00001
00002
00003
00004
00005
00006
00007
00008
00009
00010
00011
00012
00013
00014
00015
00016
00017
00018
00019
00020
00021
00022
00023
00024
00025
00026
00027
00028
00029
00030
00031
00032
00033
00034
00035
00036
00037
00038
00039
00040
00041
00042
00043
00044
00045
00046
00047
00048
00049
00050
00051
00052
00053
00054
00055 #if !defined(ALIZE_GMMTokenizer_cpp)
00056 #define ALIZE_GMMTokenizer_cpp
00057
00058 #include <iostream>
00059 #include <fstream>
00060 #include <cstdio>
00061 #include <cassert>
00062 #include <cmath>
00063 #include "GmmTokenizer.h"
00064 #include "liatools.h"
00065
00066 using namespace alize;
00067 using namespace std;
00068
00069 void computeConfusionMatrix(Feature & f,StatServer &ss, MixtureGDStat &acc, unsigned long & nBest, Matrix <unsigned long> & mce_matrix) {
00070
00071 acc.computeAndAccumulateLLK(f,1.0,DETERMINE_TOP_DISTRIBS);
00072 const LKVector& v = ss.getTopDistribIndexVector();
00073 const unsigned long bestDistrib=v[0].idx;
00074 for (unsigned long i=0; i<nBest;i++)
00075 mce_matrix(bestDistrib,v[i].idx)++;
00076 acc.resetLLK();
00077 }
00078
00079 void computeConfusionMatrix(Seg * seg, FeatureServer & fs, StatServer & ss, MixtureGDStat & acc, unsigned long & nBest,Matrix <unsigned long> &mce_matrix) {
00080 unsigned long idxBeginFrame=seg->begin()+fs.getFirstFeatureIndexOfASource(seg->sourceName());
00081 fs.seekFeature(idxBeginFrame);
00082 Feature f;
00083 for (unsigned long idxFrame=0;idxFrame<seg->length();idxFrame++){
00084 fs.readFeature(f);
00085 computeConfusionMatrix(f,ss,acc,nBest,mce_matrix);
00086 }
00087 }
00088
00089 void computeConfusionMatrix(SegCluster & selectedSegments, FeatureServer & fs, StatServer & ss, MixtureGD & world, unsigned long & nBest, Matrix <unsigned long> & mce_matrix) {
00090 MixtureGDStat &acc=ss.createAndStoreMixtureGDStat(world);
00091 Seg* seg;
00092 selectedSegments.rewind();
00093 while((seg=selectedSegments.getSeg())!=NULL){
00094 computeConfusionMatrix(seg, fs, ss,acc,nBest, mce_matrix) ;
00095 }
00096 }
00097
00098
00099 void computeSymbols(Feature & f, MixtureGD & world, StatServer & ss, ULongVector & stream, Config & config) {
00100 ss.computeAndAccumulateLLK(world, f,DETERMINE_TOP_DISTRIBS);
00101 const LKVector& v = ss.getTopDistribIndexVector();
00102 const unsigned long bestDistrib=v[0].idx;
00103 stream.addValue(bestDistrib);
00104 }
00105
00106
00107 void computeSymbols(Seg* seg, FeatureServer & fs, MixtureGD & world, StatServer & ss, ULongVector & stream,Config & config) {
00108 unsigned long idxBeginFrame=seg->begin()+fs.getFirstFeatureIndexOfASource(seg->sourceName());
00109 fs.seekFeature(idxBeginFrame);
00110 Feature f;
00111 for (unsigned long idxFrame=0;idxFrame<seg->length();idxFrame++){
00112 fs.readFeature(f);
00113 computeSymbols(f,world,ss,stream,config);
00114 }
00115 }
00116
00117 void computeSymbols(SegCluster & selectedSegments, FeatureServer & fs, MixtureGD & world, StatServer & ss, ULongVector & stream, Config & config) {
00118 Seg* seg;
00119 selectedSegments.rewind();
00120 while((seg=selectedSegments.getSeg())!=NULL){
00121 computeSymbols(seg, fs, world, ss, stream, config);
00122 }
00123 }
00124
00125 int GaussianConfusionMatrix(Config & config)
00126 {
00127 String inputNDXFileName = config.getParam("inputFeatureFilename");
00128 String inputWorldFilename = config.getParam("inputWorldModelName");
00129 String labelSelectedFrames =config.getParam("labelSelectedFrames");
00130
00131 String matrixName=config.getParam("matrixOutputName");
00132 unsigned long nBest =config.getParam("topDistribsCount").toLong();
00133
00134 try{
00135 XList ndx(inputNDXFileName,config);
00136 XLine *linep;
00137 ndx.getLine(0);
00138 MixtureServer ms(config);
00139 StatServer ss(config, ms);
00140 MixtureGD& world = ms.loadMixtureGD(inputWorldFilename);
00141 if (verbose) cout << "Confusion Matrix Memory Allocation" << endl;
00142 unsigned long model_size=world.getDistribCount();
00143 Matrix <unsigned long> mce_matrix;
00144 mce_matrix.setDimensions(model_size,model_size);
00145
00146 while ((linep=ndx.getLine()) != NULL){
00147 String &featureFileName=linep->getElement(0);
00148 FeatureServer fs(config,featureFileName);
00149 SegServer segmentsServer;
00150 LabelServer labelServer;
00151 initializeClusters(featureFileName,segmentsServer,labelServer,config);
00152 verifyClusterFile(segmentsServer,fs,config);
00153 unsigned long codeSelectedFrame=labelServer.getLabelIndexByString(labelSelectedFrames);
00154 SegCluster& selectedSegments=segmentsServer.getCluster(codeSelectedFrame);
00155 if (verbose) cout << "test seg["<<featureFileName<<"]"<< endl;
00156 computeConfusionMatrix(selectedSegments, fs, ss, world, nBest, mce_matrix);
00157 }
00158 mce_matrix.save(matrixName,config);
00159
00160 }
00161
00162 catch (Exception& e){
00163 cout << e.toString().c_str() << endl;
00164 }
00165 return 0;
00166
00167 }
00168
00169
00170 int GMMTokenizer(Config & config)
00171 {
00172 String inputNDXFileName = config.getParam("inputFeatureFilename");
00173 String inputWorldFilename = config.getParam("inputWorldModelName");
00174 String labelSelectedFrames =config.getParam("labelSelectedFrames");
00175 String matrixName, symbolsFilesPath;
00176 symbolsFilesPath=config.getParam("symbolsFilesPath");
00177
00178 try{
00179 XList ndx(inputNDXFileName,config);
00180 XLine *linep;
00181 ndx.getLine(0);
00182 MixtureServer ms(config);
00183 StatServer ss(config, ms);
00184 MixtureGD& world = ms.loadMixtureGD(inputWorldFilename);
00185
00186 while ((linep=ndx.getLine()) != NULL){
00187 String &featureFileName=linep->getElement(0);
00188 FeatureServer fs(config,featureFileName);
00189 SegServer segmentsServer;
00190 LabelServer labelServer;
00191 initializeClusters(featureFileName,segmentsServer,labelServer,config);
00192 verifyClusterFile(segmentsServer,fs,config);
00193 unsigned long codeSelectedFrame=labelServer.getLabelIndexByString(labelSelectedFrames);
00194 SegCluster& selectedSegments=segmentsServer.getCluster(codeSelectedFrame);
00195 if (verbose) cout << "test seg["<<featureFileName<<"]"<< endl;
00196 ULongVector stream;
00197 computeSymbols(selectedSegments, fs, world, ss, stream,config);
00198 String output="./"+symbolsFilesPath+"/"+featureFileName+".sym";
00199 stream.save(output);
00200 }
00201 }
00202
00203 catch (Exception& e){
00204 cout << e.toString().c_str() << endl;
00205 }
00206 return 0;
00207
00208 }
00209
00210 #endif //!defined(ALIZE_GMMTokenizer_cpp)