modelToSvMain.cpp

Go to the documentation of this file.
00001 /*
00002 This file is part of LIA_RAL which is a set of software based on ALIZE
00003 toolkit for speaker recognition. ALIZE toolkit is required to use LIA_RAL.
00004 
00005 LIA_RAL project is a development project was initiated by the computer
00006 science laboratory of Avignon / France (Laboratoire Informatique d'Avignon -
00007 LIA) [http://lia.univ-avignon.fr <http://lia.univ-avignon.fr/>]. Then it
00008 was supported by two national projects of the French Research Ministry:
00009         - TECHNOLANGUE program [http://www.technolangue.net]
00010         - MISTRAL program [http://mistral.univ-avignon.fr]
00011 
00012 LIA_RAL is free software: you can redistribute it and/or modify
00013 it under the terms of the GNU Lesser General Public License as
00014 published by the Free Software Foundation, either version 3 of
00015 the License, or any later version.
00016 
00017 LIA_RAL is distributed in the hope that it will be useful,
00018 but WITHOUT ANY WARRANTY; without even the implied warranty of
00019 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
00020 GNU Lesser General Public License for more details.
00021 
00022 You should have received a copy of the GNU Lesser General Public
00023 License along with LIA_RAL.
00024 If not, see [http://www.gnu.org/licenses/].
00025 
00026 The LIA team as well as the LIA_RAL project team wants to highlight the
00027 limits of voice authentication in a forensic context.
00028 The "Person Authentification by Voice: A Need of Caution" paper
00029 proposes a good overview of this point (cf. "Person
00030 Authentification by Voice: A Need of Caution", Bonastre J.F.,
00031 Bimbot F., Boe L.J., Campbell J.P., Douglas D.A., Magrin-
00032 chagnolleau I., Eurospeech 2003, Genova].
00033 The conclusion of the paper of the paper is proposed bellow:
00034 [Currently, it is not possible to completely determine whether the
00035 similarity between two recordings is due to the speaker or to other
00036 factors, especially when: (a) the speaker does not cooperate, (b) there
00037 is no control over recording equipment, (c) recording conditions are not
00038 known, (d) one does not know whether the voice was disguised and, to a
00039 lesser extent, (e) the linguistic content of the message is not
00040 controlled. Caution and judgment must be exercised when applying speaker
00041 recognition techniques, whether human or automatic, to account for these
00042 uncontrolled factors. Under more constrained or calibrated situations,
00043 or as an aid for investigative purposes, judicious application of these
00044 techniques may be suitable, provided they are not considered as infallible.
00045 At the present time, there is no scientific process that enables one to
00046 uniquely characterize a persones voice or to identify with absolute
00047 certainty an individual from his or her voice.]
00048 
00049 Copyright (C) 2004-2010
00050 Laboratoire d'informatique d'Avignon [http://lia.univ-avignon.fr]
00051 LIA_RAL admin [alize@univ-avignon.fr]
00052 Jean-Francois Bonastre [jean-francois.bonastre@univ-avignon.fr]
00053 */
00054 
00055 #include <iostream>
00056 #include "liatools.h"
00057 
00058 void getMeanNorm(RealVector <double>& norm,MixtureGD & UBM) {
00059     unsigned long mSize=UBM.getDistribCount();
00060     unsigned long vSize=UBM.getVectSize();            
00061     norm.setSize(mSize*vSize);    
00062     for (unsigned long i=0;i<mSize;i++) {
00063         DistribGD & d=UBM.getDistrib(i);
00064         double w=UBM.weight(i);
00065         for (unsigned long j=0;j<vSize;j++)
00066             norm[i*vSize+j]=sqrt(w*d.getCovInv(j)); 
00067     }
00068 }
00069 
00070 void getWeightNorm(RealVector <double>& norm,MixtureGD & UBM) {
00071     unsigned long mSize=UBM.getDistribCount();    
00072     norm.setSize(mSize);       
00073     for (unsigned long i=0;i<mSize;i++) 
00074         norm[i]=1/sqrt(UBM.weight(i));
00075 }
00076 
00077 int main(int argc, char* argv[]){
00078 
00079     ConfigChecker cc;
00080     cc.addStringParam("config", false, true, "default config filename");    
00081     cc.addBooleanParam("meanSv", true, true, "output Mean vector");
00082     cc.addBooleanParam("weightSv", true, true, "output Weight vector");    
00083     cc.addBooleanParam("normSv", true, true, "normalize vector (need UBM)");
00084     cc.addBooleanParam("vectors", false, true, "read from vectors");       
00085     try{
00086     CmdLine cmdLine(argc, argv);
00087     Config tmp;
00088     cmdLine.copyIntoConfig(tmp);
00089     Config config;
00090     if (tmp.existsParam("config")) config.load(tmp.getParam("config"));
00091     cmdLine.copyIntoConfig(config);
00092     cc.check(config);
00093     debug=config.getParam_debug();
00094     if (config.existsParam("verbose"))verbose=config.getParam("verbose").toBool();else verbose=false;
00095     if (verbose) verboseLevel=1;else verboseLevel=0;
00096     if (config.existsParam("verboseLevel"))verboseLevel=config.getParam("verboseLevel").toLong();
00097     if (verboseLevel>0) verbose=true;
00098 
00099     // Begins here
00100     bool mean=config.getParam("meanSv").toBool();
00101     bool weight=config.getParam("weightSv").toBool();
00102     if (!(weight^mean)) throw Exception("weightSv and meanSv have same value !",__FILE__,__LINE__);
00103     bool norm=config.getParam("normSv").toBool();    
00104     bool vectors=false;
00105     if (config.existsParam("vectors")) vectors=true; // read either from models or vectors
00106     bool gmm=!vectors;
00107     if (verbose) {
00108         if (mean) cout << "(modelToSv) MeanSv"<<endl;
00109         if (weight) cout << "(modelToSv) WeightSv"<<endl;
00110         if (norm) cout << "(modelToSv) NormSv: Normalizing vector with UBM model "<<endl;
00111         if (norm && !(weight||mean)) cout << "(modelToSv) NormSv: only normalize vectors" << endl;
00112         }
00113     XList inputList(config.getParam("inputFilename"));
00114     String vPath=config.getParam("vectorFilesPath");
00115     String vExt=config.getParam("vectorFilesExtension");        
00116     MixtureServer ms(config);
00117     MixtureGD UBM=ms.loadMixtureGD(config.getParam("inputWorldFilename"));
00118     RealVector <double> normVector;
00119     if (norm) {
00120         if (verbose)  cout << "(modelToSv) Compute normalisation vector"<<endl;
00121         if(mean) getMeanNorm(normVector,UBM); // do seometing better, if only want to normalize assume it's mean
00122         if (weight) getWeightNorm(normVector,UBM);     
00123         String normFile=vPath+"norm"+vExt; 
00124         if (debug ) {
00125             ((Matrix<double>)normVector).save(normFile,config);
00126             cout<<"(modelToSv) Saving normalisation vector to ["<<normFile<<"]"<<endl;
00127         }
00128     }
00129          
00130     for (unsigned long r=0;r<inputList.getLineCount();r++) {
00131             String out=vPath+inputList.getLine(r).getElement(0)+vExt;         
00132             if (verbose) cout << "(modelToSv) Processing ["<<inputList.getLine(r).getElement(0)<<"] to ["<<out<<"]"<<endl;         
00133             RealVector <double> sv;        
00134             if (gmm) { // read from models
00135                 if (verbose) cout << "(modelToSv) Read from GMM models"<<endl;
00136                 MixtureGD &curr=ms.loadMixtureGD(inputList.getLine(r).getElement(0));
00137                 if (mean) modelToSv(curr,sv);
00138                 if (weight) {
00139                     unsigned long mSize=curr.getDistribCount();
00140                     sv.setSize(mSize);        
00141                     for (unsigned long i=0;i<mSize;i++)
00142                         sv[i]=curr.weight(i);
00143                 }
00144                 ms.deleteMixture(curr);
00145                 ms.deleteUnusedDistribs();  
00146             }
00147             else if (vectors) {//read from vectors (mean and weight at false)
00148                 if (verbose) cout << "(modelToSv) Read from SV from vectors"<<endl;     
00149                 String vIExt=config.getParam("inputVectorFilesExtension"); 
00150                 String in=vPath+inputList.getLine(r).getElement(0)+vIExt;   
00151                 Matrix <double> a;
00152                 a.load(in,config);   
00153                 sv.setSize(a.cols());
00154                 for (unsigned long i=0;i<sv.size();i++)
00155                     sv[i]=a(0,i);
00156             }
00157             if(norm) {
00158                 for (unsigned long i=0;i<sv.size();i++) 
00159                     sv[i]*=normVector[i];
00160             }
00161             ((Matrix<double>)sv).save(out,config);        
00162     }
00163     return 0;
00164   }
00165   catch(alize::Exception & e){ cout <<"modelToSv"<< e.toString() << endl << cc.getParamList()<<endl;}
00166 }