00001 /* 00002 This file is part of LIA_RAL which is a set of software based on ALIZE 00003 toolkit for speaker recognition. ALIZE toolkit is required to use LIA_RAL. 00004 00005 LIA_RAL project is a development project was initiated by the computer 00006 science laboratory of Avignon / France (Laboratoire Informatique d'Avignon - 00007 LIA) [http://lia.univ-avignon.fr <http://lia.univ-avignon.fr/>]. Then it 00008 was supported by two national projects of the French Research Ministry: 00009 - TECHNOLANGUE program [http://www.technolangue.net] 00010 - MISTRAL program [http://mistral.univ-avignon.fr] 00011 00012 LIA_RAL is free software: you can redistribute it and/or modify 00013 it under the terms of the GNU Lesser General Public License as 00014 published by the Free Software Foundation, either version 3 of 00015 the License, or any later version. 00016 00017 LIA_RAL is distributed in the hope that it will be useful, 00018 but WITHOUT ANY WARRANTY; without even the implied warranty of 00019 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 00020 GNU Lesser General Public License for more details. 00021 00022 You should have received a copy of the GNU Lesser General Public 00023 License along with LIA_RAL. 00024 If not, see [http://www.gnu.org/licenses/]. 00025 00026 The LIA team as well as the LIA_RAL project team wants to highlight the 00027 limits of voice authentication in a forensic context. 00028 The "Person Authentification by Voice: A Need of Caution" paper 00029 proposes a good overview of this point (cf. "Person 00030 Authentification by Voice: A Need of Caution", Bonastre J.F., 00031 Bimbot F., Boe L.J., Campbell J.P., Douglas D.A., Magrin- 00032 chagnolleau I., Eurospeech 2003, Genova]. 00033 The conclusion of the paper of the paper is proposed bellow: 00034 [Currently, it is not possible to completely determine whether the 00035 similarity between two recordings is due to the speaker or to other 00036 factors, especially when: (a) the speaker does not cooperate, (b) there 00037 is no control over recording equipment, (c) recording conditions are not 00038 known, (d) one does not know whether the voice was disguised and, to a 00039 lesser extent, (e) the linguistic content of the message is not 00040 controlled. Caution and judgment must be exercised when applying speaker 00041 recognition techniques, whether human or automatic, to account for these 00042 uncontrolled factors. Under more constrained or calibrated situations, 00043 or as an aid for investigative purposes, judicious application of these 00044 techniques may be suitable, provided they are not considered as infallible. 00045 At the present time, there is no scientific process that enables one to 00046 uniquely characterize a persones voice or to identify with absolute 00047 certainty an individual from his or her voice.] 00048 00049 Copyright (C) 2004-2010 00050 Laboratoire d'informatique d'Avignon [http://lia.univ-avignon.fr] 00051 LIA_RAL admin [alize@univ-avignon.fr] 00052 Jean-Francois Bonastre [jean-francois.bonastre@univ-avignon.fr] 00053 */ 00054 00055 00056 #if !defined(ALIZE_EigenVoice_cpp) 00057 #define ALIZE_EigenVoice_cpp 00058 00059 #include <iostream> 00060 #include <fstream> 00061 #include <cstdio> 00062 #include <cassert> 00063 #include <cmath> 00064 #include <liatools.h> 00065 #include "EigenVoice.h" 00066 #include "AccumulateJFAStat.h" 00067 00068 using namespace std; 00069 using namespace alize; 00070 00071 00072 //----------------------------------------------------------------------------------------------------------------------------------------------------------- 00073 int EigenVoice(Config & config){ 00074 00075 cerr<<"entering Eigenvoices"<<endl; 00076 00077 //Read the NDX file 00078 String ndxFilename = config.getParam("ndxFilename"); 00079 00080 //Create and initialise the accumulator 00081 JFAAcc jfaAcc(ndxFilename, config); 00082 00083 //Option used to check the Likelihood at each iteration 00084 bool _checkLLK = false; 00085 if (config.existsParam("checkLLK")) _checkLLK= config.getParam("checkLLK").toBool(); 00086 00087 //Statistics 00088 if((config.existsParam("loadAccs")) && config.getParam("loadAccs").toBool()){ //load pre-computed statistics 00089 cerr<<"load accumulators"<<endl; 00090 jfaAcc.loadN(config); 00091 jfaAcc.loadN_h(config); 00092 jfaAcc.loadF_X(config); 00093 jfaAcc.loadF_X_h(config); 00094 } 00095 else{ //Compute statistics if they don't exists 00096 jfaAcc.computeAndAccumulateJFAStat(config); 00097 jfaAcc.saveAccs(config); 00098 } 00099 00100 //Initialise the EV Matrix 00101 bool loadInitEigenVoiceMatrix = false; 00102 if(config.existsParam("loadInitEigenVoiceMatrix")) loadInitEigenVoiceMatrix = config.getParam("loadInitEigenVoiceMatrix").toBool(); 00103 if(loadInitEigenVoiceMatrix){ //Load the EV matrix when existing 00104 jfaAcc.loadEV(config.getParam("initEigenVoiceMatrix"), config); 00105 } 00106 else{ //Initialise the EV matrix randomly if does not exists 00107 jfaAcc.initEV(config); 00108 } 00109 00110 //Save the initial V matrix to be able restart the process with the same initialisation 00111 if(config.existsParam("saveInitEigenVoiceMatrix") && config.getParam("saveInitEigenVoiceMatrix").toBool()){ 00112 String initV = config.getParam("eigenVoiceMatrix")+"_init"; 00113 jfaAcc.saveV(initV, config); 00114 cout<<" (EigenVoice) Save the initial EigenVoice Matrix in "<<initV<<endl; 00115 } 00116 00117 //iteratively retrain the EV matrix 00118 unsigned long nbIt = config.getParam("nbIt").toULong(); 00119 00120 jfaAcc.storeAccs(); 00121 for(unsigned long it=0; it<nbIt; it++){ 00122 00123 cout<<" (EigenVoices) --------- start iteration "<<it<<" --------"<<endl; 00124 if (_checkLLK) jfaAcc.verifyEMLK(config); 00125 00126 //On calcules les matrices vEvT 00127 jfaAcc.estimateVEVT(config); 00128 00129 //On calcules les matrices L et on les inverse (on integre la boucle sur tous les locuteurs dans cette fonction) 00130 jfaAcc.estimateAndInverseL_EV(config); 00131 00132 //On soustrait les statistiques du locuteur (M+DZ)*Ns pour chaque locuteur 00133 jfaAcc.substractMplusDZ(config); 00134 00135 //On soustrait pour chaque locuteur la composante canal de chaque session 00136 jfaAcc.substractUX(config); 00137 00138 //On update Y pour tous les locuteurs 00139 jfaAcc.estimateYandV(config); 00140 00141 //Update _V 00142 jfaAcc.updateVestimate(); 00143 00144 //Reinitialise the accumulators 00145 jfaAcc.resetTmpAcc(); 00146 jfaAcc.restoreAccs(); 00147 00148 //Save the V matrix at the end of the iteration 00149 bool saveAllEVMatrices = false; 00150 if(config.existsParam("saveAllEVMatrices")) saveAllEVMatrices=config.getParam("saveAllEVMatrices").toBool(); 00151 if(saveAllEVMatrices){ 00152 String s; 00153 String output = config.getParam("eigenVoiceMatrix") + s.valueOf(it); 00154 jfaAcc.saveV(output, config); 00155 } 00156 } 00157 00158 cout<<" (EigenVoices) --------- save EigenVoices Matrix --------"<<endl; 00159 jfaAcc.saveV(config.getParam("eigenVoiceMatrix"), config); 00160 cout<<" (EigenVoices) --------- end of process --------"<<endl; 00161 00162 return 0; 00163 } 00164 #endif
1.7.2