EigenVoice.cpp

Go to the documentation of this file.
00001 /*
00002 This file is part of LIA_RAL which is a set of software based on ALIZE
00003 toolkit for speaker recognition. ALIZE toolkit is required to use LIA_RAL.
00004 
00005 LIA_RAL project is a development project was initiated by the computer
00006 science laboratory of Avignon / France (Laboratoire Informatique d'Avignon -
00007 LIA) [http://lia.univ-avignon.fr <http://lia.univ-avignon.fr/>]. Then it
00008 was supported by two national projects of the French Research Ministry:
00009         - TECHNOLANGUE program [http://www.technolangue.net]
00010         - MISTRAL program [http://mistral.univ-avignon.fr]
00011 
00012 LIA_RAL is free software: you can redistribute it and/or modify
00013 it under the terms of the GNU Lesser General Public License as
00014 published by the Free Software Foundation, either version 3 of
00015 the License, or any later version.
00016 
00017 LIA_RAL is distributed in the hope that it will be useful,
00018 but WITHOUT ANY WARRANTY; without even the implied warranty of
00019 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
00020 GNU Lesser General Public License for more details.
00021 
00022 You should have received a copy of the GNU Lesser General Public
00023 License along with LIA_RAL.
00024 If not, see [http://www.gnu.org/licenses/].
00025 
00026 The LIA team as well as the LIA_RAL project team wants to highlight the
00027 limits of voice authentication in a forensic context.
00028 The "Person Authentification by Voice: A Need of Caution" paper
00029 proposes a good overview of this point (cf. "Person
00030 Authentification by Voice: A Need of Caution", Bonastre J.F.,
00031 Bimbot F., Boe L.J., Campbell J.P., Douglas D.A., Magrin-
00032 chagnolleau I., Eurospeech 2003, Genova].
00033 The conclusion of the paper of the paper is proposed bellow:
00034 [Currently, it is not possible to completely determine whether the
00035 similarity between two recordings is due to the speaker or to other
00036 factors, especially when: (a) the speaker does not cooperate, (b) there
00037 is no control over recording equipment, (c) recording conditions are not
00038 known, (d) one does not know whether the voice was disguised and, to a
00039 lesser extent, (e) the linguistic content of the message is not
00040 controlled. Caution and judgment must be exercised when applying speaker
00041 recognition techniques, whether human or automatic, to account for these
00042 uncontrolled factors. Under more constrained or calibrated situations,
00043 or as an aid for investigative purposes, judicious application of these
00044 techniques may be suitable, provided they are not considered as infallible.
00045 At the present time, there is no scientific process that enables one to
00046 uniquely characterize a persones voice or to identify with absolute
00047 certainty an individual from his or her voice.]
00048 
00049 Copyright (C) 2004-2010
00050 Laboratoire d'informatique d'Avignon [http://lia.univ-avignon.fr]
00051 LIA_RAL admin [alize@univ-avignon.fr]
00052 Jean-Francois Bonastre [jean-francois.bonastre@univ-avignon.fr]
00053 */
00054 
00055 
00056 #if !defined(ALIZE_EigenVoice_cpp)
00057 #define ALIZE_EigenVoice_cpp
00058 
00059 #include <iostream>
00060 #include <fstream>
00061 #include <cstdio>
00062 #include <cassert>
00063 #include <cmath>
00064 #include <liatools.h>
00065 #include "EigenVoice.h"
00066 #include "AccumulateJFAStat.h"
00067 
00068 using namespace std;
00069 using namespace alize;
00070 
00071 
00072 //-----------------------------------------------------------------------------------------------------------------------------------------------------------
00073 int EigenVoice(Config & config){
00074         
00075         cerr<<"entering Eigenvoices"<<endl;
00076 
00077         //Read the NDX file
00078         String ndxFilename = config.getParam("ndxFilename");
00079         
00080         //Create and initialise the accumulator
00081         JFAAcc jfaAcc(ndxFilename, config);
00082 
00083         //Option used to check the Likelihood at each iteration
00084         bool _checkLLK = false;
00085         if (config.existsParam("checkLLK")) _checkLLK= config.getParam("checkLLK").toBool();
00086         
00087         //Statistics
00088         if((config.existsParam("loadAccs")) && config.getParam("loadAccs").toBool()){   //load pre-computed statistics
00089                 cerr<<"load accumulators"<<endl;
00090                 jfaAcc.loadN(config);
00091                 jfaAcc.loadN_h(config);
00092                 jfaAcc.loadF_X(config);
00093                 jfaAcc.loadF_X_h(config);
00094         }
00095         else{                                                                                                                   //Compute statistics if they don't exists
00096                 jfaAcc.computeAndAccumulateJFAStat(config);
00097                 jfaAcc.saveAccs(config);
00098         }
00099         
00100         //Initialise the EV Matrix
00101         bool loadInitEigenVoiceMatrix = false;
00102         if(config.existsParam("loadInitEigenVoiceMatrix")) loadInitEigenVoiceMatrix = config.getParam("loadInitEigenVoiceMatrix").toBool();
00103         if(loadInitEigenVoiceMatrix){   //Load the EV matrix when existing
00104                 jfaAcc.loadEV(config.getParam("initEigenVoiceMatrix"), config);
00105         }
00106         else{   //Initialise the EV matrix randomly if does not exists
00107                 jfaAcc.initEV(config);
00108         }
00109         
00110         //Save the initial V matrix to be able restart the process with the same initialisation
00111         if(config.existsParam("saveInitEigenVoiceMatrix") && config.getParam("saveInitEigenVoiceMatrix").toBool()){
00112                 String initV = config.getParam("eigenVoiceMatrix")+"_init";
00113                 jfaAcc.saveV(initV, config);
00114                 cout<<" (EigenVoice) Save the initial EigenVoice Matrix in "<<initV<<endl;
00115         }
00116 
00117         //iteratively retrain the EV matrix
00118         unsigned long nbIt = config.getParam("nbIt").toULong();
00119         
00120         jfaAcc.storeAccs();
00121         for(unsigned long it=0; it<nbIt; it++){
00122                 
00123                 cout<<" (EigenVoices) --------- start iteration "<<it<<" --------"<<endl;
00124                 if (_checkLLK) jfaAcc.verifyEMLK(config);
00125                 
00126                 //On calcules les matrices vEvT
00127                 jfaAcc.estimateVEVT(config);
00128 
00129                 //On calcules les matrices L et on les inverse (on integre la boucle sur tous les locuteurs dans cette fonction)
00130                 jfaAcc.estimateAndInverseL_EV(config);
00131 
00132                 //On soustrait les statistiques du locuteur (M+DZ)*Ns pour chaque locuteur
00133                 jfaAcc.substractMplusDZ(config);
00134                 
00135                 //On soustrait pour chaque locuteur la composante canal de chaque session
00136                 jfaAcc.substractUX(config);
00137                 
00138                 //On update Y pour tous les locuteurs
00139                 jfaAcc.estimateYandV(config);
00140                 
00141                 //Update _V
00142                 jfaAcc.updateVestimate();
00143 
00144                 //Reinitialise the accumulators
00145                 jfaAcc.resetTmpAcc();
00146                 jfaAcc.restoreAccs();
00147                 
00148                 //Save the V matrix at the end of the iteration
00149                 bool saveAllEVMatrices = false;
00150                 if(config.existsParam("saveAllEVMatrices")) saveAllEVMatrices=config.getParam("saveAllEVMatrices").toBool();
00151                 if(saveAllEVMatrices){
00152                         String s;
00153                         String output = config.getParam("eigenVoiceMatrix") + s.valueOf(it);
00154                         jfaAcc.saveV(output, config);
00155                 }
00156         }
00157 
00158         cout<<" (EigenVoices) --------- save EigenVoices Matrix --------"<<endl;
00159         jfaAcc.saveV(config.getParam("eigenVoiceMatrix"), config);
00160         cout<<" (EigenVoices) --------- end of process --------"<<endl;
00161 
00162 return 0;
00163 }
00164 #endif