EnergyDetectorMain.cpp

Go to the documentation of this file.
00001 /*
00002 This file is part of LIA_RAL which is a set of software based on ALIZE
00003 toolkit for speaker recognition. ALIZE toolkit is required to use LIA_RAL.
00004 
00005 LIA_RAL project is a development project was initiated by the computer
00006 science laboratory of Avignon / France (Laboratoire Informatique d'Avignon -
00007 LIA) [http://lia.univ-avignon.fr <http://lia.univ-avignon.fr/>]. Then it
00008 was supported by two national projects of the French Research Ministry:
00009         - TECHNOLANGUE program [http://www.technolangue.net]
00010         - MISTRAL program [http://mistral.univ-avignon.fr]
00011 
00012 LIA_RAL is free software: you can redistribute it and/or modify
00013 it under the terms of the GNU Lesser General Public License as
00014 published by the Free Software Foundation, either version 3 of
00015 the License, or any later version.
00016 
00017 LIA_RAL is distributed in the hope that it will be useful,
00018 but WITHOUT ANY WARRANTY; without even the implied warranty of
00019 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
00020 GNU Lesser General Public License for more details.
00021 
00022 You should have received a copy of the GNU Lesser General Public
00023 License along with LIA_RAL.
00024 If not, see [http://www.gnu.org/licenses/].
00025 
00026 The LIA team as well as the LIA_RAL project team wants to highlight the
00027 limits of voice authentication in a forensic context.
00028 The "Person Authentification by Voice: A Need of Caution" paper
00029 proposes a good overview of this point (cf. "Person
00030 Authentification by Voice: A Need of Caution", Bonastre J.F.,
00031 Bimbot F., Boe L.J., Campbell J.P., Douglas D.A., Magrin-
00032 chagnolleau I., Eurospeech 2003, Genova].
00033 The conclusion of the paper of the paper is proposed bellow:
00034 [Currently, it is not possible to completely determine whether the
00035 similarity between two recordings is due to the speaker or to other
00036 factors, especially when: (a) the speaker does not cooperate, (b) there
00037 is no control over recording equipment, (c) recording conditions are not
00038 known, (d) one does not know whether the voice was disguised and, to a
00039 lesser extent, (e) the linguistic content of the message is not
00040 controlled. Caution and judgment must be exercised when applying speaker
00041 recognition techniques, whether human or automatic, to account for these
00042 uncontrolled factors. Under more constrained or calibrated situations,
00043 or as an aid for investigative purposes, judicious application of these
00044 techniques may be suitable, provided they are not considered as infallible.
00045 At the present time, there is no scientific process that enables one to
00046 uniquely characterize a persones voice or to identify with absolute
00047 certainty an individual from his or her voice.]
00048 
00049 Copyright (C) 2004-2010
00050 Laboratoire d'informatique d'Avignon [http://lia.univ-avignon.fr]
00051 LIA_RAL admin [alize@univ-avignon.fr]
00052 Jean-Francois Bonastre [jean-francois.bonastre@univ-avignon.fr]
00053 */
00054 
00055 #include <liatools.h>
00056 #include "alize.h"
00057 #include "EnergyDetector.h"
00058 
00059 //---------------------------------------------------------------------------------------------------------------
00060 // Energy detector
00061 // Input : Xlist        Format: File1 File2 on separate or same lines
00062 
00063 int main (int argc, char *argv[])
00064 {
00065   using namespace std;
00066   using namespace alize;
00067 
00068     ConfigChecker cc;
00069     cc.addStringParam("config", false, true, "default config filename");
00070     cc.addStringParam("inputFeatureFilename",true,true,"input feature - could be a simple feature file or a list of filename");
00071     cc.addStringParam("labelFilesPath",false,true,"path of input and output labels");
00072     cc.addStringParam("saveLabelFileExtension",true,true,"output labelFile extension");
00073     cc.addStringParam("labelOutputFrames",true,true,"output label tag");
00074     cc.addFloatParam("alpha",true,true,"threshold giving the percentage of data of the middle Gaussian to take into account");
00075     cc.addStringParam("segmentalMode",true,true,"file to have a file by file behaviour");
00076 
00077     // gestion du thresholdMode obligatoire
00078     cc.addStringParam("thresholdMode",true,true,"this parameter must be set to select 3 top gaussian. It's a default parameter");
00079 
00080   try
00081   {
00082     CmdLine cmdLine (argc, argv);
00083     if (cmdLine.displayHelpRequired ()){        // --help
00084         cout << "************************************" << endl;
00085         cout << "********** EnergyDetector.exe *********" << endl;
00086         cout << "************************************" << endl;
00087         cout << endl;
00088         cout << "Speech/Non Speech Detector." << endl;
00089         cout<<cc.getParamList()<<endl;
00090       }
00091     else if (cmdLine.displayVersionRequired ())
00092       cout << "Version 2beta" << endl;
00093     else{
00094       // copy parameters from command line into config
00095       Config tmp;
00096       cmdLine.copyIntoConfig (tmp);
00097       Config config;
00098       if (tmp.existsParam("config")) config.load(tmp.getParam("config"));
00099       cmdLine.copyIntoConfig(config);
00100       cc.check(config);
00101       debug=config.getParam_debug();
00102       if (config.existsParam("verbose")) verbose=config.getParam("verbose").toBool();
00103       else verbose=false;
00104       if (verbose) verboseLevel=1;else verboseLevel=0;
00105       if (config.existsParam("verboseLevel"))verboseLevel=config.getParam("verboseLevel").toLong();
00106       if (verboseLevel>0) verbose=true;
00107               
00108         bool energy=true;
00109         if (config.existsParam("turnDetection")) energy=false;                 // choice between energy detection or GLR turn detection
00110         String inputFeatureFileName =config.getParam("inputFeatureFilename");  // input feature - could be a simple feature file or a list of filename
00111         String extOutput=".lbl";                                               // the extension of the output files    
00112         if (config.existsParam("saveLabelFileExtension")) extOutput=config.getParam("saveLabelFileExtension");   
00113         String pathOutput="./";                                                // the path of the output files    
00114         if (config.existsParam("labelFilesPath")) pathOutput=config.getParam("labelFilesPath");
00115         XLine inputFeatureFileNameList;                                        // The (feature) input filename list - list of files to process
00116             try{                                            
00117               XList inputFileNameXList(inputFeatureFileName,config);               // Read the filename list file if it is really a list
00118               inputFeatureFileNameList=inputFileNameXList.getAllElements();        // And put the filename in a list if the file is a list of feature filenames
00119             }
00120             catch(FileNotFoundException& e){                                       // It was a simple feature file and not a filename list
00121               inputFeatureFileNameList.addElement(inputFeatureFileName);           // add the filename in the list
00122             }
00123       String *file;
00124       while ((file=inputFeatureFileNameList.getElement())!= NULL){         // Loop on each feature file
00125         String & fileName=*file;                                           // current input file basename 
00126         SegServer segServer;                                               // Create the segment server for dealing with selected/unselected segments
00127         if (energy){                                                       // The energy detector
00128           SegCluster &outputSeg=energyDetector(config,segServer,fileName); 
00129           outputLabelFile(outputSeg,pathOutput+fileName+extOutput,config); 
00130         }
00131       }                                                                    // end of file loop
00132     }
00133   }
00134   catch (alize::Exception & e) {cout << e.toString () << endl << cc.getParamList() << endl;}
00135 return 0;
00136 }
00137