FeatureFileReaderSingle.h

Go to the documentation of this file.
00001 /*
00002         This file is part of ALIZE which is an open-source tool for 
00003         speaker recognition.
00004 
00005     ALIZE is free software: you can redistribute it and/or modify
00006     it under the terms of the GNU Lesser General Public License as 
00007     published by the Free Software Foundation, either version 3 of 
00008     the License, or any later version.
00009 
00010     ALIZE is distributed in the hope that it will be useful,
00011     but WITHOUT ANY WARRANTY; without even the implied warranty of
00012     MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
00013     GNU Lesser General Public License for more details.
00014 
00015     You should have received a copy of the GNU Lesser General Public 
00016     License along with ALIZE.
00017     If not, see <http://www.gnu.org/licenses/>.
00018         
00019         ALIZE is a development project initiated by the ELISA consortium
00020         [alize.univ-avignon.fr/] and funded by the French Research 
00021         Ministry in the framework of the TECHNOLANGUE program 
00022         [www.technolangue.net]
00023 
00024         The ALIZE project team wants to highlight the limits of voice
00025         authentication in a forensic context.
00026         The "Person  Authentification by Voice: A Need of Caution" paper 
00027         proposes a good overview of this point (cf. "Person  
00028         Authentification by Voice: A Need of Caution", Bonastre J.F., 
00029         Bimbot F., Boe L.J., Campbell J.P., Douglas D.A., Magrin-
00030         chagnolleau I., Eurospeech 2003, Genova].
00031         The conclusion of the paper of the paper is proposed bellow:
00032         [Currently, it is not possible to completely determine whether the 
00033         similarity between two recordings is due to the speaker or to other 
00034         factors, especially when: (a) the speaker does not cooperate, (b) there 
00035         is no control over recording equipment, (c) recording conditions are not 
00036         known, (d) one does not know whether the voice was disguised and, to a 
00037         lesser extent, (e) the linguistic content of the message is not 
00038         controlled. Caution and judgment must be exercised when applying speaker 
00039         recognition techniques, whether human or automatic, to account for these 
00040         uncontrolled factors. Under more constrained or calibrated situations, 
00041         or as an aid for investigative purposes, judicious application of these 
00042         techniques may be suitable, provided they are not considered as infallible.
00043         At the present time, there is no scientific process that enables one to 
00044         uniquely characterize a person=92s voice or to identify with absolute 
00045         certainty an individual from his or her voice.]
00046         Contact Jean-Francois Bonastre for more information about the licence or
00047         the use of ALIZE
00048 
00049         Copyright (C) 2003-2010
00050         Laboratoire d'informatique d'Avignon [lia.univ-avignon.fr]
00051         ALIZE admin [alize@univ-avignon.fr]
00052         Jean-Francois Bonastre [jean-francois.bonastre@univ-avignon.fr]
00053 */
00054 
00055 #if !defined(ALIZE_FeatureFileReaderSingle_h)
00056 #define ALIZE_FeatureFileReaderSingle_h
00057 
00058 #if defined(_WIN32)
00059 #if defined(ALIZE_EXPORTS)
00060 #define ALIZE_API __declspec(dllexport)
00061 #else
00062 #define ALIZE_API __declspec(dllimport)
00063 #endif
00064 #else
00065 #define ALIZE_API
00066 #endif
00067 
00068 #include "FeatureFileReaderAbstract.h"
00069 #include "Feature.h"
00070 #include "RealVector.h"
00071 
00072 namespace alize
00073 {
00074   class Config;
00075   class FileReader;
00076   
00081 
00082   class ALIZE_API FeatureFileReaderSingle : public FeatureFileReaderAbstract
00083   {
00084     friend class TestFeatureFileReader;
00085 
00086   public :
00087 
00088     FeatureFileReaderSingle(FileReader*, FeatureInputStream*, 
00089           const Config&, LabelServer*, BufferUsage, unsigned long bufferSize,
00090           HistoricUsage, unsigned long historicSize);
00091     virtual ~FeatureFileReaderSingle();
00092 
00095     virtual void close();
00096 
00097     virtual bool readFeature(Feature&, unsigned long step = 1);
00098     virtual bool writeFeature(const Feature& f, unsigned long step = 1);
00099     virtual unsigned long getSourceCount();
00100     virtual unsigned long getFeatureCountOfASource(unsigned long srcIdx);
00101     virtual unsigned long getFeatureCountOfASource(const String& srcName);
00102     virtual unsigned long getFirstFeatureIndexOfASource(unsigned long srcIdx);
00103     virtual unsigned long getFirstFeatureIndexOfASource(const String& srcName);
00104     virtual const String& getNameOfASource(unsigned long srcIdx);
00105 
00106     virtual void setExternalBufferToUse(FloatVector& v);
00107     
00108     virtual String toString() const;
00109 
00110   protected :
00111 
00112     FileReader*     _pReader;
00113     FeatureInputStream* _pFeatureInputStream; // useful to read audio file
00114     Feature*        _pFeature;
00115     unsigned long   _headerLength;
00116     unsigned long   _featureCount;
00117     unsigned long   _vectSize;
00118     FeatureFlags    _flags;
00119     real_t          _sampleRate;
00120     unsigned long   _featureIndex;
00121     unsigned long   _lastFeatureIndex;
00122     // feature buffer
00123     unsigned long   _featureIndexOfBuffer;
00124     unsigned long   _nbStored;
00125     FloatVector*    _pBuffer;
00126     Feature         _f;
00127 
00128     String getPath(const FileName&, const Config&) const;
00129     String getExt(const FileName&, const Config&) const;
00130     bool getBigEndian(const Config&, BigEndian) const;
00131 
00132   private :
00133 
00134     virtual unsigned long getHeaderLength();
00135     bool featureWantedIsInHistoric() const;
00136   };
00137 
00138 } // end namespace alize
00139 
00140 #endif // !defined(ALIZE_FeatureFileReaderSingle_h)
00141