00001 /* 00002 This file is part of ALIZE which is an open-source tool for 00003 speaker recognition. 00004 00005 ALIZE is free software: you can redistribute it and/or modify 00006 it under the terms of the GNU Lesser General Public License as 00007 published by the Free Software Foundation, either version 3 of 00008 the License, or any later version. 00009 00010 ALIZE is distributed in the hope that it will be useful, 00011 but WITHOUT ANY WARRANTY; without even the implied warranty of 00012 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 00013 GNU Lesser General Public License for more details. 00014 00015 You should have received a copy of the GNU Lesser General Public 00016 License along with ALIZE. 00017 If not, see <http://www.gnu.org/licenses/>. 00018 00019 ALIZE is a development project initiated by the ELISA consortium 00020 [alize.univ-avignon.fr/] and funded by the French Research 00021 Ministry in the framework of the TECHNOLANGUE program 00022 [www.technolangue.net] 00023 00024 The ALIZE project team wants to highlight the limits of voice 00025 authentication in a forensic context. 00026 The "Person Authentification by Voice: A Need of Caution" paper 00027 proposes a good overview of this point (cf. "Person 00028 Authentification by Voice: A Need of Caution", Bonastre J.F., 00029 Bimbot F., Boe L.J., Campbell J.P., Douglas D.A., Magrin- 00030 chagnolleau I., Eurospeech 2003, Genova]. 00031 The conclusion of the paper of the paper is proposed bellow: 00032 [Currently, it is not possible to completely determine whether the 00033 similarity between two recordings is due to the speaker or to other 00034 factors, especially when: (a) the speaker does not cooperate, (b) there 00035 is no control over recording equipment, (c) recording conditions are not 00036 known, (d) one does not know whether the voice was disguised and, to a 00037 lesser extent, (e) the linguistic content of the message is not 00038 controlled. Caution and judgment must be exercised when applying speaker 00039 recognition techniques, whether human or automatic, to account for these 00040 uncontrolled factors. Under more constrained or calibrated situations, 00041 or as an aid for investigative purposes, judicious application of these 00042 techniques may be suitable, provided they are not considered as infallible. 00043 At the present time, there is no scientific process that enables one to 00044 uniquely characterize a person=92s voice or to identify with absolute 00045 certainty an individual from his or her voice.] 00046 Contact Jean-Francois Bonastre for more information about the licence or 00047 the use of ALIZE 00048 00049 Copyright (C) 2003-2010 00050 Laboratoire d'informatique d'Avignon [lia.univ-avignon.fr] 00051 ALIZE admin [alize@univ-avignon.fr] 00052 Jean-Francois Bonastre [jean-francois.bonastre@univ-avignon.fr] 00053 */ 00054 00055 #if !defined(ALIZE_AudioFileReader_h) 00056 #define ALIZE_AudioFileReader_h 00057 00058 #if defined(_WIN32) 00059 #if defined(ALIZE_EXPORTS) 00060 #define ALIZE_API __declspec(dllexport) 00061 #else 00062 #define ALIZE_API __declspec(dllimport) 00063 #endif 00064 #else 00065 #define ALIZE_API 00066 #endif 00067 00068 #include "AudioInputStream.h" 00069 00070 namespace alize 00071 { 00072 class AudioFrame; 00073 class Config; 00074 class FileReader; 00075 00083 class ALIZE_API AudioFileReader : public AudioInputStream 00084 { 00085 friend class TestAudioFileReader; 00086 00087 public : 00088 00094 explicit AudioFileReader(const FileName& f, const Config& c, 00095 BigEndian be = BIGENDIAN_AUTO); 00096 static AudioFileReader& create(const FileName& f, const Config& c, 00097 BigEndian be = BIGENDIAN_AUTO); 00098 virtual ~AudioFileReader(); 00099 virtual bool readFrame(AudioFrame& f); 00100 virtual void seekFrame(unsigned long pos); 00101 00105 virtual void reset(); 00106 00109 virtual void close(); 00110 00114 unsigned long getFrameCount(); 00115 00119 virtual unsigned long getChannelCount(); 00120 00124 virtual unsigned long getSampleBytes(); 00125 00129 virtual real_t getFrameRate(); 00130 00134 virtual unsigned long getSourceCount(); 00135 00136 virtual String getClassName() const; 00137 String toString() const; 00138 00139 private : 00140 00141 String getPath(const FileName&, const Config&) const; 00142 String getExt(const FileName&, const Config&) const; 00143 unsigned long getChannel(const Config&) const; 00144 bool getBigEndian(const Config&, BigEndian) const; 00145 void readParams(); 00146 unsigned long getHeaderLength(); 00147 00148 FileReader* _pReader; 00149 unsigned long _frameCount; 00150 unsigned long _frameIndex; 00151 unsigned long _headerLength; 00152 unsigned long _channelCount; 00153 unsigned long _sampleBytes; 00154 real_t _frameRate; 00155 bool _paramDefined; 00156 bool _seekWanted; 00157 unsigned long _seekWantedIdx; 00158 }; 00159 00160 } // end namespace alize 00161 00162 #endif // !defined(ALIZE_AudioFileReader_h) 00163
1.7.2