FeatureInputStream.h

Go to the documentation of this file.
00001 /*
00002         This file is part of ALIZE which is an open-source tool for 
00003         speaker recognition.
00004 
00005     ALIZE is free software: you can redistribute it and/or modify
00006     it under the terms of the GNU Lesser General Public License as 
00007     published by the Free Software Foundation, either version 3 of 
00008     the License, or any later version.
00009 
00010     ALIZE is distributed in the hope that it will be useful,
00011     but WITHOUT ANY WARRANTY; without even the implied warranty of
00012     MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
00013     GNU Lesser General Public License for more details.
00014 
00015     You should have received a copy of the GNU Lesser General Public 
00016     License along with ALIZE.
00017     If not, see <http://www.gnu.org/licenses/>.
00018         
00019         ALIZE is a development project initiated by the ELISA consortium
00020         [alize.univ-avignon.fr/] and funded by the French Research 
00021         Ministry in the framework of the TECHNOLANGUE program 
00022         [www.technolangue.net]
00023 
00024         The ALIZE project team wants to highlight the limits of voice
00025         authentication in a forensic context.
00026         The "Person  Authentification by Voice: A Need of Caution" paper 
00027         proposes a good overview of this point (cf. "Person  
00028         Authentification by Voice: A Need of Caution", Bonastre J.F., 
00029         Bimbot F., Boe L.J., Campbell J.P., Douglas D.A., Magrin-
00030         chagnolleau I., Eurospeech 2003, Genova].
00031         The conclusion of the paper of the paper is proposed bellow:
00032         [Currently, it is not possible to completely determine whether the 
00033         similarity between two recordings is due to the speaker or to other 
00034         factors, especially when: (a) the speaker does not cooperate, (b) there 
00035         is no control over recording equipment, (c) recording conditions are not 
00036         known, (d) one does not know whether the voice was disguised and, to a 
00037         lesser extent, (e) the linguistic content of the message is not 
00038         controlled. Caution and judgment must be exercised when applying speaker 
00039         recognition techniques, whether human or automatic, to account for these 
00040         uncontrolled factors. Under more constrained or calibrated situations, 
00041         or as an aid for investigative purposes, judicious application of these 
00042         techniques may be suitable, provided they are not considered as infallible.
00043         At the present time, there is no scientific process that enables one to 
00044         uniquely characterize a person=92s voice or to identify with absolute 
00045         certainty an individual from his or her voice.]
00046         Contact Jean-Francois Bonastre for more information about the licence or
00047         the use of ALIZE
00048 
00049         Copyright (C) 2003-2010
00050         Laboratoire d'informatique d'Avignon [lia.univ-avignon.fr]
00051         ALIZE admin [alize@univ-avignon.fr]
00052         Jean-Francois Bonastre [jean-francois.bonastre@univ-avignon.fr]
00053 */
00054 
00055 #if !defined(ALIZE_FeatureInputStream_h)
00056 #define ALIZE_FeatureInputStream_h
00057 
00058 #if defined(_WIN32)
00059 #if defined(ALIZE_EXPORTS)
00060 #define ALIZE_API __declspec(dllexport)
00061 #else
00062 #define ALIZE_API __declspec(dllimport)
00063 #endif
00064 #else
00065 #define ALIZE_API
00066 #endif
00067 
00068 #include "Object.h"
00069 #include "FeatureFlags.h"
00070 #include "alizeString.h"
00071 
00072 namespace alize
00073 {
00074   class Feature;
00075   class LabelServer;
00076   class Config;
00077   
00095   class ALIZE_API FeatureInputStream : public Object
00096   {
00097 
00098   public :
00099 
00100     enum Error
00101     {
00102       NO_ERROR,
00103       FEATURE_OUT_OF_HISTORY,
00104     };
00105     
00106     explicit FeatureInputStream();
00107     
00112     explicit FeatureInputStream(const Config& c, LabelServer* ls = NULL);
00113 
00114     const Config& getConfig() const;
00115     bool existsConfig() const;
00116 
00117     virtual ~FeatureInputStream();
00118 
00127     virtual bool readFeature(Feature& f, unsigned long s = 1) = 0;
00128 
00137     virtual bool writeFeature(const Feature& f, unsigned long s = 1);
00138 
00139     virtual void reset() = 0;
00140     virtual void close() = 0;
00141 
00142 
00149     virtual unsigned long getVectSize() = 0;
00150 
00157     virtual const FeatureFlags& getFeatureFlags() = 0;
00158 
00165     virtual real_t getSampleRate() = 0;
00166 
00172     virtual unsigned long getFeatureCount() = 0;
00173 
00179     virtual void seekFeature(unsigned long pos, const String& srcName = "") = 0;
00180 
00184     virtual unsigned long getSourceCount() = 0;
00185 
00190     virtual unsigned long getFeatureCountOfASource(unsigned long srcIdx) = 0;
00191 
00196     virtual unsigned long getFeatureCountOfASource(const String& srcName) = 0;
00197 
00203     virtual unsigned long getFirstFeatureIndexOfASource(unsigned long srcIdx) = 0;
00204 
00210     virtual unsigned long getFirstFeatureIndexOfASource(const String& srcName) = 0;
00211 
00217     virtual const String& getNameOfASource(unsigned long srcIdx) = 0;
00218 
00222     Error getError();
00223 
00224     virtual String getClassName() const = 0;
00225 
00226   protected :
00227     LabelServer*  _pLabelServer;
00228     Error         _error;
00229     bool          _seekWanted;
00230     unsigned long _seekWantedIdx;
00231     String        _seekWantedSrcName;
00232     bool          _featuresAreWritable;
00233     void init(const Config& c, LabelServer* ls = NULL);
00234 
00235   private :
00236     const Config* _pConfig;
00237   };
00238 
00239 } // end namespace alize
00240 
00241 #endif // !defined(ALIZE_FeatureInputStream_h)
00242