ViterbiAccum.h

Go to the documentation of this file.
00001 /*
00002         This file is part of ALIZE which is an open-source tool for 
00003         speaker recognition.
00004 
00005     ALIZE is free software: you can redistribute it and/or modify
00006     it under the terms of the GNU Lesser General Public License as 
00007     published by the Free Software Foundation, either version 3 of 
00008     the License, or any later version.
00009 
00010     ALIZE is distributed in the hope that it will be useful,
00011     but WITHOUT ANY WARRANTY; without even the implied warranty of
00012     MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
00013     GNU Lesser General Public License for more details.
00014 
00015     You should have received a copy of the GNU Lesser General Public 
00016     License along with ALIZE.
00017     If not, see <http://www.gnu.org/licenses/>.
00018         
00019         ALIZE is a development project initiated by the ELISA consortium
00020         [alize.univ-avignon.fr/] and funded by the French Research 
00021         Ministry in the framework of the TECHNOLANGUE program 
00022         [www.technolangue.net]
00023 
00024         The ALIZE project team wants to highlight the limits of voice
00025         authentication in a forensic context.
00026         The "Person  Authentification by Voice: A Need of Caution" paper 
00027         proposes a good overview of this point (cf. "Person  
00028         Authentification by Voice: A Need of Caution", Bonastre J.F., 
00029         Bimbot F., Boe L.J., Campbell J.P., Douglas D.A., Magrin-
00030         chagnolleau I., Eurospeech 2003, Genova].
00031         The conclusion of the paper of the paper is proposed bellow:
00032         [Currently, it is not possible to completely determine whether the 
00033         similarity between two recordings is due to the speaker or to other 
00034         factors, especially when: (a) the speaker does not cooperate, (b) there 
00035         is no control over recording equipment, (c) recording conditions are not 
00036         known, (d) one does not know whether the voice was disguised and, to a 
00037         lesser extent, (e) the linguistic content of the message is not 
00038         controlled. Caution and judgment must be exercised when applying speaker 
00039         recognition techniques, whether human or automatic, to account for these 
00040         uncontrolled factors. Under more constrained or calibrated situations, 
00041         or as an aid for investigative purposes, judicious application of these 
00042         techniques may be suitable, provided they are not considered as infallible.
00043         At the present time, there is no scientific process that enables one to 
00044         uniquely characterize a person=92s voice or to identify with absolute 
00045         certainty an individual from his or her voice.]
00046         Contact Jean-Francois Bonastre for more information about the licence or
00047         the use of ALIZE
00048 
00049         Copyright (C) 2003-2010
00050         Laboratoire d'informatique d'Avignon [lia.univ-avignon.fr]
00051         ALIZE admin [alize@univ-avignon.fr]
00052         Jean-Francois Bonastre [jean-francois.bonastre@univ-avignon.fr]
00053 */
00054 
00055 #if !defined(ALIZE_ViterbiAccum_h)
00056 #define ALIZE_ViterbiAccum_h
00057 
00058 #if defined(_WIN32)
00059 #if defined(ALIZE_EXPORTS)
00060 #define ALIZE_API __declspec(dllexport)
00061 #else
00062 #define ALIZE_API __declspec(dllimport)
00063 #endif
00064 #else
00065 #define ALIZE_API
00066 #endif
00067 
00068 #include "Object.h"
00069 #include "RefVector.h"
00070 #include "ULongVector.h"
00071 #include "RealVector.h"
00072 #include "FeatureServer.h"
00073 #include <iostream>
00074 
00075 
00076 namespace alize
00077 {
00078     class Mixture;
00079     class Config;
00080     class Feature;
00081     class StatServer;
00082 
00095     class ALIZE_API ViterbiAccum : public Object
00096     {
00097         friend class TestViterbiAccum;
00098 
00099     public :
00100 
00101 
00105         void addState(Mixture& m);
00106 
00113         real_t& logTransition(unsigned long i1, unsigned long i2);
00114         real_t logTransition(unsigned long i1, unsigned long i2) const;
00115 
00121         Mixture& getState(unsigned long i) const;
00122 
00126         unsigned long getStateCount() const;
00127 
00128         // -----------
00129         // Computation
00130         // -----------
00131 
00134         void reset();
00135 
00141               void computeAndAccumulate(const Feature& f, double llkW = 0);
00142         
00146               void computeAndAccumulate(FeatureServer& fs,
00147                      unsigned long start, unsigned long count, double fudge);
00148         
00152         void computeAndAccumulate(FeatureServer& fs, DoubleVector& llk,
00153                                    unsigned long start, unsigned long count);
00154         
00158         void computeAndAccumulate(const Feature& f, double fudge,
00159                                                             double penality);
00160 
00163         unsigned long getFeatureCount() const;
00164 
00165         // -------
00166         // Results
00167         // -------
00168         
00172         const ULongVector& getPath();
00173 
00178         real_t getLlp() const;
00179 
00180         virtual String getClassName() const;
00181         virtual String toString() const;
00182 
00183         // inaccessible for user
00184         static ViterbiAccum& create(StatServer&, const Config&, const K&);
00185         virtual ~ViterbiAccum();
00186 
00187     private :
00188 
00189         const Config*      _pConfig;
00190 
00191         RefVector<Mixture> _stateVect;
00192         DoubleVector       _transMatrix;
00193 
00194         DoubleVector       _llpVect;
00195         DoubleVector       _tmpLLKVect;
00196         DoubleVector       _tmpllpVect;
00197         ULongVector        _tmpTab;
00198         unsigned long      _featureCount;
00199 
00200         ULongVector        _path;
00201         bool               _pathDefined;
00202         real_t             _llp;
00203         bool               _llpDefined;
00204         StatServer*        _pStatServer;
00205 
00206         lk_t computeStateLLK(unsigned long stateIndex, const Feature&) const;
00207         ViterbiAccum(StatServer&, const Config&);
00208         ViterbiAccum(const ViterbiAccum&);            
00209         const ViterbiAccum& operator=(const ViterbiAccum& c);
00211         bool operator==(const ViterbiAccum& c) const; 
00212         bool operator!=(const ViterbiAccum& c) const; 
00213     };   
00214 
00215 } // end namespace alize
00216 
00217 #endif // !defined(ALIZE_ViterbiAccum_h)