ToPS
GeneralizedHiddenMarkovModel.hpp
00001 /*
00002  *       GeneralizedHiddenMarkovModel.hpp
00003  *
00004  *       Copyright 2011 Andre Yoshiaki Kashiwabara <akashiwabara@usp.br>
00005  *                      Ígor Bonádio <ibonadio@ime.usp.br>
00006  *                      Vitor Onuchic <vitoronuchic@gmail.com>
00007  *                      Alan Mitchell Durham <aland@usp.br>
00008  *
00009  *       This program is free software; you can redistribute it and/or modify
00010  *       it under the terms of the GNU  General Public License as published by
00011  *       the Free Software Foundation; either version 3 of the License, or
00012  *       (at your option) any later version.
00013  *
00014  *       This program is distributed in the hope that it will be useful,
00015  *       but WITHOUT ANY WARRANTY; without even the implied warranty of
00016  *       MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
00017  *       GNU General Public License for more details.
00018  *
00019  *       You should have received a copy of the GNU General Public License
00020  *       along with this program; if not, write to the Free Software
00021  *       Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
00022  *       MA 02110-1301, USA.
00023  */
00024 
00025 #ifndef GENERALIZED_HIDDEN_MARKOV_MODEL_H
00026 #define GENERALIZED_HIDDEN_MARKOV_MODEL_H
00027 
00028 #include "crossplatform.hpp"
00029 
00030 #include <set>
00031 
00032 #include "DiscreteIIDModel.hpp"
00033 #include "ProbabilisticModel.hpp"
00034 #include "Sequence.hpp"
00035 #include "Alphabet.hpp"
00036 #include "DecodableModel.hpp"
00037 #include "GHMMStates.hpp"
00038 #include "util.hpp"
00039 #include "SparseMatrix.hpp"
00040 
00041 namespace tops {
00042 
00043 
00045   class DLLEXPORT GeneralizedHiddenMarkovModel: public DecodableModel {
00046   private:
00047       Matrix _alpha;
00048       Sequence _last;
00049       DiscreteIIDModelPtr _last_state_probabilities;
00050       DiscreteIIDModelPtr _duration_state_probabilities;
00051     DiscreteIIDModelPtr _initial_probabilities;
00052     DiscreteIIDModelPtr _terminal_probabilities;
00053     GHMMStates _all_states;
00054     AlphabetPtr _state_names;
00055     int _nclasses;
00056     GHMMStates _geometric_duration_states;
00057     GHMMSignalStates _signal_states;
00058     GHMMExplicitDurationStates _explicit_duration_states;
00059     void initialize_prefix_sum_arrays(const Sequence & s) const;
00060     void buildDoubleParameterValue(DiscreteIIDModelPtr distr, ProbabilisticModelParameters & answer, const char *) const;
00061     void restore_model(std::string & model_name, const ProbabilisticModelParameters & parameters);
00062     std::map<std::string, ProbabilisticModelPtr> _models;
00063   public:
00064     GeneralizedHiddenMarkovModel() {
00065     }
00066 
00067     virtual ~GeneralizedHiddenMarkovModel() {
00068     }
00069 
00070     void fixStatesPredecessorSuccessor();
00071 
00072     virtual double inefficient_forward(const Sequence & s, Matrix &alpha) const;
00073 
00074     virtual std::string print_graph () const ;
00075 
00077     virtual double forward(const Sequence & s, Matrix &alpha) const;
00078 
00080     virtual double backward(const Sequence & s, Matrix &beta) const;
00081 
00082     virtual void posteriorProbabilitiesWithClasses (const Sequence &s, SparseMatrixPtr probabilities) const;
00083 
00084     virtual void posteriorProbabilitiesNoClasses (const Sequence &s, fMatrix &probabilities) const;
00085     void posteriorProbabilities(const Sequence &s, fMatrix &postProbs) const;
00086 
00087 
00088     float MEAPred(const Sequence &s, Sequence &path);
00089     float MEAPred(const Sequence &s, Sequence &path, SparseMatrixPtr ppPred);
00090 
00091 
00092     virtual void setNumClasses(int nclasses);
00093 
00094     virtual int getNumClasses();
00095 
00097     virtual double
00098     viterbi(const Sequence &s, Sequence &path, Matrix & gamma) const;
00099 
00101       virtual void choosePath(const Sequence &s, Sequence &path) ;
00102 
00103       virtual void initializeChoosePathAlgorithm(const Sequence &s);
00104 
00106     virtual double _viterbi(const Sequence &s, Sequence &path, Matrix & gamma) const;
00107 
00109     virtual Sequence & chooseObservation(Sequence & h, int i, int state) const;
00110 
00112     virtual int chooseState(int state) const;
00113 
00115     virtual int chooseFirstState() const;
00116 
00118     virtual DiscreteIIDModelPtr getInitialProbabilities() const {
00119       return _initial_probabilities;
00120     }
00121 
00123     virtual std::string getStateName(int state) const;
00124 
00126     virtual AlphabetPtr getStateNames() const;
00127     virtual std::string model_name() const {
00128       return "GeneralizedHiddenMarkovModel";
00129     }
00130 
00131     virtual ProbabilisticModelCreatorPtr getFactory() const;
00132     virtual std::string str() const;
00133 
00134     virtual DecodableModel * decodable() {
00135       return this;
00136     }
00137     int configureExplicitDurationState(std::string observation_model_name, DiscreteIIDModelPtr transition_distr,
00138                std::string duration_model_name, std::string state_name, int iphase, int ophase, std::vector<int> classes);
00139 
00140     int configureSignalState(std::string observation_model_name,
00141            DiscreteIIDModelPtr transition_distr,
00142            int size, std::string state_name, int iphase, int ophase, std::vector<int> classes);
00143 
00144     int configureGeometricDurationState(std::string observation_model_name,
00145                                          DiscreteIIDModelPtr transition_distr,
00146           std::string state_name, int iphase, int ophase, std::vector<int> classes);
00147     void setInitialProbability(DiscreteIIDModelPtr init);
00148     void setTerminalProbability(DiscreteIIDModelPtr term);
00149     void setObservationSymbols(AlphabetPtr obs) {
00150       setAlphabet(obs);
00151     }
00152     void setStateNames(AlphabetPtr alphabet);
00153     virtual ProbabilisticModelParameters parameters() const ;
00154     virtual void initialize(const ProbabilisticModelParameters & p) ;
00155 
00156 
00157   };
00158 
00159   typedef boost::shared_ptr<GeneralizedHiddenMarkovModel>
00160   GeneralizedHiddenMarkovModelPtr;
00161 }
00162 #endif