diff options
Diffstat (limited to 'GIZA++-v2/hmm.h')
-rw-r--r-- | GIZA++-v2/hmm.h | 88 |
1 files changed, 88 insertions, 0 deletions
diff --git a/GIZA++-v2/hmm.h b/GIZA++-v2/hmm.h new file mode 100644 index 0000000..d4f3301 --- /dev/null +++ b/GIZA++-v2/hmm.h @@ -0,0 +1,88 @@ +/* + +EGYPT Toolkit for Statistical Machine Translation +Written by Yaser Al-Onaizan, Jan Curin, Michael Jahr, Kevin Knight, John Lafferty, Dan Melamed, David Purdy, Franz Och, Noah Smith, and David Yarowsky. + +This program is free software; you can redistribute it and/or +modify it under the terms of the GNU General Public License +as published by the Free Software Foundation; either version 2 +of the License, or (at your option) any later version. + +This program is distributed in the hope that it will be useful, +but WITHOUT ANY WARRANTY; without even the implied warranty of +MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +GNU General Public License for more details. + +You should have received a copy of the GNU General Public License +along with this program; if not, write to the Free Software +Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, +USA. + +*/ +#ifndef _hmm_h +#define _hmm_h 1 + +#include <assert.h> + +#include <iostream> +#include <algorithm> +#include <functional> +#include <map> +#include <set> +#include "Vector.h" +#include <utility> + +#if __GNUC__>2 +#include <ext/hash_map> +using __gnu_cxx::hash_map; +#else +#include <hash_map> +#endif +#include <fstream.h> +#include <math.h> +#include <time.h> + +#include "TTables.h" +#include "ATables.h" +#include "getSentence.h" +#include "defs.h" +#include "model2.h" +#include "Perplexity.h" +#include "vocab.h" +#include "WordClasses.h" +#include "HMMTables.h" +#include "ForwardBackward.h" + +class hmm : public model2 +{ + private: + WordClasses ewordclasses; + WordClasses fwordclasses; + HMMTables<int,WordClasses> counts,probs; + public: + template<class MAPPER> + void makeWordClasses(const MAPPER&m1,const MAPPER&m2,string efile,string ffile) + { + ifstream estrm(efile.c_str()),fstrm(ffile.c_str()); + if( !estrm ) + { + cerr << "ERROR: can not read " << efile << endl; + } + else + ewordclasses.read(estrm,m1); + if( !fstrm ) + cerr << "ERROR: can not read " << ffile << endl; + else + fwordclasses.read(fstrm,m2); + } + hmm(model2&m2); + void initialize_table_uniformly(sentenceHandler&); + int em_with_tricks(int); + void load_table(const char* aname); + void em_loop(Perplexity& perp, sentenceHandler& sHandler1, bool dump_files, + const char* alignfile, Perplexity&, bool test,bool doInit,int iter); + HMMNetwork *makeHMMNetwork(const Vector<WordIndex>& es,const Vector<WordIndex>&fs,bool doInit)const; + friend class model3; +}; + +#endif |