/*********************************************************************** Moses - factored phrase-based language decoder Copyright (C) 2006 University of Edinburgh This library is free software; you can redistribute it and/or modify it under the terms of the GNU Lesser General Public License as published by the Free Software Foundation; either version 2.1 of the License, or (at your option) any later version. This library is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public License for more details. You should have received a copy of the GNU Lesser General Public License along with this library; if not, write to the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA ***********************************************************************/ #ifndef moses_TypeDef_h #define moses_TypeDef_h #include #include #include #include #ifdef WIN32 #include #else #include typedef uint32_t UINT32; typedef uint64_t UINT64; #endif namespace Moses { #define PROJECT_NAME "moses" #ifndef BOS_ #define BOS_ "" //Beginning of sentence symbol #endif #ifndef EOS_ #define EOS_ "" //End of sentence symbol #endif #define UNKNOWN_FACTOR "UNK" #define EPSILON "*EPS*" #define NOT_FOUND std::numeric_limits::max() #define MAX_NGRAM_SIZE 20 const size_t DEFAULT_CUBE_PRUNING_POP_LIMIT = 1000; const size_t DEFAULT_CUBE_PRUNING_DIVERSITY = 0; const size_t DEFAULT_MAX_HYPOSTACK_SIZE = 200; const size_t DEFAULT_MAX_TRANS_OPT_CACHE_SIZE = 10000; const size_t DEFAULT_MAX_TRANS_OPT_SIZE = 5000; const size_t DEFAULT_MAX_PART_TRANS_OPT_SIZE = 10000; const size_t DEFAULT_MAX_PHRASE_LENGTH = 20; const size_t DEFAULT_MAX_CHART_SPAN = 10; const size_t ARRAY_SIZE_INCR = 10; //amount by which a phrase gets resized when necessary const float LOWEST_SCORE = -100.0f; const float DEFAULT_BEAM_WIDTH = 0.00001f; const float DEFAULT_EARLY_DISCARDING_THRESHOLD = 0.0f; const float DEFAULT_TRANSLATION_OPTION_THRESHOLD = 0.0f; const size_t DEFAULT_VERBOSE_LEVEL = 1; // enums. // must be 0, 1, 2, ..., unless otherwise stated // can only be 2 at the moment const int NUM_LANGUAGES = 2; const size_t MAX_NUM_FACTORS = 4; enum FactorDirection { Input, //! Source factors Output //! Target factors }; enum DecodeType { Translate ,Generate ,InsertNullFertilityWord //! an optional step that attempts to insert a few closed-class words to improve LM scores }; namespace LexReorderType { enum LexReorderType { // explain values Backward ,Forward ,Bidirectional ,Fe ,F }; } namespace DistortionOrientationType { enum DistortionOrientationOptions { Monotone, //distinguish only between monotone and non-monotone as possible orientations Msd //further separate non-monotone into swapped and discontinuous }; } enum LMType { SingleFactor ,MultiFactor }; enum LMImplementation { SRI = 0 ,IRST = 1 // ,Skip = 2 ,Joint = 3 // ,Internal = 4 ,RandLM = 5 ,Remote = 6 ,ParallelBackoff = 7 ,Ken = 8 ,LazyKen = 9 ,ORLM = 10 ,LDHTLM = 11 }; enum PhraseTableImplementation { Memory = 0 ,Binary = 1 ,OnDisk = 2 //,GlueRule = 3 //,Joshua = 4 //,MemorySourceLabel = 5 ,SCFG = 6 //,BerkeleyDb = 7 ,SuffixArray = 8 ,Hiero = 9 ,ALSuffixArray = 10 }; enum InputTypeEnum { SentenceInput = 0 ,ConfusionNetworkInput = 1 ,WordLatticeInput = 2 ,TreeInputType = 3 ,WordLatticeInput2 = 4 }; enum XmlInputType { XmlPassThrough = 0, XmlIgnore = 1, XmlExclusive = 2, XmlInclusive = 3 }; enum DictionaryFind { Best = 0 ,All = 1 }; enum ParsingAlgorithm { ParseCYKPlus = 0, ParseScope3 = 1 }; enum SearchAlgorithm { Normal = 0 ,CubePruning = 1 ,CubeGrowing = 2 ,ChartDecoding= 3 }; enum SourceLabelOverlap { SourceLabelOverlapAdd = 0 ,SourceLabelOverlapReplace = 1 ,SourceLabelOverlapDiscard = 2 }; enum WordAlignmentSort { NoSort = 0 ,TargetOrder = 1 }; // typedef typedef size_t FactorType; typedef std::vector Scores; typedef std::vector WordAlignments; typedef std::vector FactorList; typedef std::pair,Scores > StringTgtCand; typedef std::pair,WordAlignments > StringWordAlignmentCand; } #endif