Welcome to mirror list, hosted at ThFree Co, Russian Federation.

tables-core.h « phrase-extract - github.com/moses-smt/mosesdecoder.git - Unnamed repository; edit this file 'description' to name the repository.
summaryrefslogtreecommitdiff
blob: 9662ced2a63a5b6493a3aa4c9c6a753be43218ba (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
// $Id$

#ifndef _TABLES_H
#define _TABLES_H

#include <iostream>
#include <fstream>
#include <assert.h>
#include <stdlib.h>
#include <string>
#include <queue>
#include <map>
#include <cmath>

extern std::vector<std::string> tokenize( const char*);

namespace MosesTraining
{

typedef std::string WORD;
typedef unsigned int WORD_ID;

class Vocabulary
{
public:
  std::map<WORD, WORD_ID>  lookup;
  std::vector< WORD > vocab;
  WORD_ID storeIfNew( const WORD& );
  WORD_ID getWordID( const WORD& );
  inline WORD &getWord( const WORD_ID id ) {
    return vocab[ id ];
  }
};

typedef std::vector< WORD_ID > PHRASE;
typedef unsigned int PHRASE_ID;

class PhraseTable
{
public:
  std::map< PHRASE, PHRASE_ID > lookup;
  std::vector< PHRASE > phraseTable;
  PHRASE_ID storeIfNew( const PHRASE& );
  PHRASE_ID getPhraseID( const PHRASE& );
  void clear();
  inline PHRASE &getPhrase( const PHRASE_ID id ) {
    return phraseTable[ id ];
  }
};

typedef std::vector< std::pair< PHRASE_ID, double > > PHRASEPROBVEC;

class TTable
{
public:
  std::map< PHRASE_ID, std::vector< std::pair< PHRASE_ID, double > > > ttable;
  std::map< PHRASE_ID, std::vector< std::pair< PHRASE_ID, std::vector< double > > > > ttableMulti;
};

class DTable
{
public:
  std::map< int, double > dtable;
  void init();
  void load( const std::string& );
  double get( int );
};

}

#endif