Welcome to mirror list, hosted at ThFree Co, Russian Federation.

Word.h « OnDiskPt - github.com/moses-smt/mosesdecoder.git - Unnamed repository; edit this file 'description' to name the repository.
summaryrefslogtreecommitdiff
blob: 53253fa241cc290aa20861e4bf8a97ff0f589056 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
#pragma once
// $Id$
/***********************************************************************
 Moses - factored phrase-based, hierarchical and syntactic language decoder
 Copyright (C) 2009 Hieu Hoang

 This library is free software; you can redistribute it and/or
 modify it under the terms of the GNU Lesser General Public
 License as published by the Free Software Foundation; either
 version 2.1 of the License, or (at your option) any later version.

 This library is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 Lesser General Public License for more details.

 You should have received a copy of the GNU Lesser General Public
 License along with this library; if not, write to the Free Software
 Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301  USA
 ***********************************************************************/
#include <string>
#include <vector>
#include <iostream>
#include <fstream>
#include <boost/shared_ptr.hpp>
#include "Vocab.h"

namespace Moses
{
class Word;
}

namespace OnDiskPt
{
class Vocab;

/* A wrapper around a vocab id, and a boolean indicating whther it is a term or non-term.
 * Factors can be represented by using a vocab string with | character, eg go|VB
 */
class Word
{
  friend std::ostream& operator<<(std::ostream&, const Word&);

private:
  bool m_isNonTerminal;
  UINT64 m_vocabId;

public:
  explicit Word() {
  }

  explicit Word(bool isNonTerminal)
    :m_isNonTerminal(isNonTerminal)
    ,m_vocabId(0) {
  }

  Word(const Word &copy);
  ~Word();


  void CreateFromString(const std::string &inString, Vocab &vocab);
  bool IsNonTerminal() const {
    return m_isNonTerminal;
  }

  size_t WriteToMemory(char *mem) const;
  size_t ReadFromMemory(const char *mem);
  size_t ReadFromFile(std::fstream &file);

  void SetVocabId(UINT32 vocabId) {
    m_vocabId = vocabId;
  }

  void ConvertToMoses(
    const std::vector<Moses::FactorType> &outputFactorsVec,
    const Vocab &vocab,
    Moses::Word &overwrite) const;

  void DebugPrint(std::ostream &out, const Vocab &vocab) const;
  inline const std::string &GetString(const Vocab &vocab) const {
    return vocab.GetString(m_vocabId);
  }

  int Compare(const Word &compare) const;
  bool operator<(const Word &compare) const;
  bool operator==(const Word &compare) const;

};

typedef boost::shared_ptr<Word> WordPtr;
}