Welcome to mirror list, hosted at ThFree Co, Russian Federation.

TreeInput.h « moses - github.com/moses-smt/mosesdecoder.git - Unnamed repository; edit this file 'description' to name the repository.
summaryrefslogtreecommitdiff
blob: 0d79516ab2796c71b39b44788b9c664038c946f6 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
// -*- c++ -*-
#ifndef moses_TreeInput_h
#define moses_TreeInput_h


#include <vector>
#include "Sentence.h"

namespace Moses
{
class TranslationTask;
//! @todo what is this?
class XMLParseOutput
{
public:
  std::string m_label;
  Range m_range;

  XMLParseOutput(const std::string &label, const Range &range)
    : m_label(label)
    , m_range(range) {
  }
};

/** An input to the decoder that represent a parse tree.
 *  Implemented as a sentence with non-terminal labels over certain ranges.
 *  This representation doesn't necessarily have to form a tree, it's up to the user to make sure it does if they really want a tree.
 *  @todo Need to rewrite if you want packed forest, or packed forest over lattice - not sure if can inherit from this
 */
class TreeInput : public Sentence
{
  friend std::ostream& operator<<(std::ostream&, const TreeInput&);

protected:
  std::vector<std::vector<NonTerminalSet> > m_sourceChart;
  std::vector<XMLParseOutput> m_labelledSpans;

  void AddChartLabel(size_t startPos, size_t endPos, const std::string &label);
  void AddChartLabel(size_t startPos, size_t endPos, const Word &label);

  NonTerminalSet &GetLabelSet(size_t startPos, size_t endPos) {
    return m_sourceChart[startPos][endPos - startPos];
  }

  bool ProcessAndStripXMLTags(AllOptions const& opts, std::string &line,
                              std::vector<XMLParseOutput> &sourceLabels,
                              std::vector<XmlOption const*> &res);

public:
  TreeInput(AllOptions::ptr const& opts) : Sentence(opts) { }

  InputTypeEnum GetType() const {
    return TreeInputType;
  }

  //! populate this InputType with data from in stream
  virtual int
  Read(std::istream& in);

  //! Output debugging info to stream out
  virtual void Print(std::ostream&) const;

  //! create trans options specific to this InputType
  virtual TranslationOptionCollection* CreateTranslationOptionCollection() const;

  virtual const NonTerminalSet &GetLabelSet(size_t startPos, size_t endPos) const {
    return m_sourceChart[startPos][endPos - startPos];
  }

  //! Get the XMLParseOutput objects in the order they were created.
  const std::vector<XMLParseOutput> &GetLabelledSpans() const {
    return m_labelledSpans;
  }
};

}

#endif