1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
|
// -*- c++ -*-
#ifndef moses_TreeInput_h
#define moses_TreeInput_h
#include <vector>
#include "Sentence.h"
namespace Moses
{
class TranslationTask;
//! @todo what is this?
class XMLParseOutput
{
public:
std::string m_label;
Range m_range;
XMLParseOutput(const std::string &label, const Range &range)
: m_label(label)
, m_range(range) {
}
};
/** An input to the decoder that represent a parse tree.
* Implemented as a sentence with non-terminal labels over certain ranges.
* This representation doesn't necessarily have to form a tree, it's up to the user to make sure it does if they really want a tree.
* @todo Need to rewrite if you want packed forest, or packed forest over lattice - not sure if can inherit from this
*/
class TreeInput : public Sentence
{
friend std::ostream& operator<<(std::ostream&, const TreeInput&);
protected:
std::vector<std::vector<NonTerminalSet> > m_sourceChart;
std::vector<XMLParseOutput> m_labelledSpans;
void AddChartLabel(size_t startPos, size_t endPos, const std::string &label);
void AddChartLabel(size_t startPos, size_t endPos, const Word &label);
NonTerminalSet &GetLabelSet(size_t startPos, size_t endPos) {
return m_sourceChart[startPos][endPos - startPos];
}
bool ProcessAndStripXMLTags(AllOptions const& opts, std::string &line,
std::vector<XMLParseOutput> &sourceLabels,
std::vector<XmlOption const*> &res);
public:
TreeInput(AllOptions::ptr const& opts) : Sentence(opts) { }
InputTypeEnum GetType() const {
return TreeInputType;
}
//! populate this InputType with data from in stream
virtual int
Read(std::istream& in);
//! Output debugging info to stream out
virtual void Print(std::ostream&) const;
//! create trans options specific to this InputType
virtual TranslationOptionCollection* CreateTranslationOptionCollection() const;
virtual const NonTerminalSet &GetLabelSet(size_t startPos, size_t endPos) const {
return m_sourceChart[startPos][endPos - startPos];
}
//! Get the XMLParseOutput objects in the order they were created.
const std::vector<XMLParseOutput> &GetLabelledSpans() const {
return m_labelledSpans;
}
};
}
#endif
|