Welcome to mirror list, hosted at ThFree Co, Russian Federation.

line_splitter.hh « ProbingPT « TranslationModel « moses - github.com/moses-smt/mosesdecoder.git - Unnamed repository; edit this file 'description' to name the repository.
summaryrefslogtreecommitdiff
blob: cec0a5f4596545bc499d471b25402738521a6c4e (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
#pragma once

#include "util/string_piece.hh"
#include "util/tokenize_piece.hh"
#include "util/file_piece.hh"
#include <vector>
#include <cstdlib> //atof
#include "util/string_piece.hh"  //Tokenization and work with StringPiece
#include "util/tokenize_piece.hh"
#include <vector>

namespace Moses
{

//Struct for holding processed line
struct line_text
{
  StringPiece source_phrase;
  StringPiece target_phrase;
  StringPiece prob;
  StringPiece word_align;
  StringPiece counts;
  StringPiece sparse_score;
  StringPiece property;
  std::string property_to_be_binarized;
};

//Struct for holding processed line
struct target_text
{
  std::vector<unsigned int> target_phrase;
  std::vector<float> prob;
  std::vector<size_t> word_align_term;
  std::vector<size_t> word_align_non_term;
  std::vector<char> counts;
  std::vector<char> sparse_score;
  std::vector<char> property;

  /*
  void Reset()
  {
    target_phrase.clear();
    prob.clear();
    word_all1.clear();
    counts.clear();
    sparse_score.clear();
    property.clear();
  }
  */
};

//Ask if it's better to have it receive a pointer to a line_text struct
line_text splitLine(const StringPiece &textin, bool scfg);
void reformatSCFG(line_text &output);

std::vector<unsigned char> splitWordAll1(const StringPiece &textin);

}