Welcome to mirror list, hosted at ThFree Co, Russian Federation.

PhrasePairCollection.h « biconcor « ems « scripts - github.com/moses-smt/mosesdecoder.git - Unnamed repository; edit this file 'description' to name the repository.
summaryrefslogtreecommitdiff
blob: b2473515eddb8a9f521b2bd9cd644e0eee47ac87 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
#include "Vocabulary.h"
#include "SuffixArray.h"
#include "TargetCorpus.h"
#include "Alignment.h"
#include "PhrasePair.h"
#include "Mismatch.h"

#pragma once

class PhrasePairCollection
{
public:
  typedef unsigned int INDEX;

private:
  SuffixArray *m_suffixArray;
  TargetCorpus *m_targetCorpus;
  Alignment *m_alignment;
  vector< vector<PhrasePair*> > m_collection;
	vector< Mismatch* > m_mismatch, m_unaligned;
  int m_size;
  int m_max_lookup;
  int m_max_pp_target;
  int m_max_pp;

public:
  PhrasePairCollection ( SuffixArray *, TargetCorpus *, Alignment * );
  ~PhrasePairCollection ();

  bool GetCollection( const vector< string > sourceString );
  void Print();
  void PrintHTML();
};

// sorting helper
struct CompareBySize {
  bool operator()(const vector<PhrasePair*> a, const vector<PhrasePair*> b ) const {
    return a.size() > b.size();
  }
};