summaryrefslogtreecommitdiff
path: root/extractor/alignment.h
blob: 4596f92b595b7885b99405e059825c1e8dee42b3 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
#ifndef _ALIGNMENT_H_
#define _ALIGNMENT_H_

#include <string>
#include <vector>

#include <boost/filesystem.hpp>

namespace fs = boost::filesystem;
using namespace std;

namespace extractor {

/**
 * Data structure storing the word alignments for a parallel corpus.
 */
class Alignment {
 public:
  // Reads alignment from text file.
  Alignment(const string& filename);

  // Returns the alignment for a given sentence.
  virtual vector<pair<int, int>> GetLinks(int sentence_index) const;

  // Writes alignment to file in binary format.
  void WriteBinary(const fs::path& filepath);

  virtual ~Alignment();

 protected:
  Alignment();

 private:
  vector<vector<pair<int, int>>> alignments;
};

} // namespace extractor

#endif