summaryrefslogtreecommitdiff
path: root/utils/alignment_io.cc
blob: 460fbd3f1d23bdc29303f80dc9833950a8f9de1b (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
#include "utils/alignment_io.h"

using namespace std;

static bool is_digit(char x) { return x >= '0' && x <= '9'; }

boost::shared_ptr<Array2D<bool> > AlignmentIO::ReadPharaohAlignmentGrid(const string& al) {
  int max_x = 0;
  int max_y = 0;
  unsigned i = 0;
  size_t pos = al.rfind(" ||| ");
  if (pos != string::npos) { i = pos + 5; }
  while (i < al.size()) {
    if (al[i] == '\n' || al[i] == '\r') break;
    int x = 0;
    while(i < al.size() && is_digit(al[i])) {
      x *= 10;
      x += al[i] - '0';
      ++i;
    }
    if (x > max_x) max_x = x;
    assert(i < al.size());
    if(al[i] != '-') {
      cerr << "BAD ALIGNMENT: " << al << endl;
      abort();
    }
    ++i;
    int y = 0;
    while(i < al.size() && is_digit(al[i])) {
      y *= 10;
      y += al[i] - '0';
      ++i;
    }
    if (y > max_y) max_y = y;
    while(i < al.size() && al[i] == ' ') { ++i; }
  }

  boost::shared_ptr<Array2D<bool> > grid(new Array2D<bool>(max_x + 1, max_y + 1));
  i = 0;
  if (pos != string::npos) { i = pos + 5; }
  while (i < al.size()) {
    if (al[i] == '\n' || al[i] == '\r') break;
    int x = 0;
    while(i < al.size() && is_digit(al[i])) {
      x *= 10;
      x += al[i] - '0';
      ++i;
    }
    assert(i < al.size());
    assert(al[i] == '-');
    ++i;
    int y = 0;
    while(i < al.size() && is_digit(al[i])) {
      y *= 10;
      y += al[i] - '0';
      ++i;
    }
    (*grid)(x, y) = true;
    while(i < al.size() && al[i] == ' ') { ++i; }
  }
  // cerr << *grid << endl;
  return grid;
}

void AlignmentIO::SerializePharaohFormat(const Array2D<bool>& alignment, ostream* o) {
  ostream& out = *o;
  bool need_space = false;
  for (unsigned i = 0; i < alignment.width(); ++i)
    for (unsigned j = 0; j < alignment.height(); ++j)
      if (alignment(i,j)) {
        if (need_space) out << ' '; else need_space = true;
        out << i << '-' << j;
      }
  out << endl;
}

void AlignmentIO::SerializeTypedAlignment(const Array2D<AlignmentType>& alignment, ostream* o) {
  ostream& out = *o;
  bool need_space = false;
  for (unsigned i = 0; i < alignment.width(); ++i)
    for (unsigned j = 0; j < alignment.height(); ++j) {
      const AlignmentType& aij = alignment(i,j);
      if (aij != kNONE) {
        if (need_space) out << ' '; else need_space = true;
        if (aij == kTRANSLATION) {}
        else if (aij == kTRANSLITERATION) {
          out << 'T' << ':';
        } else {
          cerr << "\nUnexpected alignment point type: " << static_cast<int>(aij) << endl;
          abort();
        }
        out << i << '-' << j;
      }
    }
  out << endl;
}