summaryrefslogtreecommitdiff
path: root/extools/sentence_pair.cc
diff options
context:
space:
mode:
authorredpony <redpony@ec762483-ff6d-05da-a07a-a48fb63a330f>2010-08-26 21:49:45 +0000
committerredpony <redpony@ec762483-ff6d-05da-a07a-a48fb63a330f>2010-08-26 21:49:45 +0000
commit6ddaff1341e565dd91dca7ea763d0ea4d897f4c7 (patch)
tree884fe1de5075cfaf6897b3b31b51586c1a0cb09a /extools/sentence_pair.cc
parent81e37133c966e8de993ec922b0008c405b29fe02 (diff)
some experimental stuff
git-svn-id: https://ws10smt.googlecode.com/svn/trunk@625 ec762483-ff6d-05da-a07a-a48fb63a330f
Diffstat (limited to 'extools/sentence_pair.cc')
-rw-r--r--extools/sentence_pair.cc21
1 files changed, 9 insertions, 12 deletions
diff --git a/extools/sentence_pair.cc b/extools/sentence_pair.cc
index 55609db4..d5ebe48f 100644
--- a/extools/sentence_pair.cc
+++ b/extools/sentence_pair.cc
@@ -117,6 +117,14 @@ int AnnotatedParallelSentence::ReadAlignmentPoint(const char* buf,
return ch;
}
+void AnnotatedParallelSentence::Align(const short a, const short b) {
+ aligned(a,b) = true;
+ ++f_aligned[a];
+ ++e_aligned[b];
+ aligns_by_fword[a].push_back(make_pair(a,b));
+ // cerr << a << " " << b << endl;
+}
+
void AnnotatedParallelSentence::ParseAlignmentPoint(const char* buf, int start, int end) {
short a, b;
ReadAlignmentPoint(buf, start, end, false, &a, &b, 0, 0);
@@ -124,11 +132,7 @@ void AnnotatedParallelSentence::ParseAlignmentPoint(const char* buf, int start,
cerr << "(" << a << ',' << b << ") is out of bounds. INPUT=\n" << buf << endl;
exit(1);
}
- aligned(a,b) = true;
- ++f_aligned[a];
- ++e_aligned[b];
- aligns_by_fword[a].push_back(make_pair(a,b));
- // cerr << a << " " << b << endl;
+ Align(a,b);
}
void AnnotatedParallelSentence::ParseSpanLabel(const char* buf, int start, int end) {
@@ -191,12 +195,5 @@ void AnnotatedParallelSentence::ParseInputLine(const char* buf) {
default: cerr << "Can't happen\n"; abort();
}
}
- if (state < 2) {
- cerr << "Not enough fields: " << buf << endl;
- abort();
- }
- if (e.empty() || f.empty()) {
- cerr << "Sentences must not be empty: " << buf << endl;
- }
}