diff options
Diffstat (limited to 'extools')
-rw-r--r-- | extools/extractor.cc | 1 | ||||
-rwxr-xr-x | extools/simple-extract.sh | 2 |
2 files changed, 2 insertions, 1 deletions
diff --git a/extools/extractor.cc b/extools/extractor.cc index 7279f745..71778d49 100644 --- a/extools/extractor.cc +++ b/extools/extractor.cc @@ -396,6 +396,7 @@ int main(int argc, char** argv) { ++line; in.getline(buf, MAX_LINE_LENGTH); if (buf[0] == 0) continue; + //cerr << "line #" << line << " = " << buf << endl; if (!silent) { if (line % 200 == 0) cerr << '.'; if (line % 8000 == 0) cerr << " [" << line << "]\n" << flush; diff --git a/extools/simple-extract.sh b/extools/simple-extract.sh index 7d9f439d..ec5c5276 100755 --- a/extools/simple-extract.sh +++ b/extools/simple-extract.sh @@ -6,6 +6,6 @@ date date # -p = compute phrase marginals # -b = bidirectional rules (starting with F or E) were extracted -gzcat ex.output.gz | ./mr_stripe_rule_reduce -p -b | sort -t $'\t' -k 1 | ./mr_stripe_rule_reduce | gzip > phrase-table.gz +zcat ex.output.gz | ./mr_stripe_rule_reduce -p -b | sort -t $'\t' -k 1 | ./mr_stripe_rule_reduce | gzip > phrase-table.gz date |