summaryrefslogtreecommitdiff
path: root/extools
diff options
context:
space:
mode:
authortrevor.cohn <trevor.cohn@ec762483-ff6d-05da-a07a-a48fb63a330f>2010-07-18 22:43:24 +0000
committertrevor.cohn <trevor.cohn@ec762483-ff6d-05da-a07a-a48fb63a330f>2010-07-18 22:43:24 +0000
commit241a0317966f00546aaf3b5c02c137097cfaccda (patch)
tree9a36ff04e56df33aa4230b25b6c46a3286d8421f /extools
parentc150bdea83a9f599b34832072a70af525e40b77a (diff)
??
git-svn-id: https://ws10smt.googlecode.com/svn/trunk@312 ec762483-ff6d-05da-a07a-a48fb63a330f
Diffstat (limited to 'extools')
-rw-r--r--extools/extractor.cc1
-rwxr-xr-xextools/simple-extract.sh2
2 files changed, 2 insertions, 1 deletions
diff --git a/extools/extractor.cc b/extools/extractor.cc
index 7279f745..71778d49 100644
--- a/extools/extractor.cc
+++ b/extools/extractor.cc
@@ -396,6 +396,7 @@ int main(int argc, char** argv) {
++line;
in.getline(buf, MAX_LINE_LENGTH);
if (buf[0] == 0) continue;
+ //cerr << "line #" << line << " = " << buf << endl;
if (!silent) {
if (line % 200 == 0) cerr << '.';
if (line % 8000 == 0) cerr << " [" << line << "]\n" << flush;
diff --git a/extools/simple-extract.sh b/extools/simple-extract.sh
index 7d9f439d..ec5c5276 100755
--- a/extools/simple-extract.sh
+++ b/extools/simple-extract.sh
@@ -6,6 +6,6 @@ date
date
# -p = compute phrase marginals
# -b = bidirectional rules (starting with F or E) were extracted
-gzcat ex.output.gz | ./mr_stripe_rule_reduce -p -b | sort -t $'\t' -k 1 | ./mr_stripe_rule_reduce | gzip > phrase-table.gz
+zcat ex.output.gz | ./mr_stripe_rule_reduce -p -b | sort -t $'\t' -k 1 | ./mr_stripe_rule_reduce | gzip > phrase-table.gz
date