summaryrefslogtreecommitdiff
path: root/extools
diff options
context:
space:
mode:
authortrevor.cohn <trevor.cohn@ec762483-ff6d-05da-a07a-a48fb63a330f>2010-07-18 22:43:24 +0000
committertrevor.cohn <trevor.cohn@ec762483-ff6d-05da-a07a-a48fb63a330f>2010-07-18 22:43:24 +0000
commit1eccc03d43ae00fb913d7e648dd2d9b62c20eb81 (patch)
tree68570ab7e32a1f63aaccfd4ad6ae09aba2689f75 /extools
parentbd1019e31893ecd4799f4cb1c3000582d291c7a5 (diff)
??
git-svn-id: https://ws10smt.googlecode.com/svn/trunk@312 ec762483-ff6d-05da-a07a-a48fb63a330f
Diffstat (limited to 'extools')
-rw-r--r--extools/extractor.cc1
-rwxr-xr-xextools/simple-extract.sh2
2 files changed, 2 insertions, 1 deletions
diff --git a/extools/extractor.cc b/extools/extractor.cc
index 7279f745..71778d49 100644
--- a/extools/extractor.cc
+++ b/extools/extractor.cc
@@ -396,6 +396,7 @@ int main(int argc, char** argv) {
++line;
in.getline(buf, MAX_LINE_LENGTH);
if (buf[0] == 0) continue;
+ //cerr << "line #" << line << " = " << buf << endl;
if (!silent) {
if (line % 200 == 0) cerr << '.';
if (line % 8000 == 0) cerr << " [" << line << "]\n" << flush;
diff --git a/extools/simple-extract.sh b/extools/simple-extract.sh
index 7d9f439d..ec5c5276 100755
--- a/extools/simple-extract.sh
+++ b/extools/simple-extract.sh
@@ -6,6 +6,6 @@ date
date
# -p = compute phrase marginals
# -b = bidirectional rules (starting with F or E) were extracted
-gzcat ex.output.gz | ./mr_stripe_rule_reduce -p -b | sort -t $'\t' -k 1 | ./mr_stripe_rule_reduce | gzip > phrase-table.gz
+zcat ex.output.gz | ./mr_stripe_rule_reduce -p -b | sort -t $'\t' -k 1 | ./mr_stripe_rule_reduce | gzip > phrase-table.gz
date