summaryrefslogtreecommitdiff
path: root/preprocess
diff options
context:
space:
mode:
authorPatrick Simianer <p@simianer.de>2014-03-17 13:50:41 +0100
committerPatrick Simianer <p@simianer.de>2014-03-17 13:50:41 +0100
commitb08be6207a78fc3639231489b74b4c72d78221d7 (patch)
tree7aa57fd79a5c4c848ac16663256fabc2778fa780 /preprocess
parent3bbbd92fc7b1f9d0d61f8573fee0d0b2f40960d3 (diff)
fix
Diffstat (limited to 'preprocess')
-rwxr-xr-xpreprocess2
1 files changed, 1 insertions, 1 deletions
diff --git a/preprocess b/preprocess
index 69eaa54..b034e48 100755
--- a/preprocess
+++ b/preprocess
@@ -1,5 +1,5 @@
#!/bin/bash
LANG=$1
-/toolbox/scripts/no_non_printables | sed "s|[-,\.]\{4,\}|...|" | /toolbox/scripts/htmlentities 2>htmlentities.$LANG.err | /toolbox/scripts/normalize_punctuation 2>normalize-punctuation.$LANG.err | /toolbox/moses/scripts/tokenizer/tokenizer.no-escape.perl -a -b -threads 1 -l $LANG 2>tokenizer.$LANG.err | /toolbox/moses/scripts/tokenizer/lowercase.perl 2>lowercase.$LANG.err
+/toolbox/scripts/no_non_printables | sed "s|[-,\.]\{4,\}|...|g" | /toolbox/scripts/htmlentities 2>htmlentities.$LANG.err | /toolbox/scripts/normalize_punctuation 2>normalize-punctuation.$LANG.err | /toolbox/moses/scripts/tokenizer/tokenizer.no-escape.perl -a -b -threads 1 -l $LANG 2>tokenizer.$LANG.err | /toolbox/moses/scripts/tokenizer/lowercase.perl 2>lowercase.$LANG.err