summaryrefslogtreecommitdiff
path: root/preprocess_nolow
diff options
context:
space:
mode:
authorPatrick Simianer <p@simianer.de>2013-12-05 07:56:38 +0100
committerPatrick Simianer <p@simianer.de>2013-12-05 07:56:38 +0100
commitdb6a6ecfa350cae29739c59df1210d8f76a479c9 (patch)
treef137a001f57f170455c28ce97b5abb2726006cf6 /preprocess_nolow
init
Diffstat (limited to 'preprocess_nolow')
-rwxr-xr-xpreprocess_nolow5
1 files changed, 5 insertions, 0 deletions
diff --git a/preprocess_nolow b/preprocess_nolow
new file mode 100755
index 0000000..fc466b6
--- /dev/null
+++ b/preprocess_nolow
@@ -0,0 +1,5 @@
+#!/bin/zsh
+
+LANG=$1
+~/scripts/htmlentities 2>htmlentities.$LANG.err | ~/scripts/normalize-punctuation 2>normalize-punctuation.$LANG.err | ~/moses/scripts/tokenizer/tokenizer.perl -a -b -threads 1 -l $LANG 2>tokenizer.$LANG.err
+