summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
-rwxr-xr-xadd-ln (renamed from add_ln)0
-rwxr-xr-xadd-seg (renamed from add_seg)0
-rwxr-xr-xadd-start-end (renamed from add_start_end)0
-rwxr-xr-xavg-weights (renamed from avg_weights)0
-rwxr-xr-xcdec-hg-to-json (renamed from cdec_hg_to_json)0
-rwxr-xr-xconvert-to-svm-light-format (renamed from convert_to_svmlight_format)0
-rw-r--r--dense-features.txt (renamed from dense_features.txt)0
-rwxr-xr-xfake-svm-light (renamed from fake_svm_light)0
-rwxr-xr-xfeature-dict (renamed from feature_dict)0
-rwxr-xr-xfilter-by-rule-shape (renamed from filter_by_rule_shape)0
-rwxr-xr-xfilter-features (renamed from filter_features)0
-rwxr-xr-xfirst-lower (renamed from first_lower)0
-rwxr-xr-xgigaword-collapse-tags (renamed from gigaword_collapse_tags)0
-rwxr-xr-xhadoop-uniq (renamed from hadoop_uniq)0
-rwxr-xr-xkbest-bleu-oracles (renamed from kbest_bleu_oracles)0
-rwxr-xr-xkendalls-tau (renamed from kendalls_tau)0
-rwxr-xr-xkey-count (renamed from key_count)0
-rwxr-xr-xlin-reg (renamed from lin_reg)0
-rwxr-xr-xlog-reg (renamed from log_reg)0
-rwxr-xr-xmake-rule-features (renamed from make_rule_features)0
-rwxr-xr-xmax-len (renamed from max_len)0
-rwxr-xr-xmem-usage (renamed from mem_usage)0
-rwxr-xr-xmerge-files (renamed from merge_files)0
-rwxr-xr-xmerge-ttable (renamed from merge_ttable)0
-rwxr-xr-xmin-max (renamed from min_max)0
-rwxr-xr-xmoses-1best (renamed from moses_1best)0
-rwxr-xr-xno-empty (renamed from no_empty)0
-rwxr-xr-xno-non-printables (renamed from no_non_printables)0
-rwxr-xr-xnorm-german (renamed from norm_german)0
-rwxr-xr-xnorm-hyphens (renamed from norm_hyphens)0
-rwxr-xr-xnormalize-punctuation (renamed from normalize_punctuation)0
-rwxr-xr-xnum-tok (renamed from num_tok)0
-rwxr-xr-xpaste-pairs (renamed from paste_pairs)0
-rwxr-xr-xper-sentence-bleu (renamed from per_sentence_bleu)0
-rwxr-xr-xper-sentence-bleu-kbest (renamed from per_sentence_bleu_kbest)0
-rwxr-xr-xper-sentence-ter (renamed from per_sentence_ter)0
-rwxr-xr-xpreprocess2
-rwxr-xr-xpreprocess-no-lower (renamed from preprocess_no_lower)2
-rwxr-xr-xpt-bloom (renamed from pt_bloom)0
-rwxr-xr-xpush-rules (renamed from push_rules)0
-rwxr-xr-xruby-eval (renamed from ruby_eval)0
-rwxr-xr-xrule-shapes (renamed from rule_shapes)0
-rwxr-xr-xselect-from (renamed from select_from)0
-rwxr-xr-xsort-features (renamed from sort_features)0
-rwxr-xr-xsource-sides (renamed from source_sides)0
-rwxr-xr-xsplit-kbest (renamed from split_kbest)0
-rwxr-xr-xsplit-lines (renamed from split_lines)0
-rwxr-xr-xsplit-pipes (renamed from split_pipes)0
-rwxr-xr-xstanford-parser-run (renamed from stanford_parser_run)0
-rw-r--r--test/cdec-hg-to-json/cdec.ini (renamed from test/cdec_hg_to_json/cdec.ini)0
-rw-r--r--test/cdec-hg-to-json/grammar.gz (renamed from test/cdec_hg_to_json/grammar.gz)bin1399915 -> 1399915 bytes
-rw-r--r--test/cdec-hg-to-json/hg.json.gz (renamed from test/cdec_hg_to_json/hg.json.gz)bin318029 -> 318029 bytes
-rw-r--r--test/cdec-hg-to-json/hg.meta (renamed from test/cdec_hg_to_json/hg.meta)0
-rw-r--r--test/cdec-hg-to-json/in (renamed from test/cdec_hg_to_json/in)0
-rw-r--r--test/cdec-hg-to-json/toy.cdec.ini (renamed from test/cdec_hg_to_json/toy.cdec.ini)0
-rw-r--r--test/cdec-hg-to-json/toy.grammar (renamed from test/cdec_hg_to_json/toy.grammar)0
-rw-r--r--test/cdec-hg-to-json/toy.in (renamed from test/cdec_hg_to_json/toy.in)0
-rw-r--r--test/cdec-hg-to-json/toy.weights (renamed from test/cdec_hg_to_json/toy.weights)0
-rw-r--r--test/cdec-hg-to-json/weights (renamed from test/cdec_hg_to_json/weights)0
-rw-r--r--test/kbest-bleu-oracles/debug.kbests (renamed from test/kbest_bleu_oracles/debug.kbests)0
-rw-r--r--test/kbest-bleu-oracles/debug.refs (renamed from test/kbest_bleu_oracles/debug.refs)0
-rw-r--r--test/kbest-bleu-oracles/example.kbests (renamed from test/kbest_bleu_oracles/example.kbests)0
-rw-r--r--test/kbest-bleu-oracles/example.refs (renamed from test/kbest_bleu_oracles/example.refs)0
-rw-r--r--test/kbest-bleu-oracles/example.src (renamed from test/kbest_bleu_oracles/example.src)0
-rw-r--r--test/lin-reg/exptected.txt (renamed from test/lin_reg/exptected.txt)0
-rw-r--r--test/lin-reg/input.dat (renamed from test/lin_reg/input.dat)0
-rw-r--r--test/lin-reg/output.dat (renamed from test/lin_reg/output.dat)0
-rw-r--r--test/log-reg/expected.txt (renamed from test/log_reg/expected.txt)0
-rw-r--r--test/log-reg/input.dat (renamed from test/log_reg/input.dat)0
-rw-r--r--test/log-reg/output.dat (renamed from test/log_reg/output.dat)0
-rwxr-xr-xto-ascii (renamed from to_ascii)0
-rwxr-xr-xtoks-per-line (renamed from toks_per_line)0
-rwxr-xr-xtrain-test-split (renamed from train_test_split)0
73 files changed, 2 insertions, 2 deletions
diff --git a/add_ln b/add-ln
index 35bc44d..35bc44d 100755
--- a/add_ln
+++ b/add-ln
diff --git a/add_seg b/add-seg
index e5db580..e5db580 100755
--- a/add_seg
+++ b/add-seg
diff --git a/add_start_end b/add-start-end
index 30deaec..30deaec 100755
--- a/add_start_end
+++ b/add-start-end
diff --git a/avg_weights b/avg-weights
index 36b051a..36b051a 100755
--- a/avg_weights
+++ b/avg-weights
diff --git a/cdec_hg_to_json b/cdec-hg-to-json
index 5a26cf7..5a26cf7 100755
--- a/cdec_hg_to_json
+++ b/cdec-hg-to-json
diff --git a/convert_to_svmlight_format b/convert-to-svm-light-format
index a9ce98f..a9ce98f 100755
--- a/convert_to_svmlight_format
+++ b/convert-to-svm-light-format
diff --git a/dense_features.txt b/dense-features.txt
index daae8d1..daae8d1 100644
--- a/dense_features.txt
+++ b/dense-features.txt
diff --git a/fake_svm_light b/fake-svm-light
index eb074c1..eb074c1 100755
--- a/fake_svm_light
+++ b/fake-svm-light
diff --git a/feature_dict b/feature-dict
index 6849769..6849769 100755
--- a/feature_dict
+++ b/feature-dict
diff --git a/filter_by_rule_shape b/filter-by-rule-shape
index 695edec..695edec 100755
--- a/filter_by_rule_shape
+++ b/filter-by-rule-shape
diff --git a/filter_features b/filter-features
index fc21f6c..fc21f6c 100755
--- a/filter_features
+++ b/filter-features
diff --git a/first_lower b/first-lower
index 1cddb8e..1cddb8e 100755
--- a/first_lower
+++ b/first-lower
diff --git a/gigaword_collapse_tags b/gigaword-collapse-tags
index cbaf7d7..cbaf7d7 100755
--- a/gigaword_collapse_tags
+++ b/gigaword-collapse-tags
diff --git a/hadoop_uniq b/hadoop-uniq
index 5052419..5052419 100755
--- a/hadoop_uniq
+++ b/hadoop-uniq
diff --git a/kbest_bleu_oracles b/kbest-bleu-oracles
index a36c345..a36c345 100755
--- a/kbest_bleu_oracles
+++ b/kbest-bleu-oracles
diff --git a/kendalls_tau b/kendalls-tau
index c0c20be..c0c20be 100755
--- a/kendalls_tau
+++ b/kendalls-tau
diff --git a/key_count b/key-count
index deaa522..deaa522 100755
--- a/key_count
+++ b/key-count
diff --git a/lin_reg b/lin-reg
index 7a8e614..7a8e614 100755
--- a/lin_reg
+++ b/lin-reg
diff --git a/log_reg b/log-reg
index 82dc353..82dc353 100755
--- a/log_reg
+++ b/log-reg
diff --git a/make_rule_features b/make-rule-features
index 7adb6e9..7adb6e9 100755
--- a/make_rule_features
+++ b/make-rule-features
diff --git a/max_len b/max-len
index 69013b5..69013b5 100755
--- a/max_len
+++ b/max-len
diff --git a/mem_usage b/mem-usage
index 5c2104f..5c2104f 100755
--- a/mem_usage
+++ b/mem-usage
diff --git a/merge_files b/merge-files
index 714b57d..714b57d 100755
--- a/merge_files
+++ b/merge-files
diff --git a/merge_ttable b/merge-ttable
index ac10903..ac10903 100755
--- a/merge_ttable
+++ b/merge-ttable
diff --git a/min_max b/min-max
index 1dbfd40..1dbfd40 100755
--- a/min_max
+++ b/min-max
diff --git a/moses_1best b/moses-1best
index fd35cf8..fd35cf8 100755
--- a/moses_1best
+++ b/moses-1best
diff --git a/no_empty b/no-empty
index da57e23..da57e23 100755
--- a/no_empty
+++ b/no-empty
diff --git a/no_non_printables b/no-non-printables
index 9f9e3f9..9f9e3f9 100755
--- a/no_non_printables
+++ b/no-non-printables
diff --git a/norm_german b/norm-german
index cf9c060..cf9c060 100755
--- a/norm_german
+++ b/norm-german
diff --git a/norm_hyphens b/norm-hyphens
index 4a152a1..4a152a1 100755
--- a/norm_hyphens
+++ b/norm-hyphens
diff --git a/normalize_punctuation b/normalize-punctuation
index 108de44..108de44 100755
--- a/normalize_punctuation
+++ b/normalize-punctuation
diff --git a/num_tok b/num-tok
index 56cbae9..56cbae9 100755
--- a/num_tok
+++ b/num-tok
diff --git a/paste_pairs b/paste-pairs
index f6b8b31..f6b8b31 100755
--- a/paste_pairs
+++ b/paste-pairs
diff --git a/per_sentence_bleu b/per-sentence-bleu
index 402f364..402f364 100755
--- a/per_sentence_bleu
+++ b/per-sentence-bleu
diff --git a/per_sentence_bleu_kbest b/per-sentence-bleu-kbest
index f8bd860..f8bd860 100755
--- a/per_sentence_bleu_kbest
+++ b/per-sentence-bleu-kbest
diff --git a/per_sentence_ter b/per-sentence-ter
index fa283ef..fa283ef 100755
--- a/per_sentence_ter
+++ b/per-sentence-ter
diff --git a/preprocess b/preprocess
index 6531bf1..a46b0a8 100755
--- a/preprocess
+++ b/preprocess
@@ -5,5 +5,5 @@ P=`pwd -P`
popd > /dev/null
LANG=$1
-$P/no_non_printables | sed "s|[-,\.]\{4,\}|...|g" | $P/htmlentities 2>htmlentities.$LANG.err | $P/normalize_punctuation 2>normalize-punctuation.$LANG.err | $P/tokenizer-no-escape.perl -a -b -threads 1 -l $LANG 2>tokenizer.$LANG.err | $P/lowercase.perl 2>lowercase.$LANG.err
+$P/no-non-printables | sed "s|[-,\.]\{4,\}|...|g" | $P/htmlentities 2>htmlentities.$LANG.err | $P/normalize-punctuation 2>normalize-punctuation.$LANG.err | $P/tokenizer-no-escape.perl -a -b -threads 1 -l $LANG 2>tokenizer.$LANG.err | $P/lowercase.perl 2>lowercase.$LANG.err
diff --git a/preprocess_no_lower b/preprocess-no-lower
index 3a4d358..afd87e9 100755
--- a/preprocess_no_lower
+++ b/preprocess-no-lower
@@ -5,5 +5,5 @@ P=`pwd -P`
popd > /dev/null
LANG=$1
-$P/no_non_printables | sed "s|[-,\.]\{4,\}|...|g" | $P/htmlentities 2>htmlentities.$LANG.err | $P/normalize_punctuation 2>normalize-punctuation.$LANG.err | $P/tokenizer-no-escape.perl -a -b -threads 1 -l $LANG 2>tokenizer.$LANG.err
+$P/no-non-printables | sed "s|[-,\.]\{4,\}|...|g" | $P/htmlentities 2>htmlentities.$LANG.err | $P/normalize-punctuation 2>normalize-punctuation.$LANG.err | $P/tokenizer-no-escape.perl -a -b -threads 1 -l $LANG 2>tokenizer.$LANG.err
diff --git a/pt_bloom b/pt-bloom
index 5c2cf01..5c2cf01 100755
--- a/pt_bloom
+++ b/pt-bloom
diff --git a/push_rules b/push-rules
index c97ab80..c97ab80 100755
--- a/push_rules
+++ b/push-rules
diff --git a/ruby_eval b/ruby-eval
index fe0d181..fe0d181 100755
--- a/ruby_eval
+++ b/ruby-eval
diff --git a/rule_shapes b/rule-shapes
index 589a670..589a670 100755
--- a/rule_shapes
+++ b/rule-shapes
diff --git a/select_from b/select-from
index 7ab40e7..7ab40e7 100755
--- a/select_from
+++ b/select-from
diff --git a/sort_features b/sort-features
index 88bd779..88bd779 100755
--- a/sort_features
+++ b/sort-features
diff --git a/source_sides b/source-sides
index b4490c6..b4490c6 100755
--- a/source_sides
+++ b/source-sides
diff --git a/split_kbest b/split-kbest
index ab425b0..ab425b0 100755
--- a/split_kbest
+++ b/split-kbest
diff --git a/split_lines b/split-lines
index 14b3a0f..14b3a0f 100755
--- a/split_lines
+++ b/split-lines
diff --git a/split_pipes b/split-pipes
index ce8f018..ce8f018 100755
--- a/split_pipes
+++ b/split-pipes
diff --git a/stanford_parser_run b/stanford-parser-run
index f8d4210..f8d4210 100755
--- a/stanford_parser_run
+++ b/stanford-parser-run
diff --git a/test/cdec_hg_to_json/cdec.ini b/test/cdec-hg-to-json/cdec.ini
index 1ad25b5..1ad25b5 100644
--- a/test/cdec_hg_to_json/cdec.ini
+++ b/test/cdec-hg-to-json/cdec.ini
diff --git a/test/cdec_hg_to_json/grammar.gz b/test/cdec-hg-to-json/grammar.gz
index 78dda98..78dda98 100644
--- a/test/cdec_hg_to_json/grammar.gz
+++ b/test/cdec-hg-to-json/grammar.gz
Binary files differ
diff --git a/test/cdec_hg_to_json/hg.json.gz b/test/cdec-hg-to-json/hg.json.gz
index ed178c6..ed178c6 100644
--- a/test/cdec_hg_to_json/hg.json.gz
+++ b/test/cdec-hg-to-json/hg.json.gz
Binary files differ
diff --git a/test/cdec_hg_to_json/hg.meta b/test/cdec-hg-to-json/hg.meta
index d33a54c..d33a54c 100644
--- a/test/cdec_hg_to_json/hg.meta
+++ b/test/cdec-hg-to-json/hg.meta
diff --git a/test/cdec_hg_to_json/in b/test/cdec-hg-to-json/in
index 7dc411d..7dc411d 100644
--- a/test/cdec_hg_to_json/in
+++ b/test/cdec-hg-to-json/in
diff --git a/test/cdec_hg_to_json/toy.cdec.ini b/test/cdec-hg-to-json/toy.cdec.ini
index d4a2896..d4a2896 100644
--- a/test/cdec_hg_to_json/toy.cdec.ini
+++ b/test/cdec-hg-to-json/toy.cdec.ini
diff --git a/test/cdec_hg_to_json/toy.grammar b/test/cdec-hg-to-json/toy.grammar
index 382c94f..382c94f 100644
--- a/test/cdec_hg_to_json/toy.grammar
+++ b/test/cdec-hg-to-json/toy.grammar
diff --git a/test/cdec_hg_to_json/toy.in b/test/cdec-hg-to-json/toy.in
index e6df927..e6df927 100644
--- a/test/cdec_hg_to_json/toy.in
+++ b/test/cdec-hg-to-json/toy.in
diff --git a/test/cdec_hg_to_json/toy.weights b/test/cdec-hg-to-json/toy.weights
index 70075b7..70075b7 100644
--- a/test/cdec_hg_to_json/toy.weights
+++ b/test/cdec-hg-to-json/toy.weights
diff --git a/test/cdec_hg_to_json/weights b/test/cdec-hg-to-json/weights
index 7f96f1d..7f96f1d 100644
--- a/test/cdec_hg_to_json/weights
+++ b/test/cdec-hg-to-json/weights
diff --git a/test/kbest_bleu_oracles/debug.kbests b/test/kbest-bleu-oracles/debug.kbests
index 1e9c894..1e9c894 100644
--- a/test/kbest_bleu_oracles/debug.kbests
+++ b/test/kbest-bleu-oracles/debug.kbests
diff --git a/test/kbest_bleu_oracles/debug.refs b/test/kbest-bleu-oracles/debug.refs
index 8e13e46..8e13e46 100644
--- a/test/kbest_bleu_oracles/debug.refs
+++ b/test/kbest-bleu-oracles/debug.refs
diff --git a/test/kbest_bleu_oracles/example.kbests b/test/kbest-bleu-oracles/example.kbests
index 1126f1f..1126f1f 100644
--- a/test/kbest_bleu_oracles/example.kbests
+++ b/test/kbest-bleu-oracles/example.kbests
diff --git a/test/kbest_bleu_oracles/example.refs b/test/kbest-bleu-oracles/example.refs
index 632e27b..632e27b 100644
--- a/test/kbest_bleu_oracles/example.refs
+++ b/test/kbest-bleu-oracles/example.refs
diff --git a/test/kbest_bleu_oracles/example.src b/test/kbest-bleu-oracles/example.src
index f5b910d..f5b910d 100644
--- a/test/kbest_bleu_oracles/example.src
+++ b/test/kbest-bleu-oracles/example.src
diff --git a/test/lin_reg/exptected.txt b/test/lin-reg/exptected.txt
index 13de1fc..13de1fc 100644
--- a/test/lin_reg/exptected.txt
+++ b/test/lin-reg/exptected.txt
diff --git a/test/lin_reg/input.dat b/test/lin-reg/input.dat
index 3d93394..3d93394 100644
--- a/test/lin_reg/input.dat
+++ b/test/lin-reg/input.dat
diff --git a/test/lin_reg/output.dat b/test/lin-reg/output.dat
index 1f4f963..1f4f963 100644
--- a/test/lin_reg/output.dat
+++ b/test/lin-reg/output.dat
diff --git a/test/log_reg/expected.txt b/test/log-reg/expected.txt
index 46a03ef..46a03ef 100644
--- a/test/log_reg/expected.txt
+++ b/test/log-reg/expected.txt
diff --git a/test/log_reg/input.dat b/test/log-reg/input.dat
index eed0ab1..eed0ab1 100644
--- a/test/log_reg/input.dat
+++ b/test/log-reg/input.dat
diff --git a/test/log_reg/output.dat b/test/log-reg/output.dat
index 51283c0..51283c0 100644
--- a/test/log_reg/output.dat
+++ b/test/log-reg/output.dat
diff --git a/to_ascii b/to-ascii
index 10fd1c2..10fd1c2 100755
--- a/to_ascii
+++ b/to-ascii
diff --git a/toks_per_line b/toks-per-line
index 012caac..012caac 100755
--- a/toks_per_line
+++ b/toks-per-line
diff --git a/train_test_split b/train-test-split
index 4d8153a..4d8153a 100755
--- a/train_test_split
+++ b/train-test-split