diff options
Diffstat (limited to 'tests/system_tests')
32 files changed, 346 insertions, 0 deletions
diff --git a/tests/system_tests/australia-align/australia.scfg.gz b/tests/system_tests/australia-align/australia.scfg.gz Binary files differnew file mode 100644 index 00000000..0cd70f1f --- /dev/null +++ b/tests/system_tests/australia-align/australia.scfg.gz diff --git a/tests/system_tests/australia-align/cdec.ini b/tests/system_tests/australia-align/cdec.ini new file mode 100644 index 00000000..eba98941 --- /dev/null +++ b/tests/system_tests/australia-align/cdec.ini @@ -0,0 +1,3 @@ +formalism=scfg +grammar=australia.scfg.gz +aligner=true diff --git a/tests/system_tests/australia-align/gold.statistics b/tests/system_tests/australia-align/gold.statistics new file mode 100644 index 00000000..8101bd40 --- /dev/null +++ b/tests/system_tests/australia-align/gold.statistics @@ -0,0 +1,8 @@ +-lm_nodes 77 +-lm_edges 244232 +-lm_paths 3.79555e+28 +-lm_trans australia is have diplomatic relations with north korea one of the few countries . +-lm_viterbi -12.7893 +constr_nodes 111 +constr_edges 305 +constr_paths 9899 diff --git a/tests/system_tests/australia-align/gold.stdout b/tests/system_tests/australia-align/gold.stdout new file mode 100644 index 00000000..310ac348 --- /dev/null +++ b/tests/system_tests/australia-align/gold.stdout @@ -0,0 +1 @@ +0-0 1-1 2-11 3-12 3-13 4-7 4-8 5-9 5-10 6-4 7-5 8-6 9-2 9-3 10-14 diff --git a/tests/system_tests/australia-align/input.txt b/tests/system_tests/australia-align/input.txt new file mode 100644 index 00000000..482d3e4b --- /dev/null +++ b/tests/system_tests/australia-align/input.txt @@ -0,0 +1 @@ +澳洲 是 与 北韩 有 邦交 的 少数 国家 之一 。 ||| australia is one of the few countries that has diplomatic relations with north korea . diff --git a/tests/system_tests/australia-align/stderr b/tests/system_tests/australia-align/stderr new file mode 100644 index 00000000..c49e3bd0 --- /dev/null +++ b/tests/system_tests/australia-align/stderr @@ -0,0 +1,48 @@ +cdec v1.0 (c) 2009 by Chris Dyer +Configuration file: cdec.ini +Reading SCFG grammar from australia.scfg.gz + 33737 rules read. +Reading weights from weights +Loaded 7 feature weights +Reading input from input.txt + +INPUT: 澳洲 是 与 北韩 有 邦交 的 少数 国家 之一 。 ||| australia is one of the few ... + id = 0 + Goal category: [S] + ........... + -LM forest (nodes/edges): 77/244232 + -LM forest (paths): 3.79555e+28 + -LM Viterbi: australia is have diplomatic relations with north korea one of the few countries . + -LM Viterbi: -12.7893 + Goal category: [CAT_76] + ............... + Constr. forest (nodes/edges): 111/305 + Constr. forest (paths): 9899 + Constr. VitTree: (CAT_76 (CAT_75 (CAT_73 (CAT_13 (CAT_12 australia is)) (CAT_66 (CAT_55 (CAT_40 one of the few countries) (CAT_5 that has) diplomatic relations) with north korea)) (CAT_11 .))) + 1 0.367526 0 0 0 0 0 0 0 0 0 0 0 0 0 + 0.367526 0.999979 0.100222 0.0997905 0.0210297 0 0 0.00481735 8.02707e-12 0 0 0 0 0 0.0587194 + 0 9.42288e-12 0 8.53331e-07 3.77376e-06 0 0 8.02707e-12 0.0310404 0 0 0.999994 0.947965 0.947965 9.71274e-07 + 0 0 0 0 0 0 0 0 0 0 0 0.947965 1 1 0 + 0 0 7.54036e-06 6.96573e-05 0 0 0 0.742293 0.999244 0 0 0.0310422 0 0 0.000677908 + 0 0 0 0 0 0 0 0 0 1 1 0 0 0 0 + 0 0.02397 0.328274 0.330722 0.961649 0.321117 0.263254 0.257688 0.000755969 0 0 3.82289e-06 0 0 0.0265549 + 0 0 0.130232 0.130232 0.321285 1 0.565141 0 0 0 0 0 0 0 0 + 0 0 0.108129 0.10919 0.260861 0.565141 1 0 0 0 0 0 0 0 2.53515e-12 + 0 0.100047 0.999815 0.996401 0.365844 0.130232 0.108128 0 0 0 0 0 0 0 0.112835 + 0 0.058724 0.112814 0.112464 0.0214041 0 0 0.00590826 0 0 0 0 0 0 1 + + 012345678901234 +0*..............0 +1.*.............1 +2...........*...2 +3............**.3 +4.......**......4 +5.........**....5 +6....*..........6 +7.....*.........7 +8......*........8 +9..**...........9 +0..............*0 + 012345678901234 + +Translation: 1.41218 secs (1 calls) diff --git a/tests/system_tests/australia-align/weights b/tests/system_tests/australia-align/weights new file mode 100644 index 00000000..a280184c --- /dev/null +++ b/tests/system_tests/australia-align/weights @@ -0,0 +1,7 @@ +WordPenalty -2.844814 +LanguageModel 1.0 +PhraseModel_0 -1.066893 +PhraseModel_1 -0.752247 +PhraseModel_2 -0.589793 +PassThrough -20.0 +Glue 0 diff --git a/tests/system_tests/australia/australia.scfg.gz b/tests/system_tests/australia/australia.scfg.gz Binary files differnew file mode 100644 index 00000000..0cd70f1f --- /dev/null +++ b/tests/system_tests/australia/australia.scfg.gz diff --git a/tests/system_tests/australia/cdec.ini b/tests/system_tests/australia/cdec.ini new file mode 100644 index 00000000..dfc3cb20 --- /dev/null +++ b/tests/system_tests/australia/cdec.ini @@ -0,0 +1,2 @@ +formalism=scfg +grammar=australia.scfg.gz diff --git a/tests/system_tests/australia/gold.statistics b/tests/system_tests/australia/gold.statistics new file mode 100644 index 00000000..050d12dd --- /dev/null +++ b/tests/system_tests/australia/gold.statistics @@ -0,0 +1,8 @@ +-lm_nodes 77 +-lm_edges 244232 +-lm_paths 3.79555e+28 +-lm_trans australia is have diplomatic relations with north korea one of the few countries . +-lm_viterbi -12.7893 +constr_nodes 185 +constr_edges 827 +constr_paths 279358 diff --git a/tests/system_tests/australia/gold.stdout b/tests/system_tests/australia/gold.stdout new file mode 100644 index 00000000..e69de29b --- /dev/null +++ b/tests/system_tests/australia/gold.stdout diff --git a/tests/system_tests/australia/input.txt b/tests/system_tests/australia/input.txt new file mode 100644 index 00000000..f14bf535 --- /dev/null +++ b/tests/system_tests/australia/input.txt @@ -0,0 +1 @@ +澳洲 是 与 北韩 有 邦交 的 少数 国家 之一 。 ||| ((('australia',0,1),),(('is',0,1),),(('one',0,1),),(('of',0,1),),(('the',0,4),('a',0,4),('a',0,1),('the',0,1),),(('small',0,1),('tiny',0,1),('miniscule',0,1),('handful',0,2),),(('number',0,1),('group',0,1),),(('of',0,2),),(('few',0,1),),(('countries',0,1),),(('that',0,1),),(('has',0,1),('have',0,1),),(('diplomatic',0,1),),(('relations',0,1),),(('with',0,1),),(('north',0,1),),(('korea',0,1),),(('.',0,1),),) diff --git a/tests/system_tests/australia/stderr b/tests/system_tests/australia/stderr new file mode 100644 index 00000000..c41fb9fb --- /dev/null +++ b/tests/system_tests/australia/stderr @@ -0,0 +1,22 @@ +cdec v1.0 (c) 2009 by Chris Dyer +Configuration file: cdec.ini +Reading SCFG grammar from australia.scfg.gz + 33737 rules read. +Reading weights from weights +Loaded 7 feature weights +Reading input from input.txt + +INPUT: 澳洲 是 与 北韩 有 邦交 的 少数 国家 之一 。 ||| ... + id = 0 + Goal category: [S] + ........... + -LM forest (nodes/edges): 77/244232 + -LM forest (paths): 3.79555e+28 + -LM Viterbi: australia is have diplomatic relations with north korea one of the few countries . + -LM Viterbi: -12.7893 + Goal category: [CAT_76] + .................. + Constr. forest (nodes/edges): 185/827 + Constr. forest (paths): 279358 + Constr. VitTree: (CAT_76 (CAT_75 (CAT_1 (CAT_0 australia)) (CAT_74 is (CAT_31 one of (CAT_20 a few countries)) that (CAT_36 have diplomatic relations (CAT_15 with north korea)) .))) +Translation: 2.69099 secs (1 calls) diff --git a/tests/system_tests/australia/weights b/tests/system_tests/australia/weights new file mode 100644 index 00000000..a280184c --- /dev/null +++ b/tests/system_tests/australia/weights @@ -0,0 +1,7 @@ +WordPenalty -2.844814 +LanguageModel 1.0 +PhraseModel_0 -1.066893 +PhraseModel_1 -0.752247 +PhraseModel_2 -0.589793 +PassThrough -20.0 +Glue 0 diff --git a/tests/system_tests/controlled_synparse/cdec.ini b/tests/system_tests/controlled_synparse/cdec.ini new file mode 100644 index 00000000..b5c7d4d8 --- /dev/null +++ b/tests/system_tests/controlled_synparse/cdec.ini @@ -0,0 +1,3 @@ +formalism=scfg +grammar=scfg.biparse.gz +k_best=100 diff --git a/tests/system_tests/controlled_synparse/gold.statistics b/tests/system_tests/controlled_synparse/gold.statistics new file mode 100644 index 00000000..3885cf94 --- /dev/null +++ b/tests/system_tests/controlled_synparse/gold.statistics @@ -0,0 +1,16 @@ +-lm_nodes 11 +-lm_edges 18 +-lm_paths 18 +-lm_trans a d c b +-lm_trans 0 +constr_nodes 8 +constr_edges 8 +constr_paths 1 +-lm_nodes 11 +-lm_edges 18 +-lm_paths 18 +-lm_trans a d c b +-lm_trans 0 +constr_nodes 12 +constr_edges 14 +constr_paths 3 diff --git a/tests/system_tests/controlled_synparse/gold.stdout b/tests/system_tests/controlled_synparse/gold.stdout new file mode 100644 index 00000000..f3e0ce08 --- /dev/null +++ b/tests/system_tests/controlled_synparse/gold.stdout @@ -0,0 +1,36 @@ +0 ||| c b c d ||| F1bad2=1;F5=1;F6=1;F7=1;Glue=3 +0 ||| c d c b e ||| F1bad2=1;F4=1;F5=1;F7=1;Glue=1 +0 ||| c b c d ||| F1bad2=1;F6=1;F7=1;F9=1;Glue=2 +0 ||| b d c b e ||| F1bad1=1;F4=1;F5=1;F7=1;Glue=1 +0 ||| c b c d ||| F1bad2=1;F3=1;F5=1;F7=1;Glue=1 +0 ||| a d c b e ||| F1=1;F4=1;F5=1;F7=1;Glue=1 +0 ||| b b c d ||| F1bad1=1;F3=1;F5=1;F7=1;Glue=1 +0 ||| c d c b ||| F1bad2=1;F2=1;F5=1;F7=1;Glue=1 +0 ||| a b c d ||| F1=1;F3=1;F5=1;F7=1;Glue=1 +0 ||| b b c d ||| F1bad1=1;F5=1;F6=1;F7=1;Glue=3 +0 ||| b d c b ||| F1bad1=1;F2=1;F5=1;F7=1;Glue=1 +0 ||| a d c b ||| F1=1;F2=1;F5=1;F7=1;Glue=1 +0 ||| b b c d ||| F1bad1=1;F6=1;F7=1;F9=1;Glue=2 +0 ||| c c b d ||| F1bad2=1;F6=1;F7=1;F8=1;Glue=2 +0 ||| a b c d ||| F1=1;F6=1;F7=1;F9=1;Glue=2 +0 ||| a b c d ||| F1=1;F5=1;F6=1;F7=1;Glue=3 +0 ||| b c b d ||| F1bad1=1;F6=1;F7=1;F8=1;Glue=2 +0 ||| a c b d ||| F1=1;F6=1;F7=1;F8=1;Glue=2 +1 ||| c b c d ||| F1bad2=1;F5=1;F6=1;F7=1;Glue=3 +1 ||| c d c b e ||| F1bad2=1;F4=1;F5=1;F7=1;Glue=1 +1 ||| c b c d ||| F1bad2=1;F6=1;F7=1;F9=1;Glue=2 +1 ||| b d c b e ||| F1bad1=1;F4=1;F5=1;F7=1;Glue=1 +1 ||| c b c d ||| F1bad2=1;F3=1;F5=1;F7=1;Glue=1 +1 ||| a d c b e ||| F1=1;F4=1;F5=1;F7=1;Glue=1 +1 ||| b b c d ||| F1bad1=1;F3=1;F5=1;F7=1;Glue=1 +1 ||| c d c b ||| F1bad2=1;F2=1;F5=1;F7=1;Glue=1 +1 ||| a b c d ||| F1=1;F3=1;F5=1;F7=1;Glue=1 +1 ||| b b c d ||| F1bad1=1;F5=1;F6=1;F7=1;Glue=3 +1 ||| b d c b ||| F1bad1=1;F2=1;F5=1;F7=1;Glue=1 +1 ||| a d c b ||| F1=1;F2=1;F5=1;F7=1;Glue=1 +1 ||| b b c d ||| F1bad1=1;F6=1;F7=1;F9=1;Glue=2 +1 ||| c c b d ||| F1bad2=1;F6=1;F7=1;F8=1;Glue=2 +1 ||| a b c d ||| F1=1;F6=1;F7=1;F9=1;Glue=2 +1 ||| a b c d ||| F1=1;F5=1;F6=1;F7=1;Glue=3 +1 ||| b c b d ||| F1bad1=1;F6=1;F7=1;F8=1;Glue=2 +1 ||| a c b d ||| F1=1;F6=1;F7=1;F8=1;Glue=2 diff --git a/tests/system_tests/controlled_synparse/input.txt b/tests/system_tests/controlled_synparse/input.txt new file mode 100644 index 00000000..2dbc09c8 --- /dev/null +++ b/tests/system_tests/controlled_synparse/input.txt @@ -0,0 +1,2 @@ +A B C D ||| a d c b +A B C D ||| a b c d diff --git a/tests/system_tests/controlled_synparse/scfg.biparse.gz b/tests/system_tests/controlled_synparse/scfg.biparse.gz Binary files differnew file mode 100644 index 00000000..aaf1c41d --- /dev/null +++ b/tests/system_tests/controlled_synparse/scfg.biparse.gz diff --git a/tests/system_tests/ftrans/cdec.ini b/tests/system_tests/ftrans/cdec.ini new file mode 100644 index 00000000..e8e004d6 --- /dev/null +++ b/tests/system_tests/ftrans/cdec.ini @@ -0,0 +1,3 @@ +formalism=fst +k_best=1000 +grammar=ftrans.pt diff --git a/tests/system_tests/ftrans/ftrans.pt b/tests/system_tests/ftrans/ftrans.pt new file mode 100644 index 00000000..7e8c6f59 --- /dev/null +++ b/tests/system_tests/ftrans/ftrans.pt @@ -0,0 +1,4 @@ +b ||| B ||| F1=1 OtherFeat=1 +c ||| C ||| F2=0.2 +b c ||| BC ||| F3=0.4 +c b ||| CB ||| F4=1 diff --git a/tests/system_tests/ftrans/gold.statistics b/tests/system_tests/ftrans/gold.statistics new file mode 100644 index 00000000..40cdfd4c --- /dev/null +++ b/tests/system_tests/ftrans/gold.statistics @@ -0,0 +1,5 @@ +-lm_nodes 13 +-lm_edges 16 +-lm_paths 4 +-lm_trans CB +-lm_viterbi 101 diff --git a/tests/system_tests/ftrans/gold.stdout b/tests/system_tests/ftrans/gold.stdout new file mode 100644 index 00000000..25c615d1 --- /dev/null +++ b/tests/system_tests/ftrans/gold.stdout @@ -0,0 +1,4 @@ +0 ||| CB ||| F4=1;Inv=1 +0 ||| BC ||| F3=0.4;Mono=1 +0 ||| B C ||| F1=1;OtherFeat=1;F2=0.2;Mono=1 +0 ||| C B ||| F1=1;OtherFeat=1;F2=0.2;Inv=1 diff --git a/tests/system_tests/ftrans/input.cfg b/tests/system_tests/ftrans/input.cfg new file mode 100644 index 00000000..b602c1cb --- /dev/null +++ b/tests/system_tests/ftrans/input.cfg @@ -0,0 +1,5 @@ +[S] ||| [A] +[A] ||| [B] [C] ||| Mono=1 +[A] ||| [C] [B] ||| Inv=1 +[B] ||| b +[C] ||| c diff --git a/tests/system_tests/ftrans/input.txt b/tests/system_tests/ftrans/input.txt new file mode 100644 index 00000000..aa37b2e7 --- /dev/null +++ b/tests/system_tests/ftrans/input.txt @@ -0,0 +1 @@ +{"rules":[1,"[B] ||| b ||| b",2,"[C] ||| c ||| c",3,"[A] ||| [B,1] [C,2] ||| [1] [2] ||| Mono=1",4,"[A] ||| [C,1] [B,2] ||| [1] [2] ||| Inv=1",5,"[S] ||| [A,1] ||| [1]"],"features":["Mono","Inv"],"edges":[{"tail":[],"feats":[],"rule":1}],"node":{"in_edges":[0],"cat":"B"},"edges":[{"tail":[],"feats":[],"rule":2}],"node":{"in_edges":[1],"cat":"C"},"edges":[{"tail":[0,1],"feats":[0,1],"rule":3},{"tail":[1,0],"feats":[1,1],"rule":4}],"node":{"in_edges":[2,3],"cat":"A"},"edges":[{"tail":[2],"feats":[],"rule":5}],"node":{"in_edges":[4],"cat":"S"}} diff --git a/tests/system_tests/ftrans/weights b/tests/system_tests/ftrans/weights new file mode 100644 index 00000000..89d3a6d3 --- /dev/null +++ b/tests/system_tests/ftrans/weights @@ -0,0 +1,5 @@ +F1 1 +F3 10 +F4 100 +Mono 2 +Inv 1 diff --git a/tests/system_tests/unsup-align/cdec.ini b/tests/system_tests/unsup-align/cdec.ini new file mode 100644 index 00000000..4016a201 --- /dev/null +++ b/tests/system_tests/unsup-align/cdec.ini @@ -0,0 +1,6 @@ +aligner=true +grammar=unsup-align.lex-grammar +cubepruning_pop_limit=1000000 +formalism=lexcrf +feature_function=RelativeSentencePosition +feature_function=MarkovJump diff --git a/tests/system_tests/unsup-align/gold.statistics b/tests/system_tests/unsup-align/gold.statistics new file mode 100644 index 00000000..afc49bfc --- /dev/null +++ b/tests/system_tests/unsup-align/gold.statistics @@ -0,0 +1,96 @@ +-lm_nodes 2 +-lm_edges 3 +-lm_paths 2 +-lm_trans blue +-lm_trans 0.4528 ++lm_nodes 2 ++lm_edges 3 ++lm_paths 2 ++lm_trans blue +constr_nodes 3 +constr_edges 3 +constr_paths 1 +-lm_nodes 2 +-lm_edges 4 +-lm_paths 3 +-lm_trans house +-lm_trans 0.673643 ++lm_nodes 2 ++lm_edges 4 ++lm_paths 3 ++lm_trans house +constr_nodes 3 +constr_edges 3 +constr_paths 1 +-lm_nodes 4 +-lm_edges 16 +-lm_paths 49 +-lm_trans the the +-lm_viterbi 1.42559 ++lm_nodes 7 ++lm_edges 20 ++lm_paths 49 ++lm_trans the house +constr_nodes 8 +constr_edges 11 +constr_paths 4 +-lm_nodes 4 +-lm_edges 12 +-lm_paths 25 +-lm_trans house house +-lm_viterbi 1.34729 ++lm_nodes 7 ++lm_edges 16 ++lm_paths 25 ++lm_trans house blue +constr_nodes 8 +constr_edges 11 +constr_paths 4 +-lm_nodes 4 +-lm_edges 14 +-lm_paths 36 +-lm_trans the the +-lm_viterbi 1.42559 ++lm_nodes 7 ++lm_edges 18 ++lm_paths 36 ++lm_trans the the +constr_nodes 8 +constr_edges 11 +constr_paths 4 +-lm_nodes 2 +-lm_edges 5 +-lm_paths 4 +-lm_trans the +-lm_trans 0.712796 ++lm_nodes 2 ++lm_edges 5 ++lm_paths 4 ++lm_trans the +constr_nodes 3 +constr_edges 3 +constr_paths 1 +-lm_nodes 4 +-lm_edges 14 +-lm_paths 36 +-lm_trans the the +-lm_viterbi 1.42559 ++lm_nodes 7 ++lm_edges 18 ++lm_paths 36 ++lm_trans the the +constr_nodes 8 +constr_edges 11 +constr_paths 4 +-lm_nodes 4 +-lm_edges 10 +-lm_paths 16 +-lm_trans thet thet +-lm_trans 0 ++lm_nodes 7 ++lm_edges 14 ++lm_paths 16 ++lm_trans end thet +constr_nodes 8 +constr_edges 11 +constr_paths 4 diff --git a/tests/system_tests/unsup-align/gold.stdout b/tests/system_tests/unsup-align/gold.stdout new file mode 100644 index 00000000..b94ab862 --- /dev/null +++ b/tests/system_tests/unsup-align/gold.stdout @@ -0,0 +1,8 @@ +0-0 +0-0 +0-0 1-1 +0-1 1-0 +0-0 1-1 +0-0 +0-0 1-1 +0-0 1-1 diff --git a/tests/system_tests/unsup-align/input.txt b/tests/system_tests/unsup-align/input.txt new file mode 100644 index 00000000..b97f81cf --- /dev/null +++ b/tests/system_tests/unsup-align/input.txt @@ -0,0 +1,8 @@ +bleue ||| blue +maison ||| house +la maison ||| the house +maison bleue ||| blue house +la fleur ||| the flower +la ||| the +la bouche ||| the mouth +le fin ||| thet end diff --git a/tests/system_tests/unsup-align/unsup-align.lex-grammar b/tests/system_tests/unsup-align/unsup-align.lex-grammar new file mode 100644 index 00000000..30b1a61a --- /dev/null +++ b/tests/system_tests/unsup-align/unsup-align.lex-grammar @@ -0,0 +1,17 @@ +bleue ||| blue ||| F1000001=1 +bleue ||| house ||| F1000002=1 +bouche ||| the ||| F1000003=1 +bouche ||| mouth ||| F1000004=1 +fin ||| thet ||| F1000005=1 +fin ||| end ||| F1000006=1 +fleur ||| the ||| F1000007=1 +fleur ||| flower ||| F1000008=1 +la ||| the ||| F1000009=1 +la ||| house ||| F1000010=1 +la ||| flower ||| F1000011=1 +la ||| mouth ||| F1000012=1 +le ||| thet ||| F1000013=1 +le ||| end ||| F1000014=1 +maison ||| house ||| F1000015=1 +maison ||| the ||| F1000016=1 +maison ||| blue ||| F1000017=1 diff --git a/tests/system_tests/unsup-align/weights b/tests/system_tests/unsup-align/weights new file mode 100644 index 00000000..7d9012c5 --- /dev/null +++ b/tests/system_tests/unsup-align/weights @@ -0,0 +1,19 @@ +RelativeSentencePosition -0.1 +MarkovJump -0.2 +F1000001 0.45280036748928199 +F1000002 -0.30603801277140658 +F1000003 0.0087200168696079348 +F1000004 0.25201383750998718 +F1000005 0 +F1000006 0 +F1000007 0.0087200038242073886 +F1000008 0.25201333505199081 +F1000009 0.7127956550520711 +F1000010 -0.4803381673023227 +F1000011 -0.42444387021307117 +F1000012 -0.42444295555037082 +F1000013 0 +F1000014 0 +F1000015 0.67364292245615709 +F1000016 -0.38087265233441997 +F1000017 -0.34457059973906817 |