diff options
author | vladimir.eidelman <vladimir.eidelman@ec762483-ff6d-05da-a07a-a48fb63a330f> | 2010-09-12 19:54:11 +0000 |
---|---|---|
committer | vladimir.eidelman <vladimir.eidelman@ec762483-ff6d-05da-a07a-a48fb63a330f> | 2010-09-12 19:54:11 +0000 |
commit | aade3dd1721837b2fadf33bcb2c0a8a59529d685 (patch) | |
tree | 1e450271901569d551ba6c6e56a35814b68ff0f7 /tests/system_tests | |
parent | 0f15af337a3544ea59a70a65daa912e6fbba42b3 (diff) |
tagger example
git-svn-id: https://ws10smt.googlecode.com/svn/trunk@644 ec762483-ff6d-05da-a07a-a48fb63a330f
Diffstat (limited to 'tests/system_tests')
-rw-r--r-- | tests/system_tests/tagger/TRAIN | 1 | ||||
-rw-r--r-- | tests/system_tests/tagger/cdec.ini | 5 | ||||
-rw-r--r-- | tests/system_tests/tagger/input.txt | 2 | ||||
-rw-r--r-- | tests/system_tests/tagger/pos.grammar | 4 | ||||
-rw-r--r-- | tests/system_tests/tagger/tagset | 1 | ||||
-rw-r--r-- | tests/system_tests/tagger/weights | 2 |
6 files changed, 15 insertions, 0 deletions
diff --git a/tests/system_tests/tagger/TRAIN b/tests/system_tests/tagger/TRAIN new file mode 100644 index 00000000..c4bb433a --- /dev/null +++ b/tests/system_tests/tagger/TRAIN @@ -0,0 +1 @@ +../../../training/cluster-ptrain.pl cdec.ini pos.grammar weights --gaussian_prior --sigma_squared 1 &> training.log &
\ No newline at end of file diff --git a/tests/system_tests/tagger/cdec.ini b/tests/system_tests/tagger/cdec.ini new file mode 100644 index 00000000..15cc930d --- /dev/null +++ b/tests/system_tests/tagger/cdec.ini @@ -0,0 +1,5 @@ +formalism=tagger +feature_function=Tagger_BigramIdentity +feature_function=LexicalPairIdentity +intersection_strategy=full +tagger_tagset=tagset
\ No newline at end of file diff --git a/tests/system_tests/tagger/input.txt b/tests/system_tests/tagger/input.txt new file mode 100644 index 00000000..fe5cb58d --- /dev/null +++ b/tests/system_tests/tagger/input.txt @@ -0,0 +1,2 @@ +A B C +A
\ No newline at end of file diff --git a/tests/system_tests/tagger/pos.grammar b/tests/system_tests/tagger/pos.grammar new file mode 100644 index 00000000..3415854b --- /dev/null +++ b/tests/system_tests/tagger/pos.grammar @@ -0,0 +1,4 @@ +[X] ||| A B C ||| a b c +[X] ||| A ||| a +[X] ||| A ||| b +[X] ||| B C ||| b c
\ No newline at end of file diff --git a/tests/system_tests/tagger/tagset b/tests/system_tests/tagger/tagset new file mode 100644 index 00000000..3774da60 --- /dev/null +++ b/tests/system_tests/tagger/tagset @@ -0,0 +1 @@ +a b c diff --git a/tests/system_tests/tagger/weights b/tests/system_tests/tagger/weights new file mode 100644 index 00000000..ec8358f3 --- /dev/null +++ b/tests/system_tests/tagger/weights @@ -0,0 +1,2 @@ +Tagger_BigramIdentity 1 +LexicalPairIdentity 1
\ No newline at end of file |