Merge branch 'master' of github.com:redpony/cdec

author: Chris Dyer <cdyer@allegro.clab.cs.cmu.edu> 2012-11-18 17:41:32 -0500
committer: Chris Dyer <cdyer@allegro.clab.cs.cmu.edu> 2012-11-18 17:41:32 -0500
commit: 4e8985437a7ac81fac2569b5afc13e5b5c7238ba (patch)
tree: 70c5890befba1842e94d5ccb76b685f7b05a7a51
parent: c3a0f085f678b0186b977c8e97dbc9175676f9bd (diff)
parent: 61ede617e3eaa15e0005965d1da2e462659b0f7d (diff)
2 files changed, 50 insertions, 1 deletions
diff --git a/.travis.yml b/.travis.yml
index cbfd8fb9..f3c418b5 100644
--- a/.travis.yml
+++ b/.travis.yml
@@ -1,3 +1,6 @@
+language: python
+python:
+ - "2.7"
 before_script:
  - sudo apt-get install libboost-program-options-dev
  - sudo apt-get install libboost-serialization-dev
@@ -7,7 +10,12 @@ before_script:
  - sudo apt-get install flex
  - autoreconf -ifv
  - ./configure
-script: make
+script:
+ - make
+ - cd python
+ - python setup.py install
+ - cd ..
 after_script:
  - make check
  - ./tests/run-system-tests.pl
+ - nosetests python/tests
diff --git a/python/tests/test_decoder.py b/python/tests/test_decoder.py
new file mode 100644
index 00000000..a74e6268
--- /dev/null
+++ b/python/tests/test_decoder.py
@@ -0,0 +1,41 @@
+#coding:utf8
+import os
+import gzip
+import cdec
+import unittest
+from nose.tools import assert_almost_equals, assert_equal
+
+weights = os.path.dirname(__file__)+'/../../tests/system_tests/australia/weights'
+ref_weights = {'WordPenalty': -2.844814, 'LanguageModel':  1.0, 'PhraseModel_0': -1.066893, 'PhraseModel_1': -0.752247, 'PhraseModel_2': -0.589793, 'PassThrough': -20.0, 'Glue': 0}
+
+grammar_file = os.path.dirname(__file__)+'/../../tests/system_tests/australia/australia.scfg.gz'
+
+input_sentence = u'澳洲 是 与 北韩 有 邦交 的 少数 国家 之一 。'
+ref_output_sentence = u'australia is have diplomatic relations with north korea one of the few countries .'
+ref_f_tree = u'(S (S (S (S (X 澳洲 是)) (X (X 与 北韩) 有 邦交)) (X 的 少数 国家 之一)) (X 。))'
+ref_e_tree = u'(S (S (S (S (X australia is)) (X have diplomatic relations (X with north korea))) (X one of the few countries)) (X .))'
+ref_fvector = {'PhraseModel_2': 7.082652, 'Glue': 3.0, 'PhraseModel_0': 2.014353, 'PhraseModel_1': 8.591477}
+
+def assert_fvector_equal(vec, ref):
+    vecd = dict(vec)
+    assert_equal(set(vecd.keys()), set(ref.keys()))
+    for k, v in ref.items():
+        assert_almost_equals(vec[k], v, 6)
+
+class TestDecoder(unittest.TestCase):
+    def setUp(self):
+        self.decoder = cdec.Decoder(formalism='scfg')
+        self.decoder.read_weights(weights)
+        with gzip.open(grammar_file) as f:
+            self.grammar = f.read()
+
+    def test_weights(self):
+        assert_fvector_equal(self.decoder.weights, ref_weights)
+
+    def test_translate(self):
+        forest = self.decoder.translate(input_sentence, grammar=self.grammar)
+        assert_equal(forest.viterbi(), ref_output_sentence)
+        f_tree, e_tree = forest.viterbi_trees()
+        assert_equal(f_tree, ref_f_tree)
+        assert_equal(e_tree, ref_e_tree)
+        assert_fvector_equal(forest.viterbi_features(), ref_fvector)
author	Chris Dyer <cdyer@allegro.clab.cs.cmu.edu>	2012-11-18 17:41:32 -0500
committer	Chris Dyer <cdyer@allegro.clab.cs.cmu.edu>	2012-11-18 17:41:32 -0500
commit	4e8985437a7ac81fac2569b5afc13e5b5c7238ba (patch)
tree	70c5890befba1842e94d5ccb76b685f7b05a7a51
parent	c3a0f085f678b0186b977c8e97dbc9175676f9bd (diff)
parent	61ede617e3eaa15e0005965d1da2e462659b0f7d (diff)