diff options
author | Paul Baltescu <pauldb89@gmail.com> | 2013-02-14 23:17:15 +0000 |
---|---|---|
committer | Paul Baltescu <pauldb89@gmail.com> | 2013-02-14 23:17:15 +0000 |
commit | 63b30ed9c8510da8c8e2f6a456576424fddacc0e (patch) | |
tree | 1b5278fb5a4480b7f7a965bb6de8f6f9e9c4d333 /extractor/grammar_extractor.h | |
parent | 0a53f7eca74c165b5ce1c238f1999ddf1febea55 (diff) |
Working version of the grammar extractor.
Diffstat (limited to 'extractor/grammar_extractor.h')
-rw-r--r-- | extractor/grammar_extractor.h | 8 |
1 files changed, 7 insertions, 1 deletions
diff --git a/extractor/grammar_extractor.h b/extractor/grammar_extractor.h index 243f33cf..5f87faa7 100644 --- a/extractor/grammar_extractor.h +++ b/extractor/grammar_extractor.h @@ -32,13 +32,19 @@ class GrammarExtractor { bool use_baeza_yates, bool require_tight_phrases); + // For testing only. + GrammarExtractor(shared_ptr<Vocabulary> vocabulary, + shared_ptr<HieroCachingRuleFactory> rule_factory); + Grammar GetGrammar(const string& sentence); private: + vector<string> TokenizeSentence(const string& sentence); + vector<int> AnnotateWords(const vector<string>& words); shared_ptr<Vocabulary> vocabulary; - HieroCachingRuleFactory rule_factory; + shared_ptr<HieroCachingRuleFactory> rule_factory; }; #endif |