diff options
| author | Chris Dyer <cdyer@allegro.clab.cs.cmu.edu> | 2013-04-23 19:35:18 -0400 | 
|---|---|---|
| committer | Chris Dyer <cdyer@allegro.clab.cs.cmu.edu> | 2013-04-23 19:35:18 -0400 | 
| commit | 6d347f1ce078dede3da0e1498f75e357351c6543 (patch) | |
| tree | 8e872b8747c530e741e55e25e9917c1bd8b32c5b /extractor/vocabulary.cc | |
| parent | d11b76def6899790161c47a73018146311356d8b (diff) | |
| parent | 5e9605b65202f4e5fc59843b197d88c4774f0ac8 (diff) | |
merge paul's extractor code
Diffstat (limited to 'extractor/vocabulary.cc')
| -rw-r--r-- | extractor/vocabulary.cc | 37 | 
1 files changed, 37 insertions, 0 deletions
| diff --git a/extractor/vocabulary.cc b/extractor/vocabulary.cc new file mode 100644 index 00000000..15795d1e --- /dev/null +++ b/extractor/vocabulary.cc @@ -0,0 +1,37 @@ +#include "vocabulary.h" + +namespace extractor { + +Vocabulary::~Vocabulary() {} + +int Vocabulary::GetTerminalIndex(const string& word) { +  int word_id = -1; +  #pragma omp critical (vocabulary) +  { +    if (!dictionary.count(word)) { +      word_id = words.size(); +      dictionary[word] = word_id; +      words.push_back(word); +    } else { +      word_id = dictionary[word]; +    } +  } +  return word_id; +} + +int Vocabulary::GetNonterminalIndex(int position) { +  return -position; +} + +bool Vocabulary::IsTerminal(int symbol) { +  return symbol >= 0; +} + +string Vocabulary::GetTerminalValue(int symbol) { +  string word; +  #pragma omp critical (vocabulary) +  word = words[symbol]; +  return word; +} + +} // namespace extractor | 
