diff options
author | Chris Dyer <cdyer@cs.cmu.edu> | 2011-10-12 14:57:15 +0100 |
---|---|---|
committer | Chris Dyer <cdyer@cs.cmu.edu> | 2011-10-12 14:57:15 +0100 |
commit | ee84ab027c0be54800cac0c9bff62dd097354f6d (patch) | |
tree | 30344f4307d3efbafb3276807a6879c4eeeab173 /gi/pf/corpus.h | |
parent | a32cd0131c6325e364c82e5f6bbefc03b61e437f (diff) |
model lenght properly, clean up
Diffstat (limited to 'gi/pf/corpus.h')
-rw-r--r-- | gi/pf/corpus.h | 19 |
1 files changed, 19 insertions, 0 deletions
diff --git a/gi/pf/corpus.h b/gi/pf/corpus.h new file mode 100644 index 00000000..e7febdb7 --- /dev/null +++ b/gi/pf/corpus.h @@ -0,0 +1,19 @@ +#ifndef _CORPUS_H_ +#define _CORPUS_H_ + +#include <string> +#include <vector> +#include <set> +#include "wordid.h" + +namespace corpus { + +void ReadParallelCorpus(const std::string& filename, + std::vector<std::vector<WordID> >* f, + std::vector<std::vector<WordID> >* e, + std::set<WordID>* vocab_f, + std::set<WordID>* vocab_e); + +} + +#endif |