diff options
Diffstat (limited to 'rst_parser/dep_training.h')
-rw-r--r-- | rst_parser/dep_training.h | 19 |
1 files changed, 19 insertions, 0 deletions
diff --git a/rst_parser/dep_training.h b/rst_parser/dep_training.h new file mode 100644 index 00000000..3eeee22e --- /dev/null +++ b/rst_parser/dep_training.h @@ -0,0 +1,19 @@ +#ifndef _DEP_TRAINING_H_ +#define _DEP_TRAINING_H_ + +#include <iostream> +#include <string> +#include <vector> +#include "arc_factored.h" +#include "weights.h" + +struct TrainingInstance { + TaggedSentence ts; + EdgeSubset tree; + SparseVector<weight_t> features; + // reads a "Jsent" formatted dependency file + static bool ReadInstance(std::istream* in, TrainingInstance* instance); // returns false at EOF + static void ReadTrainingCorpus(const std::string& fname, std::vector<TrainingInstance>* corpus, int rank = 0, int size = 1); +}; + +#endif |