summaryrefslogtreecommitdiff
path: root/rst_parser/dep_training.h
diff options
context:
space:
mode:
authorPatrick Simianer <p@simianer.de>2012-04-23 21:44:02 +0200
committerPatrick Simianer <p@simianer.de>2012-04-23 21:44:02 +0200
commit1c733723583862a5fcee5352433022008a9dc4e0 (patch)
treed4f9a17498d6bc9210e0e3cebbcfc3635736b669 /rst_parser/dep_training.h
parentd3aa71d1095a5c45c1d3ca3155259e5fe0b58df2 (diff)
parent44508c1ad1bf88b1568713317b4a1e0be78804f8 (diff)
Merge remote-tracking branch 'upstream/master'
Conflicts: Makefile.am configure.ac
Diffstat (limited to 'rst_parser/dep_training.h')
-rw-r--r--rst_parser/dep_training.h19
1 files changed, 19 insertions, 0 deletions
diff --git a/rst_parser/dep_training.h b/rst_parser/dep_training.h
new file mode 100644
index 00000000..3eeee22e
--- /dev/null
+++ b/rst_parser/dep_training.h
@@ -0,0 +1,19 @@
+#ifndef _DEP_TRAINING_H_
+#define _DEP_TRAINING_H_
+
+#include <iostream>
+#include <string>
+#include <vector>
+#include "arc_factored.h"
+#include "weights.h"
+
+struct TrainingInstance {
+ TaggedSentence ts;
+ EdgeSubset tree;
+ SparseVector<weight_t> features;
+ // reads a "Jsent" formatted dependency file
+ static bool ReadInstance(std::istream* in, TrainingInstance* instance); // returns false at EOF
+ static void ReadTrainingCorpus(const std::string& fname, std::vector<TrainingInstance>* corpus, int rank = 0, int size = 1);
+};
+
+#endif