summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorChris Dyer <cdyer@cs.cmu.edu>2011-06-08 00:39:09 -0400
committerChris Dyer <cdyer@cs.cmu.edu>2011-06-08 00:39:09 -0400
commitdc9cd6987abdfc703f50e924fa9e55dc702d5242 (patch)
tree53520110c90fa9e087efed2378ecae80b76404fb
parent925d74ce8a92ec6e73f41a4f0685bf3ca7b865d1 (diff)
external MT evaluator client code. most logic in place, needs to be integrated. actually, the whole evaluation architecture needs to be trashed and rewritten from scratch. what a disaster it is
-rw-r--r--mteval/Makefile.am2
-rw-r--r--mteval/external_scorer.cc150
-rw-r--r--mteval/external_scorer.h35
3 files changed, 186 insertions, 1 deletions
diff --git a/mteval/Makefile.am b/mteval/Makefile.am
index f9277779..95845090 100644
--- a/mteval/Makefile.am
+++ b/mteval/Makefile.am
@@ -10,7 +10,7 @@ endif
noinst_LIBRARIES = libmteval.a
-libmteval_a_SOURCES = ter.cc comb_scorer.cc aer_scorer.cc scorer.cc
+libmteval_a_SOURCES = ter.cc comb_scorer.cc aer_scorer.cc scorer.cc external_scorer.cc
fast_score_SOURCES = fast_score.cc
fast_score_LDADD = libmteval.a $(top_srcdir)/utils/libutils.a -lz
diff --git a/mteval/external_scorer.cc b/mteval/external_scorer.cc
new file mode 100644
index 00000000..4327ce9b
--- /dev/null
+++ b/mteval/external_scorer.cc
@@ -0,0 +1,150 @@
+#include "external_scorer.h"
+
+#include <cstdio> // popen
+#include <cstdlib>
+#include <sstream>
+#include <iostream>
+#include <cassert>
+
+#include "tdict.h"
+
+using namespace std;
+
+ScoreServer::ScoreServer(const string& cmd) : pipe_() {
+ cerr << "Invoking " << cmd << " ..." << endl;
+ pipe_ = popen(cmd.c_str(), "r+");
+ assert(pipe_);
+ string dummy;
+ RequestResponse("EVAL ||| Reference initialization string . ||| Testing initialization string .\n", &dummy);
+ assert(dummy.size() > 0);
+ cerr << "Connection established.\n";
+}
+
+ScoreServer::~ScoreServer() {
+ pclose(pipe_);
+}
+
+double ScoreServer::ComputeScore(const vector<float>& fields) {
+ ostringstream os;
+ os << "EVAL";
+ for (unsigned i = 0; i < fields.size(); ++i)
+ os << ' ' << fields[i];
+ os << endl;
+ string sres;
+ RequestResponse(os.str(), &sres);
+ return strtod(sres.c_str(), NULL);
+}
+
+void ScoreServer::Evaluate(const vector<vector<WordID> >& refs, const vector<WordID>& hyp, vector<float>* fields) {
+ ostringstream os;
+ os << "SCORE";
+ for (unsigned i = 0; i < refs.size(); ++i) {
+ os << " |||";
+ for (unsigned j = 0; j < refs[i].size(); ++j) {
+ os << ' ' << TD::Convert(refs[i][j]);
+ }
+ }
+ os << " |||";
+ for (unsigned i = 0; i < hyp.size(); ++i) {
+ os << ' ' << TD::Convert(hyp[i]);
+ }
+ os << endl;
+ string sres;
+ RequestResponse(os.str(), &sres);
+ istringstream is(sres);
+ double val;
+ fields->clear();
+ while(is >> val) {
+ fields->push_back(val);
+ }
+}
+
+#define MAX_BUF 16000
+
+void ScoreServer::RequestResponse(const string& request, string* response) {
+ fprintf(pipe_, "%s", request.c_str());
+ fflush(pipe_);
+ char buf[MAX_BUF];
+ size_t cr = fread(buf, 1, MAX_BUF, pipe_);
+ if (cr == 0) {
+ cerr << "Read error. Request: " << request << endl;
+ abort();
+ }
+ while (buf[cr-1] != '\n') {
+ size_t n = fread(&buf[cr], 1, MAX_BUF-cr, pipe_);
+ assert(n > 0);
+ cr += n;
+ assert(cr < MAX_BUF);
+ }
+ buf[cr - 1] = 0;
+ *response = buf;
+}
+
+struct ExternalScore : public ScoreBase<ExternalScore> {
+ ExternalScore() : score_server() {}
+ explicit ExternalScore(const ScoreServer* s) : score_server(s), fields() {}
+ ExternalScore(const ScoreServer* s, const vector<float>& f) : score_server(s), fields(f) {}
+ float ComputePartialScore() const { return 0.0;}
+ float ComputeScore() const {
+ // TODO make EVAL call
+ assert(!"not implemented");
+ }
+ void ScoreDetails(string* details) const {
+ ostringstream os;
+ os << "EXT=" << ComputeScore() << " <";
+ for (unsigned i = 0; i < fields.size(); ++i)
+ os << (i ? " " : "") << fields[i];
+ os << '>';
+ *details = os.str();
+ }
+ void PlusPartialEquals(const Score&, int, int, int){
+ assert(!"not implemented"); // no idea
+ }
+ void PlusEquals(const Score& delta, const float scale) {
+ assert(!"not implemented"); // don't even know what this is
+ }
+ void PlusEquals(const Score& delta) {
+ if (static_cast<const ExternalScore&>(delta).score_server) score_server = static_cast<const ExternalScore&>(delta).score_server;
+ if (fields.size() != static_cast<const ExternalScore&>(delta).fields.size())
+ fields.resize(max(fields.size(), static_cast<const ExternalScore&>(delta).fields.size()));
+ for (unsigned i = 0; i < static_cast<const ExternalScore&>(delta).fields.size(); ++i)
+ fields[i] += static_cast<const ExternalScore&>(delta).fields[i];
+ }
+ ScoreP GetZero() const {
+ return ScoreP(new ExternalScore(score_server));
+ }
+ ScoreP GetOne() const {
+ return ScoreP(new ExternalScore(score_server));
+ }
+ void Subtract(const Score& rhs, Score* res) const {
+ static_cast<ExternalScore*>(res)->score_server = score_server;
+ vector<float>& rf = static_cast<ExternalScore*>(res)->fields;
+ rf.resize(max(fields.size(), static_cast<const ExternalScore&>(rhs).fields.size()));
+ for (unsigned i = 0; i < rf.size(); ++i) {
+ rf[i] = (i < fields.size() ? fields[i] : 0.0f) -
+ (i < static_cast<const ExternalScore&>(rhs).fields.size() ? static_cast<const ExternalScore&>(rhs).fields[i] : 0.0f);
+ }
+ }
+ void Encode(string* out) const {
+ ostringstream os;
+ }
+ bool IsAdditiveIdentity() const {
+ for (int i = 0; i < fields.size(); ++i)
+ if (fields[i]) return false;
+ return true;
+ }
+
+ const ScoreServer* score_server;
+ vector<float> fields;
+};
+
+ScoreP ExternalSentenceScorer::ScoreCandidate(const Sentence& hyp) const {
+ ExternalScore* res = new ExternalScore(eval_server);
+ eval_server->Evaluate(refs, hyp, &res->fields);
+ return ScoreP(res);
+}
+
+ScoreP ExternalSentenceScorer::ScoreCCandidate(const Sentence& hyp) const {
+ assert(!"not implemented");
+}
+
diff --git a/mteval/external_scorer.h b/mteval/external_scorer.h
new file mode 100644
index 00000000..a2c91960
--- /dev/null
+++ b/mteval/external_scorer.h
@@ -0,0 +1,35 @@
+#ifndef _EXTERNAL_SCORER_H_
+#define _EXTERNAL_SCORER_H_
+
+#include <vector>
+#include <cstdio>
+
+#include "scorer.h"
+
+class ScoreServer {
+ public:
+ explicit ScoreServer(const std::string& cmd);
+ virtual ~ScoreServer();
+
+ double ComputeScore(const std::vector<float>& fields);
+ void Evaluate(const std::vector<std::vector<WordID> >& refs, const std::vector<WordID>& hyp, std::vector<float>* fields);
+
+ private:
+ void RequestResponse(const std::string& request, std::string* response);
+ FILE* pipe_;
+};
+
+class ExternalSentenceScorer : public SentenceScorer {
+ public:
+ virtual ScoreP ScoreCandidate(const Sentence& hyp) const = 0;
+ virtual ScoreP ScoreCCandidate(const Sentence& hyp) const =0;
+ protected:
+ ScoreServer* eval_server;
+};
+
+class METEORServer : public ScoreServer {
+ public:
+ METEORServer() : ScoreServer("java -Xmx1024m -jar meteor-1.3.jar - - -mira -lower") {}
+};
+
+#endif