summaryrefslogtreecommitdiff
path: root/mteval/scorer.h
diff options
context:
space:
mode:
authorredpony <redpony@ec762483-ff6d-05da-a07a-a48fb63a330f>2010-08-11 02:37:10 +0000
committerredpony <redpony@ec762483-ff6d-05da-a07a-a48fb63a330f>2010-08-11 02:37:10 +0000
commita53461650fbdcd3cfe7543d28af9647ac3e5e47e (patch)
treee812756c733b34f9c16894265204acfa9f9998a9 /mteval/scorer.h
parent19b59489bb600f438ad96f04ec5d5c5b6616c9c2 (diff)
major refactor, break bad circular deps
git-svn-id: https://ws10smt.googlecode.com/svn/trunk@509 ec762483-ff6d-05da-a07a-a48fb63a330f
Diffstat (limited to 'mteval/scorer.h')
-rw-r--r--mteval/scorer.h110
1 files changed, 110 insertions, 0 deletions
diff --git a/mteval/scorer.h b/mteval/scorer.h
new file mode 100644
index 00000000..f18c8c7f
--- /dev/null
+++ b/mteval/scorer.h
@@ -0,0 +1,110 @@
+#ifndef SCORER_H_
+#define SCORER_H_
+#include <vector>
+#include <string>
+#include <boost/shared_ptr.hpp>
+//TODO: use intrusive shared_ptr in Score (because there are many of them on ErrorSurfaces)
+#include "wordid.h"
+#include "intrusive_refcount.hpp"
+
+class Score;
+class SentenceScorer;
+typedef boost::intrusive_ptr<Score> ScoreP;
+typedef boost::shared_ptr<SentenceScorer> ScorerP;
+
+class ViterbiEnvelope;
+class ErrorSurface;
+class Hypergraph; // needed for alignment
+
+//TODO: BLEU N (N separate arg, not part of enum)?
+enum ScoreType { IBM_BLEU, NIST_BLEU, Koehn_BLEU, TER, BLEU_minus_TER_over_2, SER, AER, IBM_BLEU_3 };
+ScoreType ScoreTypeFromString(const std::string& st);
+std::string StringFromScoreType(ScoreType st);
+
+class Score : public boost::intrusive_refcount<Score> {
+ public:
+ virtual ~Score();
+ virtual float ComputeScore() const = 0;
+ virtual float ComputePartialScore() const =0;
+ virtual void ScoreDetails(std::string* details) const = 0;
+ std::string ScoreDetails() {
+ std::string d;
+ ScoreDetails(&d);
+ return d;
+ }
+ virtual void TimesEquals(float scale); // only for bleu; for mira oracle
+ /// same as rhs.TimesEquals(scale);PlusEquals(rhs) except doesn't modify rhs.
+ virtual void PlusEquals(const Score& rhs, const float scale) = 0;
+ virtual void PlusEquals(const Score& rhs) = 0;
+ virtual void PlusPartialEquals(const Score& rhs, int oracle_e_cover, int oracle_f_cover, int src_len) = 0;
+ virtual void Subtract(const Score& rhs, Score *res) const = 0;
+ virtual ScoreP GetZero() const = 0;
+ virtual ScoreP GetOne() const = 0;
+ virtual bool IsAdditiveIdentity() const = 0; // returns true if adding this delta
+ // to another score results in no score change
+ // under any circumstances
+ virtual void Encode(std::string* out) const = 0;
+ static ScoreP GetZero(ScoreType type);
+ static ScoreP GetOne(ScoreType type);
+ virtual ScoreP Clone() const = 0;
+protected:
+ Score() { } // we define these explicitly because refcount is noncopyable
+ Score(Score const&) { }
+};
+
+//TODO: make sure default copy ctors for score types do what we want.
+template <class Derived>
+struct ScoreBase : public Score {
+ ScoreP Clone() const {
+ return ScoreP(new Derived(dynamic_cast<Derived const&>(*this)));
+ }
+};
+
+class SentenceScorer {
+ public:
+ typedef std::vector<WordID> Sentence;
+ typedef std::vector<Sentence> Sentences;
+ std::string desc;
+ Sentences refs;
+ SentenceScorer(std::string desc="SentenceScorer_unknown", Sentences const& refs=Sentences()) : desc(desc),refs(refs) { }
+ std::string verbose_desc() const;
+ virtual float ComputeRefLength(const Sentence& hyp) const; // default: avg of refs.length
+ virtual ~SentenceScorer();
+ virtual ScoreP GetOne() const;
+ virtual ScoreP GetZero() const;
+ virtual ScoreP ScoreCandidate(const Sentence& hyp) const = 0;
+ virtual ScoreP ScoreCCandidate(const Sentence& hyp) const =0;
+ virtual const std::string* GetSource() const;
+ static ScoreP CreateScoreFromString(const ScoreType type, const std::string& in);
+ static ScorerP CreateSentenceScorer(const ScoreType type,
+ const std::vector<Sentence >& refs,
+ const std::string& src = "");
+};
+
+//TODO: should be able to GetOne GetZero without supplying sentence (just type)
+class DocScorer {
+ public:
+ ~DocScorer();
+ DocScorer() { }
+ void Init(const ScoreType type,
+ const std::vector<std::string>& ref_files,
+ const std::string& src_file = "",
+ bool verbose=false
+ );
+ DocScorer(const ScoreType type,
+ const std::vector<std::string>& ref_files,
+ const std::string& src_file = "",
+ bool verbose=false
+ )
+ {
+ Init(type,ref_files,src_file,verbose);
+ }
+
+ int size() const { return scorers_.size(); }
+ ScorerP operator[](size_t i) const { return scorers_[i]; }
+ private:
+ std::vector<ScorerP> scorers_;
+};
+
+
+#endif