#ifndef _DTRAIN_SAMPLE_NET_H_ #define _DTRAIN_SAMPLE_NET_H_ #include "kbest.h" #include "score_net_interface.h" namespace dtrain { struct ScoredKbest : public DecoderObserver { const size_t k_; size_t feature_count_, effective_sz_; vector samples_; PerSentenceBleuScorer* scorer_; vector* ref_ngs_; vector* ref_ls_; bool dont_score; ScoredKbest(const size_t k, PerSentenceBleuScorer* scorer) : k_(k), scorer_(scorer), dont_score(false) {} virtual void NotifyTranslationForest(const SentenceMetadata& smeta, Hypergraph* hg) { samples_.clear(); effective_sz_ = feature_count_ = 0; KBest::KBestDerivations, ESentenceTraversal, KBest::FilterUnique, prob_t, EdgeProb> kbest(*hg, k_); for (size_t i = 0; i < k_; ++i) { const KBest::KBestDerivations, ESentenceTraversal, KBest::FilterUnique, prob_t, EdgeProb>::Derivation* d = kbest.LazyKthBest(hg->nodes_.size() - 1, i); if (!d) break; ScoredHyp h; h.w = d->yield; h.f = d->feature_values; h.model = log(d->score); h.rank = i; if (!dont_score) h.gold = scorer_->Score(h.w, *ref_ngs_, *ref_ls_); samples_.push_back(h); effective_sz_++; feature_count_ += h.f.size(); } } vector* GetSamples() { return &samples_; } inline void SetReference(vector& ngs, vector& ls) { ref_ngs_ = &ngs; ref_ls_ = &ls; } inline size_t GetFeatureCount() { return feature_count_; } inline size_t GetSize() { return effective_sz_; } }; } // namespace #endif