summaryrefslogtreecommitdiff
path: root/dtrain/ksampler.h
blob: ac88b643eaaeadc56166f34f90ae0d926dc5e5c8 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
#ifndef _DTRAIN_KSAMPLER_H_
#define _DTRAIN_KSAMPLER_H_

#include "hgsampler.h"
#include "kbest.h" // cdec
#include "sampler.h"

namespace dtrain
{


/*
 * KSampler
 *
 */
struct KSampler : public HypoSampler
{
  const size_t k_;
  Samples s;
  MT19937* rng;

  explicit KSampler( const size_t k, MT19937* prng ) :
    k_(k), rng(prng) {}

  virtual void
  NotifyTranslationForest( const SentenceMetadata& smeta, Hypergraph* hg )
  {
    Sample( *hg );
  }

  Samples* GetSamples() { return &s; }

  void Sample( const Hypergraph& forest ) {
    s.sents.clear();
    s.feats.clear();
    s.model_scores.clear();
    s.scores.clear();
    std::vector<HypergraphSampler::Hypothesis> samples;
    HypergraphSampler::sample_hypotheses(forest, k_, rng, &samples);
    for ( size_t i = 0; i < k_; ++i ) {
      s.sents.push_back( samples[i].words );
      s.feats.push_back( samples[i].fmap );
      s.model_scores.push_back( log(samples[i].model_score) );
    }
  }
};


} // namespace

#endif