summaryrefslogtreecommitdiff
path: root/gi/pf/pyp_tm.h
blob: 2b076a25fee1df59f86b20e93a23181cb5175063 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
#ifndef PYP_LEX_TRANS
#define PYP_LEX_TRANS

#include <vector>
#include "wordid.h"
#include "prob.h"
#include "sampler.h"
#include "freqdict.h"
#include "poisson_uniform_word_model.h"

struct FreqBinner;
template <typename T, class B> struct ConditionalPYPWordModel;

struct PYPLexicalTranslation {
  explicit PYPLexicalTranslation(const std::vector<std::vector<WordID> >& lets,
                                 const unsigned vocab_size,
                                 const unsigned num_letters);

  prob_t Likelihood() const;

  void ResampleHyperparameters(MT19937* rng);
  prob_t Prob(WordID src, WordID trg) const;  // return p(trg | src)
  void Summary() const;
  void Increment(WordID src, WordID trg, MT19937* rng);
  void Decrement(WordID src, WordID trg, MT19937* rng);
  unsigned UniqueConditioningContexts() const;

 private:
  const std::vector<std::vector<WordID> >& letters;   // spelling dictionary
  PoissonUniformWordModel base;  // "generator" of English types
  ConditionalPYPWordModel<PoissonUniformWordModel, FreqBinner>* tmodel;  // translation distributions
                      // (model English word | French word)
  const WordID kX;
};

#endif