summaryrefslogtreecommitdiff
path: root/gi/pf/hpyp_tm.h
blob: af3215badadc7574df208ec01e6cc2e6d701c5e7 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
#ifndef HPYP_LEX_TRANS
#define HPYP_LEX_TRANS

#include <vector>
#include "wordid.h"
#include "prob.h"
#include "sampler.h"
#include "freqdict.h"
#include "poisson_uniform_word_model.h"

struct FreqBinner;
template <class B> struct PYPWordModel;
template <typename T, class B> struct ConditionalPYPWordModel;

struct HPYPLexicalTranslation {
  explicit HPYPLexicalTranslation(const std::vector<std::vector<WordID> >& lets,
                                 const unsigned vocab_size,
                                 const unsigned num_letters);

  prob_t Likelihood() const;

  void ResampleHyperparameters(MT19937* rng);
  prob_t Prob(WordID src, WordID trg) const;  // return p(trg | src)
  void Summary() const;
  void Increment(WordID src, WordID trg, MT19937* rng);
  void Decrement(WordID src, WordID trg, MT19937* rng);
  unsigned UniqueConditioningContexts() const;

 private:
  const std::vector<std::vector<WordID> >& letters;   // spelling dictionary
  PoissonUniformWordModel base;  // "generator" of English types
  PYPWordModel<PoissonUniformWordModel>* up0;  // model English lexicon
  ConditionalPYPWordModel<PYPWordModel<PoissonUniformWordModel>, FreqBinner>* tmodel;  // translation distributions
                      // (model English word | French word)
  const WordID kX;
};

#endif