summaryrefslogtreecommitdiff
path: root/decoder/cfg_options.h
blob: 7b59c05c0bc12e4f744826df2b52b286e0f1f1c3 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
#ifndef CFG_OPTIONS_H
#define CFG_OPTIONS_H

#include "filelib.h"
#include "hg_cfg.h"
#include "cfg_format.h"
#include "cfg_binarize.h"
//#include "program_options.h"

struct CFGOptions {
  CFGFormat format;
  CFGBinarize binarize;
  std::string out,source_out,unbin_out;
  bool uniq;
  void set_defaults() {
    format.set_defaults();
    binarize.set_defaults();
    out=source_out=unbin_out="";
    uniq=false;
  }

  CFGOptions() { set_defaults(); }
  template <class Opts> // template to support both printable_opts and boost nonprintable
  void AddOptions(Opts *opts) {
    opts->add_options()
      ("cfg_output", defaulted_value(&out),"write final target CFG (before FSA rescoring) to this file")
      ("source_cfg_output", defaulted_value(&source_out),"write source CFG (after prelm-scoring, prelm-prune) to this file")
      ("cfg_unbin_output", defaulted_value(&unbin_out),"write pre-binarization CFG to this file") //TODO:
      ("cfg_uniq", defaulted_value(&uniq),"in case of duplicate rules, keep only the one with highest prob")

    ;
    binarize.AddOptions(opts);
    format.AddOptions(opts);
  }
  void Validate() {
    format.Validate();
    binarize.Validate();
  }
  void maybe_output_source(Hypergraph const& hg) {
    if (source_out.empty()) return;
    std::cerr<<"Printing source CFG to "<<source_out<<": "<<format<<'\n';
    WriteFile o(source_out);
    CFG cfg(hg,false,format.features,format.goal_nt());
    cfg.Print(o.get(),format);
  }
  // executes all options except source_cfg_output, building target hgcfg
  void prepare(HgCFG &hgcfg) {
    if (out.empty() && unbin_out.empty()) return;
    CFG &cfg=hgcfg.GetCFG();
    maybe_print(cfg,unbin_out);
    maybe_uniq(hgcfg);
    maybe_binarize(hgcfg);
    maybe_print(cfg,out,"");
  }

  char const* description() const {
    return "CFG output options";
  }
  void maybe_print(CFG &cfg,std::string cfg_output,char const* desc=" unbinarized") {
    if (cfg_output.empty()) return;
    WriteFile o(cfg_output);
    std::cerr<<"Printing target"<<desc<<" CFG to "<<cfg_output<<": "<<format<<'\n';
    cfg.Print(o.get(),format);
  }

  void maybe_uniq(HgCFG &hgcfg) {
    if (hgcfg.uniqed) return;
    hgcfg.GetCFG().UniqRules();
    hgcfg.uniqed=true;
  }
  void maybe_binarize(HgCFG &hgcfg) {
    if (hgcfg.binarized) return;
    hgcfg.GetCFG().Binarize(binarize);
    hgcfg.binarized=true;
  }
};


#endif