1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
|
#ifndef CFG_OPTIONS_H
#define CFG_OPTIONS_H
#include "hg_cfg.h"
#include "cfg_format.h"
#include "cfg_binarize.h"
//#include "program_options.h"
struct CFGOptions {
CFGFormat format;
CFGBinarize binarize;
std::string out,source_out,unbin_out;
bool uniq;
void set_defaults() {
format.set_defaults();
binarize.set_defaults();
out=source_out=unbin_out="";
uniq=false;
}
CFGOptions() { set_defaults(); }
template <class Opts> // template to support both printable_opts and boost nonprintable
void AddOptions(Opts *opts) {
opts->add_options()
("cfg_output", defaulted_value(&out),"write final target CFG (before FSA rescoring) to this file")
("source_cfg_output", defaulted_value(&source_out),"write source CFG (after prelm-scoring, prelm-prune) to this file")
("cfg_unbin_output", defaulted_value(&unbin_out),"write pre-binarization CFG to this file") //TODO:
("cfg_uniq", defaulted_value(&uniq),"in case of duplicate rules, keep only the one with highest prob")
;
binarize.AddOptions(opts);
format.AddOptions(opts);
}
void Validate() {
format.Validate();
binarize.Validate();
}
void maybe_output_source(Hypergraph const& hg) {
if (source_out.empty()) return;
std::cerr<<"Printing source CFG to "<<source_out<<": "<<format<<'\n';
WriteFile o(source_out);
CFG cfg(hg,false,format.features,format.goal_nt());
cfg.Print(o.get(),format);
}
// executes all options except source_cfg_output, building target hgcfg
void prepare(HgCFG &hgcfg) {
if (out.empty() && unbin_out.empty()) return;
CFG &cfg=hgcfg.GetCFG();
maybe_print(cfg,unbin_out);
maybe_uniq(hgcfg);
maybe_binarize(hgcfg);
maybe_print(cfg,out,"");
}
char const* description() const {
return "CFG output options";
}
void maybe_print(CFG &cfg,std::string cfg_output,char const* desc=" unbinarized") {
if (cfg_output.empty()) return;
WriteFile o(cfg_output);
std::cerr<<"Printing target"<<desc<<" CFG to "<<cfg_output<<": "<<format<<'\n';
cfg.Print(o.get(),format);
}
void maybe_uniq(HgCFG &hgcfg) {
if (hgcfg.uniqed) return;
hgcfg.GetCFG().UniqRules();
hgcfg.uniqed=true;
}
void maybe_binarize(HgCFG &hgcfg) {
if (hgcfg.binarized) return;
hgcfg.GetCFG().Binarize(binarize);
hgcfg.binarized=true;
}
};
#endif
|