1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
|
#include "cfg.h"
#include "hg.h"
#include "cfg_format.h"
#include "cfg_binarize.h"
using namespace std;
void CFG::Binarize(CFGBinarize const& b) {
if (!b.Binarizing()) return;
if (!b.bin_l2r) {
assert(b.bin_l2r);
return;
}
// l2r only so far:
cerr << "Binarizing "<<b<<endl;
//TODO.
}
void CFG::Init(Hypergraph const& hg,bool target_side,bool copy_features,bool push_weights) {
uninit=false;
hg_=&hg;
Hypergraph::NodeProbs np;
goal_inside=hg.ComputeNodeViterbi(&np);
pushed_inside=push_weights ? goal_inside : prob_t(1);
int nn=hg.nodes_.size(),ne=hg.edges_.size();
nts.resize(nn);
goal_nt=nn-1;
rules.resize(ne);
for (int i=0;i<nn;++i) {
nts[i].ruleids=hg.nodes_[i].in_edges_;
hg.SetNodeOrigin(i,nts[i].from);
}
for (int i=0;i<ne;++i) {
Rule &cfgr=rules[i];
Hypergraph::Edge const& e=hg.edges_[i];
TRule const& er=*e.rule_; vector<WordID> const& rule_rhs=target_side?er.e():er.f();
RHS &rhs=cfgr.rhs;
prob_t &crp=cfgr.p;
crp=e.edge_prob_;
cfgr.lhs=e.head_node_;
#if CFG_DEBUG
cfgr.rule=e.rule_;
#endif
if (copy_features) cfgr.f=e.feature_values_;
if (push_weights) crp /=np[e.head_node_];
int nr=rule_rhs.size();
rhs.resize(nr);
for (int j=0;j<nr;++j) {
WordID w=rule_rhs[j];
if (w>0)
rhs[j]=w;
else {
int n=e.tail_nodes_[-w];
if (push_weights) crp*=np[n];
rhs[j]=n;
}
}
}
}
void CFG::Clear() {
rules.clear();
nts.clear();
goal_nt=-1;
hg_=0;
}
void CFG::PrintRule(std::ostream &o,RuleHandle rulei,CFGFormat const& f) const {
Rule const& r=rules[rulei];
f.print_lhs(o,*this,r.lhs);
f.print_rhs(o,*this,r.rhs.begin(),r.rhs.end());
f.print_features(o,r.p,r.f);
#if CFG_DEBUG
o<<f.partsep<<*r.rule;
#endif
}
void CFG::Print(std::ostream &o,CFGFormat const& f) const {
assert(!uninit);
if (!f.goal_nt_name.empty()) {
o << '['<<f.goal_nt_name <<']';
WordID rhs=-goal_nt;
f.print_rhs(o,*this,&rhs,&rhs+1);
if (pushed_inside!=1)
f.print_features(o,pushed_inside);
o<<'\n';
}
for (int i=0;i<nts.size();++i) {
Ruleids const& ntr=nts[i].ruleids;
for (Ruleids::const_iterator j=ntr.begin(),jj=ntr.end();j!=jj;++j) {
PrintRule(o,*j,f);
o<<'\n';
}
}
}
|