summaryrefslogtreecommitdiff
path: root/gi/scfg/abc/scfg.cpp
diff options
context:
space:
mode:
authorlinh.kitty <linh.kitty@ec762483-ff6d-05da-a07a-a48fb63a330f>2010-07-16 20:34:09 +0000
committerlinh.kitty <linh.kitty@ec762483-ff6d-05da-a07a-a48fb63a330f>2010-07-16 20:34:09 +0000
commit1c47931c5669099899e2d2667f87e191e7aa2dbd (patch)
treef31833bd02be45dbfdd6315e331b4c52e1fa8b69 /gi/scfg/abc/scfg.cpp
parentfd8d56e7b04f956dbb036a21e3ba5f33eb183cbc (diff)
add
git-svn-id: https://ws10smt.googlecode.com/svn/trunk@291 ec762483-ff6d-05da-a07a-a48fb63a330f
Diffstat (limited to 'gi/scfg/abc/scfg.cpp')
-rw-r--r--gi/scfg/abc/scfg.cpp6
1 files changed, 6 insertions, 0 deletions
diff --git a/gi/scfg/abc/scfg.cpp b/gi/scfg/abc/scfg.cpp
index b3dbad34..1e59fb4a 100644
--- a/gi/scfg/abc/scfg.cpp
+++ b/gi/scfg/abc/scfg.cpp
@@ -145,6 +145,7 @@ int main(int argc, char** argv){
}
cerr<<"get parametters\n\n\n";
+
string grammar_file = params.asString("grammar_file", "./grammar.pr");
string input_file = params.asString("input_file", "parallel_corpora");
@@ -186,6 +187,7 @@ int main(int argc, char** argv){
Hypergraph hg;
int data_size = src_corpus.size();
+ int cnt_unparsed =0;
for (int i =0; i <split_iters; i++){
cerr<<"Split Nonterminals, iteration "<<(i+1)<<endl;
@@ -208,13 +210,17 @@ int main(int argc, char** argv){
if (! parseSentencePair(goal_sym, src, tgt, g, hg) ){
cerr<<"target sentence is not parsed by the grammar!\n";
//return 1;
+ cnt_unparsed++;
continue;
}
+
cerr<<"update edge posterior prob"<<endl;
boost::static_pointer_cast<aGrammar>(g)->UpdateHgProsteriorProb(hg);
hg.clear();
+ if (k%1000 ==0 ) cerr<<"sentences "<<k<<endl;
}
+ cerr<<"cnt_unparased="<<cnt_unparsed<<endl;
boost::static_pointer_cast<aGrammar>(g)->UpdateScore();
}
boost::static_pointer_cast<aGrammar>(g)->PrintAllRules(output_file+".e" + itos(i+1));