diff options
author | graehl <graehl@ec762483-ff6d-05da-a07a-a48fb63a330f> | 2010-07-05 16:01:51 +0000 |
---|---|---|
committer | graehl <graehl@ec762483-ff6d-05da-a07a-a48fb63a330f> | 2010-07-05 16:01:51 +0000 |
commit | 137425bf3baa43e4fa1a7e9b519d41d94276d34c (patch) | |
tree | 1bdec1b1a25495f870d579eea036e70cd9231aee /decoder | |
parent | 8974cd8f215599e27647bd9fa11baa89365e5214 (diff) |
TODO (mostly low priority) notes
git-svn-id: https://ws10smt.googlecode.com/svn/trunk@128 ec762483-ff6d-05da-a07a-a48fb63a330f
Diffstat (limited to 'decoder')
-rw-r--r-- | decoder/ff.cc | 2 | ||||
-rw-r--r-- | decoder/ff_lm.cc | 2 | ||||
-rw-r--r-- | decoder/hg.cc | 2 | ||||
-rw-r--r-- | decoder/scfg_translator.cc | 20 |
4 files changed, 18 insertions, 8 deletions
diff --git a/decoder/ff.cc b/decoder/ff.cc index 61f4f0b6..95bd9665 100644 --- a/decoder/ff.cc +++ b/decoder/ff.cc @@ -1,3 +1,5 @@ +//TODO: 0 size state != rule-local feature, i.e. still may depend on source span loc/context. identify truly rule-local features so if we want they can be added to grammar rules (minor speedup) + #include "ff.h" #include "tdict.h" diff --git a/decoder/ff_lm.cc b/decoder/ff_lm.cc index 66b00448..21c05cf2 100644 --- a/decoder/ff_lm.cc +++ b/decoder/ff_lm.cc @@ -1,3 +1,5 @@ +//TODO: allow features to reorder by heuristic*weight the rules' terminal phrases (or of hyperedges'). if first pass has pruning, then compute over whole ruleset as part of heuristic + #include "ff_lm.h" #include <sstream> diff --git a/decoder/hg.cc b/decoder/hg.cc index 4da0beb3..e57f7807 100644 --- a/decoder/hg.cc +++ b/decoder/hg.cc @@ -1,3 +1,5 @@ +//TODO: lazily generate feature vectors for hyperarcs (because some of them will be pruned). this means 1) storing ref to rule for those features 2) providing ff interface for regenerating its feature vector from hyperedge+states and probably 3) still caching feat. vect on hyperedge once it's been generated. ff would normally just contribute its weighted score and result state, not component features. + #include "hg.h" #include <algorithm> diff --git a/decoder/scfg_translator.cc b/decoder/scfg_translator.cc index c215eea6..866c2721 100644 --- a/decoder/scfg_translator.cc +++ b/decoder/scfg_translator.cc @@ -1,3 +1,7 @@ +//TODO: bottom-up pruning, with actual final models' (appropriately weighted) heuristics and local scores. + +//TODO: grammar heuristic (min cost of reachable rule set) for binarizations (active edges) if we wish to prune those also + #include "translator.h" #include <vector> @@ -26,11 +30,11 @@ struct SCFGTranslatorImpl { g->SetMaxSpan(max_span_limit); g->SetGrammarName(gfiles[i]); grammars.push_back(GrammarPtr(g)); - + } } if (!conf.count("scfg_no_hiero_glue_grammar")) - { + { GlueGrammar* g = new GlueGrammar(goal, default_nt); g->SetGrammarName("GlueGrammar"); grammars.push_back(GrammarPtr(g)); @@ -39,7 +43,7 @@ struct SCFGTranslatorImpl { if (conf.count("scfg_extra_glue_grammar")) { GlueGrammar* g = new GlueGrammar(conf["scfg_extra_glue_grammar"].as<string>()); - g->SetGrammarName("ExtraGlueGrammar"); + g->SetGrammarName("ExtraGlueGrammar"); grammars.push_back(GrammarPtr(g)); cerr << "Adding extra glue grammar" << endl; } @@ -69,7 +73,7 @@ struct SCFGTranslatorImpl { if(printGrammarsUsed){ //Iterate trough grammars we have for this sentence and list them - for (int gi = 0; gi < glist.size(); ++gi) + for (int gi = 0; gi < glist.size(); ++gi) { cerr << "Using grammar::" << glist[gi]->GetGrammarName() << endl; } @@ -96,7 +100,7 @@ bool SCFGTranslator::TranslateImpl(const string& input, SentenceMetadata* smeta, const vector<double>& weights, Hypergraph* minus_lm_forest) { - + return pimpl_->Translate(input, smeta, weights, minus_lm_forest); } @@ -105,10 +109,10 @@ Check for grammar pointer in the sentence markup, for use with sentence specific */ void SCFGTranslator::ProcessMarkupHintsImpl(const map<string, string>& kv) { map<string,string>::const_iterator it = kv.find("grammar"); - - + + if (it == kv.end()) { - usingSentenceGrammar= false; + usingSentenceGrammar= false; return; } //Create sentence specific grammar from specified file name and load grammar into list of grammars |