1 files changed, 70 insertions, 70 deletions
diff --git a/training/dtrain/dtrain.cc b/training/dtrain/dtrain.cc
index 4f29c499..4c5972a1 100644
--- a/training/dtrain/dtrain.cc
+++ b/training/dtrain/dtrain.cc
@@ -8,7 +8,7 @@ using namespace dtrain;
 
 
 bool
-dtrain_init(int argc, char** argv, po::variables_map* cfg)
+dtrain_init(int argc, char** argv, po::variables_map* conf)
 {
   po::options_description ini("Configuration File Options");
   ini.add_options()
@@ -51,49 +51,49 @@ dtrain_init(int argc, char** argv, po::variables_map* cfg)
     ("quiet,q",          po::value<bool>()->zero_tokens(),           "be quiet")
     ("verbose,v",        po::value<bool>()->zero_tokens(),         "be verbose");
   cl.add(ini);
-  po::store(parse_command_line(argc, argv, cl), *cfg);
-  if (cfg->count("config")) {
-    ifstream ini_f((*cfg)["config"].as<string>().c_str());
-    po::store(po::parse_config_file(ini_f, ini), *cfg);
+  po::store(parse_command_line(argc, argv, cl), *conf);
+  if (conf->count("config")) {
+    ifstream ini_f((*conf)["config"].as<string>().c_str());
+    po::store(po::parse_config_file(ini_f, ini), *conf);
   }
-  po::notify(*cfg);
-  if (!cfg->count("decoder_config")) {
+  po::notify(*conf);
+  if (!conf->count("decoder_config")) {
     cerr << cl << endl;
     return false;
   }
-  if ((*cfg)["sample_from"].as<string>() != "kbest"
-       && (*cfg)["sample_from"].as<string>() != "forest") {
-    cerr << "Wrong 'sample_from' param: '" << (*cfg)["sample_from"].as<string>() << "', use 'kbest' or 'forest'." << endl;
+  if ((*conf)["sample_from"].as<string>() != "kbest"
+       && (*conf)["sample_from"].as<string>() != "forest") {
+    cerr << "Wrong 'sample_from' param: '" << (*conf)["sample_from"].as<string>() << "', use 'kbest' or 'forest'." << endl;
     return false;
   }
-  if ((*cfg)["sample_from"].as<string>() == "kbest" && (*cfg)["filter"].as<string>() != "uniq" &&
-        (*cfg)["filter"].as<string>() != "not") {
-    cerr << "Wrong 'filter' param: '" << (*cfg)["filter"].as<string>() << "', use 'uniq' or 'not'." << endl;
+  if ((*conf)["sample_from"].as<string>() == "kbest" && (*conf)["filter"].as<string>() != "uniq" &&
+        (*conf)["filter"].as<string>() != "not") {
+    cerr << "Wrong 'filter' param: '" << (*conf)["filter"].as<string>() << "', use 'uniq' or 'not'." << endl;
     return false;
   }
-  if ((*cfg)["pair_sampling"].as<string>() != "all" && (*cfg)["pair_sampling"].as<string>() != "XYX" &&
-        (*cfg)["pair_sampling"].as<string>() != "PRO" && (*cfg)["pair_sampling"].as<string>() != "output_pairs") {
-    cerr << "Wrong 'pair_sampling' param: '" << (*cfg)["pair_sampling"].as<string>() << "'." << endl;
+  if ((*conf)["pair_sampling"].as<string>() != "all" && (*conf)["pair_sampling"].as<string>() != "XYX" &&
+        (*conf)["pair_sampling"].as<string>() != "PRO" && (*conf)["pair_sampling"].as<string>() != "output_pairs") {
+    cerr << "Wrong 'pair_sampling' param: '" << (*conf)["pair_sampling"].as<string>() << "'." << endl;
     return false;
   }
-  if (cfg->count("hi_lo") && (*cfg)["pair_sampling"].as<string>() != "XYX") {
+  if (conf->count("hi_lo") && (*conf)["pair_sampling"].as<string>() != "XYX") {
     cerr << "Warning: hi_lo only works with pair_sampling XYX." << endl;
   }
-  if ((*cfg)["hi_lo"].as<float>() > 0.5 || (*cfg)["hi_lo"].as<float>() < 0.01) {
+  if ((*conf)["hi_lo"].as<float>() > 0.5 || (*conf)["hi_lo"].as<float>() < 0.01) {
     cerr << "hi_lo must lie in [0.01, 0.5]" << endl;
     return false;
   }
-  if (!cfg->count("bitext")) {
+  if (!conf->count("bitext")) {
     cerr << "No training data given." << endl;
     return false;
   }
-  if ((*cfg)["pair_threshold"].as<score_t>() < 0) {
+  if ((*conf)["pair_threshold"].as<score_t>() < 0) {
     cerr << "The threshold must be >= 0!" << endl;
     return false;
   }
-  if ((*cfg)["select_weights"].as<string>() != "last" && (*cfg)["select_weights"].as<string>() != "best" &&
-        (*cfg)["select_weights"].as<string>() != "avg" && (*cfg)["select_weights"].as<string>() != "VOID") {
-    cerr << "Wrong 'select_weights' param: '" << (*cfg)["select_weights"].as<string>() << "', use 'last' or 'best'." << endl;
+  if ((*conf)["select_weights"].as<string>() != "last" && (*conf)["select_weights"].as<string>() != "best" &&
+        (*conf)["select_weights"].as<string>() != "avg" && (*conf)["select_weights"].as<string>() != "VOID") {
+    cerr << "Wrong 'select_weights' param: '" << (*conf)["select_weights"].as<string>() << "', use 'last' or 'best'." << endl;
     return false;
   }
   return true;
@@ -103,60 +103,60 @@ int
 main(int argc, char** argv)
 {
   // handle most parameters
-  po::variables_map cfg;
-  if (!dtrain_init(argc, argv, &cfg)) exit(1); // something is wrong
+  po::variables_map conf;
+  if (!dtrain_init(argc, argv, &conf)) exit(1); // something is wrong
 
   bool quiet = false;
-  if (cfg.count("quiet")) quiet = true;
+  if (conf.count("quiet")) quiet = true;
   bool verbose = false;
-  if (cfg.count("verbose")) verbose = true;
+  if (conf.count("verbose")) verbose = true;
   bool noup = false;
-  if (cfg.count("noup")) noup = true;
+  if (conf.count("noup")) noup = true;
   bool rescale = false;
-  if (cfg.count("rescale")) rescale = true;
+  if (conf.count("rescale")) rescale = true;
   bool keep = false;
-  if (cfg.count("keep")) keep = true;
+  if (conf.count("keep")) keep = true;
   bool fix_features = false;
-  if (cfg.count("fix_features")) fix_features = true;
-
-  const unsigned k = cfg["k"].as<unsigned>();
-  const unsigned N = cfg["N"].as<unsigned>();
-  const unsigned T = cfg["epochs"].as<unsigned>();
-  const unsigned stop_after = cfg["stop_after"].as<unsigned>();
-  const string filter_type = cfg["filter"].as<string>();
-  const string sample_from = cfg["sample_from"].as<string>();
-  const string pair_sampling = cfg["pair_sampling"].as<string>();
-  const score_t pair_threshold = cfg["pair_threshold"].as<score_t>();
-  const string select_weights = cfg["select_weights"].as<string>();
-  const string output_ranking = cfg["output_ranking"].as<string>();
-  const float hi_lo = cfg["hi_lo"].as<float>();
-  const score_t approx_bleu_d = cfg["approx_bleu_d"].as<score_t>();
-  const unsigned max_pairs = cfg["max_pairs"].as<unsigned>();
-  int repeat = cfg["repeat"].as<unsigned>();
+  if (conf.count("fix_features")) fix_features = true;
+
+  const unsigned k = conf["k"].as<unsigned>();
+  const unsigned N = conf["N"].as<unsigned>();
+  const unsigned T = conf["epochs"].as<unsigned>();
+  const unsigned stop_after = conf["stop_after"].as<unsigned>();
+  const string filter_type = conf["filter"].as<string>();
+  const string sample_from = conf["sample_from"].as<string>();
+  const string pair_sampling = conf["pair_sampling"].as<string>();
+  const score_t pair_threshold = conf["pair_threshold"].as<score_t>();
+  const string select_weights = conf["select_weights"].as<string>();
+  const string output_ranking = conf["output_ranking"].as<string>();
+  const float hi_lo = conf["hi_lo"].as<float>();
+  const score_t approx_bleu_d = conf["approx_bleu_d"].as<score_t>();
+  const unsigned max_pairs = conf["max_pairs"].as<unsigned>();
+  int repeat = conf["repeat"].as<unsigned>();
   bool check = false;
-  if (cfg.count("check")) check = true;
-  weight_t loss_margin = cfg["loss_margin"].as<weight_t>();
+  if (conf.count("check")) check = true;
+  weight_t loss_margin = conf["loss_margin"].as<weight_t>();
   bool batch = false;
-  if (cfg.count("batch")) batch = true;
+  if (conf.count("batch")) batch = true;
   if (loss_margin > 9998.) loss_margin = std::numeric_limits<float>::max();
-  const string pclr = cfg["pclr"].as<string>();
+  const string pclr = conf["pclr"].as<string>();
   bool average = false;
   if (select_weights == "avg")
     average = true;
   vector<string> print_weights;
-  if (cfg.count("print_weights"))
-    boost::split(print_weights, cfg["print_weights"].as<string>(), boost::is_any_of(" "));
+  if (conf.count("print_weights"))
+    boost::split(print_weights, conf["print_weights"].as<string>(), boost::is_any_of(" "));
 
   // setup decoder
   register_feature_functions();
   SetSilent(true);
-  ReadFile ini_rf(cfg["decoder_config"].as<string>());
+  ReadFile ini_rf(conf["decoder_config"].as<string>());
   if (!quiet)
-    cerr << setw(25) << "cdec cfg " << "'" << cfg["decoder_config"].as<string>() << "'" << endl;
+    cerr << setw(25) << "cdec conf " << "'" << conf["decoder_config"].as<string>() << "'" << endl;
   Decoder decoder(ini_rf.stream());
 
   // scoring metric/scorer
-  string scorer_str = cfg["scorer"].as<string>();
+  string scorer_str = conf["scorer"].as<string>();
   LocalScorer* scorer;
   if (scorer_str == "bleu") {
     scorer = static_cast<BleuScorer*>(new BleuScorer);
@@ -196,8 +196,8 @@ main(int argc, char** argv)
   vector<weight_t>& decoder_weights = decoder.CurrentWeightVector();
 
   SparseVector<weight_t> lambdas, cumulative_penalties, w_average, fixed;
-  if (cfg.count("input_weights")) {
-    Weights::InitFromFile(cfg["input_weights"].as<string>(), &decoder_weights);
+  if (conf.count("input_weights")) {
+    Weights::InitFromFile(conf["input_weights"].as<string>(), &decoder_weights);
     if (fix_features) {
       Weights::InitSparseVector(decoder_weights, &fixed);
       SparseVector<weight_t>::iterator it = fixed.begin();
@@ -209,8 +209,8 @@ main(int argc, char** argv)
   Weights::InitSparseVector(decoder_weights, &lambdas);
 
   // meta params for perceptron, SVM
-  weight_t eta = cfg["learning_rate"].as<weight_t>();
-  weight_t gamma = cfg["gamma"].as<weight_t>();
+  weight_t eta = conf["learning_rate"].as<weight_t>();
+  weight_t gamma = conf["gamma"].as<weight_t>();
 
   // faster perceptron: consider only misranked pairs, see
   bool faster_perceptron = false;
@@ -221,19 +221,19 @@ main(int argc, char** argv)
   bool l1clip = false;
   bool l1cumul = false;
   weight_t l1_reg = 0;
-  if (cfg["l1_reg"].as<string>() != "none") {
-    string s = cfg["l1_reg"].as<string>();
+  if (conf["l1_reg"].as<string>() != "none") {
+    string s = conf["l1_reg"].as<string>();
     if (s == "naive") l1naive = true;
     else if (s == "clip") l1clip = true;
     else if (s == "cumul") l1cumul = true;
-    l1_reg = cfg["l1_reg_strength"].as<weight_t>();
+    l1_reg = conf["l1_reg_strength"].as<weight_t>();
   }
 
   // output
-  string output_fn = cfg["output"].as<string>();
+  string output_fn = conf["output"].as<string>();
   // input
   string input_fn;
-  ReadFile input(cfg["bitext"].as<string>());
+  ReadFile input(conf["bitext"].as<string>());
   // buffer input for t > 0
   vector<string> src_str_buf;          // source strings (decoder takes only strings)
   vector<vector<vector<WordID> > > refs_as_ids_buf; // references as WordID vecs
@@ -244,7 +244,7 @@ main(int argc, char** argv)
   unsigned best_it = 0;
   float overall_time = 0.;
 
-  // output cfg
+  // output conf
   if (!quiet) {
     cerr << _p5;
     cerr << endl << "dtrain" << endl << "Parameters:" << endl;
@@ -267,19 +267,19 @@ main(int argc, char** argv)
       cerr << setw(25) << "hi lo " << hi_lo << endl;
     cerr << setw(25) << "pair threshold " << pair_threshold << endl;
     cerr << setw(25) << "select weights " << "'" << select_weights << "'" << endl;
-    if (cfg.count("l1_reg"))
-      cerr << setw(25) << "l1 reg " << l1_reg << " '" << cfg["l1_reg"].as<string>() << "'" << endl;
+    if (conf.count("l1_reg"))
+      cerr << setw(25) << "l1 reg " << l1_reg << " '" << conf["l1_reg"].as<string>() << "'" << endl;
     if (rescale)
       cerr << setw(25) << "rescale " << rescale << endl;
     cerr << setw(25) << "pclr " << pclr << endl;
     cerr << setw(25) << "max pairs " << max_pairs << endl;
     cerr << setw(25) << "repeat " << repeat << endl;
     //cerr << setw(25) << "test k-best " << test_k_best << endl;
-    cerr << setw(25) << "cdec cfg " << "'" << cfg["decoder_config"].as<string>() << "'" << endl;
+    cerr << setw(25) << "cdec conf " << "'" << conf["decoder_config"].as<string>() << "'" << endl;
     cerr << setw(25) << "input " << "'" << input_fn << "'" << endl;
     cerr << setw(25) << "output " << "'" << output_fn << "'" << endl;
-    if (cfg.count("input_weights"))
-      cerr << setw(25) << "weights in " << "'" << cfg["input_weights"].as<string>() << "'" << endl;
+    if (conf.count("input_weights"))
+      cerr << setw(25) << "weights in " << "'" << conf["input_weights"].as<string>() << "'" << endl;
     if (stop_after > 0)
       cerr << setw(25) << "stop_after " << stop_after << endl;
     if (!verbose) cerr << "(a dot represents " << DTRAIN_DOTS << " inputs)" << endl;