summaryrefslogtreecommitdiff
path: root/decoder/minimal_decoder.cc
blob: 2592267421b247c464cef41a7651b458c70628da (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
#include <fstream>
#include <iostream>
#include <sstream>

#include "fdict.h"
#include "filelib.h"
#include "hg.h"
#include "hg_io.h"
#include "sparse_vector.h"
#include "viterbi.h"

using namespace std;

/*
 * Reads hypergraph from JSON file argv[1],
 * reweights it using weights from argv[2],
 * and outputs viterbi translation.
 *
 */
int
main(int argc, char** argv)
{
  clock_t begin_total = clock();

  // read hg
  clock_t begin_read = clock();
  ReadFile rf(argv[1]);
  Hypergraph hg;
  HypergraphIO::ReadFromJSON(rf.stream(), &hg);
  clock_t end_read = clock();
  double elapsed_secs_read = double(end_read - begin_read) / CLOCKS_PER_SEC;
  cerr << "read hg " << elapsed_secs_read << " s" << endl;

  // read weights
  clock_t begin_weights = clock();
  SparseVector<double> v;
  ifstream f(argv[2]);
  string line;
  while (getline(f, line)) {
    istringstream ss(line);
    string k; weight_t w;
    ss >> k >> w;
    v.add_value(FD::Convert(k), w);
  }
  clock_t end_weights = clock();
  double elapsed_secs_weights = double(end_weights - begin_weights) / CLOCKS_PER_SEC;
  cerr << "read weights " << elapsed_secs_weights << " s" << endl;

  // reweight hg
  clock_t begin_reweight = clock();
  hg.Reweight(v);
  clock_t end_reweight = clock();
  double elapsed_secs_reweight = double(end_reweight - begin_reweight) / CLOCKS_PER_SEC;
  cerr << "reweight " << elapsed_secs_reweight << " s" << endl;

  // topsort
  clock_t begin_top = clock();
  hg.TopologicallySortNodesAndEdges(hg.NumberOfNodes()-1);
  clock_t end_top = clock();
  double elapsed_secs_top = double(end_top - begin_top) / CLOCKS_PER_SEC;
  cerr << "topsort " << elapsed_secs_top << " s" << endl;

  // viterbi
  clock_t begin_viterbi = clock();
  vector<WordID> trans;
  ViterbiESentence(hg, &trans);
  cout << TD::GetString(trans) << endl << flush;
  clock_t end_viterbi = clock();
  double elapsed_secs_viterbi = double(end_viterbi - begin_viterbi) / CLOCKS_PER_SEC;
  cerr << "viterbi " << elapsed_secs_viterbi << " s" << endl;

  // total
  clock_t end_total = clock();
  double elapsed_secs = double(end_total - begin_total) / CLOCKS_PER_SEC;
  cerr << "total " << elapsed_secs << " s" << endl;
  
  return 0;
}