#include <iostream>
#define BOOST_TEST_MODULE ScoreTest
#include <boost/test/unit_test.hpp>
#include <boost/test/floating_point_comparison.hpp>

#include "ns.h"
#include "tdict.h"
#include "scorer.h"
#include "aer_scorer.h"
#include "kernel_string_subseq.h"

using namespace std;

struct Stuff {
 Stuff() {
     refs0.resize(4);
     refs1.resize(4);
     TD::ConvertSentence("export of high-tech products in guangdong in first two months this year reached 3.76 billion us dollars", &refs0[0]);
     TD::ConvertSentence("guangdong's export of new high technology products amounts to us $ 3.76 billion in first two months of this year", &refs0[1]);
     TD::ConvertSentence("guangdong exports us $ 3.76 billion worth of high technology products in the first two months of this year", &refs0[2]);
     TD::ConvertSentence("in the first 2 months this year , the export volume of new hi-tech products in guangdong province reached 3.76 billion us dollars .", &refs0[3]);
     TD::ConvertSentence("xinhua news agency , guangzhou , march 16 ( reporter chen ji ) the latest statistics show that from january through february this year , the export of high-tech products in guangdong province reached 3.76 billion us dollars , up 34.8 \% over the same period last year and accounted for 25.5 \% of the total export in the province .", &refs1[0]);
     TD::ConvertSentence("xinhua news agency , guangzhou , march 16 ( reporter : chen ji ) -- latest statistic indicates that guangdong's export of new high technology products amounts to us $ 3.76 billion , up 34.8 \% over corresponding period and accounts for 25.5 \% of the total exports of the province .", &refs1[1]);
     TD::ConvertSentence("xinhua news agency report of march 16 from guangzhou ( by staff reporter chen ji ) - latest statistics indicate guangdong province exported us $ 3.76 billion worth of high technology products , up 34.8 percent from the same period last year , which account for 25.5 percent of the total exports of the province .", &refs1[2]);
     TD::ConvertSentence("guangdong , march 16 , ( xinhua ) -- ( chen ji reports ) as the newest statistics shows , in january and feberuary this year , the export volume of new hi-tech products in guangdong province reached 3.76 billion us dollars , up 34.8 \% than last year , making up 25.5 \% of the province's total .", &refs1[3]);
     TD::ConvertSentence("one guangdong province will next export us $ 3.76 high-tech product two months first this year 3.76 billion us dollars", &hyp1);
     TD::ConvertSentence("xinhua news agency , guangzhou , 16th of march ( reporter chen ) -- latest statistics suggest that guangdong exports new advanced technology product totals $ 3.76 million , 34.8 percent last corresponding period and accounts for 25.5 percent of the total export province .", &hyp2);
   }

  vector<vector<WordID> > refs0;
  vector<vector<WordID> > refs1;
  vector<WordID> hyp1;
  vector<WordID> hyp2;
};

BOOST_FIXTURE_TEST_SUITE( s, Stuff );

BOOST_AUTO_TEST_CASE(TestCreateFromFiles) {
  std::string path(boost::unit_test::framework::master_test_suite().argc == 2 ? boost::unit_test::framework::master_test_suite().argv[1] : "test_data");
  vector<string> files;
  files.push_back(path + "/re.txt.0");
  files.push_back(path + "/re.txt.1");
  files.push_back(path + "/re.txt.2");
  files.push_back(path + "/re.txt.3");
  DocScorer ds(IBM_BLEU, files);
}

BOOST_AUTO_TEST_CASE(TestBLEUScorer) {
  ScorerP s1 = SentenceScorer::CreateSentenceScorer(IBM_BLEU, refs0);
  ScorerP s2 = SentenceScorer::CreateSentenceScorer(IBM_BLEU, refs1);
  ScoreP b1 = s1->ScoreCandidate(hyp1);
  BOOST_CHECK_CLOSE(0.23185077, b1->ComputeScore(), 1e-4);
  ScoreP b2 = s2->ScoreCandidate(hyp2);
  BOOST_CHECK_CLOSE(0.38101241, b2->ComputeScore(), 1e-4);
  b1->PlusEquals(*b2);
  BOOST_CHECK_CLOSE(0.348854, b1->ComputeScore(), 1e-4);
  BOOST_CHECK(!b1->IsAdditiveIdentity());
  string details;
  b1->ScoreDetails(&details);
  BOOST_CHECK_EQUAL("BLEU = 34.89, 81.5|50.8|29.5|18.6 (brev=0.898)", details);
  cerr << details << endl;
  string enc;
  b1->Encode(&enc);
  ScoreP b3 = SentenceScorer::CreateScoreFromString(IBM_BLEU, enc);
  details.clear();
  cerr << "Encoded BLEU score size: " << enc.size() << endl;
  b3->ScoreDetails(&details);
  cerr << details << endl;
  BOOST_CHECK(!b3->IsAdditiveIdentity());
  BOOST_CHECK_EQUAL("BLEU = 34.89, 81.5|50.8|29.5|18.6 (brev=0.898)", details);
  ScoreP bz = b3->GetZero();
  BOOST_CHECK(bz->IsAdditiveIdentity());
}

BOOST_AUTO_TEST_CASE(TestTERScorer) {
  ScorerP s1 = SentenceScorer::CreateSentenceScorer(TER, refs0);
  ScorerP s2 = SentenceScorer::CreateSentenceScorer(TER, refs1);
  string details;
  ScoreP t1 = s1->ScoreCandidate(hyp1);
  t1->ScoreDetails(&details);
  cerr << "DETAILS: " << details << endl;
  cerr << t1->ComputeScore() << endl;
  ScoreP t2 = s2->ScoreCandidate(hyp2);
  t2->ScoreDetails(&details);
  cerr << "DETAILS: " << details << endl;
  cerr << t2->ComputeScore() << endl;
  t1->PlusEquals(*t2);
  cerr << t1->ComputeScore() << endl;
  t1->ScoreDetails(&details);
  cerr << "DETAILS: " << details << endl;
  BOOST_CHECK_EQUAL("TER = 44.16,   4|  8| 16|  6 (len=77)", details);
  string enc;
  t1->Encode(&enc);
  ScoreP t3 = SentenceScorer::CreateScoreFromString(TER, enc);
  details.clear();
  t3->ScoreDetails(&details);
  BOOST_CHECK_EQUAL("TER = 44.16,   4|  8| 16|  6 (len=77)", details);
  BOOST_CHECK(!t3->IsAdditiveIdentity());
  ScoreP tz = t3->GetZero();
  BOOST_CHECK(tz->IsAdditiveIdentity());
}

BOOST_AUTO_TEST_CASE(TestTERScorerSimple) {
  vector<vector<WordID> > ref(1);
  TD::ConvertSentence("1 2 3 A B", &ref[0]);
  vector<WordID> hyp;
  TD::ConvertSentence("A B 1 2 3", &hyp);
  ScorerP s1 = SentenceScorer::CreateSentenceScorer(TER, ref);
  string details;
  ScoreP t1 = s1->ScoreCandidate(hyp);
  t1->ScoreDetails(&details);
  cerr << "DETAILS: " << details << endl;
}

BOOST_AUTO_TEST_CASE(TestSERScorerSimple) {
  vector<vector<WordID> > ref(1);
  TD::ConvertSentence("A B C D", &ref[0]);
  vector<WordID> hyp1;
  TD::ConvertSentence("A B C", &hyp1);
  vector<WordID> hyp2;
  TD::ConvertSentence("A B C D", &hyp2);
  ScorerP s1 = SentenceScorer::CreateSentenceScorer(SER, ref);
  string details;
  ScoreP t1 = s1->ScoreCandidate(hyp1);
  t1->ScoreDetails(&details);
  cerr << "DETAILS: " << details << endl;
  ScoreP t2 = s1->ScoreCandidate(hyp2);
  t2->ScoreDetails(&details);
  cerr << "DETAILS: " << details << endl;
  t2->PlusEquals(*t1);
  t2->ScoreDetails(&details);
  cerr << "DETAILS: " << details << endl;
}

BOOST_AUTO_TEST_CASE(TestCombiScorer) {
  ScorerP s1 = SentenceScorer::CreateSentenceScorer(BLEU_minus_TER_over_2, refs0);
  string details;
  ScoreP t1 = s1->ScoreCandidate(hyp1);
  t1->ScoreDetails(&details);
  cerr << "DETAILS: " << details << endl;
  cerr << t1->ComputeScore() << endl;
  string enc;
  t1->Encode(&enc);
  ScoreP t2 = SentenceScorer::CreateScoreFromString(BLEU_minus_TER_over_2, enc);
  details.clear();
  t2->ScoreDetails(&details);
  cerr << "DETAILS: " << details << endl;
  ScoreP cz = t2->GetZero();
  BOOST_CHECK(!t2->IsAdditiveIdentity());
  BOOST_CHECK(cz->IsAdditiveIdentity());
  cz->PlusEquals(*t2);
  BOOST_CHECK(!cz->IsAdditiveIdentity());
  string d2;
  cz->ScoreDetails(&d2);
  BOOST_CHECK_EQUAL(d2, details);
}

BOOST_AUTO_TEST_CASE(AERTest) {
  vector<vector<WordID> > refs0(1);
  TD::ConvertSentence("0-0 2-1 1-2 3-3", &refs0[0]);

  vector<WordID> hyp;
  TD::ConvertSentence("0-0 1-1", &hyp);
  AERScorer* as = new AERScorer(refs0);
  ScoreP x = as->ScoreCandidate(hyp);
  string details;
  x->ScoreDetails(&details);
  cerr << details << endl;
  string enc;
  x->Encode(&enc);
  delete as;
  cerr << "ENC size: " << enc.size() << endl;
  ScoreP y = SentenceScorer::CreateScoreFromString(AER, enc);
  string d2;
  y->ScoreDetails(&d2);
  cerr << d2 << endl;
  BOOST_CHECK_EQUAL(d2, details);
}

BOOST_AUTO_TEST_CASE(Kernel) {
  for (int i = 1; i < 10; ++i) {
    const float l = (i / 10.0);
    float f = ssk<4>(refs0[0], hyp1, l) +
              ssk<4>(refs0[1], hyp1, l) +
              ssk<4>(refs0[2], hyp1, l) +
              ssk<4>(refs0[3], hyp1, l);
    float f2= ssk<4>(refs1[0], hyp2, l) +
              ssk<4>(refs1[1], hyp2, l) +
              ssk<4>(refs1[2], hyp2, l) +
              ssk<4>(refs1[3], hyp2, l);
    f /= 4;
    f2 /= 4;
    float f3= ssk<4>(refs0[0], hyp2, l) +
              ssk<4>(refs0[1], hyp2, l) +
              ssk<4>(refs0[2], hyp2, l) +
              ssk<4>(refs0[3], hyp2, l);
    float f4= ssk<4>(refs1[0], hyp1, l) +
              ssk<4>(refs1[1], hyp1, l) +
              ssk<4>(refs1[2], hyp1, l) +
              ssk<4>(refs1[3], hyp1, l);
    f3 += f4;
    f3 /= 8;
    cerr << "LAMBDA=" << l << "\t" << f << " " << f2 << "\tf=" << ((f + f2)/2 - f3) << " (bad=" << f3 << ")" << endl;
  }
}

BOOST_AUTO_TEST_CASE(NewScoreAPI) {
  //EvaluationMetric* metric = EvaluationMetric::Instance("IBM_BLEU");
  //EvaluationMetric* metric = EvaluationMetric::Instance("METEOR");
  EvaluationMetric* metric = EvaluationMetric::Instance("COMB:IBM_BLEU=0.5;TER=-0.5");
  boost::shared_ptr<SegmentEvaluator> e1 = metric->CreateSegmentEvaluator(refs0);
  boost::shared_ptr<SegmentEvaluator> e2 = metric->CreateSegmentEvaluator(refs1);
  SufficientStats stats1;
  e1->Evaluate(hyp1, &stats1);
  SufficientStats stats2;
  e2->Evaluate(hyp2, &stats2);
  stats1 += stats2;
  string ss;
  stats1.Encode(&ss);
  cerr << "SS: " << ss << endl;
  cerr << metric->ComputeScore(stats1) << endl;
  //SufficientStats statse("IBM_BLEU 53 32 18 11 65 63 61 59 65 72");
  //cerr << metric->ComputeScore(statse) << endl;
}

BOOST_AUTO_TEST_SUITE_END()