From aa5f96417ff81408b15b54aab35a3c16b845adf8 Mon Sep 17 00:00:00 2001 From: Patrick Simianer Date: Mon, 29 Aug 2011 22:02:45 +0200 Subject: big update: working iterating, pretty output, test scripts and more --- dtrain/learner.h | 96 -------------------------------------------------------- 1 file changed, 96 deletions(-) delete mode 100644 dtrain/learner.h (limited to 'dtrain/learner.h') diff --git a/dtrain/learner.h b/dtrain/learner.h deleted file mode 100644 index 038749e2..00000000 --- a/dtrain/learner.h +++ /dev/null @@ -1,96 +0,0 @@ -#ifndef _DTRAIN_LEARNER_H_ -#define _DTRAIN_LEARNER_H_ - -#include -#include -#include - -#include "sparse_vector.h" -#include "score.h" - - -namespace dtrain -{ - - -class Learner -{ - public: - virtual void Init( const vector >& kbest, const Scores& scores, - const bool invert_score = false ) {}; - virtual void Update( SparseVector& lambdas ) {}; -}; - - -class SofiaLearner : public Learner -{ - public: - void - Init( const size_t sid, const vector >& kbest, /*const FIXME*/ Scores& scores, - const bool invert_score = false ) - { - assert( kbest.size() == scores.size() ); - ofstream o; - unlink( "/tmp/sofia_ml_training" ); - o.open( "/tmp/sofia_ml_training", ios::trunc ); // TODO randomize, filename exists - int fid = 0; - map::iterator ff; - - double score; - for ( size_t k = 0; k < kbest.size(); ++k ) { - map m; - SparseVector::const_iterator it = kbest[k].begin(); - score = scores[k].GetScore(); - if ( invert_score ) score = -score; - o << score; - for ( ; it != kbest[k].end(); ++it ) { - ff = fmap.find( it->first ); - if ( ff == fmap.end() ) { - fmap.insert( pair(it->first, fid) ); - fmap1.insert( pair(fid, it->first) ); - fid++; - } - m.insert( pair(fmap[it->first], it->second) ); - } - map::iterator ti = m.begin(); - for ( ; ti != m.end(); ++ti ) { - o << " " << ti->first << ":" << ti->second; - } - o << endl; - } - o.close(); - } - - void - Update(SparseVector& lambdas) - { - string call = "./sofia-ml --training_file /tmp/sofia_ml_training --model_out /tmp/sofia_ml_model --loop_type stochastic --lambda 100 --dimensionality "; - std::stringstream out; - out << fmap.size(); - call += out.str(); - call += " &>/dev/null"; - system ( call.c_str() ); - ifstream i; - unlink( "/tmp/sofia_ml_model" ); - i.open( "/tmp/sofia_ml_model", ios::in ); - string model; - getline( i, model ); - vector strs; - boost::split( strs, model, boost::is_any_of(" ") ); - int j = 0; - for ( vector::iterator it = strs.begin(); it != strs.end(); ++it ) { - lambdas.set_value(fmap1[j], atof( it->c_str() ) ); - j++; - } - } - - private: - map fmap; - map fmap1; -}; - - -} // namespace - -#endif - -- cgit v1.2.3