From 2af5a445f3905c69c42be5c758c52a2f21b17446 Mon Sep 17 00:00:00 2001 From: graehl Date: Tue, 31 Aug 2010 01:08:42 +0000 Subject: l2r bugfixes git-svn-id: https://ws10smt.googlecode.com/svn/trunk@634 ec762483-ff6d-05da-a07a-a48fb63a330f --- utils/d_ary_heap.h | 4 +- utils/hash.h | 27 ++++++++- utils/intern_pool.h | 26 ++++++++- utils/show.h | 12 +++- utils/stringlib.h | 4 -- utils/tdict.h | 3 +- utils/wordid.h | 6 ++ utils/writer.h | 155 ++++++++++++++++++++++++++++++++++++++++++++++++++++ 8 files changed, 227 insertions(+), 10 deletions(-) create mode 100644 utils/writer.h (limited to 'utils') diff --git a/utils/d_ary_heap.h b/utils/d_ary_heap.h index 10d04782..eee8efe0 100644 --- a/utils/d_ary_heap.h +++ b/utils/d_ary_heap.h @@ -8,8 +8,8 @@ #define D_ARY_UP_GRAEHL 0 // untested #define D_ARY_APPEND_ALWAYS_PUSH 1 // heapify (0) is untested. otherwise switch between push and heapify depending on size (cache effects, existing items vs. # appended ones) -#define D_ARY_TRACK_OUT_OF_HEAP 0 // shouldn't need to track, because in contains() false positives looking up stale or random loc map values are impossible - we just check key -#define D_ARY_VERIFY_HEAP 0 +#define D_ARY_TRACK_OUT_OF_HEAP 1 // shouldn't need to track, because in contains() false positives looking up stale or random loc map values are impossible - we just check key +#define D_ARY_VERIFY_HEAP 1 // This is a very expensive test so it should be disabled even when NDEBUG is not defined /* adapted from boost/graph/detail/d_ary_heap.hpp diff --git a/utils/hash.h b/utils/hash.h index 2062578f..2290bc34 100755 --- a/utils/hash.h +++ b/utils/hash.h @@ -95,7 +95,6 @@ typename H::mapped_type & get_or_call(H &ht,K const& k,F const& f) { } } - // the below could also return a ref to the mapped max/min. they have the advantage of not falsely claiming an improvement when an equal value already existed. otherwise you could just modify the get_default and if equal assume new. template bool improve_mapped_max(H &ht,K const& k,typename H::mapped_type const& v) { @@ -110,6 +109,32 @@ bool improve_mapped_max(H &ht,K const& k,typename H::mapped_type const& v) { return false; } + +// return true if there was no old value. like ht[k]=v but lets you know whether it was a new addition +template +bool put(H &ht,K const& k,typename H::mapped_type const& v) { + std::pair inew=ht.insert(typename H::value_type(k,v)); + if (inew.second) + return true; + inew.first->second=v; + return false; +} + +// does not update old value (returns false) if one exists, otherwise add +template +bool maybe_add(H &ht,K const& k,typename H::mapped_type const& v) { + std::pair inew=ht.insert(typename H::value_type(k,v)); + return inew.second; +} + +// ht[k] must not exist (yet) +template +void add(H &ht,K const& k,typename H::mapped_type const& v) { + bool fresh=maybe_add(ht,k,v); + assert(fresh); +} + + template bool improve_mapped_min(H &ht,K const& k,typename H::mapped_type const& v) { std::pair inew=ht.insert(typename H::value_type(k,v)); diff --git a/utils/intern_pool.h b/utils/intern_pool.h index d9890ae6..7c739add 100755 --- a/utils/intern_pool.h +++ b/utils/intern_pool.h @@ -57,6 +57,30 @@ struct compose_indirect { } +}; + +template +struct equal_indirect { + typedef Arg *argument_type; // we also accept Arg & + KeyF kf; + F f; + typedef bool result_type; + + result_type operator()(Arg const& a1,Arg const& a2) const { + return f(kf(a1),kf(a2)); + } + result_type operator()(Arg & a1,Arg & a2) const { + return f(kf(a1),kf(a2)); + } + result_type operator()(Arg * a1,Arg * a2) const { + return a1==a2||(a1&&a2&&f(kf(*a1),kf(*a2))); + } + template + result_type operator()(V const& v,W const&w) const { + return v==w||(v&&w&&f(kf(*v),kf(*w))); + } + + }; /* @@ -79,7 +103,7 @@ struct intern_pool : Pool { typedef typename KeyF::result_type Key; typedef Item *Handle; typedef compose_indirect HashDeep; - typedef compose_indirect EqDeep; + typedef equal_indirect EqDeep; typedef HASH_SET Canonical; typedef typename Canonical::iterator CFind; typedef std::pair CInsert; diff --git a/utils/show.h b/utils/show.h index 1b645c83..95cad253 100755 --- a/utils/show.h +++ b/utils/show.h @@ -1,12 +1,19 @@ #ifndef UTILS__SHOW_H #define UTILS__SHOW_H + +//usage: string s=OSTR(1<<" "<(ostringstream()<(f(ostringstream()<(f(ostringstream()<(f(ostringstream()< #define SHOWS std::cerr #endif - #define SELF_TYPE_PRINT \ template \ inline friend std::basic_ostream & operator <<(std::basic_ostream &o, self_type const& me) \ @@ -26,6 +33,8 @@ #define PRINT_SELF(self) typedef self self_type; SELF_TYPE_PRINT_OSTREAM + + #undef SHOWALWAYS #define SHOWALWAYS(x) x @@ -62,6 +71,7 @@ careful: none of this is wrapped in a block. so you can't use one of these macr #define SHOW7(IF,x,y0,y1,y2,y3,y4,y5) SHOW1(IF,x) SHOW6(IF,y0,y1,y2,y3,y4,y5) #define SHOWM(IF,m,x) SHOWP(IF,m<<": ") SHOW(IF,x) +#define SHOWM1(IF,m,x) SHOWM(IF,m,x) #define SHOWM2(IF,m,x0,x1) SHOWP(IF,m<<": ") SHOW2(IF,x0,x1) #define SHOWM3(IF,m,x0,x1,x2) SHOWP(IF,m<<": ") SHOW3(IF,x0,x1,x2) #define SHOWM4(IF,m,x0,x1,x2,x3) SHOWP(IF,m<<": ") SHOW4(IF,x0,x1,x2,x3) diff --git a/utils/stringlib.h b/utils/stringlib.h index 4f79eb31..8022bb88 100644 --- a/utils/stringlib.h +++ b/utils/stringlib.h @@ -1,10 +1,6 @@ #ifndef CDEC_STRINGLIB_H_ #define CDEC_STRINGLIB_H_ -//usage: string s=MAKESTRE(1<<" "<(ostringstream()< #define SLIBDBG(x) do { std::cerr<<"DBG(stringlib): "<"; static char const* const se_str; //=""; static char const* const unk_str; //=""; diff --git a/utils/wordid.h b/utils/wordid.h index fb50bcc1..714dcd0b 100644 --- a/utils/wordid.h +++ b/utils/wordid.h @@ -1,6 +1,12 @@ #ifndef _WORD_ID_H_ #define _WORD_ID_H_ +#include + typedef int WordID; +//namespace { +static const WordID null_wordid=std::numeric_limits::max(); +//} + #endif diff --git a/utils/writer.h b/utils/writer.h new file mode 100644 index 00000000..d21b74d6 --- /dev/null +++ b/utils/writer.h @@ -0,0 +1,155 @@ +#ifndef WRITER_H +#define WRITER_H + +#include + +struct Writer +{ + template + std::basic_ostream& + operator()(std::basic_ostream& o,const value_type &l) const { + return o << l; + } +}; + +struct LineWriter +{ + template + std::basic_ostream& + operator()(std::basic_ostream& o,const Label &l) const { + return o << l << std::endl; + } +}; + +template inline +std::ios_base::iostate write_range_iostate(O& o,T begin, T end,W writer,bool multiline=false,bool parens=true,char open_paren='(',char close_paren=')',char space=' ') +{ + static const char *const MULTILINE_SEP="\n"; + if (parens) { + o << open_paren; + if (multiline) + o << MULTILINE_SEP; + } + if (multiline) { + for (;begin!=end;++begin) { + o << space; + writer(o,*begin); + o << MULTILINE_SEP; + } + } else { + for (T i=begin;i!=end;++i) { + if (i!=begin) o< +struct range_formatter { + Ib i; + Ie e; + W w; + bool multiline; + bool parens; + range_formatter(Ib i,Ie e,W w=W(),bool multiline=false,bool parens=true) : + i(i),e(e),w(w),multiline(multiline),parens(parens) {} + + template + std::basic_ostream & + operator()(std::basic_ostream &o) const { + write_range_iostate(o,i,e,w,multiline,parens); + return o; + } + + template + friend inline + std::basic_ostream & + operator<<(std::basic_ostream &o,range_formatter const& w) { + return w(o); + } +}; + +template +range_formatter +wrange(Ib i,Ie e,W const& w,bool multiline=false,bool parens=true) +{ + return range_formatter(i,e,w,multiline,parens); +} + +template +range_formatter +prange(Ib i,Ie e,bool multiline=false,bool parens=true) +{ + return range_formatter(i,e,Writer(),multiline,parens); +} + + +template inline +std::basic_ostream & write_range(std::basic_ostream& o,T begin, T end,W writer,bool multiline=false,bool parens=true,char open_paren='(',char close_paren=')') +{ + write_range_iostate(o,begin,end,writer,multiline,parens,open_paren,close_paren); + return o; +} + +template +inline std::ios_base::iostate print_range(O& o,T begin,T end,bool multiline=false,bool parens=true,char open_paren='(',char close_paren=')') { + return write_range_iostate(o,begin,end,Writer(),multiline,parens,open_paren,close_paren); +} + +template +inline std::ios_base::iostate print_range_i(O& o,C const&c,unsigned from,unsigned to,bool multiline=false,bool parens=true,char open_paren='(',char close_paren=')') { + return write_range_iostate(o,c.begin()+from,c.begin()+to,Writer(),multiline,parens,open_paren,close_paren); +} + + +template +struct bound_printer +{ + O *po; + template + void operator()(T const& t) const + { + *po << t; + } +}; + +template +bound_printer +make_bound_printer(O &o) +{ + bound_printer ret; + ret.po=&o; + return ret; +} + +template +struct bound_writer +{ + W const& w; + bound_writer(W const& w) : w(w) {} + bound_writer(bound_writer const& o) :w(o.w) {} + template + void operator()(O &o,V const& v) const + { + v.print(o,w); + } +}; + + +template +bound_writer +make_bound_writer(W const& w) +{ + return bound_writer(w); +} + + + +#endif -- cgit v1.2.3