wasp

author: Patrick Simianer <simianer@cl.uni-heidelberg.de> 2014-04-14 16:25:44 +0200
committer: Patrick Simianer <simianer@cl.uni-heidelberg.de> 2014-04-14 16:25:44 +0200
commit: 056969a3d9dda06248afd0eaaa6eb1da2f174ea7 (patch)
tree: 722cd71d802be877d3679152f6dffe6eba76c0ea
parent: b0bff4f48b2de88560199be09e5a29feecaa267c (diff)
3 files changed, 404 insertions, 1 deletions
diff --git a/data/geoquery/README b/data/geoquery/README
index 86d6e0a..8e147fa 100644
--- a/data/geoquery/README
+++ b/data/geoquery/README
@@ -1,6 +1,5 @@
 corpus.xml         : corpus-true.xml of Jacob Andreas, without non-printable chars
 delete.ids         : references that give empty answers although they shouldn't
-eval.pl            : modified eval script from wasp-1.0
 folds600           : splits for cross-validation
 geoquery.de        : slightly corrected German part
 geoquery.en        : English part
@@ -15,4 +14,5 @@ split880.train.ids : 880 train/test split train ids
 ../weights.init : initial weights
 
 smt-semparse/ : slightly adapted code for Andreas' smt-semparse
+wasp/         : adapted stuff from wasp-1.0
 
diff --git a/data/geoquery/eval.pl b/data/geoquery/wasp/eval.pl
index e00a067..e00a067 100644
--- a/data/geoquery/eval.pl
+++ b/data/geoquery/wasp/eval.pl
diff --git a/data/geoquery/wasp/geoquery.pl b/data/geoquery/wasp/geoquery.pl
new file mode 100644
index 0000000..5d5d9bc
--- /dev/null
+++ b/data/geoquery/wasp/geoquery.pl
@@ -0,0 +1,403 @@
+:- ensure_loaded(library('lists')).
+:- ensure_loaded(library('ordsets')).
+:- ensure_loaded(geobase).
+
+country(countryid(usa)).
+
+state(stateid(State)) :- state(State,_,_,_,_,_,_,_,_,_).
+
+city(cityid(City,St)) :- city(_,St,City,_).
+
+river(riverid(R)) :- river(R,_,_). 
+
+place(placeid(P)) :- highlow(_,_,P,_,_,_).
+place(placeid(P)) :- highlow(_,_,_,_,P,_).
+
+mountain(A) :- mountain(A,_,_,_). % Rohit		     
+lake(A) :- lake(A,_,_). % Rohit		     
+
+abbreviation(stateid(State), Ab) :- 
+	state(State,Ab,_,_,_,_,_,_,_,_).
+abbreviation(Ab) :- abbreviation(_,Ab).
+
+capital(stateid(State), cityid(Cap,St)) :- state(State,St,Cap,_,_,_,_,_,_,_).
+capital(Cap) :- capital(_,Cap).
+
+print_name(stateid(X),X) :- !.
+print_name(cityid(X,_), X) :- !.
+print_name(riverid(X), X) :- !.
+print_name(placeid(X), X) :- !.
+print_name(Goal, Y) :- (Goal=_/_;Goal=_*_;Goal=_+_;Goal=_-_),!, Y is Goal.
+print_name(X,X).
+
+loc(X,countryid(usa)) :-
+	city(X) ; state(X) ; river(X) ; place(X).
+loc(cityid(City,St), stateid(State)) :-
+	city(State, St, City,_).
+loc(placeid(P), stateid(S)) :- highlow(S,_,P,_,_,_). % Rohit
+loc(placeid(P), stateid(S)) :- highlow(S,_,_,_,P,_). % Rohit
+%loc(placeid(P), stateid(S)) :-
+%	( highlow(S,_,P,_,_,_) ->
+%	      true
+%	; highlow(S,_,_,_,P,_)
+%	).
+loc(riverid(R), stateid(S)) :-
+	river(R,_,States),
+	member(S,States).
+
+traverse(riverid(R), stateid(S)) :-
+	river(R,_,States),
+	member(S,States).
+
+high_point(countryid(usa), placeid('mount mckinley')).
+high_point(stateid(S), placeid(P)) :-
+	 highlow(S,_,P,_,_,_).
+
+low_point(countryid(usa), placeid('death valley')).
+low_point(stateid(S), placeid(P)) :-
+	 highlow(S,_,_,_,P,_).
+
+area(stateid(X),Areal) :-
+	state(X,_,_,_,Area,_,_,_,_,_),
+	Areal is float(Area).
+
+major(cityid(C,S)) :-
+	X = cityid(C,S),
+	city(X),
+	population(X,P),
+	P > 150000.
+major(riverid(R)) :-
+	X = riverid(R),
+	river(X),
+	len(X,L),
+	L > 750.
+	
+first(G) :- (G -> true).
+
+n_solutions(N,Goal) :-
+	findall(Goal, Goal, GList0),
+	length(Solutions, N),
+	append(Solutions,_,GList0),
+	member(Goal, Solutions).
+
+nth_solution(N,Goal) :-
+	findall(Goal, Goal, GList),
+	nth(N,GList,Goal).
+
+population(stateid(X),Pop) :- 
+	state(X,_,_,Pop,_,_,_,_,_,_).
+population(cityid(X,St), Pop) :-
+	city(_,St,X,Pop).
+
+len(riverid(R), L) :-
+	river(R,L,_).
+
+elevation(placeid(P),E) :- highlow(_,_,_,_,P,E). % Rohit
+elevation(placeid(P),E) :- highlow(_,_,P,E,_,_). % Rohit
+%elevation(placeid(P),E) :-
+%	( highlow(_,_,P,E,_,_) 
+%	; highlow(_,_,_,_,P,E)
+%	).
+
+size(stateid(X), S) :-
+	area(stateid(X), S).
+size(cityid(X,St), S) :-
+	population(cityid(X,St), S).
+size(riverid(X), S) :-
+	len(riverid(X),S).
+size(placeid(X), S) :-
+	elevation(placeid(X),S).
+size(X,X) :-
+	number(X).
+	
+next_to(stateid(X),stateid(Y)) :-
+	border(X,_,Ys),
+	member(Y,Ys).
+
+density(S,D) :-
+	population(S,P),
+	area(S,A),
+	D is P / A.
+
+largest(Var, Goal) :-
+	findall(Size-Goal, (Goal,size(Var,Size)), Pairs0),
+	max_key(Pairs0, Goal).
+
+max_key([Key-Value|Rest],Result) :-
+	max_key(Rest, Key, Value, Result).
+
+max_key([], _, Value, Value).
+max_key([K-V|T], Key, Value, Result):-
+	( K > Key ->
+	     max_key(T, K, V, Result)
+	; max_key(T, Key, Value, Result)
+	).
+
+smallest(Var, Goal) :-
+	findall(Size-Goal, (Goal,size(Var,Size)), Pairs0),
+	min_key(Pairs0, Goal).
+
+min_key([Key-Value|Rest],Result) :-
+	min_key(Rest, Key, Value, Result).
+
+min_key([], _, Value, Value).
+min_key([K-V|T], Key, Value, Result):-
+	( K < Key ->
+	     min_key(T, K, V, Result)
+	; min_key(T, Key, Value, Result)
+	).
+
+count(V,Goal,N) :-
+	findall(V,Goal,Ts),
+	sort(Ts, Unique),
+	length(Unique, N).
+
+at_least(Min,V,Goal) :-
+	count(V,N,Goal),
+	Goal,  % This is a hack to instantiate N, making this order independent.
+	N >= Min.
+
+at_most(Max,V,Goal) :-
+	count(V,Goal,N),
+	N =< Max.
+
+execute_query(Query, Unique):-
+	tq(Query, answer(Var,Goal)),
+	findall(Name, (Goal, print_name(Var,Name)), Answers),
+	sort(Answers, Unique).
+%---------------------------------------------------------------------------
+tq(G,G) :-
+	var(G), !.
+tq(largest(V,Goal), largest(Vars, DVars, DV, DGoal)) :-
+	!,
+	variables_in(Goal, Vars),
+	copy_term((Vars,V,Goal),(DVars,DV,Goal1)),
+	tq(Goal1,DGoal).
+tq(smallest(V,Goal), smallest(Vars, DVars, DV, DGoal)) :-
+	!,
+	variables_in(Goal, Vars),
+	copy_term((Vars,V,Goal),(DVars,DV,Goal1)),
+	tq(Goal1,DGoal).
+tq(highest(V,Goal), highest(Vars, DVars, DV, DGoal)) :-
+	!,
+	variables_in(Goal, Vars),
+	copy_term((Vars,V,Goal),(DVars,DV,Goal1)),
+	tq(Goal1,DGoal).
+tq(most(I,V,Goal), most(Vars, DVars, DI, DV, DGoal)) :-
+	!,
+	variables_in(Goal, Vars),
+	copy_term((Vars,I,V,Goal),(DVars,DI,DV,Goal1)),
+	tq(Goal1,DGoal).
+tq(fewest(I,V,Goal), fewest(Vars, DVars, DI, DV, DGoal)) :-
+	!,
+	variables_in(Goal, Vars),
+	copy_term((Vars,I,V,Goal),(DVars,DI,DV,Goal1)),
+	tq(Goal1,DGoal).
+tq(Goal,TGoal) :-
+	functor(Goal,F,N),
+	functor(TGoal,F,N),
+	tq_args(N,Goal,TGoal).
+
+tq_args(N,Goal,TGoal) :-
+	( N =:= 0 ->
+	     true
+	; arg(N,Goal,GArg),
+	  arg(N,TGoal,TArg),
+	  tq(GArg,TArg),
+	  N1 is N - 1,
+	  tq_args(N1,Goal,TGoal)
+	).
+
+variables_in(A, Vs) :- variables_in(A, [], Vs).
+	
+variables_in(A, V0, V) :-
+	var(A), !, add_var(V0, A, V).
+variables_in(A, V0, V) :-
+	ground(A), !, V = V0. 
+variables_in(Term, V0, V) :-
+	functor(Term, _, N),
+	variables_in_args(N, Term, V0, V).
+
+variables_in_args(N, Term, V0, V) :-
+	( N =:= 0 ->
+	      V = V0
+	; arg(N, Term, Arg),
+	  variables_in(Arg, V0, V1),
+	  N1 is N-1,
+	  variables_in_args(N1, Term, V1, V)
+	).
+
+add_var(Vs0, V, Vs) :-
+	( contains_var(V, Vs0) ->
+	      Vs = Vs0
+	; Vs = [V|Vs0]
+	).
+
+
+contains_var(Variable, Term) :-
+	\+ free_of_var(Variable, Term).
+
+%   free_of_var(+Variable, +Term)
+%   is true when the given Term contains no sub-term identical to the
+%   given Variable (which may actually be any term, not just a var).
+%   For variables, this is precisely the "occurs check" which is
+%   needed for sound unification.
+
+free_of_var(Variable, Term) :-
+	Term == Variable,
+	!,
+	fail.
+free_of_var(Variable, Term) :-
+	compound(Term),
+	!,
+	functor(Term, _, Arity),
+	free_of_var(Arity, Term, Variable).
+free_of_var(_, _).
+
+free_of_var(1, Term, Variable) :- !,
+	arg(1, Term, Argument),
+	free_of_var(Variable, Argument).
+free_of_var(N, Term, Variable) :-
+	arg(N, Term, Argument),
+	free_of_var(Variable, Argument),
+	M is N-1, !,
+	free_of_var(M, Term, Variable).
+
+%---------------------------------------------------------------------------
+/*
+execute_query(answer(Var, Goal), Unique) :-
+	findall(Name,(Goal,print_name(Var,Name)),Answers),
+	sort(Answers,Unique).
+*/
+answer(Var, Goal) :- 
+	nl,nl,
+	findall(Name,(Goal,print_name(Var,Name)),Answers),
+	sort(Answers,Unique),
+	format('Answer = ~w~n',[Unique]).
+
+sum(V, Goal, X) :-
+	findall(V, Goal, Vs),
+	sumlist(Vs, 0, X).
+
+highest(Vars, DVars, DV, Goal) :-
+	highest(DV, Goal), !,
+	Vars = DVars.
+
+highest(X, Goal) :-
+	largest(Y, (Goal, elevation(X,Y))).
+/*CAT. bug
+lowest(X,Goal) :-
+	largest(Y, (Goal, elevation(X,Y))).
+*/
+lowest(X,Goal) :-
+	smallest(Y, (Goal, elevation(X,Y))).
+
+shortest(X,Goal) :-
+	smallest(Y, (Goal, len(X,Y))).
+
+longest(X,Goal) :-
+	largest(Y, (Goal, len(X,Y))).
+
+
+higher(X,Y) :-
+	elevation(X,EX),
+	elevation(Y,EY),
+	EX > EY.
+
+%---------------------------------
+%CAT added
+lower(X, Y) :-
+	elevation(X,EX),
+	elevation(Y,EY),
+	EX < EY.
+
+longer(X, Y) :-
+	len(X,LX),
+	len(Y, LY),
+	LX > LY.
+
+shorter(X, Y) :-
+	len(X,LX),
+	len(Y, LY),
+	LX < LY.
+
+more(X, Y) :-
+	X > Y.
+%---------------------------------
+
+divide(X,Y, X/Y).
+multiply(X,Y,X*Y).
+add(X,Y,X+Y).
+%subtract(X,Y,X-Y).
+
+sumlist([], Sum, Sum).
+sumlist([V|Vs], Sum0, Sum) :-
+	Sum1 is Sum0 + V,
+	sumlist(Vs, Sum1, Sum).
+
+const(V, V).
+
+largest(Vars, DVars, DV, DGoal) :-
+	largest(DV, DGoal),!,
+	Vars = DVars.
+
+smallest(Vars, DVars, DV, DGoal) :-
+	smallest(DV, DGoal),!,
+	Vars = DVars.
+
+most(Vars, DVars, DI, DV, DGoal) :-
+	most(DI, DV, DGoal),!,
+	Vars = DVars.
+
+fewest(Vars, DVars, DI, DV, DGoal) :-
+	fewest(DI, DV, DGoal),!,
+	Vars = DVars.
+
+most(Index,Var,Goal) :-
+	setof(Index-Var, Goal, Solutions),
+	keysort(Solutions, Collect),
+	maximum_run(Collect, Index).
+
+maximum_run(Solutions, Index) :-
+	maximum_run(Solutions, foo, 0, Index).
+
+maximum_run([], Index, _Count, Index) :- !.
+maximum_run([Index1-_|Rest], BestIndex0, Count0, BestIndex) :-
+	first_run(Rest, Index1, 1, Count1, Rest1),
+	( Count1 > Count0 ->
+	     BestIndex2 = Index1,
+	     Count2 = Count1
+	; BestIndex2 = BestIndex0,
+	  Count2 = Count0
+	),
+	maximum_run(Rest1, BestIndex2, Count2, BestIndex).
+
+first_run([], _Index, N, N, []).
+first_run([Index-G|Rest0], Target, N0, N, Rest) :-
+	( Target = Index ->
+	     N1 is N0 + 1,
+	     first_run(Rest0, Target, N1, N, Rest)
+	; N = N0,
+	  Rest = [Index-G|Rest0]
+	).
+
+fewest(Index,Var,Goal) :-
+	setof(Index-Var, Goal, Solutions),
+	keysort(Solutions, Collect),
+	minimum_run(Collect, Index).
+
+minimum_run(Solutions, Index) :-
+	minimum_run(Solutions, foo, 1000, Index).
+
+minimum_run([], Index, _Count, Index) :- !.
+minimum_run([Index1-_|Rest], BestIndex0, Count0, BestIndex) :-
+	first_run(Rest, Index1, 1, Count1, Rest1),
+	( Count1 < Count0 ->
+	     BestIndex2 = Index1,
+	     Count2 = Count1
+	; BestIndex2 = BestIndex0,
+	  Count2 = Count0
+	),
+	minimum_run(Rest1, BestIndex2, Count2, BestIndex).
+
+
author	Patrick Simianer <simianer@cl.uni-heidelberg.de>	2014-04-14 16:25:44 +0200
committer	Patrick Simianer <simianer@cl.uni-heidelberg.de>	2014-04-14 16:25:44 +0200
commit	056969a3d9dda06248afd0eaaa6eb1da2f174ea7 (patch)
tree	722cd71d802be877d3679152f6dffe6eba76c0ea
parent	b0bff4f48b2de88560199be09e5a29feecaa267c (diff)