2004-07-15 17:23:44 +01:00
|
|
|
/***********************************
|
|
|
|
|
|
|
|
Variable Elimination in Prolog
|
|
|
|
|
|
|
|
How to do it
|
|
|
|
|
|
|
|
|
|
|
|
Three steps:
|
|
|
|
build the graph:
|
|
|
|
- for all variables, find out
|
|
|
|
all tables they connect to;
|
|
|
|
multiply their size
|
|
|
|
order by size
|
|
|
|
|
|
|
|
*********************************/
|
|
|
|
|
|
|
|
:- module(vel, [vel/3,
|
|
|
|
check_if_vel_done/1]).
|
|
|
|
|
2007-07-07 02:52:57 +01:00
|
|
|
:- attribute size/1, all_diffs/1.
|
2004-07-15 17:23:44 +01:00
|
|
|
|
2004-12-16 06:07:07 +00:00
|
|
|
:- use_module(library(ordsets), [ord_union/3]).
|
2004-07-15 17:23:44 +01:00
|
|
|
|
2004-12-11 19:53:43 +00:00
|
|
|
:- use_module(library('clpbn/xbif'), [clpbn2xbif/3]).
|
|
|
|
|
|
|
|
:- use_module(library('clpbn/graphviz'), [clpbn2gviz/4]).
|
2004-12-08 22:32:34 +00:00
|
|
|
|
2007-11-28 23:52:14 +00:00
|
|
|
:- use_module(library('clpbn/dists'),
|
|
|
|
[
|
|
|
|
get_dist_domain_size/2,
|
|
|
|
get_dist_matrix/5]).
|
2007-07-13 01:52:54 +01:00
|
|
|
|
2004-12-16 06:07:07 +00:00
|
|
|
:- use_module(library('clpbn/utils'), [
|
|
|
|
clpbn_not_var_member/2,
|
|
|
|
check_for_hidden_vars/3]).
|
|
|
|
|
2007-07-07 02:52:57 +01:00
|
|
|
:- use_module(library('clpbn/display'), [
|
|
|
|
clpbn_bind_vals/3]).
|
|
|
|
|
2007-11-16 14:58:41 +00:00
|
|
|
:- use_module(library('clpbn/matrix_cpt_utils'),
|
|
|
|
[project_from_CPT/3,
|
|
|
|
reorder_CPT/5,
|
2007-11-28 23:52:14 +00:00
|
|
|
multiply_CPTs/4,
|
2007-11-16 14:58:41 +00:00
|
|
|
normalise_CPT/2,
|
|
|
|
list_from_CPT/2]).
|
2005-04-27 21:09:26 +01:00
|
|
|
|
2004-07-15 17:23:44 +01:00
|
|
|
:- use_module(library(lists),
|
|
|
|
[
|
2007-07-07 02:52:57 +01:00
|
|
|
append/3
|
2004-07-15 17:23:44 +01:00
|
|
|
]).
|
|
|
|
|
|
|
|
check_if_vel_done(Var) :-
|
|
|
|
get_atts(Var, [size(_)]), !.
|
|
|
|
|
2008-03-13 14:38:02 +00:00
|
|
|
%
|
|
|
|
% implementation of the well known variable elimination algorithm
|
|
|
|
%
|
2008-10-22 00:44:02 +01:00
|
|
|
vel([[]],_,_) :- !.
|
|
|
|
vel([LVs],Vs0,AllDiffs) :-
|
2004-07-15 17:23:44 +01:00
|
|
|
check_for_hidden_vars(Vs0, Vs0, Vs1),
|
|
|
|
sort(Vs1,Vs),
|
2008-03-13 14:38:02 +00:00
|
|
|
% LVi will have a list of CLPBN variables
|
|
|
|
% Tables0 will have the full data on each variable
|
2004-12-08 22:32:34 +00:00
|
|
|
find_all_clpbn_vars(Vs, LV0, LVi, Tables0),
|
2008-03-13 14:38:02 +00:00
|
|
|
% construct the graph
|
2004-07-15 17:23:44 +01:00
|
|
|
find_all_table_deps(Tables0, LV0),
|
2004-12-16 06:07:07 +00:00
|
|
|
(clpbn:output(xbif(XBifStream)) -> clpbn2xbif(XBifStream,vel,Vs) ; true),
|
|
|
|
(clpbn:output(gviz(XBifStream)) -> clpbn2gviz(XBifStream,vel,Vs,LVs) ; true),
|
2008-03-13 14:38:02 +00:00
|
|
|
% variable elimination proper
|
2004-12-08 22:32:34 +00:00
|
|
|
process(LVi, LVs, tab(Dist,_,_)),
|
2008-03-13 14:38:02 +00:00
|
|
|
% move from potentials back to probabilities
|
2007-11-16 14:58:41 +00:00
|
|
|
normalise_CPT(Dist,Ps),
|
2008-03-13 14:38:02 +00:00
|
|
|
% from array to list
|
2007-11-16 14:58:41 +00:00
|
|
|
list_from_CPT(Ps, LPs),
|
2008-03-13 14:38:02 +00:00
|
|
|
% bind Probs back to variables so that they can be output.
|
2008-10-29 18:24:50 +00:00
|
|
|
clpbn_bind_vals([LVs],[LPs],AllDiffs).
|
2004-07-15 17:23:44 +01:00
|
|
|
|
2008-03-13 14:38:02 +00:00
|
|
|
%
|
|
|
|
% just get a list of variables plus associated tables
|
|
|
|
%
|
2004-12-08 22:32:34 +00:00
|
|
|
find_all_clpbn_vars([], [], [], []) :- !.
|
2005-02-08 04:05:39 +00:00
|
|
|
find_all_clpbn_vars([V|Vs], [Var|LV], ProcessedVars, [table(I,Table,Parents,Sizes)|Tables]) :-
|
|
|
|
var_with_deps(V, Table, Parents, Sizes, Ev, Vals), !,
|
2004-12-08 22:32:34 +00:00
|
|
|
% variables with evidence should not be processed.
|
|
|
|
(var(Ev) ->
|
2005-02-08 04:05:39 +00:00
|
|
|
Var = var(V,I,Sz,Vals,Parents,Ev,_,_),
|
2005-04-27 21:09:26 +01:00
|
|
|
vel_get_dist_size(V,Sz),
|
2004-12-08 22:32:34 +00:00
|
|
|
ProcessedVars = [Var|ProcessedVars0]
|
|
|
|
;
|
|
|
|
ProcessedVars = ProcessedVars0
|
|
|
|
),
|
|
|
|
find_all_clpbn_vars(Vs, LV, ProcessedVars0, Tables).
|
2004-07-15 17:23:44 +01:00
|
|
|
|
2004-12-05 05:01:45 +00:00
|
|
|
var_with_deps(V, Table, Deps, Sizes, Ev, Vals) :-
|
2007-07-13 01:52:54 +01:00
|
|
|
clpbn:get_atts(V, [dist(Id,Parents)]),
|
2007-11-16 14:58:41 +00:00
|
|
|
get_dist_matrix(Id,Parents,_,Vals,TAB0),
|
2008-02-13 11:57:46 +00:00
|
|
|
( clpbn:get_atts(V, [evidence(Ev)]) -> true ; true),
|
2008-03-13 14:38:02 +00:00
|
|
|
% set CPT in canonical form
|
2007-11-16 14:58:41 +00:00
|
|
|
reorder_CPT([V|Parents],TAB0,Deps0,TAB1,Sizes1),
|
2008-03-13 14:38:02 +00:00
|
|
|
% remove evidence.
|
2007-11-16 14:58:41 +00:00
|
|
|
simplify_evidence(Deps0, TAB1, Deps0, Sizes1, Table, Deps, Sizes).
|
2004-07-15 17:23:44 +01:00
|
|
|
|
|
|
|
find_all_table_deps(Tables0, LV) :-
|
|
|
|
find_dep_graph(Tables0, DepGraph0),
|
|
|
|
sort(DepGraph0, DepGraph),
|
|
|
|
add_table_deps_to_variables(LV, DepGraph).
|
|
|
|
|
|
|
|
find_dep_graph([], []).
|
|
|
|
find_dep_graph([table(I,Tab,Deps,Sizes)|Tables], DepGraph) :-
|
|
|
|
add_table_deps(Deps, I, Deps, Tab, Sizes, DepGraph0, DepGraph),
|
|
|
|
find_dep_graph(Tables, DepGraph0).
|
|
|
|
|
|
|
|
add_table_deps([], _, _, _, _, DepGraph, DepGraph).
|
|
|
|
add_table_deps([V|Deps], I, Deps0, Table, Sizes, DepGraph0, [V-tab(Table,Deps0,Sizes)|DepGraph]) :-
|
|
|
|
add_table_deps(Deps, I, Deps0, Table, Sizes, DepGraph0, DepGraph).
|
|
|
|
|
|
|
|
add_table_deps_to_variables([], []).
|
2005-02-08 04:05:39 +00:00
|
|
|
add_table_deps_to_variables([var(V,_,_,_,_,_,Deps,K)|LV], DepGraph) :-
|
2004-07-15 17:23:44 +01:00
|
|
|
steal_deps_for_variable(DepGraph, V, NDepGraph, Deps),
|
|
|
|
compute_size(Deps,[],K),
|
2005-12-05 17:16:12 +00:00
|
|
|
% ( clpbn:get_atts(V,[key(Key)]) -> format('~w:~w~n',[Key,K]) ; true),
|
2004-07-15 17:23:44 +01:00
|
|
|
add_table_deps_to_variables(LV, NDepGraph).
|
|
|
|
|
|
|
|
steal_deps_for_variable([V-Info|DepGraph], V0, NDepGraph, [Info|Deps]) :-
|
|
|
|
V == V0, !,
|
|
|
|
steal_deps_for_variable(DepGraph, V0, NDepGraph, Deps).
|
|
|
|
steal_deps_for_variable(DepGraph, _, DepGraph, []).
|
|
|
|
|
|
|
|
compute_size([],Vs,K) :-
|
|
|
|
% use sizes now
|
2004-12-20 21:44:58 +00:00
|
|
|
% length(Vs,K).
|
|
|
|
multiply_sizes(Vs,1,K).
|
2004-07-15 17:23:44 +01:00
|
|
|
compute_size([tab(_,Vs,_)|Tabs],Vs0,K) :-
|
|
|
|
ord_union(Vs,Vs0,VsI),
|
|
|
|
compute_size(Tabs,VsI,K).
|
|
|
|
|
|
|
|
multiply_sizes([],K,K).
|
|
|
|
multiply_sizes([V|Vs],K0,K) :-
|
2005-04-27 21:09:26 +01:00
|
|
|
vel_get_dist_size(V, Sz),
|
2004-07-15 17:23:44 +01:00
|
|
|
KI is K0*Sz,
|
|
|
|
multiply_sizes(Vs,KI,K).
|
|
|
|
|
|
|
|
process(LV0, InputVs, Out) :-
|
2004-12-20 21:44:58 +00:00
|
|
|
find_best(LV0, V0, -1, V, WorkTables, LVI, InputVs),
|
2004-07-15 17:23:44 +01:00
|
|
|
V \== V0, !,
|
2007-11-20 15:51:39 +00:00
|
|
|
% format('1 ~w: ~w~n',[V,WorkTables]),
|
2005-08-02 04:09:52 +01:00
|
|
|
multiply_tables(WorkTables, tab(Tab0,Deps0,_)),
|
2007-11-16 14:58:41 +00:00
|
|
|
reorder_CPT(Deps0,Tab0,Deps,Tab,Sizes),
|
2005-08-02 04:09:52 +01:00
|
|
|
Table = tab(Tab,Deps,Sizes),
|
2007-11-20 15:51:39 +00:00
|
|
|
% format('2 ~w: ~w~n',[V,Table]),
|
2005-04-27 21:09:26 +01:00
|
|
|
project_from_CPT(V,Table,NewTable),
|
2007-11-20 15:51:39 +00:00
|
|
|
% format('3 ~w: ~w~n',[V,NewTable]),
|
2004-07-15 17:23:44 +01:00
|
|
|
include(LVI,NewTable,V,LV2),
|
|
|
|
process(LV2, InputVs, Out).
|
|
|
|
process(LV0, _, Out) :-
|
|
|
|
fetch_tables(LV0, WorkTables),
|
|
|
|
multiply_tables(WorkTables, Out).
|
|
|
|
|
2005-12-05 17:16:12 +00:00
|
|
|
|
2004-12-20 21:44:58 +00:00
|
|
|
find_best([], V, _TF, V, _, [], _).
|
|
|
|
%:-
|
|
|
|
% clpbn:get_atts(V,[key(K)]), write(chosen:K:TF), nl.
|
2005-02-08 04:05:39 +00:00
|
|
|
% root_with_single_child
|
|
|
|
%find_best([var(V,I,_,_,[],Ev,[Dep],K)|LV], _, _, V, [Dep], LVF, Inputs) :- !.
|
|
|
|
find_best([var(V,I,Sz,Vals,Parents,Ev,Deps,K)|LV], _, Threshold, VF, NWorktables, LVF, Inputs) :-
|
2004-12-20 21:44:58 +00:00
|
|
|
( K < Threshold ; Threshold < 0),
|
2004-12-16 06:07:07 +00:00
|
|
|
clpbn_not_var_member(Inputs, V), !,
|
2004-07-15 17:23:44 +01:00
|
|
|
find_best(LV, V, K, VF, WorkTables,LV0, Inputs),
|
|
|
|
(V == VF ->
|
|
|
|
LVF = LV0, Deps = NWorktables
|
|
|
|
;
|
2005-02-08 04:05:39 +00:00
|
|
|
LVF = [var(V,I,Sz,Vals,Parents,Ev,Deps,K)|LV0], WorkTables = NWorktables
|
2004-07-15 17:23:44 +01:00
|
|
|
).
|
|
|
|
find_best([V|LV], V0, Threshold, VF, WorkTables, [V|LVF], Inputs) :-
|
|
|
|
find_best(LV, V0, Threshold, VF, WorkTables, LVF, Inputs).
|
|
|
|
|
|
|
|
multiply_tables([Table], Table) :- !.
|
2007-11-16 14:58:41 +00:00
|
|
|
multiply_tables([TAB1, TAB2| Tables], Out) :-
|
2007-11-28 23:52:14 +00:00
|
|
|
multiply_CPTs(TAB1, TAB2, TAB, _),
|
2007-11-16 14:58:41 +00:00
|
|
|
multiply_tables([TAB| Tables], Out).
|
2004-07-15 17:23:44 +01:00
|
|
|
|
|
|
|
|
2004-12-08 22:32:34 +00:00
|
|
|
simplify_evidence([], Table, Deps, Sizes, Table, Deps, Sizes).
|
|
|
|
simplify_evidence([V|VDeps], Table0, Deps0, Sizes0, Table, Deps, Sizes) :-
|
2005-04-27 21:09:26 +01:00
|
|
|
clpbn:get_atts(V, [evidence(_)]), !,
|
|
|
|
project_from_CPT(V,tab(Table0,Deps0,Sizes0),tab(NewTable,Deps1,Sizes1)),
|
2004-12-08 22:32:34 +00:00
|
|
|
simplify_evidence(VDeps, NewTable, Deps1, Sizes1, Table, Deps, Sizes).
|
|
|
|
simplify_evidence([_|VDeps], Table0, Deps0, Sizes0, Table, Deps, Sizes) :-
|
|
|
|
simplify_evidence(VDeps, Table0, Deps0, Sizes0, Table, Deps, Sizes).
|
|
|
|
|
2004-07-15 17:23:44 +01:00
|
|
|
fetch_tables([], []).
|
2005-02-08 04:05:39 +00:00
|
|
|
fetch_tables([var(_,_,_,_,_,_,Deps,_)|LV0], Tables) :-
|
2004-07-15 17:23:44 +01:00
|
|
|
append(Deps,Tables0,Tables),
|
|
|
|
fetch_tables(LV0, Tables0).
|
|
|
|
%
|
|
|
|
include([],_,_,[]).
|
2005-02-08 04:05:39 +00:00
|
|
|
include([var(V,P,VSz,D,Parents,Ev,Tabs,Est)|LV],tab(T,Vs,Sz),V1,[var(V,P,VSz,D,Parents,Ev,Tabs,Est)|NLV]) :-
|
2004-12-16 06:07:07 +00:00
|
|
|
clpbn_not_var_member(Vs,V), !,
|
2004-07-15 17:23:44 +01:00
|
|
|
include(LV,tab(T,Vs,Sz),V1,NLV).
|
2005-02-08 04:05:39 +00:00
|
|
|
include([var(V,P,VSz,D,Parents,Ev,Tabs,_)|LV],Table,NV,[var(V,P,VSz,D,Parents,Ev,NTabs,NEst)|NLV]) :-
|
2004-12-20 21:44:58 +00:00
|
|
|
update_tables(Tabs,NTabs,Table,NV),
|
|
|
|
compute_size(NTabs, [], NEst),
|
2004-07-15 17:23:44 +01:00
|
|
|
include(LV,Table,NV,NLV).
|
|
|
|
|
2004-12-20 21:44:58 +00:00
|
|
|
update_tables([],[Table],Table,_).
|
|
|
|
update_tables([tab(Tab0,Vs,Sz)|Tabs],[tab(Tab0,Vs,Sz)|NTabs],Table,V) :-
|
2004-12-16 06:07:07 +00:00
|
|
|
clpbn_not_var_member(Vs,V), !,
|
2004-12-20 21:44:58 +00:00
|
|
|
update_tables(Tabs,NTabs,Table,V).
|
|
|
|
update_tables([_|Tabs],NTabs,Table,V) :-
|
|
|
|
update_tables(Tabs,NTabs,Table,V).
|
2004-07-15 17:23:44 +01:00
|
|
|
|
2005-04-27 21:09:26 +01:00
|
|
|
vel_get_dist_size(V,Sz) :-
|
2004-12-16 06:07:07 +00:00
|
|
|
get_atts(V, [size(Sz)]), !.
|
2005-04-27 21:09:26 +01:00
|
|
|
vel_get_dist_size(V,Sz) :-
|
2007-07-13 01:52:54 +01:00
|
|
|
clpbn:get_atts(V,dist(Id,_)), !,
|
|
|
|
get_dist_domain_size(Id,Sz),
|
2004-12-16 06:07:07 +00:00
|
|
|
put_atts(V, [size(Sz)]).
|
|
|
|
|