2009-02-16 12:23:29 +00:00
|
|
|
%
|
|
|
|
% Maximum likelihood estimator and friends.
|
|
|
|
%
|
|
|
|
%
|
|
|
|
% This assumes we have a single big example.
|
|
|
|
%
|
|
|
|
|
2012-12-17 17:57:00 +00:00
|
|
|
:- module(clpbn_mle,
|
|
|
|
[learn_parameters/2,
|
|
|
|
learn_parameters/3,
|
|
|
|
parameters_from_evidence/3
|
|
|
|
]).
|
2009-02-16 12:23:29 +00:00
|
|
|
|
|
|
|
:- use_module(library('clpbn')).
|
2012-12-17 17:57:00 +00:00
|
|
|
|
2009-02-16 12:23:29 +00:00
|
|
|
:- use_module(library('clpbn/learning/learn_utils'),
|
2012-12-17 17:57:00 +00:00
|
|
|
[run_all/1,
|
|
|
|
clpbn_vars/2,
|
|
|
|
normalise_counts/2,
|
|
|
|
soften_table/2,
|
|
|
|
normalise_counts/2
|
|
|
|
]).
|
2009-02-16 12:23:29 +00:00
|
|
|
|
|
|
|
:- use_module(library('clpbn/dists'),
|
2012-12-17 17:57:00 +00:00
|
|
|
[empty_dist/2,
|
|
|
|
dist_new_table/2
|
|
|
|
]).
|
2009-02-16 12:23:29 +00:00
|
|
|
|
|
|
|
:- use_module(library(matrix),
|
2012-12-17 17:57:00 +00:00
|
|
|
[matrix_inc/2]).
|
2009-02-16 12:23:29 +00:00
|
|
|
|
|
|
|
|
|
|
|
learn_parameters(Items, Tables) :-
|
|
|
|
learn_parameters(Items, Tables, []).
|
|
|
|
|
|
|
|
%
|
|
|
|
% full evidence learning
|
|
|
|
%
|
|
|
|
learn_parameters(Items, Tables, Extras) :-
|
|
|
|
run_all(Items),
|
|
|
|
attributes:all_attvars(AVars),
|
|
|
|
% sort and incorporate evidence
|
|
|
|
clpbn_vars(AVars, AllVars),
|
|
|
|
mk_sample(AllVars, Sample),
|
|
|
|
compute_tables(Extras, Sample, Tables).
|
|
|
|
|
|
|
|
parameters_from_evidence(AllVars, Sample, Extras) :-
|
|
|
|
mk_sample_from_evidence(AllVars, Sample),
|
|
|
|
compute_tables(Extras, Sample, Tables).
|
|
|
|
|
|
|
|
mk_sample_from_evidence(AllVars, SortedSample) :-
|
|
|
|
add_evidence2sample(AllVars, Sample),
|
|
|
|
msort(Sample, SortedSample).
|
|
|
|
|
|
|
|
mk_sample(AllVars, SortedSample) :-
|
|
|
|
add2sample(AllVars, Sample),
|
|
|
|
msort(Sample, SortedSample).
|
|
|
|
|
|
|
|
%
|
|
|
|
% assumes we have full data, meaning evidence for every variable
|
|
|
|
%
|
|
|
|
add2sample([], []).
|
|
|
|
add2sample([V|Vs],[val(Id,[Ev|EParents])|Vals]) :-
|
|
|
|
clpbn:get_atts(V, [evidence(Ev),dist(Id,Parents)]),
|
|
|
|
get_eparents(Parents, EParents),
|
|
|
|
add2sample(Vs, Vals).
|
|
|
|
|
|
|
|
get_eparents([P|Parents], [E|EParents]) :-
|
|
|
|
clpbn:get_atts(P, [evidence(E)]),
|
|
|
|
get_eparents(Parents, EParents).
|
|
|
|
get_eparents([], []).
|
|
|
|
|
|
|
|
|
|
|
|
%
|
|
|
|
% assumes we ignore variables without evidence or without evidence
|
|
|
|
% on a parent!
|
|
|
|
%
|
|
|
|
add_evidence2sample([], []).
|
|
|
|
add_evidence2sample([V|Vs],[val(Id,[Ev|EParents])|Vals]) :-
|
|
|
|
clpbn:get_atts(V, [evidence(Ev),dist(Id,Parents)]),
|
|
|
|
get_eveparents(Parents, EParents), !,
|
|
|
|
add_evidence2sample(Vs, Vals).
|
|
|
|
add_evidence2sample([_|Vs],Vals) :-
|
|
|
|
add_evidence2sample(Vs, Vals).
|
|
|
|
|
|
|
|
get_eveparents([P|Parents], [E|EParents]) :-
|
|
|
|
clpbn:get_atts(P, [evidence(E)]),
|
|
|
|
get_eparents(Parents, EParents).
|
|
|
|
get_eveparents([], []).
|
|
|
|
|
|
|
|
|
|
|
|
compute_tables(Parameters, Sample, NewTables) :-
|
|
|
|
estimator(Sample, Tables),
|
|
|
|
add_priors(Parameters, Tables, NewTables).
|
|
|
|
|
|
|
|
estimator([], []).
|
|
|
|
estimator([val(Id,Sample)|Samples], [NewDist|Tables]) :-
|
|
|
|
empty_dist(Id, NewTable),
|
|
|
|
id_samples(Id, Samples, IdSamples, MoreSamples),
|
|
|
|
mle([Sample|IdSamples], NewTable),
|
|
|
|
soften_table(NewTable, SoftenedTable),
|
|
|
|
normalise_counts(SoftenedTable, NewDist),
|
|
|
|
% replace matrix in distribution
|
|
|
|
dist_new_table(Id, NewDist),
|
|
|
|
estimator(MoreSamples, Tables).
|
|
|
|
|
|
|
|
|
|
|
|
id_samples(_, [], [], []).
|
|
|
|
id_samples(Id, [val(Id,Sample)|Samples], [Sample|IdSamples], MoreSamples) :- !,
|
|
|
|
id_samples(Id, Samples, IdSamples, MoreSamples).
|
|
|
|
id_samples(_, Samples, [], Samples).
|
|
|
|
|
|
|
|
mle([Sample|IdSamples], Table) :-
|
|
|
|
matrix_inc(Table, Sample),
|
|
|
|
mle(IdSamples, Table).
|
|
|
|
mle([], _).
|
|
|
|
|