yap-6.3/packages/cplint/em/em.pl

/*

CEM

Copyright (c) 2011, Fabrizio Riguzzi

*/
%:- set_prolog_flag(unknown,error).
%:- set_prolog_flag(profiling,on).
%:- set_prolog_flag(debug,on).
:- set_prolog_flag(discontiguous_warnings,on).
:- set_prolog_flag(single_var_warnings,on).
:- set_prolog_flag(unknown,fail).
%:-source.
%:-yap_flag(gc_trace,very_verbose).
:- use_module(inference,
[find_deriv_inf1/3]).
%:-consult(inference).
:-use_module(library(rbtrees)).
:-use_module(library(random)).
:-use_module(library(avl)).
:-use_module(library(lists)).

%:-use_module(library(lpadsld)).
:-load_foreign_files(['cplint'],[],init_my_predicates).

:-dynamic setting/2,rule/5.


setting(depth,3).
setting(single_var,false).

setting(sample_size,1000).
/* Total number of examples in case in which the models in the kb file contain
a prob(P). fact. In that case, one model corresponds to sample_size*P examples
*/
setting(equivalent_sample_size,100).
/* equivalent samaple size for computing the BD score of the network refinements
It is indicated with NPrime in the formulas on Heckerman, Geiger & Chickering
paper */
setting(epsilon_em,0.1).
setting(epsilon_em_fraction,0.01).
/* if the difference in log likelihood in two successive em iteration is smaller
than epsilon_em, then em stops */
setting(epsilon_sem,2).
setting(random_restarts_number,1).
/* number of random restarts of em */
setting(verbosity,1).


em(File):-
  generate_file_names(File,FileKB,FileOut,FileL,FileLPAD),
  reconsult(FileL),
  load_models(FileKB,DB),
  load_initial_model(FileLPAD,Model0),!,
  set(verbosity,3),
  statistics(cputime,[_,_]),
  gen_ex(DB,[],DBE),
  compute_parameters_EM(Model0,Model,SuffStats,CLL,DBE),
  statistics(cputime,[_,CT]),
  CTS is CT/1000,
  format("Final CLL ~f~n",[CLL]),
  format("Execution time ~f~n",[CTS]),
  write_stats(user_output,SuffStats),
  listing(setting/2),
  format("Model:~n",[]),
  write_model(Model,user_output),
  open(FileOut,write,Stream),
  format(Stream,"/* Final CLL ~f~n",[CLL]),
  format(Stream,"Execution time ~f~n",[CTS]),
  tell(Stream),
  listing(setting/2),
  write_stats(Stream,SuffStats),
  format(Stream,"*/~n",[]),
  write_model(Model,Stream),
  told.

gen_ex([],DBE,DBE).

gen_ex([H|T],DB0,DB1):-
        get_ouptut_atoms(O),
  generate_goal(O,H,[],GL),
  append(DB0,GL,DB2),
  gen_ex(T,DB2,DB1).


cycle_head([],[],_NR,_S,_NH,_PG,_CSetList,_N):-!.

cycle_head([SSH0|T],[SSH1|T1],NR,S,NH,PG,CSetList,N):-
  extract_relevant_C_sets(NR,S,NH,CSetList,CSL1),
  (CSL1=[]->
    SSH1 is SSH0
  ;
    build_formula(CSL1,Formula,[],Var),
    var2numbers(Var,0,NewVar),
    compute_prob(NewVar,Formula,Prob,0),
    SSH1 is SSH0 +Prob/PG*N
  ),
  NH1 is NH+1,
  cycle_head(T,T1,NR,S,NH1,PG,CSetList,N).

cycle_head_neg([],[],_NR,_S,_NH,_NA,_PG,_CSetList,_N):-!.

cycle_head_neg([SSH0|T],[SSH1|T1],NR,S,NH,NA,PG,CSetList,N):-
        extract_relevant_C_sets_neg(NR,S,NH,NA,CSetList,CSL1),
        (CSL1=[]->
                SSH1 is SSH0%+0.001
        ;
                build_formula(CSL1,Formula,[],Var),
                var2numbers(Var,0,NewVar),
                compute_prob(NewVar,Formula,Prob,0),
                (Prob>1 ->write(cyc),write(Prob),write(NewVar),nl;true),
                SSH1 is SSH0 +(1-Prob)/PG*N
        ),
        NH1 is NH+1,
        cycle_head_neg(T,T1,NR,S,NH1,NA,PG,CSetList,N).

extract_relevant_C_sets_neg(NR,S,NH,NA,CS,CS1):-
        neg_choice(0,NA,NH,NR,S,C),
        append(CS,C,CS1).

neg_choice(N,N,_NH,_NR,_S,[]):-!.

neg_choice(NH,NA,NH,NR,S,L):-!,
        N1 is NH+1,
        neg_choice(N1,NA,NH,NR,S,L).

neg_choice(N,NA,NH,NR,S,[[(N,NR,S)]|L]):-
        N1 is N+1,
        neg_choice(N1,NA,NH,NR,S,L).

extract_relevant_C_sets(_NR,_S,_NH,[],[]):-!.

extract_relevant_C_sets(NR,S,NH,[H|T],CS):-
  member((NH1,NR,S),H),!,
  extract_relevant_C_sets1(NR,S,NH,NH1,H,T,CS).

extract_relevant_C_sets(NR,S,NH,[H|T],[H1|CS]):-
  append(H,[(NH,NR,S)],H1),
  extract_relevant_C_sets(NR,S,NH,T,CS).

extract_relevant_C_sets1(NR,S,NH,NH1,_H,T,CS):-
  NH1\=NH,!,
  extract_relevant_C_sets(NR,S,NH,T,CS).

extract_relevant_C_sets1(NR,S,NH,_NH1,H,T,[H|CS]):-
  extract_relevant_C_sets(NR,S,NH,T,CS).


/* EM start */
compute_parameters_EM([],[],SuffStats,-1e200,_DB):-!,
  rb_new(SuffStats).

compute_parameters_EM(Model0,Model1,SuffStats1,CLL1,DB):-
  setting(verbosity,Ver),
  (Ver>0->
    format("EM computation ~nInitial model:~n",[]),
    write_model(Model0,user_output),
    flush_output
  ;
    true
  ),
  (Ver>2->
    format("Initial EM Iteration ~n",[]),
    flush_output
  ;
    true
  ),
  randomize(Model0,ModelR),
  em_iteration(ModelR,Model,SuffStats,CLL,DB),
  (Ver>2->
    format("CLL ~f~n",[CLL])
  ;
    true
  ),
  flush_output,
  setting(random_restarts_number,N),
  random_restarts(N,Model,SuffStats,CLL,Model1,SuffStats1,CLL1,DB),
  (Ver>0->
    format("Final CLL ~f~n",[CLL1]),
    flush_output
  ;
    true
  ).

random_restarts(1,Model,SS,CLL,Model,SS,CLL,_DB):-!.

random_restarts(N,Model0,SS0,CLL0,Model1,SS1,CLL1,DB):-
  setting(verbosity,Ver),
  (Ver>2->
    setting(random_restarts_number,NMax),
    Num is NMax-N+1,
    format("Restart number ~d~n",[Num]),
    flush_output
  ;
    true
  ),
  randomize(Model0,ModelR),
  em_iteration(ModelR,ModelR1,SSR,CLLR,DB),
  setting(verbosity,Ver),
  (Ver>2->
    format("CLL ~f~n",[CLLR])
  ;
    true
  ),
  N1 is N-1,
  (CLLR>CLL0->
    random_restarts(N1,ModelR1,SSR,CLLR,Model1,SS1,CLL1,DB)
  ;
    random_restarts(N1,Model0,SS0,CLL0,Model1,SS1,CLL1,DB)
  ).

randomize([],[]):-!.

randomize([rule(N,V,NH,HL,BL,LogF)|T],[rule(N,V,NH,HL1,BL,LogF)|T1]):-
  length(HL,L),
  Int is 1.0/L,
  randomize_head(Int,HL,0,HL1),
  randomize(T,T1).

randomize_head(_Int,['':_],P,['':PNull1]):-!,
  PNull is 1.0-P,
  (PNull>=0.0->
    PNull1 =PNull
  ;
    PNull1=0.0
  ).

randomize_head(Int,[H:_|T],P,[H:PH1|NT]):-
  PMax is 1.0-P,
  random(0,PMax,PH1),
  P1 is P+PH1,
  randomize_head(Int,T,P1,NT).


em_iteration(Model0,ModelPar,SuffStats1,CLL1,DB):-
  compute_CLL_stats(Model0,DB,CLL0,SuffStats0),
/*  setting(verbosity,Ver),
  (Ver>2->
    format("EM Iteration numer ~d~nCLL ~f~n",[N,CLL0]),
    write_stats(user_output,SuffStats0)
  ;
    true
  ),*/
  cycle_EM(Model0,SuffStats0,CLL0,ModelPar,SuffStats1,CLL1,DB,1).

cycle_EM(Model0,SuffStats0,CLL0,ModelPar,SuffStats,CLL,DB,N):-
  m_step(Model0,SuffStats0,Model1),
  compute_CLL_stats(Model1,DB,CLL1,SuffStats1),
  setting(verbosity,Ver),
  (Ver>2->
    format("Iteration: ~d CLL ~f~n",[N,CLL1])
  ;
    true
  ),
  flush_output,
%  write_stats(user_output,SuffStats1),
%  statistics,
  setting(epsilon_em,Epsilon_EM),
  setting(epsilon_em_fraction,Epsilon_EM_Frac),
  ((CLL1-CLL0<Epsilon_EM;(CLL1-CLL0)< - CLL0*Epsilon_EM_Frac)->
    ModelPar=Model1,
    SuffStats=SuffStats1,
    CLL=CLL1,!
  ;
    N1 is N+1,!,
    cycle_EM(Model1,SuffStats1,CLL1,ModelPar,SuffStats,CLL,DB,N1)
  ).

write_stats(S,SS):-
  rb_visit(SS,Pairs),
  format(S,"Suff stats~n",[]),
  write_stats_list(S,Pairs).

write_stats_list(S,[]):-nl(S),nl(S),!.

write_stats_list(S,[R-d(D,N,I)|T]):-
  format(S,"~d,~p,~f,~d~n",[R,D,N,I]),
  write_stats_list(S,T).

m_step([],_SS,[]):-!.

m_step([rule(N,V,NH,HL,BL,LogF)|T],SS,[rule(N,V,NH,HL1,BL,LogF)|T1]):-
  (rb_lookup(N,d(Distr,_NBT,_NI),SS)->
    sum_list(Distr,NBT),
    update_head(HL,Distr,NBT,HL1)
  ;
    HL1=HL
  ),
  m_step(T,SS,T1).

update_head([],[],_N,[]).

update_head([H:_P|T],[PU|TP],N,[H:P|T1]):-
  P is PU/N,
  update_head(T,TP,N,T1).


/* EM end */


/* Start of computation of log likelihood and sufficient stats */
compute_CLL_stats(Model,DB,CLL,SuffStats1):-
  assert_model(Model),
  compute_CLL_stats_examples(DB,CLL,SuffStats1),
  retract_model.

assert_model([]):-!.

assert_model([rule(N,V,NH,HL,BL,_LogF)|T]):-
  assert_rules(HL,0,HL,BL,NH,N,V),
  assertz(rule_by_num(N,V,NH,HL,BL)),
  assert_model(T).

retract_model:-
  retractall(rule_by_num(_,_,_,_,_)),
  retractall(rule(_,_,_,_,_,_,_,_)).

assert_rules([],_Pos,_HL,_BL,_Nh,_N,_V1):-!.

assert_rules(['':_P],_Pos,_HL,_BL,_Nh,_N,_V1):-!.

assert_rules([H:P|T],Pos,HL,BL,NH,N,V1):-
        assertz(rule(H,P,Pos,N,V1,NH,HL,BL)),
        Pos1 is Pos+1,
        assert_rules(T,Pos1,HL,BL,NH,N,V1).

compute_CLL_stats_examples(DB,CLL,SuffStats1):-
  rb_new(SuffStats0),
  compute_CLL_stats_cplint(DB,0,CLL,SuffStats0,SuffStats1).

get_ouptut_atoms(O):-
  findall((A/Ar),output((A/Ar)),O).

generate_goal([],_H,G,G):-!.

generate_goal([P/A|T],H,G0,G1):-
  functor(Pred,P,A),
  Pred=..[P|Rest],
  Pred1=..[P,H|Rest],
  findall(Pred1,call(Pred1),L),
  findall(\+ Pred1,call(neg(Pred1)),LN),
  append(G0,L,G2),
  append(G2,LN,G3),
  generate_goal(T,H,G3,G1).

compute_CLL_stats_cplint([],CLL,CLL,S,S):-!.

compute_CLL_stats_cplint([\+ H|T],CLL0,CLL1,Stats0,Stats1):-!,
        setting(verbosity,V),
        (V>3->
                write(user_error,(\+ H)),nl(user_error),flush_output
        ;
                true
        ),
        s([H],CL,CSetList,PG),!,
        (PG=:=1.0->
                CLL2=CLL0,
                Stats2=Stats0
        ;
                (prob(H,P)->
                        setting(sample_size,NTot),
                        N is P*NTot
                ;
                        N=1
                ),
                PG1 is 1-PG,
                CLL2 is CLL0+log(PG1)*N,
                collect_stats_cplint_neg(CL,PG1,CSetList,N,Stats0,Stats2)
        ),
        compute_CLL_stats_cplint(T,CLL2,CLL1,Stats2,Stats1).

compute_CLL_stats_cplint([H|T],CLL0,CLL1,Stats0,Stats1):-
        setting(verbosity,V),
        (V>3->
                write(user_error,H),nl(user_error),flush_output
        ;
                true
        ),
  s([H],CL,CSetList,PG),!,
  (PG=0.0->
    CLL2=CLL0,
    Stats2=Stats0
  ;
    (prob(H,P)->
      setting(sample_size,NTot),
      N is P*NTot
    ;
      N=1
    ),
    CLL2 is CLL0+log(PG)*N,
    collect_stats_cplint(CL,PG,CSetList,N,Stats0,Stats2)
  ),
  compute_CLL_stats_cplint(T,CLL2,CLL1,Stats2,Stats1).


s(GoalsList,GroundLpad,CSets,Prob):-
  solve(GoalsList,GroundLpad,CSets,Prob).

solve(GoalsList,GroundLpad,LDup,Prob):-
        setting(depth,D),
        findall(Deriv,inference:find_deriv_inf1(GoalsList,D,Deriv),LDup),
        (LDup=[]->
                Prob=0.0,
                GroundLpad=[]
        ;
                append(LDup,L0),
                remove_head(L0,L1),
                remove_duplicates(L1,L2),
                build_ground_lpad(L2,GroundLpad),
                build_formula(LDup,Formula,[],Var),
                var2numbers(Var,0,NewVar),
                compute_prob(NewVar,Formula,Prob,0),
                true
        ).

collect_stats_cplint([],_PG,_CSetList,_N,Stats,Stats):-!.

collect_stats_cplint([(R,S,Head,_Body)|T],PG,CSetList,N,Stats0,Stats1):-
  (rb_lookup(R,d(Distr0,N1,NInst1),Stats0)->
    cycle_head(Distr0,Distr,R,S,0,PG,CSetList,N),
    N2 is N+N1,
    rb_update(Stats0,R,d(Distr,N2,NInst1),Stats2)
  ;
    length(Head,LH),
    list0(0,LH,Distr0),
    cycle_head(Distr0,Distr,R,S,0,PG,CSetList,N),
    rb_insert(Stats0,R,d(Distr,N,1),Stats2)
  ),
  collect_stats_cplint(T,PG,CSetList,N,Stats2,Stats1).

collect_stats_cplint_neg([],_PG,_CSetList,_N,Stats,Stats):-!.

collect_stats_cplint_neg([(R,S,Head,_Body)|T],PG,CSetList,N,Stats0,Stats1):-
        length(Head,NA),
        (rb_lookup(R,d(Distr0,N1,NInst1),Stats0)->
                cycle_head_neg(Distr0,Distr,R,S,0,NA,PG,CSetList,N),
                N2 is N+N1,
                rb_update(Stats0,R,d(Distr,N2,NInst1),Stats2)
        ;
                length(Head,LH),
                list0(0,LH,Distr0),
                cycle_head_neg(Distr0,Distr,R,S,0,NA,PG,CSetList,N),
                rb_insert(Stats0,R,d(Distr,N,1),Stats2)
        ),
        collect_stats_cplint_neg(T,PG,CSetList,N,Stats2,Stats1).

/* build_formula(LC,Formula,VarIn,VarOut) takes as input a set of C sets
LC and a list of Variables VarIn and returns the formula and a new list
of variables VarOut
Formula is of the form [Term1,...,Termn]
Termi is of the form [Factor1,...,Factorm]
Factorj is of the form (Var,Value) where Var is the index of
the multivalued variable Var and Value is the index of the value
*/
build_formula([],[],Var,Var,C,C).

build_formula([D|TD],[F|TF],VarIn,VarOut,C0,C1):-
        length(D,NC),
        C2 is C0+NC,
        build_term(D,F,VarIn,Var1),
        build_formula(TD,TF,Var1,VarOut,C2,C1).

build_formula([],[],Var,Var).

build_formula([D|TD],[F|TF],VarIn,VarOut):-
        build_term(D,F,VarIn,Var1),
        build_formula(TD,TF,Var1,VarOut).

build_term([],[],Var,Var).

build_term([(_,pruned,_)|TC],TF,VarIn,VarOut):-!,
        build_term(TC,TF,VarIn,VarOut).

build_term([(N,R,S)|TC],[[NVar,N]|TF],VarIn,VarOut):-
        (nth0_eq(0,NVar,VarIn,(R,S))->
                Var1=VarIn
        ;
                append(VarIn,[(R,S)],Var1),
                length(VarIn,NVar)
        ),
        build_term(TC,TF,Var1,VarOut).

/* nth0_eq(PosIn,PosOut,List,El) takes as input a List,
an element El and an initial position PosIn and returns in PosOut
the position in the List that contains an element exactly equal to El
*/
nth0_eq(N,N,[H|_T],El):-
        H==El,!.

nth0_eq(NIn,NOut,[_H|T],El):-
        N1 is NIn+1,
        nth0_eq(N1,NOut,T,El).

/* var2numbers converts a list of couples (Rule,Substitution) into a list
of triples (N,NumberOfHeadsAtoms,ListOfProbabilities), where N is an integer
starting from 0 */
var2numbers([],_N,[]).

var2numbers([(R,S)|T],N,[[N,ValNumber,Probs]|TNV]):-
        find_probs(R,S,Probs),
        length(Probs,ValNumber),
        N1 is N+1,
        var2numbers(T,N1,TNV).

find_probs(R,S,Probs):-
        rule_by_num(R,S,_N,Head,_Body),
        get_probs(Head,Probs).

get_probs(uniform(_A:1/Num,_P,_Number),ListP):-
        Prob is 1/Num,
        list_el(Num,Prob,ListP).

get_probs([],[]).

get_probs([_H:P|T],[P1|T1]):-
        P1 is P,
        get_probs(T,T1).

list_el(0,_P,[]):-!.

list_el(N,P,[P|T]):-
        N1 is N-1,
        list_el(N1,P,T).

sum(_NS,[],[],[]):-!.

sum(NS,[H0|T0],[H1|T1],[H2|T2]):-
  H2 is H0+H1*NS,
  sum(NS,T0,T1,T2).

times(_NS,[],[]):-!.

times(NS,[H0|T0],[H1|T1]):-
  H1 is H0*NS,
  times(NS,T0,T1).

/* End of computation of log likelihood and sufficient stats */

/* Utility predicates */
generate_file_names(File,FileKB,FileOut,FileL,FileLPAD):-
    generate_file_name(File,".kb",FileKB),
    generate_file_name(File,".rules",FileOut),
    generate_file_name(File,".cpl",FileLPAD),
    generate_file_name(File,".l",FileL).

generate_file_name(File,Ext,FileExt):-
    name(File,FileString),
    append(FileString,Ext,FileStringExt),
    name(FileExt,FileStringExt).


set(Parameter,Value):-
  retract(setting(Parameter,_)),
  assert(setting(Parameter,Value)).

load_initial_model(File,Model):-
  open(File,read,S),
  read_clauses(S,C),
  close(S),
  process_clauses(C,1,_N,[],Model).

process_clauses([(end_of_file,[])],N,N,Model,Model).

process_clauses([((H:-B),_V)|T],N,N2,Model0,Model1):-
        H=(db(A)),!,
  assert((A:-B)),
  process_clauses(T,N,N2,Model0,Model1).

process_clauses([((H:-B),V)|T],N,N2,Model0,[rule(N,V1,NH,HL,BL,0)|Model1]):-
  H=(_;_),!,
  list2or(HL1,H),
  process_head(HL1,HL,VI),
  list2and(BL0,B),
  add_int_atom(BL0,BL,VI),
  length(HL,LH),
  listN(0,LH,NH),
  N1 is N+1,
  (setting(single_var,true)->
    V1=[]
  ;
    V1=V
  ),
%  assertz(rule(N,V,NH,HL,BL)),
  process_clauses(T,N1,N2,Model0,Model1).

process_clauses([((H:-B),V)|T],N,N2,Model0,[rule(N,V1,NH,HL,BL,0)|Model1]):-
  H=(_:_),!,
  list2or(HL1,H),
  process_head(HL1,HL,VI),
  list2and(BL0,B),
  add_int_atom(BL0,BL,VI),
  length(HL,LH),
  listN(0,LH,NH),
  (setting(single_var,true)->
    V1=[]
  ;
    V1=V
  ),
  N1 is N+1,
%  assertz(rule(N,V1,NH,HL,BL)),
  process_clauses(T,N1,N2,Model0,Model1).

process_clauses([((H:-B),V)|T],N,N2,Model0,[rule(N,V1,NH,HL,BL,0)|Model1]):-!,
  process_head([H:1.0],HL,VI),
  list2and(BL0,B),
  add_int_atom(BL0,BL,VI),
  length(HL,LH),
  listN(0,LH,NH),
  (setting(single_var,true)->
    V1=[]
  ;
    V1=V
  ),
  N1 is N+1,
%  assertz(rule(N,V1,NH,HL,BL)),
  process_clauses(T,N1,N2,Model0,Model1).

process_clauses([(H,V)|T],N,N2,Model0,[rule(N,V1,NH,HL,[],0)|Model1]):-
  H=(_;_),!,
  list2or(HL1,H),
  process_head(HL1,HL,_VI),
  length(HL,LH),
  listN(0,LH,NH),
  (setting(single_var,true)->
    V1=[]
  ;
    V1=V
  ),
  N1 is N+1,
%  assertz(rule(N,V,NH,HL,[])),
  process_clauses(T,N1,N2,Model0,Model1).

process_clauses([(H,V)|T],N,N2,Model0,[rule(N,V1,NH,HL,[],0)|Model1]):-
  H=(_:_),!,
  list2or(HL1,H),
  process_head(HL1,HL,_VI),
  length(HL,LH),
  listN(0,LH,NH),
  (setting(single_var,true)->
    V1=[]
  ;
    V1=V
  ),
  N1 is N+1,
%  assertz(rule(N,V,NH,HL,[])),
  process_clauses(T,N1,N2,Model0,Model1).

process_clauses([(H,V)|T],N,N2,Model0,[rule(N,V1,NH,HL,[],0)|Model1]):-
  process_head([H:1.0],HL,_VI),
  length(HL,LH),
  listN(0,LH,NH),
  (setting(single_var,true)->
    V1=[]
  ;
    V1=V
  ),
  N1 is N+1,
%  assertz(rule(N,V,NH,HL,[])),
  process_clauses(T,N1,N2,Model0,Model1).


/* if the annotation in the head are not ground, the null atom is not added
and the eventual formulas are not evaluated */

process_head([H:P|T],NHL,VI):-!,
    process_head_prob([H:P|T],0.0,NHL,VI).

process_head(HL,NHL,VI):-
    process_head_random(HL,0.0,NHL,VI).

process_head_random([],P,['':PNull1],_VI):-
  PNull is 1.0-P,
  (PNull>=0.0->
    PNull1 =PNull
  ;
    PNull1=0.0
  ).

process_head_random([H|T],P,[H1:PH1|NT],VI):-
  add_int_atom([H],[H1],VI),
  PMax is 1.0-P,
  random(0,PMax,PH1),
  P1 is P+PH1,
  process_head_random(T,P1,NT,VI).


process_head_prob([H:PH],P,[H1:PH1,'':PNull1],VI):-
  add_int_atom([H],[H1],VI),
  PH1 is PH,
  PNull is 1.0-P-PH1,
  (PNull>=0.0->
    PNull1 =PNull
  ;
    PNull1=0.0
  ).

process_head_prob([H:PH|T],P,[H1:PH1|NT],VI):-
  add_int_atom([H],[H1],VI),
  PH1 is PH,
  P1 is P+PH1,
  process_head_prob(T,P1,NT,VI).


add_int_atom([],[],_VI).

add_int_atom([\+ H|T],[\+ H|T1],VI):-
    inference:builtin(H),!,
  add_int_atom(T,T1,VI).

add_int_atom([\+ H|T],[\+ H1|T1],VI):-!,
  H=..[F|Args],
  H1=..[F,VI|Args],
  add_int_atom(T,T1,VI).

add_int_atom([H|T],[H|T1],VI):-
  inference:builtin(H),!,
  add_int_atom(T,T1,VI).

add_int_atom([H|T],[H1|T1],VI):-
  H=..[F|Args],
  H1=..[F,VI|Args],
  add_int_atom(T,T1,VI).

/* predicates for reading in the program clauses */
read_clauses(S,Clauses):-
    read_clauses_ground_body(S,Clauses).


read_clauses_ground_body(S,[(Cl,V)|Out]):-
  read_term(S,Cl,[variable_names(V)]),
  (Cl=end_of_file->
    Out=[]
  ;
    read_clauses_ground_body(S,Out)
  ).


listN(N,N,[]):-!.

listN(NIn,N,[NIn|T]):-
  N1 is NIn+1,
  listN(N1,N,T).

list0(N,N,[]):-!.

list0(NIn,N,[0|T]):-
  N1 is NIn+1,
  list0(N1,N,T).

/* end of predicates for parsing an input file containing a program */


load_models(File,ModulesList):-
    open(File,read,Stream),
    read_models(Stream,ModulesList),
    close(Stream).

read_models(Stream,[Name1|Names]):-
    read(Stream,begin(model(Name))),!,
    (number(Name)->
        name(Name,NameStr),
        append("i",NameStr,Name1Str),
        name(Name1,Name1Str)
    ;
        Name1=Name
    ),
    read_all_atoms(Stream,Name1),
    read_models(Stream,Names).

read_models(_S,[]).

read_all_atoms(Stream,Name):-
    read(Stream,At),
    At \=end(model(_Name)),!,
    (At=neg(Atom)->
      Atom=..[Pred|Args],
      Atom1=..[Pred,Name|Args],
      assertz(neg(Atom1))
    ;
      At=..[Pred|Args],
      Atom1=..[Pred,Name|Args],
      assertz(Atom1)
    ),
    read_all_atoms(Stream,Name).

read_all_atoms(_S,_N).


list2or([],true):-!.

list2or([X],X):-
    X\=;(_,_),!.

list2or([H|T],(H ; Ta)):-!,
    list2or(T,Ta).

list2and([],true):-!.

list2and([X],X):-
    X\=(_,_),!.

list2and([H|T],(H,Ta)):-!,
    list2and(T,Ta).


write_model([],_Stream):-!.

write_model([rule(_N,_V,_NH,HL,BL,_LogF)|Rest],Stream):-
  copy_term((HL,BL),(HL1,BL1)),
    numbervars((HL1,BL1),0,_M),
    write_disj_clause(Stream,(HL1:-BL1)),
    format(Stream,".~n~n",[]),
    write_model(Rest,Stream).


write_disj_clause(S,(H:-[])):-!,
  write_head(S,H).

write_disj_clause(S,(H:-B)):-
  write_head(S,H),
  write(S,' :-'),
  nl(S),
  write_body(S,B).

write_head(S,[A:1.0|_Rest]):-!,
  remove_int_atom(A,A1),
    format(S,"~p",[A1]).

write_head(S,[A:P,'':_P]):-!,
  remove_int_atom(A,A1),
    format(S,"~p:~f",[A1,P]).

write_head(S,[A:P|Rest]):-
  remove_int_atom(A,A1),
    format(S,"~p:~f ; ",[A1,P]),
    write_head(S,Rest).

write_body(S,[\+ A]):-!,
  remove_int_atom(A,A1),
    format(S,"\t\\+ ~p",[A1]).

write_body(S,[A]):-!,
  remove_int_atom(A,A1),
    format(S,"\t~p",[A1]).

write_body(S,[\+ A|T]):-!,
  remove_int_atom(A,A1),
    format(S,"\t\\+ ~p,~n",[A1]),
    write_body(S,T).

write_body(S,[A|T]):-
  remove_int_atom(A,A1),
    format(S,"\t~p,~n",[A1]),
    write_body(S,T).


remove_int_atom(A,A1):-
  A=..[F,_|T],
  A1=..[F|T].

build_ground_lpad([],[]):-!.

build_ground_lpad([(R,S)|T],[(R,S,Head,Body)|T1]):-
  user:rule_by_num(R,S,_,Head,Body),
  build_ground_lpad(T,T1).


remove_head([],[]).

remove_head([(_N,R,S)|T],[(R,S)|T1]):-
  remove_head(T,T1).


append_all([],L,L):-!.

append_all([LIntH|IntT],IntIn,IntOut):-
  append(IntIn,LIntH,Int1),
  append_all(IntT,Int1,IntOut).