%%% -*- Mode: Prolog; -*-

%  $Date: 2011-11-28 14:41:26 +0100 (Mon, 28 Nov 2011) $
%  $Revision: 6764 $
%  This file is part of ProbLog
%  http://dtai.cs.kuleuven.be/problog
%  ProbLog was developed at Katholieke Universiteit Leuven
%  Copyright 2008, 2009, 2010
%  Katholieke Universiteit Leuven
%  Main authors of this file:
%  Theofrastos Mantadelis
% Module hash_table.
% Maps tuples of form (x1,x2,...,xn) to incremental IDs.
% Ensures lookup time for tuple = O(n) with n being the size of tuple lookup
% time is independed from the amount of entries in the table when +Size big.
% If +Size not big enought then lookup time linear per +Size entries.
% To return from ID to tuple again constant time but based on +TuppleSize.
% Exports:
% hash_table_init(+Size, -HashTable)
% hash_table_init(+Size, +TupleSize, -HashTable)
%   Initializes a hash table with internal array size of +Size, and #tuples
%   of +TupleSize.
%   +Size ~> # of problog different prob facts.
%   +TupleSize ~> estimated tuples to be used.
% hash_table_set_domain_size(+HashTable, +Tuple, +TupleSize)
%   Useful to define that a specific +Tuple mask will have specific internal
%   size. It also pre initialized an array for the ID.
%   Examples: if problog fact ID1 is a non-ground and we now that it has
%   1000 possible groundings then: hash_table_set_domain_size(HT, ID1, 1000).
%   problog fact ID2 is an mvs with 5 possible values and each is non
%   ground with 100 possible values then: hash_table_set_domain_size(HT, ID2, 5),
%   hash_table_set_domain_size(HT, (ID2,'*'), 100).
%   When emmitted the internal array will assume the defined size from father.
% hash_table_delete(+HashTable)
%   Clears the +HashTable
% hash_table_display(+HashTable, +ColSize, +PaneSize)
%   Debug only purposes currently.
% hash_table_lookup(+HashTable, +Tuple, -ID)
% hash_table_lookup(+HashTable, -Tuple, +ID)
%   This is the lookup function. Either takes a +Tuple and retuns an -ID
%   or vice versa. Handles collisions, automatically grows array by a chain
%   of arrays.
% hash_table_contains(+HashTable, +Tuple, -ID)
%   Similar with lookup but only checks if +Tuple has been seen and returns -ID.
% hash_table_get_entries(+HashTable, -Count)
%   Returns the # of tuples seen up to now.
% problog_key_to_tuple(+Key, -Tuple)
%   Takes a +Key of format "ID1_ID2" and makes a tuple (ID1, ID2)
% IMPORTANT: Currently it under performs for some reason...
:- module(hash_table, [hash_table_init/2,

:- use_module(library(lists), [member/2]).
% General use predicates
  int(0, N).
int(N, N).
int(P, R):-
  N is P + 1,
  int(N, R).

get_digits(Num, Digits):-
  get_digits(Num, Digits, 1).
get_digits(Num, Digits, Digits):-
  Num < 10, !.
get_digits(Num, Digits, Acc):-
  NNum is Num / 10,
  NAcc is Acc + 1,
  get_digits(NNum, Digits, NAcc).

% Simple Counters
:- initialization(bb_put(array_count, 1)).

get_next_array(ID, Name):-
  bb_get(array_count, ID),
  NewID is ID + 1,
  bb_put(array_count, NewID),
  number_atom(ID, Name).

get_next_identifier(Identifier, Next):-
  bb_get(Identifier, Next),
  NewNext is Next + 1,
  bb_put(Identifier, NewNext).

% Syntactic Sugar
get_array_name(ID, Array):-   % if you change this, you need to change also get_next_array
%   char_code(Array, ID).
  number_atom(ID, Array).
%   atomic_concat(array, ID, Array).

get_array_identifier(ID, Identifier):-
  atomic_concat(array_identifier, ID, Identifier).

% hash_table_init(+Size, -HashTable)
% initializes a HashTable with Size positions, collitions are handled
% by expanding a new array that is kept at the last array element
hash_table_init(Size, HashTable):-
  hash_table_init(Size, Size, HashTable).
hash_table_init(Size, RevSize, HashTable):-
  ArraySize is Size + 1,
  get_next_array(ID, Array),
  get_array_identifier(ID, Identifier),
  static_array(Array, ArraySize, int),
  bb_put(Identifier, 1),
  RevArraySize is RevSize + 1,
  get_next_array(_RevID, RevArray),
  static_array(RevArray, RevArraySize, term),
  recordz(hash_table, hash(Array, Size, Identifier, RevArray, RevSize), HashTable).

hash_table_expand_array(Array, Size, NewArray):-
  ArraySize is Size + 1,
  get_next_array(ID, NewArray),
  static_array(NewArray, ArraySize, int),
  update_array(Array, Size, ID).

hash_table_sub_array_init(Array, Index, NewArray, Size):-
  ArraySize is Size + 1,
  get_next_array(ID, NewArray),
  static_array(NewArray, ArraySize, int),
  recordz(hash_table_arrays, array(ID, NewArray, Size, Array), _),
  update_array(Array, Index, ID).

% hash_table_set_domain_size(HashTable, Index, DomainSize)
hash_table_set_domain_size(HashTable, Index, DomainSize):-
  recorded(hash_table, hash(Array, Size, _Identifier, _RevArray, _RevSize), HashTable),
  hash_table_set_domain_size(Array, Size, Index, DomainSize).

hash_table_set_domain_size(Array, Size, Index, DomainSize):-
  Index < Size, !,
  array_element(Array, Index, A),
  (A is 0 ->
    hash_table_sub_array_init(Array, Index, _NewArray, DomainSize)
    throw(hash_table_exception(set_domain_size_fail(duplicate_definition(Index, DomainSize))))

hash_table_set_domain_size(Array, Size, Index, DomainSize):-
  integer(Index), !,
  NewIndex is Index - Size,
  array_element(Array, Size, SubArrayID),
  (SubArrayID is 0->
    hash_table_expand_array(Array, Size, NewArray)
    get_array_name(SubArrayID, NewArray)
  hash_table_set_domain_size(NewArray, Size, NewIndex, DomainSize).

hash_table_set_domain_size(Array, Size, Index, DomainSize):-
  Index == '*', !,
  hash_table_set_domain_size(Array, Size, N, DomainSize),
  N is Size - 1, !.

hash_table_set_domain_size(Array, Size, (Index, Rest), DomainSize):-
  Index < Size, !,
  array_element(Array, Index, SubArrayID),
  (SubArrayID is 0->
    throw(hash_table_exception(set_domain_size_fail(sub_array_missing((Index, Rest), DomainSize))))
    recorded(hash_table_arrays, array(SubArrayID, SubArray, SubArraySize, Array), _)
  hash_table_set_domain_size(SubArray, SubArraySize, Rest, DomainSize).

hash_table_set_domain_size(Array, Size, (Index, Rest), DomainSize):-
  NewIndex is Index - Size,
  array_element(Array, Size, SubArrayID),
  (SubArrayID is 0->
    hash_table_expand_array(Array, Size, NewArray)
    get_array_name(SubArrayID, NewArray)
  hash_table_set_domain_size(NewArray, Size, (NewIndex, Rest), DomainSize).

% hash_table_delete(+HashTable)
% deletes the arrays, records, and blackboard variables related with the hashtable
  recorded(hash_table, hash(Array, Size, Identifier, RevArray, RevSize), HashTable),
  bb_delete(Identifier, _),
  hash_table_delete_array(Array, Size),
  hash_table_delete_rev_array(RevArray, RevSize).

hash_table_delete_array(Array, Size):-
  hash_table_delete_chain(Array, Size),

hash_table_delete_chain(Array, Size):-
  array_element(Array, Size, ChainArrayID),
  (ChainArrayID is 0 ->
    get_array_name(ChainArrayID, ChainArray),
    hash_table_delete_array(ChainArray, Size)

hash_table_delete_subarrays(Array):- % I can improve the performance of this by making a second record with Array infront
  forall(recorded(hash_table_arrays, array(_SubArrayID, SubArray, Size, Array) , Ref),
    (erase(Ref), hash_table_delete_array(SubArray, Size))).

hash_table_delete_rev_array(Array, Size):-
  (array_element(Array, Size, ChainArray) ->
    hash_table_delete_rev_array(ChainArray, Size)

% hash_table_reset(+HashTable)
% resets the table values, retains the structure

  recorded(hash_table, hash(Array, Size, Identifier, RevArray, RevSize), HashTable),
  hash_table_get_entries(HashTable, Count),
  hash_table_lookup(HashTable, Tuple, Index),
  hash_table_reset_element(Array, Size, Tuple),
  Index is Count - 1, !,
  hash_table_reset_rev_array(RevArray, RevSize),
  bb_put(Identifier, 1).

hash_table_reset_element(Array, Size, Index):-
  Index < Size, !,
  update_array(Array, Index, 0).

hash_table_reset_element(Array, Size, Index):-
  NewIndex is Index - Size,
  array_element(Array, Size, SubArrayID),
  get_array_name(SubArrayID, SubArray),
  hash_table_reset_element(SubArray, Size, NewIndex).

hash_table_reset_element(Array, Size, (Index, Rest)):-
  Index < Size, !,
  array_element(Array, Index, SubArrayID),
  recorded(hash_table_arrays, array(SubArrayID, SubArray, SubArraySize, Array), _),
  hash_table_reset_element(SubArray, SubArraySize, Rest).

hash_table_reset_element(Array, Size, (Index, Rest)):-
  NewIndex is Index - Size,
  array_element(Array, Size, SubArrayID),
  get_array_name(SubArrayID, SubArray),
  hash_table_reset_element(SubArray, Size, (NewIndex, Rest)).
hash_table_reset_rev_array(RevArray, RevSize):-
  array_element(RevArray, RevSize, ChainArray), !,
  update_array(RevArray, RevSize, ChainArray),
  hash_table_reset_rev_array(ChainArray, RevSize).
hash_table_reset_rev_array(RevArray, _RevSize):-

% hash_table_lookup(+HashTable, +Tuple, -ID)
% hash_table_lookup(+HashTable, -Tuple, +ID)
% lookup Tuple in HashTable and insert, return ID
% lookup ID in HashTable and return Tuple
% Known bug: If HashTable contains a Tuple of form (ID, _) looking up ID succeeds
%            and returns the SubArrayID.
%            This is safe under the assumption that ID is unique to start from.

hash_table_lookup(HashTable, Tuple, ID):-
  ground(HashTable), !,
  recorded(hash_table, hash(Array, Size, Identifier, RevArray, RevSize), HashTable),
  hash_table_lookup(Array, Size, Identifier, Tuple, ID),
  hash_table_update_rev_array(RevArray, RevSize, ID, Tuple).

hash_table_lookup(HashTable, Tuple, ID):-
  recorded(hash_table, hash(_Array, _Size, _Identifier, RevArray, RevSize), HashTable),
  hash_table_element_rev_array(RevArray, RevSize, ID, Tuple).

hash_table_lookup(Array, Size, Identifier, Index, RID):-
  Index < Size, !,
  array_element(Array, Index, StoredID),
  (StoredID is 0 ->
    get_next_identifier(Identifier, ID),
    update_array(Array, Index, ID)
    ID = StoredID
  RID is ID - 1.

hash_table_lookup(Array, Size, Identifier, Index, ID):-
  integer(Index), !,
  NewIndex is Index - Size,
  array_element(Array, Size, ArrayID),
  (ArrayID is 0 ->
    hash_table_expand_array(Array, Size, SubArray)
    get_array_name(ArrayID, SubArray)
  hash_table_lookup(SubArray, Size, Identifier, NewIndex, ID).

hash_table_lookup(Array, Size, Identifier, (Index,Tuple), ID):-
  Index < Size, !,
  array_element(Array, Index, ArrayID),
  (ArrayID is 0 ->
    NewSize = Size,
    hash_table_sub_array_init(Array, Index, SubArray, Size)
    recorded(hash_table_arrays, array(ArrayID, SubArray, NewSize, Array), _)
  hash_table_lookup(SubArray, NewSize, Identifier, Tuple, ID).

hash_table_lookup(Array, Size, Identifier, (Index,Tuple), ID):-
  NewIndex is Index - Size,
  array_element(Array, Size, ArrayID),
  (ArrayID is 0 ->
    hash_table_expand_array(Array, Size, SubArray)
    get_array_name(ArrayID, SubArray)
  hash_table_lookup(SubArray, Size, Identifier, (NewIndex, Tuple), ID).

hash_table_update_rev_array(Array, Size, Index, Tuple):-
  Index < Size, !,
  update_array(Array, Index, Tuple).

hash_table_update_rev_array(Array, Size, Index, Tuple):-
  NewIndex is Index - Size,
  (array_element(Array, Size, SubArray) ->
    SubArraySize is Size + 1,
    get_next_array(_SubArrayID, SubArray),
    static_array(SubArray, SubArraySize, term),
    update_array(Array, Size, SubArray)
  hash_table_update_rev_array(SubArray, Size, NewIndex, Tuple).

hash_table_element_rev_array(Array, Size, Index, Tuple):-
  Index < Size, !,
  array_element(Array, Index, Tuple).

hash_table_element_rev_array(Array, Size, Index, Tuple):-
  NewIndex is Index - Size,
  array_element(Array, Size, SubArray),
  hash_table_element_rev_array(SubArray, Size, NewIndex, Tuple).

% hash_table_contains(+HashTable, +Tuple, -ID)
% search the hash_table to see if it contains a Tuple and return the ID
% Known bug: If HashTable contains a Tuple of form (ID, _) asking if HashTable
%            contains ID it succeeds.
%            This is safe under the assumption that ID is unique to start from.
hash_table_contains(HashTable, Tuple, ID):-
  ground(HashTable), !,
  recorded(hash_table, hash(Array, Size, _Identifier, _RevArray, _RevSize), HashTable),
  hash_table_contains(Array, Size, Tuple, ID).

hash_table_contains(Array, Size, Index, RID):-
  Index < Size, !,
  array_element(Array, Index, ID),
  ID > 0,
  RID is ID - 1.

hash_table_contains(Array, Size, Index, ID):-
  integer(Index), !,
  NewIndex is Index - Size,
  array_element(Array, Size, SubArrayID),
  SubArrayID > 0,
  get_array_name(SubArrayID, SubArray),
  hash_table_contains(SubArray, Size, NewIndex, ID).

hash_table_contains(Array, Size, (Index,Tuple), ID):-
  Index < Size, !,
  array_element(Array, Index, SubArrayID),
  SubArrayID > 0,
  recorded(hash_table_arrays, array(SubArrayID, SubArray, NewSize, Array), _),
  hash_table_contains(SubArray, NewSize, Tuple, ID).

hash_table_contains(Array, Size, (Index,Tuple), ID):-
  NewIndex is Index - Size,
  array_element(Array, Size, SubArrayID),
  SubArrayID > 0,
  get_array_name(SubArrayID, SubArray),
  hash_table_contains(SubArray, Size, (NewIndex, Tuple), ID).

% hash_table_get_entries(+HashTable, -Count)
% returns the number of entries inside the hash table
hash_table_get_entries(HashTable, Count):-
  recorded(hash_table, hash(_Array, _Size, Identifier, _RevArray, _RevSize), HashTable),
  bb_get(Identifier, Num),
  Count is Num - 1.

% hash_table_display(+HashTable, +ColSize, +PaneSize)
% Only for debugging reasons.
hash_table_display(HashTable, ColSize, PaneSize):-
  ground(HashTable), integer(ColSize), integer(PaneSize), ColSize =< PaneSize,
  recorded(hash_table, hash(Array, Size, Identifier, RevArray, RevSize), HashTable),
  hash_table_get_entries(HashTable, Count),
  format('Hash Table: ~q~n  Entries: ~d~n  Identifier: ~w~n', [HashTable, Count, Identifier]),
  hash_table_display_array(Array, Size),
  hash_table_display_rev_array(RevArray, RevSize, Identifier, ColSize, PaneSize).

hash_table_display_array(Array, Size):-
  hash_table_get_chains(Array, Size, Chains),
  findall(SubArray, recorded(hash_table_arrays, array(_, SubArray, _, Array),_), SubArrays),
  format('Array: ~q~n  Size: ~d~n  Chains: ~q~n  Sub Arrays: ~q~n',[Array, Size, Chains, SubArrays]),
  forall(member(SubArray, SubArrays), (
    recorded(hash_table_arrays, array(_, SubArray, SubSize, Array),_),
    hash_table_display_array(SubArray, SubSize)

hash_table_display_rev_array(RevArray, RevSize, Identifier, ColSize, PaneSize):-
  hash_table_get_chains(RevArray, RevSize, Chains),
  format('Array: ~q~n  Size: ~d~n  Chains: ~q~n', [RevArray, RevSize, Chains]),
  bb_get(Identifier, Num),
  get_digits(Num, Digits),
  hash_table_get_elements(RevArray, RevSize, 0, Tupples),
  hash_table_display_elements(0, Tupples, Digits, ColSize, PaneSize).

hash_table_get_elements(RevArray, RevSize, Current, [Tupple|Tupples]):-
  Current < RevSize,
  array_element(RevArray, Current, Tupple), !,
  Next is Current + 1,
  hash_table_get_elements(RevArray, RevSize, Next, Tupples).
hash_table_get_elements(_RevArray, RevSize, Current, []):-
  Current < RevSize, !.
hash_table_get_elements(RevArray, RevSize, RevSize, Tupples):-
  array_element(RevArray, RevSize, NextArray), !,
  hash_table_get_elements(NextArray, RevSize, 0, Tupples).
hash_table_get_elements(_RevArray, RevSize, RevSize, []).

hash_table_get_chains(Array, Size, Chains):-
  ((array_element(Array, Size, ChainID), ChainID \== 0) ->
    (integer(ChainID) ->
      get_array_name(ChainID, ChainName)
      ChainName = ChainID
    hash_table_get_chains(ChainName, Size, RestChains),
    Chains = [ChainName|RestChains]
    Chains = []

hash_table_display_elements(_Index, [], _Digits, _ColSize, _PaneSize):- format('~n',[]), !.
hash_table_display_elements(Index, [Element|T], Digits, ColSize, PaneSize):-
  NL is Index mod integer(PaneSize / ColSize),
  RealColSize is ColSize - Digits - 3,
  ((NL > 0; Index =:= 0) -> true; format('~n',[])),
  format('~t~d~*+ = ~q~*+', [Index, Digits, Element, RealColSize]),
  NewIndex is Index + 1,
  hash_table_display_elements(NewIndex, T, Digits, ColSize, PaneSize).

% problog_key_to_tuple(+Key, -Tuple)
% This should be removed in new implementation
problog_key_to_tuple(Key, Key):-
  integer(Key), !.
problog_key_to_tuple(Key, (PID, SID)):-
  atom_chars(Key, ID_Chars),
  break_list_at(ID_Chars, 95, Part1, Part2),
%   once(append(Part1, [95|Part2], ID_Chars)), % 95 = '_'
  number_chars(PID, Part1),
  number_chars(SID, Part2).

break_list_at([H|T], H, [], T):-!.
break_list_at([H|T], At, [H|Part1], Part2):-
  break_list_at(T, At, Part1, Part2).