This repository has been archived on 2023-08-20. You can view files and clone it, but cannot push or open issues or pull requests.
yap-6.3/library/MYDDAS/myddas_prolog2sql.ypp
tiagosoares 174a2c4518 MYDDAS: Enhanced statistics ability
git-svn-id: https://yap.svn.sf.net/svnroot/yap/trunk@1628 b08c6af1-5177-4d33-ba66-4b1c6b8b522a
2006-05-03 18:02:29 +00:00

1374 lines
44 KiB
Prolog
Executable File

% -*- Mode: Prolog -*-
% --------------------------------------------------------------------------------------
%
% This Prolog to SQL compiler may be distributed free of charge provided that it is
% not used in commercial applications without written consent of the author, and
% that the copyright notice remains unchanged.
%
% (C) Copyright by Christoph Draxler, Munich
% Version 1.1 of Dec. 21st 1992
%
% I would like to keep in my hands the further development and distribution of the
% compiler. This does not mean that I don't want other people to suggest or even
% implement improvements - quite on the contrary: I greatly appreciate contributions
% and if they make sense to me I will incorporate them into the compiler (with due
% credits given!).
%
% For further development of the compiler, address your requests, comments and
% criticism to the author:
%
% Christoph Draxler
% CIS Centre for Information and Speech Processing
% Ludwig-Maximilians-University Munich
% Wagmuellerstr. 23
% D 80538 Munich
% Tel : ++49 / +89 / 211 06 64 (-60)
% Fax : ++49 / +89 / 211 06 74
% Mail: draxler@cis.uni-muenchen.de
%
%
% A report describing the implementation is available upon request from the
% author.
%
%
% RELEASE INFORMATION
% ===================
% Current version is v. 1.1 of Dec. 21st 1992.
% Version 1.0 Sept. 3 1992
% --------------------------------------------------------------------------------------
:- module(myddas_prolog2sql,[
translate/3,
queries_atom/2
]).
:- use_module(lists,[
append/3,
member/2
]).
:- use_module(myddas_prolog2sql_optimizer,[
optimize_sql/2
]).
% --------------------------------------------------------------------------------------
%
% Top level predicate translate/3 organizes the compilation and constructs a
% Prolog term representation of the SQL query.
%
% --------------------------------------------------------------------------------------
#ifdef MYDDAS_STATS
translate(ProjectionTerm,DatabaseGoal,SQLQueryTermOpt):-
c_db_stats_walltime(Start),
translate_(ProjectionTerm,DatabaseGoal,SQLQueryTermOpt),
c_db_stats_walltime(End),
c_db_stats_translate(Start,End).
translate_(ProjectionTerm,DatabaseGoal,SQLQueryTermOpt):-
#else
translate(ProjectionTerm,DatabaseGoal,SQLQueryTermOpt):-
#endif
% --- initialize variable identifiers and range variables for relations -----
init_gensym(var),
init_gensym(rel),
% --- tokenize projection term and database goal ----------------------------
tokenize_term(DatabaseGoal,TokenDatabaseGoal),
tokenize_term(ProjectionTerm,TokenProjectionTerm),
% --- lexical analysis: reordering of goals for disjunctive normalized form -
disjunction(TokenDatabaseGoal,Disjunction),
% --- code generation ---------------------------------------------------------------
query_generation(Disjunction,TokenProjectionTerm,SQLQueryTerm),
% --- optimize sql ------------------------------------------------------------------
optimize_sql(SQLQueryTerm,SQLQueryTermOpt).
% --- disjunction(Goal,Disjunction) ----------------------------------------------------
%
% turns original goal into disjunctive normalized form by computing all conjunctions
% and collecting them in a list
%
% --------------------------------------------------------------------------------------
disjunction(Goal,Disjunction):-
findall(Conjunction,linearize(Goal,Conjunction),Disjunction).
% --- linearize(Goal,ConjunctionList) --------------------------------------------------
%
% Returns a conjunction of base goals for a complex disjunctive or conjunctive goal
% Yields several solutions upon backtracking for disjunctive goals
%
% --------------------------------------------------------------------------------------
linearize(((A,B),C),(LinA,(LinB,LinC))):-
% --- transform left-linear to right-linear conjunction (',' is associative) ----
linearize(A,LinA),
linearize(B,LinB),
linearize(C,LinC).
linearize((A,B),(LinA,LinB)):-
A \= (_,_),
% --- make sure A is not a conjunction ------------------------------------------
linearize(A,LinA),
linearize(B,LinB).
% ILP
%linearize((A;B),LinA):-
linearize((A;_),LinA):-
linearize(A,LinA).
% ILP
%linearize((A;B),LinB):-
linearize((_;B),LinB):-
linearize(B,LinB).
linearize(not A, not LinA):-
linearize(A,LinA).
linearize(Var^A, Var^LinA):-
linearize(A,LinA).
linearize(A,A):-
A \= (_,_),
A \= (_;_),
A \= _^_,
A \= not(_).
% --- tokenize_term(Term,TokenizedTerm) -------------------------------------------------
%
% If Term is a
%
% - variable, then this variable is instantiated with a unique identifier
% of the form '$var$'(VarId), and TokenizedTerm is bound to the same
% term '$var$'(VarId).
%
% - constant, then TokenizedTerm is bound to '$const$'(Term).
%
% - complex term, then the term is decomposed, its arguments are tokenized,
% and TokenizedTerm is bound to the result of the composition of the original
% functor and the tokenized arguments.
%
% --------------------------------------------------------------------------------------
tokenize_term('$var$'(VarId),'$var$'(VarId)):-
var(VarId),
% --- uninstantiated variable: instantiate it with unique identifier.
gensym(var,VarId).
tokenize_term('$var$'(VarId),'$var$'(VarId)):-
nonvar(VarId).
tokenize_term(Constant,'$const$'(Constant)):-
nonvar(Constant),
functor(Constant,_,0).
tokenize_term(Term,TokenizedTerm):-
nonvar(Term),
Term \= '$var$'(_),
Term \= '$const$'(_),
Term =.. [Functor|Arguments],
Arguments \= [],
tokenize_arguments(Arguments,TokenArguments),
TokenizedTerm =.. [Functor|TokenArguments].
% --- tokenize_arguments(Arguments,TokenizedArguments) ---------------------------------
%
% organizes tokenization of arguments by traversing list and calling tokenize_term
% for each element of the list.
%
% --------------------------------------------------------------------------------------
tokenize_arguments([],[]).
tokenize_arguments([FirstArg|RestArgs],[TokFirstArg|TokRestArgs]):-
tokenize_term(FirstArg,TokFirstArg),
tokenize_arguments(RestArgs,TokRestArgs).
% --- query_generation(ListOfConjunctions, ProjectionTerm, ListOfQueries) --------------
%
% For each Conjunction translate the pair (ProjectionTerm,Conjunction) to an SQL query
% and connect each such query through a UNION-operator to result in the ListOfQueries.
%
% A Conjunction consists of positive or negative subgoals. Each subgoal is translated
% as follows:
% - the functor of a goal that is not a comparison operation is translated to
% a relation name with a range variable
% - negated goals are translated to NOT EXISTS-subqueries with * projection
% - comparison operations are translated to comparison operations in the WHERE-clause
% - aggregate function terms are translated to aggregate function (sub)queries
%
% The arguments of a goal are translated as follows:
% - variables of a goal are translated to qualified attributes
% - variables occurring in several goals are translated to equality comparisons
% (equi join) in the WHERE-clause
% - constant arguments are translated to equality comparisons in the WHERE-clause
%
% Special treatment of arithmetic functions:
% - arithmetic functions are identified through the Prolog is/2 operator
% - an arithmetic function may contain an unbound variable only on its left side
% - the right side of the is/2 operator may consist of
% * bound variables (bound through occurrence within a positive database goal, or
% bound through preceeding arithmetic function), or of
% * constants (numbers, i.e. integers, reals)
%
% The following RESTRICTION holds:
%
% - the binding of variables follows Prolog: variables are bound by positive base goals
% and on the left side of the is/2 predicate - comparison operations, negated goals
% and right sides of the is/2 predicate do not return variable bindings and may even
% require all arguments to be bound for a safe evaluation.
%
% --------------------------------------------------------------------------------------
query_generation([],_,[]).
query_generation([Conjunction|Conjunctions],ProjectionTerm,[Query|Queries]):-
projection_term_variables(ProjectionTerm,InitDict),
( Conjunction =.. [once|Arguments] ->
[Args] = Arguments,
translate_conjunction(Args,SQLFrom,SQLWhereTemp,InitDict,Dict),
append(SQLWhereTemp,[once],SQLWhere)
;
translate_conjunction(Conjunction,SQLFrom,SQLWhere,InitDict,Dict)
),
translate_projection(ProjectionTerm,Dict,SQLSelect),
Query = query(SQLSelect,SQLFrom,SQLWhere),
query_generation(Conjunctions,ProjectionTerm,Queries).
% --- translate_goal(Goal,SQLFrom,SQLWhere,Dict,NewDict) -------------------------------
%
% translates a
%
% - positive database goal to the associated FROM- and WHERE clause of an SQL query
% - a negated goal to a negated existential subquery
% - an arithmetic goal to an arithmetic expression or an aggregate function query
% - a comparison goal to a comparison expression
% - a negated comparison goal to a comparison expression with the opposite comparison
% operator
%
% --------------------------------------------------------------------------------------
translate_goal(SimpleGoal,[SQLFrom],SQLWhere,Dict,NewDict):-
% --- positive goal binds variables - these bindings are held in the dictionary -----
functor(SimpleGoal,Functor,Arity),
translate_functor(Functor,Arity,SQLFrom),
SimpleGoal =.. [Functor|Arguments],
translate_arguments(Arguments,SQLFrom,1,SQLWhere,Dict,NewDict).
translate_goal(Result is Expression,[],SQLWhere,Dict,NewDict):-
translate_arithmetic_function(Result,Expression,SQLWhere,Dict,NewDict).
translate_goal(not NegatedGoals,[],SQLNegatedSubquery,Dict,Dict):-
% --- negated goals do not bind variables - hence Dict is returned unchanged --------
functor(NegatedGoals,Functor,_),
not comparison(Functor,_),
translate_conjunction(NegatedGoals,SQLFrom,SQLWhere,Dict,_),
SQLNegatedSubquery = [negated_existential_subquery([*],SQLFrom,SQLWhere)].
translate_goal(not ComparisonGoal,[],SQLCompOp,Dict,Dict):-
% --- comparison operations do not bind variables - Dict is returned unchanged ------
ComparisonGoal =.. [ComparisonOperator,LeftArg,RightArg],
comparison(ComparisonOperator,SQLOperator),
negated_comparison(SQLOperator,SQLNegOperator),
translate_comparison(LeftArg,RightArg,SQLNegOperator,Dict,SQLCompOp).
%% EXAMPLE: db_prolog_select([Gene1],(once((eval(Gene1,_,_),exists(eval(Gene1),eval(Gene1,_,_)))))).
translate_goal(exists(ProjectionTerm,ExistsGoals),SQLFrom,SQLExistsSubquery,Dict,Dict):-
% --- exists goals do not bind variables - hence Dict is returned unchanged --------
functor(ExistsGoals,Functor,_),
not comparison(Functor,_),
translate_projection(ProjectionTerm,Dict,SQLSelect),
translate_conjunction(ExistsGoals,SQLFrom,SQLWhere,Dict,_),
SQLExistsSubquery = [existential_subquery(SQLSelect,SQLFrom,SQLWhere)].
translate_goal(exists(ExistsGoals),SQLFrom,SQLExistsSubquery,Dict,Dict):-
% --- exists goals do not bind variables - hence Dict is returned unchanged --------
functor(ExistsGoals,Functor,_),
not comparison(Functor,_),
translate_conjunction(ExistsGoals,SQLFrom,SQLWhere,Dict,_),
SQLExistsSubquery = [existential_subquery([*],SQLFrom,SQLWhere)].
translate_goal(ComparisonGoal,[],SQLCompOp,Dict,Dict):-
% --- comparison operations do not bind variables - Dict is returned unchanged ------
ComparisonGoal =.. [ComparisonOperator,LeftArg,RightArg],
comparison(ComparisonOperator,SQLOperator),
translate_comparison(LeftArg,RightArg,SQLOperator,Dict,SQLCompOp).
%DISTINCT
translate_goal(distinct(Goal),List,SQL,Dict,DistinctDict):-!,
translate_goal(Goal,List,SQL,Dict,NewDict),
add_distinct_statement(NewDict,DistinctDict).
%DEBUG
add_distinct_statement(Dict,Dict):-
append([_],[1,2],_).
% --- translate_conjunction(Conjunction,SQLFrom,SQLWhere,Dict,NewDict) -----------------
%
% translates a conjunction of goals (represented as a list of goals preceeded by
% existentially quantified variables) to FROM- and WHERE-clause of an SQL query.
% A dictionary containing the associated SQL table and attribute names is built up
% as an accumulator pair (arguments Dict and NewDict)
%
% --------------------------------------------------------------------------------------
translate_conjunction('$var$'(VarId)^Goal,SQLFrom,SQLWhere,Dict,NewDict):-
#ifdef DEBUG_TRANSLATE
write('translate_conjuntion clause 1'),nl,
#endif
% --- add info on existentially quantified variables to dictionary here -------------
add_to_dictionary(VarId,_,_,_,existential,Dict,TmpDict),
translate_conjunction(Goal,SQLFrom,SQLWhere,TmpDict,NewDict).
translate_conjunction(Goal,SQLFrom,SQLWhere,Dict,NewDict):-
#ifdef DEBUG_TRANSLATE
write('translate_conjuntion clause 2'),nl,
#endif
Goal \= (_,_),
translate_goal(Goal,SQLFrom,SQLWhere,Dict,NewDict).
translate_conjunction((Goal,Conjunction),SQLFrom,SQLWhere,Dict,NewDict):-
#ifdef DEBUG_TRANSLATE
write('translate_conjuntion clause 3'),nl,
#endif
translate_goal(Goal,FromBegin,WhereBegin,Dict,TmpDict),
translate_conjunction(Conjunction,FromRest,WhereRest,TmpDict,NewDict),
append(FromBegin,FromRest,SQLFrom),
append(WhereBegin,WhereRest,SQLWhere).
% --- translate_arithmetic_function(Result,Expression,SQLWhere,Dict,NewDict) -----------
%
% Arithmetic functions (left side of is/2 operator is bound to value of expression on
% right side) may be called with either
%
% - Result unbound: then Result is bound to the value of the evaluation of Expression
% - Result bound: then an equality condition is returned between the value of Result
% and the value of the evaluation of Expression.
%
% Only the equality test shows up in the WHERE clause of an SQLquery.
%
% --------------------------------------------------------------------------------------
translate_arithmetic_function('$var$'(VarId),Expression,[],Dict,NewDict):-
% assigment of value of arithmetic expression to variable - does not
% show up in WHERE-part, but expression corresponding to
% variable must be stored in Dict for projection translation
evaluable_expression(Expression,Dict,ArithExpression,Type),
add_to_dictionary(VarId,is,ArithExpression,Type,all,Dict,NewDict).
translate_arithmetic_function('$var$'(VarId),Expression,ArithComparison,Dict,Dict):-
% --- test whether left side evaluates to right side: return equality comparison ----
% Left side consists of qualified attribute, i.e. range variable must not be
% arithmetic operator is/2
lookup(VarId,Dict,PrevRangeVar,PrevAtt,PrevType),
not (PrevRangeVar = is),
% test whether type of attribute is numeric - if not, there's no sense in
% continuing the translation
%type_compatible(PrevType,number),
evaluable_expression(Expression,Dict,ArithExpression,ExprType),
%type_compatible(ExprType,number),
ArithComparison = [comp(att(PrevRangeVar,PrevAtt),'=',ArithExpression)].
translate_arithmetic_function('$var$'(VarId),Expression,ArithComparison,Dict,Dict):-
% --- test whether left side evaluates to right side: return equality comparison ----
% Left side consists of arithmetic expression, i.e. VarId is stored in Dict as
% belonging to arithmetic expression which is expressed as RangeVar-argument
% of lookup returning is/2. Type information is implicit through the is/2 functor
lookup(VarId,Dict,is,LeftExpr,Type),
%type_compatible(Type,number),
evaluable_expression(Expression,Dict,RightExpr,ExprType),
%type_compatible(ExprType,number),
ArithComparison = [comp(LeftExpr,'=',RightExpr)].
translate_arithmetic_function('$const$'(Constant),Expression,ArithComparison,Dict,Dict):-
% --- is/2 used to test whether left side evaluates to right side -------------------
get_type('$const$'(Constant),ConstantType),
%type_compatible(ConstantType,number),
evaluable_expression(Expression,Dict,ArithExpression,ExprType),
%type_compatible(ExprType,number),
ArithComparison = [comp('$const$'(Constant),'=',ArithExpression)].
% --- translate_comparison(LeftArg,RightArg,CompOp,Dict,SQLComparison) ---------
%
% translates the left and right arguments of a comparison term into the
% appropriate comparison operation in SQL. The result type of each
% argument expression is checked for type compatibility
%
% ------------------------------------------------------------------------------
translate_comparison(LeftArg,RightArg,CompOp,Dict,Comparison):-
evaluable_expression(LeftArg,Dict,LeftTerm,LeftArgType),
evaluable_expression(RightArg,Dict,RightTerm,RightArgType),
%type_compatible(LeftArgType,RightArgType),
Comparison = [comp(LeftTerm,CompOp,RightTerm)].
% --- translate_functor(Functor,QualifiedTableName) ------------------------------------
%
% translate_functor searches for the matching relation table name for
% a given functor and creates a unique range variable to result in
% a unique qualified relation table name.
%
% --------------------------------------------------------------------------------------
translate_functor(Functor,Arity,rel(TableName,RangeVariable)):-
relation(Functor,Arity,TableName),
gensym(rel,RangeVariable).
% --- translate_arguments(Arguments,RelTable,ArgPos,Conditions,Dict) -------------------
%
% translate_arguments organizes the translation of term arguments. One
% term argument after the other is taken from the list of term arguments
% until the list is exhausted.
%
% --------------------------------------------------------------------------------------
translate_arguments([],_,_,[],Dict,Dict).
translate_arguments([Arg|Args],SQLTable,Position,SQLWhere,Dict,NewDict):-
translate_argument(Arg,SQLTable,Position,Where,Dict,TmpDict),
NewPosition is Position + 1,
translate_arguments(Args,SQLTable,NewPosition,RestWhere,TmpDict,NewDict),
append(Where,RestWhere,SQLWhere).
% --- translate_argument(Argument,RelTable,Position,Condition,Dict) --------------------
%
% The first occurrence of a variable leads to its associated SQL attribute information
% to be recorded in the Dict. Any further occurrence creates an equi-join condition
% between the current attribute and the previously recorded attribute.
% Constant arguments always translate to equality comparisons between an attribute and
% the constant value.
%
% --------------------------------------------------------------------------------------
translate_argument('$var$'(VarId),rel(SQLTable,RangeVar),Position,[],Dict,NewDict):-
attribute(Position,SQLTable,Attribute,Type),
add_to_dictionary(VarId,RangeVar,Attribute,Type,all,Dict,NewDict).
translate_argument('$var$'(VarId),rel(SQLTable,RangeVar),Position,AttComparison,Dict,Dict):-
% --- Variable occurred previously - retrieve first occurrence data from dictionary -
lookup(VarId,Dict,PrevRangeVar,PrevAtt,PrevType),
attribute(Position,SQLTable,Attribute,Type),
% type_compatible(PrevType,Type),
AttComparison = [comp(att(RangeVar,Attribute),=,att(PrevRangeVar,PrevAtt))].
translate_argument('$const$'(Constant),rel(SQLTable,RangeVar),Position,ConstComparison,Dict,Dict):-
% --- Equality comparison of constant value and attribute in table ------------------
attribute(Position,SQLTable,Attribute,Type),
%get_type('$const$'(Constant),ConstType),
%type_compatible(ConstType,Type),
ConstComparison = [comp(att(RangeVar,Attribute),=,'$const$'(Constant))].
% --- projection_term_variables(ProjectionTerm,Dict) -----------------------------------
%
% extracts all variables from the ProjectionTerm and places them into the
% Dict as a dict/4 term with their Identifier, a non instantiated RangeVar and
% Attribute argument, and the keyword existential for the type of quantification
%
% --------------------------------------------------------------------------------------
%% ERRO??
%projection_term_variables('$const(_)$',[]).
projection_term_variables('$const$'(_),[]).
projection_term_variables('$var$'(VarId),[dict(VarId,_,_,_,existential)]).
projection_term_variables(ProjectionTerm,ProjectionTermVariables):-
ProjectionTerm =.. [Functor|ProjectionTermList],
not (Functor = '$var$'),
not (ProjectionTermList = []),
projection_list_vars(ProjectionTermList,ProjectionTermVariables).
projection_list_vars([],[]).
projection_list_vars(['$var$'(VarId)|RestArgs],[dict(VarId,_,_,_,existential)|RestVars]):-
projection_list_vars(RestArgs,RestVars).
projection_list_vars(['$const$'(_)|RestArgs],Vars):-
projection_list_vars(RestArgs,Vars).
% --------------------------------------------------------------------------------------
% RESTRICTION! ProjectionTerm underlies the following restrictions:
%
% - ProjectionTerm must have a functor other than the built-in
% operators, i.e. ',',';', etc. are not allowed
%
% - only variables and constants are allowed as arguments,
% i.e. no structured terms
%
% --------------------------------------------------------------------------------------
translate_projection('$var$'(VarId),Dict,SelectList):-
projection_arguments(['$var$'(VarId)],SelectList,Dict).
translate_projection('$const$'(Const),_,['$const$'(Const)]).
translate_projection(ProjectionTerm,Dict,SelectList):-
ProjectionTerm =.. [Functor|Arguments],
not (Functor = '$var$'),
not (Functor = '$const$'),
not (Arguments = []),
projection_arguments(Arguments,SelectList,Dict).
projection_arguments([],[],_).
projection_arguments([Arg|RestArgs],[Att|RestAtts],Dict):-
retrieve_argument(Arg,Att,Dict),
projection_arguments(RestArgs,RestAtts,Dict).
% - retrieve_argument(Argument,SQLAttribute,Dictionary) --------------------------------
%
% retrieves the mapping of an argument to the appropriate SQL construct, i.e.
%
% - qualified attribute names for variables in base goals
% - arithmetic expressions for variables in arithmetic goals
% - constant values for constants
%
% --------------------------------------------------------------------------------------
retrieve_argument('$var$'(VarId),Attribute,Dict):-
lookup(VarId,Dict,TableName,AttName,_),
(
TableName = is ->
Attribute = AttName
;
Attribute = att(TableName,AttName)
).
retrieve_argument('$const$'(Constant),'$const$'(Constant),_).
% --- lookup(Key,Dict,Value) -----------------------------------------------------------
lookup(VarId,Dict,RangeVar,Attribute,Type):-
member(dict(VarId,RangeVar,Attribute,Type,Quant),Dict),
(
Quant = all ->
true
;
nonvar(RangeVar),
nonvar(Attribute)
).
% --- add_to_dictionary(Key,RangeVar,Attribute,Quantifier,Dict,NewDict) ----------------
add_to_dictionary(Key,RangeVar,Attribute,Type,_,Dict,Dict):-
member(dict(Key,RangeVar,Attribute,Type,existential),Dict).
add_to_dictionary(Key,RangeVar,Attribute,Type,Quantifier,Dict,NewDict):-
not member(dict(Key,_,_,_,_),Dict),
NewDict = [dict(Key,RangeVar,Attribute,Type,Quantifier)|Dict].
% --- aggregate_function(AggregateFunctionTerm,Dict,AggregateFunctionQuery) ------------
%
% aggregate_function discerns five Prolog aggregate function terms: count, avg, min,
% max, and sum. Each such term is has two arguments: a variable indicating the attribute
% over which the function is to be computed, and a goal argument which must contain in
% at least one argument position the variable:
%
% e.g. avg(Seats,plane(Type,Seats))
%
% These aggregate function terms correspond to the SQL built-in aggregate functions.
%
% RESTRICTION: AggregateGoal may only be conjunction of (positive or negative) base
% goals
%
% --------------------------------------------------------------------------------------
aggregate_function(AggregateFunctionTerm,Dict,AggregateFunctionExpression):-
AggregateFunctionTerm =..[AggFunctor,AggVar,AggGoal],
aggregate_functor(AggFunctor,SQLFunction),
conjunction(AggGoal,AggConjunction),
aggregate_query_generation(SQLFunction,AggVar,AggConjunction,Dict,AggregateFunctionExpression).
conjunction(Goal,Conjunction):-
disjunction(Goal,[Conjunction]).
% --- aggregate_query_generation(Function,FunctionVariable,AggGoal,Dict,AggregateQuery)
%
% compiles the function variable (representing the attribute over which the aggregate
% function is to be computed) and the aggregate goal (representing the selection and
% join conditions for the computation of the aggregate function) to an SQL aggregate
% function subquery.
%
% --------------------------------------------------------------------------------------
% ILP
% aggregate_query_generation(count,'$const$'('*'),AggGoal,Dict,AggregateQuery):-
% translate_conjunction(AggGoal,SQLFrom,SQLWhere,Dict,TmpDict),
% AggregateQuery = agg_query(Function,(count,['$const$'(*)]),SQLFrom,SQLWhere,[]).
aggregate_query_generation(count,'$const$'('*'),AggGoal,Dict,AggregateQuery):-
translate_conjunction(AggGoal,SQLFrom,SQLWhere,Dict,_),
% ATTENTION! It is assumed that in count(*) aggregate query terms there cannot be
% free variables because '*' stands for "all arguments"
AggregateQuery = agg_query(_,(count,['$const$'(*)]),SQLFrom,SQLWhere,[]).
%DISTINCT
aggregate_query_generation(countdistinct,'$const$'('*'),AggGoal,Dict,AggregateQuery):-
translate_conjunction(AggGoal,SQLFrom,SQLWhere,Dict,_),
% ATTENTION! It is assumed that in count(*) aggregate query terms there cannot be
% free variables because '*' stands for "all arguments"
AggregateQuery = agg_query(_,(countdistinct,['$const$'(*)]),SQLFrom,SQLWhere,[]).
aggregate_query_generation(Function,FunctionVariable,AggGoal,Dict,AggregateQuery):-
translate_conjunction(AggGoal,SQLFrom,SQLWhere,Dict,TmpDict),
% --- only variables occurring in the aggregate goal are relevant to the translation
% of the function variable and the free variables in the goal.
% Thus subtract from TmpDict all entries of Dict
set_difference(TmpDict,Dict,AggDict),
translate_projection(FunctionVariable,AggDict,SQLSelect),
translate_grouping(FunctionVariable,AggDict,SQLGroup),
AggregateQuery = agg_query(Function,SQLSelect,SQLFrom,SQLWhere,SQLGroup).
% --- translate_grouping(FunctionVariable,Dict,SQLGroup) -------------------------------
%
% finds the free variables in the aggregate function term and collects their
% corresponding SQL qualified attributes in the SQLGroup list.
%
% --------------------------------------------------------------------------------------
translate_grouping(FunctionVariable,Dict,SQLGroup):-
free_vars(FunctionVariable,Dict,FreeVariables),
translate_free_vars(FreeVariables,SQLGroup).
% --- free_vars(FunctionVariable,Dict,FreeVarList) -------------------------------------
%
% A Variable is free if it neither occurs as the FunctionVariable, nor is stored as
% existentially quantified (through ^/2 in the original goal) in the dictionary
%
% FreeVars contains for each variable the relevant attribute and relation information
% contained in the dictionary
%
% --------------------------------------------------------------------------------------
% ILP
% free_vars(FunctionVariable,Dict,FreeVarList):-
% projection_term_variables(FunctionVariable,FunctionVariableList),
% findall((Var,Table,Attribute),
% (member(dict(Var,Table,Attribute,Type,all),Dict),
% not member(dict(Var,_,_,_,_),FunctionVariableList)
% ),
% FreeVarList).
free_vars(FunctionVariable,Dict,FreeVarList):-
projection_term_variables(FunctionVariable,FunctionVariableList),
findall((Var,Table,Attribute),
(member(dict(Var,Table,Attribute,_,all),Dict),
not member(dict(Var,_,_,_,_),FunctionVariableList)
),
FreeVarList).
% --- function_variable_list(FunctionVariable,FunctionVariableList) --------------------
%
% extracts the list of variables which occur in the function variable term
%
% RESTRICTION: FunctionVariable may only contain one single variable.
%
% --------------------------------------------------------------------------------------
function_variable_list('$var$'(VarId),[VarId]).
% --- translate_free_vars(FreeVars,SQLGroup) -------------------------------------------
%
% translates dictionary information on free variables to SQLGroup of aggregate
% function query
%
% --------------------------------------------------------------------------------------
translate_free_vars([],[]).
% ILP
%translate_free_vars([(VarId,Table,Attribute)|FreeVars],[att(Table,Attribute)|SQLGroups]):-
translate_free_vars([(_,Table,Attribute)|FreeVars],[att(Table,Attribute)|SQLGroups]):-
translate_free_vars(FreeVars,SQLGroups).
% --- evaluable_expression(ExpressionTerm,Dictionary,Expression,Type) --------------------
%
% evaluable_expression constructs SQL arithmetic expressions with qualified attribute names
% from the Prolog arithmetic expression term and the information stored in the dictionary.
%
% The type of an evaluable function is returned in the argument Type.
%
% The dictionary is not changed because it is used for lookup only.
%
evaluable_expression(AggregateFunctionTerm,Dictionary,AggregateFunctionExpression,number):-
aggregate_function(AggregateFunctionTerm,Dictionary,AggregateFunctionExpression).
evaluable_expression(LeftExp + RightExp,Dictionary,LeftAr + RightAr,number):-
evaluable_expression(LeftExp,Dictionary,LeftAr,number),
evaluable_expression(RightExp,Dictionary,RightAr,number).
evaluable_expression(LeftExp - RightExp,Dictionary,LeftAr - RightAr,number):-
evaluable_expression(LeftExp,Dictionary,LeftAr,number),
evaluable_expression(RightExp,Dictionary,RightAr,number).
evaluable_expression(LeftExp * RightExp,Dictionary,LeftAr * RightAr,number):-
evaluable_expression(LeftExp,Dictionary,LeftAr,number),
evaluable_expression(RightExp,Dictionary,RightAr,number).
evaluable_expression(LeftExp / RightExp,Dictionary, LeftAr / RightAr,number):-
evaluable_expression(LeftExp,Dictionary,LeftAr,number),
evaluable_expression(RightExp,Dictionary,RightAr,number).
evaluable_expression('$var$'(VarId),Dictionary,att(RangeVar,Attribute),Type):-
lookup(VarId,Dictionary,RangeVar,Attribute,Type),
RangeVar \= is.
evaluable_expression('$var$'(VarId),Dictionary,ArithmeticExpression,Type):-
lookup(VarId,Dictionary,is,ArithmeticExpression,Type).
evaluable_expression('$const$'(Const),_,'$const$'(Const),ConstType):-
get_type('$const$'(Const),ConstType).
% --------------------------------------------------------------------------------------
%
% Output to screen predicates - rather crude at the moment
%
% --------------------------------------------------------------------------------------
% --- printqueries(Code) ---------------------------------------------------------------
printqueries([Query]):-
nl,
print_query(Query),
write(';'),
nl,
nl.
printqueries([Query|Queries]):-
not (Queries = []),
nl,
print_query(Query),
nl,
write('UNION '),
nl,
printqueries(Queries).
% --- print_query(QueryCode) -----------------------------------------------------------
print_query(query([agg_query(Function,Select,From,Where,Group)],_,_)):-
% --- ugly rule here: aggregate function only in SELECT Part of query ----
!,
print_query(agg_query(Function,Select,From,Where,Group)).
print_query(query(Select,From,Where)):-
print_clause('SELECT',Select,','),
nl,
print_clause('FROM',From,','),
nl,
print_clause('WHERE',Where,'AND'),
nl.
print_query(agg_query(Function,Select,From,Where,Group)):-
print_clause('SELECT',Function,Select,','),
nl,
print_clause('FROM',From,','),
nl,
print_clause('WHERE',Where,'AND'),
nl,
print_clause('GROUP BY',Group,',').
print_query(negated_existential_subquery(Select,From,Where)):-
write('NOT EXISTS'),
nl,
write('('),
print_clause('SELECT',Select,','),
nl,
print_clause('FROM',From,','),
nl,
print_clause('WHERE',Where,'AND'),
nl,
write(')').
print_query(existential_subquery(Select,From,Where)):-
write('EXISTS'),
nl,
write('('),
print_clause('SELECT',Select,','),
nl,
print_clause('FROM',From,','),
nl,
print_clause('WHERE',Where,'AND'),
nl,
write(')').
% --- print_clause(Keyword,ClauseCode,Separator) ---------------------------------------
%
% with
% Keyword one of SELECT, FROM, WHERE, or GROUP BY,
% ClauseCode the code corresponding to the appropriate clause of an SQL query, and
% Separator indicating the character(s) through which the items of a clause
% are separated from each other (',' or 'AND').
%
% --------------------------------------------------------------------------------------
% ILP
% print_clause(Keyword,[],_).
print_clause(_,[],_).
print_clause(Keyword,[Column|RestColumns],Separator):-
write(Keyword),
write(' '),
print_clause([Column|RestColumns],Separator).
print_clause(Keyword,Function,[Column],Separator):-
write(Keyword),
write(' '),
write(Function),
write('('),
print_clause([Column],Separator),
write(')').
% --- print_clause(ClauseCode,Separator) -----------------------------------------------
print_clause([Item],_):-
print_column(Item).
print_clause([Item,NextItem|RestItems],Separator):-
print_column(Item),
write(' '),
write(Separator),
write(' '),
print_clause([NextItem|RestItems],Separator).
% --- print_column(ColumnCode) --------------------------------
print_column('*'):-
write('*').
print_column(att(RangeVar,Attribute)):-
write(RangeVar),
write('.'),
write(Attribute).
print_column(rel(Relation,RangeVar)):-
write(Relation),
write(' '),
write(RangeVar).
print_column('$const$'(String)):-
get_type('$const$'(String),string),
write('"'),
write(String),
write('"').
print_column('$const$'(Number)):-
get_type('$const$'(Number),NumType),
type_compatible(NumType,number),
write(Number).
print_column(comp(LeftArg,Operator,RightArg)):-
print_column(LeftArg),
write(' '),
write(Operator),
write(' '),
print_column(RightArg).
print_column(LeftExpr * RightExpr):-
print_column(LeftExpr),
write('*'),
print_column(RightExpr).
print_column(LeftExpr / RightExpr):-
print_column(LeftExpr),
write('/'),
print_column(RightExpr).
print_column(LeftExpr + RightExpr):-
print_column(LeftExpr),
write('+'),
print_column(RightExpr).
print_column(LeftExpr - RightExpr):-
print_column(LeftExpr),
write('-'),
print_column(RightExpr).
print_column(agg_query(Function,Select,From,Where,Group)):-
nl,
write('('),
print_query(agg_query(Function,Select,From,Where,Group)),
write(')').
print_column(negated_existential_subquery(Select,From,Where)):-
print_query(negated_existential_subquery(Select,From,Where)).
print_column(existential_subquery(Select,From,Where)):-
print_query(existential_subquery(Select,From,Where)).
% --- queries_atom(Queries,QueryAtom) ----------------------------
%
% queries_atom(Queries,QueryAtom) returns in its second argument
% the SQL query as a Prolog atom. For efficiency reasons, a list
% of ASCII codes is ceated as a difference list, and it is then
% transformed to an atom by name/2
% ----------------------------------------------------------------
queries_atom(Queries,QueryAtom):-
queries_atom(Queries,QueryList,[]),
name(QueryAtom,QueryList).
queries_atom([Query],QueryList,Diff):-
query_atom(Query,QueryList,Diff).
queries_atom([Query|Queries],QueryList,Diff):-
Queries \= [],
query_atom(Query,QueryList,X1),
column_atom('UNION ',X1,X2),
queries_atom(Queries,X2,Diff).
% --- query_atom(QueryCode) --------------------------------
query_atom(query([agg_query(Function,Select,From,Where,Group)],_,_),QueryList,Diff):-
% --- ugly rule here: aggregate function only in SELECT Part of query ----
!,
query_atom(agg_query(Function,Select,From,Where,Group),QueryList,Diff).
query_atom(query(Select,From,Where),QueryList,Diff):-
clause_atom('SELECT',Select,',',QueryList,X1),
clause_atom('FROM',From,',',X1,X2),
clause_atom('WHERE',Where,'AND',X2,Diff).
query_atom(agg_query(Function,Select,From,Where,Group),QueryList,Diff):-
clause_atom('SELECT',Function,Select,',',QueryList,X1),
clause_atom('FROM',From,',',X1,X2),
clause_atom('WHERE',Where,'AND',X2,X3),
%ILP : PARA NAO POR OS GROUP BYS. FAZER FLAG PARA ISTO
clause_atom('GROUP BY',Group,',',X3,Diff).
query_atom(negated_existential_subquery(Select,From,Where),QueryList,Diff):-
column_atom('NOT EXISTS(',QueryList,X1),
clause_atom('SELECT',Select,',',X1,X2),
clause_atom('FROM',From,',',X2,X3),
clause_atom('WHERE',Where,'AND',X3,X4),
column_atom(')',X4,Diff).
query_atom(existential_subquery(Select,From,Where),QueryList,Diff):-
column_atom('EXISTS(',QueryList,X1),
clause_atom('SELECT',Select,',',X1,X2),
clause_atom('FROM',From,',',X2,X3),
clause_atom('WHERE',Where,'AND',X3,X4),
column_atom('LIMIT 1)',X4,Diff).
% --- clause_atom(Keyword,ClauseCode,Junctor,CurrAtom,QueryAtom) -------------
%
% with
% Keyword one of SELECT, FROM, WHERE, or GROUP BY,
% ClauseCode the code corresponding to the appropriate clause of an SQL query, and
% Junctor indicating the character(s) through which the items of a clause
% are separated from each other (',' or 'AND').
% ILP
% clause_atom(Keyword,[],_,QueryList,QueryList).
clause_atom(_,[],_,QueryList,QueryList).
% case there is no WHERE condition
clause_atom(_,[once],_,QueryList,Diff):-!,
column_atom(' ',QueryList,X1),
column_atom('LIMIT 1',X1,X2),
column_atom(' ',X2,Diff).
clause_atom(Keyword,[Column|RestColumns],Junctor,QueryList,Diff):-
column_atom(Keyword,QueryList,X1),
column_atom(' ',X1,X2),
clause_atom([Column|RestColumns],Junctor,X2,X3),
column_atom(' ',X3,Diff).
%DISTINCT
clause_atom(Keyword,'COUNTDISTINCT',[Column],Junctor,QueryList,Diff):-!,
column_atom(Keyword,QueryList,X1),
column_atom(' ',X1,X2),
column_atom('COUNT',X2,X3),
column_atom('(DISTINCT ',X3,X4),
clause_atom([Column],Junctor,X4,X5),
column_atom(') ',X5,Diff).
clause_atom(Keyword,Function,[Column],Junctor,QueryList,Diff):-
column_atom(Keyword,QueryList,X1),
column_atom(' ',X1,X2),
column_atom(Function,X2,X3),
column_atom('(',X3,X4),
clause_atom([Column],Junctor,X4,X5),
column_atom(') ',X5,Diff).
% --- clause_atom(ClauseCode,Junctor) --------------------------------
clause_atom([once],_,QueryList,Diff):-!,
column_atom(' LIMIT 1 ',QueryList,Diff).
clause_atom([Item],_,QueryList,Diff):-
column_atom(Item,QueryList,Diff).
clause_atom([Item,NextItem|RestItems],Junctor,QueryList,Diff):-
column_atom(Item,QueryList,X1),
column_atom(' ',X1,X2),
( NextItem = once ->
X4 = X2
;
column_atom(Junctor,X2,X3),
column_atom(' ',X3,X4)
),
clause_atom([NextItem|RestItems],Junctor,X4,Diff).
column_atom(att(RangeVar,Attribute),QueryList,Diff):-
column_atom(RangeVar,QueryList,X1),
column_atom('.',X1,X2),
column_atom(Attribute,X2,Diff).
column_atom(rel(Relation,RangeVar),QueryList,Diff):-
column_atom('`',QueryList,X0),
column_atom(Relation,X0,X1),
column_atom('` ',X1,X2),
column_atom(RangeVar,X2,Diff).
column_atom('$const$'(String),QueryList,Diff):-
get_type('$const$'(String),string),
column_atom('"',QueryList,X1),
column_atom(String,X1,X2),
column_atom('"',X2,Diff).
column_atom('$const$'(Number),QueryList,Diff):-
get_type('$const$'(Number),NumType),
type_compatible(NumType,number),
column_atom(Number,QueryList,Diff).
column_atom(comp(LeftArg,Operator,RightArg),QueryList,Diff):-
column_atom(LeftArg,QueryList,X1),
column_atom(' ',X1,X2),
column_atom(Operator,X2,X3),
column_atom(' ',X3,X4),
column_atom(RightArg,X4,Diff).
column_atom(LeftExpr * RightExpr,QueryList,Diff):-
column_atom(LeftExpr,QueryList,X1),
column_atom('*',X1,X2),
column_atom(RightExpr,X2,Diff).
column_atom(LeftExpr + RightExpr,QueryList,Diff):-
column_atom(LeftExpr,QueryList,X1),
column_atom('+',X1,X2),
column_atom(RightExpr,X2,Diff).
column_atom(LeftExpr - RightExpr,QueryList,Diff):-
column_atom(LeftExpr,QueryList,X1),
column_atom('-',X1,X2),
column_atom(RightExpr,X2,Diff).
column_atom(LeftExpr / RightExpr,QueryList,Diff):-
column_atom(LeftExpr,QueryList,X1),
column_atom('/',X1,X2),
column_atom(RightExpr,X2,Diff).
column_atom(agg_query(Function,Select,From,Where,Group),QueryList,Diff):-
column_atom('(',QueryList,X1),
query_atom(agg_query(Function,Select,From,Where,Group),X1,X2),
column_atom(')',X2,Diff).
column_atom(negated_existential_subquery(Select,From,Where),QueryList,Diff):-
query_atom(negated_existential_subquery(Select,From,Where),QueryList,Diff).
column_atom(existential_subquery(Select,From,Where),QueryList,Diff):-
query_atom(existential_subquery(Select,From,Where),QueryList,Diff).
column_atom(Atom,List,Diff):-
atom(Atom),
name(Atom,X1),
append(X1,Diff,List).
column_atom(Number,List,Diff) :-
number(Number),
name(Number,X1),
append(X1,Diff,List).
% --- gensym(Root,Symbol) ----------------------------------------------------
%
% SEPIA 3.2. version - other Prolog implementations provide gensym/2
% and init_gensym/1 as built-ins. */
%
% (C) Christoph Draxler, Aug. 1992
%
%
init_gensym(Atom) :-
set_value(Atom,'@').
gensym(Atom,Var) :-
var(Var),
get_value(Atom,Value),
char_code(Value,Code),
NewCode is Code + 1,
char_code(Var,NewCode),
set_value(Atom,Var).
% --- auxiliary predicates (some of them may be built-in... --------------------
repeat_n(N):-
integer(N),
N > 0,
repeat_1(N).
repeat_1(1):-!.
repeat_1(_).
repeat_1(N):-
N1 is N-1,
repeat_1(N1).
% --- set_difference(SetA,SetB,Difference) --------------------------------------------
%
% SetA - SetB = Difference
set_difference([],_,[]).
set_difference([Element|RestSet],Set,[Element|RestDifference]):-
not member(Element,Set),
set_difference(RestSet,Set,RestDifference).
set_difference([Element|RestSet],Set,RestDifference):-
member(Element,Set),
set_difference(RestSet,Set,RestDifference).
% --- Mapping of Prolog operators to SQL operators -------------------------------------
comparison(=,=).
comparison(<,<).
comparison(=<,'<=').
comparison(>=,'>=').
comparison(>,>).
comparison(@<,<).
comparison(@>,>).
negated_comparison(=,'<>').
negated_comparison(\=,=).
negated_comparison(>,'<=').
negated_comparison(=<,>).
negated_comparison(<,>=).
negated_comparison(>=,<).
% --- aggregate_function(PrologFunctor,SQLFunction) -----------------
aggregate_functor(avg,'AVG').
aggregate_functor(min,'MIN').
aggregate_functor(max,'MAX').
aggregate_functor(sum,'SUM').
aggregate_functor(count,'COUNT').
aggregate_functor(countdistinct,'COUNTDISTINCT').
% --- type system --------------------------------------------------------------
%
% A rudimentary type system is provided for consistency checking during the
% translation and for output formatting
%
% The basic types are string and number. number has the subtypes integer and
% real.
%
% ------------------------------------------------------------------------------
type_compatible(Type,Type):-
is_type(Type).
type_compatible(SubType,Type):-
subtype(SubType,Type).
type_compatible(Type,SubType):-
subtype(SubType,Type).
% --- subtype(SubType,SuperType) -----------------------------------------------
%
% Simple type hierarchy checking
%
% ------------------------------------------------------------------------------
subtype(SubType,SuperType):-
is_subtype(SubType,SuperType).
subtype(SubType,SuperType):-
is_subtype(SubType,InterType),
subtype(InterType,SuperType).
% --- is_type(Type) ------------------------------------------------------------
%
% Type names
%
% ------------------------------------------------------------------------------
is_type(number).
is_type(integer).
is_type(real).
is_type(string).
is_type(natural).
% --- is_subtype(SubType,SuperType) --------------------------------------------
%
% Simple type hierarchy for numeric types
%
% ------------------------------------------------------------------------------
is_subtype(integer,number).
is_subtype(real,number).
is_subtype(natural,integer).
% --- get_type(Constant,Type) --------------------------------------------------
%
% Prolog implementation specific definition of type retrieval
% sepia Prolog version given here
%
% ------------------------------------------------------------------------------
get_type('$const$'(Constant),integer):-
integer(Constant),!.
get_type('$const$'(Constant),real):-
number(Constant),!.
get_type('$const$'(Constant),string):-
atom(Constant).