500 lines
		
	
	
		
			22 KiB
		
	
	
	
		
			Prolog
		
	
	
	
	
	
			
		
		
	
	
			500 lines
		
	
	
		
			22 KiB
		
	
	
	
		
			Prolog
		
	
	
	
	
	
| /* XML Utilities
 | |
| 
 | |
|  *
 | |
| 
 | |
|  * Copyright (C) 2001-2005 Binding Time Limited
 | |
| 
 | |
|  * Copyright (C) 2005-2011 John Fletcher
 | |
| 
 | |
|  *
 | |
| 
 | |
|  * Current Release: $Revision: 3.4 $
 | |
| 
 | |
|  * 
 | |
| 
 | |
|  * TERMS AND CONDITIONS:
 | |
| 
 | |
|  *
 | |
| 
 | |
|  * This program is offered free of charge, as unsupported source code. You may
 | |
| 
 | |
|  * use it, copy it, distribute it, modify it or sell it without restriction,
 | |
| 
 | |
|  * but entirely at your own risk.
 | |
| 
 | |
|  */
 | |
| 
 | |
| 
 | |
| 
 | |
| % Entity and Namespace map operations: these maps are usually quite small, so
 | |
| 
 | |
| % a linear list lookup is okay. They could be substituted by a logarithmic
 | |
| 
 | |
| % data structure - in extremis.
 | |
| 
 | |
| 
 | |
| 
 | |
| /* empty_map( ?Map ) is true if Map is a null map.
 | |
| 
 | |
|  */
 | |
| 
 | |
| empty_map( [] ).
 | |
| 
 | |
| 
 | |
| 
 | |
| /* map_member( +Key, +Map, ?Data ) is true if Map is a ordered map structure
 | |
| 
 | |
|  * which records the pair Key-Data. Key must be ground.
 | |
| 
 | |
|  */
 | |
| 
 | |
| map_member( Key0, [Key1-Data1|Rest], Data0 ) :-
 | |
| 
 | |
| 	( Key0 == Key1 ->
 | |
| 
 | |
| 		Data0 = Data1
 | |
| 
 | |
| 	; Key0 @> Key1 ->
 | |
| 
 | |
| 		map_member( Key0, Rest, Data0 )
 | |
| 
 | |
| 	).
 | |
| 
 | |
| 
 | |
| 
 | |
| /* map_store( +Map0, +Key, +Data, ?Map1 ) is true if Map0 is an ordered map
 | |
| 
 | |
|  * structure, Key must be ground, and Map1 is identical to Map0 except that
 | |
| 
 | |
|  * the pair Key-Data is recorded by Map1.
 | |
| 
 | |
|  */
 | |
| 
 | |
| map_store( [], Key, Data, [Key-Data] ).
 | |
| 
 | |
| map_store( [Key0-Data0|Map0], Key, Data, Map ) :-
 | |
| 
 | |
| 	( Key == Key0 ->
 | |
| 
 | |
| 		Map = [Key-Data|Map0]
 | |
| 
 | |
| 	; Key @< Key0 ->
 | |
| 
 | |
| 		Map = [Key-Data,Key0-Data0|Map0]
 | |
| 
 | |
| 	; otherwise -> % >
 | |
| 
 | |
| 		Map = [Key0-Data0|Map1],
 | |
| 
 | |
| 		map_store( Map0, Key, Data, Map1 )
 | |
| 
 | |
| 	).
 | |
| 
 | |
| 
 | |
| 
 | |
| /* context(?Element, ?PreserveSpace, ?CurrentNS, ?DefaultNS, ?Entities, ?Namespaces )
 | |
| 
 | |
|  * is an ADT hiding the "state" arguments for XML Acquisition
 | |
| 
 | |
|  */
 | |
| 
 | |
| initial_context(
 | |
| 
 | |
| 		Controls,
 | |
| 
 | |
| 		context(void,PreserveSpace,'','',Entities,Empty,
 | |
| 
 | |
| 			RemoveAttributePrefixes,AllowAmpersand)
 | |
| 
 | |
| 		) :-
 | |
| 
 | |
| 	empty_map( Empty ),
 | |
| 
 | |
| 	( member( extended_characters(false), Controls ) ->
 | |
| 
 | |
| 		Entities = Empty
 | |
| 
 | |
| 	; otherwise ->
 | |
| 
 | |
| 		extended_character_entities(Entities)
 | |
| 
 | |
| 	),
 | |
| 
 | |
| 	( member( format(false), Controls ) ->
 | |
| 
 | |
| 		PreserveSpace = true
 | |
| 
 | |
| 	; otherwise ->
 | |
| 
 | |
| 		PreserveSpace = false
 | |
| 
 | |
| 	),
 | |
| 
 | |
| 	( member( remove_attribute_prefixes(true), Controls ) ->
 | |
| 
 | |
| 		RemoveAttributePrefixes = true
 | |
| 
 | |
| 	; otherwise ->
 | |
| 
 | |
| 		RemoveAttributePrefixes = false
 | |
| 
 | |
| 	),
 | |
| 
 | |
| 	( member( allow_ampersand(true), Controls ) ->
 | |
| 
 | |
| 		AllowAmpersand = true
 | |
| 
 | |
| 	; otherwise ->
 | |
| 
 | |
| 		AllowAmpersand = false
 | |
| 
 | |
| 	).
 | |
| 
 | |
| 
 | |
| 
 | |
| context_update( current_namespace, Context0, URI, Context1 ) :-
 | |
| 
 | |
| 	Context0 = context(Element,Preserve,_Current,Default,Entities,
 | |
| 
 | |
| 		Namespaces,RemoveAttributePrefixes,Amp),
 | |
| 
 | |
| 	Context1 = context(Element,Preserve,URI,Default,Entities,
 | |
| 
 | |
| 		Namespaces,RemoveAttributePrefixes,Amp).
 | |
| 
 | |
| context_update( element, Context0, Tag, Context1 ) :-
 | |
| 
 | |
| 	Context0 = context(_Element,Preserve,Current,Default,Entities,
 | |
| 
 | |
| 		Namespaces,RemoveAttributePrefixes,Amp),
 | |
| 
 | |
| 	Context1 = context(tag(Tag),Preserve,Current,Default,Entities,
 | |
| 
 | |
| 		Namespaces,RemoveAttributePrefixes,Amp).
 | |
| 
 | |
| context_update( default_namespace, Context0, URI, Context1 ):-
 | |
| 
 | |
| 	Context0 = context(Element,Preserve,Current,_Default,Entities,
 | |
| 
 | |
| 		Namespaces,RemoveAttributePrefixes,Amp),
 | |
| 
 | |
| 	Context1 = context(Element,Preserve,Current,URI,Entities,
 | |
| 
 | |
| 		Namespaces,RemoveAttributePrefixes,Amp).
 | |
| 
 | |
| context_update( space_preserve, Context0, Boolean, Context1 ):-
 | |
| 
 | |
| 	Context0 = context(Element,_Preserve,Current,Default,Entities,
 | |
| 
 | |
| 		Namespaces,RemoveAttributePrefixes,Amp),
 | |
| 
 | |
| 	Context1 = context(Element,Boolean,Current,Default,Entities,
 | |
| 
 | |
| 		Namespaces,RemoveAttributePrefixes,Amp).
 | |
| 
 | |
| context_update( ns_prefix(Prefix), Context0, URI, Context1 ) :-
 | |
| 
 | |
| 	Context0 = context(Element,Preserve,Current,Default,Entities,
 | |
| 
 | |
| 		Namespaces0,RemoveAttributePrefixes,Amp),
 | |
| 
 | |
| 	Context1 = context(Element,Preserve,Current,Default,Entities,
 | |
| 
 | |
| 		Namespaces1,RemoveAttributePrefixes,Amp),
 | |
| 
 | |
| 	map_store( Namespaces0, Prefix, URI, Namespaces1 ).
 | |
| 
 | |
| context_update( entity(Name), Context0, String, Context1 ) :-
 | |
| 
 | |
| 	Context0 = context(Element,Preserve,Current,Default,Entities0,
 | |
| 
 | |
| 		Namespaces,RemoveAttributePrefixes,Amp),
 | |
| 
 | |
| 	Context1 = context(Element,Preserve,Current,Default,Entities1,
 | |
| 
 | |
| 		Namespaces,RemoveAttributePrefixes,Amp),
 | |
| 
 | |
| 	map_store( Entities0, Name, String, Entities1 ).
 | |
| 
 | |
| 
 | |
| 
 | |
| remove_attribute_prefixes( Context ) :-
 | |
| 
 | |
| 	Context = context(_Element,_Preserve,_Current,_Default,_Entities,
 | |
| 
 | |
| 		_Namespaces,true,_Amp).
 | |
| 
 | |
| 
 | |
| 
 | |
| current_tag( Context, Tag ) :-
 | |
| 
 | |
| 	Context = context(tag(Tag),_Preserve,_Current,_Default,_Entities,
 | |
| 
 | |
| 		_Namespaces,_RPFA,_Amp).
 | |
| 
 | |
| 
 | |
| 
 | |
| current_namespace( Context, Current ) :-
 | |
| 
 | |
| 	Context = context(_Element,_Preserve,Current,_Default,_Entities,
 | |
| 
 | |
| 		_Namespaces,_RPFA,_Amp).
 | |
| 
 | |
| 
 | |
| 
 | |
| default_namespace( Context, Default ) :-
 | |
| 
 | |
| 	Context = context(_Element,_Preserve,_Current,Default,_Entities,
 | |
| 
 | |
| 		_Namespaces,_RPFA,_Amp).
 | |
| 
 | |
| 
 | |
| 
 | |
| space_preserve( Context ) :-
 | |
| 
 | |
| 	Context = context(tag(_Tag),true,_Current,_Default,_Entities,
 | |
| 
 | |
| 		_Namespaces,_RPFA,_Amp).
 | |
| 
 | |
| 
 | |
| 
 | |
| specific_namespace( Prefix, Context, URI ) :-
 | |
| 
 | |
| 	Context = context(_Element,_Preserve,_Current,_Default,_Entities,
 | |
| 
 | |
| 		Namespaces,_RPFA,_Amp),
 | |
| 
 | |
| 	map_member( Prefix, Namespaces, URI ).
 | |
| 
 | |
| 
 | |
| 
 | |
| defined_entity( Reference, Context, String ) :-
 | |
| 
 | |
| 	Context = context(_Element,_Preserve,_Current,_Default,Entities,
 | |
| 
 | |
| 		_Namespaces,_RPFA,_Amp),
 | |
| 
 | |
| 	map_member( Reference, Entities, String ).
 | |
| 
 | |
| 	
 | |
| 
 | |
| close_context( Context, Terms, WellFormed ) :-
 | |
| 
 | |
| 	Context = context(Element,_Preserve,_Current,_Default,_Entities,
 | |
| 
 | |
| 		_Namespaces,_RPFA,_Amp),
 | |
| 
 | |
| 	close_context1( Element, Terms, WellFormed ).
 | |
| 
 | |
| 
 | |
| 
 | |
| close_context1( void, [], true ).
 | |
| 
 | |
| close_context1( tag(TagChars), [out_of_context(Tag)], false ) :-
 | |
| 
 | |
| 	atom_chars( Tag, TagChars ).
 | |
| 
 | |
| 
 | |
| 
 | |
| void_context(
 | |
| 
 | |
| 	context(void,_Preserve,_Current,_Default,_Entities,_Names,_RPFA,_Amp)
 | |
| 
 | |
| 	).
 | |
| 
 | |
| 
 | |
| 
 | |
| allow_ampersand(
 | |
| 
 | |
| 	context(_Void,_Preserve,_Current,_Default,_Entities,_Names,_RPFA,true)
 | |
| 
 | |
| 	).
 | |
| 
 | |
| 
 | |
| 
 | |
| /* pp_string( +String ) prints String onto the current output stream.
 | |
| 
 | |
|  * If String contains only 7-bit chars it is printed in shorthand quoted
 | |
| 
 | |
|  * format, otherwise it is written as a list.
 | |
| 
 | |
|  * If your Prolog uses " to delimit a special string type, just use write/1.
 | |
| 
 | |
|  */
 | |
| 
 | |
| pp_string( Chars ) :-
 | |
| 
 | |
| 	( member( Char, Chars ),
 | |
| 
 | |
| 	  not_shorthand( Char ) ->
 | |
| 
 | |
| 		write( Chars )
 | |
| 
 | |
| 	; otherwise ->
 | |
| 
 | |
| 		put_quote,
 | |
| 
 | |
| 		pp_string1( Chars ),
 | |
| 
 | |
| 		put_quote
 | |
| 
 | |
| 	).
 | |
| 
 | |
| 
 | |
| 
 | |
| not_shorthand( Char ) :-
 | |
| 
 | |
| 	Char > 255.
 | |
| 
 | |
| not_shorthand( Char ) :-
 | |
| 
 | |
| 	Char < 9.
 | |
| 
 | |
| not_shorthand( 126 ).	% ~ gives syntax errors in LPA Prolog
 | |
| 
 | |
| 
 | |
| 
 | |
| put_quote :-
 | |
| 
 | |
| 	put( 0'" ). % '
 | |
| 
 | |
| 
 | |
| 
 | |
| pp_string1( [] ).
 | |
| 
 | |
| pp_string1( [Char|Chars] ) :-
 | |
| 
 | |
| 	( Char =:= """"  -> % Meta-quote
 | |
| 
 | |
| 		put( Char ),
 | |
| 
 | |
| 		put( Char ),
 | |
| 
 | |
| 		pp_string1( Chars )
 | |
| 
 | |
| 	; Char =:= 13,	% Handle Windows border-settings
 | |
| 
 | |
| 	  Chars = [10|Chars1] ->
 | |
| 
 | |
| 		put( 10 ),
 | |
| 
 | |
| 		pp_string1( Chars1 )
 | |
| 
 | |
| 	; otherwise ->
 | |
| 
 | |
| 		put( Char ),
 | |
| 
 | |
| 		pp_string1( Chars )
 | |
| 
 | |
| 	).
 | |
| 
 | |
| 
 | |
| 
 | |
| xml_declaration_attributes_valid( [] ).
 | |
| 
 | |
| xml_declaration_attributes_valid( [Name=Value|Attributes] ) :-
 | |
| 
 | |
| 	xml_declaration_attribute_valid( Name, Value ),
 | |
| 
 | |
| 	xml_declaration_attributes_valid( Attributes ).
 | |
| 
 | |
| 
 | |
| 
 | |
| xml_declaration_attribute_valid( Name, Value ) :-
 | |
| 
 | |
| 	lowercase( Value, Lowercase ),
 | |
| 
 | |
| 	canonical_xml_declaration_attribute( Name, Lowercase ).
 | |
| 
 | |
| 
 | |
| 
 | |
| canonical_xml_declaration_attribute( version, "1.0" ).
 | |
| 
 | |
| canonical_xml_declaration_attribute( standalone, "yes" ).
 | |
| 
 | |
| canonical_xml_declaration_attribute( standalone, "no" ).
 | |
| 
 | |
| % The encodings here are all valid for the output produced.
 | |
| 
 | |
| canonical_xml_declaration_attribute( encoding, "utf-8" ).
 | |
| 
 | |
| % canonical_xml_declaration_attribute( encoding, "utf-16" ).
 | |
| 
 | |
| % This is erroneous for the output of this library
 | |
| 
 | |
| canonical_xml_declaration_attribute( encoding, "us-ascii" ).
 | |
| 
 | |
| canonical_xml_declaration_attribute( encoding, "ascii" ).
 | |
| 
 | |
| canonical_xml_declaration_attribute( encoding, "iso-8859-1" ).
 | |
| 
 | |
| canonical_xml_declaration_attribute( encoding, "iso-8859-2" ).
 | |
| 
 | |
| canonical_xml_declaration_attribute( encoding, "iso-8859-15" ).
 | |
| 
 | |
| canonical_xml_declaration_attribute( encoding, "windows-1252" ).
 | |
| 
 | |
| % In general, it's better not to specify an encoding.
 | |
| 
 | |
| 
 | |
| 
 | |
| /* lowercase( +MixedCase, ?Lowercase ) holds when Lowercase and MixedCase are
 | |
| 
 | |
|  * lists of character codes, and Lowercase is identical to MixedCase with
 | |
| 
 | |
|  * every uppercase character replaced by its lowercase equivalent.
 | |
| 
 | |
|  */
 | |
| 
 | |
| lowercase( [], [] ).
 | |
| 
 | |
| lowercase( [Char|Chars], [Lower|LowerCase] ) :-
 | |
| 
 | |
| 	( Char >= "A", Char =< "Z" ->
 | |
| 
 | |
| 		Lower is Char + "a" - "A"
 | |
| 
 | |
| 	; otherwise ->
 | |
| 
 | |
| 		Lower = Char
 | |
| 
 | |
| 	),
 | |
| 
 | |
| 	lowercase( Chars, LowerCase ).
 | |
| 
 | |
| 
 | |
| 
 | |
| extended_character_entities( [
 | |
| 
 | |
| 	"AElig"-[198],		% latin capital letter AE
 | |
| 
 | |
| 	"Aacute"-[193],		% latin capital letter A with acute,
 | |
| 
 | |
| 	"Acirc"-[194],		% latin capital letter A with circumflex,
 | |
| 
 | |
| 	"Agrave"-[192],		% latin capital letter A with grave
 | |
| 
 | |
| 	"Alpha"-[913],		% greek capital letter alpha, U+0391
 | |
| 
 | |
| 	"Aring"-[197],		% latin capital letter A with ring above
 | |
| 
 | |
| 	"Atilde"-[195],		% latin capital letter A with tilde,
 | |
| 
 | |
| 	"Auml"-[196],		% latin capital letter A with diaeresis,
 | |
| 
 | |
| 	"Beta"-[914],		% greek capital letter beta, U+0392
 | |
| 
 | |
| 	"Ccedil"-[199],		% latin capital letter C with cedilla,
 | |
| 
 | |
| 	"Chi"-[935],		% greek capital letter chi, U+03A7
 | |
| 
 | |
| 	"Dagger"-[8225],	% double dagger, U+2021 ISOpub
 | |
| 
 | |
| 	"Delta"-[916],		% greek capital letter delta,
 | |
| 
 | |
| 	"ETH"-[208],		% latin capital letter ETH, U+00D0 ISOlat1>
 | |
| 
 | |
| 	"Eacute"-[201],		% latin capital letter E with acute,
 | |
| 
 | |
| 	"Ecirc"-[202],		% latin capital letter E with circumflex,
 | |
| 
 | |
| 	"Egrave"-[200],		% latin capital letter E with grave,
 | |
| 
 | |
| 	"Epsilon"-[917],	% greek capital letter epsilon, U+0395
 | |
| 
 | |
| 	"Eta"-[919],		% greek capital letter eta, U+0397
 | |
| 
 | |
| 	"Euml"-[203],		% latin capital letter E with diaeresis,
 | |
| 
 | |
| 	"Gamma"-[915],		% greek capital letter gamma,
 | |
| 
 | |
| 	"Iacute"-[205],		% latin capital letter I with acute,
 | |
| 
 | |
| 	"Icirc"-[206],		% latin capital letter I with circumflex,
 | |
| 
 | |
| 	"Igrave"-[204],		% latin capital letter I with grave,
 | |
| 
 | |
| 	"Iota"-[921],		% greek capital letter iota, U+0399
 | |
| 
 | |
| 	"Iuml"-[207],		% latin capital letter I with diaeresis,
 | |
| 
 | |
| 	"Kappa"-[922],		% greek capital letter kappa, U+039A
 | |
| 
 | |
| 	"Lambda"-[923],		% greek capital letter lambda,
 | |
| 
 | |
| 	"Mu"-[924],			% greek capital letter mu, U+039C
 | |
| 
 | |
| 	"Ntilde"-[209],		% latin capital letter N with tilde,
 | |
| 
 | |
| 	"Nu"-[925],			% greek capital letter nu, U+039D
 | |
| 
 | |
| 	"OElig"-[338],		% latin capital ligature OE,
 | |
| 
 | |
| 	"Oacute"-[211],		% latin capital letter O with acute,
 | |
| 
 | |
| 	"Ocirc"-[212],		% latin capital letter O with circumflex,
 | |
| 
 | |
| 	"Ograve"-[210],		% latin capital letter O with grave,
 | |
| 
 | |
| 	"Omega"-[937],		% greek capital letter omega,
 | |
| 
 | |
| 	"Omicron"-[927],	% greek capital letter omicron, U+039F
 | |
| 
 | |
| 	"Oslash"-[216],		% latin capital letter O with stroke
 | |
| 
 | |
| 	"Otilde"-[213],		% latin capital letter O with tilde,
 | |
| 
 | |
| 	"Ouml"-[214],		% latin capital letter O with diaeresis,
 | |
| 
 | |
| 	"Phi"-[934],		% greek capital letter phi,
 | |
| 
 | |
| 	"Pi"-[928],			% greek capital letter pi, U+03A0 ISOgrk3
 | |
| 
 | |
| 	"Prime"-[8243],		% double prime = seconds = inches,
 | |
| 
 | |
| 	"Psi"-[936],		% greek capital letter psi,
 | |
| 
 | |
| 	"Rho"-[929],		% greek capital letter rho, U+03A1
 | |
| 
 | |
| 	"Scaron"-[352],		% latin capital letter S with caron,
 | |
| 
 | |
| 	"Sigma"-[931],		% greek capital letter sigma,
 | |
| 
 | |
| 	"THORN"-[222],		% latin capital letter THORN,
 | |
| 
 | |
| 	"Tau"-[932],		% greek capital letter tau, U+03A4
 | |
| 
 | |
| 	"Theta"-[920],		% greek capital letter theta,
 | |
| 
 | |
| 	"Uacute"-[218],		% latin capital letter U with acute,
 | |
| 
 | |
| 	"Ucirc"-[219],		% latin capital letter U with circumflex,
 | |
| 
 | |
| 	"Ugrave"-[217],		% latin capital letter U with grave,
 | |
| 
 | |
| 	"Upsilon"-[933],	% greek capital letter upsilon,
 | |
| 
 | |
| 	"Uuml"-[220],		% latin capital letter U with diaeresis,
 | |
| 
 | |
| 	"Xi"-[926],			% greek capital letter xi, U+039E ISOgrk3
 | |
| 
 | |
| 	"Yacute"-[221],		% latin capital letter Y with acute,
 | |
| 
 | |
| 	"Yuml"-[376],		% latin capital letter Y with diaeresis,
 | |
| 
 | |
| 	"Zeta"-[918],		% greek capital letter zeta, U+0396
 | |
| 
 | |
| 	"aacute"-[225],		% latin small letter a with acute,
 | |
| 
 | |
| 	"acirc"-[226],		% latin small letter a with circumflex,
 | |
| 
 | |
| 	"acute"-[180],		% acute accent = spacing acute,
 | |
| 
 | |
| 	"aelig"-[230],		% latin small letter ae
 | |
| 
 | |
| 	"agrave"-[224],		% latin small letter a with grave
 | |
| 
 | |
| 	"alefsym"-[8501],	% alef symbol = first transfinite cardinal,
 | |
| 
 | |
| 	"alpha"-[945],		% greek small letter alpha,
 | |
| 
 | |
| 	"and"-[8743],		% logical and = wedge, U+2227 ISOtech
 | |
| 
 | |
| 	"ang"-[8736],		% angle, U+2220 ISOamso
 | |
| 
 | |
| 	"aring"-[229],		% latin small letter a with ring above
 | |
| 
 | |
| 	"asymp"-[8776],		% almost equal to = asymptotic to,
 | |
| 
 | |
| 	"atilde"-[227],		% latin small letter a with tilde,
 | |
| 
 | |
| 	"auml"-[228],		% latin small letter a with diaeresis,
 | |
| 
 | |
| 	"bdquo"-[8222],		% double low-9 quotation mark, U+201E NEW
 | |
| 
 | |
| 	"beta"-[946],		% greek small letter beta, U+03B2 ISOgrk3
 | |
| 
 | |
| 	"brvbar"-[166],		% broken bar = broken vertical bar,
 | |
| 
 | |
| 	"bull"-[8226],		% bullet = black small circle,
 | |
| 
 | |
| 	"cap"-[8745],		% intersection = cap, U+2229 ISOtech
 | |
| 
 | |
| 	"ccedil"-[231],		% latin small letter c with cedilla,
 | |
| 
 | |
| 	"cedil"-[184],		% cedilla = spacing cedilla, U+00B8 ISOdia>
 | |
| 
 | |
| 	"cent"-[162],		% cent sign, U+00A2 ISOnum>
 | |
| 
 | |
| 	"chi"-[967],		% greek small letter chi, U+03C7 ISOgrk3
 | |
| 
 | |
| 	"circ"-[710],		% modifier letter circumflex accent,
 | |
| 
 | |
| 	"clubs"-[9827],		% black club suit = shamrock,
 | |
| 
 | |
| 	"cong"-[8773],		% approximately equal to, U+2245 ISOtech
 | |
| 
 | |
| 	"copy"-[169],		% copyright sign, U+00A9 ISOnum>
 | |
| 
 | |
| 	"crarr"-[8629],		% downwards arrow with corner leftwards
 | |
| 
 | |
| 	"cup"-[8746],		% union = cup, U+222A ISOtech
 | |
| 
 | |
| 	"curren"-[164],		% currency sign, U+00A4 ISOnum>
 | |
| 
 | |
| 	"dArr"-[8659],		% downwards double arrow, U+21D3 ISOamsa
 | |
| 
 | |
| 	"dagger"-[8224],	% dagger, U+2020 ISOpub
 | |
| 
 | |
| 	"darr"-[8595],		% downwards arrow, U+2193 ISOnum
 | |
| 
 | |
| 	"deg"-[176],		% degree sign, U+00B0 ISOnum>
 | |
| 
 | |
| 	"delta"-[948],		% greek small letter delta,
 | |
| 
 | |
| 	"diams"-[9830],		% black diamond suit, U+2666 ISOpub
 | |
| 
 | |
| 	"divide"-[247],		% division sign, U+00F7 ISOnum>
 | |
| 
 | |
| 	"eacute"-[233],		% latin small letter e with acute,
 | |
| 
 | |
| 	"ecirc"-[234],		% latin small letter e with circumflex,
 | |
| 
 | |
| 	"egrave"-[232],		% latin small letter e with grave,
 | |
| 
 | |
| 	"empty"-[8709],		% empty set = null set = diameter,
 | |
| 
 | |
| 	"emsp"-[8195],		% em space, U+2003 ISOpub
 | |
| 
 | |
| 	"ensp"-[8194],		% en space, U+2002 ISOpub
 | |
| 
 | |
| 	"epsilon"-[949],	% greek small letter epsilon,
 | |
| 
 | |
| 	"equiv"-[8801],		% identical to, U+2261 ISOtech
 | |
| 
 | |
| 	"eta"-[951],		% greek small letter eta, U+03B7 ISOgrk3
 | |
| 
 | |
| 	"eth"-[240],		% latin small letter eth, U+00F0 ISOlat1>
 | |
| 
 | |
| 	"euml"-[235],		% latin small letter e with diaeresis,
 | |
| 
 | |
| 	"euro"-[8364],		% euro sign, U+20AC NEW
 | |
| 
 | |
| 	"exist"-[8707],		% there exists, U+2203 ISOtech
 | |
| 
 | |
| 	"fnof"-[402],		% latin small f with hook = function
 | |
| 
 | |
| 	"forall"-[8704],	% for all, U+2200 ISOtech
 | |
| 
 | |
| 	"frac12"-[189],		% vulgar fraction one half
 | |
| 
 | |
| 	"frac14"-[188],		% vulgar fraction one quarter
 | |
| 
 | |
| 	"frac34"-[190],		% vulgar fraction three quarters
 | |
| 
 | |
| 	"frasl"-[8260],		% fraction slash, U+2044 NEW
 | |
| 
 | |
| 	"gamma"-[947],		% greek small letter gamma,
 | |
| 
 | |
| 	"ge"-[8805],		% greater-than or equal to,
 | |
| 
 | |
| 	"hArr"-[8660],		% left right double arrow,
 | |
| 
 | |
| 	"harr"-[8596],		% left right arrow, U+2194 ISOamsa
 | |
| 
 | |
| 	"hearts"-[9829],	% black heart suit = valentine,
 | |
| 
 | |
| 	"hellip"-[8230],	% horizontal ellipsis = three dot leader,
 | |
| 
 | |
| 	"iacute"-[237],		% latin small letter i with acute,
 | |
| 
 | |
| 	"icirc"-[238],		% latin small letter i with circumflex,
 | |
| 
 | |
| 	"iexcl"-[161],		% inverted exclamation mark, U+00A1 ISOnum>
 | |
| 
 | |
| 	"igrave"-[236],		% latin small letter i with grave,
 | |
| 
 | |
| 	"image"-[8465],		% blackletter capital I = imaginary part,
 | |
| 
 | |
| 	"infin"-[8734],		% infinity, U+221E ISOtech
 | |
| 
 | |
| 	"int"-[8747],		% integral, U+222B ISOtech
 | |
| 
 | |
| 	"iota"-[953],		% greek small letter iota, U+03B9 ISOgrk3
 | |
| 
 | |
| 	"iquest"-[191],		% inverted question mark
 | |
| 
 | |
| 	"isin"-[8712],		% element of, U+2208 ISOtech
 | |
| 
 | |
| 	"iuml"-[239],		% latin small letter i with diaeresis,
 | |
| 
 | |
| 	"kappa"-[954],		% greek small letter kappa,
 | |
| 
 | |
| 	"lArr"-[8656],		% leftwards double arrow, U+21D0 ISOtech
 | |
| 
 | |
| 	"lambda"-[955],		% greek small letter lambda,
 | |
| 
 | |
| 	"lang"-[9001],		% left-pointing angle bracket = bra,
 | |
| 
 | |
| 	"laquo"-[171],		% left-pointing double angle quotation mark
 | |
| 
 | |
| 	"larr"-[8592],		% leftwards arrow, U+2190 ISOnum
 | |
| 
 | |
| 	"lceil"-[8968],		% left ceiling = apl upstile,
 | |
| 
 | |
| 	"ldquo"-[8220],		% left double quotation mark,
 | |
| 
 | |
| 	"le"-[8804],		% less-than or equal to, U+2264 ISOtech
 | |
| 
 | |
| 	"lfloor"-[8970],	% left floor = apl downstile,
 | |
| 
 | |
| 	"lowast"-[8727],	% asterisk operator, U+2217 ISOtech
 | |
| 
 | |
| 	"loz"-[9674],		% lozenge, U+25CA ISOpub
 | |
| 
 | |
| 	"lrm"-[8206],		% left-to-right mark, U+200E NEW RFC 2070
 | |
| 
 | |
| 	"lsaquo"-[8249],	% single left-pointing angle quotation mark,
 | |
| 
 | |
| 	"lsquo"-[8216],		% left single quotation mark,
 | |
| 
 | |
| 	"macr"-[175],		% macron = spacing macron = overline
 | |
| 
 | |
| 	"mdash"-[8212],		% em dash, U+2014 ISOpub
 | |
| 
 | |
| 	"micro"-[181],		% micro sign, U+00B5 ISOnum>
 | |
| 
 | |
| 	"middot"-[183],		% middle dot = Georgian comma
 | |
| 
 | |
| 	"minus"-[8722],		% minus sign, U+2212 ISOtech
 | |
| 
 | |
| 	"mu"-[956],			% greek small letter mu, U+03BC ISOgrk3
 | |
| 
 | |
| 	"nabla"-[8711],		% nabla = backward difference,
 | |
| 
 | |
| 	"nbsp"-[160],		% no-break space = non-breaking space,
 | |
| 
 | |
| 	"ndash"-[8211],		% en dash, U+2013 ISOpub
 | |
| 
 | |
| 	"ne"-[8800],		% not equal to, U+2260 ISOtech
 | |
| 
 | |
| 	"ni"-[8715],		% contains as member, U+220B ISOtech
 | |
| 
 | |
| 	"not"-[172],		% not sign, U+00AC ISOnum>
 | |
| 
 | |
| 	"notin"-[8713],		% not an element of, U+2209 ISOtech
 | |
| 
 | |
| 	"nsub"-[8836],		% not a subset of, U+2284 ISOamsn
 | |
| 
 | |
| 	"ntilde"-[241],		% latin small letter n with tilde,
 | |
| 
 | |
| 	"nu"-[957],			% greek small letter nu, U+03BD ISOgrk3
 | |
| 
 | |
| 	"oacute"-[243],		% latin small letter o with acute,
 | |
| 
 | |
| 	"ocirc"-[244],		% latin small letter o with circumflex,
 | |
| 
 | |
| 	"oelig"-[339],		% latin small ligature oe, U+0153 ISOlat2
 | |
| 
 | |
| 	"ograve"-[242],		% latin small letter o with grave,
 | |
| 
 | |
| 	"oline"-[8254],		% overline = spacing overscore,
 | |
| 
 | |
| 	"omega"-[969],		% greek small letter omega,
 | |
| 
 | |
| 	"omicron"-[959],	% greek small letter omicron, U+03BF NEW
 | |
| 
 | |
| 	"oplus"-[8853],		% circled plus = direct sum,
 | |
| 
 | |
| 	"or"-[8744],		% logical or = vee, U+2228 ISOtech
 | |
| 
 | |
| 	"ordf"-[170],		% feminine ordinal indicator, U+00AA ISOnum>
 | |
| 
 | |
| 	"ordm"-[186],		% masculine ordinal indicator,
 | |
| 
 | |
| 	"oslash"-[248],		% latin small letter o with stroke,
 | |
| 
 | |
| 	"otilde"-[245],		% latin small letter o with tilde,
 | |
| 
 | |
| 	"otimes"-[8855],	% circled times = vector product,
 | |
| 
 | |
| 	"ouml"-[246],		% latin small letter o with diaeresis,
 | |
| 
 | |
| 	"para"-[182],		% pilcrow sign = paragraph sign,
 | |
| 
 | |
| 	"part"-[8706],		% partial differential, U+2202 ISOtech
 | |
| 
 | |
| 	"permil"-[8240],	% per mille sign, U+2030 ISOtech
 | |
| 
 | |
| 	"perp"-[8869],		% up tack = orthogonal to = perpendicular,
 | |
| 
 | |
| 	"phi"-[966],		% greek small letter phi, U+03C6 ISOgrk3
 | |
| 
 | |
| 	"pi"-[960],			% greek small letter pi, U+03C0 ISOgrk3
 | |
| 
 | |
| 	"piv"-[982],		% greek pi symbol, U+03D6 ISOgrk3
 | |
| 
 | |
| 	"plusmn"-[177],		% plus-minus sign = plus-or-minus sign,
 | |
| 
 | |
| 	"pound"-[163],		% pound sign, U+00A3 ISOnum>
 | |
| 
 | |
| 	"prime"-[8242],		% prime = minutes = feet, U+2032 ISOtech
 | |
| 
 | |
| 	"prod"-[8719],		% n-ary product = product sign,
 | |
| 
 | |
| 	"prop"-[8733],		% proportional to, U+221D ISOtech
 | |
| 
 | |
| 	"psi"-[968],		% greek small letter psi, U+03C8 ISOgrk3
 | |
| 
 | |
| 	"rArr"-[8658],		% rightwards double arrow,
 | |
| 
 | |
| 	"radic"-[8730],		% square root = radical sign,
 | |
| 
 | |
| 	"rang"-[9002],		% right-pointing angle bracket = ket,
 | |
| 
 | |
| 	"raquo"-[187],		% right-pointing double angle quotation mark
 | |
| 
 | |
| 	"rarr"-[8594],		% rightwards arrow, U+2192 ISOnum
 | |
| 
 | |
| 	"rceil"-[8969],		% right ceiling, U+2309 ISOamsc
 | |
| 
 | |
| 	"rdquo"-[8221],		% right double quotation mark,
 | |
| 
 | |
| 	"real"-[8476],		% blackletter capital R = real part symbol,
 | |
| 
 | |
| 	"reg"-[174],		% registered sign = registered trade mark sign,
 | |
| 
 | |
| 	"rfloor"-[8971],	% right floor, U+230B ISOamsc
 | |
| 
 | |
| 	"rho"-[961],		% greek small letter rho, U+03C1 ISOgrk3
 | |
| 
 | |
| 	"rlm"-[8207],		% right-to-left mark, U+200F NEW RFC 2070
 | |
| 
 | |
| 	"rsaquo"-[8250],	% single right-pointing angle quotation mark,
 | |
| 
 | |
| 	"rsquo"-[8217],		% right single quotation mark,
 | |
| 
 | |
| 	"sbquo"-[8218],		% single low-9 quotation mark, U+201A NEW
 | |
| 
 | |
| 	"scaron"-[353],		% latin small letter s with caron,
 | |
| 
 | |
| 	"sdot"-[8901],		% dot operator, U+22C5 ISOamsb
 | |
| 
 | |
| 	"sect"-[167],		% section sign, U+00A7 ISOnum>
 | |
| 
 | |
| 	"shy"-[173],		% soft hyphen = discretionary hyphen,
 | |
| 
 | |
| 	"sigma"-[963],		% greek small letter sigma,
 | |
| 
 | |
| 	"sigmaf"-[962],		% greek small letter final sigma,
 | |
| 
 | |
| 	"sim"-[8764],		% tilde operator = varies with = similar to,
 | |
| 
 | |
| 	"spades"-[9824],	% black spade suit, U+2660 ISOpub
 | |
| 
 | |
| 	"sub"-[8834],		% subset of, U+2282 ISOtech
 | |
| 
 | |
| 	"sube"-[8838],		% subset of or equal to, U+2286 ISOtech
 | |
| 
 | |
| 	"sum"-[8721],		% n-ary sumation, U+2211 ISOamsb
 | |
| 
 | |
| 	"sup"-[8835],		% superset of, U+2283 ISOtech
 | |
| 
 | |
| 	"sup1"-[185],		% superscript one = superscript digit one,
 | |
| 
 | |
| 	"sup2"-[178],		% superscript two = superscript digit two
 | |
| 
 | |
| 	"sup3"-[179],		% superscript three = superscript digit three
 | |
| 
 | |
| 	"supe"-[8839],		% superset of or equal to,
 | |
| 
 | |
| 	"szlig"-[223],		% latin small letter sharp s = ess-zed,
 | |
| 
 | |
| 	"tau"-[964],		% greek small letter tau, U+03C4 ISOgrk3
 | |
| 
 | |
| 	"there4"-[8756],	% therefore, U+2234 ISOtech
 | |
| 
 | |
| 	"theta"-[952],		% greek small letter theta,
 | |
| 
 | |
| 	"thetasym"-[977],	% greek small letter theta symbol,
 | |
| 
 | |
| 	"thinsp"-[8201],	% thin space, U+2009 ISOpub
 | |
| 
 | |
| 	"thorn"-[254],		% latin small letter thorn with,
 | |
| 
 | |
| 	"tilde"-[732],		% small tilde, U+02DC ISOdia
 | |
| 
 | |
| 	"times"-[215],		% multiplication sign, U+00D7 ISOnum>
 | |
| 
 | |
| 	"trade"-[8482],		% trade mark sign, U+2122 ISOnum
 | |
| 
 | |
| 	"uArr"-[8657],		% upwards double arrow, U+21D1 ISOamsa
 | |
| 
 | |
| 	"uacute"-[250],		% latin small letter u with acute,
 | |
| 
 | |
| 	"uarr"-[8593],		% upwards arrow, U+2191 ISOnum
 | |
| 
 | |
| 	"ucirc"-[251],		% latin small letter u with circumflex,
 | |
| 
 | |
| 	"ugrave"-[249],		% latin small letter u with grave,
 | |
| 
 | |
| 	"uml"-[168],		% diaeresis = spacing diaeresis,
 | |
| 
 | |
| 	"upsih"-[978],		% greek upsilon with hook symbol,
 | |
| 
 | |
| 	"upsilon"-[965],	% greek small letter upsilon,
 | |
| 
 | |
| 	"uuml"-[252],		% latin small letter u with diaeresis,
 | |
| 
 | |
| 	"weierp"-[8472],	% script capital P = power set
 | |
| 
 | |
| 	"xi"-[958],			% greek small letter xi, U+03BE ISOgrk3
 | |
| 
 | |
| 	"yacute"-[253],		% latin small letter y with acute,
 | |
| 
 | |
| 	"yen"-[165],		% yen sign = yuan sign, U+00A5 ISOnum>
 | |
| 
 | |
| 	"yuml"-[255],		% latin small letter y with diaeresis,
 | |
| 
 | |
| 	"zeta"-[950],		% greek small letter zeta, U+03B6 ISOgrk3
 | |
| 
 | |
| 	"zwj"-[8205],		% zero width joiner, U+200D NEW RFC 2070
 | |
| 
 | |
| 	"zwnj"-[8204]		% zero width non-joiner,
 | |
| 
 | |
| 	] ).
 | |
| 
 | |
| 
 | |
| 
 | |
| /* chars( ?Chars, ?Plus, ?Minus ) used as chars( ?Chars ) in a DCG to
 | |
| 
 | |
|  * copy the list Chars inline.
 | |
| 
 | |
|  *
 | |
| 
 | |
|  * This is best expressed in terms of append/3 where append/3 is built-in.
 | |
| 
 | |
|  * For other Prologs, a straightforward specification can be used:
 | |
| 
 | |
|  *
 | |
| 
 | |
|  *	chars( [] ) --> "".
 | |
| 
 | |
|  *	chars( [Char|Chars] ) -->
 | |
| 
 | |
|  *		[Char],
 | |
| 
 | |
|  *		chars( Chars ).
 | |
| 
 | |
|  */
 | |
| 
 | |
| 
 | |
| 
 | |
| chars( Chars, Plus, Minus ) :-
 | |
| 
 | |
| 	append( Chars, Minus, Plus ).
 | |
| 
 | |
| 
 | |
| 
 |