| 
									
										
										
										
											2009-03-13 19:39:06 +00:00
										 |  |  | /*  $Id$
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     Part of SWI-Prolog | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     Author:        Jan Wielemaker | 
					
						
							|  |  |  |     E-mail:        jan@swi.psy.uva.nl | 
					
						
							|  |  |  |     WWW:           http://www.swi-prolog.org
 | 
					
						
							|  |  |  |     Copyright (C): 1985-2002, University of Amsterdam | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     This library is free software; you can redistribute it and/or | 
					
						
							|  |  |  |     modify it under the terms of the GNU Lesser General Public | 
					
						
							|  |  |  |     License as published by the Free Software Foundation; either | 
					
						
							|  |  |  |     version 2.1 of the License, or (at your option) any later version. | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     This library is distributed in the hope that it will be useful, | 
					
						
							|  |  |  |     but WITHOUT ANY WARRANTY; without even the implied warranty of | 
					
						
							|  |  |  |     MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU | 
					
						
							|  |  |  |     Lesser General Public License for more details. | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     You should have received a copy of the GNU Lesser General Public | 
					
						
							|  |  |  |     License along with this library; if not, write to the Free Software | 
					
						
							|  |  |  |     Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA | 
					
						
							|  |  |  | */ | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #include <stdio.h>
 | 
					
						
							|  |  |  | #include <stdlib.h>
 | 
					
						
							|  |  |  | #include "dtd.h"
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | static void | 
					
						
							|  |  |  | char_range(dtd_charclass *map, int from, int to, int msk) | 
					
						
							|  |  |  | { unsigned char *ca; | 
					
						
							|  |  |  |   int i; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   for(i=from, ca=map->class+i; i++<=to; ) | 
					
						
							|  |  |  |     *ca++ |= msk; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | dtd_charclass * | 
					
						
							|  |  |  | new_charclass() | 
					
						
							|  |  |  | { dtd_charclass *map = sgml_calloc(1, sizeof(*map)); | 
					
						
							|  |  |  |   unsigned char *ca = map->class; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   char_range(map, 'a', 'z', CH_LCLETTER); | 
					
						
							|  |  |  |   char_range(map, 'A', 'Z', CH_LCLETTER); | 
					
						
							|  |  |  |   char_range(map, '0', '9', CH_DIGIT); | 
					
						
							| 
									
										
										
										
											2010-05-06 10:59:09 +01:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2009-03-13 19:39:06 +00:00
										 |  |  |   ca['.'] |= CH_CNM; | 
					
						
							|  |  |  |   ca['-'] |= CH_CNM; | 
					
						
							|  |  |  |   ca[183] |= CH_CNM;			/* XML */ | 
					
						
							|  |  |  |   ca[':'] |= CH_CNMSTRT;		/* HTML and XML */ | 
					
						
							|  |  |  |   ca['_'] |= CH_CNMSTRT;		/* HTML and XML */ | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   char_range(map, 192, 214, CH_CNMSTRT); /* XML ISO-LATIN-1 accented chars */ | 
					
						
							|  |  |  |   char_range(map, 216, 246, CH_CNMSTRT); | 
					
						
							|  |  |  |   char_range(map, 248, 255, CH_CNMSTRT); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   ca['\t'] |= CH_WHITE; | 
					
						
							|  |  |  |   ca[' ']  |= CH_WHITE; | 
					
						
							|  |  |  |   ca['\r'] |= CH_RE; | 
					
						
							|  |  |  |   ca['\n'] |= CH_RS; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   return map; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | dtd_charfunc * | 
					
						
							|  |  |  | new_charfunc() | 
					
						
							|  |  |  | { dtd_charfunc *f = sgml_calloc(1, sizeof(*f)); | 
					
						
							|  |  |  |   ichar *cf = f->func; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   cf[CF_STAGO]	= '<'; | 
					
						
							|  |  |  |   cf[CF_STAGC]	= '>'; | 
					
						
							|  |  |  |   cf[CF_ETAGO1]	= '<'; | 
					
						
							|  |  |  |   cf[CF_ETAGO2]	= '/'; | 
					
						
							|  |  |  |   cf[CF_VI]	= '='; | 
					
						
							|  |  |  |   cf[CF_NS]     = ':'; | 
					
						
							|  |  |  |   cf[CF_LIT]	= '"'; | 
					
						
							|  |  |  |   cf[CF_LITA]	= '\''; | 
					
						
							|  |  |  |   cf[CF_PERO]	= '%'; | 
					
						
							|  |  |  |   cf[CF_ERO]	= '&'; | 
					
						
							|  |  |  |   cf[CF_ERC]	= ';'; | 
					
						
							|  |  |  |   cf[CF_MDO1]	= '<'; | 
					
						
							|  |  |  |   cf[CF_MDO2]	= '!'; | 
					
						
							|  |  |  |   cf[CF_MDC]	= '>'; | 
					
						
							|  |  |  |   cf[CF_PRO1]	= '<'; | 
					
						
							|  |  |  |   cf[CF_PRO2]	= '?'; | 
					
						
							|  |  |  |   cf[CF_PRC]	= '>'; | 
					
						
							|  |  |  |   cf[CF_GRPO]	= '('; | 
					
						
							|  |  |  |   cf[CF_GRPC]	= ')'; | 
					
						
							|  |  |  |   cf[CF_SEQ]	= ','; | 
					
						
							|  |  |  |   cf[CF_AND]	= '&'; | 
					
						
							|  |  |  |   cf[CF_OR]	= '|'; | 
					
						
							|  |  |  |   cf[CF_OPT]	= '?'; | 
					
						
							|  |  |  |   cf[CF_PLUS]	= '+'; | 
					
						
							|  |  |  |   cf[CF_DSO]	= '['; | 
					
						
							|  |  |  |   cf[CF_DSC]	= ']'; | 
					
						
							|  |  |  |   cf[CF_REP]	= '*'; | 
					
						
							|  |  |  |   cf[CF_RS]	= '\n'; | 
					
						
							|  |  |  |   cf[CF_RE]	= '\r'; | 
					
						
							|  |  |  |   cf[CF_CMT]	= '-'; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   return f; | 
					
						
							|  |  |  | } |