| 
									
										
										
										
											2001-04-09 19:54:03 +00:00
										 |  |  | /*-
 | 
					
						
							|  |  |  |  * Copyright (c) 1992, 1993, 1994 Henry Spencer. | 
					
						
							|  |  |  |  * Copyright (c) 1992, 1993, 1994 | 
					
						
							|  |  |  |  *	The Regents of the University of California.  All rights reserved. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * This code is derived from software contributed to Berkeley by | 
					
						
							|  |  |  |  * Henry Spencer. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * Redistribution and use in source and binary forms, with or without | 
					
						
							|  |  |  |  * modification, are permitted provided that the following conditions | 
					
						
							|  |  |  |  * are met: | 
					
						
							|  |  |  |  * 1. Redistributions of source code must retain the above copyright | 
					
						
							|  |  |  |  *    notice, this list of conditions and the following disclaimer. | 
					
						
							|  |  |  |  * 2. Redistributions in binary form must reproduce the above copyright | 
					
						
							|  |  |  |  *    notice, this list of conditions and the following disclaimer in the | 
					
						
							|  |  |  |  *    documentation and/or other materials provided with the distribution. | 
					
						
							|  |  |  |  * 3. All advertising materials mentioning features or use of this software | 
					
						
							|  |  |  |  *    must display the following acknowledgement: | 
					
						
							|  |  |  |  *	This product includes software developed by the University of | 
					
						
							|  |  |  |  *	California, Berkeley and its contributors. | 
					
						
							|  |  |  |  * 4. Neither the name of the University nor the names of its contributors | 
					
						
							|  |  |  |  *    may be used to endorse or promote products derived from this software | 
					
						
							|  |  |  |  *    without specific prior written permission. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND | 
					
						
							|  |  |  |  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | 
					
						
							|  |  |  |  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE | 
					
						
							|  |  |  |  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE | 
					
						
							|  |  |  |  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL | 
					
						
							|  |  |  |  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS | 
					
						
							|  |  |  |  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) | 
					
						
							|  |  |  |  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT | 
					
						
							|  |  |  |  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY | 
					
						
							|  |  |  |  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF | 
					
						
							|  |  |  |  * SUCH DAMAGE. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  *	@(#)regexec.c	8.3 (Berkeley) 3/20/94 | 
					
						
							|  |  |  |  */ | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #if defined(LIBC_SCCS) && !defined(lint)
 | 
					
						
							|  |  |  | static char sccsid[] = "@(#)regexec.c	8.3 (Berkeley) 3/20/94"; | 
					
						
							|  |  |  | #endif /* LIBC_SCCS and not lint */
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /*
 | 
					
						
							|  |  |  |  * the outer shell of regexec() | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * This file includes engine.c *twice*, after muchos fiddling with the | 
					
						
							|  |  |  |  * macros that code uses.  This lets the same code operate on two different | 
					
						
							|  |  |  |  * representations for state sets. | 
					
						
							|  |  |  |  */ | 
					
						
							| 
									
										
										
										
											2002-03-12 15:54:01 +00:00
										 |  |  | #include "config.h"
 | 
					
						
							| 
									
										
										
										
											2016-04-18 16:41:30 +01:00
										 |  |  | 
 | 
					
						
							|  |  |  | #ifndef HAVE_REGEXEC
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2002-03-12 15:54:01 +00:00
										 |  |  | #include "c_interface.h"
 | 
					
						
							|  |  |  | #if HAVE_SYS_TYPES_H
 | 
					
						
							| 
									
										
										
										
											2001-04-09 19:54:03 +00:00
										 |  |  | #include <sys/types.h>
 | 
					
						
							| 
									
										
										
										
											2002-03-12 15:54:01 +00:00
										 |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2001-04-09 19:54:03 +00:00
										 |  |  | #include <stdio.h>
 | 
					
						
							|  |  |  | #include <stdlib.h>
 | 
					
						
							| 
									
										
										
										
											2004-12-16 06:08:57 +00:00
										 |  |  | #if HAVE_CTYPE_H
 | 
					
						
							| 
									
										
										
										
											2002-03-12 15:54:01 +00:00
										 |  |  | #include <ctype.h>
 | 
					
						
							|  |  |  | #endif
 | 
					
						
							|  |  |  | #if HAVE_STRING_H
 | 
					
						
							| 
									
										
										
										
											2001-04-09 19:54:03 +00:00
										 |  |  | #include <string.h>
 | 
					
						
							| 
									
										
										
										
											2002-03-12 15:54:01 +00:00
										 |  |  | #endif
 | 
					
						
							|  |  |  | #if HAVE_LIMITS_H
 | 
					
						
							| 
									
										
										
										
											2001-04-09 19:54:03 +00:00
										 |  |  | #include <limits.h>
 | 
					
						
							| 
									
										
										
										
											2002-03-12 15:54:01 +00:00
										 |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2001-04-09 19:54:03 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | #include "regex2.h"
 | 
					
						
							| 
									
										
										
										
											2016-04-18 16:41:30 +01:00
										 |  |  | #include "utils.h"
 | 
					
						
							|  |  |  | #include "yapregex.h"
 | 
					
						
							| 
									
										
										
										
											2001-04-09 19:54:03 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2004-11-04 18:22:36 +00:00
										 |  |  | #if used
 | 
					
						
							| 
									
										
										
										
											2016-04-18 16:41:30 +01:00
										 |  |  | static int nope = 0; /* for use in asserts; shuts lint up */ | 
					
						
							| 
									
										
										
										
											2004-11-04 18:22:36 +00:00
										 |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2001-04-09 19:54:03 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | /* macros for manipulating states, small version */ | 
					
						
							| 
									
										
										
										
											2016-04-18 16:41:30 +01:00
										 |  |  | #define states long
 | 
					
						
							|  |  |  | #define states1 states /* for later use in regexec() decision */
 | 
					
						
							|  |  |  | #define CLEAR(v) ((v) = 0)
 | 
					
						
							|  |  |  | #define SET0(v, n) ((v) &= ~((unsigned long)1 << (n)))
 | 
					
						
							|  |  |  | #define SET1(v, n) ((v) |= (unsigned long)1 << (n))
 | 
					
						
							|  |  |  | #define ISSET(v, n) (((v) & ((unsigned long)1 << (n))) != 0)
 | 
					
						
							|  |  |  | #define ASSIGN(d, s) ((d) = (s))
 | 
					
						
							|  |  |  | #define EQ(a, b) ((a) == (b))
 | 
					
						
							|  |  |  | #define STATEVARS long dummy /* dummy version */
 | 
					
						
							|  |  |  | #define STATESETUP(m, n)     /* nothing */
 | 
					
						
							|  |  |  | #define STATETEARDOWN(m)     /* nothing */
 | 
					
						
							|  |  |  | #define SETUP(v) ((v) = 0)
 | 
					
						
							|  |  |  | #define onestate long
 | 
					
						
							|  |  |  | #define INIT(o, n) ((o) = (unsigned long)1 << (n))
 | 
					
						
							|  |  |  | #define INC(o) ((o) <<= 1)
 | 
					
						
							|  |  |  | #define ISSTATEIN(v, o) (((v) & (o)) != 0)
 | 
					
						
							| 
									
										
										
										
											2001-04-09 19:54:03 +00:00
										 |  |  | /* some abbreviations; note that some of these know variable names! */ | 
					
						
							|  |  |  | /* do "if I'm here, I can also be there" etc without branches */ | 
					
						
							| 
									
										
										
										
											2016-04-18 16:41:30 +01:00
										 |  |  | #define FWD(dst, src, n) ((dst) |= ((unsigned long)(src) & (here)) << (n))
 | 
					
						
							|  |  |  | #define BACK(dst, src, n) ((dst) |= ((unsigned long)(src) & (here)) >> (n))
 | 
					
						
							|  |  |  | #define ISSETBACK(v, n) (((v) & ((unsigned long)here >> (n))) != 0)
 | 
					
						
							| 
									
										
										
										
											2001-04-09 19:54:03 +00:00
										 |  |  | /* function names */ | 
					
						
							| 
									
										
										
										
											2016-04-18 16:41:30 +01:00
										 |  |  | #define SNAMES /* engine.c looks after details */
 | 
					
						
							| 
									
										
										
										
											2001-04-09 19:54:03 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | #include "engine.c"
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /* now undo things */ | 
					
						
							| 
									
										
										
										
											2016-04-18 16:41:30 +01:00
										 |  |  | #undef states
 | 
					
						
							|  |  |  | #undef CLEAR
 | 
					
						
							|  |  |  | #undef SET0
 | 
					
						
							|  |  |  | #undef SET1
 | 
					
						
							|  |  |  | #undef ISSET
 | 
					
						
							|  |  |  | #undef ASSIGN
 | 
					
						
							|  |  |  | #undef EQ
 | 
					
						
							|  |  |  | #undef STATEVARS
 | 
					
						
							|  |  |  | #undef STATESETUP
 | 
					
						
							|  |  |  | #undef STATETEARDOWN
 | 
					
						
							|  |  |  | #undef SETUP
 | 
					
						
							|  |  |  | #undef onestate
 | 
					
						
							|  |  |  | #undef INIT
 | 
					
						
							|  |  |  | #undef INC
 | 
					
						
							|  |  |  | #undef ISSTATEIN
 | 
					
						
							|  |  |  | #undef FWD
 | 
					
						
							|  |  |  | #undef BACK
 | 
					
						
							|  |  |  | #undef ISSETBACK
 | 
					
						
							|  |  |  | #undef SNAMES
 | 
					
						
							| 
									
										
										
										
											2001-04-09 19:54:03 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | /* macros for manipulating states, large version */ | 
					
						
							| 
									
										
										
										
											2016-04-18 16:41:30 +01:00
										 |  |  | #define states char *
 | 
					
						
							|  |  |  | #define CLEAR(v) memset(v, 0, m->g->nstates)
 | 
					
						
							|  |  |  | #define SET0(v, n) ((v)[n] = 0)
 | 
					
						
							|  |  |  | #define SET1(v, n) ((v)[n] = 1)
 | 
					
						
							|  |  |  | #define ISSET(v, n) ((v)[n])
 | 
					
						
							|  |  |  | #define ASSIGN(d, s) memcpy(d, s, m->g->nstates)
 | 
					
						
							|  |  |  | #define EQ(a, b) (memcmp(a, b, m->g->nstates) == 0)
 | 
					
						
							|  |  |  | #define STATEVARS                                                              \
 | 
					
						
							|  |  |  |   long vn;                                                                     \ | 
					
						
							|  |  |  |   char *space | 
					
						
							|  |  |  | #define STATESETUP(m, nv)                                                      \
 | 
					
						
							|  |  |  |   {                                                                            \ | 
					
						
							|  |  |  |     (m)->space = malloc((nv) * (m)->g->nstates);                               \ | 
					
						
							|  |  |  |     if ((m)->space == NULL)                                                    \ | 
					
						
							|  |  |  |       return (REG_ESPACE);                                                     \ | 
					
						
							|  |  |  |     (m)->vn = 0;                                                               \ | 
					
						
							|  |  |  |   } | 
					
						
							|  |  |  | #define STATETEARDOWN(m)                                                       \
 | 
					
						
							|  |  |  |   { free((m)->space); } | 
					
						
							|  |  |  | #define SETUP(v) ((v) = &m->space[m->vn++ * m->g->nstates])
 | 
					
						
							|  |  |  | #define onestate long
 | 
					
						
							|  |  |  | #define INIT(o, n) ((o) = (n))
 | 
					
						
							|  |  |  | #define INC(o) ((o)++)
 | 
					
						
							|  |  |  | #define ISSTATEIN(v, o) ((v)[o])
 | 
					
						
							| 
									
										
										
										
											2001-04-09 19:54:03 +00:00
										 |  |  | /* some abbreviations; note that some of these know variable names! */ | 
					
						
							|  |  |  | /* do "if I'm here, I can also be there" etc without branches */ | 
					
						
							| 
									
										
										
										
											2016-04-18 16:41:30 +01:00
										 |  |  | #define FWD(dst, src, n) ((dst)[here + (n)] |= (src)[here])
 | 
					
						
							|  |  |  | #define BACK(dst, src, n) ((dst)[here - (n)] |= (src)[here])
 | 
					
						
							|  |  |  | #define ISSETBACK(v, n) ((v)[here - (n)])
 | 
					
						
							| 
									
										
										
										
											2001-04-09 19:54:03 +00:00
										 |  |  | /* function names */ | 
					
						
							| 
									
										
										
										
											2016-04-18 16:41:30 +01:00
										 |  |  | #define LNAMES /* flag */
 | 
					
						
							| 
									
										
										
										
											2001-04-09 19:54:03 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | #include "engine.c"
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /*
 | 
					
						
							|  |  |  |  - regexec - interface for matching | 
					
						
							|  |  |  |  = extern int regexec(const regex_t *, const char *, size_t, \ | 
					
						
							|  |  |  |  =					regmatch_t [], int); | 
					
						
							|  |  |  |  = #define	REG_NOTBOL	00001 | 
					
						
							|  |  |  |  = #define	REG_NOTEOL	00002 | 
					
						
							|  |  |  |  = #define	REG_STARTEND	00004 | 
					
						
							|  |  |  |  = #define	REG_TRACE	00400	// tracing of execution
 | 
					
						
							|  |  |  |  = #define	REG_LARGE	01000	// force large representation
 | 
					
						
							|  |  |  |  = #define	REG_BACKR	02000	// force use of backref code
 | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * We put this here so we can exploit knowledge of the state representation | 
					
						
							|  |  |  |  * when choosing which matcher to call.  Also, by this point the matchers | 
					
						
							|  |  |  |  * have been prototyped. | 
					
						
							|  |  |  |  */ | 
					
						
							| 
									
										
										
										
											2016-04-18 16:41:30 +01:00
										 |  |  | int /* 0 success, REG_NOMATCH failure */ | 
					
						
							|  |  |  |     yap_regexec(preg, string, nmatch, pmatch, eflags) const regex_t *preg; | 
					
						
							| 
									
										
										
										
											2001-04-09 19:54:03 +00:00
										 |  |  | const char *string; | 
					
						
							|  |  |  | size_t nmatch; | 
					
						
							|  |  |  | regmatch_t pmatch[]; | 
					
						
							|  |  |  | int eflags; | 
					
						
							|  |  |  | { | 
					
						
							| 
									
										
										
										
											2016-04-18 16:41:30 +01:00
										 |  |  |   register struct re_guts *g = preg->re_g; | 
					
						
							| 
									
										
										
										
											2001-04-09 19:54:03 +00:00
										 |  |  | #ifdef REDEBUG
 | 
					
						
							| 
									
										
										
										
											2016-04-18 16:41:30 +01:00
										 |  |  | #define GOODFLAGS(f) (f)
 | 
					
						
							| 
									
										
										
										
											2001-04-09 19:54:03 +00:00
										 |  |  | #else
 | 
					
						
							| 
									
										
										
										
											2016-04-18 16:41:30 +01:00
										 |  |  | #define GOODFLAGS(f) ((f) & (REG_NOTBOL | REG_NOTEOL | REG_STARTEND))
 | 
					
						
							| 
									
										
										
										
											2001-04-09 19:54:03 +00:00
										 |  |  | #endif
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2016-04-18 16:41:30 +01:00
										 |  |  |   if (preg->re_magic != MAGIC1 || g->magic != MAGIC2) | 
					
						
							|  |  |  |     return (REG_BADPAT); | 
					
						
							|  |  |  |   assert(!(g->iflags & BAD)); | 
					
						
							|  |  |  |   if (g->iflags & BAD) /* backstop for no-debug case */ | 
					
						
							|  |  |  |     return (REG_BADPAT); | 
					
						
							|  |  |  |   eflags = GOODFLAGS(eflags); | 
					
						
							| 
									
										
										
										
											2001-04-09 19:54:03 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2016-04-18 16:41:30 +01:00
										 |  |  |   if (g->nstates <= CHAR_BIT * sizeof(states1) && !(eflags & REG_LARGE)) | 
					
						
							|  |  |  |     return (smatcher(g, (char *)string, nmatch, pmatch, eflags)); | 
					
						
							|  |  |  |   else | 
					
						
							|  |  |  |     return (lmatcher(g, (char *)string, nmatch, pmatch, eflags)); | 
					
						
							| 
									
										
										
										
											2001-04-09 19:54:03 +00:00
										 |  |  | } | 
					
						
							| 
									
										
										
										
											2016-04-18 16:41:30 +01:00
										 |  |  | 
 | 
					
						
							|  |  |  | #endif
 |