Guido van Rossum | b700df9 | 2000-03-31 14:59:30 +0000 | [diff] [blame] | 1 | /* |
| 2 | * Secret Labs' Regular Expression Engine |
| 3 | * $Id$ |
| 4 | * |
| 5 | * simple regular expression matching engine |
| 6 | * |
| 7 | * Copyright (c) 1997-2000 by Secret Labs AB. All rights reserved. |
| 8 | * |
| 9 | * See the _sre.c file for information on usage and redistribution. |
| 10 | */ |
| 11 | |
| 12 | #ifndef SRE_INCLUDED |
| 13 | #define SRE_INCLUDED |
| 14 | |
| 15 | #include "sre_constants.h" |
| 16 | |
Fredrik Lundh | 102f3ad | 2000-06-29 08:55:54 +0000 | [diff] [blame] | 17 | /* size of a code word (must be unsigned short or larger) */ |
| 18 | #define SRE_CODE unsigned short |
| 19 | |
Guido van Rossum | b700df9 | 2000-03-31 14:59:30 +0000 | [diff] [blame] | 20 | typedef struct { |
| 21 | PyObject_HEAD |
| 22 | PyObject* code; /* link to the code string object */ |
Guido van Rossum | b700df9 | 2000-03-31 14:59:30 +0000 | [diff] [blame] | 23 | int groups; |
| 24 | PyObject* groupindex; |
Jeremy Hylton | b1aa195 | 2000-06-01 17:39:12 +0000 | [diff] [blame] | 25 | /* compatibility */ |
| 26 | PyObject* pattern; /* pattern source (or None) */ |
| 27 | int flags; /* flags used when compiling pattern source */ |
Guido van Rossum | b700df9 | 2000-03-31 14:59:30 +0000 | [diff] [blame] | 28 | } PatternObject; |
| 29 | |
Jeremy Hylton | b1aa195 | 2000-06-01 17:39:12 +0000 | [diff] [blame] | 30 | #define PatternObject_GetCode(o)\ |
| 31 | ((void*) PyString_AS_STRING(((PatternObject*)(o))->code)) |
Guido van Rossum | b700df9 | 2000-03-31 14:59:30 +0000 | [diff] [blame] | 32 | |
| 33 | typedef struct { |
| 34 | PyObject_HEAD |
| 35 | PyObject* string; /* link to the target string */ |
| 36 | PatternObject* pattern; /* link to the regex (pattern) object */ |
| 37 | int groups; /* number of groups (start/end marks) */ |
| 38 | int mark[2]; |
| 39 | } MatchObject; |
| 40 | |
Fredrik Lundh | 102f3ad | 2000-06-29 08:55:54 +0000 | [diff] [blame] | 41 | typedef unsigned int (*SRE_TOLOWER_HOOK)(unsigned int ch); |
| 42 | |
| 43 | typedef struct { |
| 44 | /* stack elements */ |
| 45 | SRE_CODE* pattern; |
| 46 | void* ptr; |
| 47 | } SRE_STACK; |
| 48 | |
Jeremy Hylton | b1aa195 | 2000-06-01 17:39:12 +0000 | [diff] [blame] | 49 | typedef struct { |
| 50 | /* string pointers */ |
| 51 | void* ptr; /* current position (also end of current slice) */ |
| 52 | void* beginning; /* start of original string */ |
| 53 | void* start; /* start of current slice */ |
| 54 | void* end; /* end of original string */ |
| 55 | /* character size */ |
| 56 | int charsize; |
| 57 | /* registers */ |
Fredrik Lundh | 102f3ad | 2000-06-29 08:55:54 +0000 | [diff] [blame] | 58 | int lastmark; |
Jeremy Hylton | b1aa195 | 2000-06-01 17:39:12 +0000 | [diff] [blame] | 59 | void* mark[64]; /* FIXME: <fl> should be dynamically allocated! */ |
| 60 | /* backtracking stack */ |
Fredrik Lundh | 102f3ad | 2000-06-29 08:55:54 +0000 | [diff] [blame] | 61 | SRE_STACK* stack; |
Jeremy Hylton | b1aa195 | 2000-06-01 17:39:12 +0000 | [diff] [blame] | 62 | int stacksize; |
| 63 | int stackbase; |
Fredrik Lundh | 102f3ad | 2000-06-29 08:55:54 +0000 | [diff] [blame] | 64 | /* hooks */ |
Fredrik Lundh | b389df3 | 2000-06-29 12:48:37 +0000 | [diff] [blame^] | 65 | SRE_TOLOWER_HOOK lower; |
Jeremy Hylton | b1aa195 | 2000-06-01 17:39:12 +0000 | [diff] [blame] | 66 | } SRE_STATE; |
Guido van Rossum | b700df9 | 2000-03-31 14:59:30 +0000 | [diff] [blame] | 67 | |
Jeremy Hylton | b1aa195 | 2000-06-01 17:39:12 +0000 | [diff] [blame] | 68 | typedef struct { |
Fredrik Lundh | 102f3ad | 2000-06-29 08:55:54 +0000 | [diff] [blame] | 69 | /* search helper */ |
Jeremy Hylton | b1aa195 | 2000-06-01 17:39:12 +0000 | [diff] [blame] | 70 | PyObject_HEAD |
| 71 | PyObject* pattern; |
| 72 | PyObject* string; |
| 73 | SRE_STATE state; |
| 74 | } CursorObject; |
| 75 | |
| 76 | #endif |