X-Git-Url: http://git.shadowcat.co.uk/gitweb/gitweb.cgi?a=blobdiff_plain;f=regexp.h;h=2f7aa02b3d393a019b8274f0cbdb94c3de6fdec4;hb=0a5d5e8be390bda2f9b7684490082d428228d28f;hp=33d9e3250e8a0c6fce8879e501ed16c8e8f23728;hpb=55204971972392ce5a252fbbd6d78b1c48ed70e3;p=p5sagit%2Fp5-mst-13.2.git diff --git a/regexp.h b/regexp.h index 33d9e32..2f7aa02 100644 --- a/regexp.h +++ b/regexp.h @@ -1,3 +1,6 @@ +/* regexp.h + */ + /* * Definitions etc. for regexp(3) routines. * @@ -5,46 +8,64 @@ * not the System V one. */ -/* $RCSfile: regexp.h,v $$Revision: 4.0.1.2 $$Date: 91/11/05 18:24:31 $ - * - * $Log: regexp.h,v $ - * Revision 4.0.1.2 91/11/05 18:24:31 lwall - * patch11: minimum match length calculation in regexp is now cumulative - * patch11: initial .* in pattern had dependency on value of $* - * - * Revision 4.0.1.1 91/06/07 11:51:18 lwall - * patch4: new copyright notice - * patch4: // wouldn't use previous pattern if it started with a null character - * patch4: $` was busted inside s/// - * - * Revision 4.0 91/03/20 01:39:23 lwall - * 4.0 baseline. - * - */ + +struct regnode { + U8 flags; + U8 type; + U16 next_off; +}; + +typedef struct regnode regnode; typedef struct regexp { + I32 refcnt; char **startp; char **endp; - STR *regstart; /* Internal use only. */ - char *regstclass; - STR *regmust; /* Internal use only. */ - int regback; /* Can regmust locate first try? */ - int minlen; /* mininum possible length of $& */ - int prelen; /* length of precomp */ + regnode *regstclass; + I32 minlen; /* mininum possible length of $& */ + I32 prelen; /* length of precomp */ + U32 nparens; /* number of parentheses */ + U32 lastparen; /* last paren matched */ char *precomp; /* pre-compilation regular expression */ char *subbase; /* saved string so \digit works forever */ char *subbeg; /* same, but not responsible for allocation */ char *subend; /* end of subbase */ - char reganch; /* Internal use only. */ - char do_folding; /* do case-insensitive match? */ - char lastparen; /* last paren matched */ - char nparens; /* number of parentheses */ - char program[1]; /* Unwarranted chumminess with compiler. */ + U16 naughty; /* how exponential is this pattern? */ + U16 reganch; /* Internal use only + + Tainted information used by regexec? */ + SV *anchored_substr; /* Substring at fixed position wrt start. */ + I32 anchored_offset; /* Position of it. */ + SV *float_substr; /* Substring at variable position wrt start. */ + I32 float_min_offset; /* Minimal position of it. */ + I32 float_max_offset; /* Maximal position of it. */ + SV *check_substr; /* Substring to check before matching. */ + I32 check_offset_min; /* Offset of the above. */ + I32 check_offset_max; /* Offset of the above. */ + struct reg_data *data; /* Additional data. */ + regnode program[1]; /* Unwarranted chumminess with compiler. */ } regexp; -#define ROPT_ANCH 1 -#define ROPT_SKIP 2 -#define ROPT_IMPLICIT 4 +#define ROPT_ANCH (ROPT_ANCH_BOL|ROPT_ANCH_MBOL|ROPT_ANCH_GPOS) +#define ROPT_ANCH_SINGLE (ROPT_ANCH_BOL|ROPT_ANCH_GPOS) +#define ROPT_ANCH_BOL 1 +#define ROPT_ANCH_MBOL 2 +#define ROPT_ANCH_GPOS 4 +#define ROPT_SKIP 8 +#define ROPT_IMPLICIT 0x10 /* Converted .* to ^.* */ +#define ROPT_NOSCAN 0x20 /* Check-string always at start. */ +#define ROPT_GPOS_SEEN 0x40 +#define ROPT_CHECK_ALL 0x80 +#define ROPT_LOOKBEHIND_SEEN 0x100 + +#define ROPT_TAINTED_SEEN 0x8000 + +#define RX_MATCH_TAINTED(prog) ((prog)->reganch & ROPT_TAINTED_SEEN) +#define RX_MATCH_TAINTED_SET(prog, t) ((t) \ + ? ((prog)->reganch |= ROPT_TAINTED_SEEN) \ + : ((prog)->reganch &= ~ROPT_TAINTED_SEEN)) + +#define REXEC_COPY_STR 1 /* Need to copy the string. */ +#define REXEC_CHECKED 2 /* check_substr already checked. */ -regexp *regcomp(); -int regexec(); +#define ReREFCNT_inc(re) ((re && re->refcnt++), re) +#define ReREFCNT_dec(re) pregfree(re)