1 /* $RCSfile: toke.c,v $$Revision: 4.1 $$Date: 92/08/07 18:28:39 $
3 * Copyright (c) 1991, Larry Wall
5 * You may distribute under the terms of either the GNU General Public
6 * License or the Artistic License, as specified in the README file.
9 * Revision 4.1 92/08/07 18:28:39 lwall
11 * Revision 4.0.1.7 92/06/11 21:16:30 lwall
12 * patch34: expect incorrectly set to indicate start of program or block
14 * Revision 4.0.1.6 92/06/08 16:03:49 lwall
15 * patch20: an EXPR may now start with a bareword
16 * patch20: print $fh EXPR can now expect term rather than operator in EXPR
17 * patch20: added ... as variant on ..
18 * patch20: new warning on spurious backslash
19 * patch20: new warning on missing $ for foreach variable
20 * patch20: "foo"x1024 now legal without space after x
21 * patch20: new warning on print accidentally used as function
22 * patch20: tr/stuff// wasn't working right
23 * patch20: 2. now eats the dot
24 * patch20: <@ARGV> now notices @ARGV
25 * patch20: tr/// now lets you say \-
27 * Revision 4.0.1.5 91/11/11 16:45:51 lwall
28 * patch19: default arg for shift was wrong after first subroutine definition
30 * Revision 4.0.1.4 91/11/05 19:02:48 lwall
31 * patch11: \x and \c were subject to double interpretation in regexps
32 * patch11: prepared for ctype implementations that don't define isascii()
33 * patch11: nested list operators could miscount parens
34 * patch11: once-thru blocks didn't display right in the debugger
35 * patch11: sort eval "whatever" didn't work
36 * patch11: underscore is now allowed within literal octal and hex numbers
38 * Revision 4.0.1.3 91/06/10 01:32:26 lwall
39 * patch10: m'$foo' now treats string as single quoted
40 * patch10: certain pattern optimizations were botched
42 * Revision 4.0.1.2 91/06/07 12:05:56 lwall
43 * patch4: new copyright notice
44 * patch4: debugger lost track of lines in eval
45 * patch4: //o and s///o now optimize themselves fully at runtime
46 * patch4: added global modifier for pattern matches
48 * Revision 4.0.1.1 91/04/12 09:18:18 lwall
49 * patch1: perl -de "print" wouldn't stop at the first statement
51 * Revision 4.0 91/03/20 01:42:14 lwall
60 static void set_csh();
62 /* The following are arranged oddly so that the guard on the switch statement
63 * can get by with a single comparison (if the compiler is smart enough).
67 #define LEX_INTERPNORMAL 7
68 #define LEX_INTERPCASEMOD 6
69 #define LEX_INTERPSTART 5
70 #define LEX_INTERPEND 4
71 #define LEX_INTERPENDMAYBE 3
72 #define LEX_INTERPCONCAT 2
73 #define LEX_INTERPCONST 1
74 #define LEX_KNOWNEXT 0
76 static U32 lex_state = LEX_NORMAL; /* next token is determined */
77 static U32 lex_defer; /* state after determined token */
78 static I32 lex_brackets; /* bracket count */
79 static I32 lex_fakebrack; /* outer bracket is mere delimiter */
80 static I32 lex_casemods; /* casemod count */
81 static I32 lex_dojoin; /* doing an array interpolation */
82 static I32 lex_starts; /* how many interps done on level */
83 static SV * lex_stuff; /* runtime pattern from m// or s/// */
84 static SV * lex_repl; /* runtime replacement from s/// */
85 static OP * lex_op; /* extra info to pass back on op */
86 static I32 lex_inpat; /* in pattern $) and $| are special */
87 static I32 lex_inwhat; /* what kind of quoting are we in */
89 /* What we know when we're in LEX_KNOWNEXT state. */
90 static YYSTYPE nextval[5]; /* value of next token, if any */
91 static I32 nexttype[5]; /* type of next token */
92 static I32 nexttoke = 0;
105 #include "keywords.h"
112 #define CLINE (copline = (curcop->cop_line < copline ? curcop->cop_line : copline))
115 #define PERL_META(c) ((c) | 128)
117 #define META(c) ((c) | 128)
120 #define TOKEN(retval) return (bufptr = s,(int)retval)
121 #define OPERATOR(retval) return (expect = XTERM,bufptr = s,(int)retval)
122 #define PREBLOCK(retval) return (expect = XBLOCK,bufptr = s,(int)retval)
123 #define PREREF(retval) return (expect = XREF,bufptr = s,(int)retval)
124 #define TERM(retval) return (CLINE, expect = XOPERATOR,bufptr = s,(int)retval)
125 #define LOOPX(f) return(yylval.ival=f,expect = XOPERATOR,bufptr = s,(int)LOOPEX)
126 #define FTST(f) return(yylval.ival=f,expect = XTERM,bufptr = s,(int)UNIOP)
127 #define FUN0(f) return(yylval.ival = f,expect = XOPERATOR,bufptr = s,(int)FUNC0)
128 #define FUN1(f) return(yylval.ival = f,expect = XOPERATOR,bufptr = s,(int)FUNC1)
129 #define BOop(f) return(yylval.ival=f,expect = XTERM,bufptr = s,(int)BITOROP)
130 #define BAop(f) return(yylval.ival=f,expect = XTERM,bufptr = s,(int)BITANDOP)
131 #define SHop(f) return(yylval.ival=f,expect = XTERM,bufptr = s,(int)SHIFTOP)
132 #define PWop(f) return(yylval.ival=f,expect = XTERM,bufptr = s,(int)POWOP)
133 #define PMop(f) return(yylval.ival=f,expect = XTERM,bufptr = s,(int)MATCHOP)
134 #define Aop(f) return(yylval.ival=f,expect = XTERM,bufptr = s,(int)ADDOP)
135 #define Mop(f) return(yylval.ival=f,expect = XTERM,bufptr = s,(int)MULOP)
136 #define Eop(f) return(yylval.ival=f,expect = XTERM,bufptr = s,(int)EQOP)
137 #define Rop(f) return(yylval.ival=f,expect = XTERM,bufptr = s,(int)RELOP)
139 /* This bit of chicanery makes a unary function followed by
140 * a parenthesis into a function with one argument, highest precedence.
142 #define UNI(f) return(yylval.ival = f, \
145 last_uni = oldbufptr, \
146 (*s == '(' || (s = skipspace(s), *s == '(') ? (int)FUNC1 : (int)UNIOP) )
148 #define UNIBRACK(f) return(yylval.ival = f, \
150 last_uni = oldbufptr, \
151 (*s == '(' || (s = skipspace(s), *s == '(') ? (int)FUNC1 : (int)UNIOP) )
153 /* This does similarly for list operators */
154 #define LOP(f) return(yylval.ival = f, \
158 last_lop = oldbufptr, \
159 (*s == '(' || (s = skipspace(s), *s == '(') ? (int)FUNC : (int)LSTOP) )
161 /* grandfather return to old style */
162 #define OLDLOP(f) return(yylval.ival=f,expect = XTERM,bufptr = s,(int)LSTOP)
166 while (s < bufend && isALNUM(*s)) \
173 lex_state = LEX_NORMAL;
188 oldoldbufptr = oldbufptr = bufptr = SvPVn(linestr);
189 bufend = bufptr + SvCUR(linestr);
196 while (s < bufend && isSPACE(*s))
206 if (oldoldbufptr != last_uni)
208 while (isSPACE(*last_uni))
210 for (s = last_uni; isALNUM(*s) || *s == '-'; s++) ;
213 warn("Warning: Use of \"%s\" without parens is ambiguous", last_uni);
221 #define UNI(f) return uni(f,s)
222 #define LOP(f) return lop(f,s)
232 last_uni = oldbufptr;
251 last_uni = oldbufptr;
261 #endif /* CRIPPLED_CC */
267 nexttype[nexttoke] = type;
269 if (lex_state != LEX_KNOWNEXT) {
270 lex_defer = lex_state;
271 lex_state = LEX_KNOWNEXT;
283 if (isIDFIRST(*s) || *s == '\'') {
286 while (s < bufend && *s == '\'' && isIDFIRST(s[1])) {
290 nextval[nexttoke].opval = (OP*)newSVOP(OP_CONST, 0, newSVpv(tokenbuf,0));
301 nextval[nexttoke].opval = (OP*)newSVOP(OP_CONST, 0, newSVpv(s,0));
319 send = s + SvCUR(sv);
320 while (s < send && *s != '\\')
325 delim = SvSTORAGE(sv);
328 if (s + 1 < send && (s[1] == '\\' || s[1] == delim))
329 s++; /* all that, just for this */
334 SvCUR_set(sv, d - SvPV(sv));
342 register I32 op_type = yylval.ival;
345 if (op_type == OP_NULL) {
346 yylval.opval = lex_op;
350 if (op_type == OP_CONST || op_type == OP_READLINE) {
351 yylval.opval = (OP*)newSVOP(op_type, 0, q(lex_stuff));
358 SAVEINT(lex_brackets);
359 SAVEINT(lex_fakebrack);
360 SAVEINT(lex_casemods);
365 SAVEINT(curcop->cop_line);
368 SAVESPTR(oldoldbufptr);
374 bufend = bufptr = oldbufptr = oldoldbufptr = SvPVn(linestr);
375 bufend += SvCUR(linestr);
382 lex_state = LEX_INTERPCONCAT;
383 curcop->cop_line = multi_start;
385 lex_inwhat = op_type;
386 if (op_type == OP_MATCH || op_type == OP_SUBST)
393 yylval.opval = lex_op;
406 yylval.opval = (OP*)newSVOP(OP_CONST, 0, NEWSV(94,1));
410 if (lex_casemods) { /* oops, we've got some unbalanced parens */
411 lex_state = LEX_INTERPCASEMOD;
416 /* Is there a right-hand side to take care of? */
417 if (lex_repl && (lex_inwhat == OP_SUBST || lex_inwhat == OP_TRANS)) {
420 bufend = bufptr = oldbufptr = oldoldbufptr = SvPVn(linestr);
421 bufend += SvCUR(linestr);
427 if (SvCOMPILED(lex_repl)) {
428 lex_state = LEX_INTERPNORMAL;
432 lex_state = LEX_INTERPCONCAT;
438 bufend = SvPVn(linestr);
439 bufend += SvCUR(linestr);
449 register char *send = bufend;
450 SV *sv = NEWSV(93, send - start);
451 register char *s = start;
452 register char *d = SvPV(sv);
453 char delim = SvSTORAGE(linestr);
454 bool dorange = FALSE;
458 ? "\\.^$@dDwWsSbB+*?|()-nrtfeaxc0123456789[{]}"
459 : (lex_inwhat & OP_TRANS)
463 while (s < send || dorange) {
464 if (lex_inwhat == OP_TRANS) {
469 SvGROW(sv, SvLEN(sv) + 256);
473 for (i = (*d & 0377); i <= max; i++)
478 else if (*s == '-' && s+1 < send && s != start) {
485 else if (*s == '$') {
486 if (!lex_inpat) /* not a regexp, so $ must be var */
488 if (s + 1 < send && s[1] != ')' && s[1] != '|')
489 break; /* in regexp, $ might be tail anchor */
491 if (*s == '\\' && s+1 < send) {
497 if (*s && index(leave, *s)) {
502 if (lex_inwhat == OP_SUBST && !lex_inpat &&
503 isDIGIT(*s) && !isDIGIT(s[1]))
508 if (lex_inwhat != OP_TRANS && *s && index("lLuUE", *s)) {
514 if (lex_inwhat == OP_TRANS) {
522 case '0': case '1': case '2': case '3':
523 case '4': case '5': case '6': case '7':
524 *d++ = scan_oct(s, 3, &len);
528 *d++ = scan_hex(++s, 2, &len);
566 SvCUR_set(sv, d - SvPV(sv));
569 if (SvCUR(sv) + 5 < SvLEN(sv)) {
570 SvLEN_set(sv, SvCUR(sv) + 1);
571 Renew(SvPV(sv), SvLEN(sv), char);
574 yylval.opval = (OP*)newSVOP(OP_CONST, 0, sv);
580 /* This is the one truly awful dwimmer necessary to conflate C and sed. */
587 if (*s == '-' && s[1] == '>' && (s[2] == '[' || s[2] == '{'))
589 if (*s != '{' && *s != '[')
594 /* In a pattern, so maybe we have {n,m}. */
611 /* On the other hand, maybe we have a character class */
614 if (*s == ']' || *s == '^')
617 int weight = 2; /* let's weigh the evidence */
619 unsigned char un_char = 0, last_un_char;
620 char *send = index(s,']');
623 if (!send) /* has to be an expression */
629 else if (isDIGIT(*s)) {
631 if (isDIGIT(s[1]) && s[2] == ']')
637 for (; s < send; s++) {
638 last_un_char = un_char;
639 un_char = (unsigned char)*s;
644 weight -= seen[un_char] * 10;
646 scan_ident(s,send,tmpbuf,FALSE);
647 if (strlen(tmpbuf) > 1 && gv_fetchpv(tmpbuf,FALSE))
652 else if (*s == '$' && s[1] &&
653 index("[#!%*<>()-=",s[1])) {
654 if (/*{*/ index("])} =",s[2]))
663 if (index("wds]",s[1]))
665 else if (seen['\''] || seen['"'])
667 else if (index("rnftbxcav",s[1]))
669 else if (isDIGIT(s[1])) {
671 while (s[1] && isDIGIT(s[1]))
681 if (index("aA01! ",last_un_char))
683 if (index("zZ79~",s[1]))
687 if (!isALNUM(last_un_char) && !index("$@&",last_un_char) &&
688 isALPHA(*s) && s[1] && isALPHA(s[1])) {
693 if (keyword(tmpbuf, d - tmpbuf))
696 if (un_char == last_un_char + 1)
698 weight -= seen[un_char];
703 if (weight >= 0) /* probably a character class */
716 extern int yychar; /* last token */
720 case LEX_NORMAL: /* Some compilers will produce faster */
721 case LEX_INTERPNORMAL: /* code if we comment these out. */
727 yylval = nextval[nexttoke];
729 lex_state = lex_defer;
730 return(nexttype[nexttoke]);
732 case LEX_INTERPCASEMOD:
734 if (bufptr != bufend && *bufptr != '\\')
735 fatal("panic: INTERPCASEMOD");
737 if (bufptr == bufend || bufptr[1] == 'E') {
738 if (lex_casemods <= 1) {
739 if (bufptr != bufend)
741 lex_state = LEX_INTERPSTART;
751 if (strnEQ(s, "L\\u", 3) || strnEQ(s, "U\\l", 3))
752 tmp = *s, *s = s[2], s[2] = tmp; /* misordered... */
754 lex_state = LEX_INTERPCONCAT;
755 nextval[nexttoke].ival = 0;
758 nextval[nexttoke].ival = OP_LCFIRST;
760 nextval[nexttoke].ival = OP_UCFIRST;
762 nextval[nexttoke].ival = OP_LC;
764 nextval[nexttoke].ival = OP_UC;
766 fatal("panic: yylex");
777 case LEX_INTERPSTART:
778 if (bufptr == bufend)
779 return sublex_done();
781 lex_dojoin = (*bufptr == '@');
782 lex_state = LEX_INTERPNORMAL;
784 nextval[nexttoke].ival = 0;
787 nextval[nexttoke].ival = 0;
789 nextval[nexttoke].ival = 0;
791 nextval[nexttoke].ival = OP_JOIN; /* emulate join($", ...) */
802 case LEX_INTERPENDMAYBE:
803 if (intuit_more(bufptr)) {
804 lex_state = LEX_INTERPNORMAL; /* false alarm, more expr */
812 lex_state = LEX_INTERPCONCAT;
816 case LEX_INTERPCONCAT:
819 fatal("panic: INTERPCONCAT");
821 if (bufptr == bufend)
822 return sublex_done();
824 if (SvSTORAGE(linestr) == '\'') {
825 SV *sv = newSVsv(linestr);
828 yylval.opval = (OP*)newSVOP(OP_CONST, 0, sv);
832 s = scan_const(bufptr);
834 lex_state = LEX_INTERPCASEMOD;
836 lex_state = LEX_INTERPSTART;
840 nextval[nexttoke] = yylval;
854 oldoldbufptr = oldbufptr;
860 fprintf(stderr,"Tokener at %s",s);
862 fprintf(stderr,"Tokener at %s\n",s);
866 if ((*s & 127) == '}') {
871 warn("Unrecognized character \\%03o ignored", *s++ & 255);
877 if ((*s & 127) == '}') {
882 warn("Unrecognized character \\%03o ignored", *s++ & 255);
886 goto fake_eof; /* emulate EOF on ^D or ^Z */
891 goto retry; /* ignore stray nulls */
896 sv_setpv(linestr,"");
898 char *pdb = getenv("PERLDB");
900 sv_catpv(linestr, pdb ? pdb : "require 'perldb.pl'");
901 sv_catpv(linestr, ";");
903 sv_catpv(linestr, "&BEGIN if defined &BEGIN;");
904 if (minus_n || minus_p) {
905 sv_catpv(linestr, "LINE: while (<>) {");
907 sv_catpv(linestr,"chop;");
909 sv_catpv(linestr,"@F=split(' ');");
911 oldoldbufptr = oldbufptr = s = SvPVn(linestr);
912 bufend = SvPV(linestr) + SvCUR(linestr);
917 #endif /* CRYPTSCRIPT */
919 if ((s = sv_gets(linestr, rsfp, 0)) == Nullch) {
923 (void)my_pclose(rsfp);
924 else if ((FILE*)rsfp == stdin)
930 if (minus_n || minus_p) {
931 sv_setpv(linestr,minus_p ? ";}continue{print" : "");
932 sv_catpv(linestr,";}");
933 oldoldbufptr = oldbufptr = s = SvPVn(linestr);
934 bufend = SvPV(linestr) + SvCUR(linestr);
935 minus_n = minus_p = 0;
938 oldoldbufptr = oldbufptr = s = SvPVn(linestr);
939 sv_setpv(linestr,"");
940 TOKEN(';'); /* not infinite loop because rsfp is NULL now */
942 if (doextract && *SvPV(linestr) == '#')
946 oldoldbufptr = oldbufptr = bufptr = s;
948 SV *sv = NEWSV(85,0);
950 sv_setsv(sv,linestr);
951 av_store(GvAV(curcop->cop_filegv),(I32)curcop->cop_line,sv);
953 bufend = SvPV(linestr) + SvCUR(linestr);
954 if (curcop->cop_line == 1) {
955 while (s < bufend && isSPACE(*s))
957 if (*s == ':') /* for csh's that have to exec sh scripts */
959 if (*s == '#' && s[1] == '!') {
960 if (!in_eval && !instr(s,"perl") && instr(origargv[0],"perl")) {
968 while (s < bufend && !isSPACE(*s))
971 while (s < bufend && isSPACE(*s))
974 Newz(899,newargv,origargc+3,char*);
976 while (s < bufend && !isSPACE(*s))
979 Copy(origargv+1, newargv+2, origargc+1, char*);
985 fatal("Can't exec %s", cmd);
987 if (d = instr(s, "perl -")) {
990 while (d = moreswitches(d)) ;
994 if (in_format && lex_brackets <= 1) {
995 s = scan_formline(s);
1001 case ' ': case '\t': case '\f': case '\r': case 013:
1005 if (preprocess && s == SvPVn(linestr) &&
1006 s[1] == ' ' && (isDIGIT(s[2]) || strnEQ(s+2,"line ",5)) ) {
1007 while (*s && !isDIGIT(*s))
1009 curcop->cop_line = atoi(s)-1;
1013 s[strlen(s)-1] = '\0'; /* wipe out newline */
1016 s[strlen(s)-1] = '\0'; /* wipe out trailing quote */
1019 curcop->cop_filegv = gv_fetchfile(s);
1021 curcop->cop_filegv = gv_fetchfile(origfilename);
1022 oldoldbufptr = oldbufptr = s = SvPVn(linestr);
1026 if (lex_state != LEX_NORMAL || (in_eval && !rsfp)) {
1028 while (s < d && *s != '\n')
1033 if (in_format && lex_brackets <= 1) {
1034 s = scan_formline(s);
1046 if (s[1] && isALPHA(s[1]) && !isALNUM(s[2])) {
1048 last_uni = oldbufptr;
1050 case 'r': FTST(OP_FTEREAD);
1051 case 'w': FTST(OP_FTEWRITE);
1052 case 'x': FTST(OP_FTEEXEC);
1053 case 'o': FTST(OP_FTEOWNED);
1054 case 'R': FTST(OP_FTRREAD);
1055 case 'W': FTST(OP_FTRWRITE);
1056 case 'X': FTST(OP_FTREXEC);
1057 case 'O': FTST(OP_FTROWNED);
1058 case 'e': FTST(OP_FTIS);
1059 case 'z': FTST(OP_FTZERO);
1060 case 's': FTST(OP_FTSIZE);
1061 case 'f': FTST(OP_FTFILE);
1062 case 'd': FTST(OP_FTDIR);
1063 case 'l': FTST(OP_FTLINK);
1064 case 'p': FTST(OP_FTPIPE);
1065 case 'S': FTST(OP_FTSOCK);
1066 case 'u': FTST(OP_FTSUID);
1067 case 'g': FTST(OP_FTSGID);
1068 case 'k': FTST(OP_FTSVTX);
1069 case 'b': FTST(OP_FTBLK);
1070 case 'c': FTST(OP_FTCHR);
1071 case 't': FTST(OP_FTTTY);
1072 case 'T': FTST(OP_FTTEXT);
1073 case 'B': FTST(OP_FTBINARY);
1074 case 'M': gv_fetchpv("\024",TRUE); FTST(OP_FTMTIME);
1075 case 'A': gv_fetchpv("\024",TRUE); FTST(OP_FTATIME);
1076 case 'C': gv_fetchpv("\024",TRUE); FTST(OP_FTCTIME);
1085 if (expect == XOPERATOR)
1090 else if (*s == '>') {
1093 if (isIDFIRST(*s)) {
1095 for (d = s; isALNUM(*d); d++) ;
1096 strncpy(tokenbuf,s,d-s);
1097 tokenbuf[d-s] = '\0';
1098 if (!keyword(tokenbuf, d - s))
1099 s = force_word(s,METHOD);
1103 if (expect == XOPERATOR)
1106 if (isSPACE(*s) || !isSPACE(*bufptr))
1108 OPERATOR('-'); /* unary minus */
1115 if (expect == XOPERATOR)
1120 if (expect == XOPERATOR)
1123 if (isSPACE(*s) || !isSPACE(*bufptr))
1129 if (expect != XOPERATOR) {
1130 s = scan_ident(s, bufend, tokenbuf, TRUE);
1131 force_ident(tokenbuf);
1142 if (expect != XOPERATOR) {
1143 s = scan_ident(s, bufend, tokenbuf, TRUE);
1144 force_ident(tokenbuf);
1163 if (curcop->cop_line < copline)
1164 copline = curcop->cop_line;
1172 if (lex_state == LEX_INTERPNORMAL) {
1173 if (--lex_brackets == 0) {
1174 if (*s != '-' || s[1] != '>')
1175 lex_state = LEX_INTERPEND;
1185 if (expect == XTERM)
1186 OPERATOR(HASHBRACK);
1187 yylval.ival = curcop->cop_line;
1188 if (isSPACE(*s) || *s == '#')
1189 copline = NOLINE; /* invalidate current command line number */
1195 if (lex_state == LEX_INTERPNORMAL) {
1196 if (--lex_brackets == 0) {
1197 if (lex_fakebrack) {
1198 lex_state = LEX_INTERPEND;
1200 return yylex(); /* ignore fake brackets */
1202 if (*s != '-' || s[1] != '>')
1203 lex_state = LEX_INTERPEND;
1214 if (expect == XOPERATOR)
1217 s = scan_ident(s-1, bufend, tokenbuf, TRUE);
1219 force_ident(tokenbuf);
1241 if (in_format == 2 && (tmp == '\n' || s[1] == '\n')) {
1258 if (expect != XOPERATOR) {
1259 if (s[1] != '<' && !index(s,'>'))
1262 s = scan_heredoc(s);
1264 s = scan_inputsymbol(s);
1265 TERM(sublex_start());
1270 SHop(OP_LEFT_SHIFT);
1284 SHop(OP_RIGHT_SHIFT);
1291 if (in_format && expect == XOPERATOR)
1292 OPERATOR(','); /* grandfather non-comma-format format */
1293 if (s[1] == '#' && (isALPHA(s[2]) || s[2] == '_')) {
1294 s = scan_ident(s+1, bufend, tokenbuf, FALSE);
1295 force_ident(tokenbuf);
1298 s = scan_ident(s, bufend, tokenbuf, FALSE);
1300 force_ident(tokenbuf);
1304 if (lex_state == LEX_NORMAL &&
1308 oldoldbufptr < bufptr)
1311 while (isSPACE(*oldoldbufptr))
1313 if (*oldoldbufptr == 'p' && strnEQ(oldoldbufptr,"print",5)) {
1314 if (index("&*<%", *s) && isIDFIRST(s[1]))
1315 expect = XTERM; /* e.g. print $fh &sub */
1316 else if (*s == '.' && isDIGIT(s[1]))
1317 expect = XTERM; /* e.g. print $fh .3 */
1318 else if (index("/?-+", *s) && !isSPACE(s[1]))
1319 expect = XTERM; /* e.g. print $fh -1 */
1325 s = scan_ident(s, bufend, tokenbuf, FALSE);
1327 force_ident(tokenbuf);
1332 case '/': /* may either be division or pattern */
1333 case '?': /* may either be conditional or pattern */
1334 if (expect != XOPERATOR) {
1337 TERM(sublex_start());
1345 if (in_format == 2) {
1349 if (expect == XOPERATOR || !isDIGIT(s[1])) {
1355 yylval.ival = OPf_SPECIAL;
1361 if (expect != XOPERATOR)
1366 case '0': case '1': case '2': case '3': case '4':
1367 case '5': case '6': case '7': case '8': case '9':
1372 if (in_format && expect == XOPERATOR)
1373 OPERATOR(','); /* grandfather non-comma-format format */
1376 fatal("EOF in string");
1377 yylval.ival = OP_CONST;
1378 TERM(sublex_start());
1381 if (in_format && expect == XOPERATOR)
1382 OPERATOR(','); /* grandfather non-comma-format format */
1385 fatal("EOF in string");
1386 yylval.ival = OP_SCALAR;
1387 TERM(sublex_start());
1392 fatal("EOF in backticks");
1393 yylval.ival = OP_BACKTICK;
1395 TERM(sublex_start());
1402 if (isDIGIT(s[1]) && expect == XOPERATOR) {
1440 switch (tmp = keyword(tokenbuf, d - tokenbuf)) {
1442 default: /* not a keyword */
1444 while (*s == '\'' && isIDFIRST(s[1])) {
1448 if (expect == XBLOCK) { /* special case: start of statement */
1449 yylval.pval = savestr(tokenbuf);
1450 while (isSPACE(*s)) s++;
1458 if (oldoldbufptr && oldoldbufptr < bufptr) {
1459 if (oldoldbufptr == last_lop) {
1462 yylval.opval = (OP*)newSVOP(OP_CONST, 0,
1463 newSVpv(tokenbuf,0));
1464 yylval.opval->op_private = OPpCONST_BARE;
1465 for (d = tokenbuf; *d && isLOWER(*d); d++) ;
1468 "\"%s\" may clash with future reserved word",
1473 while (s < bufend && isSPACE(*s))
1478 nextval[nexttoke].opval = (OP*)newSVOP(OP_CONST, 0, newSVpv(tokenbuf,0));
1479 nextval[nexttoke].opval->op_private = OPpCONST_BARE;
1481 LOP( OP_ENTERSUBR );
1485 yylval.opval = (OP*)newSVOP(OP_CONST, 0, newSVpv(tokenbuf,0));
1486 yylval.opval->op_private = OPpCONST_BARE;
1488 if (*s == '$' || *s == '{')
1491 for (d = tokenbuf; *d && isLOWER(*d); d++) ;
1494 "\"%s\" may clash with future reserved word",
1499 case KEY___FILE__: {
1500 if (tokenbuf[2] == 'L')
1501 (void)sprintf(tokenbuf,"%ld",(long)curcop->cop_line);
1503 strcpy(tokenbuf, SvPV(GvSV(curcop->cop_filegv)));
1504 yylval.opval = (OP*)newSVOP(OP_CONST, 0, newSVpv(tokenbuf,0));
1513 if (!in_eval && (gv = gv_fetchpv("DATA",FALSE))) {
1517 GvIO(gv)->ifp = rsfp;
1518 #if defined(HAS_FCNTL) && defined(FFt_SETFD)
1520 fcntl(fd,FFt_SETFD,fd >= 3);
1523 GvIO(gv)->type = '|';
1524 else if ((FILE*)rsfp == stdin)
1525 GvIO(gv)->type = '-';
1527 GvIO(gv)->type = '<';
1536 if (minus_p || minus_n || *s == '{' ) {
1537 nextval[nexttoke].opval =
1538 (OP*)newSVOP(OP_CONST, 0, newSVpv(tokenbuf,0));
1569 (void)gv_fetchpv("ENV",TRUE); /* may use HOME */
1611 s = force_word(s,WORD);
1636 yylval.ival = curcop->cop_line;
1646 allgvs = TRUE; /* must initialize everything since */
1648 expect = (*s == '{') ? XBLOCK : XTERM;
1649 UNIBRACK(OP_ENTEREVAL); /* we don't know what will be used */
1664 case KEY_endhostent:
1670 case KEY_endservent:
1673 case KEY_endprotoent:
1684 yylval.ival = curcop->cop_line;
1685 while (s < bufend && isSPACE(*s))
1688 fatal("Missing $ on loop variable");
1730 case KEY_getpriority:
1731 LOP(OP_GETPRIORITY);
1733 case KEY_getprotobyname:
1736 case KEY_getprotobynumber:
1739 case KEY_getprotoent:
1751 case KEY_getpeername:
1752 UNI(OP_GETPEERNAME);
1754 case KEY_gethostbyname:
1757 case KEY_gethostbyaddr:
1760 case KEY_gethostent:
1763 case KEY_getnetbyname:
1766 case KEY_getnetbyaddr:
1772 case KEY_getservbyname:
1775 case KEY_getservbyport:
1778 case KEY_getservent:
1781 case KEY_getsockname:
1782 UNI(OP_GETSOCKNAME);
1784 case KEY_getsockopt:
1803 yylval.ival = curcop->cop_line;
1862 TERM(sublex_start());
1898 checkcomma(s,tokenbuf,"filehandle");
1902 checkcomma(s,tokenbuf,"filehandle");
1915 s = force_word(s,WORD);
1924 fatal("EOF in string");
1925 yylval.ival = OP_CONST;
1926 TERM(sublex_start());
1931 fatal("EOF in string");
1932 yylval.ival = OP_SCALAR;
1933 if (SvSTORAGE(lex_stuff) == '\'')
1934 SvSTORAGE(lex_stuff) = 0; /* qq'$foo' should intepolate */
1935 TERM(sublex_start());
1940 fatal("EOF in string");
1941 yylval.ival = OP_BACKTICK;
1943 TERM(sublex_start());
1949 allgvs = TRUE; /* must initialize everything since */
1950 UNI(OP_REQUIRE); /* we don't know what will be used */
1994 TERM(sublex_start());
1996 TOKEN(1); /* force error */
2022 case KEY_setpriority:
2023 LOP(OP_SETPRIORITY);
2025 case KEY_sethostent:
2031 case KEY_setservent:
2034 case KEY_setprotoent:
2046 case KEY_setsockopt:
2076 case KEY_socketpair:
2080 checkcomma(s,tokenbuf,"subroutine name");
2082 if (*s == ';' || *s == ')') /* probably a close */
2083 fatal("sort is now a reserved word");
2084 if (isIDFIRST(*s)) {
2086 for (d = s; isALNUM(*d); d++) ;
2087 strncpy(tokenbuf,s,d-s);
2088 tokenbuf[d-s] = '\0';
2089 if (!keyword(tokenbuf, d - s) || strEQ(tokenbuf,"reverse"))
2090 s = force_word(s,WORD);
2121 yylval.ival = savestack_ix; /* restore stuff on reduce */
2128 av_push(comppad, Nullsv);
2129 curpad = AvARRAY(comppad);
2132 subline = curcop->cop_line;
2134 if (isIDFIRST(*s) || *s == '\'') {
2135 sv_setsv(subname,curstname);
2136 sv_catpvn(subname,"'",1);
2137 for (d = s+1; isALNUM(*d) || *d == '\''; d++)
2142 sv_catpvn(subname,s,d-s);
2143 s = force_word(s,WORD);
2146 sv_setpv(subname,"?");
2173 TERM(sublex_start());
2197 yylval.ival = curcop->cop_line;
2201 yylval.ival = curcop->cop_line;
2230 yylval.ival = curcop->cop_line;
2249 if (expect == XOPERATOR)
2256 TERM(sublex_start());
2269 if (strEQ(d,"__LINE__")) return KEY___LINE__;
2270 if (strEQ(d,"__FILE__")) return KEY___FILE__;
2271 if (strEQ(d,"__END__")) return KEY___END__;
2275 if (strEQ(d,"alarm")) return KEY_alarm;
2276 if (strEQ(d,"accept")) return KEY_accept;
2277 if (strEQ(d,"atan2")) return KEY_atan2;
2280 if (strEQ(d,"BEGIN")) return KEY_BEGIN;
2282 if (strEQ(d,"bless")) return KEY_bless;
2283 if (strEQ(d,"bind")) return KEY_bind;
2284 if (strEQ(d,"binmode")) return KEY_binmode;
2289 if (strEQ(d,"cmp")) return KEY_cmp;
2290 if (strEQ(d,"cos")) return KEY_cos;
2293 if (strEQ(d,"chop")) return KEY_chop;
2296 if (strEQ(d,"close")) return KEY_close;
2297 if (strEQ(d,"chdir")) return KEY_chdir;
2298 if (strEQ(d,"chmod")) return KEY_chmod;
2299 if (strEQ(d,"chown")) return KEY_chown;
2300 if (strEQ(d,"crypt")) return KEY_crypt;
2303 if (strEQ(d,"chroot")) return KEY_chroot;
2304 if (strEQ(d,"caller")) return KEY_caller;
2307 if (strEQ(d,"connect")) return KEY_connect;
2310 if (strEQ(d,"closedir")) return KEY_closedir;
2311 if (strEQ(d,"continue")) return KEY_continue;
2318 if (strEQ(d,"do")) return KEY_do;
2321 if (strEQ(d,"die")) return KEY_die;
2324 if (strEQ(d,"dump")) return KEY_dump;
2327 if (strEQ(d,"delete")) return KEY_delete;
2330 if (strEQ(d,"defined")) return KEY_defined;
2331 if (strEQ(d,"dbmopen")) return KEY_dbmopen;
2334 if (strEQ(d,"dbmclose")) return KEY_dbmclose;
2339 if (strEQ(d,"EQ")) return KEY_eq;
2340 if (strEQ(d,"END")) return KEY_END;
2345 if (strEQ(d,"eq")) return KEY_eq;
2348 if (strEQ(d,"eof")) return KEY_eof;
2349 if (strEQ(d,"exp")) return KEY_exp;
2352 if (strEQ(d,"else")) return KEY_else;
2353 if (strEQ(d,"exit")) return KEY_exit;
2354 if (strEQ(d,"eval")) return KEY_eval;
2355 if (strEQ(d,"exec")) return KEY_exec;
2356 if (strEQ(d,"each")) return KEY_each;
2359 if (strEQ(d,"elsif")) return KEY_elsif;
2362 if (strEQ(d,"endgrent")) return KEY_endgrent;
2363 if (strEQ(d,"endpwent")) return KEY_endpwent;
2366 if (strEQ(d,"endnetent")) return KEY_endnetent;
2369 if (strEQ(d,"endhostent")) return KEY_endhostent;
2370 if (strEQ(d,"endservent")) return KEY_endservent;
2373 if (strEQ(d,"endprotoent")) return KEY_endprotoent;
2380 if (strEQ(d,"for")) return KEY_for;
2383 if (strEQ(d,"fork")) return KEY_fork;
2386 if (strEQ(d,"fcntl")) return KEY_fcntl;
2387 if (strEQ(d,"flock")) return KEY_flock;
2390 if (strEQ(d,"format")) return KEY_format;
2391 if (strEQ(d,"fileno")) return KEY_fileno;
2394 if (strEQ(d,"foreach")) return KEY_foreach;
2397 if (strEQ(d,"formline")) return KEY_formline;
2403 if (strEQ(d,"GT")) return KEY_gt;
2404 if (strEQ(d,"GE")) return KEY_ge;
2408 if (strnEQ(d,"get",3)) {
2413 if (strEQ(d,"ppid")) return KEY_getppid;
2414 if (strEQ(d,"pgrp")) return KEY_getpgrp;
2417 if (strEQ(d,"pwent")) return KEY_getpwent;
2418 if (strEQ(d,"pwnam")) return KEY_getpwnam;
2419 if (strEQ(d,"pwuid")) return KEY_getpwuid;
2422 if (strEQ(d,"peername")) return KEY_getpeername;
2423 if (strEQ(d,"protoent")) return KEY_getprotoent;
2424 if (strEQ(d,"priority")) return KEY_getpriority;
2427 if (strEQ(d,"protobyname")) return KEY_getprotobyname;
2430 if (strEQ(d,"protobynumber"))return KEY_getprotobynumber;
2434 else if (*d == 'h') {
2435 if (strEQ(d,"hostbyname")) return KEY_gethostbyname;
2436 if (strEQ(d,"hostbyaddr")) return KEY_gethostbyaddr;
2437 if (strEQ(d,"hostent")) return KEY_gethostent;
2439 else if (*d == 'n') {
2440 if (strEQ(d,"netbyname")) return KEY_getnetbyname;
2441 if (strEQ(d,"netbyaddr")) return KEY_getnetbyaddr;
2442 if (strEQ(d,"netent")) return KEY_getnetent;
2444 else if (*d == 's') {
2445 if (strEQ(d,"servbyname")) return KEY_getservbyname;
2446 if (strEQ(d,"servbyport")) return KEY_getservbyport;
2447 if (strEQ(d,"servent")) return KEY_getservent;
2448 if (strEQ(d,"sockname")) return KEY_getsockname;
2449 if (strEQ(d,"sockopt")) return KEY_getsockopt;
2451 else if (*d == 'g') {
2452 if (strEQ(d,"grent")) return KEY_getgrent;
2453 if (strEQ(d,"grnam")) return KEY_getgrnam;
2454 if (strEQ(d,"grgid")) return KEY_getgrgid;
2456 else if (*d == 'l') {
2457 if (strEQ(d,"login")) return KEY_getlogin;
2463 if (strEQ(d,"gt")) return KEY_gt;
2464 if (strEQ(d,"ge")) return KEY_ge;
2467 if (strEQ(d,"grep")) return KEY_grep;
2468 if (strEQ(d,"goto")) return KEY_goto;
2469 if (strEQ(d,"getc")) return KEY_getc;
2472 if (strEQ(d,"gmtime")) return KEY_gmtime;
2477 if (strEQ(d,"hex")) return KEY_hex;
2482 if (strEQ(d,"if")) return KEY_if;
2485 if (strEQ(d,"int")) return KEY_int;
2488 if (strEQ(d,"index")) return KEY_index;
2489 if (strEQ(d,"ioctl")) return KEY_ioctl;
2494 if (strEQ(d,"join")) return KEY_join;
2498 if (strEQ(d,"keys")) return KEY_keys;
2499 if (strEQ(d,"kill")) return KEY_kill;
2504 if (strEQ(d,"LT")) return KEY_lt;
2505 if (strEQ(d,"LE")) return KEY_le;
2511 if (strEQ(d,"lt")) return KEY_lt;
2512 if (strEQ(d,"le")) return KEY_le;
2513 if (strEQ(d,"lc")) return KEY_lc;
2516 if (strEQ(d,"log")) return KEY_log;
2519 if (strEQ(d,"last")) return KEY_last;
2520 if (strEQ(d,"link")) return KEY_link;
2523 if (strEQ(d,"local")) return KEY_local;
2524 if (strEQ(d,"lstat")) return KEY_lstat;
2527 if (strEQ(d,"length")) return KEY_length;
2528 if (strEQ(d,"listen")) return KEY_listen;
2531 if (strEQ(d,"lcfirst")) return KEY_lcfirst;
2534 if (strEQ(d,"localtime")) return KEY_localtime;
2540 case 1: return KEY_m;
2542 if (strEQ(d,"mkdir")) return KEY_mkdir;
2545 if (strEQ(d,"msgctl")) return KEY_msgctl;
2546 if (strEQ(d,"msgget")) return KEY_msgget;
2547 if (strEQ(d,"msgrcv")) return KEY_msgrcv;
2548 if (strEQ(d,"msgsnd")) return KEY_msgsnd;
2553 if (strEQ(d,"NE")) return KEY_ne;
2556 if (strEQ(d,"next")) return KEY_next;
2557 if (strEQ(d,"ne")) return KEY_ne;
2562 if (strEQ(d,"ord")) return KEY_ord;
2563 if (strEQ(d,"oct")) return KEY_oct;
2566 if (strEQ(d,"open")) return KEY_open;
2569 if (strEQ(d,"opendir")) return KEY_opendir;
2576 if (strEQ(d,"pop")) return KEY_pop;
2579 if (strEQ(d,"push")) return KEY_push;
2580 if (strEQ(d,"pack")) return KEY_pack;
2581 if (strEQ(d,"pipe")) return KEY_pipe;
2584 if (strEQ(d,"print")) return KEY_print;
2587 if (strEQ(d,"printf")) return KEY_printf;
2590 if (strEQ(d,"package")) return KEY_package;
2596 if (strEQ(d,"q")) return KEY_q;
2597 if (strEQ(d,"qq")) return KEY_qq;
2598 if (strEQ(d,"qx")) return KEY_qx;
2604 if (strEQ(d,"ref")) return KEY_ref;
2607 if (strEQ(d,"read")) return KEY_read;
2608 if (strEQ(d,"rand")) return KEY_rand;
2609 if (strEQ(d,"recv")) return KEY_recv;
2610 if (strEQ(d,"redo")) return KEY_redo;
2613 if (strEQ(d,"rmdir")) return KEY_rmdir;
2614 if (strEQ(d,"reset")) return KEY_reset;
2617 if (strEQ(d,"return")) return KEY_return;
2618 if (strEQ(d,"rename")) return KEY_rename;
2619 if (strEQ(d,"rindex")) return KEY_rindex;
2622 if (strEQ(d,"require")) return KEY_require;
2623 if (strEQ(d,"reverse")) return KEY_reverse;
2624 if (strEQ(d,"readdir")) return KEY_readdir;
2627 if (strEQ(d,"readlink")) return KEY_readlink;
2630 if (strEQ(d,"rewinddir")) return KEY_rewinddir;
2636 case 0: return KEY_s;
2638 if (strEQ(d,"scalar")) return KEY_scalar;
2643 if (strEQ(d,"seek")) return KEY_seek;
2644 if (strEQ(d,"send")) return KEY_send;
2647 if (strEQ(d,"semop")) return KEY_semop;
2650 if (strEQ(d,"select")) return KEY_select;
2651 if (strEQ(d,"semctl")) return KEY_semctl;
2652 if (strEQ(d,"semget")) return KEY_semget;
2655 if (strEQ(d,"setpgrp")) return KEY_setpgrp;
2656 if (strEQ(d,"seekdir")) return KEY_seekdir;
2659 if (strEQ(d,"setpwent")) return KEY_setpwent;
2660 if (strEQ(d,"setgrent")) return KEY_setgrent;
2663 if (strEQ(d,"setnetent")) return KEY_setnetent;
2666 if (strEQ(d,"setsockopt")) return KEY_setsockopt;
2667 if (strEQ(d,"sethostent")) return KEY_sethostent;
2668 if (strEQ(d,"setservent")) return KEY_setservent;
2671 if (strEQ(d,"setpriority")) return KEY_setpriority;
2672 if (strEQ(d,"setprotoent")) return KEY_setprotoent;
2679 if (strEQ(d,"shift")) return KEY_shift;
2682 if (strEQ(d,"shmctl")) return KEY_shmctl;
2683 if (strEQ(d,"shmget")) return KEY_shmget;
2686 if (strEQ(d,"shmread")) return KEY_shmread;
2689 if (strEQ(d,"shmwrite")) return KEY_shmwrite;
2690 if (strEQ(d,"shutdown")) return KEY_shutdown;
2695 if (strEQ(d,"sin")) return KEY_sin;
2698 if (strEQ(d,"sleep")) return KEY_sleep;
2701 if (strEQ(d,"sort")) return KEY_sort;
2702 if (strEQ(d,"socket")) return KEY_socket;
2703 if (strEQ(d,"socketpair")) return KEY_socketpair;
2706 if (strEQ(d,"split")) return KEY_split;
2707 if (strEQ(d,"sprintf")) return KEY_sprintf;
2708 if (strEQ(d,"splice")) return KEY_splice;
2711 if (strEQ(d,"sqrt")) return KEY_sqrt;
2714 if (strEQ(d,"srand")) return KEY_srand;
2717 if (strEQ(d,"stat")) return KEY_stat;
2718 if (strEQ(d,"study")) return KEY_study;
2721 if (strEQ(d,"substr")) return KEY_substr;
2722 if (strEQ(d,"sub")) return KEY_sub;
2727 if (strEQ(d,"system")) return KEY_system;
2730 if (strEQ(d,"sysread")) return KEY_sysread;
2731 if (strEQ(d,"symlink")) return KEY_symlink;
2732 if (strEQ(d,"syscall")) return KEY_syscall;
2735 if (strEQ(d,"syswrite")) return KEY_syswrite;
2744 if (strEQ(d,"tr")) return KEY_tr;
2747 if (strEQ(d,"tell")) return KEY_tell;
2748 if (strEQ(d,"time")) return KEY_time;
2751 if (strEQ(d,"times")) return KEY_times;
2754 if (strEQ(d,"telldir")) return KEY_telldir;
2757 if (strEQ(d,"truncate")) return KEY_truncate;
2764 if (strEQ(d,"uc")) return KEY_uc;
2767 if (strEQ(d,"undef")) return KEY_undef;
2768 if (strEQ(d,"until")) return KEY_until;
2769 if (strEQ(d,"utime")) return KEY_utime;
2770 if (strEQ(d,"umask")) return KEY_umask;
2773 if (strEQ(d,"unless")) return KEY_unless;
2774 if (strEQ(d,"unpack")) return KEY_unpack;
2775 if (strEQ(d,"unlink")) return KEY_unlink;
2778 if (strEQ(d,"unshift")) return KEY_unshift;
2779 if (strEQ(d,"ucfirst")) return KEY_ucfirst;
2784 if (strEQ(d,"values")) return KEY_values;
2785 if (strEQ(d,"vec")) return KEY_vec;
2790 if (strEQ(d,"warn")) return KEY_warn;
2791 if (strEQ(d,"wait")) return KEY_wait;
2794 if (strEQ(d,"while")) return KEY_while;
2795 if (strEQ(d,"write")) return KEY_write;
2798 if (strEQ(d,"waitpid")) return KEY_waitpid;
2801 if (strEQ(d,"wantarray")) return KEY_wantarray;
2806 if (len == 1) return KEY_x;
2809 if (len == 1) return KEY_y;
2818 checkcomma(s,name,what)
2825 if (dowarn && *s == ' ' && s[1] == '(') {
2828 for (w++; *w && isSPACE(*w); w++) ;
2829 if (!w || !*w || !index(";|}", *w)) /* an advisory hack only... */
2830 warn("%s (...) interpreted as function",name);
2832 while (s < bufend && isSPACE(*s))
2836 while (s < bufend && isSPACE(*s))
2838 if (isIDFIRST(*s)) {
2842 while (s < bufend && isSPACE(*s))
2847 "tell eof times getlogin wait length shift umask getppid \
2848 cos exp int log rand sin sqrt ord wantarray",
2853 fatal("No comma allowed after %s", what);
2859 scan_ident(s,send,dest,ck_uni)
2861 register char *send;
2868 if (lex_brackets == 0)
2877 while (isALNUM(*s) || *s == '\'')
2880 while (d > dest+1 && d[-1] == '\'')
2885 if (lex_state != LEX_NORMAL)
2886 lex_state = LEX_INTERPENDMAYBE;
2890 (*s == '$' && (isALPHA(s[1]) || s[1] == '$' || s[1] == '_')))
2901 if (*d == '^' && (isUPPER(*s) || index("[\\]^_?", *s))) {
2907 if (isALPHA(*d) || *d == '_') {
2912 if (*s == '[' || *s == '{') {
2914 fatal("Can't use delimiter brackets within expression");
2915 lex_fakebrack = TRUE;
2923 if (lex_state == LEX_INTERPNORMAL && !lex_brackets)
2924 lex_state = LEX_INTERPEND;
2927 s = bracket; /* let the parser handle it */
2931 else if (lex_state == LEX_INTERPNORMAL && !lex_brackets && !intuit_more(s))
2932 lex_state = LEX_INTERPEND;
2937 scan_prefix(pm,string,len)
2942 register SV *tmpstr;
2946 char *origstring = string;
2948 if (ninstr(string, string+len, vert, vert+1))
2952 tmpstr = NEWSV(86,len);
2953 sv_upgrade(tmpstr, SVt_PVBM);
2954 sv_setpvn(tmpstr,string,len);
2957 BmUSEFUL(tmpstr) = 100;
2958 for (d=t; d < e; ) {
2966 case '.': case '[': case '$': case '(': case ')': case '|': case '+':
2971 if (d[1] && index("wWbB0123456789sSdDlLuUExc",d[1])) {
2975 Move(d+1,d,e-d,char);
3000 if (d[1] == '*' || (d[1] == '{' && d[2] == '0') || d[1] == '?') {
3012 SvCUR_set(tmpstr, d - t);
3014 pm->op_pmflags |= PMf_ALL;
3015 if (*origstring != '^')
3016 pm->op_pmflags |= PMf_SCANFIRST;
3017 pm->op_pmshort = tmpstr;
3018 pm->op_pmslen = d - t;
3028 multi_start = curcop->cop_line;
3030 s = scan_str(start);
3035 fatal("Search pattern not terminated");
3037 pm = (PMOP*)newPMOP(OP_MATCH, 0);
3039 pm->op_pmflags |= PMf_ONCE;
3041 while (*s == 'i' || *s == 'o' || *s == 'g') {
3045 pm->op_pmflags |= PMf_FOLD;
3049 pm->op_pmflags |= PMf_KEEP;
3053 pm->op_pmflags |= PMf_GLOBAL;
3058 yylval.ival = OP_MATCH;
3066 register char *s = start;
3070 multi_start = curcop->cop_line;
3071 yylval.ival = OP_NULL;
3079 fatal("Substitution pattern not terminated");
3082 if (s[-1] == *start)
3093 fatal("Substitution replacement not terminated");
3096 pm = (PMOP*)newPMOP(OP_SUBST, 0);
3097 while (*s == 'g' || *s == 'i' || *s == 'e' || *s == 'o') {
3104 pm->op_pmflags |= PMf_GLOBAL;
3109 pm->op_pmflags |= PMf_FOLD;
3113 pm->op_pmflags |= PMf_KEEP;
3119 pm->op_pmflags |= PMf_EVAL;
3123 sv_catpvn(repl, "eval ", 5);
3125 sv_catpvn(repl, "{ ", 2);
3126 sv_catsv(repl, lex_repl);
3127 sv_catpvn(repl, " };", 2);
3128 SvCOMPILED_on(repl);
3134 yylval.ival = OP_SUBST;
3142 if (!pm->op_pmshort && pm->op_pmregexp->regstart &&
3143 (!pm->op_pmregexp->regmust || pm->op_pmregexp->reganch & ROPT_ANCH)
3145 if (!(pm->op_pmregexp->reganch & ROPT_ANCH))
3146 pm->op_pmflags |= PMf_SCANFIRST;
3147 else if (pm->op_pmflags & PMf_FOLD)
3149 pm->op_pmshort = sv_ref(pm->op_pmregexp->regstart);
3151 else if (pm->op_pmregexp->regmust) {/* is there a better short-circuit? */
3152 if (pm->op_pmshort &&
3153 sv_eq(pm->op_pmshort,pm->op_pmregexp->regmust))
3155 if (pm->op_pmflags & PMf_SCANFIRST) {
3156 sv_free(pm->op_pmshort);
3157 pm->op_pmshort = Nullsv;
3160 sv_free(pm->op_pmregexp->regmust);
3161 pm->op_pmregexp->regmust = Nullsv;
3165 if (!pm->op_pmshort || /* promote the better string */
3166 ((pm->op_pmflags & PMf_SCANFIRST) &&
3167 (SvCUR(pm->op_pmshort) < SvCUR(pm->op_pmregexp->regmust)) )){
3168 sv_free(pm->op_pmshort); /* ok if null */
3169 pm->op_pmshort = pm->op_pmregexp->regmust;
3170 pm->op_pmregexp->regmust = Nullsv;
3171 pm->op_pmflags |= PMf_SCANFIRST;
3180 register char *s = start;
3187 yylval.ival = OP_NULL;
3194 fatal("Translation pattern not terminated");
3196 if (s[-1] == *start)
3199 s = scan_str(s, SCAN_TR|SCAN_REPL);
3207 fatal("Translation replacement not terminated");
3210 New(803,tbl,256,short);
3211 op = newPVOP(OP_TRANS, 0, (char*)tbl);
3213 complement = delete = squash = 0;
3214 while (*s == 'c' || *s == 'd' || *s == 's') {
3216 complement = OPpTRANS_COMPLEMENT;
3218 delete = OPpTRANS_DELETE;
3220 squash = OPpTRANS_SQUASH;
3223 op->op_private = delete|squash|complement;
3226 yylval.ival = OP_TRANS;
3235 I32 op_type = OP_SCALAR;
3245 if (*s && index("`'\"",*s)) {
3247 s = cpytill(d,s,bufend,term,&len);
3259 } /* assuming tokenbuf won't clobber */
3264 if (rsfp || !(d=ninstr(s,bufend,d,d+1)))
3265 herewas = newSVpv(s,bufend-s);
3267 s--, herewas = newSVpv(s,d-s);
3268 s += SvCUR(herewas);
3272 op_type = OP_BACKTICK;
3275 multi_start = curcop->cop_line;
3276 multi_open = multi_close = '<';
3277 tmpstr = NEWSV(87,80);
3281 while (s < bufend &&
3282 (*s != term || bcmp(s,tokenbuf,len) != 0) ) {
3287 curcop->cop_line = multi_start;
3288 fatal("EOF in string");
3290 sv_setpvn(tmpstr,d+1,s-d);
3292 sv_catpvn(herewas,s,bufend-s);
3293 sv_setsv(linestr,herewas);
3294 oldoldbufptr = oldbufptr = bufptr = s = SvPVn(linestr);
3295 bufend = SvPV(linestr) + SvCUR(linestr);
3298 sv_setpvn(tmpstr,"",0); /* avoid "uninitialized" warning */
3299 while (s >= bufend) { /* multiple line string? */
3301 !(oldoldbufptr = oldbufptr = s = sv_gets(linestr, rsfp, 0))) {
3302 curcop->cop_line = multi_start;
3303 fatal("EOF in string");
3307 SV *sv = NEWSV(88,0);
3309 sv_setsv(sv,linestr);
3310 av_store(GvAV(curcop->cop_filegv),
3311 (I32)curcop->cop_line,sv);
3313 bufend = SvPV(linestr) + SvCUR(linestr);
3314 if (*s == term && bcmp(s,tokenbuf,len) == 0) {
3317 sv_catsv(linestr,herewas);
3318 bufend = SvPV(linestr) + SvCUR(linestr);
3322 sv_catsv(tmpstr,linestr);
3325 multi_end = curcop->cop_line;
3327 if (SvCUR(tmpstr) + 5 < SvLEN(tmpstr)) {
3328 SvLEN_set(tmpstr, SvCUR(tmpstr) + 1);
3329 Renew(SvPV(tmpstr), SvLEN(tmpstr), char);
3333 yylval.ival = op_type;
3338 scan_inputsymbol(start)
3341 register char *s = start;
3346 s = cpytill(d, s+1, bufend, '>', &len);
3350 fatal("Unterminated <> operator");
3353 while (*d && (isALNUM(*d) || *d == '\''))
3355 if (d - tokenbuf != len) {
3356 yylval.ival = OP_GLOB;
3358 s = scan_str(start);
3360 fatal("Glob not terminated");
3366 (void)strcpy(d,"ARGV");
3368 GV *gv = gv_fetchpv(d+1,TRUE);
3369 lex_op = (OP*)newUNOP(OP_READLINE, 0,
3370 newUNOP(OP_RV2GV, 0,
3371 newUNOP(OP_RV2SV, 0,
3372 newGVOP(OP_GV, 0, gv))));
3373 yylval.ival = OP_NULL;
3378 GV *gv = gv_fetchpv(d,TRUE);
3380 if (strEQ(d,"ARGV")) {
3382 io->flags |= IOf_ARGV|IOf_START;
3384 lex_op = (OP*)newUNOP(OP_READLINE, 0, newGVOP(OP_GV, 0, gv));
3385 yylval.ival = OP_NULL;
3397 register char *s = start;
3398 register char term = *s;
3401 multi_start = curcop->cop_line;
3403 if (term && (tmps = index("([{< )]}> )]}>",term)))
3407 tmpstr = NEWSV(87,80);
3408 SvSTORAGE(tmpstr) = term;
3409 s = sv_append_till(tmpstr, s+1, bufend, term, Nullch);
3411 while (s >= bufend) { /* multiple line string? */
3413 !(oldoldbufptr = oldbufptr = s = sv_gets(linestr, rsfp, 0))) {
3414 curcop->cop_line = multi_start;
3419 SV *sv = NEWSV(88,0);
3421 sv_setsv(sv,linestr);
3422 av_store(GvAV(curcop->cop_filegv),
3423 (I32)curcop->cop_line, sv);
3425 bufend = SvPV(linestr) + SvCUR(linestr);
3426 s = sv_append_till(tmpstr, s, bufend, term, Nullch);
3428 multi_end = curcop->cop_line;
3430 if (SvCUR(tmpstr) + 5 < SvLEN(tmpstr)) {
3431 SvLEN_set(tmpstr, SvCUR(tmpstr) + 1);
3432 Renew(SvPV(tmpstr), SvLEN(tmpstr), char);
3445 register char *s = start;
3454 fatal("panic: scan_num");
3464 else if (s[1] == '.')
3478 yyerror("Illegal octal digit");
3480 case '0': case '1': case '2': case '3': case '4':
3481 case '5': case '6': case '7':
3485 case 'a': case 'b': case 'c': case 'd': case 'e': case 'f':
3486 case 'A': case 'B': case 'C': case 'D': case 'E': case 'F':
3490 i += (*s++ & 7) + 9;
3497 if (tryi32 == i && tryi32 >= 0)
3498 sv_setiv(sv,tryi32);
3500 sv_setnv(sv,(double)i);
3503 case '1': case '2': case '3': case '4': case '5':
3504 case '6': case '7': case '8': case '9': case '.':
3508 while (isDIGIT(*s) || *s == '_') {
3514 if (*s == '.' && s[1] != '.') {
3517 while (isDIGIT(*s) || *s == '_') {
3524 if (*s && index("eE",*s) && index("+-0123456789",s[1])) {
3527 *d++ = 'e'; /* At least some Mach atof()s don't grok 'E' */
3528 if (*s == '+' || *s == '-')
3535 value = atof(tokenbuf);
3536 tryi32 = (I32)value;
3537 if (!floatit && (double)tryi32 == value)
3538 sv_setiv(sv,tryi32);
3544 yylval.opval = newSVOP(OP_CONST, 0, sv);
3555 SV *stuff = NEWSV(0,0);
3556 bool needargs = FALSE;
3561 for (t = s+1; *t == ' ' || *t == '\t'; t++) ;
3565 if (in_eval && !rsfp) {
3566 eol = index(s,'\n');
3571 eol = bufend = SvPV(linestr) + SvCUR(linestr);
3573 sv_catpvn(stuff, s, eol-s);
3575 if (*s == '@' || *s == '^') {
3584 s = sv_gets(linestr, rsfp, 0);
3585 oldoldbufptr = oldbufptr = bufptr = SvPVn(linestr);
3588 yyerror("Format not terminated");
3596 nextval[nexttoke].ival = 0;
3601 nextval[nexttoke].opval = (OP*)newSVOP(OP_CONST, 0, stuff);
3603 nextval[nexttoke].ival = OP_FORMLINE;
3619 cshlen = strlen(cshname);