1 /* $RCSfile: toke.c,v $$Revision: 4.1 $$Date: 92/08/07 18:28:39 $
3 * Copyright (c) 1991, Larry Wall
5 * You may distribute under the terms of either the GNU General Public
6 * License or the Artistic License, as specified in the README file.
9 * Revision 4.1 92/08/07 18:28:39 lwall
11 * Revision 4.0.1.7 92/06/11 21:16:30 lwall
12 * patch34: expect incorrectly set to indicate start of program or block
14 * Revision 4.0.1.6 92/06/08 16:03:49 lwall
15 * patch20: an EXPR may now start with a bareword
16 * patch20: print $fh EXPR can now expect term rather than operator in EXPR
17 * patch20: added ... as variant on ..
18 * patch20: new warning on spurious backslash
19 * patch20: new warning on missing $ for foreach variable
20 * patch20: "foo"x1024 now legal without space after x
21 * patch20: new warning on print accidentally used as function
22 * patch20: tr/stuff// wasn't working right
23 * patch20: 2. now eats the dot
24 * patch20: <@ARGV> now notices @ARGV
25 * patch20: tr/// now lets you say \-
27 * Revision 4.0.1.5 91/11/11 16:45:51 lwall
28 * patch19: default arg for shift was wrong after first subroutine definition
30 * Revision 4.0.1.4 91/11/05 19:02:48 lwall
31 * patch11: \x and \c were subject to double interpretation in regexps
32 * patch11: prepared for ctype implementations that don't define isascii()
33 * patch11: nested list operators could miscount parens
34 * patch11: once-thru blocks didn't display right in the debugger
35 * patch11: sort eval "whatever" didn't work
36 * patch11: underscore is now allowed within literal octal and hex numbers
38 * Revision 4.0.1.3 91/06/10 01:32:26 lwall
39 * patch10: m'$foo' now treats string as single quoted
40 * patch10: certain pattern optimizations were botched
42 * Revision 4.0.1.2 91/06/07 12:05:56 lwall
43 * patch4: new copyright notice
44 * patch4: debugger lost track of lines in eval
45 * patch4: //o and s///o now optimize themselves fully at runtime
46 * patch4: added global modifier for pattern matches
48 * Revision 4.0.1.1 91/04/12 09:18:18 lwall
49 * patch1: perl -de "print" wouldn't stop at the first statement
51 * Revision 4.0 91/03/20 01:42:14 lwall
60 static void set_csh();
62 /* The following are arranged oddly so that the guard on the switch statement
63 * can get by with a single comparison (if the compiler is smart enough).
67 #define LEX_INTERPNORMAL 7
68 #define LEX_INTERPCASEMOD 6
69 #define LEX_INTERPSTART 5
70 #define LEX_INTERPEND 4
71 #define LEX_INTERPENDMAYBE 3
72 #define LEX_INTERPCONCAT 2
73 #define LEX_INTERPCONST 1
74 #define LEX_KNOWNEXT 0
76 static U32 lex_state = LEX_NORMAL; /* next token is determined */
77 static U32 lex_defer; /* state after determined token */
78 static expectation lex_expect; /* expect after determined token */
79 static I32 lex_brackets; /* bracket count */
80 static I32 lex_fakebrack; /* outer bracket is mere delimiter */
81 static I32 lex_casemods; /* casemod count */
82 static I32 lex_dojoin; /* doing an array interpolation */
83 static I32 lex_starts; /* how many interps done on level */
84 static SV * lex_stuff; /* runtime pattern from m// or s/// */
85 static SV * lex_repl; /* runtime replacement from s/// */
86 static OP * lex_op; /* extra info to pass back on op */
87 static I32 lex_inpat; /* in pattern $) and $| are special */
88 static I32 lex_inwhat; /* what kind of quoting are we in */
89 static char * lex_brackstack; /* what kind of brackets to pop */
91 /* What we know when we're in LEX_KNOWNEXT state. */
92 static YYSTYPE nextval[5]; /* value of next token, if any */
93 static I32 nexttype[5]; /* type of next token */
94 static I32 nexttoke = 0;
100 #include <sys/file.h>
107 #include "keywords.h"
114 #define CLINE (copline = (curcop->cop_line < copline ? curcop->cop_line : copline))
117 #define PERL_META(c) ((c) | 128)
119 #define META(c) ((c) | 128)
122 #define TOKEN(retval) return (bufptr = s,(int)retval)
123 #define OPERATOR(retval) return (expect = XTERM,bufptr = s,(int)retval)
124 #define PREBLOCK(retval) return (expect = XBLOCK,bufptr = s,(int)retval)
125 #define PREREF(retval) return (expect = XREF,bufptr = s,(int)retval)
126 #define TERM(retval) return (CLINE, expect = XOPERATOR,bufptr = s,(int)retval)
127 #define LOOPX(f) return(yylval.ival=f,expect = XTERM,bufptr = s,(int)LOOPEX)
128 #define FTST(f) return(yylval.ival=f,expect = XTERM,bufptr = s,(int)UNIOP)
129 #define FUN0(f) return(yylval.ival = f,expect = XOPERATOR,bufptr = s,(int)FUNC0)
130 #define FUN1(f) return(yylval.ival = f,expect = XOPERATOR,bufptr = s,(int)FUNC1)
131 #define BOop(f) return(yylval.ival=f,expect = XTERM,bufptr = s,(int)BITOROP)
132 #define BAop(f) return(yylval.ival=f,expect = XTERM,bufptr = s,(int)BITANDOP)
133 #define SHop(f) return(yylval.ival=f,expect = XTERM,bufptr = s,(int)SHIFTOP)
134 #define PWop(f) return(yylval.ival=f,expect = XTERM,bufptr = s,(int)POWOP)
135 #define PMop(f) return(yylval.ival=f,expect = XTERM,bufptr = s,(int)MATCHOP)
136 #define Aop(f) return(yylval.ival=f,expect = XTERM,bufptr = s,(int)ADDOP)
137 #define Mop(f) return(yylval.ival=f,expect = XTERM,bufptr = s,(int)MULOP)
138 #define Eop(f) return(yylval.ival=f,expect = XTERM,bufptr = s,(int)EQOP)
139 #define Rop(f) return(yylval.ival=f,expect = XTERM,bufptr = s,(int)RELOP)
141 /* This bit of chicanery makes a unary function followed by
142 * a parenthesis into a function with one argument, highest precedence.
144 #define UNI(f) return(yylval.ival = f, \
147 last_uni = oldbufptr, \
148 (*s == '(' || (s = skipspace(s), *s == '(') ? (int)FUNC1 : (int)UNIOP) )
150 #define UNIBRACK(f) return(yylval.ival = f, \
152 last_uni = oldbufptr, \
153 (*s == '(' || (s = skipspace(s), *s == '(') ? (int)FUNC1 : (int)UNIOP) )
155 /* This does similarly for list operators */
156 #define LOP(f) return(yylval.ival = f, \
160 last_lop = oldbufptr, \
161 (*s == '(' || (s = skipspace(s), *s == '(') ? (int)FUNC : (int)LSTOP) )
163 /* grandfather return to old style */
164 #define OLDLOP(f) return(yylval.ival=f,expect = XTERM,bufptr = s,(int)LSTOP)
170 warn("%s found where operator expected", what);
178 SAVEINT(lex_brackets);
179 SAVEINT(lex_fakebrack);
180 SAVEINT(lex_casemods);
185 SAVEINT(curcop->cop_line);
188 SAVESPTR(oldoldbufptr);
190 SAVESPTR(lex_brackstack);
192 lex_state = LEX_NORMAL;
198 SAVESPTR(lex_brackstack);
199 lex_brackstack = malloc(120);
211 oldoldbufptr = oldbufptr = bufptr = SvPVX(linestr);
212 bufend = bufptr + SvCUR(linestr);
222 free(lex_brackstack);
239 while (*s == ' ' || *s == '\t') s++;
240 if (strnEQ(s, "line ", 5)) {
249 while (*s == ' ' || *s == '\t')
251 if (*s == '"' && (t = strchr(s+1, '"')))
255 return; /* false alarm */
256 for (t = s; !isSPACE(*t); t++) ;
261 curcop->cop_filegv = gv_fetchfile(s);
263 curcop->cop_filegv = gv_fetchfile(origfilename);
265 curcop->cop_line = atoi(n)-1;
272 if (in_format && lex_brackets <= 1) {
273 while (s < bufend && (*s == ' ' || *s == '\t'))
278 while (s < bufend && isSPACE(*s))
280 if (s < bufend && *s == '#') {
281 while (s < bufend && *s != '\n')
286 if (s < bufend || !rsfp)
288 if ((s = sv_gets(linestr, rsfp, 0)) == Nullch) {
289 sv_setpv(linestr,"");
290 bufend = oldoldbufptr = oldbufptr = bufptr = s = SvPVX(linestr);
293 oldoldbufptr = oldbufptr = bufptr = s;
294 bufend = bufptr + SvCUR(linestr);
304 if (oldoldbufptr != last_uni)
306 while (isSPACE(*last_uni))
308 for (s = last_uni; isALNUM(*s) || *s == '-'; s++) ;
311 warn("Warning: Use of \"%s\" without parens is ambiguous", last_uni);
319 #define UNI(f) return uni(f,s)
320 #define LOP(f) return lop(f,s)
330 last_uni = oldbufptr;
349 last_uni = oldbufptr;
359 #endif /* CRIPPLED_CC */
365 nexttype[nexttoke] = type;
367 if (lex_state != LEX_KNOWNEXT) {
368 lex_defer = lex_state;
370 lex_state = LEX_KNOWNEXT;
375 force_word(start,token,check_keyword,allow_tick)
376 register char *start;
384 start = skipspace(start);
386 if (isIDFIRST(*s) || (allow_tick && (*s == '\'' || *s == ':'))) {
387 s = scan_word(s, tokenbuf, allow_tick, &len);
388 if (check_keyword && keyword(tokenbuf, len))
390 if (token == METHOD) {
400 nextval[nexttoke].opval = (OP*)newSVOP(OP_CONST,0, newSVpv(tokenbuf,0));
411 nextval[nexttoke].opval = (OP*)newSVOP(OP_CONST, 0, newSVpv(s,0));
431 while (s < send && *s != '\\')
436 delim = SvSTORAGE(sv);
439 if (s + 1 < send && (s[1] == '\\' || s[1] == delim))
440 s++; /* all that, just for this */
445 SvCUR_set(sv, d - SvPVX(sv));
453 register I32 op_type = yylval.ival;
457 if (op_type == OP_NULL) {
458 yylval.opval = lex_op;
462 if (op_type == OP_CONST || op_type == OP_READLINE) {
463 yylval.opval = (OP*)newSVOP(op_type, 0, q(lex_stuff));
470 SAVEINT(lex_brackets);
471 SAVEINT(lex_fakebrack);
472 SAVEINT(lex_casemods);
477 SAVEINT(curcop->cop_line);
480 SAVESPTR(oldoldbufptr);
482 SAVESPTR(lex_brackstack);
487 bufend = bufptr = oldbufptr = oldoldbufptr = SvPVX(linestr);
488 bufend += SvCUR(linestr);
493 lex_brackstack = malloc(120);
496 lex_state = LEX_INTERPCONCAT;
497 curcop->cop_line = multi_start;
499 lex_inwhat = op_type;
500 if (op_type == OP_MATCH || op_type == OP_SUBST)
508 yylval.opval = lex_op;
521 yylval.opval = (OP*)newSVOP(OP_CONST, 0, newSVpv("",0));
525 if (lex_casemods) { /* oops, we've got some unbalanced parens */
526 lex_state = LEX_INTERPCASEMOD;
531 /* Is there a right-hand side to take care of? */
532 if (lex_repl && (lex_inwhat == OP_SUBST || lex_inwhat == OP_TRANS)) {
535 bufend = bufptr = oldbufptr = oldoldbufptr = SvPVX(linestr);
536 bufend += SvCUR(linestr);
542 if (SvCOMPILED(lex_repl)) {
543 lex_state = LEX_INTERPNORMAL;
547 lex_state = LEX_INTERPCONCAT;
553 free(lex_brackstack);
557 bufend = SvPVX(linestr);
558 bufend += SvCUR(linestr);
568 register char *send = bufend;
569 SV *sv = NEWSV(93, send - start);
570 register char *s = start;
571 register char *d = SvPVX(sv);
572 char delim = SvSTORAGE(linestr);
573 bool dorange = FALSE;
577 ? "\\.^$@dDwWsSbB+*?|()-nrtfeaxc0123456789[{]}"
578 : (lex_inwhat & OP_TRANS)
582 while (s < send || dorange) {
583 if (lex_inwhat == OP_TRANS) {
588 SvGROW(sv, SvLEN(sv) + 256);
592 for (i = (*d & 0377); i <= max; i++)
597 else if (*s == '-' && s+1 < send && s != start) {
604 else if (*s == '$') {
605 if (!lex_inpat) /* not a regexp, so $ must be var */
607 if (s + 1 < send && s[1] != ')' && s[1] != '|')
608 break; /* in regexp, $ might be tail anchor */
610 if (*s == '\\' && s+1 < send) {
616 if (*s && strchr(leave, *s)) {
621 if (lex_inwhat == OP_SUBST && !lex_inpat &&
622 isDIGIT(*s) && !isDIGIT(s[1]))
627 if (lex_inwhat != OP_TRANS && *s && strchr("lLuUE", *s)) {
633 if (lex_inwhat == OP_TRANS) {
641 case '0': case '1': case '2': case '3':
642 case '4': case '5': case '6': case '7':
643 *d++ = scan_oct(s, 3, &len);
647 *d++ = scan_hex(++s, 2, &len);
685 SvCUR_set(sv, d - SvPVX(sv));
688 if (SvCUR(sv) + 5 < SvLEN(sv)) {
689 SvLEN_set(sv, SvCUR(sv) + 1);
690 Renew(SvPVX(sv), SvLEN(sv), char);
693 yylval.opval = (OP*)newSVOP(OP_CONST, 0, sv);
699 /* This is the one truly awful dwimmer necessary to conflate C and sed. */
706 if (*s == '-' && s[1] == '>' && (s[2] == '[' || s[2] == '{'))
708 if (*s != '{' && *s != '[')
713 /* In a pattern, so maybe we have {n,m}. */
730 /* On the other hand, maybe we have a character class */
733 if (*s == ']' || *s == '^')
736 int weight = 2; /* let's weigh the evidence */
738 unsigned char un_char = 0, last_un_char;
739 char *send = strchr(s,']');
742 if (!send) /* has to be an expression */
748 else if (isDIGIT(*s)) {
750 if (isDIGIT(s[1]) && s[2] == ']')
756 for (; s < send; s++) {
757 last_un_char = un_char;
758 un_char = (unsigned char)*s;
763 weight -= seen[un_char] * 10;
765 scan_ident(s,send,tmpbuf,FALSE);
766 if (strlen(tmpbuf) > 1 && gv_fetchpv(tmpbuf,FALSE))
771 else if (*s == '$' && s[1] &&
772 strchr("[#!%*<>()-=",s[1])) {
773 if (/*{*/ strchr("])} =",s[2]))
782 if (strchr("wds]",s[1]))
784 else if (seen['\''] || seen['"'])
786 else if (strchr("rnftbxcav",s[1]))
788 else if (isDIGIT(s[1])) {
790 while (s[1] && isDIGIT(s[1]))
800 if (strchr("aA01! ",last_un_char))
802 if (strchr("zZ79~",s[1]))
806 if (!isALNUM(last_un_char) && !strchr("$@&",last_un_char) &&
807 isALPHA(*s) && s[1] && isALPHA(s[1])) {
812 if (keyword(tmpbuf, d - tmpbuf))
815 if (un_char == last_un_char + 1)
817 weight -= seen[un_char];
822 if (weight >= 0) /* probably a character class */
829 static char* exp_name[] = { "OPERATOR", "TERM", "BLOCK", "REF" };
831 extern int yychar; /* last token */
843 case LEX_NORMAL: /* Some compilers will produce faster */
844 case LEX_INTERPNORMAL: /* code if we comment these out. */
850 yylval = nextval[nexttoke];
852 lex_state = lex_defer;
855 return(nexttype[nexttoke]);
857 case LEX_INTERPCASEMOD:
859 if (bufptr != bufend && *bufptr != '\\')
860 croak("panic: INTERPCASEMOD");
862 if (bufptr == bufend || bufptr[1] == 'E') {
863 if (lex_casemods <= 1) {
864 if (bufptr != bufend)
866 lex_state = LEX_INTERPSTART;
874 else if (lex_casemods) {
880 if (strnEQ(s, "L\\u", 3) || strnEQ(s, "U\\l", 3))
881 tmp = *s, *s = s[2], s[2] = tmp; /* misordered... */
883 lex_state = LEX_INTERPCONCAT;
884 nextval[nexttoke].ival = 0;
887 nextval[nexttoke].ival = OP_LCFIRST;
889 nextval[nexttoke].ival = OP_UCFIRST;
891 nextval[nexttoke].ival = OP_LC;
893 nextval[nexttoke].ival = OP_UC;
895 croak("panic: yylex");
907 case LEX_INTERPSTART:
908 if (bufptr == bufend)
909 return sublex_done();
911 lex_dojoin = (*bufptr == '@');
912 lex_state = LEX_INTERPNORMAL;
914 nextval[nexttoke].ival = 0;
917 nextval[nexttoke].ival = 0;
919 nextval[nexttoke].ival = 0;
921 nextval[nexttoke].ival = OP_JOIN; /* emulate join($", ...) */
932 case LEX_INTERPENDMAYBE:
933 if (intuit_more(bufptr)) {
934 lex_state = LEX_INTERPNORMAL; /* false alarm, more expr */
942 lex_state = LEX_INTERPCONCAT;
946 case LEX_INTERPCONCAT:
949 croak("panic: INTERPCONCAT");
951 if (bufptr == bufend)
952 return sublex_done();
954 if (SvSTORAGE(linestr) == '\'') {
955 SV *sv = newSVsv(linestr);
958 yylval.opval = (OP*)newSVOP(OP_CONST, 0, sv);
962 s = scan_const(bufptr);
964 lex_state = LEX_INTERPCASEMOD;
966 lex_state = LEX_INTERPSTART;
970 nextval[nexttoke] = yylval;
985 oldoldbufptr = oldbufptr;
988 fprintf(stderr,"### Tokener expecting %s at %s\n", exp_name[expect], s);
994 if ((*s & 127) == '}') {
999 warn("Unrecognized character \\%03o ignored", *s++ & 255);
1005 if ((*s & 127) == '}') {
1010 warn("Unrecognized character \\%03o ignored", *s++ & 255);
1014 goto fake_eof; /* emulate EOF on ^D or ^Z */
1018 yyerror("Missing right bracket");
1022 goto retry; /* ignore stray nulls */
1027 sv_setpv(linestr,"");
1029 char *pdb = getenv("PERLDB");
1031 sv_catpv(linestr,"{");
1032 sv_catpv(linestr, pdb ? pdb : "require 'perldb.pl'");
1033 sv_catpv(linestr, "}");
1035 if (minus_n || minus_p) {
1036 sv_catpv(linestr, "LINE: while (<>) {");
1038 sv_catpv(linestr,"chop;");
1040 sv_catpv(linestr,"@F=split(' ');");
1042 oldoldbufptr = oldbufptr = s = SvPVX(linestr);
1043 bufend = SvPVX(linestr) + SvCUR(linestr);
1048 #endif /* CRYPTSCRIPT */
1050 if ((s = sv_gets(linestr, rsfp, 0)) == Nullch) {
1054 (void)my_pclose(rsfp);
1055 else if ((FILE*)rsfp == stdin)
1061 if (minus_n || minus_p) {
1062 sv_setpv(linestr,minus_p ? ";}continue{print" : "");
1063 sv_catpv(linestr,";}");
1064 oldoldbufptr = oldbufptr = s = SvPVX(linestr);
1065 bufend = SvPVX(linestr) + SvCUR(linestr);
1066 minus_n = minus_p = 0;
1069 oldoldbufptr = oldbufptr = s = SvPVX(linestr);
1070 sv_setpv(linestr,"");
1071 TOKEN(';'); /* not infinite loop because rsfp is NULL now */
1073 if (doextract && *s == '#')
1076 } while (doextract);
1077 oldoldbufptr = oldbufptr = bufptr = s;
1079 SV *sv = NEWSV(85,0);
1081 sv_upgrade(sv, SVt_PVMG);
1082 sv_setsv(sv,linestr);
1083 av_store(GvAV(curcop->cop_filegv),(I32)curcop->cop_line,sv);
1085 bufend = SvPVX(linestr) + SvCUR(linestr);
1086 if (curcop->cop_line == 1) {
1087 while (s < bufend && isSPACE(*s))
1089 if (*s == ':') /* for csh's that have to exec sh scripts */
1091 if (*s == '#' && s[1] == '!') {
1092 if (!in_eval && !instr(s,"perl") && instr(origargv[0],"perl")) {
1100 while (s < bufend && !isSPACE(*s))
1103 while (s < bufend && isSPACE(*s))
1106 Newz(899,newargv,origargc+3,char*);
1108 while (s < bufend && !isSPACE(*s))
1111 Copy(origargv+1, newargv+2, origargc+1, char*);
1117 croak("Can't exec %s", cmd);
1119 if (d = instr(s, "perl -")) {
1122 while (d = moreswitches(d)) ;
1126 if (in_format && lex_brackets <= 1) {
1127 s = scan_formline(s);
1133 case ' ': case '\t': case '\f': case '\r': case 013:
1138 if (lex_state != LEX_NORMAL || (in_eval && !rsfp)) {
1140 while (s < d && *s != '\n')
1145 if (in_format && lex_brackets <= 1) {
1146 s = scan_formline(s);
1158 if (s[1] && isALPHA(s[1]) && !isALNUM(s[2])) {
1160 last_uni = oldbufptr;
1162 case 'r': FTST(OP_FTEREAD);
1163 case 'w': FTST(OP_FTEWRITE);
1164 case 'x': FTST(OP_FTEEXEC);
1165 case 'o': FTST(OP_FTEOWNED);
1166 case 'R': FTST(OP_FTRREAD);
1167 case 'W': FTST(OP_FTRWRITE);
1168 case 'X': FTST(OP_FTREXEC);
1169 case 'O': FTST(OP_FTROWNED);
1170 case 'e': FTST(OP_FTIS);
1171 case 'z': FTST(OP_FTZERO);
1172 case 's': FTST(OP_FTSIZE);
1173 case 'f': FTST(OP_FTFILE);
1174 case 'd': FTST(OP_FTDIR);
1175 case 'l': FTST(OP_FTLINK);
1176 case 'p': FTST(OP_FTPIPE);
1177 case 'S': FTST(OP_FTSOCK);
1178 case 'u': FTST(OP_FTSUID);
1179 case 'g': FTST(OP_FTSGID);
1180 case 'k': FTST(OP_FTSVTX);
1181 case 'b': FTST(OP_FTBLK);
1182 case 'c': FTST(OP_FTCHR);
1183 case 't': FTST(OP_FTTTY);
1184 case 'T': FTST(OP_FTTEXT);
1185 case 'B': FTST(OP_FTBINARY);
1186 case 'M': gv_fetchpv("\024",TRUE); FTST(OP_FTMTIME);
1187 case 'A': gv_fetchpv("\024",TRUE); FTST(OP_FTATIME);
1188 case 'C': gv_fetchpv("\024",TRUE); FTST(OP_FTCTIME);
1197 if (expect == XOPERATOR)
1202 else if (*s == '>') {
1205 if (isIDFIRST(*s)) {
1206 s = force_word(s,METHOD,TRUE,FALSE);
1212 if (expect == XOPERATOR)
1215 if (isSPACE(*s) || !isSPACE(*bufptr))
1217 OPERATOR('-'); /* unary minus */
1224 if (expect == XOPERATOR)
1229 if (expect == XOPERATOR)
1232 if (isSPACE(*s) || !isSPACE(*bufptr))
1238 if (expect != XOPERATOR) {
1239 s = scan_ident(s, bufend, tokenbuf, TRUE);
1241 force_ident(tokenbuf);
1252 if (expect != XOPERATOR) {
1253 s = scan_ident(s, bufend, tokenbuf + 1, TRUE);
1258 if (strchr(tokenbuf,':'))
1259 croak("\"my\" variable %s can't be in a package",tokenbuf);
1260 nextval[nexttoke].opval = newOP(OP_PADHV, 0);
1261 nextval[nexttoke].opval->op_targ = pad_allocmy(tokenbuf);
1262 force_next(PRIVATEREF);
1265 if (!strchr(tokenbuf,':')) {
1266 if (tmp = pad_findmy(tokenbuf)) {
1267 nextval[nexttoke].opval = newOP(OP_PADHV, 0);
1268 nextval[nexttoke].opval->op_targ = tmp;
1269 force_next(PRIVATEREF);
1273 force_ident(tokenbuf + 1);
1295 if (curcop->cop_line < copline)
1296 copline = curcop->cop_line;
1304 if (lex_brackets <= 0)
1305 yyerror("Unmatched right bracket");
1308 if (lex_state == LEX_INTERPNORMAL) {
1309 if (lex_brackets == 0) {
1310 if (*s != '-' || s[1] != '>')
1311 lex_state = LEX_INTERPEND;
1320 if (lex_brackets > 100)
1321 realloc(lex_brackstack, lex_brackets + 1);
1322 if (oldoldbufptr == last_lop)
1323 lex_brackstack[lex_brackets++] = XTERM;
1325 lex_brackstack[lex_brackets++] = XOPERATOR;
1326 if (expect == XTERM)
1327 OPERATOR(HASHBRACK);
1328 else if (expect == XREF) {
1332 OPERATOR(HASHBRACK);
1335 (isSPACE(*t) || isALPHA(*t) || *t == '"' || *t == '\'');
1337 if (*t == ',' || (*t == '=' && t[1] == '>'))
1338 OPERATOR(HASHBRACK);
1342 lex_brackstack[lex_brackets-1] = XBLOCK;
1345 yylval.ival = curcop->cop_line;
1346 if (isSPACE(*s) || *s == '#')
1347 copline = NOLINE; /* invalidate current command line number */
1352 if (lex_brackets <= 0)
1353 yyerror("Unmatched right bracket");
1355 expect = (expectation)lex_brackstack[--lex_brackets];
1356 if (lex_state == LEX_INTERPNORMAL) {
1357 if (lex_brackets == 0) {
1358 if (lex_fakebrack) {
1359 lex_state = LEX_INTERPEND;
1361 return yylex(); /* ignore fake brackets */
1363 if (*s != '-' || s[1] != '>')
1364 lex_state = LEX_INTERPEND;
1375 if (expect == XOPERATOR) {
1376 if (dowarn && isALPHA(*s) && bufptr == SvPVX(linestr)) {
1384 s = scan_ident(s-1, bufend, tokenbuf, TRUE);
1387 force_ident(tokenbuf);
1409 if (dowarn && tmp && isSPACE(*s) && strchr("+-*/%.^&|<",tmp))
1410 warn("Reversed %c= operator",tmp);
1412 if (in_format == 2 && (tmp == '\n' || s[1] == '\n')) {
1429 if (expect != XOPERATOR) {
1430 if (s[1] != '<' && !strchr(s,'>'))
1433 s = scan_heredoc(s);
1435 s = scan_inputsymbol(s);
1436 TERM(sublex_start());
1441 SHop(OP_LEFT_SHIFT);
1455 SHop(OP_RIGHT_SHIFT);
1462 if (expect == XOPERATOR) {
1464 OPERATOR(','); /* grandfather non-comma-format format */
1468 if (s[1] == '#' && (isALPHA(s[2]) || s[2] == '_' || s[2] == '{')) {
1469 s = scan_ident(s+1, bufend, tokenbuf, FALSE);
1471 force_ident(tokenbuf);
1474 s = scan_ident(s, bufend, tokenbuf+1, FALSE);
1477 if (dowarn && *s == '[') {
1479 for (t = s+1; isSPACE(*t) || isALNUM(*t) || *t == '$'; t++) ;
1481 bufptr = skipspace(bufptr);
1482 while (t < bufend && *t != ']') t++;
1483 warn("Multidimensional syntax %.*s not supported",
1484 t-bufptr+1, bufptr);
1488 if (lex_state == LEX_NORMAL && isSPACE(*s)) {
1489 bool islop = (last_lop == oldoldbufptr);
1491 if (strchr("$@\"'`q", *s))
1492 expect = XTERM; /* e.g. print $fh "foo" */
1495 else if (strchr("&*<%", *s) && isIDFIRST(s[1]))
1496 expect = XTERM; /* e.g. print $fh &sub */
1497 else if (isDIGIT(*s))
1498 expect = XTERM; /* e.g. print $fh 3 */
1499 else if (*s == '.' && isDIGIT(s[1]))
1500 expect = XTERM; /* e.g. print $fh .3 */
1501 else if (strchr("/?-+", *s) && !isSPACE(s[1]))
1502 expect = XTERM; /* e.g. print $fh -1 */
1503 else if (*s == '<' && s[1] == '<' && !isSPACE(s[2]))
1504 expect = XTERM; /* print $fh <<"EOF" */
1507 if (strchr(tokenbuf,':'))
1508 croak("\"my\" variable %s can't be in a package",tokenbuf);
1509 nextval[nexttoke].opval = newOP(OP_PADSV, 0);
1510 nextval[nexttoke].opval->op_targ = pad_allocmy(tokenbuf);
1511 force_next(PRIVATEREF);
1513 else if (!strchr(tokenbuf,':')) {
1514 I32 optype = OP_PADSV;
1519 else if (*s == '{') {
1523 if (tmp = pad_findmy(tokenbuf)) {
1524 nextval[nexttoke].opval = newOP(optype, 0);
1525 nextval[nexttoke].opval->op_targ = tmp;
1526 force_next(PRIVATEREF);
1529 force_ident(tokenbuf+1);
1532 force_ident(tokenbuf+1);
1536 yyerror("Final $ should be \\$ or $name");
1542 if (expect == XOPERATOR)
1544 s = scan_ident(s, bufend, tokenbuf+1, FALSE);
1549 if (strchr(tokenbuf,':'))
1550 croak("\"my\" variable %s can't be in a package",tokenbuf);
1551 nextval[nexttoke].opval = newOP(OP_PADAV, 0);
1552 nextval[nexttoke].opval->op_targ = pad_allocmy(tokenbuf);
1553 force_next(PRIVATEREF);
1556 else if (!strchr(tokenbuf,':')) {
1557 I32 optype = OP_PADAV;
1562 if (tmp = pad_findmy(tokenbuf)) {
1563 nextval[nexttoke].opval = newOP(optype, 0);
1564 nextval[nexttoke].opval->op_targ = tmp;
1565 force_next(PRIVATEREF);
1569 if (dowarn && *s == '[') {
1571 for (t = s+1; isSPACE(*t) || isALNUM(*t) || *t == '$'; t++) ;
1573 bufptr = skipspace(bufptr);
1574 warn("Scalar value %.*s better written as $%.*s",
1575 t-bufptr, bufptr, t-bufptr-1, bufptr+1);
1578 force_ident(tokenbuf+1);
1582 yyerror("Final @ should be \\@ or @name");
1587 case '/': /* may either be division or pattern */
1588 case '?': /* may either be conditional or pattern */
1589 if (expect != XOPERATOR) {
1592 TERM(sublex_start());
1600 if (in_format == 2) {
1605 if (expect == XOPERATOR || !isDIGIT(s[1])) {
1611 yylval.ival = OPf_SPECIAL;
1617 if (expect != XOPERATOR)
1622 case '0': case '1': case '2': case '3': case '4':
1623 case '5': case '6': case '7': case '8': case '9':
1624 if (expect == XOPERATOR)
1630 if (expect == XOPERATOR) {
1632 OPERATOR(','); /* grandfather non-comma-format format */
1638 croak("EOF in string");
1639 yylval.ival = OP_CONST;
1640 TERM(sublex_start());
1643 if (expect == XOPERATOR) {
1645 OPERATOR(','); /* grandfather non-comma-format format */
1651 croak("EOF in string");
1652 yylval.ival = OP_SCALAR;
1653 TERM(sublex_start());
1656 if (expect == XOPERATOR)
1660 croak("EOF in backticks");
1661 yylval.ival = OP_BACKTICK;
1663 TERM(sublex_start());
1666 if (expect == XOPERATOR)
1672 if (isDIGIT(s[1]) && expect == XOPERATOR) {
1708 s = scan_word(s, tokenbuf, FALSE, &len);
1710 switch (tmp = keyword(tokenbuf, len)) {
1712 default: /* not a keyword */
1715 if (*s == '\'' || *s == ':')
1716 s = scan_word(s, tokenbuf + len, TRUE, &len);
1717 if (expect == XBLOCK) { /* special case: start of statement */
1718 while (isSPACE(*s)) s++;
1720 yylval.pval = savestr(tokenbuf);
1726 else if (dowarn && expect == XOPERATOR) {
1727 if (bufptr == SvPVX(linestr)) {
1735 gv = gv_fetchpv(tokenbuf,FALSE);
1736 if (gv && GvCV(gv)) {
1737 nextval[nexttoke].opval =
1738 (OP*)newSVOP(OP_CONST, 0, newSVpv(tokenbuf,0));
1739 nextval[nexttoke].opval->op_private = OPpCONST_BARE;
1747 last_lop = oldbufptr;
1754 if (oldoldbufptr && oldoldbufptr < bufptr) {
1755 if (oldoldbufptr == last_lop) {
1758 yylval.opval = (OP*)newSVOP(OP_CONST, 0,
1759 newSVpv(tokenbuf,0));
1760 yylval.opval->op_private = OPpCONST_BARE;
1761 for (d = tokenbuf; *d && isLOWER(*d); d++) ;
1763 warn(warn_reserved, tokenbuf);
1767 while (s < bufend && isSPACE(*s))
1771 nextval[nexttoke].opval =
1772 (OP*)newSVOP(OP_CONST, 0, newSVpv(tokenbuf,0));
1773 nextval[nexttoke].opval->op_private = OPpCONST_BARE;
1779 yylval.opval = (OP*)newSVOP(OP_CONST, 0, newSVpv(tokenbuf,0));
1780 yylval.opval->op_private = OPpCONST_BARE;
1782 if (*s == '$' || *s == '{') {
1783 last_lop = oldbufptr;
1790 s = scan_word(s, tmpbuf, TRUE, &len);
1791 if (!keyword(tmpbuf, len)) {
1792 gv = gv_fetchpv(tmpbuf,FALSE);
1793 if (!gv || !GvCV(gv)) {
1794 nextval[nexttoke].opval =
1795 (OP*)newSVOP(OP_CONST, 0, newSVpv(tmpbuf,0));
1796 nextval[nexttoke].opval->op_private = OPpCONST_BARE;
1805 for (d = tokenbuf; *d && isLOWER(*d); d++) ;
1807 warn(warn_reserved, tokenbuf);
1812 case KEY___FILE__: {
1813 if (tokenbuf[2] == 'L')
1814 (void)sprintf(tokenbuf,"%ld",(long)curcop->cop_line);
1816 strcpy(tokenbuf, SvPVX(GvSV(curcop->cop_filegv)));
1817 yylval.opval = (OP*)newSVOP(OP_CONST, 0, newSVpv(tokenbuf,0));
1826 if (!in_eval && (gv = gv_fetchpv("DATA",FALSE))) {
1830 GvIO(gv)->ifp = rsfp;
1831 #if defined(HAS_FCNTL) && defined(FFt_SETFD)
1833 fcntl(fd,FFt_SETFD,fd >= 3);
1836 GvIO(gv)->type = '|';
1837 else if ((FILE*)rsfp == stdin)
1838 GvIO(gv)->type = '-';
1840 GvIO(gv)->type = '<';
1849 if (expect == XBLOCK && (minus_p || minus_n || *s == '{' )) {
1886 (void)gv_fetchpv("ENV",TRUE); /* may use HOME */
1910 if (dowarn && *s != '0' && isDIGIT(*s))
1911 warn("chmod: mode argument is missing initial 0");
1934 s = force_word(s,WORD,FALSE,TRUE);
1959 yylval.ival = curcop->cop_line;
1970 expect = (*s == '{') ? XBLOCK : XTERM;
1971 UNIBRACK(OP_ENTEREVAL);
1986 case KEY_endhostent:
1992 case KEY_endservent:
1995 case KEY_endprotoent:
2006 yylval.ival = curcop->cop_line;
2007 while (s < bufend && isSPACE(*s))
2010 croak("Missing $ on loop variable");
2052 case KEY_getpriority:
2053 LOP(OP_GETPRIORITY);
2055 case KEY_getprotobyname:
2058 case KEY_getprotobynumber:
2061 case KEY_getprotoent:
2073 case KEY_getpeername:
2074 UNI(OP_GETPEERNAME);
2076 case KEY_gethostbyname:
2079 case KEY_gethostbyaddr:
2082 case KEY_gethostent:
2085 case KEY_getnetbyname:
2088 case KEY_getnetbyaddr:
2094 case KEY_getservbyname:
2097 case KEY_getservbyport:
2100 case KEY_getservent:
2103 case KEY_getsockname:
2104 UNI(OP_GETSOCKNAME);
2106 case KEY_getsockopt:
2128 yylval.ival = curcop->cop_line;
2150 s = force_word(s,WORD,TRUE,FALSE);
2189 TERM(sublex_start());
2212 s = force_word(s,WORD,TRUE,FALSE);
2220 if (isIDFIRST(*s)) {
2222 for (d = s; isALNUM(*d); d++) ;
2224 if (strchr("|&*+-=!?:.", *t))
2225 warn("Precedence problem: open %.*s should be open(%.*s)",
2243 checkcomma(s,tokenbuf,"filehandle");
2247 checkcomma(s,tokenbuf,"filehandle");
2260 s = force_word(s,WORD,FALSE,TRUE);
2269 croak("EOF in string");
2270 yylval.ival = OP_CONST;
2271 TERM(sublex_start());
2276 croak("EOF in string");
2277 yylval.ival = OP_SCALAR;
2278 if (SvSTORAGE(lex_stuff) == '\'')
2279 SvSTORAGE(lex_stuff) = 0; /* qq'$foo' should intepolate */
2280 TERM(sublex_start());
2285 croak("EOF in string");
2286 yylval.ival = OP_BACKTICK;
2288 TERM(sublex_start());
2300 s = force_word(s,WORD,TRUE,FALSE);
2347 TERM(sublex_start());
2349 TOKEN(1); /* force error */
2375 case KEY_setpriority:
2376 LOP(OP_SETPRIORITY);
2378 case KEY_sethostent:
2384 case KEY_setservent:
2387 case KEY_setprotoent:
2399 case KEY_setsockopt:
2429 case KEY_socketpair:
2433 checkcomma(s,tokenbuf,"subroutine name");
2435 if (*s == ';' || *s == ')') /* probably a close */
2436 croak("sort is now a reserved word");
2438 s = force_word(s,WORD,TRUE,TRUE);
2469 yylval.ival = savestack_ix; /* restore stuff on reduce */
2475 SAVESPTR(comppadname);
2476 SAVEINT(comppadnamefill);
2478 comppadname = newAV();
2479 comppadnamefill = -1;
2480 av_push(comppad, Nullsv);
2481 curpad = AvARRAY(comppad);
2484 subline = curcop->cop_line;
2486 if (tmp == KEY_format)
2490 if (isIDFIRST(*s) || *s == '\'' || *s == ':') {
2492 d = scan_word(s, tmpbuf, TRUE, &len);
2493 if (strchr(tmpbuf, ':'))
2494 sv_setpv(subname, tmpbuf);
2496 sv_setsv(subname,curstname);
2497 sv_catpvn(subname,"'",1);
2498 sv_catpvn(subname,tmpbuf,len);
2500 s = force_word(s,WORD,FALSE,TRUE);
2503 sv_setpv(subname,"?");
2505 if (tmp != KEY_format)
2530 TERM(sublex_start());
2560 yylval.ival = curcop->cop_line;
2564 yylval.ival = curcop->cop_line;
2581 if (dowarn && *s != '0' && isDIGIT(*s))
2582 warn("umask: argument is missing initial 0");
2596 yylval.ival = curcop->cop_line;
2615 if (expect == XOPERATOR)
2622 TERM(sublex_start());
2635 if (strEQ(d,"__LINE__")) return KEY___LINE__;
2636 if (strEQ(d,"__FILE__")) return KEY___FILE__;
2637 if (strEQ(d,"__END__")) return KEY___END__;
2643 if (strEQ(d,"and")) return KEY_and;
2644 if (strEQ(d,"abs")) return KEY_abs;
2647 if (strEQ(d,"alarm")) return KEY_alarm;
2648 if (strEQ(d,"atan2")) return KEY_atan2;
2651 if (strEQ(d,"accept")) return KEY_accept;
2656 if (strEQ(d,"BEGIN")) return KEY_BEGIN;
2659 if (strEQ(d,"bless")) return KEY_bless;
2660 if (strEQ(d,"bind")) return KEY_bind;
2661 if (strEQ(d,"binmode")) return KEY_binmode;
2666 if (strEQ(d,"cmp")) return KEY_cmp;
2667 if (strEQ(d,"chr")) return KEY_chr;
2668 if (strEQ(d,"cos")) return KEY_cos;
2671 if (strEQ(d,"chop")) return KEY_chop;
2674 if (strEQ(d,"close")) return KEY_close;
2675 if (strEQ(d,"chdir")) return KEY_chdir;
2676 if (strEQ(d,"chmod")) return KEY_chmod;
2677 if (strEQ(d,"chown")) return KEY_chown;
2678 if (strEQ(d,"crypt")) return KEY_crypt;
2681 if (strEQ(d,"chroot")) return KEY_chroot;
2682 if (strEQ(d,"caller")) return KEY_caller;
2685 if (strEQ(d,"connect")) return KEY_connect;
2688 if (strEQ(d,"closedir")) return KEY_closedir;
2689 if (strEQ(d,"continue")) return KEY_continue;
2696 if (strEQ(d,"do")) return KEY_do;
2699 if (strEQ(d,"die")) return KEY_die;
2702 if (strEQ(d,"dump")) return KEY_dump;
2705 if (strEQ(d,"delete")) return KEY_delete;
2708 if (strEQ(d,"defined")) return KEY_defined;
2709 if (strEQ(d,"dbmopen")) return KEY_dbmopen;
2712 if (strEQ(d,"dbmclose")) return KEY_dbmclose;
2717 if (strEQ(d,"EQ")) return KEY_eq;
2718 if (strEQ(d,"END")) return KEY_END;
2723 if (strEQ(d,"eq")) return KEY_eq;
2726 if (strEQ(d,"eof")) return KEY_eof;
2727 if (strEQ(d,"exp")) return KEY_exp;
2730 if (strEQ(d,"else")) return KEY_else;
2731 if (strEQ(d,"exit")) return KEY_exit;
2732 if (strEQ(d,"eval")) return KEY_eval;
2733 if (strEQ(d,"exec")) return KEY_exec;
2734 if (strEQ(d,"each")) return KEY_each;
2737 if (strEQ(d,"elsif")) return KEY_elsif;
2740 if (strEQ(d,"endgrent")) return KEY_endgrent;
2741 if (strEQ(d,"endpwent")) return KEY_endpwent;
2744 if (strEQ(d,"endnetent")) return KEY_endnetent;
2747 if (strEQ(d,"endhostent")) return KEY_endhostent;
2748 if (strEQ(d,"endservent")) return KEY_endservent;
2751 if (strEQ(d,"endprotoent")) return KEY_endprotoent;
2758 if (strEQ(d,"for")) return KEY_for;
2761 if (strEQ(d,"fork")) return KEY_fork;
2764 if (strEQ(d,"fcntl")) return KEY_fcntl;
2765 if (strEQ(d,"flock")) return KEY_flock;
2768 if (strEQ(d,"format")) return KEY_format;
2769 if (strEQ(d,"fileno")) return KEY_fileno;
2772 if (strEQ(d,"foreach")) return KEY_foreach;
2775 if (strEQ(d,"formline")) return KEY_formline;
2781 if (strEQ(d,"GT")) return KEY_gt;
2782 if (strEQ(d,"GE")) return KEY_ge;
2786 if (strnEQ(d,"get",3)) {
2791 if (strEQ(d,"ppid")) return KEY_getppid;
2792 if (strEQ(d,"pgrp")) return KEY_getpgrp;
2795 if (strEQ(d,"pwent")) return KEY_getpwent;
2796 if (strEQ(d,"pwnam")) return KEY_getpwnam;
2797 if (strEQ(d,"pwuid")) return KEY_getpwuid;
2800 if (strEQ(d,"peername")) return KEY_getpeername;
2801 if (strEQ(d,"protoent")) return KEY_getprotoent;
2802 if (strEQ(d,"priority")) return KEY_getpriority;
2805 if (strEQ(d,"protobyname")) return KEY_getprotobyname;
2808 if (strEQ(d,"protobynumber"))return KEY_getprotobynumber;
2812 else if (*d == 'h') {
2813 if (strEQ(d,"hostbyname")) return KEY_gethostbyname;
2814 if (strEQ(d,"hostbyaddr")) return KEY_gethostbyaddr;
2815 if (strEQ(d,"hostent")) return KEY_gethostent;
2817 else if (*d == 'n') {
2818 if (strEQ(d,"netbyname")) return KEY_getnetbyname;
2819 if (strEQ(d,"netbyaddr")) return KEY_getnetbyaddr;
2820 if (strEQ(d,"netent")) return KEY_getnetent;
2822 else if (*d == 's') {
2823 if (strEQ(d,"servbyname")) return KEY_getservbyname;
2824 if (strEQ(d,"servbyport")) return KEY_getservbyport;
2825 if (strEQ(d,"servent")) return KEY_getservent;
2826 if (strEQ(d,"sockname")) return KEY_getsockname;
2827 if (strEQ(d,"sockopt")) return KEY_getsockopt;
2829 else if (*d == 'g') {
2830 if (strEQ(d,"grent")) return KEY_getgrent;
2831 if (strEQ(d,"grnam")) return KEY_getgrnam;
2832 if (strEQ(d,"grgid")) return KEY_getgrgid;
2834 else if (*d == 'l') {
2835 if (strEQ(d,"login")) return KEY_getlogin;
2837 else if (strEQ(d,"c")) return KEY_getc;
2842 if (strEQ(d,"gt")) return KEY_gt;
2843 if (strEQ(d,"ge")) return KEY_ge;
2846 if (strEQ(d,"grep")) return KEY_grep;
2847 if (strEQ(d,"goto")) return KEY_goto;
2848 if (strEQ(d,"glob")) return KEY_glob;
2851 if (strEQ(d,"gmtime")) return KEY_gmtime;
2856 if (strEQ(d,"hex")) return KEY_hex;
2861 if (strEQ(d,"if")) return KEY_if;
2864 if (strEQ(d,"int")) return KEY_int;
2867 if (strEQ(d,"index")) return KEY_index;
2868 if (strEQ(d,"ioctl")) return KEY_ioctl;
2873 if (strEQ(d,"join")) return KEY_join;
2877 if (strEQ(d,"keys")) return KEY_keys;
2878 if (strEQ(d,"kill")) return KEY_kill;
2883 if (strEQ(d,"LT")) return KEY_lt;
2884 if (strEQ(d,"LE")) return KEY_le;
2890 if (strEQ(d,"lt")) return KEY_lt;
2891 if (strEQ(d,"le")) return KEY_le;
2892 if (strEQ(d,"lc")) return KEY_lc;
2895 if (strEQ(d,"log")) return KEY_log;
2898 if (strEQ(d,"last")) return KEY_last;
2899 if (strEQ(d,"link")) return KEY_link;
2902 if (strEQ(d,"local")) return KEY_local;
2903 if (strEQ(d,"lstat")) return KEY_lstat;
2906 if (strEQ(d,"length")) return KEY_length;
2907 if (strEQ(d,"listen")) return KEY_listen;
2910 if (strEQ(d,"lcfirst")) return KEY_lcfirst;
2913 if (strEQ(d,"localtime")) return KEY_localtime;
2919 case 1: return KEY_m;
2921 if (strEQ(d,"my")) return KEY_my;
2924 if (strEQ(d,"mkdir")) return KEY_mkdir;
2927 if (strEQ(d,"msgctl")) return KEY_msgctl;
2928 if (strEQ(d,"msgget")) return KEY_msgget;
2929 if (strEQ(d,"msgrcv")) return KEY_msgrcv;
2930 if (strEQ(d,"msgsnd")) return KEY_msgsnd;
2935 if (strEQ(d,"NE")) return KEY_ne;
2938 if (strEQ(d,"next")) return KEY_next;
2939 if (strEQ(d,"ne")) return KEY_ne;
2944 if (strEQ(d,"or")) return KEY_or;
2947 if (strEQ(d,"ord")) return KEY_ord;
2948 if (strEQ(d,"oct")) return KEY_oct;
2951 if (strEQ(d,"open")) return KEY_open;
2954 if (strEQ(d,"opendir")) return KEY_opendir;
2961 if (strEQ(d,"pop")) return KEY_pop;
2964 if (strEQ(d,"push")) return KEY_push;
2965 if (strEQ(d,"pack")) return KEY_pack;
2966 if (strEQ(d,"pipe")) return KEY_pipe;
2969 if (strEQ(d,"print")) return KEY_print;
2972 if (strEQ(d,"printf")) return KEY_printf;
2975 if (strEQ(d,"package")) return KEY_package;
2981 if (strEQ(d,"q")) return KEY_q;
2982 if (strEQ(d,"qq")) return KEY_qq;
2983 if (strEQ(d,"qx")) return KEY_qx;
2989 if (strEQ(d,"ref")) return KEY_ref;
2992 if (strEQ(d,"read")) return KEY_read;
2993 if (strEQ(d,"rand")) return KEY_rand;
2994 if (strEQ(d,"recv")) return KEY_recv;
2995 if (strEQ(d,"redo")) return KEY_redo;
2998 if (strEQ(d,"rmdir")) return KEY_rmdir;
2999 if (strEQ(d,"reset")) return KEY_reset;
3002 if (strEQ(d,"return")) return KEY_return;
3003 if (strEQ(d,"rename")) return KEY_rename;
3004 if (strEQ(d,"rindex")) return KEY_rindex;
3007 if (strEQ(d,"require")) return KEY_require;
3008 if (strEQ(d,"reverse")) return KEY_reverse;
3009 if (strEQ(d,"readdir")) return KEY_readdir;
3012 if (strEQ(d,"readlink")) return KEY_readlink;
3013 if (strEQ(d,"readline")) return KEY_readline;
3014 if (strEQ(d,"readpipe")) return KEY_readpipe;
3017 if (strEQ(d,"rewinddir")) return KEY_rewinddir;
3023 case 0: return KEY_s;
3025 if (strEQ(d,"scalar")) return KEY_scalar;
3030 if (strEQ(d,"seek")) return KEY_seek;
3031 if (strEQ(d,"send")) return KEY_send;
3034 if (strEQ(d,"semop")) return KEY_semop;
3037 if (strEQ(d,"select")) return KEY_select;
3038 if (strEQ(d,"semctl")) return KEY_semctl;
3039 if (strEQ(d,"semget")) return KEY_semget;
3042 if (strEQ(d,"setpgrp")) return KEY_setpgrp;
3043 if (strEQ(d,"seekdir")) return KEY_seekdir;
3046 if (strEQ(d,"setpwent")) return KEY_setpwent;
3047 if (strEQ(d,"setgrent")) return KEY_setgrent;
3050 if (strEQ(d,"setnetent")) return KEY_setnetent;
3053 if (strEQ(d,"setsockopt")) return KEY_setsockopt;
3054 if (strEQ(d,"sethostent")) return KEY_sethostent;
3055 if (strEQ(d,"setservent")) return KEY_setservent;
3058 if (strEQ(d,"setpriority")) return KEY_setpriority;
3059 if (strEQ(d,"setprotoent")) return KEY_setprotoent;
3066 if (strEQ(d,"shift")) return KEY_shift;
3069 if (strEQ(d,"shmctl")) return KEY_shmctl;
3070 if (strEQ(d,"shmget")) return KEY_shmget;
3073 if (strEQ(d,"shmread")) return KEY_shmread;
3076 if (strEQ(d,"shmwrite")) return KEY_shmwrite;
3077 if (strEQ(d,"shutdown")) return KEY_shutdown;
3082 if (strEQ(d,"sin")) return KEY_sin;
3085 if (strEQ(d,"sleep")) return KEY_sleep;
3088 if (strEQ(d,"sort")) return KEY_sort;
3089 if (strEQ(d,"socket")) return KEY_socket;
3090 if (strEQ(d,"socketpair")) return KEY_socketpair;
3093 if (strEQ(d,"split")) return KEY_split;
3094 if (strEQ(d,"sprintf")) return KEY_sprintf;
3095 if (strEQ(d,"splice")) return KEY_splice;
3098 if (strEQ(d,"sqrt")) return KEY_sqrt;
3101 if (strEQ(d,"srand")) return KEY_srand;
3104 if (strEQ(d,"stat")) return KEY_stat;
3105 if (strEQ(d,"study")) return KEY_study;
3108 if (strEQ(d,"substr")) return KEY_substr;
3109 if (strEQ(d,"sub")) return KEY_sub;
3114 if (strEQ(d,"system")) return KEY_system;
3117 if (strEQ(d,"sysread")) return KEY_sysread;
3118 if (strEQ(d,"symlink")) return KEY_symlink;
3119 if (strEQ(d,"syscall")) return KEY_syscall;
3122 if (strEQ(d,"syswrite")) return KEY_syswrite;
3131 if (strEQ(d,"tr")) return KEY_tr;
3134 if (strEQ(d,"tie")) return KEY_tie;
3137 if (strEQ(d,"tell")) return KEY_tell;
3138 if (strEQ(d,"time")) return KEY_time;
3141 if (strEQ(d,"times")) return KEY_times;
3144 if (strEQ(d,"telldir")) return KEY_telldir;
3147 if (strEQ(d,"truncate")) return KEY_truncate;
3154 if (strEQ(d,"uc")) return KEY_uc;
3157 if (strEQ(d,"undef")) return KEY_undef;
3158 if (strEQ(d,"until")) return KEY_until;
3159 if (strEQ(d,"untie")) return KEY_untie;
3160 if (strEQ(d,"utime")) return KEY_utime;
3161 if (strEQ(d,"umask")) return KEY_umask;
3164 if (strEQ(d,"unless")) return KEY_unless;
3165 if (strEQ(d,"unpack")) return KEY_unpack;
3166 if (strEQ(d,"unlink")) return KEY_unlink;
3169 if (strEQ(d,"unshift")) return KEY_unshift;
3170 if (strEQ(d,"ucfirst")) return KEY_ucfirst;
3175 if (strEQ(d,"values")) return KEY_values;
3176 if (strEQ(d,"vec")) return KEY_vec;
3181 if (strEQ(d,"warn")) return KEY_warn;
3182 if (strEQ(d,"wait")) return KEY_wait;
3185 if (strEQ(d,"while")) return KEY_while;
3186 if (strEQ(d,"write")) return KEY_write;
3189 if (strEQ(d,"waitpid")) return KEY_waitpid;
3192 if (strEQ(d,"wantarray")) return KEY_wantarray;
3197 if (len == 1) return KEY_x;
3200 if (len == 1) return KEY_y;
3209 checkcomma(s,name,what)
3216 if (dowarn && *s == ' ' && s[1] == '(') { /* XXX gotta be a better way */
3219 for (w++; *w && isSPACE(*w); w++) ;
3220 if (!w || !*w || !strchr(";|}", *w)) /* an advisory hack only... */
3221 warn("%s (...) interpreted as function",name);
3223 while (s < bufend && isSPACE(*s))
3227 while (s < bufend && isSPACE(*s))
3229 if (isIDFIRST(*s)) {
3233 while (s < bufend && isSPACE(*s))
3238 kw = keyword(w, s - w);
3242 croak("No comma allowed after %s", what);
3248 scan_word(s, dest, allow_package, slp)
3254 register char *d = dest;
3258 else if (*s == '\'' && allow_package && isIDFIRST(s[1])) {
3263 else if (*s == ':' && s[1] == ':' && allow_package && isIDFIRST(s[2])) {
3276 scan_ident(s,send,dest,ck_uni)
3278 register char *send;
3285 if (lex_brackets == 0)
3297 else if (*s == '\'' && isIDFIRST(s[1])) {
3302 else if (*s == ':' && s[1] == ':' && isIDFIRST(s[2])) {
3313 if (lex_state != LEX_NORMAL)
3314 lex_state = LEX_INTERPENDMAYBE;
3318 (*s == '$' && (isALPHA(s[1]) || s[1] == '$' || s[1] == '_')))
3329 if (*d == '^' && (isUPPER(*s) || strchr("[\\]^_?", *s))) {
3335 if (isALPHA(*d) || *d == '_') {
3340 if (*s == '[' || *s == '{') {
3342 croak("Can't use delimiter brackets within expression");
3343 lex_fakebrack = TRUE;
3351 if (lex_state == LEX_INTERPNORMAL && !lex_brackets)
3352 lex_state = LEX_INTERPEND;
3355 s = bracket; /* let the parser handle it */
3359 else if (lex_state == LEX_INTERPNORMAL && !lex_brackets && !intuit_more(s))
3360 lex_state = LEX_INTERPEND;
3365 scan_prefix(pm,string,len)
3370 register SV *tmpstr;
3374 char *origstring = string;
3376 if (ninstr(string, string+len, vert, vert+1))
3380 tmpstr = NEWSV(86,len);
3381 sv_upgrade(tmpstr, SVt_PVBM);
3382 sv_setpvn(tmpstr,string,len);
3385 BmUSEFUL(tmpstr) = 100;
3386 for (d=t; d < e; ) {
3394 case '.': case '[': case '$': case '(': case ')': case '|': case '+':
3399 if (d[1] && strchr("wWbB0123456789sSdDlLuUExc",d[1])) {
3403 Move(d+1,d,e-d,char);
3428 if (d[1] == '*' || (d[1] == '{' && d[2] == '0') || d[1] == '?') {
3440 SvCUR_set(tmpstr, d - t);
3442 pm->op_pmflags |= PMf_ALL;
3443 if (*origstring != '^')
3444 pm->op_pmflags |= PMf_SCANFIRST;
3445 pm->op_pmshort = tmpstr;
3446 pm->op_pmslen = d - t;
3456 multi_start = curcop->cop_line;
3458 s = scan_str(start);
3463 croak("Search pattern not terminated");
3465 pm = (PMOP*)newPMOP(OP_MATCH, 0);
3467 pm->op_pmflags |= PMf_ONCE;
3469 while (*s == 'i' || *s == 'o' || *s == 'g') {
3473 pm->op_pmflags |= PMf_FOLD;
3477 pm->op_pmflags |= PMf_KEEP;
3481 pm->op_pmflags |= PMf_GLOBAL;
3486 yylval.ival = OP_MATCH;
3494 register char *s = start;
3498 multi_start = curcop->cop_line;
3499 yylval.ival = OP_NULL;
3507 croak("Substitution pattern not terminated");
3510 if (s[-1] == *start)
3521 croak("Substitution replacement not terminated");
3524 pm = (PMOP*)newPMOP(OP_SUBST, 0);
3525 while (*s == 'g' || *s == 'i' || *s == 'e' || *s == 'o') {
3532 pm->op_pmflags |= PMf_GLOBAL;
3537 pm->op_pmflags |= PMf_FOLD;
3541 pm->op_pmflags |= PMf_KEEP;
3547 pm->op_pmflags |= PMf_EVAL;
3548 repl = newSVpv("",0);
3550 sv_catpvn(repl, "eval ", 5);
3551 sv_catpvn(repl, "{ ", 2);
3552 sv_catsv(repl, lex_repl);
3553 sv_catpvn(repl, " };", 2);
3554 SvCOMPILED_on(repl);
3560 yylval.ival = OP_SUBST;
3568 if (!pm->op_pmshort && pm->op_pmregexp->regstart &&
3569 (!pm->op_pmregexp->regmust || pm->op_pmregexp->reganch & ROPT_ANCH)
3571 if (!(pm->op_pmregexp->reganch & ROPT_ANCH))
3572 pm->op_pmflags |= PMf_SCANFIRST;
3573 else if (pm->op_pmflags & PMf_FOLD)
3575 pm->op_pmshort = sv_ref(pm->op_pmregexp->regstart);
3577 else if (pm->op_pmregexp->regmust) {/* is there a better short-circuit? */
3578 if (pm->op_pmshort &&
3579 sv_eq(pm->op_pmshort,pm->op_pmregexp->regmust))
3581 if (pm->op_pmflags & PMf_SCANFIRST) {
3582 sv_free(pm->op_pmshort);
3583 pm->op_pmshort = Nullsv;
3586 sv_free(pm->op_pmregexp->regmust);
3587 pm->op_pmregexp->regmust = Nullsv;
3591 if (!pm->op_pmshort || /* promote the better string */
3592 ((pm->op_pmflags & PMf_SCANFIRST) &&
3593 (SvCUR(pm->op_pmshort) < SvCUR(pm->op_pmregexp->regmust)) )){
3594 sv_free(pm->op_pmshort); /* ok if null */
3595 pm->op_pmshort = pm->op_pmregexp->regmust;
3596 pm->op_pmregexp->regmust = Nullsv;
3597 pm->op_pmflags |= PMf_SCANFIRST;
3606 register char *s = start;
3613 yylval.ival = OP_NULL;
3620 croak("Translation pattern not terminated");
3622 if (s[-1] == *start)
3633 croak("Translation replacement not terminated");
3636 New(803,tbl,256,short);
3637 op = newPVOP(OP_TRANS, 0, (char*)tbl);
3639 complement = delete = squash = 0;
3640 while (*s == 'c' || *s == 'd' || *s == 's') {
3642 complement = OPpTRANS_COMPLEMENT;
3644 delete = OPpTRANS_DELETE;
3646 squash = OPpTRANS_SQUASH;
3649 op->op_private = delete|squash|complement;
3652 yylval.ival = OP_TRANS;
3661 I32 op_type = OP_SCALAR;
3671 if (*s && strchr("`'\"",*s)) {
3673 s = cpytill(d,s,bufend,term,&len);
3685 } /* assuming tokenbuf won't clobber */
3690 if (rsfp || !(d=ninstr(s,bufend,d,d+1)))
3691 herewas = newSVpv(s,bufend-s);
3693 s--, herewas = newSVpv(s,d-s);
3694 s += SvCUR(herewas);
3698 op_type = OP_BACKTICK;
3701 multi_start = curcop->cop_line;
3702 multi_open = multi_close = '<';
3703 tmpstr = NEWSV(87,80);
3707 while (s < bufend &&
3708 (*s != term || bcmp(s,tokenbuf,len) != 0) ) {
3713 curcop->cop_line = multi_start;
3714 croak("EOF in string");
3716 sv_setpvn(tmpstr,d+1,s-d);
3718 sv_catpvn(herewas,s,bufend-s);
3719 sv_setsv(linestr,herewas);
3720 oldoldbufptr = oldbufptr = bufptr = s = SvPVX(linestr);
3721 bufend = SvPVX(linestr) + SvCUR(linestr);
3724 sv_setpvn(tmpstr,"",0); /* avoid "uninitialized" warning */
3725 while (s >= bufend) { /* multiple line string? */
3727 !(oldoldbufptr = oldbufptr = s = sv_gets(linestr, rsfp, 0))) {
3728 curcop->cop_line = multi_start;
3729 croak("EOF in string");
3733 SV *sv = NEWSV(88,0);
3735 sv_upgrade(sv, SVt_PVMG);
3736 sv_setsv(sv,linestr);
3737 av_store(GvAV(curcop->cop_filegv),
3738 (I32)curcop->cop_line,sv);
3740 bufend = SvPVX(linestr) + SvCUR(linestr);
3741 if (*s == term && bcmp(s,tokenbuf,len) == 0) {
3744 sv_catsv(linestr,herewas);
3745 bufend = SvPVX(linestr) + SvCUR(linestr);
3749 sv_catsv(tmpstr,linestr);
3752 multi_end = curcop->cop_line;
3754 if (SvCUR(tmpstr) + 5 < SvLEN(tmpstr)) {
3755 SvLEN_set(tmpstr, SvCUR(tmpstr) + 1);
3756 Renew(SvPVX(tmpstr), SvLEN(tmpstr), char);
3760 yylval.ival = op_type;
3765 scan_inputsymbol(start)
3768 register char *s = start;
3773 s = cpytill(d, s+1, bufend, '>', &len);
3777 croak("Unterminated <> operator");
3780 while (*d && (isALNUM(*d) || *d == '\''))
3782 if (d - tokenbuf != len) {
3783 yylval.ival = OP_GLOB;
3785 s = scan_str(start);
3787 croak("Glob not terminated");
3793 (void)strcpy(d,"ARGV");
3795 GV *gv = gv_fetchpv(d+1,TRUE);
3796 lex_op = (OP*)newUNOP(OP_READLINE, 0,
3797 newUNOP(OP_RV2GV, 0,
3798 newUNOP(OP_RV2SV, 0,
3799 newGVOP(OP_GV, 0, gv))));
3800 yylval.ival = OP_NULL;
3805 GV *gv = gv_fetchpv(d,TRUE);
3807 if (strEQ(d,"ARGV")) {
3809 io->flags |= IOf_ARGV|IOf_START;
3811 lex_op = (OP*)newUNOP(OP_READLINE, 0, newGVOP(OP_GV, 0, gv));
3812 yylval.ival = OP_NULL;
3824 register char *s = start;
3825 register char term = *s;
3830 multi_start = curcop->cop_line;
3832 if (term && (tmps = strchr("([{< )]}> )]}>",term)))
3837 sv_upgrade(sv, SVt_PV);
3838 SvSTORAGE(sv) = term;
3839 SvPOK_only(sv); /* validate pointer */
3842 SvGROW(sv, SvCUR(sv) + (bufend - s) + 1);
3843 to = SvPVX(sv)+SvCUR(sv);
3844 if (multi_open == multi_close) {
3845 for (; s < bufend; s++,to++) {
3846 if (*s == '\n' && !rsfp)
3848 if (*s == '\\' && s+1 < bufend && term != '\\')
3850 else if (*s == term)
3856 for (; s < bufend; s++,to++) {
3857 if (*s == '\n' && !rsfp)
3859 if (*s == '\\' && s+1 < bufend && term != '\\')
3861 else if (*s == term && --brackets <= 0)
3863 else if (*s == multi_open)
3869 SvCUR_set(sv, to - SvPVX(sv));
3871 if (s < bufend) break; /* string ends on this line? */
3874 !(oldoldbufptr = oldbufptr = s = sv_gets(linestr, rsfp, 0))) {
3875 curcop->cop_line = multi_start;
3880 SV *sv = NEWSV(88,0);
3882 sv_upgrade(sv, SVt_PVMG);
3883 sv_setsv(sv,linestr);
3884 av_store(GvAV(curcop->cop_filegv),
3885 (I32)curcop->cop_line, sv);
3887 bufend = SvPVX(linestr) + SvCUR(linestr);
3889 multi_end = curcop->cop_line;
3891 if (SvCUR(sv) + 5 < SvLEN(sv)) {
3892 SvLEN_set(sv, SvCUR(sv) + 1);
3893 Renew(SvPVX(sv), SvLEN(sv), char);
3906 register char *s = start;
3916 croak("panic: scan_num");
3926 else if (s[1] == '.')
3940 yyerror("Illegal octal digit");
3942 case '0': case '1': case '2': case '3': case '4':
3943 case '5': case '6': case '7':
3947 case 'a': case 'b': case 'c': case 'd': case 'e': case 'f':
3948 case 'A': case 'B': case 'C': case 'D': case 'E': case 'F':
3952 i += (*s++ & 7) + 9;
3959 if (tryi32 == i && tryi32 >= 0)
3960 sv_setiv(sv,tryi32);
3962 sv_setnv(sv,(double)i);
3965 case '1': case '2': case '3': case '4': case '5':
3966 case '6': case '7': case '8': case '9': case '.':
3970 while (isDIGIT(*s) || *s == '_') {
3972 if (dowarn && lastub && s - lastub != 3)
3973 warn("Misplaced _");
3979 if (dowarn && lastub && s - lastub != 3)
3980 warn("Misplaced _");
3981 if (*s == '.' && s[1] != '.') {
3984 while (isDIGIT(*s) || *s == '_') {
3991 if (*s && strchr("eE",*s) && strchr("+-0123456789",s[1])) {
3994 *d++ = 'e'; /* At least some Mach atof()s don't grok 'E' */
3995 if (*s == '+' || *s == '-')
4002 value = atof(tokenbuf);
4003 tryi32 = (I32)value;
4004 if (!floatit && (double)tryi32 == value)
4005 sv_setiv(sv,tryi32);
4011 yylval.opval = newSVOP(OP_CONST, 0, sv);
4022 SV *stuff = newSV(0);
4023 bool needargs = FALSE;
4028 for (t = s+1; *t == ' ' || *t == '\t'; t++) ;
4032 if (in_eval && !rsfp) {
4033 eol = strchr(s,'\n');
4038 eol = bufend = SvPVX(linestr) + SvCUR(linestr);
4040 sv_catpvn(stuff, s, eol-s);
4042 if (*s == '@' || *s == '^') {
4051 s = sv_gets(linestr, rsfp, 0);
4052 oldoldbufptr = oldbufptr = bufptr = SvPVX(linestr);
4055 yyerror("Format not terminated");
4064 nextval[nexttoke].ival = 0;
4069 nextval[nexttoke].opval = (OP*)newSVOP(OP_CONST, 0, stuff);
4071 nextval[nexttoke].ival = OP_FORMLINE;
4087 cshlen = strlen(cshname);
4097 char *tname = tmpbuf;
4099 if (bufptr > oldoldbufptr && bufptr - oldoldbufptr < 200 &&
4100 oldoldbufptr != oldbufptr && oldbufptr != bufptr) {
4101 while (isSPACE(*oldoldbufptr))
4103 cpy7bit(tmp2buf, oldoldbufptr, bufptr - oldoldbufptr);
4104 sprintf(tname,"near \"%s\"",tmp2buf);
4106 else if (bufptr > oldbufptr && bufptr - oldbufptr < 200 &&
4107 oldbufptr != bufptr) {
4108 while (isSPACE(*oldbufptr))
4110 cpy7bit(tmp2buf, oldbufptr, bufptr - oldbufptr);
4111 sprintf(tname,"near \"%s\"",tmp2buf);
4113 else if (yychar > 255)
4114 tname = "next token ???";
4115 else if (!yychar || (yychar == ';' && !rsfp))
4116 (void)strcpy(tname,"at EOF");
4117 else if ((yychar & 127) == 127) {
4118 if (lex_state == LEX_NORMAL ||
4119 (lex_state == LEX_KNOWNEXT && lex_defer == LEX_NORMAL))
4120 (void)strcpy(tname,"at end of line");
4122 (void)strcpy(tname,"at end of string");
4124 else if (yychar < 32)
4125 (void)sprintf(tname,"next char ^%c",yychar+64);
4127 (void)sprintf(tname,"next char %c",yychar);
4128 (void)sprintf(buf, "%s at %s line %d, %s\n",
4129 s,SvPVX(GvSV(curcop->cop_filegv)),curcop->cop_line,tname);
4130 if (curcop->cop_line == multi_end && multi_start < multi_end)
4131 sprintf(buf+strlen(buf),
4132 " (Might be a runaway multi-line %c%c string starting on line %d)\n",
4133 multi_open,multi_close,multi_start);
4135 sv_catpv(GvSV(gv_fetchpv("@",TRUE)),buf);
4138 if (++error_count >= 10)
4139 croak("%s has too many errors.\n",
4140 SvPVX(GvSV(curcop->cop_filegv)));