3 * Copyright (c) 1991-1997, Larry Wall
5 * You may distribute under the terms of either the GNU General Public
6 * License or the Artistic License, as specified in the README file.
11 * "It all comes from here, the stench and the peril." --Frodo
17 static void check_uni _((void));
18 static void force_next _((I32 type));
19 static char *force_version _((char *start));
20 static char *force_word _((char *start, int token, int check_keyword, int allow_pack, int allow_tick));
21 static SV *q _((SV *sv));
22 static char *scan_const _((char *start));
23 static char *scan_formline _((char *s));
24 static char *scan_heredoc _((char *s));
25 static char *scan_ident _((char *s, char *send, char *dest, STRLEN destlen,
27 static char *scan_inputsymbol _((char *start));
28 static char *scan_pat _((char *start));
29 static char *scan_str _((char *start));
30 static char *scan_subst _((char *start));
31 static char *scan_trans _((char *start));
32 static char *scan_word _((char *s, char *dest, STRLEN destlen,
33 int allow_package, STRLEN *slp));
34 static char *skipspace _((char *s));
35 static void checkcomma _((char *s, char *name, char *what));
36 static void force_ident _((char *s, int kind));
37 static void incline _((char *s));
38 static int intuit_method _((char *s, GV *gv));
39 static int intuit_more _((char *s));
40 static I32 lop _((I32 f, expectation x, char *s));
41 static void missingterm _((char *s));
42 static void no_op _((char *what, char *s));
43 static void set_csh _((void));
44 static I32 sublex_done _((void));
45 static I32 sublex_push _((void));
46 static I32 sublex_start _((void));
48 static int uni _((I32 f, char *s));
50 static char * filter_gets _((SV *sv, PerlIO *fp, STRLEN append));
51 static void restore_rsfp _((void *f));
53 static char ident_too_long[] = "Identifier too long";
55 static char *linestart; /* beg. of most recently read line */
57 static char pending_ident; /* pending identifier lookup */
60 I32 super_state; /* lexer state to save */
61 I32 sub_inwhat; /* "lex_inwhat" to use */
62 OP *sub_op; /* "lex_op" to use */
65 /* The following are arranged oddly so that the guard on the switch statement
66 * can get by with a single comparison (if the compiler is smart enough).
69 /* #define LEX_NOTPARSING 11 is done in perl.h. */
72 #define LEX_INTERPNORMAL 9
73 #define LEX_INTERPCASEMOD 8
74 #define LEX_INTERPPUSH 7
75 #define LEX_INTERPSTART 6
76 #define LEX_INTERPEND 5
77 #define LEX_INTERPENDMAYBE 4
78 #define LEX_INTERPCONCAT 3
79 #define LEX_INTERPCONST 2
80 #define LEX_FORMLINE 1
81 #define LEX_KNOWNEXT 0
90 /* XXX If this causes problems, set i_unistd=undef in the hint file. */
92 # include <unistd.h> /* Needed for execv() */
100 #include "keywords.h"
105 #define CLINE (copline = (curcop->cop_line < copline ? curcop->cop_line : copline))
107 #define TOKEN(retval) return (bufptr = s,(int)retval)
108 #define OPERATOR(retval) return (expect = XTERM,bufptr = s,(int)retval)
109 #define AOPERATOR(retval) return ao((expect = XTERM,bufptr = s,(int)retval))
110 #define PREBLOCK(retval) return (expect = XBLOCK,bufptr = s,(int)retval)
111 #define PRETERMBLOCK(retval) return (expect = XTERMBLOCK,bufptr = s,(int)retval)
112 #define PREREF(retval) return (expect = XREF,bufptr = s,(int)retval)
113 #define TERM(retval) return (CLINE, expect = XOPERATOR,bufptr = s,(int)retval)
114 #define LOOPX(f) return(yylval.ival=f,expect = XTERM,bufptr = s,(int)LOOPEX)
115 #define FTST(f) return(yylval.ival=f,expect = XTERM,bufptr = s,(int)UNIOP)
116 #define FUN0(f) return(yylval.ival = f,expect = XOPERATOR,bufptr = s,(int)FUNC0)
117 #define FUN1(f) return(yylval.ival = f,expect = XOPERATOR,bufptr = s,(int)FUNC1)
118 #define BOop(f) return ao((yylval.ival=f,expect = XTERM,bufptr = s,(int)BITOROP))
119 #define BAop(f) return ao((yylval.ival=f,expect = XTERM,bufptr = s,(int)BITANDOP))
120 #define SHop(f) return ao((yylval.ival=f,expect = XTERM,bufptr = s,(int)SHIFTOP))
121 #define PWop(f) return ao((yylval.ival=f,expect = XTERM,bufptr = s,(int)POWOP))
122 #define PMop(f) return(yylval.ival=f,expect = XTERM,bufptr = s,(int)MATCHOP)
123 #define Aop(f) return ao((yylval.ival=f,expect = XTERM,bufptr = s,(int)ADDOP))
124 #define Mop(f) return ao((yylval.ival=f,expect = XTERM,bufptr = s,(int)MULOP))
125 #define Eop(f) return(yylval.ival=f,expect = XTERM,bufptr = s,(int)EQOP)
126 #define Rop(f) return(yylval.ival=f,expect = XTERM,bufptr = s,(int)RELOP)
128 /* This bit of chicanery makes a unary function followed by
129 * a parenthesis into a function with one argument, highest precedence.
131 #define UNI(f) return(yylval.ival = f, \
134 last_uni = oldbufptr, \
136 (*s == '(' || (s = skipspace(s), *s == '(') ? (int)FUNC1 : (int)UNIOP) )
138 #define UNIBRACK(f) return(yylval.ival = f, \
140 last_uni = oldbufptr, \
141 (*s == '(' || (s = skipspace(s), *s == '(') ? (int)FUNC1 : (int)UNIOP) )
143 /* grandfather return to old style */
144 #define OLDLOP(f) return(yylval.ival=f,expect = XTERM,bufptr = s,(int)LSTOP)
149 if (*bufptr == '=') {
151 if (toketype == ANDAND)
152 yylval.ival = OP_ANDASSIGN;
153 else if (toketype == OROR)
154 yylval.ival = OP_ORASSIGN;
161 no_op(char *what, char *s)
163 char *oldbp = bufptr;
164 bool is_first = (oldbufptr == linestart);
167 yywarn(form("%s found where operator expected", what));
169 warn("\t(Missing semicolon on previous line?)\n");
170 else if (oldoldbufptr && isIDFIRST(*oldoldbufptr)) {
172 for (t = oldoldbufptr; *t && (isALNUM(*t) || *t == ':'); t++) ;
173 if (t < bufptr && isSPACE(*t))
174 warn("\t(Do you need to predeclare %.*s?)\n",
175 t - oldoldbufptr, oldoldbufptr);
179 warn("\t(Missing operator before %.*s?)\n", s - oldbp, oldbp);
189 char *nl = strrchr(s,'\n');
193 else if (multi_close < 32 || multi_close == 127) {
195 tmpbuf[1] = toCTRL(multi_close);
201 *tmpbuf = multi_close;
205 q = strchr(s,'"') ? '\'' : '"';
206 croak("Can't find string terminator %c%s%c anywhere before EOF",q,s,q);
213 warn("Use of %s is deprecated", s);
219 deprecate("comma-less variable list");
230 SAVEI32(lex_brackets);
231 SAVEI32(lex_fakebrack);
232 SAVEI32(lex_casemods);
237 SAVEI16(curcop->cop_line);
241 SAVEPPTR(oldoldbufptr);
244 SAVEPPTR(lex_brackstack);
245 SAVEPPTR(lex_casestack);
246 SAVEDESTRUCTOR(restore_rsfp, rsfp);
248 lex_state = LEX_NORMAL;
253 New(899, lex_brackstack, 120, char);
254 New(899, lex_casestack, 12, char);
255 SAVEFREEPV(lex_brackstack);
256 SAVEFREEPV(lex_casestack);
258 *lex_casestack = '\0';
262 SvREFCNT_dec(lex_stuff);
265 SvREFCNT_dec(lex_repl);
270 if (SvREADONLY(linestr))
271 linestr = sv_2mortal(newSVsv(linestr));
272 s = SvPV(linestr, len);
273 if (len && s[len-1] != ';') {
274 if (!(SvFLAGS(linestr) & SVs_TEMP))
275 linestr = sv_2mortal(newSVsv(linestr));
276 sv_catpvn(linestr, "\n;", 2);
279 oldoldbufptr = oldbufptr = bufptr = linestart = SvPVX(linestr);
280 bufend = bufptr + SvCUR(linestr);
282 rs = newSVpv("\n", 1);
293 restore_rsfp(void *f)
295 PerlIO *fp = (PerlIO*)f;
297 if (rsfp == PerlIO_stdin())
298 PerlIO_clearerr(rsfp);
299 else if (rsfp && (rsfp != fp))
316 while (*s == ' ' || *s == '\t') s++;
317 if (strnEQ(s, "line ", 5)) {
326 while (*s == ' ' || *s == '\t')
328 if (*s == '"' && (t = strchr(s+1, '"')))
332 return; /* false alarm */
333 for (t = s; !isSPACE(*t); t++) ;
338 curcop->cop_filegv = gv_fetchfile(s);
340 curcop->cop_filegv = gv_fetchfile(origfilename);
342 curcop->cop_line = atoi(n)-1;
346 skipspace(register char *s)
349 if (lex_formbrack && lex_brackets <= lex_formbrack) {
350 while (s < bufend && (*s == ' ' || *s == '\t'))
356 while (s < bufend && isSPACE(*s))
358 if (s < bufend && *s == '#') {
359 while (s < bufend && *s != '\n')
364 if (s < bufend || !rsfp || lex_state != LEX_NORMAL)
366 if ((s = filter_gets(linestr, rsfp, (prevlen = SvCUR(linestr)))) == Nullch) {
367 if (minus_n || minus_p) {
368 sv_setpv(linestr,minus_p ?
369 ";}continue{print or die qq(-p destination: $!\\n)" :
371 sv_catpv(linestr,";}");
372 minus_n = minus_p = 0;
375 sv_setpv(linestr,";");
376 oldoldbufptr = oldbufptr = bufptr = s = linestart = SvPVX(linestr);
377 bufend = SvPVX(linestr) + SvCUR(linestr);
378 if (preprocess && !in_eval)
379 (void)my_pclose(rsfp);
380 else if ((PerlIO*)rsfp == PerlIO_stdin())
381 PerlIO_clearerr(rsfp);
383 (void)PerlIO_close(rsfp);
389 linestart = bufptr = s + prevlen;
390 bufend = s + SvCUR(linestr);
393 if (PERLDB_LINE && curstash != debstash) {
394 SV *sv = NEWSV(85,0);
396 sv_upgrade(sv, SVt_PVMG);
397 sv_setpvn(sv,bufptr,bufend-bufptr);
398 av_store(GvAV(curcop->cop_filegv),(I32)curcop->cop_line,sv);
409 if (oldoldbufptr != last_uni)
411 while (isSPACE(*last_uni))
413 for (s = last_uni; isALNUM(*s) || *s == '-'; s++) ;
414 if ((t = strchr(s, '(')) && t < bufptr)
418 warn("Warning: Use of \"%s\" without parens is ambiguous", last_uni);
425 #define UNI(f) return uni(f,s)
433 last_uni = oldbufptr;
444 #endif /* CRIPPLED_CC */
446 #define LOP(f,x) return lop(f,x,s)
451 (I32 f, expectation x, char *s)
457 #endif /* CAN_PROTOTYPE */
464 last_lop = oldbufptr;
480 nexttype[nexttoke] = type;
482 if (lex_state != LEX_KNOWNEXT) {
483 lex_defer = lex_state;
485 lex_state = LEX_KNOWNEXT;
490 force_word(register char *start, int token, int check_keyword, int allow_pack, int allow_tick)
495 start = skipspace(start);
498 (allow_pack && *s == ':') ||
499 (allow_tick && *s == '\'') )
501 s = scan_word(s, tokenbuf, sizeof tokenbuf, allow_pack, &len);
502 if (check_keyword && keyword(tokenbuf, len))
504 if (token == METHOD) {
514 nextval[nexttoke].opval = (OP*)newSVOP(OP_CONST,0, newSVpv(tokenbuf,0));
515 nextval[nexttoke].opval->op_private |= OPpCONST_BARE;
522 force_ident(register char *s, int kind)
525 OP* o = (OP*)newSVOP(OP_CONST, 0, newSVpv(s,0));
526 nextval[nexttoke].opval = o;
529 dTHR; /* just for in_eval */
530 o->op_private = OPpCONST_ENTERED;
531 /* XXX see note in pp_entereval() for why we forgo typo
532 warnings if the symbol must be introduced in an eval.
534 gv_fetchpv(s, in_eval ? GV_ADDMULTI : TRUE,
535 kind == '$' ? SVt_PV :
536 kind == '@' ? SVt_PVAV :
537 kind == '%' ? SVt_PVHV :
545 force_version(char *s)
547 OP *version = Nullop;
551 /* default VERSION number -- GBARR */
556 for( d=s, c = 1; isDIGIT(*d) || *d == '_' || (*d == '.' && c--); d++);
557 if((*d == ';' || isSPACE(*d)) && *(skipspace(d)) != ',') {
559 /* real VERSION number -- GBARR */
560 version = yylval.opval;
564 /* NOTE: The parser sees the package name and the VERSION swapped */
565 nextval[nexttoke].opval = version;
582 s = SvPV_force(sv, len);
586 while (s < send && *s != '\\')
593 if (s + 1 < send && (s[1] == '\\'))
594 s++; /* all that, just for this */
599 SvCUR_set(sv, d - SvPVX(sv));
607 register I32 op_type = yylval.ival;
609 if (op_type == OP_NULL) {
610 yylval.opval = lex_op;
614 if (op_type == OP_CONST || op_type == OP_READLINE) {
615 SV *sv = q(lex_stuff);
617 char *p = SvPV(sv, len);
618 yylval.opval = (OP*)newSVOP(op_type, 0, newSVpv(p, len));
624 sublex_info.super_state = lex_state;
625 sublex_info.sub_inwhat = op_type;
626 sublex_info.sub_op = lex_op;
627 lex_state = LEX_INTERPPUSH;
631 yylval.opval = lex_op;
645 lex_state = sublex_info.super_state;
647 SAVEI32(lex_brackets);
648 SAVEI32(lex_fakebrack);
649 SAVEI32(lex_casemods);
654 SAVEI16(curcop->cop_line);
657 SAVEPPTR(oldoldbufptr);
660 SAVEPPTR(lex_brackstack);
661 SAVEPPTR(lex_casestack);
666 bufend = bufptr = oldbufptr = oldoldbufptr = linestart = SvPVX(linestr);
667 bufend += SvCUR(linestr);
673 New(899, lex_brackstack, 120, char);
674 New(899, lex_casestack, 12, char);
675 SAVEFREEPV(lex_brackstack);
676 SAVEFREEPV(lex_casestack);
678 *lex_casestack = '\0';
680 lex_state = LEX_INTERPCONCAT;
681 curcop->cop_line = multi_start;
683 lex_inwhat = sublex_info.sub_inwhat;
684 if (lex_inwhat == OP_MATCH || lex_inwhat == OP_SUBST)
685 lex_inpat = sublex_info.sub_op;
697 yylval.opval = (OP*)newSVOP(OP_CONST, 0, newSVpv("",0));
701 if (lex_casemods) { /* oops, we've got some unbalanced parens */
702 lex_state = LEX_INTERPCASEMOD;
706 /* Is there a right-hand side to take care of? */
707 if (lex_repl && (lex_inwhat == OP_SUBST || lex_inwhat == OP_TRANS)) {
710 bufend = bufptr = oldbufptr = oldoldbufptr = linestart = SvPVX(linestr);
711 bufend += SvCUR(linestr);
717 *lex_casestack = '\0';
719 if (SvCOMPILED(lex_repl)) {
720 lex_state = LEX_INTERPNORMAL;
724 lex_state = LEX_INTERPCONCAT;
730 bufend = SvPVX(linestr);
731 bufend += SvCUR(linestr);
738 scan_const(char *start)
740 register char *send = bufend;
741 SV *sv = NEWSV(93, send - start);
742 register char *s = start;
743 register char *d = SvPVX(sv);
744 bool dorange = FALSE;
748 ? "\\.^$@AGZdDwWsSbB+*?|()-nrtfeaxc0123456789[{]} \t\n\r\f\v#"
749 : (lex_inwhat & OP_TRANS)
753 while (s < send || dorange) {
754 if (lex_inwhat == OP_TRANS) {
759 SvGROW(sv, SvLEN(sv) + 256);
763 for (i = (U8)*d; i <= max; i++)
768 else if (*s == '-' && s+1 < send && s != start) {
773 else if (*s == '(' && lex_inpat && s[1] == '?' && s[2] == '#') {
774 while (s < send && *s != ')')
777 else if (*s == '#' && lex_inpat &&
778 ((PMOP*)lex_inpat)->op_pmflags & PMf_EXTENDED) {
779 while (s+1 < send && *s != '\n')
782 else if (*s == '@' && s[1] && (isALNUM(s[1]) || strchr(":'{$", s[1])))
784 else if (*s == '$') {
785 if (!lex_inpat) /* not a regexp, so $ must be var */
787 if (s + 1 < send && !strchr(")| \n\t", s[1]))
788 break; /* in regexp, $ might be tail anchor */
790 if (*s == '\\' && s+1 < send) {
792 if (*s && strchr(leaveit, *s)) {
797 if (lex_inwhat == OP_SUBST && !lex_inpat &&
798 isDIGIT(*s) && *s != '0' && !isDIGIT(s[1]))
801 warn("\\%c better written as $%c", *s, *s);
805 if (lex_inwhat != OP_TRANS && *s && strchr("lLuUEQ", *s)) {
811 if (lex_inwhat == OP_TRANS) {
819 case '0': case '1': case '2': case '3':
820 case '4': case '5': case '6': case '7':
821 *d++ = scan_oct(s, 3, &len);
825 *d++ = scan_hex(++s, 2, &len);
861 SvCUR_set(sv, d - SvPVX(sv));
864 if (SvCUR(sv) + 5 < SvLEN(sv)) {
865 SvLEN_set(sv, SvCUR(sv) + 1);
866 Renew(SvPVX(sv), SvLEN(sv), char);
869 yylval.opval = (OP*)newSVOP(OP_CONST, 0, sv);
875 /* This is the one truly awful dwimmer necessary to conflate C and sed. */
877 intuit_more(register char *s)
881 if (*s == '-' && s[1] == '>' && (s[2] == '[' || s[2] == '{'))
883 if (*s != '{' && *s != '[')
888 /* In a pattern, so maybe we have {n,m}. */
905 /* On the other hand, maybe we have a character class */
908 if (*s == ']' || *s == '^')
911 int weight = 2; /* let's weigh the evidence */
913 unsigned char un_char = 0, last_un_char;
914 char *send = strchr(s,']');
915 char tmpbuf[sizeof tokenbuf * 4];
917 if (!send) /* has to be an expression */
923 else if (isDIGIT(*s)) {
925 if (isDIGIT(s[1]) && s[2] == ']')
931 for (; s < send; s++) {
932 last_un_char = un_char;
933 un_char = (unsigned char)*s;
938 weight -= seen[un_char] * 10;
940 scan_ident(s, send, tmpbuf, sizeof tmpbuf, FALSE);
941 if ((int)strlen(tmpbuf) > 1 && gv_fetchpv(tmpbuf,FALSE, SVt_PV))
946 else if (*s == '$' && s[1] &&
947 strchr("[#!%*<>()-=",s[1])) {
948 if (/*{*/ strchr("])} =",s[2]))
957 if (strchr("wds]",s[1]))
959 else if (seen['\''] || seen['"'])
961 else if (strchr("rnftbxcav",s[1]))
963 else if (isDIGIT(s[1])) {
965 while (s[1] && isDIGIT(s[1]))
975 if (strchr("aA01! ",last_un_char))
977 if (strchr("zZ79~",s[1]))
981 if (!isALNUM(last_un_char) && !strchr("$@&",last_un_char) &&
982 isALPHA(*s) && s[1] && isALPHA(s[1])) {
987 if (keyword(tmpbuf, d - tmpbuf))
990 if (un_char == last_un_char + 1)
992 weight -= seen[un_char];
997 if (weight >= 0) /* probably a character class */
1005 intuit_method(char *start, GV *gv)
1007 char *s = start + (*start == '$');
1008 char tmpbuf[sizeof tokenbuf];
1018 s = scan_word(s, tmpbuf, sizeof tmpbuf, TRUE, &len);
1019 if (*start == '$') {
1020 if (gv || last_lop_op == OP_PRINT || isUPPER(*tokenbuf))
1025 return *s == '(' ? FUNCMETH : METHOD;
1027 if (!keyword(tmpbuf, len)) {
1028 indirgv = gv_fetchpv(tmpbuf,FALSE, SVt_PVCV);
1029 if (indirgv && GvCVu(indirgv))
1031 /* filehandle or package name makes it a method */
1032 if (!gv || GvIO(indirgv) || gv_stashpvn(tmpbuf, len, FALSE)) {
1034 if ((bufend - s) >= 2 && *s == '=' && *(s+1) == '>')
1035 return 0; /* no assumptions -- "=>" quotes bearword */
1036 nextval[nexttoke].opval =
1037 (OP*)newSVOP(OP_CONST, 0,
1039 nextval[nexttoke].opval->op_private =
1044 return *s == '(' ? FUNCMETH : METHOD;
1054 char *pdb = getenv("PERL5DB");
1058 return "BEGIN { require 'perl5db.pl' }";
1064 /* Encoded script support. filter_add() effectively inserts a
1065 * 'pre-processing' function into the current source input stream.
1066 * Note that the filter function only applies to the current source file
1067 * (e.g., it will not affect files 'require'd or 'use'd by this one).
1069 * The datasv parameter (which may be NULL) can be used to pass
1070 * private data to this instance of the filter. The filter function
1071 * can recover the SV using the FILTER_DATA macro and use it to
1072 * store private buffers and state information.
1074 * The supplied datasv parameter is upgraded to a PVIO type
1075 * and the IoDIRP field is used to store the function pointer.
1076 * Note that IoTOP_NAME, IoFMT_NAME, IoBOTTOM_NAME, if set for
1077 * private use must be set using malloc'd pointers.
1079 static int filter_debug = 0;
1082 filter_add(filter_t funcp, SV *datasv)
1084 if (!funcp){ /* temporary handy debugging hack to be deleted */
1085 filter_debug = atoi((char*)datasv);
1089 rsfp_filters = newAV();
1092 if (!SvUPGRADE(datasv, SVt_PVIO))
1093 die("Can't upgrade filter_add data to SVt_PVIO");
1094 IoDIRP(datasv) = (DIR*)funcp; /* stash funcp into spare field */
1096 warn("filter_add func %p (%s)", funcp, SvPV(datasv,na));
1097 av_unshift(rsfp_filters, 1);
1098 av_store(rsfp_filters, 0, datasv) ;
1103 /* Delete most recently added instance of this filter function. */
1105 filter_del(filter_t funcp)
1108 warn("filter_del func %p", funcp);
1109 if (!rsfp_filters || AvFILL(rsfp_filters)<0)
1111 /* if filter is on top of stack (usual case) just pop it off */
1112 if (IoDIRP(FILTER_DATA(0)) == (void*)funcp){
1113 /* sv_free(av_pop(rsfp_filters)); */
1114 sv_free(av_shift(rsfp_filters));
1118 /* we need to search for the correct entry and clear it */
1119 die("filter_del can only delete in reverse order (currently)");
1123 /* Invoke the n'th filter function for the current rsfp. */
1125 filter_read(int idx, SV *buf_sv, int maxlen)
1128 /* 0 = read one text line */
1135 if (idx > AvFILL(rsfp_filters)){ /* Any more filters? */
1136 /* Provide a default input filter to make life easy. */
1137 /* Note that we append to the line. This is handy. */
1139 warn("filter_read %d: from rsfp\n", idx);
1143 int old_len = SvCUR(buf_sv) ;
1145 /* ensure buf_sv is large enough */
1146 SvGROW(buf_sv, old_len + maxlen) ;
1147 if ((len = PerlIO_read(rsfp, SvPVX(buf_sv) + old_len, maxlen)) <= 0){
1148 if (PerlIO_error(rsfp))
1149 return -1; /* error */
1151 return 0 ; /* end of file */
1153 SvCUR_set(buf_sv, old_len + len) ;
1156 if (sv_gets(buf_sv, rsfp, SvCUR(buf_sv)) == NULL) {
1157 if (PerlIO_error(rsfp))
1158 return -1; /* error */
1160 return 0 ; /* end of file */
1163 return SvCUR(buf_sv);
1165 /* Skip this filter slot if filter has been deleted */
1166 if ( (datasv = FILTER_DATA(idx)) == &sv_undef){
1168 warn("filter_read %d: skipped (filter deleted)\n", idx);
1169 return FILTER_READ(idx+1, buf_sv, maxlen); /* recurse */
1171 /* Get function pointer hidden within datasv */
1172 funcp = (filter_t)IoDIRP(datasv);
1174 warn("filter_read %d: via function %p (%s)\n",
1175 idx, funcp, SvPV(datasv,na));
1176 /* Call function. The function is expected to */
1177 /* call "FILTER_READ(idx+1, buf_sv)" first. */
1178 /* Return: <0:error, =0:eof, >0:not eof */
1179 return (*funcp)(idx, buf_sv, maxlen);
1183 filter_gets(register SV *sv, register FILE *fp, STRLEN append)
1188 SvCUR_set(sv, 0); /* start with empty line */
1189 if (FILTER_READ(0, sv, 0) > 0)
1190 return ( SvPVX(sv) ) ;
1195 return (sv_gets(sv, fp, append));
1201 static char* exp_name[] =
1202 { "OPERATOR", "TERM", "REF", "STATE", "BLOCK", "TERMBLOCK" };
1205 EXT int yychar; /* last token */
1216 if (pending_ident) {
1217 char pit = pending_ident;
1221 if (strchr(tokenbuf,':'))
1222 croak(no_myglob,tokenbuf);
1223 yylval.opval = newOP(OP_PADANY, 0);
1224 yylval.opval->op_targ = pad_allocmy(tokenbuf);
1228 if (!strchr(tokenbuf,':')) {
1230 /* Check for single character per-thread magicals */
1231 if (tokenbuf[0] == '$' && tokenbuf[2] == '\0'
1232 && !isALPHA(tokenbuf[1]) /* Rule out obvious non-magicals */
1233 && (tmp = find_thread_magical(&tokenbuf[1])) != NOT_IN_PAD)
1235 yylval.opval = newOP(OP_THREADSV, 0);
1236 yylval.opval->op_targ = tmp;
1239 #endif /* USE_THREADS */
1240 if ((tmp = pad_findmy(tokenbuf)) != NOT_IN_PAD) {
1241 if (last_lop_op == OP_SORT &&
1242 tokenbuf[0] == '$' &&
1243 (tokenbuf[1] == 'a' || tokenbuf[1] == 'b')
1246 for (d = in_eval ? oldoldbufptr : linestart;
1247 d < bufend && *d != '\n';
1250 if (strnEQ(d,"<=>",3) || strnEQ(d,"cmp",3)) {
1251 croak("Can't use \"my %s\" in sort comparison",
1257 yylval.opval = newOP(OP_PADANY, 0);
1258 yylval.opval->op_targ = tmp;
1263 /* Force them to make up their mind on "@foo". */
1264 if (pit == '@' && lex_state != LEX_NORMAL && !lex_brackets) {
1265 GV *gv = gv_fetchpv(tokenbuf+1, FALSE, SVt_PVAV);
1266 if (!gv || ((tokenbuf[0] == '@') ? !GvAV(gv) : !GvHV(gv)))
1267 yyerror(form("In string, %s now must be written as \\%s",
1268 tokenbuf, tokenbuf));
1271 yylval.opval = (OP*)newSVOP(OP_CONST, 0, newSVpv(tokenbuf+1, 0));
1272 yylval.opval->op_private = OPpCONST_ENTERED;
1273 gv_fetchpv(tokenbuf+1, in_eval ? GV_ADDMULTI : TRUE,
1274 ((tokenbuf[0] == '$') ? SVt_PV
1275 : (tokenbuf[0] == '@') ? SVt_PVAV
1280 switch (lex_state) {
1282 case LEX_NORMAL: /* Some compilers will produce faster */
1283 case LEX_INTERPNORMAL: /* code if we comment these out. */
1289 yylval = nextval[nexttoke];
1291 lex_state = lex_defer;
1292 expect = lex_expect;
1293 lex_defer = LEX_NORMAL;
1295 return(nexttype[nexttoke]);
1297 case LEX_INTERPCASEMOD:
1299 if (bufptr != bufend && *bufptr != '\\')
1300 croak("panic: INTERPCASEMOD");
1302 if (bufptr == bufend || bufptr[1] == 'E') {
1305 oldmod = lex_casestack[--lex_casemods];
1306 lex_casestack[lex_casemods] = '\0';
1307 if (bufptr != bufend && strchr("LUQ", oldmod)) {
1309 lex_state = LEX_INTERPCONCAT;
1313 if (bufptr != bufend)
1315 lex_state = LEX_INTERPCONCAT;
1320 if (strnEQ(s, "L\\u", 3) || strnEQ(s, "U\\l", 3))
1321 tmp = *s, *s = s[2], s[2] = tmp; /* misordered... */
1322 if (strchr("LU", *s) &&
1323 (strchr(lex_casestack, 'L') || strchr(lex_casestack, 'U')))
1325 lex_casestack[--lex_casemods] = '\0';
1328 if (lex_casemods > 10) {
1329 char* newlb = Renew(lex_casestack, lex_casemods + 2, char);
1330 if (newlb != lex_casestack) {
1332 lex_casestack = newlb;
1335 lex_casestack[lex_casemods++] = *s;
1336 lex_casestack[lex_casemods] = '\0';
1337 lex_state = LEX_INTERPCONCAT;
1338 nextval[nexttoke].ival = 0;
1341 nextval[nexttoke].ival = OP_LCFIRST;
1343 nextval[nexttoke].ival = OP_UCFIRST;
1345 nextval[nexttoke].ival = OP_LC;
1347 nextval[nexttoke].ival = OP_UC;
1349 nextval[nexttoke].ival = OP_QUOTEMETA;
1351 croak("panic: yylex");
1363 case LEX_INTERPPUSH:
1364 return sublex_push();
1366 case LEX_INTERPSTART:
1367 if (bufptr == bufend)
1368 return sublex_done();
1370 lex_dojoin = (*bufptr == '@');
1371 lex_state = LEX_INTERPNORMAL;
1373 nextval[nexttoke].ival = 0;
1376 nextval[nexttoke].opval = newOP(OP_THREADSV, 0);
1377 nextval[nexttoke].opval->op_targ = find_thread_magical("\"");
1378 force_next(PRIVATEREF);
1380 force_ident("\"", '$');
1381 #endif /* USE_THREADS */
1382 nextval[nexttoke].ival = 0;
1384 nextval[nexttoke].ival = 0;
1386 nextval[nexttoke].ival = OP_JOIN; /* emulate join($", ...) */
1395 case LEX_INTERPENDMAYBE:
1396 if (intuit_more(bufptr)) {
1397 lex_state = LEX_INTERPNORMAL; /* false alarm, more expr */
1405 lex_state = LEX_INTERPCONCAT;
1409 case LEX_INTERPCONCAT:
1412 croak("panic: INTERPCONCAT");
1414 if (bufptr == bufend)
1415 return sublex_done();
1417 if (SvIVX(linestr) == '\'') {
1418 SV *sv = newSVsv(linestr);
1421 yylval.opval = (OP*)newSVOP(OP_CONST, 0, sv);
1425 s = scan_const(bufptr);
1427 lex_state = LEX_INTERPCASEMOD;
1429 lex_state = LEX_INTERPSTART;
1433 nextval[nexttoke] = yylval;
1446 lex_state = LEX_NORMAL;
1447 s = scan_formline(bufptr);
1454 oldoldbufptr = oldbufptr;
1457 PerlIO_printf(PerlIO_stderr(), "### Tokener expecting %s at %s\n", exp_name[expect], s);
1463 croak("Unrecognized character \\%03o", *s & 255);
1466 goto fake_eof; /* emulate EOF on ^D or ^Z */
1472 yyerror("Missing right bracket");
1476 goto retry; /* ignore stray nulls */
1479 if (!in_eval && !preambled) {
1481 sv_setpv(linestr,incl_perldb());
1483 sv_catpv(linestr,";");
1485 while(AvFILL(preambleav) >= 0) {
1486 SV *tmpsv = av_shift(preambleav);
1487 sv_catsv(linestr, tmpsv);
1488 sv_catpv(linestr, ";");
1491 sv_free((SV*)preambleav);
1494 if (minus_n || minus_p) {
1495 sv_catpv(linestr, "LINE: while (<>) {");
1497 sv_catpv(linestr,"chomp;");
1499 GV* gv = gv_fetchpv("::F", TRUE, SVt_PVAV);
1501 GvIMPORTED_AV_on(gv);
1503 if (strchr("/'\"", *splitstr)
1504 && strchr(splitstr + 1, *splitstr))
1505 sv_catpvf(linestr, "@F=split(%s);", splitstr);
1508 s = "'~#\200\1'"; /* surely one char is unused...*/
1509 while (s[1] && strchr(splitstr, *s)) s++;
1511 sv_catpvf(linestr, "@F=split(%s%c",
1512 "q" + (delim == '\''), delim);
1513 for (s = splitstr; *s; s++) {
1515 sv_catpvn(linestr, "\\", 1);
1516 sv_catpvn(linestr, s, 1);
1518 sv_catpvf(linestr, "%c);", delim);
1522 sv_catpv(linestr,"@F=split(' ');");
1525 sv_catpv(linestr, "\n");
1526 oldoldbufptr = oldbufptr = s = linestart = SvPVX(linestr);
1527 bufend = SvPVX(linestr) + SvCUR(linestr);
1528 if (PERLDB_LINE && curstash != debstash) {
1529 SV *sv = NEWSV(85,0);
1531 sv_upgrade(sv, SVt_PVMG);
1532 sv_setsv(sv,linestr);
1533 av_store(GvAV(curcop->cop_filegv),(I32)curcop->cop_line,sv);
1538 if ((s = filter_gets(linestr, rsfp, 0)) == Nullch) {
1541 if (preprocess && !in_eval)
1542 (void)my_pclose(rsfp);
1543 else if ((PerlIO *)rsfp == PerlIO_stdin())
1544 PerlIO_clearerr(rsfp);
1546 (void)PerlIO_close(rsfp);
1551 if (!in_eval && (minus_n || minus_p)) {
1552 sv_setpv(linestr,minus_p ? ";}continue{print" : "");
1553 sv_catpv(linestr,";}");
1554 oldoldbufptr = oldbufptr = s = linestart = SvPVX(linestr);
1555 bufend = SvPVX(linestr) + SvCUR(linestr);
1556 minus_n = minus_p = 0;
1559 oldoldbufptr = oldbufptr = s = linestart = SvPVX(linestr);
1560 sv_setpv(linestr,"");
1561 TOKEN(';'); /* not infinite loop because rsfp is NULL now */
1564 if (*s == '#' && s[1] == '!' && instr(s,"perl"))
1567 /* Incest with pod. */
1568 if (*s == '=' && strnEQ(s, "=cut", 4)) {
1569 sv_setpv(linestr, "");
1570 oldoldbufptr = oldbufptr = s = linestart = SvPVX(linestr);
1571 bufend = SvPVX(linestr) + SvCUR(linestr);
1576 } while (doextract);
1577 oldoldbufptr = oldbufptr = bufptr = linestart = s;
1578 if (PERLDB_LINE && curstash != debstash) {
1579 SV *sv = NEWSV(85,0);
1581 sv_upgrade(sv, SVt_PVMG);
1582 sv_setsv(sv,linestr);
1583 av_store(GvAV(curcop->cop_filegv),(I32)curcop->cop_line,sv);
1585 bufend = SvPVX(linestr) + SvCUR(linestr);
1586 if (curcop->cop_line == 1) {
1587 while (s < bufend && isSPACE(*s))
1589 if (*s == ':' && s[1] != ':') /* for csh execing sh scripts */
1593 if (*s == '#' && *(s+1) == '!')
1595 #ifdef ALTERNATE_SHEBANG
1597 static char as[] = ALTERNATE_SHEBANG;
1598 if (*s == as[0] && strnEQ(s, as, sizeof(as) - 1))
1599 d = s + (sizeof(as) - 1);
1601 #endif /* ALTERNATE_SHEBANG */
1610 while (*d && !isSPACE(*d))
1614 #ifdef ARG_ZERO_IS_SCRIPT
1615 if (ipathend > ipath) {
1617 * HP-UX (at least) sets argv[0] to the script name,
1618 * which makes $^X incorrect. And Digital UNIX and Linux,
1619 * at least, set argv[0] to the basename of the Perl
1620 * interpreter. So, having found "#!", we'll set it right.
1622 SV *x = GvSV(gv_fetchpv("\030", TRUE, SVt_PV));
1623 assert(SvPOK(x) || SvGMAGICAL(x));
1624 if (sv_eq(x, GvSV(curcop->cop_filegv))) {
1625 sv_setpvn(x, ipath, ipathend - ipath);
1628 TAINT_NOT; /* $^X is always tainted, but that's OK */
1630 #endif /* ARG_ZERO_IS_SCRIPT */
1635 d = instr(s,"perl -");
1637 d = instr(s,"perl");
1638 #ifdef ALTERNATE_SHEBANG
1640 * If the ALTERNATE_SHEBANG on this system starts with a
1641 * character that can be part of a Perl expression, then if
1642 * we see it but not "perl", we're probably looking at the
1643 * start of Perl code, not a request to hand off to some
1644 * other interpreter. Similarly, if "perl" is there, but
1645 * not in the first 'word' of the line, we assume the line
1646 * contains the start of the Perl program.
1648 if (d && *s != '#') {
1650 while (*c && !strchr("; \t\r\n\f\v#", *c))
1653 d = Nullch; /* "perl" not in first word; ignore */
1655 *s = '#'; /* Don't try to parse shebang line */
1657 #endif /* ALTERNATE_SHEBANG */
1662 !instr(s,"indir") &&
1663 instr(origargv[0],"perl"))
1669 while (s < bufend && isSPACE(*s))
1672 Newz(899,newargv,origargc+3,char*);
1674 while (s < bufend && !isSPACE(*s))
1677 Copy(origargv+1, newargv+2, origargc+1, char*);
1682 execv(ipath, newargv);
1683 croak("Can't exec %s", ipath);
1686 U32 oldpdb = perldb;
1687 bool oldn = minus_n;
1688 bool oldp = minus_p;
1690 while (*d && !isSPACE(*d)) d++;
1691 while (*d == ' ' || *d == '\t') d++;
1695 if (*d == 'M' || *d == 'm') {
1697 while (*d && !isSPACE(*d)) d++;
1698 croak("Too late for \"-%.*s\" option",
1701 d = moreswitches(d);
1703 if (PERLDB_LINE && !oldpdb ||
1704 ( minus_n || minus_p ) && !(oldn || oldp) )
1705 /* if we have already added "LINE: while (<>) {",
1706 we must not do it again */
1708 sv_setpv(linestr, "");
1709 oldoldbufptr = oldbufptr = s = linestart = SvPVX(linestr);
1710 bufend = SvPVX(linestr) + SvCUR(linestr);
1713 (void)gv_fetchfile(origfilename);
1720 if (lex_formbrack && lex_brackets <= lex_formbrack) {
1722 lex_state = LEX_FORMLINE;
1727 warn("Illegal character \\%03o (carriage return)", '\r');
1729 "(Maybe you didn't strip carriage returns after a network transfer?)\n");
1730 case ' ': case '\t': case '\f': case 013:
1735 if (lex_state != LEX_NORMAL || (in_eval && !rsfp)) {
1737 while (s < d && *s != '\n')
1742 if (lex_formbrack && lex_brackets <= lex_formbrack) {
1744 lex_state = LEX_FORMLINE;
1754 if (s[1] && isALPHA(s[1]) && !isALNUM(s[2])) {
1759 while (s < bufend && (*s == ' ' || *s == '\t'))
1762 if (strnEQ(s,"=>",2)) {
1764 warn("Ambiguous use of -%c => resolved to \"-%c\" =>",
1765 (int)tmp, (int)tmp);
1766 s = force_word(bufptr,WORD,FALSE,FALSE,FALSE);
1767 OPERATOR('-'); /* unary minus */
1769 last_uni = oldbufptr;
1770 last_lop_op = OP_FTEREAD; /* good enough */
1772 case 'r': FTST(OP_FTEREAD);
1773 case 'w': FTST(OP_FTEWRITE);
1774 case 'x': FTST(OP_FTEEXEC);
1775 case 'o': FTST(OP_FTEOWNED);
1776 case 'R': FTST(OP_FTRREAD);
1777 case 'W': FTST(OP_FTRWRITE);
1778 case 'X': FTST(OP_FTREXEC);
1779 case 'O': FTST(OP_FTROWNED);
1780 case 'e': FTST(OP_FTIS);
1781 case 'z': FTST(OP_FTZERO);
1782 case 's': FTST(OP_FTSIZE);
1783 case 'f': FTST(OP_FTFILE);
1784 case 'd': FTST(OP_FTDIR);
1785 case 'l': FTST(OP_FTLINK);
1786 case 'p': FTST(OP_FTPIPE);
1787 case 'S': FTST(OP_FTSOCK);
1788 case 'u': FTST(OP_FTSUID);
1789 case 'g': FTST(OP_FTSGID);
1790 case 'k': FTST(OP_FTSVTX);
1791 case 'b': FTST(OP_FTBLK);
1792 case 'c': FTST(OP_FTCHR);
1793 case 't': FTST(OP_FTTTY);
1794 case 'T': FTST(OP_FTTEXT);
1795 case 'B': FTST(OP_FTBINARY);
1796 case 'M': gv_fetchpv("\024",TRUE, SVt_PV); FTST(OP_FTMTIME);
1797 case 'A': gv_fetchpv("\024",TRUE, SVt_PV); FTST(OP_FTATIME);
1798 case 'C': gv_fetchpv("\024",TRUE, SVt_PV); FTST(OP_FTCTIME);
1800 croak("Unrecognized file test: -%c", (int)tmp);
1807 if (expect == XOPERATOR)
1812 else if (*s == '>') {
1815 if (isIDFIRST(*s)) {
1816 s = force_word(s,METHOD,FALSE,TRUE,FALSE);
1824 if (expect == XOPERATOR)
1827 if (isSPACE(*s) || !isSPACE(*bufptr))
1829 OPERATOR('-'); /* unary minus */
1836 if (expect == XOPERATOR)
1841 if (expect == XOPERATOR)
1844 if (isSPACE(*s) || !isSPACE(*bufptr))
1850 if (expect != XOPERATOR) {
1851 s = scan_ident(s, bufend, tokenbuf, sizeof tokenbuf, TRUE);
1853 force_ident(tokenbuf, '*');
1866 if (expect == XOPERATOR) {
1871 s = scan_ident(s, bufend, tokenbuf + 1, sizeof tokenbuf - 1, TRUE);
1874 yyerror("Final % should be \\% or %name");
1877 pending_ident = '%';
1899 if (last_lop == oldoldbufptr || last_uni == oldoldbufptr)
1900 oldbufptr = oldoldbufptr; /* allow print(STDOUT 123) */
1905 if (curcop->cop_line < copline)
1906 copline = curcop->cop_line;
1917 if (lex_brackets <= 0)
1918 yyerror("Unmatched right bracket");
1921 if (lex_state == LEX_INTERPNORMAL) {
1922 if (lex_brackets == 0) {
1923 if (*s != '[' && *s != '{' && (*s != '-' || s[1] != '>'))
1924 lex_state = LEX_INTERPEND;
1931 if (lex_brackets > 100) {
1932 char* newlb = Renew(lex_brackstack, lex_brackets + 1, char);
1933 if (newlb != lex_brackstack) {
1935 lex_brackstack = newlb;
1940 if (lex_formbrack) {
1944 if (oldoldbufptr == last_lop)
1945 lex_brackstack[lex_brackets++] = XTERM;
1947 lex_brackstack[lex_brackets++] = XOPERATOR;
1948 OPERATOR(HASHBRACK);
1950 while (s < bufend && (*s == ' ' || *s == '\t'))
1954 if (d < bufend && *d == '-') {
1957 while (d < bufend && (*d == ' ' || *d == '\t'))
1960 if (d < bufend && isIDFIRST(*d)) {
1961 d = scan_word(d, tokenbuf + 1, sizeof tokenbuf - 1,
1963 while (d < bufend && (*d == ' ' || *d == '\t'))
1966 char minus = (tokenbuf[0] == '-');
1968 (keyword(tokenbuf + 1, len) ||
1969 (minus && len == 1 && isALPHA(tokenbuf[1])) ||
1970 perl_get_cv(tokenbuf + 1, FALSE) ))
1971 warn("Ambiguous use of {%s} resolved to {\"%s\"}",
1972 tokenbuf + !minus, tokenbuf + !minus);
1973 s = force_word(s + minus, WORD, FALSE, TRUE, FALSE);
1980 lex_brackstack[lex_brackets++] = XSTATE;
1984 lex_brackstack[lex_brackets++] = XOPERATOR;
1989 if (oldoldbufptr == last_lop)
1990 lex_brackstack[lex_brackets++] = XTERM;
1992 lex_brackstack[lex_brackets++] = XOPERATOR;
1995 OPERATOR(HASHBRACK);
1996 /* This hack serves to disambiguate a pair of curlies
1997 * as being a block or an anon hash. Normally, expectation
1998 * determines that, but in cases where we're not in a
1999 * position to expect anything in particular (like inside
2000 * eval"") we have to resolve the ambiguity. This code
2001 * covers the case where the first term in the curlies is a
2002 * quoted string. Most other cases need to be explicitly
2003 * disambiguated by prepending a `+' before the opening
2004 * curly in order to force resolution as an anon hash.
2006 * XXX should probably propagate the outer expectation
2007 * into eval"" to rely less on this hack, but that could
2008 * potentially break current behavior of eval"".
2012 if (*s == '\'' || *s == '"' || *s == '`') {
2013 /* common case: get past first string, handling escapes */
2014 for (t++; t < bufend && *t != *s;)
2015 if (*t++ == '\\' && (*t == '\\' || *t == *s))
2019 else if (*s == 'q') {
2022 || ((*t == 'q' || *t == 'x') && ++t < bufend
2023 && !isALNUM(*t)))) {
2025 char open, close, term;
2028 while (t < bufend && isSPACE(*t))
2032 if (term && (tmps = strchr("([{< )]}> )]}>",term)))
2036 for (t++; t < bufend; t++) {
2037 if (*t == '\\' && t+1 < bufend && open != '\\')
2039 else if (*t == open)
2043 for (t++; t < bufend; t++) {
2044 if (*t == '\\' && t+1 < bufend)
2046 else if (*t == close && --brackets <= 0)
2048 else if (*t == open)
2054 else if (isALPHA(*s)) {
2055 for (t++; t < bufend && isALNUM(*t); t++) ;
2057 while (t < bufend && isSPACE(*t))
2059 /* if comma follows first term, call it an anon hash */
2060 /* XXX it could be a comma expression with loop modifiers */
2061 if (t < bufend && ((*t == ',' && (*s == 'q' || !isLOWER(*s)))
2062 || (*t == '=' && t[1] == '>')))
2063 OPERATOR(HASHBRACK);
2067 lex_brackstack[lex_brackets-1] = XSTATE;
2073 yylval.ival = curcop->cop_line;
2074 if (isSPACE(*s) || *s == '#')
2075 copline = NOLINE; /* invalidate current command line number */
2080 if (lex_brackets <= 0)
2081 yyerror("Unmatched right bracket");
2083 expect = (expectation)lex_brackstack[--lex_brackets];
2084 if (lex_brackets < lex_formbrack)
2086 if (lex_state == LEX_INTERPNORMAL) {
2087 if (lex_brackets == 0) {
2088 if (lex_fakebrack) {
2089 lex_state = LEX_INTERPEND;
2091 return yylex(); /* ignore fake brackets */
2093 if (*s == '-' && s[1] == '>')
2094 lex_state = LEX_INTERPENDMAYBE;
2095 else if (*s != '[' && *s != '{')
2096 lex_state = LEX_INTERPEND;
2099 if (lex_brackets < lex_fakebrack) {
2102 return yylex(); /* ignore fake brackets */
2112 if (expect == XOPERATOR) {
2113 if (dowarn && isALPHA(*s) && bufptr == linestart) {
2121 s = scan_ident(s - 1, bufend, tokenbuf, sizeof tokenbuf, TRUE);
2124 force_ident(tokenbuf, '&');
2128 yylval.ival = (OPpENTERSUB_AMPER<<8);
2147 if (dowarn && tmp && isSPACE(*s) && strchr("+-*/%.^&|<",tmp))
2148 warn("Reversed %c= operator",(int)tmp);
2150 if (expect == XSTATE && isALPHA(tmp) &&
2151 (s == linestart+1 || s[-2] == '\n') )
2153 if (in_eval && !rsfp) {
2158 if (strnEQ(s,"=cut",4)) {
2175 if (lex_brackets < lex_formbrack) {
2177 for (t = s; *t == ' ' || *t == '\t'; t++) ;
2178 if (*t == '\n' || *t == '#') {
2196 if (expect != XOPERATOR) {
2197 if (s[1] != '<' && !strchr(s,'>'))
2200 s = scan_heredoc(s);
2202 s = scan_inputsymbol(s);
2203 TERM(sublex_start());
2208 SHop(OP_LEFT_SHIFT);
2222 SHop(OP_RIGHT_SHIFT);
2231 if (expect == XOPERATOR) {
2232 if (lex_formbrack && lex_brackets == lex_formbrack) {
2235 return ','; /* grandfather non-comma-format format */
2239 if (s[1] == '#' && (isALPHA(s[2]) || strchr("_{$:", s[2]))) {
2240 if (expect == XOPERATOR)
2241 no_op("Array length", bufptr);
2243 s = scan_ident(s + 1, bufend, tokenbuf + 1, sizeof tokenbuf - 1,
2248 pending_ident = '#';
2252 if (expect == XOPERATOR)
2253 no_op("Scalar", bufptr);
2255 s = scan_ident(s, bufend, tokenbuf + 1, sizeof tokenbuf - 1, FALSE);
2258 yyerror("Final $ should be \\$ or $name");
2262 /* This kludge not intended to be bulletproof. */
2263 if (tokenbuf[1] == '[' && !tokenbuf[2]) {
2264 yylval.opval = newSVOP(OP_CONST, 0,
2265 newSViv((IV)compiling.cop_arybase));
2266 yylval.opval->op_private = OPpCONST_ARYBASE;
2271 if (lex_state == LEX_NORMAL)
2274 if ((expect != XREF || oldoldbufptr == last_lop) && intuit_more(s)) {
2280 isSPACE(*t) || isALNUM(*t) || *t == '$';
2283 bufptr = skipspace(bufptr);
2284 while (t < bufend && *t != ']')
2286 warn("Multidimensional syntax %.*s not supported",
2287 (t - bufptr) + 1, bufptr);
2291 else if (*s == '{') {
2293 if (dowarn && strEQ(tokenbuf+1, "SIG") &&
2294 (t = strchr(s, '}')) && (t = strchr(t, '=')))
2296 char tmpbuf[sizeof tokenbuf];
2298 for (t++; isSPACE(*t); t++) ;
2299 if (isIDFIRST(*t)) {
2300 t = scan_word(t, tmpbuf, sizeof tmpbuf, TRUE, &len);
2301 if (*t != '(' && perl_get_cv(tmpbuf, FALSE))
2302 warn("You need to quote \"%s\"", tmpbuf);
2309 if (lex_state == LEX_NORMAL && isSPACE(*d)) {
2310 bool islop = (last_lop == oldoldbufptr);
2311 if (!islop || last_lop_op == OP_GREPSTART)
2313 else if (strchr("$@\"'`q", *s))
2314 expect = XTERM; /* e.g. print $fh "foo" */
2315 else if (strchr("&*<%", *s) && isIDFIRST(s[1]))
2316 expect = XTERM; /* e.g. print $fh &sub */
2317 else if (isIDFIRST(*s)) {
2318 char tmpbuf[sizeof tokenbuf];
2319 scan_word(s, tmpbuf, sizeof tmpbuf, TRUE, &len);
2320 if (tmp = keyword(tmpbuf, len)) {
2321 /* binary operators exclude handle interpretations */
2333 expect = XTERM; /* e.g. print $fh length() */
2338 GV *gv = gv_fetchpv(tmpbuf, FALSE, SVt_PVCV);
2339 if (gv && GvCVu(gv))
2340 expect = XTERM; /* e.g. print $fh subr() */
2343 else if (isDIGIT(*s))
2344 expect = XTERM; /* e.g. print $fh 3 */
2345 else if (*s == '.' && isDIGIT(s[1]))
2346 expect = XTERM; /* e.g. print $fh .3 */
2347 else if (strchr("/?-+", *s) && !isSPACE(s[1]))
2348 expect = XTERM; /* e.g. print $fh -1 */
2349 else if (*s == '<' && s[1] == '<' && !isSPACE(s[2]))
2350 expect = XTERM; /* print $fh <<"EOF" */
2352 pending_ident = '$';
2356 if (expect == XOPERATOR)
2359 s = scan_ident(s, bufend, tokenbuf + 1, sizeof tokenbuf - 1, FALSE);
2362 yyerror("Final @ should be \\@ or @name");
2365 if (lex_state == LEX_NORMAL)
2367 if ((expect != XREF || oldoldbufptr == last_lop) && intuit_more(s)) {
2371 /* Warn about @ where they meant $. */
2373 if (*s == '[' || *s == '{') {
2375 while (*t && (isALNUM(*t) || strchr(" \t$#+-'\"", *t)))
2377 if (*t == '}' || *t == ']') {
2379 bufptr = skipspace(bufptr);
2380 warn("Scalar value %.*s better written as $%.*s",
2381 t-bufptr, bufptr, t-bufptr-1, bufptr+1);
2386 pending_ident = '@';
2389 case '/': /* may either be division or pattern */
2390 case '?': /* may either be conditional or pattern */
2391 if (expect != XOPERATOR) {
2394 TERM(sublex_start());
2402 if (lex_formbrack && lex_brackets == lex_formbrack && s[1] == '\n' &&
2403 (s == linestart || s[-1] == '\n') ) {
2408 if (expect == XOPERATOR || !isDIGIT(s[1])) {
2414 yylval.ival = OPf_SPECIAL;
2420 if (expect != XOPERATOR)
2425 case '0': case '1': case '2': case '3': case '4':
2426 case '5': case '6': case '7': case '8': case '9':
2428 if (expect == XOPERATOR)
2434 if (expect == XOPERATOR) {
2435 if (lex_formbrack && lex_brackets == lex_formbrack) {
2438 return ','; /* grandfather non-comma-format format */
2444 missingterm((char*)0);
2445 yylval.ival = OP_CONST;
2446 TERM(sublex_start());
2450 if (expect == XOPERATOR) {
2451 if (lex_formbrack && lex_brackets == lex_formbrack) {
2454 return ','; /* grandfather non-comma-format format */
2460 missingterm((char*)0);
2461 yylval.ival = OP_CONST;
2462 for (d = SvPV(lex_stuff, len); len; len--, d++) {
2463 if (*d == '$' || *d == '@' || *d == '\\') {
2464 yylval.ival = OP_STRINGIFY;
2468 TERM(sublex_start());
2472 if (expect == XOPERATOR)
2473 no_op("Backticks",s);
2475 missingterm((char*)0);
2476 yylval.ival = OP_BACKTICK;
2478 TERM(sublex_start());
2482 if (dowarn && lex_inwhat && isDIGIT(*s))
2483 warn("Can't use \\%c to mean $%c in expression", *s, *s);
2484 if (expect == XOPERATOR)
2485 no_op("Backslash",s);
2489 if (isDIGIT(s[1]) && expect == XOPERATOR) {
2528 s = scan_word(s, tokenbuf, sizeof tokenbuf, FALSE, &len);
2530 /* Some keywords can be followed by any delimiter, including ':' */
2531 tmp = (len == 1 && strchr("msyq", tokenbuf[0]) ||
2532 len == 2 && ((tokenbuf[0] == 't' && tokenbuf[1] == 'r') ||
2533 (tokenbuf[0] == 'q' &&
2534 strchr("qwx", tokenbuf[1]))));
2536 /* x::* is just a word, unless x is "CORE" */
2537 if (!tmp && *s == ':' && s[1] == ':' && strNE(tokenbuf, "CORE"))
2541 while (d < bufend && isSPACE(*d))
2542 d++; /* no comments skipped here, or s### is misparsed */
2544 /* Is this a label? */
2545 if (!tmp && expect == XSTATE
2546 && d < bufend && *d == ':' && *(d + 1) != ':') {
2548 yylval.pval = savepv(tokenbuf);
2553 /* Check for keywords */
2554 tmp = keyword(tokenbuf, len);
2556 /* Is this a word before a => operator? */
2557 if (strnEQ(d,"=>",2)) {
2559 if (dowarn && (tmp || perl_get_cv(tokenbuf, FALSE)))
2560 warn("Ambiguous use of %s => resolved to \"%s\" =>",
2561 tokenbuf, tokenbuf);
2562 yylval.opval = (OP*)newSVOP(OP_CONST, 0, newSVpv(tokenbuf,0));
2563 yylval.opval->op_private = OPpCONST_BARE;
2567 if (tmp < 0) { /* second-class keyword? */
2568 if (expect != XOPERATOR && (*s != ':' || s[1] != ':') &&
2569 (((gv = gv_fetchpv(tokenbuf, FALSE, SVt_PVCV)) &&
2570 GvCVu(gv) && GvIMPORTED_CV(gv)) ||
2571 ((gvp = (GV**)hv_fetch(globalstash,tokenbuf,len,FALSE)) &&
2572 (gv = *gvp) != (GV*)&sv_undef &&
2573 GvCVu(gv) && GvIMPORTED_CV(gv))))
2575 tmp = 0; /* overridden by importation */
2578 && -tmp==KEY_lock /* XXX generalizable kludge */
2579 && !hv_fetch(GvHVn(incgv), "Thread.pm", 9, FALSE))
2581 tmp = 0; /* any sub overrides "weak" keyword */
2584 tmp = -tmp; gv = Nullgv; gvp = 0;
2591 default: /* not a keyword */
2594 char lastchar = (bufptr == oldoldbufptr ? 0 : bufptr[-1]);
2596 /* Get the rest if it looks like a package qualifier */
2598 if (*s == '\'' || *s == ':' && s[1] == ':') {
2599 s = scan_word(s, tokenbuf + len, sizeof tokenbuf - len,
2602 croak("Bad name after %s::", tokenbuf);
2605 if (expect == XOPERATOR) {
2606 if (bufptr == linestart) {
2612 no_op("Bareword",s);
2615 /* Look for a subroutine with this name in current package. */
2618 sv = newSVpv("CORE::GLOBAL::",14);
2619 sv_catpv(sv,tokenbuf);
2622 sv = newSVpv(tokenbuf,0);
2624 gv = gv_fetchpv(tokenbuf,FALSE, SVt_PVCV);
2626 /* Presume this is going to be a bareword of some sort. */
2629 yylval.opval = (OP*)newSVOP(OP_CONST, 0, sv);
2630 yylval.opval->op_private = OPpCONST_BARE;
2632 /* See if it's the indirect object for a list operator. */
2635 oldoldbufptr < bufptr &&
2636 (oldoldbufptr == last_lop || oldoldbufptr == last_uni) &&
2637 /* NO SKIPSPACE BEFORE HERE! */
2639 ((opargs[last_lop_op] >> OASHIFT)& 7) == OA_FILEREF) )
2641 bool immediate_paren = *s == '(';
2643 /* (Now we can afford to cross potential line boundary.) */
2646 /* Two barewords in a row may indicate method call. */
2648 if ((isALPHA(*s) || *s == '$') && (tmp=intuit_method(s,gv)))
2651 /* If not a declared subroutine, it's an indirect object. */
2652 /* (But it's an indir obj regardless for sort.) */
2654 if ((last_lop_op == OP_SORT ||
2655 (!immediate_paren && (!gv || !GvCVu(gv))) ) &&
2656 (last_lop_op != OP_MAPSTART && last_lop_op != OP_GREPSTART)){
2657 expect = (last_lop == oldoldbufptr) ? XTERM : XOPERATOR;
2662 /* If followed by a paren, it's certainly a subroutine. */
2668 if (gv && GvCVu(gv)) {
2669 for (d = s + 1; *d == ' ' || *d == '\t'; d++) ;
2670 if (*d == ')' && (sv = cv_const_sv(GvCV(gv)))) {
2675 nextval[nexttoke].opval = yylval.opval;
2682 /* If followed by var or block, call it a method (unless sub) */
2684 if ((*s == '$' || *s == '{') && (!gv || !GvCVu(gv))) {
2685 last_lop = oldbufptr;
2686 last_lop_op = OP_METHOD;
2690 /* If followed by a bareword, see if it looks like indir obj. */
2692 if ((isALPHA(*s) || *s == '$') && (tmp = intuit_method(s,gv)))
2695 /* Not a method, so call it a subroutine (if defined) */
2697 if (gv && GvCVu(gv)) {
2699 if (lastchar == '-')
2700 warn("Ambiguous use of -%s resolved as -&%s()",
2701 tokenbuf, tokenbuf);
2702 last_lop = oldbufptr;
2703 last_lop_op = OP_ENTERSUB;
2704 /* Check for a constant sub */
2706 if ((sv = cv_const_sv(cv))) {
2708 SvREFCNT_dec(((SVOP*)yylval.opval)->op_sv);
2709 ((SVOP*)yylval.opval)->op_sv = SvREFCNT_inc(sv);
2710 yylval.opval->op_private = 0;
2714 /* Resolve to GV now. */
2715 op_free(yylval.opval);
2716 yylval.opval = newCVREF(0, newGVOP(OP_GV, 0, gv));
2717 /* Is there a prototype? */
2720 char *proto = SvPV((SV*)cv, len);
2723 if (strEQ(proto, "$"))
2725 if (*proto == '&' && *s == '{') {
2726 sv_setpv(subname,"__ANON__");
2730 nextval[nexttoke].opval = yylval.opval;
2736 if (hints & HINT_STRICT_SUBS &&
2739 last_lop_op != OP_TRUNCATE && /* S/F prototype in opcode.pl */
2740 last_lop_op != OP_ACCEPT &&
2741 last_lop_op != OP_PIPE_OP &&
2742 last_lop_op != OP_SOCKPAIR)
2745 "Bareword \"%s\" not allowed while \"strict subs\" in use",
2750 /* Call it a bare word */
2754 if (lastchar != '-') {
2755 for (d = tokenbuf; *d && isLOWER(*d); d++) ;
2757 warn(warn_reserved, tokenbuf);
2760 if (lastchar && strchr("*%&", lastchar)) {
2761 warn("Operator or semicolon missing before %c%s",
2762 lastchar, tokenbuf);
2763 warn("Ambiguous use of %c resolved as operator %c",
2764 lastchar, lastchar);
2770 yylval.opval = (OP*)newSVOP(OP_CONST, 0,
2771 newSVsv(GvSV(curcop->cop_filegv)));
2775 yylval.opval = (OP*)newSVOP(OP_CONST, 0,
2776 newSVpvf("%ld", (long)curcop->cop_line));
2779 case KEY___PACKAGE__:
2780 yylval.opval = (OP*)newSVOP(OP_CONST, 0,
2782 ? newSVsv(curstname)
2791 if (rsfp && (!in_eval || tokenbuf[2] == 'D')) {
2792 char *pname = "main";
2793 if (tokenbuf[2] == 'D')
2794 pname = HvNAME(curstash ? curstash : defstash);
2795 gv = gv_fetchpv(form("%s::DATA", pname), TRUE, SVt_PVIO);
2798 GvIOp(gv) = newIO();
2799 IoIFP(GvIOp(gv)) = rsfp;
2800 #if defined(HAS_FCNTL) && defined(F_SETFD)
2802 int fd = PerlIO_fileno(rsfp);
2803 fcntl(fd,F_SETFD,fd >= 3);
2806 /* Mark this internal pseudo-handle as clean */
2807 IoFLAGS(GvIOp(gv)) |= IOf_UNTAINT;
2809 IoTYPE(GvIOp(gv)) = '|';
2810 else if ((PerlIO*)rsfp == PerlIO_stdin())
2811 IoTYPE(GvIOp(gv)) = '-';
2813 IoTYPE(GvIOp(gv)) = '<';
2824 if (expect == XSTATE) {
2831 if (*s == ':' && s[1] == ':') {
2834 s = scan_word(s, tokenbuf, sizeof tokenbuf, FALSE, &len);
2835 tmp = keyword(tokenbuf, len);
2849 LOP(OP_ACCEPT,XTERM);
2855 LOP(OP_ATAN2,XTERM);
2864 LOP(OP_BLESS,XTERM);
2873 (void)gv_fetchpv("ENV",TRUE, SVt_PVHV); /* may use HOME */
2893 LOP(OP_CRYPT,XTERM);
2897 for (d = s; d < bufend && (isSPACE(*d) || *d == '('); d++) ;
2898 if (*d != '0' && isDIGIT(*d))
2899 yywarn("chmod: mode argument is missing initial 0");
2901 LOP(OP_CHMOD,XTERM);
2904 LOP(OP_CHOWN,XTERM);
2907 LOP(OP_CONNECT,XTERM);
2923 s = force_word(s,WORD,FALSE,TRUE,FALSE);
2927 hints |= HINT_BLOCK_SCOPE;
2937 gv_fetchpv("AnyDBM_File::ISA", GV_ADDMULTI, SVt_PVAV);
2938 LOP(OP_DBMOPEN,XTERM);
2944 s = force_word(s,WORD,TRUE,FALSE,FALSE);
2951 yylval.ival = curcop->cop_line;
2965 expect = (*s == '{') ? XTERMBLOCK : XTERM;
2966 UNIBRACK(OP_ENTEREVAL);
2981 case KEY_endhostent:
2987 case KEY_endservent:
2990 case KEY_endprotoent:
3001 yylval.ival = curcop->cop_line;
3003 if (isIDFIRST(*s)) {
3005 if ((bufend - p) >= 3 &&
3006 strnEQ(p, "my", 2) && isSPACE(*(p + 2)))
3010 croak("Missing $ on loop variable");
3015 LOP(OP_FORMLINE,XTERM);
3021 LOP(OP_FCNTL,XTERM);
3027 LOP(OP_FLOCK,XTERM);
3036 LOP(OP_GREPSTART, *s == '(' ? XTERM : XREF);
3039 s = force_word(s,WORD,TRUE,FALSE,FALSE);
3054 case KEY_getpriority:
3055 LOP(OP_GETPRIORITY,XTERM);
3057 case KEY_getprotobyname:
3060 case KEY_getprotobynumber:
3061 LOP(OP_GPBYNUMBER,XTERM);
3063 case KEY_getprotoent:
3075 case KEY_getpeername:
3076 UNI(OP_GETPEERNAME);
3078 case KEY_gethostbyname:
3081 case KEY_gethostbyaddr:
3082 LOP(OP_GHBYADDR,XTERM);
3084 case KEY_gethostent:
3087 case KEY_getnetbyname:
3090 case KEY_getnetbyaddr:
3091 LOP(OP_GNBYADDR,XTERM);
3096 case KEY_getservbyname:
3097 LOP(OP_GSBYNAME,XTERM);
3099 case KEY_getservbyport:
3100 LOP(OP_GSBYPORT,XTERM);
3102 case KEY_getservent:
3105 case KEY_getsockname:
3106 UNI(OP_GETSOCKNAME);
3108 case KEY_getsockopt:
3109 LOP(OP_GSOCKOPT,XTERM);
3131 yylval.ival = curcop->cop_line;
3135 LOP(OP_INDEX,XTERM);
3141 LOP(OP_IOCTL,XTERM);
3153 s = force_word(s,WORD,TRUE,FALSE,FALSE);
3184 LOP(OP_LISTEN,XTERM);
3194 TERM(sublex_start());
3197 LOP(OP_MAPSTART,XREF);
3200 LOP(OP_MKDIR,XTERM);
3203 LOP(OP_MSGCTL,XTERM);
3206 LOP(OP_MSGGET,XTERM);
3209 LOP(OP_MSGRCV,XTERM);
3212 LOP(OP_MSGSND,XTERM);
3217 if (isIDFIRST(*s)) {
3218 s = scan_word(s, tokenbuf, sizeof tokenbuf, TRUE, &len);
3219 in_my_stash = gv_stashpv(tokenbuf, FALSE);
3223 sprintf(tmpbuf, "No such class %.1000s", tokenbuf);
3230 s = force_word(s,WORD,TRUE,FALSE,FALSE);
3237 if (expect != XSTATE)
3238 yyerror("\"no\" not allowed in expression");
3239 s = force_word(s,WORD,FALSE,TRUE,FALSE);
3240 s = force_version(s);
3249 if (isIDFIRST(*s)) {
3251 for (d = s; isALNUM(*d); d++) ;
3253 if (strchr("|&*+-=!?:.", *t))
3254 warn("Precedence problem: open %.*s should be open(%.*s)",
3260 yylval.ival = OP_OR;
3270 LOP(OP_OPEN_DIR,XTERM);
3273 checkcomma(s,tokenbuf,"filehandle");
3277 checkcomma(s,tokenbuf,"filehandle");
3296 s = force_word(s,WORD,FALSE,TRUE,FALSE);
3300 LOP(OP_PIPE_OP,XTERM);
3305 missingterm((char*)0);
3306 yylval.ival = OP_CONST;
3307 TERM(sublex_start());
3315 missingterm((char*)0);
3316 if (dowarn && SvLEN(lex_stuff)) {
3317 d = SvPV_force(lex_stuff, len);
3318 for (; len; --len, ++d) {
3320 warn("Possible attempt to separate words with commas");
3324 warn("Possible attempt to put comments in qw() list");
3330 nextval[nexttoke].opval = (OP*)newSVOP(OP_CONST, 0, q(lex_stuff));
3334 nextval[nexttoke].opval = (OP*)newSVOP(OP_CONST, 0, newSVpv(" ",1));
3337 yylval.ival = OP_SPLIT;
3341 last_lop = oldbufptr;
3342 last_lop_op = OP_SPLIT;
3348 missingterm((char*)0);
3349 yylval.ival = OP_STRINGIFY;
3350 if (SvIVX(lex_stuff) == '\'')
3351 SvIVX(lex_stuff) = 0; /* qq'$foo' should intepolate */
3352 TERM(sublex_start());
3357 missingterm((char*)0);
3358 yylval.ival = OP_BACKTICK;
3360 TERM(sublex_start());
3367 s = force_word(s,WORD,TRUE,TRUE,FALSE);
3368 if (isIDFIRST(*tokenbuf))
3369 gv_stashpvn(tokenbuf, strlen(tokenbuf), TRUE);
3371 yyerror("<> should be quotes");
3378 s = force_word(s,WORD,TRUE,FALSE,FALSE);
3382 LOP(OP_RENAME,XTERM);
3391 LOP(OP_RINDEX,XTERM);
3414 LOP(OP_REVERSE,XTERM);
3425 TERM(sublex_start());
3427 TOKEN(1); /* force error */
3436 LOP(OP_SELECT,XTERM);
3442 LOP(OP_SEMCTL,XTERM);
3445 LOP(OP_SEMGET,XTERM);
3448 LOP(OP_SEMOP,XTERM);
3454 LOP(OP_SETPGRP,XTERM);
3456 case KEY_setpriority:
3457 LOP(OP_SETPRIORITY,XTERM);
3459 case KEY_sethostent:
3465 case KEY_setservent:
3468 case KEY_setprotoent:
3478 LOP(OP_SEEKDIR,XTERM);
3480 case KEY_setsockopt:
3481 LOP(OP_SSOCKOPT,XTERM);
3487 LOP(OP_SHMCTL,XTERM);
3490 LOP(OP_SHMGET,XTERM);
3493 LOP(OP_SHMREAD,XTERM);
3496 LOP(OP_SHMWRITE,XTERM);
3499 LOP(OP_SHUTDOWN,XTERM);
3508 LOP(OP_SOCKET,XTERM);
3510 case KEY_socketpair:
3511 LOP(OP_SOCKPAIR,XTERM);
3514 checkcomma(s,tokenbuf,"subroutine name");
3516 if (*s == ';' || *s == ')') /* probably a close */
3517 croak("sort is now a reserved word");
3519 s = force_word(s,WORD,TRUE,TRUE,TRUE);
3523 LOP(OP_SPLIT,XTERM);
3526 LOP(OP_SPRINTF,XTERM);
3529 LOP(OP_SPLICE,XTERM);
3545 LOP(OP_SUBSTR,XTERM);
3552 if (isIDFIRST(*s) || *s == '\'' || *s == ':') {
3553 char tmpbuf[sizeof tokenbuf];
3555 d = scan_word(s, tmpbuf, sizeof tmpbuf, TRUE, &len);
3556 if (strchr(tmpbuf, ':'))
3557 sv_setpv(subname, tmpbuf);
3559 sv_setsv(subname,curstname);
3560 sv_catpvn(subname,"::",2);
3561 sv_catpvn(subname,tmpbuf,len);
3563 s = force_word(s,WORD,FALSE,TRUE,TRUE);
3567 expect = XTERMBLOCK;
3568 sv_setpv(subname,"?");
3571 if (tmp == KEY_format) {
3574 lex_formbrack = lex_brackets + 1;
3578 /* Look for a prototype */
3585 SvREFCNT_dec(lex_stuff);
3587 croak("Prototype not terminated");
3590 d = SvPVX(lex_stuff);
3592 for (p = d; *p; ++p) {
3597 SvCUR(lex_stuff) = tmp;
3600 nextval[1] = nextval[0];
3601 nexttype[1] = nexttype[0];
3602 nextval[0].opval = (OP*)newSVOP(OP_CONST, 0, lex_stuff);
3603 nexttype[0] = THING;
3604 if (nexttoke == 1) {
3605 lex_defer = lex_state;
3606 lex_expect = expect;
3607 lex_state = LEX_KNOWNEXT;
3612 if (*SvPV(subname,na) == '?') {
3613 sv_setpv(subname,"__ANON__");
3620 LOP(OP_SYSTEM,XREF);
3623 LOP(OP_SYMLINK,XTERM);
3626 LOP(OP_SYSCALL,XTERM);
3629 LOP(OP_SYSOPEN,XTERM);
3632 LOP(OP_SYSSEEK,XTERM);
3635 LOP(OP_SYSREAD,XTERM);
3638 LOP(OP_SYSWRITE,XTERM);
3642 TERM(sublex_start());
3663 LOP(OP_TRUNCATE,XTERM);
3675 yylval.ival = curcop->cop_line;
3679 yylval.ival = curcop->cop_line;
3683 LOP(OP_UNLINK,XTERM);
3689 LOP(OP_UNPACK,XTERM);
3692 LOP(OP_UTIME,XTERM);
3696 for (d = s; d < bufend && (isSPACE(*d) || *d == '('); d++) ;
3697 if (*d != '0' && isDIGIT(*d))
3698 yywarn("umask: argument is missing initial 0");
3703 LOP(OP_UNSHIFT,XTERM);
3706 if (expect != XSTATE)
3707 yyerror("\"use\" not allowed in expression");
3710 s = force_version(s);
3711 if(*s == ';' || (s = skipspace(s), *s == ';')) {
3712 nextval[nexttoke].opval = Nullop;
3717 s = force_word(s,WORD,FALSE,TRUE,FALSE);
3718 s = force_version(s);
3731 yylval.ival = curcop->cop_line;
3735 hints |= HINT_BLOCK_SCOPE;
3742 LOP(OP_WAITPID,XTERM);
3748 gv_fetchpv("\f",TRUE, SVt_PV); /* Make sure $^L is defined */
3752 if (expect == XOPERATOR)
3758 yylval.ival = OP_XOR;
3763 TERM(sublex_start());
3769 keyword(register char *d, I32 len)
3774 if (strEQ(d,"__FILE__")) return -KEY___FILE__;
3775 if (strEQ(d,"__LINE__")) return -KEY___LINE__;
3776 if (strEQ(d,"__PACKAGE__")) return -KEY___PACKAGE__;
3777 if (strEQ(d,"__DATA__")) return KEY___DATA__;
3778 if (strEQ(d,"__END__")) return KEY___END__;
3782 if (strEQ(d,"AUTOLOAD")) return KEY_AUTOLOAD;
3787 if (strEQ(d,"and")) return -KEY_and;
3788 if (strEQ(d,"abs")) return -KEY_abs;
3791 if (strEQ(d,"alarm")) return -KEY_alarm;
3792 if (strEQ(d,"atan2")) return -KEY_atan2;
3795 if (strEQ(d,"accept")) return -KEY_accept;
3800 if (strEQ(d,"BEGIN")) return KEY_BEGIN;
3803 if (strEQ(d,"bless")) return -KEY_bless;
3804 if (strEQ(d,"bind")) return -KEY_bind;
3805 if (strEQ(d,"binmode")) return -KEY_binmode;
3808 if (strEQ(d,"CORE")) return -KEY_CORE;
3813 if (strEQ(d,"cmp")) return -KEY_cmp;
3814 if (strEQ(d,"chr")) return -KEY_chr;
3815 if (strEQ(d,"cos")) return -KEY_cos;
3818 if (strEQ(d,"chop")) return KEY_chop;
3821 if (strEQ(d,"close")) return -KEY_close;
3822 if (strEQ(d,"chdir")) return -KEY_chdir;
3823 if (strEQ(d,"chomp")) return KEY_chomp;
3824 if (strEQ(d,"chmod")) return -KEY_chmod;
3825 if (strEQ(d,"chown")) return -KEY_chown;
3826 if (strEQ(d,"crypt")) return -KEY_crypt;
3829 if (strEQ(d,"chroot")) return -KEY_chroot;
3830 if (strEQ(d,"caller")) return -KEY_caller;
3833 if (strEQ(d,"connect")) return -KEY_connect;
3836 if (strEQ(d,"closedir")) return -KEY_closedir;
3837 if (strEQ(d,"continue")) return -KEY_continue;
3842 if (strEQ(d,"DESTROY")) return KEY_DESTROY;
3847 if (strEQ(d,"do")) return KEY_do;
3850 if (strEQ(d,"die")) return -KEY_die;
3853 if (strEQ(d,"dump")) return -KEY_dump;
3856 if (strEQ(d,"delete")) return KEY_delete;
3859 if (strEQ(d,"defined")) return KEY_defined;
3860 if (strEQ(d,"dbmopen")) return -KEY_dbmopen;
3863 if (strEQ(d,"dbmclose")) return -KEY_dbmclose;
3868 if (strEQ(d,"EQ")) { deprecate(d); return -KEY_eq;}
3869 if (strEQ(d,"END")) return KEY_END;
3874 if (strEQ(d,"eq")) return -KEY_eq;
3877 if (strEQ(d,"eof")) return -KEY_eof;
3878 if (strEQ(d,"exp")) return -KEY_exp;
3881 if (strEQ(d,"else")) return KEY_else;
3882 if (strEQ(d,"exit")) return -KEY_exit;
3883 if (strEQ(d,"eval")) return KEY_eval;
3884 if (strEQ(d,"exec")) return -KEY_exec;
3885 if (strEQ(d,"each")) return KEY_each;
3888 if (strEQ(d,"elsif")) return KEY_elsif;
3891 if (strEQ(d,"exists")) return KEY_exists;
3892 if (strEQ(d,"elseif")) warn("elseif should be elsif");
3895 if (strEQ(d,"endgrent")) return -KEY_endgrent;
3896 if (strEQ(d,"endpwent")) return -KEY_endpwent;
3899 if (strEQ(d,"endnetent")) return -KEY_endnetent;
3902 if (strEQ(d,"endhostent")) return -KEY_endhostent;
3903 if (strEQ(d,"endservent")) return -KEY_endservent;
3906 if (strEQ(d,"endprotoent")) return -KEY_endprotoent;
3913 if (strEQ(d,"for")) return KEY_for;
3916 if (strEQ(d,"fork")) return -KEY_fork;
3919 if (strEQ(d,"fcntl")) return -KEY_fcntl;
3920 if (strEQ(d,"flock")) return -KEY_flock;
3923 if (strEQ(d,"format")) return KEY_format;
3924 if (strEQ(d,"fileno")) return -KEY_fileno;
3927 if (strEQ(d,"foreach")) return KEY_foreach;
3930 if (strEQ(d,"formline")) return -KEY_formline;
3936 if (strEQ(d,"GT")) { deprecate(d); return -KEY_gt;}
3937 if (strEQ(d,"GE")) { deprecate(d); return -KEY_ge;}
3941 if (strnEQ(d,"get",3)) {
3946 if (strEQ(d,"ppid")) return -KEY_getppid;
3947 if (strEQ(d,"pgrp")) return -KEY_getpgrp;
3950 if (strEQ(d,"pwent")) return -KEY_getpwent;
3951 if (strEQ(d,"pwnam")) return -KEY_getpwnam;
3952 if (strEQ(d,"pwuid")) return -KEY_getpwuid;
3955 if (strEQ(d,"peername")) return -KEY_getpeername;
3956 if (strEQ(d,"protoent")) return -KEY_getprotoent;
3957 if (strEQ(d,"priority")) return -KEY_getpriority;
3960 if (strEQ(d,"protobyname")) return -KEY_getprotobyname;
3963 if (strEQ(d,"protobynumber"))return -KEY_getprotobynumber;
3967 else if (*d == 'h') {
3968 if (strEQ(d,"hostbyname")) return -KEY_gethostbyname;
3969 if (strEQ(d,"hostbyaddr")) return -KEY_gethostbyaddr;
3970 if (strEQ(d,"hostent")) return -KEY_gethostent;
3972 else if (*d == 'n') {
3973 if (strEQ(d,"netbyname")) return -KEY_getnetbyname;
3974 if (strEQ(d,"netbyaddr")) return -KEY_getnetbyaddr;
3975 if (strEQ(d,"netent")) return -KEY_getnetent;
3977 else if (*d == 's') {
3978 if (strEQ(d,"servbyname")) return -KEY_getservbyname;
3979 if (strEQ(d,"servbyport")) return -KEY_getservbyport;
3980 if (strEQ(d,"servent")) return -KEY_getservent;
3981 if (strEQ(d,"sockname")) return -KEY_getsockname;
3982 if (strEQ(d,"sockopt")) return -KEY_getsockopt;
3984 else if (*d == 'g') {
3985 if (strEQ(d,"grent")) return -KEY_getgrent;
3986 if (strEQ(d,"grnam")) return -KEY_getgrnam;
3987 if (strEQ(d,"grgid")) return -KEY_getgrgid;
3989 else if (*d == 'l') {
3990 if (strEQ(d,"login")) return -KEY_getlogin;
3992 else if (strEQ(d,"c")) return -KEY_getc;
3997 if (strEQ(d,"gt")) return -KEY_gt;
3998 if (strEQ(d,"ge")) return -KEY_ge;
4001 if (strEQ(d,"grep")) return KEY_grep;
4002 if (strEQ(d,"goto")) return KEY_goto;
4003 if (strEQ(d,"glob")) return KEY_glob;
4006 if (strEQ(d,"gmtime")) return -KEY_gmtime;
4011 if (strEQ(d,"hex")) return -KEY_hex;
4014 if (strEQ(d,"INIT")) return KEY_INIT;
4019 if (strEQ(d,"if")) return KEY_if;
4022 if (strEQ(d,"int")) return -KEY_int;
4025 if (strEQ(d,"index")) return -KEY_index;
4026 if (strEQ(d,"ioctl")) return -KEY_ioctl;
4031 if (strEQ(d,"join")) return -KEY_join;
4035 if (strEQ(d,"keys")) return KEY_keys;
4036 if (strEQ(d,"kill")) return -KEY_kill;
4041 if (strEQ(d,"LT")) { deprecate(d); return -KEY_lt;}
4042 if (strEQ(d,"LE")) { deprecate(d); return -KEY_le;}
4048 if (strEQ(d,"lt")) return -KEY_lt;
4049 if (strEQ(d,"le")) return -KEY_le;
4050 if (strEQ(d,"lc")) return -KEY_lc;
4053 if (strEQ(d,"log")) return -KEY_log;
4056 if (strEQ(d,"last")) return KEY_last;
4057 if (strEQ(d,"link")) return -KEY_link;
4058 if (strEQ(d,"lock")) return -KEY_lock;
4061 if (strEQ(d,"local")) return KEY_local;
4062 if (strEQ(d,"lstat")) return -KEY_lstat;
4065 if (strEQ(d,"length")) return -KEY_length;
4066 if (strEQ(d,"listen")) return -KEY_listen;
4069 if (strEQ(d,"lcfirst")) return -KEY_lcfirst;
4072 if (strEQ(d,"localtime")) return -KEY_localtime;
4078 case 1: return KEY_m;
4080 if (strEQ(d,"my")) return KEY_my;
4083 if (strEQ(d,"map")) return KEY_map;
4086 if (strEQ(d,"mkdir")) return -KEY_mkdir;
4089 if (strEQ(d,"msgctl")) return -KEY_msgctl;
4090 if (strEQ(d,"msgget")) return -KEY_msgget;
4091 if (strEQ(d,"msgrcv")) return -KEY_msgrcv;
4092 if (strEQ(d,"msgsnd")) return -KEY_msgsnd;
4097 if (strEQ(d,"NE")) { deprecate(d); return -KEY_ne;}
4100 if (strEQ(d,"next")) return KEY_next;
4101 if (strEQ(d,"ne")) return -KEY_ne;
4102 if (strEQ(d,"not")) return -KEY_not;
4103 if (strEQ(d,"no")) return KEY_no;
4108 if (strEQ(d,"or")) return -KEY_or;
4111 if (strEQ(d,"ord")) return -KEY_ord;
4112 if (strEQ(d,"oct")) return -KEY_oct;
4115 if (strEQ(d,"open")) return -KEY_open;
4118 if (strEQ(d,"opendir")) return -KEY_opendir;
4125 if (strEQ(d,"pop")) return KEY_pop;
4126 if (strEQ(d,"pos")) return KEY_pos;
4129 if (strEQ(d,"push")) return KEY_push;
4130 if (strEQ(d,"pack")) return -KEY_pack;
4131 if (strEQ(d,"pipe")) return -KEY_pipe;
4134 if (strEQ(d,"print")) return KEY_print;
4137 if (strEQ(d,"printf")) return KEY_printf;
4140 if (strEQ(d,"package")) return KEY_package;
4143 if (strEQ(d,"prototype")) return KEY_prototype;
4148 if (strEQ(d,"q")) return KEY_q;
4149 if (strEQ(d,"qq")) return KEY_qq;
4150 if (strEQ(d,"qw")) return KEY_qw;
4151 if (strEQ(d,"qx")) return KEY_qx;
4153 else if (strEQ(d,"quotemeta")) return -KEY_quotemeta;
4158 if (strEQ(d,"ref")) return -KEY_ref;
4161 if (strEQ(d,"read")) return -KEY_read;
4162 if (strEQ(d,"rand")) return -KEY_rand;
4163 if (strEQ(d,"recv")) return -KEY_recv;
4164 if (strEQ(d,"redo")) return KEY_redo;
4167 if (strEQ(d,"rmdir")) return -KEY_rmdir;
4168 if (strEQ(d,"reset")) return -KEY_reset;
4171 if (strEQ(d,"return")) return KEY_return;
4172 if (strEQ(d,"rename")) return -KEY_rename;
4173 if (strEQ(d,"rindex")) return -KEY_rindex;
4176 if (strEQ(d,"require")) return -KEY_require;
4177 if (strEQ(d,"reverse")) return -KEY_reverse;
4178 if (strEQ(d,"readdir")) return -KEY_readdir;
4181 if (strEQ(d,"readlink")) return -KEY_readlink;
4182 if (strEQ(d,"readline")) return -KEY_readline;
4183 if (strEQ(d,"readpipe")) return -KEY_readpipe;
4186 if (strEQ(d,"rewinddir")) return -KEY_rewinddir;
4192 case 0: return KEY_s;
4194 if (strEQ(d,"scalar")) return KEY_scalar;
4199 if (strEQ(d,"seek")) return -KEY_seek;
4200 if (strEQ(d,"send")) return -KEY_send;
4203 if (strEQ(d,"semop")) return -KEY_semop;
4206 if (strEQ(d,"select")) return -KEY_select;
4207 if (strEQ(d,"semctl")) return -KEY_semctl;
4208 if (strEQ(d,"semget")) return -KEY_semget;
4211 if (strEQ(d,"setpgrp")) return -KEY_setpgrp;
4212 if (strEQ(d,"seekdir")) return -KEY_seekdir;
4215 if (strEQ(d,"setpwent")) return -KEY_setpwent;
4216 if (strEQ(d,"setgrent")) return -KEY_setgrent;
4219 if (strEQ(d,"setnetent")) return -KEY_setnetent;
4222 if (strEQ(d,"setsockopt")) return -KEY_setsockopt;
4223 if (strEQ(d,"sethostent")) return -KEY_sethostent;
4224 if (strEQ(d,"setservent")) return -KEY_setservent;
4227 if (strEQ(d,"setpriority")) return -KEY_setpriority;
4228 if (strEQ(d,"setprotoent")) return -KEY_setprotoent;
4235 if (strEQ(d,"shift")) return KEY_shift;
4238 if (strEQ(d,"shmctl")) return -KEY_shmctl;
4239 if (strEQ(d,"shmget")) return -KEY_shmget;
4242 if (strEQ(d,"shmread")) return -KEY_shmread;
4245 if (strEQ(d,"shmwrite")) return -KEY_shmwrite;
4246 if (strEQ(d,"shutdown")) return -KEY_shutdown;
4251 if (strEQ(d,"sin")) return -KEY_sin;
4254 if (strEQ(d,"sleep")) return -KEY_sleep;
4257 if (strEQ(d,"sort")) return KEY_sort;
4258 if (strEQ(d,"socket")) return -KEY_socket;
4259 if (strEQ(d,"socketpair")) return -KEY_socketpair;
4262 if (strEQ(d,"split")) return KEY_split;
4263 if (strEQ(d,"sprintf")) return -KEY_sprintf;
4264 if (strEQ(d,"splice")) return KEY_splice;
4267 if (strEQ(d,"sqrt")) return -KEY_sqrt;
4270 if (strEQ(d,"srand")) return -KEY_srand;
4273 if (strEQ(d,"stat")) return -KEY_stat;
4274 if (strEQ(d,"study")) return KEY_study;
4277 if (strEQ(d,"substr")) return -KEY_substr;
4278 if (strEQ(d,"sub")) return KEY_sub;
4283 if (strEQ(d,"system")) return -KEY_system;
4286 if (strEQ(d,"symlink")) return -KEY_symlink;
4287 if (strEQ(d,"syscall")) return -KEY_syscall;
4288 if (strEQ(d,"sysopen")) return -KEY_sysopen;
4289 if (strEQ(d,"sysread")) return -KEY_sysread;
4290 if (strEQ(d,"sysseek")) return -KEY_sysseek;
4293 if (strEQ(d,"syswrite")) return -KEY_syswrite;
4302 if (strEQ(d,"tr")) return KEY_tr;
4305 if (strEQ(d,"tie")) return KEY_tie;
4308 if (strEQ(d,"tell")) return -KEY_tell;
4309 if (strEQ(d,"tied")) return KEY_tied;
4310 if (strEQ(d,"time")) return -KEY_time;
4313 if (strEQ(d,"times")) return -KEY_times;
4316 if (strEQ(d,"telldir")) return -KEY_telldir;
4319 if (strEQ(d,"truncate")) return -KEY_truncate;
4326 if (strEQ(d,"uc")) return -KEY_uc;
4329 if (strEQ(d,"use")) return KEY_use;
4332 if (strEQ(d,"undef")) return KEY_undef;
4333 if (strEQ(d,"until")) return KEY_until;
4334 if (strEQ(d,"untie")) return KEY_untie;
4335 if (strEQ(d,"utime")) return -KEY_utime;
4336 if (strEQ(d,"umask")) return -KEY_umask;
4339 if (strEQ(d,"unless")) return KEY_unless;
4340 if (strEQ(d,"unpack")) return -KEY_unpack;
4341 if (strEQ(d,"unlink")) return -KEY_unlink;
4344 if (strEQ(d,"unshift")) return KEY_unshift;
4345 if (strEQ(d,"ucfirst")) return -KEY_ucfirst;
4350 if (strEQ(d,"values")) return -KEY_values;
4351 if (strEQ(d,"vec")) return -KEY_vec;
4356 if (strEQ(d,"warn")) return -KEY_warn;
4357 if (strEQ(d,"wait")) return -KEY_wait;
4360 if (strEQ(d,"while")) return KEY_while;
4361 if (strEQ(d,"write")) return -KEY_write;
4364 if (strEQ(d,"waitpid")) return -KEY_waitpid;
4367 if (strEQ(d,"wantarray")) return -KEY_wantarray;
4372 if (len == 1) return -KEY_x;
4373 if (strEQ(d,"xor")) return -KEY_xor;
4376 if (len == 1) return KEY_y;
4385 checkcomma(register char *s, char *name, char *what)
4389 if (dowarn && *s == ' ' && s[1] == '(') { /* XXX gotta be a better way */
4391 for (w = s+2; *w && level; w++) {
4398 for (; *w && isSPACE(*w); w++) ;
4399 if (!*w || !strchr(";|})]oaiuw!=", *w)) /* an advisory hack only... */
4400 warn("%s (...) interpreted as function",name);
4402 while (s < bufend && isSPACE(*s))
4406 while (s < bufend && isSPACE(*s))
4408 if (isIDFIRST(*s)) {
4412 while (s < bufend && isSPACE(*s))
4417 kw = keyword(w, s - w) || perl_get_cv(w, FALSE) != 0;
4421 croak("No comma allowed after %s", what);
4427 scan_word(register char *s, char *dest, STRLEN destlen, int allow_package, STRLEN *slp)
4429 register char *d = dest;
4430 register char *e = d + destlen - 3; /* two-character token, ending NUL */
4433 croak(ident_too_long);
4436 else if (*s == '\'' && allow_package && isIDFIRST(s[1])) {
4441 else if (*s == ':' && s[1] == ':' && allow_package && isIDFIRST(s[2])) {
4454 scan_ident(register char *s, register char *send, char *dest, STRLEN destlen, I32 ck_uni)
4461 if (lex_brackets == 0)
4466 e = d + destlen - 3; /* two-character token, ending NUL */
4468 while (isDIGIT(*s)) {
4470 croak(ident_too_long);
4477 croak(ident_too_long);
4480 else if (*s == '\'' && isIDFIRST(s[1])) {
4485 else if (*s == ':' && s[1] == ':') {
4496 if (lex_state != LEX_NORMAL)
4497 lex_state = LEX_INTERPENDMAYBE;
4500 if (*s == '$' && s[1] &&
4501 (isALNUM(s[1]) || strchr("${", s[1]) || strnEQ(s+1,"::",2)) )
4503 if (isDIGIT(s[1]) && lex_state == LEX_INTERPNORMAL)
4504 deprecate("\"$$<digit>\" to mean \"${$}<digit>\"");
4517 if (*d == '^' && *s && (isUPPER(*s) || strchr("[\\]^_?", *s))) {
4522 if (isSPACE(s[-1])) {
4525 if (ch != ' ' && ch != '\t') {
4531 if (isIDFIRST(*d)) {
4533 while (isALNUM(*s) || *s == ':')
4536 while (s < send && (*s == ' ' || *s == '\t')) s++;
4537 if ((*s == '[' || (*s == '{' && strNE(dest, "sub")))) {
4538 if (dowarn && keyword(dest, d - dest)) {
4539 char *brack = *s == '[' ? "[...]" : "{...}";
4540 warn("Ambiguous use of %c{%s%s} resolved to %c%s%s",
4541 funny, dest, brack, funny, dest, brack);
4543 lex_fakebrack = lex_brackets+1;
4545 lex_brackstack[lex_brackets++] = XOPERATOR;
4551 if (lex_state == LEX_INTERPNORMAL && !lex_brackets)
4552 lex_state = LEX_INTERPEND;
4555 if (dowarn && lex_state == LEX_NORMAL &&
4556 (keyword(dest, d - dest) || perl_get_cv(dest, FALSE)))
4557 warn("Ambiguous use of %c{%s} resolved to %c%s",
4558 funny, dest, funny, dest);
4561 s = bracket; /* let the parser handle it */
4565 else if (lex_state == LEX_INTERPNORMAL && !lex_brackets && !intuit_more(s))
4566 lex_state = LEX_INTERPEND;
4570 void pmflag(U16 *pmfl, int ch)
4575 *pmfl |= PMf_GLOBAL;
4577 *pmfl |= PMf_CONTINUE;
4581 *pmfl |= PMf_MULTILINE;
4583 *pmfl |= PMf_SINGLELINE;
4585 *pmfl |= PMf_EXTENDED;
4589 scan_pat(char *start)
4594 s = scan_str(start);
4597 SvREFCNT_dec(lex_stuff);
4599 croak("Search pattern not terminated");
4602 pm = (PMOP*)newPMOP(OP_MATCH, 0);
4603 if (multi_open == '?')
4604 pm->op_pmflags |= PMf_ONCE;
4605 while (*s && strchr("iogcmsx", *s))
4606 pmflag(&pm->op_pmflags,*s++);
4607 pm->op_pmpermflags = pm->op_pmflags;
4610 yylval.ival = OP_MATCH;
4615 scan_subst(char *start)
4622 yylval.ival = OP_NULL;
4624 s = scan_str(start);
4628 SvREFCNT_dec(lex_stuff);
4630 croak("Substitution pattern not terminated");
4633 if (s[-1] == multi_open)
4636 first_start = multi_start;
4640 SvREFCNT_dec(lex_stuff);
4643 SvREFCNT_dec(lex_repl);
4645 croak("Substitution replacement not terminated");
4647 multi_start = first_start; /* so whole substitution is taken together */
4649 pm = (PMOP*)newPMOP(OP_SUBST, 0);
4650 while (*s && strchr("iogcmsex", *s)) {
4656 pmflag(&pm->op_pmflags,*s++);
4661 pm->op_pmflags |= PMf_EVAL;
4662 repl = newSVpv("",0);
4664 sv_catpv(repl, es ? "eval " : "do ");
4665 sv_catpvn(repl, "{ ", 2);
4666 sv_catsv(repl, lex_repl);
4667 sv_catpvn(repl, " };", 2);
4668 SvCOMPILED_on(repl);
4669 SvREFCNT_dec(lex_repl);
4673 pm->op_pmpermflags = pm->op_pmflags;
4675 yylval.ival = OP_SUBST;
4680 hoistmust(register PMOP *pm)
4683 if (!pm->op_pmshort && pm->op_pmregexp->regstart &&
4684 (!pm->op_pmregexp->regmust || pm->op_pmregexp->reganch & ROPT_ANCH)
4686 if (!(pm->op_pmregexp->reganch & ROPT_ANCH))
4687 pm->op_pmflags |= PMf_SCANFIRST;
4688 pm->op_pmshort = SvREFCNT_inc(pm->op_pmregexp->regstart);
4689 pm->op_pmslen = SvCUR(pm->op_pmshort);
4691 else if (pm->op_pmregexp->regmust) {/* is there a better short-circuit? */
4692 if (pm->op_pmshort &&
4693 sv_eq(pm->op_pmshort,pm->op_pmregexp->regmust))
4695 if (pm->op_pmflags & PMf_SCANFIRST) {
4696 SvREFCNT_dec(pm->op_pmshort);
4697 pm->op_pmshort = Nullsv;
4700 SvREFCNT_dec(pm->op_pmregexp->regmust);
4701 pm->op_pmregexp->regmust = Nullsv;
4705 /* promote the better string */
4706 if ((!pm->op_pmshort &&
4707 !(pm->op_pmregexp->reganch & ROPT_ANCH_GPOS)) ||
4708 ((pm->op_pmflags & PMf_SCANFIRST) &&
4709 (SvCUR(pm->op_pmshort) < SvCUR(pm->op_pmregexp->regmust)))) {
4710 SvREFCNT_dec(pm->op_pmshort); /* ok if null */
4711 pm->op_pmshort = pm->op_pmregexp->regmust;
4712 pm->op_pmslen = SvCUR(pm->op_pmshort);
4713 pm->op_pmregexp->regmust = Nullsv;
4714 pm->op_pmflags |= PMf_SCANFIRST;
4720 scan_trans(char *start)
4729 yylval.ival = OP_NULL;
4731 s = scan_str(start);
4734 SvREFCNT_dec(lex_stuff);
4736 croak("Translation pattern not terminated");
4738 if (s[-1] == multi_open)
4744 SvREFCNT_dec(lex_stuff);
4747 SvREFCNT_dec(lex_repl);
4749 croak("Translation replacement not terminated");
4752 New(803,tbl,256,short);
4753 o = newPVOP(OP_TRANS, 0, (char*)tbl);
4755 complement = Delete = squash = 0;
4756 while (*s == 'c' || *s == 'd' || *s == 's') {
4758 complement = OPpTRANS_COMPLEMENT;
4760 Delete = OPpTRANS_DELETE;
4762 squash = OPpTRANS_SQUASH;
4765 o->op_private = Delete|squash|complement;
4768 yylval.ival = OP_TRANS;
4773 scan_heredoc(register char *s)
4777 I32 op_type = OP_SCALAR;
4784 int outer = (rsfp && !lex_inwhat);
4788 e = tokenbuf + sizeof tokenbuf - 1;
4791 for (peek = s; *peek == ' ' || *peek == '\t'; peek++) ;
4792 if (*peek && strchr("`'\"",*peek)) {
4795 s = delimcpy(d, e, s, bufend, term, &len);
4806 deprecate("bare << to mean <<\"\"");
4807 for (; isALNUM(*s); s++) {
4812 if (d >= tokenbuf + sizeof tokenbuf - 1)
4813 croak("Delimiter for here document is too long");
4818 if (outer || !(d=ninstr(s,bufend,d,d+1)))
4819 herewas = newSVpv(s,bufend-s);
4821 s--, herewas = newSVpv(s,d-s);
4822 s += SvCUR(herewas);
4824 tmpstr = NEWSV(87,80);
4825 sv_upgrade(tmpstr, SVt_PVIV);
4830 else if (term == '`') {
4831 op_type = OP_BACKTICK;
4832 SvIVX(tmpstr) = '\\';
4836 multi_start = curcop->cop_line;
4837 multi_open = multi_close = '<';
4841 while (s < bufend &&
4842 (*s != term || memNE(s,tokenbuf,len)) ) {
4847 curcop->cop_line = multi_start;
4848 missingterm(tokenbuf);
4850 sv_setpvn(tmpstr,d+1,s-d);
4852 sv_catpvn(herewas,s,bufend-s);
4853 sv_setsv(linestr,herewas);
4854 oldoldbufptr = oldbufptr = bufptr = s = linestart = SvPVX(linestr);
4855 bufend = SvPVX(linestr) + SvCUR(linestr);
4858 sv_setpvn(tmpstr,"",0); /* avoid "uninitialized" warning */
4859 while (s >= bufend) { /* multiple line string? */
4861 !(oldoldbufptr = oldbufptr = s = linestart = filter_gets(linestr, rsfp, 0))) {
4862 curcop->cop_line = multi_start;
4863 missingterm(tokenbuf);
4866 if (PERLDB_LINE && curstash != debstash) {
4867 SV *sv = NEWSV(88,0);
4869 sv_upgrade(sv, SVt_PVMG);
4870 sv_setsv(sv,linestr);
4871 av_store(GvAV(curcop->cop_filegv),
4872 (I32)curcop->cop_line,sv);
4874 bufend = SvPVX(linestr) + SvCUR(linestr);
4875 if (*s == term && memEQ(s,tokenbuf,len)) {
4878 sv_catsv(linestr,herewas);
4879 bufend = SvPVX(linestr) + SvCUR(linestr);
4883 sv_catsv(tmpstr,linestr);
4886 multi_end = curcop->cop_line;
4888 if (SvCUR(tmpstr) + 5 < SvLEN(tmpstr)) {
4889 SvLEN_set(tmpstr, SvCUR(tmpstr) + 1);
4890 Renew(SvPVX(tmpstr), SvLEN(tmpstr), char);
4892 SvREFCNT_dec(herewas);
4894 yylval.ival = op_type;
4899 scan_inputsymbol(char *start)
4901 register char *s = start;
4907 e = tokenbuf + sizeof tokenbuf;
4908 s = delimcpy(d, e, s + 1, bufend, '>', &len);
4909 if (len >= sizeof tokenbuf)
4910 croak("Excessively long <> operator");
4912 croak("Unterminated <> operator");
4914 if (*d == '$' && d[1]) d++;
4915 while (*d && (isALNUM(*d) || *d == '\'' || *d == ':'))
4917 if (d - tokenbuf != len) {
4918 yylval.ival = OP_GLOB;
4920 s = scan_str(start);
4922 croak("Glob not terminated");
4928 (void)strcpy(d,"ARGV");
4931 if ((tmp = pad_findmy(d)) != NOT_IN_PAD) {
4932 OP *o = newOP(OP_PADSV, 0);
4934 lex_op = (OP*)newUNOP(OP_READLINE, 0, newUNOP(OP_RV2GV, 0, o));
4937 GV *gv = gv_fetchpv(d+1,TRUE, SVt_PV);
4938 lex_op = (OP*)newUNOP(OP_READLINE, 0,
4939 newUNOP(OP_RV2GV, 0,
4940 newUNOP(OP_RV2SV, 0,
4941 newGVOP(OP_GV, 0, gv))));
4943 yylval.ival = OP_NULL;
4946 GV *gv = gv_fetchpv(d,TRUE, SVt_PVIO);
4947 lex_op = (OP*)newUNOP(OP_READLINE, 0, newGVOP(OP_GV, 0, gv));
4948 yylval.ival = OP_NULL;
4955 scan_str(char *start)
4960 register char *s = start;
4969 multi_start = curcop->cop_line;
4971 if (term && (tmps = strchr("([{< )]}> )]}>",term)))
4976 sv_upgrade(sv, SVt_PVIV);
4978 (void)SvPOK_only(sv); /* validate pointer */
4981 SvGROW(sv, SvCUR(sv) + (bufend - s) + 1);
4982 to = SvPVX(sv)+SvCUR(sv);
4983 if (multi_open == multi_close) {
4984 for (; s < bufend; s++,to++) {
4985 if (*s == '\n' && !rsfp)
4987 if (*s == '\\' && s+1 < bufend && term != '\\') {
4993 else if (*s == term)
4999 for (; s < bufend; s++,to++) {
5000 if (*s == '\n' && !rsfp)
5002 if (*s == '\\' && s+1 < bufend) {
5003 if ((s[1] == multi_open) || (s[1] == multi_close))
5008 else if (*s == multi_close && --brackets <= 0)
5010 else if (*s == multi_open)
5016 SvCUR_set(sv, to - SvPVX(sv));
5018 if (s < bufend) break; /* string ends on this line? */
5021 !(oldoldbufptr = oldbufptr = s = linestart = filter_gets(linestr, rsfp, 0))) {
5023 curcop->cop_line = multi_start;
5027 if (PERLDB_LINE && curstash != debstash) {
5028 SV *sv = NEWSV(88,0);
5030 sv_upgrade(sv, SVt_PVMG);
5031 sv_setsv(sv,linestr);
5032 av_store(GvAV(curcop->cop_filegv),
5033 (I32)curcop->cop_line, sv);
5035 bufend = SvPVX(linestr) + SvCUR(linestr);
5037 multi_end = curcop->cop_line;
5039 if (SvCUR(sv) + 5 < SvLEN(sv)) {
5040 SvLEN_set(sv, SvCUR(sv) + 1);
5041 Renew(SvPVX(sv), SvLEN(sv), char);
5051 scan_num(char *start)
5053 register char *s = start;
5061 static char number_too_long[] = "Number too long";
5065 croak("panic: scan_num");
5070 bool overflowed = FALSE;
5076 else if (s[1] == '.')
5092 yyerror("Illegal octal digit");
5094 case '0': case '1': case '2': case '3': case '4':
5095 case '5': case '6': case '7':
5098 case 'a': case 'b': case 'c': case 'd': case 'e': case 'f':
5099 case 'A': case 'B': case 'C': case 'D': case 'E': case 'F':
5105 if (!overflowed && (n >> shift) != u) {
5106 warn("Integer overflow in %s number",
5107 (shift == 4) ? "hex" : "octal");
5119 case '1': case '2': case '3': case '4': case '5':
5120 case '6': case '7': case '8': case '9': case '.':
5123 e = tokenbuf + sizeof tokenbuf - 6; /* room for various punctuation */
5125 while (isDIGIT(*s) || *s == '_') {
5127 if (dowarn && lastub && s - lastub != 3)
5128 warn("Misplaced _ in number");
5133 croak(number_too_long);
5137 if (dowarn && lastub && s - lastub != 3)
5138 warn("Misplaced _ in number");
5139 if (*s == '.' && s[1] != '.') {
5142 for (; isDIGIT(*s) || *s == '_'; s++) {
5144 croak(number_too_long);
5149 if (*s && strchr("eE",*s) && strchr("+-0123456789",s[1])) {
5152 *d++ = 'e'; /* At least some Mach atof()s don't grok 'E' */
5153 if (*s == '+' || *s == '-')
5155 while (isDIGIT(*s)) {
5157 croak(number_too_long);
5163 SET_NUMERIC_STANDARD();
5164 value = atof(tokenbuf);
5166 if (!floatit && (double)tryiv == value)
5167 sv_setiv(sv, tryiv);
5169 sv_setnv(sv, value);
5173 yylval.opval = newSVOP(OP_CONST, 0, sv);
5179 scan_formline(register char *s)
5184 SV *stuff = newSVpv("",0);
5185 bool needargs = FALSE;
5188 if (*s == '.' || *s == '}') {
5190 for (t = s+1; *t == ' ' || *t == '\t'; t++) ;
5194 if (in_eval && !rsfp) {
5195 eol = strchr(s,'\n');
5200 eol = bufend = SvPVX(linestr) + SvCUR(linestr);
5202 for (t = s; t < eol; t++) {
5203 if (*t == '~' && t[1] == '~' && SvCUR(stuff)) {
5205 goto enough; /* ~~ must be first line in formline */
5207 if (*t == '@' || *t == '^')
5210 sv_catpvn(stuff, s, eol-s);
5214 s = filter_gets(linestr, rsfp, 0);
5215 oldoldbufptr = oldbufptr = bufptr = linestart = SvPVX(linestr);
5216 bufend = bufptr + SvCUR(linestr);
5219 yyerror("Format not terminated");
5229 lex_state = LEX_NORMAL;
5230 nextval[nexttoke].ival = 0;
5234 lex_state = LEX_FORMLINE;
5235 nextval[nexttoke].opval = (OP*)newSVOP(OP_CONST, 0, stuff);
5237 nextval[nexttoke].ival = OP_FORMLINE;
5241 SvREFCNT_dec(stuff);
5253 cshlen = strlen(cshname);
5258 start_subparse(I32 is_format, U32 flags)
5261 I32 oldsavestack_ix = savestack_ix;
5262 CV* outsidecv = compcv;
5266 assert(SvTYPE(compcv) == SVt_PVCV);
5273 SAVESPTR(comppad_name);
5275 SAVEI32(comppad_name_fill);
5276 SAVEI32(min_intro_pending);
5277 SAVEI32(max_intro_pending);
5278 SAVEI32(pad_reset_pending);
5280 compcv = (CV*)NEWSV(1104,0);
5281 sv_upgrade((SV *)compcv, is_format ? SVt_PVFM : SVt_PVCV);
5282 CvFLAGS(compcv) |= flags;
5285 av_push(comppad, Nullsv);
5286 curpad = AvARRAY(comppad);
5287 comppad_name = newAV();
5288 comppad_name_fill = 0;
5289 min_intro_pending = 0;
5291 subline = curcop->cop_line;
5293 av_store(comppad_name, 0, newSVpv("@_", 2));
5294 curpad[0] = (SV*)newAV();
5295 SvPADMY_on(curpad[0]); /* XXX Needed? */
5296 CvOWNER(compcv) = 0;
5297 New(666, CvMUTEXP(compcv), 1, perl_mutex);
5298 MUTEX_INIT(CvMUTEXP(compcv));
5299 #endif /* USE_THREADS */
5301 comppadlist = newAV();
5302 AvREAL_off(comppadlist);
5303 av_store(comppadlist, 0, (SV*)comppad_name);
5304 av_store(comppadlist, 1, (SV*)comppad);
5306 CvPADLIST(compcv) = comppadlist;
5307 CvOUTSIDE(compcv) = (CV*)SvREFCNT_inc(outsidecv);
5309 CvOWNER(compcv) = 0;
5310 New(666, CvMUTEXP(compcv), 1, perl_mutex);
5311 MUTEX_INIT(CvMUTEXP(compcv));
5312 #endif /* USE_THREADS */
5314 return oldsavestack_ix;
5333 char *context = NULL;
5337 if (!yychar || (yychar == ';' && !rsfp))
5339 else if (bufptr > oldoldbufptr && bufptr - oldoldbufptr < 200 &&
5340 oldoldbufptr != oldbufptr && oldbufptr != bufptr) {
5341 while (isSPACE(*oldoldbufptr))
5343 context = oldoldbufptr;
5344 contlen = bufptr - oldoldbufptr;
5346 else if (bufptr > oldbufptr && bufptr - oldbufptr < 200 &&
5347 oldbufptr != bufptr) {
5348 while (isSPACE(*oldbufptr))
5350 context = oldbufptr;
5351 contlen = bufptr - oldbufptr;
5353 else if (yychar > 255)
5354 where = "next token ???";
5355 else if ((yychar & 127) == 127) {
5356 if (lex_state == LEX_NORMAL ||
5357 (lex_state == LEX_KNOWNEXT && lex_defer == LEX_NORMAL))
5358 where = "at end of line";
5360 where = "within pattern";
5362 where = "within string";
5365 SV *where_sv = sv_2mortal(newSVpv("next char ", 0));
5367 sv_catpvf(where_sv, "^%c", toCTRL(yychar));
5368 else if (isPRINT_LC(yychar))
5369 sv_catpvf(where_sv, "%c", yychar);
5371 sv_catpvf(where_sv, "\\%03o", yychar & 255);
5372 where = SvPVX(where_sv);
5374 msg = sv_2mortal(newSVpv(s, 0));
5375 sv_catpvf(msg, " at %_ line %ld, ",
5376 GvSV(curcop->cop_filegv), (long)curcop->cop_line);
5378 sv_catpvf(msg, "near \"%.*s\"\n", contlen, context);
5380 sv_catpvf(msg, "%s\n", where);
5381 if (multi_start < multi_end && (U32)(curcop->cop_line - multi_end) <= 1) {
5383 " (Might be a runaway multi-line %c%c string starting on line %ld)\n",
5384 (int)multi_open,(int)multi_close,(long)multi_start);
5390 sv_catsv(ERRSV, msg);
5392 PerlIO_write(PerlIO_stderr(), SvPVX(msg), SvCUR(msg));
5393 if (++error_count >= 10)
5394 croak("%_ has too many errors.\n", GvSV(curcop->cop_filegv));
5396 in_my_stash = Nullhv;