X-Git-Url: http://git.shadowcat.co.uk/gitweb/gitweb.cgi?a=blobdiff_plain;f=Parameters.xs;h=bb306931316c1630808b9420304b74b9f7e693a9;hb=31534187f6c934412c03d27eb4eb05993950855c;hp=5372f04024cbb6c9d7cd1f5c7f9e73d919bc2ab5;hpb=abccbe865a63e6620c5f24d8cbd7872247e68b1b;p=p5sagit%2FFunction-Parameters.git diff --git a/Parameters.xs b/Parameters.xs index 5372f04..bb30693 100644 --- a/Parameters.xs +++ b/Parameters.xs @@ -156,9 +156,6 @@ static int kw_flags(pTHX_ const char *kw_ptr, STRLEN kw_len, KWSpec *spec) { } -#include "toke_on_crack.c.inc" - - static void free_defspec(pTHX_ void *vp) { DefaultParamSpec *dp = vp; op_free(dp->init); @@ -216,11 +213,235 @@ enum { MY_ATTR_SPECIAL = 0x04 }; +static void my_sv_cat_c(pTHX_ SV *sv, U32 c) { + char ds[UTF8_MAXBYTES + 1], *d; + d = uvchr_to_utf8(ds, c); + if (d - ds > 1) { + sv_utf8_upgrade(sv); + } + sv_catpvn(sv, ds, d - ds); +} + +static bool my_is_uni_xidfirst(pTHX_ UV c) { + U8 tmpbuf[UTF8_MAXBYTES + 1]; + uvchr_to_utf8(tmpbuf, c); + return is_utf8_xidfirst(tmpbuf); +} + +static bool my_is_uni_xidcont(pTHX_ UV c) { + U8 tmpbuf[UTF8_MAXBYTES + 1]; + uvchr_to_utf8(tmpbuf, c); + return is_utf8_xidcont(tmpbuf); +} + +static SV *my_scan_word(pTHX_ bool allow_package) { + bool at_start, at_substart; + I32 c; + SV *sv = sv_2mortal(newSVpvs("")); + if (lex_bufutf8()) { + SvUTF8_on(sv); + } + + at_start = at_substart = TRUE; + c = lex_peek_unichar(0); + + while (c != -1) { + if (at_substart ? my_is_uni_xidfirst(aTHX_ c) : my_is_uni_xidcont(aTHX_ c)) { + lex_read_unichar(0); + my_sv_cat_c(aTHX_ sv, c); + at_substart = FALSE; + c = lex_peek_unichar(0); + } else if (allow_package && !at_substart && c == '\'') { + lex_read_unichar(0); + c = lex_peek_unichar(0); + if (!my_is_uni_xidfirst(aTHX_ c)) { + lex_stuff_pvs("'", 0); + break; + } + sv_catpvs(sv, "'"); + at_substart = TRUE; + } else if (allow_package && (at_start || !at_substart) && c == ':') { + lex_read_unichar(0); + if (lex_peek_unichar(0) != ':') { + lex_stuff_pvs(":", 0); + break; + } + lex_read_unichar(0); + c = lex_peek_unichar(0); + if (!my_is_uni_xidfirst(aTHX_ c)) { + lex_stuff_pvs("::", 0); + break; + } + sv_catpvs(sv, "::"); + at_substart = TRUE; + } else { + break; + } + at_start = FALSE; + } + + return SvCUR(sv) ? sv : NULL; +} + +static SV *my_scan_parens_tail(pTHX_ bool keep_backslash) { + I32 c, nesting; + SV *sv; + line_t start; + + start = CopLINE(PL_curcop); + + sv = sv_2mortal(newSVpvs("")); + if (lex_bufutf8()) { + SvUTF8_on(sv); + } + + nesting = 0; + for (;;) { + c = lex_read_unichar(0); + if (c == EOF) { + CopLINE_set(PL_curcop, start); + return NULL; + } + + if (c == '\\') { + c = lex_read_unichar(0); + if (c == EOF) { + CopLINE_set(PL_curcop, start); + return NULL; + } + if (keep_backslash || (c != '(' && c != ')')) { + sv_catpvs(sv, "\\"); + } + } else if (c == '(') { + nesting++; + } else if (c == ')') { + if (!nesting) { + break; + } + nesting--; + } + + my_sv_cat_c(aTHX_ sv, c); + } + + return sv; +} + +static void my_check_prototype(pTHX_ const SV *declarator, SV *proto) { + char *start, *r, *w, *end; + STRLEN len; + + /* strip spaces */ + start = SvPV(proto, len); + end = start + len; + + for (w = r = start; r < end; r++) { + if (!isSPACE(*r)) { + *w++ = *r; + } + } + *w = '\0'; + SvCUR_set(proto, w - start); + end = w; + len = end - start; + + if (!ckWARN(WARN_ILLEGALPROTO)) { + return; + } + + /* check for bad characters */ + if (strspn(start, "$@%*;[]&\\_+") != len) { + SV *dsv = newSVpvs_flags("", SVs_TEMP); + warner( + packWARN(WARN_ILLEGALPROTO), + "Illegal character in prototype for %"SVf" : %s", + SVfARG(declarator), + SvUTF8(proto) + ? sv_uni_display( + dsv, + proto, + len, + UNI_DISPLAY_ISPRINT + ) + : pv_pretty(dsv, start, len, 60, NULL, NULL, + PERL_PV_ESCAPE_NONASCII + ) + ); + return; + } + + for (r = start; r < end; r++) { + switch (*r) { + default: + warner( + packWARN(WARN_ILLEGALPROTO), + "Illegal character in prototype for %"SVf" : %s", + SVfARG(declarator), r + ); + return; + + case '_': + if (r[1] && !strchr(";@%", *r)) { + warner( + packWARN(WARN_ILLEGALPROTO), + "Illegal character after '_' in prototype for %"SVf" : %s", + SVfARG(declarator), r + ); + return; + } + break; + + case '@': + case '%': + if (r[1]) { + warner( + packWARN(WARN_ILLEGALPROTO), + "prototype after '%c' for %"SVf": %s", + *r, SVfARG(declarator), r + 1 + ); + return; + } + break; + + case '\\': + r++; + if (strchr("$@%&*", *r)) { + break; + } + if (*r == '[') { + r++; + for (; r < end && *r != ']'; r++) { + if (!strchr("$@%&*", *r)) { + break; + } + } + if (*r == ']' && r[-1] != '[') { + break; + } + } + warner( + packWARN(WARN_ILLEGALPROTO), + "Illegal character after '\\' in prototype for %"SVf" : %s", + SVfARG(declarator), r + ); + return; + + case '$': + case '*': + case '&': + case ';': + case '+': + break; + } + } +} + static int parse_fun(pTHX_ OP **pop, const char *keyword_ptr, STRLEN keyword_len, const KWSpec *spec) { SV *declarator; I32 floor_ix; int save_ix; SV *saw_name; + OP **prelude_sentinel; AV *params; DefaultParamSpec *defaults; int args_min, args_max; @@ -228,7 +449,6 @@ static int parse_fun(pTHX_ OP **pop, const char *keyword_ptr, STRLEN keyword_len OP **attrs_sentinel, *body; unsigned builtin_attrs; STRLEN len; - char *s; I32 c; declarator = sv_2mortal(newSVpvn(keyword_ptr, keyword_len)); @@ -239,9 +459,7 @@ static int parse_fun(pTHX_ OP **pop, const char *keyword_ptr, STRLEN keyword_len /* function name */ saw_name = NULL; - s = PL_parser->bufptr; - if ((spec->flags & FLAG_NAME_OK) && (len = S_scan_word(aTHX_ s, TRUE))) { - saw_name = sv_2mortal(newSVpvn_flags(s, len, PARSING_UTF ? SVf_UTF8 : 0)); + if ((spec->flags & FLAG_NAME_OK) && (saw_name = my_scan_word(aTHX_ TRUE))) { if (PL_parser->expect != XSTATE) { /* bail out early so we don't predeclare $saw_name */ @@ -261,10 +479,9 @@ static int parse_fun(pTHX_ OP **pop, const char *keyword_ptr, STRLEN keyword_len builtin_attrs |= MY_ATTR_SPECIAL; } - lex_read_to(s + len); lex_read_space(0); } else if (!(spec->flags & FLAG_ANON_OK)) { - croak("I was expecting a function name, not \"%.*s\"", (int)(PL_parser->bufend - s), s); + croak("I was expecting a function name, not \"%.*s\"", (int)(PL_parser->bufend - PL_parser->bufptr), PL_parser->bufptr); } else { sv_catpvs(declarator, " (anon)"); } @@ -276,12 +493,27 @@ static int parse_fun(pTHX_ OP **pop, const char *keyword_ptr, STRLEN keyword_len /* create outer block: '{' */ save_ix = S_block_start(aTHX_ TRUE); + /* initialize synthetic optree */ + Newx(prelude_sentinel, 1, OP *); + *prelude_sentinel = NULL; + SAVEDESTRUCTOR_X(free_ptr_op, prelude_sentinel); + /* parameters */ params = NULL; defaults = NULL; args_min = 0; args_max = -1; + /* my $self; */ + if (SvTRUE(spec->shift)) { + OP *var; + + var = newOP(OP_PADSV, OPf_MOD | (OPpLVAL_INTRO << 8)); + var->op_targ = pad_add_name_sv(spec->shift, 0, NULL, NULL); + + *prelude_sentinel = op_append_list(OP_LINESEQ, *prelude_sentinel, newSTATEOP(0, NULL, var)); + } + c = lex_peek_unichar(0); if (c == '(') { DefaultParamSpec **pdefaults_tail = &defaults; @@ -306,11 +538,10 @@ static int parse_fun(pTHX_ OP **pop, const char *keyword_ptr, STRLEN keyword_len lex_read_unichar(0); lex_read_space(0); - s = PL_parser->bufptr; - if (!(len = S_scan_word(aTHX_ s, FALSE))) { + if (!(param = my_scan_word(aTHX_ FALSE))) { croak("In %"SVf": missing identifier", SVfARG(declarator)); } - param = sv_2mortal(newSVpvf("%c%.*s", sigil, (int)len, s)); + sv_insert(param, 0, 0, &sigil, 1); if (saw_slurpy) { croak("In %"SVf": I was expecting \")\" after \"%"SVf"\", not \"%"SVf"\"", SVfARG(declarator), SVfARG(saw_slurpy), SVfARG(param)); } @@ -321,7 +552,6 @@ static int parse_fun(pTHX_ OP **pop, const char *keyword_ptr, STRLEN keyword_len saw_slurpy = param; } av_push(params, SvREFCNT_inc_simple_NN(param)); - lex_read_to(s + len); lex_read_space(0); c = lex_peek_unichar(0); @@ -356,6 +586,16 @@ static int parse_fun(pTHX_ OP **pop, const char *keyword_ptr, STRLEN keyword_len c = lex_peek_unichar(0); } + /* my $param; */ + { + OP *var; + + var = newOP(OP_PADSV, OPf_MOD | (OPpLVAL_INTRO << 8)); + var->op_targ = pad_add_name_sv(param, 0, NULL, NULL); + + *prelude_sentinel = op_append_list(OP_LINESEQ, *prelude_sentinel, newSTATEOP(0, NULL, var)); + } + if (c == ',') { lex_read_unichar(0); lex_read_space(0); @@ -388,11 +628,11 @@ static int parse_fun(pTHX_ OP **pop, const char *keyword_ptr, STRLEN keyword_len lex_stuff_pvs(":", 0); c = ':'; } else { - proto = sv_2mortal(newSVpvs("")); - if (!S_scan_str(aTHX_ proto, FALSE, FALSE)) { + lex_read_unichar(0); + if (!(proto = my_scan_parens_tail(aTHX_ FALSE))) { croak("In %"SVf": prototype not terminated", SVfARG(declarator)); } - S_check_prototype(aTHX_ declarator, proto); + my_check_prototype(aTHX_ declarator, proto); lex_read_space(0); c = lex_peek_unichar(0); } @@ -419,14 +659,10 @@ static int parse_fun(pTHX_ OP **pop, const char *keyword_ptr, STRLEN keyword_len for (;;) { SV *attr; - s = PL_parser->bufptr; - if (!(len = S_scan_word(aTHX_ s, FALSE))) { + if (!(attr = my_scan_word(aTHX_ FALSE))) { break; } - attr = sv_2mortal(newSVpvn_flags(s, len, PARSING_UTF ? SVf_UTF8 : 0)); - - lex_read_to(s + len); lex_read_space(0); c = lex_peek_unichar(0); @@ -439,11 +675,14 @@ static int parse_fun(pTHX_ OP **pop, const char *keyword_ptr, STRLEN keyword_len attr = NULL; } } else { - SV *sv = sv_2mortal(newSVpvs("")); - if (!S_scan_str(aTHX_ sv, TRUE, TRUE)) { + SV *sv; + lex_read_unichar(0); + if (!(sv = my_scan_parens_tail(aTHX_ TRUE))) { croak("In %"SVf": unterminated attribute parameter in attribute list", SVfARG(declarator)); } + sv_catpvs(attr, "("); sv_catsv(attr, sv); + sv_catpvs(attr, ")"); lex_read_space(0); c = lex_peek_unichar(0); @@ -485,7 +724,6 @@ static int parse_fun(pTHX_ OP **pop, const char *keyword_ptr, STRLEN keyword_len ); } - if (builtin_attrs & MY_ATTR_LVALUE) { CvLVALUE_on(PL_compcv); } @@ -496,136 +734,132 @@ static int parse_fun(pTHX_ OP **pop, const char *keyword_ptr, STRLEN keyword_len CvSPECIAL_on(PL_compcv); } - /* munge */ - { - OP *prelude = NULL; - - /* min/max argument count checks */ - if (spec->flags & FLAG_CHECK_NARGS) { - if (SvTRUE(spec->shift)) { - args_min++; - if (args_max != -1) { - args_max++; - } + /* min/max argument count checks */ + if (spec->flags & FLAG_CHECK_NARGS) { + if (SvTRUE(spec->shift)) { + args_min++; + if (args_max != -1) { + args_max++; } + } - if (args_min > 0) { - OP *chk, *cond, *err, *croak; + if (args_min > 0) { + OP *chk, *cond, *err, *croak; - err = newSVOP(OP_CONST, 0, - newSVpvf("Not enough arguments for %"SVf, SVfARG(declarator))); + err = newSVOP(OP_CONST, 0, + newSVpvf("Not enough arguments for %"SVf, SVfARG(declarator))); - croak = newCVREF(OPf_WANT_SCALAR, - newGVOP(OP_GV, 0, gv_fetchpvs("Carp::croak", 0, SVt_PVCV))); - err = newUNOP(OP_ENTERSUB, OPf_STACKED, - op_append_elem(OP_LIST, err, croak)); + croak = newCVREF(OPf_WANT_SCALAR, + newGVOP(OP_GV, 0, gv_fetchpvs("Carp::croak", 0, SVt_PVCV))); + err = newUNOP(OP_ENTERSUB, OPf_STACKED, + op_append_elem(OP_LIST, err, croak)); - cond = newBINOP(OP_LT, 0, - newAVREF(newGVOP(OP_GV, 0, PL_defgv)), - newSVOP(OP_CONST, 0, newSViv(args_min))); - chk = newLOGOP(OP_AND, 0, cond, err); + cond = newBINOP(OP_LT, 0, + newAVREF(newGVOP(OP_GV, 0, PL_defgv)), + newSVOP(OP_CONST, 0, newSViv(args_min))); + chk = newLOGOP(OP_AND, 0, cond, err); - prelude = op_append_list(OP_LINESEQ, prelude, newSTATEOP(0, NULL, chk)); - } - if (args_max != -1) { - OP *chk, *cond, *err, *croak; + *prelude_sentinel = op_append_list(OP_LINESEQ, *prelude_sentinel, newSTATEOP(0, NULL, chk)); + } + if (args_max != -1) { + OP *chk, *cond, *err, *croak; - err = newSVOP(OP_CONST, 0, - newSVpvf("Too many arguments for %"SVf, SVfARG(declarator))); + err = newSVOP(OP_CONST, 0, + newSVpvf("Too many arguments for %"SVf, SVfARG(declarator))); - croak = newCVREF(OPf_WANT_SCALAR, - newGVOP(OP_GV, 0, gv_fetchpvs("Carp::croak", 0, SVt_PVCV))); - err = newUNOP(OP_ENTERSUB, OPf_STACKED, - op_append_elem(OP_LIST, err, croak)); + croak = newCVREF(OPf_WANT_SCALAR, + newGVOP(OP_GV, 0, gv_fetchpvs("Carp::croak", 0, SVt_PVCV))); + err = newUNOP(OP_ENTERSUB, OPf_STACKED, + op_append_elem(OP_LIST, err, croak)); - cond = newBINOP(OP_GT, 0, - newAVREF(newGVOP(OP_GV, 0, PL_defgv)), - newSVOP(OP_CONST, 0, newSViv(args_max))); - chk = newLOGOP(OP_AND, 0, cond, err); + cond = newBINOP(OP_GT, 0, + newAVREF(newGVOP(OP_GV, 0, PL_defgv)), + newSVOP(OP_CONST, 0, newSViv(args_max))); + chk = newLOGOP(OP_AND, 0, cond, err); - prelude = op_append_list(OP_LINESEQ, prelude, newSTATEOP(0, NULL, chk)); - } + *prelude_sentinel = op_append_list(OP_LINESEQ, *prelude_sentinel, newSTATEOP(0, NULL, chk)); } + } - /* my $self = shift; */ - if (SvTRUE(spec->shift)) { - OP *var, *shift; - - var = newOP(OP_PADSV, OPf_WANT_SCALAR | (OPpLVAL_INTRO << 8)); - var->op_targ = pad_add_name_sv(spec->shift, 0, NULL, NULL); + /* $self = shift; */ + if (SvTRUE(spec->shift)) { + OP *var, *shift; - shift = newASSIGNOP(OPf_STACKED, var, 0, newOP(OP_SHIFT, 0)); - prelude = op_append_list(OP_LINESEQ, prelude, newSTATEOP(0, NULL, shift)); - } + var = newOP(OP_PADSV, OPf_WANT_SCALAR); + var->op_targ = pad_findmy_sv(spec->shift, 0); - /* my (PARAMS) = @_; */ - if (params && av_len(params) > -1) { - SV *param; - OP *init_param, *left, *right; - - left = NULL; - while ((param = av_shift(params)) != &PL_sv_undef) { - OP *const var = newOP(OP_PADSV, OPf_WANT_LIST | (OPpLVAL_INTRO << 8)); - var->op_targ = pad_add_name_sv(param, 0, NULL, NULL); - SvREFCNT_dec(param); - left = op_append_elem(OP_LIST, left, var); - } - - left->op_flags |= OPf_PARENS; - right = newAVREF(newGVOP(OP_GV, 0, PL_defgv)); - init_param = newASSIGNOP(OPf_STACKED, left, 0, right); - init_param = newSTATEOP(0, NULL, init_param); + shift = newASSIGNOP(OPf_STACKED, var, 0, newOP(OP_SHIFT, 0)); + *prelude_sentinel = op_append_list(OP_LINESEQ, *prelude_sentinel, newSTATEOP(0, NULL, shift)); + } - prelude = op_append_list(OP_LINESEQ, prelude, init_param); + /* (PARAMS) = @_; */ + if (params && av_len(params) > -1) { + SV *param; + OP *init_param, *left, *right; + + left = NULL; + while ((param = av_shift(params)) != &PL_sv_undef) { + OP *const var = newOP(OP_PADSV, OPf_WANT_LIST); + var->op_targ = pad_findmy_sv(param, 0); + SvREFCNT_dec(param); + left = op_append_elem(OP_LIST, left, var); } - /* defaults */ - { - OP *gen = NULL; - DefaultParamSpec *dp; + left->op_flags |= OPf_PARENS; + right = newAVREF(newGVOP(OP_GV, 0, PL_defgv)); + init_param = newASSIGNOP(OPf_STACKED, left, 0, right); + init_param = newSTATEOP(0, NULL, init_param); - for (dp = defaults; dp; dp = dp->next) { - OP *init = dp->init; - OP *var, *args, *cond; + *prelude_sentinel = op_append_list(OP_LINESEQ, *prelude_sentinel, init_param); + } + + /* defaults */ + { + OP *gen = NULL; + DefaultParamSpec *dp; - /* var = `$,name */ - var = newOP(OP_PADSV, 0); - var->op_targ = pad_findmy_sv(dp->name, 0); + for (dp = defaults; dp; dp = dp->next) { + OP *init = dp->init; + OP *var, *args, *cond; - /* init = `,var = ,init */ - init = newASSIGNOP(OPf_STACKED, var, 0, init); + /* var = `$,name */ + var = newOP(OP_PADSV, 0); + var->op_targ = pad_findmy_sv(dp->name, 0); - /* args = `@_ */ - args = newAVREF(newGVOP(OP_GV, 0, PL_defgv)); + /* init = `,var = ,init */ + init = newASSIGNOP(OPf_STACKED, var, 0, init); - /* cond = `,args < ,index */ - cond = newBINOP(OP_LT, 0, args, newSVOP(OP_CONST, 0, newSViv(dp->limit))); + /* args = `@_ */ + args = newAVREF(newGVOP(OP_GV, 0, PL_defgv)); - /* init = `,init if ,cond */ - init = newLOGOP(OP_AND, 0, cond, init); + /* cond = `,args < ,index */ + cond = newBINOP(OP_LT, 0, args, newSVOP(OP_CONST, 0, newSViv(dp->limit))); - /* gen = `,gen ; ,init */ - gen = op_append_list(OP_LINESEQ, gen, newSTATEOP(0, NULL, init)); + /* init = `,init if ,cond */ + init = newLOGOP(OP_AND, 0, cond, init); - dp->init = NULL; - } + /* gen = `,gen ; ,init */ + gen = op_append_list(OP_LINESEQ, gen, newSTATEOP(0, NULL, init)); - prelude = op_append_list(OP_LINESEQ, prelude, gen); + dp->init = NULL; } - /* finally let perl parse the actual subroutine body */ - body = parse_block(0); + *prelude_sentinel = op_append_list(OP_LINESEQ, *prelude_sentinel, gen); + } - /* add '();' to make function return nothing by default */ - /* (otherwise the invisible parameter initialization can "leak" into - the return value: fun ($x) {}->("asdf", 0) == 2) */ - if (prelude) { - body = newSTATEOP(0, NULL, body); - } + /* finally let perl parse the actual subroutine body */ + body = parse_block(0); - body = op_append_list(OP_LINESEQ, prelude, body); + /* add '();' to make function return nothing by default */ + /* (otherwise the invisible parameter initialization can "leak" into + the return value: fun ($x) {}->("asdf", 0) == 2) */ + if (*prelude_sentinel) { + body = newSTATEOP(0, NULL, body); } + body = op_append_list(OP_LINESEQ, *prelude_sentinel, body); + *prelude_sentinel = NULL; + /* it's go time. */ { OP *const attrs = *attrs_sentinel;