6 require Config; import Config;
15 ok( $_ eq '$x', ":$_: eq :\$x:" );
19 ok( $_ eq 'foo', ":$_: eq :foo:" );
23 ok( $_ eq '$x foo', ":$_: eq :\$x foo:" );
26 ($a = 'abcdef') =~ s<(b${b}e)>'\n$1';
27 ok( $1 eq 'bcde' && $a eq 'a\n$1f', ":$1: eq :bcde: ; :$a: eq :a\\n\$1f:" );
30 ok( ($a =~ s/a/x/g) == 4 && $a eq 'xbxcxdx' );
32 ok( ($a =~ s/a/y/g) == 0 && $a eq 'xbxcxdx' );
34 ok( ($a =~ s/b/y/g) == 1 && $a eq 'xyxcxdx' );
37 ok( /a/i && s///gi && $_ eq 'BCD' );
40 ok( length($_) == 4 );
42 ok( $_ eq '\\' x 8 && $snum == 4 );
45 ok( length($_) == 8 );
47 ok( $_ eq '\\//' x 4 && $snum == 4 );
48 ok( length($_) == 12 );
52 ok( $_ eq 'aaXXXXbbb' );
56 ok( $_ eq 'aaXXXXbbb' );
60 ok( $_ eq 'baaXXXXbbb' );
64 ok( $_ eq 'baaXXXXbbb' );
68 ok( $_ eq 'aXXXXbbb' );
72 ok( $_ eq 'baXXXXbbb' );
76 ok( $_ eq 'aaaXXXXbb' );
80 ok( $_ eq 'aaaXXXXbb' );
84 ok( $_ eq 'aaaXXXXb' );
88 ok( $_ eq 'aayXXXbbb' );
92 ok( $_ eq 'aaaXXXzbb' );
100 ok( $_ eq 'aaaXXXXxb' );
102 # now for some unoptimized versions of the same.
106 ok( $_ eq 'aaXXXXbbb' );
110 ok( $_ eq 'aaXXXXbbb' );
114 ok( $_ eq 'baaXXXXbbb' );
118 ok( $_ eq 'baaXXXXbbb' );
122 ok( $_ eq 'aXXXXbbb' );
126 ok( $_ eq 'baXXXXbbb' );
130 ok( $_ eq 'aaaXXXXbb' );
134 ok( $_ eq 'aaaXXXXbb' );
138 ok( $_ eq 'aaaXXXXb' );
142 ok( $_ eq 'aayXXXbbb' );
146 ok( $_ eq 'aaaXXXzbb' );
149 $x ne $x || s/aaX.*Xbb//;
154 ok( $_ eq 'aaaXXXXxb' );
157 s/(\d+)/$1*2/e; # yields 'abc246xyz'
158 ok( $_ eq 'abc246xyz' );
159 s/(\d+)/sprintf("%5d",$1)/e; # yields 'abc 246xyz'
160 ok( $_ eq 'abc 246xyz' );
161 s/(\w)/$1 x 2/eg; # yields 'aabbcc 224466xxyyzz'
162 ok( $_ eq 'aabbcc 224466xxyyzz' );
173 $_ = "Now is the %#*! time for all good men...";
174 ok( ($x=(y/a-zA-Z //cd)) == 7 );
177 $_ = 'abcdefghijklmnopqrstuvwxyz0123456789';
180 ok( $_ eq 'ABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789' );
182 # same as tr/A-Z/a-z/;
183 if (defined $Config{ebcdic} && $Config{ebcdic} eq 'define') { # EBCDIC.
185 y[\301-\351][\201-\251];
186 } else { # Ye Olde ASCII. Or something like it.
187 y[\101-\132][\141-\172];
190 ok( $_ eq 'abcdefghijklmnopqrstuvwxyz0123456789' );
193 skip("not ASCII",1) unless (ord("+") == ord(",") - 1
194 && ord(",") == ord("-") - 1
195 && ord("a") == ord("b") - 1
196 && ord("b") == ord("c") - 1);
211 # test recursive substitutions
212 # code based on the recursive expansion of makefile variables
215 AAAAA => '$(B)', B=>'$(C)', C => 'D', # long->short
216 E => '$(F)', F=>'p $(G) q', G => 'HHHHH', # short->long
217 DIR => '$(UNDEFINEDNAME)/xxx',
220 my($var,$level) = @_;
221 return "\$($var)" unless exists $MK{$var};
222 return exp_vars($MK{$var}, $level+1); # can recurse
225 my($str,$level) = @_;
226 $str =~ s/\$\((\w+)\)/var($1, $level+1)/ge; # can recurse
227 #warn "exp_vars $level = '$str'\n";
231 ok( exp_vars('$(AAAAA)',0) eq 'D' );
232 ok( exp_vars('$(E)',0) eq 'p HHHHH q' );
233 ok( exp_vars('$(DIR)',0) eq '$(UNDEFINEDNAME)/xxx' );
234 ok( exp_vars('foo $(DIR)/yyy bar',0) eq 'foo $(UNDEFINEDNAME)/xxx/yyy bar' );
237 s/(..)/$x = $1, m#.#/eg;
238 ok( $x eq "cd", 'a match nested in the RHS of a substitution' );
240 # Subst and lookbehind
243 $snum = s/(?<!x)c/x/g;
244 ok( $_ eq "xxxxx" && $snum == 5 );
247 $snum = s/(?<!x)(c)/x/g;
248 ok( $_ eq "xxxxx" && $snum == 5 );
251 $snum = s/(?<!r)foobbar/foobar/g;
252 ok( $_ eq "foobarfoobbar" && $snum == 1 );
255 $snum = s/(?<!ar)(foobbar)/foobar/g;
256 ok( $_ eq "foobarfoobbar" && $snum == 1 );
259 $snum = s/(?<!ar)foobbar/foobar/g;
260 ok( $_ eq "foobarfoobbar" && $snum == 1 );
262 eval 's{foo} # this is a comment, not a delimiter
264 ok( ! @?, 'parsing of split subst with comment' );
266 $snum = eval '$_="exactly"; s sxsys;m 3(yactl)3;$1';
267 is( $snum, 'yactl', 'alpha delimiters are allowed' );
271 ok( $_ eq "bbcbb" && $snum == 4,
272 'check if squashing works at the end of string' );
278 $url = new URI::URL "http://www/"; die if $url eq "xXx";
282 $foo = ' $@%#lowercase $@%# lowercase UPPERCASE$@%#UPPERCASE' .
283 ' $@%#lowercase$@%#lowercase$@%# lowercase lowercase $@%#lowercase' .
284 ' lowercase $@%#MiXeD$@%# ';
287 s{ \d+ \b [,.;]? (?{ 'digits' })
289 [a-z]+ \b [,.;]? (?{ 'lowercase' })
291 [A-Z]+ \b [,.;]? (?{ 'UPPERCASE' })
293 [A-Z] [a-z]+ \b [,.;]? (?{ 'Capitalized' })
295 [A-Za-z]+ \b [,.;]? (?{ 'MiXeD' })
297 [A-Za-z0-9]+ \b [,.;]? (?{ 'alphanumeric' })
301 [^A-Za-z0-9\s]+ (?{ '$@%#' })
308 ok( $_ eq '' && $snum == 6 );
311 $snum = s/(\d*|x)/<$1>/g;
312 $foo = '<>' . ('<x><>' x 20) ;
313 ok( $_ eq $foo && $snum == 41 );
320 ok( $_ eq 'aaaaaaxxxxxx' && $snum == 3 );
325 ok( $_ eq 'aaaaaaxxx' && $snum == 3 );
330 ok( $_ eq 'aaaaaaxxaa' );
335 ok( $_ eq 'aaaaaaxaa' );
339 ok( $_ eq 'xxxxxxxxxxxxxxxxxx' && $snum == 9 );
343 ok( $_ eq 'xxxxxxxxx' && $snum == 9 );
347 ok( $_ eq 'xxaaaaaaaa' );
351 ok( $_ eq 'xaaaaaaaa' );
355 ok( $_ eq '.aaa' && $snum == 1 );
357 eval q% s/a/"b"}/e %;
358 ok( $@ =~ /Bad evalled substitution/ );
359 eval q% ($_ = "x") =~ s/(.)/"$1 "/e %;
360 ok( $_ eq "x " and !length $@ );
362 eval q% ($_ = "x") =~ s/x(($x)*)/"$1"/e %;
363 ok( $_ eq '' and !length $@ );
366 ok( !s/^([a-z]:)/\u$1/ );
368 $_ = "Charles Bronson";
370 ok( $_ eq "C B" && $snum == 12 );
374 my $s = "H\303\266he";
378 is($l, $r, "use utf8 \\w");
381 my $pv1 = my $pv2 = "Andreas J. K\303\266nig";
382 $pv1 =~ s/A/\x{100}/;
383 substr($pv2,0,1) = "\x{100}";
387 skip("EBCDIC", 3) if ord("A") == 193;
390 # Gregor Chrupala <gregor.chrupala@star-group.net>
392 $a = 'España';
394 like($a, qr/ñ/, "use utf8 RHS");
399 $a = 'España España';
401 like($a, qr/ñ/, "use utf8 LHS");
408 like($a, qr/ñ/, "use utf8 LHS and RHS");
413 # SADAHIRO Tomoyuki <bqw10602@nifty.com>
415 $a = "\x{100}\x{101}";
416 $a =~ s/\x{101}/\xFF/;
418 is(length($a), 2, "SADAHIRO utf8 s///");
420 $a = "\x{100}\x{101}";
421 $a =~ s/\x{101}/"\xFF"/e;
425 $a = "\x{100}\x{101}";
426 $a =~ s/\x{101}/\xFF\xFF\xFF/;
427 like($a, qr/\xFF\xFF\xFF/);
430 $a = "\x{100}\x{101}";
431 $a =~ s/\x{101}/"\xFF\xFF\xFF"/e;
432 like($a, qr/\xFF\xFF\xFF/);
436 $a =~ s/\xFF/\x{100}/;
437 like($a, qr/\x{100}/);
441 $a =~ s/\xFF/"\x{100}"/e;
442 like($a, qr/\x{100}/);
446 $a =~ s/\xFF/\x{100}/;
447 like($a, qr/\x{100}/);
451 $a =~ s/\xFF/"\x{100}"/e;
452 like($a, qr/\x{100}/);
457 # subst with mixed utf8/non-utf8 type
458 my($ua, $ub, $uc, $ud) = ("\x{101}", "\x{102}", "\x{103}", "\x{104}");
459 my($na, $nb) = ("\x{ff}", "\x{fe}");
462 ($b = $a) =~ s/--/$na/;
463 is($b, "$ua$na$ub", "s///: replace non-utf8 into utf8");
464 ($b = $a) =~ s/--/--$na--/;
465 is($b, "$ua--$na--$ub", "s///: replace long non-utf8 into utf8");
466 ($b = $a) =~ s/--/$uc/;
467 is($b, "$ua$uc$ub", "s///: replace utf8 into utf8");
468 ($b = $a) =~ s/--/--$uc--/;
469 is($b, "$ua--$uc--$ub", "s///: replace long utf8 into utf8");
471 ($b = $a) =~ s/--/$ua/;
472 is($b, "$na$ua$nb", "s///: replace utf8 into non-utf8");
473 ($b = $a) =~ s/--/--$ua--/;
474 is($b, "$na--$ua--$nb", "s///: replace long utf8 into non-utf8");
476 # now with utf8 pattern
478 ($b = $a) =~ s/-($ud)?-/$na/;
479 is($b, "$ua$na$ub", "s///: replace non-utf8 into utf8 (utf8 pattern)");
480 ($b = $a) =~ s/-($ud)?-/--$na--/;
481 is($b, "$ua--$na--$ub", "s///: replace long non-utf8 into utf8 (utf8 pattern)");
482 ($b = $a) =~ s/-($ud)?-/$uc/;
483 is($b, "$ua$uc$ub", "s///: replace utf8 into utf8 (utf8 pattern)");
484 ($b = $a) =~ s/-($ud)?-/--$uc--/;
485 is($b, "$ua--$uc--$ub", "s///: replace long utf8 into utf8 (utf8 pattern)");
487 ($b = $a) =~ s/-($ud)?-/$ua/;
488 is($b, "$na$ua$nb", "s///: replace utf8 into non-utf8 (utf8 pattern)");
489 ($b = $a) =~ s/-($ud)?-/--$ua--/;
490 is($b, "$na--$ua--$nb", "s///: replace long utf8 into non-utf8 (utf8 pattern)");
491 ($b = $a) =~ s/-($ud)?-/$na/;
492 is($b, "$na$na$nb", "s///: replace non-utf8 into non-utf8 (utf8 pattern)");
493 ($b = $a) =~ s/-($ud)?-/--$na--/;
494 is($b, "$na--$na--$nb", "s///: replace long non-utf8 into non-utf8 (utf8 pattern)");
500 is("<$_> <$s>", "<xxxx> <4>", "[perl #7806]");
504 is("<$_> <$s>", "<> <4>", "[perl #7806]");
506 # [perl #19048] Coredump in silly replacement
511 is($_, "\n", "[perl #19048]");
514 # [perl #17757] interaction between saw_ampersand and study
516 my $f = eval q{ $& };
520 is($f, "yy", "[perl #17757]");
523 # [perl #20684] returned a zero count
525 is(s/(??{1})/2/eg, 4, '#20684 s/// with (??{..}) inside');
527 # [perl #20682] @- not visible in replacement
529 /(2)/; # seed @- with something else
530 s/(1)(2)(3)/$#- (@-)/;
531 is($_, "3 (0 0 1 2)", '#20682 @- not visible in replacement');
533 # [perl #20682] $^N not visible in replacement
535 /(a)/; s/(b)|(c)/-$^N/g;
536 is($_,'a-b-c','#20682 $^N not visible in replacement');
538 # [perl #22351] perl bug with 'e' substitution modifier
541 no warnings 'uninitialized';
544 is($name, "cis", q[#22351 bug with 'e' substitution modifier]);
547 # [perl #34171] $1 didn't honour 'use bytes' in s//e
555 is(length($x), 2, '[perl #34171]');
559 { # [perl #27940] perlbug: [\x00-\x1f] works, [\c@-\c_] does not
562 ($c = "\x20\c@\x30\cA\x40\cZ\x50\c_\x60") =~ s/[\c@-\c_]//g;
563 is($c, "\x20\x30\x40\x50\x60", "s/[\\c\@-\\c_]//g");
565 ($c = "\x20\x00\x30\x01\x40\x1A\x50\x1F\x60") =~ s/[\x00-\x1f]//g;
566 is($c, "\x20\x30\x40\x50\x60", "s/[\\x00-\\x1f]//g");
570 no warnings 'uninitialized';
571 /(((((((((x)))))))))(z)/; # clear $10
572 s/(((((((((x)))))))))(y)/${10}/;
573 is($_,"y","RT#6006: \$_ eq '$_'");
575 s/(((((((((x)))))))))(r)/fooba${10}/;
576 is($_,"foobar","RT#6006: \$_ eq '$_'");
579 my $want=("\n" x 11).("B\n" x 11)."B";
586 is($want,$_,"RT#17542");
590 my @tests = ('ABC', "\xA3\xA4\xA5", "\x{410}\x{411}\x{412}");
594 is($_, "012", "RT#52104: $id");
598 fresh_perl_is( '$_=q(foo);s/(.)\G//g;print' => 'foo', '[perl #69056] positive GPOS regex segfault' );
599 fresh_perl_is( '$_="abcef"; s/bc|(.)\G(.)/$1 ? "[$1-$2]" : "XX"/ge; print' => 'aXX[c-e][e-f]f', 'positive GPOS regex substitution failure' );