Commit | Line | Data |
8d063cd8 |
1 | #!./perl |
8d37f932 |
2 | # |
3 | # This is a home for regular expression tests that don't fit into |
4 | # the format supported by op/regexp.t. If you want to add a test |
5 | # that does fit that format, add it to op/re_tests, not here. |
8d063cd8 |
6 | |
79072805 |
7 | # $RCSfile: pat.t,v $$Revision: 4.1 $$Date: 92/08/07 18:28:12 $ |
378cc40b |
8 | |
e4d48cc9 |
9 | print "1..124\n"; |
8d37f932 |
10 | |
e4d48cc9 |
11 | BEGIN { |
12 | chdir 't' if -d 't'; |
13 | @INC = "../lib" if -d "../lib"; |
14 | } |
8d37f932 |
15 | eval 'use Config'; # Defaults assumed if this fails |
e4d48cc9 |
16 | use re 'eval'; |
8d063cd8 |
17 | |
18 | $x = "abc\ndef\n"; |
19 | |
20 | if ($x =~ /^abc/) {print "ok 1\n";} else {print "not ok 1\n";} |
21 | if ($x !~ /^def/) {print "ok 2\n";} else {print "not ok 2\n";} |
22 | |
23 | $* = 1; |
24 | if ($x =~ /^def/) {print "ok 3\n";} else {print "not ok 3\n";} |
25 | $* = 0; |
26 | |
27 | $_ = '123'; |
28 | if (/^([0-9][0-9]*)/) {print "ok 4\n";} else {print "not ok 4\n";} |
29 | |
30 | if ($x =~ /^xxx/) {print "not ok 5\n";} else {print "ok 5\n";} |
31 | if ($x !~ /^abc/) {print "not ok 6\n";} else {print "ok 6\n";} |
32 | |
33 | if ($x =~ /def/) {print "ok 7\n";} else {print "not ok 7\n";} |
34 | if ($x !~ /def/) {print "not ok 8\n";} else {print "ok 8\n";} |
35 | |
36 | if ($x !~ /.def/) {print "ok 9\n";} else {print "not ok 9\n";} |
37 | if ($x =~ /.def/) {print "not ok 10\n";} else {print "ok 10\n";} |
38 | |
39 | if ($x =~ /\ndef/) {print "ok 11\n";} else {print "not ok 11\n";} |
40 | if ($x !~ /\ndef/) {print "not ok 12\n";} else {print "ok 12\n";} |
41 | |
42 | $_ = 'aaabbbccc'; |
43 | if (/(a*b*)(c*)/ && $1 eq 'aaabbb' && $2 eq 'ccc') { |
44 | print "ok 13\n"; |
45 | } else { |
46 | print "not ok 13\n"; |
47 | } |
48 | if (/(a+b+c+)/ && $1 eq 'aaabbbccc') { |
49 | print "ok 14\n"; |
50 | } else { |
51 | print "not ok 14\n"; |
52 | } |
53 | |
54 | if (/a+b?c+/) {print "not ok 15\n";} else {print "ok 15\n";} |
55 | |
56 | $_ = 'aaabccc'; |
57 | if (/a+b?c+/) {print "ok 16\n";} else {print "not ok 16\n";} |
58 | if (/a*b+c*/) {print "ok 17\n";} else {print "not ok 17\n";} |
59 | |
60 | $_ = 'aaaccc'; |
61 | if (/a*b?c*/) {print "ok 18\n";} else {print "not ok 18\n";} |
62 | if (/a*b+c*/) {print "not ok 19\n";} else {print "ok 19\n";} |
63 | |
64 | $_ = 'abcdef'; |
65 | if (/bcd|xyz/) {print "ok 20\n";} else {print "not ok 20\n";} |
66 | if (/xyz|bcd/) {print "ok 21\n";} else {print "not ok 21\n";} |
67 | |
68 | if (m|bc/*d|) {print "ok 22\n";} else {print "not ok 22\n";} |
378cc40b |
69 | |
70 | if (/^$_$/) {print "ok 23\n";} else {print "not ok 23\n";} |
71 | |
72 | $* = 1; # test 3 only tested the optimized version--this one is for real |
73 | if ("ab\ncd\n" =~ /^cd/) {print "ok 24\n";} else {print "not ok 24\n";} |
74 | $* = 0; |
75 | |
76 | $XXX{123} = 123; |
77 | $XXX{234} = 234; |
78 | $XXX{345} = 345; |
79 | |
80 | @XXX = ('ok 25','not ok 25', 'ok 26','not ok 26','not ok 27'); |
c6aa4a32 |
81 | while ($_ = shift(@XXX)) { |
378cc40b |
82 | ?(.*)? && (print $1,"\n"); |
83 | /not/ && reset; |
84 | /not ok 26/ && reset 'X'; |
85 | } |
86 | |
a0d0e21e |
87 | while (($key,$val) = each(%XXX)) { |
378cc40b |
88 | print "not ok 27\n"; |
89 | exit; |
90 | } |
91 | |
92 | print "ok 27\n"; |
93 | |
94 | 'cde' =~ /[^ab]*/; |
95 | 'xyz' =~ //; |
96 | if ($& eq 'xyz') {print "ok 28\n";} else {print "not ok 28\n";} |
97 | |
98 | $foo = '[^ab]*'; |
99 | 'cde' =~ /$foo/; |
100 | 'xyz' =~ //; |
101 | if ($& eq 'xyz') {print "ok 29\n";} else {print "not ok 29\n";} |
102 | |
103 | $foo = '[^ab]*'; |
104 | 'cde' =~ /$foo/; |
105 | 'xyz' =~ /$null/; |
106 | if ($& eq 'xyz') {print "ok 30\n";} else {print "not ok 30\n";} |
a687059c |
107 | |
108 | $_ = 'abcdefghi'; |
109 | /def/; # optimized up to cmd |
110 | if ("$`:$&:$'" eq 'abc:def:ghi') {print "ok 31\n";} else {print "not ok 31\n";} |
111 | |
112 | /cde/ + 0; # optimized only to spat |
113 | if ("$`:$&:$'" eq 'ab:cde:fghi') {print "ok 32\n";} else {print "not ok 32\n";} |
114 | |
115 | /[d][e][f]/; # not optimized |
116 | if ("$`:$&:$'" eq 'abc:def:ghi') {print "ok 33\n";} else {print "not ok 33\n";} |
117 | |
118 | $_ = 'now is the {time for all} good men to come to.'; |
119 | / {([^}]*)}/; |
120 | if ($1 eq 'time for all') {print "ok 34\n";} else {print "not ok 34 $1\n";} |
121 | |
122 | $_ = 'xxx {3,4} yyy zzz'; |
123 | print /( {3,4})/ ? "ok 35\n" : "not ok 35\n"; |
124 | print $1 eq ' ' ? "ok 36\n" : "not ok 36\n"; |
125 | print /( {4,})/ ? "not ok 37\n" : "ok 37\n"; |
126 | print /( {2,3}.)/ ? "ok 38\n" : "not ok 38\n"; |
127 | print $1 eq ' y' ? "ok 39\n" : "not ok 39\n"; |
128 | print /(y{2,3}.)/ ? "ok 40\n" : "not ok 40\n"; |
129 | print $1 eq 'yyy ' ? "ok 41\n" : "not ok 41\n"; |
130 | print /x {3,4}/ ? "not ok 42\n" : "ok 42\n"; |
131 | print /^xxx {3,4}/ ? "not ok 43\n" : "ok 43\n"; |
352d5a3a |
132 | |
133 | $_ = "now is the time for all good men to come to."; |
134 | @words = /(\w+)/g; |
135 | print join(':',@words) eq "now:is:the:time:for:all:good:men:to:come:to" |
136 | ? "ok 44\n" |
137 | : "not ok 44\n"; |
138 | |
139 | @words = (); |
140 | while (/\w+/g) { |
141 | push(@words, $&); |
142 | } |
143 | print join(':',@words) eq "now:is:the:time:for:all:good:men:to:come:to" |
144 | ? "ok 45\n" |
145 | : "not ok 45\n"; |
146 | |
147 | @words = (); |
71be2cbc |
148 | pos = 0; |
352d5a3a |
149 | while (/to/g) { |
150 | push(@words, $&); |
151 | } |
152 | print join(':',@words) eq "to:to" |
153 | ? "ok 46\n" |
71be2cbc |
154 | : "not ok 46 `@words'\n"; |
352d5a3a |
155 | |
71be2cbc |
156 | pos $_ = 0; |
352d5a3a |
157 | @words = /to/g; |
158 | print join(':',@words) eq "to:to" |
159 | ? "ok 47\n" |
71be2cbc |
160 | : "not ok 47 `@words'\n"; |
352d5a3a |
161 | |
162 | $_ = "abcdefghi"; |
163 | |
164 | $pat1 = 'def'; |
165 | $pat2 = '^def'; |
166 | $pat3 = '.def.'; |
167 | $pat4 = 'abc'; |
168 | $pat5 = '^abc'; |
169 | $pat6 = 'abc$'; |
170 | $pat7 = 'ghi'; |
171 | $pat8 = '\w*ghi'; |
172 | $pat9 = 'ghi$'; |
173 | |
174 | $t1=$t2=$t3=$t4=$t5=$t6=$t7=$t8=$t9=0; |
175 | |
176 | for $iter (1..5) { |
177 | $t1++ if /$pat1/o; |
178 | $t2++ if /$pat2/o; |
179 | $t3++ if /$pat3/o; |
180 | $t4++ if /$pat4/o; |
181 | $t5++ if /$pat5/o; |
182 | $t6++ if /$pat6/o; |
183 | $t7++ if /$pat7/o; |
184 | $t8++ if /$pat8/o; |
185 | $t9++ if /$pat9/o; |
186 | } |
187 | |
188 | $x = "$t1$t2$t3$t4$t5$t6$t7$t8$t9"; |
189 | print $x eq '505550555' ? "ok 48\n" : "not ok 48 $x\n"; |
1462b684 |
190 | |
191 | $xyz = 'xyz'; |
192 | print "abc" =~ /^abc$|$xyz/ ? "ok 49\n" : "not ok 49\n"; |
193 | |
194 | # perl 4.009 says "unmatched ()" |
195 | eval '"abc" =~ /a(bc$)|$xyz/; $result = "$&:$1"'; |
196 | print $@ eq "" ? "ok 50\n" : "not ok 50\n"; |
197 | print $result eq "abc:bc" ? "ok 51\n" : "not ok 51\n"; |
a0d0e21e |
198 | |
199 | |
200 | $_="abcfooabcbar"; |
201 | $x=/abc/g; |
202 | print $` eq "" ? "ok 52\n" : "not ok 52\n" if $x; |
203 | $x=/abc/g; |
204 | print $` eq "abcfoo" ? "ok 53\n" : "not ok 53\n" if $x; |
205 | $x=/abc/g; |
206 | print $x == 0 ? "ok 54\n" : "not ok 54\n"; |
71be2cbc |
207 | pos = 0; |
a0d0e21e |
208 | $x=/ABC/gi; |
209 | print $` eq "" ? "ok 55\n" : "not ok 55\n" if $x; |
210 | $x=/ABC/gi; |
211 | print $` eq "abcfoo" ? "ok 56\n" : "not ok 56\n" if $x; |
212 | $x=/ABC/gi; |
213 | print $x == 0 ? "ok 57\n" : "not ok 57\n"; |
71be2cbc |
214 | pos = 0; |
a0d0e21e |
215 | $x=/abc/g; |
216 | print $' eq "fooabcbar" ? "ok 58\n" : "not ok 58\n" if $x; |
217 | $x=/abc/g; |
218 | print $' eq "bar" ? "ok 59\n" : "not ok 59\n" if $x; |
219 | $_ .= ''; |
220 | @x=/abc/g; |
221 | print scalar @x == 2 ? "ok 60\n" : "not ok 60\n"; |
71be2cbc |
222 | |
223 | $_ = "abdc"; |
224 | pos $_ = 2; |
c90c0ff4 |
225 | /\Gc/gc; |
71be2cbc |
226 | print "not " if (pos $_) != 2; |
227 | print "ok 61\n"; |
c90c0ff4 |
228 | /\Gc/g; |
229 | print "not " if defined pos $_; |
230 | print "ok 62\n"; |
c277df42 |
231 | |
232 | $out = 1; |
233 | 'abc' =~ m'a(?{ $out = 2 })b'; |
234 | print "not " if $out != 2; |
235 | print "ok 63\n"; |
236 | |
237 | $out = 1; |
238 | 'abc' =~ m'a(?{ $out = 3 })c'; |
239 | print "not " if $out != 1; |
240 | print "ok 64\n"; |
241 | |
242 | $_ = 'foobar1 bar2 foobar3 barfoobar5 foobar6'; |
243 | @out = /(?<!foo)bar./g; |
244 | print "not " if "@out" ne 'bar2 barf'; |
245 | print "ok 65\n"; |
246 | |
8d37f932 |
247 | # Tests which depend on REG_INFTY |
248 | $reg_infty = defined $Config{reg_infty} ? $Config{reg_infty} : 32767; |
249 | $reg_infty_m = $reg_infty - 1; $reg_infty_p = $reg_infty + 1; |
250 | |
251 | # As well as failing if the pattern matches do unexpected things, the |
252 | # next three tests will fail if you should have picked up a lower-than- |
253 | # default value for $reg_infty from Config.pm, but have not. |
254 | |
255 | undef $@; |
256 | print "not " if eval q(('aaa' =~ /(a{1,$reg_infty_m})/)[0] ne 'aaa') || $@; |
257 | print "ok 66\n"; |
258 | |
259 | undef $@; |
260 | print "not " if eval q(('a' x $reg_infty_m) !~ /a{$reg_infty_m}/) || $@; |
261 | print "ok 67\n"; |
262 | |
263 | undef $@; |
264 | print "not " if eval q(('a' x ($reg_infty_m - 1)) =~ /a{$reg_infty_m}/) || $@; |
265 | print "ok 68\n"; |
266 | |
267 | undef $@; |
268 | eval "'aaa' =~ /a{1,$reg_infty}/"; |
269 | print "not " if $@ !~ m%^\Q/a{1,$reg_infty}/: Quantifier in {,} bigger than%; |
270 | print "ok 69\n"; |
271 | |
272 | eval "'aaa' =~ /a{1,$reg_infty_p}/"; |
273 | print "not " |
274 | if $@ !~ m%^\Q/a{1,$reg_infty_p}/: Quantifier in {,} bigger than%; |
275 | print "ok 70\n"; |
276 | undef $@; |
277 | |
278 | # Poke a couple more parse failures |
279 | |
280 | $context = 'x' x 256; |
281 | eval qq("${context}y" =~ /(?<=$context)y/); |
282 | print "not " if $@ !~ m%^\Q/(?<=\Ex+/: lookbehind longer than 255 not%; |
283 | print "ok 71\n"; |
284 | |
285 | # This one will fail when POSIX character classes do get implemented |
286 | { |
287 | my $w; |
288 | local $^W = 1; |
289 | local $SIG{__WARN__} = sub{$w = shift}; |
290 | eval q('a' =~ /[[:alpha:]]/); |
291 | print "not " if $w !~ /^\QCharacter class syntax [: :] is reserved/; |
292 | } |
293 | print "ok 72\n"; |
294 | |
c277df42 |
295 | # Long Monsters |
8d37f932 |
296 | $test = 73; |
c277df42 |
297 | for $l (125, 140, 250, 270, 300000, 30) { # Ordered to free memory |
298 | $a = 'a' x $l; |
299 | print "# length=$l\nnot " unless "ba$a=" =~ /a$a=/; |
300 | print "ok $test\n"; |
301 | $test++; |
302 | |
303 | print "not " if "b$a=" =~ /a$a=/; |
304 | print "ok $test\n"; |
305 | $test++; |
306 | } |
307 | |
308 | # 20000 nodes, each taking 3 words per string, and 1 per branch |
309 | $long_constant_len = join '|', 12120 .. 32645; |
310 | $long_var_len = join '|', 8120 .. 28645; |
311 | %ans = ( 'ax13876y25677lbc' => 1, |
312 | 'ax13876y25677mcb' => 0, # not b. |
313 | 'ax13876y35677nbc' => 0, # Num too big |
314 | 'ax13876y25677y21378obc' => 1, |
315 | 'ax13876y25677y21378zbc' => 0, # Not followed by [k-o] |
316 | 'ax13876y25677y21378y21378kbc' => 1, |
317 | 'ax13876y25677y21378y21378kcb' => 0, # Not b. |
318 | 'ax13876y25677y21378y21378y21378kbc' => 0, # 5 runs |
319 | ); |
320 | |
321 | for ( keys %ans ) { |
322 | print "# const-len `$_' not => $ans{$_}\nnot " |
323 | if $ans{$_} xor /a(?=([yx]($long_constant_len)){2,4}[k-o]).*b./o; |
324 | print "ok $test\n"; |
325 | $test++; |
326 | print "# var-len `$_' not => $ans{$_}\nnot " |
327 | if $ans{$_} xor /a(?=([yx]($long_var_len)){2,4}[k-o]).*b./o; |
328 | print "ok $test\n"; |
329 | $test++; |
330 | } |
331 | |
332 | $_ = " a (bla()) and x(y b((l)u((e))) and b(l(e)e)e"; |
333 | $expect = "(bla()) ((l)u((e))) (l(e)e)"; |
334 | |
335 | sub matchit { |
cc6b7395 |
336 | m/ |
c277df42 |
337 | ( |
338 | \( |
339 | (?{ $c = 1 }) # Initialize |
340 | (?: |
341 | (?(?{ $c == 0 }) # PREVIOUS iteration was OK, stop the loop |
342 | (?! |
343 | ) # Fail: will unwind one iteration back |
344 | ) |
345 | (?: |
346 | [^()]+ # Match a big chunk |
347 | (?= |
348 | [()] |
349 | ) # Do not try to match subchunks |
350 | | |
351 | \( |
352 | (?{ ++$c }) |
353 | | |
354 | \) |
355 | (?{ --$c }) |
356 | ) |
357 | )+ # This may not match with different subblocks |
358 | ) |
359 | (?(?{ $c != 0 }) |
360 | (?! |
361 | ) # Fail |
362 | ) # Otherwise the chunk 1 may succeed with $c>0 |
cc6b7395 |
363 | /xg; |
c277df42 |
364 | } |
365 | |
366 | push @ans, $res while $res = matchit; |
367 | |
368 | print "# ans='@ans'\n# expect='$expect'\nnot " if "@ans" ne "1 1 1"; |
369 | print "ok $test\n"; |
370 | $test++; |
371 | |
372 | @ans = matchit; |
373 | |
374 | print "# ans='@ans'\n# expect='$expect'\nnot " if "@ans" ne $expect; |
375 | print "ok $test\n"; |
376 | $test++; |
377 | |
378 | @ans = ('a/b' =~ m%(.*/)?(.*)%); # Stack may be bad |
379 | print "not " if "@ans" ne 'a/ b'; |
380 | print "ok $test\n"; |
381 | $test++; |
382 | |
cc6b7395 |
383 | $code = '{$blah = 45}'; |
c277df42 |
384 | $blah = 12; |
e4d48cc9 |
385 | eval { /(?$code)/ }; |
386 | print "not " unless $@ and $@ =~ /not allowed at run time/ and $blah == 12; |
387 | print "ok $test\n"; |
388 | $test++; |
389 | |
390 | $code = '{$blah = 45}'; |
391 | $blah = 12; |
392 | eval "/(?$code)/"; |
cc6b7395 |
393 | print "not " if $blah != 45; |
394 | print "ok $test\n"; |
395 | $test++; |
396 | |
397 | $blah = 12; |
398 | /(?{$blah = 45})/; |
c277df42 |
399 | print "not " if $blah != 45; |
400 | print "ok $test\n"; |
401 | $test++; |
402 | |
74d6a13a |
403 | $x = 'banana'; |
404 | $x =~ /.a/g; |
405 | print "not " unless pos($x) == 2; |
406 | print "ok $test\n"; |
407 | $test++; |
408 | |
409 | $x =~ /.z/gc; |
410 | print "not " unless pos($x) == 2; |
411 | print "ok $test\n"; |
412 | $test++; |
413 | |
414 | sub f { |
415 | my $p = $_[0]; |
416 | return $p; |
417 | } |
418 | |
419 | $x =~ /.a/g; |
420 | print "not " unless f(pos($x)) == 4; |
421 | print "ok $test\n"; |
422 | $test++; |
4599a1de |
423 | |
ce862d02 |
424 | $x = $^R = 67; |
425 | 'foot' =~ /foo(?{$x = 12; 75})[t]/; |
426 | print "not " unless $^R eq '75'; |
427 | print "ok $test\n"; |
428 | $test++; |
429 | |
430 | $x = $^R = 67; |
431 | 'foot' =~ /foo(?{$x = 12; 75})[xy]/; |
432 | print "not " unless $^R eq '67' and $x eq '12'; |
433 | print "ok $test\n"; |
434 | $test++; |
435 | |
436 | $x = $^R = 67; |
437 | 'foot' =~ /foo(?{ $^R + 12 })((?{ $x = 12; $^R + 17 })[xy])?/; |
438 | print "not " unless $^R eq '79' and $x eq '12'; |
439 | print "ok $test\n"; |
440 | $test++; |
441 | |
97197631 |
442 | # This should be changed to qr/\b\v$/ ASAP |
1bd3ad17 |
443 | print "not " unless study(/\b\v$/) eq '(?:\bv$)'; |
97197631 |
444 | print "ok $test\n"; |
445 | $test++; |
446 | |
7e5428c5 |
447 | $_ = 'xabcx'; |
448 | foreach $ans ('', 'c') { |
449 | /(?<=(?=a)..)((?=c)|.)/g; |
450 | print "not " unless $1 eq $ans; |
451 | print "ok $test\n"; |
452 | $test++; |
453 | } |
454 | |
455 | $_ = 'a'; |
456 | foreach $ans ('', 'a', '') { |
457 | /^|a|$/g; |
458 | print "not " unless $& eq $ans; |
459 | print "ok $test\n"; |
460 | $test++; |
461 | } |
462 | |
09f25ae4 |
463 | sub prefixify { |
464 | my($v,$a,$b,$res) = @_; |
465 | $v =~ s/\Q$a\E/$b/; |
466 | print "not " unless $res eq $v; |
467 | print "ok $test\n"; |
468 | $test++; |
469 | } |
470 | prefixify('/a/b/lib/arch', "/a/b/lib", 'X/lib', 'X/lib/arch'); |
471 | prefixify('/a/b/man/arch', "/a/b/man", 'X/man', 'X/man/arch'); |
472 | |
473 | $_ = 'var="foo"'; |
474 | /(\")/; |
475 | print "not " unless $1 and /$1/; |
476 | print "ok $test\n"; |
477 | $test++; |
478 | |
4599a1de |
479 | sub must_warn_pat { |
480 | my $warn_pat = shift; |
481 | return sub { print "not " unless $_[0] =~ /$warn_pat/ } |
482 | } |
483 | |
484 | sub must_warn { |
485 | my ($warn_pat, $code) = @_; |
486 | local $^W; local %SIG; |
487 | eval 'BEGIN { $^W = 1; $SIG{__WARN__} = $warn_pat };' . $code; |
488 | print "ok $test\n"; |
489 | $test++; |
490 | } |
491 | |
492 | |
493 | sub make_must_warn { |
494 | my $warn_pat = shift; |
495 | return sub { must_warn(must_warn_pat($warn_pat)) } |
496 | } |
497 | |
498 | my $for_future = make_must_warn('reserved for future extensions'); |
499 | |
500 | &$for_future('q(a:[b]:) =~ /[x[:foo:]]/'); |
501 | &$for_future('q(a=[b]=) =~ /[x[=foo=]]/'); |
502 | &$for_future('q(a.[b].) =~ /[x[.foo.]]/'); |