Better add new files to MANIFEST, too.
[p5sagit/p5-mst-13.2.git] / t / op / tr.t
CommitLineData
c8e3bb4c 1# tr.t
2
f05dd7cc 3BEGIN {
4 chdir 't' if -d 't';
20822f61 5 @INC = '../lib';
f05dd7cc 6}
a5095b95 7
bec89253 8print "1..70\n";
c8e3bb4c 9
10$_ = "abcdefghijklmnopqrstuvwxyz";
11
12tr/a-z/A-Z/;
13
14print "not " unless $_ eq "ABCDEFGHIJKLMNOPQRSTUVWXYZ";
15print "ok 1\n";
16
17tr/A-Z/a-z/;
18
19print "not " unless $_ eq "abcdefghijklmnopqrstuvwxyz";
20print "ok 2\n";
21
22tr/b-y/B-Y/;
23
24print "not " unless $_ eq "aBCDEFGHIJKLMNOPQRSTUVWXYz";
25print "ok 3\n";
26
27# In EBCDIC 'I' is \xc9 and 'J' is \0xd1, 'i' is \x89 and 'j' is \x91.
28# Yes, discontinuities. Regardless, the \xca in the below should stay
29# untouched (and not became \x8a).
5e037136 30{
31 no utf8;
32 $_ = "I\xcaJ";
c8e3bb4c 33
5e037136 34 tr/I-J/i-j/;
c8e3bb4c 35
5e037136 36 print "not " unless $_ eq "i\xcaj";
37 print "ok 4\n";
38}
c8e3bb4c 39#
2de7b02f 40
41# make sure that tr cancels IOK and NOK
42($x = 12) =~ tr/1/3/;
43(my $y = 12) =~ tr/1/3/;
44($f = 1.5) =~ tr/1/3/;
45(my $g = 1.5) =~ tr/1/3/;
d0dafe05 46print "not " unless $x + $y + $f + $g == 71;
2de7b02f 47print "ok 5\n";
48
49# make sure tr is harmless if not updating - see [ID 20000511.005]
50$_ = 'fred';
51/([a-z]{2})/;
52$1 =~ tr/A-Z//;
53s/^(\s*)f/$1F/;
54print "not " if $_ ne 'Fred';
55print "ok 6\n";
56
57# check tr handles UTF8 correctly
58($x = 256.65.258) =~ tr/a/b/;
59print "not " if $x ne 256.65.258 or length $x != 3;
60print "ok 7\n";
61$x =~ tr/A/B/;
67a17885 62if (ord("\t") == 9) { # ASCII
63 print "not " if $x ne 256.66.258 or length $x != 3;
64}
65else {
66 print "not " if $x ne 256.65.258 or length $x != 3;
67}
2de7b02f 68print "ok 8\n";
cbe7f703 69# EBCDIC variants of the above tests
70($x = 256.193.258) =~ tr/a/b/;
71print "not " if $x ne 256.193.258 or length $x != 3;
72print "ok 9\n";
73$x =~ tr/A/B/;
74if (ord("\t") == 9) { # ASCII
75 print "not " if $x ne 256.193.258 or length $x != 3;
76}
77else {
78 print "not " if $x ne 256.194.258 or length $x != 3;
79}
80print "ok 10\n";
036b4402 81
82{
cbe7f703 83# 11 - changing UTF8 characters in a UTF8 string, same length.
8973db79 84my $l = chr(300); my $r = chr(400);
036b4402 85$x = 200.300.400;
86$x =~ tr/\x{12c}/\x{190}/;
87printf "not (%vd) ", $x if $x ne 200.400.400 or length $x != 3;
cbe7f703 88print "ok 11\n";
036b4402 89
cbe7f703 90# 12 - changing UTF8 characters in UTF8 string, more bytes.
036b4402 91$x = 200.300.400;
92$x =~ tr/\x{12c}/\x{be8}/;
93printf "not (%vd) ", $x if $x ne 200.3048.400 or length $x != 3;
cbe7f703 94print "ok 12\n";
036b4402 95
cbe7f703 96# 13 - introducing UTF8 characters to non-UTF8 string.
036b4402 97$x = 100.125.60;
98$x =~ tr/\x{64}/\x{190}/;
99printf "not (%vd) ", $x if $x ne 400.125.60 or length $x != 3;
cbe7f703 100print "ok 13\n";
036b4402 101
cbe7f703 102# 14 - removing UTF8 characters from UTF8 string
036b4402 103$x = 400.125.60;
104$x =~ tr/\x{190}/\x{64}/;
105printf "not (%vd) ", $x if $x ne 100.125.60 or length $x != 3;
cbe7f703 106print "ok 14\n";
036b4402 107
cbe7f703 108# 15 - counting UTF8 chars in UTF8 string
036b4402 109$x = 400.125.60.400;
110$y = $x =~ tr/\x{190}/\x{190}/;
111print "not " if $y != 2;
cbe7f703 112print "ok 15\n";
036b4402 113
cbe7f703 114# 16 - counting non-UTF8 chars in UTF8 string
036b4402 115$x = 60.400.125.60.400;
116$y = $x =~ tr/\x{3c}/\x{3c}/;
117print "not " if $y != 2;
cbe7f703 118print "ok 16\n";
036b4402 119
cbe7f703 120# 17 - counting UTF8 chars in non-UTF8 string
036b4402 121$x = 200.125.60;
122$y = $x =~ tr/\x{190}/\x{190}/;
123print "not " if $y != 0;
cbe7f703 124print "ok 17\n";
036b4402 125}
c2e66d9e 126
cbe7f703 127# 18: test brokenness with tr/a-z-9//;
c2e66d9e 128$_ = "abcdefghijklmnopqrstuvwxyz";
129eval "tr/a-z-9/ /";
130print (($@ =~ /^Ambiguous range in transliteration operator/)
cbe7f703 131 ? '' : 'not ', "ok 18\n");
c2e66d9e 132
cbe7f703 133# 19-21: Make sure leading and trailing hyphens still work
c2e66d9e 134$_ = "car-rot9";
135tr/-a-m/./;
cbe7f703 136print (($_ eq '..r.rot9') ? '' : 'not ', "ok 19\n");
c2e66d9e 137
138$_ = "car-rot9";
139tr/a-m-/./;
cbe7f703 140print (($_ eq '..r.rot9') ? '' : 'not ', "ok 20\n");
c2e66d9e 141
142$_ = "car-rot9";
143tr/-a-m-/./;
cbe7f703 144print (($_ eq '..r.rot9') ? '' : 'not ', "ok 21\n");
c2e66d9e 145
146$_ = "abcdefghijklmnop";
147tr/ae-hn/./;
cbe7f703 148print (($_ eq '.bcd....ijklm.op') ? '' : 'not ', "ok 22\n");
c2e66d9e 149
150$_ = "abcdefghijklmnop";
151tr/a-cf-kn-p/./;
cbe7f703 152print (($_ eq '...de......lm...') ? '' : 'not ', "ok 23\n");
c2e66d9e 153
154$_ = "abcdefghijklmnop";
155tr/a-ceg-ikm-o/./;
cbe7f703 156print (($_ eq '...d.f...j.l...p') ? '' : 'not ', "ok 24\n");
c2e66d9e 157
cbe7f703 158# 25: Test reversed range check
c2e66d9e 159# 20000705 MJD
160eval "tr/m-d/ /";
161print (($@ =~ /^Invalid \[\] range "m-d" in transliteration operator/)
cbe7f703 162 ? '' : 'not ', "ok 25\n");
c2e66d9e 163
cbe7f703 164# 26: test cannot update if read-only
d897a58d 165eval '$1 =~ tr/x/y/';
166print (($@ =~ /^Modification of a read-only value attempted/) ? '' : 'not ',
cbe7f703 167 "ok 26\n");
d897a58d 168
cbe7f703 169# 27: test can count read-only
d897a58d 170'abcdef' =~ /(bcd)/;
cbe7f703 171print (( eval '$1 =~ tr/abcd//' == 3) ? '' : 'not ', "ok 27\n");
d897a58d 172
cbe7f703 173# 28: test lhs OK if not updating
174print ((eval '"123" =~ tr/12//' == 2) ? '' : 'not ', "ok 28\n");
d897a58d 175
cbe7f703 176# 29: test lhs bad if updating
d897a58d 177eval '"123" =~ tr/1/1/';
178print (($@ =~ m|^Can't modify constant item in transliteration \(tr///\)|)
cbe7f703 179 ? '' : 'not ', "ok 29\n");
d897a58d 180
381d18bc 181# v300 (0x12c) is UTF-8-encoded as 196 172 (0xc4 0xac)
182# v400 (0x190) is UTF-8-encoded as 198 144 (0xc6 0x90)
183
184# Transliterate a byte to a byte, all four ways.
185
186($a = v300.196.172.300.196.172) =~ tr/\xc4/\xc5/;
187print "not " unless $a eq v300.197.172.300.197.172;
188print "ok 30\n";
189
190($a = v300.196.172.300.196.172) =~ tr/\xc4/\x{c5}/;
191print "not " unless $a eq v300.197.172.300.197.172;
192print "ok 31\n";
193
194($a = v300.196.172.300.196.172) =~ tr/\x{c4}/\xc5/;
195print "not " unless $a eq v300.197.172.300.197.172;
196print "ok 32\n";
197
198($a = v300.196.172.300.196.172) =~ tr/\x{c4}/\x{c5}/;
199print "not " unless $a eq v300.197.172.300.197.172;
200print "ok 33\n";
201
202# Transliterate a byte to a wide character.
203
204($a = v300.196.172.300.196.172) =~ tr/\xc4/\x{12d}/;
205print "not " unless $a eq v300.301.172.300.301.172;
206print "ok 34\n";
207
208# Transliterate a wide character to a byte.
209
210($a = v300.196.172.300.196.172) =~ tr/\x{12c}/\xc3/;
211print "not " unless $a eq v195.196.172.195.196.172;
212print "ok 35\n";
213
214# Transliterate a wide character to a wide character.
215
216($a = v300.196.172.300.196.172) =~ tr/\x{12c}/\x{12d}/;
217print "not " unless $a eq v301.196.172.301.196.172;
218print "ok 36\n";
219
220# Transliterate both ways.
221
222($a = v300.196.172.300.196.172) =~ tr/\xc4\x{12c}/\x{12d}\xc3/;
223print "not " unless $a eq v195.301.172.195.301.172;
224print "ok 37\n";
225
226# Transliterate all (four) ways.
227
228($a = v300.196.172.300.196.172.400.198.144) =~
229 tr/\xac\xc4\x{12c}\x{190}/\xad\x{12d}\xc5\x{191}/;
230print "not " unless $a eq v197.301.173.197.301.173.401.198.144;
231print "ok 38\n";
232
233# Transliterate and count.
234
235print "not "
236 unless (($a = v300.196.172.300.196.172) =~ tr/\xc4/\xc5/) == 2;
237print "ok 39\n";
238
239print "not "
240 unless (($a = v300.196.172.300.196.172) =~ tr/\x{12c}/\x{12d}/) == 2;
241print "ok 40\n";
242
243# Transliterate with complement.
244
245($a = v300.196.172.300.196.172) =~ tr/\xc4/\x{12d}/c;
246print "not " unless $a eq v301.196.301.301.196.301;
247print "ok 41\n";
248
249($a = v300.196.172.300.196.172) =~ tr/\x{12c}/\xc5/c;
250print "not " unless $a eq v300.197.197.300.197.197;
251print "ok 42\n";
252
253# Transliterate with deletion.
254
255($a = v300.196.172.300.196.172) =~ tr/\xc4//d;
256print "not " unless $a eq v300.172.300.172;
257print "ok 43\n";
258
259($a = v300.196.172.300.196.172) =~ tr/\x{12c}//d;
260print "not " unless $a eq v196.172.196.172;
261print "ok 44\n";
262
263# Transliterate with squeeze.
264
265($a = v196.196.172.300.300.196.172) =~ tr/\xc4/\xc5/s;
266print "not " unless $a eq v197.172.300.300.197.172;
267print "ok 45\n";
268
269($a = v196.172.300.300.196.172.172) =~ tr/\x{12c}/\x{12d}/s;
270print "not " unless $a eq v196.172.301.196.172.172;
271print "ok 46\n";
272
a1874b66 273# Tricky cases by Simon Cozens.
274
275($a = v196.172.200) =~ tr/\x{12c}/a/;
276print "not " unless sprintf("%vd", $a) eq '196.172.200';
277print "ok 47\n";
278
279($a = v196.172.200) =~ tr/\x{12c}/\x{12c}/;
280print "not " unless sprintf("%vd", $a) eq '196.172.200';
281print "ok 48\n";
282
283($a = v196.172.200) =~ tr/\x{12c}//d;
284print "not " unless sprintf("%vd", $a) eq '196.172.200';
285print "ok 49\n";
286
8973db79 287# UTF8 range tests from Inaba Hiroto
f9a63242 288
a26bfc40 289# Not working in EBCDIC as of 12674.
f9a63242 290($a = v300.196.172.302.197.172) =~ tr/\x{12c}-\x{130}/\xc0-\xc4/;
291print "not " unless $a eq v192.196.172.194.197.172;
292print "ok 50\n";
293
294($a = v300.196.172.302.197.172) =~ tr/\xc4-\xc8/\x{12c}-\x{130}/;
295print "not " unless $a eq v300.300.172.302.301.172;
296print "ok 51\n";
8973db79 297
298# UTF8 range tests from Karsten Sperling (patch #9008 required)
299
300($a = "\x{0100}") =~ tr/\x00-\x{100}/X/;
301print "not " unless $a eq "X";
302print "ok 52\n";
303
304($a = "\x{0100}") =~ tr/\x{0000}-\x{00ff}/X/c;
305print "not " unless $a eq "X";
306print "ok 53\n";
307
308($a = "\x{0100}") =~ tr/\x{0000}-\x{00ff}\x{0101}/X/c;
309print "not " unless $a eq "X";
310print "ok 54\n";
311
312($a = v256) =~ tr/\x{0000}-\x{00ff}\x{0101}/X/c;
313print "not " unless $a eq "X";
314print "ok 55\n";
315
94472101 316# UTF8 range tests from Inaba Hiroto
317
318($a = "\x{200}") =~ tr/\x00-\x{100}/X/c;
319print "not " unless $a eq "X";
320print "ok 56\n";
321
322($a = "\x{200}") =~ tr/\x00-\x{100}/X/cs;
323print "not " unless $a eq "X";
324print "ok 57\n";
325
6b6bd37b 326# Tricky on EBCDIC: while [a-z] [A-Z] must not match the gap characters,
327# (i-j, r-s, I-J, R-S), [\x89-\x91] [\xc9-\xd1] has to match them,
328# from Karsten Sperling.
329
a26bfc40 330# Not working in EBCDIC as of 12674.
6b6bd37b 331$c = ($a = "\x89\x8a\x8b\x8c\x8d\x8f\x90\x91") =~ tr/\x89-\x91/X/;
332print "not " unless $c == 8 and $a eq "XXXXXXXX";
333print "ok 58\n";
334
a26bfc40 335# Not working in EBCDIC as of 12674.
6b6bd37b 336$c = ($a = "\xc9\xca\xcb\xcc\xcd\xcf\xd0\xd1") =~ tr/\xc9-\xd1/X/;
337print "not " unless $c == 8 and $a eq "XXXXXXXX";
338print "ok 59\n";
339
340if (ord('i') == 0x89 & ord('J') == 0xd1) {
341
342$c = ($a = "\x89\x8a\x8b\x8c\x8d\x8f\x90\x91") =~ tr/i-j/X/;
343print "not " unless $c == 2 and $a eq "X\x8a\x8b\x8c\x8d\x8f\x90X";
344print "ok 60\n";
345
346$c = ($a = "\xc9\xca\xcb\xcc\xcd\xcf\xd0\xd1") =~ tr/I-J/X/;
347print "not " unless $c == 2 and $a eq "X\xca\xcb\xcc\xcd\xcf\xd0X";
348print "ok 61\n";
349
350} else {
351 for (60..61) { print "ok $_ # Skip: not EBCDIC\n" }
352}
1ed601ec 353
354($a = "\x{100}") =~ tr/\x00-\xff/X/c;
355print "not " unless ord($a) == ord("X");
356print "ok 62\n";
357
358($a = "\x{100}") =~ tr/\x00-\xff/X/cs;
359print "not " unless ord($a) == ord("X");
360print "ok 63\n";
361
362($a = "\x{100}\x{100}") =~ tr/\x{101}-\x{200}//c;
363print "not " unless $a eq "\x{100}\x{100}";
364print "ok 64\n";
365
366($a = "\x{100}\x{100}") =~ tr/\x{101}-\x{200}//cs;
367print "not " unless $a eq "\x{100}";
368print "ok 65\n";
369
629b4584 370$a = "\xfe\xff"; $a =~ tr/\xfe\xff/\x{1ff}\x{1fe}/;
371print "not " unless $a eq "\x{1ff}\x{1fe}";
372print "ok 66\n";
76ef7183 373
374# From David Dyck
375($a = "R0_001") =~ tr/R_//d;
376print "not " if hex($a) != 1;
377print "ok 67\n";
378
800b4dc4 379# From Inaba Hiroto
380@a = (1,2); map { y/1/./ for $_ } @a;
381print "not " if "@a" ne ". 2";
382print "ok 68\n";
383
384@a = (1,2); map { y/1/./ for $_.'' } @a;
385print "not " if "@a" ne "1 2";
386print "ok 69\n";
387
bec89253 388# Additional test for Inaba Hiroto patch (robin@kitsite.com)
389($a = "\x{100}\x{102}\x{101}") =~ tr/\x00-\377/XYZ/c;
390print "not " unless $a eq "XZY";
391print "ok 70\n";
392
393