integrate from perlio: changes #17709, #17795, #17796, #18032
[p5sagit/p5-mst-13.2.git] / lib / charnames.t
CommitLineData
423cee85 1#!./perl
2
52ea3e69 3my @WARN;
4
423cee85 5BEGIN {
6 unless(grep /blib/, @INC) {
7 chdir 't' if -d 't';
20822f61 8 @INC = '../lib';
423cee85 9 }
52ea3e69 10 $SIG{__WARN__} = sub { push @WARN, @_ };
423cee85 11}
12
13$| = 1;
822ebcc8 14
35c0985d 15print "1..69\n";
423cee85 16
17use charnames ':full';
18
93979888 19print "not " unless "Here\N{EXCLAMATION MARK}?" eq "Here!?";
423cee85 20print "ok 1\n";
21
c82a54e6 22{
5d9a6404 23 use bytes; # TEST -utf8 can switch utf8 on
c82a54e6 24
25 print "# \$res=$res \$\@='$@'\nnot "
26 if $res = eval <<'EOE'
423cee85 27use charnames ":full";
4a2d328f 28"Here: \N{CYRILLIC SMALL LETTER BE}!";
423cee85 291
30EOE
c82a54e6 31 or $@ !~ /above 0xFF/;
32 print "ok 2\n";
33 # print "# \$res=$res \$\@='$@'\n";
423cee85 34
c82a54e6 35 print "# \$res=$res \$\@='$@'\nnot "
36 if $res = eval <<'EOE'
423cee85 37use charnames 'cyrillic';
4a2d328f 38"Here: \N{Be}!";
423cee85 391
40EOE
c82a54e6 41 or $@ !~ /CYRILLIC CAPITAL LETTER BE.*above 0xFF/;
42 print "ok 3\n";
43}
423cee85 44
45# If octal representation of unicode char is \0xyzt, then the utf8 is \3xy\2zt
210db7fc 46if (ord('A') == 65) { # as on ASCII or UTF-8 machines
47 $encoded_be = "\320\261";
48 $encoded_alpha = "\316\261";
49 $encoded_bet = "\327\221";
50 $encoded_deseng = "\360\220\221\215";
51}
52else { # EBCDIC where UTF-EBCDIC may be used (this may be 1047 specific since
53 # UTF-EBCDIC is codepage specific)
54 $encoded_be = "\270\102\130";
55 $encoded_alpha = "\264\130";
56 $encoded_bet = "\270\125\130";
57 $encoded_deseng = "\336\102\103\124";
58}
c5cc3500 59
60sub to_bytes {
f9a63242 61 pack"a*", shift;
c5cc3500 62}
63
423cee85 64{
65 use charnames ':full';
423cee85 66
c5cc3500 67 print "not " unless to_bytes("\N{CYRILLIC SMALL LETTER BE}") eq $encoded_be;
423cee85 68 print "ok 4\n";
69
70 use charnames qw(cyrillic greek :short);
71
c5cc3500 72 print "not " unless to_bytes("\N{be},\N{alpha},\N{hebrew:bet}")
423cee85 73 eq "$encoded_be,$encoded_alpha,$encoded_bet";
74 print "ok 5\n";
75}
e1992b6d 76
77{
78 use charnames ':full';
79 print "not " unless "\x{263a}" eq "\N{WHITE SMILING FACE}";
80 print "ok 6\n";
81 print "not " unless length("\x{263a}") == 1;
82 print "ok 7\n";
83 print "not " unless length("\N{WHITE SMILING FACE}") == 1;
84 print "ok 8\n";
85 print "not " unless sprintf("%vx", "\x{263a}") eq "263a";
86 print "ok 9\n";
87 print "not " unless sprintf("%vx", "\N{WHITE SMILING FACE}") eq "263a";
88 print "ok 10\n";
f08d6ad9 89 print "not " unless sprintf("%vx", "\xFF\N{WHITE SMILING FACE}") eq "ff.263a";
90 print "ok 11\n";
91 print "not " unless sprintf("%vx", "\x{ff}\N{WHITE SMILING FACE}") eq "ff.263a";
92 print "ok 12\n";
e1992b6d 93}
c00525d4 94
95{
96 use charnames qw(:full);
55eda711 97 use utf8;
c00525d4 98
99 my $x = "\x{221b}";
100 my $named = "\N{CUBE ROOT}";
101
102 print "not " unless ord($x) == ord($named);
103 print "ok 13\n";
104}
105
f9a63242 106{
107 use charnames qw(:full);
55eda711 108 use utf8;
f9a63242 109 print "not " unless "\x{100}\N{CENT SIGN}" eq "\x{100}"."\N{CENT SIGN}";
110 print "ok 14\n";
111}
112
b896c7a5 113{
114 use charnames ':full';
115
116 print "not "
117 unless to_bytes("\N{DESERET SMALL LETTER ENG}") eq $encoded_deseng;
118 print "ok 15\n";
4765795a 119}
b896c7a5 120
4765795a 121{
122 # 20001114.001
123
4c53e876 124 no utf8; # naked Latin-1
3ba0e062 125
4765795a 126 if (ord("Ä") == 0xc4) { # Try to do this only on Latin-1.
127 use charnames ':full';
128 my $text = "\N{LATIN CAPITAL LETTER A WITH DIAERESIS}";
129 print "not " unless $text eq "\xc4" && ord($text) == 0xc4;
130 print "ok 16\n";
131 } else {
132 print "ok 16 # Skip: not Latin-1\n";
133 }
b896c7a5 134}
135
daf0d493 136{
137 print "not " unless charnames::viacode(0x1234) eq "ETHIOPIC SYLLABLE SEE";
138 print "ok 17\n";
139
a23c04e4 140 # Unused Hebrew.
11881cb4 141 print "not " if defined charnames::viacode(0x0590);
daf0d493 142 print "ok 18\n";
143}
144
145{
146 print "not " unless
51b0dbc4 147 sprintf("%04X", charnames::vianame("GOTHIC LETTER AHSA")) eq "10330";
daf0d493 148 print "ok 19\n";
149
150 print "not " if
151 defined charnames::vianame("NONE SUCH");
152 print "ok 20\n";
153}
4e2cda5d 154
155{
156 # check that caching at least hasn't broken anything
157
158 print "not " unless charnames::viacode(0x1234) eq "ETHIOPIC SYLLABLE SEE";
159 print "ok 21\n";
160
161 print "not " unless
51b0dbc4 162 sprintf("%04X", charnames::vianame("GOTHIC LETTER AHSA")) eq "10330";
4e2cda5d 163 print "ok 22\n";
164
165}
301a3cda 166
822ebcc8 167print "not " unless "\N{CHARACTER TABULATION}" eq "\t";
301a3cda 168print "ok 23\n";
169
170print "not " unless "\N{ESCAPE}" eq "\e";
171print "ok 24\n";
172
173print "not " unless "\N{NULL}" eq "\c@";
174print "ok 25\n";
175
eb380778 176if ($^O eq 'MacOS')
177{
178 print "not " unless "\N{CARRIAGE RETURN (CR)}" eq "\n";
179 print "ok 26\n";
180
181 print "not " unless "\N{CARRIAGE RETURN}" eq "\n";
182 print "ok 27\n";
183
184 print "not " unless "\N{CR}" eq "\n";
185 print "ok 28\n";
186}
187else
188{
189 print "not " unless "\N{LINE FEED (LF)}" eq "\n";
190 print "ok 26\n";
52ea3e69 191
eb380778 192 print "not " unless "\N{LINE FEED}" eq "\n";
193 print "ok 27\n";
52ea3e69 194
eb380778 195 print "not " unless "\N{LF}" eq "\n";
196 print "ok 28\n";
197}
52ea3e69 198
a2e77dd4 199my $nel = ord("A") == 193 ? qr/^(?:\x15|\x25)$/ : qr/^\x85$/;
200
201print "not " unless "\N{NEXT LINE (NEL)}" =~ $nel;
52ea3e69 202print "ok 29\n";
203
a2e77dd4 204print "not " unless "\N{NEXT LINE}" =~ $nel;
52ea3e69 205print "ok 30\n";
206
a2e77dd4 207print "not " unless "\N{NEL}" =~ $nel;
51e9e896 208print "ok 31\n";
209
274085e3 210print "not " unless "\N{BYTE ORDER MARK}" eq chr(0xFEFF);
51e9e896 211print "ok 32\n";
212
d7d589a8 213print "not " unless "\N{BOM}" eq chr(0xFEFF);
51e9e896 214print "ok 33\n";
215
52ea3e69 216{
217 use warnings 'deprecated';
218
219 print "not " unless "\N{HORIZONTAL TABULATION}" eq "\t";
51e9e896 220 print "ok 34\n";
52ea3e69 221
222 print "not " unless grep { /"HORIZONTAL TABULATION" is deprecated/ } @WARN;
51e9e896 223 print "ok 35\n";
822ebcc8 224
52ea3e69 225 no warnings 'deprecated';
226
227 print "not " unless "\N{VERTICAL TABULATION}" eq "\013";
51e9e896 228 print "ok 36\n";
52ea3e69 229
230 print "not " if grep { /"VERTICAL TABULATION" is deprecated/ } @WARN;
51e9e896 231 print "ok 37\n";
52ea3e69 232}
822ebcc8 233
274085e3 234print "not " unless charnames::viacode(0xFEFF) eq "ZERO WIDTH NO-BREAK SPACE";
a23c04e4 235print "ok 38\n";
236
872c91ae 237{
238 use warnings;
239 print "not " unless ord("\N{BOM}") == 0xFEFF;
240 print "ok 39\n";
241}
242
24b5d5cc 243print "not " unless ord("\N{ZWNJ}") == 0x200C;
244print "ok 40\n";
245
246print "not " unless ord("\N{ZWJ}") == 0x200D;
247print "ok 41\n";
dbc0d4f2 248
249print "not " unless "\N{U+263A}" eq "\N{WHITE SMILING FACE}";
250print "ok 42\n";
251
51b0dbc4 252{
253 print "not " unless
254 0x3093 == charnames::vianame("HIRAGANA LETTER N");
255 print "ok 43\n";
256
257 print "not " unless
258 0x0397 == charnames::vianame("GREEK CAPITAL LETTER ETA");
259 print "ok 44\n";
260}
261
00d835f2 262print "not " if defined charnames::viacode(0x110000);
51b0dbc4 263print "ok 45\n";
00d835f2 264
265print "not " if grep { /you asked for U+110000/ } @WARN;
51b0dbc4 266print "ok 46\n";
35c0985d 267
268
269# ---- Alias extensions
270
271my $tmpfile = "tmp0000";
272my $alifile = "../lib/unicore/xyzzy_alias.pl";
273my $i = 0;
2741 while -e ++$tmpfile;
275END { if ($tmpfile) { 1 while unlink $tmpfile; } }
276
277my @prgs;
278{ local $/ = undef;
279 @prgs = split "\n########\n", <DATA>;
280 }
281
282my $i = 46;
283for (@prgs) {
284 my ($code, $exp) = ((split m/\nEXPECT\n/), '$');
285 my ($prog, $fil) = ((split m/\nFILE\n/, $code), "");
286 open my $tmp, "> $tmpfile" or die "Could not open $tmpfile: $!";
287 print $tmp $prog, "\n";
288 close $tmp or die "Could not close $tmpfile: $!";
289 if ($fil) {
290 $fil .= "\n";
291 open my $ali, "> $alifile" or die "Could not open $alifile: $!";
292 print $ali $fil;
293 close $ali or die "Could not close $alifile: $!";
294 }
295 my $res =
296 $^O eq "MSWin32" ? `.\\perl -I../lib $switch $tmpfile 2>&1` :
297 $^O eq "NetWare" ? `perl -I../lib $switch $tmpfile 2>&1` :
298 $^O eq "MacOS" ? `$^X -I::lib -MMac::err=unix $switch $tmpfile` :
299 `./perl -I. -I../lib $switch $tmpfile 2>&1`;
300 my $status = $?;
301 $res =~ s/[\r\n]+$//;
302 $res =~ s/tmp\d+/-/g; # fake $prog from STDIN
303 $res =~ s/\n%[A-Z]+-[SIWEF]-.*$// # clip off DCL status msg
304 if $^O eq "VMS";
305 $exp =~ s/[\r\n]+$//;
306 if ($^O eq "MacOS") {
307 $exp =~ s{(\./)?abc\.pm}{:abc.pm}g;
308 $exp =~ s{./abc} {:abc}g;
309 }
310 my $pfx = ($res =~ s/^PREFIX\n//);
311 my $rexp = qr{^$exp};
312 if ($res =~ s/^SKIPPED\n//) {
313 print "$results\n";
314 }
315 elsif (($pfx and $res !~ /^\Q$expected/) or
316 (!$pfx and $res !~ $rexp)) {
317 print STDERR
318 "PROG:\n$prog\n",
319 "FILE:\n$fil",
320 "EXPECTED:\n$exp\n",
321 "GOT:\n$res\n";
322 print "not ";
323 }
324 print "ok ", ++$i, "\n";
325 1 while unlink $tmpfile;
326 $fil or next;
327 1 while unlink $alifile;
328 }
329
330__END__
331# wrong type of alias (missing colon)
332use charnames "alias";
333"Here: \N{e_ACUTE}!\n";
334EXPECT
335Unknown charname 'e_ACUTE' at
336########
337# alias without an argument
338use charnames ":alias";
339"Here: \N{e_ACUTE}!\n";
340EXPECT
341Unknown charname 'e_ACUTE' at
342########
343# alias with hashref but no :full
344use charnames ":alias" => { e_ACUTE => "LATIN SMALL LETTER E WITH ACUTE" };
345"Here: \N{e_ACUTE}!\n";
346EXPECT
347Unknown charname 'LATIN SMALL LETTER E WITH ACUTE' at
348########
349# alias with hashref but with :short
350use charnames ":short", ":alias" => { e_ACUTE => "LATIN SMALL LETTER E WITH ACUTE" };
351"Here: \N{e_ACUTE}!\n";
352EXPECT
353Unknown charname 'LATIN SMALL LETTER E WITH ACUTE' at
354########
355# alias with hashref to :full OK
356use charnames ":full", ":alias" => { e_ACUTE => "LATIN SMALL LETTER E WITH ACUTE" };
357"Here: \N{e_ACUTE}!\n";
358EXPECT
359$
360########
361# alias with hashref to :short but using :full
362use charnames ":full", ":alias" => { e_ACUTE => "LATIN:e WITH ACUTE" };
363"Here: \N{e_ACUTE}!\n";
364EXPECT
365Unknown charname 'LATIN:e WITH ACUTE' at
366########
367# alias with hashref to :short OK
368use charnames ":short", ":alias" => { e_ACUTE => "LATIN:e WITH ACUTE" };
369"Here: \N{e_ACUTE}!\n";
370EXPECT
371$
372########
373# alias with bad hashref
374use charnames ":short", ":alias" => "e_ACUTE";
375"Here: \N{e_ACUTE}\N{a_ACUTE}!\n";
376EXPECT
377Odd number of elements in anonymous hash at
378########
379# alias with arrayref
380use charnames ":short", ":alias" => [ e_ACUTE => "LATIN:e WITH ACUTE" ];
381"Here: \N{e_ACUTE}!\n";
382EXPECT
383Only HASH reference supported as argument to :alias at
384########
385# alias with bad hashref
386use charnames ":short", ":alias" => { e_ACUTE => "LATIN:e WITH ACUTE", "a_ACUTE" };
387"Here: \N{e_ACUTE}\N{a_ACUTE}!\n";
388EXPECT
389Use of uninitialized value in string eq at
390########
391# alias with hashref two aliases
392use charnames ":short", ":alias" => {
393 e_ACUTE => "LATIN:e WITH ACUTE",
394 a_ACUTE => "",
395 };
396"Here: \N{e_ACUTE}\N{a_ACUTE}!\n";
397EXPECT
398Unknown charname '' at
399########
400# alias with hashref two aliases
401use charnames ":short", ":alias" => {
402 e_ACUTE => "LATIN:e WITH ACUTE",
403 a_ACUTE => "LATIN:a WITH ACUTE",
404 };
405"Here: \N{e_ACUTE}\N{a_ACUTE}!\n";
406EXPECT
407$
408########
409# alias with hashref using mixed aliasses
410use charnames ":short", ":alias" => {
411 e_ACUTE => "LATIN:e WITH ACUTE",
412 a_ACUTE => "LATIN SMALL LETTER A WITH ACUT",
413 };
414"Here: \N{e_ACUTE}\N{a_ACUTE}!\n";
415EXPECT
416Unknown charname 'LATIN SMALL LETTER A WITH ACUT' at
417########
418# alias with hashref using mixed aliasses
419use charnames ":short", ":alias" => {
420 e_ACUTE => "LATIN:e WITH ACUTE",
421 a_ACUTE => "LATIN SMALL LETTER A WITH ACUTE",
422 };
423"Here: \N{e_ACUTE}\N{a_ACUTE}!\n";
424EXPECT
425Unknown charname 'LATIN SMALL LETTER A WITH ACUTE' at
426########
427# alias with hashref using mixed aliasses
428use charnames ":full", ":alias" => {
429 e_ACUTE => "LATIN:e WITH ACUTE",
430 a_ACUTE => "LATIN SMALL LETTER A WITH ACUTE",
431 };
432"Here: \N{e_ACUTE}\N{a_ACUTE}!\n";
433EXPECT
434Unknown charname 'LATIN:e WITH ACUTE' at
435########
436# alias with nonexisting file
437use charnames ":full", ":alias" => "xyzzy";
438"Here: \N{e_ACUTE}\N{a_ACUTE}!\n";
439EXPECT
440Odd number of elements in anonymous hash at
441########
442# alias with bad file
443use charnames ":full", ":alias" => "xyzzy";
444"Here: \N{e_ACUTE}\N{a_ACUTE}!\n";
445FILE
446#!perl
4470;
448EXPECT
449Odd number of elements in anonymous hash at
450########
451# alias with file with empty list
452use charnames ":full", ":alias" => "xyzzy";
453"Here: \N{e_ACUTE}\N{a_ACUTE}!\n";
454FILE
455#!perl
456();
457EXPECT
458Unknown charname 'e_ACUTE' at
459########
460# alias with file OK but file has :short aliasses
461use charnames ":full", ":alias" => "xyzzy";
462"Here: \N{e_ACUTE}\N{a_ACUTE}!\n";
463FILE
464#!perl
465( e_ACUTE => "LATIN:e WITH ACUTE",
466 a_ACUTE => "LATIN:a WITH ACUTE",
467 );
468EXPECT
469Unknown charname 'LATIN:e WITH ACUTE' at
470########
471# alias with :short and file OK
472use charnames ":short", ":alias" => "xyzzy";
473"Here: \N{e_ACUTE}\N{a_ACUTE}!\n";
474FILE
475#!perl
476( e_ACUTE => "LATIN:e WITH ACUTE",
477 a_ACUTE => "LATIN:a WITH ACUTE",
478 );
479EXPECT
480$
481########
482# alias with :short and file OK has :long aliasses
483use charnames ":short", ":alias" => "xyzzy";
484"Here: \N{e_ACUTE}\N{a_ACUTE}!\n";
485FILE
486#!perl
487( e_ACUTE => "LATIN SMALL LETTER E WITH ACUTE",
488 a_ACUTE => "LATIN SMALL LETTER A WITH ACUTE",
489 );
490EXPECT
491Unknown charname 'LATIN SMALL LETTER E WITH ACUTE' at
492########
493# alias with file implicit :full but file has :short aliasses
494use charnames ":alias" => ":xyzzy";
495"Here: \N{e_ACUTE}\N{a_ACUTE}!\n";
496FILE
497#!perl
498( e_ACUTE => "LATIN:e WITH ACUTE",
499 a_ACUTE => "LATIN:a WITH ACUTE",
500 );
501EXPECT
502Unknown charname 'LATIN:e WITH ACUTE' at
503########
504# alias with file implicit :full and file has :long aliasses
505use charnames ":alias" => ":xyzzy";
506"Here: \N{e_ACUTE}\N{a_ACUTE}!\n";
507FILE
508#!perl
509( e_ACUTE => "LATIN SMALL LETTER E WITH ACUTE",
510 a_ACUTE => "LATIN SMALL LETTER A WITH ACUTE",
511 );
512EXPECT
513$