Integrate (@snapshot)
[p5sagit/p5-mst-13.2.git] / t / io / utf8.t
CommitLineData
7d59b7e4 1#!./perl
2
3BEGIN {
4 chdir 't' if -d 't';
5 @INC = '../lib';
f6c77cf1 6 unless (defined &perlio::import) {
7d59b7e4 7 print "1..0 # Skip: not perlio\n";
8 exit 0;
9 }
10}
11
12$| = 1;
360eb788 13print "1..25\n";
7d59b7e4 14
15open(F,"+>:utf8",'a');
16print F chr(0x100).'£';
17print '#'.tell(F)."\n";
18print "not " unless tell(F) == 4;
19print "ok 1\n";
20print F "\n";
21print '#'.tell(F)."\n";
22print "not " unless tell(F) >= 5;
23print "ok 2\n";
24seek(F,0,0);
25print "not " unless getc(F) eq chr(0x100);
26print "ok 3\n";
27print "not " unless getc(F) eq "£";
28print "ok 4\n";
29print "not " unless getc(F) eq "\n";
30print "ok 5\n";
31seek(F,0,0);
32binmode(F,":bytes");
33print "not " unless getc(F) eq chr(0xc4);
34print "ok 6\n";
35print "not " unless getc(F) eq chr(0x80);
36print "ok 7\n";
37print "not " unless getc(F) eq chr(0xc2);
38print "ok 8\n";
39print "not " unless getc(F) eq chr(0xa3);
40print "ok 9\n";
41print "not " unless getc(F) eq "\n";
42print "ok 10\n";
43seek(F,0,0);
44binmode(F,":utf8");
45print "not " unless scalar(<F>) eq "\x{100}£\n";
46print "ok 11\n";
eb5c063a 47seek(F,0,0);
48$buf = chr(0x200);
49$count = read(F,$buf,2,1);
50print "not " unless $count == 2;
51print "ok 12\n";
52print "not " unless $buf eq "\x{200}\x{100}£";
53print "ok 13\n";
7d59b7e4 54close(F);
55
360eb788 56{
57$a = chr(300); # This *is* UTF-encoded
58$b = chr(130); # This is not.
59
60open F, ">:utf8", 'a' or die $!;
61print F $a,"\n";
62close F;
63
64open F, "<:utf8", 'a' or die $!;
65$x = <F>;
66chomp($x);
67print "not " unless $x eq chr(300);
68print "ok 14\n";
69
70open F, "a" or die $!; # Not UTF
71$x = <F>;
72chomp($x);
73print "not " unless $x eq chr(196).chr(172);
74print "ok 15\n";
75close F;
76
77open F, ">:utf8", 'a' or die $!;
79086a00 78binmode(F); # we write a "\n" and then tell() - avoid CRLF issues.
360eb788 79print F $a;
80my $y;
f6c77cf1 81{ my $x = tell(F);
360eb788 82 { use bytes; $y = length($a);}
83 print "not " unless $x == $y;
84 print "ok 16\n";
85}
86
87{ # Check byte length of $b
88use bytes; my $y = length($b);
89print "not " unless $y == 1;
90print "ok 17\n";
91}
92
f9a63242 93print F $b,"\n"; # Don't upgrades $b
360eb788 94
95{ # Check byte length of $b
96use bytes; my $y = length($b);
f9a63242 97print "not ($y) " unless $y == 1;
360eb788 98print "ok 18\n";
99}
100
f6c77cf1 101{ my $x = tell(F);
360eb788 102 { use bytes; $y += 3;}
f9a63242 103 print "not ($x,$y) " unless $x == $y;
360eb788 104 print "ok 19\n";
105}
106
107close F;
108
109open F, "a" or die $!; # Not UTF
110$x = <F>;
111chomp($x);
f9a63242 112printf "not (%vd) ", $x unless $x eq v196.172.194.130;
360eb788 113print "ok 20\n";
114
115open F, "<:utf8", "a" or die $!;
116$x = <F>;
117chomp($x);
118close F;
f9a63242 119printf "not (%vd) ", $x unless $x eq chr(300).chr(130);
360eb788 120print "ok 21\n";
121
122# Now let's make it suffer.
123open F, ">", "a" or die $!;
124eval { print F $a; };
125print "not " unless $@ and $@ =~ /Wide character in print/i;
126print "ok 22\n";
127}
128
129# Hm. Time to get more evil.
130open F, ">:utf8", "a" or die $!;
131print F $a;
132binmode(F, ":bytes");
133print F chr(130)."\n";
134close F;
135
136open F, "<", "a" or die $!;
137$x = <F>; chomp $x;
138print "not " unless $x eq v196.172.130;
139print "ok 23\n";
140
141# Right.
142open F, ">:utf8", "a" or die $!;
143print F $a;
144close F;
145open F, ">>", "a" or die $!;
146print F chr(130)."\n";
147close F;
148
149open F, "<", "a" or die $!;
150$x = <F>; chomp $x;
151print "not " unless $x eq v196.172.130;
152print "ok 24\n";
153
154# Now we have a deformed file.
155open F, "<:utf8", "a" or die $!;
156$x = <F>; chomp $x;
157{ local $SIG{__WARN__} = sub { print "ok 25\n"; };
158eval { sprintf "%vd\n", $x; }
159}
160
161unlink('a');
7d59b7e4 162