Needs to be conditional on SunOS 4.
[p5sagit/p5-mst-13.2.git] / t / pragma / utf8.t
index 16a1586..2b208cc 100755 (executable)
@@ -2,7 +2,7 @@
 
 BEGIN {
     chdir 't' if -d 't';
-    unshift @INC, '../lib';
+    @INC = '../lib';
     $ENV{PERL5LIB} = '../lib';
     if ( ord("\t") != 9 ) { # skip on ebcdic platforms
         print "1..0 # Skip utf8 tests on ebcdic platform.\n";
@@ -10,7 +10,7 @@ BEGIN {
     }
 }
 
-print "1..61\n";
+print "1..75\n";
 
 my $test = 1;
 
@@ -20,6 +20,26 @@ sub ok {
     print "ok $test\n";
 }
 
+sub nok {
+    my ($got,$expect) = @_;
+    print "# expected not [$expect], got [$got]\nnot " if $got eq $expect;
+    print "ok $test\n";
+}
+
+sub ok_bytes {
+    use bytes;
+    my ($got,$expect) = @_;
+    print "# expected [$expect], got [$got]\nnot " if $got ne $expect;
+    print "ok $test\n";
+}
+
+sub nok_bytes {
+    use bytes;
+    my ($got,$expect) = @_;
+    print "# expected not [$expect], got [$got]\nnot " if $got eq $expect;
+    print "ok $test\n";
+}
+
 {
     use utf8;
     $_ = ">\x{263A}<"; 
@@ -120,9 +140,9 @@ sub ok {
     $test++;                           # 22
 
     {
-        use bytes;
+       use bytes;
 
-        my $tmp = $&;
+       my $tmp = $&;
        ok $tmp, pack("C*", ord(">"), 0342, 0230, 0272);
        $test++;                                # 23
 
@@ -139,39 +159,51 @@ sub ok {
        $test++;                                # 26
     }
 
+    ok_bytes $&, pack("C*", ord(">"), 0342, 0230, 0272);
+    $test++;                           # 27
+
+    ok_bytes $', pack("C*", 0342, 0230, 0272);
+    $test++;                           # 28
+
+    ok_bytes $`, pack("C*", 0342, 0230, 0272);
+    $test++;                           # 29
+
+    ok_bytes $1, pack("C*", 0342, 0230, 0272);
+    $test++;                           # 30
+
     {
        use bytes;
        no utf8;
 
        ok length, 10;
-       $test++;                                # 27
+       $test++;                                # 31
 
        ok length((m/>(.)/)[0]), 1;
-       $test++;                                # 28
+       $test++;                                # 32
 
        ok length($&), 2;
-       $test++;                                # 29
+       $test++;                                # 33
 
        ok length($'), 5;
-       $test++;                                # 30
+       $test++;                                # 34
 
        ok length($`), 3;
-       $test++;                                # 31
+       $test++;                                # 35
 
        ok length($1), 1;
-       $test++;                                # 32
+       $test++;                                # 36
 
        ok $&, pack("C*", ord(">"), 0342);
-       $test++;                                # 33
+       $test++;                                # 37
 
        ok $', pack("C*", 0230, 0272, 0342, 0230, 0272);
-       $test++;                                # 34
+       $test++;                                # 38
 
        ok $`, pack("C*", 0342, 0230, 0272);
-       $test++;                                # 35
+       $test++;                                # 39
 
        ok $1, pack("C*", 0342);
-       $test++;                                # 36
+       $test++;                                # 40
 
     }
 
@@ -182,90 +214,163 @@ sub ok {
     }
 
     ok length, 10;
-    $test++;                           # 37
+    $test++;                           # 41
 
     ok length((m/>(.)/)[0]), 1;
-    $test++;                           # 38
+    $test++;                           # 42
 
     ok length($&), 2;
-    $test++;                           # 39
+    $test++;                           # 43
 
     ok length($'), 1;
-    $test++;                           # 40
+    $test++;                           # 44
 
     ok length($`), 1;
-    $test++;                           # 41
+    $test++;                           # 45
 
     ok length($1), 1;
-    $test++;                           # 42
+    $test++;                           # 46
 
     ok length($tmp=$&), 2;
-    $test++;                           # 43
+    $test++;                           # 47
 
     ok length($tmp=$'), 1;
-    $test++;                           # 44
+    $test++;                           # 48
 
     ok length($tmp=$`), 1;
-    $test++;                           # 45
+    $test++;                           # 49
 
     ok length($tmp=$1), 1;
-    $test++;                           # 46
+    $test++;                           # 50
 
     {
        use bytes;
 
         my $tmp = $&;
        ok $tmp, pack("C*", ord(">"), 0342, 0230, 0272);
-       $test++;                                # 47
+       $test++;                                # 51
 
         $tmp = $';
        ok $tmp, pack("C*", 0342, 0230, 0272);
-       $test++;                                # 48
+       $test++;                                # 52
 
         $tmp = $`;
        ok $tmp, pack("C*", 0342, 0230, 0272);
-       $test++;                                # 49
+       $test++;                                # 53
 
         $tmp = $1;
        ok $tmp, pack("C*", 0342, 0230, 0272);
-       $test++;                                # 50
+       $test++;                                # 54
     }
     {
        use bytes;
        no utf8;
 
        ok length, 10;
-       $test++;                                # 51
+       $test++;                                # 55
 
        ok length((m/>(.)/)[0]), 1;
-       $test++;                                # 52
+       $test++;                                # 56
 
        ok length($&), 2;
-       $test++;                                # 53
+       $test++;                                # 57
 
        ok length($'), 5;
-       $test++;                                # 54
+       $test++;                                # 58
 
        ok length($`), 3;
-       $test++;                                # 55
+       $test++;                                # 59
 
        ok length($1), 1;
-       $test++;                                # 56
+       $test++;                                # 60
 
        ok $&, pack("C*", ord(">"), 0342);
-       $test++;                                # 57
+       $test++;                                # 61
 
        ok $', pack("C*", 0230, 0272, 0342, 0230, 0272);
-       $test++;                                # 58
+       $test++;                                # 62
 
        ok $`, pack("C*", 0342, 0230, 0272);
-       $test++;                                # 59
+       $test++;                                # 63
 
        ok $1, pack("C*", 0342);
-       $test++;                                # 60
+       $test++;                                # 64
 
     }
 
     ok "\x{ab}" =~ /^\x{ab}$/, 1;
-    $test++;                                   # 61
+    $test++;                                   # 65
+}
+
+{
+    use utf8;
+    ok_bytes chr(0xe2), pack("C*", 0xc3, 0xa2);
+    $test++;                # 66
+}
+
+{
+    use utf8;
+    my @a = map ord, split(//, join("", map chr, (1234, 123, 2345)));
+    ok "@a", "1234 123 2345";
+    $test++;                # 67
+}
+
+{
+    use utf8;
+    my $x = chr(123);
+    my @a = map ord, split(/$x/, join("", map chr, (1234, 123, 2345)));
+    ok "@a", "1234 2345";
+    $test++;                # 68
+}
+
+{
+  my($a,$b);
+  { use bytes; $a = "\xc3\xa4"; }  
+  { use utf8;  $b = "\xe4"; }
+  { use bytes; ok_bytes $a, $b; $test++; } # 69
+  { use utf8;  nok      $a, $b; $test++; } # 70
+}
+
+{
+    my @x = ("stra\337e 138","stra\337e 138");
+    for (@x) {
+       s/(\d+)\s*([\w\-]+)/$1 . uc $2/e;
+       my($latin) = /^(.+)(?:\s+\d)/;
+       print $latin eq "stra\337e" ? "ok $test\n" :
+           "#latin[$latin]\nnot ok $test\n";
+       $test++;
+       $latin =~ s/stra\337e/straße/; # \303\237 after the 2nd a
+       use utf8;
+       $latin =~ s!(s)tr(?:aß|s+e)!$1tr.!; # \303\237 after the a
+    }
+}
+
+{
+    $_ = $dx = "\x{10f2}";
+    s/($dx)/$dx$1/;
+    {
+       use bytes;
+       print "not " unless $_ eq "$dx$dx";
+       print "ok $test\n";
+       $test++;
+    }
+
+    $_ = $dx = "\x{10f2}";
+    s/($dx)/$1$dx/;
+    {
+       use bytes;
+       print "not " unless $_ eq "$dx$dx";
+       print "ok $test\n";
+       $test++;
+    }
+
+    $dx = "\x{10f2}";
+    $_  = "\x{10f2}\x{10f2}";
+    s/($dx)($dx)/$1$2/;
+    {
+       use bytes;
+       print "not " unless $_ eq "$dx$dx";
+       print "ok $test\n";
+       $test++;
+    }
 }