2 # $Id: jperl.t,v 1.24 2002/04/26 03:02:04 dankogai Exp $
4 # This script is written in euc-jp
7 require Config; import Config;
8 if ($Config{'extensions'} !~ /\bEncode\b/) {
9 print "1..0 # Skip: Encode was not built\n";
12 unless (find PerlIO::Layer 'perlio') {
13 print "1..0 # Skip: PerlIO was not built\n";
16 if (ord("A") == 193) {
17 print "1..0 # Skip: EBCDIC\n";
23 no utf8; # we have raw Japanese encodings here
26 use Test::More tests => 18;
30 my $Enamae = "\xbe\xae\xbb\xf4\x20\xc3\xc6"; # euc-jp, with \x escapes
31 use encoding "euc-jp";
33 my $Namae = "¾®»ô ÃÆ"; # in Japanese, in euc-jp
34 my $Name = "Dan Kogai"; # in English
35 # euc-jp in \x format but after the pragma. But this one will be converted!
36 my $Ynamae = "\xbe\xae\xbb\xf4\x20\xc3\xc6";
39 my $str = $Namae; $str =~ s/¾®»ô ÃÆ/Dan Kogai/o;
40 is($str, $Name, q{regex});
41 $str = $Namae; $str =~ s/$Namae/Dan Kogai/o;
42 is($str, $Name, q{regex - with variable});
43 is(length($Namae), 4, q{utf8:length});
46 # converted to UTF-8 so 3*3+1
47 is(length($Namae), 10, q{bytes:length});
49 is(length($Enamae), 7, q{euc:length}); # 2*3+1
50 is ($Namae, $Ynamae, q{literal conversions});
51 isnt($Enamae, $Ynamae, q{before and after});
52 is($Enamae, Encode::encode('euc-jp', $Namae));
54 # let's test the scope as well. Must be in utf8 realm
55 is(length($Namae), 4, q{utf8:length});
59 ok(! defined(${^ENCODING}), q{no encoding;});
61 # should've been isnt() but no scoping is suported -- yet
62 ok(! defined(${^ENCODING}), q{not scoped yet});
64 # now let's try some real black magic!
65 local(${^ENCODING}) = Encode::find_encoding("euc-jp");
66 my $str = "\xbe\xae\xbb\xf4\x20\xc3\xc6";
67 is (length($str), 4, q{black magic:length});
68 is ($str, $Enamae, q{black magic:eq});
70 ok(! defined(${^ENCODING}), q{out of black magic});
72 is (length($Namae), 10);
75 # now something completely different!
78 use encoding "euc-jp", Filter=>1;
81 no strict 'vars'; # fools
82 # doesn't work w/ "my" as of this writing.
83 # because of buggy strict.pm and utf8.pm
85 # ^^U+4eba, "human" in CJK ideograph
86 $¿Í++; # a child is born
88 is ($people, 3, "Filter:utf8 identifier");