Encode simply needs more work on EBCDIC.
[p5sagit/p5-mst-13.2.git] / ext / Encode / t / Aliases.t
CommitLineData
5d030b67 1#!../perl
2
67d7b5ef 3BEGIN {
037b88d6 4 if ($ENV{'PERL_CORE'}){
5 chdir 't';
6 unshift @INC, '../lib';
7 }
67d7b5ef 8 require Config; import Config;
9 if ($Config{'extensions'} !~ /\bEncode\b/) {
10 print "1..0 # Skip: Encode was not built\n";
11 exit 0;
12 }
13}
14
5d030b67 15use strict;
5129552c 16use Encode;
17use Encode::Alias;
a63c962f 18my %a2c;
19my $ON_EBCDIC;
5d030b67 20
a999c27c 21sub init_a2c{
a63c962f 22 %a2c = (
a999c27c 23 'US-ascii' => 'ascii',
2d06ad02 24 'ISO-646-US' => 'ascii',
a999c27c 25 'UTF-8' => 'utf8',
80a5d8e7 26 'UCS-2' => 'UCS-2BE',
27 'UCS2' => 'UCS-2BE',
28 'iso-10646-1' => 'UCS-2BE',
29 'ucs2-le' => 'UCS-2LE',
eaac0a15 30 'ucs2-be' => 'UCS-2BE',
80a5d8e7 31 'utf16' => 'UTF-16',
32 'utf32' => 'UTF-32',
33 'utf16-be' => 'UTF-16BE',
34 'utf32-be' => 'UTF-32BE',
35 'utf16-le' => 'UTF-16LE',
36 'utf32-le' => 'UTF-32LE',
126bf8bf 37 'UCS4-BE' => 'UTF-32BE',
38 'UCS-4-LE' => 'UTF-32LE',
a63c962f 39 'cyrillic' => 'iso-8859-5',
40 'arabic' => 'iso-8859-6',
41 'greek' => 'iso-8859-7',
42 'hebrew' => 'iso-8859-8',
43 'thai' => 'iso-8859-11',
44 'tis620' => 'iso-8859-11',
45 'WinLatin1' => 'cp1252',
46 'WinLatin2' => 'cp1250',
47 'WinCyrillic' => 'cp1251',
48 'WinGreek' => 'cp1253',
49 'WinTurkish' => 'cp1254',
50 'WinHebrew' => 'cp1255',
51 'WinArabic' => 'cp1256',
52 'WinBaltic' => 'cp1257',
53 'WinVietnamese' => 'cp1258',
54 'ja_JP.euc' => $ON_EBCDIC ? '' : 'euc-jp',
55 'x-euc-jp' => $ON_EBCDIC ? '' : 'euc-jp',
56 'zh_CN.euc' => $ON_EBCDIC ? '' : 'euc-cn',
57 'x-euc-cn' => $ON_EBCDIC ? '' : 'euc-cn',
58 'ko_KR.euc' => $ON_EBCDIC ? '' : 'euc-kr',
59 'x-euc-kr' => $ON_EBCDIC ? '' : 'euc-kr',
60 'ujis' => $ON_EBCDIC ? '' : 'euc-jp',
61 'Shift_JIS' => $ON_EBCDIC ? '' : 'shiftjis',
62 'x-sjis' => $ON_EBCDIC ? '' : 'shiftjis',
63 'jis' => $ON_EBCDIC ? '' : '7bit-jis',
b0b300a3 64 'big-5' => $ON_EBCDIC ? '' : 'big5-eten',
65 'zh_TW.Big5' => $ON_EBCDIC ? '' : 'big5-eten',
2d06ad02 66 'tca-big5' => $ON_EBCDIC ? '' : 'big5-eten',
a63c962f 67 'big5-hk' => $ON_EBCDIC ? '' : 'big5-hkscs',
2d06ad02 68 'hkscs-big5' => $ON_EBCDIC ? '' : 'big5-hkscs',
67d7b5ef 69 'GB_2312-80' => $ON_EBCDIC ? '' : 'euc-cn',
67d7b5ef 70 'KS_C_5601-1987' => $ON_EBCDIC ? '' : 'cp949',
80a5d8e7 71 #
72 'gb12345-raw' => $ON_EBCDIC ? '' : 'gb12345-raw',
73 'gb2312-raw' => $ON_EBCDIC ? '' : 'gb2312-raw',
74 'jis0201-raw' => $ON_EBCDIC ? '' : 'jis0201-raw',
75 'jis0208-raw' => $ON_EBCDIC ? '' : 'jis0208-raw',
76 'jis0212-raw' => $ON_EBCDIC ? '' : 'jis0212-raw',
77 'ksc5601-raw' => $ON_EBCDIC ? '' : 'ksc5601-raw',
78 );
a63c962f 79
80 for my $i (1..11,13..16){
81 $a2c{"ISO 8859 $i"} = "iso-8859-$i";
82 }
83 for my $i (1..10){
84 $a2c{"ISO Latin $i"} = "iso-8859-$Encode::Alias::Latin2iso[$i]";
85 }
86 for my $k (keys %Encode::Alias::Winlatin2cp){
87 my $v = $Encode::Alias::Winlatin2cp{$k};
88 $a2c{"Win" . ucfirst($k)} = "cp" . $v;
89 $a2c{"IBM-$v"} = $a2c{"MS-$v"} = "cp" . $v;
2d06ad02 90 $a2c{"cp-" . $v} = "cp" . $v;
9d2ff094 91 }
a999c27c 92 my @a2c = keys %a2c;
93 for my $k (@a2c){
94 $a2c{uc($k)} = $a2c{$k};
95 $a2c{lc($k)} = $a2c{$k};
96 $a2c{lcfirst($k)} = $a2c{$k};
97 $a2c{ucfirst($k)} = $a2c{$k};
98 }
99}
100
101BEGIN{
102 $ON_EBCDIC = ord("A") == 193;
103 @ARGV and $ON_EBCDIC = $ARGV[0] eq 'EBCDIC';
104 $Encode::ON_EBCDIC = $ON_EBCDIC;
105 init_a2c();
9d2ff094 106}
107
a63c962f 108if ($ON_EBCDIC){
109 delete @Encode::ExtModule{
a999c27c 110 qw(euc-cn gb2312 gb12345 gbk cp936 iso-ir-165 MacChineseSimp
67d7b5ef 111 euc-jp iso-2022-jp 7bit-jis shiftjis MacJapanese cp932
a999c27c 112 euc-kr ksc5601 cp949 MacKorean
113 big5 big5-hkscs cp950 MacChineseTrad
a63c962f 114 gb18030 big5plus euc-tw)
115 };
5d030b67 116}
117
a999c27c 118use Test::More tests => (scalar keys %a2c) * 4;
5d030b67 119
a63c962f 120print "# alias test; \$ON_EBCDIC == $ON_EBCDIC\n";
5d030b67 121
eaac0a15 122foreach my $a (keys %a2c){
5d030b67 123 my $e = Encode::find_encoding($a);
eaac0a15 124 is((defined($e) and $e->name), $a2c{$a},$a)
a999c27c 125 or warn "alias was $a";;
5d030b67 126}
127
128# now we override some of the aliases and see if it works fine
129
a999c27c 130define_alias(
131 qr/ascii/i => 'WinLatin1',
132 qr/cyrillic/i => 'WinCyrillic',
133 qr/arabic/i => 'WinArabic',
134 qr/greek/i => 'WinGreek',
135 qr/hebrew/i => 'WinHebrew'
136 );
5d030b67 137
138print "# alias test with alias overrides\n";
139
eaac0a15 140foreach my $a (keys %a2c){
5d030b67 141 my $e = Encode::find_encoding($a);
eaac0a15 142 is((defined($e) and $e->name), $a2c{$a}, "Override $a")
67d7b5ef 143 or warn "alias was $a";
5d030b67 144}
145
5129552c 146print "# alias undef test\n";
147
148Encode::Alias->undef_aliases;
eaac0a15 149foreach my $a (keys %a2c){
5129552c 150 my $e = Encode::find_encoding($a);
eaac0a15 151 ok(!defined($e) || $e->name =~ /-raw$/o,"Undef $a")
a999c27c 152 or warn "alias was $a";
5129552c 153}
154
a999c27c 155print "# alias reinit test\n";
156
157Encode::Alias->init_aliases;
158init_a2c();
eaac0a15 159foreach my $a (keys %a2c){
a999c27c 160 my $e = Encode::find_encoding($a);
eaac0a15 161 is((defined($e) and $e->name), $a2c{$a}, "Reinit $a")
a999c27c 162 or warn "alias was $a";
163}
5d030b67 164__END__
a999c27c 165for my $k (keys %a2c){
166 $k =~ /[A-Z]/ and next;
167 print "$k => $a2c{$k}\n";
5d030b67 168}
169
170
a999c27c 171