On Win32 the end.t failure should be gone now.
[p5sagit/p5-mst-13.2.git] / ext / Encode / TW / TW.pm
CommitLineData
0e567a6c 1package Encode::TW;
071db25d 2BEGIN {
3 if (ord("A") == 193) {
4 die "Encode::TW not supported on EBCDIC\n";
5 }
6}
0ab8f81e 7our $VERSION = do { my @r = (q$Revision: 1.24 $ =~ /\d+/g); sprintf "%d."."%02d" x $#r, @r };
c0d88b76 8
9use Encode;
0e567a6c 10use XSLoader;
b2704119 11XSLoader::load(__PACKAGE__,$VERSION);
0e567a6c 12
131;
14__END__
67d7b5ef 15
b2729934 16=head1 NAME
17
18Encode::TW - Taiwan-based Chinese Encodings
19
20=head1 SYNOPSIS
21
1b2c56c8 22 use Encode qw/encode decode/;
2b217bf7 23 $big5 = encode("big5", $utf8); # loads Encode::TW implicitly
ee981de6 24 $utf8 = decode("big5", $big5); # ditto
b2729934 25
26=head1 DESCRIPTION
27
0ab8f81e 28This module implements tradition Chinese charset encodings as used
29in Taiwan and Hong Kong.
b2729934 30Encodings supported are as follows.
31
1b2c56c8 32 Canonical Alias Description
33 --------------------------------------------------------------------
b0b300a3 34 big5-eten /\bbig-?5$/i Big5 encoding (with ETen extensions)
35 /\bbig5-?et(en)?$/i
36 big5-hkscs /\bbig5-?hk(scs)?$/i
37 Big5 + Cantonese characters in Hong Kong
a999c27c 38 MacChineseSimp Big5 + Apple Vendor Mappings
1b2c56c8 39 cp950 Code Page 950
a999c27c 40 = Big5 + Microsoft vendor mappings
5129552c 41 --------------------------------------------------------------------
42
0ab8f81e 43To find out how to use this module in detail, see L<Encode>.
b2729934 44
45=head1 NOTES
46
85982a32 47Due to size concerns, C<EUC-TW> (Extended Unix Character), C<CCCII>
b0b300a3 48(Chinese Character Code for Information Interchange), C<BIG5PLUS>
49(CMEX's Big5+) and C<BIG5EXT> (CMEX's Big5e) are distributed separately
50on CPAN, under the name L<Encode::HanExtra>. That module also contains
51extra China-based encodings.
b2729934 52
53=head1 BUGS
54
b0b300a3 55Since the original C<big5> encoding (1984) is not supported anywhere
56(glibc and DOS-based systems uses C<big5> to mean C<big5-eten>; Microsoft
0ab8f81e 57uses C<big5> to mean C<cp950>), a conscious decision was made to alias
b0b300a3 58C<big5> to C<big5-eten>, which is the de facto superset of the original
59big5.
60
85982a32 61The C<CNS11643> encoding files are not complete. For common C<CNS11643>
b2729934 62manipulation, please use C<EUC-TW> in L<Encode::HanExtra>, which contains
0ab8f81e 63planes 1-7.
b2729934 64
0ab8f81e 65The ASCII region (0x00-0x7f) is preserved for all encodings, even
66though this conflicts with mappings by the Unicode Consortium. See
b2729934 67
a63c962f 68L<http://www.debian.or.jp/~kubota/unicode-symbols.html.en>
b2729934 69
0ab8f81e 70to find out why it is implemented that way.
b2729934 71
72=head1 SEE ALSO
73
85982a32 74L<Encode>
b2729934 75
76=cut