Upgrade to Encode 2.00.
[p5sagit/p5-mst-13.2.git] / ext / Encode / TW / TW.pm
CommitLineData
0e567a6c 1package Encode::TW;
071db25d 2BEGIN {
3 if (ord("A") == 193) {
4 die "Encode::TW not supported on EBCDIC\n";
5 }
6}
7237418a 7our $VERSION = do { my @r = (q$Revision: 2.0 $ =~ /\d+/g); sprintf "%d."."%02d" x $#r, @r };
c0d88b76 8
9use Encode;
0e567a6c 10use XSLoader;
b2704119 11XSLoader::load(__PACKAGE__,$VERSION);
0e567a6c 12
131;
14__END__
67d7b5ef 15
b2729934 16=head1 NAME
17
18Encode::TW - Taiwan-based Chinese Encodings
19
20=head1 SYNOPSIS
21
1b2c56c8 22 use Encode qw/encode decode/;
2b217bf7 23 $big5 = encode("big5", $utf8); # loads Encode::TW implicitly
ee981de6 24 $utf8 = decode("big5", $big5); # ditto
b2729934 25
26=head1 DESCRIPTION
27
0ab8f81e 28This module implements tradition Chinese charset encodings as used
29in Taiwan and Hong Kong.
b2729934 30Encodings supported are as follows.
31
1b2c56c8 32 Canonical Alias Description
33 --------------------------------------------------------------------
b0b300a3 34 big5-eten /\bbig-?5$/i Big5 encoding (with ETen extensions)
35 /\bbig5-?et(en)?$/i
2d06ad02 36 /\btca-?big5$/i
b0b300a3 37 big5-hkscs /\bbig5-?hk(scs)?$/i
2d06ad02 38 /\bhk(scs)?-?big5$/i
b0b300a3 39 Big5 + Cantonese characters in Hong Kong
ef175861 40 MacChineseTrad Big5 + Apple Vendor Mappings
1b2c56c8 41 cp950 Code Page 950
a999c27c 42 = Big5 + Microsoft vendor mappings
5129552c 43 --------------------------------------------------------------------
44
0ab8f81e 45To find out how to use this module in detail, see L<Encode>.
b2729934 46
47=head1 NOTES
48
85982a32 49Due to size concerns, C<EUC-TW> (Extended Unix Character), C<CCCII>
b0b300a3 50(Chinese Character Code for Information Interchange), C<BIG5PLUS>
51(CMEX's Big5+) and C<BIG5EXT> (CMEX's Big5e) are distributed separately
52on CPAN, under the name L<Encode::HanExtra>. That module also contains
53extra China-based encodings.
b2729934 54
55=head1 BUGS
56
b0b300a3 57Since the original C<big5> encoding (1984) is not supported anywhere
58(glibc and DOS-based systems uses C<big5> to mean C<big5-eten>; Microsoft
0ab8f81e 59uses C<big5> to mean C<cp950>), a conscious decision was made to alias
b0b300a3 60C<big5> to C<big5-eten>, which is the de facto superset of the original
61big5.
62
85982a32 63The C<CNS11643> encoding files are not complete. For common C<CNS11643>
b2729934 64manipulation, please use C<EUC-TW> in L<Encode::HanExtra>, which contains
0ab8f81e 65planes 1-7.
b2729934 66
0ab8f81e 67The ASCII region (0x00-0x7f) is preserved for all encodings, even
68though this conflicts with mappings by the Unicode Consortium. See
b2729934 69
a63c962f 70L<http://www.debian.or.jp/~kubota/unicode-symbols.html.en>
b2729934 71
0ab8f81e 72to find out why it is implemented that way.
b2729934 73
74=head1 SEE ALSO
75
85982a32 76L<Encode>
b2729934 77
78=cut