Updated Encode to CPAN release 2.38
[p5sagit/p5-mst-13.2.git] / cpan / Encode / TW / TW.pm
CommitLineData
0e567a6c 1package Encode::TW;
071db25d 2BEGIN {
d1256cb1 3 if ( ord("A") == 193 ) {
4 die "Encode::TW not supported on EBCDIC\n";
071db25d 5 }
6}
656ebd29 7use strict;
8use warnings;
c0d88b76 9use Encode;
b2deda17 10our $VERSION = do { my @r = ( q$Revision: 2.3 $ =~ /\d+/g ); sprintf "%d." . "%02d" x $#r, @r };
0e567a6c 11use XSLoader;
d1256cb1 12XSLoader::load( __PACKAGE__, $VERSION );
0e567a6c 13
141;
15__END__
67d7b5ef 16
b2729934 17=head1 NAME
18
19Encode::TW - Taiwan-based Chinese Encodings
20
21=head1 SYNOPSIS
22
1b2c56c8 23 use Encode qw/encode decode/;
2b217bf7 24 $big5 = encode("big5", $utf8); # loads Encode::TW implicitly
ee981de6 25 $utf8 = decode("big5", $big5); # ditto
b2729934 26
27=head1 DESCRIPTION
28
0ab8f81e 29This module implements tradition Chinese charset encodings as used
30in Taiwan and Hong Kong.
b2729934 31Encodings supported are as follows.
32
1b2c56c8 33 Canonical Alias Description
34 --------------------------------------------------------------------
b0b300a3 35 big5-eten /\bbig-?5$/i Big5 encoding (with ETen extensions)
d1256cb1 36 /\bbig5-?et(en)?$/i
37 /\btca-?big5$/i
b0b300a3 38 big5-hkscs /\bbig5-?hk(scs)?$/i
2d06ad02 39 /\bhk(scs)?-?big5$/i
b0b300a3 40 Big5 + Cantonese characters in Hong Kong
ef175861 41 MacChineseTrad Big5 + Apple Vendor Mappings
1b2c56c8 42 cp950 Code Page 950
a999c27c 43 = Big5 + Microsoft vendor mappings
5129552c 44 --------------------------------------------------------------------
45
0ab8f81e 46To find out how to use this module in detail, see L<Encode>.
b2729934 47
48=head1 NOTES
49
85982a32 50Due to size concerns, C<EUC-TW> (Extended Unix Character), C<CCCII>
b0b300a3 51(Chinese Character Code for Information Interchange), C<BIG5PLUS>
52(CMEX's Big5+) and C<BIG5EXT> (CMEX's Big5e) are distributed separately
53on CPAN, under the name L<Encode::HanExtra>. That module also contains
54extra China-based encodings.
b2729934 55
56=head1 BUGS
57
b0b300a3 58Since the original C<big5> encoding (1984) is not supported anywhere
59(glibc and DOS-based systems uses C<big5> to mean C<big5-eten>; Microsoft
0ab8f81e 60uses C<big5> to mean C<cp950>), a conscious decision was made to alias
b0b300a3 61C<big5> to C<big5-eten>, which is the de facto superset of the original
62big5.
63
85982a32 64The C<CNS11643> encoding files are not complete. For common C<CNS11643>
b2729934 65manipulation, please use C<EUC-TW> in L<Encode::HanExtra>, which contains
0ab8f81e 66planes 1-7.
b2729934 67
0ab8f81e 68The ASCII region (0x00-0x7f) is preserved for all encodings, even
b2deda17 69though this conflicts with mappings by the Unicode Consortium.
b2729934 70
71=head1 SEE ALSO
72
85982a32 73L<Encode>
b2729934 74
75=cut