1 # Before `make install' is performed this script should be runnable with
2 # `make test'. After `make install' it should work as `perl test.pl'
4 #########################
7 BEGIN { plan tests => 50 };
9 ok(1); # If we made it this far, we're ok.
11 #########################
13 my $Collator = Unicode::Collate->new(
15 normalization => undef,
18 ok(ref $Collator, "Unicode::Collate");
21 join(':', $Collator->sort(
22 qw/ lib strict Carp ExtUtils CGI Time warnings Math overload Pod CPAN /
25 qw/ Carp CGI CPAN ExtUtils lib Math overload Pod strict Time warnings /
29 my $A_acute = pack('U', 0x00C1);
30 my $acute = pack('U', 0x0301);
32 ok($Collator->cmp("A$acute", $A_acute), -1);
34 ok($Collator->cmp("", ""), 0);
35 ok(! $Collator->ne("", "") );
36 ok( $Collator->eq("", "") );
38 ok($Collator->cmp("", "perl"), -1);
40 eval "use Unicode::Normalize";
43 my $NFD = Unicode::Collate->new(
46 ok($NFD->cmp("A$acute", $A_acute), 0);
52 my $tr = Unicode::Collate->new(
54 normalization => undef,
55 ignoreName => qr/^(?:HANGUL|HIRAGANA|KATAKANA|BOPOMOFO)$/,
57 0063 0068 ; [.0893.0020.0002.0063] # "ch" in traditional Spanish
58 0043 0068 ; [.0893.0020.0008.0043] # "Ch" in traditional Spanish
59 00DF ; [.09F3.0154.0004.00DF] [.09F3.0020.0004.00DF] # eszet in Germany
65 qw/ acha aca ada acia acka /
68 qw/ aca acia acka acha ada /
73 join(':', $Collator->sort(
74 qw/ acha aca ada acia acka /
77 qw/ aca acha acia acka ada /
81 my $old_level = $Collator->{level};
82 my $hiragana = "\x{3042}\x{3044}";
83 my $katakana = "\x{30A2}\x{30A4}";
85 $Collator->{level} = 2;
87 ok( $Collator->cmp("ABC","abc"), 0);
88 ok( $Collator->eq("ABC","abc") );
89 ok( $Collator->le("ABC","abc") );
90 ok( $Collator->cmp($hiragana, $katakana), 0);
91 ok( $Collator->eq($hiragana, $katakana) );
92 ok( $Collator->ge($hiragana, $katakana) );
95 ok( $Collator->eq("a\x{AC00}b", "a\x{1100}\x{1161}b") );
96 ok( $Collator->eq("a\x{AE00}b", "a\x{1100}\x{1173}\x{11AF}b") );
97 ok( $Collator->gt("a\x{AE00}b", "a\x{1100}\x{1173}b\x{11AF}") );
98 ok( $Collator->lt("a\x{AC00}b", "a\x{AE00}b") );
99 ok( $Collator->gt("a\x{D7A3}b", "a\x{C544}b") );
100 ok( $Collator->lt("a\x{C544}b", "a\x{30A2}b") ); # hangul < hiragana
102 $Collator->{level} = $old_level;
104 $Collator->{katakana_before_hiragana} = 1;
106 ok( $Collator->cmp("abc", "ABC"), -1);
107 ok( $Collator->ne("abc", "ABC") );
108 ok( $Collator->lt("abc", "ABC") );
109 ok( $Collator->le("abc", "ABC") );
110 ok( $Collator->cmp($hiragana, $katakana), 1);
111 ok( $Collator->ne($hiragana, $katakana) );
112 ok( $Collator->gt($hiragana, $katakana) );
113 ok( $Collator->ge($hiragana, $katakana) );
115 $Collator->{upper_before_lower} = 1;
117 ok( $Collator->cmp("abc", "ABC"), 1);
118 ok( $Collator->ge("abc", "ABC"), 1);
119 ok( $Collator->gt("abc", "ABC"), 1);
120 ok( $Collator->cmp($hiragana, $katakana), 1);
121 ok( $Collator->ge($hiragana, $katakana), 1);
122 ok( $Collator->gt($hiragana, $katakana), 1);
124 $Collator->{katakana_before_hiragana} = 0;
126 ok( $Collator->cmp("abc", "ABC"), 1);
127 ok( $Collator->cmp($hiragana, $katakana), -1);
129 $Collator->{upper_before_lower} = 0;
131 ok( $Collator->cmp("abc", "ABC"), -1);
132 ok( $Collator->le("abc", "ABC") );
133 ok( $Collator->cmp($hiragana, $katakana), -1);
134 ok( $Collator->lt($hiragana, $katakana) );
136 my $ign = Unicode::Collate->new(
138 normalization => undef,
139 ignoreChar => qr/^[ae]$/,
142 ok( $ign->cmp("element","lament"), 0);
144 $Collator->{level} = 2;
148 my $orig = "This is a Perl book.";
151 my $ret = "This is a camel book.";
154 if(my($pos,$len) = $Collator->index($str, $sub)){
155 substr($str, $pos, $len, $rep);
160 $Collator->{level} = $old_level;
163 if(my($pos,$len) = $Collator->index($str, $sub)){
164 substr($str, $pos, $len, $rep);
171 $str = "Ich mu\x{00DF} studieren.";
172 $sub = "m\x{00FC}ss";
174 if(my($pos, $len) = $tr->index($str, $sub)){
175 $match = substr($str, $pos, $len);
177 ok($match, "mu\x{00DF}");
179 $tr->{level} = $old_level;
181 $str = "Ich mu\x{00DF} studieren.";
182 $sub = "m\x{00FC}ss";
184 if(my($pos, $len) = $tr->index($str, $sub)){
185 $match = substr($str, $pos, $len);
190 if(my($pos,$len) = $Collator->index("", "")){
191 $match = substr("", $pos, $len);
196 if(my($pos,$len) = $Collator->index("", "abc")){
197 $match = substr("", $pos, $len);