[p5sagit/p5-mst-13.2.git] / t / pragma / locale.t

#!./perl -wT

BEGIN {
    chdir 't' if -d 't';
    @INC = '../lib';
}

use strict;

my $have_setlocale = 0;
eval {
    require POSIX;
    import POSIX ':locale_h';
    $have_setlocale++;
};

print "1..", ($have_setlocale ? 104 : 98), "\n";

use vars qw($a
	    $English $German $French $Spanish
	    @C @English @German @French @Spanish
	    $Locale @Locale %iLocale %UPPER %lower @Neoalpha);

$a = 'abc %';

sub ok {
    my ($n, $result) = @_;

    print 'not ' unless ($result);
    print "ok $n\n";
}

# First we'll do a lot of taint checking for locales.
# This is the easiest to test, actually, as any locale,
# even the default locale will taint under 'use locale'.

sub is_tainted { # hello, camel two.
    my $dummy;
    not eval { $dummy = join("", @_), kill 0; 1 }
}

sub check_taint ($$) {
    ok $_[0], is_tainted($_[1]);
}

sub check_taint_not ($$) {
    ok $_[0], not is_tainted($_[1]);
}

use locale;	# engage locale and therefore locale taint.

check_taint_not   1, $a;

check_taint       2, uc($a);
check_taint       3, "\U$a";
check_taint       4, ucfirst($a);
check_taint       5, "\u$a";
check_taint       6, lc($a);
check_taint       7, "\L$a";
check_taint       8, lcfirst($a);
check_taint       9, "\l$a";

check_taint      10, sprintf('%e', 123.456);
check_taint      11, sprintf('%f', 123.456);
check_taint      12, sprintf('%g', 123.456);
check_taint_not  13, sprintf('%d', 123.456);
check_taint_not  14, sprintf('%x', 123.456);

$_ = $a;	# untaint $_

$_ = uc($a);	# taint $_

check_taint      15, $_;

/(\w)/;	# taint $&, $`, $', $+, $1.
check_taint      16, $&;
check_taint      17, $`;
check_taint      18, $';
check_taint      19, $+;
check_taint      20, $1;
check_taint_not  21, $2;

/(.)/;	# untaint $&, $`, $', $+, $1.
check_taint_not  22, $&;
check_taint_not  23, $`;
check_taint_not  24, $';
check_taint_not  25, $+;
check_taint_not  26, $1;
check_taint_not  27, $2;

/(\W)/;	# taint $&, $`, $', $+, $1.
check_taint      28, $&;
check_taint      29, $`;
check_taint      30, $';
check_taint      31, $+;
check_taint      32, $1;
check_taint_not  33, $2;

/(\s)/;	# taint $&, $`, $', $+, $1.
check_taint      34, $&;
check_taint      35, $`;
check_taint      36, $';
check_taint      37, $+;
check_taint      38, $1;
check_taint_not  39, $2;

/(\S)/;	# taint $&, $`, $', $+, $1.
check_taint      40, $&;
check_taint      41, $`;
check_taint      42, $';
check_taint      43, $+;
check_taint      44, $1;
check_taint_not  45, $2;

$_ = $a;	# untaint $_

check_taint_not  46, $_;

/(b)/;		# this must not taint
check_taint_not  47, $&;
check_taint_not  48, $`;
check_taint_not  49, $';
check_taint_not  50, $+;
check_taint_not  51, $1;
check_taint_not  52, $2;

$_ = $a;	# untaint $_

check_taint_not  53, $_;

$b = uc($a);	# taint $b
s/(.+)/$b/;	# this must taint only the $_

check_taint      54, $_;
check_taint_not  55, $&;
check_taint_not  56, $`;
check_taint_not  57, $';
check_taint_not  58, $+;
check_taint_not  59, $1;
check_taint_not  60, $2;

$_ = $a;	# untaint $_

s/(.+)/b/;	# this must not taint
check_taint_not  61, $_;
check_taint_not  62, $&;
check_taint_not  63, $`;
check_taint_not  64, $';
check_taint_not  65, $+;
check_taint_not  66, $1;
check_taint_not  67, $2;

$b = $a;	# untaint $b

($b = $a) =~ s/\w/$&/;
check_taint      68, $b;	# $b should be tainted.
check_taint_not  69, $a;	# $a should be not.

$_ = $a;	# untaint $_

s/(\w)/\l$1/;	# this must taint
check_taint      70, $_;
check_taint      71, $&;
check_taint      72, $`;
check_taint      73, $';
check_taint      74, $+;
check_taint      75, $1;
check_taint_not  76, $2;

$_ = $a;	# untaint $_

s/(\w)/\L$1/;	# this must taint
check_taint      77, $_;
check_taint      78, $&;
check_taint      79, $`;
check_taint      80, $';
check_taint      81, $+;
check_taint      82, $1;
check_taint_not  83, $2;

$_ = $a;	# untaint $_

s/(\w)/\u$1/;	# this must taint
check_taint      84, $_;
check_taint      85, $&;
check_taint      86, $`;
check_taint      87, $';
check_taint      88, $+;
check_taint      89, $1;
check_taint_not  90, $2;

$_ = $a;	# untaint $_

s/(\w)/\U$1/;	# this must taint
check_taint      91, $_;
check_taint      92, $&;
check_taint      93, $`;
check_taint      94, $';
check_taint      95, $+;
check_taint      96, $1;
check_taint_not  97, $2;

# After all this tainting $a should be cool.

check_taint_not  98, $a;

# I think we've seen quite enough of taint.
# Let us do some *real* locale work now,
#  unless setlocale() is missing (i.e. minitest).

exit unless $have_setlocale;

sub getalnum {
    sort grep /\w/, map { chr } 0..255
}

sub locatelocale ($$@) {
    my ($lcall, $alnum, @try) = @_;

    undef $$lcall;

    for (@try) {
	local $^W = 0; # suppress "Subroutine LC_ALL redefined"
	if (setlocale(&LC_ALL, $_)) {
	    $$lcall = $_;
	    @$alnum = &getalnum;
	    last;
	}
    }

    @$alnum = () unless (defined $$lcall);
}

# Find some default locale

locatelocale(\$Locale, \@Locale, qw(C POSIX));

# Find some English locale

locatelocale(\$English, \@English,
	     qw(en_US.ISO8859-1 en_GB.ISO8859-1
		en en_US en_UK en_IE en_CA en_AU en_NZ
		english english.iso88591
		american american.iso88591
		british british.iso88591
		));

# Find some German locale

locatelocale(\$German, \@German,
	     qw(de_DE.ISO8859-1 de_AT.ISO8859-1 de_CH.ISO8859-1
		de de_DE de_AT de_CH
		german german.iso88591));

# Find some French locale

locatelocale(\$French, \@French,
	     qw(fr_FR.ISO8859-1 fr_BE.ISO8859-1 fr_CA.ISO8859-1 fr_CH.ISO8859-1
		fr fr_FR fr_BE fr_CA fr_CH
		french french.iso88591));

# Find some Spanish locale

locatelocale(\$Spanish, \@Spanish,
	     qw(es_AR.ISO8859-1 es_BO.ISO8859-1 es_CL.ISO8859-1
		es_CO.ISO8859-1 es_CR.ISO8859-1 es_EC.ISO8859-1
		es_ES.ISO8859-1 es_GT.ISO8859-1 es_MX.ISO8859-1
		es_NI.ISO8859-1 es_PA.ISO8859-1 es_PE.ISO8859-1
		es_PY.ISO8859-1 es_SV.ISO8859-1 es_UY.ISO8859-1 es_VE.ISO8859-1
		es es_AR es_BO es_CL
		es_CO es_CR es_EC
		es_ES es_GT es_MX
		es_NI es_PA es_PE
		es_PY es_SV es_UY es_VE
		spanish spanish.iso88591));

# Select the largest of the alpha(num)bets.

($Locale, @Locale) = ($English, @English)
    if (length(@English) > length(@Locale));
($Locale, @Locale) = ($German, @German)
    if (length(@German)  > length(@Locale));
($Locale, @Locale) = ($French, @French)
    if (length(@French)  > length(@Locale));
($Locale, @Locale) = ($Spanish, @Spanish)
    if (length(@Spanish) > length(@Locale));

print "# Locale = $Locale\n";
print "# Alnum_ = @Locale\n";

{
    local $^W = 0;
    setlocale(&LC_ALL, $Locale);
}

{
    my $i = 0;

    for (@Locale) {
	$iLocale{$_} = $i++;
    }
}

# Sieve the uppercase and the lowercase.

for (@Locale) {
    if (/[^\d_]/) { # skip digits and the _
	if (lc eq $_) {
	    $UPPER{$_} = uc;
	} else {
	    $lower{$_} = lc;
	}
    }
}

# Cross-check the upper and the lower.
# Yes, this is broken when the upper<->lower changes the number of
# the glyphs (e.g. the German sharp-s aka double-s aka sz-ligature,
# or the Dutch IJ or the Spanish LL or ...)
# But so far all the implementations do this wrong so we can do it wrong too.

for (keys %UPPER) {
    if (defined $lower{$UPPER{$_}}) {
	if ($_ ne $lower{$UPPER{$_}}) {
	    print 'not ';
	    last;
	}
    }
}
print "ok 99\n";

for (keys %lower) {
    if (defined $UPPER{$lower{$_}}) {
	if ($_ ne $UPPER{$lower{$_}}) {
	    print 'not ';
	    last;
	}
    }
}
print "ok 100\n";

# Find the alphabets that are not alphabets in the default locale.

{
    no locale;
    
    for (keys %UPPER, keys %lower) {
	push(@Neoalpha, $_) if (/\W/);
    }
}

@Neoalpha = sort @Neoalpha;

# Test \w.

{
    my $word = join('', @Neoalpha);

    $word =~ /^(\w*)$/;

    print 'not ' if ($1 ne $word);
}
print "ok 101\n";

# Find places where the collation order differs from the default locale.

print "# testing 102\n";
{
    my (@k, $i, $j, @d);

    {
	no locale;

	@k = sort (keys %UPPER, keys %lower); 
    }

    for ($i = 0; $i < @k; $i++) {
	for ($j = $i + 1; $j < @k; $j++) {
	    if ($iLocale{$k[$j]} < $iLocale{$k[$i]}) {
		push(@d, [$k[$j], $k[$i]]);
	    }
	}
    }

    # Cross-check those places.

    for (@d) {
	($i, $j) = @$_;
	if ($i gt $j) {
	    print "# failed 102 at:\n";
	    print "# i = $i, j = $j, i ",
	          $i le $j ? 'le' : 'gt', " j\n";
	    print 'not ';
	    last;
	}
    }
}
print "ok 102\n";

# Cross-check whole character set.

print "# testing 103\n";
for (map { chr } 0..255) {
    if (/\w/ and /\W/) { print 'not '; last }
    if (/\d/ and /\D/) { print 'not '; last }
    if (/\s/ and /\S/) { print 'not '; last }
    if (/\w/ and /\D/ and not /_/ and
	not (exists $UPPER{$_} or exists $lower{$_})) {
	print "# failed 103 at:\n";
	print "# ", ord($_), " '$_'\n";
	print 'not ';
	last;
    }
}
print "ok 103\n";

# The @Locale should be internally consistent.

print "# testing 104\n";
{
    my ($from, $to, $lesser, $greater, @test, %test, $test);

    for (0..9) {
	# Select a slice.
	$from = int(($_*@Locale)/10);
	$to = $from + int(@Locale/10);
        $to = $#Locale if ($to > $#Locale);
	$lesser  = join('', @Locale[$from..$to]);
	# Select a slice one character on.
	$from++; $to++;
        $to = $#Locale if ($to > $#Locale);
	$greater = join('', @Locale[$from..$to]);
	@test = 
	    (
	     'not ($lesser  lt $greater)', # 0
	     'not ($lesser  le $greater)', # 1
	     'not ($lesser  ne $greater)', # 2
	     '    ($lesser  eq $greater)', # 3
	     '    ($lesser  ge $greater)', # 4
	     '    ($lesser  gt $greater)', # 5
	     '    ($greater lt $lesser )', # 6
	     '    ($greater le $lesser )', # 7
	     'not ($greater ne $lesser )', # 8
	     '    ($greater eq $lesser )', # 9
	     'not ($greater ge $lesser )', # 10
	     'not ($greater gt $lesser )', # 11
	     # Well, these two are sort of redundant
	     # because @Locale was derived using cmp.
	     'not (($lesser  cmp $greater) == -1)', # 12
	     'not (($greater cmp $lesser ) ==  1)'  # 13
	     );
	@test{@test} = 0 x @test;
	$test = 0;
	for my $ti (@test) { $test{$ti} = eval $ti ; $test ||= $test{$ti} }
	if ($test) {
	    print "# failed 104 at:\n";
	    print "# lesser  = '$lesser'\n";
	    print "# greater = '$greater'\n";
	    print "# (greater) from = $from, to = $to\n";
	    for my $ti (@test) {
		printf("# %-40s %-4s", $ti,
		       $test{$ti} ? 'FAIL' : 'ok');
		if ($ti =~ /\(\.*(\$.+ +cmp +\$[^\)]+)\.*\)/) {
		    printf("(%s == %4d)", $1, eval $1);
	        }
		print "\n";
	    }

	    print 'not ';
	    last;
	}
    }
}
print "ok 104\n";
Commit	Line	Data
8ebc5c01	1	#!./perl -wT
	2
	3	BEGIN {
	4	chdir 't' if -d 't';
	5	@INC = '../lib';
	6	}
	7
	8	use strict;
	9
	10	my $have_setlocale = 0;
	11	eval {
	12	require POSIX;
	13	import POSIX ':locale_h';
	14	$have_setlocale++;
	15	};
	16
	17	print "1..", ($have_setlocale ? 104 : 98), "\n";
	18
	19	use vars qw($a
	20	$English $German $French $Spanish
	21	@C @English @German @French @Spanish
	22	$Locale @Locale %iLocale %UPPER %lower @Neoalpha);
	23
	24	$a = 'abc %';
	25
	26	sub ok {
	27	my ($n, $result) = @_;
	28
	29	print 'not ' unless ($result);
	30	print "ok $n\n";
	31	}
	32
	33	# First we'll do a lot of taint checking for locales.
	34	# This is the easiest to test, actually, as any locale,
	35	# even the default locale will taint under 'use locale'.
	36
	37	sub is_tainted { # hello, camel two.
	38	my $dummy;
	39	not eval { $dummy = join("", @_), kill 0; 1 }
	40	}
	41
	42	sub check_taint ($$) {
	43	ok $_[0], is_tainted($_[1]);
	44	}
	45
	46	sub check_taint_not ($$) {
	47	ok $_[0], not is_tainted($_[1]);
	48	}
	49
	50	use locale; # engage locale and therefore locale taint.
	51
	52	check_taint_not 1, $a;
	53
	54	check_taint 2, uc($a);
	55	check_taint 3, "\U$a";
	56	check_taint 4, ucfirst($a);
	57	check_taint 5, "\u$a";
	58	check_taint 6, lc($a);
	59	check_taint 7, "\L$a";
	60	check_taint 8, lcfirst($a);
	61	check_taint 9, "\l$a";
	62
	63	check_taint 10, sprintf('%e', 123.456);
	64	check_taint 11, sprintf('%f', 123.456);
65	check_taint 12, sprintf('%g', 123.456);
66	check_taint_not 13, sprintf('%d', 123.456);
67	check_taint_not 14, sprintf('%x', 123.456);
68
69	$_ = $a; # untaint $_
70
71	$_ = uc($a); # taint $_
72
73	check_taint 15, $_;
74
75	/(\w)/; # taint $&, $`, $', $+, $1.
76	check_taint 16, $&;
77	check_taint 17, $`;
78	check_taint 18, $';
79	check_taint 19, $+;
80	check_taint 20, $1;
81	check_taint_not 21, $2;
82
83	/(.)/; # untaint $&, $`, $', $+, $1.
84	check_taint_not 22, $&;
85	check_taint_not 23, $`;
86	check_taint_not 24, $';
87	check_taint_not 25, $+;
88	check_taint_not 26, $1;
89	check_taint_not 27, $2;
90
91	/(\W)/; # taint $&, $`, $', $+, $1.
92	check_taint 28, $&;
93	check_taint 29, $`;
94	check_taint 30, $';
95	check_taint 31, $+;
96	check_taint 32, $1;
97	check_taint_not 33, $2;
98
99	/(\s)/; # taint $&, $`, $', $+, $1.
100	check_taint 34, $&;
101	check_taint 35, $`;
102	check_taint 36, $';
103	check_taint 37, $+;
104	check_taint 38, $1;
105	check_taint_not 39, $2;
106
107	/(\S)/; # taint $&, $`, $', $+, $1.
108	check_taint 40, $&;
109	check_taint 41, $`;
110	check_taint 42, $';
111	check_taint 43, $+;
112	check_taint 44, $1;
113	check_taint_not 45, $2;
114
115	$_ = $a; # untaint $_
116
117	check_taint_not 46, $_;
118
119	/(b)/; # this must not taint
120	check_taint_not 47, $&;
121	check_taint_not 48, $`;
122	check_taint_not 49, $';
123	check_taint_not 50, $+;
124	check_taint_not 51, $1;
125	check_taint_not 52, $2;
126
127	$_ = $a; # untaint $_
128
129	check_taint_not 53, $_;
130
131	$b = uc($a); # taint $b
132	s/(.+)/$b/; # this must taint only the $_
133
134	check_taint 54, $_;
135	check_taint_not 55, $&;
136	check_taint_not 56, $`;
137	check_taint_not 57, $';
138	check_taint_not 58, $+;
139	check_taint_not 59, $1;
140	check_taint_not 60, $2;
141
142	$_ = $a; # untaint $_
143
144	s/(.+)/b/; # this must not taint
145	check_taint_not 61, $_;
146	check_taint_not 62, $&;
147	check_taint_not 63, $`;
148	check_taint_not 64, $';
149	check_taint_not 65, $+;
150	check_taint_not 66, $1;
151	check_taint_not 67, $2;
152
153	$b = $a; # untaint $b
154
155	($b = $a) =~ s/\w/$&/;
156	check_taint 68, $b; # $b should be tainted.
157	check_taint_not 69, $a; # $a should be not.
158
159	$_ = $a; # untaint $_
160
161	s/(\w)/\l$1/; # this must taint
162	check_taint 70, $_;
163	check_taint 71, $&;
164	check_taint 72, $`;
165	check_taint 73, $';
166	check_taint 74, $+;
167	check_taint 75, $1;
168	check_taint_not 76, $2;
169
170	$_ = $a; # untaint $_
171
172	s/(\w)/\L$1/; # this must taint
173	check_taint 77, $_;
174	check_taint 78, $&;
175	check_taint 79, $`;
176	check_taint 80, $';
177	check_taint 81, $+;
178	check_taint 82, $1;
179	check_taint_not 83, $2;
180
181	$_ = $a; # untaint $_
182
183	s/(\w)/\u$1/; # this must taint
184	check_taint 84, $_;
185	check_taint 85, $&;
186	check_taint 86, $`;
187	check_taint 87, $';
188	check_taint 88, $+;
189	check_taint 89, $1;
190	check_taint_not 90, $2;
191
192	$_ = $a; # untaint $_
193
194	s/(\w)/\U$1/; # this must taint
195	check_taint 91, $_;
196	check_taint 92, $&;
197	check_taint 93, $`;
198	check_taint 94, $';
199	check_taint 95, $+;
200	check_taint 96, $1;
201	check_taint_not 97, $2;
202
203	# After all this tainting $a should be cool.
204
205	check_taint_not 98, $a;
206
207	# I think we've seen quite enough of taint.
208	# Let us do some real locale work now,
209	# unless setlocale() is missing (i.e. minitest).
210
211	exit unless $have_setlocale;
212
213	sub getalnum {
214	sort grep /\w/, map { chr } 0..255
215	}
216
217	sub locatelocale ($$@) {
218	my ($lcall, $alnum, @try) = @_;
219
220	undef $$lcall;
221
222	for (@try) {
223	local $^W = 0; # suppress "Subroutine LC_ALL redefined"
224	if (setlocale(&LC_ALL, $_)) {
225	$$lcall = $_;
226	@$alnum = &getalnum;
227	last;
228	}
229	}
230
231	@$alnum = () unless (defined $$lcall);
232	}
233
234	# Find some default locale
235
236	locatelocale(\$Locale, \@Locale, qw(C POSIX));
237
238	# Find some English locale
239
240	locatelocale(\$English, \@English,
241	qw(en_US.ISO8859-1 en_GB.ISO8859-1
242	en en_US en_UK en_IE en_CA en_AU en_NZ
243	english english.iso88591
244	american american.iso88591
245	british british.iso88591
246	));
247
248	# Find some German locale
249
250	locatelocale(\$German, \@German,
251	qw(de_DE.ISO8859-1 de_AT.ISO8859-1 de_CH.ISO8859-1
252	de de_DE de_AT de_CH
253	german german.iso88591));
254
255	# Find some French locale
256
257	locatelocale(\$French, \@French,
258	qw(fr_FR.ISO8859-1 fr_BE.ISO8859-1 fr_CA.ISO8859-1 fr_CH.ISO8859-1
259	fr fr_FR fr_BE fr_CA fr_CH
260	french french.iso88591));
261
262	# Find some Spanish locale
263
264	locatelocale(\$Spanish, \@Spanish,
265	qw(es_AR.ISO8859-1 es_BO.ISO8859-1 es_CL.ISO8859-1
266	es_CO.ISO8859-1 es_CR.ISO8859-1 es_EC.ISO8859-1
267	es_ES.ISO8859-1 es_GT.ISO8859-1 es_MX.ISO8859-1
268	es_NI.ISO8859-1 es_PA.ISO8859-1 es_PE.ISO8859-1
269	es_PY.ISO8859-1 es_SV.ISO8859-1 es_UY.ISO8859-1 es_VE.ISO8859-1
270	es es_AR es_BO es_CL
271	es_CO es_CR es_EC
272	es_ES es_GT es_MX
273	es_NI es_PA es_PE
274	es_PY es_SV es_UY es_VE
275	spanish spanish.iso88591));
276
277	# Select the largest of the alpha(num)bets.
278
279	($Locale, @Locale) = ($English, @English)
280	if (length(@English) > length(@Locale));
281	($Locale, @Locale) = ($German, @German)
282	if (length(@German) > length(@Locale));
283	($Locale, @Locale) = ($French, @French)
284	if (length(@French) > length(@Locale));
285	($Locale, @Locale) = ($Spanish, @Spanish)
286	if (length(@Spanish) > length(@Locale));
287
288	print "# Locale = $Locale\n";
289	print "# Alnum_ = @Locale\n";
290
291	{
292	local $^W = 0;
293	setlocale(&LC_ALL, $Locale);
294	}
295
296	{
297	my $i = 0;
298
299	for (@Locale) {
300	$iLocale{$_} = $i++;
301	}
302	}
303
304	# Sieve the uppercase and the lowercase.
305
306	for (@Locale) {
307	if (/[^\d_]/) { # skip digits and the _
308	if (lc eq $_) {
309	$UPPER{$_} = uc;
310	} else {
311	$lower{$_} = lc;
312	}
313	}
314	}
315
316	# Cross-check the upper and the lower.
317	# Yes, this is broken when the upper<->lower changes the number of
318	# the glyphs (e.g. the German sharp-s aka double-s aka sz-ligature,
319	# or the Dutch IJ or the Spanish LL or ...)
320	# But so far all the implementations do this wrong so we can do it wrong too.
321
322	for (keys %UPPER) {
323	if (defined $lower{$UPPER{$_}}) {
324	if ($_ ne $lower{$UPPER{$_}}) {
325	print 'not ';
326	last;
327	}
328	}
329	}
330	print "ok 99\n";
331
332	for (keys %lower) {
333	if (defined $UPPER{$lower{$_}}) {
334	if ($_ ne $UPPER{$lower{$_}}) {
335	print 'not ';
336	last;
337	}
338	}
339	}
340	print "ok 100\n";
341
342	# Find the alphabets that are not alphabets in the default locale.
343
344	{
345	no locale;
346
347	for (keys %UPPER, keys %lower) {
348	push(@Neoalpha, $_) if (/\W/);
349	}
350	}
351
352	@Neoalpha = sort @Neoalpha;
353
354	# Test \w.
355
356	{
357	my $word = join('', @Neoalpha);
358
359	$word =~ /^(\w*)$/;
360
361	print 'not ' if ($1 ne $word);
362	}
363	print "ok 101\n";
364
365	# Find places where the collation order differs from the default locale.
366
774d564b	367	print "# testing 102\n";
8ebc5c01	368	{
	369	my (@k, $i, $j, @d);
	370
	371	{
	372	no locale;
	373
	374	@k = sort (keys %UPPER, keys %lower);
	375	}
	376
	377	for ($i = 0; $i < @k; $i++) {
	378	for ($j = $i + 1; $j < @k; $j++) {
	379	if ($iLocale{$k[$j]} < $iLocale{$k[$i]}) {
	380	push(@d, [$k[$j], $k[$i]]);
	381	}
	382	}
	383	}
	384
	385	# Cross-check those places.
	386
	387	for (@d) {
	388	($i, $j) = @$_;
	389	if ($i gt $j) {
774d564b	390	print "# failed 102 at:\n";
8ebc5c01	391	print "# i = $i, j = $j, i ",
	392	$i le $j ? 'le' : 'gt', " j\n";
	393	print 'not ';
	394	last;
	395	}
	396	}
	397	}
	398	print "ok 102\n";
	399
	400	# Cross-check whole character set.
	401
774d564b	402	print "# testing 103\n";
8ebc5c01	403	for (map { chr } 0..255) {
	404	if (/\w/ and /\W/) { print 'not '; last }
	405	if (/\d/ and /\D/) { print 'not '; last }
	406	if (/\s/ and /\S/) { print 'not '; last }
	407	if (/\w/ and /\D/ and not /_/ and
	408	not (exists $UPPER{$_} or exists $lower{$_})) {
774d564b	409	print "# failed 103 at:\n";
774d564b	410	print "# ", ord($_), " '$_'\n";
8ebc5c01	411	print 'not ';
	412	last;
	413	}
	414	}
	415	print "ok 103\n";
	416
	417	# The @Locale should be internally consistent.
	418
774d564b	419	print "# testing 104\n";
8ebc5c01	420	{
774d564b	421	my ($from, $to, $lesser, $greater, @test, %test, $test);
8ebc5c01	422
	423	for (0..9) {
	424	# Select a slice.
	425	$from = int(($_*@Locale)/10);
	426	$to = $from + int(@Locale/10);
	427	$to = $#Locale if ($to > $#Locale);
	428	$lesser = join('', @Locale[$from..$to]);
	429	# Select a slice one character on.
	430	$from++; $to++;
	431	$to = $#Locale if ($to > $#Locale);
	432	$greater = join('', @Locale[$from..$to]);
774d564b	433	@test =
	434	(
	435	'not ($lesser lt $greater)', # 0
	436	'not ($lesser le $greater)', # 1
	437	'not ($lesser ne $greater)', # 2
	438	' ($lesser eq $greater)', # 3
	439	' ($lesser ge $greater)', # 4
	440	' ($lesser gt $greater)', # 5
	441	' ($greater lt $lesser )', # 6
	442	' ($greater le $lesser )', # 7
	443	'not ($greater ne $lesser )', # 8
	444	' ($greater eq $lesser )', # 9
	445	'not ($greater ge $lesser )', # 10
	446	'not ($greater gt $lesser )', # 11
	447	# Well, these two are sort of redundant
	448	# because @Locale was derived using cmp.
	449	'not (($lesser cmp $greater) == -1)', # 12
	450	'not (($greater cmp $lesser ) == 1)' # 13
	451	);
	452	@test{@test} = 0 x @test;
	453	$test = 0;
	454	for my $ti (@test) { $test{$ti} = eval $ti ; $test \|\|= $test{$ti} }
	455	if ($test) {
	456	print "# failed 104 at:\n";
	457	print "# lesser = '$lesser'\n";
	458	print "# greater = '$greater'\n";
	459	print "# (greater) from = $from, to = $to\n";
	460	for my $ti (@test) {
	461	printf("# %-40s %-4s", $ti,
	462	$test{$ti} ? 'FAIL' : 'ok');
	463	if ($ti =~ /\(\.(\$.+ +cmp +\$[^\)]+)\.\)/) {
	464	printf("(%s == %4d)", $1, eval $1);
	465	}
	466	print "\n";
	467	}
	468
8ebc5c01	469	print 'not ';
	470	last;
	471	}
	472	}
	473	}
	474	print "ok 104\n";