15 my $Is_EBCDIC = (defined $Config{ebcdic} && $Config{ebcdic} eq 'define');
16 my $Perl = which_perl();
19 my @result = map {_qq($_)} @_;
23 return '(' . join (', ', @result) . ')';
29 return unless @$l == @$r;
31 if (defined $l->[$i]) {
32 return unless defined ($r->[$i]) && $l->[$i] eq $r->[$i];
34 return if defined $r->[$i]
40 ##############################################################################
42 # Here starteth the tests
46 my $format = "c2 x5 C C x s d i l a6";
47 # Need the expression in here to force ary[5] to be numeric. This avoids
48 # test2 failing because ary2 goes str->numeric->str and ary doesn't.
49 my @ary = (1,-100,127,128,32767,987.654321098 / 100.0,12345,123456,
51 my $foo = pack($format,@ary);
52 my @ary2 = unpack($format,$foo);
56 my $out1=join(':',@ary);
57 my $out2=join(':',@ary2);
58 # Using long double NVs may introduce greater accuracy than wanted.
59 $out1 =~ s/:9\.87654321097999\d*:/:9.87654321098:/;
60 $out2 =~ s/:9\.87654321097999\d*:/:9.87654321098:/;
65 # How about counting bits?
69 is( ($x = unpack("%32B*", "\001\002\004\010\020\040\100\200\377")), 16 );
71 is( ($x = unpack("%32b69", "\001\002\004\010\020\040\100\200\017")), 12 );
73 is( ($x = unpack("%32B69", "\001\002\004\010\020\040\100\200\017")), 9 );
77 my $sum = 129; # ASCII
78 $sum = 103 if $Is_EBCDIC;
81 is( ($x = unpack("%32B*", "Now is the time for all good blurfl")), $sum );
84 open(BIN, $Perl) || die "Can't open $Perl: $!\n";
85 sysread BIN, $foo, 8192;
88 $sum = unpack("%32b*", $foo);
89 my $longway = unpack("b*", $foo);
90 is( $sum, $longway =~ tr/1/1/ );
95 is( ($x = unpack("I",pack("I", 0xFFFFFFFF))), 0xFFFFFFFF );
100 my @x = (5,130,256,560,32000,3097152,268435455,1073741844, 2**33,
101 '4503599627365785','23728385234614992549757750638446');
102 my $x = pack('w*', @x);
103 my $y = pack 'H*', '0581028200843081fa0081bd8440ffffff7f8480808014A0808'.
104 '0800087ffffffffffdb19caefe8e1eeeea0c2e1e3e8ede1ee6e';
108 my @y = unpack('w*', $y);
110 while ($a = pop @x) {
115 @y = unpack('w2', $x);
125 eval { $x = unpack 'w', pack 'C*', 0xff, 0xff};
126 like($@, qr/^Unterminated compressed integer/);
128 eval { $x = unpack 'w', pack 'C*', 0xff, 0xff, 0xff, 0xff};
129 like($@, qr/^Unterminated compressed integer/);
131 eval { $x = unpack 'w', pack 'C*', 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff};
132 like($@, qr/^Unterminated compressed integer/);
136 # test the "p" template
139 is(unpack("p",pack("p","foo")), "foo");
142 is(unpack("p",pack("p",239)), 239);
145 sub foo { my $a = "a"; return $a . $a++ . $a++ }
149 local $SIG{__WARN__} = sub {
152 my $junk = pack("p", &foo);
154 like($warning, qr/temporary val/);
157 # undef should give null pointer
158 like(pack("p", undef), qr/^\0+/);
160 # Check for optimizer bug (e.g. Digital Unix GEM cc with -O4 on DU V4.0B gives
161 # 4294967295 instead of -1)
162 # see #ifdef __osf__ in pp.c pp_unpack
163 is((unpack("i",pack("i",-1))), -1);
165 # test the pack lengths of s S i I l L
166 # test the pack lengths of n N v V
167 my @lengths = qw(s 2 S 2 i -4 I -4 l 4 L 4 n 2 N 4 v 2 V 4);
168 while (my ($format, $expect) = splice @lengths, 0, 2) {
169 my $len = length(pack($format, 0));
171 is($expect, $len, "format '$format'");
174 ok ($len >= $expect, "format '$format'") ||
175 print "# format '$format' has length $len, expected >= $expect\n";
180 # test unpack-pack lengths
181 my @templates = qw(c C i I s S l L n N v V f d q Q);
183 foreach my $t (@templates) {
185 my @t = eval { unpack("$t*", pack("$t*", 12, 34)) };
187 # quads not supported everywhere
188 skip "Quads not supported", 4 if $@ =~ /Invalid type in pack/;
194 skip "$t not expected to work for some reason", 2 if $t =~ /[nv]/i;
205 # Note that first uuencoding known 'text' data and then checking the
206 # binary values of the uuencoded version would not be portable between
207 # character sets. Uuencoding is meant for encoding binary data, not
210 my $in = pack 'C*', 0 .. 255;
212 # just to be anal, we do some random tr/`/ /
214 M` $"`P0%!@<("0H+# T.#Q`1$A,4%187&!D:&QP='A\@(2(C)"4F)R@I*BLL
215 M+2XO,#$R,S0U-C<X.3H[/#T^/T!!0D-$149'2$E*2TQ-3D]045)35%565UA9
216 M6EM<75Y?8&%B8V1E9F=H:6IK;&UN;W!Q<G-T=79W>'EZ>WQ]?G^`@8*#A(6&
217 MAXB)BHN,C8Z/D)&2DY25EI>8F9J;G)V>GZ"AHJ.DI::GJ*FJJZRMKJ^PL;*S
218 MM+6VM[BYNKN\O;Z_P,'"P\3%QL?(R<K+S,W.S]#1TM/4U=;7V-G:V]S=WM_@
219 ?X>+CY.7FY^CIZNOL[>[O\/'R\_3U]O?X^?K[_/W^_P `
225 is(pack('u', $in), $_);
227 is(unpack('u', $uu), $in);
229 $in = "\x1f\x8b\x08\x08\x58\xdc\xc4\x35\x02\x03\x4a\x41\x50\x55\x00\xf3\x2a\x2d\x2e\x51\x48\xcc\xcb\x2f\xc9\x48\x2d\x52\x08\x48\x2d\xca\x51\x28\x2d\x4d\xce\x4f\x49\x2d\xe2\x02\x00\x64\x66\x60\x5c\x1a\x00\x00\x00";
231 M'XL("%C<Q#4"`TI!4%4`\RHM+E%(S,LOR4@M4@A(+<I1*"U-SD])+>("`&1F
235 is(unpack('u', $uu), $in);
237 # This is identical to the above except that backquotes have been
241 M'XL("%C<Q#4" TI!4%4 \RHM+E%(S,LOR4@M4@A(+<I1*"U-SD])+>(" &1F
246 is(unpack('u', $uu), $in);
250 # test the ascii template types (A, a, Z)
253 ['p', 'A*', "foo\0bar\0 ", "foo\0bar\0 "],
254 ['p', 'A11', "foo\0bar\0 ", "foo\0bar\0 "],
255 ['u', 'A*', "foo\0bar \0", "foo\0bar"],
256 ['u', 'A8', "foo\0bar \0", "foo\0bar"],
257 ['p', 'a*', "foo\0bar\0 ", "foo\0bar\0 "],
258 ['p', 'a11', "foo\0bar\0 ", "foo\0bar\0 \0\0"],
259 ['u', 'a*', "foo\0bar \0", "foo\0bar \0"],
260 ['u', 'a8', "foo\0bar \0", "foo\0bar "],
261 ['p', 'Z*', "foo\0bar\0 ", "foo\0bar\0 \0"],
262 ['p', 'Z11', "foo\0bar\0 ", "foo\0bar\0 \0\0"],
263 ['p', 'Z3', "foo", "fo\0"],
264 ['u', 'Z*', "foo\0bar \0", "foo"],
265 ['u', 'Z8', "foo\0bar \0", "foo"],
268 my ($what, $template, $in, $out) = @$_;
269 my $got = $what eq 'u' ? (unpack $template, $in) : (pack $template, $in);
270 unless (is($got, $out)) {
271 my $un = $what eq 'u' ? 'un' : '';
272 print "# ${un}pack ('$template', "._qq($in).') gave '._qq($out).
273 ' not '._qq($got)."\n";
277 # packing native shorts/ints/longs
279 is(length(pack("s!", 0)), $Config{shortsize});
280 is(length(pack("i!", 0)), $Config{intsize});
281 is(length(pack("l!", 0)), $Config{longsize});
282 ok(length(pack("s!", 0)) <= length(pack("i!", 0)));
283 ok(length(pack("i!", 0)) <= length(pack("l!", 0)));
284 is(length(pack("i!", 0)), length(pack("i", 0)));
288 return numbers_with_total ($format, undef, @_);
291 sub numbers_with_total {
294 if (!defined $total) {
301 my $out = eval {unpack($format, pack($format, $_))};
302 skip "cannot pack '$format' on this perl", 2 if
303 $@ =~ /Invalid type in pack: '$format'/;
310 my $skip_if_longer_than = ~0; # "Infinity"
312 # If we're running with -DNO_PERLPRESERVE_IVUV and NVs don't preserve all
313 # UVs (in which case ~0 is NV, ~0-1 will be the same NV) then we can't
314 # correctly in perl calculate UV totals for long checksums, as pp_unpack
315 # is using UV maths, and we've only got NVs.
316 $skip_if_longer_than = $Config{d_nv_preserves_uv_bits};
319 foreach ('', 1, 2, 3, 15, 16, 17, 31, 32, 33, 53, 54, 63, 64, 65) {
321 my $sum = eval {unpack "%$_$format*", pack "$format*", @_};
322 skip "cannot pack '$format' on this perl", 3
323 if $@ =~ /Invalid type in pack: '$format'/;
328 my $len = $_; # Copy, so that we can reassign ''
329 $len = 16 unless length $len;
332 skip "cannot test checksums over $skip_if_longer_than bits", 1
333 if $len > $skip_if_longer_than;
335 # Our problem with testing this portably is that the checksum code in
336 # pp_unpack is able to cast signed to unsigned, and do modulo 2**n
337 # arithmetic in unsigned ints, which perl has no operators to do.
338 # (use integer; does signed ints, which won't wrap on UTS, which is just
339 # fine with ANSI, but not with most people's assumptions.
340 # This is why we need to supply the totals for 'Q' as there's no way in
341 # perl to calculate them, short of unpack '%0Q' (is that documented?)
342 # ** returns NVs; make sure it's IV.
343 my $max = 1 + 2 * (int (2 ** ($len-1))-1); # The max possible checksum
344 my $max_p1 = $max + 1;
345 my ($max_is_integer, $max_p1_is_integer);
346 $max_p1_is_integer = 1 unless $max_p1 + 1 == $max_p1;
347 $max_is_integer = 1 if $max - 1 < ~0;
351 $calc_sum = &$total($len);
354 # Shift into range by some multiple of the total
355 my $mult = int ($total / $max_p1);
356 # Need this to make sure that -1 + (~0+1) is ~0 (ie still integer)
357 $calc_sum = $total - $mult;
358 $calc_sum -= $mult * $max;
364 if ($calc_sum == $calc_sum - 1 && $calc_sum == $max_p1) {
365 # we're into floating point (either by getting out of the range of
366 # UV arithmetic, or because we're doing a floating point checksum)
367 # and our calculation of the checksum has become rounded up to
372 if ($calc_sum == $sum) { # HAS to be ==, not eq (so no is()).
373 ok ("unpack '%$_$format' gave $sum");
375 my $delta = 1.000001;
376 if ($format =~ tr /dDfF//
377 && ($calc_sum <= $sum * $delta && $calc_sum >= $sum / $delta)) {
378 pass ("unpack '%$_$format' gave $sum, expected $calc_sum");
380 my $text = ref $total ? &$total($len) : $total;
382 print "# For list (" . join (", ", @_) . ") (total $text)"
383 . " packed with $format unpack '%$_$format' gave $sum,"
384 . " expected $calc_sum\n";
392 numbers ('c', -128, -1, 0, 1, 127);
393 numbers ('C', 0, 1, 127, 128, 255);
394 numbers ('s', -32768, -1, 0, 1, 32767);
395 numbers ('S', 0, 1, 32767, 32768, 65535);
396 numbers ('i', -2147483648, -1, 0, 1, 2147483647);
397 numbers ('I', 0, 1, 2147483647, 2147483648, 4294967295);
398 numbers ('l', -2147483648, -1, 0, 1, 2147483647);
399 numbers ('L', 0, 1, 2147483647, 2147483648, 4294967295);
400 numbers ('s!', -32768, -1, 0, 1, 32767);
401 numbers ('S!', 0, 1, 32767, 32768, 65535);
402 numbers ('i!', -2147483648, -1, 0, 1, 2147483647);
403 numbers ('I!', 0, 1, 2147483647, 2147483648, 4294967295);
404 numbers ('l!', -2147483648, -1, 0, 1, 2147483647);
405 numbers ('L!', 0, 1, 2147483647, 2147483648, 4294967295);
406 numbers ('n', 0, 1, 32767, 32768, 65535);
407 numbers ('v', 0, 1, 32767, 32768, 65535);
408 numbers ('N', 0, 1, 2147483647, 2147483648, 4294967295);
409 numbers ('V', 0, 1, 2147483647, 2147483648, 4294967295);
410 # All these should have exact binary representations:
411 numbers ('f', -1, 0, 0.5, 42, 2**34);
412 numbers ('d', -(2**34), -1, 0, 1, 2**34);
413 ## These don't, but 'd' is NV. XXX wrong, it's double
414 #numbers ('d', -1, 0, 1, 1-exp(-1), -exp(1));
416 numbers_with_total ('q', -1,
417 -9223372036854775808, -1, 0, 1,9223372036854775807);
418 # This total is icky, but the true total is 2**65-1, and need a way to generate
419 # the epxected checksum on any system including those where NVs can preserve
420 # 65 bits. (long double is 128 bits on sparc, so they certainly can)
421 # or where rounding is down not up on binary conversion (crays)
422 numbers_with_total ('Q', sub {
424 $len = 65 if $len > 65; # unmasked total is 2**65-1 here
425 my $total = 1 + 2 * (int (2**($len - 1)) - 1);
426 return 0 if $total == $total - 1; # Overflowed integers
427 return $total; # NVs still accurate to nearest integer
429 0, 1,9223372036854775807, 9223372036854775808,
430 18446744073709551615);
432 # pack nvNV byteorders
434 is(pack("n", 0xdead), "\xde\xad");
435 is(pack("v", 0xdead), "\xad\xde");
436 is(pack("N", 0xdeadbeef), "\xde\xad\xbe\xef");
437 is(pack("V", 0xdeadbeef), "\xef\xbe\xad\xde");
443 eval { ($x) = unpack '/a*','hello' };
444 like($@, qr!/ must follow a numeric type!);
446 eval { $x = unpack '/a*','hello' };
447 like($@, qr!/ must follow a numeric type!);
450 eval { ($z,$x,$y) = unpack 'a3/A C/a* C/Z', "003ok \003yes\004z\000abc" };
456 eval { $z = unpack 'a3/A C/a* C/Z', "003ok \003yes\004z\000abc" };
462 eval { ($x) = pack '/a*','hello' };
463 like($@, qr!Invalid type in pack: '/'!);
465 eval { $x = pack '/a*','hello' };
466 like($@, qr!Invalid type in pack: '/'!);
468 $z = pack 'n/a* N/Z* w/A*','string','hi there ','etc';
469 my $expect = "\000\006string\0\0\0\012hi there \000\003etc";
473 $expect = 'hello world';
474 eval { ($x) = unpack ("w/a", chr (11) . "hello world!")};
479 # Doing this in scalar context used to fail.
480 eval { $x = unpack ("w/a", chr (11) . "hello world!")};
485 ['a/a*/a*', '212ab345678901234567','ab3456789012'],
486 ['a/a*/a*', '3012ab345678901234567', 'ab3456789012'],
487 ['a/a*/b*', '212ab', $Is_EBCDIC ? '100000010100' : '100001100100'],
490 my ($pat, $in, $expect) = @$_;
492 eval { ($x) = unpack $pat, $in };
495 printf "# list unpack ('$pat', '$in') gave %s, expected '$expect'\n",
499 eval { $x = unpack $pat, $in };
502 printf "# scalar unpack ('$pat', '$in') gave %s, expected '$expect'\n",
508 my $pattern = <<'EOU';
509 a3/A # Count in ASCII
510 C/a* # Count in a C char
511 C/Z # Count in a C char but skip after \0
515 eval { ($z,$x,$y) = unpack $pattern, "003ok \003yes\004z\000abc" };
521 eval { $z = unpack $pattern, "003ok \003yes\004z\000abc" };
526 n/a* # Count as network short
527 w/A* # Count a BER integer
529 $expect = "\000\006string\003etc";
530 $z = pack $pattern,'string','etc';
534 is("1.20.300.4000", sprintf "%vd", pack("U*",1,20,300,4000));
535 is("1.20.300.4000", sprintf "%vd", pack(" U*",1,20,300,4000));
536 isnt(v1.20.300.4000, sprintf "%vd", pack("C0U*",1,20,300,4000));
538 my $rslt = $Is_EBCDIC ? "156 67" : "199 162";
539 is(join(" ", unpack("C*", chr(0x1e2))), $rslt);
541 # does pack U create Unicode?
542 is(ord(pack('U', 300)), 300);
544 # does unpack U deref Unicode?
545 is((unpack('U', chr(300)))[0], 300);
547 # is unpack U the reverse of pack U for Unicode string?
548 is("@{[unpack('U*', pack('U*', 100, 200, 300))]}", "100 200 300");
550 # is unpack U the reverse of pack U for byte string?
551 is("@{[unpack('U*', pack('U*', 100, 200))]}", "100 200");
555 skip "Not for EBCDIC", 4 if $Is_EBCDIC;
557 # does unpack C unravel pack U?
558 is("@{[unpack('C*', pack('U*', 100, 200))]}", "100 195 136");
560 # does pack U0C create Unicode?
561 is("@{[pack('U0C*', 100, 195, 136)]}", v100.v200);
563 # does pack C0U create characters?
564 is("@{[pack('C0U*', 100, 200)]}", pack("C*", 100, 195, 136));
566 # does unpack U0U on byte data warn?
568 local $SIG{__WARN__} = sub { $@ = "@_" };
569 my @null = unpack('U0U', chr(255));
570 like($@, /^Malformed UTF-8 character /);
575 my $p = pack 'i*', -2147483648, ~0, 0, 1, 2147483647;
577 # bug - % had to be at the start of the pattern, no leading whitespace or
578 # comments. %i! didn't work at all.
579 foreach my $pat ('%32i*', ' %32i*', "# Muhahahaha\n%32i*", '%32i* ',
580 '%32i!*', ' %32i!*', "\n#\n#\n\r \t\f%32i!*", '%32i!*#') {
581 @a = unpack $pat, $p;
582 is($a[0], 0xFFFFFFFF) || print "# $pat\n";
583 @a = scalar unpack $pat, $p;
584 is($a[0], 0xFFFFFFFF) || print "# $pat\n";
588 $p = pack 'I*', 42, 12;
589 # Multiline patterns in scalar context failed.
590 foreach my $pat ('I', <<EOPOEMSNIPPET, 'I#I', 'I # I', 'I # !!!') {
591 # On the Ning Nang Nong
592 # Where the Cows go Bong!
593 # And the Monkeys all say Boo!
596 @a = unpack $pat, $p;
599 @a = scalar unpack $pat, $p;
604 # shorts (of all flavours) didn't calculate checksums > 32 bits with floating
605 # point, so a pathologically long pattern would wrap at 32 bits.
606 my $pat = "\xff\xff"x65538; # Start with it long, to save any copying.
607 foreach (4,3,2,1,0) {
608 my $len = 65534 + $_;
609 is(unpack ("%33n$len", $pat), 65535 * $len);
619 ['xXa*', "Nick", "Nick"],
620 ['a5Xa5', "cameL", "llama", "camellama"],
622 ['a*@8a*', 'Camel', 'Dromedary', "Camel\0\0\0Dromedary"],
623 ['a*@4a', 'Perl rules', '!', 'Perl!'],
626 my ($template, @in) = @$_;
628 my $got = eval {pack $template, @in};
631 printf "# pack ('$template', %s) gave %s expected %s\n",
632 encode_list (@in), encode_list ($got), encode_list ($out);
639 ['xXa*', "Nick", "Nick"],
640 ['a5Xa5', "camellama", "camel", "llama"],
642 ['@2a2', "water", "te"],
643 ['a*@1a3', "steam", "steam", "tea"],
646 my ($template, $in, @out) = @$_;
647 my @got = eval {unpack $template, $in};
649 list_eq (\@got, \@out) ||
650 printf "# list unpack ('$template', %s) gave %s expected %s\n",
651 _qq($in), encode_list (@got), encode_list (@out);
653 my $got = eval {unpack $template, $in};
655 @out ? is( $got, $out[0] ) # 1 or more items; should get first
656 : ok( !defined $got ) # 0 items; should get undef
657 or printf "# scalar unpack ('$template', %s) gave %s expected %s\n",
658 _qq($in), encode_list ($got), encode_list ($out[0]);
663 my ($u, $v) = qw(foo xyzzy);
664 my $p = pack($t, $u, $v);
665 my @u = unpack($t, $p);
672 is((unpack("w/a*", "\x02abc"))[0], "ab");
674 # "w/a*" should be seen as one unit
676 is(scalar unpack("w/a*", "\x02abc"), "ab");
680 # from Wolfgang Laun: fix in change #13163
684 my $buf = pack( 'Z*/A* C', $s, $x );
688 $h =~ s/[^[:print:]]/./g;
689 ( $s, $y ) = unpack( "Z*/A* C", $buf );
690 is($h, "30.ABCABCABCABCABCABCABCABCABCABC*");
692 is($s, "ABCABCABCABCABCABCABCABCABCABC");
697 # from Wolfgang Laun: fix in change #13288
699 eval { my $t=unpack("P*", "abc") };
700 like($@, qr/P must have an explicit size/);