Re: perl@14647
[p5sagit/p5-mst-13.2.git] / ext / Data / Dumper / Dumper.pm
CommitLineData
823edd99 1#
2# Data/Dumper.pm
3#
4# convert perl data structures into perl syntax suitable for both printing
5# and eval
6#
7# Documentation at the __END__
8#
9
10package Data::Dumper;
11
8e5f9a6e 12$VERSION = '2.12';
823edd99 13
14#$| = 1;
15
3b825e41 16use 5.006_001;
823edd99 17require Exporter;
9426adcd 18use XSLoader ();
823edd99 19require overload;
20
21use Carp;
22
9426adcd 23@ISA = qw(Exporter);
823edd99 24@EXPORT = qw(Dumper);
25@EXPORT_OK = qw(DumperX);
26
9426adcd 27XSLoader::load 'Data::Dumper';
823edd99 28
29# module vars and their defaults
30$Indent = 2 unless defined $Indent;
31$Purity = 0 unless defined $Purity;
32$Pad = "" unless defined $Pad;
33$Varname = "VAR" unless defined $Varname;
34$Useqq = 0 unless defined $Useqq;
35$Terse = 0 unless defined $Terse;
36$Freezer = "" unless defined $Freezer;
37$Toaster = "" unless defined $Toaster;
38$Deepcopy = 0 unless defined $Deepcopy;
39$Quotekeys = 1 unless defined $Quotekeys;
40$Bless = "bless" unless defined $Bless;
41#$Expdepth = 0 unless defined $Expdepth;
a2126434 42$Maxdepth = 0 unless defined $Maxdepth;
31a725b3 43$Useperl = 0 unless defined $Useperl;
44$Sortkeys = 0 unless defined $Sortkeys;
8e5f9a6e 45$Deparse = 0 unless defined $Deparse;
823edd99 46
47#
48# expects an arrayref of values to be dumped.
49# can optionally pass an arrayref of names for the values.
50# names must have leading $ sign stripped. begin the name with *
51# to cause output of arrays and hashes rather than refs.
52#
53sub new {
54 my($c, $v, $n) = @_;
55
56 croak "Usage: PACKAGE->new(ARRAYREF, [ARRAYREF])"
57 unless (defined($v) && (ref($v) eq 'ARRAY'));
58 $n = [] unless (defined($n) && (ref($v) eq 'ARRAY'));
59
60 my($s) = {
61 level => 0, # current recursive depth
62 indent => $Indent, # various styles of indenting
63 pad => $Pad, # all lines prefixed by this string
64 xpad => "", # padding-per-level
65 apad => "", # added padding for hash keys n such
66 sep => "", # list separator
67 seen => {}, # local (nested) refs (id => [name, val])
68 todump => $v, # values to dump []
69 names => $n, # optional names for values []
70 varname => $Varname, # prefix to use for tagging nameless ones
71 purity => $Purity, # degree to which output is evalable
72 useqq => $Useqq, # use "" for strings (backslashitis ensues)
73 terse => $Terse, # avoid name output (where feasible)
74 freezer => $Freezer, # name of Freezer method for objects
75 toaster => $Toaster, # name of method to revive objects
76 deepcopy => $Deepcopy, # dont cross-ref, except to stop recursion
77 quotekeys => $Quotekeys, # quote hash keys
78 'bless' => $Bless, # keyword to use for "bless"
79# expdepth => $Expdepth, # cutoff depth for explicit dumping
a2126434 80 maxdepth => $Maxdepth, # depth beyond which we give up
31a725b3 81 useperl => $Useperl, # use the pure Perl implementation
82 sortkeys => $Sortkeys, # flag or filter for sorting hash keys
8e5f9a6e 83 deparse => $Deparse, # use B::Deparse for coderefs
823edd99 84 };
85
86 if ($Indent > 0) {
87 $s->{xpad} = " ";
88 $s->{sep} = "\n";
89 }
90 return bless($s, $c);
91}
92
93#
94# add-to or query the table of already seen references
95#
96sub Seen {
97 my($s, $g) = @_;
98 if (defined($g) && (ref($g) eq 'HASH')) {
99 my($k, $v, $id);
100 while (($k, $v) = each %$g) {
101 if (defined $v and ref $v) {
102 ($id) = (overload::StrVal($v) =~ /\((.*)\)$/);
103 if ($k =~ /^[*](.*)$/) {
104 $k = (ref $v eq 'ARRAY') ? ( "\\\@" . $1 ) :
105 (ref $v eq 'HASH') ? ( "\\\%" . $1 ) :
106 (ref $v eq 'CODE') ? ( "\\\&" . $1 ) :
107 ( "\$" . $1 ) ;
108 }
109 elsif ($k !~ /^\$/) {
110 $k = "\$" . $k;
111 }
112 $s->{seen}{$id} = [$k, $v];
113 }
114 else {
115 carp "Only refs supported, ignoring non-ref item \$$k";
116 }
117 }
118 return $s;
119 }
120 else {
121 return map { @$_ } values %{$s->{seen}};
122 }
123}
124
125#
126# set or query the values to be dumped
127#
128sub Values {
129 my($s, $v) = @_;
130 if (defined($v) && (ref($v) eq 'ARRAY')) {
131 $s->{todump} = [@$v]; # make a copy
132 return $s;
133 }
134 else {
135 return @{$s->{todump}};
136 }
137}
138
139#
140# set or query the names of the values to be dumped
141#
142sub Names {
143 my($s, $n) = @_;
144 if (defined($n) && (ref($n) eq 'ARRAY')) {
145 $s->{names} = [@$n]; # make a copy
146 return $s;
147 }
148 else {
149 return @{$s->{names}};
150 }
151}
152
153sub DESTROY {}
154
0f1923bd 155sub Dump {
156 return &Dumpxs
31a725b3 157 unless $Data::Dumper::Useperl || (ref($_[0]) && $_[0]->{useperl}) ||
8e5f9a6e 158 $Data::Dumper::Useqq || (ref($_[0]) && $_[0]->{useqq}) ||
159 $Data::Dumper::Deparse || (ref($_[0]) && $_[0]->{deparse});
0f1923bd 160 return &Dumpperl;
161}
162
823edd99 163#
164# dump the refs in the current dumper object.
165# expects same args as new() if called via package name.
166#
0f1923bd 167sub Dumpperl {
823edd99 168 my($s) = shift;
169 my(@out, $val, $name);
170 my($i) = 0;
171 local(@post);
172
173 $s = $s->new(@_) unless ref $s;
174
175 for $val (@{$s->{todump}}) {
176 my $out = "";
177 @post = ();
178 $name = $s->{names}[$i++];
179 if (defined $name) {
180 if ($name =~ /^[*](.*)$/) {
181 if (defined $val) {
182 $name = (ref $val eq 'ARRAY') ? ( "\@" . $1 ) :
183 (ref $val eq 'HASH') ? ( "\%" . $1 ) :
184 (ref $val eq 'CODE') ? ( "\*" . $1 ) :
185 ( "\$" . $1 ) ;
186 }
187 else {
188 $name = "\$" . $1;
189 }
190 }
191 elsif ($name !~ /^\$/) {
192 $name = "\$" . $name;
193 }
194 }
195 else {
196 $name = "\$" . $s->{varname} . $i;
197 }
198
199 my $valstr;
200 {
201 local($s->{apad}) = $s->{apad};
202 $s->{apad} .= ' ' x (length($name) + 3) if $s->{indent} >= 2;
203 $valstr = $s->_dump($val, $name);
204 }
205
206 $valstr = "$name = " . $valstr . ';' if @post or !$s->{terse};
207 $out .= $s->{pad} . $valstr . $s->{sep};
208 $out .= $s->{pad} . join(';' . $s->{sep} . $s->{pad}, @post)
209 . ';' . $s->{sep} if @post;
210
211 push @out, $out;
212 }
213 return wantarray ? @out : join('', @out);
214}
215
216#
217# twist, toil and turn;
218# and recurse, of course.
31a725b3 219# sometimes sordidly;
220# and curse if no recourse.
823edd99 221#
222sub _dump {
223 my($s, $val, $name) = @_;
224 my($sname);
225 my($out, $realpack, $realtype, $type, $ipad, $id, $blesspad);
226
823edd99 227 $type = ref $val;
228 $out = "";
229
230 if ($type) {
231
232 # prep it, if it looks like an object
982af928 233 if (my $freezer = $s->{freezer}) {
234 $val->$freezer() if UNIVERSAL::can($val, $freezer);
823edd99 235 }
236
237 ($realpack, $realtype, $id) =
238 (overload::StrVal($val) =~ /^(?:(.*)\=)?([^=]*)\(([^\(]*)\)$/);
a2126434 239
7820172a 240 # if it has a name, we need to either look it up, or keep a tab
241 # on it so we know when we hit it later
242 if (defined($name) and length($name)) {
243 # keep a tab on it so that we dont fall into recursive pit
244 if (exists $s->{seen}{$id}) {
245# if ($s->{expdepth} < $s->{level}) {
246 if ($s->{purity} and $s->{level} > 0) {
247 $out = ($realtype eq 'HASH') ? '{}' :
248 ($realtype eq 'ARRAY') ? '[]' :
5df59fb6 249 'do{my $o}' ;
7820172a 250 push @post, $name . " = " . $s->{seen}{$id}[0];
823edd99 251 }
252 else {
7820172a 253 $out = $s->{seen}{$id}[0];
254 if ($name =~ /^([\@\%])/) {
255 my $start = $1;
256 if ($out =~ /^\\$start/) {
257 $out = substr($out, 1);
258 }
259 else {
260 $out = $start . '{' . $out . '}';
261 }
262 }
263 }
264 return $out;
265# }
266 }
267 else {
268 # store our name
269 $s->{seen}{$id} = [ (($name =~ /^[@%]/) ? ('\\' . $name ) :
270 ($realtype eq 'CODE' and
271 $name =~ /^[*](.*)$/) ? ('\\&' . $1 ) :
272 $name ),
273 $val ];
823edd99 274 }
823edd99 275 }
276
a2126434 277 if ($realpack and $realpack eq 'Regexp') {
7894fbab 278 $out = "$val";
279 $out =~ s,/,\\/,g;
280 return "qr/$out/";
a2126434 281 }
282
283 # If purity is not set and maxdepth is set, then check depth:
284 # if we have reached maximum depth, return the string
285 # representation of the thing we are currently examining
286 # at this depth (i.e., 'Foo=ARRAY(0xdeadbeef)').
287 if (!$s->{purity}
288 and $s->{maxdepth} > 0
289 and $s->{level} >= $s->{maxdepth})
290 {
291 return qq['$val'];
292 }
293
294 # we have a blessed ref
295 if ($realpack) {
296 $out = $s->{'bless'} . '( ';
297 $blesspad = $s->{apad};
298 $s->{apad} .= ' ' if ($s->{indent} >= 2);
7894fbab 299 }
300
823edd99 301 $s->{level}++;
302 $ipad = $s->{xpad} x $s->{level};
303
54964f74 304 if ($realtype eq 'SCALAR' || $realtype eq 'REF') {
823edd99 305 if ($realpack) {
7820172a 306 $out .= 'do{\\(my $o = ' . $s->_dump($$val, "\${$name}") . ')}';
823edd99 307 }
308 else {
7820172a 309 $out .= '\\' . $s->_dump($$val, "\${$name}");
823edd99 310 }
311 }
312 elsif ($realtype eq 'GLOB') {
7820172a 313 $out .= '\\' . $s->_dump($$val, "*{$name}");
823edd99 314 }
315 elsif ($realtype eq 'ARRAY') {
316 my($v, $pad, $mname);
317 my($i) = 0;
318 $out .= ($name =~ /^\@/) ? '(' : '[';
319 $pad = $s->{sep} . $s->{pad} . $s->{apad};
320 ($name =~ /^\@(.*)$/) ? ($mname = "\$" . $1) :
7820172a 321 # omit -> if $foo->[0]->{bar}, but not ${$foo->[0]}->{bar}
322 ($name =~ /^\\?[\%\@\*\$][^{].*[]}]$/) ? ($mname = $name) :
323 ($mname = $name . '->');
823edd99 324 $mname .= '->' if $mname =~ /^\*.+\{[A-Z]+\}$/;
325 for $v (@$val) {
326 $sname = $mname . '[' . $i . ']';
327 $out .= $pad . $ipad . '#' . $i if $s->{indent} >= 3;
328 $out .= $pad . $ipad . $s->_dump($v, $sname);
329 $out .= "," if $i++ < $#$val;
330 }
331 $out .= $pad . ($s->{xpad} x ($s->{level} - 1)) if $i;
332 $out .= ($name =~ /^\@/) ? ')' : ']';
333 }
334 elsif ($realtype eq 'HASH') {
335 my($k, $v, $pad, $lpad, $mname);
336 $out .= ($name =~ /^\%/) ? '(' : '{';
337 $pad = $s->{sep} . $s->{pad} . $s->{apad};
338 $lpad = $s->{apad};
7820172a 339 ($name =~ /^\%(.*)$/) ? ($mname = "\$" . $1) :
340 # omit -> if $foo->[0]->{bar}, but not ${$foo->[0]}->{bar}
341 ($name =~ /^\\?[\%\@\*\$][^{].*[]}]$/) ? ($mname = $name) :
342 ($mname = $name . '->');
823edd99 343 $mname .= '->' if $mname =~ /^\*.+\{[A-Z]+\}$/;
31a725b3 344 my ($sortkeys, $keys, $key) = ("$s->{sortkeys}");
345 if ($sortkeys) {
346 if (ref($s->{sortkeys}) eq 'CODE') {
347 $keys = $s->{sortkeys}($val);
348 unless (ref($keys) eq 'ARRAY') {
349 carp "Sortkeys subroutine did not return ARRAYREF";
350 $keys = [];
351 }
352 }
353 else {
354 $keys = [ sort keys %$val ];
355 }
356 }
357 while (($k, $v) = ! $sortkeys ? (each %$val) :
358 @$keys ? ($key = shift(@$keys), $val->{$key}) :
359 () )
360 {
823edd99 361 my $nk = $s->_dump($k, "");
362 $nk = $1 if !$s->{quotekeys} and $nk =~ /^[\"\']([A-Za-z_]\w*)[\"\']$/;
363 $sname = $mname . '{' . $nk . '}';
364 $out .= $pad . $ipad . $nk . " => ";
365
366 # temporarily alter apad
367 $s->{apad} .= (" " x (length($nk) + 4)) if $s->{indent} >= 2;
368 $out .= $s->_dump($val->{$k}, $sname) . ",";
369 $s->{apad} = $lpad if $s->{indent} >= 2;
370 }
371 if (substr($out, -1) eq ',') {
372 chop $out;
373 $out .= $pad . ($s->{xpad} x ($s->{level} - 1));
374 }
375 $out .= ($name =~ /^\%/) ? ')' : '}';
376 }
377 elsif ($realtype eq 'CODE') {
8e5f9a6e 378 if ($s->{deparse}) {
379 require B::Deparse;
380 my $sub = 'sub ' . (B::Deparse->new)->coderef2text($val);
381 $pad = $s->{sep} . $s->{pad} . $s->{xpad} . $s->{apad} . ' ';
382 $sub =~ s/\n/$pad/gse;
383 $out .= $sub;
384 } else {
385 $out .= 'sub { "DUMMY" }';
386 carp "Encountered CODE ref, using dummy placeholder" if $s->{purity};
387 }
823edd99 388 }
389 else {
390 croak "Can\'t handle $realtype type.";
391 }
392
393 if ($realpack) { # we have a blessed ref
394 $out .= ', \'' . $realpack . '\'' . ' )';
395 $out .= '->' . $s->{toaster} . '()' if $s->{toaster} ne '';
396 $s->{apad} = $blesspad;
397 }
398 $s->{level}--;
399
400 }
401 else { # simple scalar
402
403 my $ref = \$_[1];
404 # first, catalog the scalar
405 if ($name ne '') {
406 ($id) = ("$ref" =~ /\(([^\(]*)\)$/);
407 if (exists $s->{seen}{$id}) {
7820172a 408 if ($s->{seen}{$id}[2]) {
409 $out = $s->{seen}{$id}[0];
410 #warn "[<$out]\n";
411 return "\${$out}";
412 }
823edd99 413 }
414 else {
7820172a 415 #warn "[>\\$name]\n";
416 $s->{seen}{$id} = ["\\$name", $ref];
823edd99 417 }
418 }
419 if (ref($ref) eq 'GLOB' or "$ref" =~ /=GLOB\([^()]+\)$/) { # glob
420 my $name = substr($val, 1);
421 if ($name =~ /^[A-Za-z_][\w:]*$/) {
422 $name =~ s/^main::/::/;
423 $sname = $name;
424 }
425 else {
426 $sname = $s->_dump($name, "");
427 $sname = '{' . $sname . '}';
428 }
429 if ($s->{purity}) {
430 my $k;
431 local ($s->{level}) = 0;
432 for $k (qw(SCALAR ARRAY HASH)) {
7820172a 433 my $gval = *$val{$k};
434 next unless defined $gval;
435 next if $k eq "SCALAR" && ! defined $$gval; # always there
436
823edd99 437 # _dump can push into @post, so we hold our place using $postlen
438 my $postlen = scalar @post;
439 $post[$postlen] = "\*$sname = ";
440 local ($s->{apad}) = " " x length($post[$postlen]) if $s->{indent} >= 2;
7820172a 441 $post[$postlen] .= $s->_dump($gval, "\*$sname\{$k\}");
823edd99 442 }
443 }
444 $out .= '*' . $sname;
445 }
7820172a 446 elsif (!defined($val)) {
447 $out .= "undef";
448 }
45b49486 449 elsif ($val =~ /^(?:0|-?[1-9]\d{0,8})$/) { # safe decimal number
823edd99 450 $out .= $val;
451 }
452 else { # string
453 if ($s->{useqq}) {
7820172a 454 $out .= qquote($val, $s->{useqq});
823edd99 455 }
456 else {
457 $val =~ s/([\\\'])/\\$1/g;
458 $out .= '\'' . $val . '\'';
459 }
460 }
461 }
7820172a 462 if ($id) {
463 # if we made it this far, $id was added to seen list at current
464 # level, so remove it to get deep copies
465 if ($s->{deepcopy}) {
466 delete($s->{seen}{$id});
467 }
468 elsif ($name) {
469 $s->{seen}{$id}[2] = 1;
470 }
471 }
823edd99 472 return $out;
473}
474
475#
476# non-OO style of earlier version
477#
478sub Dumper {
479 return Data::Dumper->Dump([@_]);
480}
481
0f1923bd 482# compat stub
823edd99 483sub DumperX {
484 return Data::Dumper->Dumpxs([@_], []);
485}
486
487sub Dumpf { return Data::Dumper->Dump(@_) }
488
489sub Dumpp { print Data::Dumper->Dump(@_) }
490
491#
492# reset the "seen" cache
493#
494sub Reset {
495 my($s) = shift;
496 $s->{seen} = {};
497 return $s;
498}
499
500sub Indent {
501 my($s, $v) = @_;
502 if (defined($v)) {
503 if ($v == 0) {
504 $s->{xpad} = "";
505 $s->{sep} = "";
506 }
507 else {
508 $s->{xpad} = " ";
509 $s->{sep} = "\n";
510 }
511 $s->{indent} = $v;
512 return $s;
513 }
514 else {
515 return $s->{indent};
516 }
517}
518
519sub Pad {
520 my($s, $v) = @_;
521 defined($v) ? (($s->{pad} = $v), return $s) : $s->{pad};
522}
523
524sub Varname {
525 my($s, $v) = @_;
526 defined($v) ? (($s->{varname} = $v), return $s) : $s->{varname};
527}
528
529sub Purity {
530 my($s, $v) = @_;
531 defined($v) ? (($s->{purity} = $v), return $s) : $s->{purity};
532}
533
534sub Useqq {
535 my($s, $v) = @_;
536 defined($v) ? (($s->{useqq} = $v), return $s) : $s->{useqq};
537}
538
539sub Terse {
540 my($s, $v) = @_;
541 defined($v) ? (($s->{terse} = $v), return $s) : $s->{terse};
542}
543
544sub Freezer {
545 my($s, $v) = @_;
546 defined($v) ? (($s->{freezer} = $v), return $s) : $s->{freezer};
547}
548
549sub Toaster {
550 my($s, $v) = @_;
551 defined($v) ? (($s->{toaster} = $v), return $s) : $s->{toaster};
552}
553
554sub Deepcopy {
555 my($s, $v) = @_;
556 defined($v) ? (($s->{deepcopy} = $v), return $s) : $s->{deepcopy};
557}
558
559sub Quotekeys {
560 my($s, $v) = @_;
561 defined($v) ? (($s->{quotekeys} = $v), return $s) : $s->{quotekeys};
562}
563
564sub Bless {
565 my($s, $v) = @_;
566 defined($v) ? (($s->{'bless'} = $v), return $s) : $s->{'bless'};
567}
568
a2126434 569sub Maxdepth {
570 my($s, $v) = @_;
571 defined($v) ? (($s->{'maxdepth'} = $v), return $s) : $s->{'maxdepth'};
572}
573
31a725b3 574sub Useperl {
575 my($s, $v) = @_;
576 defined($v) ? (($s->{'useperl'} = $v), return $s) : $s->{'useperl'};
577}
578
579sub Sortkeys {
580 my($s, $v) = @_;
581 defined($v) ? (($s->{'sortkeys'} = $v), return $s) : $s->{'sortkeys'};
582}
583
8e5f9a6e 584sub Deparse {
585 my($s, $v) = @_;
586 defined($v) ? (($s->{'deparse'} = $v), return $s) : $s->{'deparse'};
587}
a2126434 588
7820172a 589# used by qquote below
590my %esc = (
591 "\a" => "\\a",
592 "\b" => "\\b",
593 "\t" => "\\t",
594 "\n" => "\\n",
595 "\f" => "\\f",
596 "\r" => "\\r",
597 "\e" => "\\e",
598);
599
823edd99 600# put a string value in double quotes
601sub qquote {
602 local($_) = shift;
7820172a 603 s/([\\\"\@\$])/\\$1/g;
dc71dc59 604 my $bytes; { use bytes; $bytes = length }
605 s/([^\x00-\x7f])/'\x{'.sprintf("%x",ord($1)).'}'/ge if $bytes > length;
0407a77b 606 return qq("$_") unless
607 /[^ !"\#\$%&'()*+,\-.\/0-9:;<=>?\@A-Z[\\\]^_`a-z{|}~]/; # fast exit
7820172a 608
609 my $high = shift || "";
610 s/([\a\b\t\n\f\r\e])/$esc{$1}/g;
611
0407a77b 612 if (ord('^')==94) { # ascii
613 # no need for 3 digits in escape for these
614 s/([\0-\037])(?!\d)/'\\'.sprintf('%o',ord($1))/eg;
615 s/([\0-\037\177])/'\\'.sprintf('%03o',ord($1))/eg;
43948175 616 # all but last branch below not supported --BEHAVIOR SUBJECT TO CHANGE--
0407a77b 617 if ($high eq "iso8859") {
618 s/([\200-\240])/'\\'.sprintf('%o',ord($1))/eg;
619 } elsif ($high eq "utf8") {
620# use utf8;
621# $str =~ s/([^\040-\176])/sprintf "\\x{%04x}", ord($1)/ge;
622 } elsif ($high eq "8bit") {
623 # leave it as it is
624 } else {
625 s/([\200-\377])/'\\'.sprintf('%03o',ord($1))/eg;
626 }
627 }
628 else { # ebcdic
43948175 629 s{([^ !"\#\$%&'()*+,\-.\/0-9:;<=>?\@A-Z[\\\]^_`a-z{|}~])(?!\d)}
630 {my $v = ord($1); '\\'.sprintf(($v <= 037 ? '%o' : '%03o'), $v)}eg;
631 s{([^ !"\#\$%&'()*+,\-.\/0-9:;<=>?\@A-Z[\\\]^_`a-z{|}~])}
632 {'\\'.sprintf('%03o',ord($1))}eg;
7820172a 633 }
0407a77b 634
7820172a 635 return qq("$_");
823edd99 636}
637
6381;
639__END__
640
641=head1 NAME
642
643Data::Dumper - stringified perl data structures, suitable for both printing and C<eval>
644
823edd99 645=head1 SYNOPSIS
646
647 use Data::Dumper;
648
649 # simple procedural interface
650 print Dumper($foo, $bar);
651
652 # extended usage with names
653 print Data::Dumper->Dump([$foo, $bar], [qw(foo *ary)]);
654
655 # configuration variables
656 {
657 local $Data::Dump::Purity = 1;
658 eval Data::Dumper->Dump([$foo, $bar], [qw(foo *ary)]);
659 }
660
661 # OO usage
662 $d = Data::Dumper->new([$foo, $bar], [qw(foo *ary)]);
663 ...
664 print $d->Dump;
665 ...
666 $d->Purity(1)->Terse(1)->Deepcopy(1);
667 eval $d->Dump;
668
669
670=head1 DESCRIPTION
671
672Given a list of scalars or reference variables, writes out their contents in
673perl syntax. The references can also be objects. The contents of each
674variable is output in a single Perl statement. Handles self-referential
675structures correctly.
676
677The return value can be C<eval>ed to get back an identical copy of the
678original reference structure.
679
680Any references that are the same as one of those passed in will be named
681C<$VAR>I<n> (where I<n> is a numeric suffix), and other duplicate references
682to substructures within C<$VAR>I<n> will be appropriately labeled using arrow
683notation. You can specify names for individual values to be dumped if you
684use the C<Dump()> method, or you can change the default C<$VAR> prefix to
685something else. See C<$Data::Dumper::Varname> and C<$Data::Dumper::Terse>
686below.
687
688The default output of self-referential structures can be C<eval>ed, but the
689nested references to C<$VAR>I<n> will be undefined, since a recursive
690structure cannot be constructed using one Perl statement. You should set the
691C<Purity> flag to 1 to get additional statements that will correctly fill in
692these references.
693
694In the extended usage form, the references to be dumped can be given
695user-specified names. If a name begins with a C<*>, the output will
696describe the dereferenced type of the supplied reference for hashes and
697arrays, and coderefs. Output of names will be avoided where possible if
698the C<Terse> flag is set.
699
700In many cases, methods that are used to set the internal state of the
701object will return the object itself, so method calls can be conveniently
702chained together.
703
704Several styles of output are possible, all controlled by setting
705the C<Indent> flag. See L<Configuration Variables or Methods> below
706for details.
707
708
709=head2 Methods
710
711=over 4
712
713=item I<PACKAGE>->new(I<ARRAYREF [>, I<ARRAYREF]>)
714
715Returns a newly created C<Data::Dumper> object. The first argument is an
716anonymous array of values to be dumped. The optional second argument is an
717anonymous array of names for the values. The names need not have a leading
718C<$> sign, and must be comprised of alphanumeric characters. You can begin
719a name with a C<*> to specify that the dereferenced type must be dumped
720instead of the reference itself, for ARRAY and HASH references.
721
722The prefix specified by C<$Data::Dumper::Varname> will be used with a
723numeric suffix if the name for a value is undefined.
724
725Data::Dumper will catalog all references encountered while dumping the
726values. Cross-references (in the form of names of substructures in perl
727syntax) will be inserted at all possible points, preserving any structural
728interdependencies in the original set of values. Structure traversal is
729depth-first, and proceeds in order from the first supplied value to
730the last.
731
732=item I<$OBJ>->Dump I<or> I<PACKAGE>->Dump(I<ARRAYREF [>, I<ARRAYREF]>)
733
734Returns the stringified form of the values stored in the object (preserving
735the order in which they were supplied to C<new>), subject to the
91e74348 736configuration options below. In a list context, it returns a list
823edd99 737of strings corresponding to the supplied values.
738
739The second form, for convenience, simply calls the C<new> method on its
740arguments before dumping the object immediately.
741
823edd99 742=item I<$OBJ>->Seen(I<[HASHREF]>)
743
744Queries or adds to the internal table of already encountered references.
745You must use C<Reset> to explicitly clear the table if needed. Such
746references are not dumped; instead, their names are inserted wherever they
747are encountered subsequently. This is useful especially for properly
748dumping subroutine references.
749
d1be9408 750Expects an anonymous hash of name => value pairs. Same rules apply for names
823edd99 751as in C<new>. If no argument is supplied, will return the "seen" list of
91e74348 752name => value pairs, in a list context. Otherwise, returns the object
823edd99 753itself.
754
755=item I<$OBJ>->Values(I<[ARRAYREF]>)
756
757Queries or replaces the internal array of values that will be dumped.
758When called without arguments, returns the values. Otherwise, returns the
759object itself.
760
761=item I<$OBJ>->Names(I<[ARRAYREF]>)
762
763Queries or replaces the internal array of user supplied names for the values
764that will be dumped. When called without arguments, returns the names.
765Otherwise, returns the object itself.
766
767=item I<$OBJ>->Reset
768
769Clears the internal table of "seen" references and returns the object
770itself.
771
772=back
773
774=head2 Functions
775
776=over 4
777
778=item Dumper(I<LIST>)
779
780Returns the stringified form of the values in the list, subject to the
781configuration options below. The values will be named C<$VAR>I<n> in the
782output, where I<n> is a numeric suffix. Will return a list of strings
91e74348 783in a list context.
823edd99 784
823edd99 785=back
786
787=head2 Configuration Variables or Methods
788
789Several configuration variables can be used to control the kind of output
790generated when using the procedural interface. These variables are usually
791C<local>ized in a block so that other parts of the code are not affected by
792the change.
793
794These variables determine the default state of the object created by calling
795the C<new> method, but cannot be used to alter the state of the object
796thereafter. The equivalent method names should be used instead to query
797or set the internal state of the object.
798
799The method forms return the object itself when called with arguments,
800so that they can be chained together nicely.
801
802=over 4
803
804=item $Data::Dumper::Indent I<or> I<$OBJ>->Indent(I<[NEWVAL]>)
805
806Controls the style of indentation. It can be set to 0, 1, 2 or 3. Style 0
807spews output without any newlines, indentation, or spaces between list
808items. It is the most compact format possible that can still be called
809valid perl. Style 1 outputs a readable form with newlines but no fancy
810indentation (each level in the structure is simply indented by a fixed
811amount of whitespace). Style 2 (the default) outputs a very readable form
812which takes into account the length of hash keys (so the hash value lines
813up). Style 3 is like style 2, but also annotates the elements of arrays
814with their index (but the comment is on its own line, so array output
815consumes twice the number of lines). Style 2 is the default.
816
817=item $Data::Dumper::Purity I<or> I<$OBJ>->Purity(I<[NEWVAL]>)
818
819Controls the degree to which the output can be C<eval>ed to recreate the
820supplied reference structures. Setting it to 1 will output additional perl
821statements that will correctly recreate nested references. The default is
8220.
823
824=item $Data::Dumper::Pad I<or> I<$OBJ>->Pad(I<[NEWVAL]>)
825
826Specifies the string that will be prefixed to every line of the output.
827Empty string by default.
828
829=item $Data::Dumper::Varname I<or> I<$OBJ>->Varname(I<[NEWVAL]>)
830
831Contains the prefix to use for tagging variable names in the output. The
832default is "VAR".
833
834=item $Data::Dumper::Useqq I<or> I<$OBJ>->Useqq(I<[NEWVAL]>)
835
836When set, enables the use of double quotes for representing string values.
837Whitespace other than space will be represented as C<[\n\t\r]>, "unsafe"
838characters will be backslashed, and unprintable characters will be output as
839quoted octal integers. Since setting this variable imposes a performance
0f1923bd 840penalty, the default is 0. C<Dump()> will run slower if this flag is set,
841since the fast XSUB implementation doesn't support it yet.
823edd99 842
843=item $Data::Dumper::Terse I<or> I<$OBJ>->Terse(I<[NEWVAL]>)
844
845When set, Data::Dumper will emit single, non-self-referential values as
846atoms/terms rather than statements. This means that the C<$VAR>I<n> names
847will be avoided where possible, but be advised that such output may not
848always be parseable by C<eval>.
849
850=item $Data::Dumper::Freezer I<or> $I<OBJ>->Freezer(I<[NEWVAL]>)
851
852Can be set to a method name, or to an empty string to disable the feature.
853Data::Dumper will invoke that method via the object before attempting to
854stringify it. This method can alter the contents of the object (if, for
855instance, it contains data allocated from C), and even rebless it in a
856different package. The client is responsible for making sure the specified
857method can be called via the object, and that the object ends up containing
858only perl data types after the method has been called. Defaults to an empty
859string.
860
861=item $Data::Dumper::Toaster I<or> $I<OBJ>->Toaster(I<[NEWVAL]>)
862
863Can be set to a method name, or to an empty string to disable the feature.
864Data::Dumper will emit a method call for any objects that are to be dumped
8e5f9a6e 865using the syntax C<bless(DATA, CLASS)-E<gt>METHOD()>. Note that this means that
823edd99 866the method specified will have to perform any modifications required on the
867object (like creating new state within it, and/or reblessing it in a
868different package) and then return it. The client is responsible for making
869sure the method can be called via the object, and that it returns a valid
870object. Defaults to an empty string.
871
872=item $Data::Dumper::Deepcopy I<or> $I<OBJ>->Deepcopy(I<[NEWVAL]>)
873
874Can be set to a boolean value to enable deep copies of structures.
875Cross-referencing will then only be done when absolutely essential
876(i.e., to break reference cycles). Default is 0.
877
878=item $Data::Dumper::Quotekeys I<or> $I<OBJ>->Quotekeys(I<[NEWVAL]>)
879
880Can be set to a boolean value to control whether hash keys are quoted.
881A false value will avoid quoting hash keys when it looks like a simple
882string. Default is 1, which will always enclose hash keys in quotes.
883
884=item $Data::Dumper::Bless I<or> $I<OBJ>->Bless(I<[NEWVAL]>)
885
886Can be set to a string that specifies an alternative to the C<bless>
887builtin operator used to create objects. A function with the specified
888name should exist, and should accept the same arguments as the builtin.
889Default is C<bless>.
890
a2126434 891=item $Data::Dumper::Maxdepth I<or> $I<OBJ>->Maxdepth(I<[NEWVAL]>)
892
893Can be set to a positive integer that specifies the depth beyond which
894which we don't venture into a structure. Has no effect when
895C<Data::Dumper::Purity> is set. (Useful in debugger when we often don't
896want to see more than enough). Default is 0, which means there is
897no maximum depth.
898
31a725b3 899=item $Data::Dumper::Useperl I<or> $I<OBJ>->Useperl(I<[NEWVAL]>)
900
901Can be set to a boolean value which controls whether the pure Perl
902implementation of C<Data::Dumper> is used. The C<Data::Dumper> module is
903a dual implementation, with almost all functionality written in both
904pure Perl and also in XS ('C'). Since the XS version is much faster, it
905will always be used if possible. This option lets you override the
906default behavior, usually for testing purposes only. Default is 0, which
907means the XS implementation will be used if possible.
908
909=item $Data::Dumper::Sortkeys I<or> $I<OBJ>->Sortkeys(I<[NEWVAL]>)
910
911Can be set to a boolean value to control whether hash keys are dumped in
912sorted order. A true value will cause the keys of all hashes to be
913dumped in Perl's default sort order. Can also be set to a subroutine
914reference which will be called for each hash that is dumped. In this
915case C<Data::Dumper> will call the subroutine once for each hash,
916passing it the reference of the hash. The purpose of the subroutine is
917to return a reference to an array of the keys that will be dumped, in
918the order that they should be dumped. Using this feature, you can
919control both the order of the keys, and which keys are actually used. In
920other words, this subroutine acts as a filter by which you can exclude
921certain keys from being dumped. Default is 0, which means that hash keys
922are not sorted.
923
8e5f9a6e 924=item $Data::Dumper::Deparse I<or> $I<OBJ>->Deparse(I<[NEWVAL]>)
925
926Can be set to a boolean value to control whether code references are
927turned into perl source code. If set to a true value, C<B::Deparse>
928will be used to get the source of the code reference. Using this option
929will force using the Perl implementation of the dumper, since the fast
930XSUB implementation doesn't support it.
931
932Caution : use this option only if you know that your coderefs will be
933properly reconstructed by C<B::Deparse>.
934
823edd99 935=back
936
937=head2 Exports
938
939=over 4
940
941=item Dumper
942
943=back
944
945=head1 EXAMPLES
946
947Run these code snippets to get a quick feel for the behavior of this
948module. When you are through with these examples, you may want to
949add or change the various configuration variables described above,
950to see their behavior. (See the testsuite in the Data::Dumper
951distribution for more examples.)
952
953
954 use Data::Dumper;
955
956 package Foo;
957 sub new {bless {'a' => 1, 'b' => sub { return "foo" }}, $_[0]};
958
959 package Fuz; # a weird REF-REF-SCALAR object
960 sub new {bless \($_ = \ 'fu\'z'), $_[0]};
961
962 package main;
963 $foo = Foo->new;
964 $fuz = Fuz->new;
965 $boo = [ 1, [], "abcd", \*foo,
966 {1 => 'a', 023 => 'b', 0x45 => 'c'},
967 \\"p\q\'r", $foo, $fuz];
3cb6de81 968
823edd99 969 ########
970 # simple usage
971 ########
972
973 $bar = eval(Dumper($boo));
974 print($@) if $@;
975 print Dumper($boo), Dumper($bar); # pretty print (no array indices)
976
977 $Data::Dumper::Terse = 1; # don't output names where feasible
978 $Data::Dumper::Indent = 0; # turn off all pretty print
979 print Dumper($boo), "\n";
980
981 $Data::Dumper::Indent = 1; # mild pretty print
982 print Dumper($boo);
983
984 $Data::Dumper::Indent = 3; # pretty print with array indices
985 print Dumper($boo);
986
987 $Data::Dumper::Useqq = 1; # print strings in double quotes
988 print Dumper($boo);
3cb6de81 989
990
823edd99 991 ########
992 # recursive structures
993 ########
3cb6de81 994
823edd99 995 @c = ('c');
996 $c = \@c;
997 $b = {};
998 $a = [1, $b, $c];
999 $b->{a} = $a;
1000 $b->{b} = $a->[1];
1001 $b->{c} = $a->[2];
1002 print Data::Dumper->Dump([$a,$b,$c], [qw(a b c)]);
3cb6de81 1003
1004
823edd99 1005 $Data::Dumper::Purity = 1; # fill in the holes for eval
1006 print Data::Dumper->Dump([$a, $b], [qw(*a b)]); # print as @a
1007 print Data::Dumper->Dump([$b, $a], [qw(*b a)]); # print as %b
3cb6de81 1008
1009
823edd99 1010 $Data::Dumper::Deepcopy = 1; # avoid cross-refs
1011 print Data::Dumper->Dump([$b, $a], [qw(*b a)]);
3cb6de81 1012
1013
823edd99 1014 $Data::Dumper::Purity = 0; # avoid cross-refs
1015 print Data::Dumper->Dump([$b, $a], [qw(*b a)]);
3cb6de81 1016
a2126434 1017 ########
1018 # deep structures
1019 ########
3cb6de81 1020
a2126434 1021 $a = "pearl";
1022 $b = [ $a ];
1023 $c = { 'b' => $b };
1024 $d = [ $c ];
1025 $e = { 'd' => $d };
1026 $f = { 'e' => $e };
1027 print Data::Dumper->Dump([$f], [qw(f)]);
1028
1029 $Data::Dumper::Maxdepth = 3; # no deeper than 3 refs down
1030 print Data::Dumper->Dump([$f], [qw(f)]);
1031
3cb6de81 1032
823edd99 1033 ########
1034 # object-oriented usage
1035 ########
3cb6de81 1036
823edd99 1037 $d = Data::Dumper->new([$a,$b], [qw(a b)]);
1038 $d->Seen({'*c' => $c}); # stash a ref without printing it
1039 $d->Indent(3);
1040 print $d->Dump;
1041 $d->Reset->Purity(0); # empty the seen cache
1042 print join "----\n", $d->Dump;
3cb6de81 1043
1044
823edd99 1045 ########
1046 # persistence
1047 ########
3cb6de81 1048
823edd99 1049 package Foo;
1050 sub new { bless { state => 'awake' }, shift }
1051 sub Freeze {
1052 my $s = shift;
1053 print STDERR "preparing to sleep\n";
1054 $s->{state} = 'asleep';
1055 return bless $s, 'Foo::ZZZ';
1056 }
3cb6de81 1057
823edd99 1058 package Foo::ZZZ;
1059 sub Thaw {
1060 my $s = shift;
1061 print STDERR "waking up\n";
1062 $s->{state} = 'awake';
1063 return bless $s, 'Foo';
1064 }
3cb6de81 1065
823edd99 1066 package Foo;
1067 use Data::Dumper;
1068 $a = Foo->new;
1069 $b = Data::Dumper->new([$a], ['c']);
1070 $b->Freezer('Freeze');
1071 $b->Toaster('Thaw');
1072 $c = $b->Dump;
1073 print $c;
1074 $d = eval $c;
1075 print Data::Dumper->Dump([$d], ['d']);
3cb6de81 1076
1077
823edd99 1078 ########
1079 # symbol substitution (useful for recreating CODE refs)
1080 ########
3cb6de81 1081
823edd99 1082 sub foo { print "foo speaking\n" }
1083 *other = \&foo;
1084 $bar = [ \&other ];
1085 $d = Data::Dumper->new([\&other,$bar],['*other','bar']);
1086 $d->Seen({ '*foo' => \&foo });
1087 print $d->Dump;
1088
1089
31a725b3 1090 ########
1091 # sorting and filtering hash keys
1092 ########
1093
1094 $Data::Dumper::Sortkeys = \&my_filter;
1095 my $foo = { map { (ord, "$_$_$_") } 'I'..'Q' };
1096 my $bar = { %$foo };
1097 my $baz = { reverse %$foo };
1098 print Dumper [ $foo, $bar, $baz ];
1099
1100 sub my_filter {
1101 my ($hash) = @_;
1102 # return an array ref containing the hash keys to dump
1103 # in the order that you want them to be dumped
1104 return [
1105 # Sort the keys of %$foo in reverse numeric order
1106 $hash eq $foo ? (sort {$b <=> $a} keys %$hash) :
1107 # Only dump the odd number keys of %$bar
1108 $hash eq $bar ? (grep {$_ % 2} keys %$hash) :
1109 # Sort keys in default order for all other hashes
1110 (sort keys %$hash)
1111 ];
1112 }
1113
823edd99 1114=head1 BUGS
1115
1116Due to limitations of Perl subroutine call semantics, you cannot pass an
1117array or hash. Prepend it with a C<\> to pass its reference instead. This
8e5f9a6e 1118will be remedied in time, now that Perl has subroutine prototypes.
1119For now, you need to use the extended usage form, and prepend the
823edd99 1120name with a C<*> to output it as a hash or array.
1121
1122C<Data::Dumper> cheats with CODE references. If a code reference is
8e5f9a6e 1123encountered in the structure being processed (and if you haven't set
1124the C<Deparse> flag), an anonymous subroutine that
823edd99 1125contains the string '"DUMMY"' will be inserted in its place, and a warning
1126will be printed if C<Purity> is set. You can C<eval> the result, but bear
1127in mind that the anonymous sub that gets created is just a placeholder.
1128Someday, perl will have a switch to cache-on-demand the string
1129representation of a compiled piece of code, I hope. If you have prior
1130knowledge of all the code refs that your data structures are likely
1131to have, you can use the C<Seen> method to pre-seed the internal reference
1132table and make the dumped output point to them, instead. See L<EXAMPLES>
1133above.
1134
8e5f9a6e 1135The C<Useqq> and C<Deparse> flags makes Dump() run slower, since the
1136XSUB implementation does not support them.
823edd99 1137
1138SCALAR objects have the weirdest looking C<bless> workaround.
1139
1140
1141=head1 AUTHOR
1142
6e238990 1143Gurusamy Sarathy gsar@activestate.com
823edd99 1144
1145Copyright (c) 1996-98 Gurusamy Sarathy. All rights reserved.
1146This program is free software; you can redistribute it and/or
1147modify it under the same terms as Perl itself.
1148
1149
1150=head1 VERSION
1151
8e5f9a6e 1152Version 2.12 (unreleased)
823edd99 1153
1154=head1 SEE ALSO
1155
1156perl(1)
1157
1158=cut