Implement state array and state hashes. Initialisation assignment
[p5sagit/p5-mst-13.2.git] / ext / B / B / Concise.pm
CommitLineData
c99ca59a 1package B::Concise;
c27ea44e 2# Copyright (C) 2000-2003 Stephen McCamant. All rights reserved.
c99ca59a 3# This program is free software; you can redistribute and/or modify it
4# under the same terms as Perl itself.
5
8ec8fbef 6# Note: we need to keep track of how many use declarations/BEGIN
7# blocks this module uses, so we can avoid printing them when user
8# asks for the BEGIN blocks in her program. Update the comments and
9# the count in concise_specials if you add or delete one. The
10# -MO=Concise counts as use #1.
78ad9108 11
8ec8fbef 12use strict; # use #2
13use warnings; # uses #3 and #4, since warnings uses Carp
78ad9108 14
8ec8fbef 15use Exporter (); # use #5
16
952306ac 17our $VERSION = "0.68";
78ad9108 18our @ISA = qw(Exporter);
cc02ea56 19our @EXPORT_OK = qw( set_style set_style_standard add_callback
20 concise_subref concise_cv concise_main
21 add_style walk_output compile reset_sequence );
22our %EXPORT_TAGS =
23 ( io => [qw( walk_output compile reset_sequence )],
24 style => [qw( add_style set_style_standard )],
25 cb => [qw( add_callback )],
26 mech => [qw( concise_subref concise_cv concise_main )], );
78ad9108 27
8ec8fbef 28# use #6
c99ca59a 29use B qw(class ppname main_start main_root main_cv cstring svref_2object
6a077020 30 SVf_IOK SVf_NOK SVf_POK SVf_IVisUV SVf_FAKE OPf_KIDS OPf_SPECIAL
31 CVf_ANON);
c99ca59a 32
f95e3c3c 33my %style =
c99ca59a 34 ("terse" =>
c3caa09d 35 ["(?(#label =>\n)?)(*( )*)#class (#addr) #name (?([#targ])?) "
36 . "#svclass~(?((#svaddr))?)~#svval~(?(label \"#coplabel\")?)\n",
c99ca59a 37 "(*( )*)goto #class (#addr)\n",
38 "#class pp_#name"],
39 "concise" =>
40 ["#hyphseq2 (*( (x( ;)x))*)<#classsym> "
cc02ea56 41 . "#exname#arg(?([#targarglife])?)~#flags(?(/#private)?)(x(;~->#next)x)\n"
42 , " (*( )*) goto #seq\n",
c99ca59a 43 "(?(<#seq>)?)#exname#arg(?([#targarglife])?)"],
44 "linenoise" =>
45 ["(x(;(*( )*))x)#noise#arg(?([#targarg])?)(x( ;\n)x)",
46 "gt_#seq ",
47 "(?(#seq)?)#noise#arg(?([#targarg])?)"],
48 "debug" =>
49 ["#class (#addr)\n\top_next\t\t#nextaddr\n\top_sibling\t#sibaddr\n\t"
7252851f 50 . "op_ppaddr\tPL_ppaddr[OP_#NAME]\n\top_type\t\t#typenum\n" .
51 ($] > 5.009 ? '' : "\top_seq\t\t#seqnum\n")
2814eb74 52 . "\top_flags\t#flagval\n\top_private\t#privval\n"
c99ca59a 53 . "(?(\top_first\t#firstaddr\n)?)(?(\top_last\t\t#lastaddr\n)?)"
54 . "(?(\top_sv\t\t#svaddr\n)?)",
55 " GOTO #addr\n",
56 "#addr"],
57 "env" => [$ENV{B_CONCISE_FORMAT}, $ENV{B_CONCISE_GOTO_FORMAT},
58 $ENV{B_CONCISE_TREE_FORMAT}],
59 );
60
724aa791 61# Renderings, ie how Concise prints, is controlled by these vars
62# primary:
63our $stylename; # selects current style from %style
64my $order = "basic"; # how optree is walked & printed: basic, exec, tree
65
66# rendering mechanics:
67# these 'formats' are the line-rendering templates
68# they're updated from %style when $stylename changes
69my ($format, $gotofmt, $treefmt);
70
71# lesser players:
72my $base = 36; # how <sequence#> is displayed
73my $big_endian = 1; # more <sequence#> display
74my $tree_style = 0; # tree-order details
75my $banner = 1; # print banner before optree is traversed
cc02ea56 76my $do_main = 0; # force printing of main routine
724aa791 77
cc02ea56 78# another factor: can affect all styles!
724aa791 79our @callbacks; # allow external management
80
81set_style_standard("concise");
82
c99ca59a 83my $curcv;
c27ea44e 84my $cop_seq_base;
78ad9108 85
86sub set_style {
87 ($format, $gotofmt, $treefmt) = @_;
724aa791 88 #warn "set_style: deprecated, use set_style_standard instead\n"; # someday
f95e3c3c 89 die "expecting 3 style-format args\n" unless @_ == 3;
90}
91
92sub add_style {
93 my ($newstyle,@args) = @_;
94 die "style '$newstyle' already exists, choose a new name\n"
95 if exists $style{$newstyle};
96 die "expecting 3 style-format args\n" unless @args == 3;
97 $style{$newstyle} = [@args];
724aa791 98 $stylename = $newstyle; # update rendering state
78ad9108 99}
100
31b49ad4 101sub set_style_standard {
724aa791 102 ($stylename) = @_; # update rendering state
f95e3c3c 103 die "err: style '$stylename' unknown\n" unless exists $style{$stylename};
104 set_style(@{$style{$stylename}});
31b49ad4 105}
106
78ad9108 107sub add_callback {
108 push @callbacks, @_;
109}
c99ca59a 110
f95e3c3c 111# output handle, used with all Concise-output printing
cc02ea56 112our $walkHandle; # public for your convenience
113BEGIN { $walkHandle = \*STDOUT }
f95e3c3c 114
115sub walk_output { # updates $walkHandle
116 my $handle = shift;
cc02ea56 117 return $walkHandle unless $handle; # allow use as accessor
118
f95e3c3c 119 if (ref $handle eq 'SCALAR') {
2ce64696 120 require Config;
121 die "no perlio in this build, can't call walk_output (\\\$scalar)\n"
122 unless $Config::Config{useperlio};
f95e3c3c 123 # in 5.8+, open(FILEHANDLE,MODE,REFERENCE) writes to string
2ce64696 124 open my $tmp, '>', $handle; # but cant re-set existing STDOUT
f95e3c3c 125 $walkHandle = $tmp; # so use my $tmp as intermediate var
cc02ea56 126 return $walkHandle;
f95e3c3c 127 }
cc02ea56 128 my $iotype = ref $handle;
f95e3c3c 129 die "expecting argument/object that can print\n"
cc02ea56 130 unless $iotype eq 'GLOB' or $iotype and $handle->can('print');
131 $walkHandle = $handle;
f95e3c3c 132}
133
8ec8fbef 134sub concise_subref {
c0939cee 135 my($order, $coderef, $name) = @_;
f95e3c3c 136 my $codeobj = svref_2object($coderef);
cc02ea56 137
c0939cee 138 return concise_stashref(@_)
cc02ea56 139 unless ref $codeobj eq 'B::CV';
c0939cee 140 concise_cv_obj($order, $codeobj, $name);
8ec8fbef 141}
142
cc02ea56 143sub concise_stashref {
144 my($order, $h) = @_;
145 foreach my $k (sort keys %$h) {
146 local *s = $h->{$k};
147 my $coderef = *s{CODE} or next;
148 reset_sequence();
149 print "FUNC: ", *s, "\n";
150 my $codeobj = svref_2object($coderef);
151 next unless ref $codeobj eq 'B::CV';
152 eval { concise_cv_obj($order, $codeobj) }
153 or warn "err $@ on $codeobj";
154 }
155}
156
8ec8fbef 157# This should have been called concise_subref, but it was exported
158# under this name in versions before 0.56
c0939cee 159*concise_cv = \&concise_subref;
8ec8fbef 160
161sub concise_cv_obj {
c0939cee 162 my ($order, $cv, $name) = @_;
163 # name is either a string, or a CODE ref (copy of $cv arg??)
164
c99ca59a 165 $curcv = $cv;
d51cf0c9 166
2018a5c3 167 if (ref($cv->XSUBANY) =~ /B::(\w+)/) {
d51cf0c9 168 print $walkHandle "$name is a constant sub, optimized to a $1\n";
169 return;
170 }
c0939cee 171 if ($cv->XSUB) {
172 print $walkHandle "$name is XS code\n";
173 return;
174 }
175 if (class($cv->START) eq "NULL") {
176 no strict 'refs';
177 if (ref $name eq 'CODE') {
178 print $walkHandle "coderef $name has no START\n";
179 }
180 elsif (exists &$name) {
e75702e9 181 print $walkHandle "$name exists in stash, but has no START\n";
c0939cee 182 }
183 else {
184 print $walkHandle "$name not in symbol table\n";
185 }
186 return;
187 }
c27ea44e 188 sequence($cv->START);
c99ca59a 189 if ($order eq "exec") {
190 walk_exec($cv->START);
c0939cee 191 }
192 elsif ($order eq "basic") {
193 # walk_topdown($cv->ROOT, sub { $_[0]->concise($_[1]) }, 0);
194 my $root = $cv->ROOT;
195 unless (ref $root eq 'B::NULL') {
196 walk_topdown($root, sub { $_[0]->concise($_[1]) }, 0);
197 } else {
198 print $walkHandle "B::NULL encountered doing ROOT on $cv. avoiding disaster\n";
199 }
c99ca59a 200 } else {
f95e3c3c 201 print $walkHandle tree($cv->ROOT, 0);
c99ca59a 202 }
203}
204
31b49ad4 205sub concise_main {
206 my($order) = @_;
207 sequence(main_start);
208 $curcv = main_cv;
209 if ($order eq "exec") {
210 return if class(main_start) eq "NULL";
211 walk_exec(main_start);
212 } elsif ($order eq "tree") {
213 return if class(main_root) eq "NULL";
f95e3c3c 214 print $walkHandle tree(main_root, 0);
31b49ad4 215 } elsif ($order eq "basic") {
216 return if class(main_root) eq "NULL";
217 walk_topdown(main_root,
218 sub { $_[0]->concise($_[1]) }, 0);
219 }
220}
221
8ec8fbef 222sub concise_specials {
223 my($name, $order, @cv_s) = @_;
224 my $i = 1;
225 if ($name eq "BEGIN") {
c0939cee 226 splice(@cv_s, 0, 8); # skip 7 BEGIN blocks in this file. NOW 8 ??
8ec8fbef 227 } elsif ($name eq "CHECK") {
228 pop @cv_s; # skip the CHECK block that calls us
229 }
f95e3c3c 230 for my $cv (@cv_s) {
231 print $walkHandle "$name $i:\n";
8ec8fbef 232 $i++;
c0939cee 233 concise_cv_obj($order, $cv, $name);
8ec8fbef 234 }
235}
236
c99ca59a 237my $start_sym = "\e(0"; # "\cN" sometimes also works
238my $end_sym = "\e(B"; # "\cO" respectively
239
f95e3c3c 240my @tree_decorations =
c99ca59a 241 ([" ", "--", "+-", "|-", "| ", "`-", "-", 1],
242 [" ", "-", "+", "+", "|", "`", "", 0],
243 [" ", map("$start_sym$_$end_sym", "qq", "wq", "tq", "x ", "mq", "q"), 1],
244 [" ", map("$start_sym$_$end_sym", "q", "w", "t", "x", "m"), "", 0],
245 );
78ad9108 246
cc02ea56 247
248sub compileOpts {
249 # set rendering state from options and args
c0939cee 250 my (@options,@args);
251 if (@_) {
252 @options = grep(/^-/, @_);
253 @args = grep(!/^-/, @_);
254 }
c99ca59a 255 for my $o (@options) {
cc02ea56 256 # mode/order
c99ca59a 257 if ($o eq "-basic") {
258 $order = "basic";
259 } elsif ($o eq "-exec") {
260 $order = "exec";
261 } elsif ($o eq "-tree") {
262 $order = "tree";
cc02ea56 263 }
264 # tree-specific
265 elsif ($o eq "-compact") {
c99ca59a 266 $tree_style |= 1;
267 } elsif ($o eq "-loose") {
268 $tree_style &= ~1;
269 } elsif ($o eq "-vt") {
270 $tree_style |= 2;
271 } elsif ($o eq "-ascii") {
272 $tree_style &= ~2;
cc02ea56 273 }
274 # sequence numbering
275 elsif ($o =~ /^-base(\d+)$/) {
c99ca59a 276 $base = $1;
277 } elsif ($o eq "-bigendian") {
278 $big_endian = 1;
279 } elsif ($o eq "-littleendian") {
280 $big_endian = 0;
cc02ea56 281 }
282 elsif ($o eq "-nobanner") {
724aa791 283 $banner = 0;
cc02ea56 284 } elsif ($o eq "-banner") {
285 $banner = 1;
286 }
287 elsif ($o eq "-main") {
288 $do_main = 1;
289 } elsif ($o eq "-nomain") {
290 $do_main = 0;
724aa791 291 }
cc02ea56 292 # line-style options
724aa791 293 elsif (exists $style{substr($o, 1)}) {
f95e3c3c 294 $stylename = substr($o, 1);
724aa791 295 set_style_standard($stylename);
c99ca59a 296 } else {
297 warn "Option $o unrecognized";
298 }
299 }
cc02ea56 300 return (@args);
301}
302
303sub compile {
304 my (@args) = compileOpts(@_);
c27ea44e 305 return sub {
cc02ea56 306 my @newargs = compileOpts(@_); # accept new rendering options
307 warn "disregarding non-options: @newargs\n" if @newargs;
308
309 for my $objname (@args) {
59910b6d 310 next unless $objname; # skip null args to avoid noisy responses
311
cc02ea56 312 if ($objname eq "BEGIN") {
313 concise_specials("BEGIN", $order,
c0939cee 314 B::begin_av->isa("B::AV") ?
315 B::begin_av->ARRAY : ());
cc02ea56 316 } elsif ($objname eq "INIT") {
317 concise_specials("INIT", $order,
c0939cee 318 B::init_av->isa("B::AV") ?
319 B::init_av->ARRAY : ());
cc02ea56 320 } elsif ($objname eq "CHECK") {
321 concise_specials("CHECK", $order,
c0939cee 322 B::check_av->isa("B::AV") ?
323 B::check_av->ARRAY : ());
cc02ea56 324 } elsif ($objname eq "END") {
325 concise_specials("END", $order,
c0939cee 326 B::end_av->isa("B::AV") ?
327 B::end_av->ARRAY : ());
cc02ea56 328 }
329 else {
330 # convert function names to subrefs
331 my $objref;
332 if (ref $objname) {
333 print $walkHandle "B::Concise::compile($objname)\n"
334 if $banner;
335 $objref = $objname;
8ec8fbef 336 } else {
cc02ea56 337 $objname = "main::" . $objname unless $objname =~ /::/;
338 print $walkHandle "$objname:\n";
339 no strict 'refs';
c0939cee 340 unless (exists &$objname) {
341 print $walkHandle "err: unknown function ($objname)\n";
342 return;
343 }
cc02ea56 344 $objref = \&$objname;
8ec8fbef 345 }
c0939cee 346 concise_subref($order, $objref, $objname);
c99ca59a 347 }
348 }
c27ea44e 349 if (!@args or $do_main) {
f95e3c3c 350 print $walkHandle "main program:\n" if $do_main;
31b49ad4 351 concise_main($order);
c99ca59a 352 }
cc02ea56 353 return @args; # something
c99ca59a 354 }
355}
356
357my %labels;
724aa791 358my $lastnext; # remembers op-chain, used to insert gotos
c99ca59a 359
360my %opclass = ('OP' => "0", 'UNOP' => "1", 'BINOP' => "2", 'LOGOP' => "|",
361 'LISTOP' => "@", 'PMOP' => "/", 'SVOP' => "\$", 'GVOP' => "*",
051f02e9 362 'PVOP' => '"', 'LOOP' => "{", 'COP' => ";", 'PADOP' => "#");
c99ca59a 363
8ec8fbef 364no warnings 'qw'; # "Possible attempt to put comments..."; use #7
35fc55f1 365my @linenoise =
366 qw'# () sc ( @? 1 $* gv *{ m$ m@ m% m? p/ *$ $ $# & a& pt \\ s\\ rf bl
c99ca59a 367 ` *? <> ?? ?/ r/ c/ // qr s/ /c y/ = @= C sC Cp sp df un BM po +1 +I
368 -1 -I 1+ I+ 1- I- ** * i* / i/ %$ i% x + i+ - i- . " << >> < i<
369 > i> <= i, >= i. == i= != i! <? i? s< s> s, s. s= s! s? b& b^ b| -0 -i
370 ! ~ a2 si cs rd sr e^ lg sq in %x %o ab le ss ve ix ri sf FL od ch cy
371 uf lf uc lc qm @ [f [ @[ eh vl ky dl ex % ${ @{ uk pk st jn ) )[ a@
372 a% sl +] -] [- [+ so rv GS GW MS MW .. f. .f && || ^^ ?: &= |= -> s{ s}
373 v} ca wa di rs ;; ; ;d }{ { } {} f{ it {l l} rt }l }n }r dm }g }e ^o
374 ^c ^| ^# um bm t~ u~ ~d DB db ^s se ^g ^r {w }w pf pr ^O ^K ^R ^W ^d ^v
375 ^e ^t ^k t. fc ic fl .s .p .b .c .l .a .h g1 s1 g2 s2 ?. l? -R -W -X -r
376 -w -x -e -o -O -z -s -M -A -C -S -c -b -f -d -p -l -u -g -k -t -T -B cd
377 co cr u. cm ut r. l@ s@ r@ mD uD oD rD tD sD wD cD f$ w$ p$ sh e$ k$ g3
378 g4 s4 g5 s5 T@ C@ L@ G@ A@ S@ Hg Hc Hr Hw Mg Mc Ms Mr Sg Sc So rq do {e
379 e} {t t} g6 G6 6e g7 G7 7e g8 G8 8e g9 G9 9e 6s 7s 8s 9s 6E 7E 8E 9E Pn
c27ea44e 380 Pu GP SP EP Gn Gg GG SG EG g0 c$ lk t$ ;s n> // /= CO';
c99ca59a 381
382my $chars = "0123456789abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ";
383
19e169bf 384sub op_flags { # common flags (see BASOP.op_flags in op.h)
c99ca59a 385 my($x) = @_;
386 my(@v);
387 push @v, "v" if ($x & 3) == 1;
388 push @v, "s" if ($x & 3) == 2;
389 push @v, "l" if ($x & 3) == 3;
390 push @v, "K" if $x & 4;
391 push @v, "P" if $x & 8;
392 push @v, "R" if $x & 16;
393 push @v, "M" if $x & 32;
394 push @v, "S" if $x & 64;
395 push @v, "*" if $x & 128;
396 return join("", @v);
397}
398
399sub base_n {
400 my $x = shift;
401 return "-" . base_n(-$x) if $x < 0;
402 my $str = "";
403 do { $str .= substr($chars, $x % $base, 1) } while $x = int($x / $base);
404 $str = reverse $str if $big_endian;
405 return $str;
406}
407
c27ea44e 408my %sequence_num;
409my $seq_max = 1;
410
f95e3c3c 411sub reset_sequence {
412 # reset the sequence
413 %sequence_num = ();
414 $seq_max = 1;
cc02ea56 415 $lastnext = 0;
f95e3c3c 416}
417
c27ea44e 418sub seq {
419 my($op) = @_;
420 return "-" if not exists $sequence_num{$$op};
421 return base_n($sequence_num{$$op});
422}
c99ca59a 423
424sub walk_topdown {
425 my($op, $sub, $level) = @_;
426 $sub->($op, $level);
427 if ($op->flags & OPf_KIDS) {
428 for (my $kid = $op->first; $$kid; $kid = $kid->sibling) {
429 walk_topdown($kid, $sub, $level + 1);
430 }
431 }
c0939cee 432 elsif (class($op) eq "PMOP") {
c6e79e55 433 my $maybe_root = $op->pmreplroot;
434 if (ref($maybe_root) and $maybe_root->isa("B::OP")) {
435 # It really is the root of the replacement, not something
436 # else stored here for lack of space elsewhere
437 walk_topdown($maybe_root, $sub, $level + 1);
438 }
c99ca59a 439 }
440}
441
442sub walklines {
443 my($ar, $level) = @_;
444 for my $l (@$ar) {
445 if (ref($l) eq "ARRAY") {
446 walklines($l, $level + 1);
447 } else {
448 $l->concise($level);
449 }
450 }
451}
452
453sub walk_exec {
454 my($top, $level) = @_;
455 my %opsseen;
456 my @lines;
457 my @todo = ([$top, \@lines]);
458 while (@todo and my($op, $targ) = @{shift @todo}) {
459 for (; $$op; $op = $op->next) {
460 last if $opsseen{$$op}++;
461 push @$targ, $op;
462 my $name = $op->name;
62e36f8a 463 if (class($op) eq "LOGOP") {
c99ca59a 464 my $ar = [];
465 push @$targ, $ar;
466 push @todo, [$op->other, $ar];
467 } elsif ($name eq "subst" and $ {$op->pmreplstart}) {
468 my $ar = [];
469 push @$targ, $ar;
470 push @todo, [$op->pmreplstart, $ar];
471 } elsif ($name =~ /^enter(loop|iter)$/) {
7252851f 472 if ($] > 5.009) {
473 $labels{${$op->nextop}} = "NEXT";
474 $labels{${$op->lastop}} = "LAST";
475 $labels{${$op->redoop}} = "REDO";
476 } else {
477 $labels{$op->nextop->seq} = "NEXT";
478 $labels{$op->lastop->seq} = "LAST";
479 $labels{$op->redoop->seq} = "REDO";
480 }
c99ca59a 481 }
482 }
483 }
484 walklines(\@lines, 0);
485}
486
c27ea44e 487# The structure of this routine is purposely modeled after op.c's peep()
488sub sequence {
489 my($op) = @_;
490 my $oldop = 0;
491 return if class($op) eq "NULL" or exists $sequence_num{$$op};
492 for (; $$op; $op = $op->next) {
493 last if exists $sequence_num{$$op};
494 my $name = $op->name;
495 if ($name =~ /^(null|scalar|lineseq|scope)$/) {
496 next if $oldop and $ {$op->next};
497 } else {
498 $sequence_num{$$op} = $seq_max++;
499 if (class($op) eq "LOGOP") {
500 my $other = $op->other;
501 $other = $other->next while $other->name eq "null";
502 sequence($other);
503 } elsif (class($op) eq "LOOP") {
504 my $redoop = $op->redoop;
505 $redoop = $redoop->next while $redoop->name eq "null";
506 sequence($redoop);
507 my $nextop = $op->nextop;
508 $nextop = $nextop->next while $nextop->name eq "null";
509 sequence($nextop);
510 my $lastop = $op->lastop;
511 $lastop = $lastop->next while $lastop->name eq "null";
512 sequence($lastop);
513 } elsif ($name eq "subst" and $ {$op->pmreplstart}) {
514 my $replstart = $op->pmreplstart;
515 $replstart = $replstart->next while $replstart->name eq "null";
516 sequence($replstart);
517 }
518 }
519 $oldop = $op;
520 }
521}
522
724aa791 523sub fmt_line { # generate text-line for op.
cc02ea56 524 my($hr, $op, $text, $level) = @_;
525
526 $_->($hr, $op, \$text, \$level, $stylename) for @callbacks;
527
724aa791 528 return '' if $hr->{SKIP}; # suppress line if a callback said so
cc02ea56 529 return '' if $hr->{goto} and $hr->{goto} eq '-'; # no goto nowhere
f95e3c3c 530
cc02ea56 531 # spec: (?(text1#varText2)?)
c99ca59a 532 $text =~ s/\(\?\(([^\#]*?)\#(\w+)([^\#]*?)\)\?\)/
f95e3c3c 533 $hr->{$2} ? $1.$hr->{$2}.$3 : ""/eg;
534
cc02ea56 535 # spec: (x(exec_text;basic_text)x)
c99ca59a 536 $text =~ s/\(x\((.*?);(.*?)\)x\)/$order eq "exec" ? $1 : $2/egs;
cc02ea56 537
538 # spec: (*(text)*)
c99ca59a 539 $text =~ s/\(\*\(([^;]*?)\)\*\)/$1 x $level/egs;
cc02ea56 540
541 # spec: (*(text1;text2)*)
c99ca59a 542 $text =~ s/\(\*\((.*?);(.*?)\)\*\)/$1 x ($level - 1) . $2 x ($level>0)/egs;
cc02ea56 543
544 # convert #Var to tag=>val form: Var\t#var
545 $text =~ s/\#([A-Z][a-z]+)(\d+)?/\t\u$1\t\L#$1$2/gs;
546
547 # spec: #varN
724aa791 548 $text =~ s/\#([a-zA-Z]+)(\d+)/sprintf("%-$2s", $hr->{$1})/eg;
549
cc02ea56 550 $text =~ s/\#([a-zA-Z]+)/$hr->{$1}/eg; # populate #var's
551 $text =~ s/[ \t]*~+[ \t]*/ /g; # squeeze tildes
f95e3c3c 552 chomp $text;
553 return "$text\n" if $text ne "";
554 return $text; # suppress empty lines
c99ca59a 555}
556
19e169bf 557our %priv; # used to display each opcode's BASEOP.op_private values
558
c99ca59a 559$priv{$_}{128} = "LVINTRO"
560 for ("pos", "substr", "vec", "threadsv", "gvsv", "rv2sv", "rv2hv", "rv2gv",
561 "rv2av", "rv2arylen", "aelem", "helem", "aslice", "hslice", "padsv",
241416b8 562 "padav", "padhv", "enteriter");
c99ca59a 563$priv{$_}{64} = "REFC" for ("leave", "leavesub", "leavesublv", "leavewrite");
564$priv{"aassign"}{64} = "COMMON";
4ac6efe6 565$priv{"aassign"}{32} = "PHASH" if $] < 5.009;
952306ac 566$priv{"sassign"}{32} = "STATE";
c99ca59a 567$priv{"sassign"}{64} = "BKWARD";
7abc42fc 568$priv{$_}{64} = "RTIME" for ("match", "subst", "substcont", "qr");
c99ca59a 569@{$priv{"trans"}}{1,2,4,8,16,64} = ("<UTF", ">UTF", "IDENT", "SQUASH", "DEL",
570 "COMPL", "GROWS");
571$priv{"repeat"}{64} = "DOLIST";
572$priv{"leaveloop"}{64} = "CONT";
573@{$priv{$_}}{32,64,96} = ("DREFAV", "DREFHV", "DREFSV")
314d4778 574 for (qw(rv2gv rv2sv padsv aelem helem));
a5911867 575$priv{$_}{16} = "STATE" for ("padav", "padhv", "padsv");
d4797c1d 576@{$priv{"entersub"}}{16,32,64} = ("DBG","TARG","NOMOD");
c99ca59a 577@{$priv{$_}}{4,8,128} = ("INARGS","AMPER","NO()") for ("entersub", "rv2cv");
578$priv{"gv"}{32} = "EARLYCV";
579$priv{"aelem"}{16} = $priv{"helem"}{16} = "LVDEFER";
241416b8 580$priv{$_}{16} = "OURINTR" for ("gvsv", "rv2sv", "rv2av", "rv2hv", "r2gv",
581 "enteriter");
c99ca59a 582$priv{$_}{16} = "TARGMY"
583 for (map(($_,"s$_"),"chop", "chomp"),
584 map(($_,"i_$_"), "postinc", "postdec", "multiply", "divide", "modulo",
585 "add", "subtract", "negate"), "pow", "concat", "stringify",
586 "left_shift", "right_shift", "bit_and", "bit_xor", "bit_or",
587 "complement", "atan2", "sin", "cos", "rand", "exp", "log", "sqrt",
588 "int", "hex", "oct", "abs", "length", "index", "rindex", "sprintf",
589 "ord", "chr", "crypt", "quotemeta", "join", "push", "unshift", "flock",
590 "chdir", "chown", "chroot", "unlink", "chmod", "utime", "rename",
591 "link", "symlink", "mkdir", "rmdir", "wait", "waitpid", "system",
592 "exec", "kill", "getppid", "getpgrp", "setpgrp", "getpriority",
593 "setpriority", "time", "sleep");
ef3e5ea9 594$priv{$_}{4} = "REVERSED" for ("enteriter", "iter");
d4797c1d 595@{$priv{"const"}}{4,8,16,32,64,128} = ("SHORT","STRICT","ENTERED",'$[',"BARE","WARN");
c99ca59a 596$priv{"flip"}{64} = $priv{"flop"}{64} = "LINENUM";
597$priv{"list"}{64} = "GUESSED";
598$priv{"delete"}{64} = "SLICE";
599$priv{"exists"}{64} = "SUB";
7b9ef140 600@{$priv{"sort"}}{1,2,4,8,16,32,64} = ("NUM", "INT", "REV", "INPLACE","DESC","QSORT","STABLE");
c99ca59a 601$priv{"threadsv"}{64} = "SVREFd";
c27ea44e 602@{$priv{$_}}{16,32,64,128} = ("INBIN","INCR","OUTBIN","OUTCR")
603 for ("open", "backtick");
c99ca59a 604$priv{"exit"}{128} = "VMS";
feaeca78 605$priv{$_}{2} = "FTACCESS"
606 for ("ftrread", "ftrwrite", "ftrexec", "fteread", "ftewrite", "fteexec");
7b9ef140 607$priv{"entereval"}{2} = "HAS_HH";
32454ac8 608if ($] >= 5.009) {
609 # Stacked filetests are post 5.8.x
610 $priv{$_}{4} = "FTSTACKED"
611 for ("ftrread", "ftrwrite", "ftrexec", "fteread", "ftewrite", "fteexec",
612 "ftis", "fteowned", "ftrowned", "ftzero", "ftsize", "ftmtime",
613 "ftatime", "ftctime", "ftsock", "ftchr", "ftblk", "ftfile", "ftdir",
614 "ftpipe", "ftlink", "ftsuid", "ftsgid", "ftsvtx", "fttty", "fttext",
615 "ftbinary");
616 # Lexical $_ is post 5.8.x
617 $priv{$_}{2} = "GREPLEX"
618 for ("mapwhile", "mapstart", "grepwhile", "grepstart");
619}
c99ca59a 620
621sub private_flags {
622 my($name, $x) = @_;
623 my @s;
624 for my $flag (128, 96, 64, 32, 16, 8, 4, 2, 1) {
625 if ($priv{$name}{$flag} and $x & $flag and $x >= $flag) {
626 $x -= $flag;
627 push @s, $priv{$name}{$flag};
628 }
629 }
630 push @s, $x if $x;
631 return join(",", @s);
632}
633
c27ea44e 634sub concise_sv {
2db5ca0a 635 my($sv, $hr, $preferpv) = @_;
c27ea44e 636 $hr->{svclass} = class($sv);
31b49ad4 637 $hr->{svclass} = "UV"
638 if $hr->{svclass} eq "IV" and $sv->FLAGS & SVf_IVisUV;
5b493bdf 639 Carp::cluck("bad concise_sv: $sv") unless $sv and $$sv;
c27ea44e 640 $hr->{svaddr} = sprintf("%#x", $$sv);
641 if ($hr->{svclass} eq "GV") {
642 my $gv = $sv;
643 my $stash = $gv->STASH->NAME;
644 if ($stash eq "main") {
645 $stash = "";
646 } else {
647 $stash = $stash . "::";
648 }
649 $hr->{svval} = "*$stash" . $gv->SAFENAME;
650 return "*$stash" . $gv->SAFENAME;
651 } else {
652 while (class($sv) eq "RV") {
653 $hr->{svval} .= "\\";
654 $sv = $sv->RV;
655 }
656 if (class($sv) eq "SPECIAL") {
40b5b14f 657 $hr->{svval} .= ["Null", "sv_undef", "sv_yes", "sv_no"]->[$$sv];
2db5ca0a 658 } elsif ($preferpv && $sv->FLAGS & SVf_POK) {
659 $hr->{svval} .= cstring($sv->PV);
c27ea44e 660 } elsif ($sv->FLAGS & SVf_NOK) {
40b5b14f 661 $hr->{svval} .= $sv->NV;
c27ea44e 662 } elsif ($sv->FLAGS & SVf_IOK) {
31b49ad4 663 $hr->{svval} .= $sv->int_value;
c27ea44e 664 } elsif ($sv->FLAGS & SVf_POK) {
40b5b14f 665 $hr->{svval} .= cstring($sv->PV);
31b49ad4 666 } elsif (class($sv) eq "HV") {
667 $hr->{svval} .= 'HASH';
c27ea44e 668 }
cc02ea56 669
670 $hr->{svval} = 'undef' unless defined $hr->{svval};
671 my $out = $hr->{svclass};
672 return $out .= " $hr->{svval}" ;
c27ea44e 673 }
674}
675
c99ca59a 676sub concise_op {
677 my ($op, $level, $format) = @_;
678 my %h;
679 $h{exname} = $h{name} = $op->name;
680 $h{NAME} = uc $h{name};
681 $h{class} = class($op);
682 $h{extarg} = $h{targ} = $op->targ;
683 $h{extarg} = "" unless $h{extarg};
684 if ($h{name} eq "null" and $h{targ}) {
8ec8fbef 685 # targ holds the old type
c99ca59a 686 $h{exname} = "ex-" . substr(ppname($h{targ}), 3);
687 $h{extarg} = "";
8ec8fbef 688 } elsif ($op->name =~ /^leave(sub(lv)?|write)?$/) {
689 # targ potentially holds a reference count
690 if ($op->private & 64) {
691 my $refs = "ref" . ($h{targ} != 1 ? "s" : "");
692 $h{targarglife} = $h{targarg} = "$h{targ} $refs";
693 }
c99ca59a 694 } elsif ($h{targ}) {
695 my $padname = (($curcv->PADLIST->ARRAY)[0]->ARRAY)[$h{targ}];
696 if (defined $padname and class($padname) ne "SPECIAL") {
0b40bd6d 697 $h{targarg} = $padname->PVX;
127212b2 698 if ($padname->FLAGS & SVf_FAKE) {
4ac6efe6 699 if ($] < 5.009) {
700 $h{targarglife} = "$h{targarg}:FAKE";
701 } else {
702 # These changes relate to the jumbo closure fix.
703 # See changes 19939 and 20005
704 my $fake = '';
705 $fake .= 'a' if $padname->IVX & 1; # PAD_FAKELEX_ANON
706 $fake .= 'm' if $padname->IVX & 2; # PAD_FAKELEX_MULTI
707 $fake .= ':' . $padname->NVX if $curcv->CvFLAGS & CVf_ANON;
708 $h{targarglife} = "$h{targarg}:FAKE:$fake";
709 }
127212b2 710 }
711 else {
712 my $intro = $padname->NVX - $cop_seq_base;
713 my $finish = int($padname->IVX) - $cop_seq_base;
714 $finish = "end" if $finish == 999999999 - $cop_seq_base;
715 $h{targarglife} = "$h{targarg}:$intro,$finish";
716 }
c99ca59a 717 } else {
718 $h{targarglife} = $h{targarg} = "t" . $h{targ};
719 }
720 }
721 $h{arg} = "";
722 $h{svclass} = $h{svaddr} = $h{svval} = "";
723 if ($h{class} eq "PMOP") {
724 my $precomp = $op->precomp;
7a9b44b9 725 if (defined $precomp) {
c27ea44e 726 $precomp = cstring($precomp); # Escape literal control sequences
727 $precomp = "/$precomp/";
728 } else {
729 $precomp = "";
7a9b44b9 730 }
b2a3cfdd 731 my $pmreplroot = $op->pmreplroot;
34a48b4b 732 my $pmreplstart;
c6e79e55 733 if (ref($pmreplroot) eq "B::GV") {
b2a3cfdd 734 # with C<@stash_array = split(/pat/, str);>,
c6e79e55 735 # *stash_array is stored in /pat/'s pmreplroot.
b2a3cfdd 736 $h{arg} = "($precomp => \@" . $pmreplroot->NAME . ")";
c6e79e55 737 } elsif (!ref($pmreplroot) and $pmreplroot) {
738 # same as the last case, except the value is actually a
739 # pad offset for where the GV is kept (this happens under
740 # ithreads)
741 my $gv = (($curcv->PADLIST->ARRAY)[1]->ARRAY)[$pmreplroot];
742 $h{arg} = "($precomp => \@" . $gv->NAME . ")";
b2a3cfdd 743 } elsif ($ {$op->pmreplstart}) {
c99ca59a 744 undef $lastnext;
745 $pmreplstart = "replstart->" . seq($op->pmreplstart);
746 $h{arg} = "(" . join(" ", $precomp, $pmreplstart) . ")";
747 } else {
748 $h{arg} = "($precomp)";
749 }
750 } elsif ($h{class} eq "PVOP" and $h{name} ne "trans") {
751 $h{arg} = '("' . $op->pv . '")';
752 $h{svval} = '"' . $op->pv . '"';
753 } elsif ($h{class} eq "COP") {
754 my $label = $op->label;
c3caa09d 755 $h{coplabel} = $label;
c99ca59a 756 $label = $label ? "$label: " : "";
757 my $loc = $op->file;
758 $loc =~ s[.*/][];
759 $loc .= ":" . $op->line;
760 my($stash, $cseq) = ($op->stash->NAME, $op->cop_seq - $cop_seq_base);
761 my $arybase = $op->arybase;
762 $arybase = $arybase ? ' $[=' . $arybase : "";
763 $h{arg} = "($label$stash $cseq $loc$arybase)";
764 } elsif ($h{class} eq "LOOP") {
765 $h{arg} = "(next->" . seq($op->nextop) . " last->" . seq($op->lastop)
766 . " redo->" . seq($op->redoop) . ")";
767 } elsif ($h{class} eq "LOGOP") {
768 undef $lastnext;
769 $h{arg} = "(other->" . seq($op->other) . ")";
5b493bdf 770 }
771 elsif ($h{class} eq "SVOP" or $h{class} eq "PADOP") {
6a077020 772 unless ($h{name} eq 'aelemfast' and $op->flags & OPf_SPECIAL) {
5b493bdf 773 my $idx = ($h{class} eq "SVOP") ? $op->targ : $op->padix;
2db5ca0a 774 my $preferpv = $h{name} eq "method_named";
5b493bdf 775 if ($h{class} eq "PADOP" or !${$op->sv}) {
776 my $sv = (($curcv->PADLIST->ARRAY)[1]->ARRAY)[$idx];
2db5ca0a 777 $h{arg} = "[" . concise_sv($sv, \%h, $preferpv) . "]";
6a077020 778 $h{targarglife} = $h{targarg} = "";
779 } else {
2db5ca0a 780 $h{arg} = "(" . concise_sv($op->sv, \%h, $preferpv) . ")";
6a077020 781 }
c99ca59a 782 }
783 }
784 $h{seq} = $h{hyphseq} = seq($op);
785 $h{seq} = "" if $h{seq} eq "-";
7252851f 786 if ($] > 5.009) {
787 $h{opt} = $op->opt;
788 $h{static} = $op->static;
789 $h{label} = $labels{$$op};
790 } else {
791 $h{seqnum} = $op->seq;
792 $h{label} = $labels{$op->seq};
793 }
c99ca59a 794 $h{next} = $op->next;
795 $h{next} = (class($h{next}) eq "NULL") ? "(end)" : seq($h{next});
796 $h{nextaddr} = sprintf("%#x", $ {$op->next});
797 $h{sibaddr} = sprintf("%#x", $ {$op->sibling});
798 $h{firstaddr} = sprintf("%#x", $ {$op->first}) if $op->can("first");
799 $h{lastaddr} = sprintf("%#x", $ {$op->last}) if $op->can("last");
800
801 $h{classsym} = $opclass{$h{class}};
802 $h{flagval} = $op->flags;
803 $h{flags} = op_flags($op->flags);
804 $h{privval} = $op->private;
805 $h{private} = private_flags($h{name}, $op->private);
806 $h{addr} = sprintf("%#x", $$op);
c99ca59a 807 $h{typenum} = $op->type;
808 $h{noise} = $linenoise[$op->type];
f95e3c3c 809
cc02ea56 810 return fmt_line(\%h, $op, $format, $level);
c99ca59a 811}
812
813sub B::OP::concise {
814 my($op, $level) = @_;
815 if ($order eq "exec" and $lastnext and $$lastnext != $$op) {
724aa791 816 # insert a 'goto' line
cc02ea56 817 my $synth = {"seq" => seq($lastnext), "class" => class($lastnext),
818 "addr" => sprintf("%#x", $$lastnext),
819 "goto" => seq($lastnext), # simplify goto '-' removal
820 };
821 print $walkHandle fmt_line($synth, $op, $gotofmt, $level+1);
c99ca59a 822 }
823 $lastnext = $op->next;
f95e3c3c 824 print $walkHandle concise_op($op, $level, $format);
c99ca59a 825}
826
31b49ad4 827# B::OP::terse (see Terse.pm) now just calls this
828sub b_terse {
829 my($op, $level) = @_;
830
831 # This isn't necessarily right, but there's no easy way to get
832 # from an OP to the right CV. This is a limitation of the
833 # ->terse() interface style, and there isn't much to do about
834 # it. In particular, we can die in concise_op if the main pad
835 # isn't long enough, or has the wrong kind of entries, compared to
836 # the pad a sub was compiled with. The fix for that would be to
837 # make a backwards compatible "terse" format that never even
838 # looked at the pad, just like the old B::Terse. I don't think
839 # that's worth the effort, though.
840 $curcv = main_cv unless $curcv;
841
842 if ($order eq "exec" and $lastnext and $$lastnext != $$op) {
724aa791 843 # insert a 'goto'
31b49ad4 844 my $h = {"seq" => seq($lastnext), "class" => class($lastnext),
845 "addr" => sprintf("%#x", $$lastnext)};
cc02ea56 846 print # $walkHandle
847 fmt_line($h, $op, $style{"terse"}[1], $level+1);
31b49ad4 848 }
849 $lastnext = $op->next;
cc02ea56 850 print # $walkHandle
851 concise_op($op, $level, $style{"terse"}[0]);
31b49ad4 852}
853
c99ca59a 854sub tree {
855 my $op = shift;
856 my $level = shift;
857 my $style = $tree_decorations[$tree_style];
858 my($space, $single, $kids, $kid, $nokid, $last, $lead, $size) = @$style;
859 my $name = concise_op($op, $level, $treefmt);
860 if (not $op->flags & OPf_KIDS) {
861 return $name . "\n";
862 }
863 my @lines;
864 for (my $kid = $op->first; $$kid; $kid = $kid->sibling) {
865 push @lines, tree($kid, $level+1);
866 }
867 my $i;
868 for ($i = $#lines; substr($lines[$i], 0, 1) eq " "; $i--) {
869 $lines[$i] = $space . $lines[$i];
870 }
871 if ($i > 0) {
872 $lines[$i] = $last . $lines[$i];
873 while ($i-- > 1) {
874 if (substr($lines[$i], 0, 1) eq " ") {
875 $lines[$i] = $nokid . $lines[$i];
876 } else {
f95e3c3c 877 $lines[$i] = $kid . $lines[$i];
c99ca59a 878 }
879 }
880 $lines[$i] = $kids . $lines[$i];
881 } else {
882 $lines[0] = $single . $lines[0];
883 }
884 return("$name$lead" . shift @lines,
885 map(" " x (length($name)+$size) . $_, @lines));
886}
887
213a1a26 888# *** Warning: fragile kludge ahead ***
889# Because the B::* modules run in the same interpreter as the code
2814eb74 890# they're compiling, their presence tends to distort the view we have of
891# the code we're looking at. In particular, perl gives sequence numbers
892# to COPs. If the program we're looking at were run on its own, this
893# would start at 1. Because all of B::Concise and all the modules it
894# uses are compiled first, though, by the time we get to the user's
895# program the sequence number is already pretty high, which could be
896# distracting if you're trying to tell OPs apart. Therefore we'd like to
897# subtract an offset from all the sequence numbers we display, to
898# restore the simpler view of the world. The trick is to know what that
899# offset will be, when we're still compiling B::Concise! If we
213a1a26 900# hardcoded a value, it would have to change every time B::Concise or
2814eb74 901# other modules we use do. To help a little, what we do here is compile
902# a little code at the end of the module, and compute the base sequence
903# number for the user's program as being a small offset later, so all we
904# have to worry about are changes in the offset.
7252851f 905
906# [For 5.8.x and earlier perl is generating sequence numbers for all ops,
907# and using them to reference labels]
908
909
213a1a26 910# When you say "perl -MO=Concise -e '$a'", the output should look like:
911
912# 4 <@> leave[t1] vKP/REFC ->(end)
913# 1 <0> enter ->2
914 #^ smallest OP sequence number should be 1
915# 2 <;> nextstate(main 1 -e:1) v ->3
916 # ^ smallest COP sequence number should be 1
917# - <1> ex-rv2sv vK/1 ->4
918# 3 <$> gvsv(*a) s ->4
919
c27ea44e 920# If the second of the marked numbers there isn't 1, it means you need
921# to update the corresponding magic number in the next line.
922# Remember, this needs to stay the last things in the module.
e69a2255 923
c27ea44e 924# Why is this different for MacOS? Does it matter?
8ec8fbef 925my $cop_seq_mnum = $^O eq 'MacOS' ? 12 : 11;
e69a2255 926$cop_seq_base = svref_2object(eval 'sub{0;}')->START->cop_seq + $cop_seq_mnum;
c99ca59a 927
9281;
929
930__END__
931
932=head1 NAME
933
934B::Concise - Walk Perl syntax tree, printing concise info about ops
935
936=head1 SYNOPSIS
937
938 perl -MO=Concise[,OPTIONS] foo.pl
939
78ad9108 940 use B::Concise qw(set_style add_callback);
941
c99ca59a 942=head1 DESCRIPTION
943
944This compiler backend prints the internal OPs of a Perl program's syntax
945tree in one of several space-efficient text formats suitable for debugging
946the inner workings of perl or other compiler backends. It can print OPs in
947the order they appear in the OP tree, in the order they will execute, or
948in a text approximation to their tree structure, and the format of the
3c4b39be 949information displayed is customizable. Its function is similar to that of
c99ca59a 950perl's B<-Dx> debugging flag or the B<B::Terse> module, but it is more
951sophisticated and flexible.
952
f8a679e6 953=head1 EXAMPLE
954
f9f861ec 955Here's two outputs (or 'renderings'), using the -exec and -basic
956(i.e. default) formatting conventions on the same code snippet.
19e169bf 957
958 % perl -MO=Concise,-exec -e '$a = $b + 42'
959 1 <0> enter
960 2 <;> nextstate(main 1 -e:1) v
961 3 <#> gvsv[*b] s
962 4 <$> const[IV 42] s
963 * 5 <2> add[t3] sK/2
964 6 <#> gvsv[*a] s
965 7 <2> sassign vKS/2
966 8 <@> leave[1 ref] vKP/REFC
967
f9f861ec 968In this -exec rendering, each opcode is executed in the order shown.
969The add opcode, marked with '*', is discussed in more detail.
19e169bf 970
971The 1st column is the op's sequence number, starting at 1, and is
f9f861ec 972displayed in base 36 by default. Here they're purely linear; the
973sequences are very helpful when looking at code with loops and
974branches.
19e169bf 975
976The symbol between angle brackets indicates the op's type, for
977example; <2> is a BINOP, <@> a LISTOP, and <#> is a PADOP, which is
978used in threaded perls. (see L</"OP class abbreviations">).
979
f9f861ec 980The opname, as in B<'add[t1]'>, may be followed by op-specific
19e169bf 981information in parentheses or brackets (ex B<'[t1]'>).
982
f9f861ec 983The op-flags (ex B<'sK/2'>) are described in (L</"OP flags
19e169bf 984abbreviations">).
f8a679e6 985
986 % perl -MO=Concise -e '$a = $b + 42'
8ec8fbef 987 8 <@> leave[1 ref] vKP/REFC ->(end)
f8a679e6 988 1 <0> enter ->2
989 2 <;> nextstate(main 1 -e:1) v ->3
990 7 <2> sassign vKS/2 ->8
19e169bf 991 * 5 <2> add[t1] sK/2 ->6
f8a679e6 992 - <1> ex-rv2sv sK/1 ->4
993 3 <$> gvsv(*b) s ->4
994 4 <$> const(IV 42) s ->5
995 - <1> ex-rv2sv sKRM*/1 ->7
996 6 <$> gvsv(*a) s ->7
997
19e169bf 998The default rendering is top-down, so they're not in execution order.
999This form reflects the way the stack is used to parse and evaluate
1000expressions; the add operates on the two terms below it in the tree.
f8a679e6 1001
19e169bf 1002Nullops appear as C<ex-opname>, where I<opname> is an op that has been
1003optimized away by perl. They're displayed with a sequence-number of
1004'-', because they are not executed (they don't appear in previous
1005example), they're printed here because they reflect the parse.
f8a679e6 1006
19e169bf 1007The arrow points to the sequence number of the next op; they're not
1008displayed in -exec mode, for obvious reasons.
f8a679e6 1009
19e169bf 1010Note that because this rendering was done on a non-threaded perl, the
1011PADOPs in the previous examples are now SVOPs, and some (but not all)
1012of the square brackets have been replaced by round ones. This is a
1013subtle feature to provide some visual distinction between renderings
1014on threaded and un-threaded perls.
f8a679e6 1015
f8a679e6 1016
c99ca59a 1017=head1 OPTIONS
1018
1019Arguments that don't start with a hyphen are taken to be the names of
8ec8fbef 1020subroutines to print the OPs of; if no such functions are specified,
1021the main body of the program (outside any subroutines, and not
19e169bf 1022including use'd or require'd files) is rendered. Passing C<BEGIN>,
8ec8fbef 1023C<CHECK>, C<INIT>, or C<END> will cause all of the corresponding
1024special blocks to be printed.
c99ca59a 1025
724aa791 1026Options affect how things are rendered (ie printed). They're presented
1027here by their visual effect, 1st being strongest. They're grouped
1028according to how they interrelate; within each group the options are
1029mutually exclusive (unless otherwise stated).
1030
1031=head2 Options for Opcode Ordering
1032
1033These options control the 'vertical display' of opcodes. The display
1034'order' is also called 'mode' elsewhere in this document.
1035
c99ca59a 1036=over 4
1037
1038=item B<-basic>
1039
1040Print OPs in the order they appear in the OP tree (a preorder
1041traversal, starting at the root). The indentation of each OP shows its
19e169bf 1042level in the tree, and the '->' at the end of the line indicates the
1043next opcode in execution order. This mode is the default, so the flag
1044is included simply for completeness.
c99ca59a 1045
1046=item B<-exec>
1047
1048Print OPs in the order they would normally execute (for the majority
1049of constructs this is a postorder traversal of the tree, ending at the
1050root). In most cases the OP that usually follows a given OP will
1051appear directly below it; alternate paths are shown by indentation. In
1052cases like loops when control jumps out of a linear path, a 'goto'
1053line is generated.
1054
1055=item B<-tree>
1056
1057Print OPs in a text approximation of a tree, with the root of the tree
1058at the left and 'left-to-right' order of children transformed into
1059'top-to-bottom'. Because this mode grows both to the right and down,
1060it isn't suitable for large programs (unless you have a very wide
1061terminal).
1062
724aa791 1063=back
1064
1065=head2 Options for Line-Style
1066
1067These options select the line-style (or just style) used to render
1068each opcode, and dictates what info is actually printed into each line.
1069
1070=over 4
1071
1072=item B<-concise>
1073
1074Use the author's favorite set of formatting conventions. This is the
1075default, of course.
1076
1077=item B<-terse>
1078
1079Use formatting conventions that emulate the output of B<B::Terse>. The
1080basic mode is almost indistinguishable from the real B<B::Terse>, and the
1081exec mode looks very similar, but is in a more logical order and lacks
1082curly brackets. B<B::Terse> doesn't have a tree mode, so the tree mode
1083is only vaguely reminiscent of B<B::Terse>.
1084
1085=item B<-linenoise>
1086
1087Use formatting conventions in which the name of each OP, rather than being
1088written out in full, is represented by a one- or two-character abbreviation.
1089This is mainly a joke.
1090
1091=item B<-debug>
1092
1093Use formatting conventions reminiscent of B<B::Debug>; these aren't
1094very concise at all.
1095
1096=item B<-env>
1097
1098Use formatting conventions read from the environment variables
1099C<B_CONCISE_FORMAT>, C<B_CONCISE_GOTO_FORMAT>, and C<B_CONCISE_TREE_FORMAT>.
1100
1101=back
1102
1103=head2 Options for tree-specific formatting
1104
1105=over 4
1106
c99ca59a 1107=item B<-compact>
1108
1109Use a tree format in which the minimum amount of space is used for the
1110lines connecting nodes (one character in most cases). This squeezes out
1111a few precious columns of screen real estate.
1112
1113=item B<-loose>
1114
1115Use a tree format that uses longer edges to separate OP nodes. This format
1116tends to look better than the compact one, especially in ASCII, and is
1117the default.
1118
1119=item B<-vt>
1120
1121Use tree connecting characters drawn from the VT100 line-drawing set.
1122This looks better if your terminal supports it.
1123
1124=item B<-ascii>
1125
1126Draw the tree with standard ASCII characters like C<+> and C<|>. These don't
1127look as clean as the VT100 characters, but they'll work with almost any
1128terminal (or the horizontal scrolling mode of less(1)) and are suitable
1129for text documentation or email. This is the default.
1130
724aa791 1131=back
c99ca59a 1132
724aa791 1133These are pairwise exclusive, i.e. compact or loose, vt or ascii.
1134
1135=head2 Options controlling sequence numbering
1136
1137=over 4
c99ca59a 1138
1139=item B<-base>I<n>
1140
1141Print OP sequence numbers in base I<n>. If I<n> is greater than 10, the
1142digit for 11 will be 'a', and so on. If I<n> is greater than 36, the digit
1143for 37 will be 'A', and so on until 62. Values greater than 62 are not
1144currently supported. The default is 36.
1145
1146=item B<-bigendian>
1147
1148Print sequence numbers with the most significant digit first. This is the
1149usual convention for Arabic numerals, and the default.
1150
1151=item B<-littleendian>
1152
724aa791 1153Print seqence numbers with the least significant digit first. This is
1154obviously mutually exclusive with bigendian.
c99ca59a 1155
724aa791 1156=back
c99ca59a 1157
724aa791 1158=head2 Other options
c99ca59a 1159
cc02ea56 1160These are pairwise exclusive.
1161
724aa791 1162=over 4
c99ca59a 1163
724aa791 1164=item B<-main>
c99ca59a 1165
724aa791 1166Include the main program in the output, even if subroutines were also
cc02ea56 1167specified. This rendering is normally suppressed when a subroutine
1168name or reference is given.
1169
1170=item B<-nomain>
1171
1172This restores the default behavior after you've changed it with '-main'
1173(it's not normally needed). If no subroutine name/ref is given, main is
1174rendered, regardless of this flag.
1175
1176=item B<-nobanner>
1177
1178Renderings usually include a banner line identifying the function name
1179or stringified subref. This suppresses the printing of the banner.
1180
1181TBC: Remove the stringified coderef; while it provides a 'cookie' for
1182each function rendered, the cookies used should be 1,2,3.. not a
1183random hex-address. It also complicates string comparison of two
1184different trees.
c99ca59a 1185
724aa791 1186=item B<-banner>
c99ca59a 1187
cc02ea56 1188restores default banner behavior.
1189
1190=item B<-banneris> => subref
1191
1192TBC: a hookpoint (and an option to set it) for a user-supplied
1193function to produce a banner appropriate for users needs. It's not
1194ideal, because the rendering-state variables, which are a natural
1195candidate for use in concise.t, are unavailable to the user.
c99ca59a 1196
724aa791 1197=back
c99ca59a 1198
724aa791 1199=head2 Option Stickiness
c99ca59a 1200
724aa791 1201If you invoke Concise more than once in a program, you should know that
1202the options are 'sticky'. This means that the options you provide in
1203the first call will be remembered for the 2nd call, unless you
1204re-specify or change them.
c99ca59a 1205
cc02ea56 1206=head1 ABBREVIATIONS
1207
1208The concise style uses symbols to convey maximum info with minimal
1209clutter (like hex addresses). With just a little practice, you can
1210start to see the flowers, not just the branches, in the trees.
1211
1212=head2 OP class abbreviations
1213
1214These symbols appear before the op-name, and indicate the
1215B:: namespace that represents the ops in your Perl code.
1216
1217 0 OP (aka BASEOP) An OP with no children
1218 1 UNOP An OP with one child
1219 2 BINOP An OP with two children
1220 | LOGOP A control branch OP
1221 @ LISTOP An OP that could have lots of children
1222 / PMOP An OP with a regular expression
1223 $ SVOP An OP with an SV
1224 " PVOP An OP with a string
1225 { LOOP An OP that holds pointers for a loop
1226 ; COP An OP that marks the start of a statement
1227 # PADOP An OP with a GV on the pad
1228
1229=head2 OP flags abbreviations
1230
19e169bf 1231OP flags are either public or private. The public flags alter the
1232behavior of each opcode in consistent ways, and are represented by 0
1233or more single characters.
cc02ea56 1234
1235 v OPf_WANT_VOID Want nothing (void context)
1236 s OPf_WANT_SCALAR Want single value (scalar context)
1237 l OPf_WANT_LIST Want list of any length (list context)
19e169bf 1238 Want is unknown
cc02ea56 1239 K OPf_KIDS There is a firstborn child.
1240 P OPf_PARENS This operator was parenthesized.
1241 (Or block needs explicit scope entry.)
1242 R OPf_REF Certified reference.
1243 (Return container, not containee).
1244 M OPf_MOD Will modify (lvalue).
1245 S OPf_STACKED Some arg is arriving on the stack.
1246 * OPf_SPECIAL Do something weird for this op (see op.h)
1247
19e169bf 1248Private flags, if any are set for an opcode, are displayed after a '/'
1249
1250 8 <@> leave[1 ref] vKP/REFC ->(end)
1251 7 <2> sassign vKS/2 ->8
1252
1253They're opcode specific, and occur less often than the public ones, so
1254they're represented by short mnemonics instead of single-chars; see
00baac8f 1255F<op.h> for gory details, or try this quick 2-liner:
19e169bf 1256
1257 $> perl -MB::Concise -de 1
1258 DB<1> |x \%B::Concise::priv
1259
c99ca59a 1260=head1 FORMATTING SPECIFICATIONS
1261
724aa791 1262For each line-style ('concise', 'terse', 'linenoise', etc.) there are
12633 format-specs which control how OPs are rendered.
1264
1265The first is the 'default' format, which is used in both basic and exec
1266modes to print all opcodes. The 2nd, goto-format, is used in exec
1267mode when branches are encountered. They're not real opcodes, and are
1268inserted to look like a closing curly brace. The tree-format is tree
1269specific.
1270
cc02ea56 1271When a line is rendered, the correct format-spec is copied and scanned
1272for the following items; data is substituted in, and other
1273manipulations like basic indenting are done, for each opcode rendered.
1274
1275There are 3 kinds of items that may be populated; special patterns,
1276#vars, and literal text, which is copied verbatim. (Yes, it's a set
1277of s///g steps.)
1278
1279=head2 Special Patterns
1280
1281These items are the primitives used to perform indenting, and to
1282select text from amongst alternatives.
c99ca59a 1283
1284=over 4
1285
1286=item B<(x(>I<exec_text>B<;>I<basic_text>B<)x)>
1287
1288Generates I<exec_text> in exec mode, or I<basic_text> in basic mode.
1289
1290=item B<(*(>I<text>B<)*)>
1291
1292Generates one copy of I<text> for each indentation level.
1293
1294=item B<(*(>I<text1>B<;>I<text2>B<)*)>
1295
1296Generates one fewer copies of I<text1> than the indentation level, followed
1297by one copy of I<text2> if the indentation level is more than 0.
1298
1299=item B<(?(>I<text1>B<#>I<var>I<Text2>B<)?)>
1300
1301If the value of I<var> is true (not empty or zero), generates the
1302value of I<var> surrounded by I<text1> and I<Text2>, otherwise
1303nothing.
1304
cc02ea56 1305=item B<~>
1306
1307Any number of tildes and surrounding whitespace will be collapsed to
1308a single space.
1309
1310=back
1311
1312=head2 # Variables
1313
1314These #vars represent opcode properties that you may want as part of
1315your rendering. The '#' is intended as a private sigil; a #var's
1316value is interpolated into the style-line, much like "read $this".
1317
1318These vars take 3 forms:
1319
1320=over 4
1321
c99ca59a 1322=item B<#>I<var>
1323
cc02ea56 1324A property named 'var' is assumed to exist for the opcodes, and is
1325interpolated into the rendering.
c99ca59a 1326
1327=item B<#>I<var>I<N>
1328
cc02ea56 1329Generates the value of I<var>, left justified to fill I<N> spaces.
1330Note that this means while you can have properties 'foo' and 'foo2',
1331you cannot render 'foo2', but you could with 'foo2a'. You would be
1332wise not to rely on this behavior going forward ;-)
c99ca59a 1333
cc02ea56 1334=item B<#>I<Var>
c99ca59a 1335
cc02ea56 1336This ucfirst form of #var generates a tag-value form of itself for
1337display; it converts '#Var' into a 'Var => #var' style, which is then
1338handled as described above. (Imp-note: #Vars cannot be used for
1339conditional-fills, because the => #var transform is done after the check
1340for #Var's value).
c99ca59a 1341
1342=back
1343
cc02ea56 1344The following variables are 'defined' by B::Concise; when they are
1345used in a style, their respective values are plugged into the
1346rendering of each opcode.
1347
1348Only some of these are used by the standard styles, the others are
1349provided for you to delve into optree mechanics, should you wish to
1350add a new style (see L</add_style> below) that uses them. You can
00baac8f 1351also add new ones using L</add_callback>.
c99ca59a 1352
1353=over 4
1354
1355=item B<#addr>
1356
cc02ea56 1357The address of the OP, in hexadecimal.
c99ca59a 1358
1359=item B<#arg>
1360
1361The OP-specific information of the OP (such as the SV for an SVOP, the
cc02ea56 1362non-local exit pointers for a LOOP, etc.) enclosed in parentheses.
c99ca59a 1363
1364=item B<#class>
1365
1366The B-determined class of the OP, in all caps.
1367
f8a679e6 1368=item B<#classsym>
c99ca59a 1369
1370A single symbol abbreviating the class of the OP.
1371
c3caa09d 1372=item B<#coplabel>
1373
1374The label of the statement or block the OP is the start of, if any.
1375
c99ca59a 1376=item B<#exname>
1377
1378The name of the OP, or 'ex-foo' if the OP is a null that used to be a foo.
1379
1380=item B<#extarg>
1381
1382The target of the OP, or nothing for a nulled OP.
1383
1384=item B<#firstaddr>
1385
19e169bf 1386The address of the OP's first child, in hexadecimal.
c99ca59a 1387
1388=item B<#flags>
1389
1390The OP's flags, abbreviated as a series of symbols.
1391
1392=item B<#flagval>
1393
1394The numeric value of the OP's flags.
1395
f8a679e6 1396=item B<#hyphseq>
c99ca59a 1397
1398The sequence number of the OP, or a hyphen if it doesn't have one.
1399
1400=item B<#label>
1401
1402'NEXT', 'LAST', or 'REDO' if the OP is a target of one of those in exec
1403mode, or empty otherwise.
1404
1405=item B<#lastaddr>
1406
19e169bf 1407The address of the OP's last child, in hexadecimal.
c99ca59a 1408
1409=item B<#name>
1410
1411The OP's name.
1412
1413=item B<#NAME>
1414
1415The OP's name, in all caps.
1416
1417=item B<#next>
1418
1419The sequence number of the OP's next OP.
1420
1421=item B<#nextaddr>
1422
19e169bf 1423The address of the OP's next OP, in hexadecimal.
c99ca59a 1424
1425=item B<#noise>
1426
c27ea44e 1427A one- or two-character abbreviation for the OP's name.
c99ca59a 1428
1429=item B<#private>
1430
1431The OP's private flags, rendered with abbreviated names if possible.
1432
1433=item B<#privval>
1434
1435The numeric value of the OP's private flags.
1436
1437=item B<#seq>
1438
2814eb74 1439The sequence number of the OP. Note that this is a sequence number
1440generated by B::Concise.
c99ca59a 1441
7252851f 1442=item B<#seqnum>
1443
14445.8.x and earlier only. 5.9 and later do not provide this.
1445
1446The real sequence number of the OP, as a regular number and not adjusted
1447to be relative to the start of the real program. (This will generally be
1448a fairly large number because all of B<B::Concise> is compiled before
1449your program is).
1450
2814eb74 1451=item B<#opt>
c99ca59a 1452
2814eb74 1453Whether or not the op has been optimised by the peephole optimiser.
1454
7252851f 1455Only available in 5.9 and later.
1456
2814eb74 1457=item B<#static>
1458
1459Whether or not the op is statically defined. This flag is used by the
1460B::C compiler backend and indicates that the op should not be freed.
c99ca59a 1461
7252851f 1462Only available in 5.9 and later.
1463
c99ca59a 1464=item B<#sibaddr>
1465
19e169bf 1466The address of the OP's next youngest sibling, in hexadecimal.
c99ca59a 1467
1468=item B<#svaddr>
1469
19e169bf 1470The address of the OP's SV, if it has an SV, in hexadecimal.
c99ca59a 1471
1472=item B<#svclass>
1473
1474The class of the OP's SV, if it has one, in all caps (e.g., 'IV').
1475
1476=item B<#svval>
1477
1478The value of the OP's SV, if it has one, in a short human-readable format.
1479
1480=item B<#targ>
1481
1482The numeric value of the OP's targ.
1483
1484=item B<#targarg>
1485
1486The name of the variable the OP's targ refers to, if any, otherwise the
1487letter t followed by the OP's targ in decimal.
1488
1489=item B<#targarglife>
1490
1491Same as B<#targarg>, but followed by the COP sequence numbers that delimit
1492the variable's lifetime (or 'end' for a variable in an open scope) for a
1493variable.
1494
1495=item B<#typenum>
1496
1497The numeric value of the OP's type, in decimal.
1498
1499=back
1500
f9f861ec 1501=head1 One-Liner Command tips
1502
1503=over 4
1504
1505=item perl -MO=Concise,bar foo.pl
1506
1507Renders only bar() from foo.pl. To see main, drop the ',bar'. To see
1508both, add ',-main'
1509
1510=item perl -MDigest::MD5=md5 -MO=Concise,md5 -e1
1511
1512Identifies md5 as an XS function. The export is needed so that BC can
1513find it in main.
1514
1515=item perl -MPOSIX -MO=Concise,_POSIX_ARG_MAX -e1
1516
1517Identifies _POSIX_ARG_MAX as a constant sub, optimized to an IV.
1518Although POSIX isn't entirely consistent across platforms, this is
1519likely to be present in virtually all of them.
1520
1521=item perl -MPOSIX -MO=Concise,a -e 'print _POSIX_SAVED_IDS'
1522
1523This renders a print statement, which includes a call to the function.
1524It's identical to rendering a file with a use call and that single
1525statement, except for the filename which appears in the nextstate ops.
1526
1527=item perl -MPOSIX -MO=Concise,a -e 'sub a{_POSIX_SAVED_IDS}'
1528
1529This is B<very> similar to previous, only the first two ops differ. This
1530subroutine rendering is more representative, insofar as a single main
1531program will have many subs.
1532
1533
1534
78ad9108 1535=head1 Using B::Concise outside of the O framework
1536
cc02ea56 1537The common (and original) usage of B::Concise was for command-line
1538renderings of simple code, as given in EXAMPLE. But you can also use
1539B<B::Concise> from your code, and call compile() directly, and
724aa791 1540repeatedly. By doing so, you can avoid the compile-time only
cc02ea56 1541operation of O.pm, and even use the debugger to step through
1542B::Concise::compile() itself.
f95e3c3c 1543
cc02ea56 1544Once you're doing this, you may alter Concise output by adding new
1545rendering styles, and by optionally adding callback routines which
1546populate new variables, if such were referenced from those (just
1547added) styles.
f95e3c3c 1548
724aa791 1549=head2 Example: Altering Concise Renderings
78ad9108 1550
1551 use B::Concise qw(set_style add_callback);
cc02ea56 1552 add_style($yourStyleName => $defaultfmt, $gotofmt, $treefmt);
78ad9108 1553 add_callback
f95e3c3c 1554 ( sub {
1555 my ($h, $op, $format, $level, $stylename) = @_;
78ad9108 1556 $h->{variable} = some_func($op);
cc02ea56 1557 });
1558 $walker = B::Concise::compile(@options,@subnames,@subrefs);
1559 $walker->();
78ad9108 1560
f95e3c3c 1561=head2 set_style()
1562
724aa791 1563B<set_style> accepts 3 arguments, and updates the three format-specs
1564comprising a line-style (basic-exec, goto, tree). It has one minor
1565drawback though; it doesn't register the style under a new name. This
1566can become an issue if you render more than once and switch styles.
1567Thus you may prefer to use add_style() and/or set_style_standard()
1568instead.
1569
1570=head2 set_style_standard($name)
1571
1572This restores one of the standard line-styles: C<terse>, C<concise>,
1573C<linenoise>, C<debug>, C<env>, into effect. It also accepts style
1574names previously defined with add_style().
f95e3c3c 1575
1576=head2 add_style()
78ad9108 1577
f95e3c3c 1578This subroutine accepts a new style name and three style arguments as
1579above, and creates, registers, and selects the newly named style. It is
1580an error to re-add a style; call set_style_standard() to switch between
1581several styles.
1582
f95e3c3c 1583=head2 add_callback()
1584
19e169bf 1585If your newly minted styles refer to any new #variables, you'll need
1586to define a callback subroutine that will populate (or modify) those
1587variables. They are then available for use in the style you've
1588chosen.
f95e3c3c 1589
1590The callbacks are called for each opcode visited by Concise, in the
1591same order as they are added. Each subroutine is passed five
1592parameters.
1593
1594 1. A hashref, containing the variable names and values which are
1595 populated into the report-line for the op
1596 2. the op, as a B<B::OP> object
1597 3. a reference to the format string
1598 4. the formatting (indent) level
1599 5. the selected stylename
78ad9108 1600
1601To define your own variables, simply add them to the hash, or change
1602existing values if you need to. The level and format are passed in as
1603references to scalars, but it is unlikely that they will need to be
1604changed or even used.
1605
724aa791 1606=head2 Running B::Concise::compile()
f95e3c3c 1607
1608B<compile> accepts options as described above in L</OPTIONS>, and
1609arguments, which are either coderefs, or subroutine names.
1610
cc02ea56 1611It constructs and returns a $treewalker coderef, which when invoked,
1612traverses, or walks, and renders the optrees of the given arguments to
1613STDOUT. You can reuse this, and can change the rendering style used
1614each time; thereafter the coderef renders in the new style.
f95e3c3c 1615
1616B<walk_output> lets you change the print destination from STDOUT to
19e169bf 1617another open filehandle, or into a string passed as a ref (unless
1618you've built perl with -Uuseperlio).
f95e3c3c 1619
cc02ea56 1620 my $walker = B::Concise::compile('-terse','aFuncName', \&aSubRef); # 1
f95e3c3c 1621 walk_output(\my $buf);
cc02ea56 1622 $walker->(); # 1 renders -terse
1623 set_style_standard('concise'); # 2
1624 $walker->(); # 2 renders -concise
1625 $walker->(@new); # 3 renders whatever
1626 print "3 different renderings: terse, concise, and @new: $buf\n";
1627
1628When $walker is called, it traverses the subroutines supplied when it
1629was created, and renders them using the current style. You can change
1630the style afterwards in several different ways:
1631
1632 1. call C<compile>, altering style or mode/order
1633 2. call C<set_style_standard>
1634 3. call $walker, passing @new options
1635
1636Passing new options to the $walker is the easiest way to change
1637amongst any pre-defined styles (the ones you add are automatically
1638recognized as options), and is the only way to alter rendering order
1639without calling compile again. Note however that rendering state is
1640still shared amongst multiple $walker objects, so they must still be
1641used in a coordinated manner.
f95e3c3c 1642
1643=head2 B::Concise::reset_sequence()
1644
1645This function (not exported) lets you reset the sequence numbers (note
1646that they're numbered arbitrarily, their goal being to be human
1647readable). Its purpose is mostly to support testing, i.e. to compare
1648the concise output from two identical anonymous subroutines (but
1649different instances). Without the reset, B::Concise, seeing that
1650they're separate optrees, generates different sequence numbers in
1651the output.
1652
1653=head2 Errors
1654
9a3b3024 1655Errors in rendering (non-existent function-name, non-existent coderef)
1656are written to the STDOUT, or wherever you've set it via
1657walk_output().
31b49ad4 1658
9a3b3024 1659Errors using the various *style* calls, and bad args to walk_output(),
1660result in die(). Use an eval if you wish to catch these errors and
1661continue processing.
78ad9108 1662
c99ca59a 1663=head1 AUTHOR
1664
31b49ad4 1665Stephen McCamant, E<lt>smcc@CSUA.Berkeley.EDUE<gt>.
c99ca59a 1666
1667=cut