Spaces:
Running
Running
# B::Deparse.pm | |
# Copyright (c) 1998-2000, 2002, 2003, 2004, 2005, 2006 Stephen McCamant. | |
# All rights reserved. | |
# This module is free software; you can redistribute and/or modify | |
# it under the same terms as Perl itself. | |
# This is based on the module of the same name by Malcolm Beattie, | |
# but essentially none of his code remains. | |
package B::Deparse; | |
use Carp; | |
use B qw(class main_root main_start main_cv svref_2object opnumber perlstring | |
OPf_WANT OPf_WANT_VOID OPf_WANT_SCALAR OPf_WANT_LIST | |
OPf_KIDS OPf_REF OPf_STACKED OPf_SPECIAL OPf_MOD OPf_PARENS | |
OPpLVAL_INTRO OPpOUR_INTRO OPpENTERSUB_AMPER OPpSLICE OPpKVSLICE | |
OPpCONST_BARE | |
OPpTRANS_SQUASH OPpTRANS_DELETE OPpTRANS_COMPLEMENT OPpTARGET_MY | |
OPpEXISTS_SUB OPpSORT_NUMERIC OPpSORT_INTEGER OPpREPEAT_DOLIST | |
OPpSORT_REVERSE OPpMULTIDEREF_EXISTS OPpMULTIDEREF_DELETE | |
OPpSPLIT_ASSIGN OPpSPLIT_LEX | |
OPpPADHV_ISKEYS OPpRV2HV_ISKEYS | |
OPpCONCAT_NESTED | |
OPpMULTICONCAT_APPEND OPpMULTICONCAT_STRINGIFY OPpMULTICONCAT_FAKE | |
OPpTRUEBOOL OPpINDEX_BOOLNEG | |
SVf_IOK SVf_NOK SVf_ROK SVf_POK SVpad_OUR SVf_FAKE SVs_RMG SVs_SMG | |
SVs_PADTMP SVpad_TYPED | |
CVf_METHOD CVf_LVALUE | |
PMf_KEEP PMf_GLOBAL PMf_CONTINUE PMf_EVAL PMf_ONCE | |
PMf_MULTILINE PMf_SINGLELINE PMf_FOLD PMf_EXTENDED PMf_EXTENDED_MORE | |
PADNAMEt_OUTER | |
MDEREF_reload | |
MDEREF_AV_pop_rv2av_aelem | |
MDEREF_AV_gvsv_vivify_rv2av_aelem | |
MDEREF_AV_padsv_vivify_rv2av_aelem | |
MDEREF_AV_vivify_rv2av_aelem | |
MDEREF_AV_padav_aelem | |
MDEREF_AV_gvav_aelem | |
MDEREF_HV_pop_rv2hv_helem | |
MDEREF_HV_gvsv_vivify_rv2hv_helem | |
MDEREF_HV_padsv_vivify_rv2hv_helem | |
MDEREF_HV_vivify_rv2hv_helem | |
MDEREF_HV_padhv_helem | |
MDEREF_HV_gvhv_helem | |
MDEREF_ACTION_MASK | |
MDEREF_INDEX_none | |
MDEREF_INDEX_const | |
MDEREF_INDEX_padsv | |
MDEREF_INDEX_gvsv | |
MDEREF_INDEX_MASK | |
MDEREF_FLAG_last | |
MDEREF_MASK | |
MDEREF_SHIFT | |
); | |
$VERSION = '1.56'; | |
use strict; | |
our $AUTOLOAD; | |
use warnings (); | |
require feature; | |
use Config; | |
BEGIN { | |
# List version-specific constants here. | |
# Easiest way to keep this code portable between version looks to | |
# be to fake up a dummy constant that will never actually be true. | |
foreach (qw(OPpSORT_INPLACE OPpSORT_DESCEND OPpITER_REVERSED OPpCONST_NOVER | |
OPpPAD_STATE PMf_SKIPWHITE RXf_SKIPWHITE | |
PMf_CHARSET PMf_KEEPCOPY PMf_NOCAPTURE CVf_ANONCONST | |
CVf_LOCKED OPpREVERSE_INPLACE OPpSUBSTR_REPL_FIRST | |
PMf_NONDESTRUCT OPpEVAL_BYTES | |
OPpLVREF_TYPE OPpLVREF_SV OPpLVREF_AV OPpLVREF_HV | |
OPpLVREF_CV OPpLVREF_ELEM SVpad_STATE)) { | |
eval { B->import($_) }; | |
no strict 'refs'; | |
*{$_} = sub () {0} unless *{$_}{CODE}; | |
} | |
} | |
# Todo: | |
# (See also BUGS section at the end of this file) | |
# | |
# - finish tr/// changes | |
# - add option for even more parens (generalize \&foo change) | |
# - left/right context | |
# - copy comments (look at real text with $^P?) | |
# - avoid semis in one-statement blocks | |
# - associativity of &&=, ||=, ?: | |
# - ',' => '=>' (auto-unquote?) | |
# - break long lines ("\r" as discretionary break?) | |
# - configurable syntax highlighting: ANSI color, HTML, TeX, etc. | |
# - more style options: brace style, hex vs. octal, quotes, ... | |
# - print big ints as hex/octal instead of decimal (heuristic?) | |
# - handle 'my $x if 0'? | |
# - version using op_next instead of op_first/sibling? | |
# - avoid string copies (pass arrays, one big join?) | |
# - here-docs? | |
# Current test.deparse failures | |
# comp/hints 6 - location of BEGIN blocks wrt. block openings | |
# run/switchI 1 - missing -I switches entirely | |
# perl -Ifoo -e 'print @INC' | |
# op/caller 2 - warning mask propagates backwards before warnings::register | |
# 'use warnings; BEGIN {${^WARNING_BITS} eq "U"x12;} use warnings::register' | |
# op/getpid 2 - can't assign to shared my() declaration (threads only) | |
# 'my $x : shared = 5' | |
# op/override 7 - parens on overridden require change v-string interpretation | |
# 'BEGIN{*CORE::GLOBAL::require=sub {}} require v5.6' | |
# c.f. 'BEGIN { *f = sub {0} }; f 2' | |
# op/pat 774 - losing Unicode-ness of Latin1-only strings | |
# 'use charnames ":short"; $x="\N{latin:a with acute}"' | |
# op/recurse 12 - missing parens on recursive call makes it look like method | |
# 'sub f { f($x) }' | |
# op/subst 90 - inconsistent handling of utf8 under "use utf8" | |
# op/taint 29 - "use re 'taint'" deparsed in the wrong place wrt. block open | |
# op/tiehandle compile - "use strict" deparsed in the wrong place | |
# uni/tr_ several | |
# ext/B/t/xref 11 - line numbers when we add newlines to one-line subs | |
# ext/Data/Dumper/t/dumper compile | |
# ext/DB_file/several | |
# ext/Encode/several | |
# ext/Ernno/Errno warnings | |
# ext/IO/lib/IO/t/io_sel 23 | |
# ext/PerlIO/t/encoding compile | |
# ext/POSIX/t/posix 6 | |
# ext/Socket/Socket 8 | |
# ext/Storable/t/croak compile | |
# lib/Attribute/Handlers/t/multi compile | |
# lib/bignum/ several | |
# lib/charnames 35 | |
# lib/constant 32 | |
# lib/English 40 | |
# lib/ExtUtils/t/bytes 4 | |
# lib/File/DosGlob compile | |
# lib/Filter/Simple/t/data 1 | |
# lib/Math/BigInt/t/constant 1 | |
# lib/Net/t/config Deparse-warning | |
# lib/overload compile | |
# lib/Switch/ several | |
# lib/Symbol 4 | |
# lib/Test/Simple several | |
# lib/Term/Complete | |
# lib/Tie/File/t/29_downcopy 5 | |
# lib/vars 22 | |
# Object fields: | |
# | |
# in_coderef2text: | |
# True when deparsing via $deparse->coderef2text; false when deparsing the | |
# main program. | |
# | |
# avoid_local: | |
# (local($a), local($b)) and local($a, $b) have the same internal | |
# representation but the short form looks better. We notice we can | |
# use a large-scale local when checking the list, but need to prevent | |
# individual locals too. This hash holds the addresses of OPs that | |
# have already had their local-ness accounted for. The same thing | |
# is done with my(). | |
# | |
# curcv: | |
# CV for current sub (or main program) being deparsed | |
# | |
# curcvlex: | |
# Cached hash of lexical variables for curcv: keys are | |
# names prefixed with "m" or "o" (representing my/our), and | |
# each value is an array with two elements indicating the cop_seq | |
# of scopes in which a var of that name is valid and a third ele- | |
# ment referencing the pad name. | |
# | |
# curcop: | |
# COP for statement being deparsed | |
# | |
# curstash: | |
# name of the current package for deparsed code | |
# | |
# subs_todo: | |
# array of [cop_seq, CV, is_format?, name] for subs and formats we still | |
# want to deparse. The fourth element is a pad name thingy for lexical | |
# subs or a string for special blocks. For other subs, it is undef. For | |
# lexical subs, CV may be undef, indicating a stub declaration. | |
# | |
# protos_todo: | |
# as above, but [name, prototype] for subs that never got a GV | |
# | |
# subs_done, forms_done: | |
# keys are addresses of GVs for subs and formats we've already | |
# deparsed (or at least put into subs_todo) | |
# | |
# subs_declared | |
# keys are names of subs for which we've printed declarations. | |
# That means we can omit parentheses from the arguments. It also means we | |
# need to put CORE:: on core functions of the same name. | |
# | |
# in_subst_repl | |
# True when deparsing the replacement part of a substitution. | |
# | |
# in_refgen | |
# True when deparsing the argument to \. | |
# | |
# parens: -p | |
# linenums: -l | |
# unquote: -q | |
# cuddle: ' ' or '\n', depending on -sC | |
# indent_size: -si | |
# use_tabs: -sT | |
# ex_const: -sv | |
# A little explanation of how precedence contexts and associativity | |
# work: | |
# | |
# deparse() calls each per-op subroutine with an argument $cx (short | |
# for context, but not the same as the cx* in the perl core), which is | |
# a number describing the op's parents in terms of precedence, whether | |
# they're inside an expression or at statement level, etc. (see | |
# chart below). When ops with children call deparse on them, they pass | |
# along their precedence. Fractional values are used to implement | |
# associativity ('($x + $y) + $z' => '$x + $y + $y') and related | |
# parentheses hacks. The major disadvantage of this scheme is that | |
# it doesn't know about right sides and left sides, so say if you | |
# assign a listop to a variable, it can't tell it's allowed to leave | |
# the parens off the listop. | |
# Precedences: | |
# 26 [TODO] inside interpolation context ("") | |
# 25 left terms and list operators (leftward) | |
# 24 left -> | |
# 23 nonassoc ++ -- | |
# 22 right ** | |
# 21 right ! ~ \ and unary + and - | |
# 20 left =~ !~ | |
# 19 left * / % x | |
# 18 left + - . | |
# 17 left << >> | |
# 16 nonassoc named unary operators | |
# 15 nonassoc < > <= >= lt gt le ge | |
# 14 nonassoc == != <=> eq ne cmp | |
# 13 left & | |
# 12 left | ^ | |
# 11 left && | |
# 10 left || | |
# 9 nonassoc .. ... | |
# 8 right ?: | |
# 7 right = += -= *= etc. | |
# 6 left , => | |
# 5 nonassoc list operators (rightward) | |
# 4 right not | |
# 3 left and | |
# 2 left or xor | |
# 1 statement modifiers | |
# 0.5 statements, but still print scopes as do { ... } | |
# 0 statement level | |
# -1 format body | |
# Nonprinting characters with special meaning: | |
# \cS - steal parens (see maybe_parens_unop) | |
# \n - newline and indent | |
# \t - increase indent | |
# \b - decrease indent ('outdent') | |
# \f - flush left (no indent) | |
# \cK - kill following semicolon, if any | |
# Semicolon handling: | |
# - Individual statements are not deparsed with trailing semicolons. | |
# (If necessary, \cK is tacked on to the end.) | |
# - Whatever code joins statements together or emits them (lineseq, | |
# scopeop, deparse_root) is responsible for adding semicolons where | |
# necessary. | |
# - use statements are deparsed with trailing semicolons because they are | |
# immediately concatenated with the following statement. | |
# - indent() removes semicolons wherever it sees \cK. | |
BEGIN { for (qw[ const stringify rv2sv list glob pushmark null aelem | |
kvaslice kvhslice padsv argcheck | |
nextstate dbstate rv2av rv2hv helem custom ]) { | |
eval "sub OP_\U$_ () { " . opnumber($_) . "}" | |
}} | |
# _pessimise_walk(): recursively walk the optree of a sub, | |
# possibly undoing optimisations along the way. | |
sub DEBUG { 0 } | |
use if DEBUG, 'Data::Dumper'; | |
sub _pessimise_walk { | |
my ($self, $startop) = @_; | |
return unless $$startop; | |
my ($op, $prevop); | |
for ($op = $startop; $$op; $prevop = $op, $op = $op->sibling) { | |
my $ppname = $op->name; | |
# pessimisations start here | |
if ($ppname eq "padrange") { | |
# remove PADRANGE: | |
# the original optimisation either (1) changed this: | |
# pushmark -> (various pad and list and null ops) -> the_rest | |
# or (2), for the = @_ case, changed this: | |
# pushmark -> gv[_] -> rv2av -> (pad stuff) -> the_rest | |
# into this: | |
# padrange ----------------------------------------> the_rest | |
# so we just need to convert the padrange back into a | |
# pushmark, and in case (1), set its op_next to op_sibling, | |
# which is the head of the original chain of optimised-away | |
# pad ops, or for (2), set it to sibling->first, which is | |
# the original gv[_]. | |
$B::overlay->{$$op} = { | |
type => OP_PUSHMARK, | |
name => 'pushmark', | |
private => ($op->private & OPpLVAL_INTRO), | |
}; | |
} | |
# pessimisations end here | |
if (class($op) eq 'PMOP') { | |
if (ref($op->pmreplroot) | |
&& ${$op->pmreplroot} | |
&& $op->pmreplroot->isa( 'B::OP' )) | |
{ | |
$self-> _pessimise_walk($op->pmreplroot); | |
} | |
# pessimise any /(?{...})/ code blocks | |
my ($re, $cv); | |
my $code_list = $op->code_list; | |
if ($$code_list) { | |
$self->_pessimise_walk($code_list); | |
} | |
elsif (${$re = $op->pmregexp} && ${$cv = $re->qr_anoncv}) { | |
$code_list = $cv->ROOT # leavesub | |
->first # qr | |
->code_list; # list | |
$self->_pessimise_walk($code_list); | |
} | |
} | |
if ($op->flags & OPf_KIDS) { | |
$self-> _pessimise_walk($op->first); | |
} | |
} | |
} | |
# _pessimise_walk_exe(): recursively walk the op_next chain of a sub, | |
# possibly undoing optimisations along the way. | |
sub _pessimise_walk_exe { | |
my ($self, $startop, $visited) = @_; | |
no warnings 'recursion'; | |
return unless $$startop; | |
return if $visited->{$$startop}; | |
my ($op, $prevop); | |
for ($op = $startop; $$op; $prevop = $op, $op = $op->next) { | |
last if $visited->{$$op}; | |
$visited->{$$op} = 1; | |
my $ppname = $op->name; | |
if ($ppname =~ | |
/^((and|d?or)(assign)?|(map|grep)while|range|cond_expr|once)$/ | |
# entertry is also a logop, but its op_other invariably points | |
# into the same chain as the main execution path, so we skip it | |
) { | |
$self->_pessimise_walk_exe($op->other, $visited); | |
} | |
elsif ($ppname eq "subst") { | |
$self->_pessimise_walk_exe($op->pmreplstart, $visited); | |
} | |
elsif ($ppname =~ /^(enter(loop|iter))$/) { | |
# redoop and nextop will already be covered by the main block | |
# of the loop | |
$self->_pessimise_walk_exe($op->lastop, $visited); | |
} | |
# pessimisations start here | |
} | |
} | |
# Go through an optree and "remove" some optimisations by using an | |
# overlay to selectively modify or un-null some ops. Deparsing in the | |
# absence of those optimisations is then easier. | |
# | |
# Note that older optimisations are not removed, as Deparse was already | |
# written to recognise them before the pessimise/overlay system was added. | |
sub pessimise { | |
my ($self, $root, $start) = @_; | |
no warnings 'recursion'; | |
# walk tree in root-to-branch order | |
$self->_pessimise_walk($root); | |
my %visited; | |
# walk tree in execution order | |
$self->_pessimise_walk_exe($start, \%visited); | |
} | |
sub null { | |
my $op = shift; | |
return class($op) eq "NULL"; | |
} | |
# Add a CV to the list of subs that still need deparsing. | |
sub todo { | |
my $self = shift; | |
my($cv, $is_form, $name) = @_; | |
my $cvfile = $cv->FILE//''; | |
return unless ($cvfile eq $0 || exists $self->{files}{$cvfile}); | |
my $seq; | |
if ($cv->OUTSIDE_SEQ) { | |
$seq = $cv->OUTSIDE_SEQ; | |
} elsif (!null($cv->START) and is_state($cv->START)) { | |
$seq = $cv->START->cop_seq; | |
} else { | |
$seq = 0; | |
} | |
my $stash = $cv->STASH; | |
if (class($stash) eq 'HV') { | |
$self->{packs}{$stash->NAME}++; | |
} | |
push @{$self->{'subs_todo'}}, [$seq, $cv, $is_form, $name]; | |
} | |
# Pop the next sub from the todo list and deparse it | |
sub next_todo { | |
my $self = shift; | |
my $ent = shift @{$self->{'subs_todo'}}; | |
my ($seq, $cv, $is_form, $name) = @$ent; | |
# any 'use strict; package foo' that should come before the sub | |
# declaration to sync with the first COP of the sub | |
my $pragmata = ''; | |
if ($cv and !null($cv->START) and is_state($cv->START)) { | |
$pragmata = $self->pragmata($cv->START); | |
} | |
if (ref $name) { # lexical sub | |
# emit the sub. | |
my @text; | |
my $flags = $name->FLAGS; | |
push @text, | |
!$cv || $seq <= $name->COP_SEQ_RANGE_LOW | |
? $self->keyword($flags & SVpad_OUR | |
? "our" | |
: $flags & SVpad_STATE | |
? "state" | |
: "my") . " " | |
: ""; | |
# XXX We would do $self->keyword("sub"), but ‘my CORE::sub’ | |
# doesn’t work and ‘my sub’ ignores a &sub in scope. I.e., | |
# we have a core bug here. | |
push @text, "sub " . substr $name->PVX, 1; | |
if ($cv) { | |
# my sub foo { } | |
push @text, " " . $self->deparse_sub($cv); | |
$text[-1] =~ s/ ;$/;/; | |
} | |
else { | |
# my sub foo; | |
push @text, ";\n"; | |
} | |
return $pragmata . join "", @text; | |
} | |
my $gv = $cv->GV; | |
$name //= $self->gv_name($gv); | |
if ($is_form) { | |
return $pragmata . $self->keyword("format") . " $name =\n" | |
. $self->deparse_format($cv). "\n"; | |
} else { | |
my $use_dec; | |
if ($name eq "BEGIN") { | |
$use_dec = $self->begin_is_use($cv); | |
if (defined ($use_dec) and $self->{'expand'} < 5) { | |
return $pragmata if 0 == length($use_dec); | |
# XXX bit of a hack: Test::More's use_ok() method | |
# builds a fake use statement which deparses as, e.g. | |
# use Net::Ping (@{$args[0];}); | |
# As well as being superfluous (the use_ok() is deparsed | |
# too) and ugly, it fails under use strict and otherwise | |
# makes use of a lexical var that's not in scope. | |
# So strip it out. | |
return $pragmata | |
if $use_dec =~ | |
m/ | |
\A | |
use \s \S+ \s \(\@\{ | |
( | |
\s*\#line\ \d+\ \".*"\s* | |
)? | |
\$args\[0\];\}\); | |
\n | |
\Z | |
/x; | |
$use_dec =~ s/^(use|no)\b/$self->keyword($1)/e; | |
} | |
} | |
my $l = ''; | |
if ($self->{'linenums'}) { | |
my $line = $gv->LINE; | |
my $file = $gv->FILE; | |
$l = "\n\f#line $line \"$file\"\n"; | |
} | |
my $p = ''; | |
my $stash; | |
if (class($cv->STASH) ne "SPECIAL") { | |
$stash = $cv->STASH->NAME; | |
if ($stash ne $self->{'curstash'}) { | |
$p = $self->keyword("package") . " $stash;\n"; | |
$name = "$self->{'curstash'}::$name" unless $name =~ /::/; | |
$self->{'curstash'} = $stash; | |
} | |
} | |
if ($use_dec) { | |
return "$pragmata$p$l$use_dec"; | |
} | |
if ( $name !~ /::/ and $self->lex_in_scope("&$name") | |
|| $self->lex_in_scope("&$name", 1) ) | |
{ | |
$name = "$self->{'curstash'}::$name"; | |
} elsif (defined $stash) { | |
$name =~ s/^\Q$stash\E::(?!\z|.*::)//; | |
} | |
my $ret = "$pragmata${p}${l}" . $self->keyword("sub") . " $name " | |
. $self->deparse_sub($cv); | |
$self->{'subs_declared'}{$name} = 1; | |
return $ret; | |
} | |
} | |
# Return a "use" declaration for this BEGIN block, if appropriate | |
sub begin_is_use { | |
my ($self, $cv) = @_; | |
my $root = $cv->ROOT; | |
local @$self{qw'curcv curcvlex'} = ($cv); | |
local $B::overlay = {}; | |
$self->pessimise($root, $cv->START); | |
#require B::Debug; | |
#B::walkoptree($cv->ROOT, "debug"); | |
my $lineseq = $root->first; | |
return if $lineseq->name ne "lineseq"; | |
my $req_op = $lineseq->first->sibling; | |
return if $req_op->name ne "require"; | |
# maybe it's C<require expr> rather than C<require 'foo'> | |
return if ($req_op->first->name ne 'const'); | |
my $module; | |
if ($req_op->first->private & OPpCONST_BARE) { | |
# Actually it should always be a bareword | |
$module = $self->const_sv($req_op->first)->PV; | |
$module =~ s[/][::]g; | |
$module =~ s/.pm$//; | |
} | |
else { | |
$module = $self->const($self->const_sv($req_op->first), 6); | |
} | |
my $version; | |
my $version_op = $req_op->sibling; | |
return if class($version_op) eq "NULL"; | |
if ($version_op->name eq "lineseq") { | |
# We have a version parameter; skip nextstate & pushmark | |
my $constop = $version_op->first->next->next; | |
return unless $self->const_sv($constop)->PV eq $module; | |
$constop = $constop->sibling; | |
$version = $self->const_sv($constop); | |
if (class($version) eq "IV") { | |
$version = $version->int_value; | |
} elsif (class($version) eq "NV") { | |
$version = $version->NV; | |
} elsif (class($version) ne "PVMG") { | |
# Includes PVIV and PVNV | |
$version = $version->PV; | |
} else { | |
# version specified as a v-string | |
$version = 'v'.join '.', map ord, split //, $version->PV; | |
} | |
$constop = $constop->sibling; | |
return if $constop->name ne "method_named"; | |
return if $self->meth_sv($constop)->PV ne "VERSION"; | |
} | |
$lineseq = $version_op->sibling; | |
return if $lineseq->name ne "lineseq"; | |
my $entersub = $lineseq->first->sibling; | |
if ($entersub->name eq "stub") { | |
return "use $module $version ();\n" if defined $version; | |
return "use $module ();\n"; | |
} | |
return if $entersub->name ne "entersub"; | |
# See if there are import arguments | |
my $args = ''; | |
my $svop = $entersub->first->sibling; # Skip over pushmark | |
return unless $self->const_sv($svop)->PV eq $module; | |
# Pull out the arguments | |
for ($svop=$svop->sibling; index($svop->name, "method_") != 0; | |
$svop = $svop->sibling) { | |
$args .= ", " if length($args); | |
$args .= $self->deparse($svop, 6); | |
} | |
my $use = 'use'; | |
my $method_named = $svop; | |
return if $method_named->name ne "method_named"; | |
my $method_name = $self->meth_sv($method_named)->PV; | |
if ($method_name eq "unimport") { | |
$use = 'no'; | |
} | |
# Certain pragmas are dealt with using hint bits, | |
# so we ignore them here | |
if ($module eq 'strict' || $module eq 'integer' | |
|| $module eq 'bytes' || $module eq 'warnings' | |
|| $module eq 'feature') { | |
return ""; | |
} | |
if (defined $version && length $args) { | |
return "$use $module $version ($args);\n"; | |
} elsif (defined $version) { | |
return "$use $module $version;\n"; | |
} elsif (length $args) { | |
return "$use $module ($args);\n"; | |
} else { | |
return "$use $module;\n"; | |
} | |
} | |
sub stash_subs { | |
my ($self, $pack, $seen) = @_; | |
my (@ret, $stash); | |
if (!defined $pack) { | |
$pack = ''; | |
$stash = \%::; | |
} | |
else { | |
$pack =~ s/(::)?$/::/; | |
no strict 'refs'; | |
$stash = \%{"main::$pack"}; | |
} | |
return | |
if ($seen ||= {})->{ | |
$INC{"overload.pm"} ? overload::StrVal($stash) : $stash | |
}++; | |
my $stashobj = svref_2object($stash); | |
my %stash = $stashobj->ARRAY; | |
while (my ($key, $val) = each %stash) { | |
my $flags = $val->FLAGS; | |
if ($flags & SVf_ROK) { | |
# A reference. Dump this if it is a reference to a CV. If it | |
# is a constant acting as a proxy for a full subroutine, then | |
# we may or may not have to dump it. If some form of perl- | |
# space visible code must have created it, be it a use | |
# statement, or some direct symbol-table manipulation code that | |
# we will deparse, then we don’t want to dump it. If it is the | |
# result of a declaration like sub f () { 42 } then we *do* | |
# want to dump it. The only way to distinguish these seems | |
# to be the SVs_PADTMP flag on the constant, which is admit- | |
# tedly a hack. | |
my $class = class(my $referent = $val->RV); | |
if ($class eq "CV") { | |
$self->todo($referent, 0); | |
} elsif ( | |
$class !~ /^(AV|HV|CV|FM|IO|SPECIAL)\z/ | |
# A more robust way to write that would be this, but B does | |
# not provide the SVt_ constants: | |
# ($referent->FLAGS & B::SVTYPEMASK) < B::SVt_PVAV | |
and $referent->FLAGS & SVs_PADTMP | |
) { | |
push @{$self->{'protos_todo'}}, [$pack . $key, $val]; | |
} | |
} elsif ($flags & (SVf_POK|SVf_IOK)) { | |
# Just a prototype. As an ugly but fairly effective way | |
# to find out if it belongs here is to see if the AUTOLOAD | |
# (if any) for the stash was defined in one of our files. | |
my $A = $stash{"AUTOLOAD"}; | |
if (defined ($A) && class($A) eq "GV" && defined($A->CV) | |
&& class($A->CV) eq "CV") { | |
my $AF = $A->FILE; | |
next unless $AF eq $0 || exists $self->{'files'}{$AF}; | |
} | |
push @{$self->{'protos_todo'}}, | |
[$pack . $key, $flags & SVf_POK ? $val->PV: undef]; | |
} elsif (class($val) eq "GV") { | |
if (class(my $cv = $val->CV) ne "SPECIAL") { | |
next if $self->{'subs_done'}{$$val}++; | |
# Ignore imposters (aliases etc) | |
my $name = $cv->NAME_HEK; | |
if(defined $name) { | |
# avoid using $cv->GV here because if the $val GV is | |
# an alias, CvGV() could upgrade the real stash entry | |
# from an RV to a GV | |
next unless $name eq $key; | |
next unless $$stashobj == ${$cv->STASH}; | |
} | |
else { | |
next if $$val != ${$cv->GV}; | |
} | |
$self->todo($cv, 0); | |
} | |
if (class(my $cv = $val->FORM) ne "SPECIAL") { | |
next if $self->{'forms_done'}{$$val}++; | |
next if $$val != ${$cv->GV}; # Ignore imposters | |
$self->todo($cv, 1); | |
} | |
if (class($val->HV) ne "SPECIAL" && $key =~ /::$/) { | |
$self->stash_subs($pack . $key, $seen); | |
} | |
} | |
} | |
} | |
sub print_protos { | |
my $self = shift; | |
my $ar; | |
my @ret; | |
foreach $ar (@{$self->{'protos_todo'}}) { | |
if (ref $ar->[1]) { | |
# Only print a constant if it occurs in the same package as a | |
# dumped sub. This is not perfect, but a heuristic that will | |
# hopefully work most of the time. Ideally we would use | |
# CvFILE, but a constant stub has no CvFILE. | |
my $pack = ($ar->[0] =~ /(.*)::/)[0]; | |
next if $pack and !$self->{packs}{$pack} | |
} | |
my $body = defined $ar->[1] | |
? ref $ar->[1] | |
? " () {\n " . $self->const($ar->[1]->RV,0) . ";\n}" | |
: " (". $ar->[1] . ");" | |
: ";"; | |
push @ret, "sub " . $ar->[0] . "$body\n"; | |
} | |
delete $self->{'protos_todo'}; | |
return @ret; | |
} | |
sub style_opts { | |
my $self = shift; | |
my $opts = shift; | |
my $opt; | |
while (length($opt = substr($opts, 0, 1))) { | |
if ($opt eq "C") { | |
$self->{'cuddle'} = " "; | |
$opts = substr($opts, 1); | |
} elsif ($opt eq "i") { | |
$opts =~ s/^i(\d+)//; | |
$self->{'indent_size'} = $1; | |
} elsif ($opt eq "T") { | |
$self->{'use_tabs'} = 1; | |
$opts = substr($opts, 1); | |
} elsif ($opt eq "v") { | |
$opts =~ s/^v([^.]*)(.|$)//; | |
$self->{'ex_const'} = $1; | |
} | |
} | |
} | |
sub new { | |
my $class = shift; | |
my $self = bless {}, $class; | |
$self->{'cuddle'} = "\n"; | |
$self->{'curcop'} = undef; | |
$self->{'curstash'} = "main"; | |
$self->{'ex_const'} = "'???'"; | |
$self->{'expand'} = 0; | |
$self->{'files'} = {}; | |
$self->{'packs'} = {}; | |
$self->{'indent_size'} = 4; | |
$self->{'linenums'} = 0; | |
$self->{'parens'} = 0; | |
$self->{'subs_todo'} = []; | |
$self->{'unquote'} = 0; | |
$self->{'use_dumper'} = 0; | |
$self->{'use_tabs'} = 0; | |
$self->{'ambient_warnings'} = undef; # Assume no lexical warnings | |
$self->{'ambient_hints'} = 0; | |
$self->{'ambient_hinthash'} = undef; | |
$self->init(); | |
while (my $arg = shift @_) { | |
if ($arg eq "-d") { | |
$self->{'use_dumper'} = 1; | |
require Data::Dumper; | |
} elsif ($arg =~ /^-f(.*)/) { | |
$self->{'files'}{$1} = 1; | |
} elsif ($arg eq "-l") { | |
$self->{'linenums'} = 1; | |
} elsif ($arg eq "-p") { | |
$self->{'parens'} = 1; | |
} elsif ($arg eq "-P") { | |
$self->{'noproto'} = 1; | |
} elsif ($arg eq "-q") { | |
$self->{'unquote'} = 1; | |
} elsif (substr($arg, 0, 2) eq "-s") { | |
$self->style_opts(substr $arg, 2); | |
} elsif ($arg =~ /^-x(\d)$/) { | |
$self->{'expand'} = $1; | |
} | |
} | |
return $self; | |
} | |
{ | |
# Mask out the bits that L<warnings::register> uses | |
my $WARN_MASK; | |
BEGIN { | |
$WARN_MASK = $warnings::Bits{all} | $warnings::DeadBits{all}; | |
} | |
sub WARN_MASK () { | |
return $WARN_MASK; | |
} | |
} | |
# Initialise the contextual information, either from | |
# defaults provided with the ambient_pragmas method, | |
# or from perl's own defaults otherwise. | |
sub init { | |
my $self = shift; | |
$self->{'warnings'} = defined ($self->{'ambient_warnings'}) | |
? $self->{'ambient_warnings'} & WARN_MASK | |
: undef; | |
$self->{'hints'} = $self->{'ambient_hints'}; | |
$self->{'hinthash'} = $self->{'ambient_hinthash'}; | |
# also a convenient place to clear out subs_declared | |
delete $self->{'subs_declared'}; | |
} | |
sub compile { | |
my(@args) = @_; | |
return sub { | |
my $self = B::Deparse->new(@args); | |
# First deparse command-line args | |
if (defined $^I) { # deparse -i | |
print q(BEGIN { $^I = ).perlstring($^I).qq(; }\n); | |
} | |
if ($^W) { # deparse -w | |
print qq(BEGIN { \$^W = $^W; }\n); | |
} | |
if ($/ ne "\n" or defined $O::savebackslash) { # deparse -l and -0 | |
my $fs = perlstring($/) || 'undef'; | |
my $bs = perlstring($O::savebackslash) || 'undef'; | |
print qq(BEGIN { \$/ = $fs; \$\\ = $bs; }\n); | |
} | |
my @BEGINs = B::begin_av->isa("B::AV") ? B::begin_av->ARRAY : (); | |
my @UNITCHECKs = B::unitcheck_av->isa("B::AV") | |
? B::unitcheck_av->ARRAY | |
: (); | |
my @CHECKs = B::check_av->isa("B::AV") ? B::check_av->ARRAY : (); | |
my @INITs = B::init_av->isa("B::AV") ? B::init_av->ARRAY : (); | |
my @ENDs = B::end_av->isa("B::AV") ? B::end_av->ARRAY : (); | |
my @names = qw(BEGIN UNITCHECK CHECK INIT END); | |
my @blocks = \(@BEGINs, @UNITCHECKs, @CHECKs, @INITs, @ENDs); | |
while (@names) { | |
my ($name, $blocks) = (shift @names, shift @blocks); | |
for my $block (@$blocks) { | |
$self->todo($block, 0, $name); | |
} | |
} | |
$self->stash_subs(); | |
local($SIG{"__DIE__"}) = | |
sub { | |
if ($self->{'curcop'}) { | |
my $cop = $self->{'curcop'}; | |
my($line, $file) = ($cop->line, $cop->file); | |
print STDERR "While deparsing $file near line $line,\n"; | |
} | |
}; | |
$self->{'curcv'} = main_cv; | |
$self->{'curcvlex'} = undef; | |
print $self->print_protos; | |
@{$self->{'subs_todo'}} = | |
sort {$a->[0] <=> $b->[0]} @{$self->{'subs_todo'}}; | |
my $root = main_root; | |
local $B::overlay = {}; | |
unless (null $root) { | |
$self->pad_subs($self->{'curcv'}); | |
# Check for a stub-followed-by-ex-cop, resulting from a program | |
# consisting solely of sub declarations. For backward-compati- | |
# bility (and sane output) we don’t want to emit the stub. | |
# leave | |
# enter | |
# stub | |
# ex-nextstate (or ex-dbstate) | |
my $kid; | |
if ( $root->name eq 'leave' | |
and ($kid = $root->first)->name eq 'enter' | |
and !null($kid = $kid->sibling) and $kid->name eq 'stub' | |
and !null($kid = $kid->sibling) and $kid->name eq 'null' | |
and class($kid) eq 'COP' and null $kid->sibling ) | |
{ | |
# ignore | |
} else { | |
$self->pessimise($root, main_start); | |
print $self->indent($self->deparse_root($root)), "\n"; | |
} | |
} | |
my @text; | |
while (scalar(@{$self->{'subs_todo'}})) { | |
push @text, $self->next_todo; | |
} | |
print $self->indent(join("", @text)), "\n" if @text; | |
# Print __DATA__ section, if necessary | |
no strict 'refs'; | |
my $laststash = defined $self->{'curcop'} | |
? $self->{'curcop'}->stash->NAME : $self->{'curstash'}; | |
if (defined *{$laststash."::DATA"}{IO}) { | |
print $self->keyword("package") . " $laststash;\n" | |
unless $laststash eq $self->{'curstash'}; | |
print $self->keyword("__DATA__") . "\n"; | |
print readline(*{$laststash."::DATA"}); | |
} | |
} | |
} | |
sub coderef2text { | |
my $self = shift; | |
my $sub = shift; | |
croak "Usage: ->coderef2text(CODEREF)" unless UNIVERSAL::isa($sub, "CODE"); | |
$self->init(); | |
local $self->{in_coderef2text} = 1; | |
return $self->indent($self->deparse_sub(svref_2object($sub))); | |
} | |
my %strict_bits = do { | |
local $^H; | |
map +($_ => strict::bits($_)), qw/refs subs vars/ | |
}; | |
sub ambient_pragmas { | |
my $self = shift; | |
my ($hint_bits, $warning_bits, $hinthash) = (0); | |
while (@_ > 1) { | |
my $name = shift(); | |
my $val = shift(); | |
if ($name eq 'strict') { | |
require strict; | |
if ($val eq 'none') { | |
$hint_bits &= $strict_bits{$_} for qw/refs subs vars/; | |
next(); | |
} | |
my @names; | |
if ($val eq "all") { | |
@names = qw/refs subs vars/; | |
} | |
elsif (ref $val) { | |
@names = @$val; | |
} | |
else { | |
@names = split' ', $val; | |
} | |
$hint_bits |= $strict_bits{$_} for @names; | |
} | |
elsif ($name eq 'integer' | |
|| $name eq 'bytes' | |
|| $name eq 'utf8') { | |
require "$name.pm"; | |
if ($val) { | |
$hint_bits |= ${$::{"${name}::"}{"hint_bits"}}; | |
} | |
else { | |
$hint_bits &= ~${$::{"${name}::"}{"hint_bits"}}; | |
} | |
} | |
elsif ($name eq 're') { | |
require re; | |
if ($val eq 'none') { | |
$hint_bits &= ~re::bits(qw/taint eval/); | |
next(); | |
} | |
my @names; | |
if ($val eq 'all') { | |
@names = qw/taint eval/; | |
} | |
elsif (ref $val) { | |
@names = @$val; | |
} | |
else { | |
@names = split' ',$val; | |
} | |
$hint_bits |= re::bits(@names); | |
} | |
elsif ($name eq 'warnings') { | |
if ($val eq 'none') { | |
$warning_bits = $warnings::NONE; | |
next(); | |
} | |
my @names; | |
if (ref $val) { | |
@names = @$val; | |
} | |
else { | |
@names = split/\s+/, $val; | |
} | |
$warning_bits = $warnings::NONE if !defined ($warning_bits); | |
$warning_bits |= warnings::bits(@names); | |
} | |
elsif ($name eq 'warning_bits') { | |
$warning_bits = $val; | |
} | |
elsif ($name eq 'hint_bits') { | |
$hint_bits = $val; | |
} | |
elsif ($name eq '%^H') { | |
$hinthash = $val; | |
} | |
else { | |
croak "Unknown pragma type: $name"; | |
} | |
} | |
if (@_) { | |
croak "The ambient_pragmas method expects an even number of args"; | |
} | |
$self->{'ambient_warnings'} = $warning_bits; | |
$self->{'ambient_hints'} = $hint_bits; | |
$self->{'ambient_hinthash'} = $hinthash; | |
} | |
# This method is the inner loop, so try to keep it simple | |
sub deparse { | |
my $self = shift; | |
my($op, $cx) = @_; | |
Carp::confess("Null op in deparse") if !defined($op) | |
|| class($op) eq "NULL"; | |
my $meth = "pp_" . $op->name; | |
return $self->$meth($op, $cx); | |
} | |
sub indent { | |
my $self = shift; | |
my $txt = shift; | |
# \cK also swallows a preceding line break when followed by a | |
# semicolon. | |
$txt =~ s/\n\cK;//g; | |
my @lines = split(/\n/, $txt); | |
my $leader = ""; | |
my $level = 0; | |
my $line; | |
for $line (@lines) { | |
my $cmd = substr($line, 0, 1); | |
if ($cmd eq "\t" or $cmd eq "\b") { | |
$level += ($cmd eq "\t" ? 1 : -1) * $self->{'indent_size'}; | |
if ($self->{'use_tabs'}) { | |
$leader = "\t" x ($level / 8) . " " x ($level % 8); | |
} else { | |
$leader = " " x $level; | |
} | |
$line = substr($line, 1); | |
} | |
if (index($line, "\f") > 0) { | |
$line =~ s/\f/\n/; | |
} | |
if (substr($line, 0, 1) eq "\f") { | |
$line = substr($line, 1); # no indent | |
} else { | |
$line = $leader . $line; | |
} | |
$line =~ s/\cK;?//g; | |
} | |
return join("\n", @lines); | |
} | |
sub pad_subs { | |
my ($self, $cv) = @_; | |
my $padlist = $cv->PADLIST; | |
my @names = $padlist->ARRAYelt(0)->ARRAY; | |
my @values = $padlist->ARRAYelt(1)->ARRAY; | |
my @todo; | |
PADENTRY: | |
for my $ix (0.. $#names) { for $_ ($names[$ix]) { | |
next if class($_) eq "SPECIAL"; | |
my $name = $_->PVX; | |
if (defined $name && $name =~ /^&./) { | |
my $low = $_->COP_SEQ_RANGE_LOW; | |
my $flags = $_->FLAGS; | |
my $outer = $flags & PADNAMEt_OUTER; | |
if ($flags & SVpad_OUR) { | |
push @todo, [$low, undef, 0, $_] | |
# [seq, no cv, not format, padname] | |
unless $outer; | |
next; | |
} | |
my $protocv = $flags & SVpad_STATE | |
? $values[$ix] | |
: $_->PROTOCV; | |
if (class ($protocv) ne 'CV') { | |
my $flags = $flags; | |
my $cv = $cv; | |
my $name = $_; | |
while ($flags & PADNAMEt_OUTER && class ($protocv) ne 'CV') | |
{ | |
$cv = $cv->OUTSIDE; | |
next PADENTRY if class($cv) eq 'SPECIAL'; # XXX freed? | |
my $padlist = $cv->PADLIST; | |
my $ix = $name->PARENT_PAD_INDEX; | |
$name = $padlist->NAMES->ARRAYelt($ix); | |
$flags = $name->FLAGS; | |
$protocv = $flags & SVpad_STATE | |
? $padlist->ARRAYelt(1)->ARRAYelt($ix) | |
: $name->PROTOCV; | |
} | |
} | |
my $defined_in_this_sub = ${$protocv->OUTSIDE} == $$cv || do { | |
my $other = $protocv->PADLIST; | |
$$other && $other->outid == $padlist->id; | |
}; | |
if ($flags & PADNAMEt_OUTER) { | |
next unless $defined_in_this_sub; | |
push @todo, [$protocv->OUTSIDE_SEQ, $protocv, 0, $_]; | |
next; | |
} | |
my $outseq = $protocv->OUTSIDE_SEQ; | |
if ($outseq <= $low) { | |
# defined before its name is visible, so it’s gotta be | |
# declared and defined at once: my sub foo { ... } | |
push @todo, [$low, $protocv, 0, $_]; | |
} | |
else { | |
# declared and defined separately: my sub f; sub f { ... } | |
push @todo, [$low, undef, 0, $_]; | |
push @todo, [$outseq, $protocv, 0, $_] | |
if $defined_in_this_sub; | |
} | |
} | |
}} | |
@{$self->{'subs_todo'}} = | |
sort {$a->[0] <=> $b->[0]} @{$self->{'subs_todo'}}, @todo | |
} | |
# deparse_argops(): deparse, if possible, a sequence of argcheck + argelem | |
# ops into a subroutine signature. If successful, return the first op | |
# following the signature ops plus the signature string; else return the | |
# empty list. | |
# | |
# Normally a bunch of argelem ops will have been generated by the | |
# signature parsing, but it's possible that ops have been added manually | |
# or altered. In this case we return "()" and fall back to general | |
# deparsing of the individual sigelems as 'my $x = $_[N]' etc. | |
# | |
# We're only called if the top is an ex-argcheck, which is a placeholder | |
# indicating a signature subtree. | |
# | |
# Return a signature string, or an empty list if no deparseable as a | |
# signature | |
sub deparse_argops { | |
my ($self, $topop, $cv) = @_; | |
my @sig; | |
$topop = $topop->first; | |
return unless $$topop and $topop->name eq 'lineseq'; | |
# last op should be nextstate | |
my $last = $topop->last; | |
return unless $$last | |
and ( _op_is_or_was($last, OP_NEXTSTATE) | |
or _op_is_or_was($last, OP_DBSTATE)); | |
# first OP_NEXTSTATE | |
my $o = $topop->first; | |
return unless $$o; | |
return if $o->label; | |
# OP_ARGCHECK | |
$o = $o->sibling; | |
return unless $$o and $o->name eq 'argcheck'; | |
my ($params, $opt_params, $slurpy) = $o->aux_list($cv); | |
my $mandatory = $params - $opt_params; | |
my $seen_slurpy = 0; | |
my $last_ix = -1; | |
# keep looking for valid nextstate + argelem pairs, terminated | |
# by a final nextstate | |
while (1) { | |
$o = $o->sibling; | |
return unless $$o; | |
# skip trailing nextstate | |
last if $$o == $$last; | |
# OP_NEXTSTATE | |
return unless $o->name =~ /^(next|db)state$/; | |
return if $o->label; | |
# OP_ARGELEM | |
$o = $o->sibling; | |
last unless $$o; | |
if ($o->name eq 'argelem') { | |
my $ix = $o->string($cv); | |
while (++$last_ix < $ix) { | |
push @sig, $last_ix < $mandatory ? '$' : '$='; | |
} | |
my $var = $self->padname($o->targ); | |
if ($var =~ /^[@%]/) { | |
return if $seen_slurpy; | |
$seen_slurpy = 1; | |
return if $ix != $params or !$slurpy | |
or substr($var,0,1) ne $slurpy; | |
} | |
else { | |
return if $ix >= $params; | |
} | |
if ($o->flags & OPf_KIDS) { | |
my $kid = $o->first; | |
return unless $$kid and $kid->name eq 'argdefelem'; | |
my $def = $self->deparse($kid->first, 7); | |
$def = "($def)" if $kid->first->flags & OPf_PARENS; | |
$var .= " = $def"; | |
} | |
push @sig, $var; | |
} | |
elsif ($o->name eq 'null' | |
and ($o->flags & OPf_KIDS) | |
and $o->first->name eq 'argdefelem') | |
{ | |
# special case - a void context default expression: $ = expr | |
my $defop = $o->first; | |
my $ix = $defop->targ; | |
while (++$last_ix < $ix) { | |
push @sig, $last_ix < $mandatory ? '$' : '$='; | |
} | |
return if $last_ix >= $params | |
or $last_ix < $mandatory; | |
my $def = $self->deparse($defop->first, 7); | |
$def = "($def)" if $defop->first->flags & OPf_PARENS; | |
push @sig, '$ = ' . $def; | |
} | |
else { | |
return; | |
} | |
} | |
while (++$last_ix < $params) { | |
push @sig, $last_ix < $mandatory ? '$' : '$='; | |
} | |
push @sig, $slurpy if $slurpy and !$seen_slurpy; | |
return (join(', ', @sig)); | |
} | |
# Deparse a sub. Returns everything except the 'sub foo', | |
# e.g. ($$) : method { ...; } | |
# or : prototype($$) lvalue ($a, $b) { ...; }; | |
sub deparse_sub { | |
my $self = shift; | |
my $cv = shift; | |
my @attrs; | |
my $proto; | |
my $sig; | |
Carp::confess("NULL in deparse_sub") if !defined($cv) || $cv->isa("B::NULL"); | |
Carp::confess("SPECIAL in deparse_sub") if $cv->isa("B::SPECIAL"); | |
local $self->{'curcop'} = $self->{'curcop'}; | |
my $has_sig = $self->{hinthash}{feature_signatures}; | |
if ($cv->FLAGS & SVf_POK) { | |
my $myproto = $cv->PV; | |
if ($has_sig) { | |
push @attrs, "prototype($myproto)"; | |
} | |
else { | |
$proto = $myproto; | |
} | |
} | |
if ($cv->CvFLAGS & (CVf_METHOD|CVf_LOCKED|CVf_LVALUE|CVf_ANONCONST)) { | |
push @attrs, "lvalue" if $cv->CvFLAGS & CVf_LVALUE; | |
push @attrs, "method" if $cv->CvFLAGS & CVf_METHOD; | |
push @attrs, "const" if $cv->CvFLAGS & CVf_ANONCONST; | |
} | |
local($self->{'curcv'}) = $cv; | |
local($self->{'curcvlex'}); | |
local(@$self{qw'curstash warnings hints hinthash'}) | |
= @$self{qw'curstash warnings hints hinthash'}; | |
my $body; | |
my $root = $cv->ROOT; | |
local $B::overlay = {}; | |
if (not null $root) { | |
$self->pad_subs($cv); | |
$self->pessimise($root, $cv->START); | |
my $lineseq = $root->first; | |
# stub sub may have single op rather than list of ops | |
my $is_list = ($lineseq->name eq "lineseq"); | |
my $firstop = $is_list ? $lineseq->first : $lineseq; | |
# Try to deparse first subtree as a signature if possible. | |
# Top of signature subtree has an ex-argcheck as a placeholder | |
if ( $has_sig | |
and $$firstop | |
and $firstop->name eq 'null' | |
and $firstop->targ == OP_ARGCHECK | |
) { | |
my ($mysig) = $self->deparse_argops($firstop, $cv); | |
if (defined $mysig) { | |
$sig = $mysig; | |
$firstop = $is_list ? $firstop->sibling : undef; | |
} | |
} | |
if ($is_list && $firstop) { | |
my @ops; | |
for (my $o = $firstop; $$o; $o=$o->sibling) { | |
push @ops, $o; | |
} | |
$body = $self->lineseq(undef, 0, @ops).";"; | |
if (!$has_sig and $ops[-1]->name =~ /^(next|db)state$/) { | |
# this handles void context in | |
# use feature signatures; sub ($=1) {} | |
$body .= "\n()"; | |
} | |
my $scope_en = $self->find_scope_en($lineseq); | |
if (defined $scope_en) { | |
my $subs = join"", $self->seq_subs($scope_en); | |
$body .= ";\n$subs" if length($subs); | |
} | |
} | |
elsif ($firstop) { | |
$body = $self->deparse($root->first, 0); | |
} | |
else { | |
$body = ';'; # stub sub | |
} | |
my $l = ''; | |
if ($self->{'linenums'}) { | |
# a glob's gp_line is set from the line containing a | |
# sub's closing '}' if the CV is the first use of the GV. | |
# So make sure the linenum is set correctly for '}' | |
my $gv = $cv->GV; | |
my $line = $gv->LINE; | |
my $file = $gv->FILE; | |
$l = "\f#line $line \"$file\"\n"; | |
} | |
$body = "{\n\t$body\n$l\b}"; | |
} | |
else { | |
my $sv = $cv->const_sv; | |
if ($$sv) { | |
# uh-oh. inlinable sub... format it differently | |
$body = "{ " . $self->const($sv, 0) . " }\n"; | |
} else { # XSUB? (or just a declaration) | |
$body = ';' | |
} | |
} | |
$proto = defined $proto ? "($proto) " : ""; | |
$sig = defined $sig ? "($sig) " : ""; | |
my $attrs = ''; | |
$attrs = ': ' . join('', map "$_ ", @attrs) if @attrs; | |
return "$proto$attrs$sig$body\n"; | |
} | |
sub deparse_format { | |
my $self = shift; | |
my $form = shift; | |
my @text; | |
local($self->{'curcv'}) = $form; | |
local($self->{'curcvlex'}); | |
local($self->{'in_format'}) = 1; | |
local(@$self{qw'curstash warnings hints hinthash'}) | |
= @$self{qw'curstash warnings hints hinthash'}; | |
my $op = $form->ROOT; | |
local $B::overlay = {}; | |
$self->pessimise($op, $form->START); | |
my $kid; | |
return "\f." if $op->first->name eq 'stub' | |
|| $op->first->name eq 'nextstate'; | |
$op = $op->first->first; # skip leavewrite, lineseq | |
while (not null $op) { | |
$op = $op->sibling; # skip nextstate | |
my @exprs; | |
$kid = $op->first->sibling; # skip pushmark | |
push @text, "\f".$self->const_sv($kid)->PV; | |
$kid = $kid->sibling; | |
for (; not null $kid; $kid = $kid->sibling) { | |
push @exprs, $self->deparse($kid, -1); | |
$exprs[-1] =~ s/;\z//; | |
} | |
push @text, "\f".join(", ", @exprs)."\n" if @exprs; | |
$op = $op->sibling; | |
} | |
return join("", @text) . "\f."; | |
} | |
sub is_scope { | |
my $op = shift; | |
return $op->name eq "leave" || $op->name eq "scope" | |
|| $op->name eq "lineseq" | |
|| ($op->name eq "null" && class($op) eq "UNOP" | |
&& (is_scope($op->first) || $op->first->name eq "enter")); | |
} | |
sub is_state { | |
my $name = $_[0]->name; | |
return $name eq "nextstate" || $name eq "dbstate" || $name eq "setstate"; | |
} | |
sub is_miniwhile { # check for one-line loop ('foo() while $y--') | |
my $op = shift; | |
return (!null($op) and null($op->sibling) | |
and $op->name eq "null" and class($op) eq "UNOP" | |
and (($op->first->name =~ /^(and|or)$/ | |
and $op->first->first->sibling->name eq "lineseq") | |
or ($op->first->name eq "lineseq" | |
and not null $op->first->first->sibling | |
and $op->first->first->sibling->name eq "unstack") | |
)); | |
} | |
# Check if the op and its sibling are the initialization and the rest of a | |
# for (..;..;..) { ... } loop | |
sub is_for_loop { | |
my $op = shift; | |
# This OP might be almost anything, though it won't be a | |
# nextstate. (It's the initialization, so in the canonical case it | |
# will be an sassign.) The sibling is (old style) a lineseq whose | |
# first child is a nextstate and whose second is a leaveloop, or | |
# (new style) an unstack whose sibling is a leaveloop. | |
my $lseq = $op->sibling; | |
return 0 unless !is_state($op) and !null($lseq); | |
if ($lseq->name eq "lineseq") { | |
if ($lseq->first && !null($lseq->first) && is_state($lseq->first) | |
&& (my $sib = $lseq->first->sibling)) { | |
return (!null($sib) && $sib->name eq "leaveloop"); | |
} | |
} elsif ($lseq->name eq "unstack" && ($lseq->flags & OPf_SPECIAL)) { | |
my $sib = $lseq->sibling; | |
return $sib && !null($sib) && $sib->name eq "leaveloop"; | |
} | |
return 0; | |
} | |
sub is_scalar { | |
my $op = shift; | |
return ($op->name eq "rv2sv" or | |
$op->name eq "padsv" or | |
$op->name eq "gv" or # only in array/hash constructs | |
$op->flags & OPf_KIDS && !null($op->first) | |
&& $op->first->name eq "gvsv"); | |
} | |
sub maybe_parens { | |
my $self = shift; | |
my($text, $cx, $prec) = @_; | |
if ($prec < $cx # unary ops nest just fine | |
or $prec == $cx and $cx != 4 and $cx != 16 and $cx != 21 | |
or $self->{'parens'}) | |
{ | |
$text = "($text)"; | |
# In a unop, let parent reuse our parens; see maybe_parens_unop | |
$text = "\cS" . $text if $cx == 16; | |
return $text; | |
} else { | |
return $text; | |
} | |
} | |
# same as above, but get around the 'if it looks like a function' rule | |
sub maybe_parens_unop { | |
my $self = shift; | |
my($name, $kid, $cx) = @_; | |
if ($cx > 16 or $self->{'parens'}) { | |
$kid = $self->deparse($kid, 1); | |
if ($name eq "umask" && $kid =~ /^\d+$/) { | |
$kid = sprintf("%#o", $kid); | |
} | |
return $self->keyword($name) . "($kid)"; | |
} else { | |
$kid = $self->deparse($kid, 16); | |
if ($name eq "umask" && $kid =~ /^\d+$/) { | |
$kid = sprintf("%#o", $kid); | |
} | |
$name = $self->keyword($name); | |
if (substr($kid, 0, 1) eq "\cS") { | |
# use kid's parens | |
return $name . substr($kid, 1); | |
} elsif (substr($kid, 0, 1) eq "(") { | |
# avoid looks-like-a-function trap with extra parens | |
# ('+' can lead to ambiguities) | |
return "$name(" . $kid . ")"; | |
} else { | |
return "$name $kid"; | |
} | |
} | |
} | |
sub maybe_parens_func { | |
my $self = shift; | |
my($func, $text, $cx, $prec) = @_; | |
if ($prec <= $cx or substr($text, 0, 1) eq "(" or $self->{'parens'}) { | |
return "$func($text)"; | |
} else { | |
return "$func $text"; | |
} | |
} | |
sub find_our_type { | |
my ($self, $name) = @_; | |
$self->populate_curcvlex() if !defined $self->{'curcvlex'}; | |
my $seq = $self->{'curcop'} ? $self->{'curcop'}->cop_seq : 0; | |
for my $a (@{$self->{'curcvlex'}{"o$name"}}) { | |
my ($st, undef, $padname) = @$a; | |
if ($st >= $seq && $padname->FLAGS & SVpad_TYPED) { | |
return $padname->SvSTASH->NAME; | |
} | |
} | |
return ''; | |
} | |
sub maybe_local { | |
my $self = shift; | |
my($op, $cx, $text) = @_; | |
my $name = $op->name; | |
my $our_intro = ($name =~ /^(?:(?:gv|rv2)[ash]v|split|refassign | |
|lv(?:av)?ref)$/x) | |
? OPpOUR_INTRO | |
: 0; | |
my $lval_intro = $name eq 'split' ? 0 : OPpLVAL_INTRO; | |
# The @a in \(@a) isn't in ref context, but only when the | |
# parens are there. | |
my $need_parens = $self->{'in_refgen'} && $name =~ /[ah]v\z/ | |
&& ($op->flags & (OPf_PARENS|OPf_REF)) == OPf_PARENS; | |
if ((my $priv = $op->private) & ($lval_intro|$our_intro)) { | |
my @our_local; | |
push @our_local, "local" if $priv & $lval_intro; | |
push @our_local, "our" if $priv & $our_intro; | |
my $our_local = join " ", map $self->keyword($_), @our_local; | |
if( $our_local[-1] eq 'our' ) { | |
if ( $text !~ /^\W(\w+::)*\w+\z/ | |
and !utf8::decode($text) || $text !~ /^\W(\w+::)*\w+\z/ | |
) { | |
die "Unexpected our($text)\n"; | |
} | |
$text =~ s/(\w+::)+//; | |
if (my $type = $self->find_our_type($text)) { | |
$our_local .= ' ' . $type; | |
} | |
} | |
return $need_parens ? "($text)" : $text | |
if $self->{'avoid_local'}{$$op}; | |
if ($need_parens) { | |
return "$our_local($text)"; | |
} elsif (want_scalar($op) || $our_local eq 'our') { | |
return "$our_local $text"; | |
} else { | |
return $self->maybe_parens_func("$our_local", $text, $cx, 16); | |
} | |
} else { | |
return $need_parens ? "($text)" : $text; | |
} | |
} | |
sub maybe_targmy { | |
my $self = shift; | |
my($op, $cx, $func, @args) = @_; | |
if ($op->private & OPpTARGET_MY) { | |
my $var = $self->padname($op->targ); | |
my $val = $func->($self, $op, 7, @args); | |
return $self->maybe_parens("$var = $val", $cx, 7); | |
} else { | |
return $func->($self, $op, $cx, @args); | |
} | |
} | |
sub padname_sv { | |
my $self = shift; | |
my $targ = shift; | |
return $self->{'curcv'}->PADLIST->ARRAYelt(0)->ARRAYelt($targ); | |
} | |
sub maybe_my { | |
my $self = shift; | |
my($op, $cx, $text, $padname, $forbid_parens) = @_; | |
# The @a in \(@a) isn't in ref context, but only when the | |
# parens are there. | |
my $need_parens = !$forbid_parens && $self->{'in_refgen'} | |
&& $op->name =~ /[ah]v\z/ | |
&& ($op->flags & (OPf_PARENS|OPf_REF)) == OPf_PARENS; | |
# The @a in \my @a must not have parens. | |
if (!$need_parens && $self->{'in_refgen'}) { | |
$forbid_parens = 1; | |
} | |
if ($op->private & OPpLVAL_INTRO and not $self->{'avoid_local'}{$$op}) { | |
# Check $padname->FLAGS for statehood, rather than $op->private, | |
# because enteriter ops do not carry the flag. | |
my $my = | |
$self->keyword($padname->FLAGS & SVpad_STATE ? "state" : "my"); | |
if ($padname->FLAGS & SVpad_TYPED) { | |
$my .= ' ' . $padname->SvSTASH->NAME; | |
} | |
if ($need_parens) { | |
return "$my($text)"; | |
} elsif ($forbid_parens || want_scalar($op)) { | |
return "$my $text"; | |
} else { | |
return $self->maybe_parens_func($my, $text, $cx, 16); | |
} | |
} else { | |
return $need_parens ? "($text)" : $text; | |
} | |
} | |
# The following OPs don't have functions: | |
# pp_padany -- does not exist after parsing | |
sub AUTOLOAD { | |
if ($AUTOLOAD =~ s/^.*::pp_//) { | |
warn "unexpected OP_". | |
($_[1]->type == OP_CUSTOM ? "CUSTOM ($AUTOLOAD)" : uc $AUTOLOAD); | |
return "XXX"; | |
} else { | |
die "Undefined subroutine $AUTOLOAD called"; | |
} | |
} | |
sub DESTROY {} # Do not AUTOLOAD | |
# $root should be the op which represents the root of whatever | |
# we're sequencing here. If it's undefined, then we don't append | |
# any subroutine declarations to the deparsed ops, otherwise we | |
# append appropriate declarations. | |
sub lineseq { | |
my($self, $root, $cx, @ops) = @_; | |
my($expr, @exprs); | |
my $out_cop = $self->{'curcop'}; | |
my $out_seq = defined($out_cop) ? $out_cop->cop_seq : undef; | |
my $limit_seq; | |
if (defined $root) { | |
$limit_seq = $out_seq; | |
my $nseq; | |
$nseq = $self->find_scope_st($root->sibling) if ${$root->sibling}; | |
$limit_seq = $nseq if !defined($limit_seq) | |
or defined($nseq) && $nseq < $limit_seq; | |
} | |
$limit_seq = $self->{'limit_seq'} | |
if defined($self->{'limit_seq'}) | |
&& (!defined($limit_seq) || $self->{'limit_seq'} < $limit_seq); | |
local $self->{'limit_seq'} = $limit_seq; | |
$self->walk_lineseq($root, \@ops, | |
sub { push @exprs, $_[0]} ); | |
my $sep = $cx ? '; ' : ";\n"; | |
my $body = join($sep, grep {length} @exprs); | |
my $subs = ""; | |
if (defined $root && defined $limit_seq && !$self->{'in_format'}) { | |
$subs = join "\n", $self->seq_subs($limit_seq); | |
} | |
return join($sep, grep {length} $body, $subs); | |
} | |
sub scopeop { | |
my($real_block, $self, $op, $cx) = @_; | |
my $kid; | |
my @kids; | |
local(@$self{qw'curstash warnings hints hinthash'}) | |
= @$self{qw'curstash warnings hints hinthash'} if $real_block; | |
if ($real_block) { | |
$kid = $op->first->sibling; # skip enter | |
if (is_miniwhile($kid)) { | |
my $top = $kid->first; | |
my $name = $top->name; | |
if ($name eq "and") { | |
$name = $self->keyword("while"); | |
} elsif ($name eq "or") { | |
$name = $self->keyword("until"); | |
} else { # no conditional -> while 1 or until 0 | |
return $self->deparse($top->first, 1) . " " | |
. $self->keyword("while") . " 1"; | |
} | |
my $cond = $top->first; | |
my $body = $cond->sibling->first; # skip lineseq | |
$cond = $self->deparse($cond, 1); | |
$body = $self->deparse($body, 1); | |
return "$body $name $cond"; | |
} | |
} else { | |
$kid = $op->first; | |
} | |
for (; !null($kid); $kid = $kid->sibling) { | |
push @kids, $kid; | |
} | |
if ($cx > 0) { # inside an expression, (a do {} while for lineseq) | |
my $body = $self->lineseq($op, 0, @kids); | |
return is_lexical_subs(@kids) | |
? $body | |
: ($self->lex_in_scope("&do") ? "CORE::do" : "do") | |
. " {\n\t$body\n\b}"; | |
} else { | |
my $lineseq = $self->lineseq($op, $cx, @kids); | |
return (length ($lineseq) ? "$lineseq;" : ""); | |
} | |
} | |
sub pp_scope { scopeop(0, @_); } | |
sub pp_lineseq { scopeop(0, @_); } | |
sub pp_leave { scopeop(1, @_); } | |
# This is a special case of scopeop and lineseq, for the case of the | |
# main_root. The difference is that we print the output statements as | |
# soon as we get them, for the sake of impatient users. | |
sub deparse_root { | |
my $self = shift; | |
my($op) = @_; | |
local(@$self{qw'curstash warnings hints hinthash'}) | |
= @$self{qw'curstash warnings hints hinthash'}; | |
my @kids; | |
return if null $op->first; # Can happen, e.g., for Bytecode without -k | |
for (my $kid = $op->first->sibling; !null($kid); $kid = $kid->sibling) { | |
push @kids, $kid; | |
} | |
$self->walk_lineseq($op, \@kids, | |
sub { return unless length $_[0]; | |
print $self->indent($_[0].';'); | |
print "\n" | |
unless $_[1] == $#kids; | |
}); | |
} | |
sub walk_lineseq { | |
my ($self, $op, $kids, $callback) = @_; | |
my @kids = @$kids; | |
for (my $i = 0; $i < @kids; $i++) { | |
my $expr = ""; | |
if (is_state $kids[$i]) { | |
$expr = $self->deparse($kids[$i++], 0); | |
if ($i > $#kids) { | |
$callback->($expr, $i); | |
last; | |
} | |
} | |
if (is_for_loop($kids[$i])) { | |
$callback->($expr . $self->for_loop($kids[$i], 0), | |
$i += $kids[$i]->sibling->name eq "unstack" ? 2 : 1); | |
next; | |
} | |
my $expr2 = $self->deparse($kids[$i], (@kids != 1)/2); | |
$expr2 =~ s/^sub :(?!:)/+sub :/; # statement label otherwise | |
$expr .= $expr2; | |
$callback->($expr, $i); | |
} | |
} | |
# The BEGIN {} is used here because otherwise this code isn't executed | |
# when you run B::Deparse on itself. | |
my %globalnames; | |
BEGIN { map($globalnames{$_}++, "SIG", "STDIN", "STDOUT", "STDERR", "INC", | |
"ENV", "ARGV", "ARGVOUT", "_"); } | |
sub gv_name { | |
my $self = shift; | |
my $gv = shift; | |
my $raw = shift; | |
#Carp::confess() unless ref($gv) eq "B::GV"; | |
my $cv = $gv->FLAGS & SVf_ROK ? $gv->RV : 0; | |
my $stash = ($cv || $gv)->STASH->NAME; | |
my $name = $raw | |
? $cv ? $cv->NAME_HEK || $cv->GV->NAME : $gv->NAME | |
: $cv | |
? B::safename($cv->NAME_HEK || $cv->GV->NAME) | |
: $gv->SAFENAME; | |
if ($stash eq 'main' && $name =~ /^::/) { | |
$stash = '::'; | |
} | |
elsif (($stash eq 'main' | |
&& ($globalnames{$name} || $name =~ /^[^A-Za-z_:]/)) | |
or ($stash eq $self->{'curstash'} && !$globalnames{$name} | |
&& ($stash eq 'main' || $name !~ /::/)) | |
) | |
{ | |
$stash = ""; | |
} else { | |
$stash = $stash . "::"; | |
} | |
if (!$raw and $name =~ /^(\^..|{)/) { | |
$name = "{$name}"; # ${^WARNING_BITS}, etc and ${ | |
} | |
return $stash . $name; | |
} | |
# Return the name to use for a stash variable. | |
# If a lexical with the same name is in scope, or | |
# if strictures are enabled, it may need to be | |
# fully-qualified. | |
sub stash_variable { | |
my ($self, $prefix, $name, $cx) = @_; | |
return $prefix.$self->maybe_qualify($prefix, $name) if $name =~ /::/; | |
unless ($prefix eq '$' || $prefix eq '@' || $prefix eq '&' || #' | |
$prefix eq '%' || $prefix eq '$#') { | |
return "$prefix$name"; | |
} | |
if ($name =~ /^[^[:alpha:]_+-]$/) { | |
if (defined $cx && $cx == 26) { | |
if ($prefix eq '@') { | |
return "$prefix\{$name}"; | |
} | |
elsif ($name eq '#') { return '${#}' } # "${#}a" vs "$#a" | |
} | |
if ($prefix eq '$#') { | |
return "\$#{$name}"; | |
} | |
} | |
return $prefix . $self->maybe_qualify($prefix, $name); | |
} | |
my %unctrl = # portable to EBCDIC | |
( | |
"\c@" => '@', # unused | |
"\cA" => 'A', | |
"\cB" => 'B', | |
"\cC" => 'C', | |
"\cD" => 'D', | |
"\cE" => 'E', | |
"\cF" => 'F', | |
"\cG" => 'G', | |
"\cH" => 'H', | |
"\cI" => 'I', | |
"\cJ" => 'J', | |
"\cK" => 'K', | |
"\cL" => 'L', | |
"\cM" => 'M', | |
"\cN" => 'N', | |
"\cO" => 'O', | |
"\cP" => 'P', | |
"\cQ" => 'Q', | |
"\cR" => 'R', | |
"\cS" => 'S', | |
"\cT" => 'T', | |
"\cU" => 'U', | |
"\cV" => 'V', | |
"\cW" => 'W', | |
"\cX" => 'X', | |
"\cY" => 'Y', | |
"\cZ" => 'Z', | |
"\c[" => '[', # unused | |
"\c\\" => '\\', # unused | |
"\c]" => ']', # unused | |
"\c_" => '_', # unused | |
); | |
# Return just the name, without the prefix. It may be returned as a quoted | |
# string. The second return value is a boolean indicating that. | |
sub stash_variable_name { | |
my($self, $prefix, $gv) = @_; | |
my $name = $self->gv_name($gv, 1); | |
$name = $self->maybe_qualify($prefix,$name); | |
if ($name =~ /^(?:\S|(?!\d)[\ca-\cz]?(?:\w|::)*|\d+)\z/) { | |
$name =~ s/^([\ca-\cz])/'^' . $unctrl{$1}/e; | |
$name =~ /^(\^..|{)/ and $name = "{$name}"; | |
return $name, 0; # not quoted | |
} | |
else { | |
single_delim("q", "'", $name, $self), 1; | |
} | |
} | |
sub maybe_qualify { | |
my ($self,$prefix,$name) = @_; | |
my $v = ($prefix eq '$#' ? '@' : $prefix) . $name; | |
if ($prefix eq "") { | |
$name .= "::" if $name =~ /(?:\ACORE::[^:]*|::)\z/; | |
return $name; | |
} | |
return $name if $name =~ /::/; | |
return $self->{'curstash'}.'::'. $name | |
if | |
$name =~ /^(?!\d)\w/ # alphabetic | |
&& $v !~ /^\$[ab]\z/ # not $a or $b | |
&& $v =~ /\A[\$\@\%\&]/ # scalar, array, hash, or sub | |
&& !$globalnames{$name} # not a global name | |
&& $self->{hints} & $strict_bits{vars} # strict vars | |
&& !$self->lex_in_scope($v,1) # no "our" | |
or $self->lex_in_scope($v); # conflicts with "my" variable | |
return $name; | |
} | |
sub lex_in_scope { | |
my ($self, $name, $our) = @_; | |
substr $name, 0, 0, = $our ? 'o' : 'm'; # our/my | |
$self->populate_curcvlex() if !defined $self->{'curcvlex'}; | |
return 0 if !defined($self->{'curcop'}); | |
my $seq = $self->{'curcop'}->cop_seq; | |
return 0 if !exists $self->{'curcvlex'}{$name}; | |
for my $a (@{$self->{'curcvlex'}{$name}}) { | |
my ($st, $en) = @$a; | |
return 1 if $seq > $st && $seq <= $en; | |
} | |
return 0; | |
} | |
sub populate_curcvlex { | |
my $self = shift; | |
for (my $cv = $self->{'curcv'}; class($cv) eq "CV"; $cv = $cv->OUTSIDE) { | |
my $padlist = $cv->PADLIST; | |
# an undef CV still in lexical chain | |
next if class($padlist) eq "SPECIAL"; | |
my @padlist = $padlist->ARRAY; | |
my @ns = $padlist[0]->ARRAY; | |
for (my $i=0; $i<@ns; ++$i) { | |
next if class($ns[$i]) eq "SPECIAL"; | |
if (class($ns[$i]) eq "PV") { | |
# Probably that pesky lexical @_ | |
next; | |
} | |
my $name = $ns[$i]->PVX; | |
next unless defined $name; | |
my ($seq_st, $seq_en) = | |
($ns[$i]->FLAGS & SVf_FAKE) | |
? (0, 999999) | |
: ($ns[$i]->COP_SEQ_RANGE_LOW, $ns[$i]->COP_SEQ_RANGE_HIGH); | |
push @{$self->{'curcvlex'}{ | |
($ns[$i]->FLAGS & SVpad_OUR ? 'o' : 'm') . $name | |
}}, [$seq_st, $seq_en, $ns[$i]]; | |
} | |
} | |
} | |
sub find_scope_st { ((find_scope(@_))[0]); } | |
sub find_scope_en { ((find_scope(@_))[1]); } | |
# Recurses down the tree, looking for pad variable introductions and COPs | |
sub find_scope { | |
my ($self, $op, $scope_st, $scope_en) = @_; | |
carp("Undefined op in find_scope") if !defined $op; | |
return ($scope_st, $scope_en) unless $op->flags & OPf_KIDS; | |
my @queue = ($op); | |
while(my $op = shift @queue ) { | |
for (my $o=$op->first; $$o; $o=$o->sibling) { | |
if ($o->name =~ /^pad.v$/ && $o->private & OPpLVAL_INTRO) { | |
my $s = int($self->padname_sv($o->targ)->COP_SEQ_RANGE_LOW); | |
my $e = $self->padname_sv($o->targ)->COP_SEQ_RANGE_HIGH; | |
$scope_st = $s if !defined($scope_st) || $s < $scope_st; | |
$scope_en = $e if !defined($scope_en) || $e > $scope_en; | |
return ($scope_st, $scope_en); | |
} | |
elsif (is_state($o)) { | |
my $c = $o->cop_seq; | |
$scope_st = $c if !defined($scope_st) || $c < $scope_st; | |
$scope_en = $c if !defined($scope_en) || $c > $scope_en; | |
return ($scope_st, $scope_en); | |
} | |
elsif ($o->flags & OPf_KIDS) { | |
unshift (@queue, $o); | |
} | |
} | |
} | |
return ($scope_st, $scope_en); | |
} | |
# Returns a list of subs which should be inserted before the COP | |
sub cop_subs { | |
my ($self, $op, $out_seq) = @_; | |
my $seq = $op->cop_seq; | |
$seq = $out_seq if defined($out_seq) && $out_seq < $seq; | |
return $self->seq_subs($seq); | |
} | |
sub seq_subs { | |
my ($self, $seq) = @_; | |
my @text; | |
#push @text, "# ($seq)\n"; | |
return "" if !defined $seq; | |
my @pending; | |
while (scalar(@{$self->{'subs_todo'}}) | |
and $seq > $self->{'subs_todo'}[0][0]) { | |
my $cv = $self->{'subs_todo'}[0][1]; | |
# Skip the OUTSIDE check for lexical subs. We may be deparsing a | |
# cloned anon sub with lexical subs declared in it, in which case | |
# the OUTSIDE pointer points to the anon protosub. | |
my $lexical = ref $self->{'subs_todo'}[0][3]; | |
my $outside = !$lexical && $cv && $cv->OUTSIDE; | |
if (!$lexical and $cv | |
and ${$cv->OUTSIDE || \0} != ${$self->{'curcv'}}) | |
{ | |
push @pending, shift @{$self->{'subs_todo'}}; | |
next; | |
} | |
push @text, $self->next_todo; | |
} | |
unshift @{$self->{'subs_todo'}}, @pending; | |
return @text; | |
} | |
sub _features_from_bundle { | |
my ($hints, $hh) = @_; | |
foreach (@{$feature::feature_bundle{@feature::hint_bundles[$hints >> $feature::hint_shift]}}) { | |
$hh->{$feature::feature{$_}} = 1; | |
} | |
return $hh; | |
} | |
# generate any pragmas, 'package foo' etc needed to synchronise | |
# with the given cop | |
sub pragmata { | |
my $self = shift; | |
my($op) = @_; | |
my @text; | |
my $stash = $op->stashpv; | |
if ($stash ne $self->{'curstash'}) { | |
push @text, $self->keyword("package") . " $stash;\n"; | |
$self->{'curstash'} = $stash; | |
} | |
my $warnings = $op->warnings; | |
my $warning_bits; | |
if ($warnings->isa("B::SPECIAL") && $$warnings == 4) { | |
$warning_bits = $warnings::Bits{"all"} & WARN_MASK; | |
} | |
elsif ($warnings->isa("B::SPECIAL") && $$warnings == 5) { | |
$warning_bits = $warnings::NONE; | |
} | |
elsif ($warnings->isa("B::SPECIAL")) { | |
$warning_bits = undef; | |
} | |
else { | |
$warning_bits = $warnings->PV & WARN_MASK; | |
} | |
if (defined ($warning_bits) and | |
!defined($self->{warnings}) || $self->{'warnings'} ne $warning_bits) { | |
push @text, | |
$self->declare_warnings($self->{'warnings'}, $warning_bits); | |
$self->{'warnings'} = $warning_bits; | |
} | |
my $hints = $op->hints; | |
my $old_hints = $self->{'hints'}; | |
if ($self->{'hints'} != $hints) { | |
push @text, $self->declare_hints($self->{'hints'}, $hints); | |
$self->{'hints'} = $hints; | |
} | |
my $newhh; | |
$newhh = $op->hints_hash->HASH; | |
{ | |
# feature bundle hints | |
my $from = $old_hints & $feature::hint_mask; | |
my $to = $ hints & $feature::hint_mask; | |
if ($from != $to) { | |
if ($to == $feature::hint_mask) { | |
if ($self->{'hinthash'}) { | |
delete $self->{'hinthash'}{$_} | |
for grep /^feature_/, keys %{$self->{'hinthash'}}; | |
} | |
else { $self->{'hinthash'} = {} } | |
$self->{'hinthash'} | |
= _features_from_bundle($from, $self->{'hinthash'}); | |
} | |
else { | |
my $bundle = | |
$feature::hint_bundles[$to >> $feature::hint_shift]; | |
$bundle =~ s/(\d[13579])\z/$1+1/e; # 5.11 => 5.12 | |
push @text, | |
$self->keyword("no") . " feature ':all';\n", | |
$self->keyword("use") . " feature ':$bundle';\n"; | |
} | |
} | |
} | |
{ | |
push @text, $self->declare_hinthash( | |
$self->{'hinthash'}, $newhh, | |
$self->{indent_size}, $self->{hints}, | |
); | |
$self->{'hinthash'} = $newhh; | |
} | |
return join("", @text); | |
} | |
# Notice how subs and formats are inserted between statements here; | |
# also $[ assignments and pragmas. | |
sub pp_nextstate { | |
my $self = shift; | |
my($op, $cx) = @_; | |
$self->{'curcop'} = $op; | |
my @text; | |
my @subs = $self->cop_subs($op); | |
if (@subs) { | |
# Special marker to swallow up the semicolon | |
push @subs, "\cK"; | |
} | |
push @text, @subs; | |
push @text, $self->pragmata($op); | |
# This should go after of any branches that add statements, to | |
# increase the chances that it refers to the same line it did in | |
# the original program. | |
if ($self->{'linenums'} && $cx != .5) { # $cx == .5 means in a format | |
push @text, "\f#line " . $op->line . | |
' "' . $op->file, qq'"\n'; | |
} | |
push @text, $op->label . ": " if $op->label; | |
return join("", @text); | |
} | |
sub declare_warnings { | |
my ($self, $from, $to) = @_; | |
$from //= ''; | |
my $all = (warnings::bits("all") & WARN_MASK); | |
unless ((($from & WARN_MASK) & ~$all) =~ /[^\0]/) { | |
# no FATAL bits need turning off | |
if ( ($to & WARN_MASK) eq $all) { | |
return $self->keyword("use") . " warnings;\n"; | |
} | |
elsif (($to & WARN_MASK) eq ("\0"x length($to) & WARN_MASK)) { | |
return $self->keyword("no") . " warnings;\n"; | |
} | |
} | |
return "BEGIN {\${^WARNING_BITS} = \"" | |
. join("", map { sprintf("\\x%02x", ord $_) } split "", $to) | |
. "\"}\n\cK"; | |
} | |
sub declare_hints { | |
my ($self, $from, $to) = @_; | |
my $use = $to & ~$from; | |
my $no = $from & ~$to; | |
my $decls = ""; | |
for my $pragma (hint_pragmas($use)) { | |
$decls .= $self->keyword("use") . " $pragma;\n"; | |
} | |
for my $pragma (hint_pragmas($no)) { | |
$decls .= $self->keyword("no") . " $pragma;\n"; | |
} | |
return $decls; | |
} | |
# Internal implementation hints that the core sets automatically, so don't need | |
# (or want) to be passed back to the user | |
my %ignored_hints = ( | |
'open<' => 1, | |
'open>' => 1, | |
':' => 1, | |
'strict/refs' => 1, | |
'strict/subs' => 1, | |
'strict/vars' => 1, | |
'feature/bits' => 1, | |
); | |
my %rev_feature; | |
sub declare_hinthash { | |
my ($self, $from, $to, $indent, $hints) = @_; | |
my $doing_features = | |
($hints & $feature::hint_mask) == $feature::hint_mask; | |
my @decls; | |
my @features; | |
my @unfeatures; # bugs? | |
for my $key (sort keys %$to) { | |
next if $ignored_hints{$key}; | |
my $is_feature = $key =~ /^feature_/; | |
next if $is_feature and not $doing_features; | |
if (!exists $from->{$key} or $from->{$key} ne $to->{$key}) { | |
push(@features, $key), next if $is_feature; | |
push @decls, | |
qq(\$^H{) . single_delim("q", "'", $key, $self) . qq(} = ) | |
. ( | |
defined $to->{$key} | |
? single_delim("q", "'", $to->{$key}, $self) | |
: 'undef' | |
) | |
. qq(;); | |
} | |
} | |
for my $key (sort keys %$from) { | |
next if $ignored_hints{$key}; | |
my $is_feature = $key =~ /^feature_/; | |
next if $is_feature and not $doing_features; | |
if (!exists $to->{$key}) { | |
push(@unfeatures, $key), next if $is_feature; | |
push @decls, qq(delete \$^H{'$key'};); | |
} | |
} | |
my @ret; | |
if (@features || @unfeatures) { | |
if (!%rev_feature) { %rev_feature = reverse %feature::feature } | |
} | |
if (@features) { | |
push @ret, $self->keyword("use") . " feature " | |
. join(", ", map "'$rev_feature{$_}'", @features) . ";\n"; | |
} | |
if (@unfeatures) { | |
push @ret, $self->keyword("no") . " feature " | |
. join(", ", map "'$rev_feature{$_}'", @unfeatures) | |
. ";\n"; | |
} | |
@decls and | |
push @ret, | |
join("\n" . (" " x $indent), "BEGIN {", @decls) . "\n}\n\cK"; | |
return @ret; | |
} | |
sub hint_pragmas { | |
my ($bits) = @_; | |
my (@pragmas, @strict); | |
push @pragmas, "integer" if $bits & 0x1; | |
for (sort keys %strict_bits) { | |
push @strict, "'$_'" if $bits & $strict_bits{$_}; | |
} | |
if (@strict == keys %strict_bits) { | |
push @pragmas, "strict"; | |
} | |
elsif (@strict) { | |
push @pragmas, "strict " . join ', ', @strict; | |
} | |
push @pragmas, "bytes" if $bits & 0x8; | |
return @pragmas; | |
} | |
sub pp_dbstate { pp_nextstate(@_) } | |
sub pp_setstate { pp_nextstate(@_) } | |
sub pp_unstack { return "" } # see also leaveloop | |
my %feature_keywords = ( | |
# keyword => 'feature', | |
state => 'state', | |
say => 'say', | |
given => 'switch', | |
when => 'switch', | |
default => 'switch', | |
break => 'switch', | |
evalbytes=>'evalbytes', | |
__SUB__ => '__SUB__', | |
fc => 'fc', | |
try => 'try', | |
catch => 'try', | |
); | |
# keywords that are strong and also have a prototype | |
# | |
my %strong_proto_keywords = map { $_ => 1 } qw( | |
pos | |
prototype | |
scalar | |
study | |
undef | |
); | |
sub feature_enabled { | |
my($self,$name) = @_; | |
my $hh; | |
my $hints = $self->{hints} & $feature::hint_mask; | |
if ($hints && $hints != $feature::hint_mask) { | |
$hh = _features_from_bundle($hints); | |
} | |
elsif ($hints) { $hh = $self->{'hinthash'} } | |
return $hh && $hh->{"feature_$feature_keywords{$name}"} | |
} | |
sub keyword { | |
my $self = shift; | |
my $name = shift; | |
return $name if $name =~ /^CORE::/; # just in case | |
if (exists $feature_keywords{$name}) { | |
return "CORE::$name" if not $self->feature_enabled($name); | |
} | |
# This sub may be called for a program that has no nextstate ops. In | |
# that case we may have a lexical sub named no/use/sub in scope but | |
# $self->lex_in_scope will return false because it depends on the | |
# current nextstate op. So we need this alternate method if there is | |
# no current cop. | |
if (!$self->{'curcop'}) { | |
$self->populate_curcvlex() if !defined $self->{'curcvlex'}; | |
return "CORE::$name" if exists $self->{'curcvlex'}{"m&$name"} | |
|| exists $self->{'curcvlex'}{"o&$name"}; | |
} elsif ($self->lex_in_scope("&$name") | |
|| $self->lex_in_scope("&$name", 1)) { | |
return "CORE::$name"; | |
} | |
if ($strong_proto_keywords{$name} | |
|| ($name !~ /^(?:chom?p|do|exec|glob|s(?:elect|ystem))\z/ | |
&& !defined eval{prototype "CORE::$name"}) | |
) { return $name } | |
if ( | |
exists $self->{subs_declared}{$name} | |
or | |
exists &{"$self->{curstash}::$name"} | |
) { | |
return "CORE::$name" | |
} | |
return $name; | |
} | |
sub baseop { | |
my $self = shift; | |
my($op, $cx, $name) = @_; | |
return $self->keyword($name); | |
} | |
sub pp_stub { "()" } | |
sub pp_wantarray { baseop(@_, "wantarray") } | |
sub pp_fork { baseop(@_, "fork") } | |
sub pp_wait { maybe_targmy(@_, \&baseop, "wait") } | |
sub pp_getppid { maybe_targmy(@_, \&baseop, "getppid") } | |
sub pp_time { maybe_targmy(@_, \&baseop, "time") } | |
sub pp_tms { baseop(@_, "times") } | |
sub pp_ghostent { baseop(@_, "gethostent") } | |
sub pp_gnetent { baseop(@_, "getnetent") } | |
sub pp_gprotoent { baseop(@_, "getprotoent") } | |
sub pp_gservent { baseop(@_, "getservent") } | |
sub pp_ehostent { baseop(@_, "endhostent") } | |
sub pp_enetent { baseop(@_, "endnetent") } | |
sub pp_eprotoent { baseop(@_, "endprotoent") } | |
sub pp_eservent { baseop(@_, "endservent") } | |
sub pp_gpwent { baseop(@_, "getpwent") } | |
sub pp_spwent { baseop(@_, "setpwent") } | |
sub pp_epwent { baseop(@_, "endpwent") } | |
sub pp_ggrent { baseop(@_, "getgrent") } | |
sub pp_sgrent { baseop(@_, "setgrent") } | |
sub pp_egrent { baseop(@_, "endgrent") } | |
sub pp_getlogin { baseop(@_, "getlogin") } | |
sub POSTFIX () { 1 } | |
# I couldn't think of a good short name, but this is the category of | |
# symbolic unary operators with interesting precedence | |
sub pfixop { | |
my $self = shift; | |
my($op, $cx, $name, $prec, $flags) = (@_, 0); | |
my $kid = $op->first; | |
$kid = $self->deparse($kid, $prec); | |
return $self->maybe_parens(($flags & POSTFIX) | |
? "$kid$name" | |
# avoid confusion with filetests | |
: $name eq '-' | |
&& $kid =~ /^[a-zA-Z](?!\w)/ | |
? "$name($kid)" | |
: "$name$kid", | |
$cx, $prec); | |
} | |
sub pp_preinc { pfixop(@_, "++", 23) } | |
sub pp_predec { pfixop(@_, "--", 23) } | |
sub pp_postinc { maybe_targmy(@_, \&pfixop, "++", 23, POSTFIX) } | |
sub pp_postdec { maybe_targmy(@_, \&pfixop, "--", 23, POSTFIX) } | |
sub pp_i_preinc { pfixop(@_, "++", 23) } | |
sub pp_i_predec { pfixop(@_, "--", 23) } | |
sub pp_i_postinc { maybe_targmy(@_, \&pfixop, "++", 23, POSTFIX) } | |
sub pp_i_postdec { maybe_targmy(@_, \&pfixop, "--", 23, POSTFIX) } | |
sub pp_complement { maybe_targmy(@_, \&pfixop, "~", 21) } | |
*pp_ncomplement = *pp_complement; | |
sub pp_scomplement { maybe_targmy(@_, \&pfixop, "~.", 21) } | |
sub pp_negate { maybe_targmy(@_, \&real_negate) } | |
sub real_negate { | |
my $self = shift; | |
my($op, $cx) = @_; | |
if ($op->first->name =~ /^(i_)?negate$/) { | |
# avoid --$x | |
$self->pfixop($op, $cx, "-", 21.5); | |
} else { | |
$self->pfixop($op, $cx, "-", 21); | |
} | |
} | |
sub pp_i_negate { pp_negate(@_) } | |
sub pp_not { | |
my $self = shift; | |
my($op, $cx) = @_; | |
if ($cx <= 4) { | |
$self->listop($op, $cx, "not", $op->first); | |
} else { | |
$self->pfixop($op, $cx, "!", 21); | |
} | |
} | |
sub unop { | |
my $self = shift; | |
my($op, $cx, $name, $nollafr) = @_; | |
my $kid; | |
if ($op->flags & OPf_KIDS) { | |
$kid = $op->first; | |
if (not $name) { | |
# this deals with 'boolkeys' right now | |
return $self->deparse($kid,$cx); | |
} | |
my $builtinname = $name; | |
$builtinname =~ /^CORE::/ or $builtinname = "CORE::$name"; | |
if (defined prototype($builtinname) | |
&& $builtinname ne 'CORE::readline' | |
&& prototype($builtinname) =~ /^;?\*/ | |
&& $kid->name eq "rv2gv") { | |
$kid = $kid->first; | |
} | |
if ($nollafr) { | |
if (($kid = $self->deparse($kid, 16)) !~ s/^\cS//) { | |
# require foo() is a syntax error. | |
$kid =~ /^(?!\d)\w/ and $kid = "($kid)"; | |
} | |
return $self->maybe_parens( | |
$self->keyword($name) . " $kid", $cx, 16 | |
); | |
} | |
return $self->maybe_parens_unop($name, $kid, $cx); | |
} else { | |
return $self->maybe_parens( | |
$self->keyword($name) . ($op->flags & OPf_SPECIAL ? "()" : ""), | |
$cx, 16, | |
); | |
} | |
} | |
sub pp_chop { maybe_targmy(@_, \&unop, "chop") } | |
sub pp_chomp { maybe_targmy(@_, \&unop, "chomp") } | |
sub pp_schop { maybe_targmy(@_, \&unop, "chop") } | |
sub pp_schomp { maybe_targmy(@_, \&unop, "chomp") } | |
sub pp_defined { unop(@_, "defined") } | |
sub pp_undef { unop(@_, "undef") } | |
sub pp_study { unop(@_, "study") } | |
sub pp_ref { unop(@_, "ref") } | |
sub pp_pos { maybe_local(@_, unop(@_, "pos")) } | |
sub pp_sin { maybe_targmy(@_, \&unop, "sin") } | |
sub pp_cos { maybe_targmy(@_, \&unop, "cos") } | |
sub pp_rand { maybe_targmy(@_, \&unop, "rand") } | |
sub pp_srand { unop(@_, "srand") } | |
sub pp_exp { maybe_targmy(@_, \&unop, "exp") } | |
sub pp_log { maybe_targmy(@_, \&unop, "log") } | |
sub pp_sqrt { maybe_targmy(@_, \&unop, "sqrt") } | |
sub pp_int { maybe_targmy(@_, \&unop, "int") } | |
sub pp_hex { maybe_targmy(@_, \&unop, "hex") } | |
sub pp_oct { maybe_targmy(@_, \&unop, "oct") } | |
sub pp_abs { maybe_targmy(@_, \&unop, "abs") } | |
sub pp_length { maybe_targmy(@_, \&unop, "length") } | |
sub pp_ord { maybe_targmy(@_, \&unop, "ord") } | |
sub pp_chr { maybe_targmy(@_, \&unop, "chr") } | |
sub pp_each { unop(@_, "each") } | |
sub pp_values { unop(@_, "values") } | |
sub pp_keys { unop(@_, "keys") } | |
{ no strict 'refs'; *{"pp_r$_"} = *{"pp_$_"} for qw< keys each values >; } | |
sub pp_boolkeys { | |
# no name because its an optimisation op that has no keyword | |
unop(@_,""); | |
} | |
sub pp_aeach { unop(@_, "each") } | |
sub pp_avalues { unop(@_, "values") } | |
sub pp_akeys { unop(@_, "keys") } | |
sub pp_pop { unop(@_, "pop") } | |
sub pp_shift { unop(@_, "shift") } | |
sub pp_caller { unop(@_, "caller") } | |
sub pp_reset { unop(@_, "reset") } | |
sub pp_exit { unop(@_, "exit") } | |
sub pp_prototype { unop(@_, "prototype") } | |
sub pp_close { unop(@_, "close") } | |
sub pp_fileno { unop(@_, "fileno") } | |
sub pp_umask { unop(@_, "umask") } | |
sub pp_untie { unop(@_, "untie") } | |
sub pp_tied { unop(@_, "tied") } | |
sub pp_dbmclose { unop(@_, "dbmclose") } | |
sub pp_getc { unop(@_, "getc") } | |
sub pp_eof { unop(@_, "eof") } | |
sub pp_tell { unop(@_, "tell") } | |
sub pp_getsockname { unop(@_, "getsockname") } | |
sub pp_getpeername { unop(@_, "getpeername") } | |
sub pp_chdir { | |
my ($self, $op, $cx) = @_; | |
if (($op->flags & (OPf_SPECIAL|OPf_KIDS)) == (OPf_SPECIAL|OPf_KIDS)) { | |
my $kw = $self->keyword("chdir"); | |
my $kid = $self->const_sv($op->first)->PV; | |
my $code = $kw | |
. ($cx >= 16 || $self->{'parens'} ? "($kid)" : " $kid"); | |
maybe_targmy(@_, sub { $_[3] }, $code); | |
} else { | |
maybe_targmy(@_, \&unop, "chdir") | |
} | |
} | |
sub pp_chroot { maybe_targmy(@_, \&unop, "chroot") } | |
sub pp_readlink { unop(@_, "readlink") } | |
sub pp_rmdir { maybe_targmy(@_, \&unop, "rmdir") } | |
sub pp_readdir { unop(@_, "readdir") } | |
sub pp_telldir { unop(@_, "telldir") } | |
sub pp_rewinddir { unop(@_, "rewinddir") } | |
sub pp_closedir { unop(@_, "closedir") } | |
sub pp_getpgrp { maybe_targmy(@_, \&unop, "getpgrp") } | |
sub pp_localtime { unop(@_, "localtime") } | |
sub pp_gmtime { unop(@_, "gmtime") } | |
sub pp_alarm { unop(@_, "alarm") } | |
sub pp_sleep { maybe_targmy(@_, \&unop, "sleep") } | |
sub pp_dofile { | |
my $code = unop(@_, "do", 1); # llafr does not apply | |
if ($code =~ s/^((?:CORE::)?do) \{/$1({/) { $code .= ')' } | |
$code; | |
} | |
sub pp_entereval { | |
unop( | |
@_, | |
$_[1]->private & OPpEVAL_BYTES ? 'evalbytes' : "eval" | |
) | |
} | |
sub pp_ghbyname { unop(@_, "gethostbyname") } | |
sub pp_gnbyname { unop(@_, "getnetbyname") } | |
sub pp_gpbyname { unop(@_, "getprotobyname") } | |
sub pp_shostent { unop(@_, "sethostent") } | |
sub pp_snetent { unop(@_, "setnetent") } | |
sub pp_sprotoent { unop(@_, "setprotoent") } | |
sub pp_sservent { unop(@_, "setservent") } | |
sub pp_gpwnam { unop(@_, "getpwnam") } | |
sub pp_gpwuid { unop(@_, "getpwuid") } | |
sub pp_ggrnam { unop(@_, "getgrnam") } | |
sub pp_ggrgid { unop(@_, "getgrgid") } | |
sub pp_lock { unop(@_, "lock") } | |
sub pp_continue { unop(@_, "continue"); } | |
sub pp_break { unop(@_, "break"); } | |
sub givwhen { | |
my $self = shift; | |
my($op, $cx, $givwhen) = @_; | |
my $enterop = $op->first; | |
my ($head, $block); | |
if ($enterop->flags & OPf_SPECIAL) { | |
$head = $self->keyword("default"); | |
$block = $self->deparse($enterop->first, 0); | |
} | |
else { | |
my $cond = $enterop->first; | |
my $cond_str = $self->deparse($cond, 1); | |
$head = "$givwhen ($cond_str)"; | |
$block = $self->deparse($cond->sibling, 0); | |
} | |
return "$head {\n". | |
"\t$block\n". | |
"\b}\cK"; | |
} | |
sub pp_leavegiven { givwhen(@_, $_[0]->keyword("given")); } | |
sub pp_leavewhen { givwhen(@_, $_[0]->keyword("when")); } | |
sub pp_exists { | |
my $self = shift; | |
my($op, $cx) = @_; | |
my $arg; | |
my $name = $self->keyword("exists"); | |
if ($op->private & OPpEXISTS_SUB) { | |
# Checking for the existence of a subroutine | |
return $self->maybe_parens_func($name, | |
$self->pp_rv2cv($op->first, 16), $cx, 16); | |
} | |
if ($op->flags & OPf_SPECIAL) { | |
# Array element, not hash element | |
return $self->maybe_parens_func($name, | |
$self->pp_aelem($op->first, 16), $cx, 16); | |
} | |
return $self->maybe_parens_func($name, $self->pp_helem($op->first, 16), | |
$cx, 16); | |
} | |
sub pp_delete { | |
my $self = shift; | |
my($op, $cx) = @_; | |
my $arg; | |
my $name = $self->keyword("delete"); | |
if ($op->private & (OPpSLICE|OPpKVSLICE)) { | |
if ($op->flags & OPf_SPECIAL) { | |
# Deleting from an array, not a hash | |
return $self->maybe_parens_func($name, | |
$self->pp_aslice($op->first, 16), | |
$cx, 16); | |
} | |
return $self->maybe_parens_func($name, | |
$self->pp_hslice($op->first, 16), | |
$cx, 16); | |
} else { | |
if ($op->flags & OPf_SPECIAL) { | |
# Deleting from an array, not a hash | |
return $self->maybe_parens_func($name, | |
$self->pp_aelem($op->first, 16), | |
$cx, 16); | |
} | |
return $self->maybe_parens_func($name, | |
$self->pp_helem($op->first, 16), | |
$cx, 16); | |
} | |
} | |
sub pp_require { | |
my $self = shift; | |
my($op, $cx) = @_; | |
my $opname = $op->flags & OPf_SPECIAL ? 'CORE::require' : 'require'; | |
my $kid = $op->first; | |
if ($kid->name eq 'const') { | |
my $priv = $kid->private; | |
my $sv = $self->const_sv($kid); | |
my $arg; | |
if ($priv & OPpCONST_BARE) { | |
$arg = $sv->PV; | |
$arg =~ s[/][::]g; | |
$arg =~ s/\.pm//g; | |
} elsif ($priv & OPpCONST_NOVER) { | |
$opname = $self->keyword('no'); | |
$arg = $self->const($sv, 16); | |
} elsif ((my $tmp = $self->const($sv, 16)) =~ /^v/) { | |
$arg = $tmp; | |
} | |
if ($arg) { | |
return $self->maybe_parens("$opname $arg", $cx, 16); | |
} | |
} | |
$self->unop( | |
$op, $cx, | |
$opname, | |
1, # llafr does not apply | |
); | |
} | |
sub pp_scalar { | |
my $self = shift; | |
my($op, $cx) = @_; | |
my $kid = $op->first; | |
if (not null $kid->sibling) { | |
# XXX Was a here-doc | |
return $self->dquote($op); | |
} | |
$self->unop(@_, "scalar"); | |
} | |
sub padval { | |
my $self = shift; | |
my $targ = shift; | |
return $self->{'curcv'}->PADLIST->ARRAYelt(1)->ARRAYelt($targ); | |
} | |
sub anon_hash_or_list { | |
my $self = shift; | |
my($op, $cx) = @_; | |
my($pre, $post) = @{{"anonlist" => ["[","]"], | |
"anonhash" => ["{","}"]}->{$op->name}}; | |
my($expr, @exprs); | |
$op = $op->first->sibling; # skip pushmark | |
for (; !null($op); $op = $op->sibling) { | |
$expr = $self->deparse($op, 6); | |
push @exprs, $expr; | |
} | |
if ($pre eq "{" and $cx < 1) { | |
# Disambiguate that it's not a block | |
$pre = "+{"; | |
} | |
return $pre . join(", ", @exprs) . $post; | |
} | |
sub pp_anonlist { | |
my $self = shift; | |
my ($op, $cx) = @_; | |
if ($op->flags & OPf_SPECIAL) { | |
return $self->anon_hash_or_list($op, $cx); | |
} | |
warn "Unexpected op pp_" . $op->name() . " without OPf_SPECIAL"; | |
return 'XXX'; | |
} | |
*pp_anonhash = \&pp_anonlist; | |
sub pp_refgen { | |
my $self = shift; | |
my($op, $cx) = @_; | |
my $kid = $op->first; | |
if ($kid->name eq "null") { | |
my $anoncode = $kid = $kid->first; | |
if ($anoncode->name eq "anonconst") { | |
$anoncode = $anoncode->first->first->sibling; | |
} | |
if ($anoncode->name eq "anoncode" | |
or !null($anoncode = $kid->sibling) and | |
$anoncode->name eq "anoncode") { | |
return $self->e_anoncode({ code => $self->padval($anoncode->targ) }); | |
} elsif ($kid->name eq "pushmark") { | |
my $sib_name = $kid->sibling->name; | |
if ($sib_name eq 'entersub') { | |
my $text = $self->deparse($kid->sibling, 1); | |
# Always show parens for \(&func()), but only with -p otherwise | |
$text = "($text)" if $self->{'parens'} | |
or $kid->sibling->private & OPpENTERSUB_AMPER; | |
return "\\$text"; | |
} | |
} | |
} | |
local $self->{'in_refgen'} = 1; | |
$self->pfixop($op, $cx, "\\", 20); | |
} | |
sub e_anoncode { | |
my ($self, $info) = @_; | |
my $text = $self->deparse_sub($info->{code}); | |
return $self->keyword("sub") . " $text"; | |
} | |
sub pp_srefgen { pp_refgen(@_) } | |
sub pp_readline { | |
my $self = shift; | |
my($op, $cx) = @_; | |
my $kid = $op->first; | |
if (is_scalar($kid) | |
and $op->flags & OPf_SPECIAL | |
and $self->deparse($kid, 1) eq 'ARGV') | |
{ | |
return '<<>>'; | |
} | |
return $self->unop($op, $cx, "readline"); | |
} | |
sub pp_rcatline { | |
my $self = shift; | |
my($op) = @_; | |
return "<" . $self->gv_name($self->gv_or_padgv($op)) . ">"; | |
} | |
# Unary operators that can occur as pseudo-listops inside double quotes | |
sub dq_unop { | |
my $self = shift; | |
my($op, $cx, $name, $prec, $flags) = (@_, 0, 0); | |
my $kid; | |
if ($op->flags & OPf_KIDS) { | |
$kid = $op->first; | |
# If there's more than one kid, the first is an ex-pushmark. | |
$kid = $kid->sibling if not null $kid->sibling; | |
return $self->maybe_parens_unop($name, $kid, $cx); | |
} else { | |
return $name . ($op->flags & OPf_SPECIAL ? "()" : ""); | |
} | |
} | |
sub pp_ucfirst { dq_unop(@_, "ucfirst") } | |
sub pp_lcfirst { dq_unop(@_, "lcfirst") } | |
sub pp_uc { dq_unop(@_, "uc") } | |
sub pp_lc { dq_unop(@_, "lc") } | |
sub pp_quotemeta { maybe_targmy(@_, \&dq_unop, "quotemeta") } | |
sub pp_fc { dq_unop(@_, "fc") } | |
sub loopex { | |
my $self = shift; | |
my ($op, $cx, $name) = @_; | |
if (class($op) eq "PVOP") { | |
$name .= " " . $op->pv; | |
} elsif (class($op) eq "OP") { | |
# no-op | |
} elsif (class($op) eq "UNOP") { | |
(my $kid = $self->deparse($op->first, 7)) =~ s/^\cS//; | |
# last foo() is a syntax error. | |
$kid =~ /^(?!\d)\w/ and $kid = "($kid)"; | |
$name .= " $kid"; | |
} | |
return $self->maybe_parens($name, $cx, 7); | |
} | |
sub pp_last { loopex(@_, "last") } | |
sub pp_next { loopex(@_, "next") } | |
sub pp_redo { loopex(@_, "redo") } | |
sub pp_goto { loopex(@_, "goto") } | |
sub pp_dump { loopex(@_, "CORE::dump") } | |
sub ftst { | |
my $self = shift; | |
my($op, $cx, $name) = @_; | |
if (class($op) eq "UNOP") { | |
# Genuine '-X' filetests are exempt from the LLAFR, but not | |
# l?stat() | |
if ($name =~ /^-/) { | |
(my $kid = $self->deparse($op->first, 16)) =~ s/^\cS//; | |
return $self->maybe_parens("$name $kid", $cx, 16); | |
} | |
return $self->maybe_parens_unop($name, $op->first, $cx); | |
} elsif (class($op) =~ /^(SV|PAD)OP$/) { | |
return $self->maybe_parens_func($name, $self->pp_gv($op, 1), $cx, 16); | |
} else { # I don't think baseop filetests ever survive ck_ftst, but... | |
return $name; | |
} | |
} | |
sub pp_lstat { ftst(@_, "lstat") } | |
sub pp_stat { ftst(@_, "stat") } | |
sub pp_ftrread { ftst(@_, "-R") } | |
sub pp_ftrwrite { ftst(@_, "-W") } | |
sub pp_ftrexec { ftst(@_, "-X") } | |
sub pp_fteread { ftst(@_, "-r") } | |
sub pp_ftewrite { ftst(@_, "-w") } | |
sub pp_fteexec { ftst(@_, "-x") } | |
sub pp_ftis { ftst(@_, "-e") } | |
sub pp_fteowned { ftst(@_, "-O") } | |
sub pp_ftrowned { ftst(@_, "-o") } | |
sub pp_ftzero { ftst(@_, "-z") } | |
sub pp_ftsize { ftst(@_, "-s") } | |
sub pp_ftmtime { ftst(@_, "-M") } | |
sub pp_ftatime { ftst(@_, "-A") } | |
sub pp_ftctime { ftst(@_, "-C") } | |
sub pp_ftsock { ftst(@_, "-S") } | |
sub pp_ftchr { ftst(@_, "-c") } | |
sub pp_ftblk { ftst(@_, "-b") } | |
sub pp_ftfile { ftst(@_, "-f") } | |
sub pp_ftdir { ftst(@_, "-d") } | |
sub pp_ftpipe { ftst(@_, "-p") } | |
sub pp_ftlink { ftst(@_, "-l") } | |
sub pp_ftsuid { ftst(@_, "-u") } | |
sub pp_ftsgid { ftst(@_, "-g") } | |
sub pp_ftsvtx { ftst(@_, "-k") } | |
sub pp_fttty { ftst(@_, "-t") } | |
sub pp_fttext { ftst(@_, "-T") } | |
sub pp_ftbinary { ftst(@_, "-B") } | |
sub SWAP_CHILDREN () { 1 } | |
sub ASSIGN () { 2 } # has OP= variant | |
sub LIST_CONTEXT () { 4 } # Assignment is in list context | |
my(%left, %right); | |
sub assoc_class { | |
my $op = shift; | |
my $name = $op->name; | |
if ($name eq "concat" and $op->first->name eq "concat") { | |
# avoid spurious '=' -- see comment in pp_concat | |
return "concat"; | |
} | |
if ($name eq "null" and class($op) eq "UNOP" | |
and $op->first->name =~ /^(and|x?or)$/ | |
and null $op->first->sibling) | |
{ | |
# Like all conditional constructs, OP_ANDs and OP_ORs are topped | |
# with a null that's used as the common end point of the two | |
# flows of control. For precedence purposes, ignore it. | |
# (COND_EXPRs have these too, but we don't bother with | |
# their associativity). | |
return assoc_class($op->first); | |
} | |
return $name . ($op->flags & OPf_STACKED ? "=" : ""); | |
} | |
# Left associative operators, like '+', for which | |
# $a + $b + $c is equivalent to ($a + $b) + $c | |
BEGIN { | |
%left = ('multiply' => 19, 'i_multiply' => 19, | |
'divide' => 19, 'i_divide' => 19, | |
'modulo' => 19, 'i_modulo' => 19, | |
'repeat' => 19, | |
'add' => 18, 'i_add' => 18, | |
'subtract' => 18, 'i_subtract' => 18, | |
'concat' => 18, | |
'left_shift' => 17, 'right_shift' => 17, | |
'bit_and' => 13, 'nbit_and' => 13, 'sbit_and' => 13, | |
'bit_or' => 12, 'bit_xor' => 12, | |
'sbit_or' => 12, 'sbit_xor' => 12, | |
'nbit_or' => 12, 'nbit_xor' => 12, | |
'and' => 3, | |
'or' => 2, 'xor' => 2, | |
); | |
} | |
sub deparse_binop_left { | |
my $self = shift; | |
my($op, $left, $prec) = @_; | |
if ($left{assoc_class($op)} && $left{assoc_class($left)} | |
and $left{assoc_class($op)} == $left{assoc_class($left)}) | |
{ | |
return $self->deparse($left, $prec - .00001); | |
} else { | |
return $self->deparse($left, $prec); | |
} | |
} | |
# Right associative operators, like '=', for which | |
# $a = $b = $c is equivalent to $a = ($b = $c) | |
BEGIN { | |
%right = ('pow' => 22, | |
'sassign=' => 7, 'aassign=' => 7, | |
'multiply=' => 7, 'i_multiply=' => 7, | |
'divide=' => 7, 'i_divide=' => 7, | |
'modulo=' => 7, 'i_modulo=' => 7, | |
'repeat=' => 7, 'refassign' => 7, 'refassign=' => 7, | |
'add=' => 7, 'i_add=' => 7, | |
'subtract=' => 7, 'i_subtract=' => 7, | |
'concat=' => 7, | |
'left_shift=' => 7, 'right_shift=' => 7, | |
'bit_and=' => 7, 'sbit_and=' => 7, 'nbit_and=' => 7, | |
'nbit_or=' => 7, 'nbit_xor=' => 7, | |
'sbit_or=' => 7, 'sbit_xor=' => 7, | |
'andassign' => 7, | |
'orassign' => 7, | |
); | |
} | |
sub deparse_binop_right { | |
my $self = shift; | |
my($op, $right, $prec) = @_; | |
if ($right{assoc_class($op)} && $right{assoc_class($right)} | |
and $right{assoc_class($op)} == $right{assoc_class($right)}) | |
{ | |
return $self->deparse($right, $prec - .00001); | |
} else { | |
return $self->deparse($right, $prec); | |
} | |
} | |
sub binop { | |
my $self = shift; | |
my ($op, $cx, $opname, $prec, $flags) = (@_, 0); | |
my $left = $op->first; | |
my $right = $op->last; | |
my $eq = ""; | |
if ($op->flags & OPf_STACKED && $flags & ASSIGN) { | |
$eq = "="; | |
$prec = 7; | |
} | |
if ($flags & SWAP_CHILDREN) { | |
($left, $right) = ($right, $left); | |
} | |
my $leftop = $left; | |
$left = $self->deparse_binop_left($op, $left, $prec); | |
$left = "($left)" if $flags & LIST_CONTEXT | |
and $left !~ /^(my|our|local|state|)\s*[\@%\(]/ | |
|| do { | |
# Parenthesize if the left argument is a | |
# lone repeat op. | |
my $left = $leftop->first->sibling; | |
$left->name eq 'repeat' | |
&& null($left->sibling); | |
}; | |
$right = $self->deparse_binop_right($op, $right, $prec); | |
return $self->maybe_parens("$left $opname$eq $right", $cx, $prec); | |
} | |
sub pp_add { maybe_targmy(@_, \&binop, "+", 18, ASSIGN) } | |
sub pp_multiply { maybe_targmy(@_, \&binop, "*", 19, ASSIGN) } | |
sub pp_subtract { maybe_targmy(@_, \&binop, "-",18, ASSIGN) } | |
sub pp_divide { maybe_targmy(@_, \&binop, "/", 19, ASSIGN) } | |
sub pp_modulo { maybe_targmy(@_, \&binop, "%", 19, ASSIGN) } | |
sub pp_i_add { maybe_targmy(@_, \&binop, "+", 18, ASSIGN) } | |
sub pp_i_multiply { maybe_targmy(@_, \&binop, "*", 19, ASSIGN) } | |
sub pp_i_subtract { maybe_targmy(@_, \&binop, "-", 18, ASSIGN) } | |
sub pp_i_divide { maybe_targmy(@_, \&binop, "/", 19, ASSIGN) } | |
sub pp_i_modulo { maybe_targmy(@_, \&binop, "%", 19, ASSIGN) } | |
sub pp_pow { maybe_targmy(@_, \&binop, "**", 22, ASSIGN) } | |
sub pp_left_shift { maybe_targmy(@_, \&binop, "<<", 17, ASSIGN) } | |
sub pp_right_shift { maybe_targmy(@_, \&binop, ">>", 17, ASSIGN) } | |
sub pp_bit_and { maybe_targmy(@_, \&binop, "&", 13, ASSIGN) } | |
sub pp_bit_or { maybe_targmy(@_, \&binop, "|", 12, ASSIGN) } | |
sub pp_bit_xor { maybe_targmy(@_, \&binop, "^", 12, ASSIGN) } | |
*pp_nbit_and = *pp_bit_and; | |
*pp_nbit_or = *pp_bit_or; | |
*pp_nbit_xor = *pp_bit_xor; | |
sub pp_sbit_and { maybe_targmy(@_, \&binop, "&.", 13, ASSIGN) } | |
sub pp_sbit_or { maybe_targmy(@_, \&binop, "|.", 12, ASSIGN) } | |
sub pp_sbit_xor { maybe_targmy(@_, \&binop, "^.", 12, ASSIGN) } | |
sub pp_eq { binop(@_, "==", 14) } | |
sub pp_ne { binop(@_, "!=", 14) } | |
sub pp_lt { binop(@_, "<", 15) } | |
sub pp_gt { binop(@_, ">", 15) } | |
sub pp_ge { binop(@_, ">=", 15) } | |
sub pp_le { binop(@_, "<=", 15) } | |
sub pp_ncmp { binop(@_, "<=>", 14) } | |
sub pp_i_eq { binop(@_, "==", 14) } | |
sub pp_i_ne { binop(@_, "!=", 14) } | |
sub pp_i_lt { binop(@_, "<", 15) } | |
sub pp_i_gt { binop(@_, ">", 15) } | |
sub pp_i_ge { binop(@_, ">=", 15) } | |
sub pp_i_le { binop(@_, "<=", 15) } | |
sub pp_i_ncmp { maybe_targmy(@_, \&binop, "<=>", 14) } | |
sub pp_seq { binop(@_, "eq", 14) } | |
sub pp_sne { binop(@_, "ne", 14) } | |
sub pp_slt { binop(@_, "lt", 15) } | |
sub pp_sgt { binop(@_, "gt", 15) } | |
sub pp_sge { binop(@_, "ge", 15) } | |
sub pp_sle { binop(@_, "le", 15) } | |
sub pp_scmp { maybe_targmy(@_, \&binop, "cmp", 14) } | |
sub pp_isa { binop(@_, "isa", 15) } | |
sub pp_sassign { binop(@_, "=", 7, SWAP_CHILDREN) } | |
sub pp_aassign { binop(@_, "=", 7, SWAP_CHILDREN | LIST_CONTEXT) } | |
sub pp_smartmatch { | |
my ($self, $op, $cx) = @_; | |
if (($op->flags & OPf_SPECIAL) && $self->{expand} < 2) { | |
return $self->deparse($op->last, $cx); | |
} | |
else { | |
binop(@_, "~~", 14); | |
} | |
} | |
# '.' is special because concats-of-concats are optimized to save copying | |
# by making all but the first concat stacked. The effect is as if the | |
# programmer had written '($a . $b) .= $c', except legal. | |
sub pp_concat { maybe_targmy(@_, \&real_concat) } | |
sub real_concat { | |
my $self = shift; | |
my($op, $cx) = @_; | |
my $left = $op->first; | |
my $right = $op->last; | |
my $eq = ""; | |
my $prec = 18; | |
if (($op->flags & OPf_STACKED) and !($op->private & OPpCONCAT_NESTED)) { | |
# '.=' rather than optimised '.' | |
$eq = "="; | |
$prec = 7; | |
} | |
$left = $self->deparse_binop_left($op, $left, $prec); | |
$right = $self->deparse_binop_right($op, $right, $prec); | |
return $self->maybe_parens("$left .$eq $right", $cx, $prec); | |
} | |
sub pp_repeat { maybe_targmy(@_, \&repeat) } | |
# 'x' is weird when the left arg is a list | |
sub repeat { | |
my $self = shift; | |
my($op, $cx) = @_; | |
my $left = $op->first; | |
my $right = $op->last; | |
my $eq = ""; | |
my $prec = 19; | |
if ($op->flags & OPf_STACKED) { | |
$eq = "="; | |
$prec = 7; | |
} | |
if (null($right)) { # list repeat; count is inside left-side ex-list | |
# in 5.21.5 and earlier | |
my $kid = $left->first->sibling; # skip pushmark | |
my @exprs; | |
for (; !null($kid->sibling); $kid = $kid->sibling) { | |
push @exprs, $self->deparse($kid, 6); | |
} | |
$right = $kid; | |
$left = "(" . join(", ", @exprs). ")"; | |
} else { | |
my $dolist = $op->private & OPpREPEAT_DOLIST; | |
$left = $self->deparse_binop_left($op, $left, $dolist ? 1 : $prec); | |
if ($dolist) { | |
$left = "($left)"; | |
} | |
} | |
$right = $self->deparse_binop_right($op, $right, $prec); | |
return $self->maybe_parens("$left x$eq $right", $cx, $prec); | |
} | |
sub range { | |
my $self = shift; | |
my ($op, $cx, $type) = @_; | |
my $left = $op->first; | |
my $right = $left->sibling; | |
$left = $self->deparse($left, 9); | |
$right = $self->deparse($right, 9); | |
return $self->maybe_parens("$left $type $right", $cx, 9); | |
} | |
sub pp_flop { | |
my $self = shift; | |
my($op, $cx) = @_; | |
my $flip = $op->first; | |
my $type = ($flip->flags & OPf_SPECIAL) ? "..." : ".."; | |
return $self->range($flip->first, $cx, $type); | |
} | |
# one-line while/until is handled in pp_leave | |
sub logop { | |
my $self = shift; | |
my ($op, $cx, $lowop, $lowprec, $highop, $highprec, $blockname) = @_; | |
my $left = $op->first; | |
my $right = $op->first->sibling; | |
$blockname &&= $self->keyword($blockname); | |
if ($cx < 1 and is_scope($right) and $blockname | |
and $self->{'expand'} < 7) | |
{ # if ($a) {$b} | |
$left = $self->deparse($left, 1); | |
$right = $self->deparse($right, 0); | |
return "$blockname ($left) {\n\t$right\n\b}\cK"; | |
} elsif ($cx < 1 and $blockname and not $self->{'parens'} | |
and $self->{'expand'} < 7) { # $b if $a | |
$right = $self->deparse($right, 1); | |
$left = $self->deparse($left, 1); | |
return "$right $blockname $left"; | |
} elsif ($cx > $lowprec and $highop) { # $a && $b | |
$left = $self->deparse_binop_left($op, $left, $highprec); | |
$right = $self->deparse_binop_right($op, $right, $highprec); | |
return $self->maybe_parens("$left $highop $right", $cx, $highprec); | |
} else { # $a and $b | |
$left = $self->deparse_binop_left($op, $left, $lowprec); | |
$right = $self->deparse_binop_right($op, $right, $lowprec); | |
return $self->maybe_parens("$left $lowop $right", $cx, $lowprec); | |
} | |
} | |
sub pp_and { logop(@_, "and", 3, "&&", 11, "if") } | |
sub pp_or { logop(@_, "or", 2, "||", 10, "unless") } | |
sub pp_dor { logop(@_, "//", 10) } | |
# xor is syntactically a logop, but it's really a binop (contrary to | |
# old versions of opcode.pl). Syntax is what matters here. | |
sub pp_xor { logop(@_, "xor", 2, "", 0, "") } | |
sub logassignop { | |
my $self = shift; | |
my ($op, $cx, $opname) = @_; | |
my $left = $op->first; | |
my $right = $op->first->sibling->first; # skip sassign | |
$left = $self->deparse($left, 7); | |
$right = $self->deparse($right, 7); | |
return $self->maybe_parens("$left $opname $right", $cx, 7); | |
} | |
sub pp_andassign { logassignop(@_, "&&=") } | |
sub pp_orassign { logassignop(@_, "||=") } | |
sub pp_dorassign { logassignop(@_, "//=") } | |
my %cmpchain_cmpops = ( | |
eq => ["==", 14], | |
i_eq => ["==", 14], | |
ne => ["!=", 14], | |
i_ne => ["!=", 14], | |
seq => ["eq", 14], | |
sne => ["ne", 14], | |
lt => ["<", 15], | |
i_lt => ["<", 15], | |
gt => [">", 15], | |
i_gt => [">", 15], | |
le => ["<=", 15], | |
i_le => ["<=", 15], | |
ge => [">=", 15], | |
i_ge => [">=", 15], | |
slt => ["lt", 15], | |
sgt => ["gt", 15], | |
sle => ["le", 15], | |
sge => ["ge", 15], | |
); | |
sub pp_cmpchain_and { | |
my($self, $op, $cx) = @_; | |
my($prec, $dep); | |
while(1) { | |
my($thiscmp, $rightcond); | |
if($op->name eq "cmpchain_and") { | |
$thiscmp = $op->first; | |
$rightcond = $thiscmp->sibling; | |
} else { | |
$thiscmp = $op; | |
} | |
my $thiscmptype = $cmpchain_cmpops{$thiscmp->name} // (return "XXX"); | |
if(defined $prec) { | |
$thiscmptype->[1] == $prec or return "XXX"; | |
$thiscmp->first->name eq "null" && | |
!($thiscmp->first->flags & OPf_KIDS) | |
or return "XXX"; | |
} else { | |
$prec = $thiscmptype->[1]; | |
$dep = $self->deparse($thiscmp->first, $prec); | |
} | |
$dep .= " ".$thiscmptype->[0]." "; | |
my $operand = $thiscmp->last; | |
if(defined $rightcond) { | |
$operand->name eq "cmpchain_dup" or return "XXX"; | |
$operand = $operand->first; | |
} | |
$dep .= $self->deparse($operand, $prec); | |
last unless defined $rightcond; | |
if($rightcond->name eq "null" && ($rightcond->flags & OPf_KIDS) && | |
$rightcond->first->name eq "cmpchain_and") { | |
$rightcond = $rightcond->first; | |
} | |
$op = $rightcond; | |
} | |
return $self->maybe_parens($dep, $cx, $prec); | |
} | |
sub rv2gv_or_string { | |
my($self,$op) = @_; | |
if ($op->name eq "gv") { # could be open("open") or open("###") | |
my($name,$quoted) = | |
$self->stash_variable_name("", $self->gv_or_padgv($op)); | |
$quoted ? $name : "*$name"; | |
} | |
else { | |
$self->deparse($op, 6); | |
} | |
} | |
sub listop { | |
my $self = shift; | |
my($op, $cx, $name, $kid, $nollafr) = @_; | |
my(@exprs); | |
my $parens = ($cx >= 5) || $self->{'parens'}; | |
$kid ||= $op->first->sibling; | |
# If there are no arguments, add final parentheses (or parenthesize the | |
# whole thing if the llafr does not apply) to account for cases like | |
# (return)+1 or setpgrp()+1. When the llafr does not apply, we use a | |
# precedence of 6 (< comma), as "return, 1" does not need parentheses. | |
if (null $kid) { | |
return $nollafr | |
? $self->maybe_parens($self->keyword($name), $cx, 7) | |
: $self->keyword($name) . '()' x (7 < $cx); | |
} | |
my $first; | |
my $fullname = $self->keyword($name); | |
my $proto = prototype("CORE::$name"); | |
if ( | |
( (defined $proto && $proto =~ /^;?\*/) | |
|| $name eq 'select' # select(F) doesn't have a proto | |
) | |
&& $kid->name eq "rv2gv" | |
&& !($kid->private & OPpLVAL_INTRO) | |
) { | |
$first = $self->rv2gv_or_string($kid->first); | |
} | |
else { | |
$first = $self->deparse($kid, 6); | |
} | |
if ($name eq "chmod" && $first =~ /^\d+$/) { | |
$first = sprintf("%#o", $first); | |
} | |
$first = "+$first" | |
if not $parens and not $nollafr and substr($first, 0, 1) eq "("; | |
push @exprs, $first; | |
$kid = $kid->sibling; | |
if (defined $proto && $proto =~ /^\*\*/ && $kid->name eq "rv2gv" | |
&& !($kid->private & OPpLVAL_INTRO)) { | |
push @exprs, $first = $self->rv2gv_or_string($kid->first); | |
$kid = $kid->sibling; | |
} | |
for (; !null($kid); $kid = $kid->sibling) { | |
push @exprs, $self->deparse($kid, 6); | |
} | |
if ($name eq "reverse" && ($op->private & OPpREVERSE_INPLACE)) { | |
return "$exprs[0] = $fullname" | |
. ($parens ? "($exprs[0])" : " $exprs[0]"); | |
} | |
if ($parens && $nollafr) { | |
return "($fullname " . join(", ", @exprs) . ")"; | |
} elsif ($parens) { | |
return "$fullname(" . join(", ", @exprs) . ")"; | |
} else { | |
return "$fullname " . join(", ", @exprs); | |
} | |
} | |
sub pp_bless { listop(@_, "bless") } | |
sub pp_atan2 { maybe_targmy(@_, \&listop, "atan2") } | |
sub pp_substr { | |
my ($self,$op,$cx) = @_; | |
if ($op->private & OPpSUBSTR_REPL_FIRST) { | |
return | |
listop($self, $op, 7, "substr", $op->first->sibling->sibling) | |
. " = " | |
. $self->deparse($op->first->sibling, 7); | |
} | |
maybe_local(@_, listop(@_, "substr")) | |
} | |
sub pp_index { | |
# Also handles pp_rindex. | |
# | |
# The body of this function includes an unrolled maybe_targmy(), | |
# since the two parts of that sub's actions need to have have the | |
# '== -1' bit in between | |
my($self, $op, $cx) = @_; | |
my $lex = ($op->private & OPpTARGET_MY); | |
my $bool = ($op->private & OPpTRUEBOOL); | |
my $val = $self->listop($op, ($bool ? 14 : $lex ? 7 : $cx), $op->name); | |
# (index() == -1) has op_eq and op_const optimised away | |
if ($bool) { | |
$val .= ($op->private & OPpINDEX_BOOLNEG) ? " == -1" : " != -1"; | |
$val = "($val)" if ($op->flags & OPf_PARENS); | |
} | |
if ($lex) { | |
my $var = $self->padname($op->targ); | |
$val = $self->maybe_parens("$var = $val", $cx, 7); | |
} | |
$val; | |
} | |
sub pp_rindex { pp_index(@_); } | |
sub pp_vec { maybe_targmy(@_, \&maybe_local, listop(@_, "vec")) } | |
sub pp_sprintf { maybe_targmy(@_, \&listop, "sprintf") } | |
sub pp_formline { listop(@_, "formline") } # see also deparse_format | |
sub pp_crypt { maybe_targmy(@_, \&listop, "crypt") } | |
sub pp_unpack { listop(@_, "unpack") } | |
sub pp_pack { listop(@_, "pack") } | |
sub pp_join { maybe_targmy(@_, \&listop, "join") } | |
sub pp_splice { listop(@_, "splice") } | |
sub pp_push { maybe_targmy(@_, \&listop, "push") } | |
sub pp_unshift { maybe_targmy(@_, \&listop, "unshift") } | |
sub pp_reverse { listop(@_, "reverse") } | |
sub pp_warn { listop(@_, "warn") } | |
sub pp_die { listop(@_, "die") } | |
sub pp_return { listop(@_, "return", undef, 1) } # llafr does not apply | |
sub pp_open { listop(@_, "open") } | |
sub pp_pipe_op { listop(@_, "pipe") } | |
sub pp_tie { listop(@_, "tie") } | |
sub pp_binmode { listop(@_, "binmode") } | |
sub pp_dbmopen { listop(@_, "dbmopen") } | |
sub pp_sselect { listop(@_, "select") } | |
sub pp_select { listop(@_, "select") } | |
sub pp_read { listop(@_, "read") } | |
sub pp_sysopen { listop(@_, "sysopen") } | |
sub pp_sysseek { listop(@_, "sysseek") } | |
sub pp_sysread { listop(@_, "sysread") } | |
sub pp_syswrite { listop(@_, "syswrite") } | |
sub pp_send { listop(@_, "send") } | |
sub pp_recv { listop(@_, "recv") } | |
sub pp_seek { listop(@_, "seek") } | |
sub pp_fcntl { listop(@_, "fcntl") } | |
sub pp_ioctl { listop(@_, "ioctl") } | |
sub pp_flock { maybe_targmy(@_, \&listop, "flock") } | |
sub pp_socket { listop(@_, "socket") } | |
sub pp_sockpair { listop(@_, "socketpair") } | |
sub pp_bind { listop(@_, "bind") } | |
sub pp_connect { listop(@_, "connect") } | |
sub pp_listen { listop(@_, "listen") } | |
sub pp_accept { listop(@_, "accept") } | |
sub pp_shutdown { listop(@_, "shutdown") } | |
sub pp_gsockopt { listop(@_, "getsockopt") } | |
sub pp_ssockopt { listop(@_, "setsockopt") } | |
sub pp_chown { maybe_targmy(@_, \&listop, "chown") } | |
sub pp_unlink { maybe_targmy(@_, \&listop, "unlink") } | |
sub pp_chmod { maybe_targmy(@_, \&listop, "chmod") } | |
sub pp_utime { maybe_targmy(@_, \&listop, "utime") } | |
sub pp_rename { maybe_targmy(@_, \&listop, "rename") } | |
sub pp_link { maybe_targmy(@_, \&listop, "link") } | |
sub pp_symlink { maybe_targmy(@_, \&listop, "symlink") } | |
sub pp_mkdir { maybe_targmy(@_, \&listop, "mkdir") } | |
sub pp_open_dir { listop(@_, "opendir") } | |
sub pp_seekdir { listop(@_, "seekdir") } | |
sub pp_waitpid { maybe_targmy(@_, \&listop, "waitpid") } | |
sub pp_system { maybe_targmy(@_, \&indirop, "system") } | |
sub pp_exec { maybe_targmy(@_, \&indirop, "exec") } | |
sub pp_kill { maybe_targmy(@_, \&listop, "kill") } | |
sub pp_setpgrp { maybe_targmy(@_, \&listop, "setpgrp") } | |
sub pp_getpriority { maybe_targmy(@_, \&listop, "getpriority") } | |
sub pp_setpriority { maybe_targmy(@_, \&listop, "setpriority") } | |
sub pp_shmget { listop(@_, "shmget") } | |
sub pp_shmctl { listop(@_, "shmctl") } | |
sub pp_shmread { listop(@_, "shmread") } | |
sub pp_shmwrite { listop(@_, "shmwrite") } | |
sub pp_msgget { listop(@_, "msgget") } | |
sub pp_msgctl { listop(@_, "msgctl") } | |
sub pp_msgsnd { listop(@_, "msgsnd") } | |
sub pp_msgrcv { listop(@_, "msgrcv") } | |
sub pp_semget { listop(@_, "semget") } | |
sub pp_semctl { listop(@_, "semctl") } | |
sub pp_semop { listop(@_, "semop") } | |
sub pp_ghbyaddr { listop(@_, "gethostbyaddr") } | |
sub pp_gnbyaddr { listop(@_, "getnetbyaddr") } | |
sub pp_gpbynumber { listop(@_, "getprotobynumber") } | |
sub pp_gsbyname { listop(@_, "getservbyname") } | |
sub pp_gsbyport { listop(@_, "getservbyport") } | |
sub pp_syscall { listop(@_, "syscall") } | |
sub pp_glob { | |
my $self = shift; | |
my($op, $cx) = @_; | |
my $kid = $op->first->sibling; # skip pushmark | |
my $keyword = | |
$op->flags & OPf_SPECIAL ? 'glob' : $self->keyword('glob'); | |
my $text = $self->deparse($kid, $cx); | |
return $cx >= 5 || $self->{'parens'} | |
? "$keyword($text)" | |
: "$keyword $text"; | |
} | |
# Truncate is special because OPf_SPECIAL makes a bareword first arg | |
# be a filehandle. This could probably be better fixed in the core | |
# by moving the GV lookup into ck_truc. | |
sub pp_truncate { | |
my $self = shift; | |
my($op, $cx) = @_; | |
my(@exprs); | |
my $parens = ($cx >= 5) || $self->{'parens'}; | |
my $kid = $op->first->sibling; | |
my $fh; | |
if ($op->flags & OPf_SPECIAL) { | |
# $kid is an OP_CONST | |
$fh = $self->const_sv($kid)->PV; | |
} else { | |
$fh = $self->deparse($kid, 6); | |
$fh = "+$fh" if not $parens and substr($fh, 0, 1) eq "("; | |
} | |
my $len = $self->deparse($kid->sibling, 6); | |
my $name = $self->keyword('truncate'); | |
if ($parens) { | |
return "$name($fh, $len)"; | |
} else { | |
return "$name $fh, $len"; | |
} | |
} | |
sub indirop { | |
my $self = shift; | |
my($op, $cx, $name) = @_; | |
my($expr, @exprs); | |
my $firstkid = my $kid = $op->first->sibling; | |
my $indir = ""; | |
if ($op->flags & OPf_STACKED) { | |
$indir = $kid; | |
$indir = $indir->first; # skip rv2gv | |
if (is_scope($indir)) { | |
$indir = "{" . $self->deparse($indir, 0) . "}"; | |
$indir = "{;}" if $indir eq "{}"; | |
} elsif ($indir->name eq "const" && $indir->private & OPpCONST_BARE) { | |
$indir = $self->const_sv($indir)->PV; | |
} else { | |
$indir = $self->deparse($indir, 24); | |
} | |
$indir = $indir . " "; | |
$kid = $kid->sibling; | |
} | |
if ($name eq "sort" && $op->private & (OPpSORT_NUMERIC | OPpSORT_INTEGER)) { | |
$indir = ($op->private & OPpSORT_DESCEND) ? '{$b <=> $a} ' | |
: '{$a <=> $b} '; | |
} | |
elsif ($name eq "sort" && $op->private & OPpSORT_DESCEND) { | |
$indir = '{$b cmp $a} '; | |
} | |
for (; !null($kid); $kid = $kid->sibling) { | |
$expr = $self->deparse($kid, !$indir && $kid == $firstkid && $name eq "sort" && $firstkid->name eq "entersub" ? 16 : 6); | |
push @exprs, $expr; | |
} | |
my $name2; | |
if ($name eq "sort" && $op->private & OPpSORT_REVERSE) { | |
$name2 = $self->keyword('reverse') . ' ' . $self->keyword('sort'); | |
} | |
else { $name2 = $self->keyword($name) } | |
if ($name eq "sort" && ($op->private & OPpSORT_INPLACE)) { | |
return "$exprs[0] = $name2 $indir $exprs[0]"; | |
} | |
my $args = $indir . join(", ", @exprs); | |
if ($indir ne "" && $name eq "sort") { | |
# We don't want to say "sort(f 1, 2, 3)", since perl -w will | |
# give bareword warnings in that case. Therefore if context | |
# requires, we'll put parens around the outside "(sort f 1, 2, | |
# 3)". Unfortunately, we'll currently think the parens are | |
# necessary more often that they really are, because we don't | |
# distinguish which side of an assignment we're on. | |
if ($cx >= 5) { | |
return "($name2 $args)"; | |
} else { | |
return "$name2 $args"; | |
} | |
} elsif ( | |
!$indir && $name eq "sort" | |
&& !null($op->first->sibling) | |
&& $op->first->sibling->name eq 'entersub' | |
) { | |
# We cannot say sort foo(bar), as foo will be interpreted as a | |
# comparison routine. We have to say sort(...) in that case. | |
return "$name2($args)"; | |
} else { | |
return length $args | |
? $self->maybe_parens_func($name2, $args, $cx, 5) | |
: $name2 . '()' x (7 < $cx); | |
} | |
} | |
sub pp_prtf { indirop(@_, "printf") } | |
sub pp_print { indirop(@_, "print") } | |
sub pp_say { indirop(@_, "say") } | |
sub pp_sort { indirop(@_, "sort") } | |
sub mapop { | |
my $self = shift; | |
my($op, $cx, $name) = @_; | |
my($expr, @exprs); | |
my $kid = $op->first; # this is the (map|grep)start | |
$kid = $kid->first->sibling; # skip a pushmark | |
my $code = $kid->first; # skip a null | |
if (is_scope $code) { | |
$code = "{" . $self->deparse($code, 0) . "} "; | |
} else { | |
$code = $self->deparse($code, 24); | |
$code .= ", " if !null($kid->sibling); | |
} | |
$kid = $kid->sibling; | |
for (; !null($kid); $kid = $kid->sibling) { | |
$expr = $self->deparse($kid, 6); | |
push @exprs, $expr if defined $expr; | |
} | |
return $self->maybe_parens_func($self->keyword($name), | |
$code . join(", ", @exprs), $cx, 5); | |
} | |
sub pp_mapwhile { mapop(@_, "map") } | |
sub pp_grepwhile { mapop(@_, "grep") } | |
sub pp_mapstart { baseop(@_, "map") } | |
sub pp_grepstart { baseop(@_, "grep") } | |
my %uses_intro; | |
BEGIN { | |
@uses_intro{ | |
eval { require B::Op_private } | |
? @{$B::Op_private::ops_using{OPpLVAL_INTRO}} | |
: qw(gvsv rv2sv rv2hv rv2gv rv2av aelem helem aslice | |
hslice delete padsv padav padhv enteriter entersub padrange | |
pushmark cond_expr refassign list) | |
} = (); | |
delete @uses_intro{qw( lvref lvrefslice lvavref entersub )}; | |
} | |
# Look for a my/state attribute declaration in a list or ex-list. | |
# Returns undef if not found, 'my($x, @a) :Foo(bar)' etc otherwise. | |
# | |
# There are three basic tree structs that are expected: | |
# | |
# my $x :foo; | |
# <1> ex-list vK/LVINTRO ->c | |
# <0> ex-pushmark v ->3 | |
# <1> entersub[t2] vKRS*/TARG ->b | |
# .... | |
# <0> padsv[$x:64,65] vM/LVINTRO ->c | |
# | |
# my @a :foo; | |
# my %h :foo; | |
# | |
# <1> ex-list vK ->c | |
# <0> ex-pushmark v ->3 | |
# <0> padav[@a:64,65] vM/LVINTRO ->4 | |
# <1> entersub[t2] vKRS*/TARG ->c | |
# .... | |
# | |
# my ($x,@a,%h) :foo; | |
# | |
# <;> nextstate(main 64 -e:1) v:{ ->3 | |
# <@> list vKP ->w | |
# <0> pushmark vM/LVINTRO ->4 | |
# <0> padsv[$x:64,65] vM/LVINTRO ->5 | |
# <0> padav[@a:64,65] vM/LVINTRO ->6 | |
# <0> padhv[%h:64,65] vM/LVINTRO ->7 | |
# <1> entersub[t4] vKRS*/TARG ->f | |
# .... | |
# <1> entersub[t5] vKRS*/TARG ->n | |
# .... | |
# <1> entersub[t6] vKRS*/TARG ->v | |
# .... | |
# where the entersub in all cases looks like | |
# <1> entersub[t2] vKRS*/TARG ->c | |
# <0> pushmark s ->5 | |
# <$> const[PV "attributes"] sM ->6 | |
# <$> const[PV "main"] sM ->7 | |
# <1> srefgen sKM/1 ->9 | |
# <1> ex-list lKRM ->8 | |
# <0> padsv[@a:64,65] sRM ->8 | |
# <$> const[PV "foo"] sM ->a | |
# <.> method_named[PV "import"] ->b | |
sub maybe_var_attr { | |
my ($self, $op, $cx) = @_; | |
my $kid = $op->first->sibling; # skip pushmark | |
return if class($kid) eq 'NULL'; | |
my $lop; | |
my $type; | |
# Extract out all the pad ops and entersub ops into | |
# @padops and @entersubops. Return if anything else seen. | |
# Also determine what class (if any) all the pad vars belong to | |
my $class; | |
my $decl; # 'my' or 'state' | |
my (@padops, @entersubops); | |
for ($lop = $kid; !null($lop); $lop = $lop->sibling) { | |
my $lopname = $lop->name; | |
my $loppriv = $lop->private; | |
if ($lopname =~ /^pad[sah]v$/) { | |
return unless $loppriv & OPpLVAL_INTRO; | |
my $padname = $self->padname_sv($lop->targ); | |
my $thisclass = ($padname->FLAGS & SVpad_TYPED) | |
? $padname->SvSTASH->NAME : 'main'; | |
# all pad vars must be in the same class | |
$class //= $thisclass; | |
return unless $thisclass eq $class; | |
# all pad vars must be the same sort of declaration | |
# (all my, all state, etc) | |
my $this = ($loppriv & OPpPAD_STATE) ? 'state' : 'my'; | |
if (defined $decl) { | |
return unless $this eq $decl; | |
} | |
$decl = $this; | |
push @padops, $lop; | |
} | |
elsif ($lopname eq 'entersub') { | |
push @entersubops, $lop; | |
} | |
else { | |
return; | |
} | |
} | |
return unless @padops && @padops == @entersubops; | |
# there should be a balance: each padop has a corresponding | |
# 'attributes'->import() method call, in the same order. | |
my @varnames; | |
my $attr_text; | |
for my $i (0..$#padops) { | |
my $padop = $padops[$i]; | |
my $esop = $entersubops[$i]; | |
push @varnames, $self->padname($padop->targ); | |
return unless ($esop->flags & OPf_KIDS); | |
my $kid = $esop->first; | |
return unless $kid->type == OP_PUSHMARK; | |
$kid = $kid->sibling; | |
return unless $$kid && $kid->type == OP_CONST; | |
return unless $self->const_sv($kid)->PV eq 'attributes'; | |
$kid = $kid->sibling; | |
return unless $$kid && $kid->type == OP_CONST; # __PACKAGE__ | |
$kid = $kid->sibling; | |
return unless $$kid | |
&& $kid->name eq "srefgen" | |
&& ($kid->flags & OPf_KIDS) | |
&& ($kid->first->flags & OPf_KIDS) | |
&& $kid->first->first->name =~ /^pad[sah]v$/ | |
&& $kid->first->first->targ == $padop->targ; | |
$kid = $kid->sibling; | |
my @attr; | |
while ($$kid) { | |
last if ($kid->type != OP_CONST); | |
push @attr, $self->const_sv($kid)->PV; | |
$kid = $kid->sibling; | |
} | |
return unless @attr; | |
my $thisattr = ":" . join(' ', @attr); | |
$attr_text //= $thisattr; | |
# all import calls must have the same list of attributes | |
return unless $attr_text eq $thisattr; | |
return unless $kid->name eq 'method_named'; | |
return unless $self->meth_sv($kid)->PV eq 'import'; | |
$kid = $kid->sibling; | |
return if $$kid; | |
} | |
my $res = $decl; | |
$res .= " $class " if $class ne 'main'; | |
$res .= | |
(@varnames > 1) | |
? "(" . join(', ', @varnames) . ')' | |
: " $varnames[0]"; | |
return "$res $attr_text"; | |
} | |
sub pp_list { | |
my $self = shift; | |
my($op, $cx) = @_; | |
{ | |
# might be my ($s,@a,%h) :Foo(bar); | |
my $my_attr = maybe_var_attr($self, $op, $cx); | |
return $my_attr if defined $my_attr; | |
} | |
my($expr, @exprs); | |
my $kid = $op->first->sibling; # skip pushmark | |
return '' if class($kid) eq 'NULL'; | |
my $lop; | |
my $local = "either"; # could be local(...), my(...), state(...) or our(...) | |
my $type; | |
for ($lop = $kid; !null($lop); $lop = $lop->sibling) { | |
my $lopname = $lop->name; | |
my $loppriv = $lop->private; | |
my $newtype; | |
if ($lopname =~ /^pad[ash]v$/ && $loppriv & OPpLVAL_INTRO) { | |
if ($loppriv & OPpPAD_STATE) { # state() | |
($local = "", last) if $local !~ /^(?:either|state)$/; | |
$local = "state"; | |
} else { # my() | |
($local = "", last) if $local !~ /^(?:either|my)$/; | |
$local = "my"; | |
} | |
my $padname = $self->padname_sv($lop->targ); | |
if ($padname->FLAGS & SVpad_TYPED) { | |
$newtype = $padname->SvSTASH->NAME; | |
} | |
} elsif ($lopname =~ /^(?:gv|rv2)([ash])v$/ | |
&& $loppriv & OPpOUR_INTRO | |
or $lopname eq "null" && class($lop) eq 'UNOP' | |
&& $lop->first->name eq "gvsv" | |
&& $lop->first->private & OPpOUR_INTRO) { # our() | |
my $newlocal = "local " x !!($loppriv & OPpLVAL_INTRO) . "our"; | |
($local = "", last) | |
if $local ne 'either' && $local ne $newlocal; | |
$local = $newlocal; | |
my $funny = !$1 || $1 eq 's' ? '$' : $1 eq 'a' ? '@' : '%'; | |
if (my $t = $self->find_our_type( | |
$funny . $self->gv_or_padgv($lop->first)->NAME | |
)) { | |
$newtype = $t; | |
} | |
} elsif ($lopname ne 'undef' | |
and !($loppriv & OPpLVAL_INTRO) | |
|| !exists $uses_intro{$lopname eq 'null' | |
? substr B::ppname($lop->targ), 3 | |
: $lopname}) | |
{ | |
$local = ""; # or not | |
last; | |
} elsif ($lopname ne "undef") | |
{ | |
# local() | |
($local = "", last) if $local !~ /^(?:either|local)$/; | |
$local = "local"; | |
} | |
if (defined $type && defined $newtype && $newtype ne $type) { | |
$local = ''; | |
last; | |
} | |
$type = $newtype; | |
} | |
$local = "" if $local eq "either"; # no point if it's all undefs | |
$local &&= join ' ', map $self->keyword($_), split / /, $local; | |
$local .= " $type " if $local && length $type; | |
return $self->deparse($kid, $cx) if null $kid->sibling and not $local; | |
for (; !null($kid); $kid = $kid->sibling) { | |
if ($local) { | |
if (class($kid) eq "UNOP" and $kid->first->name eq "gvsv") { | |
$lop = $kid->first; | |
} else { | |
$lop = $kid; | |
} | |
$self->{'avoid_local'}{$$lop}++; | |
$expr = $self->deparse($kid, 6); | |
delete $self->{'avoid_local'}{$$lop}; | |
} else { | |
$expr = $self->deparse($kid, 6); | |
} | |
push @exprs, $expr; | |
} | |
if ($local) { | |
if (@exprs == 1 && ($local eq 'state' || $local eq 'CORE::state')) { | |
# 'state @a = ...' is legal, while 'state(@a) = ...' currently isn't | |
return "$local $exprs[0]"; | |
} | |
return "$local(" . join(", ", @exprs) . ")"; | |
} else { | |
return $self->maybe_parens( join(", ", @exprs), $cx, 6); | |
} | |
} | |
sub is_ifelse_cont { | |
my $op = shift; | |
return ($op->name eq "null" and class($op) eq "UNOP" | |
and $op->first->name =~ /^(and|cond_expr)$/ | |
and is_scope($op->first->first->sibling)); | |
} | |
sub pp_cond_expr { | |
my $self = shift; | |
my($op, $cx) = @_; | |
my $cond = $op->first; | |
my $true = $cond->sibling; | |
my $false = $true->sibling; | |
my $cuddle = $self->{'cuddle'}; | |
unless ($cx < 1 and (is_scope($true) and $true->name ne "null") and | |
(is_scope($false) || is_ifelse_cont($false)) | |
and $self->{'expand'} < 7) { | |
$cond = $self->deparse($cond, 8); | |
$true = $self->deparse($true, 6); | |
$false = $self->deparse($false, 8); | |
return $self->maybe_parens("$cond ? $true : $false", $cx, 8); | |
} | |
$cond = $self->deparse($cond, 1); | |
$true = $self->deparse($true, 0); | |
my $head = $self->keyword("if") . " ($cond) {\n\t$true\n\b}"; | |
my @elsifs; | |
my $elsif; | |
while (!null($false) and is_ifelse_cont($false)) { | |
my $newop = $false->first; | |
my $newcond = $newop->first; | |
my $newtrue = $newcond->sibling; | |
$false = $newtrue->sibling; # last in chain is OP_AND => no else | |
if ($newcond->name eq "lineseq") | |
{ | |
# lineseq to ensure correct line numbers in elsif() | |
# Bug #37302 fixed by change #33710. | |
$newcond = $newcond->first->sibling; | |
} | |
$newcond = $self->deparse($newcond, 1); | |
$newtrue = $self->deparse($newtrue, 0); | |
$elsif ||= $self->keyword("elsif"); | |
push @elsifs, "$elsif ($newcond) {\n\t$newtrue\n\b}"; | |
} | |
if (!null($false)) { | |
$false = $cuddle . $self->keyword("else") . " {\n\t" . | |
$self->deparse($false, 0) . "\n\b}\cK"; | |
} else { | |
$false = "\cK"; | |
} | |
return $head . join($cuddle, "", @elsifs) . $false; | |
} | |
sub pp_once { | |
my ($self, $op, $cx) = @_; | |
my $cond = $op->first; | |
my $true = $cond->sibling; | |
my $ret = $self->deparse($true, $cx); | |
$ret =~ s/^(\(?)\$/$1 . $self->keyword("state") . ' $'/e; | |
$ret; | |
} | |
sub loop_common { | |
my $self = shift; | |
my($op, $cx, $init) = @_; | |
my $enter = $op->first; | |
my $kid = $enter->sibling; | |
local(@$self{qw'curstash warnings hints hinthash'}) | |
= @$self{qw'curstash warnings hints hinthash'}; | |
my $head = ""; | |
my $bare = 0; | |
my $body; | |
my $cond = undef; | |
my $name; | |
if ($kid->name eq "lineseq") { # bare or infinite loop | |
if ($kid->last->name eq "unstack") { # infinite | |
$head = "while (1) "; # Can't use for(;;) if there's a continue | |
$cond = ""; | |
} else { | |
$bare = 1; | |
} | |
$body = $kid; | |
} elsif ($enter->name eq "enteriter") { # foreach | |
my $ary = $enter->first->sibling; # first was pushmark | |
my $var = $ary->sibling; | |
if ($ary->name eq 'null' and $enter->private & OPpITER_REVERSED) { | |
# "reverse" was optimised away | |
$ary = listop($self, $ary->first->sibling, 1, 'reverse'); | |
} elsif ($enter->flags & OPf_STACKED | |
and not null $ary->first->sibling->sibling) | |
{ | |
$ary = $self->deparse($ary->first->sibling, 9) . " .. " . | |
$self->deparse($ary->first->sibling->sibling, 9); | |
} else { | |
$ary = $self->deparse($ary, 1); | |
} | |
if (null $var) { | |
$var = $self->pp_padsv($enter, 1, 1); | |
} elsif ($var->name eq "rv2gv") { | |
$var = $self->pp_rv2sv($var, 1); | |
if ($enter->private & OPpOUR_INTRO) { | |
# our declarations don't have package names | |
$var =~ s/^(.).*::/$1/; | |
$var = "our $var"; | |
} | |
} elsif ($var->name eq "gv") { | |
$var = "\$" . $self->deparse($var, 1); | |
} else { | |
$var = $self->deparse($var, 1); | |
} | |
$body = $kid->first->first->sibling; # skip OP_AND and OP_ITER | |
if (!is_state $body->first and $body->first->name !~ /^(?:stub|leave|scope)$/) { | |
confess unless $var eq '$_'; | |
$body = $body->first; | |
return $self->deparse($body, 2) . " " | |
. $self->keyword("foreach") . " ($ary)"; | |
} | |
$head = "foreach $var ($ary) "; | |
} elsif ($kid->name eq "null") { # while/until | |
$kid = $kid->first; | |
$name = {"and" => "while", "or" => "until"}->{$kid->name}; | |
$cond = $kid->first; | |
$body = $kid->first->sibling; | |
} elsif ($kid->name eq "stub") { # bare and empty | |
return "{;}"; # {} could be a hashref | |
} | |
# If there isn't a continue block, then the next pointer for the loop | |
# will point to the unstack, which is kid's last child, except | |
# in a bare loop, when it will point to the leaveloop. When neither of | |
# these conditions hold, then the second-to-last child is the continue | |
# block (or the last in a bare loop). | |
my $cont_start = $enter->nextop; | |
my $cont; | |
my $precond; | |
my $postcond; | |
if ($$cont_start != $$op && ${$cont_start} != ${$body->last}) { | |
if ($bare) { | |
$cont = $body->last; | |
} else { | |
$cont = $body->first; | |
while (!null($cont->sibling->sibling)) { | |
$cont = $cont->sibling; | |
} | |
} | |
my $state = $body->first; | |
my $cuddle = $self->{'cuddle'}; | |
my @states; | |
for (; $$state != $$cont; $state = $state->sibling) { | |
push @states, $state; | |
} | |
$body = $self->lineseq(undef, 0, @states); | |
if (defined $cond and not is_scope $cont and $self->{'expand'} < 3) { | |
$precond = "for ($init; "; | |
$postcond = "; " . $self->deparse($cont, 1) .") "; | |
$cont = "\cK"; | |
} else { | |
$cont = $cuddle . "continue {\n\t" . | |
$self->deparse($cont, 0) . "\n\b}\cK"; | |
} | |
} else { | |
return "" if !defined $body; | |
if (length $init) { | |
$precond = "for ($init; "; | |
$postcond = ";) "; | |
} | |
$cont = "\cK"; | |
$body = $self->deparse($body, 0); | |
} | |
if ($precond) { # for(;;) | |
$cond &&= $name eq 'until' | |
? listop($self, undef, 1, "not", $cond->first) | |
: $self->deparse($cond, 1); | |
$head = "$precond$cond$postcond"; | |
} | |
if ($name && !$head) { | |
ref $cond and $cond = $self->deparse($cond, 1); | |
$head = "$name ($cond) "; | |
} | |
$head =~ s/^(for(?:each)?|while|until)/$self->keyword($1)/e; | |
$body =~ s/;?$/;\n/; | |
return $head . "{\n\t" . $body . "\b}" . $cont; | |
} | |
sub pp_leaveloop { shift->loop_common(@_, "") } | |
sub for_loop { | |
my $self = shift; | |
my($op, $cx) = @_; | |
my $init = $self->deparse($op, 1); | |
my $s = $op->sibling; | |
my $ll = $s->name eq "unstack" ? $s->sibling : $s->first->sibling; | |
return $self->loop_common($ll, $cx, $init); | |
} | |
sub pp_leavetry { | |
my $self = shift; | |
return "eval {\n\t" . $self->pp_leave(@_) . "\n\b}"; | |
} | |
sub pp_leavetrycatch { | |
my $self = shift; | |
my ($op) = @_; | |
# Expect that the first three kids should be (entertrycatch, poptry, catch) | |
my $entertrycatch = $op->first; | |
$entertrycatch->name eq "entertrycatch" or die "Expected entertrycatch as first child of leavetrycatch"; | |
my $tryblock = $entertrycatch->sibling; | |
$tryblock->name eq "poptry" or die "Expected poptry as second child of leavetrycatch"; | |
my $catch = $tryblock->sibling; | |
$catch->name eq "catch" or die "Expected catch as third child of leavetrycatch"; | |
my $catchblock = $catch->first->sibling; | |
$catchblock->name eq "scope" or die "Expected scope as second child of catch"; | |
my $trycode = scopeop(0, $self, $tryblock); | |
my $catchvar = $self->padname($catch->targ); | |
my $catchcode = scopeop(0, $self, $catchblock); | |
return "try {\n\t$trycode\n\b}\n" . | |
"catch($catchvar) {\n\t$catchcode\n\b}\cK"; | |
} | |
sub _op_is_or_was { | |
my ($op, $expect_type) = @_; | |
my $type = $op->type; | |
return($type == $expect_type | |
|| ($type == OP_NULL && $op->targ == $expect_type)); | |
} | |
sub pp_null { | |
my($self, $op, $cx) = @_; | |
# might be 'my $s :Foo(bar);' | |
if ($op->targ == OP_LIST) { | |
my $my_attr = maybe_var_attr($self, $op, $cx); | |
return $my_attr if defined $my_attr; | |
} | |
if (class($op) eq "OP") { | |
# old value is lost | |
return $self->{'ex_const'} if $op->targ == OP_CONST; | |
} elsif (class ($op) eq "COP") { | |
return &pp_nextstate; | |
} elsif ($op->first->name eq 'pushmark' | |
or $op->first->name eq 'null' | |
&& $op->first->targ == OP_PUSHMARK | |
&& _op_is_or_was($op, OP_LIST)) { | |
return $self->pp_list($op, $cx); | |
} elsif ($op->first->name eq "enter") { | |
return $self->pp_leave($op, $cx); | |
} elsif ($op->first->name eq "leave") { | |
return $self->pp_leave($op->first, $cx); | |
} elsif ($op->first->name eq "scope") { | |
return $self->pp_scope($op->first, $cx); | |
} elsif ($op->targ == OP_STRINGIFY) { | |
return $self->dquote($op, $cx); | |
} elsif ($op->targ == OP_GLOB) { | |
return $self->pp_glob( | |
$op->first # entersub | |
->first # ex-list | |
->first # pushmark | |
->sibling, # glob | |
$cx | |
); | |
} elsif (!null($op->first->sibling) and | |
$op->first->sibling->name eq "readline" and | |
$op->first->sibling->flags & OPf_STACKED) { | |
return $self->maybe_parens($self->deparse($op->first, 7) . " = " | |
. $self->deparse($op->first->sibling, 7), | |
$cx, 7); | |
} elsif (!null($op->first->sibling) and | |
$op->first->sibling->name =~ /^transr?\z/ and | |
$op->first->sibling->flags & OPf_STACKED) { | |
return $self->maybe_parens($self->deparse($op->first, 20) . " =~ " | |
. $self->deparse($op->first->sibling, 20), | |
$cx, 20); | |
} elsif ($op->flags & OPf_SPECIAL && $cx < 1 && !$op->targ) { | |
return ($self->lex_in_scope("&do") ? "CORE::do" : "do") | |
. " {\n\t". $self->deparse($op->first, $cx) ."\n\b};"; | |
} elsif (!null($op->first->sibling) and | |
$op->first->sibling->name eq "null" and | |
class($op->first->sibling) eq "UNOP" and | |
$op->first->sibling->first->flags & OPf_STACKED and | |
$op->first->sibling->first->name eq "rcatline") { | |
return $self->maybe_parens($self->deparse($op->first, 18) . " .= " | |
. $self->deparse($op->first->sibling, 18), | |
$cx, 18); | |
} else { | |
return $self->deparse($op->first, $cx); | |
} | |
} | |
sub padname { | |
my $self = shift; | |
my $targ = shift; | |
return $self->padname_sv($targ)->PVX; | |
} | |
sub padany { | |
my $self = shift; | |
my $op = shift; | |
return substr($self->padname($op->targ), 1); # skip $/@/% | |
} | |
sub pp_padsv { | |
my $self = shift; | |
my($op, $cx, $forbid_parens) = @_; | |
my $targ = $op->targ; | |
return $self->maybe_my($op, $cx, $self->padname($targ), | |
$self->padname_sv($targ), | |
$forbid_parens); | |
} | |
sub pp_padav { pp_padsv(@_) } | |
# prepend 'keys' where its been optimised away, with suitable handling | |
# of CORE:: and parens | |
sub add_keys_keyword { | |
my ($self, $str, $cx) = @_; | |
$str = $self->maybe_parens($str, $cx, 16); | |
# 'keys %h' versus 'keys(%h)' | |
$str = " $str" unless $str =~ /^\(/; | |
return $self->keyword("keys") . $str; | |
} | |
sub pp_padhv { | |
my ($self, $op, $cx) = @_; | |
my $str = pp_padsv(@_); | |
# with OPpPADHV_ISKEYS the keys op is optimised away, except | |
# in scalar context the old op is kept (but not executed) so its targ | |
# can be used. | |
if ( ($op->private & OPpPADHV_ISKEYS) | |
&& !(($op->flags & OPf_WANT) == OPf_WANT_SCALAR)) | |
{ | |
$str = $self->add_keys_keyword($str, $cx); | |
} | |
$str; | |
} | |
sub gv_or_padgv { | |
my $self = shift; | |
my $op = shift; | |
if (class($op) eq "PADOP") { | |
return $self->padval($op->padix); | |
} else { # class($op) eq "SVOP" | |
return $op->gv; | |
} | |
} | |
sub pp_gvsv { | |
my $self = shift; | |
my($op, $cx) = @_; | |
my $gv = $self->gv_or_padgv($op); | |
return $self->maybe_local($op, $cx, $self->stash_variable("\$", | |
$self->gv_name($gv), $cx)); | |
} | |
sub pp_gv { | |
my $self = shift; | |
my($op, $cx) = @_; | |
my $gv = $self->gv_or_padgv($op); | |
return $self->maybe_qualify("", $self->gv_name($gv)); | |
} | |
sub pp_aelemfast_lex { | |
my $self = shift; | |
my($op, $cx) = @_; | |
my $name = $self->padname($op->targ); | |
$name =~ s/^@/\$/; | |
my $i = $op->private; | |
$i -= 256 if $i > 127; | |
return $name . "[$i]"; | |
} | |
sub pp_aelemfast { | |
my $self = shift; | |
my($op, $cx) = @_; | |
# optimised PADAV, pre 5.15 | |
return $self->pp_aelemfast_lex(@_) if ($op->flags & OPf_SPECIAL); | |
my $gv = $self->gv_or_padgv($op); | |
my($name,$quoted) = $self->stash_variable_name('@',$gv); | |
$name = $quoted ? "$name->" : '$' . $name; | |
my $i = $op->private; | |
$i -= 256 if $i > 127; | |
return $name . "[$i]"; | |
} | |
sub rv2x { | |
my $self = shift; | |
my($op, $cx, $type) = @_; | |
if (class($op) eq 'NULL' || !$op->can("first")) { | |
carp("Unexpected op in pp_rv2x"); | |
return 'XXX'; | |
} | |
my $kid = $op->first; | |
if ($kid->name eq "gv") { | |
return $self->stash_variable($type, | |
$self->gv_name($self->gv_or_padgv($kid)), $cx); | |
} elsif (is_scalar $kid) { | |
my $str = $self->deparse($kid, 0); | |
if ($str =~ /^\$([^\w\d])\z/) { | |
# "$$+" isn't a legal way to write the scalar dereference | |
# of $+, since the lexer can't tell you aren't trying to | |
# do something like "$$ + 1" to get one more than your | |
# PID. Either "${$+}" or "$${+}" are workable | |
# disambiguations, but if the programmer did the former, | |
# they'd be in the "else" clause below rather than here. | |
# It's not clear if this should somehow be unified with | |
# the code in dq and re_dq that also adds lexer | |
# disambiguation braces. | |
$str = '$' . "{$1}"; #' | |
} | |
return $type . $str; | |
} else { | |
return $type . "{" . $self->deparse($kid, 0) . "}"; | |
} | |
} | |
sub pp_rv2sv { maybe_local(@_, rv2x(@_, "\$")) } | |
sub pp_rv2gv { maybe_local(@_, rv2x(@_, "*")) } | |
sub pp_rv2hv { | |
my ($self, $op, $cx) = @_; | |
my $str = rv2x(@_, "%"); | |
if ($op->private & OPpRV2HV_ISKEYS) { | |
$str = $self->add_keys_keyword($str, $cx); | |
} | |
return maybe_local(@_, $str); | |
} | |
# skip rv2av | |
sub pp_av2arylen { | |
my $self = shift; | |
my($op, $cx) = @_; | |
my $kid = $op->first; | |
if ($kid->name eq "padav") { | |
return $self->maybe_local($op, $cx, '$#' . $self->padany($kid)); | |
} else { | |
my $kkid; | |
if ( $kid->name eq "rv2av" | |
&& ($kkid = $kid->first) | |
&& $kkid->name !~ /^(scope|leave|gv)$/) | |
{ | |
# handle (expr)->$#* postfix form | |
my $expr; | |
$expr = $self->deparse($kkid, 24); # 24 is '->' | |
$expr = "$expr->\$#*"; | |
# XXX maybe_local is probably wrong here: local($#-expression) | |
# doesn't "do" local (the is no INTRO flag set) | |
return $self->maybe_local($op, $cx, $expr); | |
} | |
else { | |
# handle $#{expr} form | |
# XXX see maybe_local comment above | |
return $self->maybe_local($op, $cx, $self->rv2x($kid, $cx, '$#')); | |
} | |
} | |
} | |
# skip down to the old, ex-rv2cv | |
sub pp_rv2cv { | |
my ($self, $op, $cx) = @_; | |
if (!null($op->first) && $op->first->name eq 'null' && | |
$op->first->targ == OP_LIST) | |
{ | |
return $self->rv2x($op->first->first->sibling, $cx, "&") | |
} | |
else { | |
return $self->rv2x($op, $cx, "") | |
} | |
} | |
sub list_const { | |
my $self = shift; | |
my($cx, @list) = @_; | |
my @a = map $self->const($_, 6), @list; | |
if (@a == 0) { | |
return "()"; | |
} elsif (@a == 1) { | |
return $a[0]; | |
} elsif ( @a > 2 and !grep(!/^-?\d+$/, @a)) { | |
# collapse (-1,0,1,2) into (-1..2) | |
my ($s, $e) = @a[0,-1]; | |
my $i = $s; | |
return $self->maybe_parens("$s..$e", $cx, 9) | |
unless grep $i++ != $_, @a; | |
} | |
return $self->maybe_parens(join(", ", @a), $cx, 6); | |
} | |
sub pp_rv2av { | |
my $self = shift; | |
my($op, $cx) = @_; | |
my $kid = $op->first; | |
if ($kid->name eq "const") { # constant list | |
my $av = $self->const_sv($kid); | |
return $self->list_const($cx, $av->ARRAY); | |
} else { | |
return $self->maybe_local($op, $cx, $self->rv2x($op, $cx, "\@")); | |
} | |
} | |
sub is_subscriptable { | |
my $op = shift; | |
if ($op->name =~ /^([ahg]elem|multideref$)/) { | |
return 1; | |
} elsif ($op->name eq "entersub") { | |
my $kid = $op->first; | |
return 0 unless null $kid->sibling; | |
$kid = $kid->first; | |
$kid = $kid->sibling until null $kid->sibling; | |
return 0 if is_scope($kid); | |
$kid = $kid->first; | |
return 0 if $kid->name eq "gv" || $kid->name eq "padcv"; | |
return 0 if is_scalar($kid); | |
return is_subscriptable($kid); | |
} else { | |
return 0; | |
} | |
} | |
sub elem_or_slice_array_name | |
{ | |
my $self = shift; | |
my ($array, $left, $padname, $allow_arrow) = @_; | |
if ($array->name eq $padname) { | |
return $self->padany($array); | |
} elsif (is_scope($array)) { # ${expr}[0] | |
return "{" . $self->deparse($array, 0) . "}"; | |
} elsif ($array->name eq "gv") { | |
($array, my $quoted) = | |
$self->stash_variable_name( | |
$left eq '[' ? '@' : '%', $self->gv_or_padgv($array) | |
); | |
if (!$allow_arrow && $quoted) { | |
# This cannot happen. | |
die "Invalid variable name $array for slice"; | |
} | |
return $quoted ? "$array->" : $array; | |
} elsif (!$allow_arrow || is_scalar $array) { # $x[0], $$x[0], ... | |
return $self->deparse($array, 24); | |
} else { | |
return undef; | |
} | |
} | |
sub elem_or_slice_single_index | |
{ | |
my $self = shift; | |
my ($idx) = @_; | |
$idx = $self->deparse($idx, 1); | |
# Outer parens in an array index will confuse perl | |
# if we're interpolating in a regular expression, i.e. | |
# /$x$foo[(-1)]/ is *not* the same as /$x$foo[-1]/ | |
# | |
# If $self->{parens}, then an initial '(' will | |
# definitely be paired with a final ')'. If | |
# !$self->{parens}, the misleading parens won't | |
# have been added in the first place. | |
# | |
# [You might think that we could get "(...)...(...)" | |
# where the initial and final parens do not match | |
# each other. But we can't, because the above would | |
# only happen if there's an infix binop between the | |
# two pairs of parens, and *that* means that the whole | |
# expression would be parenthesized as well.] | |
# | |
$idx =~ s/^\((.*)\)$/$1/ if $self->{'parens'}; | |
# Hash-element braces will autoquote a bareword inside themselves. | |
# We need to make sure that C<$hash{warn()}> doesn't come out as | |
# C<$hash{warn}>, which has a quite different meaning. Currently | |
# B::Deparse will always quote strings, even if the string was a | |
# bareword in the original (i.e. the OPpCONST_BARE flag is ignored | |
# for constant strings.) So we can cheat slightly here - if we see | |
# a bareword, we know that it is supposed to be a function call. | |
# | |
$idx =~ s/^([A-Za-z_]\w*)$/$1()/; | |
return $idx; | |
} | |
sub elem { | |
my $self = shift; | |
my ($op, $cx, $left, $right, $padname) = @_; | |
my($array, $idx) = ($op->first, $op->first->sibling); | |
$idx = $self->elem_or_slice_single_index($idx); | |
unless ($array->name eq $padname) { # Maybe this has been fixed | |
$array = $array->first; # skip rv2av (or ex-rv2av in _53+) | |
} | |
if (my $array_name=$self->elem_or_slice_array_name | |
($array, $left, $padname, 1)) { | |
return ($array_name =~ /->\z/ | |
? $array_name | |
: $array_name eq '#' ? '${#}' : "\$" . $array_name) | |
. $left . $idx . $right; | |
} else { | |
# $x[20][3]{hi} or expr->[20] | |
my $arrow = is_subscriptable($array) ? "" : "->"; | |
return $self->deparse($array, 24) . $arrow . $left . $idx . $right; | |
} | |
} | |
# a simplified version of elem_or_slice_array_name() | |
# for the use of pp_multideref | |
sub multideref_var_name { | |
my $self = shift; | |
my ($gv, $is_hash) = @_; | |
my ($name, $quoted) = | |
$self->stash_variable_name( $is_hash ? '%' : '@', $gv); | |
return $quoted ? "$name->" | |
: $name eq '#' | |
? '${#}' # avoid ${#}[1] => $#[1] | |
: '$' . $name; | |
} | |
# deparse an OP_MULTICONCAT. If $in_dq is 1, we're within | |
# a double-quoted string, so for example. | |
# "abc\Qdef$x\Ebar" | |
# might get compiled as | |
# multiconcat("abc", metaquote(multiconcat("def", $x)), "bar") | |
# and the inner multiconcat should be deparsed as C<def$x> rather than | |
# the normal C<def . $x> | |
# Ditto if $in_dq is 2, handle qr/...\Qdef$x\E.../. | |
sub do_multiconcat { | |
my $self = shift; | |
my($op, $cx, $in_dq) = @_; | |
my $kid; | |
my @kids; | |
my $assign; | |
my $append; | |
my $lhs = ""; | |
for ($kid = $op->first; !null $kid; $kid = $kid->sibling) { | |
# skip the consts and/or padsv we've optimised away | |
push @kids, $kid | |
unless $kid->type == OP_NULL | |
&& ( $kid->targ == OP_PADSV | |
|| $kid->targ == OP_CONST | |
|| $kid->targ == OP_PUSHMARK); | |
} | |
$append = ($op->private & OPpMULTICONCAT_APPEND); | |
if ($op->private & OPpTARGET_MY) { | |
# '$lex = ...' or '$lex .= ....' or 'my $lex = ' | |
$lhs = $self->padname($op->targ); | |
$lhs = "my $lhs" if ($op->private & OPpLVAL_INTRO); | |
$assign = 1; | |
} | |
elsif ($op->flags & OPf_STACKED) { | |
# 'expr = ...' or 'expr .= ....' | |
my $expr = $append ? shift(@kids) : pop(@kids); | |
$lhs = $self->deparse($expr, 7); | |
$assign = 1; | |
} | |
if ($assign) { | |
$lhs .= $append ? ' .= ' : ' = '; | |
} | |
my ($nargs, $const_str, @const_lens) = $op->aux_list($self->{curcv}); | |
my @consts; | |
my $i = 0; | |
for (@const_lens) { | |
if ($_ == -1) { | |
push @consts, undef; | |
} | |
else { | |
push @consts, substr($const_str, $i, $_); | |
my @args; | |
$i += $_; | |
} | |
} | |
my $rhs = ""; | |
if ( $in_dq | |
|| (($op->private & OPpMULTICONCAT_STRINGIFY) && !$self->{'unquote'})) | |
{ | |
# "foo=$foo bar=$bar " | |
my $not_first; | |
while (@consts) { | |
if ($not_first) { | |
my $s = $self->dq(shift(@kids), 18); | |
# don't deparse "a${$}b" as "a$$b" | |
$s = '${$}' if $s eq '$$'; | |
$rhs = dq_disambiguate($rhs, $s); | |
} | |
$not_first = 1; | |
my $c = shift @consts; | |
if (defined $c) { | |
if ($in_dq == 2) { | |
# in pattern: don't convert newline to '\n' etc etc | |
my $s = re_uninterp(escape_re(re_unback($c))); | |
$rhs = re_dq_disambiguate($rhs, $s) | |
} | |
else { | |
my $s = uninterp(escape_str(unback($c))); | |
$rhs = dq_disambiguate($rhs, $s) | |
} | |
} | |
} | |
return $rhs if $in_dq; | |
$rhs = single_delim("qq", '"', $rhs, $self); | |
} | |
elsif ($op->private & OPpMULTICONCAT_FAKE) { | |
# sprintf("foo=%s bar=%s ", $foo, $bar) | |
my @all; | |
@consts = map { $_ //= ''; s/%/%%/g; $_ } @consts; | |
my $fmt = join '%s', @consts; | |
push @all, $self->quoted_const_str($fmt); | |
# the following is a stripped down copy of sub listop {} | |
my $parens = $assign || ($cx >= 5) || $self->{'parens'}; | |
my $fullname = $self->keyword('sprintf'); | |
push @all, map $self->deparse($_, 6), @kids; | |
$rhs = $parens | |
? "$fullname(" . join(", ", @all) . ")" | |
: "$fullname " . join(", ", @all); | |
} | |
else { | |
# "foo=" . $foo . " bar=" . $bar | |
my @all; | |
my $not_first; | |
while (@consts) { | |
push @all, $self->deparse(shift(@kids), 18) if $not_first; | |
$not_first = 1; | |
my $c = shift @consts; | |
if (defined $c) { | |
push @all, $self->quoted_const_str($c); | |
} | |
} | |
$rhs .= join ' . ', @all; | |
} | |
my $text = $lhs . $rhs; | |
$text = "($text)" if ($cx >= (($assign) ? 7 : 18+1)) | |
|| $self->{'parens'}; | |
return $text; | |
} | |
sub pp_multiconcat { | |
my $self = shift; | |
$self->do_multiconcat(@_, 0); | |
} | |
sub pp_multideref { | |
my $self = shift; | |
my($op, $cx) = @_; | |
my $text = ""; | |
if ($op->private & OPpMULTIDEREF_EXISTS) { | |
$text = $self->keyword("exists"). " "; | |
} | |
elsif ($op->private & OPpMULTIDEREF_DELETE) { | |
$text = $self->keyword("delete"). " "; | |
} | |
elsif ($op->private & OPpLVAL_INTRO) { | |
$text = $self->keyword("local"). " "; | |
} | |
if ($op->first && ($op->first->flags & OPf_KIDS)) { | |
# arbitrary initial expression, e.g. f(1,2,3)->[...] | |
my $expr = $self->deparse($op->first, 24); | |
# stop "exists (expr)->{...}" being interpreted as | |
#"(exists (expr))->{...}" | |
$expr = "+$expr" if $expr =~ /^\(/; | |
$text .= $expr; | |
} | |
my @items = $op->aux_list($self->{curcv}); | |
my $actions = shift @items; | |
my $is_hash; | |
my $derefs = 0; | |
while (1) { | |
if (($actions & MDEREF_ACTION_MASK) == MDEREF_reload) { | |
$actions = shift @items; | |
next; | |
} | |
$is_hash = ( | |
($actions & MDEREF_ACTION_MASK) == MDEREF_HV_pop_rv2hv_helem | |
|| ($actions & MDEREF_ACTION_MASK) == MDEREF_HV_gvsv_vivify_rv2hv_helem | |
|| ($actions & MDEREF_ACTION_MASK) == MDEREF_HV_padsv_vivify_rv2hv_helem | |
|| ($actions & MDEREF_ACTION_MASK) == MDEREF_HV_vivify_rv2hv_helem | |
|| ($actions & MDEREF_ACTION_MASK) == MDEREF_HV_padhv_helem | |
|| ($actions & MDEREF_ACTION_MASK) == MDEREF_HV_gvhv_helem | |
); | |
if ( ($actions & MDEREF_ACTION_MASK) == MDEREF_AV_padav_aelem | |
|| ($actions & MDEREF_ACTION_MASK) == MDEREF_HV_padhv_helem) | |
{ | |
$derefs = 1; | |
$text .= '$' . substr($self->padname(shift @items), 1); | |
} | |
elsif ( ($actions & MDEREF_ACTION_MASK) == MDEREF_AV_gvav_aelem | |
|| ($actions & MDEREF_ACTION_MASK) == MDEREF_HV_gvhv_helem) | |
{ | |
$derefs = 1; | |
$text .= $self->multideref_var_name(shift @items, $is_hash); | |
} | |
else { | |
if ( ($actions & MDEREF_ACTION_MASK) == | |
MDEREF_AV_padsv_vivify_rv2av_aelem | |
|| ($actions & MDEREF_ACTION_MASK) == | |
MDEREF_HV_padsv_vivify_rv2hv_helem) | |
{ | |
$text .= $self->padname(shift @items); | |
} | |
elsif ( ($actions & MDEREF_ACTION_MASK) == | |
MDEREF_AV_gvsv_vivify_rv2av_aelem | |
|| ($actions & MDEREF_ACTION_MASK) == | |
MDEREF_HV_gvsv_vivify_rv2hv_helem) | |
{ | |
$text .= $self->multideref_var_name(shift @items, $is_hash); | |
} | |
elsif ( ($actions & MDEREF_ACTION_MASK) == | |
MDEREF_AV_pop_rv2av_aelem | |
|| ($actions & MDEREF_ACTION_MASK) == | |
MDEREF_HV_pop_rv2hv_helem) | |
{ | |
if ( ($op->flags & OPf_KIDS) | |
&& ( _op_is_or_was($op->first, OP_RV2AV) | |
|| _op_is_or_was($op->first, OP_RV2HV)) | |
&& ($op->first->flags & OPf_KIDS) | |
&& ( _op_is_or_was($op->first->first, OP_AELEM) | |
|| _op_is_or_was($op->first->first, OP_HELEM)) | |
) | |
{ | |
$derefs++; | |
} | |
} | |
$text .= '->' if !$derefs++; | |
} | |
if (($actions & MDEREF_INDEX_MASK) == MDEREF_INDEX_none) { | |
last; | |
} | |
$text .= $is_hash ? '{' : '['; | |
if (($actions & MDEREF_INDEX_MASK) == MDEREF_INDEX_const) { | |
my $key = shift @items; | |
if ($is_hash) { | |
$text .= $self->const($key, $cx); | |
} | |
else { | |
$text .= $key; | |
} | |
} | |
elsif (($actions & MDEREF_INDEX_MASK) == MDEREF_INDEX_padsv) { | |
$text .= $self->padname(shift @items); | |
} | |
elsif (($actions & MDEREF_INDEX_MASK) == MDEREF_INDEX_gvsv) { | |
$text .= '$' . ($self->stash_variable_name('$', shift @items))[0]; | |
} | |
$text .= $is_hash ? '}' : ']'; | |
if ($actions & MDEREF_FLAG_last) { | |
last; | |
} | |
$actions >>= MDEREF_SHIFT; | |
} | |
return $text; | |
} | |
sub pp_aelem { maybe_local(@_, elem(@_, "[", "]", "padav")) } | |
sub pp_helem { maybe_local(@_, elem(@_, "{", "}", "padhv")) } | |
sub pp_gelem { | |
my $self = shift; | |
my($op, $cx) = @_; | |
my($glob, $part) = ($op->first, $op->last); | |
$glob = $glob->first; # skip rv2gv | |
$glob = $glob->first if $glob->name eq "rv2gv"; # this one's a bug | |
my $scope = is_scope($glob); | |
$glob = $self->deparse($glob, 0); | |
$part = $self->deparse($part, 1); | |
$glob =~ s/::\z// unless $scope; | |
return "*" . ($scope ? "{$glob}" : $glob) . "{$part}"; | |
} | |
sub slice { | |
my $self = shift; | |
my ($op, $cx, $left, $right, $regname, $padname) = @_; | |
my $last; | |
my(@elems, $kid, $array, $list); | |
if (class($op) eq "LISTOP") { | |
$last = $op->last; | |
} else { # ex-hslice inside delete() | |
for ($kid = $op->first; !null $kid->sibling; $kid = $kid->sibling) {} | |
$last = $kid; | |
} | |
$array = $last; | |
$array = $array->first | |
if $array->name eq $regname or $array->name eq "null"; | |
$array = $self->elem_or_slice_array_name($array,$left,$padname,0); | |
$kid = $op->first->sibling; # skip pushmark | |
if ($kid->name eq "list") { | |
$kid = $kid->first->sibling; # skip list, pushmark | |
for (; !null $kid; $kid = $kid->sibling) { | |
push @elems, $self->deparse($kid, 6); | |
} | |
$list = join(", ", @elems); | |
} else { | |
$list = $self->elem_or_slice_single_index($kid); | |
} | |
my $lead = ( _op_is_or_was($op, OP_KVHSLICE) | |
|| _op_is_or_was($op, OP_KVASLICE)) | |
? '%' : '@'; | |
return $lead . $array . $left . $list . $right; | |
} | |
sub pp_aslice { maybe_local(@_, slice(@_, "[", "]", "rv2av", "padav")) } | |
sub pp_kvaslice { slice(@_, "[", "]", "rv2av", "padav") } | |
sub pp_hslice { maybe_local(@_, slice(@_, "{", "}", "rv2hv", "padhv")) } | |
sub pp_kvhslice { slice(@_, "{", "}", "rv2hv", "padhv") } | |
sub pp_lslice { | |
my $self = shift; | |
my($op, $cx) = @_; | |
my $idx = $op->first; | |
my $list = $op->last; | |
my(@elems, $kid); | |
$list = $self->deparse($list, 1); | |
$idx = $self->deparse($idx, 1); | |
return "($list)" . "[$idx]"; | |
} | |
sub want_scalar { | |
my $op = shift; | |
return ($op->flags & OPf_WANT) == OPf_WANT_SCALAR; | |
} | |
sub want_list { | |
my $op = shift; | |
return ($op->flags & OPf_WANT) == OPf_WANT_LIST; | |
} | |
sub _method { | |
my $self = shift; | |
my($op, $cx) = @_; | |
my $kid = $op->first->sibling; # skip pushmark | |
my($meth, $obj, @exprs); | |
if ($kid->name eq "list" and want_list $kid) { | |
# When an indirect object isn't a bareword but the args are in | |
# parens, the parens aren't part of the method syntax (the LLAFR | |
# doesn't apply), but they make a list with OPf_PARENS set that | |
# doesn't get flattened by the append_elem that adds the method, | |
# making a (object, arg1, arg2, ...) list where the object | |
# usually is. This can be distinguished from | |
# '($obj, $arg1, $arg2)->meth()' (which is legal if $arg2 is an | |
# object) because in the later the list is in scalar context | |
# as the left side of -> always is, while in the former | |
# the list is in list context as method arguments always are. | |
# (Good thing there aren't method prototypes!) | |
$meth = $kid->sibling; | |
$kid = $kid->first->sibling; # skip pushmark | |
$obj = $kid; | |
$kid = $kid->sibling; | |
for (; not null $kid; $kid = $kid->sibling) { | |
push @exprs, $kid; | |
} | |
} else { | |
$obj = $kid; | |
$kid = $kid->sibling; | |
for (; !null ($kid->sibling) && $kid->name!~/^method(?:_named)?\z/; | |
$kid = $kid->sibling) { | |
push @exprs, $kid | |
} | |
$meth = $kid; | |
} | |
if ($meth->name eq "method_named") { | |
$meth = $self->meth_sv($meth)->PV; | |
} elsif ($meth->name eq "method_super") { | |
$meth = "SUPER::".$self->meth_sv($meth)->PV; | |
} elsif ($meth->name eq "method_redir") { | |
$meth = $self->meth_rclass_sv($meth)->PV.'::'.$self->meth_sv($meth)->PV; | |
} elsif ($meth->name eq "method_redir_super") { | |
$meth = $self->meth_rclass_sv($meth)->PV.'::SUPER::'. | |
$self->meth_sv($meth)->PV; | |
} else { | |
$meth = $meth->first; | |
if ($meth->name eq "const") { | |
# As of 5.005_58, this case is probably obsoleted by the | |
# method_named case above | |
$meth = $self->const_sv($meth)->PV; # needs to be bare | |
} | |
} | |
return { method => $meth, variable_method => ref($meth), | |
object => $obj, args => \@exprs }, | |
$cx; | |
} | |
# compat function only | |
sub method { | |
my $self = shift; | |
my $info = $self->_method(@_); | |
return $self->e_method( $self->_method(@_) ); | |
} | |
sub e_method { | |
my ($self, $info, $cx) = @_; | |
my $obj = $self->deparse($info->{object}, 24); | |
my $meth = $info->{method}; | |
$meth = $self->deparse($meth, 1) if $info->{variable_method}; | |
my $args = join(", ", map { $self->deparse($_, 6) } @{$info->{args}} ); | |
if ($info->{object}->name eq 'scope' && want_list $info->{object}) { | |
# method { $object } | |
# This must be deparsed this way to preserve list context | |
# of $object. | |
my $need_paren = $cx >= 6; | |
return '(' x $need_paren | |
. $meth . substr($obj,2) # chop off the "do" | |
. " $args" | |
. ')' x $need_paren; | |
} | |
my $kid = $obj . "->" . $meth; | |
if (length $args) { | |
return $kid . "(" . $args . ")"; # parens mandatory | |
} else { | |
return $kid; | |
} | |
} | |
# returns "&" if the prototype doesn't match the args, | |
# or ("", $args_after_prototype_demunging) if it does. | |
sub check_proto { | |
my $self = shift; | |
return "&" if $self->{'noproto'}; | |
my($proto, @args) = @_; | |
my($arg, $real); | |
my $doneok = 0; | |
my @reals; | |
# An unbackslashed @ or % gobbles up the rest of the args | |
1 while $proto =~ s/(?<!\\)([@%])[^\]]+$/$1/; | |
$proto =~ s/^\s*//; | |
while ($proto) { | |
$proto =~ s/^(\\?[\$\@&%*_]|\\\[[\$\@&%*]+\]|;|)\s*//; | |
my $chr = $1; | |
if ($chr eq "") { | |
return "&" if @args; | |
} elsif ($chr eq ";") { | |
$doneok = 1; | |
} elsif ($chr eq "@" or $chr eq "%") { | |
push @reals, map($self->deparse($_, 6), @args); | |
@args = (); | |
} else { | |
$arg = shift @args; | |
last unless $arg; | |
if ($chr eq "\$" || $chr eq "_") { | |
if (want_scalar $arg) { | |
push @reals, $self->deparse($arg, 6); | |
} else { | |
return "&"; | |
} | |
} elsif ($chr eq "&") { | |
if ($arg->name =~ /^(s?refgen|undef)$/) { | |
push @reals, $self->deparse($arg, 6); | |
} else { | |
return "&"; | |
} | |
} elsif ($chr eq "*") { | |
if ($arg->name =~ /^s?refgen$/ | |
and $arg->first->first->name eq "rv2gv") | |
{ | |
$real = $arg->first->first; # skip refgen, null | |
if ($real->first->name eq "gv") { | |
push @reals, $self->deparse($real, 6); | |
} else { | |
push @reals, $self->deparse($real->first, 6); | |
} | |
} else { | |
return "&"; | |
} | |
} elsif (substr($chr, 0, 1) eq "\\") { | |
$chr =~ tr/\\[]//d; | |
if ($arg->name =~ /^s?refgen$/ and | |
!null($real = $arg->first) and | |
($chr =~ /\$/ && is_scalar($real->first) | |
or ($chr =~ /@/ | |
&& class($real->first->sibling) ne 'NULL' | |
&& $real->first->sibling->name | |
=~ /^(rv2|pad)av$/) | |
or ($chr =~ /%/ | |
&& class($real->first->sibling) ne 'NULL' | |
&& $real->first->sibling->name | |
=~ /^(rv2|pad)hv$/) | |
#or ($chr =~ /&/ # This doesn't work | |
# && $real->first->name eq "rv2cv") | |
or ($chr =~ /\*/ | |
&& $real->first->name eq "rv2gv"))) | |
{ | |
push @reals, $self->deparse($real, 6); | |
} else { | |
return "&"; | |
} | |
} | |
} | |
} | |
return "&" if $proto and !$doneok; # too few args and no ';' | |
return "&" if @args; # too many args | |
return ("", join ", ", @reals); | |
} | |
sub retscalar { | |
my $name = $_[0]->name; | |
# XXX There has to be a better way of doing this scalar-op check. | |
# Currently PL_opargs is not exposed. | |
if ($name eq 'null') { | |
$name = substr B::ppname($_[0]->targ), 3 | |
} | |
$name =~ /^(?:scalar|pushmark|wantarray|const|gvsv|gv|padsv|rv2gv | |
|rv2sv|av2arylen|anoncode|prototype|srefgen|ref|bless | |
|regcmaybe|regcreset|regcomp|qr|subst|substcont|trans | |
|transr|sassign|chop|schop|chomp|schomp|defined|undef | |
|study|pos|preinc|i_preinc|predec|i_predec|postinc | |
|i_postinc|postdec|i_postdec|pow|multiply|i_multiply | |
|divide|i_divide|modulo|i_modulo|add|i_add|subtract | |
|i_subtract|concat|multiconcat|stringify|left_shift|right_shift|lt | |
|i_lt|gt|i_gt|le|i_le|ge|i_ge|eq|i_eq|ne|i_ne|ncmp|i_ncmp | |
|slt|sgt|sle|sge|seq|sne|scmp|[sn]?bit_(?:and|x?or)|negate | |
|i_negate|not|[sn]?complement|smartmatch|atan2|sin|cos | |
|rand|srand|exp|log|sqrt|int|hex|oct|abs|length|substr | |
|vec|index|rindex|sprintf|formline|ord|chr|crypt|ucfirst | |
|lcfirst|uc|lc|quotemeta|aelemfast|aelem|exists|helem | |
|pack|join|anonlist|anonhash|push|pop|shift|unshift|xor | |
|andassign|orassign|dorassign|warn|die|reset|nextstate | |
|dbstate|unstack|last|next|redo|dump|goto|exit|open|close | |
|pipe_op|fileno|umask|binmode|tie|untie|tied|dbmopen | |
|dbmclose|select|getc|read|enterwrite|prtf|print|say | |
|sysopen|sysseek|sysread|syswrite|eof|tell|seek|truncate | |
|fcntl|ioctl|flock|send|recv|socket|sockpair|bind|connect | |
|listen|accept|shutdown|gsockopt|ssockopt|getsockname | |
|getpeername|ftrread|ftrwrite|ftrexec|fteread|ftewrite | |
|fteexec|ftis|ftsize|ftmtime|ftatime|ftctime|ftrowned | |
|fteowned|ftzero|ftsock|ftchr|ftblk|ftfile|ftdir|ftpipe | |
|ftsuid|ftsgid|ftsvtx|ftlink|fttty|fttext|ftbinary|chdir | |
|chown|chroot|unlink|chmod|utime|rename|link|symlink | |
|readlink|mkdir|rmdir|open_dir|telldir|seekdir|rewinddir | |
|closedir|fork|wait|waitpid|system|exec|kill|getppid | |
|getpgrp|setpgrp|getpriority|setpriority|time|alarm|sleep | |
|shmget|shmctl|shmread|shmwrite|msgget|msgctl|msgsnd | |
|msgrcv|semop|semget|semctl|hintseval|shostent|snetent | |
|sprotoent|sservent|ehostent|enetent|eprotoent|eservent | |
|spwent|epwent|sgrent|egrent|getlogin|syscall|lock|runcv | |
|fc)\z/x | |
} | |
sub pp_entersub { | |
my $self = shift; | |
my($op, $cx) = @_; | |
return $self->e_method($self->_method($op, $cx)) | |
unless null $op->first->sibling; | |
my $prefix = ""; | |
my $amper = ""; | |
my($kid, @exprs); | |
if ($op->flags & OPf_SPECIAL && !($op->flags & OPf_MOD)) { | |
$prefix = "do "; | |
} elsif ($op->private & OPpENTERSUB_AMPER) { | |
$amper = "&"; | |
} | |
$kid = $op->first; | |
$kid = $kid->first->sibling; # skip ex-list, pushmark | |
for (; not null $kid->sibling; $kid = $kid->sibling) { | |
push @exprs, $kid; | |
} | |
my $simple = 0; | |
my $proto = undef; | |
my $lexical; | |
if (is_scope($kid)) { | |
$amper = "&"; | |
$kid = "{" . $self->deparse($kid, 0) . "}"; | |
} elsif ($kid->first->name eq "gv") { | |
my $gv = $self->gv_or_padgv($kid->first); | |
my $cv; | |
if (class($gv) eq 'GV' && class($cv = $gv->CV) ne "SPECIAL" | |
|| $gv->FLAGS & SVf_ROK && class($cv = $gv->RV) eq 'CV') { | |
$proto = $cv->PV if $cv->FLAGS & SVf_POK; | |
} | |
$simple = 1; # only calls of named functions can be prototyped | |
$kid = $self->maybe_qualify("!", $self->gv_name($gv)); | |
my $fq; | |
# Fully qualify any sub name that conflicts with a lexical. | |
if ($self->lex_in_scope("&$kid") | |
|| $self->lex_in_scope("&$kid", 1)) | |
{ | |
$fq++; | |
} elsif (!$amper) { | |
if ($kid eq 'main::') { | |
$kid = '::'; | |
} | |
else { | |
if ($kid !~ /::/ && $kid ne 'x') { | |
# Fully qualify any sub name that is also a keyword. While | |
# we could check the import flag, we cannot guarantee that | |
# the code deparsed so far would set that flag, so we qual- | |
# ify the names regardless of importation. | |
if (exists $feature_keywords{$kid}) { | |
$fq++ if $self->feature_enabled($kid); | |
} elsif (do { local $@; local $SIG{__DIE__}; | |
eval { () = prototype "CORE::$kid"; 1 } }) { | |
$fq++ | |
} | |
} | |
if ($kid !~ /^(?:\w|::)(?:[\w\d]|::(?!\z))*\z/) { | |
$kid = single_delim("q", "'", $kid, $self) . '->'; | |
} | |
} | |
} | |
$fq and substr $kid, 0, 0, = $self->{'curstash'}.'::'; | |
} elsif (is_scalar ($kid->first) && $kid->first->name ne 'rv2cv') { | |
$amper = "&"; | |
$kid = $self->deparse($kid, 24); | |
} else { | |
$prefix = ""; | |
my $grandkid = $kid->first; | |
my $arrow = ($lexical = $grandkid->name eq "padcv") | |
|| is_subscriptable($grandkid) | |
? "" | |
: "->"; | |
$kid = $self->deparse($kid, 24) . $arrow; | |
if ($lexical) { | |
my $padlist = $self->{'curcv'}->PADLIST; | |
my $padoff = $grandkid->targ; | |
my $padname = $padlist->ARRAYelt(0)->ARRAYelt($padoff); | |
my $protocv = $padname->FLAGS & SVpad_STATE | |
? $padlist->ARRAYelt(1)->ARRAYelt($padoff) | |
: $padname->PROTOCV; | |
if ($protocv->FLAGS & SVf_POK) { | |
$proto = $protocv->PV | |
} | |
$simple = 1; | |
} | |
} | |
# Doesn't matter how many prototypes there are, if | |
# they haven't happened yet! | |
my $declared = $lexical || exists $self->{'subs_declared'}{$kid}; | |
if (not $declared and $self->{'in_coderef2text'}) { | |
no strict 'refs'; | |
no warnings 'uninitialized'; | |
$declared = | |
( | |
defined &{ ${$self->{'curstash'}."::"}{$kid} } | |
&& !exists | |
$self->{'subs_deparsed'}{$self->{'curstash'}."::".$kid} | |
&& defined prototype $self->{'curstash'}."::".$kid | |
); | |
} | |
if (!$declared && defined($proto)) { | |
# Avoid "too early to check prototype" warning | |
($amper, $proto) = ('&'); | |
} | |
my $args; | |
my $listargs = 1; | |
if ($declared and defined $proto and not $amper) { | |
($amper, $args) = $self->check_proto($proto, @exprs); | |
$listargs = $amper; | |
} | |
if ($listargs) { | |
$args = join(", ", map( | |
($_->flags & OPf_WANT) == OPf_WANT_SCALAR | |
&& !retscalar($_) | |
? $self->maybe_parens_unop('scalar', $_, 6) | |
: $self->deparse($_, 6), | |
@exprs | |
)); | |
} | |
if ($prefix or $amper) { | |
if ($kid eq '&') { $kid = "{$kid}" } # &{&} cannot be written as && | |
if ($op->flags & OPf_STACKED) { | |
return $prefix . $amper . $kid . "(" . $args . ")"; | |
} else { | |
return $prefix . $amper. $kid; | |
} | |
} else { | |
# It's a syntax error to call CORE::GLOBAL::foo with a prefix, | |
# so it must have been translated from a keyword call. Translate | |
# it back. | |
$kid =~ s/^CORE::GLOBAL:://; | |
my $dproto = defined($proto) ? $proto : "undefined"; | |
my $scalar_proto = $dproto =~ /^;*(?:[\$*_+]|\\.|\\\[[^]]\])\z/; | |
if (!$declared) { | |
return "$kid(" . $args . ")"; | |
} elsif ($dproto =~ /^\s*\z/) { | |
return $kid; | |
} elsif ($scalar_proto and is_scalar($exprs[0])) { | |
# is_scalar is an excessively conservative test here: | |
# really, we should be comparing to the precedence of the | |
# top operator of $exprs[0] (ala unop()), but that would | |
# take some major code restructuring to do right. | |
return $self->maybe_parens_func($kid, $args, $cx, 16); | |
} elsif (not $scalar_proto and defined($proto) || $simple) { #' | |
return $self->maybe_parens_func($kid, $args, $cx, 5); | |
} else { | |
return "$kid(" . $args . ")"; | |
} | |
} | |
} | |
sub pp_enterwrite { unop(@_, "write") } | |
# escape things that cause interpolation in double quotes, | |
# but not character escapes | |
sub uninterp { | |
my($str) = @_; | |
$str =~ s/(^|\G|[^\\])((?:\\\\)*)([\$\@]|\\[uUlLQE])/$1$2\\$3/g; | |
return $str; | |
} | |
{ | |
my $bal; | |
BEGIN { | |
use re "eval"; | |
# Matches any string which is balanced with respect to {braces} | |
$bal = qr( | |
(?: | |
[^\\{}] | |
| \\\\ | |
| \\[{}] | |
| \{(??{$bal})\} | |
)* | |
)x; | |
} | |
# the same, but treat $|, $), $( and $ at the end of the string differently | |
# and leave comments unmangled for the sake of /x and (?x). | |
sub re_uninterp { | |
my($str) = @_; | |
$str =~ s/ | |
( ^|\G # $1 | |
| [^\\] | |
) | |
( # $2 | |
(?:\\\\)* | |
) | |
( # $3 | |
( \(\?\??\{$bal\}\) # $4 (skip over (?{}) and (??{}) blocks) | |
| \#[^\n]* # (skip over comments) | |
) | |
| [\$\@] | |
(?!\||\)|\(|$|\s) | |
| \\[uUlLQE] | |
) | |
/defined($4) && length($4) ? "$1$2$4" : "$1$2\\$3"/xeg; | |
return $str; | |
} | |
} | |
# character escapes, but not delimiters that might need to be escaped | |
sub escape_str { # ASCII, UTF8 | |
my($str) = @_; | |
$str =~ s/(.)/ord($1) > 255 ? sprintf("\\x{%x}", ord($1)) : $1/eg; | |
$str =~ s/\a/\\a/g; | |
# $str =~ s/\cH/\\b/g; # \b means something different in a regex; and \cH | |
# isn't a backspace in EBCDIC | |
$str =~ s/\t/\\t/g; | |
$str =~ s/\n/\\n/g; | |
$str =~ s/\e/\\e/g; | |
$str =~ s/\f/\\f/g; | |
$str =~ s/\r/\\r/g; | |
$str =~ s/([\cA-\cZ])/'\\c' . $unctrl{$1}/ge; | |
$str =~ s/([[:^print:]])/sprintf("\\%03o", ord($1))/age; | |
return $str; | |
} | |
# For regexes. Leave whitespace unmangled in case of /x or (?x). | |
sub escape_re { | |
my($str) = @_; | |
$str =~ s/(.)/ord($1) > 255 ? sprintf("\\x{%x}", ord($1)) : $1/eg; | |
$str =~ s/([[:^print:]])/ | |
($1 =~ y! \t\n!!) ? $1 : sprintf("\\%03o", ord($1))/age; | |
$str =~ s/\n/\n\f/g; | |
return $str; | |
} | |
# Don't do this for regexen | |
sub unback { | |
my($str) = @_; | |
$str =~ s/\\/\\\\/g; | |
return $str; | |
} | |
# Remove backslashes which precede literal control characters, | |
# to avoid creating ambiguity when we escape the latter. | |
# | |
# Don't remove a backslash from escaped whitespace: where the T represents | |
# a literal tab character, /T/x is not equivalent to /\T/x | |
sub re_unback { | |
my($str) = @_; | |
# the insane complexity here is due to the behaviour of "\c\" | |
$str =~ s/ | |
# these two lines ensure that the backslash we're about to | |
# remove isn't preceeded by something which makes it part | |
# of a \c | |
(^ | [^\\] | \\c\\) # $1 | |
(?<!\\c) | |
# the backslash to remove | |
\\ | |
# keep pairs of backslashes | |
(\\\\)* # $2 | |
# only remove if the thing following is a control char | |
(?=[[:^print:]]) | |
# and not whitespace | |
(?=\S) | |
/$1$2/xg; | |
return $str; | |
} | |
sub balanced_delim { | |
my($str) = @_; | |
my @str = split //, $str; | |
my($ar, $open, $close, $fail, $c, $cnt, $last_bs); | |
for $ar (['[',']'], ['(',')'], ['<','>'], ['{','}']) { | |
($open, $close) = @$ar; | |
$fail = 0; $cnt = 0; $last_bs = 0; | |
for $c (@str) { | |
if ($c eq $open) { | |
$fail = 1 if $last_bs; | |
$cnt++; | |
} elsif ($c eq $close) { | |
$fail = 1 if $last_bs; | |
$cnt--; | |
if ($cnt < 0) { | |
# qq()() isn't ")(" | |
$fail = 1; | |
last; | |
} | |
} | |
$last_bs = $c eq '\\'; | |
} | |
$fail = 1 if $cnt != 0; | |
return ($open, "$open$str$close") if not $fail; | |
} | |
return ("", $str); | |
} | |
sub single_delim { | |
my($q, $default, $str, $self) = @_; | |
return "$default$str$default" if $default and index($str, $default) == -1; | |
my $coreq = $self->keyword($q); # maybe CORE::q | |
if ($q ne 'qr') { | |
(my $succeed, $str) = balanced_delim($str); | |
return "$coreq$str" if $succeed; | |
} | |
for my $delim ('/', '"', '#') { | |
return "$coreq$delim" . $str . $delim if index($str, $delim) == -1; | |
} | |
if ($default) { | |
$str =~ s/$default/\\$default/g; | |
return "$default$str$default"; | |
} else { | |
$str =~ s[/][\\/]g; | |
return "$coreq/$str/"; | |
} | |
} | |
my $max_prec; | |
BEGIN { $max_prec = int(0.999 + 8*length(pack("F", 42))*log(2)/log(10)); } | |
# Split a floating point number into an integer mantissa and a binary | |
# exponent. Assumes you've already made sure the number isn't zero or | |
# some weird infinity or NaN. | |
sub split_float { | |
my($f) = @_; | |
my $exponent = 0; | |
if ($f == int($f)) { | |
while ($f % 2 == 0) { | |
$f /= 2; | |
$exponent++; | |
} | |
} else { | |
while ($f != int($f)) { | |
$f *= 2; | |
$exponent--; | |
} | |
} | |
my $mantissa = sprintf("%.0f", $f); | |
return ($mantissa, $exponent); | |
} | |
# suitably single- or double-quote a literal constant string | |
sub quoted_const_str { | |
my ($self, $str) =@_; | |
if ($str =~ /[[:^print:]]/a) { | |
return single_delim("qq", '"', | |
uninterp(escape_str unback $str), $self); | |
} else { | |
return single_delim("q", "'", unback($str), $self); | |
} | |
} | |
sub const { | |
my $self = shift; | |
my($sv, $cx) = @_; | |
if ($self->{'use_dumper'}) { | |
return $self->const_dumper($sv, $cx); | |
} | |
if (class($sv) eq "SPECIAL") { | |
# sv_undef, sv_yes, sv_no | |
return $$sv == 3 ? $self->maybe_parens("!1", $cx, 21) | |
: ('undef', '1')[$$sv-1]; | |
} | |
if (class($sv) eq "NULL") { | |
return 'undef'; | |
} | |
# convert a version object into the "v1.2.3" string in its V magic | |
if ($sv->FLAGS & SVs_RMG) { | |
for (my $mg = $sv->MAGIC; $mg; $mg = $mg->MOREMAGIC) { | |
return $mg->PTR if $mg->TYPE eq 'V'; | |
} | |
} | |
if ($sv->FLAGS & SVf_IOK) { | |
my $str = $sv->int_value; | |
$str = $self->maybe_parens($str, $cx, 21) if $str < 0; | |
return $str; | |
} elsif ($sv->FLAGS & SVf_NOK) { | |
my $nv = $sv->NV; | |
if ($nv == 0) { | |
if (pack("F", $nv) eq pack("F", 0)) { | |
# positive zero | |
return "0"; | |
} else { | |
# negative zero | |
return $self->maybe_parens("-.0", $cx, 21); | |
} | |
} elsif (1/$nv == 0) { | |
if ($nv > 0) { | |
# positive infinity | |
return $self->maybe_parens("9**9**9", $cx, 22); | |
} else { | |
# negative infinity | |
return $self->maybe_parens("-9**9**9", $cx, 21); | |
} | |
} elsif ($nv != $nv) { | |
# NaN | |
if (pack("F", $nv) eq pack("F", sin(9**9**9))) { | |
# the normal kind | |
return "sin(9**9**9)"; | |
} elsif (pack("F", $nv) eq pack("F", -sin(9**9**9))) { | |
# the inverted kind | |
return $self->maybe_parens("-sin(9**9**9)", $cx, 21); | |
} else { | |
# some other kind | |
my $hex = unpack("h*", pack("F", $nv)); | |
return qq'unpack("F", pack("h*", "$hex"))'; | |
} | |
} | |
# first, try the default stringification | |
my $str = "$nv"; | |
if ($str != $nv) { | |
# failing that, try using more precision | |
$str = sprintf("%.${max_prec}g", $nv); | |
# if (pack("F", $str) ne pack("F", $nv)) { | |
if ($str != $nv) { | |
# not representable in decimal with whatever sprintf() | |
# and atof() Perl is using here. | |
my($mant, $exp) = split_float($nv); | |
return $self->maybe_parens("$mant * 2**$exp", $cx, 19); | |
} | |
} | |
$str = $self->maybe_parens($str, $cx, 21) if $nv < 0; | |
return $str; | |
} elsif ($sv->FLAGS & SVf_ROK && $sv->can("RV")) { | |
my $ref = $sv->RV; | |
my $class = class($ref); | |
if ($class eq "AV") { | |
return "[" . $self->list_const(2, $ref->ARRAY) . "]"; | |
} elsif ($class eq "HV") { | |
my %hash = $ref->ARRAY; | |
my @elts; | |
for my $k (sort keys %hash) { | |
push @elts, "$k => " . $self->const($hash{$k}, 6); | |
} | |
return "{" . join(", ", @elts) . "}"; | |
} elsif ($class eq "CV") { | |
no overloading; | |
if ($self->{curcv} && | |
$self->{curcv}->object_2svref == $ref->object_2svref) { | |
return $self->keyword("__SUB__"); | |
} | |
return "sub " . $self->deparse_sub($ref); | |
} | |
if ($class ne 'SPECIAL' and $ref->FLAGS & SVs_SMG) { | |
for (my $mg = $ref->MAGIC; $mg; $mg = $mg->MOREMAGIC) { | |
if ($mg->TYPE eq 'r') { | |
my $re = re_uninterp(escape_re(re_unback($mg->precomp))); | |
return single_delim("qr", "", $re, $self); | |
} | |
} | |
} | |
my $const = $self->const($ref, 20); | |
if ($self->{in_subst_repl} && $const =~ /^[0-9]/) { | |
$const = "($const)"; | |
} | |
return $self->maybe_parens("\\$const", $cx, 20); | |
} elsif ($sv->FLAGS & SVf_POK) { | |
my $str = $sv->PV; | |
return $self->quoted_const_str($str); | |
} else { | |
return "undef"; | |
} | |
} | |
sub const_dumper { | |
my $self = shift; | |
my($sv, $cx) = @_; | |
my $ref = $sv->object_2svref(); | |
my $dumper = Data::Dumper->new([$$ref], ['$v']); | |
$dumper->Purity(1)->Terse(1)->Deparse(1)->Indent(0)->Useqq(1)->Sortkeys(1); | |
my $str = $dumper->Dump(); | |
if ($str =~ /^\$v/) { | |
return '${my ' . $str . ' \$v}'; | |
} else { | |
return $str; | |
} | |
} | |
sub const_sv { | |
my $self = shift; | |
my $op = shift; | |
my $sv = $op->sv; | |
# the constant could be in the pad (under useithreads) | |
$sv = $self->padval($op->targ) unless $$sv; | |
return $sv; | |
} | |
sub meth_sv { | |
my $self = shift; | |
my $op = shift; | |
my $sv = $op->meth_sv; | |
# the constant could be in the pad (under useithreads) | |
$sv = $self->padval($op->targ) unless $$sv; | |
return $sv; | |
} | |
sub meth_rclass_sv { | |
my $self = shift; | |
my $op = shift; | |
my $sv = $op->rclass; | |
# the constant could be in the pad (under useithreads) | |
$sv = $self->padval($sv) unless ref $sv; | |
return $sv; | |
} | |
sub pp_const { | |
my $self = shift; | |
my($op, $cx) = @_; | |
# if ($op->private & OPpCONST_BARE) { # trouble with '=>' autoquoting | |
# return $self->const_sv($op)->PV; | |
# } | |
my $sv = $self->const_sv($op); | |
return $self->const($sv, $cx); | |
} | |
# Join two components of a double-quoted string, disambiguating | |
# "${foo}bar", "${foo}{bar}", "${foo}[1]", "$foo\::bar" | |
sub dq_disambiguate { | |
my ($first, $last) = @_; | |
($last =~ /^[A-Z\\\^\[\]_?]/ && | |
$first =~ s/([\$@])\^$/${1}{^}/) # "${^}W" etc | |
|| ($last =~ /^[:'{\[\w_]/ && #' | |
$first =~ s/([\$@])([A-Za-z_]\w*)$/${1}{$2}/); | |
return $first . $last; | |
} | |
# Deparse a double-quoted optree. For example, "$a[0]\Q$b\Efo\"o" gets | |
# compiled to concat(concat($[0],quotemeta($b)),const("fo\"o")), and this | |
# sub deparses it back to $a[0]\Q$b\Efo"o | |
# (It does not add delimiters) | |
sub dq { | |
my $self = shift; | |
my $op = shift; | |
my $type = $op->name; | |
if ($type eq "const") { | |
return uninterp(escape_str(unback($self->const_sv($op)->as_string))); | |
} elsif ($type eq "concat") { | |
return dq_disambiguate($self->dq($op->first), $self->dq($op->last)); | |
} elsif ($type eq "multiconcat") { | |
return $self->do_multiconcat($op, 26, 1); | |
} elsif ($type eq "uc") { | |
return '\U' . $self->dq($op->first->sibling) . '\E'; | |
} elsif ($type eq "lc") { | |
return '\L' . $self->dq($op->first->sibling) . '\E'; | |
} elsif ($type eq "ucfirst") { | |
return '\u' . $self->dq($op->first->sibling); | |
} elsif ($type eq "lcfirst") { | |
return '\l' . $self->dq($op->first->sibling); | |
} elsif ($type eq "quotemeta") { | |
return '\Q' . $self->dq($op->first->sibling) . '\E'; | |
} elsif ($type eq "fc") { | |
return '\F' . $self->dq($op->first->sibling) . '\E'; | |
} elsif ($type eq "join") { | |
return $self->deparse($op->last, 26); # was join($", @ary) | |
} else { | |
return $self->deparse($op, 26); | |
} | |
} | |
sub pp_backtick { | |
my $self = shift; | |
my($op, $cx) = @_; | |
# skip pushmark if it exists (readpipe() vs ``) | |
my $child = $op->first->sibling->isa('B::NULL') | |
? $op->first : $op->first->sibling; | |
if ($self->pure_string($child)) { | |
return single_delim("qx", '`', $self->dq($child, 1), $self); | |
} | |
unop($self, @_, "readpipe"); | |
} | |
sub dquote { | |
my $self = shift; | |
my($op, $cx) = @_; | |
my $kid = $op->first->sibling; # skip ex-stringify, pushmark | |
return $self->deparse($kid, $cx) if $self->{'unquote'}; | |
$self->maybe_targmy($kid, $cx, | |
sub {single_delim("qq", '"', $self->dq($_[1]), | |
$self)}); | |
} | |
# OP_STRINGIFY is a listop, but it only ever has one arg | |
sub pp_stringify { | |
my ($self, $op, $cx) = @_; | |
my $kid = $op->first->sibling; | |
while ($kid->name eq 'null' && !null($kid->first)) { | |
$kid = $kid->first; | |
} | |
if ($kid->name =~ /^(?:const|padsv|rv2sv|av2arylen|gvsv|multideref | |
|aelemfast(?:_lex)?|[ah]elem|join|concat)\z/x) { | |
maybe_targmy(@_, \&dquote); | |
} | |
else { | |
# Actually an optimised join. | |
my $result = listop(@_,"join"); | |
$result =~ s/join([( ])/join$1$self->{'ex_const'}, /; | |
$result; | |
} | |
} | |
# tr/// and s/// (and tr[][], tr[]//, tr###, etc) | |
# note that tr(from)/to/ is OK, but not tr/from/(to) | |
sub double_delim { | |
my($from, $to) = @_; | |
my($succeed, $delim); | |
if ($from !~ m[/] and $to !~ m[/]) { | |
return "/$from/$to/"; | |
} elsif (($succeed, $from) = balanced_delim($from) and $succeed) { | |
if (($succeed, $to) = balanced_delim($to) and $succeed) { | |
return "$from$to"; | |
} else { | |
for $delim ('/', '"', '#') { # note no "'" -- s''' is special | |
return "$from$delim$to$delim" if index($to, $delim) == -1; | |
} | |
$to =~ s[/][\\/]g; | |
return "$from/$to/"; | |
} | |
} else { | |
for $delim ('/', '"', '#') { # note no ' | |
return "$delim$from$delim$to$delim" | |
if index($to . $from, $delim) == -1; | |
} | |
$from =~ s[/][\\/]g; | |
$to =~ s[/][\\/]g; | |
return "/$from/$to/"; | |
} | |
} | |
# Escape a characrter. | |
# Only used by tr///, so backslashes hyphens | |
sub pchr { | |
my($n) = @_; | |
return sprintf("\\x{%X}", $n) if $n > 255; | |
return '\\\\' if $n == ord '\\'; | |
return "\\-" if $n == ord "-"; | |
# I'm presuming a regex is not ok here, otherwise we could have used | |
# /[[:print:]]/a to get here | |
return chr($n) if ( utf8::native_to_unicode($n) | |
>= utf8::native_to_unicode(ord(' ')) | |
and utf8::native_to_unicode($n) | |
<= utf8::native_to_unicode(ord('~'))); | |
my $mnemonic_pos = index("\a\b\e\f\n\r\t", chr($n)); | |
return "\\" . substr("abefnrt", $mnemonic_pos, 1) if $mnemonic_pos >= 0; | |
return '\\c' . $unctrl{chr $n} if $n >= ord("\cA") and $n <= ord("\cZ"); | |
# return '\x' . sprintf("%02x", $n); | |
return '\\' . sprintf("%03o", $n); | |
} | |
# Convert a list of characters into a string suitable for tr/// search or | |
# replacement, with suitable escaping and collapsing of ranges | |
sub collapse { | |
my(@chars) = @_; | |
my($str, $c, $tr) = (""); | |
for ($c = 0; $c < @chars; $c++) { | |
$tr = $chars[$c]; | |
$str .= pchr($tr); | |
if ($c <= $#chars - 2 and $chars[$c + 1] == $tr + 1 and | |
$chars[$c + 2] == $tr + 2) | |
{ | |
for (; $c <= $#chars-1 and $chars[$c + 1] == $chars[$c] + 1; $c++) | |
{} | |
$str .= "-"; | |
$str .= pchr($chars[$c]); | |
} | |
} | |
return $str; | |
} | |
sub tr_decode_byte { | |
my($table, $flags) = @_; | |
my $ssize_t = $Config{ptrsize} == 8 ? 'q' : 'l'; | |
my ($size, @table) = unpack("${ssize_t}s*", $table); | |
pop @table; # remove the wildcard final entry | |
my($c, $tr, @from, @to, @delfrom, $delhyphen); | |
if ($table[ord "-"] != -1 and | |
$table[ord("-") - 1] == -1 || $table[ord("-") + 1] == -1) | |
{ | |
$tr = $table[ord "-"]; | |
$table[ord "-"] = -1; | |
if ($tr >= 0) { | |
@from = ord("-"); | |
@to = $tr; | |
} else { # -2 ==> delete | |
$delhyphen = 1; | |
} | |
} | |
for ($c = 0; $c < @table; $c++) { | |
$tr = $table[$c]; | |
if ($tr >= 0) { | |
push @from, $c; push @to, $tr; | |
} elsif ($tr == -2) { | |
push @delfrom, $c; | |
} | |
} | |
@from = (@from, @delfrom); | |
if ($flags & OPpTRANS_COMPLEMENT) { | |
unless ($flags & OPpTRANS_DELETE) { | |
@to = () if ("@from" eq "@to"); | |
} | |
my @newfrom = (); | |
my %from; | |
@from{@from} = (1) x @from; | |
for ($c = 0; $c < 256; $c++) { | |
push @newfrom, $c unless $from{$c}; | |
} | |
@from = @newfrom; | |
} | |
unless ($flags & OPpTRANS_DELETE || !@to) { | |
pop @to while $#to and $to[$#to] == $to[$#to -1]; | |
} | |
my($from, $to); | |
$from = collapse(@from); | |
$to = collapse(@to); | |
$from .= "-" if $delhyphen; | |
return ($from, $to); | |
} | |
my $infinity = ~0 >> 1; # IV_MAX | |
sub tr_append_to_invlist { | |
my ($list_ref, $current, $next) = @_; | |
# Appends the range $current..$next-1 to the inversion list $list_ref | |
printf STDERR "%d: %d..%d %s", __LINE__, $current, $next, Dumper $list_ref if DEBUG; | |
if (@$list_ref && $list_ref->[-1] == $current) { | |
# The new range extends the current final one. If it is a finite | |
# rane, replace the current final by the new ending. | |
if (defined $next) { | |
$list_ref->[-1] = $next; | |
} | |
else { | |
# The new range extends to infinity, which means the current end | |
# of the inversion list is dangling. Removing it causes things to | |
# work. | |
pop @$list_ref; | |
} | |
} | |
else { # The new range starts after the current final one; add it as a | |
# new range | |
push @$list_ref, $current; | |
push @$list_ref, $next if defined $next; | |
} | |
print STDERR __LINE__, ": ", Dumper $list_ref if DEBUG; | |
} | |
sub tr_invlist_to_string { | |
my ($list_ref, $to_complement) = @_; | |
# Stringify the inversion list $list_ref, possibly complementing it first. | |
# CAUTION: this can modify $list_ref. | |
print STDERR __LINE__, ": ", Dumper $list_ref if DEBUG; | |
if ($to_complement) { | |
# Complementing an inversion list is done by prepending a 0 if it | |
# doesn't have one there already; otherwise removing the leading 0. | |
if ($list_ref->[0] == 0) { | |
shift @$list_ref; | |
} | |
else { | |
unshift @$list_ref, 0; | |
} | |
print STDERR __LINE__, ": ", Dumper $list_ref if DEBUG; | |
} | |
my $output = ""; | |
# Every other element is in the list. | |
for (my $i = 0; $i < @$list_ref; $i += 2) { | |
my $base = $list_ref->[$i]; | |
$output .= pchr($base); | |
last unless defined $list_ref->[$i+1]; | |
# The beginning of the next element starts the range of items not in | |
# the list. | |
my $upper = $list_ref->[$i+1] - 1; | |
my $range = $upper - $base; | |
$output .= '-' if $range > 1; # Adjacent characters don't have a | |
# minus, though it would be legal to do | |
# so | |
$output .= pchr($upper) if $range > 0; | |
} | |
print STDERR __LINE__, ": tr_invlist_to_string() returning '$output'\n" | |
if DEBUG; | |
return $output; | |
} | |
my $unmapped = ~0; | |
my $special_handling = ~0 - 1; | |
sub dump_invmap { | |
my ($invlist_ref, $map_ref) = @_; | |
for my $i (0 .. @$invlist_ref - 1) { | |
printf STDERR "[%d]\t%x\t", $i, $invlist_ref->[$i]; | |
my $map = $map_ref->[$i]; | |
if ($map == $unmapped) { | |
print STDERR "TR_UNMAPPED\n"; | |
} | |
elsif ($map == $special_handling) { | |
print STDERR "TR_SPECIAL\n"; | |
} | |
else { | |
printf STDERR "%x\n", $map; | |
} | |
} | |
} | |
sub tr_decode_utf8 { | |
my($tr_av, $flags) = @_; | |
printf STDERR "\n%s: %d: flags=0x%x\n", __FILE__, __LINE__, $flags if DEBUG; | |
my $invlist = $tr_av->ARRAYelt(0); | |
my @invlist = unpack("J*", $invlist->PV); | |
my @map = unpack("J*", $tr_av->ARRAYelt(1)->PV); | |
dump_invmap(\@invlist, \@map) if DEBUG; | |
my @from; | |
my @to; | |
# Go through the whole map | |
for (my $i = 0; $i < @invlist; $i++) { | |
my $map = $map[$i]; | |
printf STDERR "%d: i=%d, source=%x, map=%x\n", | |
__LINE__, $i, $invlist[$i], $map if DEBUG; | |
# Ignore any lines that are unmapped | |
next if $map == $unmapped; | |
# Calculate this component of the mapping; First the lhs | |
my $this_from = $invlist[$i]; | |
my $next_from = $invlist[$i+1] if $i < @invlist - 1; | |
# The length of the rhs is the same as the lhs, except when special | |
my $next_map = $map - $this_from + $next_from | |
if $map != $special_handling && defined $next_from; | |
if (DEBUG) { | |
printf STDERR "%d: i=%d, from=%x, to=%x", | |
__LINE__, $i, $this_from, $map; | |
printf STDERR ", next_from=%x,", $next_from if defined $next_from; | |
printf STDERR ", next_map=%x", $next_map if defined $next_map; | |
print STDERR "\n"; | |
} | |
# Add the lhs. | |
tr_append_to_invlist(\@from, $this_from, $next_from); | |
# And, the rhs; special handling doesn't get output as it really is an | |
# unmatched rhs | |
tr_append_to_invlist(\@to, $map, $next_map) if $map != $special_handling; | |
} | |
# Done with the input. | |
my $to; | |
if (join("", @from) eq join("", @to)) { | |
# the rhs is suppressed if identical to the left. That's because | |
# tr/ABC/ABC/ can be written as tr/ABC//. (Do this comparison before | |
# any complementing) | |
$to = ""; | |
} | |
else { | |
$to = tr_invlist_to_string(\@to, 0); # rhs not complemented | |
} | |
my $from = tr_invlist_to_string(\@from, | |
($flags & OPpTRANS_COMPLEMENT) != 0); | |
print STDERR "Returning ", escape_str($from), "/", | |
escape_str($to), "\n" if DEBUG; | |
return (escape_str($from), escape_str($to)); | |
} | |
sub pp_trans { | |
my $self = shift; | |
my($op, $cx, $morflags) = @_; | |
my($from, $to); | |
my $class = class($op); | |
my $priv_flags = $op->private; | |
if ($class eq "PVOP") { | |
($from, $to) = tr_decode_byte($op->pv, $priv_flags); | |
} elsif ($class eq "PADOP") { | |
($from, $to) | |
= tr_decode_utf8($self->padval($op->padix), $priv_flags); | |
} else { # class($op) eq "SVOP" | |
($from, $to) = tr_decode_utf8($op->sv, $priv_flags); | |
} | |
my $flags = ""; | |
$flags .= "c" if $priv_flags & OPpTRANS_COMPLEMENT; | |
$flags .= "d" if $priv_flags & OPpTRANS_DELETE; | |
$to = "" if $from eq $to and $flags eq ""; | |
$flags .= "s" if $priv_flags & OPpTRANS_SQUASH; | |
$flags .= $morflags if defined $morflags; | |
my $ret = $self->keyword("tr") . double_delim($from, $to) . $flags; | |
if (my $targ = $op->targ) { | |
return $self->maybe_parens($self->padname($targ) . " =~ $ret", | |
$cx, 20); | |
} | |
return $ret; | |
} | |
sub pp_transr { push @_, 'r'; goto &pp_trans } | |
# Join two components of a double-quoted re, disambiguating | |
# "${foo}bar", "${foo}{bar}", "${foo}[1]". | |
sub re_dq_disambiguate { | |
my ($first, $last) = @_; | |
($last =~ /^[A-Z\\\^\[\]_?]/ && | |
$first =~ s/([\$@])\^$/${1}{^}/) # "${^}W" etc | |
|| ($last =~ /^[{\[\w_]/ && | |
$first =~ s/([\$@])([A-Za-z_]\w*)$/${1}{$2}/); | |
return $first . $last; | |
} | |
# Like dq(), but different | |
sub re_dq { | |
my $self = shift; | |
my ($op) = @_; | |
my $type = $op->name; | |
if ($type eq "const") { | |
my $unbacked = re_unback($self->const_sv($op)->as_string); | |
return re_uninterp(escape_re($unbacked)); | |
} elsif ($type eq "concat") { | |
my $first = $self->re_dq($op->first); | |
my $last = $self->re_dq($op->last); | |
return re_dq_disambiguate($first, $last); | |
} elsif ($type eq "multiconcat") { | |
return $self->do_multiconcat($op, 26, 2); | |
} elsif ($type eq "uc") { | |
return '\U' . $self->re_dq($op->first->sibling) . '\E'; | |
} elsif ($type eq "lc") { | |
return '\L' . $self->re_dq($op->first->sibling) . '\E'; | |
} elsif ($type eq "ucfirst") { | |
return '\u' . $self->re_dq($op->first->sibling); | |
} elsif ($type eq "lcfirst") { | |
return '\l' . $self->re_dq($op->first->sibling); | |
} elsif ($type eq "quotemeta") { | |
return '\Q' . $self->re_dq($op->first->sibling) . '\E'; | |
} elsif ($type eq "fc") { | |
return '\F' . $self->re_dq($op->first->sibling) . '\E'; | |
} elsif ($type eq "join") { | |
return $self->deparse($op->last, 26); # was join($", @ary) | |
} else { | |
my $ret = $self->deparse($op, 26); | |
$ret =~ s/^\$([(|)])\z/\${$1}/ # $( $| $) need braces | |
or $ret =~ s/^\@([-+])\z/\@{$1}/; # @- @+ need braces | |
return $ret; | |
} | |
} | |
sub pure_string { | |
my ($self, $op) = @_; | |
return 0 if null $op; | |
my $type = $op->name; | |
if ($type eq 'const' || $type eq 'av2arylen') { | |
return 1; | |
} | |
elsif ($type =~ /^(?:[ul]c(first)?|fc)$/ || $type eq 'quotemeta') { | |
return $self->pure_string($op->first->sibling); | |
} | |
elsif ($type eq 'join') { | |
my $join_op = $op->first->sibling; # Skip pushmark | |
return 0 unless $join_op->name eq 'null' && $join_op->targ == OP_RV2SV; | |
my $gvop = $join_op->first; | |
return 0 unless $gvop->name eq 'gvsv'; | |
return 0 unless '"' eq $self->gv_name($self->gv_or_padgv($gvop)); | |
return 0 unless ${$join_op->sibling} eq ${$op->last}; | |
return 0 unless $op->last->name =~ /^(?:[ah]slice|(?:rv2|pad)av)$/; | |
} | |
elsif ($type eq 'concat') { | |
return $self->pure_string($op->first) | |
&& $self->pure_string($op->last); | |
} | |
elsif ($type eq 'multiconcat') { | |
my ($kid, @kids); | |
for ($kid = $op->first; !null $kid; $kid = $kid->sibling) { | |
# skip the consts and/or padsv we've optimised away | |
push @kids, $kid | |
unless $kid->type == OP_NULL | |
&& ( $kid->targ == OP_PADSV | |
|| $kid->targ == OP_CONST | |
|| $kid->targ == OP_PUSHMARK); | |
} | |
if ($op->flags & OPf_STACKED) { | |
# remove expr from @kids where 'expr = ...' or 'expr .= ....' | |
if ($op->private & OPpMULTICONCAT_APPEND) { | |
shift(@kids); | |
} | |
else { | |
pop(@kids); | |
} | |
} | |
for (@kids) { | |
return 0 unless $self->pure_string($_); | |
} | |
return 1; | |
} | |
elsif (is_scalar($op) || $type =~ /^[ah]elem$/) { | |
return 1; | |
} | |
elsif ($type eq "null" and $op->can('first') and not null $op->first) { | |
my $first = $op->first; | |
return 1 if $first->name eq "multideref"; | |
return 1 if $first->name eq "aelemfast_lex"; | |
if ( $first->name eq "null" | |
and $first->can('first') | |
and not null $first->first | |
and $first->first->name eq "aelemfast" | |
) | |
{ | |
return 1; | |
} | |
} | |
return 0; | |
} | |
sub code_list { | |
my ($self,$op,$cv) = @_; | |
# localise stuff relating to the current sub | |
$cv and | |
local($self->{'curcv'}) = $cv, | |
local($self->{'curcvlex'}), | |
local(@$self{qw'curstash warnings hints hinthash curcop'}) | |
= @$self{qw'curstash warnings hints hinthash curcop'}; | |
my $re; | |
for ($op = $op->first->sibling; !null($op); $op = $op->sibling) { | |
if ($op->name eq 'null' and $op->flags & OPf_SPECIAL) { | |
my $scope = $op->first; | |
# 0 context (last arg to scopeop) means statement context, so | |
# the contents of the block will not be wrapped in do{...}. | |
my $block = scopeop($scope->first->name eq "enter", $self, | |
$scope, 0); | |
# next op is the source code of the block | |
$op = $op->sibling; | |
$re .= ($self->const_sv($op)->PV =~ m|^(\(\?\??\{)|)[0]; | |
my $multiline = $block =~ /\n/; | |
$re .= $multiline ? "\n\t" : ' '; | |
$re .= $block; | |
$re .= $multiline ? "\n\b})" : " })"; | |
} else { | |
$re = re_dq_disambiguate($re, $self->re_dq($op)); | |
} | |
} | |
$re; | |
} | |
sub regcomp { | |
my $self = shift; | |
my($op, $cx) = @_; | |
my $kid = $op->first; | |
$kid = $kid->first if $kid->name eq "regcmaybe"; | |
$kid = $kid->first if $kid->name eq "regcreset"; | |
my $kname = $kid->name; | |
if ($kname eq "null" and !null($kid->first) | |
and $kid->first->name eq 'pushmark') | |
{ | |
my $str = ''; | |
$kid = $kid->first->sibling; | |
while (!null($kid)) { | |
my $first = $str; | |
my $last = $self->re_dq($kid); | |
$str = re_dq_disambiguate($first, $last); | |
$kid = $kid->sibling; | |
} | |
return $str, 1; | |
} | |
return ($self->re_dq($kid), 1) | |
if $kname =~ /^(?:rv2|pad)av/ or $self->pure_string($kid); | |
return ($self->deparse($kid, $cx), 0); | |
} | |
sub pp_regcomp { | |
my ($self, $op, $cx) = @_; | |
return (($self->regcomp($op, $cx, 0))[0]); | |
} | |
sub re_flags { | |
my ($self, $op) = @_; | |
my $flags = ''; | |
my $pmflags = $op->pmflags; | |
if (!$pmflags) { | |
my $re = $op->pmregexp; | |
if ($$re) { | |
$pmflags = $re->compflags; | |
} | |
} | |
$flags .= "g" if $pmflags & PMf_GLOBAL; | |
$flags .= "i" if $pmflags & PMf_FOLD; | |
$flags .= "m" if $pmflags & PMf_MULTILINE; | |
$flags .= "o" if $pmflags & PMf_KEEP; | |
$flags .= "s" if $pmflags & PMf_SINGLELINE; | |
$flags .= "x" if $pmflags & PMf_EXTENDED; | |
$flags .= "x" if $pmflags & PMf_EXTENDED_MORE; | |
$flags .= "p" if $pmflags & PMf_KEEPCOPY; | |
$flags .= "n" if $pmflags & PMf_NOCAPTURE; | |
if (my $charset = $pmflags & PMf_CHARSET) { | |
# Hardcoding this is fragile, but B does not yet export the | |
# constants we need. | |
$flags .= qw(d l u a aa)[$charset >> 7] | |
} | |
# The /d flag is indicated by 0; only show it if necessary. | |
elsif ($self->{hinthash} and | |
$self->{hinthash}{reflags_charset} | |
|| $self->{hinthash}{feature_unicode} | |
or $self->{hints} & $feature::hint_mask | |
&& ($self->{hints} & $feature::hint_mask) | |
!= $feature::hint_mask | |
&& $self->{hints} & $feature::hint_uni8bit | |
) { | |
$flags .= 'd'; | |
} | |
$flags; | |
} | |
# osmic acid -- see osmium tetroxide | |
my %matchwords; | |
map($matchwords{join "", sort split //, $_} = $_, 'cig', 'cog', 'cos', 'cogs', | |
'cox', 'go', 'is', 'ism', 'iso', 'mig', 'mix', 'osmic', 'ox', 'sic', | |
'sig', 'six', 'smog', 'so', 'soc', 'sog', 'xi', 'soup', 'soupmix'); | |
# When deparsing a regular expression with code blocks, we have to look in | |
# various places to find the blocks. | |
# | |
# For qr/(?{...})/ without interpolation, the CV is under $qr->qr_anoncv | |
# and the code list (list of blocks and constants, maybe vars) is under | |
# $cv->ROOT->first->code_list: | |
# ./perl -Ilib -MB -e 'use O "Concise", B::svref_2object(sub {qr/(?{die})/})->ROOT->first->first->sibling->pmregexp->qr_anoncv->object_2svref' | |
# | |
# For qr/$a(?{...})/ with interpolation, the code list is more accessible, | |
# under $pmop->code_list, but the $cv is something you have to dig for in | |
# the regcomp op’s kids: | |
# ./perl -Ilib -mO=Concise -e 'qr/$a(?{die})/' | |
# | |
# For m// and split //, things are much simpler. There is no CV. The code | |
# list is under $pmop->code_list. | |
sub matchop { | |
my $self = shift; | |
my($op, $cx, $name, $delim) = @_; | |
my $kid = $op->first; | |
my ($binop, $var, $re) = ("", "", ""); | |
if ($op->name ne 'split' && $op->flags & OPf_STACKED) { | |
$binop = 1; | |
$var = $self->deparse($kid, 20); | |
$kid = $kid->sibling; | |
} | |
# not $name; $name will be 'm' for both match and split | |
elsif ($op->name eq 'match' and my $targ = $op->targ) { | |
$binop = 1; | |
$var = $self->padname($targ); | |
} | |
my $quote = 1; | |
my $pmflags = $op->pmflags; | |
my $rhs_bound_to_defsv; | |
my ($cv, $bregexp); | |
my $have_kid = !null $kid; | |
# Check for code blocks first | |
if (not null my $code_list = $op->code_list) { | |
$re = $self->code_list($code_list, | |
$op->name eq 'qr' | |
? $self->padval( | |
$kid->first # ex-list | |
->first # pushmark | |
->sibling # entersub | |
->first # ex-list | |
->first # pushmark | |
->sibling # srefgen | |
->first # ex-list | |
->first # anoncode | |
->targ | |
) | |
: undef); | |
} elsif (${$bregexp = $op->pmregexp} && ${$cv = $bregexp->qr_anoncv}) { | |
my $patop = $cv->ROOT # leavesub | |
->first # qr | |
->code_list;# list | |
$re = $self->code_list($patop, $cv); | |
} elsif (!$have_kid) { | |
$re = re_uninterp(escape_re(re_unback($op->precomp))); | |
} elsif ($kid->name ne 'regcomp') { | |
if ($op->name eq 'split') { | |
# split has other kids, not just regcomp | |
$re = re_uninterp(escape_re(re_unback($op->precomp))); | |
} | |
else { | |
carp("found ".$kid->name." where regcomp expected"); | |
} | |
} else { | |
($re, $quote) = $self->regcomp($kid, 21); | |
} | |
if ($have_kid and $kid->name eq 'regcomp') { | |
my $matchop = $kid->first; | |
if ($matchop->name eq 'regcreset') { | |
$matchop = $matchop->first; | |
} | |
if ($matchop->name =~ /^(?:match|transr?|subst)\z/ | |
&& $matchop->flags & OPf_SPECIAL) { | |
$rhs_bound_to_defsv = 1; | |
} | |
} | |
my $flags = ""; | |
$flags .= "c" if $pmflags & PMf_CONTINUE; | |
$flags .= $self->re_flags($op); | |
$flags = join '', sort split //, $flags; | |
$flags = $matchwords{$flags} if $matchwords{$flags}; | |
if ($pmflags & PMf_ONCE) { # only one kind of delimiter works here | |
$re =~ s/\?/\\?/g; | |
$re = $self->keyword("m") . "?$re?"; # explicit 'm' is required | |
} elsif ($quote) { | |
$re = single_delim($name, $delim, $re, $self); | |
} | |
$re = $re . $flags if $quote; | |
if ($binop) { | |
return | |
$self->maybe_parens( | |
$rhs_bound_to_defsv | |
? "$var =~ (\$_ =~ $re)" | |
: "$var =~ $re", | |
$cx, 20 | |
); | |
} else { | |
return $re; | |
} | |
} | |
sub pp_match { matchop(@_, "m", "/") } | |
sub pp_qr { matchop(@_, "qr", "") } | |
sub pp_runcv { unop(@_, "__SUB__"); } | |
sub pp_split { | |
my $self = shift; | |
my($op, $cx) = @_; | |
my($kid, @exprs, $ary, $expr); | |
my $stacked = $op->flags & OPf_STACKED; | |
$kid = $op->first; | |
$kid = $kid->sibling if $kid->name eq 'regcomp'; | |
for (; !null($kid); $kid = $kid->sibling) { | |
push @exprs, $self->deparse($kid, 6); | |
} | |
unshift @exprs, $self->matchop($op, $cx, "m", "/"); | |
if ($op->private & OPpSPLIT_ASSIGN) { | |
# With C<@array = split(/pat/, str);>, | |
# array is stored in split's pmreplroot; either | |
# as an integer index into the pad (for a lexical array) | |
# or as GV for a package array (which will be a pad index | |
# on threaded builds) | |
# With my/our @array = split(/pat/, str), the array is instead | |
# accessed via an extra padav/rv2av op at the end of the | |
# split's kid ops. | |
if ($stacked) { | |
$ary = pop @exprs; | |
} | |
else { | |
if ($op->private & OPpSPLIT_LEX) { | |
$ary = $self->padname($op->pmreplroot); | |
} | |
else { | |
# union with op_pmtargetoff, op_pmtargetgv | |
my $gv = $op->pmreplroot; | |
$gv = $self->padval($gv) if !ref($gv); | |
$ary = $self->maybe_local(@_, | |
$self->stash_variable('@', | |
$self->gv_name($gv), | |
$cx)) | |
} | |
if ($op->private & OPpLVAL_INTRO) { | |
$ary = $op->private & OPpSPLIT_LEX ? "my $ary" : "local $ary"; | |
} | |
} | |
} | |
# handle special case of split(), and split(' ') that compiles to /\s+/ | |
$exprs[0] = q{' '} if ($op->reflags // 0) & RXf_SKIPWHITE(); | |
$expr = "split(" . join(", ", @exprs) . ")"; | |
if ($ary) { | |
return $self->maybe_parens("$ary = $expr", $cx, 7); | |
} else { | |
return $expr; | |
} | |
} | |
# oxime -- any of various compounds obtained chiefly by the action of | |
# hydroxylamine on aldehydes and ketones and characterized by the | |
# bivalent grouping C=NOH [Webster's Tenth] | |
my %substwords; | |
map($substwords{join "", sort split //, $_} = $_, 'ego', 'egoism', 'em', | |
'es', 'ex', 'exes', 'gee', 'go', 'goes', 'ie', 'ism', 'iso', 'me', | |
'meese', 'meso', 'mig', 'mix', 'os', 'ox', 'oxime', 'see', 'seem', | |
'seg', 'sex', 'sig', 'six', 'smog', 'sog', 'some', 'xi', 'rogue', | |
'sir', 'rise', 'smore', 'more', 'seer', 'rome', 'gore', 'grim', 'grime', | |
'or', 'rose', 'rosie'); | |
sub pp_subst { | |
my $self = shift; | |
my($op, $cx) = @_; | |
my $kid = $op->first; | |
my($binop, $var, $re, $repl) = ("", "", "", ""); | |
if ($op->flags & OPf_STACKED) { | |
$binop = 1; | |
$var = $self->deparse($kid, 20); | |
$kid = $kid->sibling; | |
} | |
elsif (my $targ = $op->targ) { | |
$binop = 1; | |
$var = $self->padname($targ); | |
} | |
my $flags = ""; | |
my $pmflags = $op->pmflags; | |
if (null($op->pmreplroot)) { | |
$repl = $kid; | |
$kid = $kid->sibling; | |
} else { | |
$repl = $op->pmreplroot->first; # skip substcont | |
} | |
while ($repl->name eq "entereval") { | |
$repl = $repl->first; | |
$flags .= "e"; | |
} | |
{ | |
local $self->{in_subst_repl} = 1; | |
if ($pmflags & PMf_EVAL) { | |
$repl = $self->deparse($repl->first, 0); | |
} else { | |
$repl = $self->dq($repl); | |
} | |
} | |
if (not null my $code_list = $op->code_list) { | |
$re = $self->code_list($code_list); | |
} elsif (null $kid) { | |
$re = re_uninterp(escape_re(re_unback($op->precomp))); | |
} else { | |
($re) = $self->regcomp($kid, 1); | |
} | |
$flags .= "r" if $pmflags & PMf_NONDESTRUCT; | |
$flags .= "e" if $pmflags & PMf_EVAL; | |
$flags .= $self->re_flags($op); | |
$flags = join '', sort split //, $flags; | |
$flags = $substwords{$flags} if $substwords{$flags}; | |
my $core_s = $self->keyword("s"); # maybe CORE::s | |
if ($binop) { | |
return $self->maybe_parens("$var =~ $core_s" | |
. double_delim($re, $repl) . $flags, | |
$cx, 20); | |
} else { | |
return "$core_s". double_delim($re, $repl) . $flags; | |
} | |
} | |
sub is_lexical_subs { | |
my (@ops) = shift; | |
for my $op (@ops) { | |
return 0 if $op->name !~ /\A(?:introcv|clonecv)\z/; | |
} | |
return 1; | |
} | |
# Pretend these two ops do not exist. The perl parser adds them to the | |
# beginning of any block containing my-sub declarations, whereas we handle | |
# the subs in pad_subs and next_todo. | |
*pp_clonecv = *pp_introcv; | |
sub pp_introcv { | |
my $self = shift; | |
my($op, $cx) = @_; | |
# For now, deparsing doesn't worry about the distinction between introcv | |
# and clonecv, so pretend this op doesn't exist: | |
return ''; | |
} | |
sub pp_padcv { | |
my $self = shift; | |
my($op, $cx) = @_; | |
return $self->padany($op); | |
} | |
my %lvref_funnies = ( | |
OPpLVREF_SV, => '$', | |
OPpLVREF_AV, => '@', | |
OPpLVREF_HV, => '%', | |
OPpLVREF_CV, => '&', | |
); | |
sub pp_refassign { | |
my ($self, $op, $cx) = @_; | |
my $left; | |
if ($op->private & OPpLVREF_ELEM) { | |
$left = $op->first->sibling; | |
$left = maybe_local(@_, elem($self, $left, undef, | |
$left->targ == OP_AELEM | |
? qw([ ] padav) | |
: qw({ } padhv))); | |
} elsif ($op->flags & OPf_STACKED) { | |
$left = maybe_local(@_, | |
$lvref_funnies{$op->private & OPpLVREF_TYPE} | |
. $self->deparse($op->first->sibling)); | |
} else { | |
$left = &pp_padsv; | |
} | |
my $right = $self->deparse_binop_right($op, $op->first, 7); | |
return $self->maybe_parens("\\$left = $right", $cx, 7); | |
} | |
sub pp_lvref { | |
my ($self, $op, $cx) = @_; | |
my $code; | |
if ($op->private & OPpLVREF_ELEM) { | |
$code = $op->first->name =~ /av\z/ ? &pp_aelem : &pp_helem; | |
} elsif ($op->flags & OPf_STACKED) { | |
$code = maybe_local(@_, | |
$lvref_funnies{$op->private & OPpLVREF_TYPE} | |
. $self->deparse($op->first)); | |
} else { | |
$code = &pp_padsv; | |
} | |
"\\$code"; | |
} | |
sub pp_lvrefslice { | |
my ($self, $op, $cx) = @_; | |
'\\' . ($op->last->name =~ /av\z/ ? &pp_aslice : &pp_hslice); | |
} | |
sub pp_lvavref { | |
my ($self, $op, $cx) = @_; | |
'\\(' . ($op->flags & OPf_STACKED | |
? maybe_local(@_, rv2x(@_, "\@")) | |
: &pp_padsv) . ')' | |
} | |
sub pp_argcheck { | |
my $self = shift; | |
my($op, $cx) = @_; | |
my ($params, $opt_params, $slurpy) = $op->aux_list($self->{curcv}); | |
my $mandatory = $params - $opt_params; | |
my $check = ''; | |
$check .= <<EOF if !$slurpy; | |
die sprintf("Too many arguments for subroutine at %s line %d.\\n", (caller)[1, 2]) unless \@_ <= $params; | |
EOF | |
$check .= <<EOF if $mandatory > 0; | |
die sprintf("Too few arguments for subroutine at %s line %d.\\n", (caller)[1, 2]) unless \@_ >= $mandatory; | |
EOF | |
my $cond = ($params & 1) ? 'unless' : 'if'; | |
$check .= <<EOF if $slurpy eq '%'; | |
die sprintf("Odd name/value argument for subroutine at %s line %d.\\n", (caller)[1, 2]) if \@_ > $params && ((\@_ - $params) & 1); | |
EOF | |
$check =~ s/;\n\z//; | |
return $check; | |
} | |
sub pp_argelem { | |
my $self = shift; | |
my($op, $cx) = @_; | |
my $var = $self->padname($op->targ); | |
my $ix = $op->string($self->{curcv}); | |
my $expr; | |
if ($op->flags & OPf_KIDS) { | |
$expr = $self->deparse($op->first, 7); | |
} | |
elsif ($var =~ /^[@%]/) { | |
$expr = $ix ? "\@_[$ix .. \$#_]" : '@_'; | |
} | |
else { | |
$expr = "\$_[$ix]"; | |
} | |
return "my $var = $expr"; | |
} | |
sub pp_argdefelem { | |
my $self = shift; | |
my($op, $cx) = @_; | |
my $ix = $op->targ; | |
my $expr = "\@_ >= " . ($ix+1) . " ? \$_[$ix] : "; | |
my $def = $self->deparse($op->first, 7); | |
$def = "($def)" if $op->first->flags & OPf_PARENS; | |
$expr .= $self->deparse($op->first, $cx); | |
return $expr; | |
} | |
1; | |
__END__ | |
=head1 NAME | |
B::Deparse - Perl compiler backend to produce perl code | |
=head1 SYNOPSIS | |
B<perl> B<-MO=Deparse>[B<,-d>][B<,-f>I<FILE>][B<,-p>][B<,-q>][B<,-l>] | |
[B<,-s>I<LETTERS>][B<,-x>I<LEVEL>] I<prog.pl> | |
=head1 DESCRIPTION | |
B::Deparse is a backend module for the Perl compiler that generates | |
perl source code, based on the internal compiled structure that perl | |
itself creates after parsing a program. The output of B::Deparse won't | |
be exactly the same as the original source, since perl doesn't keep | |
track of comments or whitespace, and there isn't a one-to-one | |
correspondence between perl's syntactical constructions and their | |
compiled form, but it will often be close. When you use the B<-p> | |
option, the output also includes parentheses even when they are not | |
required by precedence, which can make it easy to see if perl is | |
parsing your expressions the way you intended. | |
While B::Deparse goes to some lengths to try to figure out what your | |
original program was doing, some parts of the language can still trip | |
it up; it still fails even on some parts of Perl's own test suite. If | |
you encounter a failure other than the most common ones described in | |
the BUGS section below, you can help contribute to B::Deparse's | |
ongoing development by submitting a bug report with a small | |
example. | |
=head1 OPTIONS | |
As with all compiler backend options, these must follow directly after | |
the '-MO=Deparse', separated by a comma but not any white space. | |
=over 4 | |
=item B<-d> | |
Output data values (when they appear as constants) using Data::Dumper. | |
Without this option, B::Deparse will use some simple routines of its | |
own for the same purpose. Currently, Data::Dumper is better for some | |
kinds of data (such as complex structures with sharing and | |
self-reference) while the built-in routines are better for others | |
(such as odd floating-point values). | |
=item B<-f>I<FILE> | |
Normally, B::Deparse deparses the main code of a program, and all the subs | |
defined in the same file. To include subs defined in | |
other files, pass the B<-f> option with the filename. | |
You can pass the B<-f> option several times, to | |
include more than one secondary file. (Most of the time you don't want to | |
use it at all.) You can also use this option to include subs which are | |
defined in the scope of a B<#line> directive with two parameters. | |
=item B<-l> | |
Add '#line' declarations to the output based on the line and file | |
locations of the original code. | |
=item B<-p> | |
Print extra parentheses. Without this option, B::Deparse includes | |
parentheses in its output only when they are needed, based on the | |
structure of your program. With B<-p>, it uses parentheses (almost) | |
whenever they would be legal. This can be useful if you are used to | |
LISP, or if you want to see how perl parses your input. If you say | |
if ($var & 0x7f == 65) {print "Gimme an A!"} | |
print ($which ? $a : $b), "\n"; | |
$name = $ENV{USER} or "Bob"; | |
C<B::Deparse,-p> will print | |
if (($var & 0)) { | |
print('Gimme an A!') | |
}; | |
(print(($which ? $a : $b)), '???'); | |
(($name = $ENV{'USER'}) or '???') | |
which probably isn't what you intended (the C<'???'> is a sign that | |
perl optimized away a constant value). | |
=item B<-P> | |
Disable prototype checking. With this option, all function calls are | |
deparsed as if no prototype was defined for them. In other words, | |
perl -MO=Deparse,-P -e 'sub foo (\@) { 1 } foo @x' | |
will print | |
sub foo (\@) { | |
1; | |
} | |
&foo(\@x); | |
making clear how the parameters are actually passed to C<foo>. | |
=item B<-q> | |
Expand double-quoted strings into the corresponding combinations of | |
concatenation, uc, ucfirst, lc, lcfirst, quotemeta, and join. For | |
instance, print | |
print "Hello, $world, @ladies, \u$gentlemen\E, \u\L$me!"; | |
as | |
print 'Hello, ' . $world . ', ' . join($", @ladies) . ', ' | |
. ucfirst($gentlemen) . ', ' . ucfirst(lc $me . '!'); | |
Note that the expanded form represents the way perl handles such | |
constructions internally -- this option actually turns off the reverse | |
translation that B::Deparse usually does. On the other hand, note that | |
C<$x = "$y"> is not the same as C<$x = $y>: the former makes the value | |
of $y into a string before doing the assignment. | |
=item B<-s>I<LETTERS> | |
Tweak the style of B::Deparse's output. The letters should follow | |
directly after the 's', with no space or punctuation. The following | |
options are available: | |
=over 4 | |
=item B<C> | |
Cuddle C<elsif>, C<else>, and C<continue> blocks. For example, print | |
if (...) { | |
... | |
} else { | |
... | |
} | |
instead of | |
if (...) { | |
... | |
} | |
else { | |
... | |
} | |
The default is not to cuddle. | |
=item B<i>I<NUMBER> | |
Indent lines by multiples of I<NUMBER> columns. The default is 4 columns. | |
=item B<T> | |
Use tabs for each 8 columns of indent. The default is to use only spaces. | |
For instance, if the style options are B<-si4T>, a line that's indented | |
3 times will be preceded by one tab and four spaces; if the options were | |
B<-si8T>, the same line would be preceded by three tabs. | |
=item B<v>I<STRING>B<.> | |
Print I<STRING> for the value of a constant that can't be determined | |
because it was optimized away (mnemonic: this happens when a constant | |
is used in B<v>oid context). The end of the string is marked by a period. | |
The string should be a valid perl expression, generally a constant. | |
Note that unless it's a number, it probably needs to be quoted, and on | |
a command line quotes need to be protected from the shell. Some | |
conventional values include 0, 1, 42, '', 'foo', and | |
'Useless use of constant omitted' (which may need to be | |
B<-sv"'Useless use of constant omitted'."> | |
or something similar depending on your shell). The default is '???'. | |
If you're using B::Deparse on a module or other file that's require'd, | |
you shouldn't use a value that evaluates to false, since the customary | |
true constant at the end of a module will be in void context when the | |
file is compiled as a main program. | |
=back | |
=item B<-x>I<LEVEL> | |
Expand conventional syntax constructions into equivalent ones that expose | |
their internal operation. I<LEVEL> should be a digit, with higher values | |
meaning more expansion. As with B<-q>, this actually involves turning off | |
special cases in B::Deparse's normal operations. | |
If I<LEVEL> is at least 3, C<for> loops will be translated into equivalent | |
while loops with continue blocks; for instance | |
for ($i = 0; $i < 10; ++$i) { | |
print $i; | |
} | |
turns into | |
$i = 0; | |
while ($i < 10) { | |
print $i; | |
} continue { | |
++$i | |
} | |
Note that in a few cases this translation can't be perfectly carried back | |
into the source code -- if the loop's initializer declares a my variable, | |
for instance, it won't have the correct scope outside of the loop. | |
If I<LEVEL> is at least 5, C<use> declarations will be translated into | |
C<BEGIN> blocks containing calls to C<require> and C<import>; for | |
instance, | |
use strict 'refs'; | |
turns into | |
sub BEGIN { | |
require strict; | |
do { | |
'strict'->import('refs') | |
}; | |
} | |
If I<LEVEL> is at least 7, C<if> statements will be translated into | |
equivalent expressions using C<&&>, C<?:> and C<do {}>; for instance | |
print 'hi' if $nice; | |
if ($nice) { | |
print 'hi'; | |
} | |
if ($nice) { | |
print 'hi'; | |
} else { | |
print 'bye'; | |
} | |
turns into | |
$nice and print 'hi'; | |
$nice and do { print 'hi' }; | |
$nice ? do { print 'hi' } : do { print 'bye' }; | |
Long sequences of elsifs will turn into nested ternary operators, which | |
B::Deparse doesn't know how to indent nicely. | |
=back | |
=head1 USING B::Deparse AS A MODULE | |
=head2 Synopsis | |
use B::Deparse; | |
$deparse = B::Deparse->new("-p", "-sC"); | |
$body = $deparse->coderef2text(\&func); | |
eval "sub func $body"; # the inverse operation | |
=head2 Description | |
B::Deparse can also be used on a sub-by-sub basis from other perl | |
programs. | |
=head2 new | |
$deparse = B::Deparse->new(OPTIONS) | |
Create an object to store the state of a deparsing operation and any | |
options. The options are the same as those that can be given on the | |
command line (see L</OPTIONS>); options that are separated by commas | |
after B<-MO=Deparse> should be given as separate strings. | |
=head2 ambient_pragmas | |
$deparse->ambient_pragmas(strict => 'all', '$[' => $[); | |
The compilation of a subroutine can be affected by a few compiler | |
directives, B<pragmas>. These are: | |
=over 4 | |
=item * | |
use strict; | |
=item * | |
use warnings; | |
=item * | |
Assigning to the special variable $[ | |
=item * | |
use integer; | |
=item * | |
use bytes; | |
=item * | |
use utf8; | |
=item * | |
use re; | |
=back | |
Ordinarily, if you use B::Deparse on a subroutine which has | |
been compiled in the presence of one or more of these pragmas, | |
the output will include statements to turn on the appropriate | |
directives. So if you then compile the code returned by coderef2text, | |
it will behave the same way as the subroutine which you deparsed. | |
However, you may know that you intend to use the results in a | |
particular context, where some pragmas are already in scope. In | |
this case, you use the B<ambient_pragmas> method to describe the | |
assumptions you wish to make. | |
Not all of the options currently have any useful effect. See | |
L</BUGS> for more details. | |
The parameters it accepts are: | |
=over 4 | |
=item strict | |
Takes a string, possibly containing several values separated | |
by whitespace. The special values "all" and "none" mean what you'd | |
expect. | |
$deparse->ambient_pragmas(strict => 'subs refs'); | |
=item $[ | |
Takes a number, the value of the array base $[. | |
Obsolete: cannot be non-zero. | |
=item bytes | |
=item utf8 | |
=item integer | |
If the value is true, then the appropriate pragma is assumed to | |
be in the ambient scope, otherwise not. | |
=item re | |
Takes a string, possibly containing a whitespace-separated list of | |
values. The values "all" and "none" are special. It's also permissible | |
to pass an array reference here. | |
$deparser->ambient_pragmas(re => 'eval'); | |
=item warnings | |
Takes a string, possibly containing a whitespace-separated list of | |
values. The values "all" and "none" are special, again. It's also | |
permissible to pass an array reference here. | |
$deparser->ambient_pragmas(warnings => [qw[void io]]); | |
If one of the values is the string "FATAL", then all the warnings | |
in that list will be considered fatal, just as with the B<warnings> | |
pragma itself. Should you need to specify that some warnings are | |
fatal, and others are merely enabled, you can pass the B<warnings> | |
parameter twice: | |
$deparser->ambient_pragmas( | |
warnings => 'all', | |
warnings => [FATAL => qw/void io/], | |
); | |
See L<warnings> for more information about lexical warnings. | |
=item hint_bits | |
=item warning_bits | |
These two parameters are used to specify the ambient pragmas in | |
the format used by the special variables $^H and ${^WARNING_BITS}. | |
They exist principally so that you can write code like: | |
{ my ($hint_bits, $warning_bits); | |
BEGIN {($hint_bits, $warning_bits) = ($^H, ${^WARNING_BITS})} | |
$deparser->ambient_pragmas ( | |
hint_bits => $hint_bits, | |
warning_bits => $warning_bits, | |
'$[' => 0 + $[ | |
); } | |
which specifies that the ambient pragmas are exactly those which | |
are in scope at the point of calling. | |
=item %^H | |
This parameter is used to specify the ambient pragmas which are | |
stored in the special hash %^H. | |
=back | |
=head2 coderef2text | |
$body = $deparse->coderef2text(\&func) | |
$body = $deparse->coderef2text(sub ($$) { ... }) | |
Return source code for the body of a subroutine (a block, optionally | |
preceded by a prototype in parens), given a reference to the | |
sub. Because a subroutine can have no names, or more than one name, | |
this method doesn't return a complete subroutine definition -- if you | |
want to eval the result, you should prepend "sub subname ", or "sub " | |
for an anonymous function constructor. Unless the sub was defined in | |
the main:: package, the code will include a package declaration. | |
=head1 BUGS | |
=over 4 | |
=item * | |
The only pragmas to | |
be completely supported are: C<use warnings>, | |
C<use strict>, C<use bytes>, C<use integer> | |
and C<use feature>. | |
Excepting those listed above, we're currently unable to guarantee that | |
B::Deparse will produce a pragma at the correct point in the program. | |
(Specifically, pragmas at the beginning of a block often appear right | |
before the start of the block instead.) | |
Since the effects of pragmas are often lexically scoped, this can mean | |
that the pragma holds sway over a different portion of the program | |
than in the input file. | |
=item * | |
In fact, the above is a specific instance of a more general problem: | |
we can't guarantee to produce BEGIN blocks or C<use> declarations in | |
exactly the right place. So if you use a module which affects compilation | |
(such as by over-riding keywords, overloading constants or whatever) | |
then the output code might not work as intended. | |
=item * | |
Some constants don't print correctly either with or without B<-d>. | |
For instance, neither B::Deparse nor Data::Dumper know how to print | |
dual-valued scalars correctly, as in: | |
use constant E2BIG => ($!=7); $y = E2BIG; print $y, 0+$y; | |
use constant H => { "#" => 1 }; H->{"#"}; | |
=item * | |
An input file that uses source filtering probably won't be deparsed into | |
runnable code, because it will still include the B<use> declaration | |
for the source filtering module, even though the code that is | |
produced is already ordinary Perl which shouldn't be filtered again. | |
=item * | |
Optimized-away statements are rendered as | |
'???'. This includes statements that | |
have a compile-time side-effect, such as the obscure | |
my $x if 0; | |
which is not, consequently, deparsed correctly. | |
foreach my $i (@_) { 0 } | |
=> | |
foreach my $i (@_) { '???' } | |
=item * | |
Lexical (my) variables declared in scopes external to a subroutine | |
appear in coderef2text output text as package variables. This is a tricky | |
problem, as perl has no native facility for referring to a lexical variable | |
defined within a different scope, although L<PadWalker> is a good start. | |
See also L<Data::Dump::Streamer>, which combines B::Deparse and | |
L<PadWalker> to serialize closures properly. | |
=item * | |
There are probably many more bugs on non-ASCII platforms (EBCDIC). | |
=back | |
=head1 AUTHOR | |
Stephen McCamant <[email protected]>, based on an earlier version | |
by Malcolm Beattie <[email protected]>, with contributions from | |
Gisle Aas, James Duncan, Albert Dvornik, Robin Houston, Dave Mitchell, | |
Hugo van der Sanden, Gurusamy Sarathy, Nick Ing-Simmons, and Rafael | |
Garcia-Suarez. | |
=cut | |