Re: Named-capture regex syntax
[p5sagit/p5-mst-13.2.git] / lib / SelfLoader.pm
CommitLineData
f8881bd9 1package SelfLoader;
f8881bd9 2require Exporter;
3@ISA = qw(Exporter);
4@EXPORT = qw(AUTOLOAD);
2ef89038 5$VERSION = "1.10";
52128c7b 6sub Version {$VERSION}
f8881bd9 7$DEBUG = 0;
8
9my %Cache; # private cache for all SelfLoader's client packages
10
09bef843 11# allow checking for valid ': attrlist' attachments
2611e30b 12# (we use 'our' rather than 'my' here, due to the rather complex and buggy
13# behaviour of lexicals with qr// and (??{$lex}) )
14our $nested;
14455d6c 15$nested = qr{ \( (?: (?> [^()]+ ) | (??{ $nested }) )* \) }x;
2611e30b 16our $one_attr = qr{ (?> (?! \d) \w+ (?:$nested)? ) (?:\s*\:\s*|\s+(?!\:)) }x;
17our $attr_list = qr{ \s* : \s* (?: $one_attr )* }x;
09bef843 18
cca8f13b 19# in croak and carp, protect $@ from "require Carp;" RT #40216
20
21sub croak { { local $@; require Carp; } goto &Carp::croak }
22sub carp { { local $@; require Carp; } goto &Carp::carp }
e3d0cac0 23
f8881bd9 24AUTOLOAD {
25 print STDERR "SelfLoader::AUTOLOAD for $AUTOLOAD\n" if $DEBUG;
c7675058 26 my $SL_code = $Cache{$AUTOLOAD};
bfdd1499 27 my $save = $@; # evals in both AUTOLOAD and _load_stubs can corrupt $@
c7675058 28 unless ($SL_code) {
f8881bd9 29 # Maybe this pack had stubs before __DATA__, and never initialized.
30 # Or, this maybe an automatic DESTROY method call when none exists.
31 $AUTOLOAD =~ m/^(.*)::/;
32 SelfLoader->_load_stubs($1) unless exists $Cache{"${1}::<DATA"};
c7675058 33 $SL_code = $Cache{$AUTOLOAD};
34 $SL_code = "sub $AUTOLOAD { }"
35 if (!$SL_code and $AUTOLOAD =~ m/::DESTROY$/);
36 croak "Undefined subroutine $AUTOLOAD" unless $SL_code;
f8881bd9 37 }
c7675058 38 print STDERR "SelfLoader::AUTOLOAD eval: $SL_code\n" if $DEBUG;
bfdd1499 39
c7675058 40 eval $SL_code;
f8881bd9 41 if ($@) {
42 $@ =~ s/ at .*\n//;
43 croak $@;
44 }
bfdd1499 45 $@ = $save;
f8881bd9 46 defined(&$AUTOLOAD) || die "SelfLoader inconsistency error";
47 delete $Cache{$AUTOLOAD};
48 goto &$AUTOLOAD
49}
50
51sub load_stubs { shift->_load_stubs((caller)[0]) }
52
53sub _load_stubs {
33235a50 54 # $endlines is used by Devel::SelfStubber to capture lines after __END__
55 my($self, $callpack, $endlines) = @_;
f8881bd9 56 my $fh = \*{"${callpack}::DATA"};
57 my $currpack = $callpack;
58 my($line,$name,@lines, @stubs, $protoype);
59
60 print STDERR "SelfLoader::load_stubs($callpack)\n" if $DEBUG;
61 croak("$callpack doesn't contain an __DATA__ token")
2ef89038 62 unless defined fileno($fh);
add1a1a3 63 # Protect: fork() shares the file pointer between the parent and the kid
64 open my $nfh, '<&', $fh or croak "reopen: $!";# dup() the fd
65 close $fh or die "close: $1"; # autocloses, but be paranoid
66 open $fh, '<&', $nfh or croak "reopen2: $!"; # dup() the fd "back"
67 close $nfh or die "close after reopen: $1"; # autocloses, but be paranoid
f8881bd9 68 $Cache{"${currpack}::<DATA"} = 1; # indicate package is cached
69
52128c7b 70 local($/) = "\n";
40da2db3 71 while(defined($line = <$fh>) and $line !~ m/^__END__/) {
09bef843 72 if ($line =~ m/^sub\s+([\w:]+)\s*((?:\([\\\$\@\%\&\*\;]*\))?(?:$attr_list)?)/) {
f8881bd9 73 push(@stubs, $self->_add_to_cache($name, $currpack, \@lines, $protoype));
74 $protoype = $2;
75 @lines = ($line);
76 if (index($1,'::') == -1) { # simple sub name
77 $name = "${currpack}::$1";
78 } else { # sub name with package
79 $name = $1;
80 $name =~ m/^(.*)::/;
81 if (defined(&{"${1}::AUTOLOAD"})) {
82 \&{"${1}::AUTOLOAD"} == \&SelfLoader::AUTOLOAD ||
83 die 'SelfLoader Error: attempt to specify Selfloading',
84 " sub $name in non-selfloading module $1";
85 } else {
86 $self->export($1,'AUTOLOAD');
87 }
88 }
89 } elsif ($line =~ m/^package\s+([\w:]+)/) { # A package declared
90 push(@stubs, $self->_add_to_cache($name, $currpack, \@lines, $protoype));
91 $self->_package_defined($line);
92 $name = '';
93 @lines = ();
94 $currpack = $1;
95 $Cache{"${currpack}::<DATA"} = 1; # indicate package is cached
96 if (defined(&{"${1}::AUTOLOAD"})) {
97 \&{"${1}::AUTOLOAD"} == \&SelfLoader::AUTOLOAD ||
98 die 'SelfLoader Error: attempt to specify Selfloading',
99 " package $currpack which already has AUTOLOAD";
100 } else {
101 $self->export($currpack,'AUTOLOAD');
102 }
103 } else {
104 push(@lines,$line);
105 }
106 }
33235a50 107 if (defined($line) && $line =~ /^__END__/) { # __END__
108 unless ($line =~ /^__END__\s*DATA/) {
109 if ($endlines) {
110 # Devel::SelfStubber would like us to capture the lines after
111 # __END__ so it can write out the entire file
112 @$endlines = <$fh>;
113 }
114 close($fh);
115 }
116 }
f8881bd9 117 push(@stubs, $self->_add_to_cache($name, $currpack, \@lines, $protoype));
118 eval join('', @stubs) if @stubs;
119}
120
121
122sub _add_to_cache {
123 my($self,$fullname,$pack,$lines, $protoype) = @_;
124 return () unless $fullname;
8878f897 125 carp("Redefining sub $fullname")
e3d0cac0 126 if exists $Cache{$fullname};
f8881bd9 127 $Cache{$fullname} = join('', "package $pack; ",@$lines);
128 print STDERR "SelfLoader cached $fullname: $Cache{$fullname}" if $DEBUG;
129 # return stub to be eval'd
130 defined($protoype) ? "sub $fullname $protoype;" : "sub $fullname;"
131}
132
133sub _package_defined {}
134
1351;
136__END__
cb1a09d0 137
f8881bd9 138=head1 NAME
139
140SelfLoader - load functions only on demand
141
142=head1 SYNOPSIS
143
144 package FOOBAR;
145 use SelfLoader;
3cb6de81 146
f8881bd9 147 ... (initializing code)
3cb6de81 148
f8881bd9 149 __DATA__
150 sub {....
151
152
153=head1 DESCRIPTION
154
155This module tells its users that functions in the FOOBAR package are to be
463e8aa9 156autoloaded from after the C<__DATA__> token. See also
157L<perlsub/"Autoloading">.
f8881bd9 158
159=head2 The __DATA__ token
160
463e8aa9 161The C<__DATA__> token tells the perl compiler that the perl code
162for compilation is finished. Everything after the C<__DATA__> token
f8881bd9 163is available for reading via the filehandle FOOBAR::DATA,
463e8aa9 164where FOOBAR is the name of the current package when the C<__DATA__>
165token is reached. This works just the same as C<__END__> does in
166package 'main', but for other modules data after C<__END__> is not
f610777f 167automatically retrievable, whereas data after C<__DATA__> is.
463e8aa9 168The C<__DATA__> token is not recognized in versions of perl prior to
f8881bd9 1695.001m.
170
463e8aa9 171Note that it is possible to have C<__DATA__> tokens in the same package
172in multiple files, and that the last C<__DATA__> token in a given
f8881bd9 173package that is encountered by the compiler is the one accessible
463e8aa9 174by the filehandle. This also applies to C<__END__> and main, i.e. if
175the 'main' program has an C<__END__>, but a module 'require'd (_not_ 'use'd)
176by that program has a 'package main;' declaration followed by an 'C<__DATA__>',
177then the C<DATA> filehandle is set to access the data after the C<__DATA__>
178in the module, _not_ the data after the C<__END__> token in the 'main'
f8881bd9 179program, since the compiler encounters the 'require'd file later.
180
181=head2 SelfLoader autoloading
182
463e8aa9 183The B<SelfLoader> works by the user placing the C<__DATA__>
184token I<after> perl code which needs to be compiled and
185run at 'require' time, but I<before> subroutine declarations
f8881bd9 186that can be loaded in later - usually because they may never
187be called.
188
463e8aa9 189The B<SelfLoader> will read from the FOOBAR::DATA filehandle to
190load in the data after C<__DATA__>, and load in any subroutine
f8881bd9 191when it is called. The costs are the one-time parsing of the
463e8aa9 192data after C<__DATA__>, and a load delay for the _first_
f8881bd9 193call of any autoloaded function. The benefits (hopefully)
194are a speeded up compilation phase, with no need to load
195functions which are never used.
196
463e8aa9 197The B<SelfLoader> will stop reading from C<__DATA__> if
198it encounters the C<__END__> token - just as you would expect.
199If the C<__END__> token is present, and is followed by the
200token DATA, then the B<SelfLoader> leaves the FOOBAR::DATA
f8881bd9 201filehandle open on the line after that token.
202
463e8aa9 203The B<SelfLoader> exports the C<AUTOLOAD> subroutine to the
204package using the B<SelfLoader>, and this loads the called
f8881bd9 205subroutine when it is first called.
206
207There is no advantage to putting subroutines which will _always_
463e8aa9 208be called after the C<__DATA__> token.
f8881bd9 209
210=head2 Autoloading and package lexicals
211
212A 'my $pack_lexical' statement makes the variable $pack_lexical
463e8aa9 213local _only_ to the file up to the C<__DATA__> token. Subroutines
f8881bd9 214declared elsewhere _cannot_ see these types of variables,
215just as if you declared subroutines in the package but in another
216file, they cannot see these variables.
217
218So specifically, autoloaded functions cannot see package
463e8aa9 219lexicals (this applies to both the B<SelfLoader> and the Autoloader).
220The C<vars> pragma provides an alternative to defining package-level
221globals that will be visible to autoloaded routines. See the documentation
222on B<vars> in the pragma section of L<perlmod>.
f8881bd9 223
224=head2 SelfLoader and AutoLoader
225
463e8aa9 226The B<SelfLoader> can replace the AutoLoader - just change 'use AutoLoader'
227to 'use SelfLoader' (though note that the B<SelfLoader> exports
f8881bd9 228the AUTOLOAD function - but if you have your own AUTOLOAD and
229are using the AutoLoader too, you probably know what you're doing),
463e8aa9 230and the C<__END__> token to C<__DATA__>. You will need perl version 5.001m
f8881bd9 231or later to use this (version 5.001 with all patches up to patch m).
232
463e8aa9 233There is no need to inherit from the B<SelfLoader>.
f8881bd9 234
463e8aa9 235The B<SelfLoader> works similarly to the AutoLoader, but picks up the
236subs from after the C<__DATA__> instead of in the 'lib/auto' directory.
f610777f 237There is a maintenance gain in not needing to run AutoSplit on the module
f8881bd9 238at installation, and a runtime gain in not needing to keep opening and
239closing files to load subs. There is a runtime loss in needing
463e8aa9 240to parse the code after the C<__DATA__>. Details of the B<AutoLoader> and
241another view of these distinctions can be found in that module's
242documentation.
f8881bd9 243
244=head2 __DATA__, __END__, and the FOOBAR::DATA filehandle.
245
246This section is only relevant if you want to use
463e8aa9 247the C<FOOBAR::DATA> together with the B<SelfLoader>.
248
249Data after the C<__DATA__> token in a module is read using the
250FOOBAR::DATA filehandle. C<__END__> can still be used to denote the end
251of the C<__DATA__> section if followed by the token DATA - this is supported
252by the B<SelfLoader>. The C<FOOBAR::DATA> filehandle is left open if an
253C<__END__> followed by a DATA is found, with the filehandle positioned at
254the start of the line after the C<__END__> token. If no C<__END__> token is
255present, or an C<__END__> token with no DATA token on the same line, then
256the filehandle is closed.
257
258The B<SelfLoader> reads from wherever the current
259position of the C<FOOBAR::DATA> filehandle is, until the
260EOF or C<__END__>. This means that if you want to use
f8881bd9 261that filehandle (and ONLY if you want to), you should either
262
2631. Put all your subroutine declarations immediately after
463e8aa9 264the C<__DATA__> token and put your own data after those
265declarations, using the C<__END__> token to mark the end
266of subroutine declarations. You must also ensure that the B<SelfLoader>
1fef88e7 267reads first by calling 'SelfLoader-E<gt>load_stubs();', or by using a
f8881bd9 268function which is selfloaded;
269
270or
271
463e8aa9 2722. You should read the C<FOOBAR::DATA> filehandle first, leaving
f8881bd9 273the handle open and positioned at the first line of subroutine
274declarations.
275
276You could conceivably do both.
277
278=head2 Classes and inherited methods.
279
280For modules which are not classes, this section is not relevant.
281This section is only relevant if you have methods which could
282be inherited.
283
284A subroutine stub (or forward declaration) looks like
285
286 sub stub;
287
288i.e. it is a subroutine declaration without the body of the
289subroutine. For modules which are not classes, there is no real
290need for stubs as far as autoloading is concerned.
291
292For modules which ARE classes, and need to handle inherited methods,
293stubs are needed to ensure that the method inheritance mechanism works
294properly. You can load the stubs into the module at 'require' time, by
1fef88e7 295adding the statement 'SelfLoader-E<gt>load_stubs();' to the module to do
f8881bd9 296this.
297
463e8aa9 298The alternative is to put the stubs in before the C<__DATA__> token BEFORE
299releasing the module, and for this purpose the C<Devel::SelfStubber>
f8881bd9 300module is available. However this does require the extra step of ensuring
301that the stubs are in the module. If this is done I strongly recommend
302that this is done BEFORE releasing the module - it should NOT be done
303at install time in general.
304
305=head1 Multiple packages and fully qualified subroutine names
306
307Subroutines in multiple packages within the same file are supported - but you
463e8aa9 308should note that this requires exporting the C<SelfLoader::AUTOLOAD> to
f8881bd9 309every package which requires it. This is done automatically by the
463e8aa9 310B<SelfLoader> when it first loads the subs into the cache, but you should
311really specify it in the initialization before the C<__DATA__> by putting
f8881bd9 312a 'use SelfLoader' statement in each package.
313
314Fully qualified subroutine names are also supported. For example,
315
316 __DATA__
317 sub foo::bar {23}
318 package baz;
319 sub dob {32}
320
463e8aa9 321will all be loaded correctly by the B<SelfLoader>, and the B<SelfLoader>
f8881bd9 322will ensure that the packages 'foo' and 'baz' correctly have the
463e8aa9 323B<SelfLoader> C<AUTOLOAD> method when the data after C<__DATA__> is first
324parsed.
f8881bd9 325
326=cut