Zero entries were skipped, fix from Adrian Goalby
[p5sagit/p5-mst-13.2.git] / lib / AutoSplit.pm
CommitLineData
a0d0e21e 1package AutoSplit;
2
17f410f9 3use 5.005_64;
4e6ea2c3 4use Exporter ();
5use Config qw(%Config);
6use Carp qw(carp);
7use File::Basename ();
68dc0745 8use File::Path qw(mkpath);
0eb04855 9use File::Spec::Functions qw(curdir catfile);
4e6ea2c3 10use strict;
17f410f9 11our($VERSION, @ISA, @EXPORT, @EXPORT_OK, $Verbose, $Keep, $Maxlen,
12 $CheckForAutoloader, $CheckModTime);
a0d0e21e 13
0120eecf 14$VERSION = "1.0305";
a0d0e21e 15@ISA = qw(Exporter);
16@EXPORT = qw(&autosplit &autosplit_lib_modules);
3edbfbe5 17@EXPORT_OK = qw($Verbose $Keep $Maxlen $CheckForAutoloader $CheckModTime);
a0d0e21e 18
f06db76b 19=head1 NAME
20
21AutoSplit - split a package for autoloading
22
cb1a09d0 23=head1 SYNOPSIS
24
4e6ea2c3 25 autosplit($file, $dir, $keep, $check, $modtime);
84dc3c4d 26
4e6ea2c3 27 autosplit_lib_modules(@modules);
cb1a09d0 28
f06db76b 29=head1 DESCRIPTION
30
31This function will split up your program into files that the AutoLoader
21c92a1d 32module can handle. It is used by both the standard perl libraries and by
33the MakeMaker utility, to automatically configure libraries for autoloading.
34
35The C<autosplit> interface splits the specified file into a hierarchy
36rooted at the directory C<$dir>. It creates directories as needed to reflect
37class hierarchy, and creates the file F<autosplit.ix>. This file acts as
38both forward declaration of all package routines, and as timestamp for the
39last update of the hierarchy.
40
4e6ea2c3 41The remaining three arguments to C<autosplit> govern other options to
42the autosplitter.
43
44=over 2
45
46=item $keep
47
48If the third argument, I<$keep>, is false, then any
49pre-existing C<*.al> files in the autoload directory are removed if
50they are no longer part of the module (obsoleted functions).
51$keep defaults to 0.
52
53=item $check
54
55The
56fourth argument, I<$check>, instructs C<autosplit> to check the module
57currently being split to ensure that it does include a C<use>
58specification for the AutoLoader module, and skips the module if
59AutoLoader is not detected.
60$check defaults to 1.
61
62=item $modtime
63
64Lastly, the I<$modtime> argument specifies
65that C<autosplit> is to check the modification time of the module
66against that of the C<autosplit.ix> file, and only split the module if
67it is newer.
68$modtime defaults to 1.
69
70=back
21c92a1d 71
72Typical use of AutoSplit in the perl MakeMaker utility is via the command-line
73with:
74
75 perl -e 'use AutoSplit; autosplit($ARGV[0], $ARGV[1], 0, 1, 1)'
76
77Defined as a Make macro, it is invoked with file and directory arguments;
78C<autosplit> will split the specified file into the specified directory and
79delete obsolete C<.al> files, after checking first that the module does use
80the AutoLoader, and ensuring that the module is not already currently split
81in its current form (the modtime test).
82
83The C<autosplit_lib_modules> form is used in the building of perl. It takes
84as input a list of files (modules) that are assumed to reside in a directory
85B<lib> relative to the current directory. Each file is sent to the
86autosplitter one at a time, to be split into the directory B<lib/auto>.
87
88In both usages of the autosplitter, only subroutines defined following the
4e6ea2c3 89perl I<__END__> token are split out into separate files. Some
21c92a1d 90routines may be placed prior to this marker to force their immediate loading
91and parsing.
92
4e6ea2c3 93=head2 Multiple packages
94
95As of version 1.01 of the AutoSplit module it is possible to have
96multiple packages within a single file. Both of the following cases
97are supported:
98
99 package NAME;
100 __END__
101 sub AAA { ... }
102 package NAME::option1;
103 sub BBB { ... }
104 package NAME::option2;
105 sub BBB { ... }
21c92a1d 106
4e6ea2c3 107 package NAME;
108 __END__
109 sub AAA { ... }
110 sub NAME::option1::BBB { ... }
111 sub NAME::option2::BBB { ... }
21c92a1d 112
113=head1 DIAGNOSTICS
114
4e6ea2c3 115C<AutoSplit> will inform the user if it is necessary to create the
116top-level directory specified in the invocation. It is preferred that
117the script or installation process that invokes C<AutoSplit> have
118created the full directory path ahead of time. This warning may
119indicate that the module is being split into an incorrect path.
21c92a1d 120
4e6ea2c3 121C<AutoSplit> will warn the user of all subroutines whose name causes
122potential file naming conflicts on machines with drastically limited
123(8 characters or less) file name length. Since the subroutine name is
124used as the file name, these warnings can aid in portability to such
125systems.
21c92a1d 126
4e6ea2c3 127Warnings are issued and the file skipped if C<AutoSplit> cannot locate
128either the I<__END__> marker or a "package Name;"-style specification.
21c92a1d 129
4e6ea2c3 130C<AutoSplit> will also emit general diagnostics for inability to
131create directories or files.
f06db76b 132
133=cut
134
a0d0e21e 135# for portability warn about names longer than $maxlen
136$Maxlen = 8; # 8 for dos, 11 (14-".al") for SYSVR3
137$Verbose = 1; # 0=none, 1=minimal, 2=list .al files
138$Keep = 0;
3edbfbe5 139$CheckForAutoloader = 1;
140$CheckModTime = 1;
a0d0e21e 141
4e6ea2c3 142my $IndexFile = "autosplit.ix"; # file also serves as timestamp
143my $maxflen = 255;
a0d0e21e 144$maxflen = 14 if $Config{'d_flexfnam'} ne 'define';
39e571d4 145if (defined (&Dos::UseLFN)) {
146 $maxflen = Dos::UseLFN() ? 255 : 11;
147}
4e6ea2c3 148my $Is_VMS = ($^O eq 'VMS');
a0d0e21e 149
09bef843 150# allow checking for valid ': attrlist' attachments
151my $nested;
14455d6c 152$nested = qr{ \( (?: (?> [^()]+ ) | (??{ $nested }) )* \) }x;
0120eecf 153my $one_attr = qr{ (?> (?! \d) \w+ (?:$nested)? ) (?:\s*\:\s*|\s+(?!\:)) }x;
09bef843 154my $attr_list = qr{ \s* : \s* (?: $one_attr )* }x;
155
156
3edbfbe5 157
a0d0e21e 158sub autosplit{
4e6ea2c3 159 my($file, $autodir, $keep, $ckal, $ckmt) = @_;
75f92628 160 # $file - the perl source file to be split (after __END__)
161 # $autodir - the ".../auto" dir below which to write split subs
162 # Handle optional flags:
4e6ea2c3 163 $keep = $Keep unless defined $keep;
75f92628 164 $ckal = $CheckForAutoloader unless defined $ckal;
165 $ckmt = $CheckModTime unless defined $ckmt;
166 autosplit_file($file, $autodir, $keep, $ckal, $ckmt);
a0d0e21e 167}
168
169
a0d0e21e 170# This function is used during perl building/installation
21c92a1d 171# ./miniperl -e 'use AutoSplit; autosplit_lib_modules(@ARGV)' ...
a0d0e21e 172
173sub autosplit_lib_modules{
174 my(@modules) = @_; # list of Module names
175
3e3baf6d 176 while(defined($_ = shift @modules)){
0eb04855 177 while (m#(.*?[^:])::([^:].*)#) { # in case specified as ABC::XYZ
178 $_ = catfile($1, $2);
179 }
4633a7c4 180 s|\\|/|g; # bug in ksh OS/2
413e5597 181 s#^lib/##s; # incase specified as lib/*.pm
0eb04855 182 my($lib) = catfile(curdir(), "lib");
b1179839 183 if ($Is_VMS) { # may need to convert VMS-style filespecs
184 $lib =~ s#^\[\]#.\/#;
185 }
413e5597 186 s#^$lib\W+##s; # incase specified as ./lib/*.pm
c6538b72 187 if ($Is_VMS && /[:>\]]/) { # may need to convert VMS-style filespecs
14a089c5 188 my ($dir,$name) = (/(.*])(.*)/s);
189 $dir =~ s/.*lib[\.\]]//s;
a0d0e21e 190 $dir =~ s#[\.\]]#/#g;
191 $_ = $dir . $name;
192 }
0eb04855 193 autosplit_file(catfile($lib, $_), catfile($lib, "auto"),
4e6ea2c3 194 $Keep, $CheckForAutoloader, $CheckModTime);
a0d0e21e 195 }
196 0;
197}
198
199
200# private functions
201
4e6ea2c3 202sub autosplit_file {
203 my($filename, $autodir, $keep, $check_for_autoloader, $check_mod_time)
204 = @_;
205 my(@outfiles);
6e7678af 206 local($_);
4e6ea2c3 207 local($/) = "\n";
a0d0e21e 208
209 # where to write output files
0eb04855 210 $autodir ||= catfile(curdir(), "lib", "auto");
f86702cc 211 if ($Is_VMS) {
14a089c5 212 ($autodir = VMS::Filespec::unixpath($autodir)) =~ s|/\z||;
f86702cc 213 $filename = VMS::Filespec::unixify($filename); # may have dirs
214 }
3edbfbe5 215 unless (-d $autodir){
68dc0745 216 mkpath($autodir,0,0755);
4e6ea2c3 217 # We should never need to create the auto dir
218 # here. installperl (or similar) should have done
219 # it. Expecting it to exist is a valuable sanity check against
220 # autosplitting into some random directory by mistake.
221 print "Warning: AutoSplit had to create top-level " .
222 "$autodir unexpectedly.\n";
3edbfbe5 223 }
a0d0e21e 224
225 # allow just a package name to be used
14a089c5 226 $filename .= ".pm" unless ($filename =~ m/\.pm\z/);
a0d0e21e 227
4e6ea2c3 228 open(IN, "<$filename") or die "AutoSplit: Can't open $filename: $!\n";
a0d0e21e 229 my($pm_mod_time) = (stat($filename))[9];
230 my($autoloader_seen) = 0;
f06db76b 231 my($in_pod) = 0;
4e6ea2c3 232 my($def_package,$last_package,$this_package,$fnr);
a0d0e21e 233 while (<IN>) {
f06db76b 234 # Skip pod text.
4e6ea2c3 235 $fnr++;
697fd008 236 $in_pod = 1 if /^=\w/;
f06db76b 237 $in_pod = 0 if /^=cut/;
238 next if ($in_pod || /^=cut/);
239
a0d0e21e 240 # record last package name seen
4e6ea2c3 241 $def_package = $1 if (m/^\s*package\s+([\w:]+)\s*;/);
3edbfbe5 242 ++$autoloader_seen if m/^\s*(use|require)\s+AutoLoader\b/;
a0d0e21e 243 ++$autoloader_seen if m/\bISA\s*=.*\bAutoLoader\b/;
244 last if /^__END__/;
245 }
3edbfbe5 246 if ($check_for_autoloader && !$autoloader_seen){
4e6ea2c3 247 print "AutoSplit skipped $filename: no AutoLoader used\n"
248 if ($Verbose>=2);
249 return 0;
3edbfbe5 250 }
a0d0e21e 251 $_ or die "Can't find __END__ in $filename\n";
252
4e6ea2c3 253 $def_package or die "Can't find 'package Name;' in $filename\n";
a0d0e21e 254
4e6ea2c3 255 my($modpname) = _modpname($def_package);
b1179839 256 if ($Is_VMS) {
257 $modpname = VMS::Filespec::unixify($modpname); # may have dirs
258 }
a0d0e21e 259
4e6ea2c3 260 # this _has_ to match so we have a reasonable timestamp file
261 die "Package $def_package ($modpname.pm) does not ".
262 "match filename $filename"
68dc0745 263 unless ($filename =~ m/\Q$modpname.pm\E$/ or
39e571d4 264 ($^O eq 'dos') or ($^O eq 'MSWin32') or
c6538b72 265 $Is_VMS && $filename =~ m/$modpname.pm/i);
a0d0e21e 266
68dc0745 267 my($al_idx_file) = "$autodir/$modpname/$IndexFile";
268
a0d0e21e 269 if ($check_mod_time){
270 my($al_ts_time) = (stat("$al_idx_file"))[9] || 1;
271 if ($al_ts_time >= $pm_mod_time){
4e6ea2c3 272 print "AutoSplit skipped ($al_idx_file newer than $filename)\n"
a0d0e21e 273 if ($Verbose >= 2);
274 return undef; # one undef, not a list
275 }
276 }
277
0eb04855 278 my($modnamedir) = catfile($autodir, $modpname);
279 print "AutoSplitting $filename ($modnamedir)\n"
a0d0e21e 280 if $Verbose;
281
0eb04855 282 unless (-d "$modnamedir"){
283 mkpath("$modnamedir",0,0777);
a0d0e21e 284 }
285
286 # We must try to deal with some SVR3 systems with a limit of 14
287 # characters for file names. Sadly we *cannot* simply truncate all
288 # file names to 14 characters on these systems because we *must*
289 # create filenames which exactly match the names used by AutoLoader.pm.
290 # This is a problem because some systems silently truncate the file
291 # names while others treat long file names as an error.
292
39e571d4 293 my $Is83 = $maxflen==11; # plain, case INSENSITIVE dos filenames
294
4e6ea2c3 295 my(@subnames, $subname, %proto, %package);
96bc026d 296 my @cache = ();
297 my $caching = 1;
4e6ea2c3 298 $last_package = '';
a0d0e21e 299 while (<IN>) {
4e6ea2c3 300 $fnr++;
53667d02 301 $in_pod = 1 if /^=\w/;
4e6ea2c3 302 $in_pod = 0 if /^=cut/;
303 next if ($in_pod || /^=cut/);
304 # the following (tempting) old coding gives big troubles if a
305 # cut is forgotten at EOF:
306 # next if /^=\w/ .. /^=cut/;
307 if (/^package\s+([\w:]+)\s*;/) {
308 $this_package = $def_package = $1;
a0d0e21e 309 }
09bef843 310 if (/^sub\s+([\w:]+)(\s*(?:\(.*?\))?(?:$attr_list)?)/) {
4e6ea2c3 311 print OUT "# end of $last_package\::$subname\n1;\n"
312 if $last_package;
313 $subname = $1;
314 my $proto = $2 || '';
315 if ($subname =~ s/(.*):://){
316 $this_package = $1;
317 } else {
318 $this_package = $def_package;
a0d0e21e 319 }
4e6ea2c3 320 my $fq_subname = "$this_package\::$subname";
321 $package{$fq_subname} = $this_package;
322 $proto{$fq_subname} = $proto;
323 push(@subnames, $fq_subname);
a0d0e21e 324 my($lname, $sname) = ($subname, substr($subname,0,$maxflen-3));
4e6ea2c3 325 $modpname = _modpname($this_package);
0eb04855 326 my($modnamedir) = catfile($autodir, $modpname);
327 mkpath("$modnamedir",0,0777);
328 my($lpath) = catfile($modnamedir, "$lname.al");
329 my($spath) = catfile($modnamedir, "$sname.al");
4e6ea2c3 330 my $path;
331 if (!$Is83 and open(OUT, ">$lpath")){
332 $path=$lpath;
a0d0e21e 333 print " writing $lpath\n" if ($Verbose>=2);
4e6ea2c3 334 } else {
335 open(OUT, ">$spath") or die "Can't create $spath: $!\n";
336 $path=$spath;
337 print " writing $spath (with truncated name)\n"
338 if ($Verbose>=1);
a0d0e21e 339 }
4e6ea2c3 340 push(@outfiles, $path);
341 print OUT <<EOT;
342# NOTE: Derived from $filename.
343# Changes made here will be lost when autosplit again.
344# See AutoSplit.pm.
345package $this_package;
346
347#line $fnr "$filename (autosplit into $path)"
348EOT
96bc026d 349 print OUT @cache;
350 @cache = ();
351 $caching = 0;
352 }
353 if($caching) {
354 push(@cache, $_) if @cache || /\S/;
4e6ea2c3 355 } else {
96bc026d 356 print OUT $_;
357 }
4e6ea2c3 358 if(/^\}/) {
96bc026d 359 if($caching) {
360 print OUT @cache;
361 @cache = ();
362 }
363 print OUT "\n";
364 $caching = 1;
a0d0e21e 365 }
4e6ea2c3 366 $last_package = $this_package if defined $this_package;
a0d0e21e 367 }
548da3d2 368 if ($subname) {
369 print OUT @cache,"1;\n# end of $last_package\::$subname\n";
370 close(OUT);
371 }
a0d0e21e 372 close(IN);
4e6ea2c3 373
a0d0e21e 374 if (!$keep){ # don't keep any obsolete *.al files in the directory
4e6ea2c3 375 my(%outfiles);
376 # @outfiles{@outfiles} = @outfiles;
377 # perl downcases all filenames on VMS (which upcases all filenames) so
378 # we'd better downcase the sub name list too, or subs with upper case
379 # letters in them will get their .al files deleted right after they're
8f8c40b1 380 # created. (The mixed case sub name won't match the all-lowercase
4e6ea2c3 381 # filename, and so be cleaned up as a scrap file)
382 if ($Is_VMS or $Is83) {
383 %outfiles = map {lc($_) => lc($_) } @outfiles;
384 } else {
385 @outfiles{@outfiles} = @outfiles;
386 }
387 my(%outdirs,@outdirs);
388 for (@outfiles) {
389 $outdirs{File::Basename::dirname($_)}||=1;
390 }
391 for my $dir (keys %outdirs) {
392 opendir(OUTDIR,$dir);
393 foreach (sort readdir(OUTDIR)){
14a089c5 394 next unless /\.al\z/;
0eb04855 395 my($file) = catfile($dir, $_);
8f8c40b1 396 $file = lc $file if $Is83 or $Is_VMS;
4e6ea2c3 397 next if $outfiles{$file};
398 print " deleting $file\n" if ($Verbose>=2);
399 my($deleted,$thistime); # catch all versions on VMS
400 do { $deleted += ($thistime = unlink $file) } while ($thistime);
401 carp "Unable to delete $file: $!" unless $deleted;
402 }
403 closedir(OUTDIR);
a0d0e21e 404 }
a0d0e21e 405 }
406
407 open(TS,">$al_idx_file") or
408 carp "AutoSplit: unable to create timestamp file ($al_idx_file): $!";
4e6ea2c3 409 print TS "# Index created by AutoSplit for $filename\n";
410 print TS "# (file acts as timestamp)\n";
411 $last_package = '';
412 for my $fqs (@subnames) {
413 my($subname) = $fqs;
414 $subname =~ s/.*:://;
415 print TS "package $package{$fqs};\n"
416 unless $last_package eq $package{$fqs};
417 print TS "sub $subname $proto{$fqs};\n";
418 $last_package = $package{$fqs};
419 }
f06db76b 420 print TS "1;\n";
a0d0e21e 421 close(TS);
422
4e6ea2c3 423 _check_unique($filename, $Maxlen, 1, @outfiles);
a0d0e21e 424
4e6ea2c3 425 @outfiles;
a0d0e21e 426}
427
4e6ea2c3 428sub _modpname ($) {
429 my($package) = @_;
430 my $modpname = $package;
431 if ($^O eq 'MSWin32') {
432 $modpname =~ s#::#\\#g;
433 } else {
0eb04855 434 while ($modpname =~ m#(.*?[^:])::([^:].*)#) {
435 $modpname = catfile($1, $2);
436 }
4e6ea2c3 437 }
438 $modpname;
439}
a0d0e21e 440
4e6ea2c3 441sub _check_unique {
442 my($filename, $maxlen, $warn, @outfiles) = @_;
a0d0e21e 443 my(%notuniq) = ();
444 my(%shorts) = ();
4e6ea2c3 445 my(@toolong) = grep(
446 length(File::Basename::basename($_))
447 > $maxlen,
448 @outfiles
449 );
450
451 foreach (@toolong){
452 my($dir) = File::Basename::dirname($_);
453 my($file) = File::Basename::basename($_);
454 my($trunc) = substr($file,0,$maxlen);
455 $notuniq{$dir}{$trunc} = 1 if $shorts{$dir}{$trunc};
456 $shorts{$dir}{$trunc} = $shorts{$dir}{$trunc} ?
457 "$shorts{$dir}{$trunc}, $file" : $file;
a0d0e21e 458 }
459 if (%notuniq && $warn){
4e6ea2c3 460 print "$filename: some names are not unique when " .
461 "truncated to $maxlen characters:\n";
462 foreach my $dir (sort keys %notuniq){
463 print " directory $dir:\n";
464 foreach my $trunc (sort keys %{$notuniq{$dir}}) {
465 print " $shorts{$dir}{$trunc} truncate to $trunc\n";
466 }
a0d0e21e 467 }
468 }
a0d0e21e 469}
470
4711;
472__END__
473
474# test functions so AutoSplit.pm can be applied to itself:
4e6ea2c3 475sub test1 ($) { "test 1\n"; }
476sub test2 ($$) { "test 2\n"; }
477sub test3 ($$$) { "test 3\n"; }
478sub testtesttesttest4_1 { "test 4\n"; }
479sub testtesttesttest4_2 { "duplicate test 4\n"; }
480sub Just::Another::test5 { "another test 5\n"; }
481sub test6 { return join ":", __FILE__,__LINE__; }
482package Yet::Another::AutoSplit;
483sub testtesttesttest4_1 ($) { "another test 4\n"; }
484sub testtesttesttest4_2 ($$) { "another duplicate test 4\n"; }
09bef843 485package Yet::More::Attributes;
0120eecf 486sub test_a1 ($) : locked :locked { 1; }
09bef843 487sub test_a2 : locked { 1; }