Integrate mainline
[p5sagit/p5-mst-13.2.git] / lib / File / Basename.pm
CommitLineData
a0d0e21e 1package File::Basename;
2
f06db76b 3=head1 NAME
4
f06db76b 5fileparse - split a pathname into pieces
6
7basename - extract just the filename from a path
8
9dirname - extract just the directory from a path
10
11=head1 SYNOPSIS
12
13 use File::Basename;
14
15 ($name,$path,$suffix) = fileparse($fullname,@suffixlist)
16 fileparse_set_fstype($os_string);
17 $basename = basename($fullname,@suffixlist);
18 $dirname = dirname($fullname);
19
20 ($name,$path,$suffix) = fileparse("lib/File/Basename.pm","\.pm");
21 fileparse_set_fstype("VMS");
22 $basename = basename("lib/File/Basename.pm",".pm");
23 $dirname = dirname("lib/File/Basename.pm");
24
25=head1 DESCRIPTION
26
27These routines allow you to parse file specifications into useful
28pieces using the syntax of different operating systems.
29
30=over 4
31
32=item fileparse_set_fstype
33
34You select the syntax via the routine fileparse_set_fstype().
ee2ff9ea 35
f06db76b 36If the argument passed to it contains one of the substrings
68dc0745 37"VMS", "MSDOS", "MacOS", "AmigaOS" or "MSWin32", the file specification
55497cff 38syntax of that operating system is used in future calls to
39fileparse(), basename(), and dirname(). If it contains none of
c7b9dd21 40these substrings, Unix syntax is used. This pattern matching is
f06db76b 41case-insensitive. If you've selected VMS syntax, and the file
42specification you pass to one of these routines contains a "/",
c7b9dd21 43they assume you are using Unix emulation and apply the Unix syntax
f06db76b 44rules instead, for that function call only.
45
ee2ff9ea 46If the argument passed to it contains one of the substrings "VMS",
68dc0745 47"MSDOS", "MacOS", "AmigaOS", "os2", "MSWin32" or "RISCOS", then the pattern
ee2ff9ea 48matching for suffix removal is performed without regard for case,
49since those systems are not case-sensitive when opening existing files
50(though some of them preserve case on file creation).
51
f06db76b 52If you haven't called fileparse_set_fstype(), the syntax is chosen
f0c6ccdf 53by examining the builtin variable C<$^O> according to these rules.
f06db76b 54
55=item fileparse
56
57The fileparse() routine divides a file specification into three
58parts: a leading B<path>, a file B<name>, and a B<suffix>. The
59B<path> contains everything up to and including the last directory
60separator in the input file specification. The remainder of the input
61file specification is then divided into B<name> and B<suffix> based on
62the optional patterns you specify in C<@suffixlist>. Each element of
63this list is interpreted as a regular expression, and is matched
64against the end of B<name>. If this succeeds, the matching portion of
65B<name> is removed and prepended to B<suffix>. By proper use of
66C<@suffixlist>, you can remove file types or versions for examination.
67
68You are guaranteed that if you concatenate B<path>, B<name>, and
7e2183d3 69B<suffix> together in that order, the result will denote the same
70file as the input file specification.
f06db76b 71
72=back
73
74=head1 EXAMPLES
75
c7b9dd21 76Using Unix file syntax:
f06db76b 77
7e2183d3 78 ($base,$path,$type) = fileparse('/virgil/aeneid/draft.book7',
f06db76b 79 '\.book\d+');
80
81would yield
82
83 $base eq 'draft'
7e2183d3 84 $path eq '/virgil/aeneid/',
f0542300 85 $type eq '.book7'
f06db76b 86
87Similarly, using VMS syntax:
88
89 ($name,$dir,$type) = fileparse('Doc_Root:[Help]Rhetoric.Rnh',
90 '\..*');
91
92would yield
93
94 $name eq 'Rhetoric'
95 $dir eq 'Doc_Root:[Help]'
96 $type eq '.Rnh'
97
2ae324a7 98=over
99
f06db76b 100=item C<basename>
101
102The basename() routine returns the first element of the list produced
44a8e56a 103by calling fileparse() with the same arguments, except that it always
104quotes metacharacters in the given suffixes. It is provided for
c7b9dd21 105programmer compatibility with the Unix shell command basename(1).
f06db76b 106
107=item C<dirname>
108
109The dirname() routine returns the directory portion of the input file
110specification. When using VMS or MacOS syntax, this is identical to the
111second element of the list produced by calling fileparse() with the same
7e2183d3 112input file specification. (Under VMS, if there is no directory information
113in the input file specification, then the current default device and
c7b9dd21 114directory are returned.) When using Unix or MSDOS syntax, the return
115value conforms to the behavior of the Unix shell command dirname(1). This
f06db76b 116is usually the same as the behavior of fileparse(), but differs in some
117cases. For example, for the input file specification F<lib/>, fileparse()
118considers the directory name to be F<lib/>, while dirname() considers the
119directory name to be F<.>).
120
2ae324a7 121=back
122
f06db76b 123=cut
124
b3eb6a9b 125
126## use strict;
1f47e8e2 127# A bit of juggling to insure that C<use re 'taint';> always works, since
918c0b2d 128# File::Basename is used during the Perl build, when the re extension may
129# not be available.
130BEGIN {
131 unless (eval { require re; })
132 { eval ' sub re::import { $^H |= 0x00100000; } ' }
133 import re 'taint';
134}
135
136
137
17f410f9 138use 5.005_64;
139our(@ISA, @EXPORT, $VERSION, $Fileparse_fstype, $Fileparse_igncase);
a0d0e21e 140require Exporter;
141@ISA = qw(Exporter);
748a9306 142@EXPORT = qw(fileparse fileparse_set_fstype basename dirname);
12cbd720 143$VERSION = "2.6";
7e2183d3 144
a0d0e21e 145
146# fileparse_set_fstype() - specify OS-based rules used in future
147# calls to routines in this package
148#
ee2ff9ea 149# Currently recognized values: VMS, MSDOS, MacOS, AmigaOS, os2, RISCOS
150# Any other name uses Unix-style rules and is case-sensitive
a0d0e21e 151
152sub fileparse_set_fstype {
ee2ff9ea 153 my @old = ($Fileparse_fstype, $Fileparse_igncase);
44a8e56a 154 if (@_) {
155 $Fileparse_fstype = $_[0];
39e571d4 156 $Fileparse_igncase = ($_[0] =~ /^(?:MacOS|VMS|AmigaOS|os2|RISCOS|MSWin32|MSDOS)/i);
44a8e56a 157 }
158 wantarray ? @old : $old[0];
a0d0e21e 159}
160
161# fileparse() - parse file specification
162#
f0542300 163# Version 2.4 27-Sep-1996 Charles Bailey bailey@genetics.upenn.edu
a0d0e21e 164
165
166sub fileparse {
167 my($fullname,@suffices) = @_;
ee2ff9ea 168 my($fstype,$igncase) = ($Fileparse_fstype, $Fileparse_igncase);
7e2183d3 169 my($dirpath,$tail,$suffix,$basename);
12cbd720 170 my($taint) = substr($fullname,0,0); # Is $fullname tainted?
a0d0e21e 171
172 if ($fstype =~ /^VMS/i) {
173 if ($fullname =~ m#/#) { $fstype = '' } # We're doing Unix emulation
174 else {
c7b9dd21 175 ($dirpath,$basename) = ($fullname =~ /^(.*[:>\]])?(.*)/s);
12cbd720 176 $dirpath ||= ''; # should always be defined
a0d0e21e 177 }
178 }
fa6a1c44 179 if ($fstype =~ /^MS(DOS|Win32)|epoc/i) {
c7b9dd21 180 ($dirpath,$basename) = ($fullname =~ /^((?:.*[:\\\/])?)(.*)/s);
181 $dirpath .= '.\\' unless $dirpath =~ /[\\\/]\z/;
a0d0e21e 182 }
c7b9dd21 183 elsif ($fstype =~ /^MacOS/si) {
184 ($dirpath,$basename) = ($fullname =~ /^(.*:)?(.*)/s);
a0d0e21e 185 }
55497cff 186 elsif ($fstype =~ /^AmigaOS/i) {
c7b9dd21 187 ($dirpath,$basename) = ($fullname =~ /(.*[:\/])?(.*)/s);
a3156fc3 188 $dirpath = './' unless $dirpath;
55497cff 189 }
748a9306 190 elsif ($fstype !~ /^VMS/i) { # default to Unix
c7b9dd21 191 ($dirpath,$basename) = ($fullname =~ m#^(.*/)?(.*)#s);
e3830a4e 192 if ($^O eq 'VMS' and $fullname =~ m:^(/[^/]+/000000(/|$))(.*):) {
491527d0 193 # dev:[000000] is top of VMS tree, similar to Unix '/'
e3830a4e 194 # so strip it off and treat the rest as "normal"
195 my $devspec = $1;
196 my $remainder = $3;
197 ($dirpath,$basename) = ($remainder =~ m#^(.*/)?(.*)#s);
198 $dirpath = $devspec.$dirpath;
491527d0 199 }
f0c6ccdf 200 $dirpath = './' unless $dirpath;
a0d0e21e 201 }
202
203 if (@suffices) {
f06db76b 204 $tail = '';
a0d0e21e 205 foreach $suffix (@suffices) {
ee2ff9ea 206 my $pat = ($igncase ? '(?i)' : '') . "($suffix)\$";
c7b9dd21 207 if ($basename =~ s/$pat//s) {
12cbd720 208 $taint .= substr($suffix,0,0);
44a8e56a 209 $tail = $1 . $tail;
a0d0e21e 210 }
211 }
212 }
213
12cbd720 214 $tail .= $taint if defined $tail; # avoid warning if $tail == undef
215 wantarray ? ($basename . $taint, $dirpath . $taint, $tail)
216 : $basename . $taint;
a0d0e21e 217}
218
219
220# basename() - returns first element of list returned by fileparse()
221
222sub basename {
748a9306 223 my($name) = shift;
224 (fileparse($name, map("\Q$_\E",@_)))[0];
a0d0e21e 225}
7e2183d3 226
a0d0e21e 227
228# dirname() - returns device and directory portion of file specification
229# Behavior matches that of Unix dirname(1) exactly for Unix and MSDOS
748a9306 230# filespecs except for names ending with a separator, e.g., "/xx/yy/".
231# This differs from the second element of the list returned
a0d0e21e 232# by fileparse() in that the trailing '/' (Unix) or '\' (MSDOS) (and
233# the last directory name if the filespec ends in a '/' or '\'), is lost.
234
235sub dirname {
236 my($basename,$dirname) = fileparse($_[0]);
237 my($fstype) = $Fileparse_fstype;
238
239 if ($fstype =~ /VMS/i) {
748a9306 240 if ($_[0] =~ m#/#) { $fstype = '' }
7e2183d3 241 else { return $dirname || $ENV{DEFAULT} }
a0d0e21e 242 }
3e2f796a 243 if ($fstype =~ /MacOS/i) {
244 if( !length($basename) && $dirname !~ /^[^:]+:\z/) {
245 $dirname =~ s/([^:]):\z/$1/s;
246 ($basename,$dirname) = fileparse $dirname;
247 }
248 $dirname .= ":" unless $dirname =~ /:\z/;
249 }
a0d0e21e 250 elsif ($fstype =~ /MSDOS/i) {
c7b9dd21 251 $dirname =~ s/([^:])[\\\/]*\z/$1/;
42568e28 252 unless( length($basename) ) {
253 ($basename,$dirname) = fileparse $dirname;
c7b9dd21 254 $dirname =~ s/([^:])[\\\/]*\z/$1/;
42568e28 255 }
a0d0e21e 256 }
68dc0745 257 elsif ($fstype =~ /MSWin32/i) {
c7b9dd21 258 $dirname =~ s/([^:])[\\\/]*\z/$1/;
68dc0745 259 unless( length($basename) ) {
260 ($basename,$dirname) = fileparse $dirname;
c7b9dd21 261 $dirname =~ s/([^:])[\\\/]*\z/$1/;
68dc0745 262 }
263 }
55497cff 264 elsif ($fstype =~ /AmigaOS/i) {
c7b9dd21 265 if ( $dirname =~ /:\z/) { return $dirname }
55497cff 266 chop $dirname;
c7b9dd21 267 $dirname =~ s#[^:/]+\z## unless length($basename);
55497cff 268 }
3e2f796a 269 else {
c7b9dd21 270 $dirname =~ s:(.)/*\z:$1:s;
42568e28 271 unless( length($basename) ) {
272 local($File::Basename::Fileparse_fstype) = $fstype;
273 ($basename,$dirname) = fileparse $dirname;
c7b9dd21 274 $dirname =~ s:(.)/*\z:$1:s;
42568e28 275 }
a0d0e21e 276 }
277
278 $dirname;
279}
280
44a8e56a 281fileparse_set_fstype $^O;
a0d0e21e 282
2831;