manual integration of all outstanding ansi branch stuff into mainline
[p5sagit/p5-mst-13.2.git] / lib / File / Basename.pm
CommitLineData
a0d0e21e 1package File::Basename;
2
f06db76b 3=head1 NAME
4
f06db76b 5fileparse - split a pathname into pieces
6
7basename - extract just the filename from a path
8
9dirname - extract just the directory from a path
10
11=head1 SYNOPSIS
12
13 use File::Basename;
14
15 ($name,$path,$suffix) = fileparse($fullname,@suffixlist)
16 fileparse_set_fstype($os_string);
17 $basename = basename($fullname,@suffixlist);
18 $dirname = dirname($fullname);
19
20 ($name,$path,$suffix) = fileparse("lib/File/Basename.pm","\.pm");
21 fileparse_set_fstype("VMS");
22 $basename = basename("lib/File/Basename.pm",".pm");
23 $dirname = dirname("lib/File/Basename.pm");
24
25=head1 DESCRIPTION
26
27These routines allow you to parse file specifications into useful
28pieces using the syntax of different operating systems.
29
30=over 4
31
32=item fileparse_set_fstype
33
34You select the syntax via the routine fileparse_set_fstype().
ee2ff9ea 35
f06db76b 36If the argument passed to it contains one of the substrings
68dc0745 37"VMS", "MSDOS", "MacOS", "AmigaOS" or "MSWin32", the file specification
55497cff 38syntax of that operating system is used in future calls to
39fileparse(), basename(), and dirname(). If it contains none of
40these substrings, UNIX syntax is used. This pattern matching is
f06db76b 41case-insensitive. If you've selected VMS syntax, and the file
42specification you pass to one of these routines contains a "/",
43they assume you are using UNIX emulation and apply the UNIX syntax
44rules instead, for that function call only.
45
ee2ff9ea 46If the argument passed to it contains one of the substrings "VMS",
68dc0745 47"MSDOS", "MacOS", "AmigaOS", "os2", "MSWin32" or "RISCOS", then the pattern
ee2ff9ea 48matching for suffix removal is performed without regard for case,
49since those systems are not case-sensitive when opening existing files
50(though some of them preserve case on file creation).
51
f06db76b 52If you haven't called fileparse_set_fstype(), the syntax is chosen
f0c6ccdf 53by examining the builtin variable C<$^O> according to these rules.
f06db76b 54
55=item fileparse
56
57The fileparse() routine divides a file specification into three
58parts: a leading B<path>, a file B<name>, and a B<suffix>. The
59B<path> contains everything up to and including the last directory
60separator in the input file specification. The remainder of the input
61file specification is then divided into B<name> and B<suffix> based on
62the optional patterns you specify in C<@suffixlist>. Each element of
63this list is interpreted as a regular expression, and is matched
64against the end of B<name>. If this succeeds, the matching portion of
65B<name> is removed and prepended to B<suffix>. By proper use of
66C<@suffixlist>, you can remove file types or versions for examination.
67
68You are guaranteed that if you concatenate B<path>, B<name>, and
7e2183d3 69B<suffix> together in that order, the result will denote the same
70file as the input file specification.
f06db76b 71
72=back
73
74=head1 EXAMPLES
75
76Using UNIX file syntax:
77
7e2183d3 78 ($base,$path,$type) = fileparse('/virgil/aeneid/draft.book7',
f06db76b 79 '\.book\d+');
80
81would yield
82
83 $base eq 'draft'
7e2183d3 84 $path eq '/virgil/aeneid/',
f0542300 85 $type eq '.book7'
f06db76b 86
87Similarly, using VMS syntax:
88
89 ($name,$dir,$type) = fileparse('Doc_Root:[Help]Rhetoric.Rnh',
90 '\..*');
91
92would yield
93
94 $name eq 'Rhetoric'
95 $dir eq 'Doc_Root:[Help]'
96 $type eq '.Rnh'
97
2ae324a7 98=over
99
f06db76b 100=item C<basename>
101
102The basename() routine returns the first element of the list produced
44a8e56a 103by calling fileparse() with the same arguments, except that it always
104quotes metacharacters in the given suffixes. It is provided for
105programmer compatibility with the UNIX shell command basename(1).
f06db76b 106
107=item C<dirname>
108
109The dirname() routine returns the directory portion of the input file
110specification. When using VMS or MacOS syntax, this is identical to the
111second element of the list produced by calling fileparse() with the same
7e2183d3 112input file specification. (Under VMS, if there is no directory information
113in the input file specification, then the current default device and
114directory are returned.) When using UNIX or MSDOS syntax, the return
f06db76b 115value conforms to the behavior of the UNIX shell command dirname(1). This
116is usually the same as the behavior of fileparse(), but differs in some
117cases. For example, for the input file specification F<lib/>, fileparse()
118considers the directory name to be F<lib/>, while dirname() considers the
119directory name to be F<.>).
120
2ae324a7 121=back
122
f06db76b 123=cut
124
f0c6ccdf 125require 5.002;
a0d0e21e 126require Exporter;
127@ISA = qw(Exporter);
748a9306 128@EXPORT = qw(fileparse fileparse_set_fstype basename dirname);
7e2183d3 129#use strict;
12cbd720 130use vars qw($VERSION $Fileparse_fstype $Fileparse_igncase);
131$VERSION = "2.6";
7e2183d3 132
a0d0e21e 133
134# fileparse_set_fstype() - specify OS-based rules used in future
135# calls to routines in this package
136#
ee2ff9ea 137# Currently recognized values: VMS, MSDOS, MacOS, AmigaOS, os2, RISCOS
138# Any other name uses Unix-style rules and is case-sensitive
a0d0e21e 139
140sub fileparse_set_fstype {
ee2ff9ea 141 my @old = ($Fileparse_fstype, $Fileparse_igncase);
44a8e56a 142 if (@_) {
143 $Fileparse_fstype = $_[0];
39e571d4 144 $Fileparse_igncase = ($_[0] =~ /^(?:MacOS|VMS|AmigaOS|os2|RISCOS|MSWin32|MSDOS)/i);
44a8e56a 145 }
146 wantarray ? @old : $old[0];
a0d0e21e 147}
148
149# fileparse() - parse file specification
150#
f0542300 151# Version 2.4 27-Sep-1996 Charles Bailey bailey@genetics.upenn.edu
a0d0e21e 152
153
154sub fileparse {
155 my($fullname,@suffices) = @_;
ee2ff9ea 156 my($fstype,$igncase) = ($Fileparse_fstype, $Fileparse_igncase);
7e2183d3 157 my($dirpath,$tail,$suffix,$basename);
12cbd720 158 my($taint) = substr($fullname,0,0); # Is $fullname tainted?
a0d0e21e 159
160 if ($fstype =~ /^VMS/i) {
161 if ($fullname =~ m#/#) { $fstype = '' } # We're doing Unix emulation
162 else {
6ff81951 163 ($dirpath,$basename) = ($fullname =~ /^(.*[:>\]])?(.*)/t);
12cbd720 164 $dirpath ||= ''; # should always be defined
a0d0e21e 165 }
166 }
96e4d5b1 167 if ($fstype =~ /^MS(DOS|Win32)/i) {
6ff81951 168 ($dirpath,$basename) = ($fullname =~ /^((?:.*[:\\\/])?)(.*)/t);
42568e28 169 $dirpath .= '.\\' unless $dirpath =~ /[\\\/]$/;
a0d0e21e 170 }
7e2183d3 171 elsif ($fstype =~ /^MacOS/i) {
6ff81951 172 ($dirpath,$basename) = ($fullname =~ /^(.*:)?(.*)/t);
a0d0e21e 173 }
55497cff 174 elsif ($fstype =~ /^AmigaOS/i) {
6ff81951 175 ($dirpath,$basename) = ($fullname =~ /(.*[:\/])?(.*)/t);
a3156fc3 176 $dirpath = './' unless $dirpath;
55497cff 177 }
748a9306 178 elsif ($fstype !~ /^VMS/i) { # default to Unix
6ff81951 179 ($dirpath,$basename) = ($fullname =~ m#^(.*/)?(.*)#t);
491527d0 180 if ($^O eq 'VMS' and $fullname =~ m:/[^/]+/000000/?:) {
181 # dev:[000000] is top of VMS tree, similar to Unix '/'
182 ($basename,$dirpath) = ('',$fullname);
183 }
f0c6ccdf 184 $dirpath = './' unless $dirpath;
a0d0e21e 185 }
186
187 if (@suffices) {
f06db76b 188 $tail = '';
a0d0e21e 189 foreach $suffix (@suffices) {
ee2ff9ea 190 my $pat = ($igncase ? '(?i)' : '') . "($suffix)\$";
6ff81951 191 if ($basename =~ s/$pat//t) {
12cbd720 192 $taint .= substr($suffix,0,0);
44a8e56a 193 $tail = $1 . $tail;
a0d0e21e 194 }
195 }
196 }
197
12cbd720 198 $tail .= $taint if defined $tail; # avoid warning if $tail == undef
199 wantarray ? ($basename . $taint, $dirpath . $taint, $tail)
200 : $basename . $taint;
a0d0e21e 201}
202
203
204# basename() - returns first element of list returned by fileparse()
205
206sub basename {
748a9306 207 my($name) = shift;
208 (fileparse($name, map("\Q$_\E",@_)))[0];
a0d0e21e 209}
7e2183d3 210
a0d0e21e 211
212# dirname() - returns device and directory portion of file specification
213# Behavior matches that of Unix dirname(1) exactly for Unix and MSDOS
748a9306 214# filespecs except for names ending with a separator, e.g., "/xx/yy/".
215# This differs from the second element of the list returned
a0d0e21e 216# by fileparse() in that the trailing '/' (Unix) or '\' (MSDOS) (and
217# the last directory name if the filespec ends in a '/' or '\'), is lost.
218
219sub dirname {
220 my($basename,$dirname) = fileparse($_[0]);
221 my($fstype) = $Fileparse_fstype;
222
223 if ($fstype =~ /VMS/i) {
748a9306 224 if ($_[0] =~ m#/#) { $fstype = '' }
7e2183d3 225 else { return $dirname || $ENV{DEFAULT} }
a0d0e21e 226 }
227 if ($fstype =~ /MacOS/i) { return $dirname }
228 elsif ($fstype =~ /MSDOS/i) {
6ff81951 229 $dirname =~ s/([^:])[\\\/]*$/$1/t;
42568e28 230 unless( length($basename) ) {
231 ($basename,$dirname) = fileparse $dirname;
6ff81951 232 $dirname =~ s/([^:])[\\\/]*$/$1/t;
42568e28 233 }
a0d0e21e 234 }
68dc0745 235 elsif ($fstype =~ /MSWin32/i) {
6ff81951 236 $dirname =~ s/([^:])[\\\/]*$/$1/t;
68dc0745 237 unless( length($basename) ) {
238 ($basename,$dirname) = fileparse $dirname;
6ff81951 239 $dirname =~ s/([^:])[\\\/]*$/$1/t;
68dc0745 240 }
241 }
55497cff 242 elsif ($fstype =~ /AmigaOS/i) {
243 if ( $dirname =~ /:$/) { return $dirname }
244 chop $dirname;
6ff81951 245 $dirname =~ s#[^:/]+$##t unless length($basename);
55497cff 246 }
a0d0e21e 247 else {
42568e28 248 $dirname =~ s:(.)/*$:$1:;
249 unless( length($basename) ) {
250 local($File::Basename::Fileparse_fstype) = $fstype;
251 ($basename,$dirname) = fileparse $dirname;
6ff81951 252 $dirname =~ s:(.)/*$:$1:t;
42568e28 253 }
a0d0e21e 254 }
255
256 $dirname;
257}
258
44a8e56a 259fileparse_set_fstype $^O;
a0d0e21e 260
2611;