source: for-distributions/trunk/bin/windows/perl/lib/File/Basename.pm@ 14489

Last change on this file since 14489 was 14489, checked in by oranfry, 17 years ago

upgrading to perl 5.8

File size: 11.0 KB
Line 
1=head1 NAME
2
3File::Basename - Parse file paths into directory, filename and suffix.
4
5=head1 SYNOPSIS
6
7 use File::Basename;
8
9 ($name,$path,$suffix) = fileparse($fullname,@suffixlist);
10 $name = fileparse($fullname,@suffixlist);
11
12 $basename = basename($fullname,@suffixlist);
13 $dirname = dirname($fullname);
14
15
16=head1 DESCRIPTION
17
18These routines allow you to parse file paths into their directory, filename
19and suffix.
20
21B<NOTE>: C<dirname()> and C<basename()> emulate the behaviours, and
22quirks, of the shell and C functions of the same name. See each
23function's documentation for details. If your concern is just parsing
24paths it is safer to use L<File::Spec>'s C<splitpath()> and
25C<splitdir()> methods.
26
27It is guaranteed that
28
29 # Where $path_separator is / for Unix, \ for Windows, etc...
30 dirname($path) . $path_separator . basename($path);
31
32is equivalent to the original path for all systems but VMS.
33
34
35=cut
36
37
38package File::Basename;
39
40# A bit of juggling to insure that C<use re 'taint';> always works, since
41# File::Basename is used during the Perl build, when the re extension may
42# not be available.
43BEGIN {
44 unless (eval { require re; })
45 { eval ' sub re::import { $^H |= 0x00100000; } ' } # HINT_RE_TAINT
46 import re 'taint';
47}
48
49
50use strict;
51use 5.006;
52use warnings;
53our(@ISA, @EXPORT, $VERSION, $Fileparse_fstype, $Fileparse_igncase);
54require Exporter;
55@ISA = qw(Exporter);
56@EXPORT = qw(fileparse fileparse_set_fstype basename dirname);
57$VERSION = "2.74";
58
59fileparse_set_fstype($^O);
60
61
62=over 4
63
64=item C<fileparse>
65
66 my($filename, $directories, $suffix) = fileparse($path);
67 my($filename, $directories, $suffix) = fileparse($path, @suffixes);
68 my $filename = fileparse($path, @suffixes);
69
70The C<fileparse()> routine divides a file path into its $directories, $filename
71and (optionally) the filename $suffix.
72
73$directories contains everything up to and including the last
74directory separator in the $path including the volume (if applicable).
75The remainder of the $path is the $filename.
76
77 # On Unix returns ("baz", "/foo/bar/", "")
78 fileparse("/foo/bar/baz");
79
80 # On Windows returns ("baz", "C:\foo\bar\", "")
81 fileparse("C:\foo\bar\baz");
82
83 # On Unix returns ("", "/foo/bar/baz/", "")
84 fileparse("/foo/bar/baz/");
85
86If @suffixes are given each element is a pattern (either a string or a
87C<qr//>) matched against the end of the $filename. The matching
88portion is removed and becomes the $suffix.
89
90 # On Unix returns ("baz", "/foo/bar", ".txt")
91 fileparse("/foo/bar/baz", qr/\.[^.]*/);
92
93If type is non-Unix (see C<fileparse_set_fstype()>) then the pattern
94matching for suffix removal is performed case-insensitively, since
95those systems are not case-sensitive when opening existing files.
96
97You are guaranteed that C<$directories . $filename . $suffix> will
98denote the same location as the original $path.
99
100=cut
101
102
103sub fileparse {
104 my($fullname,@suffices) = @_;
105
106 unless (defined $fullname) {
107 require Carp;
108 Carp::croak("fileparse(): need a valid pathname");
109 }
110
111 my $orig_type = '';
112 my($type,$igncase) = ($Fileparse_fstype, $Fileparse_igncase);
113
114 my($taint) = substr($fullname,0,0); # Is $fullname tainted?
115
116 if ($type eq "VMS" and $fullname =~ m{/} ) {
117 # We're doing Unix emulation
118 $orig_type = $type;
119 $type = 'Unix';
120 }
121
122 my($dirpath, $basename);
123
124 if (grep { $type eq $_ } qw(MSDOS DOS MSWin32 Epoc)) {
125 ($dirpath,$basename) = ($fullname =~ /^((?:.*[:\\\/])?)(.*)/s);
126 $dirpath .= '.\\' unless $dirpath =~ /[\\\/]\z/;
127 }
128 elsif ($type eq "OS2") {
129 ($dirpath,$basename) = ($fullname =~ m#^((?:.*[:\\/])?)(.*)#s);
130 $dirpath = './' unless $dirpath; # Can't be 0
131 $dirpath .= '/' unless $dirpath =~ m#[\\/]\z#;
132 }
133 elsif ($type eq "MacOS") {
134 ($dirpath,$basename) = ($fullname =~ /^(.*:)?(.*)/s);
135 $dirpath = ':' unless $dirpath;
136 }
137 elsif ($type eq "AmigaOS") {
138 ($dirpath,$basename) = ($fullname =~ /(.*[:\/])?(.*)/s);
139 $dirpath = './' unless $dirpath;
140 }
141 elsif ($type eq 'VMS' ) {
142 ($dirpath,$basename) = ($fullname =~ /^(.*[:>\]])?(.*)/s);
143 $dirpath ||= ''; # should always be defined
144 }
145 else { # Default to Unix semantics.
146 ($dirpath,$basename) = ($fullname =~ m#^(.*/)?(.*)#s);
147 if ($orig_type eq 'VMS' and $fullname =~ m:^(/[^/]+/000000(/|$))(.*):) {
148 # dev:[000000] is top of VMS tree, similar to Unix '/'
149 # so strip it off and treat the rest as "normal"
150 my $devspec = $1;
151 my $remainder = $3;
152 ($dirpath,$basename) = ($remainder =~ m#^(.*/)?(.*)#s);
153 $dirpath ||= ''; # should always be defined
154 $dirpath = $devspec.$dirpath;
155 }
156 $dirpath = './' unless $dirpath;
157 }
158
159
160 my $tail = '';
161 my $suffix = '';
162 if (@suffices) {
163 foreach $suffix (@suffices) {
164 my $pat = ($igncase ? '(?i)' : '') . "($suffix)\$";
165 if ($basename =~ s/$pat//s) {
166 $taint .= substr($suffix,0,0);
167 $tail = $1 . $tail;
168 }
169 }
170 }
171
172 # Ensure taint is propgated from the path to its pieces.
173 $tail .= $taint;
174 wantarray ? ($basename .= $taint, $dirpath .= $taint, $tail)
175 : ($basename .= $taint);
176}
177
178
179
180=item C<basename>
181
182 my $filename = basename($path);
183 my $filename = basename($path, @suffixes);
184
185This function is provided for compatibility with the Unix shell command
186C<basename(1)>. It does B<NOT> always return the file name portion of a
187path as you might expect. To be safe, if you want the file name portion of
188a path use C<fileparse()>.
189
190C<basename()> returns the last level of a filepath even if the last
191level is clearly directory. In effect, it is acting like C<pop()> for
192paths. This differs from C<fileparse()>'s behaviour.
193
194 # Both return "bar"
195 basename("/foo/bar");
196 basename("/foo/bar/");
197
198@suffixes work as in C<fileparse()> except all regex metacharacters are
199quoted.
200
201 # These two function calls are equivalent.
202 my $filename = basename("/foo/bar/baz.txt", ".txt");
203 my $filename = fileparse("/foo/bar/baz.txt", qr/\Q.txt\E/);
204
205Also note that in order to be compatible with the shell command,
206C<basename()> does not strip off a suffix if it is identical to the
207remaining characters in the filename.
208
209=cut
210
211
212sub basename {
213 my($path) = shift;
214
215 # From BSD basename(1)
216 # The basename utility deletes any prefix ending with the last slash `/'
217 # character present in string (after first stripping trailing slashes)
218 _strip_trailing_sep($path);
219
220 my($basename, $dirname, $suffix) = fileparse( $path, map("\Q$_\E",@_) );
221
222 # From BSD basename(1)
223 # The suffix is not stripped if it is identical to the remaining
224 # characters in string.
225 if( length $suffix and !length $basename ) {
226 $basename = $suffix;
227 }
228
229 # Ensure that basename '/' == '/'
230 if( !length $basename ) {
231 $basename = $dirname;
232 }
233
234 return $basename;
235}
236
237
238
239=item C<dirname>
240
241This function is provided for compatibility with the Unix shell
242command C<dirname(1)> and has inherited some of its quirks. In spite of
243its name it does B<NOT> always return the directory name as you might
244expect. To be safe, if you want the directory name of a path use
245C<fileparse()>.
246
247Only on VMS (where there is no ambiguity between the file and directory
248portions of a path) and AmigaOS (possibly due to an implementation quirk in
249this module) does C<dirname()> work like C<fileparse($path)>, returning just the
250$directories.
251
252 # On VMS and AmigaOS
253 my $directories = dirname($path);
254
255When using Unix or MSDOS syntax this emulates the C<dirname(1)> shell function
256which is subtly different from how C<fileparse()> works. It returns all but
257the last level of a file path even if the last level is clearly a directory.
258In effect, it is not returning the directory portion but simply the path one
259level up acting like C<chop()> for file paths.
260
261Also unlike C<fileparse()>, C<dirname()> does not include a trailing slash on
262its returned path.
263
264 # returns /foo/bar. fileparse() would return /foo/bar/
265 dirname("/foo/bar/baz");
266
267 # also returns /foo/bar despite the fact that baz is clearly a
268 # directory. fileparse() would return /foo/bar/baz/
269 dirname("/foo/bar/baz/");
270
271 # returns '.'. fileparse() would return 'foo/'
272 dirname("foo/");
273
274Under VMS, if there is no directory information in the $path, then the
275current default device and directory is used.
276
277=cut
278
279
280sub dirname {
281 my $path = shift;
282
283 my($type) = $Fileparse_fstype;
284
285 if( $type eq 'VMS' and $path =~ m{/} ) {
286 # Parse as Unix
287 local($File::Basename::Fileparse_fstype) = '';
288 return dirname($path);
289 }
290
291 my($basename, $dirname) = fileparse($path);
292
293 if ($type eq 'VMS') {
294 $dirname ||= $ENV{DEFAULT};
295 }
296 elsif ($type eq 'MacOS') {
297 if( !length($basename) && $dirname !~ /^[^:]+:\z/) {
298 _strip_trailing_sep($dirname);
299 ($basename,$dirname) = fileparse $dirname;
300 }
301 $dirname .= ":" unless $dirname =~ /:\z/;
302 }
303 elsif (grep { $type eq $_ } qw(MSDOS DOS MSWin32 OS2)) {
304 _strip_trailing_sep($dirname);
305 unless( length($basename) ) {
306 ($basename,$dirname) = fileparse $dirname;
307 _strip_trailing_sep($dirname);
308 }
309 }
310 elsif ($type eq 'AmigaOS') {
311 if ( $dirname =~ /:\z/) { return $dirname }
312 chop $dirname;
313 $dirname =~ s#[^:/]+\z## unless length($basename);
314 }
315 else {
316 _strip_trailing_sep($dirname);
317 unless( length($basename) ) {
318 ($basename,$dirname) = fileparse $dirname;
319 _strip_trailing_sep($dirname);
320 }
321 }
322
323 $dirname;
324}
325
326
327# Strip the trailing path separator.
328sub _strip_trailing_sep {
329 my $type = $Fileparse_fstype;
330
331 if ($type eq 'MacOS') {
332 $_[0] =~ s/([^:]):\z/$1/s;
333 }
334 elsif (grep { $type eq $_ } qw(MSDOS DOS MSWin32 OS2)) {
335 $_[0] =~ s/([^:])[\\\/]*\z/$1/;
336 }
337 else {
338 $_[0] =~ s{(.)/*\z}{$1}s;
339 }
340}
341
342
343=item C<fileparse_set_fstype>
344
345 my $type = fileparse_set_fstype();
346 my $previous_type = fileparse_set_fstype($type);
347
348Normally File::Basename will assume a file path type native to your current
349operating system (ie. /foo/bar style on Unix, \foo\bar on Windows, etc...).
350With this function you can override that assumption.
351
352Valid $types are "MacOS", "VMS", "AmigaOS", "OS2", "RISCOS",
353"MSWin32", "DOS" (also "MSDOS" for backwards bug compatibility),
354"Epoc" and "Unix" (all case-insensitive). If an unrecognized $type is
355given "Unix" will be assumed.
356
357If you've selected VMS syntax, and the file specification you pass to
358one of these routines contains a "/", they assume you are using Unix
359emulation and apply the Unix syntax rules instead, for that function
360call only.
361
362=back
363
364=cut
365
366
367BEGIN {
368
369my @Ignore_Case = qw(MacOS VMS AmigaOS OS2 RISCOS MSWin32 MSDOS DOS Epoc);
370my @Types = (@Ignore_Case, qw(Unix));
371
372sub fileparse_set_fstype {
373 my $old = $Fileparse_fstype;
374
375 if (@_) {
376 my $new_type = shift;
377
378 $Fileparse_fstype = 'Unix'; # default
379 foreach my $type (@Types) {
380 $Fileparse_fstype = $type if $new_type =~ /^$type/i;
381 }
382
383 $Fileparse_igncase =
384 (grep $Fileparse_fstype eq $_, @Ignore_Case) ? 1 : 0;
385 }
386
387 return $old;
388}
389
390}
391
392
3931;
394
395
396=head1 SEE ALSO
397
398L<dirname(1)>, L<basename(1)>, L<File::Spec>
Note: See TracBrowser for help on using the repository browser.