231 lines
5.6 KiB
Perl
231 lines
5.6 KiB
Perl
|
package File::Find;
|
||
|
require 5.000;
|
||
|
require Exporter;
|
||
|
require Cwd;
|
||
|
|
||
|
=head1 NAME
|
||
|
|
||
|
find - traverse a file tree
|
||
|
|
||
|
finddepth - traverse a directory structure depth-first
|
||
|
|
||
|
=head1 SYNOPSIS
|
||
|
|
||
|
use File::Find;
|
||
|
find(\&wanted, '/foo','/bar');
|
||
|
sub wanted { ... }
|
||
|
|
||
|
use File::Find;
|
||
|
finddepth(\&wanted, '/foo','/bar');
|
||
|
sub wanted { ... }
|
||
|
|
||
|
=head1 DESCRIPTION
|
||
|
|
||
|
The first argument to find() is either a hash reference describing the
|
||
|
operations to be performed for each file, or a code reference. If it
|
||
|
is a hash reference, then the value for the key C<wanted> should be a
|
||
|
code reference. This code reference is called I<the wanted()
|
||
|
function> below.
|
||
|
|
||
|
Currently the only other supported key for the above hash is
|
||
|
C<bydepth>, in presense of which the walk over directories is
|
||
|
performed depth-first. Entry point finddepth() is a shortcut for
|
||
|
specifying C<{ bydepth => 1}> in the first argument of find().
|
||
|
|
||
|
The wanted() function does whatever verifications you want.
|
||
|
$File::Find::dir contains the current directory name, and $_ the
|
||
|
current filename within that directory. $File::Find::name contains
|
||
|
C<"$File::Find::dir/$_">. You are chdir()'d to $File::Find::dir when
|
||
|
the function is called. The function may set $File::Find::prune to
|
||
|
prune the tree.
|
||
|
|
||
|
File::Find assumes that you don't alter the $_ variable. If you do then
|
||
|
make sure you return it to its original value before exiting your function.
|
||
|
|
||
|
This library is useful for the C<find2perl> tool, which when fed,
|
||
|
|
||
|
find2perl / -name .nfs\* -mtime +7 \
|
||
|
-exec rm -f {} \; -o -fstype nfs -prune
|
||
|
|
||
|
produces something like:
|
||
|
|
||
|
sub wanted {
|
||
|
/^\.nfs.*$/ &&
|
||
|
(($dev,$ino,$mode,$nlink,$uid,$gid) = lstat($_)) &&
|
||
|
int(-M _) > 7 &&
|
||
|
unlink($_)
|
||
|
||
|
||
|
($nlink || (($dev,$ino,$mode,$nlink,$uid,$gid) = lstat($_))) &&
|
||
|
$dev < 0 &&
|
||
|
($File::Find::prune = 1);
|
||
|
}
|
||
|
|
||
|
Set the variable $File::Find::dont_use_nlink if you're using AFS,
|
||
|
since AFS cheats.
|
||
|
|
||
|
C<finddepth> is just like C<find>, except that it does a depth-first
|
||
|
search.
|
||
|
|
||
|
Here's another interesting wanted function. It will find all symlinks
|
||
|
that don't resolve:
|
||
|
|
||
|
sub wanted {
|
||
|
-l && !-e && print "bogus link: $File::Find::name\n";
|
||
|
}
|
||
|
|
||
|
=head1 BUGS
|
||
|
|
||
|
There is no way to make find or finddepth follow symlinks.
|
||
|
|
||
|
=cut
|
||
|
|
||
|
@ISA = qw(Exporter);
|
||
|
@EXPORT = qw(find finddepth);
|
||
|
|
||
|
|
||
|
sub find_opt {
|
||
|
my $wanted = shift;
|
||
|
my $bydepth = $wanted->{bydepth};
|
||
|
my $cwd = $bydepth ? Cwd::fastcwd() : Cwd::cwd();
|
||
|
# Localize these rather than lexicalizing them for backwards
|
||
|
# compatibility.
|
||
|
local($topdir,$topdev,$topino,$topmode,$topnlink);
|
||
|
foreach $topdir (@_) {
|
||
|
(($topdev,$topino,$topmode,$topnlink) =
|
||
|
($Is_VMS ? stat($topdir) : lstat($topdir)))
|
||
|
|| (warn("Can't stat $topdir: $!\n"), next);
|
||
|
if (-d _) {
|
||
|
if (chdir($topdir)) {
|
||
|
$prune = 0;
|
||
|
unless ($bydepth) {
|
||
|
($dir,$_) = ($topdir,'.');
|
||
|
$name = $topdir;
|
||
|
$wanted->{wanted}->();
|
||
|
}
|
||
|
next if $prune;
|
||
|
my $fixtopdir = $topdir;
|
||
|
$fixtopdir =~ s,/$,, ;
|
||
|
$fixtopdir =~ s/\.dir$// if $Is_VMS;
|
||
|
&finddir($wanted,$fixtopdir,$topnlink, $bydepth);
|
||
|
if ($bydepth) {
|
||
|
($dir,$_) = ($fixtopdir,'.');
|
||
|
$name = $fixtopdir;
|
||
|
$wanted->{wanted}->();
|
||
|
}
|
||
|
}
|
||
|
else {
|
||
|
warn "Can't cd to $topdir: $!\n";
|
||
|
}
|
||
|
}
|
||
|
else {
|
||
|
require File::Basename;
|
||
|
unless (($_,$dir) = File::Basename::fileparse($topdir)) {
|
||
|
($dir,$_) = ('.', $topdir);
|
||
|
}
|
||
|
if (chdir($dir)) {
|
||
|
$name = $topdir;
|
||
|
$wanted->{wanted}->();
|
||
|
}
|
||
|
else {
|
||
|
warn "Can't cd to $dir: $!\n";
|
||
|
}
|
||
|
}
|
||
|
chdir $cwd;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
sub finddir {
|
||
|
my($wanted, $nlink, $bydepth);
|
||
|
local($dir, $name);
|
||
|
($wanted, $dir, $nlink, $bydepth) = @_;
|
||
|
|
||
|
my($dev, $ino, $mode, $subcount);
|
||
|
|
||
|
# Get the list of files in the current directory.
|
||
|
opendir(DIR,'.') || (warn("Can't open $dir: $!\n"), $bydepth || return);
|
||
|
my(@filenames) = readdir(DIR);
|
||
|
closedir(DIR);
|
||
|
|
||
|
if ($nlink == 2 && !$dont_use_nlink) { # This dir has no subdirectories.
|
||
|
for (@filenames) {
|
||
|
next if $_ eq '.';
|
||
|
next if $_ eq '..';
|
||
|
$name = "$dir/$_";
|
||
|
$nlink = 0;
|
||
|
$wanted->{wanted}->();
|
||
|
}
|
||
|
}
|
||
|
else { # This dir has subdirectories.
|
||
|
$subcount = $nlink - 2;
|
||
|
for (@filenames) {
|
||
|
next if $_ eq '.';
|
||
|
next if $_ eq '..';
|
||
|
$nlink = 0;
|
||
|
$prune = 0 unless $bydepth;
|
||
|
$name = "$dir/$_";
|
||
|
$wanted->{wanted}->() unless $bydepth;
|
||
|
if ($subcount > 0 || $dont_use_nlink) { # Seen all the subdirs?
|
||
|
|
||
|
# Get link count and check for directoriness.
|
||
|
|
||
|
($dev,$ino,$mode,$nlink) = ($Is_VMS ? stat($_) : lstat($_));
|
||
|
# unless ($nlink || $dont_use_nlink);
|
||
|
|
||
|
if (-d _) {
|
||
|
|
||
|
# It really is a directory, so do it recursively.
|
||
|
|
||
|
--$subcount;
|
||
|
next if $prune;
|
||
|
if (chdir $_) {
|
||
|
$name =~ s/\.dir$// if $Is_VMS;
|
||
|
&finddir($wanted,$name,$nlink, $bydepth);
|
||
|
chdir '..';
|
||
|
}
|
||
|
else {
|
||
|
warn "Can't cd to $_: $!\n";
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
$wanted->{wanted}->() if $bydepth;
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
|
||
|
sub wrap_wanted {
|
||
|
my $wanted = shift;
|
||
|
defined &$wanted ? {wanted => $wanted} : $wanted;
|
||
|
}
|
||
|
|
||
|
sub find {
|
||
|
my $wanted = shift;
|
||
|
find_opt(wrap_wanted($wanted), @_);
|
||
|
}
|
||
|
|
||
|
sub finddepth {
|
||
|
my $wanted = wrap_wanted(shift);
|
||
|
$wanted->{bydepth} = 1;
|
||
|
find_opt($wanted, @_);
|
||
|
}
|
||
|
|
||
|
# These are hard-coded for now, but may move to hint files.
|
||
|
if ($^O eq 'VMS') {
|
||
|
$Is_VMS = 1;
|
||
|
$dont_use_nlink = 1;
|
||
|
}
|
||
|
|
||
|
$dont_use_nlink = 1
|
||
|
if $^O eq 'os2' || $^O eq 'dos' || $^O eq 'amigaos' || $^O eq 'MSWin32';
|
||
|
|
||
|
# Set dont_use_nlink in your hint file if your system's stat doesn't
|
||
|
# report the number of links in a directory as an indication
|
||
|
# of the number of files.
|
||
|
# See, e.g. hints/machten.sh for MachTen 2.2.
|
||
|
unless ($dont_use_nlink) {
|
||
|
require Config;
|
||
|
$dont_use_nlink = 1 if ($Config::Config{'dont_use_nlink'});
|
||
|
}
|
||
|
|
||
|
1;
|
||
|
|