source: trunk/gsdl/perllib/plugins/RecPlug.pm@ 1482

Last change on this file since 1482 was 1424, checked in by sjboddie, 24 years ago

Added a -out option to most of the perl building scripts to allow output
debug information to be directed to a file.

  • Property svn:executable set to *
  • Property svn:keywords set to Author Date Id Revision
File size: 2.8 KB
Line 
1###########################################################################
2#
3# RecPlug.pm --
4# A component of the Greenstone digital library software
5# from the New Zealand Digital Library Project at the
6# University of Waikato, New Zealand.
7#
8# Copyright (C) 1999 New Zealand Digital Library Project
9#
10# This program is free software; you can redistribute it and/or modify
11# it under the terms of the GNU General Public License as published by
12# the Free Software Foundation; either version 2 of the License, or
13# (at your option) any later version.
14#
15# This program is distributed in the hope that it will be useful,
16# but WITHOUT ANY WARRANTY; without even the implied warranty of
17# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18# GNU General Public License for more details.
19#
20# You should have received a copy of the GNU General Public License
21# along with this program; if not, write to the Free Software
22# Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
23#
24###########################################################################
25
26# plugin which recurses through directories processing
27# each file it finds
28
29package RecPlug;
30
31use BasPlug;
32use plugin;
33use util;
34
35
36BEGIN {
37 @ISA = ('BasPlug');
38}
39
40sub new {
41 my ($class) = @_;
42 my $self = new BasPlug ("RecPlug", @_);
43
44 $self->{'exclude_tail_dirs'} = []; # empty by default
45
46 return bless $self, $class;
47}
48
49# return 1 if this class might recurse using $pluginfo
50sub is_recursive {
51 my $self = shift (@_);
52
53 return 1;
54}
55
56
57# return number of files processed, undef if can't process
58# Note that $base_dir might be "" and that $file might
59# include directories
60sub read {
61 my $self = shift (@_);
62 my ($pluginfo, $base_dir, $file, $metadata, $processor, $maxdocs) = @_;
63 my $outhandle = $self->{'outhandle'};
64
65 foreach my $etd ( @{$self->{'exclude_tail_dirs'}} )
66 {
67 return 0 if ($file =~ m/$etd/);
68 }
69
70 my (@dir, $subfile);
71
72 my $count = 0;
73
74 # see if this is a directory
75 my $dirname = &util::filename_cat ($base_dir, $file);
76 if (-d $dirname) {
77
78 # read all the files in the directory
79 if (!opendir (DIR, $dirname))
80 {
81 print $outhandle "RecPlug: WARNING - couldn't read directory $dirname\n";
82 return;
83 }
84
85 @dir = readdir (DIR);
86 closedir (DIR);
87
88 print $outhandle "RecPlug: getting directory $dirname\n";
89
90 # process each file
91 foreach $subfile (@dir) {
92 last if ($maxdocs != -1 && $count >= $maxdocs);
93
94 if ($subfile !~ /^\.\.?$/) {
95 # note: metadata is not carried on to the next level
96 $count += &plugin::read ($pluginfo, $base_dir, &util::filename_cat($file, $subfile),
97 {}, $processor, $maxdocs);
98 }
99 }
100 return $count;
101 }
102
103 # wasn't a directory, someone else will have to process it
104 return undef;
105}
106
107
1081;
Note: See TracBrowser for help on using the repository browser.