source: trunk/gsdl/perllib/plugins/ArcPlug.pm@ 10168

Last change on this file since 10168 was 10156, checked in by davidb, 19 years ago

Extra functionality introduced to support incremental building.

  • Property svn:executable set to *
  • Property svn:keywords set to Author Date Id Revision
File size: 4.1 KB
Line 
1###########################################################################
2#
3# ArcPlug.pm --
4# A component of the Greenstone digital library software
5# from the New Zealand Digital Library Project at the
6# University of Waikato, New Zealand.
7#
8# Copyright (C) 1999 New Zealand Digital Library Project
9#
10# This program is free software; you can redistribute it and/or modify
11# it under the terms of the GNU General Public License as published by
12# the Free Software Foundation; either version 2 of the License, or
13# (at your option) any later version.
14#
15# This program is distributed in the hope that it will be useful,
16# but WITHOUT ANY WARRANTY; without even the implied warranty of
17# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18# GNU General Public License for more details.
19#
20# You should have received a copy of the GNU General Public License
21# along with this program; if not, write to the Free Software
22# Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
23#
24###########################################################################
25
26# plugin which recurses through an archives.inf file
27# (i.e. the file generated in the archives directory
28# when an import is done), processing each file it finds
29
30# 12-05-02 Added usage datastructure - John Thompson
31
32package ArcPlug;
33
34use util;
35use BasPlug;
36use plugin;
37use arcinfo;
38use gsprintf;
39
40BEGIN {
41 @ArcPlug::ISA = ('BasPlug');
42}
43
44my $options = { 'name' => "ArcPlug",
45 'desc' => "{ArcPlug.desc}",
46 'abstract' => "no",
47 'inherits' => "yes" };
48
49sub gsprintf
50{
51 return &gsprintf::gsprintf(@_);
52}
53
54sub new {
55 my ($class) = @_;
56 my $self = new BasPlug ("ArcPlug", @_);
57
58 # 14-05-02 To allow for proper inheritance of arguments - John Thompson
59 my $option_list = $self->{'option_list'};
60 push( @{$option_list}, $options );
61
62 return bless $self, $class;
63}
64
65sub deinit {
66 my ($self) = @_;
67
68 my $archive_info = $self->{'archive_info'};
69
70 if (defined $archive_info) {
71 my $archive_info_filename = $self->{'archive_info_filename'};
72
73 my $file_list = $archive_info->get_file_list();
74
75 # change each file to "Been Indexed"
76
77 foreach my $subfile (@$file_list) {
78 my $doc_oid = $subfile->[1];
79 $index_status = $archive_info->get_status_info($doc_oid);
80 $archive_info->set_status_info($doc_oid,"B");
81 }
82
83 $archive_info->save_info($archive_info_filename);
84 }
85}
86
87# return 1 if this class might recurse using $pluginfo
88sub is_recursive {
89 my $self = shift (@_);
90
91 return 1;
92}
93
94
95
96
97# return number of files processed, undef if can't process
98# Note that $base_dir might be "" and that $file might
99# include directories
100sub read {
101 my $self = shift (@_);
102 my ($pluginfo, $base_dir, $file, $metadata, $processor, $maxdocs,$total_count, $gli) = @_;
103 my $outhandle = $self->{'outhandle'};
104
105 my $count = 0;
106
107 # see if this has a archives information file within it
108 my $archive_info_filename = &util::filename_cat($base_dir,$file,"archives.inf");
109 $self->{'archive_info_filename'} = $archive_info_filename;
110
111 if (-e $archive_info_filename) {
112
113 # found an archives.inf file
114 &gsprintf($outhandle, "ArcPlug: {common.processing} $archive_info_filename\n") if $self->{'verbosity'} > 1;
115
116 # read in the archives information file
117 my $archive_info = new arcinfo ();
118 $self->{'archive_info'} = $archive_info;
119
120 $archive_info->load_info ($archive_info_filename);
121
122 my $file_list = $archive_info->get_file_list();
123
124 # process each file
125 foreach my $subfile (@$file_list) {
126 last if ($maxdocs != -1 && ($total_count + $count) >= $maxdocs);
127
128 my $tmp = &util::filename_cat ($file, $subfile->[0]);
129 next if $tmp eq $file;
130
131 my $doc_oid = $subfile->[1];
132
133 $index_status = $archive_info->get_status_info($doc_oid);
134
135 my $processor_mode = $processor->get_mode();
136
137 if (($processor_mode eq "infodb") || ($index_status eq "I")) {
138
139 # note: metadata is not carried on to the next level
140 $count += &plugin::read ($pluginfo, $base_dir, $tmp, {}, $processor, $maxdocs, ($total_count+$count), $gli);
141 }
142
143 }
144
145 return $count;
146 }
147
148 # wasn't an archives directory, someone else will have to process it
149 return undef;
150}
151
1521;
Note: See TracBrowser for help on using the repository browser.