[537] | 1 | ###########################################################################
|
---|
| 2 | #
|
---|
| 3 | # plugin.pm -- functions to handle using plugins
|
---|
| 4 | # A component of the Greenstone digital library software
|
---|
| 5 | # from the New Zealand Digital Library Project at the
|
---|
| 6 | # University of Waikato, New Zealand.
|
---|
| 7 | #
|
---|
| 8 | # Copyright (C) 1999 New Zealand Digital Library Project
|
---|
| 9 | #
|
---|
| 10 | # This program is free software; you can redistribute it and/or modify
|
---|
| 11 | # it under the terms of the GNU General Public License as published by
|
---|
| 12 | # the Free Software Foundation; either version 2 of the License, or
|
---|
| 13 | # (at your option) any later version.
|
---|
| 14 | #
|
---|
| 15 | # This program is distributed in the hope that it will be useful,
|
---|
| 16 | # but WITHOUT ANY WARRANTY; without even the implied warranty of
|
---|
| 17 | # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
---|
| 18 | # GNU General Public License for more details.
|
---|
| 19 | #
|
---|
| 20 | # You should have received a copy of the GNU General Public License
|
---|
| 21 | # along with this program; if not, write to the Free Software
|
---|
| 22 | # Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
|
---|
| 23 | #
|
---|
| 24 | ###########################################################################
|
---|
[4] | 25 |
|
---|
| 26 | package plugin;
|
---|
| 27 |
|
---|
[21307] | 28 |
|
---|
[7829] | 29 | use strict; # to pick up typos and undeclared variables...
|
---|
| 30 | no strict 'refs'; # ...but allow filehandles to be variables and vice versa
|
---|
[10579] | 31 | no strict 'subs';
|
---|
[7829] | 32 |
|
---|
[134] | 33 | require util;
|
---|
[27303] | 34 | use FileUtils;
|
---|
[7829] | 35 | use gsprintf 'gsprintf';
|
---|
[4] | 36 |
|
---|
[15873] | 37 | # mapping from old plugin names to new ones for backwards compatibility
|
---|
[17032] | 38 | # can remove at sometime in future when we no longer want to support old xxPlug names in the config file
|
---|
[15873] | 39 | my $plugin_name_map = {
|
---|
[17746] | 40 | 'GAPlug' => 'GreenstoneXMLPlugin',
|
---|
[15873] | 41 | 'ArcPlug' => 'ArchivesInfPlugin',
|
---|
| 42 | 'RecPlug' => 'DirectoryPlugin',
|
---|
| 43 | 'TEXTPlug' => 'TextPlugin',
|
---|
[17731] | 44 | 'XMLPlug' => 'ReadXMLFile',
|
---|
[15873] | 45 | 'EMAILPlug' => 'EmailPlugin',
|
---|
| 46 | 'SRCPlug' => 'SourceCodePlugin',
|
---|
| 47 | 'NULPlug' => 'NulPlugin',
|
---|
[17731] | 48 | 'W3ImgPlug' => 'HTMLImagePlugin',
|
---|
[17030] | 49 | 'PagedImgPlug' => 'PagedImagePlugin',
|
---|
[17724] | 50 | 'METSPlug' => 'GreenstoneMETSPlugin',
|
---|
| 51 | 'PPTPlug' => 'PowerPointPlugin',
|
---|
[17731] | 52 | 'PSPlug' => 'PostScriptPlugin',
|
---|
[17724] | 53 | 'DBPlug' => 'DatabasePlugin'
|
---|
[15873] | 54 | };
|
---|
| 55 |
|
---|
[7829] | 56 | # global variables
|
---|
[2785] | 57 | my $stats = {'num_processed' => 0,
|
---|
| 58 | 'num_blocked' => 0,
|
---|
| 59 | 'num_not_processed' => 0,
|
---|
[7363] | 60 | 'num_not_recognised' => 0,
|
---|
[2785] | 61 | 'num_archives' => 0
|
---|
| 62 | };
|
---|
| 63 |
|
---|
[7829] | 64 | #globaloptions contains any options that should be passed to all plugins
|
---|
| 65 | my ($verbosity, $outhandle, $failhandle, $globaloptions);
|
---|
[5682] | 66 |
|
---|
[15873] | 67 | sub get_valid_pluginname {
|
---|
| 68 | my ($pluginname) = @_;
|
---|
| 69 | my $valid_name = $pluginname;
|
---|
| 70 | if (defined $plugin_name_map->{$pluginname}) {
|
---|
| 71 | $valid_name = $plugin_name_map->{$pluginname};
|
---|
| 72 | } elsif ($pluginname =~ /Plug$/) {
|
---|
| 73 | $valid_name =~ s/Plug/Plugin/;
|
---|
| 74 |
|
---|
| 75 | }
|
---|
| 76 | return $valid_name;
|
---|
| 77 | }
|
---|
[21290] | 78 |
|
---|
[14933] | 79 | sub load_plugin_require
|
---|
| 80 | {
|
---|
| 81 | my ($pluginname) = @_;
|
---|
| 82 |
|
---|
| 83 | my @check_list = ();
|
---|
| 84 |
|
---|
| 85 | # pp_plugname shorthand for 'perllib' 'plugin' '$pluginname.pm'
|
---|
| 86 | my $pp_plugname
|
---|
[27303] | 87 | = &FileUtils::filenameConcatenate('perllib', 'plugins', "${pluginname}.pm");
|
---|
[14933] | 88 | my $collectdir = $ENV{'GSDLCOLLECTDIR'};
|
---|
| 89 |
|
---|
[10579] | 90 | # find the plugin
|
---|
[14239] | 91 | if (defined($ENV{'GSDLCOLLECTION'}))
|
---|
| 92 | {
|
---|
[14933] | 93 | my $customplugname
|
---|
[27303] | 94 | = &FileUtils::filenameConcatenate($collectdir, "custom",$ENV{'GSDLCOLLECTION'},
|
---|
[14933] | 95 | $pp_plugname);
|
---|
| 96 | push(@check_list,$customplugname);
|
---|
[14239] | 97 | }
|
---|
[14933] | 98 |
|
---|
[27303] | 99 | my $colplugname = &FileUtils::filenameConcatenate($collectdir, $pp_plugname);
|
---|
[14933] | 100 | push(@check_list,$colplugname);
|
---|
| 101 |
|
---|
| 102 | if (defined $ENV{'GSDLEXTS'}) {
|
---|
| 103 |
|
---|
[27303] | 104 | my $ext_prefix = &FileUtils::filenameConcatenate($ENV{'GSDLHOME'}, "ext");
|
---|
[14933] | 105 |
|
---|
| 106 | my @extensions = split(/:/,$ENV{'GSDLEXTS'});
|
---|
| 107 | foreach my $e (@extensions) {
|
---|
[27303] | 108 | my $extplugname = &FileUtils::filenameConcatenate($ext_prefix, $e, $pp_plugname);
|
---|
[14933] | 109 | push(@check_list,$extplugname);
|
---|
| 110 |
|
---|
| 111 | }
|
---|
| 112 | }
|
---|
[21290] | 113 | if (defined $ENV{'GSDL3EXTS'}) {
|
---|
[14933] | 114 |
|
---|
[27303] | 115 | my $ext_prefix = &FileUtils::filenameConcatenate($ENV{'GSDL3SRCHOME'}, "ext");
|
---|
[14933] | 116 |
|
---|
[21290] | 117 | my @extensions = split(/:/,$ENV{'GSDL3EXTS'});
|
---|
| 118 | foreach my $e (@extensions) {
|
---|
[27303] | 119 | my $extplugname = &FileUtils::filenameConcatenate($ext_prefix, $e, $pp_plugname);
|
---|
[21290] | 120 | push(@check_list,$extplugname);
|
---|
| 121 |
|
---|
| 122 | }
|
---|
| 123 | }
|
---|
| 124 |
|
---|
| 125 |
|
---|
[27303] | 126 | my $mainplugname = &FileUtils::filenameConcatenate($ENV{'GSDLHOME'}, $pp_plugname);
|
---|
[14933] | 127 | push(@check_list,$mainplugname);
|
---|
| 128 |
|
---|
| 129 | my $success=0;
|
---|
| 130 | foreach my $plugname (@check_list) {
|
---|
[27623] | 131 | if (&FileUtils::fileExists($plugname)) {
|
---|
[26223] | 132 | # lets add perllib folder to INC
|
---|
[27303] | 133 | # check it isn't already there first [jmt12]
|
---|
[26223] | 134 | my ($perllibfolder) = $plugname =~ /^(.*[\/\\]perllib)[\/\\]plugins/;
|
---|
[27623] | 135 | if (&FileUtils::directoryExists($perllibfolder))
|
---|
[27303] | 136 | {
|
---|
| 137 | my $found_perllibfolder = 0;
|
---|
| 138 | foreach my $path (@INC)
|
---|
| 139 | {
|
---|
| 140 | if ($path eq $perllibfolder)
|
---|
| 141 | {
|
---|
| 142 | $found_perllibfolder = 1;
|
---|
| 143 | last;
|
---|
| 144 | }
|
---|
| 145 | }
|
---|
| 146 | if (!$found_perllibfolder)
|
---|
| 147 | {
|
---|
[26223] | 148 | unshift (@INC, $perllibfolder);
|
---|
[27303] | 149 | }
|
---|
| 150 | }
|
---|
[14933] | 151 | require $plugname;
|
---|
| 152 | $success=1;
|
---|
| 153 | last;
|
---|
| 154 | }
|
---|
| 155 | }
|
---|
| 156 |
|
---|
| 157 | if (!$success) {
|
---|
[10579] | 158 | &gsprintf(STDERR, "{plugin.could_not_find_plugin}\n",
|
---|
[14933] | 159 | $pluginname);
|
---|
[10579] | 160 | die "\n";
|
---|
| 161 | }
|
---|
[14933] | 162 | }
|
---|
[10579] | 163 |
|
---|
[14933] | 164 | sub load_plugin_for_info {
|
---|
[25957] | 165 | my ($pluginname, $gs_version) = (@_);
|
---|
[15873] | 166 | $pluginname = &get_valid_pluginname($pluginname);
|
---|
[14933] | 167 | load_plugin_require($pluginname);
|
---|
| 168 |
|
---|
[10579] | 169 | # create a plugin object
|
---|
| 170 | my ($plugobj);
|
---|
[25957] | 171 | my $options = "-gsdlinfo,-gs_version,$gs_version";
|
---|
[10579] | 172 |
|
---|
| 173 | eval ("\$plugobj = new \$pluginname([],[$options])");
|
---|
| 174 | die "$@" if $@;
|
---|
| 175 |
|
---|
| 176 | return $plugobj;
|
---|
| 177 | }
|
---|
| 178 |
|
---|
[4] | 179 | sub load_plugins {
|
---|
[1431] | 180 | my ($plugin_list) = shift @_;
|
---|
[32539] | 181 | my ($incremental_mode, $gs_version, $site);
|
---|
| 182 | ($verbosity, $outhandle, $failhandle, $globaloptions, $incremental_mode, $gs_version, $site) = @_; # globals
|
---|
[4] | 183 | my @plugin_objects = ();
|
---|
[1243] | 184 | $verbosity = 2 unless defined $verbosity;
|
---|
[7829] | 185 | $outhandle = 'STDERR' unless defined $outhandle;
|
---|
| 186 | $failhandle = 'STDERR' unless defined $failhandle;
|
---|
[1243] | 187 |
|
---|
[27303] | 188 | # before pushing collection perl and plugin directories onto INC, test that
|
---|
| 189 | # they aren't already there [jmt12]
|
---|
| 190 | &util::augmentINC(&FileUtils::filenameConcatenate($ENV{'GSDLCOLLECTDIR'},'perllib'));
|
---|
| 191 | &util::augmentINC(&FileUtils::filenameConcatenate($ENV{'GSDLCOLLECTDIR'},'perllib','plugins'));
|
---|
[13933] | 192 |
|
---|
[6584] | 193 | map { $_ = "\"$_\""; } @$globaloptions;
|
---|
| 194 | my $globals = join (",", @$globaloptions);
|
---|
| 195 |
|
---|
[7829] | 196 | foreach my $pluginoptions (@$plugin_list) {
|
---|
[809] | 197 | my $pluginname = shift @$pluginoptions;
|
---|
| 198 | next unless defined $pluginname;
|
---|
[15873] | 199 | $pluginname = &get_valid_pluginname($pluginname);
|
---|
[14933] | 200 | load_plugin_require($pluginname);
|
---|
[4] | 201 |
|
---|
| 202 | # create a plugin object
|
---|
| 203 | my ($plugobj);
|
---|
[25803] | 204 | # put quotes around each option to the plugin, unless the option is already quoted
|
---|
| 205 | map { $_ = "\"$_\"" unless ($_ =~ m/^\s*\".*\"\s*$/) ; } @$pluginoptions;
|
---|
[32539] | 206 | my $site_option = $site ? "\"-site_name\",\"$site\"," : "";
|
---|
| 207 | my $options = "$site_option"."-gs_version,$gs_version,".join (",", @$pluginoptions);
|
---|
[6584] | 208 | if ($globals) {
|
---|
| 209 | if (@$pluginoptions) {
|
---|
| 210 | $options .= ",";
|
---|
| 211 | }
|
---|
| 212 | $options .= "$globals";
|
---|
| 213 | }
|
---|
[20613] | 214 | # need to escape backslash before putting in to the eval
|
---|
[22087] | 215 | # but watch out for any \" (which shouldn't be further escaped)
|
---|
[22221] | 216 | $options =~ s/\\([^"])/\\\\$1/g; #"
|
---|
[1244] | 217 | $options =~ s/\$/\\\$/g;
|
---|
[22087] | 218 |
|
---|
[10218] | 219 | eval ("\$plugobj = new \$pluginname([],[$options])");
|
---|
[4] | 220 | die "$@" if $@;
|
---|
[809] | 221 |
|
---|
[1243] | 222 | # initialize plugin
|
---|
[2785] | 223 | $plugobj->init($verbosity, $outhandle, $failhandle);
|
---|
[10478] | 224 |
|
---|
[20578] | 225 | $plugobj->set_incremental($incremental_mode);
|
---|
[1243] | 226 |
|
---|
[4] | 227 | # add this object to the list
|
---|
| 228 | push (@plugin_objects, $plugobj);
|
---|
| 229 | }
|
---|
| 230 |
|
---|
| 231 | return \@plugin_objects;
|
---|
| 232 | }
|
---|
| 233 |
|
---|
[835] | 234 |
|
---|
| 235 | sub begin {
|
---|
[11333] | 236 | my ($pluginfo, $base_dir, $processor, $maxdocs, $gli) = @_;
|
---|
[835] | 237 |
|
---|
[11333] | 238 | map { $_->{'gli'} = $gli; } @$pluginfo;
|
---|
[835] | 239 | map { $_->begin($pluginfo, $base_dir, $processor, $maxdocs); } @$pluginfo;
|
---|
| 240 | }
|
---|
| 241 |
|
---|
[21307] | 242 | sub remove_all {
|
---|
[21290] | 243 | my ($pluginfo, $base_dir, $processor, $maxdocs) = @_;
|
---|
[24345] | 244 |
|
---|
[21307] | 245 | map { $_->remove_all($pluginfo, $base_dir, $processor, $maxdocs); } @$pluginfo;
|
---|
[21290] | 246 | }
|
---|
| 247 |
|
---|
[21307] | 248 | sub remove_some {
|
---|
[21618] | 249 | my ($pluginfo, $infodbtype, $archivedir, $deleted_files) = @_;
|
---|
[21307] | 250 | return if (scalar(@$deleted_files)==0);
|
---|
[23170] | 251 | $infodbtype = "gdbm" if $infodbtype eq "gdbm-txtgz";
|
---|
[21618] | 252 | my $arcinfo_src_filename = &dbutil::get_infodb_file_path($infodbtype, "archiveinf-src", $archivedir);
|
---|
[21290] | 253 |
|
---|
[21307] | 254 | foreach my $file (@$deleted_files) {
|
---|
[21564] | 255 | # use 'archiveinf-src' info database to look up all the OIDs
|
---|
[21307] | 256 | # that this file is used in (note in most cases, it's just one OID)
|
---|
[32565] | 257 |
|
---|
| 258 | my $processed_file = 0; # set to 1 if a plugin could process the file and did so successfully
|
---|
[21307] | 259 |
|
---|
[30597] | 260 | my $file_with_placeholders = &util::abspath_to_placeholders($file);
|
---|
| 261 | my $src_rec = &dbutil::read_infodb_entry($infodbtype, $arcinfo_src_filename, $file_with_placeholders);
|
---|
[21307] | 262 | my $oids = $src_rec->{'oid'};
|
---|
[21314] | 263 | my $rv;
|
---|
| 264 | foreach my $plugobj (@$pluginfo) {
|
---|
| 265 |
|
---|
| 266 | $rv = $plugobj->remove_one($file, $oids, $archivedir);
|
---|
| 267 | if (defined $rv && $rv != -1) {
|
---|
[32565] | 268 | #return $rv;
|
---|
| 269 | $processed_file = 1;
|
---|
| 270 | last; # break and continue with outer for loop, to process other deleted files
|
---|
[21314] | 271 | } # else undefined (was not recognised by the plugin) or there was an error, try the next one
|
---|
| 272 | }
|
---|
[32565] | 273 | #return 0;
|
---|
| 274 |
|
---|
| 275 | if (!$processed_file) { # no plugin could recognise file.
|
---|
| 276 | # Should we continue processing other deleted files or not?
|
---|
| 277 | print STDERR "WARNING: plugin::remove_some() failed to process $file with oid(s) ". join(",", $oids) . "\n";
|
---|
| 278 | return 0;
|
---|
| 279 | } # else some plugin processed the current deleted file
|
---|
| 280 | # continue to process next deleted file
|
---|
| 281 |
|
---|
[21307] | 282 | }
|
---|
[32565] | 283 | return 1; # if we got here, all deleted files got processed successfully
|
---|
| 284 | }
|
---|
[21307] | 285 |
|
---|
[16381] | 286 | sub file_block_read {
|
---|
| 287 | my ($pluginfo, $base_dir, $file, $block_hash, $metadata, $gli) = @_;
|
---|
[10155] | 288 |
|
---|
[16381] | 289 |
|
---|
| 290 | $gli = 0 unless defined $gli;
|
---|
| 291 |
|
---|
| 292 | my $rv = 0;
|
---|
| 293 | my $glifile = $file;
|
---|
| 294 |
|
---|
| 295 | $glifile =~ s/^[\/\\]+//; # file sometimes starts with a / so get rid of it
|
---|
| 296 |
|
---|
| 297 | # Announce to GLI that we are handling a file
|
---|
| 298 | print STDERR "<File n='$glifile'>\n" if $gli;
|
---|
| 299 |
|
---|
| 300 | # the .kill file is a handy (if not very elegant) way of aborting
|
---|
| 301 | # an import.pl or buildcol.pl process
|
---|
[27623] | 302 | if (&FileUtils::fileExists(&FileUtils::filenameConcatenate($ENV{'GSDLCOLLECTDIR'}, ".kill"))) {
|
---|
[16381] | 303 | gsprintf($outhandle, "{plugin.kill_file}\n");
|
---|
| 304 | die "\n";
|
---|
| 305 | }
|
---|
| 306 |
|
---|
| 307 | foreach my $plugobj (@$pluginfo) {
|
---|
| 308 |
|
---|
| 309 | $rv = $plugobj->file_block_read($pluginfo, $base_dir, $file, $block_hash, $metadata, $gli);
|
---|
| 310 | #last if (defined $rv && $rv==1); # stop this file once we have found something to 'process' it
|
---|
| 311 | }
|
---|
| 312 |
|
---|
| 313 | }
|
---|
| 314 |
|
---|
| 315 |
|
---|
[8515] | 316 | sub metadata_read {
|
---|
[19497] | 317 | my ($pluginfo, $base_dir, $file, $block_hash,
|
---|
| 318 | $extrametakeys, $extrametadata, $extrametafile,
|
---|
[23212] | 319 | $processor, $gli, $aux) = @_;
|
---|
[8515] | 320 |
|
---|
| 321 | $gli = 0 unless defined $gli;
|
---|
| 322 |
|
---|
| 323 | my $rv = 0;
|
---|
| 324 | my $glifile = $file;
|
---|
| 325 |
|
---|
| 326 | $glifile =~ s/^[\/\\]+//; # file sometimes starts with a / so get rid of it
|
---|
| 327 |
|
---|
| 328 | # Announce to GLI that we are handling a file
|
---|
| 329 | print STDERR "<File n='$glifile'>\n" if $gli;
|
---|
| 330 |
|
---|
| 331 | # the .kill file is a handy (if not very elegant) way of aborting
|
---|
| 332 | # an import.pl or buildcol.pl process
|
---|
[27623] | 333 | if (&FileUtils::fileExists(&FileUtils::filenameConcatenate($ENV{'GSDLCOLLECTDIR'}, ".kill"))) {
|
---|
[8515] | 334 | gsprintf($outhandle, "{plugin.kill_file}\n");
|
---|
| 335 | die "\n";
|
---|
| 336 | }
|
---|
| 337 |
|
---|
| 338 | my $had_error = 0;
|
---|
| 339 | # pass this file by each of the plugins in turn until one
|
---|
| 340 | # is found which will process it
|
---|
| 341 | # read must return:
|
---|
| 342 | # undef - could not recognise
|
---|
| 343 | # -1 - tried but error
|
---|
| 344 | # 0 - blocked
|
---|
| 345 | # anything else for successful processing
|
---|
| 346 |
|
---|
| 347 | foreach my $plugobj (@$pluginfo) {
|
---|
| 348 |
|
---|
[16381] | 349 | $rv = $plugobj->metadata_read($pluginfo, $base_dir, $file, $block_hash,
|
---|
[19497] | 350 | $extrametakeys, $extrametadata, $extrametafile,
|
---|
[23212] | 351 | $processor, $gli, $aux);
|
---|
[8515] | 352 |
|
---|
| 353 | if (defined $rv) {
|
---|
| 354 | if ($rv == -1) {
|
---|
| 355 | # an error has occurred
|
---|
| 356 | $had_error = 1;
|
---|
| 357 | print STDERR "<ProcessingError n='$glifile'>\n" if $gli;
|
---|
| 358 | } else {
|
---|
| 359 | return $rv;
|
---|
| 360 | }
|
---|
| 361 | } # else undefined - was not recognised by the plugin
|
---|
| 362 | }
|
---|
| 363 |
|
---|
| 364 | return 0;
|
---|
| 365 | }
|
---|
| 366 |
|
---|
[4] | 367 | sub read {
|
---|
[16381] | 368 | my ($pluginfo, $base_dir, $file, $block_hash, $metadata, $processor, $maxdocs, $total_count, $gli, $aux) = @_;
|
---|
[4] | 369 |
|
---|
[809] | 370 | $maxdocs = -1 unless defined $maxdocs && $maxdocs =~ /\d/;
|
---|
[9853] | 371 | $total_count = 0 unless defined $total_count && $total_count =~ /\d/;
|
---|
[6332] | 372 | $gli = 0 unless defined $gli;
|
---|
| 373 |
|
---|
[315] | 374 | my $rv = 0;
|
---|
[7363] | 375 | my $glifile = $file;
|
---|
[7904] | 376 |
|
---|
[7363] | 377 | $glifile =~ s/^[\/\\]+//; # file sometimes starts with a / so get rid of it
|
---|
[8515] | 378 |
|
---|
[6332] | 379 | # Announce to GLI that we are handling a file
|
---|
[7363] | 380 | print STDERR "<File n='$glifile'>\n" if $gli;
|
---|
[8515] | 381 |
|
---|
[1454] | 382 | # the .kill file is a handy (if not very elegant) way of aborting
|
---|
| 383 | # an import.pl or buildcol.pl process
|
---|
[27623] | 384 | if (&FileUtils::fileExists(&FileUtils::filenameConcatenate($ENV{'GSDLCOLLECTDIR'}, ".kill"))) {
|
---|
[7829] | 385 | gsprintf($outhandle, "{plugin.kill_file}\n");
|
---|
[1454] | 386 | die "\n";
|
---|
| 387 | }
|
---|
[18441] | 388 |
|
---|
[7363] | 389 | my $had_error = 0;
|
---|
[4] | 390 | # pass this file by each of the plugins in turn until one
|
---|
| 391 | # is found which will process it
|
---|
[7363] | 392 | # read must return:
|
---|
| 393 | # undef - could not recognise
|
---|
| 394 | # -1 - tried but error
|
---|
| 395 | # 0 - blocked
|
---|
| 396 | # anything else for successful processing
|
---|
[8515] | 397 |
|
---|
[7829] | 398 | foreach my $plugobj (@$pluginfo) {
|
---|
[8515] | 399 |
|
---|
| 400 | $rv = $plugobj->read($pluginfo, $base_dir, $file,
|
---|
[16381] | 401 | $block_hash, $metadata, $processor, $maxdocs,
|
---|
| 402 | $total_count, $gli, $aux);
|
---|
[8515] | 403 |
|
---|
| 404 | if (defined $rv) {
|
---|
[7363] | 405 | if ($rv == -1) {
|
---|
[7904] | 406 | # an error has occurred
|
---|
[7363] | 407 | $had_error = 1;
|
---|
| 408 | } else {
|
---|
[7904] | 409 | return $rv;
|
---|
[7363] | 410 | }
|
---|
| 411 | } # else undefined - was not recognised by the plugin
|
---|
[4] | 412 | }
|
---|
[7904] | 413 |
|
---|
[7363] | 414 | if ($had_error) {
|
---|
| 415 | # was recognised but couldn't be processed
|
---|
| 416 | if ($verbosity >= 2) {
|
---|
[7829] | 417 | gsprintf($outhandle, "{plugin.no_plugin_could_process}\n", $file);
|
---|
[7363] | 418 | }
|
---|
| 419 | # tell the GLI that it was not processed
|
---|
| 420 | print STDERR "<NonProcessedFile n='$glifile'>\n" if $gli;
|
---|
[7904] | 421 |
|
---|
[7829] | 422 | gsprintf($failhandle, "$file: {plugin.no_plugin_could_process_this_file}\n");
|
---|
[7363] | 423 | $stats->{'num_not_processed'} ++;
|
---|
| 424 | } else {
|
---|
| 425 | # was not recognised
|
---|
| 426 | if ($verbosity >= 2) {
|
---|
[7829] | 427 | gsprintf($outhandle, "{plugin.no_plugin_could_recognise}\n",$file);
|
---|
[7363] | 428 | }
|
---|
| 429 | # tell the GLI that it was not processed
|
---|
| 430 | print STDERR "<NonRecognisedFile n='$glifile'>\n" if $gli;
|
---|
| 431 |
|
---|
[7829] | 432 | gsprintf($failhandle, "$file: {plugin.no_plugin_could_recognise_this_file}\n");
|
---|
[7363] | 433 | $stats->{'num_not_recognised'} ++;
|
---|
[170] | 434 | }
|
---|
[315] | 435 | return 0;
|
---|
[4] | 436 | }
|
---|
| 437 |
|
---|
[2785] | 438 | # write out some general stats that the plugins have compiled - note that
|
---|
| 439 | # the buildcol.pl process doesn't currently call this process so the stats
|
---|
| 440 | # are only output after import.pl -
|
---|
| 441 | sub write_stats {
|
---|
[6332] | 442 | my ($pluginfo, $statshandle, $faillog, $gli) = @_;
|
---|
[2785] | 443 |
|
---|
[6332] | 444 | $gli = 0 unless defined $gli;
|
---|
| 445 |
|
---|
[7829] | 446 | foreach my $plugobj (@$pluginfo) {
|
---|
[2785] | 447 | $plugobj->compile_stats($stats);
|
---|
| 448 | }
|
---|
| 449 |
|
---|
| 450 | my $total = $stats->{'num_processed'} + $stats->{'num_blocked'} +
|
---|
[7363] | 451 | $stats->{'num_not_processed'} + $stats->{'num_not_recognised'};
|
---|
[2785] | 452 |
|
---|
[7363] | 453 | print STDERR "<ImportComplete considered='$total' processed='$stats->{'num_processed'}' blocked='$stats->{'num_blocked'}' ignored='$stats->{'num_not_recognised'}' failed='$stats->{'num_not_processed'}'>\n" if $gli;
|
---|
[6332] | 454 |
|
---|
[2785] | 455 | if ($total == 1) {
|
---|
[7829] | 456 | gsprintf($statshandle, "* {plugin.one_considered}\n");
|
---|
[2785] | 457 | } else {
|
---|
[7829] | 458 | gsprintf($statshandle, "* {plugin.n_considered}\n", $total);
|
---|
[2785] | 459 | }
|
---|
| 460 | if ($stats->{'num_archives'}) {
|
---|
[5682] | 461 | if ($stats->{'num_archives'} == 1) {
|
---|
[7829] | 462 | gsprintf($statshandle, " ({plugin.including_archive})\n");
|
---|
[5682] | 463 | }
|
---|
| 464 | else {
|
---|
[7829] | 465 | gsprintf($statshandle, " ({plugin.including_archives})\n",
|
---|
| 466 | $stats->{'num_archives'});
|
---|
[5682] | 467 | }
|
---|
[2785] | 468 | }
|
---|
| 469 | if ($stats->{'num_processed'} == 1) {
|
---|
[7829] | 470 | gsprintf($statshandle, "* {plugin.one_included}\n");
|
---|
[2785] | 471 | } else {
|
---|
[7829] | 472 | gsprintf($statshandle, "* {plugin.n_included}\n", $stats->{'num_processed'});
|
---|
[2785] | 473 | }
|
---|
[7363] | 474 | if ($stats->{'num_not_recognised'}) {
|
---|
| 475 | if ($stats->{'num_not_recognised'} == 1) {
|
---|
[7829] | 476 | gsprintf($statshandle, "* {plugin.one_unrecognised}\n");
|
---|
[7363] | 477 | } else {
|
---|
[7829] | 478 | gsprintf($statshandle, "* {plugin.n_unrecognised}\n",
|
---|
| 479 | $stats->{'num_not_recognised'});
|
---|
[7363] | 480 | }
|
---|
| 481 |
|
---|
| 482 | }
|
---|
[2797] | 483 | if ($stats->{'num_not_processed'}) {
|
---|
| 484 | if ($stats->{'num_not_processed'} == 1) {
|
---|
[7829] | 485 | gsprintf($statshandle, "* {plugin.one_rejected}\n");
|
---|
[2797] | 486 | } else {
|
---|
[7829] | 487 | gsprintf($statshandle, "* {plugin.n_rejected}\n",
|
---|
| 488 | $stats->{'num_not_processed'});
|
---|
[5682] | 489 | }
|
---|
[7363] | 490 | }
|
---|
| 491 | if ($stats->{'num_not_processed'} || $stats->{'num_not_recognised'}) {
|
---|
[7829] | 492 | gsprintf($statshandle, " {plugin.see_faillog}\n", $faillog);
|
---|
[2797] | 493 | }
|
---|
[2785] | 494 | }
|
---|
| 495 |
|
---|
[835] | 496 | sub end {
|
---|
[1587] | 497 | my ($pluginfo, $processor) = @_;
|
---|
| 498 | map { $_->end($processor); } @$pluginfo;
|
---|
[835] | 499 | }
|
---|
[4] | 500 |
|
---|
[10155] | 501 | sub deinit {
|
---|
| 502 | my ($pluginfo, $processor) = @_;
|
---|
| 503 |
|
---|
| 504 |
|
---|
| 505 | map { $_->deinit($processor); } @$pluginfo;
|
---|
| 506 | }
|
---|
| 507 |
|
---|
[4] | 508 | 1;
|
---|