Changeset 6407
- Timestamp:
- 2004-01-09T15:33:33+13:00 (20 years ago)
- Location:
- trunk/gsdl
- Files:
-
- 5 edited
Legend:
- Unmodified
- Added
- Removed
-
trunk/gsdl/bin/script/buildcol.pl
r6331 r6407 57 57 58 58 my $arguments = 59 [ { 'name' => "archivedir", 59 [ { 'name' => "allclassifications", 60 'desc' => "{buildcol.allclassifications}", 61 'type' => "flag", 62 'reqd' => "no", 63 'modegli' => "2" }, 64 { 'name' => "archivedir", 60 65 'desc' => "{buildcol.archivedir}", 61 66 'type' => "string", 62 'reqd' => "no" }, 63 { 'name' => "verbosity", 64 'desc' => "{buildcol.verbosity}", 65 'type' => "int", 66 'deft' => "2", 67 'reqd' => "no" }, 67 'reqd' => "no", 68 'hiddengli' => "yes" }, 68 69 { 'name' => "builddir", 69 70 'desc' => "{buildcol.builddir}", 70 71 'type' => "string", 71 'reqd' => "no" }, 72 'reqd' => "no", 73 'hiddengli' => "yes" }, 72 74 # { 'name' => "cachedir", 73 75 # 'desc' => "{buildcol.cachedir}", 74 76 # 'type' => "string", 75 77 # 'reqd' => "no" }, 78 { 'name' => "collectdir", 79 'desc' => "{buildcol.collectdir}", 80 'type' => "string", 81 'deft' => &util::filename_cat ($ENV{'GSDLHOME'}, "collect"), 82 'reqd' => "no", 83 'hiddengli' => "yes" }, 84 { 'name' => "create_images", 85 'desc' => "{buildcol.create_images}", 86 'type' => "flag", 87 'reqd' => "no", 88 'modegli' => "4" }, 89 { 'name' => "debug", 90 'desc' => "{buildcol.debug}", 91 'type' => "flag", 92 'reqd' => "no", 93 'hiddengli' => "yes" }, 94 { 'name' => "faillog", 95 'desc' => "{buildcol.faillog}", 96 'type' => "string", 97 'deft' => &util::filename_cat("<collectdir>", "colname", "etc", "fail.log"), 98 'reqd' => "no", 99 'modegli' => "4" }, 100 { 'name' => "index", 101 'desc' => "{buildcol.index}", 102 'type' => "string", 103 'reqd' => "no", 104 'modegli' => "3" }, 105 { 'name' => "keepold", 106 'desc' => "{buildcol.keepold}", 107 'type' => "flag", 108 'reqd' => "no", 109 'hiddengli' => "yes" }, 110 { 'name' => "language", 111 'desc' => "{scripts.language}", 112 'type' => "string", 113 'reqd' => "no", 114 'modegli' => "4" }, 76 115 { 'name' => "maxdocs", 77 116 'desc' => "{buildcol.maxdocs}", 78 117 'type' => "int", 79 'reqd' => "no" }, 80 { 'name' => "debug", 81 'desc' => "{buildcol.debug}", 82 'type' => "flag", 83 'reqd' => "no" }, 118 'reqd' => "no", 119 'hiddengli' => "yes" }, 84 120 { 'name' => "mode", 85 121 'desc' => "{buildcol.mode}", … … 87 123 'list' => $mode_list, 88 124 'deft' => "all", 89 'reqd' => "no" }, 90 { 'name' => "index", 91 'desc' => "{buildcol.index}", 92 'type' => "string", 93 'reqd' => "no" }, 94 { 'name' => "keepold", 95 'desc' => "{buildcol.keepold}", 125 'reqd' => "no", 126 'modegli' => "4" }, 127 { 'name' => "no_strip_html", 128 'desc' => "{buildcol.no_strip_html}", 96 129 'type' => "flag", 97 'reqd' => "no" }, 130 'reqd' => "no", 131 'modegli' => "4" }, 98 132 { 'name' => "no_text", 99 133 'desc' => "{buildcol.no_text}", 100 134 'type' => "flag", 101 'reqd' => "no" }, 102 { 'name' => "allclassifications", 103 'desc' => "{buildcol.allclassifications}", 104 'type' => "flag", 105 'reqd' => "no" }, 106 { 'name' => "create_images", 107 'desc' => "{buildcol.create_images}", 108 'type' => "flag", 109 'reqd' => "no" }, 110 { 'name' => "collectdir", 111 'desc' => "{buildcol.collectdir}", 112 'type' => "string", 113 'deft' => &util::filename_cat ($ENV{'GSDLHOME'}, "collect"), 114 'reqd' => "no" }, 135 'reqd' => "no", 136 'modegli' => "3" }, 115 137 { 'name' => "out", 116 138 'desc' => "{buildcol.out}", 117 139 'type' => "string", 118 140 'deft' => "STDERR", 119 'reqd' => "no" }, 120 { 'name' => "no_strip_html", 121 'desc' => "{buildcol.no_strip_html}", 122 'type' => "flag", 123 'reqd' => "no" }, 124 { 'name' => "faillog", 125 'desc' => "{buildcol.faillog}", 126 'type' => "string", 127 'deft' => &util::filename_cat("<collectdir>", "colname", "etc", "fail.log"), 128 'reqd' => "no" }, 129 { 'name' => "language", 130 'desc' => "{scripts.language}", 131 'type' => "string", 132 'reqd' => "no" } ]; 141 'reqd' => "no", 142 'hiddengli' => "yes" }, 143 { 'name' => "verbosity", 144 'desc' => "{buildcol.verbosity}", 145 'type' => "int", 146 'deft' => "2", 147 'reqd' => "no", 148 'modegli' => "4" } ]; 133 149 134 150 my $options = { 'name' => "buildcol.pl", … … 490 506 close OUT if $close_out; 491 507 close FAILLOG; 508 509 print STDERR "</Build>\n" if $gli; 492 510 } 493 511 -
trunk/gsdl/bin/script/import.pl
r6330 r6407 56 56 'desc' => "{import.OIDtype.incremental}" } ]; 57 57 58 # Possible attributes for each argument 59 # name: The name of the argument 60 # desc: A description (or more likely a reference to a description) for this argument 61 # type: The type of control used to represent the argument. Options include: string, int, flag, regexp, metadata, metadatum, language, enum etc 62 # reqd: Is this argument required? 63 # hiddengli: Is this argument hidden in GLI? 64 # modegli: The lowest detail mode this argument is visible at in GLI 65 58 66 my $arguments = 59 67 [ { 'name' => "archivedir", 60 68 'desc' => "{import.achivedir}", 61 69 'type' => "string", 62 'reqd' => "no" }, 70 'reqd' => "no", 71 'hiddengli' => "yes" }, 63 72 { 'name' => "collectdir", 64 73 'desc' => "{import.collectdir}", 65 74 'type' => "string", 66 75 'deft' => &util::filename_cat ($ENV{'GSDLHOME'}, "collect"), 67 'reqd' => "no" }, 76 'reqd' => "no", 77 'hiddengli' => "yes" }, 68 78 { 'name' => "debug", 69 79 'desc' => "{import.debug}", 70 80 'type' => "flag", 71 'reqd' => "no" }, 81 'reqd' => "no", 82 'hiddengli' => "yes" }, 72 83 { 'name' => "faillog", 73 84 'desc' => "{import.faillog}", 74 85 'type' => "string", 75 86 'deft' => &util::filename_cat("<collectdir>", "colname", "etc", "fail.log"), 76 'reqd' => "no" }, 87 'reqd' => "no", 88 'modegli' => "4" }, 77 89 { 'name' => "groupsize", 78 90 'desc' => "{import.groupsize}", 79 91 'type' => "int", 80 92 'deft' => "1", 81 'reqd' => "no" }, 93 'reqd' => "no", 94 'modegli' => "3" }, 82 95 { 'name' => "gzip", 83 96 'desc' => "{import.gzip}", 84 97 'type' => "flag", 85 'reqd' => "no" }, 98 'reqd' => "no", 99 'modegli' => "4" }, 86 100 { 'name' => "importdir", 87 101 'desc' => "{import.importdir}", 88 102 'type' => "string", 89 'reqd' => "no" }, 103 'reqd' => "no", 104 'hiddengli' => "yes" }, 90 105 { 'name' => "keepold", 91 106 'desc' => "{import.keepold}", 92 107 'type' => "flag", 93 'reqd' => "no" }, 108 'reqd' => "no", 109 'hiddengli' => "yes" }, 110 { 'name' => "language", 111 'desc' => "{scripts.language}", 112 'type' => "string", 113 'reqd' => "no", 114 'modegli' => "4" }, 94 115 { 'name' => "maxdocs", 95 116 'desc' => "{import.maxdocs}", 96 117 'type' => "int", 97 'reqd' => "no" }, 118 'reqd' => "no", 119 'modegli' => "1" }, 98 120 { 'name' => "OIDtype", 99 121 'desc' => "{import.OIDtype}", … … 101 123 'list' => $oidtype_list, 102 124 'deft' => "hash", 103 'reqd' => "no" }, 125 'reqd' => "no", 126 'modegli' => "3" }, 104 127 { 'name' => "out", 105 128 'desc' => "{import.out}", 106 129 'type' => "string", 107 130 'deft' => "STDERR", 108 'reqd' => "no" }, 131 'reqd' => "no", 132 'hiddengli' => "yes" }, 109 133 { 'name' => "removeold", 110 134 'desc' => "{import.removeold}", 111 135 'type' => "flag", 112 'reqd' => "no" }, 136 'reqd' => "no", 137 'modegli' => "3" }, 113 138 { 'name' => "sortmeta", 114 139 'desc' => "{import.sortmeta}", 115 'type' => "string", 116 'reqd' => "no" }, 140 'type' => "metadata", 141 'reqd' => "no", 142 'modegli' => "2" }, 117 143 { 'name' => "statsfile", 118 144 'desc' => "{import.statsfile}", 119 145 'type' => "string", 120 146 'deft' => "STDERR", 121 'reqd' => "no" }, 147 'reqd' => "no", 148 'hiddengli' => "yes" }, 122 149 { 'name' => "verbosity", 123 150 'desc' => "{import.verbosity}", … … 125 152 'range' => "0,3", 126 153 'deft' => "2", 127 'reqd' => "no" }, 128 { 'name' => "language", 129 'desc' => "{scripts.language}", 130 'type' => "string", 131 'reqd' => "no" } ]; 154 'reqd' => "no", 155 'modegli' => "4" } ]; 132 156 133 157 my $options = { 'name' => "import.pl", -
trunk/gsdl/perllib/mgbuilder.pm
r6332 r6407 240 240 # -b $maxdocsize sets the maximum document size to be 12 meg 241 241 print $outhandle "\n collecting text statistics\n" if ($self->{'verbosity'} >= 1); 242 print STDERR "<Phase name='CollectTextStats' >\n" if $self->{'gli'};242 print STDERR "<Phase name='CollectTextStats'/>\n" if $self->{'gli'}; 243 243 244 244 my ($handle); … … 248 248 if (!-e "$mg_passes_exe" || 249 249 !open (PIPEOUT, "| mg_passes$exe -f \"$fulltextprefix\" -b $maxdocsize -T1 -M $maxnumeric $osextra")) { 250 print STDERR "<FatalError name='NoRunMGPasses'>\n</Stage>\n" if $self->{'gli'}; 250 251 die "mgbuilder::compress_text - couldn't run $mg_passes_exe\n"; 251 252 } … … 280 281 if (!$self->{'debug'}) { 281 282 print $outhandle "\n creating the compression dictionary\n" if ($self->{'verbosity'} >= 1); 282 print STDERR "<Phase name='CreatingCompress' >\n" if $self->{'gli'};283 print STDERR "<Phase name='CreatingCompress'/>\n" if $self->{'gli'}; 283 284 if (!-e "$mg_compression_dict_exe") { 284 285 die "mgbuilder::compress_text - couldn't run $mg_compression_dict_exe\n"; … … 289 290 if (!-e "$mg_passes_exe" || 290 291 !open ($handle, "| mg_passes$exe -f \"$fulltextprefix\" -b $maxdocsize -T2 -M $maxnumeric $osextra")) { 292 print STDERR "<FatalError name='NoRunMGPasses'/>\n</Stage>\n" if $self->{'gli'}; 291 293 die "mgbuilder::compress_text - couldn't run $mg_passes_exe\n"; 292 294 } 293 295 } 294 296 else { 295 print STDERR "<Phase name='SkipCreatingComp' >\n" if $self->{'gli'};297 print STDERR "<Phase name='SkipCreatingComp'/>\n" if $self->{'gli'}; 296 298 } 297 299 … … 299 301 # compress the text 300 302 print $outhandle "\n compressing the text\n" if ($self->{'verbosity'} >= 1); 301 print STDERR "<Phase name='CompressingText' >\n" if $self->{'gli'};303 print STDERR "<Phase name='CompressingText'/>\n" if $self->{'gli'}; 302 304 303 305 &plugin::read ($self->{'pluginfo'}, $self->{'source_dir'}, … … 306 308 307 309 $self->print_stats(); 310 print STDERR "</Stage>\n" if $self->{'gli'}; 308 311 } 309 312 … … 346 349 print $outhandle "\n*** building index $index in subdirectory " . 347 350 "$self->{'index_mapping'}->{$index}\n" if ($self->{'verbosity'} >= 1); 348 print STDERR "< Phase name='Index' source='$index'>\n" if $self->{'gli'};351 print STDERR "<Stage name='Index' source='$index'>\n" if $self->{'gli'}; 349 352 $self->build_index($index); 350 353 } else { … … 569 572 # Build index dictionary. Uses verbatim stem method 570 573 print $outhandle "\n creating index dictionary\n" if ($self->{'verbosity'} >= 1); 571 print STDERR "< Stage name='CreatingIndexDic'>\n" if $self->{'gli'};574 print STDERR "<Phase name='CreatingIndexDic'/>\n" if $self->{'gli'}; 572 575 my ($handle); 573 576 if ($self->{'debug'}) { … … 577 580 !open (PIPEOUT, "| mg_passes$exe -f \"$fullindexprefix\" -b $maxdocsize " . 578 581 "-$index_level -m 32 -s 0 -G -t 10 -N1 -M $maxnumeric $osextra")) { 582 print STDERR "<FatalError name='NoRunMGPasses'/>\n</Stage>\n" if $self->{'gli'}; 579 583 die "mgbuilder::build_index - couldn't run $mg_passes_exe\n"; 580 584 } … … 607 611 # create the perfect hash function 608 612 if (!-e "$mg_perf_hash_build_exe") { 613 print STDERR "<FatalError name='NoRunMGHash'/>\n</Stage>\n" if $self->{'gli'}; 609 614 die "mgbuilder::build_index - couldn't run $mg_perf_hash_build_exe\n"; 610 615 } … … 614 619 !open ($handle, "| mg_passes$exe -f \"$fullindexprefix\" -b $maxdocsize " . 615 620 "-$index_level -c 3 -G -t 10 -N2 -M $maxnumeric $osextra")) { 621 print STDERR "<FatalError name='NoRunMGPasses'/>\n</Stage>\n" if $self->{'gli'}; 616 622 die "mgbuilder::build_index - couldn't run $mg_passes_exe\n"; 617 623 } … … 620 626 # invert the text 621 627 print $outhandle "\n inverting the text\n" if ($self->{'verbosity'} >= 1); 622 print STDERR "< Stage name='InvertingText'>\n" if $self->{'gli'};628 print STDERR "<Phase name='InvertingText'/>\n" if $self->{'gli'}; 623 629 $self->{'buildproc'}->reset(); 624 630 &plugin::read ($self->{'pluginfo'}, $self->{'source_dir'}, … … 633 639 # create the weights file 634 640 print $outhandle "\n create the weights file\n" if ($self->{'verbosity'} >= 1); 635 print STDERR "< Stage name='CreateTheWeights'>\n" if $self->{'gli'};641 print STDERR "<Phase name='CreateTheWeights'/>\n" if $self->{'gli'}; 636 642 if (!-e "$mg_weights_build_exe") { 643 print STDERR "<FatalError name='NoRunMGWeights'/>\n</Stage>\n" if $self->{'gli'}; 637 644 die "mgbuilder::build_index - couldn't run $mg_weights_build_exe\n"; 638 645 } … … 641 648 # create 'on-disk' stemmed dictionary 642 649 print $outhandle "\n creating 'on-disk' stemmed dictionary\n" if ($self->{'verbosity'} >= 1); 643 print STDERR "< Stage name='CreateStemmedDic'>\n" if $self->{'gli'};650 print STDERR "<Phase name='CreateStemmedDic'/>\n" if $self->{'gli'}; 644 651 if (!-e "$mg_invf_dict_exe") { 652 print STDERR "<FatalError name='NoRunMGInvf'/>\n</Stage>\n" if $self->{'gli'}; 645 653 die "mgbuilder::build_index - couldn't run $mg_invf_dict_exe\n"; 646 654 } … … 650 658 # creates stem index files for the various stemming methods 651 659 print $outhandle "\n creating stem indexes\n" if ($self->{'verbosity'} >= 1); 652 print STDERR "< Stage name='CreatingStemIndx'>\n" if $self->{'gli'};660 print STDERR "<Phase name='CreatingStemIndx'/>\n" if $self->{'gli'}; 653 661 if (!-e "$mg_stem_idx_exe") { 662 print STDERR "<FatalError name='NoRunMGStem'/>\n</Stage>\n" if $self->{'gli'}; 654 663 die "mgbuilder::build_index - couldn't run $mg_stem_idx_exe\n"; 655 664 } … … 673 682 closedir (DIR); 674 683 } 684 print STDERR "</Stage>\n" if $self->{'gli'}; 675 685 } 676 686 … … 696 706 print $outhandle "\n*** creating the info database and processing associated files\n" 697 707 if ($self->{'verbosity'} >= 1); 698 print STDERR "< Phase name='CreateInfoData'>\n" if $self->{'gli'};708 print STDERR "<Stage name='CreateInfoData'>\n" if $self->{'gli'}; 699 709 700 710 # init all the classifiers 701 711 &classify::init_classifiers ($self->{'classifiers'}); 702 712 703 704 713 # set up the document processor 705 714 my ($handle); … … 708 717 } else { 709 718 if (!-e "$txt2db_exe" || !open (PIPEOUT, "| txt2db$exe \"$fulldbname\"")) { 719 print STDERR "<FatalError name='NoRunText2DB'/>\n</Stage>\n" if $self->{'gli'}; 710 720 die "mgbuilder::make_infodatabase - couldn't run $txt2db_exe\n"; 711 721 } … … 781 791 782 792 print $handle "\n" . ('-' x 70) . "\n"; 783 784 } 785 793 } 786 794 787 795 &plugin::read ($self->{'pluginfo'}, $self->{'source_dir'}, … … 806 814 807 815 close ($handle) if !$self->{'debug'}; 816 817 print STDERR "</Stage>\n" if $self->{'gli'}; 808 818 } 809 819 … … 819 829 820 830 print $outhandle "\n*** creating auxiliary files \n" if ($self->{'verbosity'} >= 1); 821 print STDERR "< Phase name='CreatingAuxilary'>\n" if $self->{'gli'};831 print STDERR "<Stage name='CreatingAuxilary'>\n" if $self->{'gli'}; 822 832 823 833 # get the text directory … … 891 901 '^(indexmap|subcollectionmap|languagemap|notbuilt)$'); 892 902 903 print STDERR "</Stage>\n" if $self->{'gli'}; 893 904 } 894 905 … … 923 934 print $outhandle " Was this your intention?\n"; 924 935 print $outhandle "***************\n"; 936 print STDERR "<Warning name='LittleOrNoText'>\n" if $self->{'gli'}; 925 937 } 926 938 } -
trunk/gsdl/perllib/mgppbuilder.pm
r5935 r6407 110 110 my ($class, $collection, $source_dir, $build_dir, $verbosity, 111 111 $maxdocs, $debug, $keepold, $allclassifications, 112 $outhandle, $no_text ) = @_;112 $outhandle, $no_text, $gli) = @_; 113 113 114 114 $outhandle = STDERR unless defined $outhandle; … … 127 127 'no_text'=>$no_text, 128 128 'notbuilt'=>{}, # indexes not built 129 'indexfieldmap'=>\%static_indexfield_map 129 'indexfieldmap'=>\%static_indexfield_map, 130 'gli'=>$gli 130 131 }, $class; 131 132 133 $self->{'gli'} = 0 unless defined $self->{'gli'}; 132 134 133 135 # read in the collection configuration file … … 318 320 319 321 print $outhandle "\n*** creating the compressed text\n" if ($self->{'verbosity'} >= 1); 322 print STDERR "<Stage name='CompressText'>\n" if $self->{'gli'}; 320 323 321 324 # collect the statistics for the text 322 325 # -b $maxdocsize sets the maximum document size to be 12 meg 323 326 print $outhandle "\n collecting text statistics (mgpp_passes -T1)\n" if ($self->{'verbosity'} >= 1); 327 print STDERR "<Phase name='CollectTextStats'/>\n" if $self->{'gli'}; 324 328 325 329 my ($handle); … … 330 334 if (!-e "$mgpp_passes_exe" || 331 335 !open (PIPEOUT, "| mgpp_passes$exe $mgpp_passes_sections -f \"$fulltextprefix\" -T1 $osextra")) { 336 print STDERR "<FatalError name='NoRunMGPasses'>\n</Stage>\n" if $self->{'gli'}; 332 337 die "mgppbuilder::compress_text - couldn't run $mgpp_passes_exe\n"; 333 338 } … … 365 370 if (!$self->{'debug'}) { 366 371 print $outhandle "\n creating the compression dictionary\n" if ($self->{'verbosity'} >= 1); 372 print STDERR "<Phase name='CreatingCompress'/>\n" if $self->{'gli'}; 367 373 if (!-e "$mgpp_compression_dict_exe") { 374 print STDERR "<FatalError name='NoRunMGCompress'/>\n</Stage>\n" if $self->{'gli'}; 368 375 die "mgppbuilder::compress_text - couldn't run $mgpp_compression_dict_exe\n"; 369 376 } … … 374 381 if (!-e "$mgpp_passes_exe" || 375 382 !open ($handle, "| mgpp_passes$exe $mgpp_passes_sections -f \"$fulltextprefix\" -T2 $osextra")) { 383 print STDERR "<FatalError name='NoRunMGPasses'/>\n</Stage>\n" if $self->{'gli'}; 376 384 die "mgppbuilder::compress_text - couldn't run $mgpp_passes_exe\n"; 377 385 } 378 386 } 387 } 388 else { 389 print STDERR "<Phase name='SkipCreatingComp'/>\n" if $self->{'gli'}; 379 390 } 380 391 … … 382 393 # compress the text 383 394 print $outhandle "\n compressing the text (mgpp_passes -T2)\n" if ($self->{'verbosity'} >= 1); 395 print STDERR "<Phase name='CompressingText'/>\n" if $self->{'gli'}; 396 384 397 &plugin::read ($self->{'pluginfo'}, $self->{'source_dir'}, 385 398 "", {}, $self->{'buildproc'}, $self->{'maxdocs'}); … … 387 400 388 401 $self->print_stats(); 402 print STDERR "</Stage>\n" if $self->{'gli'}; 389 403 } 390 404 … … 427 441 print $outhandle "\n*** building index $index in subdirectory " . 428 442 "$self->{'index_mapping'}->{$index}\n" if ($self->{'verbosity'} >= 1); 443 print STDERR "<Stage name='Index' source='$index'>\n" if $self->{'gli'}; 429 444 $self->build_index($index); 430 445 } else { … … 656 671 # Build index dictionary. Uses verbatim stem method 657 672 print $outhandle "\n creating index dictionary (mgpp_passes -I1)\n" if ($self->{'verbosity'} >= 1); 673 print STDERR "<Phase name='CreatingIndexDic'/>\n" if $self->{'gli'}; 658 674 my ($handle); 659 675 if ($self->{'debug'}) { … … 662 678 if (!-e "$mgpp_passes_exe" || 663 679 !open (PIPEOUT, "| mgpp_passes$exe $mgpp_passes_sections -f \"$fullindexprefix\" -I1 $osextra")) { 680 print STDERR "<FatalError name='NoRunMGPasses'/>\n</Stage>\n" if $self->{'gli'}; 664 681 die "mgppbuilder::build_index - couldn't run $mgpp_passes_exe\n"; 665 682 } … … 687 704 if (!-e $dict_file) { 688 705 print $outhandle "mgppbuilder::build_index - Couldn't create index $index\n"; 706 print STDERR "<Warning name='NoIndex'/>\n</Stage>\n" if $self->{'gli'}; 689 707 $self->{'notbuilt'}->{$index}=1; 690 708 return; … … 694 712 # create the perfect hash function 695 713 if (!-e "$mgpp_perf_hash_build_exe") { 714 print STDERR "<FatalError name='NoRunMGHash'/>\n</Stage>\n" if $self->{'gli'}; 696 715 die "mgppbuilder::build_index - couldn't run $mgpp_perf_hash_build_exe\n"; 697 716 } … … 700 719 if (!-e "$mgpp_passes_exe" || 701 720 !open ($handle, "| mgpp_passes$exe $mgpp_passes_sections -f \"$fullindexprefix\" -I2 $osextra")) { 721 print STDERR "<FatalError name='NoRunMGPasses'/>\n</Stage>\n" if $self->{'gli'}; 702 722 die "mgppbuilder::build_index - couldn't run $mgpp_passes_exe\n"; 703 723 } … … 706 726 # invert the text 707 727 print $outhandle "\n inverting the text (mgpp_passes -I2)\n" if ($self->{'verbosity'} >= 1); 708 728 print STDERR "<Phase name='InvertingText'/>\n" if $self->{'gli'}; 709 729 $self->{'buildproc'}->reset(); 710 730 &plugin::read ($self->{'pluginfo'}, $self->{'source_dir'}, … … 719 739 # create the weights file 720 740 print $outhandle "\n create the weights file\n" if ($self->{'verbosity'} >= 1); 741 print STDERR "<Phase name='CreateTheWeights'/>\n" if $self->{'gli'}; 721 742 if (!-e "$mgpp_weights_build_exe") { 743 print STDERR "<FatalError name='NoRunMGWeights'/>\n</Stage>\n" if $self->{'gli'}; 722 744 die "mgppbuilder::build_index - couldn't run $mgpp_weights_build_exe\n"; 723 745 } … … 727 749 print $outhandle "\n creating 'on-disk' stemmed dictionary\n" if ($self->{'verbosity'} >= 1); 728 750 if (!-e "$mgpp_invf_dict_exe") { 751 print STDERR "<FatalError name='NoRunMGInvf'/>\n</Stage>\n" if $self->{'gli'}; 729 752 die "mgppbuilder::build_index - couldn't run $mgpp_invf_dict_exe\n"; 730 753 } … … 734 757 # creates stem index files for the various stemming methods 735 758 print $outhandle "\n creating stem indexes\n" if ($self->{'verbosity'} >= 1); 759 print STDERR "<Phase name='CreatingStemIndx'/>\n" if $self->{'gli'}; 736 760 if (!-e "$mgpp_stem_idx_exe") { 761 print STDERR "<FatalError name='NoRunMGStem'/>\n</Stage>\n" if $self->{'gli'}; 737 762 die "mgppbuilder::build_index - couldn't run $mgpp_stem_idx_exe\n"; 738 763 } … … 756 781 closedir (DIR); 757 782 } 783 print STDERR "</Stage>\n" if $self->{'gli'}; 758 784 } 759 785 … … 784 810 print $outhandle "\n*** creating the info database and processing associated files\n" 785 811 if ($self->{'verbosity'} >= 1); 812 print STDERR "<Stage name='CreateInfoData'>\n" if $self->{'gli'}; 786 813 787 814 # init all the classifiers … … 794 821 } else { 795 822 if (!-e "$txt2db_exe" || !open (PIPEOUT, "| txt2db$exe \"$fulldbname\"")) { 823 print STDERR "<FatalError name='NoRunText2DB'/>\n</Stage>\n" if $self->{'gli'}; 796 824 die "mgppbuilder::make_infodatabase - couldn't run $txt2db_exe\n"; 797 825 } … … 889 917 # output classification information 890 918 &classify::output_classify_info ($self->{'classifiers'}, $handle, 891 $self->{'allclassifications'}); 919 $self->{'allclassifications'}, 920 $self->{'gli'}); 892 921 893 922 #output doclist … … 903 932 close ($handle) if !$self->{'debug'}; 904 933 934 print STDERR "</Stage>\n" if $self->{'gli'}; 905 935 } 906 936 … … 1055 1085 my $outhandle = $self->{'outhandle'}; 1056 1086 print $outhandle "\n*** creating auxiliary files \n" if ($self->{'verbosity'} >= 1); 1087 print STDERR "<Stage name='CreatingAuxilary'>\n" if $self->{'gli'}; 1057 1088 1058 1089 # get the text directory … … 1113 1144 '^(builddate|buildtype|numdocs|numbytes|textlevel)$', 1114 1145 '^(indexmap|subcollectionmap|languagemap|indexfieldmap|notbuilt|indexfields|indexlevels)$'); 1115 1146 1147 print STDERR "</Stage>\n" if $self->{'gli'}; 1116 1148 } 1117 1149 -
trunk/gsdl/perllib/plugin.pm
r6332 r6407 146 146 $stats->{'num_not_processed'}; 147 147 148 print STDERR "<ImportComplete c ='$stats->{'num_processed'}' p='$stats->{'num_processed'}'>\n" if $gli;148 print STDERR "<ImportComplete considered='$total' processed='$stats->{'num_processed'}' blocked='$stats->{'num_blocked'}' ignored='$stats->{'num_not_processed'}'>\n" if $gli; 149 149 150 150 if ($total == 1) {
Note:
See TracChangeset
for help on using the changeset viewer.