source: main/trunk/greenstone2/perllib/buildConfigxml.pm@ 28876

Last change on this file since 28876 was 28876, checked in by kjdon, 10 years ago

earliestDatestamp should have a capital D

  • Property svn:keywords set to Author Date Id Revision
File size: 24.1 KB
Line 
1###########################################################################
2#
3# buildConfigxml.pm --
4# A component of the Greenstone digital library software
5# from the New Zealand Digital Library Project at the
6# University of Waikato, New Zealand.
7#
8# Copyright (C) 1999 New Zealand Digital Library Project
9#
10# This program is free software; you can redistribute it and/or modify
11# it under the terms of the GNU General Public License as published by
12# the Free Software Foundation; either version 2 of the License, or
13# (at your option) any later version.
14#
15# This program is distributed in the hope that it will be useful,
16# but WITHOUT ANY WARRANTY; without even the implied warranty of
17# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18# GNU General Public License for more details.
19#
20# You should have received a copy of the GNU General Public License
21# along with this program; if not, write to the Free Software
22# Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
23#
24###########################################################################
25
26# reads in buildConfig.xml
27# Note, only implemented the bits that are currently used, eg by incremental
28# build code.
29# The resulting data is not a full representation on buildConfig.xml.
30
31package buildConfigxml;
32
33use strict;
34no strict 'refs';
35no strict 'subs';
36
37use XMLParser;
38
39
40# A mapping hash to resolve name discrepancy between gs2 and gs3.
41my $nameMap = {"numDocs" => "numdocs",
42 "buildType" => "buildtype",
43 "orthogonalBuildTypes" => "orthogonalbuildtypes"
44 };
45
46
47# A hash structure which is returned by sub read_cfg_file.
48my $data = {};
49
50# use those unique attribute values to locate the text within the elements
51my $currentLocation = "";
52my $stringexp = q/^(buildType|numDocs)$/;
53my $arrayexp = q/^(orthogonalBuildTypes)$/;
54
55my $indexmap_name = "";
56my $haveindexfields = 0;
57
58# Reads in the model collection configuration file, collectionConfig.xml,
59# into a structure which complies with the one used by gs2 (i.e. one read
60# in by &cfgread::read_cfg_file).
61sub read_cfg_file {
62 my ($filename) = @_;
63 $data = {};
64 if ($filename !~ /buildConfig\.xml$/ || !-f $filename) {
65 return undef;
66 }
67
68 # Removed ProtocolEncoding (see MetadataXMLPlugin for details)
69
70 # create XML::Parser object for parsing metadata.xml files
71 my $parser = new XML::Parser('Style' => 'Stream',
72 'Pkg' => 'buildConfigxml',
73 'Handlers' => {'Char' => \&Char,
74 'Doctype' => \&Doctype
75 });
76
77 if (!open (COLCFG, $filename)) {
78 print STDERR "buildConfigxml::read_cfg_file couldn't read the cfg file $filename\n";
79 } else {
80
81 $parser->parsefile ($filename);# (COLCFG);
82 close (COLCFG);
83 }
84
85 #&Display;
86 return $data;
87}
88
89sub StartTag {
90# Those marked with #@ will not be executed at the same time when this sub is being called
91# so that if/elsif is used to avoid unnecessary tests
92 my ($expat, $element) = @_;
93
94 my $name = $_{'name'};
95 my $shortname = $_{'shortname'};
96
97
98 #@ handling block metadataList
99 if (defined $name && (($name =~ m/$stringexp/) || ($name =~ m/$arrayexp/))) {
100 $currentLocation = $name;
101 # the value will be retrieved later in Text sub
102 }
103
104 #@ handle indexes - store indexmap (mg) or indexfields and indexfieldmap (mgpp/lucene/solr)
105 elsif ($element =~ /^indexList$/) {
106 # set up the data arrays
107 # this assumes that the build type has been read already, which is
108 # currently the order we save the file in.
109 if ($data->{'buildtype'} eq "mg") {
110 $indexmap_name = "indexmap";
111 if (!defined $data->{"indexmap"}) {
112 $data->{"indexmap"} = [];
113 }
114 }
115 else {
116 # mgpp, lucene or solr
117 $indexmap_name = "indexfieldmap";
118 $haveindexfields = 1;
119 if (!defined $data->{"indexfieldmap"}) {
120 $data->{"indexfieldmap"} = [];
121 }
122 if (!defined $data->{"indexfields"}) {
123 $data->{"indexfields"} = [];
124 }
125
126 }
127
128 }
129
130 elsif ($element =~ /index/) {
131 # store each index in the map
132 if (defined $name && defined $shortname) {
133 push @{$data->{$indexmap_name}}, "$name->$shortname";
134 if ($haveindexfields) {
135 push @{$data->{'indexfields'}}, $name;
136 }
137 }
138 }
139
140
141}
142
143sub EndTag {
144 my ($expat, $element) = @_;
145}
146
147sub Text {
148 if (defined $currentLocation) {
149 #@ Handling block metadataList(numDocs, buildType)
150 if ($currentLocation =~ /$stringexp/) {
151 #print $currentLocation;
152 my $key = $nameMap->{$currentLocation};
153 $data->{$key} = $_;
154 undef $currentLocation;
155 }
156 elsif ($currentLocation =~ /$arrayexp/) {
157 #print $currentLocation;
158 my $key = $nameMap->{$currentLocation};
159 push(@{$data->{$key}},$_);
160 undef $currentLocation;
161 }
162
163 }
164}
165
166# This sub is for debugging purposes
167sub Display {
168
169 print "NumDocs = ".$data->{'numdocs'}."\n" if (defined $data->{'numdocs'});
170 print "BuildType = ".$data->{'buildtype'}."\n" if (defined $data->{'buildtype'});
171 print "OrthogonalBuildTypes = ".join(",",@{$data->{'orthogonalbuildtypes'}})."\n" if (defined $data->{'orthogonalbuildtypes'});
172 print "IndexMap = ". join(" ",@{$data->{'indexmap'}})."\n" if (defined $data->{'indexmap'});
173 print "IndexFieldMap = ". join(" ",@{$data->{'indexfieldmap'}})."\n" if (defined $data->{'indexfieldmap'});
174 print "IndexFields = ". join(" ",@{$data->{'indexfields'}})."\n" if (defined $data->{'indexfields'});
175
176}
177
178# is this actually used??
179sub Doctype {
180 my ($expat, $name, $sysid, $pubid, $internal) = @_;
181
182 die if ($name !~ /^buildConfig$/);
183}
184
185# This Char function overrides the one in XML::Parser::Stream to overcome a
186# problem where $expat->{Text} is treated as the return value, slowing
187# things down significantly in some cases.
188sub Char {
189 if ($]<5.008) {
190 use bytes; # Necessary to prevent encoding issues with XML::Parser 2.31+ and Perl 5.6
191 }
192 $_[0]->{'Text'} .= $_[1];
193 return undef;
194}
195
196
197
198sub write_line {
199 my ($filehandle, $line) = @_;
200 print $filehandle join ("", @$line), "\n";
201}
202
203sub search_and_retrieve_settings
204{
205 my ($buildcfg,$collectcfg) = @_;
206
207 my $settings = {};
208
209 if (defined $buildcfg->{"buildtype"}) {
210 $settings->{'buildtype'} = $buildcfg->{"buildtype"};
211 } else {
212 $settings->{'buildtype'} = "mgpp";
213 }
214 my $buildtype = $settings->{'buildtype'};
215
216 if (defined $collectcfg->{"orthogonalbuildtypes"}) {
217 # Note the use of collectcfg, not bulidcfg
218 $settings->{'orthogonalbuildtypes'} = $collectcfg->{"orthogonalbuildtypes"};
219 } else {
220 $settings->{'orthogonalbuildtypes '}= [];
221 }
222
223 if (defined $buildcfg->{"numdocs"}) {
224 $settings->{'numdocs'} = $buildcfg->{"numdocs"};
225 }
226 else {
227 $settings->{'numdocs'} = 0;
228 }
229
230 my $service_type = "MGPP";
231 if ($buildtype eq "mg") {
232 $service_type = "MG";
233 } elsif ($buildtype eq "lucene") {
234 $service_type = "Lucene";
235 } elsif ($buildtype eq "solr") {
236 $service_type = "Solr";
237 }
238 $settings->{'service_type'} = $service_type;
239
240
241 if (defined $buildcfg->{"infodbtype"}) {
242 $settings->{'infodbtype'} = $buildcfg->{'infodbtype'};
243 }
244 else {
245 $settings->{'infodbtype'} = "gdbm";
246 }
247
248
249 #--
250 # indexes
251 #--
252
253 my $indexmap = {}; # maps index name to shortname
254 my $indexlist = []; # keeps the order for indexes
255 my $defaultindex = "";
256 my $maptype = ($buildtype eq "mg") ? "indexmap" : "indexfieldmap";
257
258 if (defined $buildcfg->{$maptype}) {
259 my $first = 1;
260 my $indexmap_t = $buildcfg->{$maptype};
261 foreach my $i (@$indexmap_t) {
262 my ($k, $v) = $i =~ /^(.*)\-\>(.*)$/;
263 $indexmap->{$k} = $v;
264 push @$indexlist, $k;
265 if ($first) {
266 $defaultindex = $v;
267 $first = 0;
268 }
269 }
270 # now if the user has assigned a default index, we use it
271 if (defined $collectcfg->{"defaultindex"}) {
272 $defaultindex = $indexmap->{$collectcfg->{"defaultindex"}};
273 }
274 } else {
275 print STDERR "$maptype not defined\n";
276 }
277
278 $settings->{'num_indexes'} = $buildcfg->{'num_indexes'};
279 $settings->{'defaultindex'} = $defaultindex;
280 $settings->{'indexmap'} = $indexmap;
281 $settings->{'indexlist'} = $indexlist;
282
283 #--
284 # default lang
285 #--
286 $settings->{'default_lang'} = "";
287 $settings->{'default_lang_short'} = "";
288
289 if (defined $buildcfg->{"languagemap"}) {
290 my $langmap_t = $buildcfg->{"languagemap"};
291 if ((defined $langmap_t) && (scalar(@$langmap_t)>=1)) {
292 my $l = $langmap_t->[0];
293 my ($k, $v) = $l =~ m/^(.*)\-\>(.*)$/;
294 $settings->{'default_lang'} = $k; #name
295 $settings->{'default_lang_short'} = $v; #short name
296 }
297
298 # now if the user has assigned a default language (as "en", "ru" etc.)
299 if (defined $collectcfg->{"defaultlanguage"}) {
300 $settings->{'default_lang'} = $collectcfg->{"defaultlanguage"};
301 # what about default_lang_short ?? ####
302 }
303 }
304
305 # default subcol
306 $settings->{'default_subcol'} = "";
307 if (defined $buildcfg->{'subcollectionmap'}) {
308 my $subcolmap_t = $buildcfg->{'subcollectionmap'};
309 if ((defined $subcolmap_t) && (scalar(@$subcolmap_t)>=1)) {
310 my $l = $subcolmap_t->[0];
311 my ($k, $v) = $l =~ m/^(.*)\-\>(.*)$/;
312
313 $settings->{'default_subcol'} = $v;
314 }
315 }
316
317
318 #--
319 # indexstem
320 #--
321 if (defined $buildcfg->{'indexstem'}) {
322 $settings->{'indexstem'} = $buildcfg->{'indexstem'};
323 }
324
325 #--
326 # levelList
327 #--
328
329 my $levelmap = {};
330 my $levellist = [];
331 my $default_search_level = "Doc";
332 my $default_retrieve_level = "Doc";
333 my $default_db_level = "Doc";
334
335 if ($buildtype eq "mgpp" || $buildtype eq "lucene" || $buildtype eq "solr") {
336 if (defined $buildcfg->{'levelmap'}) {
337 my $first = 1;
338
339 my $levelmap_t = $buildcfg->{'levelmap'};
340 foreach my $l (@$levelmap_t) {
341 my ($key, $val) = $l =~ /^(.*)\-\>(.*)$/;
342 $levelmap->{$key} = $val;
343 push @$levellist, $key;
344 if ($first) {
345 # let default search level follow the first level in the level list
346 $default_search_level = $val;
347 # retrieve/database levels may get modified later if text level is defined
348 $default_retrieve_level = $val;
349 $default_db_level = $val;
350 $first = 0;
351 }
352 }
353 }
354 # the default level assigned by the user is no longer ignored [Shaoqun], but the retrievel level stays the same.
355 if (defined $collectcfg->{"defaultlevel"}) {
356 $default_search_level = $levelmap->{$collectcfg->{"defaultlevel"}};
357 # $default_retrieve_level = $default_search_level;
358 }
359
360 if (defined $buildcfg->{'textlevel'}) {
361 # let the retrieve/database levels always follow the textlevel
362 $default_retrieve_level = $buildcfg->{'textlevel'};
363 $default_db_level = $buildcfg->{'textlevel'};
364
365 }
366 }
367 $settings->{'levelmap'} = $levelmap;
368 $settings->{'levellist'} = $levellist;
369 $settings->{'default_search_level'} = $default_search_level if $default_search_level;
370 $settings->{'default_retrieve_level'} = $default_retrieve_level;
371 $settings->{'default_db_level'} = $default_db_level;
372
373 # sort field list
374 ######
375
376 my $sortmap = {}; # maps index name to shortname
377 my $sortlist = []; # keeps the order for indexes
378
379 if (defined ($buildcfg->{"indexsortfieldmap"})) {
380 my $sortmap_t = $buildcfg->{"indexsortfieldmap"};
381 foreach my $s (@$sortmap_t) {
382 my ($k, $v) = $s =~ /^(.*)\-\>(.*)$/;
383 $sortmap->{$v} = $k;
384 }
385 }
386 if (defined ($buildcfg->{"indexsortfields"})) {
387 $sortlist = $buildcfg->{"indexsortfields"};
388 }
389
390 $settings->{'sortlist'} = $sortlist;
391 $settings->{'sortmap'} = $sortmap;
392
393 # facet field list
394 ######
395
396 my $facetmap = {}; # maps index name to shortname
397 my $facetlist = []; # keeps the order for indexes
398
399 if (defined ($buildcfg->{"indexfacetfieldmap"})) {
400 my $facetmap_t = $buildcfg->{"indexfacetfieldmap"};
401 foreach my $s (@$facetmap_t) {
402 my ($k, $v) = $s =~ /^(.*)\-\>(.*)$/;
403 $facetmap->{$v} = $k;
404 }
405 }
406 if (defined ($buildcfg->{"indexfacetfields"})) {
407 $facetlist = $buildcfg->{"indexfacetfields"};
408 }
409
410 $settings->{'facetlist'} = $facetlist;
411 $settings->{'facetmap'} = $facetmap;
412
413
414 return $settings;
415}
416
417
418sub write_search_servicerack
419{
420 my ($buildcfg,$settings) = @_;
421
422 my $buildtype = $settings->{'buildtype'};
423 my $infodbtype = $settings->{'infodbtype'};
424 my $service_type = $settings->{'service_type'};
425
426 # there's no searching and therefore no search services if there are no indexes
427 return if($settings->{'num_indexes'} <= 0);
428
429 # do the search service
430 &write_line('COLCFG', ["<serviceRack name=\"GS2", $service_type, "Search\">"]);
431 if (defined $buildcfg->{'indexstem'}) {
432 my $indexstem = $buildcfg->{'indexstem'};
433 &write_line('COLCFG', ["<indexStem name=\"", $indexstem, "\" />"]);
434 }
435 if (defined $buildcfg->{'infodbtype'}) {
436 &write_line('COLCFG', ["<databaseType name=\"", $infodbtype, "\" />"]);
437 }
438
439 #indexes
440 my $indexmap = $settings->{'indexmap'};
441 my $indexlist = $settings->{'indexlist'};
442 my $defaultindex = $settings->{'defaultindex'};
443
444 #for each index in indexList, write them out
445 &write_line('COLCFG', ["<indexList>"]);
446 foreach my $i (@$indexlist) {
447 my $index = $indexmap->{$i};
448 &write_line('COLCFG', ["<index name=\"", $i, "\" ", "shortname=\"", $index, "\" />"]);
449 }
450 &write_line('COLCFG', ["</indexList>"]);
451
452
453 #$defaultindex = "ZZ" if (!$defaultindex); # index allfields by default
454 if ($defaultindex) {
455 &write_line('COLCFG', ["<defaultIndex shortname=\"", $defaultindex, "\" />"]);
456 }
457
458
459 # do indexOptionList
460 if ($buildtype eq "mg" || $buildtype eq "mgpp") {
461 &write_line('COLCFG', ["<indexOptionList>"]);
462 my $stemindexes = 3; # default is stem and casefold
463 if (defined $buildcfg->{'stemindexes'} && $buildcfg->{'stemindexes'} =~ /^\d+$/ ) {
464 $stemindexes = $buildcfg->{'stemindexes'};
465 }
466 &write_line('COLCFG', ["<indexOption name=\"stemIndexes\" value=\"", $stemindexes, "\" />"]);
467
468 my $maxnumeric = 4; # default
469 if (defined $buildcfg->{'maxnumeric'} && $buildcfg->{'maxnumeric'} =~ /^\d+$/) {
470 $maxnumeric = $buildcfg->{'maxnumeric'};
471 }
472 &write_line('COLCFG', ["<indexOption name=\"maxnumeric\" value=\"", $maxnumeric, "\" />"]);
473 &write_line('COLCFG', ["</indexOptionList>"]);
474 }
475
476 #--
477 # levelList
478 #--
479 my $levelmap = $settings->{'levelmap'};
480 my $levellist = $settings->{'levellist'};
481 my $default_search_level = $settings->{'default_search_level'};
482 my $default_retrieve_level = $settings->{'default_retrieve_level'};
483 my $default_db_level = $settings->{'default_db_level'};
484
485 #for each level in levelList, write them out
486 if ($buildtype ne "mg") {
487 &write_line('COLCFG', ["<levelList>"]);
488 foreach my $lv (@$levellist) {
489 my $level = $levelmap->{$lv};
490 &write_line('COLCFG', ["<level name=\"", $lv, "\" shortname=\"", $level, "\" />"]);
491 }
492 &write_line('COLCFG', ["</levelList>"]);
493 }
494 # add in defaultLevel as the same level as indexLevelList, making the reading job easier
495 if ($buildtype eq "lucene" || $buildtype eq "mgpp" || $buildtype eq "solr") {
496 &write_line('COLCFG', ["<defaultLevel shortname=\"", $default_search_level, "\" />"]);
497 }
498 if ($buildtype eq "lucene" || $buildtype eq "mgpp" || $buildtype eq "solr") {
499 &write_line('COLCFG', ["<defaultDBLevel shortname=\"", $default_db_level, "\" />"]);
500 }
501
502 # do sort list
503 if ($buildtype eq "lucene" || $buildtype eq "solr") {
504 my $sortlist = $settings->{'sortlist'};
505 my $sortmap = $settings->{'sortmap'};
506 &write_line('COLCFG', ["<sortList>"]);
507 foreach my $sf (@$sortlist) {
508 my $sortf;
509 if ($sf eq "rank" || $sf eq "none") {
510 $sortf = $sf;
511 } else {
512 $sortf = $sortmap->{$sf};
513 }
514 &write_line('COLCFG', ["<sort name=\"", $sortf, "\" shortname=\"", $sf, "\" />"]);
515
516 }
517 &write_line('COLCFG', ["</sortList>"]);
518 }
519
520 # do facet list
521 if ($buildtype eq "solr") {
522 &write_line('COLCFG', ["<facetList>"]);
523 my $facetlist = $settings->{'facetlist'};
524 my $facetmap = $settings->{'facetmap'};
525 foreach my $ff (@$facetlist) {
526 my $facetf = $facetmap->{$ff};
527 &write_line('COLCFG', ["<facet name=\"", $facetf, "\" shortname=\"", $ff, "\" />"]);
528 }
529 &write_line('COLCFG', ["</facetList>"]);
530 }
531 # do searchTypeList
532 if ($buildtype eq "mgpp" || $buildtype eq "lucene" || $buildtype eq "solr") {
533 &write_line('COLCFG', ["<searchTypeList>"]);
534
535 if (defined $buildcfg->{"searchtype"}) {
536 my $searchtype_t = $buildcfg->{"searchtype"};
537 foreach my $s (@$searchtype_t) {
538 &write_line('COLCFG', ["<searchType name=\"", $s, "\" />"]);
539 }
540 } else {
541 &write_line('COLCFG', ["<searchType name=\"plain\" />"]);
542 &write_line('COLCFG', ["<searchType name=\"form\" />"]);
543 }
544 &write_line('COLCFG', ["</searchTypeList>"]);
545 }
546
547 # do indexLanguageList [in collect.cfg: languages; in build.cfg: languagemap]
548 my $default_lang = $settings->{'default_lang'};
549 my $default_lang_short = $settings->{'default_lang_short'};
550 if (defined $buildcfg->{"languagemap"}) {
551 &write_line('COLCFG', ["<indexLanguageList>"]);
552
553 my $langmap_t = $buildcfg->{"languagemap"};
554 foreach my $l (@$langmap_t) {
555 my ($k, $v) = $l =~ /^(.*)\-\>(.*)$/;
556
557 &write_line('COLCFG', ["<indexLanguage name=\"", $k, "\" shortname=\"", $v, "\" />"]);
558 }
559
560 &write_line('COLCFG', ["</indexLanguageList>"]);
561
562 &write_line('COLCFG', ["<defaultIndexLanguage name=\"", $default_lang, "\" shortname=\"", $default_lang_short, "\" />"]);
563 }
564
565 # do indexSubcollectionList
566 my $default_subcol = $settings->{'default_subcol'};
567
568 if (defined $buildcfg->{'subcollectionmap'}) {
569 &write_line('COLCFG', ["<indexSubcollectionList>"]);
570 my $subcolmap = {};
571 my @subcollist = ();
572
573 my $subcolmap_t = $buildcfg->{'subcollectionmap'};
574 foreach my $l (@$subcolmap_t) {
575 my ($k, $v) = $l =~ /^(.*)\-\>(.*)$/;
576 $subcolmap->{$k} = $v;
577 push @subcollist, $k;
578 }
579
580 foreach my $sl (@subcollist) {
581 my $subcol = $subcolmap->{$sl};
582 &write_line('COLCFG', ["<indexSubcollection name=\"", $sl, "\" shortname=\"", $subcol, "\" />"]);
583 }
584
585 &write_line('COLCFG', ["</indexSubcollectionList>"]);
586 &write_line('COLCFG', ["<defaultIndexSubcollection shortname=\"", $default_subcol, "\" />"]);
587 }
588
589 # close off search service
590 &write_line('COLCFG', ["</serviceRack>"]);
591
592}
593
594
595sub write_orthogonalsearch_serviceracks
596{
597 my ($buildcfg,$settings) = @_;
598
599 #return if($settings->{'num_indexes'} <= 0); # no search if no indexes
600
601 my $infodbtype = $settings->{'infodbtype'};
602
603 my $orthogonalbuildtypes = $settings->{'orthogonalbuildtypes'};
604
605 foreach my $obt (@$orthogonalbuildtypes) {
606 $obt =~ s/^(.)/\u$1/; # capitialize initial letter
607 $obt =~ s/-(.)/\u$1/g; # change any hyphenated words to cap next letter
608
609 &write_line('COLCFG', ["<serviceRack name=\"GS2", $obt, "Search\">"]);
610
611 &write_line('COLCFG',["<databaseType name=\"",$infodbtype,"\" />"]);
612 &write_line('COLCFG', ["</serviceRack>"]);
613 }
614}
615
616
617
618sub write_retrieve_servicerack
619{
620 my ($buildcfg,$settings) = @_;
621
622 my $buildtype = $settings->{'buildtype'};
623 my $infodbtype = $settings->{'infodbtype'};
624
625 my $service_type = $settings->{'service_type'};
626
627 # do the retrieve service
628 &write_line('COLCFG', ["<serviceRack name=\"GS2", $service_type, "Retrieve\">"]);
629
630 # do default index
631 if (defined $buildcfg->{"languagemap"}) {
632 my $default_lang = $settings->{'default_lang'};
633 &write_line('COLCFG', ["<defaultIndexLanguage shortname=\"", $default_lang, "\" />"]);
634 }
635 if (defined $buildcfg->{'subcollectionmap'}) {
636 my $default_subcol = $settings->{'default_subcol'};
637 &write_line('COLCFG', ["<defaultIndexSubcollection shortname=\"", $default_subcol, "\" />"]);
638 }
639 if ($buildtype eq "mg") {
640 my $defaultindex = $settings->{'defaultindex'};
641 &write_line('COLCFG', ["<defaultIndex shortname=\"", $defaultindex, "\" />"]);
642 }
643
644 if (defined $buildcfg->{'indexstem'}) {
645 my $indexstem = $buildcfg->{'indexstem'};
646 &write_line('COLCFG', ["<indexStem name=\"", $indexstem, "\" />"]);
647 }
648 if ($buildtype eq "mgpp" || $buildtype eq "lucene" || $buildtype eq "solr") {
649 my $default_retrieve_level = $settings->{'default_retrieve_level'};
650 &write_line('COLCFG', ["<defaultLevel shortname=\"", $default_retrieve_level, "\" />"]);
651 }
652 if (defined $buildcfg->{'infodbtype'}) {
653 &write_line('COLCFG', ["<databaseType name=\"", $infodbtype, "\" />"]);
654 }
655
656 &write_line('COLCFG', ["</serviceRack>"]);
657
658}
659
660
661# Create the buildConfig.xml file for a specific collection
662sub write_cfg_file {
663 # this sub is called in make_auxiliary_files() in basebuilder.pm
664 # the received args: $buildoutfile - destination file: buildConfig.xml
665 # $buildcfg - all build options,
666 # $collectcfg - contents of collectionConfig.xml read in by read_cfg_file sub in buildConfigxml.pm.
667 my ($buildoutfile, $buildcfg, $collectcfg) = @_;
668 my $line = [];
669
670 if (!open (COLCFG, ">$buildoutfile")) {
671 print STDERR "buildConfigxml::write_cfg_file couldn't write the build config file $buildoutfile\n";
672 die;
673 }
674
675 my $settings = search_and_retrieve_settings($buildcfg,$collectcfg);
676
677 my $buildtype = $settings->{'buildtype'};
678 my $orthogonalbuildtypes = $settings->{'orthogonalbuildtypes'};
679 my $numdocs = $settings->{'numdocs'};
680
681 &write_line('COLCFG', ["<buildConfig xmlns:gsf=\"http://www.greenstone.org/greenstone3/schema/ConfigFormat\">"]);
682
683 # output building metadata to build config file
684 &write_line('COLCFG', ["<metadataList>"]);
685 &write_line('COLCFG', ["<metadata name=\"numDocs\">", $numdocs, "</metadata>"]);
686 &write_line('COLCFG', ["<metadata name=\"buildType\">", $buildtype, "</metadata>"]);
687 foreach my $obt (@$orthogonalbuildtypes) {
688 &write_line('COLCFG', ["<metadata name=\"orthogonalBuildTypes\">", $obt, "</metadata>"]);
689 }
690
691 if (defined $buildcfg->{'indexstem'}) {
692 &write_line('COLCFG', ["<metadata name=\"indexStem\">", $buildcfg->{"indexstem"}, "</metadata>"]);
693 }
694 if (defined $buildcfg->{'infodbtype'}) {
695 &write_line('COLCFG', ["<metadata name=\"infodbType\">", $buildcfg->{"infodbtype"}, "</metadata>"]);
696 }
697 if (defined $buildcfg->{'earliestdatestamp'}) {
698 &write_line('COLCFG', ["<metadata name=\"earliestDatestamp\">", $buildcfg->{"earliestdatestamp"}, "</metadata>"]);
699 }
700
701 &write_line('COLCFG', ["</metadataList>"]);
702
703 # output serviceRackList
704 &write_line('COLCFG', ["<serviceRackList>"]);
705
706 write_search_servicerack($buildcfg,$settings);
707
708 # add in orthogonalbuildtypes
709 write_orthogonalsearch_serviceracks($buildcfg,$settings);
710
711 write_retrieve_servicerack($buildcfg,$settings);
712
713 # do the browse service
714 my $count = 1;
715 my $phind = 0;
716 my $started_classifiers = 0;
717
718 my $classifiers = $collectcfg->{"classify"};
719 foreach my $cl (@$classifiers) {
720 my $name = "CL$count";
721 $count++;
722 my ($classname) = @$cl[0];
723 if ($classname =~ /^phind$/i) {
724 $phind=1;
725 #should add it into coll config classifiers
726 next;
727 }
728
729 if (not $started_classifiers) {
730 &write_line('COLCFG', ["<serviceRack name=\"GS2Browse\">"]);
731 if (defined $buildcfg->{'indexstem'}) {
732 my $indexstem = $buildcfg->{'indexstem'};
733 &write_line('COLCFG', ["<indexStem name=\"", $indexstem, "\" />"]);
734 }
735 if (defined $buildcfg->{'infodbtype'}) {
736 my $infodbtype = $buildcfg->{'infodbtype'};
737 &write_line('COLCFG', ["<databaseType name=\"", $infodbtype, "\" />"]);
738 }
739 &write_line('COLCFG', ["<classifierList>"]);
740 $started_classifiers = 1;
741 }
742 my $content = ''; #use buttonname first, then metadata
743 if ($classname eq "DateList") {
744 $content = "Date";
745 } else {
746 for (my $j=0; $j<scalar(@$cl); $j++) {
747 my $arg = @$cl[$j];
748 if ($arg eq "-buttonname"){
749 $content = @$cl[$j+1];
750 last;
751 } elsif ($arg eq "-metadata") {
752 $content = @$cl[$j+1];
753 }
754
755 }
756 }
757 &write_line('COLCFG', ["<classifier name=\"", $name, "\" content=\"", $content, "\" />"]);
758 }
759 if ($started_classifiers) {
760 # end the classifiers
761 &write_line('COLCFG', ["</classifierList>"]);
762 # close off the Browse service
763 &write_line('COLCFG', ["</serviceRack>"]);
764 }
765
766 # the phind classifier is a separate service
767 if ($phind) {
768 # if phind classifier
769 &write_line('COLCFG', ["<serviceRack name=\"PhindPhraseBrowse\" />"]);
770 }
771
772
773 &write_line('COLCFG', ["</serviceRackList>"]);
774 &write_line('COLCFG', ["</buildConfig>"]);
775
776 close (COLCFG);
777 }
778
779
780#########################################################
781
7821;
Note: See TracBrowser for help on using the repository browser.