source: trunk/gsdl/src/recpt/collectoraction.cpp@ 11166

Last change on this file since 11166 was 11166, checked in by kjdon, 18 years ago

collector buttons now use css. left them in a table, but used background colors instead of images

  • Property svn:keywords set to Author Date Id Revision
File size: 66.9 KB
Line 
1/**********************************************************************
2 *
3 * collectoraction.cpp --
4 * Copyright (C) 2000 The New Zealand Digital Library Project
5 *
6 * A component of the Greenstone digital library software
7 * from the New Zealand Digital Library Project at the
8 * University of Waikato, New Zealand.
9 *
10 * This program is free software; you can redistribute it and/or modify
11 * it under the terms of the GNU General Public License as published by
12 * the Free Software Foundation; either version 2 of the License, or
13 * (at your option) any later version.
14 *
15 * This program is distributed in the hope that it will be useful,
16 * but WITHOUT ANY WARRANTY; without even the implied warranty of
17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 * GNU General Public License for more details.
19 *
20 * You should have received a copy of the GNU General Public License
21 * along with this program; if not, write to the Free Software
22 * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
23 *
24 *********************************************************************/
25
26#include "gsdl_modules_cfg.h"
27#ifdef GSDL_USE_COLLECTOR_ACTION
28
29// note that the collectoraction relies on having direct access to a
30// collections configuration file. this breaks the separation between
31// receptionist and collection server and so is not suitable (at least
32// in its current form) for use when collection servers are separate
33// from the receptionist (e.g. when using the CORBA protocol).
34
35// following line required to get fstream.filedesc() on darwin (Mac OS X)
36#define _STREAM_COMPAT 1
37// required for utsname on solaris???
38#define _XOPEN_SOURCE 1
39#define _XOPEN_SOURCE_EXTENDED 1
40
41#include "collectoraction.h"
42#include "OIDtools.h"
43#include "fileutil.h"
44#include "cfgread.h"
45#include "gsdltools.h"
46#include "gsdltimes.h"
47#include "nullproto.h"
48#include "argdb.h"
49#include "cgiutils.h"
50#include <stdio.h>
51#include <fcntl.h>
52
53#if !defined (__WIN32__)
54#include <sys/utsname.h>
55#include <unistd.h>
56#endif
57
58collectoraction::collectoraction () {
59
60 recpt = NULL;
61 disabled = true;
62 do_mkcol = false;
63 badsources = false;
64 failedsources.erase(failedsources.begin(), failedsources.end());
65 gsdlosc = NULL;
66 gsdlhomec = NULL;
67 pathc = NULL;
68
69 cgiarginfo arg_ainfo;
70 arg_ainfo.shortname = "a";
71 arg_ainfo.longname = "action";
72 arg_ainfo.multiplechar = true;
73 arg_ainfo.defaultstatus = cgiarginfo::weak;
74 arg_ainfo.argdefault = "collector";
75 arg_ainfo.savedarginfo = cgiarginfo::must;
76 argsinfo.addarginfo (NULL, arg_ainfo);
77
78 arg_ainfo.shortname = "p";
79 arg_ainfo.longname = "page";
80 arg_ainfo.multiplechar = true;
81 arg_ainfo.defaultstatus = cgiarginfo::weak;
82 arg_ainfo.argdefault = "intro";
83 arg_ainfo.savedarginfo = cgiarginfo::must;
84 argsinfo.addarginfo (NULL, arg_ainfo);
85
86 // temporary directory name for this collector
87 // session
88 arg_ainfo.shortname = "bc1tmp";
89 arg_ainfo.longname = "collector specific";
90 arg_ainfo.multiplechar = true;
91 arg_ainfo.defaultstatus = cgiarginfo::weak;
92 arg_ainfo.argdefault = g_EmptyText;
93 arg_ainfo.savedarginfo = cgiarginfo::must;
94 argsinfo.addarginfo (NULL, arg_ainfo);
95
96 arg_ainfo.shortname = "bc1fullname";
97 arg_ainfo.longname = "collector specific";
98 arg_ainfo.multiplechar = true;
99 arg_ainfo.defaultstatus = cgiarginfo::weak;
100 arg_ainfo.argdefault = g_EmptyText;
101 arg_ainfo.savedarginfo = cgiarginfo::mustnot; // saved on disk
102 argsinfo.addarginfo (NULL, arg_ainfo);
103
104 arg_ainfo.shortname = "bc1dirname";
105 arg_ainfo.longname = "collector specific";
106 arg_ainfo.multiplechar = true;
107 arg_ainfo.defaultstatus = cgiarginfo::weak;
108 arg_ainfo.argdefault = g_EmptyText;
109 arg_ainfo.savedarginfo = cgiarginfo::must;
110 argsinfo.addarginfo (NULL, arg_ainfo);
111
112 arg_ainfo.shortname = "bc1contactemail";
113 arg_ainfo.longname = "collector specific";
114 arg_ainfo.multiplechar = true;
115 arg_ainfo.defaultstatus = cgiarginfo::weak;
116 arg_ainfo.argdefault = g_EmptyText;
117 arg_ainfo.savedarginfo = cgiarginfo::mustnot; // saved on disk
118 argsinfo.addarginfo (NULL, arg_ainfo);
119
120 arg_ainfo.shortname = "bc1aboutdesc";
121 arg_ainfo.longname = "collector specific";
122 arg_ainfo.multiplechar = true;
123 arg_ainfo.defaultstatus = cgiarginfo::weak;
124 arg_ainfo.argdefault = g_EmptyText;
125 arg_ainfo.savedarginfo = cgiarginfo::mustnot; // saved on disk
126 argsinfo.addarginfo (NULL, arg_ainfo);
127
128 arg_ainfo.shortname = "bc1clone";
129 arg_ainfo.longname = "collector specific";
130 arg_ainfo.multiplechar = false;
131 arg_ainfo.defaultstatus = cgiarginfo::weak;
132 arg_ainfo.argdefault = "0";
133 arg_ainfo.savedarginfo = cgiarginfo::mustnot; // saved on disk
134 argsinfo.addarginfo (NULL, arg_ainfo);
135
136 arg_ainfo.shortname = "bc1clonecol";
137 arg_ainfo.longname = "collector specific";
138 arg_ainfo.multiplechar = true;
139 arg_ainfo.defaultstatus = cgiarginfo::weak;
140 arg_ainfo.argdefault = g_EmptyText;
141 arg_ainfo.savedarginfo = cgiarginfo::mustnot; // saved on disk
142 argsinfo.addarginfo (NULL, arg_ainfo);
143
144 // set when cloning option has changed
145 arg_ainfo.shortname = "bc1clonechanged";
146 arg_ainfo.longname = "collector specific";
147 arg_ainfo.multiplechar = false;
148 arg_ainfo.defaultstatus = cgiarginfo::weak;
149 arg_ainfo.argdefault = "0";
150 arg_ainfo.savedarginfo = cgiarginfo::mustnot;
151 argsinfo.addarginfo (NULL, arg_ainfo);
152
153 // only set when one of the fields was changed in
154 // the "collection info" page
155 arg_ainfo.shortname = "bc1infochanged";
156 arg_ainfo.longname = "collector specific";
157 arg_ainfo.multiplechar = false;
158 arg_ainfo.defaultstatus = cgiarginfo::weak;
159 arg_ainfo.argdefault = "0";
160 arg_ainfo.savedarginfo = cgiarginfo::mustnot;
161 argsinfo.addarginfo (NULL, arg_ainfo);
162
163 // only set when cfg file is altered from within
164 // "configure collection" page
165 arg_ainfo.shortname = "bc1cfgchanged";
166 arg_ainfo.longname = "collector specific";
167 arg_ainfo.multiplechar = false;
168 arg_ainfo.defaultstatus = cgiarginfo::weak;
169 arg_ainfo.argdefault = "0";
170 arg_ainfo.savedarginfo = cgiarginfo::mustnot;
171 argsinfo.addarginfo (NULL, arg_ainfo);
172
173 arg_ainfo.shortname = "cfgfile";
174 arg_ainfo.longname = "configuration file contents";
175 arg_ainfo.multiplechar = true;
176 arg_ainfo.defaultstatus = cgiarginfo::weak;
177 arg_ainfo.argdefault = g_EmptyText;
178 arg_ainfo.savedarginfo = cgiarginfo::mustnot;
179 argsinfo.addarginfo (NULL, arg_ainfo);
180
181 arg_ainfo.shortname = "bc1dodelete";
182 arg_ainfo.longname = "collector specific";
183 arg_ainfo.multiplechar = false;
184 arg_ainfo.defaultstatus = cgiarginfo::weak;
185 arg_ainfo.argdefault = "0";
186 arg_ainfo.savedarginfo = cgiarginfo::mustnot;
187 argsinfo.addarginfo (NULL, arg_ainfo);
188
189 // will be set if we arrived at the "configure collection" page
190 // via the "changing an existing collection" page
191 arg_ainfo.shortname = "bc1econf";
192 arg_ainfo.longname = "collector specific";
193 arg_ainfo.multiplechar = false;
194 arg_ainfo.defaultstatus = cgiarginfo::weak;
195 arg_ainfo.argdefault = "0";
196 arg_ainfo.savedarginfo = cgiarginfo::must;
197 argsinfo.addarginfo (NULL, arg_ainfo);
198
199 // will be set if we arrived at the "source data" page
200 // via the "changing an existing collection" page
201 arg_ainfo.shortname = "bc1esrce";
202 arg_ainfo.longname = "collector specific";
203 arg_ainfo.multiplechar = false;
204 arg_ainfo.defaultstatus = cgiarginfo::weak;
205 arg_ainfo.argdefault = "0";
206 arg_ainfo.savedarginfo = cgiarginfo::must;
207 argsinfo.addarginfo (NULL, arg_ainfo);
208
209 arg_ainfo.shortname = "bc1inputnum";
210 arg_ainfo.longname = "collector specific";
211 arg_ainfo.multiplechar = true;
212 arg_ainfo.defaultstatus = cgiarginfo::weak;
213 arg_ainfo.argdefault = "3";
214 arg_ainfo.savedarginfo = cgiarginfo::mustnot; // saved on disk
215 argsinfo.addarginfo (NULL, arg_ainfo);
216
217 arg_ainfo.shortname = "bc1input";
218 arg_ainfo.longname = "collector specific";
219 arg_ainfo.multiplechar = true;
220 arg_ainfo.multiplevalue = true;
221 arg_ainfo.defaultstatus = cgiarginfo::weak;
222 arg_ainfo.argdefault = g_EmptyText;
223 arg_ainfo.savedarginfo = cgiarginfo::mustnot; // saved on disk
224 argsinfo.addarginfo (NULL, arg_ainfo);
225
226 arg_ainfo.shortname = "bc1inputtype";
227 arg_ainfo.longname = "collector specific";
228 arg_ainfo.multiplechar = true;
229 arg_ainfo.multiplevalue = true;
230 arg_ainfo.defaultstatus = cgiarginfo::weak;
231 arg_ainfo.argdefault = g_EmptyText;
232 arg_ainfo.savedarginfo = cgiarginfo::mustnot; // saved on disk
233 argsinfo.addarginfo (NULL, arg_ainfo);
234
235 // will be set when we've just come from the "source data" page
236 arg_ainfo.shortname = "bc1fromsrce";
237 arg_ainfo.longname = "collector specific";
238 arg_ainfo.multiplechar = false;
239 arg_ainfo.multiplevalue = false;
240 arg_ainfo.defaultstatus = cgiarginfo::weak;
241 arg_ainfo.argdefault = "0";
242 arg_ainfo.savedarginfo = cgiarginfo::mustnot;
243 argsinfo.addarginfo (NULL, arg_ainfo);
244}
245
246collectoraction::~collectoraction () {
247 if (gsdlosc != NULL) delete []gsdlosc;
248 if (gsdlhomec != NULL) delete []gsdlhomec;
249 if (pathc != NULL) delete []pathc;
250}
251
252
253void collectoraction::configure (const text_t &key, const text_tarray &cfgline) {
254 if ((key == "collector") && (cfgline.size() == 1) &&
255 (cfgline[0] == "true" || cfgline[0] == "on" || cfgline[0] == "enabled")) {
256 disabled = false;
257 } else {
258 // call the parent class to deal with the things which
259 // are not dealt with here
260 action::configure (key, cfgline);
261 }
262}
263
264
265bool collectoraction::init (ostream & /*logout*/) {
266
267 // set up GSDLOS, GSDLHOME and PATH environment variables
268 text_t gsdlos, path;
269 unsigned int path_separator = ':';
270#if defined (__WIN32__)
271 gsdlos = "windows";
272 path_separator = ';';
273
274 path = filename_cat (gsdlhome, "bin", "windows", "perl", "bin;");
275
276#else
277 struct utsname *buf = new struct utsname();
278 int i = uname (buf);
279 if (i == -1) gsdlos = "linux"; // uname failed
280 else gsdlos.setcstr (buf->sysname);
281 delete buf;
282 lc (gsdlos);
283#endif
284
285 pathc = getenv ("PATH");
286 path += filename_cat (gsdlhome, "bin", gsdlos);
287 path.push_back (path_separator);
288 path += filename_cat (gsdlhome, "bin", "script");
289 if (pathc != NULL) {
290 path.push_back (path_separator);
291 path += pathc;
292 }
293 path = "PATH=" + path;
294
295 gsdlos = "GSDLOS=" + gsdlos;
296 text_t setgsdlhome = "GSDLHOME=" + gsdlhome;
297
298 // these will be cleaned up in the destructor
299 gsdlosc = gsdlos.getcstr();
300 gsdlhomec = setgsdlhome.getcstr();
301 pathc = path.getcstr();
302
303 putenv (gsdlosc);
304 putenv (gsdlhomec);
305 putenv (pathc);
306
307 return true;
308}
309
310bool collectoraction::check_cgiargs (cgiargsinfoclass &argsinfo, cgiargsclass &args,
311 recptprotolistclass * /*protos*/, ostream &logout) {
312
313 text_t &current_page = args["p"];
314
315 // note that the "bildstatus" and "bildframe1" pages don't actually do anything
316 // functional so we don't need to worry about authenticating them (it's the
317 // underlying "bild" page that does the building (and creates the frameset))
318 // This helps us overcome a bit of a problem we have with multiple pages trying
319 // to read from the key.db database at the same time.
320 if (current_page != "intro" && current_page != "bildstatus" && current_page != "bildframe1") {
321 // authenticate the user if authentication is available
322 args["uan"] = 1;
323 args["ug"] = "colbuilder";
324 }
325
326 if (current_page == "new" || current_page == "existing") {
327
328 // assign (and create) a temporary directory
329 if (assign_tmpname (args, logout)==false) {
330 // there was an error creating the tmp dir
331 message="tmpfail";
332 return true; // true because we could still parse the arguments
333 }
334
335 // clean up any old builds left laying about in the tmp directory
336 // (note that it's possible this could take some time if there's a huge
337 // partially built collection laying about so we'll make it an asynchronous
338 // system call)
339 gsdl_system ("perl -S cleantmp.pl", false, logout);
340 }
341
342 if (current_page != "intro" && current_page != "bildstatus" &&
343 current_page != "bildframe1" && current_page != "new") {
344 // update arguments that were saved to the harddrive
345 text_tmap saved_args;
346 saved_args["bc1fullname"] = g_EmptyText;
347 saved_args["bc1contactemail"] = g_EmptyText;
348 saved_args["bc1aboutdesc"] = g_EmptyText;
349 saved_args["bc1clone"] = g_EmptyText;
350 saved_args["bc1clonecol"] = g_EmptyText;
351 saved_args["bc1inputnum"] = g_EmptyText;
352 saved_args["bc1input"] = g_EmptyText;
353 saved_args["bc1inputtype"] = g_EmptyText;
354
355 // update the argdb database with any arguments that were set
356 // by previous page
357 text_tmap::iterator here = saved_args.begin();
358 text_tmap::iterator end = saved_args.end();
359 while (here != end) {
360 if (args.lookupcgiarg((*here).first).source != cgiarg_t::default_arg) {
361 (*here).second = args[(*here).first];
362 }
363 ++here;
364 }
365
366 text_t argfile = filename_cat(gsdlhome, "tmp", args["bc1tmp"], "argdb.db");
367 argdb *args_on_disk = new argdb(argfile);
368 if (!args_on_disk->update_args(saved_args)) {
369 // error
370 logout << "collectoraction: argdb::update_args failed (" << argfile << ")\n";
371 }
372
373 // update args from argdb
374 saved_args.erase(saved_args.begin(), saved_args.end());
375 if (!args_on_disk->get_args(saved_args)) {
376 // error
377 logout << "collectoraction: argdb::get_args failed (" << argfile << ")\n";
378 }
379 delete args_on_disk;
380 here = saved_args.begin();
381 end = saved_args.end();
382 while (here != end) {
383 if (!(*here).second.empty()) {
384 args[(*here).first] = (*here).second;
385 }
386 ++here;
387 }
388 }
389
390 if (args["bc1infochanged"] == "1") {
391
392 if (args["bc1dirname"].empty()) {
393 // we've just come from the "collection information" page for the
394 // first time so we'll need to create the collection with mkcol.pl
395 // and set up bc1dirname - we do this part here instead of in do_action
396 // because the bc1dirname argument must be set to its new value before
397 // the compressedoptions macros are set.
398 args["bc1dirname"] = get_directory_name (args["bc1fullname"]);
399
400 text_t createfile = filename_cat (gsdlhome, "tmp", args["bc1tmp"], ".create");
401 if (!file_exists (createfile)) {
402 // we could do the mkcol.pl here but I guess it's nicer to do it in do_action()
403 do_mkcol = true;
404 } else {
405 // .create file already exists but bc1dirname wasn't set ... this should only be
406 // able to occur when the "reload" (and possibly the "back" and "forward" buttons)
407 // have been used to get us here.
408 // we'll check that the bc1dirname directory exists (in case of the unlikely
409 // possibility that get_directory_name returned a different value this time
410 // than it did originally).
411 text_t coldir = filename_cat (get_collectdir(args), args["bc1dirname"]);
412 if (!directory_exists (coldir)) {
413 message = "reloaderror";
414 return true;
415 }
416 }
417 } else {
418 // "collection information" has been changed after collection already exists
419 // so we'll need to update the cfg file.
420 update_cfgfile_partial (args, false, logout);
421 }
422 }
423
424 if (args["bc1cfgchanged"] == "1") {
425 // configuration file has been changed from the "configure collection"
426 // page. we need to update the file on disk and catch bc1 arguments up
427 // with changes.
428 update_cfgfile_complete (args, logout);
429 }
430
431 if (args["bc1clonechanged"] == "1") {
432 // cloning option has been changed on "source data" page. if it was turned
433 // on we want to create a new collect.cfg file using the bc1clonecol cfg file
434 // as a model (we'll save the old file as collect.cfg.org). if cloning was
435 // turned off we'll revert to using the collect.cfg.org file (which will need
436 // updating in case the bc1 arguments have been altered since cloning was
437 // turned on).
438 update_cfgfile_clone (args, logout);
439
440 // if cloning has just been turned on we'll also copy the rest of the files
441 // (excluding collect.cfg which we've already done) from the cloned collections
442 // etc directory to the new collection.
443 if (args["bc1clone"] == "1") {
444 text_t clone_etc = filename_cat(gsdlhome, "collect", args["bc1clonecol"], "etc");
445 text_t new_etc = filename_cat(get_collectdir(args), args["bc1dirname"], "etc");
446 text_tarray files;
447
448 if (read_dir (clone_etc, files)) {
449 text_tarray::const_iterator here = files.begin();
450 text_tarray::const_iterator end = files.end();
451 while (here != end) {
452 if (*here != "collect.cfg" && *here != "collect.cfg.org") {
453 file_copy (filename_cat(clone_etc, *here), filename_cat(new_etc, *here));
454 }
455 ++here;
456 }
457 } else {
458 outconvertclass text_t2ascii;
459 logout <<text_t2ascii << "collectoraction::check_cgiargs couldn't read from "
460 << clone_etc << " directory\n";
461 }
462 }
463 }
464
465 if (current_page == "bildstatus" || current_page == "bildcancel") {
466 // if .final file exists then build has finished
467 text_t fbld = filename_cat (gsdlhome, "tmp", args["bc1tmp"], args["bc1dirname"] + ".bld.final");
468 if (file_exists (fbld)) {
469 char *fbldc = fbld.getcstr();
470 ifstream fbld_in (fbldc);
471 if (fbld_in) {
472 failcode = fbld_in.get();
473 fbld_in.close();
474 if (failcode == '0') {
475 // success - we need to create and configure a collection server for the
476 // newly built collection (for fastcgi and local library where
477 // initialization isn't going to be redone when the user clicks the
478 // "view your new collection" button
479 create_colserver (args["bc1dirname"], logout);
480 current_page = "bilddone";
481 }
482 else current_page = "bildfail";
483 } else {
484 // assume build failed (we shouldn't get here though ... right?)
485 current_page = "bildfail";
486 }
487 delete []fbldc;
488 }
489 }
490
491 if (args["bc1fromsrce"] == "1") {
492
493 // we've just come from the "source data" page so we need to check that
494 // input sources are valid
495 if (!check_sources(args, logout)) {
496 args["p"] = "srce";
497 }
498 }
499
500 return true;
501}
502
503void collectoraction::update_cfgfile_clone (cgiargsclass &args, ostream &logout) {
504
505 text_t tmpdir = filename_cat(gsdlhome, "tmp", args["bc1tmp"]);
506 text_t cfgfile = filename_cat(tmpdir, args["bc1dirname"], "etc", "collect.cfg");
507 if (!file_exists (cfgfile)) {
508 message = "tmpfail";
509 return;
510 }
511
512 text_t cfgfile_org = filename_cat (tmpdir, "collect.cfg.org");
513
514 if (args["bc1clone"] == "1") {
515 // cloning was turned on
516
517 text_t cfgfile_clone = filename_cat(gsdlhome, "collect", args["bc1clonecol"], "etc", "collect.cfg");
518 if (file_exists (cfgfile_clone)) {
519 // if .org file doesn't exist already create it
520 if (!file_exists (cfgfile_org)) {
521 if (!file_copy (cfgfile, cfgfile_org)) {
522 message = "tmpfail";
523 return;
524 }
525 }
526 // copy clone collections cfg file to new collection
527 if (!file_copy (cfgfile_clone, cfgfile)) {
528 message = "tmpfail";
529 return;
530 }
531 // update the new cfg file
532 update_cfgfile_partial (args, true, logout);
533
534 } else {
535 // can't clone non-existant or read-protected collection
536 message = "clonefail";
537 }
538
539 } else {
540 // cloning has been turned off having been on at some point. the .org file
541 // should exist, if it doesn't we'll bail out and leave the user with the
542 // cloned copy
543 if (file_exists (cfgfile_org)) {
544 // copy original back again and update it with any recent changes
545 if (file_copy (cfgfile_org, cfgfile)) {
546 update_cfgfile_partial (args, false, logout);
547 } else {
548 message = "tmpfail";
549 }
550 }
551 }
552}
553
554// update configuration file on disk to match bc1 arguments
555// there's a special case if the clone option is true as certain parts of a
556// config file should not be cloned (e.g. the iconcollection stuff)
557void collectoraction::update_cfgfile_partial (cgiargsclass &args, bool clone, ostream &logout) {
558
559 text_t cfgfile = filename_cat(get_collectdir(args), args["bc1dirname"], "etc", "collect.cfg");
560 char *cfgfilec = cfgfile.getcstr();
561
562#if defined (__WIN32__)
563 // make sure collect.cfg isn't read-only
564 _chmod (cfgfilec, _S_IREAD | _S_IWRITE);
565#endif
566
567 vector<text_tarray> cfgarray;
568
569 // read in cfg file
570 ifstream cfg_in (cfgfilec);
571 if (cfg_in) {
572 text_tarray cfgline;
573 while (read_cfg_line(cfg_in, cfgline) >= 0) {
574 if (cfgline.size () >= 2) {
575 if (cfgline[0] == "creator" || cfgline[0] == "maintainer") {
576 cfgline[1] = args["bc1contactemail"];
577 } else if (cfgline[0] == "collectionmeta") {
578 if (cfgline[1] == "collectionname") {
579 cfgline[2] = args["bc1fullname"];
580 } else if (cfgline[1] == "collectionextra") {
581 cfgline[2] = carriage_replace (args["bc1aboutdesc"], 0);
582 } else if (clone && (cfgline[1] == "iconcollection" ||
583 cfgline[1] == "iconcollectionsmall")) {
584 cfgline[2] = g_EmptyText;
585 }
586 }
587 }
588 cfgarray.push_back (cfgline);
589 }
590 cfg_in.close();
591
592 // now write cfg file back out
593 int fd=open(cfgfilec, O_WRONLY | O_CREAT | O_TRUNC
594#if defined(__WIN32__)
595 | O_BINARY
596#endif
597 );
598
599 if (fd != -1) {
600 // lock the file
601 int lock_val = 1;
602 GSDL_LOCK_FILE (fd);
603 if (lock_val != 0) {
604 logout << "Error: Couldn't lock file " << cfgfilec << "\n";
605 close(fd);
606 message = "tmpfail";
607
608 } else {
609
610 vector<text_tarray>::const_iterator this_line = cfgarray.begin();
611 vector<text_tarray>::const_iterator end_line = cfgarray.end();
612 while (this_line != end_line) {
613 write_cfg_line (fd, *this_line);
614 ++this_line;
615 }
616 GSDL_UNLOCK_FILE (fd);
617 close(fd);
618 }
619
620 } else {
621 logout << "collectoraction::update_cfgfile_partial: unable to open "
622 << cfgfilec << " for output\n";
623 message = "tmpfail";
624 }
625
626 } else {
627 logout << "collectoraction::update_cfgfile_partial: unable to open "
628 << cfgfilec << " for input\n";
629 message = "tmpfail";
630 }
631
632 delete []cfgfilec;
633}
634
635// replace configuration file on disk with that in the cfgfile argument and
636// catch other bc1 arguments up with those the new cfgfile contains
637void collectoraction::update_cfgfile_complete (cgiargsclass &args, ostream &logout) {
638
639 text_t cfgfile = filename_cat(get_collectdir(args), args["bc1dirname"], "etc", "collect.cfg");
640 char *cfgfilec = cfgfile.getcstr();
641
642#ifdef __WIN32__
643 // make sure collect.cfg isn't read-only
644 _chmod (cfgfilec, _S_IREAD | _S_IWRITE);
645#endif
646
647 int fd=open(cfgfilec, O_WRONLY | O_CREAT | O_TRUNC
648#if defined(__WIN32__)
649 | O_BINARY
650#endif
651 );
652
653 if (fd) {
654 // lock the file
655 int lock_val = 1;
656 GSDL_LOCK_FILE (fd);
657 if (lock_val != 0) {
658 logout << "Error: Couldn't lock file " << cfgfilec << "\n";
659 close(fd);
660 message = "tmpfail";
661
662 } else {
663
664 outconvertclass text_t2ascii;
665 text_t2ascii.setinput(&args["cfgfile"]);
666 size_t buffersize=args["cfgfile"].size();
667 char *buffer=new char[buffersize];
668 buffer[0]='\n'; // just in case something goes wrong...
669 size_t num_chars;
670 convertclass::status_t status;
671 text_t2ascii.convert(buffer, buffersize, num_chars, status);
672 // ignore status - assume it is "finished" as buffer is big enough
673 write(fd, buffer, num_chars);
674 GSDL_UNLOCK_FILE (fd);
675 close(fd);
676 delete []buffer;
677
678 // now that we've written the file we'll read it back again and
679 // update our bc1 arguments
680 ifstream cfg_in (cfgfilec);
681 if (cfg_in) {
682 text_tarray cfgline;
683 while (read_cfg_line(cfg_in, cfgline) >= 0) {
684 if (cfgline.size () >= 2) {
685 if (cfgline[0] == "creator") {
686 args["bc1contactemail"] = cfgline[1];
687 } else if (cfgline[0] == "collectionmeta") {
688 if (cfgline[1] == "collectionname") {
689 args["bc1fullname"] = cfgline[2];
690 } else if (cfgline[1] == "collectionextra") {
691 args["bc1aboutdesc"] = carriage_replace (cfgline[2], 1);
692 }
693 }
694 }
695 }
696 cfg_in.close();
697 } else {
698 logout << "collectoraction::update_cfgfile_complete: unable to open "
699 << cfgfilec << " for input\n";
700 message = "tmpfail";
701 }
702 }
703 } else {
704 logout << "collectoraction::update_cfgfile_complete: unable to open "
705 << cfgfilec << " for output\n";
706 message = "tmpfail";
707 }
708
709 delete []cfgfilec;
710}
711
712void collectoraction::get_cgihead_info (cgiargsclass &/*args*/, recptprotolistclass * /*protos*/,
713 response_t &response,text_t &response_data,
714 ostream &/*logout*/) {
715 response = content;
716 response_data = "text/html";
717}
718
719// return html for buttons used in collector bar
720// color may be "green", "grey", or "yellow"
721// type may be:
722// "info" --> "collection information" button
723// "srce" --> "source data" button
724// "conf" --> "configure collection" button
725// "bild" --> "build collection" button
726// "view" --> "view collection" button
727// if enabled is true button will be flashy rollover type and
728// will be hyperlinked
729
730text_t collectoraction::get_button(const text_t &thispage, const text_t &color,
731 const text_t &type, bool enabled) {
732
733 if ((color != "green" && color != "grey" && color != "yellow") ||
734 (type != "info" && type != "srce" && type != "conf" && type != "bild" && type != "view"))
735 return g_EmptyText;
736
737 text_t href = "_http"+type+"_";
738 text_t target = "";
739 if (thispage == "info" || thispage == "srce" || thispage == "conf" ||
740 thispage == "bildcancel" || thispage == "bildfail") {
741 // call the check submit macro instead of linking directly to the page
742 href="\"javascript:check_submit('"+type+"');\"";
743 } else if (type == "view") {
744 // view button is special case as it needs a target=_top
745 target = " target=_top";
746 }
747
748 text_t tdclass = "collectorbar"+color;
749 if (enabled) {
750 // link to the appropriate page
751 return "<td class="+tdclass+"><a href="+href+target+">_text"+type+"_</a></td>";
752 }
753 else {
754 // just display the text
755 return "<td class="+tdclass+">_text"+type+"_</td>";
756 }
757}
758
759
760// set the _fullnamemenu_ macro (and _warnindex_ and _selectedindex_ if
761// we're on the "srce" page)
762void collectoraction::set_fullnamemenu (displayclass &disp, cgiargsclass &args,
763 recptprotolistclass *protos, ostream &logout) {
764
765 if (recpt == NULL) {
766 logout << "ERROR (collectoraction::set_fullnamemenu): This action does not contain\n"
767 << " information about any receptionists. The method set_receptionist was\n"
768 << " probably not called from the module which instantiated this action.\n";
769 return;
770 }
771
772 text_t &current_page = args["p"];
773 text_t currentname = args["bc1dirname"];
774 if (current_page == "srce") currentname = args["bc1clonecol"];
775
776 text_tarray dirnames;
777 text_tarray fullnames;
778 vector<bool> write_protected;
779 bool is_selected = false;
780 int selected_index = 0;
781 int index = 0;
782
783 recptprotolistclass::iterator rprotolist_here = protos->begin();
784 recptprotolistclass::iterator rprotolist_end = protos->end();
785 while (rprotolist_here != rprotolist_end) {
786 if ((*rprotolist_here).p != NULL) {
787
788 // don't include z39.50 collections
789 comerror_t err = noError;
790 if ((*rprotolist_here).p->get_protocol_name (err) == "z3950proto") {
791 ++rprotolist_here;
792 continue;
793 }
794
795 text_tarray collist;
796 (*rprotolist_here).p->get_collection_list (collist, err, logout);
797 if (err == noError) {
798 text_tarray::iterator collist_here = collist.begin();
799 text_tarray::iterator collist_end = collist.end();
800 while (collist_here != collist_end) {
801 ColInfoResponse_t *cinfo = recpt->get_collectinfo_ptr ((*rprotolist_here).p, *collist_here, logout);
802 if (cinfo != NULL) {
803 text_t collectionname = cinfo->get_collectionmeta("collectionname", args["l"]);
804 if (collectionname.empty()) {
805 collectionname = *collist_here;
806 }
807 dirnames.push_back(*collist_here);
808 fullnames.push_back(collectionname);
809 // check to see if the collection is writable
810 if (collection_protected (*collist_here)) write_protected.push_back(true);
811 else write_protected.push_back(false);
812
813 if (*collist_here == currentname) {
814 is_selected = true;
815 selected_index = index;
816 }
817 ++index;
818 }
819 ++collist_here;
820 }
821 }
822 }
823 ++rprotolist_here;
824 }
825
826 bool first = true;
827 text_t warnindex;
828 text_t fullnamemenu = "<select name=\"bc1dirname\">\n";
829 if (current_page == "srce") {
830 fullnamemenu = "<select name=\"bc1clonecol\" onChange=\"menuchange();\">\n";
831 fullnamemenu += "<option value=defaultstructure";
832 if (!is_selected) fullnamemenu += " selected>";
833 else fullnamemenu.push_back('>');
834 fullnamemenu += "_collector:textdefaultstructure_\n";
835 }
836 for (int i = 0; i < index; ++i) {
837 // don't want write protected collections in list on "change existing
838 // collection" page
839 if (write_protected[i] && current_page == "existing") continue;
840 fullnamemenu += "<option value=\"" + dirnames[i] + "\"";
841 if ((i == 0 && !is_selected && current_page != "srce") ||
842 (is_selected && i == selected_index)) {
843 fullnamemenu += " selected";
844 ++selected_index;
845 is_selected = false;
846 }
847 fullnamemenu.push_back ('>');
848 fullnamemenu += fullnames[i];
849 fullnamemenu.push_back ('\n');
850
851 // add to Warnindex if collection uses any dubious plugins
852 // (if creating clone collection list)
853 if (current_page == "srce") {
854 if (first) warnindex += "0,";
855 else warnindex.push_back(',');
856 if (uses_weird_plugin (dirnames[i])) {
857 warnindex += text_t (1);
858 } else {
859 warnindex += text_t (0);
860 }
861 }
862 first = false;
863 }
864 fullnamemenu += "</select>\n";
865
866 disp.setmacro ("fullnamemenu", "collector", fullnamemenu);
867 if (current_page == "srce") {
868 disp.setmacro ("warnindex", "collector", warnindex);
869 disp.setmacro ("selectedindex", "collector", text_t(selected_index));
870 }
871}
872
873// set _sourcelist_ and _badsources_ macros
874void collectoraction::set_inputsourceboxes (displayclass &disp, cgiargsclass &args,
875 ostream &logout) {
876
877 if (badsources) disp.setmacro ("badsources", "collector", "1");
878
879 text_t sourcelist = get_source_box(args["bc1input"], args["bc1inputnum"].getint(),
880 args["bc1inputtype"]);
881
882 disp.setmacro("sourcelist", "collector", sourcelist);
883
884 // reset badsources and failedsources variables
885 badsources = false;
886 failedsources.erase(failedsources.begin(), failedsources.end());
887}
888
889text_t collectoraction::get_source_box (text_t inputarglist, int numboxes,
890 text_t inputtypelist) {
891
892 text_tarray inputvalues;
893 splitchar (inputarglist.begin(), inputarglist.end(), ',', inputvalues);
894 // remove any empty values from the end of the array
895 if (inputvalues.size()) {
896 text_tarray::iterator l = inputvalues.end() - 1;
897 text_tarray::iterator b = inputvalues.begin();
898 while ((*l).empty() && l >= b) {
899 --l;
900 }
901 inputvalues.erase(l+1, inputvalues.end());
902 }
903
904 text_tarray inputtypes;
905 splitchar (inputtypelist.begin(), inputtypelist.end(), ',', inputtypes);
906
907 int numvalues = inputvalues.size();
908 int numtypes = inputtypes.size();
909
910 text_t last = "file://";
911 text_t rv;
912 for (int i = 0; i < numboxes; ++i) {
913 rv += "<nobr><select name=\"bc1inputtype\">\n";
914 rv += "<option value=\"file://\"";
915 if ((i < numtypes && inputtypes[i] == "file://") ||
916 (numboxes == 3 && i == 0 && numvalues == 0) ||
917 (i >= 3 && i >= numvalues && last == "file://")) {
918 rv += " selected";
919 last = "file://";
920 }
921 rv += ">file://\n";
922 rv += "<option value=\"http://\"";
923 if ((i < numtypes && inputtypes[i] == "http://") ||
924 (numboxes == 3 && i == 1 && numvalues == 0) ||
925 (i >= 3 && i >= numvalues && last == "http://")) {
926 rv += " selected";
927 last = "http://";
928 }
929 rv += ">http://\n";
930 rv += "<option value=\"ftp://\"";
931 if ((i < numtypes && inputtypes[i] == "ftp://") ||
932 (numboxes == 3 && i == 2 && numvalues == 0) ||
933 (i >= 3 && i >= numvalues && last == "ftp://")) {
934 rv += " selected";
935 last = "ftp://";
936 }
937 rv += ">ftp://\n";
938 rv += "</select>\n";
939 rv += "<input type=text name=\"bc1input\" value=\"";
940 if (i < numvalues) {
941 rv += dm_safe(decode_commas(inputvalues[i]));
942 }
943 rv += "\" size=50>";
944 if (badsources) {
945 if ((i < numvalues) && (!inputvalues[i].empty())) {
946 if (failedsources[decode_commas(inputvalues[i])] == "1") {
947 rv += "_iconcross_";
948 } else {
949 rv += "_icontick_";
950 }
951 } else {
952 rv += "_iconblank_";
953 }
954 }
955 if (i+1 == numboxes) {
956 if (!badsources) rv += "_iconblank_";
957 rv += "_imagemore_</nobr><br>";
958 } else {
959 rv += "</nobr><br>\n";
960 }
961 }
962
963 return rv;
964}
965
966// set the _cfgfile_ macro
967void collectoraction::set_cfgfile (displayclass &disp, cgiargsclass &args, ostream &logout) {
968
969 text_t &collection = args["bc1dirname"];
970 if (collection.empty()) {
971 message = "nocollection";
972 return;
973 }
974
975 // read in collect.cfg
976 text_t cfgfile = filename_cat(get_collectdir(args), collection, "etc", "collect.cfg");
977 char *cfgfilec = cfgfile.getcstr();
978
979#ifdef GSDL_USE_IOS_H
980 ifstream cfg_ifs (cfgfilec, ios::in | ios::nocreate);
981#else
982 ifstream cfg_ifs (cfgfilec, ios::in);
983#endif
984
985 if (cfg_ifs) {
986 // read in collect.cfg
987 text_t cfgtext;
988 char c;
989 cfg_ifs.get(c);
990 while (!cfg_ifs.eof ()) {
991 cfgtext.push_back(c);
992 cfg_ifs.get(c);
993 }
994 cfg_ifs.close();
995
996 // define it as a macro
997 disp.setmacro("cfgfile", "collector", dm_safe(cfgtext));
998
999 } else {
1000 logout << "collectoraction::set_cfgfile: couldn't open configuration file ("
1001 << cfgfilec << ") for reading\n";
1002 message = "tmpfail";
1003 }
1004 delete []cfgfilec;
1005}
1006
1007// set the _statusline_ macro
1008void collectoraction::set_statusline (displayclass &disp, cgiargsclass &args, ostream & /*logout*/) {
1009
1010 // the build command creates .bld.download, .bld.import, and .bld.build files (in that
1011 // order) and deletes them (also in that order) when each stage is complete. the .bld
1012 // file is the concatenation of all these files.
1013 text_t bld_file = filename_cat (gsdlhome, "tmp", args["bc1tmp"], args["bc1dirname"] + ".bld");
1014 text_t statusline;
1015
1016 if (file_exists (bld_file + ".download")) {
1017 statusline = "_collector:textdownloadingfiles_<br>\n";
1018 statusline += dm_safe(file_tail(bld_file + ".download", 1, 0));
1019 } else if (file_exists (bld_file + ".import")) {
1020 statusline = "_collector:textimportingcollection_<br>\n";
1021 statusline += dm_safe(file_tail(bld_file + ".import", 1, 0));
1022 } else if (file_exists (bld_file + ".build")) {
1023 statusline = "_collector:textbuildingcollection_<br>\n";
1024 statusline += dm_safe(file_tail(bld_file + ".build", 1, 0));
1025 } else {
1026 statusline += "_collector:textcreatingcollection_<br>\n";
1027 statusline += dm_safe(file_tail(bld_file, 1, 0));
1028 }
1029
1030 disp.setmacro ("statusline", "collector", statusline);
1031
1032}
1033
1034void collectoraction::define_internal_macros (displayclass &disp, cgiargsclass &args,
1035 recptprotolistclass *protos, ostream &logout) {
1036
1037 // define_internal_macros sets the following macros:
1038 // _collectorbar_
1039 // _pagescriptextra_
1040 // _fullnamemenu_ -- if displaying the "source data" page or the "changing existing
1041 // collection" page
1042 // _cfgfile_ -- if displaying the "configure collection" page
1043 // _statusline_ -- if displaying the bildstatus page
1044 // _header_ -- may be set for pages that require it
1045 // _textfailmsg_ -- set to different messages depending on failcode returned
1046 // by build script (if build fails)
1047 // _faillog_ - set to last 6 lines of .bld file if build failed
1048 // _gsdlhome_ - the gsdlhome path (dm_safe)
1049 // _sourcelist_ -- "input source" text boxes
1050 // _badsources_ -- will be set to "1" if we've come from the
1051 // "source data" page and there's a problem
1052 // with the input sources
1053
1054 text_t &collector_page = args["p"];
1055 int esrce = args["bc1esrce"].getint();
1056 int econf = args["bc1econf"].getint();
1057
1058 // set _pagescriptextra_ macro to _cpagescriptextra_
1059 disp.setmacro ("pagescriptextra", "collector", "_" + collector_page + "scriptextra_");
1060
1061 if (collector_page == "bildstatus" || collector_page == "bilddone" ||
1062 collector_page == "bildfail" || collector_page == "bildframe1") {
1063 disp.setmacro ("header", "collector", "_" + collector_page + "header_");
1064 }
1065
1066 // set the collectorbar macro
1067 text_t collectorbar = "<table class=collectorbar border=0 cellspacing=4 cellpadding=0><tr>\n";
1068
1069 if (collector_page == "new") {
1070 collectorbar += "<td>_icongreyarrow_</td>\n";
1071 collectorbar += get_button (collector_page, "green", "info", true);
1072 collectorbar += "<td>_icongreyarrow_</td>\n";
1073 collectorbar += get_button (collector_page, "grey", "srce", false);
1074 collectorbar += "<td>_icongreyarrow_</td>\n";
1075 collectorbar += get_button (collector_page, "grey", "conf", false);
1076 collectorbar += "<td>_icongreyarrow_</td>\n";
1077 collectorbar += get_button (collector_page, "grey", "bild", false);
1078 collectorbar += "<td>_icongreyarrow_</td>\n";
1079 collectorbar += get_button (collector_page, "grey", "view", false);
1080
1081 } else if (collector_page == "info") {
1082 collectorbar += "<td>_icongreyarrow_</td>\n";
1083 collectorbar += get_button (collector_page, "yellow", "info", false);
1084 collectorbar += "<td>_icongreyarrow_</td>\n";
1085 collectorbar += get_button (collector_page, "green", "srce", true);
1086 collectorbar += "<td>_icongreyarrow_</td>\n";
1087 collectorbar += get_button (collector_page, "grey", "conf", false);
1088 collectorbar += "<td>_icongreyarrow_</td>\n";
1089 collectorbar += get_button (collector_page, "grey", "bild", false);
1090 collectorbar += "<td>_icongreyarrow_</td>\n";
1091 collectorbar += get_button (collector_page, "grey", "view", false);
1092 collectorbar += "</tr><tr><td></td><td align=center>_icongreyuparrow_</td><td colspan=8></td>\n";
1093
1094 } else if (collector_page == "srce") {
1095 collectorbar += "<td>_icongreyarrow_</td>\n";
1096 if (esrce == 1) {
1097 // if we came from the "change an existing collection" page previous button(s)
1098 // are disabled
1099 collectorbar += get_button (collector_page, "grey", "info", false);
1100 } else {
1101 collectorbar += get_button (collector_page, "yellow", "info", true);
1102 }
1103 collectorbar += "<td>_icongreyarrow_</td>\n";
1104 collectorbar += get_button (collector_page, "yellow", "srce", false);
1105 collectorbar += "<td>_icongreyarrow_</td>\n";
1106 collectorbar += get_button (collector_page, "green", "conf", true);
1107 collectorbar += "<td>_icongreyarrow_</td>\n";
1108 collectorbar += get_button (collector_page, "green", "bild", true);
1109 collectorbar += "<td>_icongreyarrow_</td>\n";
1110 collectorbar += get_button (collector_page, "grey", "view", false);
1111 collectorbar += "</tr><tr><td colspan=3></td><td align=center>_icongreyuparrow_</td><td colspan=6></td>\n";
1112
1113 } else if (collector_page == "conf") {
1114 collectorbar += "<td>_icongreyarrow_</td>\n";
1115 // disable appropriate buttons if we came from "change an existing collection"
1116 // page
1117 if (esrce == 1 || econf == 1) {
1118 collectorbar += get_button (collector_page, "grey", "info", false);
1119 } else {
1120 collectorbar += get_button (collector_page, "yellow", "info", true);
1121 }
1122 collectorbar += "<td>_icongreyarrow_</td>\n";
1123 if (econf == 1) {
1124 collectorbar += get_button (collector_page, "grey", "srce", false);
1125 } else {
1126 collectorbar += get_button (collector_page, "yellow", "srce", true);
1127 }
1128 collectorbar += "<td>_icongreyarrow_</td>\n";
1129 collectorbar += get_button (collector_page, "yellow", "conf", false);
1130 collectorbar += "<td>_icongreyarrow_</td>\n";
1131 collectorbar += get_button (collector_page, "green", "bild", true);
1132 collectorbar += "<td>_icongreyarrow_</td>\n";
1133 collectorbar += get_button (collector_page, "grey", "view", false);
1134 collectorbar += "</tr><tr><td colspan=5></td><td align=center>_icongreyuparrow_</td><td colspan=4></td>\n";
1135
1136 } else if (collector_page == "bilddone") {
1137 collectorbar += "<td>_icongreyarrow_</td>\n";
1138 // all previous buttons grey after build was completed
1139 collectorbar += get_button (collector_page, "grey", "info", false);
1140 collectorbar += "<td>_icongreyarrow_</td>\n";
1141 collectorbar += get_button (collector_page, "grey", "srce", false);
1142 collectorbar += "<td>_icongreyarrow_</td>\n";
1143 collectorbar += get_button (collector_page, "grey", "conf", false);
1144 collectorbar += "<td>_icongreyarrow_</td>\n";
1145 collectorbar += get_button (collector_page, "yellow", "bild", false);
1146 collectorbar += "<td>_icongreyarrow_</td>\n";
1147 collectorbar += get_button (collector_page, "green", "view", true);
1148 collectorbar += "</tr><tr><td colspan=7></td><td align=center>_icongreyuparrow_</td><td colspan=2></td>\n";
1149
1150 } else if (collector_page == "bildcancel" || collector_page == "bildfail") {
1151 collectorbar += "<td>_icongreyarrow_</td>\n";
1152 // disable appropriate buttons if we came from "change an existing collection"
1153 // page
1154 if (esrce == 1 || econf == 1) {
1155 collectorbar += get_button (collector_page, "grey", "info", false);
1156 } else {
1157 collectorbar += get_button (collector_page, "yellow", "info", true);
1158 }
1159 collectorbar += "<td>_icongreyarrow_</td>\n";
1160 if (econf == 1) {
1161 collectorbar += get_button (collector_page, "grey", "srce", false);
1162 } else {
1163 collectorbar += get_button (collector_page, "yellow", "srce", true);
1164 }
1165 collectorbar += "<td>_icongreyarrow_</td>\n";
1166 collectorbar += get_button (collector_page, "yellow", "conf", true);
1167 collectorbar += "<td>_icongreyarrow_</td>\n";
1168 collectorbar += get_button (collector_page, "yellow", "bild", true);
1169 collectorbar += "<td>_icongreyarrow_</td>\n";
1170 collectorbar += get_button (collector_page, "grey", "view", false);
1171 }
1172
1173 collectorbar += "</tr></table>\n";
1174 disp.setmacro ("collectorbar", "collector", collectorbar);
1175
1176 if (collector_page == "bildfail") {
1177
1178 text_t textfailmsg = "_textfailmsg";
1179 textfailmsg.push_back(failcode);
1180 textfailmsg.push_back('_');
1181 disp.setmacro("textfailmsg", "collector", textfailmsg);
1182
1183 text_t bldlog = filename_cat(gsdlhome, "tmp", args["bc1tmp"], args["bc1dirname"] + ".bld");
1184 text_t rawlog = file_tail (bldlog, 6, 0);
1185 // we'll shove in some <br> tags where \n's occur
1186 text_t faillog;
1187 text_t::const_iterator here = rawlog.begin();
1188 text_t::const_iterator end = rawlog.end();
1189 while (here != end) {
1190 if (*here == '\n') faillog += "<br>";
1191 faillog.push_back (*here);
1192 ++here;
1193 }
1194 disp.setmacro ("faillog", "collector", dm_safe(faillog));
1195 }
1196
1197 if (collector_page == "srce" || collector_page == "existing")
1198 set_fullnamemenu (disp, args, protos, logout);
1199 if (collector_page == "conf")
1200 set_cfgfile (disp, args, logout);
1201 if (collector_page == "bildstatus")
1202 set_statusline (disp, args, logout);
1203 if (collector_page == "srce") {
1204 set_inputsourceboxes (disp, args, logout);
1205 }
1206
1207 disp.setmacro ("gsdlhome", "collector", dm_safe(gsdlhome));
1208}
1209
1210bool collectoraction::do_action (cgiargsclass &args, recptprotolistclass * /*protos*/,
1211 browsermapclass * /*browsers*/, displayclass &disp,
1212 outconvertclass &outconvert, ostream &textout,
1213 ostream &logout) {
1214
1215 // make sure the collector is enabled
1216 if (disabled) {
1217 textout << outconvert
1218 << "<html>\n"
1219 << "<head>\n"
1220 << "<title>Collector disabled</title>\n"
1221 << "</head>\n"
1222 << "<body bgcolor=\"#ffffff\" text=\"#000000\" link=\"#006666\" "
1223 << "alink=\"#cc9900\" vlink=\"#666633\">\n"
1224 << "<h2>Facility disabled</h2>\n"
1225 << "Sorry, the Collector end-user collection building facility is currently disabled\n"
1226 << "\n</body>\n"
1227 << "</html>\n";
1228 return true;
1229 }
1230
1231 text_t &collector_page = args["p"];
1232 text_t &collection = args["bc1dirname"];
1233
1234 // make sure we have perl (we won't bother with this check for the
1235 // building status pages to avoid slowing things down unneccessarily)
1236 if (collector_page != "bildstatus" && collector_page != "bildframe1" && !perl_ok(logout)) {
1237 textout << outconvert
1238 << "<html>\n"
1239 << "<head>\n"
1240 << "<title>Perl not found</title>\n"
1241 << "</head>\n"
1242 << "<body bgcolor=\"#ffffff\" text=\"#000000\" link=\"#006666\" "
1243 << "alink=\"#cc9900\" vlink=\"#666633\">\n"
1244 << "<h2>Perl not found</h2>\n"
1245 << "Greenstone could not detect perl on this system. It is therefore not\n"
1246 << "possible to build a Greenstone collection, either from the Collector or the \n"
1247 << "command-line tools, or to use the Collector for any other task.\n"
1248 << "<p>Please refer to the Greenstone Installer's Guide for details on\n"
1249 << "installing perl on your system.\n"
1250 << "\n</body>\n"
1251 << "</html>\n";
1252 return true;
1253
1254 }
1255
1256 if (collector_page == "bild") {
1257 // do the work (download, import, build)
1258 gsdl_build (args, logout);
1259
1260 if (message.empty()) {
1261 // bild page is a frameset so we don't want headers and stuff
1262 textout << outconvert << disp << ("_collector:bildcontent_\n");
1263 }
1264 }
1265
1266 if (do_mkcol == true) {
1267 // execute mkcol.pl (do_mkcol is set from within check_cgiargs)
1268 gsdl_mkcol (args, logout);
1269 do_mkcol = false; // reset for fast-cgi
1270 }
1271
1272 if (args["bc1dodelete"] == "1") {
1273 // delete bcidirname collection
1274 if (collection_protected (collection)) {
1275 message = "delinvalid";
1276
1277 } else {
1278
1279 const recptconf &rcinfo = recpt->get_configinfo ();
1280 bool emailuserevents = rcinfo.EmailUserEvents;
1281
1282 // get collection maintainer email from collect.cfg before we
1283 // delete it
1284 text_t colmaintainer;
1285 text_t cfgfile = filename_cat(gsdlhome, "collect", collection, "etc", "collect.cfg");
1286 char *cfgfilec = cfgfile.getcstr();
1287 ifstream cfg_in (cfgfilec);
1288 delete []cfgfilec;
1289 if (cfg_in) {
1290 text_tarray cfgline;
1291 while (read_cfg_line(cfg_in, cfgline) >= 0) {
1292 if (cfgline.size () == 2 && cfgline[0] == "maintainer") {
1293 colmaintainer = cfgline[1];
1294 break;
1295 }
1296 }
1297 cfg_in.close();
1298 }
1299 if (colmaintainer.empty()) {
1300 logout << outconvert
1301 << "collectoraction::do_action WARNING: Collection being deleted ("
1302 << collection << ") has no maintainer address. EmailUserEvents "
1303 << "disabled\n";
1304 emailuserevents = false;
1305 }
1306
1307 // first we need to free up the collection's collection server
1308 // we must do this for the local library (and I guess when using
1309 // fastcgi too) as you can't delete the gdbm file while it's
1310 // being kept open by the collection server
1311 remove_colservr (collection, logout);
1312
1313 text_t delete_cmd = "perl -S delcol.pl -f " + collection;
1314 int rv = gsdl_system (delete_cmd, true, logout);
1315 if (rv != 0) {
1316 // deletion failed -- permissions?
1317 message = "delpermission";
1318 } else {
1319 message = "delsuccess";
1320 }
1321
1322 // log the event
1323 if (rcinfo.LogEvents == CollectorEvents || rcinfo.LogEvents == AllEvents) {
1324
1325 text_t eventlog = filename_cat (gsdlhome, "etc", "events.txt");
1326 char *eventlogt = eventlog.getcstr();
1327 ofstream eventl (eventlogt, ios::app);
1328 delete []eventlogt;
1329
1330 if (eventl) {
1331 eventl << outconvert << "[Collector Event]\n"
1332 << "Date: " << get_date (true) << "\n"
1333 << "Greenstone Username: " << args["un"] << "\n"
1334 << "Collection: " << collection << "\n"
1335 << "Collection Maintainer: " << colmaintainer << "\n"
1336 << "GSDLHOME: " << gsdlhome << "\n";
1337
1338 if (message == "delsuccess") {
1339 eventl << outconvert
1340 << "The " << collection << " collection was successfully deleted\n\n";
1341 } else {
1342 eventl << outconvert
1343 << "Attempt to delete the " << collection << " collection failed\n\n";
1344 }
1345 eventl.close();
1346
1347 } else {
1348 logout << outconvert << "collectoraction::do_action ERROR: Couldn't open "
1349 << "event log file " << eventlog << " for appending during collection "
1350 << "deletion. LogEvents disabled\n";
1351 }
1352 }
1353
1354 if (rcinfo.EmailEvents == CollectorEvents || rcinfo.EmailEvents == AllEvents || emailuserevents) {
1355 // use sendmail.pl perl script to send email events
1356 text_t tmpmailfile = filename_cat (gsdlhome, "tmp", args["bc1tmp"], "event.txt");
1357 char *tmpmailfilec = tmpmailfile.getcstr();
1358 ofstream tmpfile (tmpmailfilec);
1359 delete []tmpmailfilec;
1360 if (tmpfile) {
1361 tmpfile << outconvert << "[Collector Event]\n"
1362 << "Date: " << get_date (true) << "\n"
1363 << "Greenstone Username: " << args["un"] << "\n"
1364 << "Collection: " << collection << "\n"
1365 << "Collection Maintainer: " << colmaintainer << "\n"
1366 << "GSDLHOME: " << gsdlhome << "\n";
1367 if (message == "delsuccess") {
1368 tmpfile << outconvert
1369 << "The " << collection << " collection was successfully deleted\n\n";
1370 } else {
1371 tmpfile << outconvert
1372 << "Attempt to delete the " << collection << " collection failed\n\n";
1373 }
1374 tmpfile.close();
1375 text_t to;
1376 if (rcinfo.EmailEvents == CollectorEvents || rcinfo.EmailEvents == AllEvents) to += rcinfo.maintainer;
1377 if (emailuserevents) {
1378 if (!to.empty()) to.push_back (',');
1379 to += colmaintainer;
1380 }
1381 text_t sendmail_cmd = "perl -S sendmail.pl -to \"" + to + "\" -from \"" + rcinfo.maintainer;
1382 sendmail_cmd += "\" -smtp \"" + rcinfo.MailServer + "\" -subject \"Greenstone Collector Event\"";
1383 sendmail_cmd += " -msgfile \"" + tmpmailfile + "\"";
1384
1385 gsdl_system (sendmail_cmd, false, logout);
1386
1387 } else {
1388 logout << outconvert << "collectoraction::do_action ERROR: Couldn't open "
1389 << "temporary event log file " << tmpmailfile << " during collection "
1390 << "deletion. EmailEvents and EmailUserEvents disabled\n";
1391 }
1392 }
1393 }
1394 }
1395
1396 if (collector_page == "bildcancel" || collector_page == "bildfail") {
1397 // cancel the build (we'll also use the cancel_build script to tidy
1398 // up if the build failed)
1399 gsdl_cancel_build (args, logout);
1400 }
1401
1402 if (collector_page == "expt") {
1403
1404 // export the collection - we'll do a synchronous system call to
1405 // exportcol.pl as that's the easiest way to do it. if it becomes a
1406 // problem that it's taking too long to export a large collection then
1407 // we may have to revisit this.
1408 text_t tmpfile = filename_cat (gsdlhome, "tmp", collection + "_export.txt");
1409 text_t export_cmd = "perl -S exportcol.pl -out \"" + tmpfile + "\" " + collection;
1410 gsdl_system (export_cmd, true, logout);
1411 if (file_exists (tmpfile)) {
1412 text_t returnline = file_tail (tmpfile, 1, 0);
1413 if (returnline.size() > 23 && (substr(returnline.begin(), returnline.begin()+23) == "exportcol.pl succeeded:")) {
1414 // success
1415 message = "exptsuccess";
1416 } else {
1417 message = "exptfail";
1418 }
1419 } else {
1420 message = "exptfail";
1421 }
1422 }
1423
1424 if (message.empty()) {
1425 if (collector_page != "bild") {
1426 // output page ("bild" page was already output above)
1427 textout << outconvert << disp << ("_collector:header_\n")
1428 << ("_collector:" + collector_page + "content_\n")
1429 << ("_collector:footer_\n");
1430 }
1431 } else {
1432 // message was set somewhere (probably an error), output message page
1433 textout << outconvert << disp << ("_collector:header_\n")
1434 << ("_collector:" + message + "content_\n")
1435 << ("_collector:footer_\n");
1436 message.clear();
1437 }
1438 return true;
1439}
1440
1441// if sw = 0 replace all carriage returns in intext with the string "\n"
1442// else replace all occurances of "\n" with a carriage return
1443text_t collectoraction::carriage_replace (const text_t &intext, int sw) {
1444
1445 text_t outtext;
1446 text_t::const_iterator here = intext.begin();
1447 text_t::const_iterator end = intext.end();
1448 while (here != end) {
1449 if (sw == 0) {
1450 if (*here == '\n') {
1451 if ((here+1) != end && *(here+1) == '\r') ++here;
1452 outtext += "\\n";
1453 } else if (*here == '\r') {
1454 if ((here+1) != end && *(here+1) == '\n') ++here;
1455 outtext += "\\n";
1456 } else {
1457 outtext.push_back (*here);
1458 }
1459 } else if (*here == '\\' && (here+1) != end && *(here+1) == 'n') {
1460 outtext.push_back ('\n');
1461 ++here;
1462 } else {
1463 outtext.push_back (*here);
1464 }
1465 ++here;
1466 }
1467 return outtext;
1468}
1469
1470// create a short directory name from fullname
1471text_t collectoraction::get_directory_name (const text_t &fullname) {
1472
1473 text_t shortname;
1474 if (fullname.empty()) {
1475 shortname = "coll";
1476
1477 } else {
1478
1479 // first make all lowercase and remove any dodgy characters
1480 // (i.e. anything not [a-z]
1481 text_t::const_iterator here = fullname.begin();
1482 text_t::const_iterator end = fullname.end();
1483 while (here != end) {
1484 if ((*here >= 'A' && *here <= 'Z') || (*here >= 'a' && *here <= 'z') ||
1485 (*here == ' ')) {
1486 if (*here >= 'A' && *here <= 'Z') shortname.push_back (*here+32);
1487 else if (*here == ' ') {
1488 while ((*(here+1)) == ' ') ++here;
1489 shortname.push_back (*here);
1490 } else shortname.push_back (*here);
1491 }
1492 ++here;
1493 }
1494
1495 text_tarray words;
1496 splitchar (shortname.begin(), shortname.end(), ' ', words);
1497 int num_words = words.size();
1498
1499 if (num_words == 0) {
1500 shortname = "coll";
1501
1502 } else {
1503
1504 shortname.clear();
1505 int use_words = (num_words <= 6) ? num_words : 6;
1506 unsigned int substr_len = 6 / use_words;
1507
1508 for (int i = 0; i < use_words; ++i) {
1509 if (words[i].size() < substr_len) shortname += words[i];
1510 else shortname += substr (words[i].begin(), words[i].begin()+substr_len);
1511 }
1512 }
1513 }
1514
1515 // check to see if shortname is unique
1516 text_t fulldirname = filename_cat (gsdlhome, "collect", shortname);
1517 if (directory_exists (fulldirname)) {
1518 int version = 0;
1519 text_t newname;
1520 do {
1521 ++version;
1522 newname = shortname;
1523 newname.push_back ('v');
1524 newname.appendint (version);
1525 fulldirname = filename_cat (gsdlhome, "collect", newname);
1526 } while (directory_exists (fulldirname));
1527
1528 shortname = newname;
1529 }
1530
1531 return shortname;
1532}
1533
1534// tests if collection is write protected (currently just checks if
1535// collect.cfg file is writable
1536bool collectoraction::collection_protected (const text_t &collection) {
1537 text_t cfgfile = filename_cat(gsdlhome, "collect", collection, "etc", "collect.cfg");
1538 if (file_writable(cfgfile)) return false;
1539 return true;
1540}
1541
1542// assigns a temporary directory name for this collector session
1543// and creates temporary directory
1544// returns false if it couldn't create the directory
1545bool collectoraction::assign_tmpname (cgiargsclass &args, ostream &logout) {
1546
1547 int i = 0;
1548 text_t tmpname = "tbuild";
1549 while (directory_exists (filename_cat (gsdlhome, "tmp", tmpname + text_t(i)))) {
1550 ++i;
1551 }
1552 tmpname.appendint (i);
1553
1554 text_t fulltmpdir = filename_cat (gsdlhome, "tmp", tmpname);
1555 if (!mk_dir (fulltmpdir)) {
1556 outconvertclass text_t2ascii;
1557 logout << text_t2ascii << "collectoraction::assign_tmpname unable to create directory ("
1558 << fulltmpdir << ")\n";
1559 return false;
1560 }
1561
1562 args["bc1tmp"] = tmpname;
1563 return true;
1564}
1565
1566void collectoraction::gsdl_mkcol (cgiargsclass &args, ostream &logout) {
1567
1568 text_t tmpdir = filename_cat (gsdlhome, "tmp", args["bc1tmp"]);
1569 if (!directory_exists (tmpdir)) {
1570 message = "tmpfail";
1571 return;
1572 }
1573
1574 text_t &collection = args["bc1dirname"];
1575 if (collection.empty()) {
1576 message = "nocollection";
1577 return;
1578 }
1579
1580 // check for a .create file - if it exists then we've already created the collection
1581 text_t createfile = filename_cat (tmpdir, ".create");
1582 if (file_exists (createfile)) {
1583 return;
1584 }
1585
1586 // set up options
1587 text_t options = "-quiet -creator \"" + args["bc1contactemail"] + "\"";
1588 options += " -title \"" + args["bc1fullname"] + "\"";
1589 options += " -about \"" + carriage_replace (args["bc1aboutdesc"] + "_collectorextra_", 0) + "\"";
1590 options += " -collectdir \"" + remove_trailing_slashes(tmpdir) + "\" ";
1591
1592 text_t optionfile = filename_cat (tmpdir, "mkcol.opt");
1593 char *optionfilec = optionfile.getcstr();
1594 ofstream ofile_out (optionfilec);
1595 delete []optionfilec;
1596 if (!ofile_out) {
1597 message = "tmpfail";
1598 return;
1599 }
1600 outconvertclass text_t2ascii;
1601 ofile_out << text_t2ascii << options << "\n";
1602 ofile_out.close();
1603
1604 // run mkcol.pl
1605 text_t mkcol_cmd = "perl -S mkcol.pl -optionfile \"" + optionfile;
1606 mkcol_cmd += "\" " + collection;
1607 gsdl_system (mkcol_cmd, true, logout);
1608
1609 // make sure it went ok
1610 text_t cfgfile = filename_cat (tmpdir, collection, "etc", "collect.cfg");
1611 if (!file_writable (cfgfile)) {
1612 message = "mkcolfail";
1613 } else {
1614 // create the .create file (this file is just a place holder to let any future
1615 // pages know that the collection already exists).
1616 char *createfilec = createfile.getcstr();
1617 ofstream cfile_out (createfilec);
1618 delete []createfilec;
1619 if (cfile_out) {
1620 cfile_out << "collection created\n";
1621 cfile_out.close();
1622 } else {
1623 message = "tmpfail";
1624 return;
1625 }
1626 }
1627}
1628
1629void collectoraction::gsdl_build (cgiargsclass &args, ostream &logout) {
1630
1631 outconvertclass text_t2ascii;
1632
1633 text_t tmpdir = filename_cat (gsdlhome, "tmp", args["bc1tmp"]);
1634 if (!directory_exists (tmpdir)) {
1635 message = "tmpfail";
1636 return;
1637 }
1638
1639 text_t &collection = args["bc1dirname"];
1640 if (collection.empty()) {
1641 message = "nocollection";
1642 return;
1643 }
1644
1645 // check for a .build file - if it exists then we've already built
1646 // the collection (or are in the process of building it)
1647 text_t buildfile = filename_cat (tmpdir, ".build");
1648 if (file_exists (buildfile)) {
1649 return;
1650 } else {
1651 // create the .build file (this file is just a place holder to let any future
1652 // pages know that we've already been here)
1653 char *buildfilec = buildfile.getcstr();
1654 ofstream bfile_out (buildfilec);
1655 delete []buildfilec;
1656 if (bfile_out) {
1657 bfile_out << "collection building\n";
1658 bfile_out.close();
1659 } else {
1660 message = "tmpfail";
1661 return;
1662 }
1663 }
1664
1665 const recptconf &rcinfo = recpt->get_configinfo ();
1666
1667 // create the event header file if LogEvents, EmailEvents or
1668 // EmailUserEvents options are turned on.
1669 bool logevents =
1670 (rcinfo.LogEvents == CollectorEvents || rcinfo.LogEvents == AllEvents ||
1671 rcinfo.EmailEvents == CollectorEvents || rcinfo.EmailEvents == AllEvents ||
1672 rcinfo.EmailUserEvents);
1673 text_t ehead_file = filename_cat (tmpdir, "ehead.txt");
1674 if (logevents) {
1675 if (!create_event_header_file (ehead_file, args, logout)) {
1676 logevents = false;
1677 }
1678 }
1679
1680 text_t collectdir = get_collectdir (args);
1681
1682 // set up build options
1683 text_t options = "-make_writable -remove_import -out \"";
1684 options += filename_cat (tmpdir, collection + ".bld");
1685 options += "\" -collectdir \"" + collectdir + "\" -statsfile \"";
1686 options += filename_cat(collectdir, collection, "etc", "import.log") + "\"";
1687
1688 if (args["bc1esrce"] == 1) {
1689 // we're adding data to an existing collection
1690 options += " -save_archives -append";
1691 }
1692
1693 text_tarray inputvalues, inputtypes;
1694 splitchar (args["bc1input"].begin(), args["bc1input"].end(), ',', inputvalues);
1695 splitchar (args["bc1inputtype"].begin(), args["bc1inputtype"].end(), ',', inputtypes);
1696 int numvalues = inputvalues.size();
1697 int numtypes = inputtypes.size();
1698 for (int i = 0; i < numvalues; ++i) {
1699 if (!inputvalues[i].empty()) {
1700 text_t type = "file://"; // default
1701 if (i < numtypes) type = inputtypes[i];
1702 options += " -download \"" +
1703 remove_trailing_slashes(type + format_url(decode_commas(inputvalues[i]))) + "\"";
1704 }
1705 }
1706
1707 if (logevents) {
1708 if (rcinfo.LogEvents == CollectorEvents || rcinfo.LogEvents == AllEvents)
1709 options += " -log_events";
1710 if (rcinfo.EmailEvents == CollectorEvents || rcinfo.EmailEvents == AllEvents) {
1711 options += " -mail_server " + rcinfo.MailServer;
1712 options += " -email_events " + rcinfo.maintainer;
1713 if (rcinfo.EmailUserEvents) options += "," + args["bc1contactemail"];
1714 } else if (rcinfo.EmailUserEvents) {
1715 options += " -mail_server " + rcinfo.MailServer;
1716 options += " -email_events " + args["bc1contactemail"];
1717 }
1718 options += " -event_header " + ehead_file;
1719 }
1720
1721 text_t optionfile = filename_cat (tmpdir, "build.opt");
1722 char *optionfilec = optionfile.getcstr();
1723 ofstream ofile_out (optionfilec);
1724 delete []optionfilec;
1725 if (!ofile_out) {
1726 message = "tmpfail";
1727 return;
1728 }
1729 ofile_out << text_t2ascii << options << "\n";
1730 ofile_out.close();
1731
1732 // if we're altering an existing collection we need to kill off
1733 // the existing collection server - we do this for the local library
1734 // (and any other persistent version of the library) as the existing
1735 // gdbm file can't be deleted while the collection server holds it open
1736 if ((args["bc1econf"] == 1) || (args["bc1esrce"] == 1)) {
1737 remove_colservr (collection, logout);
1738 }
1739
1740 // set up the build command - build.bat has some issues with quoting
1741 // on win2k when gsdlhome contains spaces so we'll avoid using
1742 // "perl -S" here in favor of calling the "build" perl script explicitly
1743 text_t build_cmd = "perl \"" + filename_cat (gsdlhome, "bin", "script", "build");
1744 build_cmd += "\" -optionfile \"" + optionfile + "\" " + collection;
1745 // run build command in background (i.e. asynchronously)
1746 gsdl_system (build_cmd, false, logout);
1747}
1748
1749void collectoraction::gsdl_cancel_build (cgiargsclass &args, ostream &logout) {
1750 // I really wanted to do what this perl script does from within the library
1751 // c++ code. I ran into some problems though (like how do you write a portable
1752 // "rm -r" in c++?). One day I'll spend some time sorting it out ... maybe.
1753 text_t cancel_cmd = "perl -S cancel_build.pl -collectdir \"";
1754 cancel_cmd += filename_cat (gsdlhome, "tmp", args["bc1tmp"]) + "\" ";
1755 cancel_cmd += args["bc1dirname"];
1756 // To be on the safe side we'll make this a synchronous call
1757 // so that all tidying up is done before the user has a chance
1758 // to do anything else (like start rebuilding their collection).
1759 // This means that for a big collection where there's lots of
1760 // stuff to delete etc. it might take a while before the "build
1761 // cancelled" page appears.
1762 gsdl_system (cancel_cmd, true, logout);
1763}
1764
1765text_t collectoraction::get_collectdir (cgiargsclass &args)
1766{
1767 if ((args["bc1econf"] == 1) || (args["bc1esrce"] == 1)) {
1768 // we're adding to a collection in place
1769 return filename_cat(gsdlhome, "collect");
1770 }
1771 else {
1772 return filename_cat (gsdlhome, "tmp", args["bc1tmp"]);
1773 }
1774}
1775
1776// checks to see if any of the plugins in pluginset occur in
1777// collections configuration file
1778bool collectoraction::uses_weird_plugin (const text_t &collection) {
1779
1780 text_tset pluginset;
1781 pluginset.insert ("HBPlug");
1782
1783 text_t cfgfile_content;
1784 text_t cfgfile_name = filename_cat (gsdlhome, "collect", collection, "etc", "collect.cfg");
1785 text_t pluginstr, pluginname;
1786
1787 if (read_file (cfgfile_name, cfgfile_content)) {
1788 text_t::const_iterator here = cfgfile_content.begin();
1789 text_t::const_iterator end = cfgfile_content.end();
1790 while (here != end) {
1791 here = findchar (here, end, 'p');
1792 if (here == end) break;
1793 if ((here+6 < end) && (substr (here, here+6) == "plugin")) {
1794 getdelimitstr (here+6, end, '\n', pluginstr);
1795 text_t::const_iterator hp = pluginstr.begin();
1796 text_t::const_iterator ep = pluginstr.end();
1797 bool found = false;
1798 // remove any leading whitespace, trailing options etc.
1799 while (hp != ep) {
1800 if (*hp == '\t' || *hp == ' ' || *hp == '\n') {
1801 if (found) break;
1802 } else {
1803 pluginname.push_back (*hp);
1804 found = true;
1805 }
1806 ++hp;
1807 }
1808 text_tset::const_iterator it = pluginset.find (pluginname);
1809 if (it != pluginset.end()) return true; // found matching plugin
1810 pluginname.clear();
1811 }
1812 ++here;
1813 }
1814 }
1815 return false;
1816}
1817
1818// create and initialize a new collection server and
1819// add it to the null protocol.
1820void collectoraction::create_colserver (const text_t &collection, ostream &logout) {
1821
1822 recptprotolistclass *protos = recpt->get_recptprotolist_ptr();
1823 recptprotolistclass::iterator rprotolist_here = protos->begin();
1824 recptprotolistclass::iterator rprotolist_end = protos->end();
1825 while (rprotolist_here != rprotolist_end) {
1826 comerror_t err = noError;
1827 if ((*rprotolist_here).p != NULL) {
1828 if ((*rprotolist_here).p->get_protocol_name (err) == "nullproto") {
1829 // create collection server and add it to nullproto
1830 (*rprotolist_here).p->add_collection (collection, recpt, gsdlhome, gsdlhome);
1831 // make sure gsdlhome is configured
1832 text_tarray tmp;
1833 tmp.push_back (gsdlhome);
1834 (*rprotolist_here).p->configure ("gsdlhome", tmp, err);
1835 // re-initialize the null protocol
1836 if (!(*rprotolist_here).p->init (err, logout)) {
1837 logout << "collectoraction::create_colserver: nullproto init failed\n";
1838 }
1839 return;
1840 }
1841 }
1842 ++rprotolist_here;
1843 }
1844
1845 logout << "collectoraction::create_colserver: no valid nullproto found\n";
1846}
1847
1848// delete a collection server from the null protocol
1849void collectoraction::remove_colservr (const text_t &collection, ostream &logout) {
1850
1851 recpt->uncache_collection (collection);
1852
1853 recptprotolistclass *protos = recpt->get_recptprotolist_ptr();
1854 recptprotolistclass::iterator rprotolist_here = protos->begin();
1855 recptprotolistclass::iterator rprotolist_end = protos->end();
1856 while (rprotolist_here != rprotolist_end) {
1857 comerror_t err = noError;
1858 if ((*rprotolist_here).p != NULL) {
1859 if ((*rprotolist_here).p->get_protocol_name (err) == "nullproto") {
1860 (*rprotolist_here).p->remove_collection (collection, logout);
1861 return;
1862 }
1863 }
1864 ++rprotolist_here;
1865 }
1866
1867 logout << "collectoraction::create_colserver: no valid nullproto found\n";
1868}
1869
1870bool collectoraction::create_event_header_file (const text_t &filename, cgiargsclass &args,
1871 ostream &logout) {
1872
1873 outconvertclass text_t2ascii;
1874 char *filenamec = filename.getcstr();
1875 ofstream eheadfile (filenamec);
1876 delete []filenamec;
1877
1878 if (eheadfile) {
1879 eheadfile << text_t2ascii << get_event_header (args);
1880 eheadfile.close();
1881 return true;
1882 }
1883
1884 logout << text_t2ascii << "collectoraction::create_event_header ERROR: Couldn't create "
1885 << "Event Header file " << filename << ". Event logging disabled\n";
1886 return false;
1887}
1888
1889text_t collectoraction::get_event_header (cgiargsclass &args) {
1890 text_t header = "Greenstone Username: " + args["un"] + "\n";
1891 header += "Collection: " + args["bc1dirname"] + "\n";
1892 header += "Collection Creator: " + args["bc1contactemail"] + "\n";
1893 header += "GSDLHOME: " + gsdlhome + "\n";
1894 header += "Build Location: " + get_collectdir(args) + "\n";
1895
1896 return header;
1897}
1898
1899bool collectoraction::check_sources (cgiargsclass &args, ostream &logout) {
1900
1901 bool found = false;
1902
1903 text_tarray inputvalues;
1904 splitchar (args["bc1input"].begin(), args["bc1input"].end(), ',', inputvalues);
1905
1906 text_tarray inputtypes;
1907 splitchar (args["bc1inputtype"].begin(), args["bc1inputtype"].end(), ',', inputtypes);
1908
1909 int numvalues = inputvalues.size();
1910 int numtypes = inputtypes.size();
1911
1912 for (int i = 0; i < numvalues; ++i) {
1913 text_t value = format_url(decode_commas(inputvalues[i]));
1914 text_t type = "file://"; // default
1915 if (!value.empty()) {
1916 found = true;
1917 if (i >= numtypes || inputtypes[i].empty()) {
1918 logout << "collectoraction::check_sources: WARNING type not set\n";
1919 } else {
1920 type = inputtypes[i];
1921 }
1922 if (type == "file://") {
1923 if (!file_exists(value) && !directory_exists(value)) {
1924 failedsources[decode_commas(inputvalues[i])] = "1";
1925 badsources = true;
1926 }
1927 } else if (type == "http://") {
1928 if (gsdl_system ("perl -S ping.pl -quiet http://" + value, true, logout)) {
1929 failedsources[decode_commas(inputvalues[i])] = "1";
1930 badsources = true;
1931 }
1932 } else if (type == "ftp://") {
1933 if (gsdl_system ("perl -S ping.pl -quiet ftp://" + value, true, logout)) {
1934 failedsources[decode_commas(inputvalues[i])] = "1";
1935 badsources = true;
1936 }
1937 }
1938 }
1939 }
1940
1941 // set badsources if there weren't any sources at all
1942 if (!found) badsources = true;
1943
1944 if (badsources) return false;
1945 return true;
1946}
1947
1948// format_url simply strips "http://", "ftp://", or "file://" off the
1949// beginning of url if they're there
1950text_t collectoraction::format_url (const text_t &url) {
1951 text_t::const_iterator begin = url.begin();
1952 text_t::const_iterator end = url.end();
1953
1954 if (url.size() >= 7) {
1955 text_t prefix = substr(begin, begin+7);
1956 if (prefix == "http://" || prefix == "file://") {
1957 return substr(begin+7, end);
1958 }
1959 }
1960 if (url.size() >= 6) {
1961 if (substr(begin, begin+6) == "ftp://") {
1962 return substr(begin+6, end);
1963 }
1964 }
1965 return url;
1966}
1967
1968text_t collectoraction::remove_trailing_slashes (text_t str) {
1969
1970 while (*(str.end()-1) == '\\') {
1971 str.pop_back();
1972 }
1973 return str;
1974}
1975
1976#endif //GSDL_USE_COLLECTOR_ACTION
Note: See TracBrowser for help on using the repository browser.