source: trunk/gsdl/src/recpt/collectoraction.cpp@ 5017

Last change on this file since 5017 was 3546, checked in by sjboddie, 22 years ago

Added protos to argument list of action::check_cgiargs() as I always seem to want it to
be there.

  • Property svn:keywords set to Author Date Id Revision
File size: 66.8 KB
Line 
1/**********************************************************************
2 *
3 * collectoraction.cpp --
4 * Copyright (C) 2000 The New Zealand Digital Library Project
5 *
6 * A component of the Greenstone digital library software
7 * from the New Zealand Digital Library Project at the
8 * University of Waikato, New Zealand.
9 *
10 * This program is free software; you can redistribute it and/or modify
11 * it under the terms of the GNU General Public License as published by
12 * the Free Software Foundation; either version 2 of the License, or
13 * (at your option) any later version.
14 *
15 * This program is distributed in the hope that it will be useful,
16 * but WITHOUT ANY WARRANTY; without even the implied warranty of
17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 * GNU General Public License for more details.
19 *
20 * You should have received a copy of the GNU General Public License
21 * along with this program; if not, write to the Free Software
22 * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
23 *
24 *********************************************************************/
25
26// note that the collectoraction relies on having direct access to a
27// collections configuration file. this breaks the separation between
28// receptionist and collection server and so is not suitable (at least
29// in its current form) for use when collection servers are separate
30// from the receptionist (e.g. when using the CORBA protocol).
31
32// following line required to get fstream.filedesc() on darwin (Mac OS X)
33#define _STREAM_COMPAT 1
34// required for utsname on solaris???
35#define _XOPEN_SOURCE 1
36#define _XOPEN_SOURCE_EXTENDED 1
37
38#include "collectoraction.h"
39#include "OIDtools.h"
40#include "fileutil.h"
41#include "cfgread.h"
42#include "gsdltools.h"
43#include "gsdltimes.h"
44#include "nullproto.h"
45#include "argdb.h"
46#include "cgiutils.h"
47#include <stdio.h>
48#include <fcntl.h>
49
50#if !defined (__WIN32__)
51#include <sys/utsname.h>
52#include <unistd.h>
53#endif
54
55collectoraction::collectoraction () {
56
57 recpt = NULL;
58 disabled = true;
59 do_mkcol = false;
60 badsources = false;
61 failedsources.erase(failedsources.begin(), failedsources.end());
62 gsdlosc = NULL;
63 gsdlhomec = NULL;
64 pathc = NULL;
65
66 cgiarginfo arg_ainfo;
67 arg_ainfo.shortname = "a";
68 arg_ainfo.longname = "action";
69 arg_ainfo.multiplechar = true;
70 arg_ainfo.defaultstatus = cgiarginfo::weak;
71 arg_ainfo.argdefault = "collector";
72 arg_ainfo.savedarginfo = cgiarginfo::must;
73 argsinfo.addarginfo (NULL, arg_ainfo);
74
75 arg_ainfo.shortname = "p";
76 arg_ainfo.longname = "page";
77 arg_ainfo.multiplechar = true;
78 arg_ainfo.defaultstatus = cgiarginfo::weak;
79 arg_ainfo.argdefault = "intro";
80 arg_ainfo.savedarginfo = cgiarginfo::must;
81 argsinfo.addarginfo (NULL, arg_ainfo);
82
83 // temporary directory name for this collector
84 // session
85 arg_ainfo.shortname = "bc1tmp";
86 arg_ainfo.longname = "collector specific";
87 arg_ainfo.multiplechar = true;
88 arg_ainfo.defaultstatus = cgiarginfo::weak;
89 arg_ainfo.argdefault = "";
90 arg_ainfo.savedarginfo = cgiarginfo::must;
91 argsinfo.addarginfo (NULL, arg_ainfo);
92
93 arg_ainfo.shortname = "bc1fullname";
94 arg_ainfo.longname = "collector specific";
95 arg_ainfo.multiplechar = true;
96 arg_ainfo.defaultstatus = cgiarginfo::weak;
97 arg_ainfo.argdefault = "";
98 arg_ainfo.savedarginfo = cgiarginfo::mustnot; // saved on disk
99 argsinfo.addarginfo (NULL, arg_ainfo);
100
101 arg_ainfo.shortname = "bc1dirname";
102 arg_ainfo.longname = "collector specific";
103 arg_ainfo.multiplechar = true;
104 arg_ainfo.defaultstatus = cgiarginfo::weak;
105 arg_ainfo.argdefault = "";
106 arg_ainfo.savedarginfo = cgiarginfo::must;
107 argsinfo.addarginfo (NULL, arg_ainfo);
108
109 arg_ainfo.shortname = "bc1contactemail";
110 arg_ainfo.longname = "collector specific";
111 arg_ainfo.multiplechar = true;
112 arg_ainfo.defaultstatus = cgiarginfo::weak;
113 arg_ainfo.argdefault = "";
114 arg_ainfo.savedarginfo = cgiarginfo::mustnot; // saved on disk
115 argsinfo.addarginfo (NULL, arg_ainfo);
116
117 arg_ainfo.shortname = "bc1aboutdesc";
118 arg_ainfo.longname = "collector specific";
119 arg_ainfo.multiplechar = true;
120 arg_ainfo.defaultstatus = cgiarginfo::weak;
121 arg_ainfo.argdefault = "";
122 arg_ainfo.savedarginfo = cgiarginfo::mustnot; // saved on disk
123 argsinfo.addarginfo (NULL, arg_ainfo);
124
125 arg_ainfo.shortname = "bc1clone";
126 arg_ainfo.longname = "collector specific";
127 arg_ainfo.multiplechar = false;
128 arg_ainfo.defaultstatus = cgiarginfo::weak;
129 arg_ainfo.argdefault = "0";
130 arg_ainfo.savedarginfo = cgiarginfo::mustnot; // saved on disk
131 argsinfo.addarginfo (NULL, arg_ainfo);
132
133 arg_ainfo.shortname = "bc1clonecol";
134 arg_ainfo.longname = "collector specific";
135 arg_ainfo.multiplechar = true;
136 arg_ainfo.defaultstatus = cgiarginfo::weak;
137 arg_ainfo.argdefault = "";
138 arg_ainfo.savedarginfo = cgiarginfo::mustnot; // saved on disk
139 argsinfo.addarginfo (NULL, arg_ainfo);
140
141 // set when cloning option has changed
142 arg_ainfo.shortname = "bc1clonechanged";
143 arg_ainfo.longname = "collector specific";
144 arg_ainfo.multiplechar = false;
145 arg_ainfo.defaultstatus = cgiarginfo::weak;
146 arg_ainfo.argdefault = "0";
147 arg_ainfo.savedarginfo = cgiarginfo::mustnot;
148 argsinfo.addarginfo (NULL, arg_ainfo);
149
150 // only set when one of the fields was changed in
151 // the "collection info" page
152 arg_ainfo.shortname = "bc1infochanged";
153 arg_ainfo.longname = "collector specific";
154 arg_ainfo.multiplechar = false;
155 arg_ainfo.defaultstatus = cgiarginfo::weak;
156 arg_ainfo.argdefault = "0";
157 arg_ainfo.savedarginfo = cgiarginfo::mustnot;
158 argsinfo.addarginfo (NULL, arg_ainfo);
159
160 // only set when cfg file is altered from within
161 // "configure collection" page
162 arg_ainfo.shortname = "bc1cfgchanged";
163 arg_ainfo.longname = "collector specific";
164 arg_ainfo.multiplechar = false;
165 arg_ainfo.defaultstatus = cgiarginfo::weak;
166 arg_ainfo.argdefault = "0";
167 arg_ainfo.savedarginfo = cgiarginfo::mustnot;
168 argsinfo.addarginfo (NULL, arg_ainfo);
169
170 arg_ainfo.shortname = "cfgfile";
171 arg_ainfo.longname = "configuration file contents";
172 arg_ainfo.multiplechar = true;
173 arg_ainfo.defaultstatus = cgiarginfo::weak;
174 arg_ainfo.argdefault = "";
175 arg_ainfo.savedarginfo = cgiarginfo::mustnot;
176 argsinfo.addarginfo (NULL, arg_ainfo);
177
178 arg_ainfo.shortname = "bc1dodelete";
179 arg_ainfo.longname = "collector specific";
180 arg_ainfo.multiplechar = false;
181 arg_ainfo.defaultstatus = cgiarginfo::weak;
182 arg_ainfo.argdefault = "0";
183 arg_ainfo.savedarginfo = cgiarginfo::mustnot;
184 argsinfo.addarginfo (NULL, arg_ainfo);
185
186 // will be set if we arrived at the "configure collection" page
187 // via the "changing an existing collection" page
188 arg_ainfo.shortname = "bc1econf";
189 arg_ainfo.longname = "collector specific";
190 arg_ainfo.multiplechar = false;
191 arg_ainfo.defaultstatus = cgiarginfo::weak;
192 arg_ainfo.argdefault = "0";
193 arg_ainfo.savedarginfo = cgiarginfo::must;
194 argsinfo.addarginfo (NULL, arg_ainfo);
195
196 // will be set if we arrived at the "source data" page
197 // via the "changing an existing collection" page
198 arg_ainfo.shortname = "bc1esrce";
199 arg_ainfo.longname = "collector specific";
200 arg_ainfo.multiplechar = false;
201 arg_ainfo.defaultstatus = cgiarginfo::weak;
202 arg_ainfo.argdefault = "0";
203 arg_ainfo.savedarginfo = cgiarginfo::must;
204 argsinfo.addarginfo (NULL, arg_ainfo);
205
206 arg_ainfo.shortname = "bc1inputnum";
207 arg_ainfo.longname = "collector specific";
208 arg_ainfo.multiplechar = true;
209 arg_ainfo.defaultstatus = cgiarginfo::weak;
210 arg_ainfo.argdefault = "3";
211 arg_ainfo.savedarginfo = cgiarginfo::mustnot; // saved on disk
212 argsinfo.addarginfo (NULL, arg_ainfo);
213
214 arg_ainfo.shortname = "bc1input";
215 arg_ainfo.longname = "collector specific";
216 arg_ainfo.multiplechar = true;
217 arg_ainfo.multiplevalue = true;
218 arg_ainfo.defaultstatus = cgiarginfo::weak;
219 arg_ainfo.argdefault = "";
220 arg_ainfo.savedarginfo = cgiarginfo::mustnot; // saved on disk
221 argsinfo.addarginfo (NULL, arg_ainfo);
222
223 arg_ainfo.shortname = "bc1inputtype";
224 arg_ainfo.longname = "collector specific";
225 arg_ainfo.multiplechar = true;
226 arg_ainfo.multiplevalue = true;
227 arg_ainfo.defaultstatus = cgiarginfo::weak;
228 arg_ainfo.argdefault = "";
229 arg_ainfo.savedarginfo = cgiarginfo::mustnot; // saved on disk
230 argsinfo.addarginfo (NULL, arg_ainfo);
231
232 // will be set when we've just come from the "source data" page
233 arg_ainfo.shortname = "bc1fromsrce";
234 arg_ainfo.longname = "collector specific";
235 arg_ainfo.multiplechar = false;
236 arg_ainfo.multiplevalue = false;
237 arg_ainfo.defaultstatus = cgiarginfo::weak;
238 arg_ainfo.argdefault = "0";
239 arg_ainfo.savedarginfo = cgiarginfo::mustnot;
240 argsinfo.addarginfo (NULL, arg_ainfo);
241}
242
243collectoraction::~collectoraction () {
244 if (gsdlosc != NULL) delete gsdlosc;
245 if (gsdlhomec != NULL) delete gsdlhomec;
246 if (pathc != NULL) delete pathc;
247}
248
249
250void collectoraction::configure (const text_t &key, const text_tarray &cfgline) {
251 if ((key == "collector") && (cfgline.size() == 1) &&
252 (cfgline[0] == "true" || cfgline[0] == "on" || cfgline[0] == "enabled")) {
253 disabled = false;
254 } else {
255 // call the parent class to deal with the things which
256 // are not dealt with here
257 action::configure (key, cfgline);
258 }
259}
260
261
262bool collectoraction::init (ostream & /*logout*/) {
263
264 // set up GSDLOS, GSDLHOME and PATH environment variables
265 text_t gsdlos, path;
266 unsigned int path_separator = ':';
267#if defined (__WIN32__)
268 gsdlos = "windows";
269 path_separator = ';';
270
271 path = filename_cat (gsdlhome, "bin", "windows", "perl", "bin;");
272
273#else
274 struct utsname *buf = new struct utsname();
275 int i = uname (buf);
276 if (i == -1) gsdlos = "linux"; // uname failed
277 else gsdlos.setcstr (buf->sysname);
278 delete buf;
279 lc (gsdlos);
280#endif
281
282 pathc = getenv ("PATH");
283 path += filename_cat (gsdlhome, "bin", gsdlos);
284 path.push_back (path_separator);
285 path += filename_cat (gsdlhome, "bin", "script");
286 if (pathc != NULL) {
287 path.push_back (path_separator);
288 path += pathc;
289 }
290 path = "PATH=" + path;
291
292 gsdlos = "GSDLOS=" + gsdlos;
293 text_t setgsdlhome = "GSDLHOME=" + gsdlhome;
294
295 // these will be cleaned up in the destructor
296 gsdlosc = gsdlos.getcstr();
297 gsdlhomec = setgsdlhome.getcstr();
298 pathc = path.getcstr();
299
300 putenv (gsdlosc);
301 putenv (gsdlhomec);
302 putenv (pathc);
303
304 return true;
305}
306
307bool collectoraction::check_cgiargs (cgiargsinfoclass &argsinfo, cgiargsclass &args,
308 recptprotolistclass * /*protos*/, ostream &logout) {
309
310 text_t &current_page = args["p"];
311
312 // note that the "bildstatus" and "bildframe1" pages don't actually do anything
313 // functional so we don't need to worry about authenticating them (it's the
314 // underlying "bild" page that does the building (and creates the frameset))
315 // This helps us overcome a bit of a problem we have with multiple pages trying
316 // to read from the key.db database at the same time.
317 if (current_page != "intro" && current_page != "bildstatus" && current_page != "bildframe1") {
318 // authenticate the user if authentication is available
319 args["uan"] = 1;
320 args["ug"] = "colbuilder";
321 }
322
323 if (current_page == "new" || current_page == "existing") {
324
325 // assign (and create) a temporary directory
326 assign_tmpname (args, logout);
327
328 // clean up any old builds left laying about in the tmp directory
329 // (note that it's possible this could take some time if there's a huge
330 // partially built collection laying about so we'll make it an asynchronous
331 // system call)
332 gsdl_system ("perl -S cleantmp.pl", false, logout);
333 }
334
335 if (current_page != "intro" && current_page != "bildstatus" &&
336 current_page != "bildframe1" && current_page != "new") {
337 // update arguments that were saved to the harddrive
338 text_tmap saved_args;
339 saved_args["bc1fullname"] = "";
340 saved_args["bc1contactemail"] = "";
341 saved_args["bc1aboutdesc"] = "";
342 saved_args["bc1clone"] = "";
343 saved_args["bc1clonecol"] = "";
344 saved_args["bc1inputnum"] = "";
345 saved_args["bc1input"] = "";
346 saved_args["bc1inputtype"] = "";
347
348 // update the argdb database with any arguments that were set
349 // by previous page
350 text_tmap::iterator here = saved_args.begin();
351 text_tmap::iterator end = saved_args.end();
352 while (here != end) {
353 if (args.lookupcgiarg((*here).first).source != cgiarg_t::default_arg) {
354 (*here).second = args[(*here).first];
355 }
356 here++;
357 }
358
359 text_t argfile = filename_cat(gsdlhome, "tmp", args["bc1tmp"], "argdb.db");
360 argdb *args_on_disk = new argdb(argfile);
361 if (!args_on_disk->update_args(saved_args)) {
362 // error
363 logout << "collectoraction: argdb::update_args failed (" << argfile << ")\n";
364 }
365
366 // update args from argdb
367 saved_args.erase(saved_args.begin(), saved_args.end());
368 if (!args_on_disk->get_args(saved_args)) {
369 // error
370 logout << "collectoraction: argdb::get_args failed (" << argfile << ")\n";
371 }
372 delete args_on_disk;
373 here = saved_args.begin();
374 end = saved_args.end();
375 while (here != end) {
376 if (!(*here).second.empty()) {
377 args[(*here).first] = (*here).second;
378 }
379 here ++;
380 }
381 }
382
383 if (args["bc1infochanged"] == "1") {
384
385 if (args["bc1dirname"].empty()) {
386 // we've just come from the "collection information" page for the
387 // first time so we'll need to create the collection with mkcol.pl
388 // and set up bc1dirname - we do this part here instead of in do_action
389 // because the bc1dirname argument must be set to its new value before
390 // the compressedoptions macros are set.
391 args["bc1dirname"] = get_directory_name (args["bc1fullname"]);
392
393 text_t createfile = filename_cat (gsdlhome, "tmp", args["bc1tmp"], ".create");
394 if (!file_exists (createfile)) {
395 // we could do the mkcol.pl here but I guess it's nicer to do it in do_action()
396 do_mkcol = true;
397 } else {
398 // .create file already exists but bc1dirname wasn't set ... this should only be
399 // able to occur when the "reload" (and possibly the "back" and "forward" buttons)
400 // have been used to get us here.
401 // we'll check that the bc1dirname directory exists (in case of the unlikely
402 // possibility that get_directory_name returned a different value this time
403 // than it did originally).
404 text_t coldir = filename_cat (get_collectdir(args), args["bc1dirname"]);
405 if (!directory_exists (coldir)) {
406 message = "reloaderror";
407 return true;
408 }
409 }
410 } else {
411 // "collection information" has been changed after collection already exists
412 // so we'll need to update the cfg file.
413 update_cfgfile_partial (args, false, logout);
414 }
415 }
416
417 if (args["bc1cfgchanged"] == "1") {
418 // configuration file has been changed from the "configure collection"
419 // page. we need to update the file on disk and catch bc1 arguments up
420 // with changes.
421 update_cfgfile_complete (args, logout);
422 }
423
424 if (args["bc1clonechanged"] == "1") {
425 // cloning option has been changed on "source data" page. if it was turned
426 // on we want to create a new collect.cfg file using the bc1clonecol cfg file
427 // as a model (we'll save the old file as collect.cfg.org). if cloning was
428 // turned off we'll revert to using the collect.cfg.org file (which will need
429 // updating in case the bc1 arguments have been altered since cloning was
430 // turned on).
431 update_cfgfile_clone (args, logout);
432
433 // if cloning has just been turned on we'll also copy the rest of the files
434 // (excluding collect.cfg which we've already done) from the cloned collections
435 // etc directory to the new collection.
436 if (args["bc1clone"] == "1") {
437 text_t clone_etc = filename_cat(gsdlhome, "collect", args["bc1clonecol"], "etc");
438 text_t new_etc = filename_cat(get_collectdir(args), args["bc1dirname"], "etc");
439 text_tarray files;
440
441 if (read_dir (clone_etc, files)) {
442 text_tarray::const_iterator here = files.begin();
443 text_tarray::const_iterator end = files.end();
444 while (here != end) {
445 if (*here != "collect.cfg" && *here != "collect.cfg.org") {
446 file_copy (filename_cat(clone_etc, *here), filename_cat(new_etc, *here));
447 }
448 here ++;
449 }
450 } else {
451 outconvertclass text_t2ascii;
452 logout <<text_t2ascii << "collectoraction::check_cgiargs couldn't read from "
453 << clone_etc << " directory\n";
454 }
455 }
456 }
457
458 if (current_page == "bildstatus" || current_page == "bildcancel") {
459 // if .final file exists then build has finished
460 text_t fbld = filename_cat (gsdlhome, "tmp", args["bc1tmp"], args["bc1dirname"] + ".bld.final");
461 if (file_exists (fbld)) {
462 char *fbldc = fbld.getcstr();
463 ifstream fbld_in (fbldc);
464 if (fbld_in) {
465 failcode = fbld_in.get();
466 fbld_in.close();
467 if (failcode == '0') {
468 // success - we need to create and configure a collection server for the
469 // newly built collection (for fastcgi and local library where
470 // initialization isn't going to be redone when the user clicks the
471 // "view your new collection" button
472 create_colserver (args["bc1dirname"], logout);
473 current_page = "bilddone";
474 }
475 else current_page = "bildfail";
476 } else {
477 // assume build failed (we shouldn't get here though ... right?)
478 current_page = "bildfail";
479 }
480 delete fbldc;
481 }
482 }
483
484 if (args["bc1fromsrce"] == "1") {
485
486 // we've just come from the "source data" page so we need to check that
487 // input sources are valid
488 if (!check_sources(args, logout)) {
489 args["p"] = "srce";
490 }
491 }
492
493 return true;
494}
495
496void collectoraction::update_cfgfile_clone (cgiargsclass &args, ostream &logout) {
497
498 text_t tmpdir = filename_cat(gsdlhome, "tmp", args["bc1tmp"]);
499 text_t cfgfile = filename_cat(tmpdir, args["bc1dirname"], "etc", "collect.cfg");
500 if (!file_exists (cfgfile)) {
501 message = "tmpfail";
502 return;
503 }
504
505 text_t cfgfile_org = filename_cat (tmpdir, "collect.cfg.org");
506
507 if (args["bc1clone"] == "1") {
508 // cloning was turned on
509
510 text_t cfgfile_clone = filename_cat(gsdlhome, "collect", args["bc1clonecol"], "etc", "collect.cfg");
511 if (file_exists (cfgfile_clone)) {
512 // if .org file doesn't exist already create it
513 if (!file_exists (cfgfile_org)) {
514 if (!file_copy (cfgfile, cfgfile_org)) {
515 message = "tmpfail";
516 return;
517 }
518 }
519 // copy clone collections cfg file to new collection
520 if (!file_copy (cfgfile_clone, cfgfile)) {
521 message = "tmpfail";
522 return;
523 }
524 // update the new cfg file
525 update_cfgfile_partial (args, true, logout);
526
527 } else {
528 // can't clone non-existant or read-protected collection
529 message = "clonefail";
530 }
531
532 } else {
533 // cloning has been turned off having been on at some point. the .org file
534 // should exist, if it doesn't we'll bail out and leave the user with the
535 // cloned copy
536 if (file_exists (cfgfile_org)) {
537 // copy original back again and update it with any recent changes
538 if (file_copy (cfgfile_org, cfgfile)) {
539 update_cfgfile_partial (args, false, logout);
540 } else {
541 message = "tmpfail";
542 }
543 }
544 }
545}
546
547// update configuration file on disk to match bc1 arguments
548// there's a special case if the clone option is true as certain parts of a
549// config file should not be cloned (e.g. the iconcollection stuff)
550void collectoraction::update_cfgfile_partial (cgiargsclass &args, bool clone, ostream &logout) {
551
552 text_t cfgfile = filename_cat(get_collectdir(args), args["bc1dirname"], "etc", "collect.cfg");
553 char *cfgfilec = cfgfile.getcstr();
554
555#if defined (__WIN32__)
556 // make sure collect.cfg isn't read-only
557 _chmod (cfgfilec, _S_IREAD | _S_IWRITE);
558#endif
559
560 vector<text_tarray> cfgarray;
561
562 // read in cfg file
563 ifstream cfg_in (cfgfilec);
564 if (cfg_in) {
565 text_tarray cfgline;
566 while (read_cfg_line(cfg_in, cfgline) >= 0) {
567 if (cfgline.size () >= 2) {
568 if (cfgline[0] == "creator" || cfgline[0] == "maintainer") {
569 cfgline[1] = args["bc1contactemail"];
570 } else if (cfgline[0] == "collectionmeta") {
571 if (cfgline[1] == "collectionname") {
572 cfgline[2] = args["bc1fullname"];
573 } else if (cfgline[1] == "collectionextra") {
574 cfgline[2] = carriage_replace (args["bc1aboutdesc"], 0);
575 } else if (clone && (cfgline[1] == "iconcollection" ||
576 cfgline[1] == "iconcollectionsmall")) {
577 cfgline[2] = "";
578 }
579 }
580 }
581 cfgarray.push_back (cfgline);
582 }
583 cfg_in.close();
584
585 // now write cfg file back out
586 int fd=open(cfgfilec, O_WRONLY | O_CREAT | O_TRUNC
587#if defined(__WIN32__)
588 | O_BINARY
589#endif
590 );
591
592 if (fd != -1) {
593 // lock the file
594 int lock_val = 1;
595 GSDL_LOCK_FILE (fd);
596 if (lock_val != 0) {
597 logout << "Error: Couldn't lock file " << cfgfilec << "\n";
598 close(fd);
599 message = "tmpfail";
600
601 } else {
602
603 vector<text_tarray>::const_iterator this_line = cfgarray.begin();
604 vector<text_tarray>::const_iterator end_line = cfgarray.end();
605 while (this_line != end_line) {
606 write_cfg_line (fd, *this_line);
607 this_line ++;
608 }
609 GSDL_UNLOCK_FILE (fd);
610 close(fd);
611 }
612
613 } else {
614 logout << "collectoraction::update_cfgfile_partial: unable to open "
615 << cfgfilec << " for output\n";
616 message = "tmpfail";
617 }
618
619 } else {
620 logout << "collectoraction::update_cfgfile_partial: unable to open "
621 << cfgfilec << " for input\n";
622 message = "tmpfail";
623 }
624
625 delete cfgfilec;
626}
627
628// replace configuration file on disk with that in the cfgfile argument and
629// catch other bc1 arguments up with those the new cfgfile contains
630void collectoraction::update_cfgfile_complete (cgiargsclass &args, ostream &logout) {
631
632 text_t cfgfile = filename_cat(get_collectdir(args), args["bc1dirname"], "etc", "collect.cfg");
633 char *cfgfilec = cfgfile.getcstr();
634
635#ifdef __WIN32__
636 // make sure collect.cfg isn't read-only
637 _chmod (cfgfilec, _S_IREAD | _S_IWRITE);
638#endif
639
640 int fd=open(cfgfilec, O_WRONLY | O_CREAT | O_TRUNC
641#if defined(__WIN32__)
642 | O_BINARY
643#endif
644 );
645
646 if (fd) {
647 // lock the file
648 int lock_val = 1;
649 GSDL_LOCK_FILE (fd);
650 if (lock_val != 0) {
651 logout << "Error: Couldn't lock file " << cfgfilec << "\n";
652 close(fd);
653 message = "tmpfail";
654
655 } else {
656
657 outconvertclass text_t2ascii;
658 text_t2ascii.setinput(&args["cfgfile"]);
659 size_t buffersize=args["cfgfile"].size();
660 char *buffer=new char[buffersize];
661 buffer[0]='\n'; // just in case something goes wrong...
662 size_t num_chars;
663 convertclass::status_t status;
664 text_t2ascii.convert(buffer, buffersize, num_chars, status);
665 // ignore status - assume it is "finished" as buffer is big enough
666 write(fd, buffer, num_chars);
667 GSDL_UNLOCK_FILE (fd);
668 close(fd);
669 delete buffer;
670
671 // now that we've written the file we'll read it back again and
672 // update our bc1 arguments
673 ifstream cfg_in (cfgfilec);
674 if (cfg_in) {
675 text_tarray cfgline;
676 while (read_cfg_line(cfg_in, cfgline) >= 0) {
677 if (cfgline.size () >= 2) {
678 if (cfgline[0] == "creator") {
679 args["bc1contactemail"] = cfgline[1];
680 } else if (cfgline[0] == "collectionmeta") {
681 if (cfgline[1] == "collectionname") {
682 args["bc1fullname"] = cfgline[2];
683 } else if (cfgline[1] == "collectionextra") {
684 args["bc1aboutdesc"] = carriage_replace (cfgline[2], 1);
685 }
686 }
687 }
688 }
689 cfg_in.close();
690 } else {
691 logout << "collectoraction::update_cfgfile_complete: unable to open "
692 << cfgfilec << " for input\n";
693 message = "tmpfail";
694 }
695 }
696 } else {
697 logout << "collectoraction::update_cfgfile_complete: unable to open "
698 << cfgfilec << " for output\n";
699 message = "tmpfail";
700 }
701
702 delete cfgfilec;
703}
704
705void collectoraction::get_cgihead_info (cgiargsclass &/*args*/, recptprotolistclass * /*protos*/,
706 response_t &response,text_t &response_data,
707 ostream &/*logout*/) {
708 response = content;
709 response_data = "text/html";
710}
711
712// return html for buttons used in collector bar
713// color may be "green", "grey", or "yellow"
714// type may be:
715// "info" --> "collection information" button
716// "srce" --> "source data" button
717// "conf" --> "configure collection" button
718// "bild" --> "build collection" button
719// "view" --> "view collection" button
720// if enabled is true button will be flashy rollover type and
721// will be hyperlinked
722
723text_t collectoraction::get_button (const text_t &thispage, const text_t &color,
724 const text_t &type, bool enabled) {
725
726 if ((color != "green" && color != "grey" && color != "yellow") ||
727 (type != "info" && type != "srce" && type != "conf" && type != "bild" && type != "view"))
728 return "";
729
730 text_t prefix = "gc";
731 if (color == "grey") prefix = "nc";
732 else if (color == "yellow") prefix = "yc";
733
734 text_t httpicon = "httpicon" + prefix + type;
735
736 if (enabled) {
737 text_t gsmacro = "_gsimage_";
738 if (thispage == "info" || thispage == "srce" || thispage == "conf" ||
739 thispage == "bildcancel" || thispage == "bildfail") {
740 gsmacro = "_gsjimage_";
741 } else if (type == "view") {
742 // view button is special case as it needs a target=_top
743 gsmacro = "_gstimage_";
744 }
745 return "<td>" + gsmacro + "(_collector:http" + type + "_,_collector:" + httpicon +
746 "of_,_collector:" + httpicon + "on_," + type + ",_collector:text" + type + "_)</td>\n";
747 } else {
748 return "<td>_icon" + prefix + type + "of_</td>\n";
749 }
750}
751
752// set the _fullnamemenu_ macro (and _warnindex_ and _selectedindex_ if
753// we're on the "srce" page)
754void collectoraction::set_fullnamemenu (displayclass &disp, cgiargsclass &args,
755 recptprotolistclass *protos, ostream &logout) {
756
757 if (recpt == NULL) {
758 logout << "ERROR (collectoraction::set_fullnamemenu): This action does not contain\n"
759 << " information about any receptionists. The method set_receptionist was\n"
760 << " probably not called from the module which instantiated this action.\n";
761 return;
762 }
763
764 text_t &current_page = args["p"];
765 text_t currentname = args["bc1dirname"];
766 if (current_page == "srce") currentname = args["bc1clonecol"];
767
768 text_tarray dirnames;
769 text_tarray fullnames;
770 vector<bool> write_protected;
771 bool is_selected = false;
772 int selected_index = 0;
773 int index = 0;
774
775 recptprotolistclass::iterator rprotolist_here = protos->begin();
776 recptprotolistclass::iterator rprotolist_end = protos->end();
777 while (rprotolist_here != rprotolist_end) {
778 if ((*rprotolist_here).p != NULL) {
779
780 // don't include z39.50 collections
781 comerror_t err = noError;
782 if ((*rprotolist_here).p->get_protocol_name (err) == "z3950proto") {
783 rprotolist_here ++;
784 continue;
785 }
786
787 text_tarray collist;
788 (*rprotolist_here).p->get_collection_list (collist, err, logout);
789 if (err == noError) {
790 text_tarray::iterator collist_here = collist.begin();
791 text_tarray::iterator collist_end = collist.end();
792 FilterResponse_t response;
793 text_tset metadata;
794 metadata.insert ("collectionname");
795 while (collist_here != collist_end) {
796 ColInfoResponse_t *cinfo = recpt->get_collectinfo_ptr ((*rprotolist_here).p, *collist_here, logout);
797 if (cinfo != NULL) {
798 text_t collectionname = *collist_here;
799 if (!cinfo->collectionmeta["collectionname"].empty()) {
800 // get collection name from the collection cfg file
801 collectionname = cinfo->collectionmeta["collectionname"];
802 } else if (get_info ("collection", *collist_here, metadata, false,
803 (*rprotolist_here).p, response, logout)) {
804 // get collection name from gdbm file
805 collectionname = response.docInfo[0].metadata["collectionname"].values[0];
806 }
807 dirnames.push_back(*collist_here);
808 fullnames.push_back(collectionname);
809 // check to see if the collection is writable
810 if (collection_protected (*collist_here)) write_protected.push_back(true);
811 else write_protected.push_back(false);
812
813 if (*collist_here == currentname) {
814 is_selected = true;
815 selected_index = index;
816 }
817 index ++;
818 }
819 collist_here ++;
820 }
821 }
822 }
823 rprotolist_here ++;
824 }
825
826 bool first = true;
827 text_t warnindex;
828 text_t fullnamemenu = "<select name=\"bc1dirname\">\n";
829 if (current_page == "srce") {
830 fullnamemenu = "<select name=\"bc1clonecol\" onChange=\"menuchange();\">\n";
831 fullnamemenu += "<option value=defaultstructure";
832 if (!is_selected) fullnamemenu += " selected>";
833 else fullnamemenu.push_back('>');
834 fullnamemenu += "_collector:textdefaultstructure_\n";
835 }
836 for (int i = 0; i < index; i ++) {
837 // don't want write protected collections in list on "change existing
838 // collection" page
839 if (write_protected[i] && current_page == "existing") continue;
840 fullnamemenu += "<option value=\"" + dirnames[i] + "\"";
841 if ((i == 0 && !is_selected && current_page != "srce") ||
842 (is_selected && i == selected_index)) {
843 fullnamemenu += " selected";
844 selected_index++;
845 is_selected = false;
846 }
847 fullnamemenu.push_back ('>');
848 fullnamemenu += fullnames[i];
849 fullnamemenu.push_back ('\n');
850
851 // add to Warnindex if collection uses any dubious plugins
852 // (if creating clone collection list)
853 if (current_page == "srce") {
854 if (first) warnindex += "0,";
855 else warnindex.push_back(',');
856 if (uses_weird_plugin (dirnames[i])) {
857 warnindex += text_t (1);
858 } else {
859 warnindex += text_t (0);
860 }
861 }
862 first = false;
863 }
864 fullnamemenu += "</select>\n";
865
866 disp.setmacro ("fullnamemenu", "collector", fullnamemenu);
867 if (current_page == "srce") {
868 disp.setmacro ("warnindex", "collector", warnindex);
869 disp.setmacro ("selectedindex", "collector", text_t(selected_index));
870 }
871}
872
873// set _sourcelist_ and _badsources_ macros
874void collectoraction::set_inputsourceboxes (displayclass &disp, cgiargsclass &args,
875 ostream &logout) {
876
877 if (badsources) disp.setmacro ("badsources", "collector", "1");
878
879 text_t sourcelist = get_source_box(args["bc1input"], args["bc1inputnum"].getint(),
880 args["bc1inputtype"]);
881
882 disp.setmacro("sourcelist", "collector", sourcelist);
883
884 // reset badsources and failedsources variables
885 badsources = false;
886 failedsources.erase(failedsources.begin(), failedsources.end());
887}
888
889text_t collectoraction::get_source_box (text_t inputarglist, int numboxes,
890 text_t inputtypelist) {
891
892 text_tarray inputvalues;
893 splitchar (inputarglist.begin(), inputarglist.end(), ',', inputvalues);
894 // remove any empty values from the end of the array
895 if (inputvalues.size()) {
896 text_tarray::iterator l = inputvalues.end() - 1;
897 text_tarray::iterator b = inputvalues.begin();
898 while ((*l).empty() && l >= b) {
899 l--;
900 }
901 inputvalues.erase(l+1, inputvalues.end());
902 }
903
904 text_tarray inputtypes;
905 splitchar (inputtypelist.begin(), inputtypelist.end(), ',', inputtypes);
906
907 int numvalues = inputvalues.size();
908 int numtypes = inputtypes.size();
909
910 text_t last = "file://";
911 text_t rv;
912 for (int i = 0; i < numboxes; i++) {
913 rv += "<nobr><select name=\"bc1inputtype\">\n";
914 rv += "<option value=\"file://\"";
915 if ((i < numtypes && inputtypes[i] == "file://") ||
916 (numboxes == 3 && i == 0 && numvalues == 0) ||
917 (i >= 3 && i >= numvalues && last == "file://")) {
918 rv += " selected";
919 last = "file://";
920 }
921 rv += ">file://\n";
922 rv += "<option value=\"http://\"";
923 if ((i < numtypes && inputtypes[i] == "http://") ||
924 (numboxes == 3 && i == 1 && numvalues == 0) ||
925 (i >= 3 && i >= numvalues && last == "http://")) {
926 rv += " selected";
927 last = "http://";
928 }
929 rv += ">http://\n";
930 rv += "<option value=\"ftp://\"";
931 if ((i < numtypes && inputtypes[i] == "ftp://") ||
932 (numboxes == 3 && i == 2 && numvalues == 0) ||
933 (i >= 3 && i >= numvalues && last == "ftp://")) {
934 rv += " selected";
935 last = "ftp://";
936 }
937 rv += ">ftp://\n";
938 rv += "</select>\n";
939 rv += "<input type=text name=\"bc1input\" value=\"";
940 if (i < numvalues) {
941 rv += dm_safe(decode_commas(inputvalues[i]));
942 }
943 rv += "\" size=50>";
944 if (badsources) {
945 if ((i < numvalues) && (!inputvalues[i].empty())) {
946 if (failedsources[decode_commas(inputvalues[i])] == "1") {
947 rv += "_iconcross_";
948 } else {
949 rv += "_icontick_";
950 }
951 } else {
952 rv += "_iconblank_";
953 }
954 }
955 if (i+1 == numboxes) {
956 if (!badsources) rv += "_iconblank_";
957 rv += "_imagemore_</nobr><br>";
958 } else {
959 rv += "</nobr><br>\n";
960 }
961 }
962
963 return rv;
964}
965
966// set the _cfgfile_ macro
967void collectoraction::set_cfgfile (displayclass &disp, cgiargsclass &args, ostream &logout) {
968
969 text_t &collection = args["bc1dirname"];
970 if (collection.empty()) {
971 message = "nocollection";
972 return;
973 }
974
975 // read in collect.cfg
976 text_t cfgfile = filename_cat(get_collectdir(args), collection, "etc", "collect.cfg");
977 char *cfgfilec = cfgfile.getcstr();
978
979#ifdef GSDL_USE_IOS_H
980 ifstream cfg_ifs (cfgfilec, ios::in | ios::nocreate);
981#else
982 ifstream cfg_ifs (cfgfilec, ios::in);
983#endif
984
985 if (cfg_ifs) {
986 // read in collect.cfg
987 text_t cfgtext;
988 char c;
989 cfg_ifs.get(c);
990 while (!cfg_ifs.eof ()) {
991 cfgtext.push_back(c);
992 cfg_ifs.get(c);
993 }
994 cfg_ifs.close();
995
996 // define it as a macro
997 disp.setmacro("cfgfile", "collector", dm_safe(cfgtext));
998
999 } else {
1000 logout << "collectoraction::set_cfgfile: couldn't open configuration file ("
1001 << cfgfilec << ") for reading\n";
1002 message = "tmpfail";
1003 }
1004 delete cfgfilec;
1005}
1006
1007// set the _statusline_ macro
1008void collectoraction::set_statusline (displayclass &disp, cgiargsclass &args, ostream & /*logout*/) {
1009
1010 // the build command creates .bld.download, .bld.import, and .bld.build files (in that
1011 // order) and deletes them (also in that order) when each stage is complete. the .bld
1012 // file is the concatenation of all these files.
1013 text_t bld_file = filename_cat (gsdlhome, "tmp", args["bc1tmp"], args["bc1dirname"] + ".bld");
1014 text_t statusline;
1015
1016 if (file_exists (bld_file + ".download")) {
1017 statusline = "_collector:textdownloadingfiles_<br>\n";
1018 statusline += dm_safe(file_tail(bld_file + ".download", 1, 0));
1019 } else if (file_exists (bld_file + ".import")) {
1020 statusline = "_collector:textimportingcollection_<br>\n";
1021 statusline += dm_safe(file_tail(bld_file + ".import", 1, 0));
1022 } else if (file_exists (bld_file + ".build")) {
1023 statusline = "_collector:textbuildingcollection_<br>\n";
1024 statusline += dm_safe(file_tail(bld_file + ".build", 1, 0));
1025 } else {
1026 statusline += "_collector:textcreatingcollection_<br>\n";
1027 statusline += dm_safe(file_tail(bld_file, 1, 0));
1028 }
1029
1030 disp.setmacro ("statusline", "collector", statusline);
1031
1032}
1033
1034void collectoraction::define_internal_macros (displayclass &disp, cgiargsclass &args,
1035 recptprotolistclass *protos, ostream &logout) {
1036
1037 // define_internal_macros sets the following macros:
1038 // _collectorbar_
1039 // _pagescriptextra_
1040 // _fullnamemenu_ -- if displaying the "source data" page or the "changing existing
1041 // collection" page
1042 // _cfgfile_ -- if displaying the "configure collection" page
1043 // _statusline_ -- if displaying the bildstatus page
1044 // _header_ -- may be set for pages that require it
1045 // _textfailmsg_ -- set to different messages depending on failcode returned
1046 // by build script (if build fails)
1047 // _faillog_ - set to last 6 lines of .bld file if build failed
1048 // _gsdlhome_ - the gsdlhome path (dm_safe)
1049 // _sourcelist_ -- "input source" text boxes
1050 // _badsources_ -- will be set to "1" if we've come from the
1051 // "source data" page and there's a problem
1052 // with the input sources
1053
1054 text_t &collector_page = args["p"];
1055 int esrce = args["bc1esrce"].getint();
1056 int econf = args["bc1econf"].getint();
1057
1058 // set _pagescriptextra_ macro to _cpagescriptextra_
1059 disp.setmacro ("pagescriptextra", "collector", "_" + collector_page + "scriptextra_");
1060
1061 if (collector_page == "bildstatus" || collector_page == "bilddone" ||
1062 collector_page == "bildfail" || collector_page == "bildframe1") {
1063 disp.setmacro ("header", "collector", "_" + collector_page + "header_");
1064 }
1065
1066 // set the collectorbar macro
1067 text_t collectorbar = "<table border=0 cellspacing=4 cellpadding=0><tr>\n";
1068
1069 if (collector_page == "new") {
1070 collectorbar += "<td>_icongreyarrow_</td>\n";
1071 collectorbar += get_button (collector_page, "green", "info", true);
1072 collectorbar += "<td>_icongreyarrow_</td>\n";
1073 collectorbar += get_button (collector_page, "grey", "srce", false);
1074 collectorbar += "<td>_icongreyarrow_</td>\n";
1075 collectorbar += get_button (collector_page, "grey", "conf", false);
1076 collectorbar += "<td>_icongreyarrow_</td>\n";
1077 collectorbar += get_button (collector_page, "grey", "bild", false);
1078 collectorbar += "<td>_icongreyarrow_</td>\n";
1079 collectorbar += get_button (collector_page, "grey", "view", false);
1080
1081 } else if (collector_page == "info") {
1082 collectorbar += "<td>_icongreyarrow_</td>\n";
1083 collectorbar += get_button (collector_page, "yellow", "info", false);
1084 collectorbar += "<td>_icongreyarrow_</td>\n";
1085 collectorbar += get_button (collector_page, "green", "srce", true);
1086 collectorbar += "<td>_icongreyarrow_</td>\n";
1087 collectorbar += get_button (collector_page, "grey", "conf", false);
1088 collectorbar += "<td>_icongreyarrow_</td>\n";
1089 collectorbar += get_button (collector_page, "grey", "bild", false);
1090 collectorbar += "<td>_icongreyarrow_</td>\n";
1091 collectorbar += get_button (collector_page, "grey", "view", false);
1092 collectorbar += "</tr><tr><td></td><td align=center>_icongreyuparrow_</td><td colspan=8></td>\n";
1093
1094 } else if (collector_page == "srce") {
1095 collectorbar += "<td>_icongreyarrow_</td>\n";
1096 if (esrce == 1) {
1097 // if we came from the "change an existing collection" page previous button(s)
1098 // are disabled
1099 collectorbar += get_button (collector_page, "grey", "info", false);
1100 } else {
1101 collectorbar += get_button (collector_page, "yellow", "info", true);
1102 }
1103 collectorbar += "<td>_icongreyarrow_</td>\n";
1104 collectorbar += get_button (collector_page, "yellow", "srce", false);
1105 collectorbar += "<td>_icongreyarrow_</td>\n";
1106 collectorbar += get_button (collector_page, "green", "conf", true);
1107 collectorbar += "<td>_icongreyarrow_</td>\n";
1108 collectorbar += get_button (collector_page, "green", "bild", true);
1109 collectorbar += "<td>_icongreyarrow_</td>\n";
1110 collectorbar += get_button (collector_page, "grey", "view", false);
1111 collectorbar += "</tr><tr><td colspan=3></td><td align=center>_icongreyuparrow_</td><td colspan=6></td>\n";
1112
1113 } else if (collector_page == "conf") {
1114 collectorbar += "<td>_icongreyarrow_</td>\n";
1115 // disable appropriate buttons if we came from "change an existing collection"
1116 // page
1117 if (esrce == 1 || econf == 1) {
1118 collectorbar += get_button (collector_page, "grey", "info", false);
1119 } else {
1120 collectorbar += get_button (collector_page, "yellow", "info", true);
1121 }
1122 collectorbar += "<td>_icongreyarrow_</td>\n";
1123 if (econf == 1) {
1124 collectorbar += get_button (collector_page, "grey", "srce", false);
1125 } else {
1126 collectorbar += get_button (collector_page, "yellow", "srce", true);
1127 }
1128 collectorbar += "<td>_icongreyarrow_</td>\n";
1129 collectorbar += get_button (collector_page, "yellow", "conf", false);
1130 collectorbar += "<td>_icongreyarrow_</td>\n";
1131 collectorbar += get_button (collector_page, "green", "bild", true);
1132 collectorbar += "<td>_icongreyarrow_</td>\n";
1133 collectorbar += get_button (collector_page, "grey", "view", false);
1134 collectorbar += "</tr><tr><td colspan=5></td><td align=center>_icongreyuparrow_</td><td colspan=4></td>\n";
1135
1136 } else if (collector_page == "bilddone") {
1137 collectorbar += "<td>_icongreyarrow_</td>\n";
1138 // all previous buttons grey after build was completed
1139 collectorbar += get_button (collector_page, "grey", "info", false);
1140 collectorbar += "<td>_icongreyarrow_</td>\n";
1141 collectorbar += get_button (collector_page, "grey", "srce", false);
1142 collectorbar += "<td>_icongreyarrow_</td>\n";
1143 collectorbar += get_button (collector_page, "grey", "conf", false);
1144 collectorbar += "<td>_icongreyarrow_</td>\n";
1145 collectorbar += get_button (collector_page, "yellow", "bild", false);
1146 collectorbar += "<td>_icongreyarrow_</td>\n";
1147 collectorbar += get_button (collector_page, "green", "view", true);
1148 collectorbar += "</tr><tr><td colspan=7></td><td align=center>_icongreyuparrow_</td><td colspan=2></td>\n";
1149
1150 } else if (collector_page == "bildcancel" || collector_page == "bildfail") {
1151 collectorbar += "<td>_icongreyarrow_</td>\n";
1152 // disable appropriate buttons if we came from "change an existing collection"
1153 // page
1154 if (esrce == 1 || econf == 1) {
1155 collectorbar += get_button (collector_page, "grey", "info", false);
1156 } else {
1157 collectorbar += get_button (collector_page, "yellow", "info", true);
1158 }
1159 collectorbar += "<td>_icongreyarrow_</td>\n";
1160 if (econf == 1) {
1161 collectorbar += get_button (collector_page, "grey", "srce", false);
1162 } else {
1163 collectorbar += get_button (collector_page, "yellow", "srce", true);
1164 }
1165 collectorbar += "<td>_icongreyarrow_</td>\n";
1166 collectorbar += get_button (collector_page, "yellow", "conf", true);
1167 collectorbar += "<td>_icongreyarrow_</td>\n";
1168 collectorbar += get_button (collector_page, "yellow", "bild", true);
1169 collectorbar += "<td>_icongreyarrow_</td>\n";
1170 collectorbar += get_button (collector_page, "grey", "view", false);
1171 }
1172
1173 collectorbar += "</tr></table>\n";
1174 disp.setmacro ("collectorbar", "collector", collectorbar);
1175
1176 if (collector_page == "bildfail") {
1177
1178 text_t textfailmsg = "_textfailmsg";
1179 textfailmsg.push_back(failcode);
1180 textfailmsg.push_back('_');
1181 disp.setmacro("textfailmsg", "collector", textfailmsg);
1182
1183 text_t bldlog = filename_cat(gsdlhome, "tmp", args["bc1tmp"], args["bc1dirname"] + ".bld");
1184 text_t rawlog = file_tail (bldlog, 6, 0);
1185 // we'll shove in some <br> tags where \n's occur
1186 text_t faillog;
1187 text_t::const_iterator here = rawlog.begin();
1188 text_t::const_iterator end = rawlog.end();
1189 while (here != end) {
1190 if (*here == '\n') faillog += "<br>";
1191 faillog.push_back (*here);
1192 here ++;
1193 }
1194 disp.setmacro ("faillog", "collector", dm_safe(faillog));
1195 }
1196
1197 if (collector_page == "srce" || collector_page == "existing")
1198 set_fullnamemenu (disp, args, protos, logout);
1199 if (collector_page == "conf")
1200 set_cfgfile (disp, args, logout);
1201 if (collector_page == "bildstatus")
1202 set_statusline (disp, args, logout);
1203 if (collector_page == "srce") {
1204 set_inputsourceboxes (disp, args, logout);
1205 }
1206
1207 disp.setmacro ("gsdlhome", "collector", dm_safe(gsdlhome));
1208}
1209
1210bool collectoraction::do_action (cgiargsclass &args, recptprotolistclass * /*protos*/,
1211 browsermapclass * /*browsers*/, displayclass &disp,
1212 outconvertclass &outconvert, ostream &textout,
1213 ostream &logout) {
1214
1215 // make sure the collector is enabled
1216 if (disabled) {
1217 textout << outconvert
1218 << "<html>\n"
1219 << "<head>\n"
1220 << "<title>Collector disabled</title>\n"
1221 << "</head>\n"
1222 << "<body bgcolor=\"#ffffff\" text=\"#000000\" link=\"#006666\" "
1223 << "alink=\"#cc9900\" vlink=\"#666633\">\n"
1224 << "<h2>Facility disabled</h2>\n"
1225 << "Sorry, the Collector end-user collection building facility is currently disabled\n"
1226 << "\n</body>\n"
1227 << "</html>\n";
1228 return true;
1229 }
1230
1231 text_t &collector_page = args["p"];
1232 text_t &collection = args["bc1dirname"];
1233
1234 // make sure we have perl (we won't bother with this check for the
1235 // building status pages to avoid slowing things down unneccessarily)
1236 if (collector_page != "bildstatus" && collector_page != "bildframe1" && !perl_ok(logout)) {
1237 textout << outconvert
1238 << "<html>\n"
1239 << "<head>\n"
1240 << "<title>Perl not found</title>\n"
1241 << "</head>\n"
1242 << "<body bgcolor=\"#ffffff\" text=\"#000000\" link=\"#006666\" "
1243 << "alink=\"#cc9900\" vlink=\"#666633\">\n"
1244 << "<h2>Perl not found</h2>\n"
1245 << "Greenstone could not detect perl on this system. It is therefore not\n"
1246 << "possible to build a Greenstone collection, either from the Collector or the \n"
1247 << "command-line tools, or to use the Collector for any other task.\n"
1248 << "<p>Please refer to the Greenstone Installer's Guide for details on\n"
1249 << "installing perl on your system.\n"
1250 << "\n</body>\n"
1251 << "</html>\n";
1252 return true;
1253
1254 }
1255
1256 if (collector_page == "bild") {
1257 // do the work (download, import, build)
1258 gsdl_build (args, logout);
1259
1260 if (message.empty()) {
1261 // bild page is a frameset so we don't want headers and stuff
1262 textout << outconvert << disp << ("_collector:bildcontent_\n");
1263 }
1264 }
1265
1266 if (do_mkcol == true) {
1267 // execute mkcol.pl (do_mkcol is set from within check_cgiargs)
1268 gsdl_mkcol (args, logout);
1269 do_mkcol = false; // reset for fast-cgi
1270 }
1271
1272 if (args["bc1dodelete"] == "1") {
1273 // delete bcidirname collection
1274 if (collection_protected (collection)) {
1275 message = "delinvalid";
1276
1277 } else {
1278
1279 const recptconf &rcinfo = recpt->get_configinfo ();
1280 bool emailuserevents = rcinfo.EmailUserEvents;
1281
1282 // get collection maintainer email from collect.cfg before we
1283 // delete it
1284 text_t colmaintainer;
1285 text_t cfgfile = filename_cat(gsdlhome, "collect", collection, "etc", "collect.cfg");
1286 char *cfgfilec = cfgfile.getcstr();
1287 ifstream cfg_in (cfgfilec);
1288 delete cfgfilec;
1289 if (cfg_in) {
1290 text_tarray cfgline;
1291 while (read_cfg_line(cfg_in, cfgline) >= 0) {
1292 if (cfgline.size () == 2 && cfgline[0] == "maintainer") {
1293 colmaintainer = cfgline[1];
1294 break;
1295 }
1296 }
1297 cfg_in.close();
1298 }
1299 if (colmaintainer.empty()) {
1300 logout << outconvert
1301 << "collectoraction::do_action WARNING: Collection being deleted ("
1302 << collection << ") has no maintainer address. EmailUserEvents "
1303 << "disabled\n";
1304 emailuserevents = false;
1305 }
1306
1307 // first we need to free up the collection's collection server
1308 // we must do this for the local library (and I guess when using
1309 // fastcgi too) as you can't delete the gdbm file while it's
1310 // being kept open by the collection server
1311 remove_colservr (collection, logout);
1312
1313 text_t delete_cmd = "perl -S delcol.pl -f " + collection;
1314 int rv = gsdl_system (delete_cmd, true, logout);
1315 if (rv != 0) {
1316 // deletion failed -- permissions?
1317 message = "delpermission";
1318 } else {
1319 message = "delsuccess";
1320 }
1321
1322 // log the event
1323 if (rcinfo.LogEvents == CollectorEvents || rcinfo.LogEvents == AllEvents) {
1324
1325 text_t eventlog = filename_cat (gsdlhome, "etc", "events.txt");
1326 char *eventlogt = eventlog.getcstr();
1327 ofstream eventl (eventlogt, ios::app);
1328 delete eventlogt;
1329
1330 if (eventl) {
1331 eventl << outconvert << "[Collector Event]\n"
1332 << "Date: " << get_date (true) << "\n"
1333 << "Greenstone Username: " << args["un"] << "\n"
1334 << "Collection: " << collection << "\n"
1335 << "Collection Maintainer: " << colmaintainer << "\n"
1336 << "GSDLHOME: " << gsdlhome << "\n";
1337
1338 if (message == "delsuccess") {
1339 eventl << outconvert
1340 << "The " << collection << " collection was successfully deleted\n\n";
1341 } else {
1342 eventl << outconvert
1343 << "Attempt to delete the " << collection << " collection failed\n\n";
1344 }
1345 eventl.close();
1346
1347 } else {
1348 logout << outconvert << "collectoraction::do_action ERROR: Couldn't open "
1349 << "event log file " << eventlog << " for appending during collection "
1350 << "deletion. LogEvents disabled\n";
1351 }
1352 }
1353
1354 if (rcinfo.EmailEvents == CollectorEvents || rcinfo.EmailEvents == AllEvents || emailuserevents) {
1355 // use sendmail.pl perl script to send email events
1356 text_t tmpmailfile = filename_cat (gsdlhome, "tmp", args["bc1tmp"], "event.txt");
1357 char *tmpmailfilec = tmpmailfile.getcstr();
1358 ofstream tmpfile (tmpmailfilec);
1359 delete tmpmailfilec;
1360 if (tmpfile) {
1361 tmpfile << outconvert << "[Collector Event]\n"
1362 << "Date: " << get_date (true) << "\n"
1363 << "Greenstone Username: " << args["un"] << "\n"
1364 << "Collection: " << collection << "\n"
1365 << "Collection Maintainer: " << colmaintainer << "\n"
1366 << "GSDLHOME: " << gsdlhome << "\n";
1367 if (message == "delsuccess") {
1368 tmpfile << outconvert
1369 << "The " << collection << " collection was successfully deleted\n\n";
1370 } else {
1371 tmpfile << outconvert
1372 << "Attempt to delete the " << collection << " collection failed\n\n";
1373 }
1374 tmpfile.close();
1375 text_t to;
1376 if (rcinfo.EmailEvents == CollectorEvents || rcinfo.EmailEvents == AllEvents) to += rcinfo.maintainer;
1377 if (emailuserevents) {
1378 if (!to.empty()) to.push_back (',');
1379 to += colmaintainer;
1380 }
1381 text_t sendmail_cmd = "perl -S sendmail.pl -to \"" + to + "\" -from \"" + rcinfo.maintainer;
1382 sendmail_cmd += "\" -smtp \"" + rcinfo.MailServer + "\" -subject \"Greenstone Collector Event\"";
1383 sendmail_cmd += " -msgfile \"" + tmpmailfile + "\"";
1384
1385 gsdl_system (sendmail_cmd, false, logout);
1386
1387 } else {
1388 logout << outconvert << "collectoraction::do_action ERROR: Couldn't open "
1389 << "temporary event log file " << tmpmailfile << " during collection "
1390 << "deletion. EmailEvents and EmailUserEvents disabled\n";
1391 }
1392 }
1393 }
1394 }
1395
1396 if (collector_page == "bildcancel" || collector_page == "bildfail") {
1397 // cancel the build (we'll also use the cancel_build script to tidy
1398 // up if the build failed)
1399 gsdl_cancel_build (args, logout);
1400 }
1401
1402 if (collector_page == "expt") {
1403
1404 // export the collection - we'll do a synchronous system call to
1405 // exportcol.pl as that's the easiest way to do it. if it becomes a
1406 // problem that it's taking too long to export a large collection then
1407 // we may have to revisit this.
1408 text_t tmpfile = filename_cat (gsdlhome, "tmp", collection + "_export.txt");
1409 text_t export_cmd = "perl -S exportcol.pl -out \"" + tmpfile + "\" " + collection;
1410 gsdl_system (export_cmd, true, logout);
1411 if (file_exists (tmpfile)) {
1412 text_t returnline = file_tail (tmpfile, 1, 0);
1413 if (returnline.size() > 23 && (substr(returnline.begin(), returnline.begin()+23) == "exportcol.pl succeeded:")) {
1414 // success
1415 message = "exptsuccess";
1416 } else {
1417 message = "exptfail";
1418 }
1419 } else {
1420 message = "exptfail";
1421 }
1422 }
1423
1424 if (message.empty()) {
1425 if (collector_page != "bild") {
1426 // output page ("bild" page was already output above)
1427 textout << outconvert << disp << ("_collector:header_\n")
1428 << ("_collector:" + collector_page + "content_\n")
1429 << ("_collector:footer_\n");
1430 }
1431 } else {
1432 // message was set somewhere (probably an error), output message page
1433 textout << outconvert << disp << ("_collector:header_\n")
1434 << ("_collector:" + message + "content_\n")
1435 << ("_collector:footer_\n");
1436 message.clear();
1437 }
1438 return true;
1439}
1440
1441// if sw = 0 replace all carriage returns in intext with the string "\n"
1442// else replace all occurances of "\n" with a carriage return
1443text_t collectoraction::carriage_replace (const text_t &intext, int sw) {
1444
1445 text_t outtext;
1446 text_t::const_iterator here = intext.begin();
1447 text_t::const_iterator end = intext.end();
1448 while (here != end) {
1449 if (sw == 0) {
1450 if (*here == '\n') {
1451 if ((here+1) != end && *(here+1) == '\r') here ++;
1452 outtext += "\\n";
1453 } else if (*here == '\r') {
1454 if ((here+1) != end && *(here+1) == '\n') here ++;
1455 outtext += "\\n";
1456 } else {
1457 outtext.push_back (*here);
1458 }
1459 } else if (*here == '\\' && (here+1) != end && *(here+1) == 'n') {
1460 outtext.push_back ('\n');
1461 here ++;
1462 } else {
1463 outtext.push_back (*here);
1464 }
1465 here ++;
1466 }
1467 return outtext;
1468}
1469
1470// create a short directory name from fullname
1471text_t collectoraction::get_directory_name (const text_t &fullname) {
1472
1473 text_t shortname;
1474 if (fullname.empty()) {
1475 shortname = "coll";
1476
1477 } else {
1478
1479 // first make all lowercase and remove any dodgy characters
1480 // (i.e. anything not [a-z]
1481 text_t::const_iterator here = fullname.begin();
1482 text_t::const_iterator end = fullname.end();
1483 while (here != end) {
1484 if ((*here >= 'A' && *here <= 'Z') || (*here >= 'a' && *here <= 'z') ||
1485 (*here == ' ')) {
1486 if (*here >= 'A' && *here <= 'Z') shortname.push_back (*here+32);
1487 else if (*here == ' ') {
1488 while ((*(here+1)) == ' ') here ++;
1489 shortname.push_back (*here);
1490 } else shortname.push_back (*here);
1491 }
1492 here ++;
1493 }
1494
1495 text_tarray words;
1496 splitchar (shortname.begin(), shortname.end(), ' ', words);
1497 int num_words = words.size();
1498
1499 if (num_words == 0) {
1500 shortname = "coll";
1501
1502 } else {
1503
1504 shortname.clear();
1505 int use_words = (num_words <= 6) ? num_words : 6;
1506 unsigned int substr_len = 6 / use_words;
1507
1508 for (int i = 0; i < use_words; i++) {
1509 if (words[i].size() < substr_len) shortname += words[i];
1510 else shortname += substr (words[i].begin(), words[i].begin()+substr_len);
1511 }
1512 }
1513 }
1514
1515 // check to see if shortname is unique
1516 text_t fulldirname = filename_cat (gsdlhome, "collect", shortname);
1517 if (directory_exists (fulldirname)) {
1518 int version = 0;
1519 text_t newname;
1520 do {
1521 version ++;
1522 newname = shortname;
1523 newname.push_back ('v');
1524 newname.appendint (version);
1525 fulldirname = filename_cat (gsdlhome, "collect", newname);
1526 } while (directory_exists (fulldirname));
1527
1528 shortname = newname;
1529 }
1530
1531 return shortname;
1532}
1533
1534// tests if collection is write protected (currently just checks if
1535// collect.cfg file is writable
1536bool collectoraction::collection_protected (const text_t &collection) {
1537 text_t cfgfile = filename_cat(gsdlhome, "collect", collection, "etc", "collect.cfg");
1538 if (file_writable(cfgfile)) return false;
1539 return true;
1540}
1541
1542// assigns a temporary directory name for this collector session
1543// and creates temporary directory
1544void collectoraction::assign_tmpname (cgiargsclass &args, ostream &logout) {
1545
1546 int i = 0;
1547 text_t tmpname = "tbuild";
1548 while (directory_exists (filename_cat (gsdlhome, "tmp", tmpname + text_t(i)))) {
1549 i++;
1550 }
1551 tmpname.appendint (i);
1552
1553 text_t fulltmpdir = filename_cat (gsdlhome, "tmp", tmpname);
1554 if (!mk_dir (fulltmpdir)) {
1555 outconvertclass text_t2ascii;
1556 logout << text_t2ascii << "collectoraction::assign_tmpname unable to create directory ("
1557 << fulltmpdir << ")\n";
1558 }
1559
1560 args["bc1tmp"] = tmpname;
1561}
1562
1563void collectoraction::gsdl_mkcol (cgiargsclass &args, ostream &logout) {
1564
1565 text_t tmpdir = filename_cat (gsdlhome, "tmp", args["bc1tmp"]);
1566 if (!directory_exists (tmpdir)) {
1567 message = "tmpfail";
1568 return;
1569 }
1570
1571 text_t &collection = args["bc1dirname"];
1572 if (collection.empty()) {
1573 message = "nocollection";
1574 return;
1575 }
1576
1577 // check for a .create file - if it exists then we've already created the collection
1578 text_t createfile = filename_cat (tmpdir, ".create");
1579 if (file_exists (createfile)) {
1580 return;
1581 }
1582
1583 // set up options
1584 text_t options = "-quiet -creator \"" + args["bc1contactemail"] + "\"";
1585 options += " -title \"" + args["bc1fullname"] + "\"";
1586 options += " -about \"" + carriage_replace (args["bc1aboutdesc"] + "_collectorextra_", 0) + "\"";
1587 options += " -collectdir \"" + remove_trailing_slashes(tmpdir) + "\" ";
1588
1589 text_t optionfile = filename_cat (tmpdir, "mkcol.opt");
1590 char *optionfilec = optionfile.getcstr();
1591 ofstream ofile_out (optionfilec);
1592 delete optionfilec;
1593 if (!ofile_out) {
1594 message = "tmpfail";
1595 return;
1596 }
1597 outconvertclass text_t2ascii;
1598 ofile_out << text_t2ascii << options << "\n";
1599 ofile_out.close();
1600
1601 // run mkcol.pl
1602 text_t mkcol_cmd = "perl -S mkcol.pl -optionfile \"" + optionfile;
1603 mkcol_cmd += "\" " + collection;
1604 gsdl_system (mkcol_cmd, true, logout);
1605
1606 // make sure it went ok
1607 text_t cfgfile = filename_cat (tmpdir, collection, "etc", "collect.cfg");
1608 if (!file_writable (cfgfile)) {
1609 message = "mkcolfail";
1610 } else {
1611 // create the .create file (this file is just a place holder to let any future
1612 // pages know that the collection already exists).
1613 char *createfilec = createfile.getcstr();
1614 ofstream cfile_out (createfilec);
1615 delete createfilec;
1616 if (cfile_out) {
1617 cfile_out << "collection created\n";
1618 cfile_out.close();
1619 } else {
1620 message = "tmpfail";
1621 return;
1622 }
1623 }
1624}
1625
1626void collectoraction::gsdl_build (cgiargsclass &args, ostream &logout) {
1627
1628 outconvertclass text_t2ascii;
1629
1630 text_t tmpdir = filename_cat (gsdlhome, "tmp", args["bc1tmp"]);
1631 if (!directory_exists (tmpdir)) {
1632 message = "tmpfail";
1633 return;
1634 }
1635
1636 text_t &collection = args["bc1dirname"];
1637 if (collection.empty()) {
1638 message = "nocollection";
1639 return;
1640 }
1641
1642 // check for a .build file - if it exists then we've already built
1643 // the collection (or are in the process of building it)
1644 text_t buildfile = filename_cat (tmpdir, ".build");
1645 if (file_exists (buildfile)) {
1646 return;
1647 } else {
1648 // create the .build file (this file is just a place holder to let any future
1649 // pages know that we've already been here)
1650 char *buildfilec = buildfile.getcstr();
1651 ofstream bfile_out (buildfilec);
1652 delete buildfilec;
1653 if (bfile_out) {
1654 bfile_out << "collection building\n";
1655 bfile_out.close();
1656 } else {
1657 message = "tmpfail";
1658 return;
1659 }
1660 }
1661
1662 const recptconf &rcinfo = recpt->get_configinfo ();
1663
1664 // create the event header file if LogEvents, EmailEvents or
1665 // EmailUserEvents options are turned on.
1666 bool logevents =
1667 (rcinfo.LogEvents == CollectorEvents || rcinfo.LogEvents == AllEvents ||
1668 rcinfo.EmailEvents == CollectorEvents || rcinfo.EmailEvents == AllEvents ||
1669 rcinfo.EmailUserEvents);
1670 text_t ehead_file = filename_cat (tmpdir, "ehead.txt");
1671 if (logevents) {
1672 if (!create_event_header_file (ehead_file, args, logout)) {
1673 logevents = false;
1674 }
1675 }
1676
1677 text_t collectdir = get_collectdir (args);
1678
1679 // set up build options
1680 text_t options = "-make_writable -remove_import -out \"";
1681 options += filename_cat (tmpdir, collection + ".bld");
1682 options += "\" -collectdir \"" + collectdir + "\" -statsfile \"";
1683 options += filename_cat(collectdir, collection, "etc", "import.log") + "\"";
1684
1685 if (args["bc1esrce"] == 1) {
1686 // we're adding data to an existing collection
1687 options += " -save_archives -append";
1688 }
1689
1690 text_tarray inputvalues, inputtypes;
1691 splitchar (args["bc1input"].begin(), args["bc1input"].end(), ',', inputvalues);
1692 splitchar (args["bc1inputtype"].begin(), args["bc1inputtype"].end(), ',', inputtypes);
1693 int numvalues = inputvalues.size();
1694 int numtypes = inputtypes.size();
1695 for (int i = 0; i < numvalues; i++) {
1696 if (!inputvalues[i].empty()) {
1697 text_t type = "file://"; // default
1698 if (i < numtypes) type = inputtypes[i];
1699 options += " -download \"" +
1700 remove_trailing_slashes(type + format_url(decode_commas(inputvalues[i]))) + "\"";
1701 }
1702 }
1703
1704 if (logevents) {
1705 if (rcinfo.LogEvents == CollectorEvents || rcinfo.LogEvents == AllEvents)
1706 options += " -log_events";
1707 if (rcinfo.EmailEvents == CollectorEvents || rcinfo.EmailEvents == AllEvents) {
1708 options += " -mail_server " + rcinfo.MailServer;
1709 options += " -email_events " + rcinfo.maintainer;
1710 if (rcinfo.EmailUserEvents) options += "," + args["bc1contactemail"];
1711 } else if (rcinfo.EmailUserEvents) {
1712 options += " -mail_server " + rcinfo.MailServer;
1713 options += " -email_events " + args["bc1contactemail"];
1714 }
1715 options += " -event_header " + ehead_file;
1716 }
1717
1718 text_t optionfile = filename_cat (tmpdir, "build.opt");
1719 char *optionfilec = optionfile.getcstr();
1720 ofstream ofile_out (optionfilec);
1721 delete optionfilec;
1722 if (!ofile_out) {
1723 message = "tmpfail";
1724 return;
1725 }
1726 ofile_out << text_t2ascii << options << "\n";
1727 ofile_out.close();
1728
1729 // if we're altering an existing collection we need to kill off
1730 // the existing collection server - we do this for the local library
1731 // (and any other persistent version of the library) as the existing
1732 // gdbm file can't be deleted while the collection server holds it open
1733 if ((args["bc1econf"] == 1) || (args["bc1esrce"] == 1)) {
1734 remove_colservr (collection, logout);
1735 }
1736
1737 // set up the build command - build.bat has some issues with quoting
1738 // on win2k when gsdlhome contains spaces so we'll avoid using
1739 // "perl -S" here in favor of calling the "build" perl script explicitly
1740 text_t build_cmd = "perl \"" + filename_cat (gsdlhome, "bin", "script", "build");
1741 build_cmd += "\" -optionfile \"" + optionfile + "\" " + collection;
1742 // run build command in background (i.e. asynchronously)
1743 gsdl_system (build_cmd, false, logout);
1744}
1745
1746void collectoraction::gsdl_cancel_build (cgiargsclass &args, ostream &logout) {
1747 // I really wanted to do what this perl script does from within the library
1748 // c++ code. I ran into some problems though (like how do you write a portable
1749 // "rm -r" in c++?). One day I'll spend some time sorting it out ... maybe.
1750 text_t cancel_cmd = "perl -S cancel_build.pl -collectdir \"";
1751 cancel_cmd += filename_cat (gsdlhome, "tmp", args["bc1tmp"]) + "\" ";
1752 cancel_cmd += args["bc1dirname"];
1753 // To be on the safe side we'll make this a synchronous call
1754 // so that all tidying up is done before the user has a chance
1755 // to do anything else (like start rebuilding their collection).
1756 // This means that for a big collection where there's lots of
1757 // stuff to delete etc. it might take a while before the "build
1758 // cancelled" page appears.
1759 gsdl_system (cancel_cmd, true, logout);
1760}
1761
1762text_t collectoraction::get_collectdir (cgiargsclass &args) {
1763
1764 if ((args["bc1econf"] == 1) || (args["bc1esrce"] == 1)) {
1765 // we're adding to a collection in place
1766 return filename_cat(gsdlhome, "collect");
1767
1768 } else {
1769 return filename_cat (gsdlhome, "tmp", args["bc1tmp"]);
1770 }
1771}
1772
1773// checks to see if any of the plugins in pluginset occur in
1774// collections configuration file
1775bool collectoraction::uses_weird_plugin (const text_t &collection) {
1776
1777 text_tset pluginset;
1778 pluginset.insert ("HBPlug");
1779
1780 text_t cfgfile_content;
1781 text_t cfgfile_name = filename_cat (gsdlhome, "collect", collection, "etc", "collect.cfg");
1782 text_t pluginstr, pluginname;
1783
1784 if (read_file (cfgfile_name, cfgfile_content)) {
1785 text_t::const_iterator here = cfgfile_content.begin();
1786 text_t::const_iterator end = cfgfile_content.end();
1787 while (here != end) {
1788 here = findchar (here, end, 'p');
1789 if (here == end) break;
1790 if ((here+6 < end) && (substr (here, here+6) == "plugin")) {
1791 getdelimitstr (here+6, end, '\n', pluginstr);
1792 text_t::const_iterator hp = pluginstr.begin();
1793 text_t::const_iterator ep = pluginstr.end();
1794 bool found = false;
1795 // remove any leading whitespace, trailing options etc.
1796 while (hp != ep) {
1797 if (*hp == '\t' || *hp == ' ' || *hp == '\n') {
1798 if (found) break;
1799 } else {
1800 pluginname.push_back (*hp);
1801 found = true;
1802 }
1803 hp ++;
1804 }
1805 text_tset::const_iterator it = pluginset.find (pluginname);
1806 if (it != pluginset.end()) return true; // found matching plugin
1807 pluginname.clear();
1808 }
1809 here ++;
1810 }
1811 }
1812 return false;
1813}
1814
1815// create and initialize a new collection server and
1816// add it to the null protocol.
1817void collectoraction::create_colserver (const text_t &collection, ostream &logout) {
1818
1819 recptprotolistclass *protos = recpt->get_recptprotolist_ptr();
1820 recptprotolistclass::iterator rprotolist_here = protos->begin();
1821 recptprotolistclass::iterator rprotolist_end = protos->end();
1822 while (rprotolist_here != rprotolist_end) {
1823 comerror_t err = noError;
1824 if ((*rprotolist_here).p != NULL) {
1825 if ((*rprotolist_here).p->get_protocol_name (err) == "nullproto") {
1826 // create collection server and add it to nullproto
1827 (*rprotolist_here).p->add_collection (collection, recpt, gsdlhome, gsdlhome);
1828 // make sure gsdlhome is configured
1829 text_tarray tmp;
1830 tmp.push_back (gsdlhome);
1831 (*rprotolist_here).p->configure ("gsdlhome", tmp, err);
1832 // re-initialize the null protocol
1833 if (!(*rprotolist_here).p->init (err, logout)) {
1834 logout << "collectoraction::create_colserver: nullproto init failed\n";
1835 }
1836 return;
1837 }
1838 }
1839 rprotolist_here ++;
1840 }
1841
1842 logout << "collectoraction::create_colserver: no valid nullproto found\n";
1843}
1844
1845// delete a collection server from the null protocol
1846void collectoraction::remove_colservr (const text_t &collection, ostream &logout) {
1847
1848 recpt->uncache_collection (collection);
1849
1850 recptprotolistclass *protos = recpt->get_recptprotolist_ptr();
1851 recptprotolistclass::iterator rprotolist_here = protos->begin();
1852 recptprotolistclass::iterator rprotolist_end = protos->end();
1853 while (rprotolist_here != rprotolist_end) {
1854 comerror_t err = noError;
1855 if ((*rprotolist_here).p != NULL) {
1856 if ((*rprotolist_here).p->get_protocol_name (err) == "nullproto") {
1857 (*rprotolist_here).p->remove_collection (collection, logout);
1858 return;
1859 }
1860 }
1861 rprotolist_here ++;
1862 }
1863
1864 logout << "collectoraction::create_colserver: no valid nullproto found\n";
1865}
1866
1867bool collectoraction::create_event_header_file (const text_t &filename, cgiargsclass &args,
1868 ostream &logout) {
1869
1870 outconvertclass text_t2ascii;
1871 char *filenamec = filename.getcstr();
1872 ofstream eheadfile (filenamec);
1873 delete filenamec;
1874
1875 if (eheadfile) {
1876 eheadfile << text_t2ascii << get_event_header (args);
1877 eheadfile.close();
1878 return true;
1879 }
1880
1881 logout << text_t2ascii << "collectoraction::create_event_header ERROR: Couldn't create "
1882 << "Event Header file " << filename << ". Event logging disabled\n";
1883 return false;
1884}
1885
1886text_t collectoraction::get_event_header (cgiargsclass &args) {
1887 text_t header = "Greenstone Username: " + args["un"] + "\n";
1888 header += "Collection: " + args["bc1dirname"] + "\n";
1889 header += "Collection Creator: " + args["bc1contactemail"] + "\n";
1890 header += "GSDLHOME: " + gsdlhome + "\n";
1891 header += "Build Location: " + get_collectdir(args) + "\n";
1892
1893 return header;
1894}
1895
1896bool collectoraction::check_sources (cgiargsclass &args, ostream &logout) {
1897
1898 bool found = false;
1899
1900 text_tarray inputvalues;
1901 splitchar (args["bc1input"].begin(), args["bc1input"].end(), ',', inputvalues);
1902
1903 text_tarray inputtypes;
1904 splitchar (args["bc1inputtype"].begin(), args["bc1inputtype"].end(), ',', inputtypes);
1905
1906 int numvalues = inputvalues.size();
1907 int numtypes = inputtypes.size();
1908
1909 for (int i = 0; i < numvalues; i++) {
1910 text_t value = format_url(decode_commas(inputvalues[i]));
1911 text_t type = "file://"; // default
1912 if (!value.empty()) {
1913 found = true;
1914 if (i >= numtypes || inputtypes[i].empty()) {
1915 logout << "collectoraction::check_sources: WARNING type not set\n";
1916 } else {
1917 type = inputtypes[i];
1918 }
1919 if (type == "file://") {
1920 if (!file_exists(value) && !directory_exists(value)) {
1921 failedsources[decode_commas(inputvalues[i])] = "1";
1922 badsources = true;
1923 }
1924 } else if (type == "http://") {
1925 if (gsdl_system ("perl -S ping.pl -quiet http://" + value, true, logout)) {
1926 failedsources[decode_commas(inputvalues[i])] = "1";
1927 badsources = true;
1928 }
1929 } else if (type == "ftp://") {
1930 if (gsdl_system ("perl -S ping.pl -quiet ftp://" + value, true, logout)) {
1931 failedsources[decode_commas(inputvalues[i])] = "1";
1932 badsources = true;
1933 }
1934 }
1935 }
1936 }
1937
1938 // set badsources if there weren't any sources at all
1939 if (!found) badsources = true;
1940
1941 if (badsources) return false;
1942 return true;
1943}
1944
1945// format_url simply strips "http://", "ftp://", or "file://" off the
1946// beginning of url if they're there
1947text_t collectoraction::format_url (const text_t &url) {
1948 text_t::const_iterator begin = url.begin();
1949 text_t::const_iterator end = url.end();
1950
1951 if (url.size() >= 7) {
1952 text_t prefix = substr(begin, begin+7);
1953 if (prefix == "http://" || prefix == "file://") {
1954 return substr(begin+7, end);
1955 }
1956 }
1957 if (url.size() >= 6) {
1958 if (substr(begin, begin+6) == "ftp://") {
1959 return substr(begin+6, end);
1960 }
1961 }
1962 return url;
1963}
1964
1965text_t collectoraction::remove_trailing_slashes (text_t str) {
1966
1967 while (*(str.end()-1) == '\\') {
1968 str.pop_back();
1969 }
1970 return str;
1971}
Note: See TracBrowser for help on using the repository browser.