[23138] | 1 | #!/usr/bin/perl -w
|
---|
[23091] | 2 |
|
---|
| 3 | use strict;
|
---|
| 4 |
|
---|
| 5 | use LWP::UserAgent;
|
---|
| 6 | use HTTP::Request::Common;
|
---|
| 7 |
|
---|
| 8 | use CGI::Carp qw(fatalsToBrowser);
|
---|
| 9 | use CGI;
|
---|
| 10 |
|
---|
[23147] | 11 | use File::Basename;
|
---|
| 12 |
|
---|
[23146] | 13 | BEGIN {
|
---|
| 14 | eval('require "./gsdlCGI.pm"');
|
---|
| 15 | if ($@)
|
---|
| 16 | {
|
---|
| 17 | print STDOUT "Content-type:text/plain\n\n";
|
---|
| 18 | print STDOUT "ERROR: $@\n";
|
---|
| 19 | exit 0;
|
---|
| 20 | }
|
---|
| 21 |
|
---|
| 22 | # Line to stop annoying child DOS CMD windows from appearing
|
---|
| 23 | Win32::SetChildShowWindow(0)
|
---|
| 24 | if defined &Win32::SetChildShowWindow;
|
---|
[23091] | 25 | }
|
---|
| 26 |
|
---|
| 27 |
|
---|
[23146] | 28 |
|
---|
| 29 |
|
---|
[23138] | 30 | sub get_infodb_type
|
---|
| 31 | {
|
---|
[23144] | 32 | my ($opt_site,$collect_home,$collect) = @_;
|
---|
[23138] | 33 |
|
---|
[23144] | 34 | my $out = "STDERR";
|
---|
| 35 |
|
---|
| 36 | $collect = &colcfg::use_collection($opt_site, $collect, $collect_home);
|
---|
| 37 |
|
---|
| 38 | if ($collect eq "") {
|
---|
| 39 | print STDERR "Error: failed to find collection $collect in $collect_home\n";
|
---|
| 40 | print STDOUT "Content-type:text/plain\n\n";
|
---|
| 41 | print STDOUT "ERROR: Failed to find collection $collect\n";
|
---|
| 42 | exit 0;
|
---|
| 43 |
|
---|
| 44 | }
|
---|
| 45 |
|
---|
| 46 | # Read in the collection configuration file.
|
---|
| 47 | my ($config_filename, $gs_mode) = &colcfg::get_collect_cfg_name($out);
|
---|
| 48 | my $collectcfg = &colcfg::read_collection_cfg ($config_filename, $gs_mode);
|
---|
| 49 |
|
---|
| 50 | return $collectcfg->{'infodbtype'};
|
---|
[23138] | 51 | }
|
---|
| 52 |
|
---|
| 53 |
|
---|
| 54 | sub oid_to_docxml_filename
|
---|
| 55 | {
|
---|
[23144] | 56 | my ($opt_site,$collect_home,$collect,$docid) = @_;
|
---|
[23138] | 57 |
|
---|
[23144] | 58 | my $infodb_type = get_infodb_type($opt_site,$collect_home,$collect);
|
---|
[23138] | 59 |
|
---|
[23147] | 60 | # Derive the archives dir
|
---|
| 61 | my $archive_dir = &util::filename_cat($collect_home,$collect,"archives");
|
---|
[23138] | 62 |
|
---|
| 63 | # Obtain the doc.xml path for the specified docID
|
---|
| 64 | my $arcinfo_doc_filename
|
---|
| 65 | = &dbutil::get_infodb_file_path($infodb_type, "archiveinf-doc",
|
---|
[23147] | 66 | $archive_dir);
|
---|
[23138] | 67 | my $doc_rec_string
|
---|
| 68 | = &dbutil::read_infodb_entry($infodb_type, $arcinfo_doc_filename,
|
---|
| 69 | $docid);
|
---|
| 70 | my $doc_rec = &dbutil::convert_infodb_string_to_hash($doc_rec_string);
|
---|
| 71 | my $doc_xml_file = $doc_rec->{'doc-file'}->[0];
|
---|
[23147] | 72 | my $assoc_path = dirname($doc_xml_file);
|
---|
| 73 |
|
---|
[23138] | 74 | # The $doc_xml_file is relative to the archives, so now let's get the
|
---|
| 75 | # full path
|
---|
[23147] | 76 | my $doc_xml_filename = &util::filename_cat($archive_dir,$doc_xml_file);
|
---|
[23138] | 77 |
|
---|
[23147] | 78 | return ($doc_xml_filename,$assoc_path);
|
---|
[23138] | 79 | }
|
---|
| 80 |
|
---|
[23147] | 81 | sub zip_up_archives_doc
|
---|
| 82 | {
|
---|
| 83 | my ($gsdl_cgi,$collect_home,$collect,$doc_xml_filename,$assoc_path) = @_;
|
---|
| 84 |
|
---|
| 85 | my $timestamp = time();
|
---|
| 86 | my $lang_env = $gsdl_cgi->clean_param("lr") || "";
|
---|
| 87 |
|
---|
| 88 | my $archive_dir = &util::filename_cat($collect_home,$collect,"archives");
|
---|
| 89 |
|
---|
| 90 | # Zip up the doc_xml file and all the files associated with it
|
---|
| 91 | my $java = $gsdl_cgi->get_java_path();
|
---|
| 92 | my $jar_dir= &util::filename_cat($ENV{'GSDLHOME'}, "bin", "java");
|
---|
| 93 | my $java_classpath = &util::filename_cat($jar_dir,"GLIServer.jar");
|
---|
| 94 |
|
---|
| 95 | my $zip_file = "$collect-$timestamp.zip";
|
---|
| 96 | my $zip_file_path = &util::filename_cat($archive_dir,$zip_file);
|
---|
| 97 |
|
---|
| 98 | my $java_args = "\"$zip_file_path\" \"$archive_dir\" \"$assoc_path\"";
|
---|
| 99 |
|
---|
| 100 | $ENV{'LANG'} = $lang_env;
|
---|
[23161] | 101 | my $java_command = "\"$java\" -classpath \"$java_classpath\" org.greenstone.gatherer.remote.ZipFiles $java_args";
|
---|
[23147] | 102 |
|
---|
| 103 | my $java_output = `$java_command`;
|
---|
| 104 | my $java_status = $?;
|
---|
| 105 | if ($java_status > 0) {
|
---|
| 106 | $gsdl_cgi->generate_error("Java failed: $java_command\n--\n$java_output\nExit status: " . ($java_status / 256) . "\n" . $gsdl_cgi->check_java_home());
|
---|
| 107 | }
|
---|
| 108 |
|
---|
| 109 | # Check that the zip file was created successfully
|
---|
| 110 | if (!-e $zip_file_path || -z $zip_file_path) {
|
---|
| 111 | $gsdl_cgi->generate_error("Collection zip file $zip_file_path could not be created.");
|
---|
| 112 | }
|
---|
| 113 |
|
---|
| 114 | return $zip_file_path;
|
---|
| 115 |
|
---|
| 116 | }
|
---|
| 117 |
|
---|
[23091] | 118 | sub main
|
---|
| 119 | {
|
---|
| 120 | # Setup greenstone Perl include paths so additional packages can be found
|
---|
| 121 | my $gsdl_cgi = gsdlCGI->new();
|
---|
| 122 | $gsdl_cgi->setup_gsdl();
|
---|
| 123 |
|
---|
[23138] | 124 | my $gsdl_home = $gsdl_cgi->get_gsdl_home();
|
---|
| 125 | my $collect_home = &util::filename_cat($gsdl_home,"collect");
|
---|
| 126 |
|
---|
| 127 | require dbutil;
|
---|
[23091] | 128 | require talkback;
|
---|
[23145] | 129 | require colcfg;
|
---|
[23091] | 130 |
|
---|
[23142] | 131 | my $oid = $gsdl_cgi->param('oid');
|
---|
[23177] | 132 | my $collect = $gsdl_cgi->param('fromCollect');
|
---|
| 133 | my $toCollect = $gsdl_cgi->param('toCollect');
|
---|
[23144] | 134 | my $site = $gsdl_cgi->param('site');
|
---|
[23091] | 135 |
|
---|
[23138] | 136 | # sanity check
|
---|
| 137 | if (!defined $oid || !defined $collect) {
|
---|
| 138 | print STDOUT "Content-type:text/plain\n\n";
|
---|
[23142] | 139 | print STDOUT "ERROR: Malformed CGI argments. Need to specify 'oid' and 'collect'\n";
|
---|
[23138] | 140 | exit 0;
|
---|
[23091] | 141 | }
|
---|
| 142 |
|
---|
[23138] | 143 | my $uniq_prefix = "$collect-$oid";
|
---|
[23091] | 144 |
|
---|
[23147] | 145 | my ($docxml_filename,$assoc_path)
|
---|
| 146 | = oid_to_docxml_filename($site,$collect_home,$collect,$oid);
|
---|
[23138] | 147 |
|
---|
[23147] | 148 | my $zip_filename
|
---|
| 149 | = zip_up_archives_doc($gsdl_cgi,$collect_home,$collect,
|
---|
| 150 | $docxml_filename,$assoc_path);
|
---|
| 151 |
|
---|
[23138] | 152 | my $talktoUploadURL = $gsdl_cgi->param('talktoUpload');
|
---|
| 153 |
|
---|
[23091] | 154 | my $browser = LWP::UserAgent->new(agent => 'Perl File Upload');
|
---|
| 155 |
|
---|
| 156 | my $response = $browser->post(
|
---|
| 157 | $talktoUploadURL,
|
---|
| 158 | [ 'yes_upload' => '1',
|
---|
| 159 | 'process' => '1',
|
---|
[23142] | 160 | 'oid' => $oid,
|
---|
[23177] | 161 | 'toCollect' => $toCollect,
|
---|
[23162] | 162 | 'uploadedfile' => [$zip_filename, "$uniq_prefix-doc.zip"]
|
---|
[23091] | 163 | ],
|
---|
| 164 | 'Content_Type' => 'form-data'
|
---|
| 165 | );
|
---|
| 166 |
|
---|
| 167 | if ($response->is_success) {
|
---|
| 168 | print "Content-type:text/html\n\n";
|
---|
| 169 | print $response->content;
|
---|
| 170 | }
|
---|
| 171 | else {
|
---|
| 172 | print $response->error_as_HTML;
|
---|
| 173 | }
|
---|
| 174 |
|
---|
| 175 | }
|
---|
| 176 |
|
---|
| 177 | main();
|
---|
| 178 |
|
---|