Changeset 2614 for trunk/niupepa
- Timestamp:
- 2001-06-29T16:30:26+12:00 (23 years ago)
- Location:
- trunk/niupepa/perllib
- Files:
-
- 1 added
- 2 edited
Legend:
- Unmodified
- Added
- Removed
-
trunk/niupepa/perllib/plugins/AbstractPlug.pm
r1554 r2614 23 23 # 24 24 ########################################################################### 25 26 27 #*************** 28 29 # don't bother using this anymore - simply split up abstracts manually with 30 # the help of the format_abstract.pl script 31 32 #*************** 33 25 34 26 35 # AbstractPlug processes the abstracts created for the Niupepa collection -
trunk/niupepa/perllib/plugins/NPPlug.pm
r1569 r2614 199 199 my $topsection = $doc_obj->get_top_section(); 200 200 $self->associate_cover_images ($doc_obj, $dir, $issuekey); 201 $doc_obj->set_ metadata_element ($topsection, 'Title', $self->get_title_string($file));202 $doc_obj->set_ metadata_element ($topsection, 'abstract', $abstract) if defined $abstract;201 $doc_obj->set_utf8_metadata_element ($topsection, 'Title', $self->get_title_string($file)); 202 $doc_obj->set_utf8_metadata_element ($topsection, 'abstract', $abstract) if defined $abstract; 203 203 $self->set_main_metadata ($doc_obj, $dir); 204 204 … … 209 209 chomp $line; 210 210 if ($line =~ /^<([^>]*)>(.*?)\s*$/) { 211 $doc_obj->set_ metadata_element ($topsection, $1, $2);211 $doc_obj->set_utf8_metadata_element ($topsection, $1, $2); 212 212 $meta->{$1} = $2; 213 213 } else { … … 215 215 $line =~ s/^\s+//; 216 216 $line =~ s/\s+$//; 217 my ($pagenum) = $line =~ /(\d+)$/; 218 $doc_obj->create_named_section($pagenum); 219 $doc_obj->set_metadata_element($pagenum, 'Title', $pagenum); 220 $self->process_text ($dir, $line, $doc_obj, $pagenum); 221 $self->process_images ($dir, $line, $doc_obj, $pagenum); 217 my ($pagenum) = $line =~ /([^_]*)$/; 218 # $doc_obj->create_named_section($pagenum); <-- can't do this anymore as pagenum may 219 # be something like "cover" 220 my $cursection = $doc_obj->insert_section($doc_obj->get_end_child($topsection)); 221 222 # $doc_obj->set_utf8_metadata_element($pagenum, 'Title', $pagenum); 223 $doc_obj->set_utf8_metadata_element($cursection, 'Title', $pagenum); 224 # $self->process_text ($dir, $line, $doc_obj, $pagenum); 225 $self->process_text ($dir, $line, $doc_obj, $cursection); 226 # $self->process_images ($dir, $line, $doc_obj, $pagenum); 227 $self->process_images ($dir, $line, $doc_obj, $cursection); 222 228 } 223 229 } … … 236 242 if (-e "$filename.gif") { 237 243 $self->{'num_image_pages'} ++; 238 $doc_obj->set_ metadata_element ($cursection, "hasimg", "1");239 $doc_obj->set_ metadata_element ($cursection, "Source", $page);244 $doc_obj->set_utf8_metadata_element ($cursection, "hasimg", "1"); 245 $doc_obj->set_utf8_metadata_element ($cursection, "Source", $page); 240 246 $doc_obj->associate_file("$filename.gif", "$page.gif", "image/gif"); 241 247 } elsif ($self->{'create_log'}) { 242 $doc_obj->set_ metadata_element ($cursection, "hasimg", "0");248 $doc_obj->set_utf8_metadata_element ($cursection, "hasimg", "0"); 243 249 print LOGFILE "no fullsize image file for $page\n"; 244 250 } 245 251 246 252 if (-e "${filename}_p.gif") { 247 $doc_obj->set_ metadata_element ($cursection, "hasprevimg", "1");248 $doc_obj->set_ metadata_element ($cursection, "Source", $page);253 $doc_obj->set_utf8_metadata_element ($cursection, "hasprevimg", "1"); 254 $doc_obj->set_utf8_metadata_element ($cursection, "Source", $page); 249 255 $doc_obj->associate_file("${filename}_p.gif", "${page}_p.gif", "image/gif"); 250 256 } elsif ($self->{'create_log'}) { 251 $doc_obj->set_ metadata_element ($cursection, "hasprevimg", "0");257 $doc_obj->set_utf8_metadata_element ($cursection, "hasprevimg", "0"); 252 258 print LOGFILE "no preview image file for $page\n"; 253 259 } … … 268 274 if (defined $text) { 269 275 $self->{'num_text_pages'} ++; 270 $doc_obj->add_ text ($cursection, $text);276 $doc_obj->add_utf8_text ($cursection, $text); 271 277 } elsif ($self->{'create_log'}) { 272 278 print LOGFILE "no txt or htm file for $page\n"; … … 284 290 my $cursection = $doc_obj->get_top_section(); 285 291 $self->associate_cover_images ($doc_obj, $dir, $issuekey); 286 $doc_obj->set_ metadata_element ($cursection, 'Title', $self->get_title_string($file));292 $doc_obj->set_utf8_metadata_element ($cursection, 'Title', $self->get_title_string($file)); 287 293 $self->set_main_metadata ($doc_obj, $dir); 288 map { $doc_obj->set_ metadata_element ($cursection, $_, $meta->{$_}); } keys %$meta;289 $doc_obj->set_ metadata_element ($cursection, "doctype", "Description");290 $doc_obj->add_ text ($cursection, $text);294 map { $doc_obj->set_utf8_metadata_element ($cursection, $_, $meta->{$_}); } keys %$meta; 295 $doc_obj->set_utf8_metadata_element ($cursection, "doctype", "Description"); 296 $doc_obj->add_utf8_text ($cursection, $text); 291 297 $file =~ s/\.abstract//i; 292 298 $doc_obj->set_OID ($file . "abstract"); … … 313 319 my $cursection = $doc_obj->get_top_section(); 314 320 $self->associate_cover_images ($doc_obj, $dir, $issuekey); 315 $doc_obj->set_ metadata_element ($cursection, 'Title', "_commentary_");321 $doc_obj->set_utf8_metadata_element ($cursection, 'Title', "_commentary_"); 316 322 $self->set_main_metadata ($doc_obj, $dir); 317 $doc_obj->set_ metadata_element ($cursection, "doctype", "Commentary");318 $doc_obj->add_ text ($cursection, $text);323 $doc_obj->set_utf8_metadata_element ($cursection, "doctype", "Commentary"); 324 $doc_obj->add_utf8_text ($cursection, $text); 319 325 $doc_obj->set_OID ($issuekey . "commentary"); 320 326 $processor->process ($doc_obj); … … 352 358 # note we're using set_metadata_element (not add_metadata_element) 353 359 # this will override any previously set metadata of the same name 354 $doc_obj->set_ metadata_element ($cursection, $1, $2);360 $doc_obj->set_utf8_metadata_element ($cursection, $1, $2); 355 361 } elsif ($self->{'verbosity'}) { 356 362 print STDERR "NPPlug: Badly formatted line in $metafile\n";
Note:
See TracChangeset
for help on using the changeset viewer.