- Timestamp:
- 2018-06-11T17:54:08+12:00 (6 years ago)
- File:
-
- 1 edited
Legend:
- Unmodified
- Added
- Removed
-
gs2-extensions/pdf-box/trunk/java/perllib/plugins/PDFBoxConverter.pm
r32193 r32197 131 131 $self->{'pdfbox_launch_cmd'} = $launch_cmd; 132 132 #$self->{'pdfbox_img_launch_cmd'} = "java -cp \"$pbajar\" org.apache.pdfbox.tools.PDFToImage"; # pdfbox 2.09 cmd for converting each PDF page to an image (gif, jpg, png) 133 # Now: use this cmd to launch our new custom PDFBox class ( GS_PDFToImagesAndText.java) to convert each PDF page into an image (gif, jpg, png)133 # Now: use this cmd to launch our new custom PDFBox class (PDFBoxToImagesAndText.java) to convert each PDF page into an image (gif, jpg, png) 134 134 # AND its extracted text. An item file is still generated, but this time referring to txtfiles too, not just the images. Result: searchable paged output. 135 $self->{'pdfbox_img_launch_cmd'} = "java -cp \"$pbajar\" org.apache.pdfbox.tools.GS_PDFToImagesAndText"; 135 # Our new custom class PDFBoxToImagesAndText.java lives in the new build folder, so add that to the classpath for the launch cmd 136 my $pdfbox_build = &FileUtils::filenameConcatenate($gextpb_home,"build"); 137 my $classpath = &util::pathname_cat($pbajar,$pdfbox_build); 138 $self->{'pdfbox_img_launch_cmd'} = "java -cp \"$classpath\" org.greenstone.pdfbox.PDFBoxToImagesAndText"; 136 139 } 137 140 else {
Note:
See TracChangeset
for help on using the changeset viewer.