Changeset 10451


Ignore:
Timestamp:
2005-08-10T12:51:42+12:00 (19 years ago)
Author:
kjdon
Message:

added pdf_allow_images_only option for conversion to html when there is no text that can be extracted (thanks to Doug Carter)

File:
1 edited

Legend:

Unmodified
Added
Removed
  • trunk/gsdl/bin/script/gsConvert.pl

    r10445 r10451  
    6363my $pdf_zoom;
    6464my $pdf_ignore_images;
     65my $pdf_allow_images_only;
    6566my $windows_scripting;
    6667
     
    8182    print STDERR "\t-pdf_ignore_images\tdon't attempt to extract images when\n";
    8283    print STDERR "\t\tconverting PDF to HTML\n";
     84    print STDERR "\t-pdf_allow_images_only\tallow images only (continue even if no text is present when converting to HTML)\n";
    8385    print STDERR "\t-pdf_zoom\tfactor by which to zoom PDF (only useful if\n";
    8486    print STDERR "\t\t-pdf_complex is set\n";
     
    105107             'pdf_complex', \$pdf_complex,
    106108             'pdf_ignore_images', \$pdf_ignore_images,
     109             'pdf_allow_images_only', \$pdf_allow_images_only,
    107110             'pdf_nohidden', \$pdf_nohidden,
    108111             'pdf_zoom/\d+/2', \$pdf_zoom
     
    760763    $cmd .= " -c" if ($pdf_complex);
    761764    $cmd .= " -i" if ($pdf_ignore_images);
     765    $cmd .= " -a" if ($pdf_allow_images_only);
    762766    $cmd .= " -hidden" unless ($pdf_nohidden);
    763767    $cmd .= " \"$input_filename\" \"$output_filestem\"";
Note: See TracChangeset for help on using the changeset viewer.