Changeset 7018


Ignore:
Timestamp:
2004-03-11T12:25:02+13:00 (20 years ago)
Author:
jrm21
Message:

oops... fixed up unicode-byte marker removal for first line.

File:
1 edited

Legend:

Unmodified
Added
Removed
  • trunk/gsdl/bin/script/pdftohtml.pl

    r6362 r7018  
    147147    my $line;
    148148    my $seen_textual_content=$allow_no_text;
    149     while ($line=<INFILE>) {
     149    # check for unicode byte-order marker at the start of the file
     150    $line = <INFILE>;
     151    $line =~ s#\376\377##g;
     152    while ($line) {
    150153    $line =~ s#</b><b>##g;
    151154    $line =~ s#</i><i>##g;
    152155    $line =~ s#\\#\\\\#g; # until macro language parsing is fixed...
    153     $line =~ s#\376\377##g;
    154156# check for any extracted text
    155157    if ($seen_textual_content == 0) {
     
    186188
    187189    print OUTFILE $line;
     190    $line = <INFILE>;
    188191    }
    189192    close INFILE;
Note: See TracChangeset for help on using the changeset viewer.