Changeset 22842
- Timestamp:
- 2010-09-02T14:20:43+12:00 (14 years ago)
- File:
-
- 1 edited
Legend:
- Unmodified
- Added
- Removed
-
main/trunk/greenstone2/perllib/plugins/HTMLPlugin.pm
r22689 r22842 35 35 36 36 package HTMLPlugin; 37 38 use Encode; 37 39 38 40 use ReadTextFile; … … 1230 1232 # Convert entities to their UTF8 equivalents 1231 1233 $$textref =~ s/&(lt|gt|amp|quot|nbsp);/&z$1;/go; 1232 $$textref =~ s/&([^;]+);/& ghtml::getcharequiv($1,1)/gseo;1234 $$textref =~ s/&([^;]+);/&Encode::decode("utf8",ghtml::getcharequiv($1,1))/gseo; 1233 1235 $$textref =~ s/&z(lt|gt|amp|quot|nbsp);/&$1;/go; 1236 1234 1237 } 1235 1238 … … 1586 1589 close (PROD) || die("Error Closing File: $tmp_filename $!"); 1587 1590 1588 1589 ### my ($language, $encoding) = $self->textcat_get_language_encoding ($input_filename);1590 ### #print STDERR "*** encoding = $encoding\n";1591 1592 1591 # run html-tidy on the tmp file to make it a proper XML file 1593 1592 … … 1597 1596 my $tidy_cmd = "tidy"; 1598 1597 $tidy_cmd .= " -q" if ($self->{'verbosity'} <= 2); 1599 ## $tidy_cmd .= " -utf8 -wrap 0 -asxml \"$tmp_filename\"";1600 1598 $tidy_cmd .= " -raw -wrap 0 -asxml \"$tmp_filename\""; 1601 1599 if ($self->{'verbosity'} <= 2) {
Note:
See TracChangeset
for help on using the changeset viewer.