Changeset 25155 for gs2-extensions/ngramj/perllib/plugins/ReadTextFile.pm
- Timestamp:
- 2012-02-28T16:40:01+13:00 (12 years ago)
- File:
-
- 1 edited
Legend:
- Unmodified
- Added
- Removed
-
gs2-extensions/ngramj/perllib/plugins/ReadTextFile.pm
r25141 r25155 120 120 my ($pluginfo, $base_dir, $file, $block_hash, $metadata, $processor, $maxdocs, $total_count, $gli) = @_; 121 121 122 print STDERR "**** In Pei Jones Local version of ReadTextFile\n"; 122 my $verbosity = $self->{'verbosity'}; 123 if ($verbosity>=2) { 124 my $outhandle = $self->{'outhandle'}; 125 print $outhandle "++ Using Ngram-Java version of ReadTextFile.pm ++\n"; 126 } 123 127 124 128 my $outhandle = $self->{'outhandle'}; … … 329 333 my ($filename) = @_; 330 334 331 $self->{'textcat'} = new ngramj( ) if (!defined($self->{'textcat'}));335 $self->{'textcat'} = new ngramj($self->{'verbosity'},$self->{'outhandle'}) if (!defined($self->{'textcat'})); 332 336 333 337 my ($language, $encoding, $extracted_encoding); … … 629 633 630 634 else { # need to use textcat to get either the language, or get both language and encoding 631 $self->{'ngramj'} = new ngramj( ) if (!defined($self->{'ngramj'}));635 $self->{'ngramj'} = new ngramj($self->{'verbosity'},$self->{'outhandle'}) if (!defined($self->{'ngramj'})); 632 636 633 637 if($found_html_encoding) { # know encoding, find language by limiting search to known encoding
Note:
See TracChangeset
for help on using the changeset viewer.