Changeset 1949 for trunk/gsdl


Ignore:
Timestamp:
2001-02-12T18:31:48+13:00 (23 years ago)
Author:
paynter
Message:

Fixed bug that prevented tokeniser from distinguishing between languages.

File:
1 edited

Legend:

Unmodified
Added
Removed
  • trunk/gsdl/perllib/classify/phind.pm

    r1897 r1949  
    281281        $section = $doc_obj->get_next_section($section);
    282282        }
    283         $text .= convert_gml_to_tokens($data) . "\n";
     283        $text .= convert_gml_to_tokens($phrlanguage, $data) . "\n";
    284284    }
    285285   
     
    289289        $dataref = $doc_obj->get_metadata($doc_obj->get_top_section(), $field);
    290290        foreach $data ($$dataref) {
    291         $text .= convert_gml_to_tokens($data) . "\n";
     291        $text .= convert_gml_to_tokens($phrlanguage, $data) . "\n";
    292292        }
    293293    }
     
    302302        $section = $doc_obj->get_next_section($section);
    303303        }
    304         $text .= convert_gml_to_tokens($data) . "\n";
     304        $text .= convert_gml_to_tokens($phrlanguage, $data) . "\n";
    305305    }
    306306   
     
    430430sub convert_gml_to_tokens {
    431431   
    432     my ($text) = @_;
    433     my $language_exp = $self->{'language_exp'};
     432    my ($language_exp, $text) = @_;
    434433
    435434    if ($language_exp =~ /en/) {
    436     return convert_gml_to_tokens_EN($text);
     435    return &convert_gml_to_tokens_EN($text);
    437436    }
    438437
Note: See TracChangeset for help on using the changeset viewer.