Changeset 1646 for trunk/gsdl
- Timestamp:
- 2000-11-02T15:40:58+13:00 (24 years ago)
- File:
-
- 1 edited
Legend:
- Unmodified
- Added
- Removed
-
trunk/gsdl/perllib/classify/phind.pm
r1645 r1646 32 32 # title=Title The title field for this classification 33 33 # text=fields The text used to build the phrase hierarchy 34 # untidy=true Do not clean up intermediate files35 34 # phindexdir=directory Location of phind index files 36 35 # verbosity=num Control amount of output 36 # untidy=true Do not clean up intermediate files 37 # suffixmode=num Mode of suffix program (0 = all phrases, 1 = stopword) 38 # suffixsize=num Number of symbols available to suffix program 37 39 38 40 … … 144 146 my $indexes = "section:Title,section:text"; 145 147 148 my $suffixmode = 1; 149 my $suffixsize = 40000000; 150 146 151 my $verbosity = 2; 147 152 my $untidy = 0; … … 156 161 } elsif ($option =~ /^phindexdir=(.*)$/i) { 157 162 $phindexdir = $1; 163 } elsif ($option =~ /^suffixsize=(.*)$/i) { 164 $suffixsize = $1; 165 } elsif ($option =~ /^suffixmode=(.*)$/i) { 166 $suffixmode = $1; 158 167 } elsif ($option =~ /^verbosity=(.*)$/i) { 159 168 $verbosity = $1; … … 167 176 $self->{'title'} = $title; 168 177 $self->{'indexes'} = $indexes; 178 179 $self->{'suffixmode'} = $suffixmode; 180 $self->{'suffixsize'} = $suffixsize; 181 169 182 $self->{'verbosity'} = $verbosity; 170 183 $self->{'untidy'} = $untidy; … … 320 333 321 334 # Construct phind indexes 322 my $ mode = 1;323 my $s ymbol_limit = 40000000;335 my $suffixmode = $self->{'suffixmode'}; 336 my $suffixsize = $self->{'suffixsize'}; 324 337 my ($command, $status); 325 338 … … 331 344 # Use the suffix program to generate the phindex/phrases file 332 345 print "\nExtracting phrases from processed text (with suffix)\n" if $verbosity; 333 &execute("suffix $phindexdir $s ymbol_limit $mode", $verbosity);346 &execute("suffix $phindexdir $suffixsize $suffixmode", $verbosity); 334 347 335 348 # Create the phrase file and put phrase numbers in phindex/phrases
Note:
See TracChangeset
for help on using the changeset viewer.