Ignore:
Timestamp:
2016-12-21T00:12:10+13:00 (7 years ago)
Author:
davidb
Message:

Language counting

File:
1 edited

Legend:

Unmodified
Added
Removed
  • other-projects/hathitrust/wcsa/extracted-features-solr/trunk/solr-ingest/src/main/java/org/hathitrust/extractedfeatures/ProcessForPOSCount.java

    r31259 r31260  
    4545    protected String generateSparkAppName(String exec_mode)
    4646    {
    47         String spark_app_name = "[" + exec_mode + "] Extracted Features: Process for POS";
     47        String spark_app_name = "[" + exec_mode + "] Extracted Features: Process for POS Count";
    4848        spark_app_name += " [" + _json_list_filename + "]";
    4949   
     
    7979        //boolean icu_tokenize = Boolean.getBoolean("wcsa-ef-ingest.icu-tokenize");
    8080       
    81         PerVolumePOSStreamFlatmap paged_solr_wordfreq_flatmap
     81        PerVolumePOSStreamFlatmap paged_solr_posfreq_flatmap
    8282            = new PerVolumePOSStreamFlatmap(_input_dir,_verbosity,
    8383                                     per_vol_progress_accum,per_vol,
    8484                                     strict_file_io);
    85         JavaRDD<String> pos_list = json_list_data.flatMap(paged_solr_wordfreq_flatmap);
     85        JavaRDD<String> pos_list = json_list_data.flatMap(paged_solr_posfreq_flatmap);
    8686        pos_list.setName("pos-stream");
    8787       
Note: See TracChangeset for help on using the changeset viewer.