Changeset 32109
- Timestamp:
- 2018-01-18T23:28:54+13:00 (5 years ago)
- Location:
- other-projects/hathitrust/wcsa/extracted-features-solr/trunk/solr-ingest
- Files:
-
- 1 added
- 3 edited
Legend:
- Unmodified
- Added
- Removed
-
other-projects/hathitrust/wcsa/extracted-features-solr/trunk/solr-ingest/JSONLIST-YARN-INGEST.sh
r32107 r32109 1 1 #!/bin/bash 2 2 3 nohup ./scripts/JSONLIST-RUN-YARN-SPARK.sh TMP-faceted-htrc-fictsample-ef20 & 3 nohup ./scripts/JSONLIST-RUN-YARN-SPARK.sh \ 4 pair-tree-annika-1k-fiction-vol-ids.txt TMP-faceted-htrc-fictsample-ef20 & -
other-projects/hathitrust/wcsa/extracted-features-solr/trunk/solr-ingest/scripts/_RUN.sh
r32107 r32109 27 27 28 28 if [ "x$input_dir" != "x" ] ; then 29 if [ $ show_usage = "json" ] ; then29 if [ $class_mode = "json" ] ; then 30 30 show_usage=0 31 31 fi … … 130 130 #cmd="$cmd --properties /homea/dbbridge/extracted-features-solr/solr-ingest/ef-solr.properties $seq_file $*" 131 131 else 132 cmd="$cmd --properties ef-solr.properties $ json_filelist $input_dir$*"133 #cmd="$cmd --properties /homea/dbbridge/extracted-features-solr/solr-ingest/ef-solr.properties $ json_filelist $input_dir$*"132 cmd="$cmd --properties ef-solr.properties $input_dir $json_filelist $*" 133 #cmd="$cmd --properties /homea/dbbridge/extracted-features-solr/solr-ingest/ef-solr.properties $input_dir $json_filelist $*" 134 134 135 135 fi -
other-projects/hathitrust/wcsa/extracted-features-solr/trunk/solr-ingest/src/main/java/org/hathitrust/extractedfeatures/PerVolumeUtil.java
r32106 r32109 2 2 3 3 import java.io.IOException; 4 import java.io.Serializable; 4 5 import java.util.ArrayList; 5 6 import java.util.HashMap; 6 7 import java.util.Iterator; 7 8 8 9 import org.apache.hadoop.io.Text; 9 10 import org.apache.spark.api.java.function.FlatMapFunction; … … 14 15 import org.json.JSONObject; 15 16 16 /* 17 class PagedJSON implements Function<String, Boolean> { 18 17 public class PerVolumeUtil implements Serializable 18 { 19 19 private static final long serialVersionUID = 1L; 20 21 public Boolean call(String s) { return s.contains("a"); }22 }23 */24 25 26 //public class PerVolumeJSON implements VoidFunction<String>27 public class PerVolumeUtil28 {29 //private static final long serialVersionUID = 1L;30 20 protected String _input_dir; 31 21 protected String _whitelist_filename;
Note:
See TracChangeset
for help on using the changeset viewer.