Changeset 30929
- Timestamp:
- 2016-10-26T09:47:36+13:00 (6 years ago)
- Location:
- other-projects/hathitrust/solr-extracted-features/trunk
- Files:
-
- 2 edited
Legend:
- Unmodified
- Added
- Removed
-
other-projects/hathitrust/solr-extracted-features/trunk/RUN-PD-CLUSTER.bash
r30928 r30929 2 2 3 3 json_filelist=${1:-pd-file-listing-step10000.txt} 4 shift 4 5 5 6 input_dir="hdfs://master:9000/user/htrc/pd-ef-json-files" … … 11 12 master_opt="--master spark://10.10.0.52:7077" 12 13 13 . /_RUN.bash14 . ./_RUN.bash -
other-projects/hathitrust/solr-extracted-features/trunk/_RUN.bash
r30927 r30929 24 24 fi 25 25 26 echo 27 echo "****" 28 echo "* Checking for Spark and Hadoop daemons" 29 echo "****" 30 jps | sed 's/^/* /g' 31 echo "****" 32 echo "* Done" 33 echo "****" 34 echo 35 26 36 self_contained_jar=target/htrc-ef-ingest-0.9-jar-with-dependencies.jar 27 37 base_cmd="spark-submit --class org.hathitrust.PrepareForIngest $master_opt $self_contained_jar" 28 38 29 $base_cmd --json-filelist="$json_filelist" "$input_dir" "$output_dir" $* 39 cmd="$base_cmd --json-filelist=\"$json_filelist\" $input_dir $output_dir $*" 40 41 echo "****" 42 echo "* Lauching:" 43 echo "* $cmd" 44 echo "****" 45 echo "* Monitor progress through:" 46 echo "* http://10.10.0.52:8080/" 47 echo "****" 48 echo 49 50 $cmd 30 51 31 52 # spark-submit --class org.hathitrust.PrepareForIngest --master local[4] target/htrc-ef-ingest-0.9-jar-with-dependencies.jar --json-filelist=pd-file-listing-step10000.txt pd-ef-json-files pd-solr-json-files $*
Note:
See TracChangeset
for help on using the changeset viewer.