Ignore:
Timestamp:
2016-10-26T11:05:28+13:00 (7 years ago)
Author:
davidb
Message:

Providing json-filelist now a compulsory argument, rather than an option

File:
1 edited

Legend:

Unmodified
Added
Removed
  • other-projects/hathitrust/solr-extracted-features/trunk/_RUN.bash

    r30929 r30934  
    2424fi
    2525
    26 echo
    27 echo "****"
    28 echo "* Checking for Spark and Hadoop daemons"
    29 echo "****"
    30 jps | sed 's/^/* /g'
    31 echo "****"
    32 echo "* Done"
    33 echo "****"
    34 echo
     26run_jps=0
     27run_jps_daemons=""
     28run_jps_daemons_suffix="daemon"
     29
     30if [ "x${input_dir##hdfs://*}" = "x" ] || [ "x${output_dir##hdfs://*}" = "x" ] ; then
     31    # Evidence of running command over HDFS
     32    run_jps=1
     33    run_jps_daemons="Spark"
     34fi
     35
     36if [ "x${master_op##--master spark://*}" = "x" ] ; then
     37    # Evidence of running command submitted to Spark cluster
     38    run_jps=1
     39    if [ "x$run_jps_daemons" != "x" ] ; then
     40        run_jps_daemons="$run_jps_daemons and Hadoop"
     41    run_jps_daemons_suffix="daemons"
     42    else
     43        run_jps_daemons="Hadoop"
     44    fi
     45fi
     46
     47if [ "$run_jps" = "1" ] ; then
     48  echo
     49  echo "****"
     50  echo "* Checking for $run_jps_daemons $run_jps_daemons_suffix"
     51  echo "****"
     52  jps | sed 's/^/* /g'
     53  echo "****"
     54  echo "* Done"
     55  echo "****"
     56  echo
     57
     58fi
    3559
    3660self_contained_jar=target/htrc-ef-ingest-0.9-jar-with-dependencies.jar
    3761base_cmd="spark-submit --class org.hathitrust.PrepareForIngest $master_opt $self_contained_jar"
    3862
    39 cmd="$base_cmd --json-filelist=\"$json_filelist\" $input_dir $output_dir $*"
     63cmd="$base_cmd --verbosity 1 $json_filelist $input_dir $output_dir $*"
    4064
    4165echo "****"
Note: See TracChangeset for help on using the changeset viewer.