Changeset 30988 for other-projects
- Timestamp:
- 2016-10-30T11:32:57+13:00 (7 years ago)
- Location:
- other-projects/hathitrust/solr-extracted-features/trunk/src/main/java/org/hathitrust
- Files:
-
- 2 edited
Legend:
- Unmodified
- Added
- Removed
-
other-projects/hathitrust/solr-extracted-features/trunk/src/main/java/org/hathitrust/PagedJSON.java
r30985 r30988 119 119 solr_doc_json.put("id", page_id); 120 120 solr_doc_json.put("volumeid_s", volume_id); 121 solr_doc_json.put(" _text_", text);121 solr_doc_json.put("eftext_txt", text); 122 122 123 123 solr_add_json.put("commitWithin", 5000); -
other-projects/hathitrust/solr-extracted-features/trunk/src/main/java/org/hathitrust/PrepareForIngest.java
r30986 r30988 58 58 59 59 60 60 /* 61 61 System.out.println(""); 62 62 System.out.println("############"); … … 64 64 System.out.println("############"); 65 65 System.out.println(""); 66 66 */ 67 67 68 68 //long num_ids = json_ids.count(); … … 114 114 options.addOption(solr_url_opt); 115 115 116 Option dry_run_opt = new Option("r", "dry-run", false,117 "Used to initiate a 'dry-run'where the files are all read in, but nothing is ingested/saved");118 dry_run_opt.setRequired(false);119 options.addOption( dry_run_opt);116 Option read_only_opt = new Option("r", "read-only", false, 117 "Used to initiate a run where the files are all read in, but nothing is ingested/saved"); 118 read_only_opt.setRequired(false); 119 options.addOption(read_only_opt); 120 120 121 // need to work with CLI v1.2 as this is the JAR that is bundled with Hadoop/Spark121 // Need to work with CLI v1.2 as this is the JAR that is bundled with Hadoop/Spark 122 122 CommandLineParser parser = new GnuParser(); 123 123 //CommandLineParser parser = new DefaultParser(); // if working with CLI v1.3 and above
Note:
See TracChangeset
for help on using the changeset viewer.