Changeset 33031 for other-projects/is-sheet-music-encore/trunk/java-gen-corpus/TabProcMetaListGen.java
- Timestamp:
- 2019-04-22T14:58:53+12:00 (5 years ago)
- File:
-
- 1 edited
Legend:
- Unmodified
- Added
- Removed
-
other-projects/is-sheet-music-encore/trunk/java-gen-corpus/TabProcMetaListGen.java
r33017 r33031 13 13 14 14 15 if (args.length != 1) {16 System.out.println("Usage: TabProcMetaListGen <inputFilename> < outputFilename>");15 if (args.length != 2) { 16 System.out.println("Usage: TabProcMetaListGen <inputFilename> <listFilename>"); 17 17 } 18 18 else { 19 //Variables 19 20 String inputFilename = args[0]; 20 //String outputFilename = args[1]; 21 21 String listFilename = args[1]; 22 FileReader fileReader = new FileReader(inputFilename); 23 BufferedReader buf = new BufferedReader(fileReader); 24 FileWriter listWriter = new FileWriter(listFilename, true); 25 String line = null; 26 String[] item; 27 28 String idLine = null; 29 String id = null; 30 String numpages = null; 31 22 32 System.out.println("Processing: " + inputFilename); 23 33 24 FileReader fileReader = new FileReader(inputFilename);25 BufferedReader buf = new BufferedReader(fileReader);26 //FileWriter fw = new FileWriter(outputFilename);27 String line = null;28 String[] item;29 30 34 //Splits into each record 31 while ((line = buf.readLine()) != null) { 32 33 //Splits by tab, leaves "" for every blank entry 34 //Check items to be equal 35 //System.out.println(line); 35 while ((line = buf.readLine()) != null) { 36 if(line.contains("<id>")){ 37 //Isoclate and store the id from the line 38 idLine = line.substring(line.indexOf(">")+1, line.indexOf("</")); 39 id = idLine.substring(idLine.lastIndexOf("meta/")+5); 40 41 } 36 42 if(line.contains("<htd:numpages>")){ 37 String result = line.substring(line.indexOf(">")+1, line.indexOf(">")+2); 38 System.out.println(result); 39 } 40 if(line.contains("<id>")){ 41 String result = line.substring(line.indexOf(">")+1, line.indexOf("</")); 42 System.out.println(result); 43 } 44 45 } 43 //Iscolate and store the page number 44 numpages = line.substring(line.indexOf(">")+1, line.lastIndexOf("<")); 45 46 } 47 } 48 49 //Check if there are more than 10 pages 50 if(Integer.parseInt(numpages) >= 10){ 51 //Add extracted metadata to output list 52 listWriter.write(id + '\t' + numpages + '\n'); 53 } 46 54 buf.close(); 47 //fw.close();55 listWriter.close(); 48 56 } 49 57 }catch(Exception e){
Note:
See TracChangeset
for help on using the changeset viewer.