Changeset 33031 for other-projects/is-sheet-music-encore/trunk
- Timestamp:
- 2019-04-22T14:58:53+12:00 (5 years ago)
- Location:
- other-projects/is-sheet-music-encore/trunk
- Files:
-
- 3 added
- 5 edited
Legend:
- Unmodified
- Added
- Removed
-
other-projects/is-sheet-music-encore/trunk/-COMPX520-README.txt
r33017 r33031 1 1 INSTRUCTIONS 2 3 The RUN scripts, think that some IDs are directories. Correct this 4 2 5 TEST CORPUS GENERATION 3 6 (java-gen-corpus/..): … … 14 17 (COMPX520-DOWNLOADER-PNG.txt , COMPX520-RUN-PNG.sh , ddapiclient2-extended.pl 15 18 "source ./SETUP.bash" 16 "./COMPX520-DOWNLOADER-PNG.txt <java-gen-corpus/filename> <page_num>" 17 18 19 "./COMPX520-DOWNLOADER-PNG.sh <java-gen-corpus/filename> <page_num>" 19 20 20 21 … … 22 23 (COMPX520-DOWNLOADER-ZIP.txt , COMPX520-RUN-XIP.sh , ddapiclient2-extended-ZIP.pl): 23 24 24 "./COMPX520-DOWNLOADER-ZIP. txt<java-gen-corpus/filename>"25 "./COMPX520-DOWNLOADER-ZIP.sh <java-gen-corpus/filename>" 25 26 26 27 -
other-projects/is-sheet-music-encore/trunk/java-gen-corpus/TabProcMetaListGen.java
r33017 r33031 13 13 14 14 15 if (args.length != 1) {16 System.out.println("Usage: TabProcMetaListGen <inputFilename> < outputFilename>");15 if (args.length != 2) { 16 System.out.println("Usage: TabProcMetaListGen <inputFilename> <listFilename>"); 17 17 } 18 18 else { 19 //Variables 19 20 String inputFilename = args[0]; 20 //String outputFilename = args[1]; 21 21 String listFilename = args[1]; 22 FileReader fileReader = new FileReader(inputFilename); 23 BufferedReader buf = new BufferedReader(fileReader); 24 FileWriter listWriter = new FileWriter(listFilename, true); 25 String line = null; 26 String[] item; 27 28 String idLine = null; 29 String id = null; 30 String numpages = null; 31 22 32 System.out.println("Processing: " + inputFilename); 23 33 24 FileReader fileReader = new FileReader(inputFilename);25 BufferedReader buf = new BufferedReader(fileReader);26 //FileWriter fw = new FileWriter(outputFilename);27 String line = null;28 String[] item;29 30 34 //Splits into each record 31 while ((line = buf.readLine()) != null) { 32 33 //Splits by tab, leaves "" for every blank entry 34 //Check items to be equal 35 //System.out.println(line); 35 while ((line = buf.readLine()) != null) { 36 if(line.contains("<id>")){ 37 //Isoclate and store the id from the line 38 idLine = line.substring(line.indexOf(">")+1, line.indexOf("</")); 39 id = idLine.substring(idLine.lastIndexOf("meta/")+5); 40 41 } 36 42 if(line.contains("<htd:numpages>")){ 37 String result = line.substring(line.indexOf(">")+1, line.indexOf(">")+2); 38 System.out.println(result); 39 } 40 if(line.contains("<id>")){ 41 String result = line.substring(line.indexOf(">")+1, line.indexOf("</")); 42 System.out.println(result); 43 } 44 45 } 43 //Iscolate and store the page number 44 numpages = line.substring(line.indexOf(">")+1, line.lastIndexOf("<")); 45 46 } 47 } 48 49 //Check if there are more than 10 pages 50 if(Integer.parseInt(numpages) >= 10){ 51 //Add extracted metadata to output list 52 listWriter.write(id + '\t' + numpages + '\n'); 53 } 46 54 buf.close(); 47 //fw.close();55 listWriter.close(); 48 56 } 49 57 }catch(Exception e){ -
other-projects/is-sheet-music-encore/trunk/java-gen-corpus/TabProcTextGen.java
r33009 r33031 60 60 } 61 61 62 //REFERNECES 62 //REFERNECES 63 63 //https://www.javatpoint.com/java-filewriter-class 64 64 //https://docs.oracle.com/javase/8/docs/api/index.html?java/io/FileWriter.html -
other-projects/is-sheet-music-encore/trunk/java-gen-corpus/TabRndListGen.java
r33007 r33031 12 12 try{ 13 13 if (args.length != 3){ 14 System.out.println("Usage: RandomItemSelecta<inputFilename> <outputCount> <outputFilename>");14 System.out.println("Usage: TabRndListGen <inputFilename> <outputCount> <outputFilename>"); 15 15 } 16 16 else{ … … 27 27 ArrayList<String> subList; 28 28 String line = null; 29 String[] item; 29 30 30 31 //Add items to Array 31 32 while ((line = buf.readLine()) != null) { 32 list.add(line); 33 //Split line by tab 34 item = line.split("\t", -1); 35 //Add first element (ID) 36 list.add(item[0]); 33 37 } 34 38 //randomize list
Note:
See TracChangeset
for help on using the changeset viewer.