Changeset 28923

Show
Ignore:
Timestamp:
19.03.2014 10:57:48 (5 years ago)
Author:
ak19
Message:

Tidy up and changes resulting from UTF8 encoding issues

Files:
1 modified

Legend:

Unmodified
Added
Removed
  • main/trunk/model-sites-dev/von-sparql/collect/nz-natlib-cat/pre-import/RUN_NZ.sh

    r28795 r28923  
    22 
    33full_filename=NZDataFull.xml 
     4full_filename_utf8=NZDataFull-UTF8.xml 
    45 
    56if [ ! -f $full_filename ] ; then 
    67  echo "Did not detect uncompressed MARC-XML file '$full_filename'" 
    7   echo " => Including ISO-8859-1 character encoding XML processing instruction at start"   
     8  echo " => Including UTF-8 character encoding XML processing instruction at start"   
    89  echo "<?xml version=\"1.0\" encoding=\"utf-8\"?>" > $full_filename 
    910  echo "<collection xmlns=\"http://www.loc.gov/MARC21/slim\">" >> $full_filename  
     
    1314  echo "</collection>" >> $full_filename 
    1415  echo " => ... Done"   
     16fi 
     17 
     18if [ ! -f $full_filename_utf8 ] ; then 
     19 
     20  echo "Fixing 'alien' character encodings issues within a UTF-8 file" 
     21 
     22  java -cp UTF8_Fix/bin UTF8Fix "$full_filename" "$full_filename_utf8" 
    1523 
    1624fi