Changeset 28923 for main/trunk


Ignore:
Timestamp:
2014-03-19T10:57:48+13:00 (10 years ago)
Author:
ak19
Message:

Tidy up and changes resulting from UTF8 encoding issues

File:
1 edited

Legend:

Unmodified
Added
Removed
  • main/trunk/model-sites-dev/von-sparql/collect/nz-natlib-cat/pre-import/RUN_NZ.sh

    r28795 r28923  
    22
    33full_filename=NZDataFull.xml
     4full_filename_utf8=NZDataFull-UTF8.xml
    45
    56if [ ! -f $full_filename ] ; then
    67  echo "Did not detect uncompressed MARC-XML file '$full_filename'"
    7   echo " => Including ISO-8859-1 character encoding XML processing instruction at start" 
     8  echo " => Including UTF-8 character encoding XML processing instruction at start" 
    89  echo "<?xml version=\"1.0\" encoding=\"utf-8\"?>" > $full_filename
    910  echo "<collection xmlns=\"http://www.loc.gov/MARC21/slim\">" >> $full_filename
     
    1314  echo "</collection>" >> $full_filename
    1415  echo " => ... Done" 
     16fi
     17
     18if [ ! -f $full_filename_utf8 ] ; then
     19
     20  echo "Fixing 'alien' character encodings issues within a UTF-8 file"
     21
     22  java -cp UTF8_Fix/bin UTF8Fix "$full_filename" "$full_filename_utf8"
    1523
    1624fi
Note: See TracChangeset for help on using the changeset viewer.