Ignore:
Timestamp:
2019-06-26T15:52:27+12:00 (5 years ago)
Author:
davidb
Message:

More careful working with unicode/utf8

File:
1 edited

Legend:

Unmodified
Added
Removed
  • main/trunk/model-sites-dev/heritage-nz/collect/pdf-reports/prepare/xlsutil.py

    r33204 r33222  
    66## worksheet_name = "Archaeological reports"
    77
    8 sanitized_headers = [ "Report Identifier", "Author", "Title", "Produced By", "Date", "HNZPT Region", "File No",
    9                       "Authority No", "Site No", "Relevant TLA's", "Record Type", "Date Entered" ]
     8sanitized_headers = [ u"Report Identifier", u"Author", u"Title", u"Produced By", u"Date", u"HNZPT Region", u"File No",
     9                      u"Authority No", u"Site No", u"Relevant TLA's", u"Record Type", u"Date Entered" ]
     10
     11def make_unicode(value):
     12    value_unicode = value
     13
     14    if type(value) != unicode:
     15        value_str = value
     16        if type(value_str) != str:
     17            value_str = str(value)
     18       
     19        value_unicode =  value_str.decode('utf-8')
     20
     21    return value_unicode
     22
     23
     24def cell_value_tidy_unicode(worksheet,row_i,col_j):
     25    value= worksheet.cell_value(row_i,col_j)
     26
     27    value_unicode = make_unicode(value)
     28    value_unicode_stripped = value_unicode.strip()
     29
     30    return value_unicode_stripped
     31
    1032
    1133def format_if_int(cell_value):
     
    3658    found_header = False
    3759    for col_j in range(num_header_cols):
    38         header_cell_value = worksheet.cell_value(header_row_pos,col_j)
    39         if header_cell_value == "Report Identifier":
     60        header_cell_value = cell_value_tidy_unicode(worksheet,header_row_pos,col_j)
     61        if header_cell_value == u"Report Identifier":
    4062            found_header = True
    4163
Note: See TracChangeset for help on using the changeset viewer.