Ignore:
Timestamp:
2001-01-29T14:54:58+13:00 (23 years ago)
Author:
sjboddie
Message:

Tidied up language support stuff.

File:
1 edited

Legend:

Unmodified
Added
Removed
  • trunk/gsdl/etc/main.cfg

    r1868 r1870  
    7878# Define the interface languages and encodings supported by this receptionist
    7979
    80 # An "Encoding" line defines an encoding to be used by the receptionist
    81 # options are:
    82 # shortname -- Identifier for the given encoding. The shortname option is
    83 #              mandatory and must be unique for each "Encoding" line.
     80# An "Encoding" line defines an encoding to be used by the receptionist.
     81# Uncomment "Encoding" lines to include an encoding on your "preferences" page.
     82# Encoding line options are:
     83# shortname -- The standard charset label for the given encoding. The
     84#              shortname option is mandatory.
    8485# longname  -- The display name of the given encoding. If longname isn't set
    8586#              it will default to using shortname instead.
    86 # type      -- The type of encoding. Note that for most encodings this
    87 #              value is the directory name under which the map file for
    88 #              this encoding resides in the Greenstone unicode/MAPPINGS
    89 #              directory (e.g. 'WINDOWS', 'ISO_8859' etc.). It may also
    90 #              take the values 'CJK' and 'UTF8'.
    91 # mapfile   -- The name of the map file for use when converting between
    92 #              utf8 and the given encoding. The mapfile option is mandatory
    93 #              for all encoding types with the exception of UTF8. If type
    94 #              is CJK, mapfile is the abbreviated name of the encoding as
    95 #              used by the binary mapping files (.ump files). i.e. if the
    96 #              encoding uses the map files gbku.ump and ugbk.ump, mapfile
    97 #              will be set to "gbk".
    98 # label     -- The standard label to which you must set the value of
    99 #              "charset" within http headers or html meta tags to get a web
    100 #              browser to use the given encoding. The label option is
    101 #              mandatory.
    102 Encoding shortname=utf8 "longname=Unicode (UTF-8)" type=UTF8 label=UTF-8
    103 Encoding shortname=iso1 "longname=Western (ISO-8859-1)" type=ISO_8859 mapfile=1.TXT label=ISO-8859-1
    104 Encoding shortname=w1251 "longname=Cyrillic (Windows-1251)" type=WINDOWS mapfile=1251.TXT label=windows-1251
    105 Encoding shortname=w1256 "longname=Arabic (Windows-1256)" type=WINDOWS mapfile=1256.TXT label=windows-1256
    106 Encoding shortname=w1256 "longname=Central European (Windows-1250)" type=WINDOWS mapfile=1250.TXT label=windows-1250
    107 Encoding shortname=gb "longname=Chinese Simplified (GBK)" type=CJK label=GBK mapfile=gbk
    108 Encoding shortname=sjis "longname=Japanese (Shift-JIS)" type=CJK label=shift_jis mapfile=sjis
    109 Encoding shortname=koi8r "longname=Cyrillic (KOI8-R)" type=CYRILLIC mapfile=koi8_r.txt label=koi8-r
     87# map       -- The name of the map file (i.e. the .ump file) for use when
     88#              converting between unicode and the given encoding. The map
     89#              option is mandatory for all encoding lines except the
     90#              special case for utf8.
    11091
    111 # The following encoding is not currently supported
    112 # Encoding shortname=eucjp "longname=Japanese (EUC)" type=CJK label=euc-jp mapfile=jis
     92# The utf8 encoding is handled internally and doesn't require a map file.
     93# As a rule the utf8 encoding should always be enabled, especially if you
     94# have collections of documents that may not all be in the same
     95# language/encoding.
     96Encoding shortname=utf-8 "longname=Unicode (UTF-8)"
     97
     98# The ISO-8859 series
     99Encoding shortname=iso-8859-1 "longname=Western (ISO-8859-1)" map=8859_1.ump
     100#Encoding shortname=iso-8859-2 "longname=Central European (ISO-8859-2)" map=8859_2.ump
     101#Encoding shortname=iso-8859-3 "longname=Latin 3 (ISO-8859-3)" map=8859_3.ump
     102#Encoding shortname=iso-8859-4 "longname=Latin 4 (ISO-8859-4)" map=8859_4.ump
     103#Encoding shortname=iso-8859-5 "longname=Cyrillic (ISO-8859-5)" map=8859_5.ump
     104#Encoding shortname=iso-8859-6 "longname=Arabic (ISO-8859-6)" map=8859_6.ump
     105#Encoding shortname=iso-8859-7 "longname=Greek (ISO-8859-7)" map=8859_7.ump
     106#Encoding shortname=iso-8859-8 "longname=Hebrew (ISO-8859-8)" map=8859_8.ump
     107#Encoding shortname=iso-8859-9 "longname=Turkish (ISO-8859-9)" map=8859_9.ump
     108
     109# Windows codepages
     110#Encoding shortname=windows-1250 "longname=Central European (Windows-1250)" map=win1250.ump
     111#Encoding shortname=windows-1251 "longname=Cyrillic (Windows-1251)" map=win1251.ump
     112#Encoding shortname=windows-1252 "longname=Western (Windows-1252)" map=win1252.ump
     113#Encoding shortname=windows-1253 "longname=Greek (Windows-1253)" map=win1253.ump
     114#Encoding shortname=windows-1254 "longname=Turkish (Windows-1254)" map=win1254.ump
     115#Encoding shortname=windows-1255 "longname=Hebrew (Windows-1255)" map=win1255.ump
     116Encoding shortname=windows-1256 "longname=Arabic (Windows-1256)" map=win1256.ump
     117#Encoding shortname=windows-1257 "longname=Baltic (Windows-1257)" map=win1257.ump
     118#Encoding shortname=windows-1258 "longname=Vietnamese (Windows-1258)" map=win1258.ump
     119#Encoding shortname=windows-874 "longname=Thai (Windows-874)" map=win874.ump
     120
     121# KOI8 Cyrillic encodings
     122#Encoding shortname=koi8-r "longname=Cyrillic (KOI8-R)" map=koi8_r.ump
     123#Encoding shortname=koi8-u "longname=Cyrillic (KOI8-U)" map=koi8_u.ump
     124
     125# CJK encodings (note that Shift-JIS Japanese isn't currently supported)
     126Encoding shortname=gbk "longname=Chinese Simplified (GBK)" map=gbk.ump
     127Encoding shortname=big5 "longname=Chinese Traditional (Big5)" map=big5.ump
     128Encoding shortname=euc-jp "longname=Japanese (EUC)" map=euc_jp.ump
     129Encoding shortname=euc-kr "longname=Korean (UHC)" map=uhc.ump
    113130
    114131
     
    126143#                     interface language. This should be set to the
    127144#                     "shortname" of a valid "Encoding" line
    128 Language shortname=en longname=English default_encoding=iso1
    129 Language shortname=fr longname=French default_encoding=iso1
    130 Language shortname=zh longname=Chinese default_encoding=gb
    131 Language shortname=de longname=German default_encoding=iso1
    132 Language shortname=es longname=Spanish default_encoding=iso1
    133 Language shortname=mi longname=Maori default_encoding=iso1
    134 Language shortname=ar longname=Arabic default_encoding=w1256
    135 Language shortname=pt longname=Portuguese default_encoding=iso1
    136 Language shortname=nl longname=Dutch default_encoding=iso1
     145Language shortname=en longname=English default_encoding=iso-8859-1
     146Language shortname=fr longname=French default_encoding=iso-8859-1
     147Language shortname=zh longname=Chinese default_encoding=gbk
     148Language shortname=de longname=German default_encoding=iso-8859-1
     149Language shortname=es longname=Spanish default_encoding=iso-8859-1
     150Language shortname=mi longname=Maori default_encoding=iso-8859-1
     151Language shortname=ar longname=Arabic default_encoding=windows-1256
     152Language shortname=pt longname=Portuguese default_encoding=iso-8859-1
     153Language shortname=nl longname=Dutch default_encoding=iso-8859-1
    137154
    138155
Note: See TracChangeset for help on using the changeset viewer.