source: main/trunk/greenstone2/perllib/encodings.pm@ 21411

Last change on this file since 21411 was 15894, checked in by mdewsnip, 16 years ago

Added "use strict" to the files missing it.

  • Property svn:keywords set to Author Date Id Revision
File size: 4.5 KB
Line 
1###########################################################################
2#
3# encodings.pm --
4# A component of the Greenstone digital library software
5# from the New Zealand Digital Library Project at the
6# University of Waikato, New Zealand.
7#
8# Copyright (C) 2001 New Zealand Digital Library Project
9#
10# This program is free software; you can redistribute it and/or modify
11# it under the terms of the GNU General Public License as published by
12# the Free Software Foundation; either version 2 of the License, or
13# (at your option) any later version.
14#
15# This program is distributed in the hope that it will be useful,
16# but WITHOUT ANY WARRANTY; without even the implied warranty of
17# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18# GNU General Public License for more details.
19#
20# You should have received a copy of the GNU General Public License
21# along with this program; if not, write to the Free Software
22# Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
23#
24###########################################################################
25
26# Each encoding supported by the Greenstone build-time software should be
27# specified in the following hash table ($encodings).
28
29package encodings;
30
31use strict;
32
33# $encodings takes the form:
34# --> identifier --> name --> The full display name of the encoding.
35# --> mapfile --> The ump file associated with the encoding
36# --> double --> 1 if it's a double byte encoding
37# --> converter --> If the encoding needs a specialized conversion
38# routine this is the name of that routine.
39
40$encodings::encodings = {
41 'iso_8859_1' => {'name' => 'Latin1 (western languages)', 'mapfile' => '8859_1.ump'},
42
43 'iso_8859_2' => {'name' => 'Latin2 (central and eastern european languages)',
44 'mapfile' => '8859_2.ump'},
45
46 'iso_8859_3' => {'name' => 'Latin3', 'mapfile' => '8859_3.ump'},
47
48 'iso_8859_4' => {'name' => 'Latin4', 'mapfile' => '8859_4.ump'},
49
50 'iso_8859_5' => {'name' => 'Cyrillic', 'mapfile' => '8859_5.ump'},
51
52 'iso_8859_6' => {'name' => 'Arabic', 'mapfile' => '8859_6.ump'},
53
54 'iso_8859_7' => {'name' => 'Greek', 'mapfile' => '8859_7.ump'},
55
56 'iso_8859_8' => {'name' => 'Hebrew', 'mapfile' => '8859_8.ump'},
57
58 'iso_8859_9' => {'name' => 'Turkish', 'mapfile' => '8859_9.ump'},
59
60 'iso_8859_15' => {'name' => 'Latin15 (revised western)', 'mapfile' => '8859_15.ump'},
61
62 'windows_1250' => {'name' => 'Windows codepage 1250 (WinLatin2)',
63 'mapfile' => 'win1250.ump'},
64
65 'windows_1251' => {'name' => 'Windows codepage 1251 (WinCyrillic)',
66 'mapfile' => 'win1251.ump'},
67
68 'windows_1252' => {'name' => 'Windows codepage 1252 (WinLatin1)',
69 'mapfile' => 'win1252.ump'},
70
71 'windows_1253' => {'name' => 'Windows codepage 1253 (WinGreek)',
72 'mapfile' => 'win1253.ump'},
73
74 'windows_1254' => {'name' => 'Windows codepage 1254 (WinTurkish)',
75 'mapfile' => 'win1254.ump'},
76
77 'windows_1255' => {'name' => 'Windows codepage 1255 (WinHebrew)',
78 'mapfile' => 'win1255.ump'},
79
80 'windows_1256' => {'name' => 'Windows codepage 1256 (WinArabic)',
81 'mapfile' => 'win1256.ump'},
82
83 'windows_1257' => {'name' => 'Windows codepage 1257 (WinBaltic)',
84 'mapfile' => 'win1257.ump'},
85
86 'windows_1258' => {'name' => 'Windows codepage 1258 (Vietnamese)',
87 'mapfile' => 'win1258.ump'},
88
89 'windows_874' => {'name' => 'Windows codepage 874 (Thai)', 'mapfile' => 'win874.ump'},
90
91 'dos_437' => {'name' => 'DOS codepage 437 (US English)', 'mapfile' => 'dos437.ump'},
92
93 'dos_850' => {'name' => 'DOS codepage 850 (Latin 1)', 'mapfile' => 'dos850.ump'},
94
95 'dos_852' => {'name' => 'DOS codepage 852 (Central European)', 'mapfile' => 'dos852.ump'},
96
97 'dos_866' => {'name' => 'DOS codepage 866 (Cyrillic)', 'mapfile' => 'dos866.ump'},
98
99 'koi8_r' => {'name' => 'Cyrillic', 'mapfile' => 'koi8_r.ump'},
100
101 'koi8_u' => {'name' => 'Cyrillic (Ukrainian)', 'mapfile' => 'koi8_u.ump'},
102
103 'iscii_de' => {'name' => 'ISCII Devanagari', 'mapfile' => 'iscii_de.ump'},
104
105 'shift_jis' => {'name' => 'Japanese (Shift-JIS)', 'mapfile' => 'shiftjis.ump',
106 'converter' => 'shiftjis2unicode'},
107
108 'euc_jp' => {'name' => 'Japanese (EUC)', 'mapfile' => 'euc_jp.ump'},
109
110 'korean' => {'name' => 'Korean (Unified Hangul Code - i.e. a superset of EUC-KR)',
111 'mapfile' => 'uhc.ump'},
112
113 'gb' => {'name' => 'Chinese Simplified (GB)', 'mapfile' => 'gbk.ump'},
114
115 'big5' => {'name' => 'Chinese Traditional (Big5)', 'mapfile' => 'big5.ump'}
116
117};
Note: See TracBrowser for help on using the repository browser.