root/gs3-extensions/html-to-expeditee/trunk/src/perllib/CssStyleToExpAttr.pm @ 26727

Revision 26727, 11.5 KB (checked in by davidb, 7 years ago)

Working on obtaining the correct font information for text elements on an html page.

Line 
1###########################################################################
2#
3# CssStyleToExpAttr.pm --
4# A component of the Greenstone digital library software
5# from the New Zealand Digital Library Project at the
6# University of Waikato, New Zealand.
7#
8# Copyright (C) 2009 New Zealand Digital Library Project
9#
10# This program is free software; you can redistr   te it and/or modify
11# it under the terms of the GNU General Public License as published by
12# the Free Software Foundation; either version 2 of the License, or
13# (at your option) any later version.
14#
15# This program is distributed in the hope that it will be useful,
16# but WITHOUT ANY WARRANTY; without even the implied warranty of
17# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
18# GNU General Public License for more details.
19#
20# You should have received a copy of the GNU General Public License
21# along with this program; if not, write to the Free Software
22# Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
23#
24###########################################################################
25
26package CssStyleToExpAttr;
27
28my $font_generic_family_lookup = {
29    'serif'      => "t", # (e.g., Times)
30    'sans-serif' => "s", # (e.g., Helvetica)
31    'cursive',   => "s", # (e.g., Zapf-Chancery)
32    'fantasy'    => "s", # (e.g., Western)
33    'monospace'  => "m"  # (e.g., Courier)
34};
35
36
37my $font_specific_family_lookup = {
38  "arial"           => "sans-serif",
39  "arial black"     => "sans-serif",
40  "gadget"          => "sans-serif",
41  "comic sans ms"       => "cursive",
42  "comic sans"      => "cursive",
43  "courier"         => "monospace",
44  "courier new"     => "monospace",
45  "georgia"         => "serif",
46  "impact"          => "sans-serif",
47  "charcoal"        => "sans-serif",
48  "lucida console"      => "monospace",
49  "monaco"          => "monospace",
50  "lucida sans unicode" => "sans-serif",
51  "lucida grande"       => "sans-serif",
52  "palatino linotype"   => "serif",
53  "book antiqua"        => "serif",
54  "palatino"        => "serif",
55  "tahoma"          => "sans-serif",
56  "geneva"          => "sans-serif",
57  "georgia"         => "serif",
58  "times"           => "serif",
59  "times new roman"     => "serif",
60  "trebuchet ms"        => "sans-serif",
61  "trebuchet"       => "sans-serif",
62  "verdana"         => "sans-serif",
63  "geneva"          => "sans-serif",
64  #symbol       => "symbol",
65  #webdings         => "symbol",
66  #wingdings        => "symbol",
67  #zapf dingbats    => "symbol",
68  "ms sans serif"       => "sans-serif",
69  "sans serif       => sans-serif,
70  geneva"           => "sans-serif",
71  "ms serif"        => "serif",
72  "new york"        => "serif"
73};
74
75my $UNUSED_font_specific_family_mapping = {
76    'serif'      => [
77             "Times New Roman",
78             "Bodoni",
79             "Garamond",
80             "Minion Web",
81             "ITC Stone Serif",
82             "MS Georgia",
83             "Bitstream Cyberbit",
84             "Adobe Minion Cyrillic",
85             "Excelsior Cyrillic Upright",
86             "Monotype Albion 70",
87             "ER Bukinist",
88             "New Peninim",
89             "Raanana",
90             "Ryumin Light-KL",
91             "Kyokasho ICA",
92             "Futo Min A101",
93             "Lo Cicero Cherokee"
94    ],
95
96    'sans-serif' => [
97             "MS Trebuchet",
98             "ITC Avant Garde Gothic",
99             "MS Arial",
100             "MS Verdana",
101             "Univers",
102             "Futura",
103             "ITC Stone Sans",
104             "Gill Sans",
105             "Akzidenz Grotesk",
106             "Helvetica",
107             "Attika",
108             "Typiko New Era",
109             "MS Tahoma",
110             "Monotype Gill Sans 571",
111             "Helvetica Greek",
112             "Helvetica Cyrillic",
113             "ER Univers",
114             "Lucida Sans Unicode",
115             "Bastion",
116             "Arial Hebrew",
117             "Shin Go",
118             "Heisei Kaku Gothic W5"
119    ],
120    'cursive'    => [
121             "Caflisch Script",
122             "Adobe Poetica",
123             "Sanvito",
124             "Ex Ponto",
125             "Snell Roundhand",
126             "Zapf-Chancery",
127             "ER Architekt",
128             "Corsiva",
129             "DecoType Naskh",
130             "Monotype Urdu 507"
131    ],
132 
133   'fantasy'    => [
134             "Alpha Geometrique",
135             "Critter",
136             "Cottonwood",
137             "FB Reactor",
138             "Studz"
139    ],
140
141    'monospace'  => [
142             "Courier",
143             "MS Courier New",
144             "Prestige",
145             "Everson Mono",
146             "ER Kurier",
147             "Osaka Monospaced",
148    ]
149};
150
151
152                 
153my $font_style_lookup = {
154    'normal'  => "n",
155    'italic'  => "i",
156    'oblique' => 'i'
157};
158
159# Nothing that can currently be done for small-caps
160my $font_varient_lookup = {
161    'normal' => "",
162    'small-caps' => ""
163};
164
165
166my $font_weight_lookup = {
167    'normal'  => "n",
168    'bold'    => "n",
169    'bolder'  => "b", # filler for now
170    'lighter' => "n", # filler for now
171    '100'     => "n",
172    '200'     => "n",
173    '300'     => "b",
174    '400'     => "b",
175    '500'     => "b",
176    '600'     => "b",
177    '700'     => "b",
178    '800'     => "b",
179    '900'     => "b"
180};
181
182
183my $font_size_absolute = {
184    'xx-small' => 8,
185    'x-small'  =>10,
186    'small'    =>12,
187    'medium'   =>14,
188    'large'    =>16,
189    'x-large'  =>18,
190    'xx-large' =>20
191};
192
193# px, em, percentage, and relative, such as larger
194
195## color, background-color
196
197my $color_name_lookup = {
198    "aliceblue" =>  [240,248,255],
199    "antiquewhite" =>   [250,235,215],
200    "aqua" =>       [0,255,255],
201    "aquamarine" =>     [127,255,212],
202    "azure" =>      [240,255,255],
203    "beige" =>      [245,245,220],
204    "bisque" =>     [255,228,196],
205    "black" =>      [0,0,0],
206    "blanchedalmond" => [255,235,205],
207    "blue" =>       [0,0,255],
208    "blueviolet" =>     [138,43,226],
209    "brown" =>      [165,42,42],
210    "burlywood" =>  [222,184,135],
211    "cadetblue" =>  [95,158,160],
212    "chartreuse" =>     [127,255,0],
213    "chocolate" =>  [210,105,30],
214    "coral" =>      [255,127,80],
215    "cornflowerblue" => [100,149,237],
216    "cornsilk" =>   [255,248,220],
217    "crimson" =>    [220,20,60],
218    "cyan" =>       [0,255,255],
219    "darkblue" =>   [0,0,139],
220    "darkcyan" =>   [0,139,139],
221    "darkgoldenrod" =>  [184,134,11],
222    "darkgray" =>   [169,169,169],
223    "darkgreen" =>  [0,100,0],
224    "darkgrey" =>   [169,169,169],
225    "darkkhaki" =>  [189,183,107],
226    "darkmagenta" =>    [139,0,139],
227    "darkolivegreen" => [85,107,47],
228    "darkorange" =>     [255,140,0],
229    "darkorchid" =>     [153,50,204],
230    "darkred" =>    [139,0,0],
231    "darksalmon" =>     [233,150,122],
232    "darkseagreen" =>   [143,188,143],
233    "darkslateblue" =>  [72,61,139],
234    "darkslategray" =>  [47,79,79],
235    "darkslategrey" =>  [47,79,79],
236    "darkturquoise" =>  [0,206,209],
237    "darkviolet" =>     [148,0,211],
238    "deeppink" =>   [255,20,147],
239    "deepskyblue" =>    [0,191,255],
240    "dimgray" =>    [105,105,105],
241    "dimgrey" =>    [105,105,105],
242    "dodgerblue" =>     [30,144,255],
243    "firebrick" =>  [178,34,34],
244    "floralwhite" =>    [255,250,240],
245    "forestgreen" =>    [34,139,34],
246    "fuchsia" =>    [255,0,255],
247    "gainsboro" =>  [220,220,220],
248    "ghostwhite" =>     [248,248,255],
249    "gold" =>       [255,215,0],
250    "goldenrod" =>  [218,165,32],
251    "gray" =>       [128,128,128],
252    "green" =>      [0,128,0],
253    "greenyellow" =>    [173,255,47],
254    "grey" =>       [128,128,128],
255    "honeydew" =>   [240,255,240],
256    "hotpink" =>    [255,105,180],
257    "indianred" =>  [205,92,92],
258    "indigo" =>     [75,0,130],
259    "ivory" =>      [255,255,240],
260    "khaki" =>      [240,230,140],
261    "lavender" =>   [230,230,250],
262    "lavenderblush" =>  [255,240,245],
263    "lawngreen" =>  [124,252,0],
264    "lemonchiffon" =>   [255,250,205],
265    "lightblue" =>  [173,216,230],
266    "lightcoral" =>     [240,128,128],
267    "lightcyan" =>  [224,255,255],
268    "lightgoldenrodyellow" =>   [250,250,210],
269    "lightgray" =>  [211,211,211],
270    "lightgreen" =>     [144,238,144],
271    "lightgrey" =>  [211,211,211],
272    "lightpink" =>  [255,182,193],
273    "lightsalmon" =>    [255,160,122],
274    "lightseagreen" =>  [32,178,170],
275    "lightskyblue" =>   [135,206,250],
276    "lightslategray" => [119,136,153],
277    "lightslategrey" => [119,136,153],
278    "lightsteelblue" => [176,196,222],
279    "lightyellow" =>    [255,255,224],
280    "lime" =>       [0,255,0],
281    "limegreen" =>  [50,205,50],
282    "linen" =>      [250,240,230],
283    "magenta" =>    [255,0,255],
284    "maroon" =>     [128,0,0],
285    "mediumaquamarine" =>   [102,205,170],
286    "mediumblue" =>     [0,0,205],
287    "mediumorchid" =>   [186,85,211],
288    "mediumpurple" =>   [147,112,219],
289    "mediumseagreen" =>     [60,179,113],
290    "mediumslateblue" =>    [123,104,238],
291    "mediumspringgreen" =>  [0,250,154],
292    "mediumturquoise" =>    [72,209,204],
293    "mediumvioletred" =>    [199,21,133],
294    "midnightblue" =>   [25,25,112],
295    "mintcream" =>  [245,255,250],
296    "mistyrose" =>  [255,228,225],
297    "moccasin" =>   [255,228,181],
298    "navajowhite" =>    [255,222,173],
299    "navy" =>       [0,0,128],
300    "oldlace" =>    [253,245,230],
301    "olive" =>      [128,128,0],
302    "olivedrab" =>  [107,142,35],
303    "orange" =>     [255,165,0],
304    "orangered" =>  [255,69,0],
305    "orchid" =>     [218,112,214],
306    "palegoldenrod" =>  [238,232,170],
307    "palegreen" =>  [152,251,152],
308    "paleturquoise" =>  [175,238,238],
309    "palevioletred" =>  [219,112,147],
310    "papayawhip" =>     [255,239,213],
311    "peachpuff" =>  [255,218,185],
312    "peru" =>       [205,133,63],
313    "pink" =>       [255,192,203],
314    "plum" =>       [221,160,221],
315    "powderblue" =>     [176,224,230],
316    "purple" =>     [128,0,128],
317    "red" =>        [255,0,0],
318    "rosybrown" =>  [188,143,143],
319    "royalblue" =>  [65,105,225],
320    "saddlebrown" =>    [139,69,19],
321    "salmon" =>     [250,128,114],
322    "sandybrown" =>     [244,164,96],
323    "seagreen" =>   [46,139,87],
324    "seashell" =>   [255,245,238],
325    "sienna" =>     [160,82,45],
326    "silver" =>     [192,192,192],
327    "skyblue" =>    [135,206,235],
328    "slateblue" =>  [106,90,205],
329    "slategray" =>  [112,128,144],
330    "slategrey" =>  [112,128,144],
331    "snow" =>       [255,250,250],
332    "springgreen" =>    [0,255,127],
333    "steelblue" =>  [70,130,180],
334    "tan" =>        [210,180,140],
335    "teal" =>       [0,128,128],
336    "thistle" =>    [216,191,216],
337    "tomato" =>     [255,99,71],
338    "turquoise" =>  [64,224,208],
339    "violet" =>     [238,130,238],
340    "wheat" =>      [245,222,179],
341    "white" =>      [255,255,255],
342    "whitesmoke" =>     [245,245,245],
343    "yellow" =>     [255,255,0],
344    "yellowgreen" =>    [154,205,50 ]
345};
346
347
348sub convert_font_size
349{
350    my ($css_font_size) = @_;
351
352    my $exp_font_size = undef;
353
354   
355    #if ($css_font_size =~ m/^(\d+(?:\.\d*))px$/) {
356    #   $exp_font_size = int($1);
357    #}
358   
359    $css_font_size =~ s/[^0-9]//g;
360   
361    if(defined $css_font_size){
362        $exp_font_size = $css_font_size;
363    }
364
365    return $exp_font_size;
366}
367
368
369sub convert_color
370{
371    my ($css_color) = @_;
372
373    my $exp_color;
374
375    if ($css_color =~ m/^rgb\((\d+),\s*(\d+),\s*(\d+)\)$/) {
376
377    my $r = int(100*$1/255);
378    my $g = int(100*$2/255);
379    my $b = int(100*$3/255);
380
381    print STDERR "*** r = $r, g = $g, b = $b\n";
382
383    $exp_color = "$r $g $b";
384
385    print STDERR "*** exp color = $exp_color\n";
386
387    }
388    elsif ($css_color =~ m/^transparent/i) {
389    $exp_color = undef;
390    }
391
392    return $exp_color;
393}
394
395sub convert_font_family
396{
397    my ($css_font_family) = @_;
398       
399    print STDERR "*** PASSING PARAMETER css font family: ".$css_font_family."\n";
400   
401    my $exp_font_family;
402   
403    #use $font_specific_family_lookup and $font_generic_family_lookup
404    #to find the appropriate font family tag to output to expeditee.
405    if(defined $font_specific_family_lookup->{lc($css_font_family)}){
406        $exp_font_family = $css_font_family."_";
407    }
408   
409    print STDERR "**** TESTING TESTING ".$font_specific_family_lookup->{"georgia"}."\n";
410    print STDERR "**** TESTING TESTING ".$font_specific_family_lookup->{lc($css_font_family)}."\n";
411    print STDERR "**** TESTING TESTING ".$font_specific_family_lookup->{$css_font_family}."\n";
412    print STDERR "In CssStyleToExpAttr: font family attribute: $exp_font_family ******* \n";
413   
414    return $exp_font_family;
415}
416
417sub convert_font_style
418{
419    my ($css_font_style) = @_;
420
421    my $exp_font_style;
422   
423    return $exp_font_style;
424}
425   
4261;
Note: See TracBrowser for help on using the browser.