root/other-projects/nightly-tasks/diffcol/trunk/model-collect/Associated-Files/archives/HASH0a87.dir/doc.xml @ 29717

Revision 29717, 141.6 KB (checked in by ak19, 5 years ago)

Updating after change to wvware config file wvHtml.xml to convert justified text in input word docs to justified text in output HTML, instead of being output as left-aligned html. Still need to check whether nightly tests on this collection succeed before regenerating the other affected model collections

Line 
1<?xml version="1.0" encoding="utf-8" standalone="no"?>
2<!DOCTYPE Archive SYSTEM "http://greenstone.org/dtd/Archive/1.0/Archive.dtd">
3<Archive>
4<Section>
5  <Description>
6    <Metadata name="gsdldoctype">indexed_doc</Metadata>
7    <Metadata name="Language">en</Metadata>
8    <Metadata name="Encoding">utf8</Metadata>
9    <Metadata name="GENERATOR">wvWare/wvWare version 1.2.4</Metadata>
10    <Metadata name="Title">Greenstone: A Comprehensive Open-Source</Metadata>
11    <Metadata name="URL">http://Scratch/ak19/gs2-svn-22Oct2014/collect/Associated-Files/tmp/1423106799/greenstone01.html</Metadata>
12    <Metadata name="UTF8URL">http://Scratch/ak19/gs2-svn-22Oct2014/collect/Associated-Files/tmp/1423106799/greenstone01.html</Metadata>
13    <Metadata name="gsdlsourcefilename">import/greenstone01.doc</Metadata>
14    <Metadata name="gsdlconvertedfilename">tmp/1423106799/greenstone01.html</Metadata>
15    <Metadata name="OrigSource">greenstone01.html</Metadata>
16    <Metadata name="Source">greenstone01.doc</Metadata>
17    <Metadata name="SourceFile">greenstone01.doc</Metadata>
18    <Metadata name="Plugin">WordPlugin</Metadata>
19    <Metadata name="FileSize">414720</Metadata>
20    <Metadata name="FilenameRoot">greenstone01</Metadata>
21    <Metadata name="FileFormat">Word</Metadata>
22    <Metadata name="srcicon">_icondoc_</Metadata>
23    <Metadata name="srclink_file">doc.doc</Metadata>
24    <Metadata name="srclinkFile">doc.doc</Metadata>
25    <Metadata name="dc.Creator">Ian H. Witten</Metadata>
26    <Metadata name="dc.Creator">Rodger J. McNab</Metadata>
27    <Metadata name="dc.Creator">Stefan J. Boddie</Metadata>
28    <Metadata name="dc.Creator">David Bainbridge</Metadata>
29    <Metadata name="dc.Title">Greenstone: A Comprehensive Open-Source Digital Library Software System</Metadata>
30    <Metadata name="pdf.assoclink">&lt;a href=&quot;_httpprefix_/collect/[collection]/index/assoc/{Or}{[parent(Top):assocfilepath],[assocfilepath]}/greenstone01.pdf&quot;&gt;{If}{_iconpdf_,_iconpdf_,pdf}&lt;/a&gt;</Metadata>
31    <Metadata name="equivDocLink">&lt;a href='_httpprefix_/collect/[collection]/index/assoc/[assocfilepath]/greenstone01.pdf'&gt;</Metadata>
32    <Metadata name="equivDocIcon">_iconpdf_</Metadata>
33    <Metadata name="/equivDocLink">&lt;/a&gt;</Metadata>
34    <Metadata name="equivlink"> &lt;a href=&quot;_httpprefix_/collect/[collection]/index/assoc/{Or}{[parent(Top):assocfilepath],[assocfilepath]}/greenstone01.pdf&quot;&gt;{If}{_iconpdf_,_iconpdf_,pdf}&lt;/a&gt;</Metadata>
35    <Metadata name="Identifier">HASH0a87f402e5d107f0d73a2a</Metadata>
36    <Metadata name="lastmodified">1423106757</Metadata>
37    <Metadata name="lastmodifieddate">20150205</Metadata>
38    <Metadata name="oailastmodified">1423106799</Metadata>
39    <Metadata name="oailastmodifieddate">20150205</Metadata>
40    <Metadata name="assocfilepath">HASH0a87.dir</Metadata>
41    <Metadata name="gsdlassocfile">greenstone010.png:image/png:</Metadata>
42    <Metadata name="gsdlassocfile">greenstone011.png:image/png:</Metadata>
43    <Metadata name="gsdlassocfile">greenstone012.png:image/png:</Metadata>
44    <Metadata name="gsdlassocfile">greenstone013.png:image/png:</Metadata>
45    <Metadata name="gsdlassocfile">greenstone014.png:image/png:</Metadata>
46    <Metadata name="gsdlassocfile">greenstone015.png:image/png:</Metadata>
47    <Metadata name="gsdlassocfile">doc.doc:application/msword:</Metadata>
48    <Metadata name="gsdlassocfile">greenstone01.pdf::</Metadata>
49  </Description>
50  <Content>
51
52&lt;!--Section Begins--&gt;&lt;br&gt;
53
54
55
56&lt;p&gt;&lt;div name=&quot;Heading 1&quot; align=&quot;center&quot; style=&quot;margin: 4.17mm 0.50mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
57
58&lt;p style=&quot;text-indent: 0.00mm; text-align: center; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
59&lt;b&gt;&lt;span style=&quot;text-transform:uppercase&quot;&gt;Greenstone:  A Comprehensive Open-Source Digital Library Software System&lt;/span&gt;&lt;/b&gt;
60&lt;/p&gt;&lt;/div&gt;
61
62
63
64&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;center&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
65
66&lt;p style=&quot;text-indent: 0.00mm; text-align: center; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
67&lt;b&gt;&lt;/b&gt;
68&lt;/p&gt;&lt;/div&gt;
69
70
71
72&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;center&quot; style=&quot;margin: 1.74mm 0.00mm 1.39mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
73
74&lt;p style=&quot;text-indent: 0.00mm; text-align: center; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
75&lt;i&gt;Ian H. Witten,&lt;/i&gt;&lt;i&gt;&lt;sup&gt;*&lt;/sup&gt;&lt;/i&gt;&lt;i&gt; Rodger J. McNab,&lt;/i&gt;&lt;i&gt;&lt;sup&gt;&amp;dagger;&lt;/sup&gt;&lt;/i&gt;&lt;i&gt; Stefan J. Boddie,&lt;/i&gt;&lt;i&gt;&lt;sup&gt;*&lt;/sup&gt;&lt;/i&gt;&lt;i&gt; David Bainbridge&lt;/i&gt;&lt;i&gt;&lt;sup&gt;*&lt;/sup&gt;&lt;/i&gt;&lt;i&gt; &lt;/i&gt;&lt;i&gt;&lt;sup&gt;&lt;/sup&gt;&lt;/i&gt;
76&lt;/p&gt;&lt;/div&gt;
77
78
79&lt;table width=&quot;98.51%&quot; border=&quot;1&quot; cols=&quot;2&quot; rows=&quot;1&quot;&gt;
80&lt;tr&gt;&lt;td bgcolor=&quot;White&quot; width=&quot;46.57%&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;center&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
81
82&lt;p style=&quot;text-indent: 0.00mm; text-align: center; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
83&lt;sup&gt;*&lt;/sup&gt; Dept of Computer Science
84&lt;/p&gt;&lt;/div&gt;
85
86
87
88&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;center&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
89
90&lt;p style=&quot;text-indent: 0.00mm; text-align: center; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
91University of Waikato, New Zealand
92&lt;/p&gt;&lt;/div&gt;
93
94
95
96&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;center&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
97
98&lt;p style=&quot;text-indent: 0.00mm; text-align: center; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
99E-mail:  {ihw, sjboddie, davidb}@cs.waikato.ac.nz
100&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
101
102
103
104&lt;td bgcolor=&quot;White&quot; width=&quot;53.43%&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;center&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
105
106&lt;p style=&quot;text-indent: 0.00mm; text-align: center; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
107&lt;sup&gt;&amp;dagger; &lt;/sup&gt;Digilib Systems
108&lt;/p&gt;&lt;/div&gt;
109
110
111
112&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;center&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
113
114&lt;p style=&quot;text-indent: 0.00mm; text-align: center; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
115Hamilton, New Zealand
116&lt;/p&gt;&lt;/div&gt;
117
118
119
120&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;center&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
121
122&lt;p style=&quot;text-indent: 0.00mm; text-align: center; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
123E-mail:  rodger@digilibs.com
124&lt;/p&gt;&lt;/div&gt;
125
126
127
128&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;center&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
129
130&lt;p style=&quot;text-indent: 0.00mm; text-align: center; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
131&lt;sup&gt;&lt;/sup&gt;
132&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
133
134&lt;/tr&gt;
135
136&lt;/table&gt;
137
138&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
139
140&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
141&lt;b&gt;&lt;/b&gt;
142&lt;/p&gt;&lt;/div&gt;
143
144
145
146&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
147
148&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
149&lt;b&gt;&lt;/b&gt;
150&lt;/p&gt;&lt;/div&gt;
151
152&lt;!--Section Ends--&gt;
153
154&lt;!--Section Begins--&gt;&lt;br&gt;
155
156
157
158&lt;p&gt;&lt;div name=&quot;Heading 1&quot; align=&quot;left&quot; style=&quot;margin: 0.00mm 0.49mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
159
160&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
161&lt;b&gt;&lt;span style=&quot;text-transform:uppercase&quot;&gt;Abstract&lt;/span&gt;&lt;/b&gt;
162&lt;/p&gt;&lt;/div&gt;
163
164
165
166&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
167
168&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
169This paper describes the Greenstone digital library software, a comprehensive, open-source system for the construction and presentation of information collections. Collections built with Greenstone offer effective full-text searching and metadata-based browsing facilities that are attractive and easy to use. Moreover, they are easily maintainable and can be augmented and rebuilt entirely automatically. The system is extensible: software &amp;ldquo;plugins&amp;rdquo; accommodate different document and metadata types.
170&lt;/p&gt;&lt;/div&gt;
171
172
173
174&lt;p&gt;&lt;div name=&quot;Heading 1&quot; align=&quot;left&quot; style=&quot;margin: 4.17mm 0.50mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
175
176&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
177&lt;b&gt;&lt;span style=&quot;text-transform:uppercase&quot;&gt;Introduction&lt;/span&gt;&lt;/b&gt;
178&lt;/p&gt;&lt;/div&gt;
179
180
181
182&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
183
184&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
185Notwithstanding intense research activity in the digital library field during the second half of the 1990s, comprehensive software systems for creating digital libraries are not widely available. In fact, the usual solution when creating a digital library is also the most obvious&amp;mdash;just put it on the Web. But consider how much effort is involved in constructing a Web site for a digital library. To be effective it needs to be visually attractive and ergonomically easy to use, incorporate convenient and powerful searching capabilities, and offer rich and natural browsing facilities. Above all it must be easy to maintain and augment, which presents a significant challenge if any manual organization is involved.
186&lt;/p&gt;&lt;/div&gt;
187
188
189
190&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
191
192&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
193The alternative is to automate these activities through software tools. But the broad scope of digital library requirements makes this a daunting prospect. Ideally the software should incorporate facilities ranging from multilingual information retrieval to distributed computing protocols, from interoperability to search engine technology, from metadata standards to multiformat document parsing, from multimedia to multiple operating systems, from Web browsers to plug-and-play DVDs.
194&lt;/p&gt;&lt;/div&gt;
195
196
197
198&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
199
200&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
201The Greenstone Digital Library Software from the New Zealand Digital Library (NZDL) project tackles this issue by providing a new way of organizing information and making it available over the Internet. A &lt;i&gt;collection&lt;/i&gt; of information comprises several (typically several thousand, or several million) &lt;i&gt;documents&lt;/i&gt;, and a uniform interface is provided to all documents in a collection. A library may include many different collections, each organized differently&amp;mdash;though there is a strong family resemblance in how collections are presented.
202&lt;/p&gt;&lt;/div&gt;
203
204
205
206&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
207
208&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
209Making information available using this system is far more than &amp;ldquo;just putting it on the Web.&amp;rdquo; The collection becomes maintainable, searchable, and browsable. Each collection, prior to presentation, undergoes a &amp;ldquo;building&amp;rdquo; process that, once established, is completely automatic. This process creates all the structures that are used at run-time for accessing the collection. Searching is based on various indexes, while browsing is based on various metadata; support structures for both are created during the building operation. When new material appears it can be fully incorporated into the collection by rebuilding.
210&lt;/p&gt;&lt;/div&gt;
211
212
213
214&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
215
216&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
217To address the exceptionally broad demands of digital libraries, the system is public and extensible. It is issued under the Gnu public license and, in the spirit of open-source software, users are invited to contribute modifications and enhancements. Only through an international cooperative effort will digital library software become sufficiently comprehensive to meet the world's needs. Currently the Greenstone software is used at sites in Canada, Germany, New Zealand, Romania, UK, and the US, and collections range from newspaper articles to technical documents, from educational journals to oral history, from visual art to folksongs. The software has been used for collections in many different languages, and for CD-ROMs that have been published by the United Nations and other humanitarian agencies in Belgium, France, Japan, and the US for distribution in developing countries (Humanity Libraries, 1998; PAHO, 1999; UNESCO, 1999; UNU, 1998). Further details can be obtained from &lt;i&gt;www.nzdl.org&lt;/i&gt;.
218&lt;/p&gt;&lt;/div&gt;
219
220
221
222&lt;p&gt;&lt;div name=&quot;Caption&quot; align=&quot;center&quot; style=&quot;margin: 2.08mm 2.74mm 0.00mm 17.26mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
223
224&lt;p style=&quot;text-indent: -17.26mm; text-align: center; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
225&lt;img width=&quot;740&quot; height=&quot;658&quot; alt=&quot;0x01 graphic&quot; src=&quot;_httpdocimg_/greenstone010.png&quot;&gt;&lt;br&gt;
226&lt;/p&gt;&lt;/div&gt;
227
228
229
230&lt;p&gt;&lt;div name=&quot;Caption&quot; align=&quot;center&quot; style=&quot;margin: 2.08mm 2.74mm 0.00mm 17.26mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
231
232&lt;p style=&quot;text-indent: -17.26mm; text-align: center; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
233&lt;b&gt;Figure &lt;/b&gt;&lt;b&gt;&lt;/b&gt;&lt;b&gt;&lt;/b&gt;&lt;b&gt;&lt;/b&gt;&lt;b&gt;1&lt;/b&gt;&lt;b&gt;&lt;/b&gt;&lt;b&gt;: Searching the HDL collection&lt;/b&gt;
234&lt;/p&gt;&lt;/div&gt;
235
236
237
238&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
239
240&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
241This paper sets the scene with a brief discussion of what a digital library is. We then give an overview of the facilities offered by Greenstone and show how end users find information in collections. Next we describe the files and directories involved in a collection, and then discuss the processes of updating existing collections and creating new ones, including extending the software to provide new facilities. We conclude with an overview of related work.
242&lt;/p&gt;&lt;/div&gt;
243
244
245
246&lt;p&gt;&lt;div name=&quot;Heading 1&quot; align=&quot;left&quot; style=&quot;margin: 4.17mm 0.50mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
247
248&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
249&lt;b&gt;&lt;span style=&quot;text-transform:uppercase&quot;&gt;What is a digital library?&lt;/span&gt;&lt;/b&gt;
250&lt;/p&gt;&lt;/div&gt;
251
252
253
254&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
255
256&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
257Ten definitions of the term &amp;ldquo;digital library&amp;rdquo; have been culled from the literature by Fox (1998), and their spirit is captured in the following brief characterization:
258&lt;/p&gt;&lt;/div&gt;
259
260
261
262&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;left&quot; style=&quot;margin: 2.08mm 7.55mm 0.00mm 7.81mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
263
264&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
265&lt;i&gt;A collection of digital objects, including text, video, and audio, along with methods for access and retrieval, and for selection, organization and maintenance of the collection&lt;/i&gt;
266&lt;/p&gt;&lt;/div&gt;
267
268
269
270&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
271
272&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
273(Akscyn and Witten, 1998). Lesk (1998) views digital libraries as &amp;ldquo;organized collections of digital information,&amp;rdquo; and wisely recommends that they articulate the principles governing what is included and how the collection is organized.
274&lt;/p&gt;&lt;/div&gt;
275
276
277
278&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
279
280&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
281Digital libraries are generally distinguished from the World-Wide Web, the essential difference being in selection and organization. But they are not generally distinguished from a web &lt;i&gt;site&lt;/i&gt;: indeed, virtually all extant digital libraries manifest themselves as a web site. Hence the obvious question: to make a digital library, why not just put the information on the Web?
282&lt;/p&gt;&lt;/div&gt;
283
284
285
286&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
287
288&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
289But we make a distinction between a digital library and a web site that lies at the heart of our software design: one should easily be able to add new material to a library without having to integrate it manually or edit its content in any way. Once added, new material should immediately become a first-class component of the library. And what permits it to be integrated into existing searching and browsing structures without any manual intervention is &lt;i&gt;metadata&lt;/i&gt;. This provides sufficient focus to the concept of &amp;ldquo;digital library&amp;rdquo; to support the development of a construction kit.
290&lt;/p&gt;&lt;/div&gt;
291
292
293
294&lt;p&gt;&lt;div name=&quot;Heading 1&quot; align=&quot;left&quot; style=&quot;margin: 4.17mm 0.50mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
295
296&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
297&lt;b&gt;&lt;span style=&quot;text-transform:uppercase&quot;&gt;Overview of Greenstone&lt;/span&gt;&lt;/b&gt;
298&lt;/p&gt;&lt;/div&gt;
299
300
301
302&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
303
304&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
305Information collections built by Greenstone combine extensive full-text search facilities with browsing indexes based on different metadata types. There are several ways for users to find information, although they differ between collections depending on the metadata available and the collection design. Typically you can &lt;i&gt;search for particular words&lt;/i&gt; that appear in the text, or within a section of a document, or within a title or section heading. You can &lt;i&gt;browse documents by title&lt;/i&gt;: just click on the displayed book icon to read it. You can &lt;i&gt;browse documents by subject&lt;/i&gt;. Subjects are represented by bookshelves: just click on a shelf to see the books. Where appropriate, documents come complete with a table of contents (constructed automatically): you can click on a chapter or subsection to open it, expand the full table of contents, or expand the full document.
306&lt;/p&gt;&lt;/div&gt;
307
308
309
310&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
311
312&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
313An example of searching is shown in Figure 1 where documents in the Global Help Project's Humanity Development Library (HDL) are being searched for chapters matching the word &lt;i&gt;butterfly&lt;/i&gt;. In Figure 2 the same collection is being browsed by subject: by clicking on the bookshelf icons the user has discovered an item under Section 16, Animal Husbandry. Pursuing an interest in butterfly farming, the user selects a book by clicking on its book icon. In Figure 3 the front cover of the book is displayed as a graphic on the left, and the automatically constructed table of contents appears at the start of the document. The current focus, &lt;i&gt;Introduction and Summary&lt;/i&gt;, is shown in bold in the table of contents with its text starting further down the page.
314&lt;/p&gt;&lt;/div&gt;
315
316
317
318&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
319
320&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
321In accordance with Lesk's advice, a statement of purpose and coverage accompanies each collection, along with an explanation of how it is organized (Figure 1 shows the start of this). A distinction is made between &lt;i&gt;searching&lt;/i&gt; and &lt;i&gt;browsing&lt;/i&gt;. Searching is full-text, and&amp;mdash;depending on the collection's design&amp;mdash;the user can choose between indexes built from different parts of the documents, or from different metadata. Some collections have an index of full documents, an index of sections, an index of paragraphs, an index of titles, and an index of section headings, each of which can be searched for particular words or phrases. Browsing involves data structures created from metadata that the user can examine: lists of authors, lists of titles, lists of dates, hierarchical classification structures, and so on. Data structures for both browsing and searching are built according to instructions in a configuration file, which controls both building and serving the collection. Sample configuration files are discussed below.
322&lt;/p&gt;&lt;/div&gt;
323
324
325
326&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
327
328&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
329
330&lt;/p&gt;&lt;/div&gt;
331
332
333
334&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;center&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
335
336&lt;p style=&quot;text-indent: 0.00mm; text-align: center; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
337&lt;img width=&quot;740&quot; height=&quot;658&quot; alt=&quot;0x01 graphic&quot; src=&quot;_httpdocimg_/greenstone011.png&quot;&gt;&lt;br&gt;&lt;b&gt;&lt;/b&gt;
338&lt;/p&gt;&lt;/div&gt;
339
340
341
342&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;center&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
343
344&lt;p style=&quot;text-indent: 0.00mm; text-align: center; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
345&lt;b&gt;Figure &lt;/b&gt;&lt;b&gt;&lt;/b&gt;&lt;b&gt;&lt;/b&gt;&lt;b&gt;&lt;/b&gt;&lt;b&gt;2&lt;/b&gt;&lt;b&gt;&lt;/b&gt;&lt;b&gt;: Browsing the HDL collection by subject&lt;/b&gt;&lt;b&gt;&lt;/b&gt;
346&lt;/p&gt;&lt;/div&gt;
347
348
349
350&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
351
352&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
353Rich browsing facilities can be provided by manually linking parts of documents together and building explicit indexes and tables of contents. However, manually-created linking becomes difficult to maintain, and often falls into disrepair when a collection expands. The Greenstone software takes a different tack: it facilitates &lt;i&gt;maintainability&lt;/i&gt; by creating all searching and browsing structures automatically from the documents themselves. No links are inserted by hand. This means that when new documents in the same format become available, they can be added automatically. Indeed, for some collections this is done by processes that wake up regularly, scout for new material, and rebuild the indexes&amp;mdash;all without manual intervention.
354&lt;/p&gt;&lt;/div&gt;
355
356
357
358&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
359
360&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
361Collections comprise many documents: thousands, tens of thousands, or even millions. Each document may be hierarchically organized into &lt;i&gt;sections&lt;/i&gt; (subsections, sub-subsections, and so on). Each section comprises one or more &lt;i&gt;paragraphs&lt;/i&gt;. Metadata such as author, title, date, keywords, and so on, may be associated with documents, or with individual sections of documents. This is the raw material for indexes. It must either be provided explicitly for each document and section (for example, in an accompanying spreadsheet) or be derivable automatically from the source documents. Metadata is converted to Dublin Core and stored with the document for internal use.
362&lt;/p&gt;&lt;/div&gt;
363
364
365
366&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
367
368&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
369In order to accommodate different kinds of source documents, the software is organized so that &amp;ldquo;plugins&amp;rdquo; can be written for new document types. Plugins exist for plain text documents, HTML documents, email documents, and bibliographic formats. Word documents are handled by saving them as HTML; PostScript ones by applying a preprocessor (Nevill-Manning &lt;i&gt;et al&lt;/i&gt;., 1998). Specially written plugins also exist for proprietary formats such as that used by the BBC archives department. A collection may have source documents in different forms: it is just a matter of specifying all the necessary plugins. In order to build browsing indexes from metadata, an analogous scheme of &amp;ldquo;classifiers&amp;rdquo; is used: classifiers create indexes of various kinds based on metadata. Source documents are brought into the Greenstone system through a process called &lt;i&gt;importing&lt;/i&gt;, which uses the plugins and classifiers specified in the collection configuration file.
370&lt;/p&gt;&lt;/div&gt;
371
372
373
374&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
375
376&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
377The international Unicode character set is used throughout, so documents&amp;mdash;and interfaces&amp;mdash;can be written in any language. Collections have so far been produced in English, French, Spanish, German, Maori, Chinese, and Arabic. The NZDL Web site provides numerous examples. Collections can contain text, pictures, and even audio and video clips; a text-only version of the interface is also provided to accommodate visually impaired users. Compression technology is used to ensure best use of storage (Witten &lt;i&gt;et al&lt;/i&gt;., 1999). Most non-textual material is either linked to textual documents or accompanied by textual descriptions (such as photo captions) to allow full-text searching and browsing. However, the architecture permits the implementation of plugins and classifiers even for non-textual data.
378&lt;/p&gt;&lt;/div&gt;
379
380
381
382&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
383
384&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
385The system includes an &amp;ldquo;administrative&amp;rdquo; function whereby specified users can examine the composition of all collections, protect documents so that they can only be accessed by registered users on presentation of a password, and so on. Logs of user activity are kept that record all queries made to every Greenstone collection (though this facility can be disabled).
386&lt;/p&gt;&lt;/div&gt;
387
388
389
390&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
391
392&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
393Although primarily designed for Internet access over the World-Wide Web, collections can be made available, in precisely the same form, on CD-ROM. In either case they are accessed through any Web browser. Greenstone CD-ROMs operate on a standalone PC under Windows 3.X, 95, 98, and NT, and the interaction is identical to accessing the collection on the Web&amp;mdash;except that response is faster and more predictable. The requirement to operate on early Windows systems is one that plagues the software design, but is crucial for many users&amp;mdash;particularly those in underdeveloped countries seeking access to humanitarian aid collections. If the PC is connected to a network (intranet or Internet), a custom-built Web server provided on each CD makes exactly the same information available to others through their standard Web browser. The use of compression ensures that the greatest possible volume of information can be packed on to a CD-ROM.
394&lt;/p&gt;&lt;/div&gt;
395
396
397
398&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
399
400&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
401The collection-serving software operates under Unix and Windows NT, and works with standard Web servers. A flexible process structure allows different collections to be served by different computers, yet be presented to the user in the same way, on the same Web page, as part of the same digital library, even as part of the same collection (McNab and Witten, 1998). Existing collections can be updated and new ones brought on-line at any time, without bringing the system down; the process responsible for the user interface will notice (through periodic polling) when new collections appear and add them to the list presented to the user.
402&lt;/p&gt;&lt;/div&gt;
403
404
405
406&lt;p&gt;&lt;div name=&quot;Heading 1&quot; align=&quot;center&quot; style=&quot;margin: 4.17mm 0.50mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
407
408&lt;p style=&quot;text-indent: 0.00mm; text-align: center; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
409&lt;b&gt;&lt;span style=&quot;text-transform:uppercase&quot;&gt;&lt;img width=&quot;760&quot; height=&quot;662&quot; alt=&quot;0x01 graphic&quot; src=&quot;_httpdocimg_/greenstone012.png&quot;&gt;&lt;br&gt;&lt;/span&gt;&lt;/b&gt;&lt;b&gt;&lt;span style=&quot;text-transform:uppercase&quot;&gt;&lt;/span&gt;&lt;/b&gt;
410&lt;/p&gt;&lt;/div&gt;
411
412
413
414&lt;p&gt;&lt;div name=&quot;Caption&quot; align=&quot;center&quot; style=&quot;margin: 2.08mm 2.74mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
415
416&lt;p style=&quot;text-indent: 0.00mm; text-align: center; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
417&lt;b&gt;Figure &lt;/b&gt;&lt;b&gt;&lt;/b&gt;&lt;b&gt;&lt;/b&gt;&lt;b&gt;&lt;/b&gt;&lt;b&gt;3&lt;/b&gt;&lt;b&gt;&lt;/b&gt;&lt;b&gt;: Reading a book in the HDL&lt;/b&gt;&lt;b&gt;&lt;/b&gt;
418&lt;/p&gt;&lt;/div&gt;
419
420
421
422&lt;p&gt;&lt;div name=&quot;Heading 1&quot; align=&quot;left&quot; style=&quot;margin: 4.17mm 0.50mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
423
424&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
425&lt;b&gt;&lt;span style=&quot;text-transform:uppercase&quot;&gt;Finding information &lt;/span&gt;&lt;/b&gt;
426&lt;/p&gt;&lt;/div&gt;
427
428
429
430&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
431
432&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
433Greenstone digital library systems generally include several separate collections. A home page allows you to select a collection; in addition, each collection has its own &amp;ldquo;about&amp;rdquo; page that gives you information about how the collection is organized and the principles governing what is included.
434&lt;/p&gt;&lt;/div&gt;
435
436
437
438&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
439
440&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
441All icons in the screenshots of Figures 1-4 are clickable. Those icons at the top of the page return to the home page, provide help text, and allow you to set user interface and searching preferences. The navigation bar underneath gives access to the searching and browsing facilities, which differ from one collection to another.
442&lt;/p&gt;&lt;/div&gt;
443
444
445
446&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
447
448&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
449Each of the five buttons provides a different way to find information. You can &lt;i&gt;search for particular words&lt;/i&gt; that appear in the text from the &amp;ldquo;search&amp;rdquo; page (or from the &amp;ldquo;about&amp;rdquo; page of Figure 1). This collection contains indexes of chapters, section titles, and entire books. The default search interface is a simple one, suitable for casual users; advanced searching&amp;mdash;which allows full Boolean expressions, phrase searching, case and stemming control&amp;mdash;can be enabled from the &lt;i&gt;Preferences&lt;/i&gt; page.
450&lt;/p&gt;&lt;/div&gt;
451
452
453
454&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
455
456&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
457This collection has four browsable metadata indexes. You can &lt;i&gt;access publications by subject&lt;/i&gt; by clicking the &lt;i&gt;subjects&lt;/i&gt; button, which brings up a list of subjects, represented by bookshelves (Figure 2). You can &lt;i&gt;access publications by title&lt;/i&gt; by clicking &lt;i&gt;titles a-z&lt;/i&gt; (Figure 4), which brings up a list of books in alphabetic order. You can &lt;i&gt;access publications by organization&lt;/i&gt; (i.e. Dublin Core &amp;ldquo;publisher&amp;rdquo;), bringing up a list of organizations. You can &lt;i&gt;access publications by &amp;ldquo;how to&amp;rdquo; listing&lt;/i&gt;, yielding a list of hints defined by the collection's editors. We use the Dublin Core as a base and extend it in an &lt;i&gt;ad hoc&lt;/i&gt; manner to accommodate the individual requirements of collection designers.
458&lt;/p&gt;&lt;/div&gt;
459
460
461
462&lt;p&gt;&lt;div name=&quot;Heading 1&quot; align=&quot;left&quot; style=&quot;margin: 4.17mm 0.50mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
463
464&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
465&lt;b&gt;&lt;span style=&quot;text-transform:uppercase&quot;&gt;Files in a collection&lt;/span&gt;&lt;/b&gt;
466&lt;/p&gt;&lt;/div&gt;
467
468
469
470&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
471
472&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
473When a new collection is created or material is added to an existing one, the original source documents are first brought into the system through a process known as &amp;ldquo;importing.&amp;rdquo; This involves converting documents into a simple HTML-like format known as GML (for &amp;ldquo;Greenstone Markup Language&amp;rdquo;), which includes any metadata associated with the document. Documents are assumed to be in the Unicode UTF-8 code (of which the ASCII characters form a subset).
474&lt;/p&gt;&lt;/div&gt;
475
476
477
478&lt;p&gt;&lt;div name=&quot;Heading 2&quot; align=&quot;left&quot; style=&quot;margin: 6.94mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
479
480&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
481&lt;b&gt;Files and directories&lt;/b&gt;
482&lt;/p&gt;&lt;/div&gt;
483
484
485
486&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
487
488&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
489There is a separate directory for each collection, which contains five subdirectories: the original raw material (&lt;i&gt;import&lt;/i&gt;), the GML files created from this (&lt;i&gt;archives&lt;/i&gt;), the final collection as it is served to users (&lt;i&gt;index&lt;/i&gt;), a directory for use during the building process (&lt;i&gt;building&lt;/i&gt;), and one for any supporting files (&lt;i&gt;etc&lt;/i&gt;)&amp;mdash;including the configuration file that controls the collection creation procedure. Additional files might be required: for example, building a hierarchy of classifications requires a data file of sub-classifications.
490&lt;/p&gt;&lt;/div&gt;
491
492
493
494&lt;p&gt;&lt;div name=&quot;Heading 2&quot; align=&quot;left&quot; style=&quot;margin: 6.94mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
495
496&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
497&lt;b&gt;The imported documents&lt;/b&gt;
498&lt;/p&gt;&lt;/div&gt;
499
500
501
502&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
503
504&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
505In order to identify documents internally, a unique object identifier or OID is assigned to each original source document when it is imported (formed by hashing the content, to overcome file duplication effects caused by mirroring) and stored as metadata within that document. It is important that OIDs persist throughout the index-building process&amp;mdash;so that a user's search history is unaffected by rebuilding the collection. OIDs are assigned by hashing the contents of the original source document.
506&lt;/p&gt;&lt;/div&gt;
507
508
509
510&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
511
512&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
513Once imported, each document is stored in its own subdirectory of &lt;i&gt;archives&lt;/i&gt;, along with any associated files&amp;mdash;for example, images. To ensure compatibility with Windows 3.0, only eight characters are used in directory and file names, which causes annoying but essentially trivial complications.
514&lt;/p&gt;&lt;/div&gt;
515
516
517
518&lt;p&gt;&lt;div name=&quot;Heading 2&quot; align=&quot;left&quot; style=&quot;margin: 6.94mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
519
520&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
521&lt;b&gt;Inside the documents&lt;/b&gt;
522&lt;/p&gt;&lt;/div&gt;
523
524
525
526&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
527
528&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
529The GML format imposes a limited amount of structure on documents. Documents are divided into paragraphs. They can be split hierarchically into sections and subsections. OIDs are extended to identify these components by appending numbers, separated by periods, to a document's OID. When a book is read, its section hierarchy is visible as the table of contents (Figure 3). Chapters, sections, subsections, and pages are all implemented simply as &amp;ldquo;sections&amp;rdquo; within the document. In some collections documents do not have a hierarchical subsection structure, but are split into pages to permit browsing within a retrieved document.
530&lt;/p&gt;&lt;/div&gt;
531
532
533
534&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
535
536&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
537The document structure is used for searchable indexes. There are three levels of index: &lt;i&gt;documents&lt;/i&gt;, &lt;i&gt;sections&lt;/i&gt;, and &lt;i&gt;paragraphs&lt;/i&gt;, corresponding to the distinctions that GML makes&amp;mdash;the hierarchical structure is flattened for the purposes of creating these indexes. Indexes can be of text, or metadata, or any combination. Thus you can create a searchable index of section titles, and/or authors, and/or document descriptions, as well as the document text.
538&lt;/p&gt;&lt;/div&gt;
539
540
541
542&lt;p&gt;&lt;div name=&quot;Caption&quot; align=&quot;center&quot; style=&quot;margin: 2.08mm 2.74mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
543
544&lt;p style=&quot;text-indent: 0.00mm; text-align: center; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
545&lt;img width=&quot;698&quot; height=&quot;698&quot; alt=&quot;0x01 graphic&quot; src=&quot;_httpdocimg_/greenstone013.png&quot;&gt;&lt;br&gt;
546&lt;/p&gt;&lt;/div&gt;
547
548
549
550&lt;p&gt;&lt;div name=&quot;Caption&quot; align=&quot;center&quot; style=&quot;margin: 2.08mm 2.74mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
551
552&lt;p style=&quot;text-indent: 0.00mm; text-align: center; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
553&lt;b&gt;Figure 4&lt;/b&gt;&lt;b&gt;: Browsing titles in the HDL&lt;/b&gt;&lt;b&gt;&lt;/b&gt;
554&lt;/p&gt;&lt;/div&gt;
555
556
557
558&lt;p&gt;&lt;div name=&quot;Heading 1&quot; align=&quot;left&quot; style=&quot;margin: 4.17mm 0.50mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
559
560&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
561&lt;b&gt;&lt;span style=&quot;text-transform:uppercase&quot;&gt;Updating existing collections&lt;/span&gt;&lt;/b&gt;
562&lt;/p&gt;&lt;/div&gt;
563
564
565
566&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
567
568&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
569Updating an existing collection with new files in the same format is easy. For example, the raw material for the HDL is supplied in the form of HTML files marked up with &amp;lt;&amp;lt;TOC&amp;gt;&amp;gt; tags to split books into sections and subsections, and &amp;lt;&amp;lt;I&amp;gt;&amp;gt; tags to indicate where an image is to be inserted. For each book in the library there is a directory that contains a single HTML file representing the book, and separate files containing the associated images. An accompanying spreadsheet file contains the classification hierarchy; this is converted to a simple file format (using Excel's &lt;i&gt;Save As&lt;/i&gt; command).
570&lt;/p&gt;&lt;/div&gt;
571
572
573
574&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
575
576&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
577Since the collection exists, its directory is already set up with subdirectories &lt;i&gt;import&lt;/i&gt;, &lt;i&gt;archives&lt;/i&gt;, &lt;i&gt;building&lt;/i&gt;, &lt;i&gt;index&lt;/i&gt;, and &lt;i&gt;etc&lt;/i&gt;, and the &lt;i&gt;etc&lt;/i&gt; directory will contain a suitable collection configuration file.
578&lt;/p&gt;&lt;/div&gt;
579
580
581
582&lt;p&gt;&lt;div name=&quot;Heading 2&quot; align=&quot;left&quot; style=&quot;margin: 6.94mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
583
584&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
585&lt;b&gt;The updating procedure&lt;/b&gt;
586&lt;/p&gt;&lt;/div&gt;
587
588
589
590&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
591
592&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
593To update a collection, the new raw material is placed in the &lt;i&gt;import&lt;/i&gt; directory, in whatever form it is available. Then the &lt;i&gt;import&lt;/i&gt; process is invoked, which converts the files into GML using the specified plugins. Old material for which GML files have previously been created is not re-imported. Then the &lt;i&gt;build&lt;/i&gt; process is invoked to build the requisite indexes for the collection. Finally, the contents of the &lt;i&gt;building&lt;/i&gt; directory are moved into the &lt;i&gt;index&lt;/i&gt; directory, and the new version of the collection automatically becomes live.
594&lt;/p&gt;&lt;/div&gt;
595
596
597
598&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
599
600&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
601This procedure may seem cumbersome. But all the steps are necessary for efficient operation with large collections. The &lt;i&gt;import&lt;/i&gt; process could be performed on the fly during the building operation&amp;mdash;but because building indexes is a multipass operation, the often lengthy importing would be repeated several times. The &lt;i&gt;build&lt;/i&gt; process can take considerable time&amp;mdash;a day or two, for very large collections. Consequently, the results are placed in the &lt;i&gt;building&lt;/i&gt; directory so that, if the collection already exists, it will continue to be served to users in its old form throughout the building operation.
602&lt;/p&gt;&lt;/div&gt;
603
604
605
606&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
607
608&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
609Active users of the collection will not be disturbed when the new version becomes live&amp;mdash;they will probably not even notice. The persistent OIDs ensure that interactions remain coherent&amp;mdash;users who are examining the results of a query or browse operation will still retrieve the expected documents&amp;mdash;and if a search is actually in progress when the change takes place the program detects the resulting file-structure inconsistency and automatically and transparently re-executes the query, this time on the new version of the collection.
610&lt;/p&gt;&lt;/div&gt;
611
612
613
614&lt;p&gt;&lt;div name=&quot;Heading 2&quot; align=&quot;left&quot; style=&quot;margin: 6.94mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
615
616&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
617&lt;b&gt;How it works&lt;/b&gt;
618&lt;/p&gt;&lt;/div&gt;
619
620
621
622&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
623
624&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
625The original material in the &lt;i&gt;import&lt;/i&gt; directory may be in any format, and plugins are required to process each format type. The plugins that a collection uses must be specified in the collection configuration file. The &lt;i&gt;import&lt;/i&gt; program reads the list of plugins and passes each document to each plugin in order until it finds one that can process it. When updating an existing collection, all plugins necessary to process new material should already have been specified in the configuration file.
626&lt;/p&gt;&lt;/div&gt;
627
628
629
630&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
631
632&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
633The building step creates the indexes for both searching and browsing. The MG software is generally used to do the searching (Witten &lt;i&gt;et al.&lt;/i&gt;, 1999), and the &lt;i&gt;mgbuild&lt;/i&gt; module is automatically invoked to create each of the indexes that is required. For example, the Humanity Development Library has three indexes, one for entire books, one for chapters, and one for section titles. Subdirectories of the &lt;i&gt;index&lt;/i&gt; directory are created for each of these indexes.
634&lt;/p&gt;&lt;/div&gt;
635
636
637&lt;table width=&quot;92.93%25&quot; border=&quot;1&quot; cols=&quot;4&quot; rows=&quot;12&quot;&gt;
638&lt;tr&gt;&lt;td bgcolor=&quot;White&quot; width=&quot;6.36%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
639
640&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
641
642&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
643
644
645
646&lt;td bgcolor=&quot;White&quot; width=&quot;19.69%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
647
648&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
649creator
650&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
651
652
653
654&lt;td bgcolor=&quot;White&quot; width=&quot;64.87%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
655
656&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
657davidb@cs.waikato.ac.nz
658&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
659
660
661
662&lt;td bgcolor=&quot;White&quot; width=&quot;9.08%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
663
664&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
6651
666&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
667
668&lt;/tr&gt;
669
670
671
672&lt;tr&gt;&lt;td bgcolor=&quot;White&quot; width=&quot;6.36%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
673
674&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
675
676&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
677
678
679
680&lt;td bgcolor=&quot;White&quot; width=&quot;19.69%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
681
682&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
683maintainer
684&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
685
686
687
688&lt;td bgcolor=&quot;White&quot; width=&quot;64.87%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
689
690&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
691davidb@cs.waikato.ac.nz
692&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
693
694
695
696&lt;td bgcolor=&quot;White&quot; width=&quot;9.08%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
697
698&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
6992
700&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
701
702&lt;/tr&gt;
703
704
705
706&lt;tr&gt;&lt;td bgcolor=&quot;White&quot; width=&quot;6.36%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
707
708&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
709
710&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
711
712
713
714&lt;td bgcolor=&quot;White&quot; width=&quot;19.69%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
715
716&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
717public
718&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
719
720
721
722&lt;td bgcolor=&quot;White&quot; width=&quot;64.87%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
723
724&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
725True
726&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
727
728
729
730&lt;td bgcolor=&quot;White&quot; width=&quot;9.08%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
731
732&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
7333
734&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
735
736&lt;/tr&gt;
737
738
739
740&lt;tr&gt;&lt;td bgcolor=&quot;White&quot; width=&quot;6.36%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
741
742&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
743
744&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
745
746
747
748&lt;td bgcolor=&quot;White&quot; width=&quot;19.69%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
749
750&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
751
752&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
753
754
755
756&lt;td bgcolor=&quot;White&quot; width=&quot;64.87%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
757
758&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
759
760&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
761
762
763
764&lt;td bgcolor=&quot;White&quot; width=&quot;9.08%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
765
766&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
7674
768&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
769
770&lt;/tr&gt;
771
772
773
774&lt;tr&gt;&lt;td bgcolor=&quot;White&quot; width=&quot;6.36%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
775
776&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
777
778&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
779
780
781
782&lt;td bgcolor=&quot;White&quot; width=&quot;19.69%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
783
784&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
785indexes
786&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
787
788
789
790&lt;td bgcolor=&quot;White&quot; width=&quot;64.87%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
791
792&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
793document:text
794&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
795
796
797
798&lt;td bgcolor=&quot;White&quot; width=&quot;9.08%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
799
800&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
8015
802&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
803
804&lt;/tr&gt;
805
806
807
808&lt;tr&gt;&lt;td bgcolor=&quot;White&quot; width=&quot;6.36%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
809
810&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
811
812&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
813
814
815
816&lt;td bgcolor=&quot;White&quot; width=&quot;19.69%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
817
818&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
819defaultindex
820&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
821
822
823
824&lt;td bgcolor=&quot;White&quot; width=&quot;64.87%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
825
826&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
827document:text
828&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
829
830
831
832&lt;td bgcolor=&quot;White&quot; width=&quot;9.08%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
833
834&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
8356
836&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
837
838&lt;/tr&gt;
839
840
841
842&lt;tr&gt;&lt;td bgcolor=&quot;White&quot; width=&quot;6.36%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
843
844&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
845
846&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
847
848
849
850&lt;td bgcolor=&quot;White&quot; width=&quot;19.69%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
851
852&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
853plugins
854&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
855
856
857
858&lt;td bgcolor=&quot;White&quot; width=&quot;64.87%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
859
860&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
861GMLPlug TEXTPlug ArcPlug RecPlug
862&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
863
864
865
866&lt;td bgcolor=&quot;White&quot; width=&quot;9.08%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
867
868&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
8697
870&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
871
872&lt;/tr&gt;
873
874
875
876&lt;tr&gt;&lt;td bgcolor=&quot;White&quot; width=&quot;6.36%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
877
878&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
879
880&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
881
882
883
884&lt;td bgcolor=&quot;White&quot; width=&quot;19.69%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
885
886&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
887
888&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
889
890
891
892&lt;td bgcolor=&quot;White&quot; width=&quot;64.87%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
893
894&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
895
896&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
897
898
899
900&lt;td bgcolor=&quot;White&quot; width=&quot;9.08%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
901
902&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
9038
904&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
905
906&lt;/tr&gt;
907
908
909
910&lt;tr&gt;&lt;td bgcolor=&quot;White&quot; width=&quot;6.36%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
911
912&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
913
914&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
915
916
917
918&lt;td bgcolor=&quot;White&quot; width=&quot;19.69%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
919
920&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
921classify
922&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
923
924
925
926&lt;td bgcolor=&quot;White&quot; width=&quot;64.87%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
927
928&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
929AZList metadata=Title
930&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
931
932
933
934&lt;td bgcolor=&quot;White&quot; width=&quot;9.08%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
935
936&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
9379
938&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
939
940&lt;/tr&gt;
941
942
943
944&lt;tr&gt;&lt;td bgcolor=&quot;White&quot; width=&quot;6.36%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
945
946&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
947
948&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
949
950
951
952&lt;td bgcolor=&quot;White&quot; width=&quot;19.69%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
953
954&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
955
956&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
957
958
959
960&lt;td bgcolor=&quot;White&quot; width=&quot;64.87%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
961
962&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
963
964&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
965
966
967
968&lt;td bgcolor=&quot;White&quot; width=&quot;9.08%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
969
970&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
97110
972&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
973
974&lt;/tr&gt;
975
976
977
978&lt;tr&gt;&lt;td bgcolor=&quot;White&quot; width=&quot;6.36%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
979
980&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
981
982&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
983
984
985
986&lt;td bgcolor=&quot;White&quot; width=&quot;19.69%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
987
988&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
989collectionmeta
990&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
991
992
993
994&lt;td bgcolor=&quot;White&quot; width=&quot;64.87%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
995
996&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
997collectionname    &amp;quot;generic text collection&amp;quot;
998&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
999
1000
1001
1002&lt;td bgcolor=&quot;White&quot; width=&quot;9.08%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1003
1004&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
100511
1006&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1007
1008&lt;/tr&gt;
1009
1010
1011
1012&lt;tr&gt;&lt;td bgcolor=&quot;White&quot; width=&quot;6.36%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1013
1014&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1015(a)
1016&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1017
1018
1019
1020&lt;td bgcolor=&quot;White&quot; width=&quot;19.69%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1021
1022&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1023collectionmeta
1024&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1025
1026
1027
1028&lt;td bgcolor=&quot;White&quot; width=&quot;64.87%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1029
1030&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1031.document:text    &amp;quot;documents&amp;quot;
1032&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1033
1034
1035
1036&lt;td bgcolor=&quot;White&quot; width=&quot;9.08%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1037
1038&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
103912
1040&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1041
1042&lt;/tr&gt;
1043
1044&lt;/table&gt;
1045
1046&lt;p&gt;&lt;div name=&quot;label&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1047
1048&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1049
1050&lt;/p&gt;&lt;/div&gt;
1051
1052
1053&lt;table width=&quot;92.93%25&quot; border=&quot;1&quot; cols=&quot;4&quot; rows=&quot;17&quot;&gt;
1054&lt;tr&gt;&lt;td bgcolor=&quot;White&quot; width=&quot;6.36%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1055
1056&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1057
1058&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1059
1060
1061
1062&lt;td bgcolor=&quot;White&quot; width=&quot;19.69%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1063
1064&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1065creator
1066&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1067
1068
1069
1070&lt;td bgcolor=&quot;White&quot; width=&quot;64.87%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1071
1072&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1073davidb@cs.waikato.ac.nz
1074&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1075
1076
1077
1078&lt;td bgcolor=&quot;White&quot; width=&quot;9.08%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1079
1080&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
10811
1082&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1083
1084&lt;/tr&gt;
1085
1086
1087
1088&lt;tr&gt;&lt;td bgcolor=&quot;White&quot; width=&quot;6.36%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1089
1090&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1091
1092&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1093
1094
1095
1096&lt;td bgcolor=&quot;White&quot; width=&quot;19.69%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1097
1098&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1099maintainer
1100&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1101
1102
1103
1104&lt;td bgcolor=&quot;White&quot; width=&quot;64.87%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1105
1106&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1107davidb@cs.waikato.ac.nz
1108&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1109
1110
1111
1112&lt;td bgcolor=&quot;White&quot; width=&quot;9.08%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1113
1114&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
11152
1116&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1117
1118&lt;/tr&gt;
1119
1120
1121
1122&lt;tr&gt;&lt;td bgcolor=&quot;White&quot; width=&quot;6.36%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1123
1124&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1125
1126&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1127
1128
1129
1130&lt;td bgcolor=&quot;White&quot; width=&quot;19.69%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1131
1132&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1133public
1134&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1135
1136
1137
1138&lt;td bgcolor=&quot;White&quot; width=&quot;64.87%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1139
1140&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1141True
1142&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1143
1144
1145
1146&lt;td bgcolor=&quot;White&quot; width=&quot;9.08%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1147
1148&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
11493
1150&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1151
1152&lt;/tr&gt;
1153
1154
1155
1156&lt;tr&gt;&lt;td bgcolor=&quot;White&quot; width=&quot;6.36%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1157
1158&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1159
1160&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1161
1162
1163
1164&lt;td bgcolor=&quot;White&quot; width=&quot;19.69%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1165
1166&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1167
1168&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1169
1170
1171
1172&lt;td bgcolor=&quot;White&quot; width=&quot;64.87%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1173
1174&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1175
1176&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1177
1178
1179
1180&lt;td bgcolor=&quot;White&quot; width=&quot;9.08%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1181
1182&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
11834
1184&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1185
1186&lt;/tr&gt;
1187
1188
1189
1190&lt;tr&gt;&lt;td bgcolor=&quot;White&quot; width=&quot;6.36%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1191
1192&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1193
1194&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1195
1196
1197
1198&lt;td bgcolor=&quot;White&quot; width=&quot;19.69%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1199
1200&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1201indexes
1202&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1203
1204
1205
1206&lt;td bgcolor=&quot;White&quot; width=&quot;64.87%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1207
1208&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1209document:text document:From
1210&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1211
1212
1213
1214&lt;td bgcolor=&quot;White&quot; width=&quot;9.08%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1215
1216&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
12175
1218&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1219
1220&lt;/tr&gt;
1221
1222
1223
1224&lt;tr&gt;&lt;td bgcolor=&quot;White&quot; width=&quot;6.36%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1225
1226&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1227
1228&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1229
1230
1231
1232&lt;td bgcolor=&quot;White&quot; width=&quot;19.69%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1233
1234&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1235defaultindex
1236&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1237
1238
1239
1240&lt;td bgcolor=&quot;White&quot; width=&quot;64.87%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1241
1242&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1243document:text
1244&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1245
1246
1247
1248&lt;td bgcolor=&quot;White&quot; width=&quot;9.08%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1249
1250&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
12516
1252&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1253
1254&lt;/tr&gt;
1255
1256
1257
1258&lt;tr&gt;&lt;td bgcolor=&quot;White&quot; width=&quot;6.36%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1259
1260&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1261
1262&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1263
1264
1265
1266&lt;td bgcolor=&quot;White&quot; width=&quot;19.69%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1267
1268&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1269plugins
1270&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1271
1272
1273
1274&lt;td bgcolor=&quot;White&quot; width=&quot;64.87%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1275
1276&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1277GMLPlug EMAILPlug ArcPlug RecPlug
1278&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1279
1280
1281
1282&lt;td bgcolor=&quot;White&quot; width=&quot;9.08%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1283
1284&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
12857
1286&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1287
1288&lt;/tr&gt;
1289
1290
1291
1292&lt;tr&gt;&lt;td bgcolor=&quot;White&quot; width=&quot;6.36%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1293
1294&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1295
1296&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1297
1298
1299
1300&lt;td bgcolor=&quot;White&quot; width=&quot;19.69%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1301
1302&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1303
1304&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1305
1306
1307
1308&lt;td bgcolor=&quot;White&quot; width=&quot;64.87%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1309
1310&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1311
1312&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1313
1314
1315
1316&lt;td bgcolor=&quot;White&quot; width=&quot;9.08%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1317
1318&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
13198
1320&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1321
1322&lt;/tr&gt;
1323
1324
1325
1326&lt;tr&gt;&lt;td bgcolor=&quot;White&quot; width=&quot;6.36%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1327
1328&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1329
1330&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1331
1332
1333
1334&lt;td bgcolor=&quot;White&quot; width=&quot;19.69%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1335
1336&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1337classify
1338&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1339
1340
1341
1342&lt;td bgcolor=&quot;White&quot; width=&quot;64.87%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1343
1344&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1345AZList metadata=Title
1346&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1347
1348
1349
1350&lt;td bgcolor=&quot;White&quot; width=&quot;9.08%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1351
1352&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
13539
1354&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1355
1356&lt;/tr&gt;
1357
1358
1359
1360&lt;tr&gt;&lt;td bgcolor=&quot;White&quot; width=&quot;6.36%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1361
1362&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1363
1364&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1365
1366
1367
1368&lt;td bgcolor=&quot;White&quot; width=&quot;19.69%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1369
1370&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1371classify
1372&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1373
1374
1375
1376&lt;td bgcolor=&quot;White&quot; width=&quot;64.87%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1377
1378&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1379DateList
1380&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1381
1382
1383
1384&lt;td bgcolor=&quot;White&quot; width=&quot;9.08%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1385
1386&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
138710
1388&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1389
1390&lt;/tr&gt;
1391
1392
1393
1394&lt;tr&gt;&lt;td bgcolor=&quot;White&quot; width=&quot;6.36%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1395
1396&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1397
1398&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1399
1400
1401
1402&lt;td bgcolor=&quot;White&quot; width=&quot;19.69%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1403
1404&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1405
1406&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1407
1408
1409
1410&lt;td bgcolor=&quot;White&quot; width=&quot;64.87%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1411
1412&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1413
1414&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1415
1416
1417
1418&lt;td bgcolor=&quot;White&quot; width=&quot;9.08%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1419
1420&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
142111
1422&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1423
1424&lt;/tr&gt;
1425
1426
1427
1428&lt;tr&gt;&lt;td bgcolor=&quot;White&quot; width=&quot;6.36%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1429
1430&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1431
1432&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1433
1434
1435
1436&lt;td bgcolor=&quot;White&quot; width=&quot;19.69%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1437
1438&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1439collectionmeta
1440&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1441
1442
1443
1444&lt;td bgcolor=&quot;White&quot; width=&quot;64.87%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1445
1446&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1447collectionname    &amp;quot;Email messages&amp;quot;
1448&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1449
1450
1451
1452&lt;td bgcolor=&quot;White&quot; width=&quot;9.08%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1453
1454&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
145512
1456&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1457
1458&lt;/tr&gt;
1459
1460
1461
1462&lt;tr&gt;&lt;td bgcolor=&quot;White&quot; width=&quot;6.36%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1463
1464&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1465
1466&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1467
1468
1469
1470&lt;td bgcolor=&quot;White&quot; width=&quot;19.69%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1471
1472&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1473collectionmeta
1474&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1475
1476
1477
1478&lt;td bgcolor=&quot;White&quot; width=&quot;64.87%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1479
1480&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1481.document:text    &amp;quot;documents&amp;quot;
1482&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1483
1484
1485
1486&lt;td bgcolor=&quot;White&quot; width=&quot;9.08%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1487
1488&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
148913
1490&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1491
1492&lt;/tr&gt;
1493
1494
1495
1496&lt;tr&gt;&lt;td bgcolor=&quot;White&quot; width=&quot;6.36%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1497
1498&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1499
1500&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1501
1502
1503
1504&lt;td bgcolor=&quot;White&quot; width=&quot;19.69%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1505
1506&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1507collectionmeta
1508&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1509
1510
1511
1512&lt;td bgcolor=&quot;White&quot; width=&quot;64.87%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1513
1514&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1515.document:From    &amp;quot;email senders&amp;quot;
1516&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1517
1518
1519
1520&lt;td bgcolor=&quot;White&quot; width=&quot;9.08%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1521
1522&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
152314
1524&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1525
1526&lt;/tr&gt;
1527
1528
1529
1530&lt;tr&gt;&lt;td bgcolor=&quot;White&quot; width=&quot;6.36%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1531
1532&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1533
1534&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1535
1536
1537
1538&lt;td bgcolor=&quot;White&quot; width=&quot;19.69%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1539
1540&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1541
1542&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1543
1544
1545
1546&lt;td bgcolor=&quot;White&quot; width=&quot;64.87%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1547
1548&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1549
1550&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1551
1552
1553
1554&lt;td bgcolor=&quot;White&quot; width=&quot;9.08%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1555
1556&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
155715
1558&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1559
1560&lt;/tr&gt;
1561
1562
1563
1564&lt;tr&gt;&lt;td bgcolor=&quot;White&quot; width=&quot;6.36%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1565
1566&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1567
1568&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1569
1570
1571
1572&lt;td bgcolor=&quot;White&quot; width=&quot;19.69%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1573
1574&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1575format
1576&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1577
1578
1579
1580&lt;td bgcolor=&quot;White&quot; width=&quot;64.87%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1581
1582&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1583QueryResults /
1584&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1585
1586
1587
1588&lt;td bgcolor=&quot;White&quot; width=&quot;9.08%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1589
1590&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
159116
1592&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1593
1594&lt;/tr&gt;
1595
1596
1597
1598&lt;tr&gt;&lt;td bgcolor=&quot;White&quot; width=&quot;6.36%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1599
1600&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1601(b)
1602&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1603
1604
1605
1606&lt;td bgcolor=&quot;White&quot; width=&quot;19.69%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1607
1608&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1609
1610&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1611
1612
1613
1614&lt;td bgcolor=&quot;White&quot; width=&quot;64.87%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1615
1616&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1617&amp;lt;td&amp;gt;[link][icon][/link]&amp;lt;/td&amp;gt;&amp;lt;td&amp;gt;[Title]&amp;lt;/td&amp;gt;&amp;lt;td&amp;gt;[Author]&amp;lt;/td&amp;gt;
1618&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1619
1620
1621
1622&lt;td bgcolor=&quot;White&quot; width=&quot;9.08%25&quot; rowspan=&quot;1&quot; colspan=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1623
1624&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
162517
1626&lt;/p&gt;&lt;/div&gt;&lt;/td&gt;
1627
1628&lt;/tr&gt;
1629
1630&lt;/table&gt;
1631
1632&lt;p&gt;&lt;div name=&quot;label&quot; align=&quot;center&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1633
1634&lt;p style=&quot;text-indent: 0.00mm; text-align: center; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1635&lt;b&gt;Figure 5: Collection configuration files (a) generic, (b) for an email collection&lt;/b&gt;
1636&lt;/p&gt;&lt;/div&gt;
1637
1638
1639
1640&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1641
1642&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
1643MG also compresses the text of the collection; and the image files are linked into the &lt;i&gt;index&lt;/i&gt; subdirectory. Now none of the material in the &lt;i&gt;import&lt;/i&gt; and &lt;i&gt;archives&lt;/i&gt; directories is needed to run the collection and can be removed from the file system (though they would be needed if the collection were rebuilt).
1644&lt;/p&gt;&lt;/div&gt;
1645
1646
1647
1648&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1649
1650&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
1651Associated with each collection is a database stored in GDBM (Gnu database manager) format. This contains an entry for each document, giving its OID, its internal MG document number, and metadata such as title. Information for each of the browsing indexes, which appear as buttons on the Greenstone search/browse bar, is also extracted during the building process and stored in the database. A &amp;ldquo;classifier&amp;rdquo; program is required for each browsing index to extract the appropriate information from GML documents. Like plugins, classifiers are written on an &lt;i&gt;ad hoc&lt;/i&gt; basis for the particular information required, and where possible reused from one collection to another.
1652&lt;/p&gt;&lt;/div&gt;
1653
1654
1655
1656&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1657
1658&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
1659The building program creates the indexes based on whatever appears in the &lt;i&gt;archives&lt;/i&gt; directory. The first plugin specified by all collections is one that processes GML files, and so if &lt;i&gt;archives&lt;/i&gt; contains imported files they will be processed correctly. If it contains material in the original format, that will be converted using the appropriate plugin. Thus the import process is optional.
1660&lt;/p&gt;&lt;/div&gt;
1661
1662
1663
1664&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1665
1666&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
1667GML is designed to be fast and easy to parse, an important requirement when millions of documents are to be processed. Something as simple as requiring tags to be lower-case, for example, yields a substantial speed-up. In certain circumstances, however, it might be preferable to use a standardized format such as XML. This is straightforward to implement_just write an XML plugin_although we have not done so ourselves. Given the transitory nature of the imported data, to date, we have found GML a satisfactory and beneficial format.
1668&lt;/p&gt;&lt;/div&gt;
1669
1670
1671
1672&lt;p&gt;&lt;div name=&quot;Heading 1&quot; align=&quot;left&quot; style=&quot;margin: 4.17mm 0.50mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1673
1674&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1675&lt;b&gt;&lt;span style=&quot;text-transform:uppercase&quot;&gt;Creating new collections&lt;/span&gt;&lt;/b&gt;
1676&lt;/p&gt;&lt;/div&gt;
1677
1678
1679
1680&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1681
1682&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
1683Building new collections from scratch is only slightly different from updating an existing collection. The key new requirement is creating a collection configuration file, and a software utility is provided to help. Two pieces of information are required for this: the name of the directory that the collection will use (into which the source data and other files will eventually be placed), and a contact e-mail address for use if any problems are encountered by the software once the collection is up and running. The utility creates files and directories within the newly-named directory to support a generic collection of plain text documents. With suitable data placed in the &lt;i&gt;import&lt;/i&gt; directory, building the collection at this point will yield a document-level searchable index of all the text and a browsable list of &amp;ldquo;titles&amp;rdquo; (defined in this case to be the document filenames).
1684&lt;/p&gt;&lt;/div&gt;
1685
1686
1687
1688&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1689
1690&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
1691To enhance the functionality and presentation&amp;mdash; something anything but the most trivial collection will require&amp;mdash;the configuration file must be edited. For a collection sourced from documents in an already supported data format, presented in a similar fashion to an existing collection, the amount of editing is minimal. Importing new data formats and browsing metadata in ways not currently supported are more complex activities that require programming skills.
1692&lt;/p&gt;&lt;/div&gt;
1693
1694
1695
1696&lt;p&gt;&lt;div name=&quot;Caption&quot; align=&quot;center&quot; style=&quot;margin: 2.08mm 2.74mm 0.00mm 17.26mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1697
1698&lt;p style=&quot;text-indent: -17.26mm; text-align: center; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1699&lt;img width=&quot;698&quot; height=&quot;698&quot; alt=&quot;0x01 graphic&quot; src=&quot;_httpdocimg_/greenstone014.png&quot;&gt;&lt;br&gt;
1700&lt;/p&gt;&lt;/div&gt;
1701
1702
1703
1704&lt;p&gt;&lt;div name=&quot;Caption&quot; align=&quot;center&quot; style=&quot;margin: 2.08mm 2.74mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1705
1706&lt;p style=&quot;text-indent: 0.00mm; text-align: center; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1707&lt;b&gt;Figure 6&lt;/b&gt;&lt;b&gt;: Searching bookmarked Web pages&lt;/b&gt;&lt;b&gt;&lt;i&gt;&lt;/i&gt;&lt;/b&gt;
1708&lt;/p&gt;&lt;/div&gt;
1709
1710
1711
1712&lt;p&gt;&lt;div name=&quot;Heading 2&quot; align=&quot;left&quot; style=&quot;margin: 6.94mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1713
1714&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1715&lt;b&gt;Modifying the configuration file&lt;/b&gt;
1716&lt;/p&gt;&lt;/div&gt;
1717
1718
1719
1720&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1721
1722&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
1723Figure 5b shows simple alterations to the generic configuration file in Figure 5a that was generated by the new-collection utility. &lt;i&gt;TEXTPlug&lt;/i&gt; is replaced with &lt;i&gt;EMAILPlug&lt;/i&gt; (line 7) which reads email files and extracts metadata (&lt;i&gt;From&lt;/i&gt;, &lt;i&gt;To&lt;/i&gt;, &lt;i&gt;Date&lt;/i&gt;, &lt;i&gt;Subject&lt;/i&gt;) from them. A classifier for dates is added (line 10) to make the collection browsable chronologically. The default presentation of search results is overridden (line 17) to display both the title of the message (i.e. Dublin Core &lt;i&gt;Title&lt;/i&gt;) and its sender (i.e. Dublin Core &lt;i&gt;Author&lt;/i&gt;). Elements in square brackets, such as &lt;i&gt;[Title]&lt;/i&gt;, are replaced by the metadata associated with a particular document. The built-in term &lt;i&gt;[icon]&lt;/i&gt; produces a suitable image that represents the document (such as a book icon or page icon), and the &lt;i&gt;[link]&amp;hellip;[/link]&lt;/i&gt; construct forms a hyperlink to the complete document. Anything else in the format statement, which in this case is solely table-cell tags in HTML, is passed through to the page being displayed.
1724&lt;/p&gt;&lt;/div&gt;
1725
1726
1727
1728&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1729
1730&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
1731As this example shows, creating a new collection that stays within the bounds of the library's established capabilities falls within the capability of many computer users&amp;mdash;for instance, computer-trained librarians. Extending Greenstone to handle new document formats and browse metadata in new ways is more challenging.
1732&lt;/p&gt;&lt;/div&gt;
1733
1734
1735
1736&lt;p&gt;&lt;div name=&quot;Heading 2&quot; align=&quot;left&quot; style=&quot;margin: 6.94mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1737
1738&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1739&lt;b&gt;Writing new plugins and classifiers&lt;/b&gt;
1740&lt;/p&gt;&lt;/div&gt;
1741
1742
1743
1744&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1745
1746&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
1747Extensibility  is  obtained through  plugins  and  classifiers.
1748&lt;/p&gt;&lt;/div&gt;
1749
1750
1751
1752&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1753
1754&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
1755These are modules of code that can be slotted into the system to enhance its capabilities. Plugins parse documents, extracting the text and metadata to be indexed. Classifiers control how metadata is brought together to form browsable data structures. Both are specified in an object-oriented framework using inheritance to minimize the amount of code written.
1756&lt;/p&gt;&lt;/div&gt;
1757
1758
1759
1760&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1761
1762&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
1763A plugin must specify three things: what file formats it can handle, how they should be parsed, and whether the plugin is recursive. File formats are normally determined using regular expression matching on the filename. For example, the HTML plugin accepts all files that end in &lt;i&gt;.htm&lt;/i&gt;, .&lt;i&gt;html&lt;/i&gt;, &lt;i&gt;.HTM&lt;/i&gt;, or &lt;i&gt;.HTML&lt;/i&gt;. (It is quite possible, however, to write plugins that &amp;ldquo;look inside&amp;rdquo; the file as well.) For other files, the plugin returns &lt;i&gt;undefined&lt;/i&gt; and the file is passed to the next plugin in the collection's configuration file (e.g. Figure 5 line 7). If it can, the plugin parses the file and returns the number of documents processed. This involves extracting text and metadata and adding it to the library's content through calls to &lt;i&gt;add text&lt;/i&gt; and &lt;i&gt;add metadata&lt;/i&gt;.
1764&lt;/p&gt;&lt;/div&gt;
1765
1766
1767
1768&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1769
1770&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
1771Some plugins (&amp;ldquo;recursive&amp;rdquo; ones) add extra files into the stream of data processed during the building phase by artificially reactivating the list of plugins. This is how directory hierarchies are traversed.
1772&lt;/p&gt;&lt;/div&gt;
1773
1774
1775
1776&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1777
1778&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
1779Plugins are small modules of code that are easy to write. We monitored the time it took to develop a new one that was different to any we had produced so far. We chose to make as an example a collection of HTML bookmark files, the motivation being to produce a convenient way of searching and browsing one's bookmarked Web pages. Figure 6 shows a user searching for bookmarked pages about &lt;i&gt;music&lt;/i&gt;. The new plugin took under an hour to write, and was 160 lines long (ignoring blank lines and comments)&amp;mdash;about the average length of existing plugins.
1780&lt;/p&gt;&lt;/div&gt;
1781
1782
1783
1784&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1785
1786&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
1787Classifiers are more general than plugins because they work on GML-format data. For example, any plugin that generates date metadata in accordance with the Dublin core can request the collection to be browsable chronologically by specifying the &lt;i&gt;DateList&lt;/i&gt; classifier in the collection's configuration file (Figure 7). Classifiers are more elaborate than most plugins, but new ones are seldom required. The average length of existing classifiers is 230 lines.
1788&lt;/p&gt;&lt;/div&gt;
1789
1790
1791
1792&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1793
1794&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
1795Classifiers must specify three things: an initialization routine, how individual documents are classified, and the final browsable data structure. Initialization takes care of any options specified in the configuration file (such as &lt;i&gt;metadata=Title &lt;/i&gt;on line 9 of Figure 5b). Classifying individual documents is an iterative process: for each one, a call to &lt;i&gt;document-classify&lt;/i&gt; is made. On presentation of the document's OID, the necessary metadata is located and used to control where the document is added to the browsable data structure being constructed.
1796&lt;/p&gt;&lt;/div&gt;
1797
1798
1799
1800&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1801
1802&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
1803Once all documents have been added, a request is made for the completed data structure. Some classifiers return the data structure directly; others transform the data structure before it is returned. For example, the &lt;i&gt;AZList&lt;/i&gt; classifier divides the alphabetically sorted list of metadata into separate pages of about the same size and returns the alphabetic ranges for each one (Figure 4).
1804&lt;/p&gt;&lt;/div&gt;
1805
1806
1807
1808&lt;p&gt;&lt;div name=&quot;Caption&quot; align=&quot;center&quot; style=&quot;margin: 2.08mm 2.74mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1809
1810&lt;p style=&quot;text-indent: 0.00mm; text-align: center; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1811&lt;img width=&quot;698&quot; height=&quot;698&quot; alt=&quot;0x01 graphic&quot; src=&quot;_httpdocimg_/greenstone015.png&quot;&gt;&lt;br&gt;
1812&lt;/p&gt;&lt;/div&gt;
1813
1814
1815
1816&lt;p&gt;&lt;div name=&quot;Caption&quot; align=&quot;center&quot; style=&quot;margin: 2.08mm 2.74mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1817
1818&lt;p style=&quot;text-indent: 0.00mm; text-align: center; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1819&lt;b&gt;Figure 7&lt;/b&gt;&lt;b&gt;: Browsing a newspaper collection by date&lt;/b&gt;&lt;b&gt;&lt;/b&gt;
1820&lt;/p&gt;&lt;/div&gt;
1821
1822
1823
1824&lt;p&gt;&lt;div name=&quot;Heading 1&quot; align=&quot;left&quot; style=&quot;margin: 4.17mm 0.50mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1825
1826&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1827&lt;b&gt;&lt;span style=&quot;text-transform:uppercase&quot;&gt;Overview of related work&lt;/span&gt;&lt;/b&gt;
1828&lt;/p&gt;&lt;/div&gt;
1829
1830
1831
1832&lt;p&gt;&lt;div name=&quot;Plain Text&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.24mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1833
1834&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1835Two projects that provide substantial open source digital library software are Dienst (Lagoze and Fielding, 1998) and Harvest (Bowman &lt;i&gt;et al.&lt;/i&gt;, 1994). The origins of Dienst (&lt;i&gt;www.cs.cornell.edu/cdlrg&lt;/i&gt;) stretch back to 1992. The term has come to represent three entities: a conceptual architecture for distributed digital libraries; an open protocol for service communication; and a software system that implements the protocol. To date, five sample digital libraries have been built using this technology. They manifest themselves in two forms: technical reports and primary source documents.
1836&lt;/p&gt;&lt;/div&gt;
1837
1838
1839
1840&lt;p&gt;&lt;div name=&quot;Plain Text&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.24mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1841
1842&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1843Best known is NCSTRL, the Networked Computer Science Technical Reference Library project (&lt;i&gt;www.ncstrl.org&lt;/i&gt;). This collection facilitates searching by title, author and abstract, and browsing by year and author, across a distributed network of document repositories. Documents can (where supported) be delivered in various formats such as PostScript, a thumbnail overview of the pages, and a GIF image of a particular page.
1844&lt;/p&gt;&lt;/div&gt;
1845
1846
1847
1848&lt;p&gt;&lt;div name=&quot;Plain Text&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.24mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1849
1850&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1851The &lt;i&gt;Making of America&lt;/i&gt; resource is an example of a collection based around primary sources_in this case American social history, 1830−1900. It has a different &amp;ldquo;look and feel&amp;rdquo; to NCSTRL, being strongly oriented toward browsing rather than searching. A user navigates their way through a hierarchical structure of hyperlinks to reach a book of interest. The book itself is a series of scanned images: delivery options include going directly to a page number, next and previous page buttons, and displaying a particular page at different resolutions. A text version of the page is also available upon which a searching option is also provided.
1852&lt;/p&gt;&lt;/div&gt;
1853
1854
1855
1856&lt;p&gt;&lt;div name=&quot;Plain Text&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1857
1858&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1859Started in 1994, Harvest is also a long-running research project. It provides an efficient means of gathering source data from the Internet and distributing indexing information over the Internet. This is accomplished through five components: &lt;i&gt;gatherer&lt;/i&gt;, &lt;i&gt;broker&lt;/i&gt;, &lt;i&gt;indexer&lt;/i&gt;, &lt;i&gt;replicator&lt;/i&gt; and &lt;i&gt;cache&lt;/i&gt;. The first three are central to creating, updating and searching a collection; the last two help to improve performance over the Internet through transparent mirroring and caching techniques.
1860&lt;/p&gt;&lt;/div&gt;
1861
1862
1863
1864&lt;p&gt;&lt;div name=&quot;Plain Text&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.24mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1865
1866&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1867The system is configurable and customizable. While searching is most commonly implemented using Glimpse (&lt;i&gt;glimpse.cs.arizona.edu&lt;/i&gt;), in principle any search engine that supports incremental updates and Boolean combinations of attribute-based queries can be used. It is possible to control what type of documents are gathered during creation and updating, and how the query interface looks and is laid out.
1868&lt;/p&gt;&lt;/div&gt;
1869
1870
1871
1872&lt;p&gt;&lt;div name=&quot;Plain Text&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.24mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1873
1874&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1875Sample collections cited by the developers include 21,000 computer science technical reports and 7,000 home pages. Other examples include a sizable collection of agriculture-related electronic journals and magazines called &amp;ldquo;tomato-juice&amp;rdquo; (accessed through &lt;i&gt;hegel.lib.ncsu.edu&lt;/i&gt;) and a full-text index of library-related electronic serials (&lt;i&gt;sunsite.berkeley.edu/IndexMorganagus&lt;/i&gt;). Harvest is also often used to index Web sites (for example &lt;i&gt;www.middlebury.edu&lt;/i&gt;).
1876&lt;/p&gt;&lt;/div&gt;
1877
1878
1879
1880&lt;p&gt;&lt;div name=&quot;Plain Text&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.24mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1881
1882&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1883Comparing Greenstone with Dienst and Harvest, there are both similarities and differences. All provide substantial digital library systems, hence common themes recur, but they are driven by projects with different aims. Harvest, for instance, was not conceived as a digital library project at all, but by virtue of its selective document gathering process it can be classed (and is used) as one. While it provides sophisticated search options, it lacks the complementary service of browsing. Furthermore it adds no structure or order to the documents collected, relying on whatever structures are present in the site that they were gathered from. A proven strength of the design is its flexibility through configuration and customization_an element also present in Greenstone.
1884&lt;/p&gt;&lt;/div&gt;
1885
1886
1887
1888&lt;p&gt;&lt;div name=&quot;Plain Text&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.24mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1889
1890&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1891Dienst_best exemplified through the NCSTRL work_supports searching and browsing, like Greenstone. Both use open protocols. Differences include a high reliance in Dienst on user-supplied information when a document is added, and a smaller range of document types supported&amp;mdash;although Dienst does include a document model that should, over time, allow this to expand with relative ease.
1892&lt;/p&gt;&lt;/div&gt;
1893
1894
1895
1896&lt;p&gt;&lt;div name=&quot;Plain Text&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.24mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1897
1898&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1899There are also commercial systems that provide similar digital library services to those described. However, since corporate culture instills proprietary attitudes there is little opportunity for advancement through a shared collaborative effort. Consequently they are not reviewed here.
1900&lt;/p&gt;&lt;/div&gt;
1901
1902
1903
1904&lt;p&gt;&lt;div name=&quot;Heading 1&quot; align=&quot;left&quot; style=&quot;margin: 4.17mm 0.50mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1905
1906&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1907&lt;b&gt;&lt;span style=&quot;text-transform:uppercase&quot;&gt;Conclusions&lt;/span&gt;&lt;/b&gt;
1908&lt;/p&gt;&lt;/div&gt;
1909
1910
1911
1912&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1913
1914&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
1915Greenstone is a comprehensive software system for creating digital library collections. It builds data structures for searching and browsing from the material provided, rather than relying on any hand-crafting. The process is controlled by a configuration file, and once a collection exists new material can be added completely automatically. Browsing is based on Dublin Core metadata.
1916&lt;/p&gt;&lt;/div&gt;
1917
1918
1919
1920&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1921
1922&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
1923New collections can be developed easily, particularly if they resemble existing ones. Extensibility is achieved through software &amp;ldquo;plugins&amp;rdquo; that can be written to accommodate documents, and metadata, in different formats. Standard plugins exist for many document types; new ones are easily written. Browsing is controlled by &amp;ldquo;classifiers&amp;rdquo; that process metadata into browsing structures (by date, alphabetical, hierarchical, etc).
1924&lt;/p&gt;&lt;/div&gt;
1925
1926
1927
1928&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1929
1930&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
1931However, the most powerful support for extensibility is achieved not by technical means but by making the source code freely available under the Gnu public license. Only through an international cooperative effort will digital library software become sufficiently comprehensive to meet the world's needs with the richness and flexibility that users deserve.
1932&lt;/p&gt;&lt;/div&gt;
1933
1934
1935
1936&lt;p&gt;&lt;div name=&quot;Heading 1&quot; align=&quot;left&quot; style=&quot;margin: 4.17mm 0.50mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1937
1938&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1939&lt;b&gt;&lt;span style=&quot;text-transform:uppercase&quot;&gt;Acknowledgments&lt;/span&gt;&lt;/b&gt;
1940&lt;/p&gt;&lt;/div&gt;
1941
1942
1943
1944&lt;p&gt;&lt;div name=&quot;paragraph&quot; align=&quot;justify&quot; style=&quot;margin: 2.08mm 0.00mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1945
1946&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 3.819444mm; color: Black; background-color: White; &quot;&gt;
1947We gratefully acknowledge all those who have worked on the Greenstone software, and all members of the New Zealand Digital Library project for their enthusiasm and ideas.
1948&lt;/p&gt;&lt;/div&gt;
1949
1950
1951
1952&lt;p&gt;&lt;div name=&quot;Heading 1&quot; align=&quot;left&quot; style=&quot;margin: 0.00mm 0.49mm 0.00mm 0.00mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1953
1954&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1955&lt;b&gt;&lt;span style=&quot;text-transform:uppercase&quot;&gt;References&lt;/span&gt;&lt;/b&gt;
1956&lt;/p&gt;&lt;/div&gt;
1957
1958
1959
1960&lt;ol type=&quot;1&quot;&gt;
1961&lt;li value=&quot;1&quot;&gt;&lt;p&gt;&lt;div name=&quot;References&quot; align=&quot;justify&quot; style=&quot;margin: 1.04mm 0.00mm 0.00mm 6.25mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1962
1963&lt;p style=&quot;text-indent: -6.25mm; text-align: justify; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1964Akscyn, R.M. and Witten, I.H. (1998) &amp;ldquo;Report on First Summit on International Cooperation on Digital Libraries.&amp;rdquo; ks.com/idla-wp-oct98.
1965&lt;/p&gt;&lt;/div&gt;&lt;/li&gt;
1966
1967
1968
1969&lt;li value=&quot;2&quot;&gt;&lt;p&gt;&lt;div name=&quot;References&quot; align=&quot;justify&quot; style=&quot;margin: 1.04mm 0.00mm 0.00mm 6.25mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1970
1971&lt;p style=&quot;text-indent: -6.25mm; text-align: justify; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1972Bowman, C.M., Danzig, P.B., Manber, U., and Schwartz, M.F. &amp;ldquo;Scalable Internet resource discovery: Research problems and approaches&amp;rdquo; &lt;i&gt;Communications of the ACM,&lt;/i&gt; Vol. 37, No. 8, pp. 98−107, 1994.
1973&lt;/p&gt;&lt;/div&gt;&lt;/li&gt;
1974
1975
1976
1977&lt;li value=&quot;3&quot;&gt;&lt;p&gt;&lt;div name=&quot;References&quot; align=&quot;left&quot; style=&quot;margin: 1.04mm 0.00mm 0.00mm 6.25mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1978
1979&lt;p style=&quot;text-indent: -6.25mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1980Fox, E. (1998) &amp;ldquo;Digital library definitions.&amp;rdquo; ei.cs.vt.edu/~fox/dlib/def.html.
1981&lt;/p&gt;&lt;/div&gt;&lt;/li&gt;
1982
1983
1984
1985&lt;li value=&quot;4&quot;&gt;&lt;p&gt;&lt;div name=&quot;References&quot; align=&quot;left&quot; style=&quot;margin: 1.04mm 0.00mm 0.00mm 6.25mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1986
1987&lt;p style=&quot;text-indent: -6.25mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1988Humanity Libraries (1998) &lt;i&gt;Humanity Development Library&lt;/i&gt;. CD-ROM produced by the Global Help Project, Antwerp, Belgium.
1989&lt;/p&gt;&lt;/div&gt;&lt;/li&gt;
1990
1991
1992
1993&lt;li value=&quot;5&quot;&gt;&lt;p&gt;&lt;div name=&quot;References&quot; align=&quot;left&quot; style=&quot;margin: 1.04mm 0.00mm 0.00mm 6.25mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
1994
1995&lt;p style=&quot;text-indent: -6.25mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
1996Lagoze, C. and Fielding, D &amp;ldquo;Defining Collections in Distributed Digital Libraries&amp;rdquo; &lt;i&gt;D-Lib Magazine&lt;/i&gt;, Nov. 1998.
1997&lt;/p&gt;&lt;/div&gt;&lt;/li&gt;
1998
1999
2000
2001&lt;li value=&quot;6&quot;&gt;&lt;p&gt;&lt;div name=&quot;References&quot; align=&quot;left&quot; style=&quot;margin: 1.04mm 0.00mm 0.00mm 6.25mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
2002
2003&lt;p style=&quot;text-indent: -6.25mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
2004PAHO (1999) &lt;i&gt;Virtual Disaster Library&lt;/i&gt;. CD-ROM produced by the Pan-American Health Organization, Washington DC, USA.
2005&lt;/p&gt;&lt;/div&gt;&lt;/li&gt;
2006
2007
2008
2009&lt;li value=&quot;7&quot;&gt;&lt;p&gt;&lt;div name=&quot;References&quot; align=&quot;left&quot; style=&quot;margin: 1.04mm 0.00mm 0.00mm 6.25mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
2010
2011&lt;p style=&quot;text-indent: -6.25mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
2012McNab, R.J., Witten, I.H. and Boddie, S.J. (1998) &amp;ldquo;A distributed digital library architecture incorporating different index styles.&amp;rdquo; &lt;i&gt;Proc IEEE Advances in Digital Libraries&lt;/i&gt;, Santa Barbara, CA, pp. 36-45.
2013&lt;/p&gt;&lt;/div&gt;&lt;/li&gt;
2014
2015
2016
2017&lt;li value=&quot;8&quot;&gt;&lt;p&gt;&lt;div name=&quot;References&quot; align=&quot;left&quot; style=&quot;margin: 1.04mm 0.00mm 0.00mm 6.25mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
2018
2019&lt;p style=&quot;text-indent: -6.25mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
2020Nevill-Manning, C.G., Reed, T., and Witten, I.H. (1998) &amp;ldquo;Extracting text from PostScript&amp;rdquo; &lt;i&gt;Software&amp;mdash;Practice and Experience&lt;/i&gt;, Vol. 28, No. 5, pp. 481-491; April.
2021&lt;/p&gt;&lt;/div&gt;&lt;/li&gt;
2022
2023
2024
2025&lt;li value=&quot;9&quot;&gt;&lt;p&gt;&lt;div name=&quot;References&quot; align=&quot;left&quot; style=&quot;margin: 1.04mm 0.00mm 0.00mm 6.25mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
2026
2027&lt;p style=&quot;text-indent: -6.25mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
2028UNESCO (1999) &lt;i&gt;SAHEL point DOC: Anthologie du développement au Sahel&lt;/i&gt;. CD-ROM produced by UNESCO, Paris, France.
2029&lt;/p&gt;&lt;/div&gt;&lt;/li&gt;
2030
2031
2032
2033&lt;li value=&quot;10&quot;&gt;&lt;p&gt;&lt;div name=&quot;References&quot; align=&quot;left&quot; style=&quot;margin: 1.04mm 0.00mm 0.00mm 6.25mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
2034
2035&lt;p style=&quot;text-indent: -6.25mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
2036UNU (1998) &lt;i&gt;Collection on critical global issues.&lt;/i&gt; CD-ROM produced by the United Nations University Press, Tokyo, Japan.
2037&lt;/p&gt;&lt;/div&gt;&lt;/li&gt;
2038
2039
2040
2041&lt;li value=&quot;11&quot;&gt;&lt;p&gt;&lt;div name=&quot;References&quot; align=&quot;left&quot; style=&quot;margin: 1.04mm 0.00mm 0.00mm 6.25mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
2042
2043&lt;p style=&quot;text-indent: -6.25mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
2044Witten, I.H., Moffat, A. and Bell, T. (1999) &lt;i&gt;Managing Gigabytes: compressing and indexing documents and images&lt;/i&gt;, Morgan Kaufmann, second edition.
2045&lt;/p&gt;&lt;/div&gt;&lt;/li&gt;
2046
2047
2048
2049&lt;/ol&gt;&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
2050
2051&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
2052
2053&lt;/p&gt;&lt;/div&gt;
2054
2055
2056
2057&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
2058
2059&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
2060
2061&lt;/p&gt;&lt;/div&gt;
2062
2063
2064
2065&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
2066
2067&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
2068
2069&lt;/p&gt;&lt;/div&gt;
2070
2071
2072
2073&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
2074
2075&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
2076
2077&lt;/p&gt;&lt;/div&gt;
2078
2079
2080
2081&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
2082
2083&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
2084
2085&lt;/p&gt;&lt;/div&gt;
2086
2087
2088
2089&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
2090
2091&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
2092
2093&lt;/p&gt;&lt;/div&gt;
2094
2095
2096
2097&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
2098
2099&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
2100
2101&lt;/p&gt;&lt;/div&gt;
2102
2103
2104
2105&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
2106
2107&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
2108
2109&lt;/p&gt;&lt;/div&gt;
2110
2111
2112
2113&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
2114
2115&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
2116
2117&lt;/p&gt;&lt;/div&gt;
2118
2119
2120
2121&lt;p&gt;&lt;div name=&quot;Header&quot; align=&quot;justify&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
2122
2123&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
2124&lt;span style=&quot;text-transform:lowercase&quot;&gt;&lt;/span&gt;
2125&lt;/p&gt;&lt;/div&gt;
2126
2127
2128
2129&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
2130
2131&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
2132
2133&lt;/p&gt;&lt;/div&gt;
2134
2135
2136
2137&lt;p&gt;&lt;div name=&quot;Footer&quot; align=&quot;justify&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
2138
2139&lt;p style=&quot;text-indent: 0.00mm; text-align: justify; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
2140&lt;span style=&quot;text-transform:lowercase&quot;&gt;&lt;/span&gt;
2141&lt;/p&gt;&lt;/div&gt;
2142
2143
2144
2145&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
2146
2147&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
2148
2149&lt;/p&gt;&lt;/div&gt;
2150
2151
2152
2153&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
2154
2155&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
2156
2157&lt;/p&gt;&lt;/div&gt;
2158
2159
2160
2161&lt;p&gt;&lt;div name=&quot;Caption&quot; align=&quot;center&quot; style=&quot;margin: 2.08mm 2.74mm 0.00mm 17.26mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
2162
2163&lt;p style=&quot;text-indent: -17.26mm; text-align: center; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
2164
2165&lt;/p&gt;&lt;/div&gt;
2166
2167
2168
2169&lt;p&gt;&lt;div name=&quot;Caption&quot; align=&quot;center&quot; style=&quot;margin: 2.08mm 2.74mm 0.00mm 17.26mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
2170
2171&lt;p style=&quot;text-indent: -17.26mm; text-align: center; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
2172
2173&lt;/p&gt;&lt;/div&gt;
2174
2175
2176
2177&lt;p&gt;&lt;div name=&quot;Caption&quot; align=&quot;center&quot; style=&quot;margin: 2.08mm 2.74mm 0.00mm 17.26mm;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
2178
2179&lt;p style=&quot;text-indent: -17.26mm; text-align: center; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
2180
2181&lt;/p&gt;&lt;/div&gt;
2182
2183
2184
2185&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
2186
2187&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
2188
2189&lt;/p&gt;&lt;/div&gt;
2190
2191
2192
2193&lt;p&gt;&lt;div name=&quot;Normal&quot; align=&quot;left&quot; style=&quot;  padding: 0.00mm 0.00mm 0.00mm 0.00mm; &quot;&gt;
2194
2195&lt;p style=&quot;text-indent: 0.00mm; text-align: left; line-height: 4.166667mm; color: Black; background-color: White; &quot;&gt;
2196
2197&lt;/p&gt;&lt;/div&gt;
2198
2199&lt;!--Section Ends--&gt;
2200
2201
2202
2203&lt;!--
2204&lt;hr&gt;
2205&lt;address&gt;
2206&lt;a href=&quot;_httpextlink_&amp;amp;rl=0&amp;amp;href=http:%2f%2fwvware.sourceforge.net&quot;&gt;&lt;img
2207src=&quot;_httpdocimg_/wvSmall.gif&quot; height=31 width=47
2208align=left border=0 alt=&quot;wvWare&quot;&gt;&lt;/a&gt;
2209&lt;a href=&quot;_httpextlink_&amp;amp;rl=0&amp;amp;href=http:%2f%2fvalidator.w3.org%2fcheck%2freferer&quot;&gt;&lt;img
2210src=&quot;_httpdocimg_/vh40.gif&quot; height=31 width=88
2211align=right border=0 alt=&quot;Valid HTML 4.0!&quot;&gt;&lt;/a&gt;
2212Document created with &lt;a href=&quot;_httpextlink_&amp;amp;rl=0&amp;amp;href=http:%2f%2fwvware.sourceforge.net&quot;&gt;wvWare/wvWare version 1.2.4&lt;/a&gt;&lt;br&gt;
2213&lt;/address&gt;
2214--&gt;
2215
2216
2217</Content>
2218</Section>
2219</Archive>
Note: See TracBrowser for help on using the browser.