1 | <?xml version="1.0" encoding="utf-8" standalone="no"?>
|
---|
2 | <!DOCTYPE Archive SYSTEM "https://greenstone.org/dtd/Archive/1.0/Archive.dtd">
|
---|
3 | <Archive>
|
---|
4 | <Section>
|
---|
5 | <Description>
|
---|
6 | <Metadata name="gsdldoctype">indexed_doc</Metadata>
|
---|
7 | <Metadata name="SourceDirectory">/Scratch/ak19/gs3-svn-02May2024/web/sites/localsite/collect/Enhanced-PDF/tmp/1714975883</Metadata>
|
---|
8 | <Metadata name="Language">en</Metadata>
|
---|
9 | <Metadata name="Encoding">utf8</Metadata>
|
---|
10 | <Metadata name="URL">http://Scratch/ak19/gs3-svn-02May2024/web/sites/localsite/collect/Enhanced-PDF/tmp/1714975883/pdf03.html</Metadata>
|
---|
11 | <Metadata name="UTF8URL">http://Scratch/ak19/gs3-svn-02May2024/web/sites/localsite/collect/Enhanced-PDF/tmp/1714975883/pdf03.html</Metadata>
|
---|
12 | <Metadata name="Title">pdf03</Metadata>
|
---|
13 | <Metadata name="gsdlsourcefilename">import/pdf03.pdf</Metadata>
|
---|
14 | <Metadata name="gsdlsourcefilerenamemethod">url</Metadata>
|
---|
15 | <Metadata name="gsdlconvertedfilename">tmp/1714975883/pdf03.html</Metadata>
|
---|
16 | <Metadata name="OrigSource">pdf03.html</Metadata>
|
---|
17 | <Metadata name="Source">pdf03.pdf</Metadata>
|
---|
18 | <Metadata name="SourceFile">pdf03.pdf</Metadata>
|
---|
19 | <Metadata name="Plugin">PDFv2Plugin</Metadata>
|
---|
20 | <Metadata name="FileSize">35935</Metadata>
|
---|
21 | <Metadata name="SourceDirectory">.</Metadata>
|
---|
22 | <Metadata name="FilenameRoot">pdf03</Metadata>
|
---|
23 | <Metadata name="FileFormat">PDF</Metadata>
|
---|
24 | <Metadata name="srcicon">_iconpdf_</Metadata>
|
---|
25 | <Metadata name="srclink_file">doc.pdf</Metadata>
|
---|
26 | <Metadata name="srclinkFile">doc.pdf</Metadata>
|
---|
27 | <Metadata name="Identifier">HASH019c5dca7f5bb781460a6b9c</Metadata>
|
---|
28 | <Metadata name="lastmodified">1714975828</Metadata>
|
---|
29 | <Metadata name="lastmodifieddate">20240506</Metadata>
|
---|
30 | <Metadata name="oailastmodified">1714975885</Metadata>
|
---|
31 | <Metadata name="oailastmodifieddate">20240506</Metadata>
|
---|
32 | <Metadata name="assocfilepath">HASH019c.dir</Metadata>
|
---|
33 | <Metadata name="gsdlassocfile">page1.png:image/png:</Metadata>
|
---|
34 | <Metadata name="gsdlassocfile">page2.png:image/png:</Metadata>
|
---|
35 | <Metadata name="gsdlassocfile">page3.png:image/png:</Metadata>
|
---|
36 | <Metadata name="gsdlassocfile">page4.png:image/png:</Metadata>
|
---|
37 | <Metadata name="gsdlassocfile">page5.png:image/png:</Metadata>
|
---|
38 | <Metadata name="gsdlassocfile">page6.png:image/png:</Metadata>
|
---|
39 | <Metadata name="gsdlassocfile">page7.png:image/png:</Metadata>
|
---|
40 | <Metadata name="gsdlassocfile">page8.png:image/png:</Metadata>
|
---|
41 | <Metadata name="gsdlassocfile">page9.png:image/png:</Metadata>
|
---|
42 | <Metadata name="gsdlassocfile">page10.png:image/png:</Metadata>
|
---|
43 | <Metadata name="gsdlassocfile">page11.png:image/png:</Metadata>
|
---|
44 | <Metadata name="gsdlassocfile">page12.png:image/png:</Metadata>
|
---|
45 | <Metadata name="gsdlassocfile">page13.png:image/png:</Metadata>
|
---|
46 | <Metadata name="gsdlassocfile">page14.png:image/png:</Metadata>
|
---|
47 | <Metadata name="gsdlassocfile">page15.png:image/png:</Metadata>
|
---|
48 | <Metadata name="gsdlassocfile">page16.png:image/png:</Metadata>
|
---|
49 | <Metadata name="gsdlassocfile">page17.png:image/png:</Metadata>
|
---|
50 | <Metadata name="gsdlassocfile">doc.pdf:application/pdf:</Metadata>
|
---|
51 | </Description>
|
---|
52 | <Content>
|
---|
53 |
|
---|
54 |
|
---|
55 |
|
---|
56 | </Content>
|
---|
57 | <Section>
|
---|
58 | <Description>
|
---|
59 | <Metadata name="Title">Pages 1-10</Metadata>
|
---|
60 | </Description>
|
---|
61 | <Content>
|
---|
62 | </Content>
|
---|
63 | <Section>
|
---|
64 | <Description>
|
---|
65 | <Metadata name="Title">Page 1</Metadata>
|
---|
66 | </Description>
|
---|
67 | <Content>
|
---|
68 | <div id="page1">
|
---|
69 | <div style="position: relative; height: 842px; width: 595px;"><style type="text/css">
|
---|
70 | .txt { white-space:nowrap; }
|
---|
71 | .p1f0 { font-family:sans-serif; font-weight:normal; font-style:normal; }
|
---|
72 | .p1f1 { font-family:serif; font-weight:bold; font-style:normal; }
|
---|
73 | .p1f2 { font-family:serif; font-weight:normal; font-style:normal; }
|
---|
74 | .p1f3 { font-family:sans-serif; font-weight:normal; font-style:normal; }
|
---|
75 | </style>
|
---|
76 | <img class="background" height="842" id="background1" src="_httpdocimg_/page1.png" style="position:absolute; left:0px; top:0px;" width="595">
|
---|
77 | <div class="txt" style="position:absolute; left:166px; top:74px;"><span class="p1f1" style="font-size:14px;vertical-align:baseline;color:rgba(0,0,0,1);">Applications for Bibliometric Research</span></div>
|
---|
78 | <div class="txt" style="position:absolute; left:184px; top:98px;"><span class="p1f1" style="font-size:14px;vertical-align:baseline;color:rgba(0,0,0,1);">in the Emerging Digital Libraries</span></div>
|
---|
79 | <div class="txt" style="position:absolute; left:246px; top:147px;"><span class="p1f2" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">Sally Jo Cunningham</span></div>
|
---|
80 | <div class="txt" style="position:absolute; left:219px; top:171px;"><span class="p1f2" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">Department of Computer Science</span></div>
|
---|
81 | <div class="txt" style="position:absolute; left:245px; top:195px;"><span class="p1f2" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">University of Waikato</span></div>
|
---|
82 | <div class="txt" style="position:absolute; left:240px; top:219px;"><span class="p1f2" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">Hamilton, New Zealand</span></div>
|
---|
83 | <div class="txt" style="position:absolute; left:226px; top:243px;"><span class="p1f2" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">email: [email protected]</span></div>
|
---|
84 | <div class="txt" style="position:absolute; left:90px; top:291px;"><span class="p1f1" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">Abstract: </span><span class="p1f2" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">Large numbers of research documents have recently become available on</span></div>
|
---|
85 | <div class="txt" style="position:absolute; left:90px; top:315px;"><span class="p1f2" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">the Internet through âdigital librariesâ, and these collections are seeing high levels of</span></div>
|
---|
86 | <div class="txt" style="position:absolute; left:90px; top:339px;"><span class="p1f2" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">use by their related research communities. A secondary use for these document</span></div>
|
---|
87 | <div class="txt" style="position:absolute; left:90px; top:363px;"><span class="p1f2" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">repositories and indexes is as a platform for bibliometric research. We examine the</span></div>
|
---|
88 | <div class="txt" style="position:absolute; left:90px; top:387px;"><span class="p1f2" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">extent to which the new digital libraries support conventional bibliometric analysis, and</span></div>
|
---|
89 | <div class="txt" style="position:absolute; left:90px; top:411px;"><span class="p1f2" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">discuss shortcomings in their current forms. Interestingly, these electronic text</span></div>
|
---|
90 | <div class="txt" style="position:absolute; left:90px; top:435px;"><span class="p1f2" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">archives also provide opportunities for new types of studies: generally the full text of</span></div>
|
---|
91 | <div class="txt" style="position:absolute; left:90px; top:459px;"><span class="p1f2" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">documents are available for analysis, giving a finer grain of insight than abstract-only</span></div>
|
---|
92 | <div class="txt" style="position:absolute; left:90px; top:483px;"><span class="p1f2" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">online databases; these repositories often contain technical reports or pre-prints, the</span></div>
|
---|
93 | <div class="txt" style="position:absolute; left:90px; top:507px;"><span class="p1f2" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">âgrey literatureâ that has been previously unavailable for analysis; and document</span></div>
|
---|
94 | <div class="txt" style="position:absolute; left:90px; top:531px;"><span class="p1f2" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">âusageâ can be measured directly by recording user accesses, rather than studied</span></div>
|
---|
95 | <div class="txt" style="position:absolute; left:90px; top:555px;"><span class="p1f2" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">indirectly through document references.</span></div>
|
---|
96 | <div class="txt" style="position:absolute; left:90px; top:603px;"><span class="p1f1" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">1. Introduction</span></div>
|
---|
97 | <div class="txt" style="position:absolute; left:126px; top:639px;"><span class="p1f2" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">In recent years a number of &quot;digital libraries&quot; have become available through the</span></div>
|
---|
98 | <div class="txt" style="position:absolute; left:90px; top:663px;"><span class="p1f2" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">Internet. While the technology promises in the future to support large, heterogenous</span></div>
|
---|
99 | <div class="txt" style="position:absolute; left:90px; top:687px;"><span class="p1f2" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">collections, at present the most widely used of the academically-focussed digital</span></div>
|
---|
100 | <div class="txt" style="position:absolute; left:90px; top:711px;"><span class="p1f2" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">libraries are generally repositories of one or two types of document (typically technical</span></div>
|
---|
101 | <div class="txt" style="position:absolute; left:90px; top:735px;"><span class="p1f2" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">reports, journal articles, pre-prints, or conference proceedings), grouped by discipline.</span></div>
|
---|
102 | </div>
|
---|
103 | </div>
|
---|
104 |
|
---|
105 | </Content>
|
---|
106 | </Section>
|
---|
107 | <Section>
|
---|
108 | <Description>
|
---|
109 | <Metadata name="Title">Page 2</Metadata>
|
---|
110 | </Description>
|
---|
111 | <Content>
|
---|
112 | <div id="page2">
|
---|
113 | <div style="position: relative; height: 842px; width: 595px;"><style type="text/css">
|
---|
114 | .txt { white-space:nowrap; }
|
---|
115 | .p2f0 { font-family:sans-serif; font-weight:normal; font-style:normal; }
|
---|
116 | .p2f1 { font-family:serif; font-weight:normal; font-style:normal; }
|
---|
117 | .p2f2 { font-family:sans-serif; font-weight:normal; font-style:normal; }
|
---|
118 | </style>
|
---|
119 | <img class="background" height="842" id="background2" src="_httpdocimg_/page2.png" style="position:absolute; left:0px; top:0px;" width="595">
|
---|
120 | <div class="txt" style="position:absolute; left:90px; top:72px;"><span class="p2f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">A distinguishing characteristic of these digital libraries is that the full text of documents</span></div>
|
---|
121 | <div class="txt" style="position:absolute; left:90px; top:96px;"><span class="p2f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">are often available for retrieval, as well as bibliographic records.The sciences are</span></div>
|
---|
122 | <div class="txt" style="position:absolute; left:90px; top:120px;"><span class="p2f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">represented much more heavily in the present crop of digital libraries than the social</span></div>
|
---|
123 | <div class="txt" style="position:absolute; left:90px; top:144px;"><span class="p2f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">sciences, arts, or humanities. They are maintained by professional societies,</span></div>
|
---|
124 | <div class="txt" style="position:absolute; left:90px; top:168px;"><span class="p2f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">universities, research laboratories, and even private individuals. Access is generally</span></div>
|
---|
125 | <div class="txt" style="position:absolute; left:90px; top:192px;"><span class="p2f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">free, both to search and to download documents.</span></div>
|
---|
126 | <div class="txt" style="position:absolute; left:126px; top:216px;"><span class="p2f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">The emergence of these subject-specific digital libraries is particularly important</span></div>
|
---|
127 | <div class="txt" style="position:absolute; left:90px; top:240px;"><span class="p2f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">given the pattern of access to materials presently employed by research scientists.</span></div>
|
---|
128 | <div class="txt" style="position:absolute; left:90px; top:264px;"><span class="p2f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">Informal exchanges of preprints, reprints, and photocopies of papers passed on by</span></div>
|
---|
129 | <div class="txt" style="position:absolute; left:90px; top:288px;"><span class="p2f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">colleagues currently are major venues for the transmission of scientific information</span></div>
|
---|
130 | <div class="txt" style="position:absolute; left:90px; top:312px;"><span class="p2f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">between researchers in the sciences. In one study, the dependence on these sources</span></div>
|
---|
131 | <div class="txt" style="position:absolute; left:90px; top:336px;"><span class="p2f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">ranges from 12% (for chemistry) to 39% (for mathematics) of all papers cited in</span></div>
|
---|
132 | <div class="txt" style="position:absolute; left:90px; top:360px;"><span class="p2f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">researchers' own publications [11]. A qualitative study of study of how computer</span></div>
|
---|
133 | <div class="txt" style="position:absolute; left:90px; top:384px;"><span class="p2f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">scientists locate and retrieve documents (computing is one of the domains considered</span></div>
|
---|
134 | <div class="txt" style="position:absolute; left:90px; top:408px;"><span class="p2f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">later in this paper) indicates that for that field, technical reports and research documents</span></div>
|
---|
135 | <div class="txt" style="position:absolute; left:90px; top:432px;"><span class="p2f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">found in various locations on the Internet are a preferred source of information [6].</span></div>
|
---|
136 | <div class="txt" style="position:absolute; left:90px; top:456px;"><span class="p2f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">Many of the digital library systems discussed in this paper are repositories for just this</span></div>
|
---|
137 | <div class="txt" style="position:absolute; left:90px; top:480px;"><span class="p2f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">type of literature. The documents tend to be of high quality: primarily technical</span></div>
|
---|
138 | <div class="txt" style="position:absolute; left:90px; top:504px;"><span class="p2f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">reports or working papers from research institutions (both academic and commercial),</span></div>
|
---|
139 | <div class="txt" style="position:absolute; left:90px; top:528px;"><span class="p2f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">as well as advance copies of work accepted for publication in conventional paper</span></div>
|
---|
140 | <div class="txt" style="position:absolute; left:90px; top:552px;"><span class="p2f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">journals. Moreover, these digital libraries are also coming to include refereed work</span></div>
|
---|
141 | <div class="txt" style="position:absolute; left:90px; top:576px;"><span class="p2f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">published digitally (in electronic journals). Anecdotal evidence suggests that in their</span></div>
|
---|
142 | <div class="txt" style="position:absolute; left:90px; top:600px;"><span class="p2f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">fields, these digital libraries are coming to be the resource of choice for locating cutting</span></div>
|
---|
143 | <div class="txt" style="position:absolute; left:90px; top:624px;"><span class="p2f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">edge work.</span></div>
|
---|
144 | <div class="txt" style="position:absolute; left:126px; top:648px;"><span class="p2f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">For specialized subjects such as high energy physics, this dependence on</span></div>
|
---|
145 | <div class="txt" style="position:absolute; left:90px; top:672px;"><span class="p2f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">informal or extra-library dissemination can be much higher. Ginsparg ([9], [10])</span></div>
|
---|
146 | <div class="txt" style="position:absolute; left:90px; top:696px;"><span class="p2f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">reports that fields in physics have traditionally relied heavily on preprint exchanges, and</span></div>
|
---|
147 | <div class="txt" style="position:absolute; left:90px; top:720px;"><span class="p2f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">the digital repositories of physics preprints begun in 1991 (the </span><span class="p2f1" style="font-size:9px;vertical-align:baseline;color:rgba(0,0,0,1);">PHYSICS E</span><span class="p2f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">-</span><span class="p2f1" style="font-size:9px;vertical-align:baseline;color:rgba(0,0,0,1);">PRINT</span></div>
|
---|
148 | <div class="txt" style="position:absolute; left:90px; top:744px;"><span class="p2f1" style="font-size:9px;vertical-align:baseline;color:rgba(0,0,0,1);">ARCHIVES</span><span class="p2f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">) have to a large extent supplanted conventional publishing and physical</span></div>
|
---|
149 | </div>
|
---|
150 | </div>
|
---|
151 |
|
---|
152 | </Content>
|
---|
153 | </Section>
|
---|
154 | <Section>
|
---|
155 | <Description>
|
---|
156 | <Metadata name="Title">Page 3</Metadata>
|
---|
157 | </Description>
|
---|
158 | <Content>
|
---|
159 | <div id="page3">
|
---|
160 | <div style="position: relative; height: 842px; width: 595px;"><style type="text/css">
|
---|
161 | .txt { white-space:nowrap; }
|
---|
162 | .p3f0 { font-family:sans-serif; font-weight:normal; font-style:normal; }
|
---|
163 | .p3f1 { font-family:serif; font-weight:normal; font-style:normal; }
|
---|
164 | .p3f2 { font-family:serif; font-weight:normal; font-style:italic; }
|
---|
165 | .p3f3 { font-family:sans-serif; font-weight:normal; font-style:normal; }
|
---|
166 | </style>
|
---|
167 | <img class="background" height="842" id="background3" src="_httpdocimg_/page3.png" style="position:absolute; left:0px; top:0px;" width="595">
|
---|
168 | <div class="txt" style="position:absolute; left:90px; top:72px;"><span class="p3f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">paper mailing of technical reports. By providing ready access to information sources</span></div>
|
---|
169 | <div class="txt" style="position:absolute; left:90px; top:96px;"><span class="p3f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">that are already preferentially utilized by scientists, the digital libraries show potential to</span></div>
|
---|
170 | <div class="txt" style="position:absolute; left:90px; top:120px;"><span class="p3f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">increase access to information that until recently was expensive or difficult to acquire in</span></div>
|
---|
171 | <div class="txt" style="position:absolute; left:90px; top:144px;"><span class="p3f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">paper form. Indeed, in some fields (most notably physics) this process has already</span></div>
|
---|
172 | <div class="txt" style="position:absolute; left:90px; top:168px;"><span class="p3f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">begun, as researchers in less developed countries report access to ongoing research</span></div>
|
---|
173 | <div class="txt" style="position:absolute; left:90px; top:192px;"><span class="p3f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">through the Internet repositories that their local libraries could not afford to acquire</span></div>
|
---|
174 | <div class="txt" style="position:absolute; left:90px; top:216px;"><span class="p3f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">through conventional journal subscriptions ([9], [10]).</span></div>
|
---|
175 | <div class="txt" style="position:absolute; left:126px; top:240px;"><span class="p3f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">The primary use for new bibliographic resources is, of course, for the contents</span></div>
|
---|
176 | <div class="txt" style="position:absolute; left:90px; top:264px;"><span class="p3f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">of the documents involved. A secondary use for emerging resources is as a basis for</span></div>
|
---|
177 | <div class="txt" style="position:absolute; left:90px; top:288px;"><span class="p3f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">bibliometric analysis of the subject field. With the conventionally published scientific</span></div>
|
---|
178 | <div class="txt" style="position:absolute; left:90px; top:312px;"><span class="p3f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">literature, the sheer difficulty of accumulating statistics discouraged bibliometric</span></div>
|
---|
179 | <div class="txt" style="position:absolute; left:90px; top:336px;"><span class="p3f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">research until the advent of large bibliographic databases in the 1960's. Computerized</span></div>
|
---|
180 | <div class="txt" style="position:absolute; left:90px; top:360px;"><span class="p3f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">bibliographic databases sparked a significant increase in the number of large-scale</span></div>
|
---|
181 | <div class="txt" style="position:absolute; left:90px; top:384px;"><span class="p3f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">bibliographic studies, as significant portions of the collection and analysis of data could</span></div>
|
---|
182 | <div class="txt" style="position:absolute; left:90px; top:408px;"><span class="p3f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">be automated ([12], [13]). The availability of CD-ROM versions of bibliographic</span></div>
|
---|
183 | <div class="txt" style="position:absolute; left:90px; top:432px;"><span class="p3f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">databases has been of particular importance, since they provide a cheaper alternative to</span></div>
|
---|
184 | <div class="txt" style="position:absolute; left:90px; top:456px;"><span class="p3f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">the online commercial databases [3].</span></div>
|
---|
185 | <div class="txt" style="position:absolute; left:126px; top:480px;"><span class="p3f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">These computerized bibliographic resources have drawbacks, however. The</span></div>
|
---|
186 | <div class="txt" style="position:absolute; left:90px; top:504px;"><span class="p3f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">greatest is that the full text of documents are rarely available, and even abstracts are not</span></div>
|
---|
187 | <div class="txt" style="position:absolute; left:90px; top:528px;"><span class="p3f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">always present. This obviously limits the types of bibliometric research that can be</span></div>
|
---|
188 | <div class="txt" style="position:absolute; left:90px; top:552px;"><span class="p3f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">conducted </span><span class="p3f2" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">solely </span><span class="p3f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">through these databases. In addition, these databases are generally</span></div>
|
---|
189 | <div class="txt" style="position:absolute; left:90px; top:576px;"><span class="p3f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">limited to formally published documents (those appearing in selected books, journals,</span></div>
|
---|
190 | <div class="txt" style="position:absolute; left:90px; top:600px;"><span class="p3f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">and conference proceedings). The &quot;grey literature&quot; of technical reports, pre-prints, and</span></div>
|
---|
191 | <div class="txt" style="position:absolute; left:90px; top:624px;"><span class="p3f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">other works not formally published are largely ignored, and it is this absence of easy</span></div>
|
---|
192 | <div class="txt" style="position:absolute; left:90px; top:648px;"><span class="p3f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">access to these documents that has hampered the analysis of these important forms of</span></div>
|
---|
193 | <div class="txt" style="position:absolute; left:90px; top:672px;"><span class="p3f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">scientific communication.</span></div>
|
---|
194 | <div class="txt" style="position:absolute; left:126px; top:696px;"><span class="p3f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">The digital libraries currently in existence complement the online and CD-ROM</span></div>
|
---|
195 | <div class="txt" style="position:absolute; left:90px; top:720px;"><span class="p3f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">bibliographic databases. They are best suited for examinations of the &quot;physical&quot;</span></div>
|
---|
196 | <div class="txt" style="position:absolute; left:90px; top:744px;"><span class="p3f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">characteristics of documents (for example, document length), analysis based on</span></div>
|
---|
197 | </div>
|
---|
198 | </div>
|
---|
199 |
|
---|
200 | </Content>
|
---|
201 | </Section>
|
---|
202 | <Section>
|
---|
203 | <Description>
|
---|
204 | <Metadata name="Title">Page 4</Metadata>
|
---|
205 | </Description>
|
---|
206 | <Content>
|
---|
207 | <div id="page4">
|
---|
208 | <div style="position: relative; height: 842px; width: 595px;"><style type="text/css">
|
---|
209 | .txt { white-space:nowrap; }
|
---|
210 | .p4f0 { font-family:sans-serif; font-weight:normal; font-style:normal; }
|
---|
211 | .p4f1 { font-family:serif; font-weight:normal; font-style:normal; }
|
---|
212 | .p4f2 { font-family:serif; font-weight:bold; font-style:normal; }
|
---|
213 | .p4f3 { font-family:sans-serif; font-weight:normal; font-style:normal; }
|
---|
214 | </style>
|
---|
215 | <img class="background" height="842" id="background4" src="_httpdocimg_/page4.png" style="position:absolute; left:0px; top:0px;" width="595">
|
---|
216 | <div class="txt" style="position:absolute; left:90px; top:72px;"><span class="p4f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">bibliographic information that can be automatically extracted from the document text or</span></div>
|
---|
217 | <div class="txt" style="position:absolute; left:90px; top:96px;"><span class="p4f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">the sometimes unevenly formatted bibliographic records (such as obsolescence</span></div>
|
---|
218 | <div class="txt" style="position:absolute; left:90px; top:120px;"><span class="p4f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">studies), and usage studies (geographic or institutional origin of users, date/time of</span></div>
|
---|
219 | <div class="txt" style="position:absolute; left:90px; top:144px;"><span class="p4f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">access, individual patterns of document retrieval, etc.). Because references are present</span></div>
|
---|
220 | <div class="txt" style="position:absolute; left:90px; top:168px;"><span class="p4f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">in the document file but not identified by field, co-citation and bibliographic coupling</span></div>
|
---|
221 | <div class="txt" style="position:absolute; left:90px; top:192px;"><span class="p4f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">research is not well-supported, and conducting these studies requires considerable</span></div>
|
---|
222 | <div class="txt" style="position:absolute; left:90px; top:216px;"><span class="p4f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">effort on the part of the researcher.</span></div>
|
---|
223 | <div class="txt" style="position:absolute; left:126px; top:240px;"><span class="p4f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">The variety of bibliographic repositories in the available digital libraries in itself</span></div>
|
---|
224 | <div class="txt" style="position:absolute; left:90px; top:264px;"><span class="p4f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">has great potential in conducting bibliometric research. Sigogneau et al [15] present a</span></div>
|
---|
225 | <div class="txt" style="position:absolute; left:90px; top:288px;"><span class="p4f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">case study illustrating the ways in which the strengths of different databases can be</span></div>
|
---|
226 | <div class="txt" style="position:absolute; left:90px; top:312px;"><span class="p4f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">played off each other; they conduct a fine-grained analysis of the emergence of research</span></div>
|
---|
227 | <div class="txt" style="position:absolute; left:90px; top:336px;"><span class="p4f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">fronts in molecular and cellular biology, and demonstrate that the observations gleaned</span></div>
|
---|
228 | <div class="txt" style="position:absolute; left:90px; top:360px;"><span class="p4f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">from two complementary bibliographic databases provide greater insight into their</span></div>
|
---|
229 | <div class="txt" style="position:absolute; left:90px; top:384px;"><span class="p4f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">problem. Similarly, it appears that the types of bibliographic data that can be gleaned</span></div>
|
---|
230 | <div class="txt" style="position:absolute; left:90px; top:408px;"><span class="p4f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">from the relatively unstructured digital libraries can be profitably combined with data</span></div>
|
---|
231 | <div class="txt" style="position:absolute; left:90px; top:432px;"><span class="p4f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">from online databases, CD-ROMS, and other more conventional bibliographic</span></div>
|
---|
232 | <div class="txt" style="position:absolute; left:90px; top:456px;"><span class="p4f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">resources.</span></div>
|
---|
233 | <div class="txt" style="position:absolute; left:126px; top:480px;"><span class="p4f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">This paper is organized as follows: Section 2 discusses the types of indexing</span></div>
|
---|
234 | <div class="txt" style="position:absolute; left:90px; top:504px;"><span class="p4f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">and searching available with current digital libraries; Section 3 gives examples of</span></div>
|
---|
235 | <div class="txt" style="position:absolute; left:90px; top:528px;"><span class="p4f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">conventional bibliometric techniques applied to Internet-accessible archives; Section 4</span></div>
|
---|
236 | <div class="txt" style="position:absolute; left:90px; top:552px;"><span class="p4f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">discusses opportunities to directly measure usage of documents and to detect</span></div>
|
---|
237 | <div class="txt" style="position:absolute; left:90px; top:576px;"><span class="p4f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">information-seeking patterns in researchers; and Section 5 presents our conclusions.</span></div>
|
---|
238 | <div class="txt" style="position:absolute; left:90px; top:636px;"><span class="p4f2" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">2. Indexing and searching in current digital libraries</span></div>
|
---|
239 | <div class="txt" style="position:absolute; left:126px; top:684px;"><span class="p4f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">At present, the types of indexing fields for most academically-oriented digital</span></div>
|
---|
240 | <div class="txt" style="position:absolute; left:90px; top:708px;"><span class="p4f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">library systems are limited. Many schemes index on user-supplied document</span></div>
|
---|
241 | <div class="txt" style="position:absolute; left:90px; top:732px;"><span class="p4f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">descriptions, abstracts, or similar document surrogates (for example, the </span><span class="p4f1" style="font-size:9px;vertical-align:baseline;color:rgba(0,0,0,1);">PHYSICS E</span><span class="p4f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">-</span></div>
|
---|
242 | <div class="txt" style="position:absolute; left:90px; top:756px;"><span class="p4f1" style="font-size:9px;vertical-align:baseline;color:rgba(0,0,0,1);">PRINT ARCHIVE </span><span class="p4f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">[10], a collection of physics pre-prints and technical reports). As will</span></div>
|
---|
243 | </div>
|
---|
244 | </div>
|
---|
245 |
|
---|
246 | </Content>
|
---|
247 | </Section>
|
---|
248 | <Section>
|
---|
249 | <Description>
|
---|
250 | <Metadata name="Title">Page 5</Metadata>
|
---|
251 | </Description>
|
---|
252 | <Content>
|
---|
253 | <div id="page5">
|
---|
254 | <div style="position: relative; height: 842px; width: 595px;"><style type="text/css">
|
---|
255 | .txt { white-space:nowrap; }
|
---|
256 | .p5f0 { font-family:sans-serif; font-weight:normal; font-style:normal; }
|
---|
257 | .p5f1 { font-family:serif; font-weight:normal; font-style:normal; }
|
---|
258 | .p5f2 { font-family:monospace; font-weight:normal; font-style:normal; }
|
---|
259 | .p5f3 { font-family:serif; font-weight:normal; font-style:italic; }
|
---|
260 | .p5f4 { font-family:sans-serif; font-weight:normal; font-style:normal; }
|
---|
261 | </style>
|
---|
262 | <img class="background" height="842" id="background5" src="_httpdocimg_/page5.png" style="position:absolute; left:0px; top:0px;" width="595">
|
---|
263 | <div class="txt" style="position:absolute; left:90px; top:72px;"><span class="p5f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">be discussed below, the quality of this user-provided data can be highly variable, and</span></div>
|
---|
264 | <div class="txt" style="position:absolute; left:90px; top:96px;"><span class="p5f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">may unfavorably impact the usefulness of the index for searching. Alternatively, a</span></div>
|
---|
265 | <div class="txt" style="position:absolute; left:90px; top:120px;"><span class="p5f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">designated site librarian may maintain a catalog (eg, the </span><span class="p5f1" style="font-size:9px;vertical-align:baseline;color:rgba(0,0,0,1);">WATERS </span><span class="p5f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">[14] system, now</span></div>
|
---|
266 | <div class="txt" style="position:absolute; left:90px; top:144px;"><span class="p5f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">subsumed by </span><span class="p5f1" style="font-size:9px;vertical-align:baseline;color:rgba(0,0,0,1);">NCSTRL </span><span class="p5f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">(</span><span class="p5f2" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">http://www.ncstrl.org/</span><span class="p5f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">), both primarily collections of</span></div>
|
---|
267 | <div class="txt" style="position:absolute; left:90px; top:168px;"><span class="p5f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">computer science technical reports); in this case the quality of the bibliographic</span></div>
|
---|
268 | <div class="txt" style="position:absolute; left:90px; top:192px;"><span class="p5f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">information may be expedited to be higher, but fewer sites will be likely to support</span></div>
|
---|
269 | <div class="txt" style="position:absolute; left:90px; top:216px;"><span class="p5f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">such a librarian and therefore fewer documents are likely to be included in the digital</span></div>
|
---|
270 | <div class="txt" style="position:absolute; left:90px; top:240px;"><span class="p5f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">library. In a âharvestingâ system such as the computer science technical report</span></div>
|
---|
271 | <div class="txt" style="position:absolute; left:90px; top:264px;"><span class="p5f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">collections supported by </span><span class="p5f1" style="font-size:9px;vertical-align:baseline;color:rgba(0,0,0,1);">HARVEST </span><span class="p5f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">[2] or the </span><span class="p5f1" style="font-size:9px;vertical-align:baseline;color:rgba(0,0,0,1);">NEW ZEALAND DIGITAL LIBRARY</span></div>
|
---|
272 | <div class="txt" style="position:absolute; left:90px; top:288px;"><span class="p5f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">computer science technical report collection ([16], [17]), documents are indexed from</span></div>
|
---|
273 | <div class="txt" style="position:absolute; left:90px; top:312px;"><span class="p5f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">passive repositories (that may not even be aware that their documents are being</span></div>
|
---|
274 | <div class="txt" style="position:absolute; left:90px; top:336px;"><span class="p5f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">included in the digital library). Harvesting systems therefore cannot rely on the</span></div>
|
---|
275 | <div class="txt" style="position:absolute; left:90px; top:360px;"><span class="p5f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">presence of bibliographic data of any sort.</span></div>
|
---|
276 | <div class="txt" style="position:absolute; left:126px; top:384px;"><span class="p5f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">Because of the relative paucity of high-quality bibliographic data available to</span></div>
|
---|
277 | <div class="txt" style="position:absolute; left:90px; top:408px;"><span class="p5f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">many of the current academically- or research-focussed digital library collections, their</span></div>
|
---|
278 | <div class="txt" style="position:absolute; left:90px; top:432px;"><span class="p5f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">search interfaces tend to be more primitive than those ordinarily found in online</span></div>
|
---|
279 | <div class="txt" style="position:absolute; left:90px; top:456px;"><span class="p5f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">bibliographic databases or library catalogs. Systems such as </span><span class="p5f1" style="font-size:9px;vertical-align:baseline;color:rgba(0,0,0,1);">NCSTRL </span><span class="p5f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">can support</span></div>
|
---|
280 | <div class="txt" style="position:absolute; left:90px; top:480px;"><span class="p5f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">author, title, and subject searching, but this more sophisticated search functionality</span></div>
|
---|
281 | <div class="txt" style="position:absolute; left:90px; top:504px;"><span class="p5f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">comes at the expense of requiring participating repositories to use specific software. As</span></div>
|
---|
282 | <div class="txt" style="position:absolute; left:90px; top:528px;"><span class="p5f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">a consequence, these latter systems may provide access to a small number of sites than</span></div>
|
---|
283 | <div class="txt" style="position:absolute; left:90px; top:552px;"><span class="p5f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">harvesting systems. Harvesters may access a broader range of providers, but at the</span></div>
|
---|
284 | <div class="txt" style="position:absolute; left:90px; top:576px;"><span class="p5f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">penalty of being limited to unfielded, keyword searches over the raw text of the</span></div>
|
---|
285 | <div class="txt" style="position:absolute; left:90px; top:600px;"><span class="p5f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">document or document surrogate.</span></div>
|
---|
286 | <div class="txt" style="position:absolute; left:90px; top:648px;"><span class="p5f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">Specifically, the indexing in existing digital libraries has a variety of shortcomings for</span></div>
|
---|
287 | <div class="txt" style="position:absolute; left:90px; top:672px;"><span class="p5f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">bibliometric applications:</span></div>
|
---|
288 | <div class="txt" style="position:absolute; left:90px; top:696px;"><span class="p5f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">â¢</span></div>
|
---|
289 | <div class="txt" style="position:absolute; left:125px; top:696px;"><span class="p5f3" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">lack of fielded indexing: </span><span class="p5f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">As noted above, some large and widely used digital</span></div>
|
---|
290 | <div class="txt" style="position:absolute; left:125px; top:720px;"><span class="p5f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">libraries (such as the computer science technical report collection of the </span><span class="p5f1" style="font-size:9px;vertical-align:baseline;color:rgba(0,0,0,1);">NEW</span></div>
|
---|
291 | <div class="txt" style="position:absolute; left:125px; top:744px;"><span class="p5f1" style="font-size:9px;vertical-align:baseline;color:rgba(0,0,0,1);">ZEALAND DIGITAL LIBRARY</span><span class="p5f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">) may lack formal cataloging entirely, and rely on</span></div>
|
---|
292 | </div>
|
---|
293 | </div>
|
---|
294 |
|
---|
295 | </Content>
|
---|
296 | </Section>
|
---|
297 | <Section>
|
---|
298 | <Description>
|
---|
299 | <Metadata name="Title">Page 6</Metadata>
|
---|
300 | </Description>
|
---|
301 | <Content>
|
---|
302 | <div id="page6">
|
---|
303 | <div style="position: relative; height: 842px; width: 595px;"><style type="text/css">
|
---|
304 | .txt { white-space:nowrap; }
|
---|
305 | .p6f0 { font-family:sans-serif; font-weight:normal; font-style:normal; }
|
---|
306 | .p6f1 { font-family:serif; font-weight:normal; font-style:normal; }
|
---|
307 | .p6f2 { font-family:serif; font-weight:normal; font-style:italic; }
|
---|
308 | .p6f3 { font-family:sans-serif; font-weight:normal; font-style:normal; }
|
---|
309 | </style>
|
---|
310 | <img class="background" height="842" id="background6" src="_httpdocimg_/page6.png" style="position:absolute; left:0px; top:0px;" width="595">
|
---|
311 | <div class="txt" style="position:absolute; left:125px; top:72px;"><span class="p6f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">keyword searching over the raw document text. Obviously this makes field-</span></div>
|
---|
312 | <div class="txt" style="position:absolute; left:125px; top:96px;"><span class="p6f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">dependent analysis more difficult (for example, locating documents produced by</span></div>
|
---|
313 | <div class="txt" style="position:absolute; left:125px; top:120px;"><span class="p6f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">specific authors), and in the worst case my require a manual examination of all</span></div>
|
---|
314 | <div class="txt" style="position:absolute; left:125px; top:144px;"><span class="p6f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">files in the collection in order to reliably identify a desired document subset.</span></div>
|
---|
315 | <div class="txt" style="position:absolute; left:125px; top:168px;"><span class="p6f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">However, keyword search techniques that approximate fielded searching results</span></div>
|
---|
316 | <div class="txt" style="position:absolute; left:125px; top:192px;"><span class="p6f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">may suffice: for example in the </span><span class="p6f1" style="font-size:9px;vertical-align:baseline;color:rgba(0,0,0,1);">NEW ZEALAND DIGITAL LIBRARY </span><span class="p6f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">computer</span></div>
|
---|
317 | <div class="txt" style="position:absolute; left:125px; top:216px;"><span class="p6f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">science technical report collection, limiting the keyword search for âJohnsonâ</span></div>
|
---|
318 | <div class="txt" style="position:absolute; left:125px; top:240px;"><span class="p6f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">to a search of first pages only is likely to retrieve documents written by Johnson</span></div>
|
---|
319 | <div class="txt" style="position:absolute; left:125px; top:264px;"><span class="p6f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">(since for the majority of computer science technical reports, the first page</span></div>
|
---|
320 | <div class="txt" style="position:absolute; left:125px; top:288px;"><span class="p6f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">contains little more than author, title, date, and institution details).</span></div>
|
---|
321 | <div class="txt" style="position:absolute; left:125px; top:336px;"><span class="p6f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">A more principled approach to extracting bibliographic information is embodied</span></div>
|
---|
322 | <div class="txt" style="position:absolute; left:125px; top:360px;"><span class="p6f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">in the CiteSeer tool [1]. This software parses raw, unfielded academic</span></div>
|
---|
323 | <div class="txt" style="position:absolute; left:125px; top:384px;"><span class="p6f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">documents and attempts to identify such indexing information as author, title,</span></div>
|
---|
324 | <div class="txt" style="position:absolute; left:125px; top:408px;"><span class="p6f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">reference list, etc. Obviously such a tool cannot attain 100% accuracy over a</span></div>
|
---|
325 | <div class="txt" style="position:absolute; left:125px; top:432px;"><span class="p6f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">heterogenous document collection, but in practice it appears useful in that it can</span></div>
|
---|
326 | <div class="txt" style="position:absolute; left:125px; top:456px;"><span class="p6f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">make a good first pass in processing a set of documents, providing an initial set</span></div>
|
---|
327 | <div class="txt" style="position:absolute; left:125px; top:480px;"><span class="p6f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">of parsed documents for analysis. The remaining (presumably much smaller) set</span></div>
|
---|
328 | <div class="txt" style="position:absolute; left:125px; top:504px;"><span class="p6f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">of unparsable documents can then be dealt with manually.</span></div>
|
---|
329 | <div class="txt" style="position:absolute; left:90px; top:552px;"><span class="p6f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">â¢</span></div>
|
---|
330 | <div class="txt" style="position:absolute; left:126px; top:552px;"><span class="p6f2" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">lack of consistency in field formatting: </span><span class="p6f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">Current digital libraries usually acquire</span></div>
|
---|
331 | <div class="txt" style="position:absolute; left:126px; top:576px;"><span class="p6f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">bibliographic information from either the authors of submitted articles or</span></div>
|
---|
332 | <div class="txt" style="position:absolute; left:126px; top:600px;"><span class="p6f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">automatic extraction routines (retrieving bibliographic details from catalog files</span></div>
|
---|
333 | <div class="txt" style="position:absolute; left:126px; top:624px;"><span class="p6f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">that may or may not be in a given document site, and that may or may not be in</span></div>
|
---|
334 | <div class="txt" style="position:absolute; left:126px; top:648px;"><span class="p6f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">an easily parsable form). Neither of these methods produce records with</span></div>
|
---|
335 | <div class="txt" style="position:absolute; left:126px; top:672px;"><span class="p6f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">standard formatting, which causes problems with automated bibliometric</span></div>
|
---|
336 | <div class="txt" style="position:absolute; left:126px; top:696px;"><span class="p6f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">analysis. Consider the following examples selected from entries in the hep-th</span></div>
|
---|
337 | <div class="txt" style="position:absolute; left:126px; top:720px;"><span class="p6f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">(high energy physics) collection of the </span><span class="p6f1" style="font-size:9px;vertical-align:baseline;color:rgba(0,0,0,1);">PHYSICS E</span><span class="p6f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">-</span><span class="p6f1" style="font-size:9px;vertical-align:baseline;color:rgba(0,0,0,1);">PRINT ARCHIVES</span><span class="p6f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">:</span></div>
|
---|
338 | </div>
|
---|
339 | </div>
|
---|
340 |
|
---|
341 | </Content>
|
---|
342 | </Section>
|
---|
343 | <Section>
|
---|
344 | <Description>
|
---|
345 | <Metadata name="Title">Page 7</Metadata>
|
---|
346 | </Description>
|
---|
347 | <Content>
|
---|
348 | <div id="page7">
|
---|
349 | <div style="position: relative; height: 842px; width: 595px;"><style type="text/css">
|
---|
350 | .txt { white-space:nowrap; }
|
---|
351 | .p7f0 { font-family:sans-serif; font-weight:normal; font-style:normal; }
|
---|
352 | .p7f1 { font-family:serif; font-weight:normal; font-style:normal; }
|
---|
353 | .p7f2 { font-family:serif; font-weight:normal; font-style:italic; }
|
---|
354 | .p7f3 { font-family:sans-serif; font-weight:normal; font-style:normal; }
|
---|
355 | </style>
|
---|
356 | <img class="background" height="842" id="background7" src="_httpdocimg_/page7.png" style="position:absolute; left:0px; top:0px;" width="595">
|
---|
357 | <div class="txt" style="position:absolute; left:125px; top:72px;"><span class="p7f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">(i) Authors: A. Yu. Alekseev, V. Schomerus</span></div>
|
---|
358 | <div class="txt" style="position:absolute; left:125px; top:96px;"><span class="p7f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">(ii) Authors: Adel Bilal and Ian. I. Kogan</span></div>
|
---|
359 | <div class="txt" style="position:absolute; left:125px; top:120px;"><span class="p7f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">(iii) Authors: Paul S. Aspinwall and David R. Morrison (with an appendix</span></div>
|
---|
360 | <div class="txt" style="position:absolute; left:162px; top:144px;"><span class="p7f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">by Mark Gross)</span></div>
|
---|
361 | <div class="txt" style="position:absolute; left:125px; top:168px;"><span class="p7f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">(iv) Authors: A. H. Chamseddine and Herbi Dreiner (ETH-Zurich)</span></div>
|
---|
362 | <div class="txt" style="position:absolute; left:125px; top:216px;"><span class="p7f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">In this case, typical for existing digital libraries, there is no standardized format</span></div>
|
---|
363 | <div class="txt" style="position:absolute; left:125px; top:240px;"><span class="p7f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">for authors' names (here, appearing with full names, initials plus last name, and</span></div>
|
---|
364 | <div class="txt" style="position:absolute; left:125px; top:264px;"><span class="p7f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">a mixture of the two); no standard convention for separating author names</span></div>
|
---|
365 | <div class="txt" style="position:absolute; left:125px; top:288px;"><span class="p7f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">(here, either a comma or &quot;and&quot; are used); and parenthetical information can</span></div>
|
---|
366 | <div class="txt" style="position:absolute; left:125px; top:312px;"><span class="p7f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">include a variety of information such as the name of an associate author or the</span></div>
|
---|
367 | <div class="txt" style="position:absolute; left:125px; top:336px;"><span class="p7f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">institutional affiliations of an author. Manual processing or specially crafted</span></div>
|
---|
368 | <div class="txt" style="position:absolute; left:125px; top:360px;"><span class="p7f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">software would be required to reformat these fields for analysis.</span></div>
|
---|
369 | <div class="txt" style="position:absolute; left:90px; top:408px;"><span class="p7f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">â¢</span></div>
|
---|
370 | <div class="txt" style="position:absolute; left:125px; top:408px;"><span class="p7f2" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">duplicate entries: </span><span class="p7f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">Digital libraries that draw documents from a variety of sources</span></div>
|
---|
371 | <div class="txt" style="position:absolute; left:125px; top:432px;"><span class="p7f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">may inadvertently contain duplicate items. Unfortunately, the irregular</span></div>
|
---|
372 | <div class="txt" style="position:absolute; left:125px; top:456px;"><span class="p7f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">formatting of the bibliographic information makes it difficult to automatically</span></div>
|
---|
373 | <div class="txt" style="position:absolute; left:125px; top:480px;"><span class="p7f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">detect these duplicates.</span></div>
|
---|
374 | <div class="txt" style="position:absolute; left:90px; top:528px;"><span class="p7f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">â¢</span></div>
|
---|
375 | <div class="txt" style="position:absolute; left:125px; top:528px;"><span class="p7f2" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">implicit field tagging: </span><span class="p7f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">In some repositories, items are not explicitly tagged with</span></div>
|
---|
376 | <div class="txt" style="position:absolute; left:125px; top:552px;"><span class="p7f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">certain types of information â most commonly the document's date of</span></div>
|
---|
377 | <div class="txt" style="position:absolute; left:125px; top:576px;"><span class="p7f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">publication or production. Instead, the date is implicit in the document's title</span></div>
|
---|
378 | <div class="txt" style="position:absolute; left:125px; top:600px;"><span class="p7f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">(eg, its numeration in a technical report series) or in the location of the document</span></div>
|
---|
379 | <div class="txt" style="position:absolute; left:125px; top:624px;"><span class="p7f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">in the file structure of the repository (eg, separate directories exist for each</span></div>
|
---|
380 | <div class="txt" style="position:absolute; left:125px; top:648px;"><span class="p7f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">year). A second common piece of implicit data is the authorsâ institutional</span></div>
|
---|
381 | <div class="txt" style="position:absolute; left:125px; top:672px;"><span class="p7f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">affiliations. This may be contained in the document itself (typically on a cover</span></div>
|
---|
382 | <div class="txt" style="position:absolute; left:125px; top:696px;"><span class="p7f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">page), or may be implicit in the documentâs location (for example, a</span></div>
|
---|
383 | <div class="txt" style="position:absolute; left:125px; top:720px;"><span class="p7f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">corporationâs technical reports are stored in its ftp repository). Again, in these</span></div>
|
---|
384 | </div>
|
---|
385 | </div>
|
---|
386 |
|
---|
387 | </Content>
|
---|
388 | </Section>
|
---|
389 | <Section>
|
---|
390 | <Description>
|
---|
391 | <Metadata name="Title">Page 8</Metadata>
|
---|
392 | </Description>
|
---|
393 | <Content>
|
---|
394 | <div id="page8">
|
---|
395 | <div style="position: relative; height: 842px; width: 595px;"><style type="text/css">
|
---|
396 | .txt { white-space:nowrap; }
|
---|
397 | .p8f0 { font-family:sans-serif; font-weight:normal; font-style:normal; }
|
---|
398 | .p8f1 { font-family:serif; font-weight:normal; font-style:normal; }
|
---|
399 | .p8f2 { font-family:serif; font-weight:normal; font-style:italic; }
|
---|
400 | .p8f3 { font-family:serif; font-weight:bold; font-style:normal; }
|
---|
401 | .p8f4 { font-family:sans-serif; font-weight:normal; font-style:normal; }
|
---|
402 | </style>
|
---|
403 | <img class="background" height="842" id="background8" src="_httpdocimg_/page8.png" style="position:absolute; left:0px; top:0px;" width="595">
|
---|
404 | <div class="txt" style="position:absolute; left:125px; top:72px;"><span class="p8f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">cases special processing is required to append this field information to a</span></div>
|
---|
405 | <div class="txt" style="position:absolute; left:125px; top:96px;"><span class="p8f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">document record for bibliometric analysis.</span></div>
|
---|
406 | <div class="txt" style="position:absolute; left:90px; top:144px;"><span class="p8f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">â¢</span></div>
|
---|
407 | <div class="txt" style="position:absolute; left:126px; top:144px;"><span class="p8f2" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">extraction of document text: </span><span class="p8f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">Few of the documents stored in the research-</span></div>
|
---|
408 | <div class="txt" style="position:absolute; left:126px; top:168px;"><span class="p8f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">oriented digital libraries discussed in this paper are straight ascii text; instead,</span></div>
|
---|
409 | <div class="txt" style="position:absolute; left:126px; top:192px;"><span class="p8f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">documents may appear in a variety of file formats, such as LaTeX, PostScript,</span></div>
|
---|
410 | <div class="txt" style="position:absolute; left:126px; top:216px;"><span class="p8f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">PDF, etc. If the contents of the documents are to be automatically processed</span></div>
|
---|
411 | <div class="txt" style="position:absolute; left:126px; top:240px;"><span class="p8f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">(for example, to count the words in a document, or to extract reference</span></div>
|
---|
412 | <div class="txt" style="position:absolute; left:126px; top:264px;"><span class="p8f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">publication dates for an obsolescence study), then the text must be extracted.</span></div>
|
---|
413 | <div class="txt" style="position:absolute; left:126px; top:288px;"><span class="p8f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">Utilities are available to convert most common document formats to ascii.</span></div>
|
---|
414 | <div class="txt" style="position:absolute; left:126px; top:336px;"><span class="p8f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">It is likely that many of these problems will be addressed as the Internet-based</span></div>
|
---|
415 | <div class="txt" style="position:absolute; left:90px; top:360px;"><span class="p8f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">document indexing systems mature. Even minor changes can greatly increase the</span></div>
|
---|
416 | <div class="txt" style="position:absolute; left:90px; top:384px;"><span class="p8f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">useability of a bibliographic database for bibliometric research. For example, the</span></div>
|
---|
417 | <div class="txt" style="position:absolute; left:90px; top:408px;"><span class="p8f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">addition of an explicit date tag to many online databases in 1975 sparked new</span></div>
|
---|
418 | <div class="txt" style="position:absolute; left:90px; top:432px;"><span class="p8f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">applications in time series research [3].</span></div>
|
---|
419 | <div class="txt" style="position:absolute; left:90px; top:480px;"><span class="p8f3" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">3. Opportunities for applications of bibliometric techniques</span></div>
|
---|
420 | <div class="txt" style="position:absolute; left:126px; top:528px;"><span class="p8f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">One type of bibliometric research concentrates on quantifying fundamental,</span></div>
|
---|
421 | <div class="txt" style="position:absolute; left:90px; top:552px;"><span class="p8f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">structural details about a subject literature: how many items are published, how many</span></div>
|
---|
422 | <div class="txt" style="position:absolute; left:90px; top:576px;"><span class="p8f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">authors are publishing, over what time period documents are likely to be used, etc.</span></div>
|
---|
423 | <div class="txt" style="position:absolute; left:90px; top:600px;"><span class="p8f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">More complex studies analyze the relationships between documents, such as how</span></div>
|
---|
424 | <div class="txt" style="position:absolute; left:90px; top:624px;"><span class="p8f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">documents cluster into subjects. The following examples give a flavour of the</span></div>
|
---|
425 | <div class="txt" style="position:absolute; left:90px; top:648px;"><span class="p8f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">bibliometric research that is possible using the emerging digital libraries:</span></div>
|
---|
426 | <div class="txt" style="position:absolute; left:90px; top:696px;"><span class="p8f2" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">examining the âphysicalâ characteristics of archived documents</span></div>
|
---|
427 | <div class="txt" style="position:absolute; left:126px; top:720px;"><span class="p8f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">One relatively straightforward type of bibliometric study characterizes the</span></div>
|
---|
428 | <div class="txt" style="position:absolute; left:90px; top:744px;"><span class="p8f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">formats of different literatures. For example, Figure 1 presents a the range of the size</span></div>
|
---|
429 | </div>
|
---|
430 | </div>
|
---|
431 |
|
---|
432 | </Content>
|
---|
433 | </Section>
|
---|
434 | <Section>
|
---|
435 | <Description>
|
---|
436 | <Metadata name="Title">Page 9</Metadata>
|
---|
437 | </Description>
|
---|
438 | <Content>
|
---|
439 | <div id="page9">
|
---|
440 | <div style="position: relative; height: 842px; width: 595px;"><style type="text/css">
|
---|
441 | .txt { white-space:nowrap; }
|
---|
442 | .p9f0 { font-family:sans-serif; font-weight:normal; font-style:normal; }
|
---|
443 | .p9f1 { font-family:serif; font-weight:normal; font-style:normal; }
|
---|
444 | .p9f2 { font-family:serif; font-weight:normal; font-style:italic; }
|
---|
445 | .p9f3 { font-family:sans-serif; font-weight:normal; font-style:normal; }
|
---|
446 | </style>
|
---|
447 | <img class="background" height="842" id="background9" src="_httpdocimg_/page9.png" style="position:absolute; left:0px; top:0px;" width="595">
|
---|
448 | <div class="txt" style="position:absolute; left:90px; top:72px;"><span class="p9f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">of computer science technical reports as measured by their length in pages. Of the</span></div>
|
---|
449 | <div class="txt" style="position:absolute; left:90px; top:96px;"><span class="p9f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">45,720 documents in the CSTR collection as of April 1998, nearly 1600 did not contain</span></div>
|
---|
450 | <div class="txt" style="position:absolute; left:90px; top:120px;"><span class="p9f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">page divisions in their files (and hence are excluded from analysis). Note that the</span></div>
|
---|
451 | <div class="txt" style="position:absolute; left:90px; top:144px;"><span class="p9f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">number of pages in the shorter documents (&lt;50 pages) falls into an approximately</span></div>
|
---|
452 | <div class="txt" style="position:absolute; left:90px; top:168px;"><span class="p9f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">normal distribution (slightly skewed to the left), while presumably the longer</span></div>
|
---|
453 | <div class="txt" style="position:absolute; left:90px; top:192px;"><span class="p9f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">documents represent Mastersâ and Doctoral theses. A surprising number of documents</span></div>
|
---|
454 | <div class="txt" style="position:absolute; left:90px; top:216px;"><span class="p9f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">are very short (between one and 5 pages); these may represent the type of condensed</span></div>
|
---|
455 | <div class="txt" style="position:absolute; left:90px; top:240px;"><span class="p9f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">results frequently found in the âtechnical notesâ, âshort papersâ, and âposter sessionsâ</span></div>
|
---|
456 | <div class="txt" style="position:absolute; left:90px; top:264px;"><span class="p9f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">of computing conferences and journals. The average number of pages per document,</span></div>
|
---|
457 | <div class="txt" style="position:absolute; left:90px; top:288px;"><span class="p9f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">27.5, appears to be slightly longer than the common upper bound for a computing</span></div>
|
---|
458 | <div class="txt" style="position:absolute; left:90px; top:312px;"><span class="p9f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">journal article, although this observation must be confirmed by a similar study of the</span></div>
|
---|
459 | <div class="txt" style="position:absolute; left:90px; top:336px;"><span class="p9f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">lengths of formally published computing articles.</span></div>
|
---|
460 | <div class="txt" style="position:absolute; left:126px; top:360px;"><span class="p9f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">This type of analysis is of particular interest for technical reports, since they</span></div>
|
---|
461 | <div class="txt" style="position:absolute; left:90px; top:384px;"><span class="p9f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">have not been studied in the same detail as formally published papers. A comparison of</span></div>
|
---|
462 | <div class="txt" style="position:absolute; left:90px; top:408px;"><span class="p9f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">the physical characteristics of the formal and informal literature could provide</span></div>
|
---|
463 | <div class="txt" style="position:absolute; left:90px; top:432px;"><span class="p9f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">supporting evidence for common beliefs about the relationship between the two types</span></div>
|
---|
464 | <div class="txt" style="position:absolute; left:90px; top:456px;"><span class="p9f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">of documents. For example, do publishing constraints force journal and proceedings</span></div>
|
---|
465 | <div class="txt" style="position:absolute; left:90px; top:480px;"><span class="p9f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">articles to be shorter than technical reports, and therefore presumably omit technical</span></div>
|
---|
466 | <div class="txt" style="position:absolute; left:90px; top:504px;"><span class="p9f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">details of findings? Do technical reports contain more/less extensive reference sections?</span></div>
|
---|
467 | <div class="txt" style="position:absolute; left:90px; top:528px;"><span class="p9f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">If reference sections of technical reports are longer than those of published articles, then</span></div>
|
---|
468 | <div class="txt" style="position:absolute; left:90px; top:552px;"><span class="p9f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">citation links are being ommitted in published works; if technical reports contain fewer</span></div>
|
---|
469 | <div class="txt" style="position:absolute; left:90px; top:576px;"><span class="p9f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">references, then this may confirm earlier indications that computer scientists tend to</span></div>
|
---|
470 | <div class="txt" style="position:absolute; left:90px; top:600px;"><span class="p9f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">âresearch firstâ and do literature surveys later [6].</span></div>
|
---|
471 | <div class="txt" style="position:absolute; left:90px; top:648px;"><span class="p9f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">Figure 1. Range of sizes of CS technical reports, measured by number of pages</span></div>
|
---|
472 | <div class="txt" style="position:absolute; left:90px; top:696px;"><span class="p9f2" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">obsolescence studies.</span></div>
|
---|
473 | <div class="txt" style="position:absolute; left:126px; top:720px;"><span class="p9f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">A document is considered obsolete when it is no longer referenced by the</span></div>
|
---|
474 | <div class="txt" style="position:absolute; left:90px; top:744px;"><span class="p9f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">current literature. Typically, documents receive their greatest number and frequency of</span></div>
|
---|
475 | </div>
|
---|
476 | </div>
|
---|
477 |
|
---|
478 | </Content>
|
---|
479 | </Section>
|
---|
480 | <Section>
|
---|
481 | <Description>
|
---|
482 | <Metadata name="Title">Page 10</Metadata>
|
---|
483 | </Description>
|
---|
484 | <Content>
|
---|
485 | <div id="page10">
|
---|
486 | <div style="position: relative; height: 842px; width: 595px;"><style type="text/css">
|
---|
487 | .txt { white-space:nowrap; }
|
---|
488 | .p10f0 { font-family:sans-serif; font-weight:normal; font-style:normal; }
|
---|
489 | .p10f1 { font-family:serif; font-weight:normal; font-style:normal; }
|
---|
490 | .p10f2 { font-family:serif; font-weight:normal; font-style:italic; }
|
---|
491 | .p10f3 { font-family:sans-serif; font-weight:normal; font-style:normal; }
|
---|
492 | </style>
|
---|
493 | <img class="background" height="842" id="background10" src="_httpdocimg_/page10.png" style="position:absolute; left:0px; top:0px;" width="595">
|
---|
494 | <div class="txt" style="position:absolute; left:90px; top:72px;"><span class="p10f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">citations immediately after publication, and the frequency of citation falls rapidly as time</span></div>
|
---|
495 | <div class="txt" style="position:absolute; left:90px; top:96px;"><span class="p10f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">passes. One technique for estimating the obsolescence rate of a body of literatureâ the</span></div>
|
---|
496 | <div class="txt" style="position:absolute; left:90px; top:120px;"><span class="p10f2" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">synchronous </span><span class="p10f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">method â is to find the median date in the references of the documents.</span></div>
|
---|
497 | <div class="txt" style="position:absolute; left:90px; top:144px;"><span class="p10f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">This median date is subtracted from the year of publication for the documents, yielding</span></div>
|
---|
498 | <div class="txt" style="position:absolute; left:90px; top:168px;"><span class="p10f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">the </span><span class="p10f2" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">median citation age</span><span class="p10f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">. As would be expected, this median varies between the</span></div>
|
---|
499 | <div class="txt" style="position:absolute; left:90px; top:192px;"><span class="p10f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">disciplines. Typically the social sciences and arts have a higher median citation age</span></div>
|
---|
500 | <div class="txt" style="position:absolute; left:90px; top:216px;"><span class="p10f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">than the âhardâ sciences and engineering, indicating that documents obsolesce more</span></div>
|
---|
501 | <div class="txt" style="position:absolute; left:90px; top:240px;"><span class="p10f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">quickly for the latter fields.</span></div>
|
---|
502 | <div class="txt" style="position:absolute; left:126px; top:264px;"><span class="p10f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">As noted in Section 2, references are not generally explicitly tagged in existing</span></div>
|
---|
503 | <div class="txt" style="position:absolute; left:90px; top:288px;"><span class="p10f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">digital repositories. However, reference dates can usually be extracted from the</span></div>
|
---|
504 | <div class="txt" style="position:absolute; left:90px; top:312px;"><span class="p10f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">document text by first locating the reference section (usually delimited by a &quot;references&quot;</span></div>
|
---|
505 | <div class="txt" style="position:absolute; left:90px; top:336px;"><span class="p10f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">or &quot;bibliography&quot; section heading), and then extracting all numbers in the appropriate</span></div>
|
---|
506 | <div class="txt" style="position:absolute; left:90px; top:360px;"><span class="p10f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">ranges for dates for the field under study.</span></div>
|
---|
507 | <div class="txt" style="position:absolute; left:126px; top:384px;"><span class="p10f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">To illustrate this process, 188 technical reports were sampled from Internet-</span></div>
|
---|
508 | <div class="txt" style="position:absolute; left:90px; top:407px;"><span class="p10f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">accessible repositories</span><span class="p10f1" style="font-size:6px;vertical-align:super;color:rgba(0,0,0,1);">1 </span><span class="p10f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">and used as source documents for a synchronous obsolescence</span></div>
|
---|
509 | <div class="txt" style="position:absolute; left:90px; top:432px;"><span class="p10f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">study. Conveniently, the repositories chosen organize technical reports into sub-</span></div>
|
---|
510 | <div class="txt" style="position:absolute; left:90px; top:456px;"><span class="p10f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">directories by their date of publication. The reference dates for each technical report</span></div>
|
---|
511 | <div class="txt" style="position:absolute; left:90px; top:480px;"><span class="p10f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">were automatically extracted by software that scanned the documentâs file for numbers</span></div>
|
---|
512 | <div class="txt" style="position:absolute; left:90px; top:504px;"><span class="p10f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">of the form 19XX, since previous studies indicate that few if any computing reports</span></div>
|
---|
513 | <div class="txt" style="position:absolute; left:90px; top:528px;"><span class="p10f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">reference documents published in previous centuries [5]. Table 1 presents the median</span></div>
|
---|
514 | <div class="txt" style="position:absolute; left:90px; top:552px;"><span class="p10f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">citation age calculated for these documents, broken down by repository and the year of</span></div>
|
---|
515 | <div class="txt" style="position:absolute; left:90px; top:576px;"><span class="p10f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">publication for the source documents from which the reference dates were extracted:</span></div>
|
---|
516 | <div class="txt" style="position:absolute; left:90px; top:624px;"><span class="p10f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">Table 1. Median citation ages for technical report repositories</span></div>
|
---|
517 | <div class="txt" style="position:absolute; left:126px; top:672px;"><span class="p10f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">The median citation age ranges between 2 and 4 years, which is consistent with</span></div>
|
---|
518 | <div class="txt" style="position:absolute; left:90px; top:696px;"><span class="p10f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">previous examinations of computing and information systems literature ([5], [4]).</span></div>
|
---|
519 | <div class="txt" style="position:absolute; left:90px; top:720px;"><span class="p10f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">When graphed, the distribution of reference dates show the exponential curve typically</span></div>
|
---|
520 | <div class="txt" style="position:absolute; left:90px; top:744px;"><span class="p10f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">found in obsolescence studies, including the final droop due to an âimmediacy effectâ</span></div>
|
---|
521 | </div>
|
---|
522 | </div>
|
---|
523 |
|
---|
524 | </Content>
|
---|
525 | </Section>
|
---|
526 | </Section>
|
---|
527 | <Section>
|
---|
528 | <Description>
|
---|
529 | <Metadata name="Title">Pages 11-20</Metadata>
|
---|
530 | </Description>
|
---|
531 | <Content>
|
---|
532 | </Content>
|
---|
533 | <Section>
|
---|
534 | <Description>
|
---|
535 | <Metadata name="Title">Page 11</Metadata>
|
---|
536 | </Description>
|
---|
537 | <Content>
|
---|
538 | <div id="page11">
|
---|
539 | <div style="position: relative; height: 842px; width: 595px;"><style type="text/css">
|
---|
540 | .txt { white-space:nowrap; }
|
---|
541 | .p11f0 { font-family:sans-serif; font-weight:normal; font-style:normal; }
|
---|
542 | .p11f1 { font-family:serif; font-weight:normal; font-style:normal; }
|
---|
543 | .p11f2 { font-family:serif; font-weight:normal; font-style:italic; }
|
---|
544 | .p11f3 { font-family:sans-serif; font-weight:normal; font-style:normal; }
|
---|
545 | </style>
|
---|
546 | <img class="background" height="842" id="background11" src="_httpdocimg_/page11.png" style="position:absolute; left:0px; top:0px;" width="595">
|
---|
547 | <div class="txt" style="position:absolute; left:90px; top:72px;"><span class="p11f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">as fewer very new documents are available for citation [7]. These types of results</span></div>
|
---|
548 | <div class="txt" style="position:absolute; left:90px; top:96px;"><span class="p11f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">provide confirmation that references used in computer science technical reports (the pre-</span></div>
|
---|
549 | <div class="txt" style="position:absolute; left:90px; top:120px;"><span class="p11f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">eminent âgrey literatureâ of the computing field) conforms to the same patterns as</span></div>
|
---|
550 | <div class="txt" style="position:absolute; left:90px; top:144px;"><span class="p11f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">references found in the formally published literature.</span></div>
|
---|
551 | <div class="txt" style="position:absolute; left:90px; top:192px;"><span class="p11f2" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">co-citation and bibliographic coupling studies</span></div>
|
---|
552 | <div class="txt" style="position:absolute; left:126px; top:216px;"><span class="p11f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">The rate at which documents cite each other (co-citation) or cite the same</span></div>
|
---|
553 | <div class="txt" style="position:absolute; left:90px; top:240px;"><span class="p11f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">documents (bibliographic coupling) can be used to produce &quot;maps&quot; of a subject</span></div>
|
---|
554 | <div class="txt" style="position:absolute; left:90px; top:264px;"><span class="p11f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">literature. These techniques rely on analysis of the references of documents, and these</span></div>
|
---|
555 | <div class="txt" style="position:absolute; left:90px; top:288px;"><span class="p11f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">references must be in a common format. While digital libraries contain full text of</span></div>
|
---|
556 | <div class="txt" style="position:absolute; left:90px; top:312px;"><span class="p11f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">documents, their references are not standardized, and indeed are not even tagged as</span></div>
|
---|
557 | <div class="txt" style="position:absolute; left:90px; top:336px;"><span class="p11f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">such. To perform these studies the references must be manually extracted and</span></div>
|
---|
558 | <div class="txt" style="position:absolute; left:90px; top:360px;"><span class="p11f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">processedâa tedious process that is only worthwhile for documents (such as technical</span></div>
|
---|
559 | <div class="txt" style="position:absolute; left:90px; top:384px;"><span class="p11f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">reports) that are not included in existing citation databases such as the Science Citation</span></div>
|
---|
560 | <div class="txt" style="position:absolute; left:90px; top:408px;"><span class="p11f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">Index and Social Science Citation Index.</span></div>
|
---|
561 | <div class="txt" style="position:absolute; left:90px; top:456px;"><span class="p11f2" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">detecting cycles or regularities in the rate of production of research</span></div>
|
---|
562 | <div class="txt" style="position:absolute; left:126px; top:480px;"><span class="p11f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">Analysis of trends in the production of technical reports can give indications</span></div>
|
---|
563 | <div class="txt" style="position:absolute; left:90px; top:504px;"><span class="p11f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">about working conditions that affect research; for example, is more research produced</span></div>
|
---|
564 | <div class="txt" style="position:absolute; left:90px; top:528px;"><span class="p11f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">over the summer, when the teaching load is lighter? or is research steadily produced</span></div>
|
---|
565 | <div class="txt" style="position:absolute; left:90px; top:552px;"><span class="p11f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">throughout the year?</span></div>
|
---|
566 | <div class="txt" style="position:absolute; left:90px; top:600px;"><span class="p11f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">Figure 2. Distribution of the number of documents submitted to hep-th, 1992-1994</span></div>
|
---|
567 | <div class="txt" style="position:absolute; left:126px; top:648px;"><span class="p11f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">Figures 2 and 3 present statistics on document accumulation in the hep-th (high</span></div>
|
---|
568 | <div class="txt" style="position:absolute; left:90px; top:672px;"><span class="p11f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">energy physics) e-print server, a part of the </span><span class="p11f1" style="font-size:9px;vertical-align:baseline;color:rgba(0,0,0,1);">PHYSICS E</span><span class="p11f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">-</span><span class="p11f1" style="font-size:9px;vertical-align:baseline;color:rgba(0,0,0,1);">PRINT ARCHIVE</span><span class="p11f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">. This system</span></div>
|
---|
569 | <div class="txt" style="position:absolute; left:90px; top:696px;"><span class="p11f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">is one of the oldest formal pre-print archives, and has become the primary means for</span></div>
|
---|
570 | <div class="txt" style="position:absolute; left:90px; top:720px;"><span class="p11f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">information dissemination in its field. Examination of these figures reveals several</span></div>
|
---|
571 | <div class="txt" style="position:absolute; left:90px; top:744px;"><span class="p11f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">trends. Clearly the absolute number of documents deposited in the repository has</span></div>
|
---|
572 | </div>
|
---|
573 | </div>
|
---|
574 |
|
---|
575 | </Content>
|
---|
576 | </Section>
|
---|
577 | <Section>
|
---|
578 | <Description>
|
---|
579 | <Metadata name="Title">Page 12</Metadata>
|
---|
580 | </Description>
|
---|
581 | <Content>
|
---|
582 | <div id="page12">
|
---|
583 | <div style="position: relative; height: 842px; width: 595px;"><style type="text/css">
|
---|
584 | .txt { white-space:nowrap; }
|
---|
585 | .p12f0 { font-family:sans-serif; font-weight:normal; font-style:normal; }
|
---|
586 | .p12f1 { font-family:serif; font-weight:normal; font-style:normal; }
|
---|
587 | .p12f2 { font-family:serif; font-weight:bold; font-style:normal; }
|
---|
588 | .p12f3 { font-family:serif; font-weight:normal; font-style:italic; }
|
---|
589 | .p12f4 { font-family:sans-serif; font-weight:normal; font-style:normal; }
|
---|
590 | </style>
|
---|
591 | <img class="background" height="842" id="background12" src="_httpdocimg_/page12.png" style="position:absolute; left:0px; top:0px;" width="595">
|
---|
592 | <div class="txt" style="position:absolute; left:90px; top:72px;"><span class="p12f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">tended to increase over the time period. For all three years, research production has its</span></div>
|
---|
593 | <div class="txt" style="position:absolute; left:90px; top:96px;"><span class="p12f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">lowest point in January and February, increases through May and June, then decreases</span></div>
|
---|
594 | <div class="txt" style="position:absolute; left:90px; top:120px;"><span class="p12f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">until August and September. At that point the rate of production steps up, reaching a</span></div>
|
---|
595 | <div class="txt" style="position:absolute; left:90px; top:144px;"><span class="p12f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">yearly peak in November and December. This pattern is less clear for 1992, which</span></div>
|
---|
596 | <div class="txt" style="position:absolute; left:90px; top:168px;"><span class="p12f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">might be expected as the archive was established in mid-1991.</span></div>
|
---|
597 | <div class="txt" style="position:absolute; left:93px; top:216px;"><span class="p12f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">Figure 3. Distribution of the percentage of documents submitted to hep-th, 1992-1994</span></div>
|
---|
598 | <div class="txt" style="position:absolute; left:90px; top:264px;"><span class="p12f2" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">4. Analysis of usage data</span></div>
|
---|
599 | <div class="txt" style="position:absolute; left:126px; top:312px;"><span class="p12f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">The emerging Internet-based digital libraries will permit research on scientific</span></div>
|
---|
600 | <div class="txt" style="position:absolute; left:90px; top:336px;"><span class="p12f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">information collection and use at a much finer grain than is possible with current paper</span></div>
|
---|
601 | <div class="txt" style="position:absolute; left:90px; top:360px;"><span class="p12f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">libraries or online bibliographic databases. Current bibliometric or scientometric</span></div>
|
---|
602 | <div class="txt" style="position:absolute; left:90px; top:384px;"><span class="p12f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">research of this type must measure information use indirectly â for example, through</span></div>
|
---|
603 | <div class="txt" style="position:absolute; left:90px; top:408px;"><span class="p12f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">examination of the list of references appended to published articles. However, it is well</span></div>
|
---|
604 | <div class="txt" style="position:absolute; left:90px; top:432px;"><span class="p12f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">known that authors do not necessarily include in the reference list all documents that</span></div>
|
---|
605 | <div class="txt" style="position:absolute; left:90px; top:456px;"><span class="p12f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">could have been cited, and conversely that not all references listed may have been</span></div>
|
---|
606 | <div class="txt" style="position:absolute; left:90px; top:480px;"><span class="p12f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">actually âusedâ in performing the research; citation behavior can be affected by a</span></div>
|
---|
607 | <div class="txt" style="position:absolute; left:90px; top:504px;"><span class="p12f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">number of motivating factors (Garfield lists </span><span class="p12f3" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">15 </span><span class="p12f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">possible reasons in [8]).</span></div>
|
---|
608 | <div class="txt" style="position:absolute; left:126px; top:528px;"><span class="p12f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">Digital library transaction logs provide a powerful tool for direct analysis of</span></div>
|
---|
609 | <div class="txt" style="position:absolute; left:90px; top:552px;"><span class="p12f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">document âusageâ: since digital libraries contain the actual document (rather than only a</span></div>
|
---|
610 | <div class="txt" style="position:absolute; left:90px; top:576px;"><span class="p12f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">document surrogate), the relative amount of âuseâ that a digital libraryâs clients make of</span></div>
|
---|
611 | <div class="txt" style="position:absolute; left:90px; top:600px;"><span class="p12f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">a given document sees can be estimated from the number of times the document file is</span></div>
|
---|
612 | <div class="txt" style="position:absolute; left:90px; top:624px;"><span class="p12f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">downloaded (and, presumably, the document is read). Note that file downloading is a</span></div>
|
---|
613 | <div class="txt" style="position:absolute; left:90px; top:648px;"><span class="p12f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">much stronger statement on the part of the user than, for example, having a</span></div>
|
---|
614 | <div class="txt" style="position:absolute; left:90px; top:672px;"><span class="p12f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">bibliographic record appear in the query result set for a conventional bibliographic</span></div>
|
---|
615 | <div class="txt" style="position:absolute; left:90px; top:696px;"><span class="p12f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">system; the user downloads only </span><span class="p12f3" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">after </span><span class="p12f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">the document has been found potentially relevant</span></div>
|
---|
616 | <div class="txt" style="position:absolute; left:90px; top:720px;"><span class="p12f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">through examination of its document surrogate. Additionally, downloading is</span></div>
|
---|
617 | <div class="txt" style="position:absolute; left:90px; top:744px;"><span class="p12f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">frequently time-consuming and sometimes costly (depending on local pricing for</span></div>
|
---|
618 | </div>
|
---|
619 | </div>
|
---|
620 |
|
---|
621 | </Content>
|
---|
622 | </Section>
|
---|
623 | <Section>
|
---|
624 | <Description>
|
---|
625 | <Metadata name="Title">Page 13</Metadata>
|
---|
626 | </Description>
|
---|
627 | <Content>
|
---|
628 | <div id="page13">
|
---|
629 | <div style="position: relative; height: 842px; width: 595px;"><style type="text/css">
|
---|
630 | .txt { white-space:nowrap; }
|
---|
631 | .p13f0 { font-family:sans-serif; font-weight:normal; font-style:normal; }
|
---|
632 | .p13f1 { font-family:serif; font-weight:normal; font-style:normal; }
|
---|
633 | .p13f2 { font-family:sans-serif; font-weight:normal; font-style:normal; }
|
---|
634 | </style>
|
---|
635 | <img class="background" height="842" id="background13" src="_httpdocimg_/page13.png" style="position:absolute; left:0px; top:0px;" width="595">
|
---|
636 | <div class="txt" style="position:absolute; left:90px; top:72px;"><span class="p13f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">Internet access). Downloaded documents are therefore highly likely at least to be</span></div>
|
---|
637 | <div class="txt" style="position:absolute; left:90px; top:96px;"><span class="p13f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">scanned, if not read closely. The transaction logs for a digital library can provide a</span></div>
|
---|
638 | <div class="txt" style="position:absolute; left:90px; top:120px;"><span class="p13f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">global picture of the use of documents in the collection, since all user interactions with</span></div>
|
---|
639 | <div class="txt" style="position:absolute; left:90px; top:144px;"><span class="p13f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">the library can be automatically logged for analysis. By contrast, it is of course</span></div>
|
---|
640 | <div class="txt" style="position:absolute; left:90px; top:168px;"><span class="p13f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">impossible to track usage of print bibliographies, and very difficult to monitor usage of</span></div>
|
---|
641 | <div class="txt" style="position:absolute; left:90px; top:192px;"><span class="p13f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">bibliographic data available on CD-ROM across more than one or two sites.</span></div>
|
---|
642 | <div class="txt" style="position:absolute; left:126px; top:216px;"><span class="p13f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">Furthermore, analysis of search requests by geographic location, institution,</span></div>
|
---|
643 | <div class="txt" style="position:absolute; left:90px; top:240px;"><span class="p13f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">and sometimes even individual user are also possible. As an example, Table 2 presents</span></div>
|
---|
644 | <div class="txt" style="position:absolute; left:90px; top:264px;"><span class="p13f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">a portion of the summary of usage statistics (broken down by domain code) for queries</span></div>
|
---|
645 | <div class="txt" style="position:absolute; left:90px; top:288px;"><span class="p13f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">to the computer science technical collection of the </span><span class="p13f1" style="font-size:9px;vertical-align:baseline;color:rgba(0,0,0,1);">NEW ZEALAND DIGITAL LIBRARY</span><span class="p13f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">.</span></div>
|
---|
646 | <div class="txt" style="position:absolute; left:90px; top:312px;"><span class="p13f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">Examination of the data indicates that the heaviest use of the collection comes from</span></div>
|
---|
647 | <div class="txt" style="position:absolute; left:90px; top:336px;"><span class="p13f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">North America, Europe (particularly Germany and Finland), as well as the local New</span></div>
|
---|
648 | <div class="txt" style="position:absolute; left:90px; top:360px;"><span class="p13f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">Zealand community and nearby Australia. As expected for such a collection, a large</span></div>
|
---|
649 | <div class="txt" style="position:absolute; left:90px; top:384px;"><span class="p13f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">proportion of users are from educational (.edu) institutions; surprisingly, however, a</span></div>
|
---|
650 | <div class="txt" style="position:absolute; left:90px; top:408px;"><span class="p13f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">similar number of queries come from commercial (.com) organizations, indicating</span></div>
|
---|
651 | <div class="txt" style="position:absolute; left:90px; top:432px;"><span class="p13f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">perhaps that the documents are seeing use in commercial research and development</span></div>
|
---|
652 | <div class="txt" style="position:absolute; left:90px; top:456px;"><span class="p13f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">units.</span></div>
|
---|
653 | <div class="txt" style="position:absolute; left:90px; top:492px;"><span class="p13f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">Table 2. Accesses to the </span><span class="p13f1" style="font-size:9px;vertical-align:baseline;color:rgba(0,0,0,1);">NEW ZEALAND DIGITAL LIBRARY </span><span class="p13f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">CS collection by Domain</span></div>
|
---|
654 | <div class="txt" style="position:absolute; left:90px; top:504px;"><span class="p13f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">Code</span></div>
|
---|
655 | <div class="txt" style="position:absolute; left:126px; top:555px;"><span class="p13f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">Of course, usage levels can also be further broken down by IP number</span></div>
|
---|
656 | <div class="txt" style="position:absolute; left:90px; top:579px;"><span class="p13f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">(indicating institutions), and systems requiring users to register may also be able to</span></div>
|
---|
657 | <div class="txt" style="position:absolute; left:90px; top:603px;"><span class="p13f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">analyze usage on an individual basis. Since the query strings themselves are also</span></div>
|
---|
658 | <div class="txt" style="position:absolute; left:90px; top:627px;"><span class="p13f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">recorded in the transaction logs, this domain/institution/individual activity could also be</span></div>
|
---|
659 | <div class="txt" style="position:absolute; left:90px; top:651px;"><span class="p13f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">linked to specific subjects through the query terms. Summaries of this type could be</span></div>
|
---|
660 | <div class="txt" style="position:absolute; left:90px; top:675px;"><span class="p13f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">invaluable for studies of geographic diffusion and distribution of research topics.</span></div>
|
---|
661 | <div class="txt" style="position:absolute; left:126px; top:699px;"><span class="p13f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">Transaction log analysis can also indicate time-related patterns in the</span></div>
|
---|
662 | <div class="txt" style="position:absolute; left:90px; top:723px;"><span class="p13f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">information seeking behavior of digital library users. As a sample of this type of</span></div>
|
---|
663 | <div class="txt" style="position:absolute; left:90px; top:747px;"><span class="p13f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">analysis, Paul Ginsparg notes a seven day periodicity in the number of search requests</span></div>
|
---|
664 | </div>
|
---|
665 | </div>
|
---|
666 |
|
---|
667 | </Content>
|
---|
668 | </Section>
|
---|
669 | <Section>
|
---|
670 | <Description>
|
---|
671 | <Metadata name="Title">Page 14</Metadata>
|
---|
672 | </Description>
|
---|
673 | <Content>
|
---|
674 | <div id="page14">
|
---|
675 | <div style="position: relative; height: 842px; width: 595px;"><style type="text/css">
|
---|
676 | .txt { white-space:nowrap; }
|
---|
677 | .p14f0 { font-family:sans-serif; font-weight:normal; font-style:normal; }
|
---|
678 | .p14f1 { font-family:serif; font-weight:normal; font-style:normal; }
|
---|
679 | .p14f2 { font-family:serif; font-weight:bold; font-style:normal; }
|
---|
680 | .p14f3 { font-family:sans-serif; font-weight:normal; font-style:normal; }
|
---|
681 | </style>
|
---|
682 | <img class="background" height="842" id="background14" src="_httpdocimg_/page14.png" style="position:absolute; left:0px; top:0px;" width="595">
|
---|
683 | <div class="txt" style="position:absolute; left:90px; top:72px;"><span class="p14f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">made to the </span><span class="p14f1" style="font-size:9px;vertical-align:baseline;color:rgba(0,0,0,1);">PHYSICS E</span><span class="p14f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">-</span><span class="p14f1" style="font-size:9px;vertical-align:baseline;color:rgba(0,0,0,1);">PRINT </span><span class="p14f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">archives (Figure 4, reproduced from [9]). From this he</span></div>
|
---|
684 | <div class="txt" style="position:absolute; left:90px; top:96px;"><span class="p14f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">adduces that many physicists do not yet have weekend access to the Internet (an</span></div>
|
---|
685 | <div class="txt" style="position:absolute; left:90px; top:120px;"><span class="p14f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">alternative, slightly more cynical hypothesis is that even high energy theoretical</span></div>
|
---|
686 | <div class="txt" style="position:absolute; left:90px; top:144px;"><span class="p14f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">physicists take the weekend off).</span></div>
|
---|
687 | <div class="txt" style="position:absolute; left:128px; top:192px;"><span class="p14f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">Figure 4. Summary of search requests to the physics pre-print archives</span></div>
|
---|
688 | <div class="txt" style="position:absolute; left:90px; top:240px;"><span class="p14f2" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">5. Conclusion</span></div>
|
---|
689 | <div class="txt" style="position:absolute; left:126px; top:288px;"><span class="p14f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">This study suggests opportunities for conducting bibliometric research on the</span></div>
|
---|
690 | <div class="txt" style="position:absolute; left:90px; top:312px;"><span class="p14f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">evolving digital libraries. These repositories are suitable platforms for conventional</span></div>
|
---|
691 | <div class="txt" style="position:absolute; left:90px; top:336px;"><span class="p14f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">bibliometric techniques (such as obsolescence studies, quantification of physical</span></div>
|
---|
692 | <div class="txt" style="position:absolute; left:90px; top:360px;"><span class="p14f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">characteristics of documents comprising a subject literature, time analysis, etc.). The</span></div>
|
---|
693 | <div class="txt" style="position:absolute; left:90px; top:384px;"><span class="p14f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">ability to directly monitor access to documents in digital libraries also enables</span></div>
|
---|
694 | <div class="txt" style="position:absolute; left:90px; top:408px;"><span class="p14f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">researchers to explicitly quantify document usage, as well as to implicitly measure</span></div>
|
---|
695 | <div class="txt" style="position:absolute; left:90px; top:432px;"><span class="p14f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">usage through citations. Additional facilities could aid in the performance of</span></div>
|
---|
696 | <div class="txt" style="position:absolute; left:90px; top:456px;"><span class="p14f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">bibliographic experiments, such as: improved tagging of document fields; provision of</span></div>
|
---|
697 | <div class="txt" style="position:absolute; left:90px; top:480px;"><span class="p14f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">utilities to strip out titles, authors, etc. from common document formats; and the ability</span></div>
|
---|
698 | <div class="txt" style="position:absolute; left:90px; top:504px;"><span class="p14f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">to easily eliminate duplicate entries from downloaded library subsets. Unfortunately,</span></div>
|
---|
699 | <div class="txt" style="position:absolute; left:90px; top:528px;"><span class="p14f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">the most useful of these additional facilities â those associated with a higher degree of</span></div>
|
---|
700 | <div class="txt" style="position:absolute; left:90px; top:552px;"><span class="p14f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">cataloging â run counter to the underlying philosophy of many digital libraries: to</span></div>
|
---|
701 | <div class="txt" style="position:absolute; left:90px; top:576px;"><span class="p14f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">avoid, if possible, manual processing and formal cataloging of documents. While</span></div>
|
---|
702 | <div class="txt" style="position:absolute; left:90px; top:600px;"><span class="p14f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">adherence to this principle can limit the accuracy of fielded searching (or indeed,</span></div>
|
---|
703 | <div class="txt" style="position:absolute; left:90px; top:624px;"><span class="p14f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">preclude it altogether), it can also avoid the cataloging bottleneck and permit digital</span></div>
|
---|
704 | <div class="txt" style="position:absolute; left:90px; top:648px;"><span class="p14f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">libraries to provide access to larger numbers of documents.</span></div>
|
---|
705 | <div class="txt" style="position:absolute; left:126px; top:672px;"><span class="p14f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">The digital libraries complement the information currently available through</span></div>
|
---|
706 | <div class="txt" style="position:absolute; left:90px; top:696px;"><span class="p14f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">paper, online, and CD-ROM bibliographic resources. While these latter databases</span></div>
|
---|
707 | <div class="txt" style="position:absolute; left:90px; top:720px;"><span class="p14f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">generally have the advantage of standardized formatting of bibliographic fields, the</span></div>
|
---|
708 | <div class="txt" style="position:absolute; left:90px; top:744px;"><span class="p14f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">digital libraries are freely accessible, often contain &quot;grey literature&quot; that is otherwise</span></div>
|
---|
709 | </div>
|
---|
710 | </div>
|
---|
711 |
|
---|
712 | </Content>
|
---|
713 | </Section>
|
---|
714 | <Section>
|
---|
715 | <Description>
|
---|
716 | <Metadata name="Title">Page 15</Metadata>
|
---|
717 | </Description>
|
---|
718 | <Content>
|
---|
719 | <div id="page15">
|
---|
720 | <div style="position: relative; height: 842px; width: 595px;"><style type="text/css">
|
---|
721 | .txt { white-space:nowrap; }
|
---|
722 | .p15f0 { font-family:sans-serif; font-weight:normal; font-style:normal; }
|
---|
723 | .p15f1 { font-family:serif; font-weight:normal; font-style:normal; }
|
---|
724 | .p15f2 { font-family:serif; font-weight:bold; font-style:normal; }
|
---|
725 | .p15f3 { font-family:serif; font-weight:normal; font-style:italic; }
|
---|
726 | .p15f4 { font-family:sans-serif; font-weight:normal; font-style:normal; }
|
---|
727 | </style>
|
---|
728 | <img class="background" height="842" id="background15" src="_httpdocimg_/page15.png" style="position:absolute; left:0px; top:0px;" width="595">
|
---|
729 | <div class="txt" style="position:absolute; left:90px; top:72px;"><span class="p15f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">unavailable for analysis, and generally make the full text of documents available. The</span></div>
|
---|
730 | <div class="txt" style="position:absolute; left:90px; top:96px;"><span class="p15f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">insights gained from analysis of digital libraries will add to the store of &quot;information</span></div>
|
---|
731 | <div class="txt" style="position:absolute; left:90px; top:120px;"><span class="p15f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">about information&quot; that we have gained from older types of bibliographic repositories.</span></div>
|
---|
732 | <div class="txt" style="position:absolute; left:90px; top:168px;"><span class="p15f2" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">References</span></div>
|
---|
733 | <div class="txt" style="position:absolute; left:94px; top:204px;"><span class="p15f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">[1] Bollacker, K.D., S. Lawrence, and C.L.Giles, CiteSeer: An Autonomous Web</span></div>
|
---|
734 | <div class="txt" style="position:absolute; left:126px; top:228px;"><span class="p15f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">Agent for Automatic Retrieval and Identification of Interesting Publications,</span></div>
|
---|
735 | <div class="txt" style="position:absolute; left:126px; top:252px;"><span class="p15f3" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">Proceedings of the Second International Conference on Autonomous Agents</span></div>
|
---|
736 | <div class="txt" style="position:absolute; left:126px; top:276px;"><span class="p15f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">(Minneapolis/St. Paul, May 9-13), 1998.</span></div>
|
---|
737 | <div class="txt" style="position:absolute; left:94px; top:300px;"><span class="p15f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">[2] Bowman, C.M., P.B. Danzig, U. Manber, and M.F. Schwartz, Scalable Internet</span></div>
|
---|
738 | <div class="txt" style="position:absolute; left:126px; top:324px;"><span class="p15f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">resource discovery: Research problems and approaches, </span><span class="p15f3" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">Communications of</span></div>
|
---|
739 | <div class="txt" style="position:absolute; left:126px; top:348px;"><span class="p15f3" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">the ACM 37(8) </span><span class="p15f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">(1994) 98-107.</span></div>
|
---|
740 | <div class="txt" style="position:absolute; left:95px; top:372px;"><span class="p15f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">[3] Burton, Hilary D. , Use of a virtual information system for bibliometric analysis,</span></div>
|
---|
741 | <div class="txt" style="position:absolute; left:126px; top:396px;"><span class="p15f3" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">Informaton Processing &amp; Management 24(1) </span><span class="p15f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">(1988) 39-44.</span></div>
|
---|
742 | <div class="txt" style="position:absolute; left:94px; top:420px;"><span class="p15f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">[4] Cunningham, S.J., An empirical investigation of the obsolescence rate for</span></div>
|
---|
743 | <div class="txt" style="position:absolute; left:126px; top:444px;"><span class="p15f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">information systems literature, </span><span class="p15f3" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">Library and Information Science</span></div>
|
---|
744 | <div class="txt" style="position:absolute; left:126px; top:468px;"><span class="p15f3" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">Research</span><span class="p15f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">., 1996, http://library.fgcu.edu/iclc/lisrissu.htm</span></div>
|
---|
745 | <div class="txt" style="position:absolute; left:97px; top:492px;"><span class="p15f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">[5] Cunningham, S.J., and D. Bocock, Obsolescence of computing literature.</span></div>
|
---|
746 | <div class="txt" style="position:absolute; left:126px; top:516px;"><span class="p15f3" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">Scientometrics 34(2) </span><span class="p15f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">(1995), pp. 255-262.</span></div>
|
---|
747 | <div class="txt" style="position:absolute; left:97px; top:540px;"><span class="p15f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">[6] Cunningham, S.J. and Lynn Silipigni Connaway, Information searching</span></div>
|
---|
748 | <div class="txt" style="position:absolute; left:126px; top:564px;"><span class="p15f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">preferences and practices of computer science researchers, </span><span class="p15f3" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">Proceedings of</span></div>
|
---|
749 | <div class="txt" style="position:absolute; left:126px; top:588px;"><span class="p15f3" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">OZCHI '96 </span><span class="p15f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">(1996) 294-299.</span></div>
|
---|
750 | <div class="txt" style="position:absolute; left:94px; top:612px;"><span class="p15f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">[7] de Solla Price, D.J., Citation measures of hard science, soft science, technology,</span></div>
|
---|
751 | <div class="txt" style="position:absolute; left:126px; top:636px;"><span class="p15f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">and nonscience. In: C.E. Nelson and D.K. Pollock (eds), </span><span class="p15f3" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">Communication</span></div>
|
---|
752 | <div class="txt" style="position:absolute; left:126px; top:660px;"><span class="p15f3" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">among scientists and engineers </span><span class="p15f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">(Heath Lexington, 1970).</span></div>
|
---|
753 | <div class="txt" style="position:absolute; left:95px; top:696px;"><span class="p15f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">[8] Garfield, E., </span><span class="p15f3" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">Citation Indexing: Its theory and application in Science, Technology</span></div>
|
---|
754 | <div class="txt" style="position:absolute; left:126px; top:720px;"><span class="p15f3" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">and Humanities (</span><span class="p15f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">Wiley, 1979).</span></div>
|
---|
755 | </div>
|
---|
756 | </div>
|
---|
757 |
|
---|
758 | </Content>
|
---|
759 | </Section>
|
---|
760 | <Section>
|
---|
761 | <Description>
|
---|
762 | <Metadata name="Title">Page 16</Metadata>
|
---|
763 | </Description>
|
---|
764 | <Content>
|
---|
765 | <div id="page16">
|
---|
766 | <div style="position: relative; height: 842px; width: 595px;"><style type="text/css">
|
---|
767 | .txt { white-space:nowrap; }
|
---|
768 | .p16f0 { font-family:sans-serif; font-weight:normal; font-style:normal; }
|
---|
769 | .p16f1 { font-family:serif; font-weight:normal; font-style:normal; }
|
---|
770 | .p16f2 { font-family:serif; font-weight:normal; font-style:italic; }
|
---|
771 | .p16f3 { font-family:sans-serif; font-weight:normal; font-style:normal; }
|
---|
772 | </style>
|
---|
773 | <img class="background" height="842" id="background16" src="_httpdocimg_/page16.png" style="position:absolute; left:0px; top:0px;" width="595">
|
---|
774 | <div class="txt" style="position:absolute; left:95px; top:72px;"><span class="p16f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">[9] Ginsparg, P. After dinner remarks: 14 Oct â94 APS meeting at LANL, 1994</span></div>
|
---|
775 | <div class="txt" style="position:absolute; left:126px; top:96px;"><span class="p16f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">(&lt;URL: http://xxx.lanl.gov/blurb&gt; ).</span></div>
|
---|
776 | <div class="txt" style="position:absolute; left:95px; top:120px;"><span class="p16f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">[10] Ginsparg, P., First steps towards electronic research communication, </span><span class="p16f2" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">Computers</span></div>
|
---|
777 | <div class="txt" style="position:absolute; left:126px; top:144px;"><span class="p16f2" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">in Physics 8(4) </span><span class="p16f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">(1994) 390-401.</span></div>
|
---|
778 | <div class="txt" style="position:absolute; left:95px; top:168px;"><span class="p16f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">[11] Hallmark, J., Scientists' access and retrieval of references cited in their recent</span></div>
|
---|
779 | <div class="txt" style="position:absolute; left:126px; top:192px;"><span class="p16f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">journal articles, </span><span class="p16f2" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">College and Research Libraries 55(3) </span><span class="p16f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">(1994) 199-210.</span></div>
|
---|
780 | <div class="txt" style="position:absolute; left:95px; top:216px;"><span class="p16f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">[12] Hawkins, D.T. , Unconventional uses of on-line information retrieval systems:</span></div>
|
---|
781 | <div class="txt" style="position:absolute; left:126px; top:240px;"><span class="p16f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">on-line bibliometric studies, </span><span class="p16f2" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">Journal of the American Society for Information</span></div>
|
---|
782 | <div class="txt" style="position:absolute; left:126px; top:264px;"><span class="p16f2" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">Science 28 </span><span class="p16f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">(1977) 13-18.</span></div>
|
---|
783 | <div class="txt" style="position:absolute; left:95px; top:288px;"><span class="p16f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">[13] McGhee, P.E. , P.R. Skinner, K. Roberto, N.J. Ridenour, and S.M. Larson,</span></div>
|
---|
784 | <div class="txt" style="position:absolute; left:126px; top:312px;"><span class="p16f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">Using online databases to study current research trends: an online bibliometric</span></div>
|
---|
785 | <div class="txt" style="position:absolute; left:126px; top:336px;"><span class="p16f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">study, </span><span class="p16f2" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">Library and Information Science Research 9 </span><span class="p16f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">(1987) 285-291.</span></div>
|
---|
786 | <div class="txt" style="position:absolute; left:95px; top:360px;"><span class="p16f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">[14] Maly, K., E.A. Fox, J.C. French, and A.L. Selman, Wide area technical report</span></div>
|
---|
787 | <div class="txt" style="position:absolute; left:126px; top:384px;"><span class="p16f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">server (</span><span class="p16f2" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">Technical Report , </span><span class="p16f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">Dept. of Computer Science, Old Dominion</span></div>
|
---|
788 | <div class="txt" style="position:absolute; left:126px; top:408px;"><span class="p16f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">University, 1994. Also available at</span></div>
|
---|
789 | <div class="txt" style="position:absolute; left:471px; top:408px;"><span class="p16f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">&lt;URL:</span></div>
|
---|
790 | <div class="txt" style="position:absolute; left:126px; top:432px;"><span class="p16f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">http://www.cs.odu.edu/WATERS/WATERS-paper.ps&gt; ).</span></div>
|
---|
791 | <div class="txt" style="position:absolute; left:95px; top:456px;"><span class="p16f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">[15] Sigogneau, M.J. , S. Bain, J.P. Courtial, and H. Feillet, Scientific innovation in</span></div>
|
---|
792 | <div class="txt" style="position:absolute; left:126px; top:480px;"><span class="p16f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">bibliographical databases: a comparative study of the Science Citation Index</span></div>
|
---|
793 | <div class="txt" style="position:absolute; left:126px; top:504px;"><span class="p16f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">and the Pascal database, </span><span class="p16f2" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">Scientometrics 22(1) </span><span class="p16f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">(1991) 65-82.</span></div>
|
---|
794 | <div class="txt" style="position:absolute; left:95px; top:528px;"><span class="p16f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">[16] Witten, I.H., S.J. Cunningham, M. Vallabh, and T.C. Bell, A New Zealand</span></div>
|
---|
795 | <div class="txt" style="position:absolute; left:126px; top:552px;"><span class="p16f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">digital library for computer science research, </span><span class="p16f2" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">Proceedings of Digital Libraries</span></div>
|
---|
796 | <div class="txt" style="position:absolute; left:126px; top:576px;"><span class="p16f2" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">'95 </span><span class="p16f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">(1995) 25-30.</span></div>
|
---|
797 | <div class="txt" style="position:absolute; left:95px; top:600px;"><span class="p16f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">[17] Witten, I.H., C. Nevill-Manning, and S.J. Cunningham, A public library based</span></div>
|
---|
798 | <div class="txt" style="position:absolute; left:126px; top:624px;"><span class="p16f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">on full-text retrieval, </span><span class="p16f2" style="font-size:12px;vertical-align:baseline;color:rgba(0,0,0,1);">Communications of the ACM </span><span class="p16f1" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">41(4), 1998, p. 71</span></div>
|
---|
799 | </div>
|
---|
800 | </div>
|
---|
801 |
|
---|
802 | </Content>
|
---|
803 | </Section>
|
---|
804 | <Section>
|
---|
805 | <Description>
|
---|
806 | <Metadata name="Title">Page 17</Metadata>
|
---|
807 | </Description>
|
---|
808 | <Content>
|
---|
809 | <div id="page17">
|
---|
810 | <div style="position: relative; height: 842px; width: 595px;"><style type="text/css">
|
---|
811 | .txt { white-space:nowrap; }
|
---|
812 | .p17f0 { font-family:sans-serif; font-weight:normal; font-style:normal; }
|
---|
813 | .p17f1 { font-family:serif; font-weight:normal; font-style:normal; }
|
---|
814 | .p17f2 { font-family:serif; font-weight:normal; font-style:normal; }
|
---|
815 | .p17f3 { font-family:sans-serif; font-weight:normal; font-style:normal; }
|
---|
816 | </style>
|
---|
817 | <img class="background" height="842" id="background17" src="_httpdocimg_/page17.png" style="position:absolute; left:0px; top:0px;" width="595">
|
---|
818 | <div class="txt" style="position:absolute; left:90px; top:111px;"><span class="p17f1" style="font-size:6px;vertical-align:baseline;color:rgba(0,0,0,1);">1</span><span class="p17f2" style="font-size:11px;vertical-align:sub;color:rgba(0,0,0,1);">Documents were randomly sampled from the DEC</span></div>
|
---|
819 | <div class="txt" style="position:absolute; left:90px; top:135px;"><span class="p17f2" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">(ftp://crl.dec.com/pub/DEC/CRL/tech-reports/), Sony</span></div>
|
---|
820 | <div class="txt" style="position:absolute; left:90px; top:159px;"><span class="p17f2" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">(ftp://ftp.csl.sony.co.jp/CSL/CSL-Papers), and Ohio (ftp://archive.cis.ohio-</span></div>
|
---|
821 | <div class="txt" style="position:absolute; left:90px; top:183px;"><span class="p17f2" style="font-size:11px;vertical-align:baseline;color:rgba(0,0,0,1);">state.edu/pub/tech-report/) technical report repositories</span></div>
|
---|
822 | </div>
|
---|
823 | </div>
|
---|
824 |
|
---|
825 | </Content>
|
---|
826 | </Section>
|
---|
827 | </Section>
|
---|
828 | </Section>
|
---|
829 | </Archive>
|
---|