source: trunk/gsdl/src/recpt/comtypes.h@ 13017

Last change on this file since 13017 was 12863, checked in by kjdon, 18 years ago

added in stemIndexes to colinfo_t, plus some #defines. stemIndexes tells us whether we have casefold/stem/accentfold indexes

  • Property svn:executable set to *
  • Property svn:keywords set to Author Date Id Revision
File size: 11.3 KB
Line 
1/**********************************************************************
2 *
3 * comtypes.h --
4 * Copyright (C) 1999,2004 The New Zealand Digital Library Project
5 *
6 * A component of the Greenstone digital library software
7 * from the New Zealand Digital Library Project at the
8 * University of Waikato, New Zealand.
9 *
10 * This program is free software; you can redistribute it and/or modify
11 * it under the terms of the GNU General Public License as published by
12 * the Free Software Foundation; either version 2 of the License, or
13 * (at your option) any later version.
14 *
15 * This program is distributed in the hope that it will be useful,
16 * but WITHOUT ANY WARRANTY; without even the implied warranty of
17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 * GNU General Public License for more details.
19 *
20 * You should have received a copy of the GNU General Public License
21 * along with this program; if not, write to the Free Software
22 * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
23 *
24 *********************************************************************/
25
26
27#ifndef COMTYPES_H
28#define COMTYPES_H
29
30#include "gsdlconf.h"
31#include "text_t.h"
32
33#if defined(GSDL_USE_OBJECTSPACE)
34# include <ospace\std\vector>
35# include <ospace\std\list>
36# include <ospace\std\memory> // for pair
37# include <ospace\std\map>
38#elif defined(GSDL_USE_STL_H)
39# include <vector.h>
40# include <list.h>
41# include <memory.h> // for pair
42# include <map.h>
43#else
44# include <vector>
45# include <list>
46# include <memory> // for pair
47# include <map>
48#endif
49
50
51enum comerror_t {noError, authenticationFailure, protocolError,
52 configurationError, systemProblem, syntaxError};
53text_t get_comerror_string (comerror_t err);
54
55
56// ShortColInfo ::= SEQUENCE {
57// name GeneralString,
58// host GeneralString,
59// port INTEGER
60// }
61struct ShortColInfo_t {
62 void clear ();
63 ShortColInfo_t () {clear();}
64
65 text_t name;
66 text_t host;
67 int port;
68};
69
70// for collection metadata: metadata name -> lang -> value
71// for collection macros: macro name -> params -> value
72typedef map<text_t, text_tmap, lttext_t> collectionmeta_map;
73
74#define CCSUniformSearchResultsFormatting 1
75
76#define SIcasefold 1
77#define SIstem 2
78#define SIaccentfold 4
79
80struct ColInfoResponse_t {
81 void clear ();
82 ColInfoResponse_t () {clear();}
83 text_t get_collectionmeta(text_t name, text_t lang);
84
85 ShortColInfo_t shortInfo;
86 bool isPublic;
87 bool isBeta;
88 bool isSegmented;
89 unsigned long buildDate;
90 text_tarray ccsCols; // empty if collection does not use cross-collection searching
91 int ccsOptions; // uses CCS #defines from above
92 int stemIndexes; // uses SI #defines from above
93 text_tarray languages;
94 unsigned long numDocs; // 0 if not known
95 unsigned long numSections; // 0 if not known
96 unsigned long numWords; // 0 if not known
97 unsigned long numBytes; // 0 if not known
98 collectionmeta_map collectionmeta;
99 text_tmap format;
100 collectionmeta_map collection_macros; // for collectionmacro config directive (> gsdl 2.53)
101 text_tmap building;
102 text_t httpdomain; // GRB: could these two http items need removing
103 text_t httpprefix;
104 text_t receptionist;
105 text_t buildType; // 'mg' or 'mgpp' or 'lucene'
106 text_t authenticate; // 'document' or 'collection'
107 text_t auth_group; // 'mygroup' 'yourgroup'
108 text_tmap public_documents; // the acl to allow access to listed documents
109 text_tmap private_documents; // the acl to disallow access to listed documents
110};
111
112
113// -- filter options which might be supported for the QueryFilter
114// --
115// -- onePerQuery StartResults integer
116// -- onePerQuery EndResults integer
117// -- onePerQuery QueryType enumerated (boolean, ranked)
118// -- onePerTerm Term string ???
119// -- onePerTerm Casefold boolean
120// -- onePerTerm Stem boolean
121// -- onePerTerm Index enumerated
122// -- onePerTerm Subcollection enumerated
123// --
124// -- filter options which might be supported for the BrowseFilter
125// --
126// -- onePerQuery StartResults integer
127// -- onePerQuery EndResults integer
128// -- onePerQuery ParentNode string ("" will return the browsing available)
129// --
130// -- The NullFilter always returns the set it was given, it doesn't have
131// -- any options
132
133// InfoFiltersResponse ::= SEQUENCE {
134// filterNames StringSet
135// }
136struct InfoFiltersResponse_t {
137 void clear ();
138
139 text_tset filterNames;
140};
141
142// InfoFilterOptionsRequest ::= SEQUENCE {
143// filterName GeneralString
144// }
145struct InfoFilterOptionsRequest_t {
146 void clear ();
147
148 text_t filterName;
149};
150
151// FilterOption ::= SEQUENCE {
152// name GeneralString,
153// type ENUMERATED {booleant(0), integert(1), enumeratedt(2), stringt(3)},
154// repeatable ENUMERATED {onePerQuery(0), onePerTerm(1), nPerTerm(2)},
155// defaultValue GeneralString,
156// -- the interpretation of the validValues depends on the type
157// -- for boolean: the first value is the false value, the second is true value
158// -- for integer: the first value is the minimum, the second the maximum
159// -- for enumerated: all values a listed
160// -- for string: this value is ignored
161// validValues StringSequence
162// }
163struct FilterOption_t {
164 void clear ();
165 void check_defaultValue ();
166 FilterOption_t () {clear();}
167
168 text_t name;
169
170 enum type_t {booleant=0, integert=1, enumeratedt=2, stringt=3};
171 type_t type;
172
173 enum repeatable_t {onePerQuery=0, onePerTerm=1, nPerTerm=2};
174 repeatable_t repeatable;
175
176 text_t defaultValue;
177 text_tarray validValues;
178};
179
180bool operator==(const FilterOption_t &x, const FilterOption_t &y);
181bool operator<(const FilterOption_t &x, const FilterOption_t &y);
182
183
184typedef map<text_t, FilterOption_t, lttext_t> FilterOption_tmap;
185
186
187// InfoFilterOptionsResponse ::= SEQUENCE {
188// filterOptions SET OF FilterOption
189// }
190struct InfoFilterOptionsResponse_t {
191 void clear ();
192
193 FilterOption_tmap filterOptions;
194};
195
196
197// OptionValue ::= SEQUENCE {
198// name GeneralString,
199// value GeneralString
200// }
201struct OptionValue_t {
202 void clear ();
203
204 text_t name;
205 text_t value;
206};
207
208typedef vector<OptionValue_t> OptionValue_tarray;
209
210
211// -- Terms are presented in the same order that they are requested,
212// -- any information relating to the terms is in reference to the
213// -- index specified for that term.
214//
215// FilterRequest ::= SEQUENCE {
216// filterName [0] GeneralString,
217// filterOptions [1] IMPLICIT SEQUENCE OF OptionValue,
218// docSet [2] IMPLICIT StringSequence, -- the OID "" represents everything
219// filterResultOptions [3] IMPLICIT BIT STRING {termFreq(0), matchTerms(1), OID(2),
220// subCol(3), ranking(4), docFreq(5),
221// metadata(6)}
222//
223// -- the next set of options are for the metadata request,
224// -- they can be left blank if metadata is not wanted
225// requestParams [4] IMPLICIT GeneralString, -- used to negotiate the metadata content
226// refParams [5] IMPLICIT GeneralString, -- used to decide whether to return a
227// -- reference to the data or the actual data
228// fields [6] IMPLICIT StringSet
229// getParents [7] IMPLICIT BOOLEAN -- gets metadata of all parents too
230// }
231#define FRtermFreq 1
232#define FRmatchTerms 2
233#define FROID 4
234#define FRsubCol 8
235#define FRranking 16
236#define FRdocFreq 32
237#define FRmetadata 64
238// used to indicate a full text browse query for mgpp
239#define FRfullTextBrowse 128
240
241struct FilterRequest_t {
242 void clear ();
243 FilterRequest_t () {clear();}
244
245 text_t filterName;
246 text_t filterLang; // non empty if we want info to be retrived in language specific
247 OptionValue_tarray filterOptions;
248 text_tarray docSet; // empty if not used
249 int filterResultOptions; // use the FR* defines above
250
251 text_t requestParams; // empty if not used
252 text_t refParams; // empty if not used
253 text_tset fields; // empty if not used
254 bool getParents; // defaults to false
255};
256
257
258// TermInfo ::= SEQUENCE {
259// term [0] GeneralString,
260// freq [1] IMPLICIT INTEGER, -- 0 if not requested
261// matchTerms [2] IMPLICIT StringSequence -- empty if not requested
262// }
263struct TermInfo_t {
264 void clear ();
265 TermInfo_t () {clear();}
266
267 text_t term;
268 int freq; // 0 if not requested
269 text_tarray matchTerms; // empty if not requested
270};
271
272typedef vector<TermInfo_t> TermInfo_tarray;
273
274
275// MetadataInfo ::= SEQUENCE {
276// params [0] IMPLICIT GeneralString,
277// isRef [1] IMPLICIT BOOLEAN,
278// values [3] IMPLICIT SEQUENCE OF GeneralString,
279// name [4] IMPLICIT GeneralString
280// }
281struct MetadataInfo_t {
282 text_t params;
283 bool isRef;
284 text_tarray values;
285 MetadataInfo_t *parent;
286
287 void clear ();
288 MetadataInfo_t ();
289 MetadataInfo_t (const MetadataInfo_t &x); // copy constructor
290 ~MetadataInfo_t ();
291 MetadataInfo_t &operator=(const MetadataInfo_t &x);
292};
293
294typedef map<text_t, MetadataInfo_t, lttext_t> MetadataInfo_tmap;
295
296// ResultDocInfo ::= SEQUENCE {
297// OID [0] IMPLICIT GeneralString,
298// ranking [1] IMPLICIT INTEGER, -- 0 if not requested, range 0-10000
299// docFreq [2] IMPLICIT SEQUENCE OF INTEGER, -- empty if not requested
300// metadata [3] IMPLICIT SEQUENCE OF MetadataInfo, -- no longer a SEQUENCE (SET maybe??)
301// classifier_metadata_type [4] IMPLICIT GeneralString, -- empty if not requested
302// classifier_metadata_offset [5] IMPLICIT INTEGER, -- 0 if not requested
303// }
304struct ResultDocInfo_t {
305 void clear ();
306 ResultDocInfo_t () {clear();}
307
308 text_t OID;
309 int result_num; // place in results list
310 int ranking; // 0 if not requested (real ranking*10000)
311 int num_terms_matched; // not available on all versions of mg
312 int num_phrase_match; // not available on all versions of mg
313 vector<int> docFreq; // empty if not requested
314 MetadataInfo_tmap metadata; // empty if not requested
315 text_t classifier_metadata_type; // empty if not requested
316 int classifier_metadata_offset; // 0 if not requested
317 ResultDocInfo_t &operator=(const ResultDocInfo_t &x);
318};
319
320typedef vector<ResultDocInfo_t> ResultDocInfo_tarray;
321
322
323// FilterResponse ::= SEQUENCE {
324// numDocs [0] IMPLICIT INTEGER,
325// isApprox [1] ENUMERATED {Exact(0), Approximate(1), MoreThan(2)}, -- whether numDocs is approximate
326// termInfo [2] IMPLICIT SEQUENCE OF TermInfo, -- empty if not required
327// docInfo [3] IMPLICIT SEQUENCE OF ResultDocInfo -- empty if not required
328// }
329
330enum isapprox {Exact=0, Approximate=1, MoreThan=2};
331
332struct FilterResponse_t {
333 void clear ();
334 FilterResponse_t () {clear();}
335
336 text_t error_message; // Currently only used by Lucene
337 int numDocs;
338 isapprox isApprox;
339 TermInfo_tarray termInfo; // empty if not requested
340 ResultDocInfo_tarray docInfo; // empty if not requested
341 text_tset stopwords;
342
343 FilterResponse_t &operator=(const FilterResponse_t &x);
344};
345
346
347// DocumentRequest ::= SEQUENCE {
348// OID GeneralString,
349// docType GeneralString,
350// docFormat GeneralString
351// }
352struct DocumentRequest_t {
353 void clear ();
354 DocumentRequest_t () {clear();}
355
356 text_t OID;
357 text_t docType;
358 text_t docFormat;
359};
360
361
362// DocumentResponse ::= SEQUENCE {
363// doc OCTET STRING
364// }
365
366struct DocumentResponse_t {
367 void clear ();
368 DocumentResponse_t () {clear();}
369
370 text_t doc;
371};
372
373
374#endif
375
Note: See TracBrowser for help on using the repository browser.