source: gsdl/trunk/src/colservr/sqlbrowsefilter.cpp@ 16180

Last change on this file since 16180 was 16180, checked in by mdewsnip, 16 years ago

Modifying get_metadata_values() and get_documents_with_metadata_value() to take an array of metadata elements, rather than just one metadata element. This allows building a dynamic classifier on multiple metadata elements.

File size: 6.9 KB
Line 
1/**********************************************************************
2 *
3 * sqlbrowsefilter.cpp --
4 * Copyright (C) 2008 DL Consulting Ltd
5 *
6 * A component of the Greenstone digital library software
7 * from the New Zealand Digital Library Project at the
8 * University of Waikato, New Zealand.
9 *
10 * This program is free software; you can redistribute it and/or modify
11 * it under the terms of the GNU General Public License as published by
12 * the Free Software Foundation; either version 2 of the License, or
13 * (at your option) any later version.
14 *
15 * This program is distributed in the hope that it will be useful,
16 * but WITHOUT ANY WARRANTY; without even the implied warranty of
17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 * GNU General Public License for more details.
19 *
20 * You should have received a copy of the GNU General Public License
21 * along with this program; if not, write to the Free Software
22 * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
23 *
24 *********************************************************************/
25
26#include "sqlbrowsefilter.h"
27#include "fileutil.h"
28
29
30sqlbrowsefilterclass::sqlbrowsefilterclass ()
31{
32 sql_db_ptr = NULL;
33}
34
35
36sqlbrowsefilterclass::~sqlbrowsefilterclass ()
37{
38}
39
40
41void sqlbrowsefilterclass::configure (const text_t &key, const text_tarray &cfgline)
42{
43 filterclass::configure (key, cfgline);
44
45 if (key == "indexstem")
46 {
47 indexstem = cfgline[0];
48 }
49}
50
51
52bool sqlbrowsefilterclass::init (ostream &logout)
53{
54 outconvertclass text_t2ascii;
55
56 if (!filterclass::init(logout)) return false;
57
58 if (sql_db_ptr == NULL)
59 {
60 // most likely a configuration problem
61 logout << text_t2ascii << "configuration error: sqlbrowsefilter contains a null sqldbclass\n\n";
62 return false;
63 }
64
65 if (indexstem.empty())
66 {
67 indexstem = collection;
68 }
69
70 // get the filename for the database and make sure it exists
71 sql_db_filename = filename_cat(dbhome, "collect", collection, "index", "text", indexstem);
72 sql_db_filename += sql_db_ptr->getfileextension();
73 if (!file_exists(sql_db_filename))
74 {
75 logout << text_t2ascii << "warning: database \"" << sql_db_filename << "\" does not exist\n\n";
76 return false;
77 }
78
79 return true;
80}
81
82
83void sqlbrowsefilterclass::filter (const FilterRequest_t &request,
84 FilterResponse_t &response,
85 comerror_t &err, ostream &logout)
86{
87 outconvertclass text_t2ascii;
88
89 response.clear();
90 err = noError;
91
92 if (sql_db_ptr == NULL) {
93 // most likely a configuration problem
94 logout << text_t2ascii << "configuration error: sqlbrowsefilter contains a null sqldbclass\n\n";
95 err = configurationError;
96 return;
97 }
98
99 // open the database
100 sql_db_ptr->setlogout (&logout);
101 if (!sql_db_ptr->opendatabase (sql_db_filename, DB_READER, 100, false)) {
102 // most likely a system problem (we have already checked that the database exists)
103 logout << text_t2ascii << "system problem: open on database \"" << sql_db_filename << "\" failed\n\n";
104 err = systemProblem;
105 return;
106 }
107
108 // Request for the metadata values assigned to an element
109 if (request.requestParams == "GetMetadataValues")
110 {
111 text_tarray metadata_element_names;
112 text_t metadata_value_filter = "";
113 text_t metadata_value_grouping_expression = "";
114 OptionValue_tarray::const_iterator options_iterator = request.filterOptions.begin();
115 while (options_iterator != request.filterOptions.end())
116 {
117 if ((*options_iterator).name == "MetadataElements")
118 {
119 splitchar ((*options_iterator).value.begin(), (*options_iterator).value.end(), ',', metadata_element_names);
120 }
121 if ((*options_iterator).name == "MetadataValueFilter")
122 {
123 metadata_value_filter = (*options_iterator).value;
124 }
125 if ((*options_iterator).name == "MetadataValueGroupingExpression")
126 {
127 metadata_value_grouping_expression = (*options_iterator).value;
128 }
129 options_iterator++;
130 }
131
132 text_tarray metadata_values = sql_db_ptr->get_metadata_values (metadata_element_names, metadata_value_filter, metadata_value_grouping_expression);
133
134 // Create a map from metadata value to ResultDocInfo_t, to remove duplicate values and obtain occurrence counts
135 map<text_t, ResultDocInfo_t> unique_metadata_values_map;
136 text_tarray::iterator metadata_value_iterator = metadata_values.begin();
137 while (metadata_value_iterator != metadata_values.end())
138 {
139 text_t metadata_value = *metadata_value_iterator;
140
141 // If no ResultDocInfo_t has already been created for this metadata value, create one now
142 if (unique_metadata_values_map.find(metadata_value) == unique_metadata_values_map.end())
143 {
144 ResultDocInfo_t metadata_value_result_doc;
145 metadata_value_result_doc.OID = metadata_value;
146 metadata_value_result_doc.result_num = 1;
147 unique_metadata_values_map[metadata_value] = metadata_value_result_doc;
148 }
149 // Otherwise we've seen this value before, so just update the occurrence count
150 else
151 {
152 unique_metadata_values_map[metadata_value].result_num++;
153 }
154
155 metadata_value_iterator++;
156 }
157
158 // Fill in response.docInfo with the ResultDocInfo_t objects we've created above
159 map<text_t, ResultDocInfo_t>::iterator unique_metadata_values_iterator = unique_metadata_values_map.begin();
160 while (unique_metadata_values_iterator != unique_metadata_values_map.end())
161 {
162 response.docInfo.push_back ((*unique_metadata_values_iterator).second);
163 unique_metadata_values_iterator++;
164 }
165 }
166
167 // Request for the documents with a certain metadata value assigned
168 else if (request.requestParams == "GetDocumentsWithMetadataValue")
169 {
170 text_tarray metadata_element_names;
171 text_t metadata_value = "";
172 text_t sort_by_metadata_element_name = "";
173 OptionValue_tarray::const_iterator options_iterator = request.filterOptions.begin();
174 while (options_iterator != request.filterOptions.end())
175 {
176 if ((*options_iterator).name == "MetadataElements")
177 {
178 splitchar ((*options_iterator).value.begin(), (*options_iterator).value.end(), ',', metadata_element_names);
179 }
180 if ((*options_iterator).name == "MetadataValue")
181 {
182 metadata_value = (*options_iterator).value;
183 }
184 if ((*options_iterator).name == "SortByMetadataElement")
185 {
186 sort_by_metadata_element_name = (*options_iterator).value;
187 }
188 options_iterator++;
189 }
190
191 text_tarray document_OIDs = sql_db_ptr->get_documents_with_metadata_value (metadata_element_names, metadata_value, sort_by_metadata_element_name);
192
193 // Fill in response.docInfo with the document OIDs
194 text_tarray::iterator document_OID_iterator = document_OIDs.begin();
195 while (document_OID_iterator != document_OIDs.end())
196 {
197 ResultDocInfo_t document_result_doc;
198 document_result_doc.OID = *document_OID_iterator;
199 response.docInfo.push_back (document_result_doc);
200 document_OID_iterator++;
201 }
202 }
203
204 sql_db_ptr->closedatabase(); // Important that local library doesn't leave any files open
205}
Note: See TracBrowser for help on using the repository browser.