source: gsdl/trunk/src/recpt/dynamicclassifieraction.cpp@ 16112

Last change on this file since 16112 was 16112, checked in by mdewsnip, 16 years ago

Removed some duplicate code by calling display_classifier_nodes() from output_grouping_nodes().

  • Property svn:executable set to *
File size: 22.0 KB
Line 
1/**********************************************************************
2 *
3 * dynamicclassifieraction.cpp --
4 * Copyright (C) 2008 DL Consulting Ltd
5 *
6 * A component of the Greenstone digital library software
7 * from the New Zealand Digital Library Project at the
8 * University of Waikato, New Zealand.
9 *
10 * This program is free software; you can redistribute it and/or modify
11 * it under the terms of the GNU General Public License as published by
12 * the Free Software Foundation; either version 2 of the License, or
13 * (at your option) any later version.
14 *
15 * This program is distributed in the hope that it will be useful,
16 * but WITHOUT ANY WARRANTY; without even the implied warranty of
17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 * GNU General Public License for more details.
19 *
20 * You should have received a copy of the GNU General Public License
21 * along with this program; if not, write to the Free Software
22 * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
23 *
24 *********************************************************************/
25
26#include "dynamicclassifieraction.h"
27#include "recptprototools.h"
28
29
30dynamicclassifieraction::dynamicclassifieraction ()
31{
32 recpt = NULL;
33
34 cgiarginfo arg_ainfo;
35 arg_ainfo.shortname = "dcl";
36 arg_ainfo.longname = "dynamic classifier ID";
37 arg_ainfo.multiplechar = true;
38 arg_ainfo.defaultstatus = cgiarginfo::weak;
39 arg_ainfo.argdefault = "";
40 arg_ainfo.savedarginfo = cgiarginfo::must;
41 argsinfo.addarginfo (NULL, arg_ainfo);
42
43 arg_ainfo.shortname = "dcn";
44 arg_ainfo.longname = "dynamic classifier node";
45 arg_ainfo.multiplechar = true;
46 arg_ainfo.defaultstatus = cgiarginfo::weak;
47 arg_ainfo.argdefault = "";
48 arg_ainfo.savedarginfo = cgiarginfo::must;
49 argsinfo.addarginfo (NULL, arg_ainfo);
50}
51
52
53dynamicclassifieraction::~dynamicclassifieraction()
54{
55}
56
57
58bool dynamicclassifieraction::check_cgiargs (cgiargsinfoclass &argsinfo, cgiargsclass &args,
59 recptprotolistclass *protos, ostream &logout)
60{
61 return true;
62}
63
64
65void dynamicclassifieraction::get_cgihead_info (cgiargsclass &args, recptprotolistclass *protos,
66 response_t &response,text_t &response_data,
67 ostream &logout)
68{
69 response = content;
70 response_data = "text/html";
71}
72
73
74// define all the macros which might be used by other actions to produce pages.
75void dynamicclassifieraction::define_external_macros (displayclass &disp, cgiargsclass &args,
76 recptprotolistclass *protos, ostream &logout)
77{
78 // A valid collection server is vital
79 recptproto *collectproto = protos->getrecptproto (args["c"], logout);
80 if (collectproto == NULL)
81 {
82 logout << "dynamicclassifieraction::define_external_macros called with NULL collectproto\n";
83 return;
84 }
85
86 // Define _dynamicclassifiernavbarentries_ to add buttons to the navigation bar for the dynamic classifiers
87 text_t navigation_bar_entries = "";
88 ColInfoResponse_t *cinfo = recpt->get_collectinfo_ptr (collectproto, args["c"], logout);
89 text_tmap::iterator dynamic_classifier_iterator = cinfo->dynamic_classifiers.begin();
90 while (dynamic_classifier_iterator != cinfo->dynamic_classifiers.end())
91 {
92 text_t dynamic_classifier_id = (*dynamic_classifier_iterator).first;
93 navigation_bar_entries += "_navbarspacer_";
94 navigation_bar_entries += "_navtab_(_gwcgi_?c=" + args["c"] + "&amp;a=dc&amp;dcl=" + dynamic_classifier_id + "," + dynamic_classifier_id;
95 if (args["a"] == "dc" && args["dcl"] == dynamic_classifier_id)
96 {
97 navigation_bar_entries += ",selected";
98 }
99 navigation_bar_entries += ")";
100 dynamic_classifier_iterator++;
101 }
102
103 disp.setmacro("dynamicclassifiernavbarentries", displayclass::defaultpackage, navigation_bar_entries);
104}
105
106
107// define all the macros which are related to pages generated
108// by this action. we also load up the formatinfo structure
109// here (it's used in do_action as well as here)
110void dynamicclassifieraction::define_internal_macros (displayclass &disp, cgiargsclass &args,
111 recptprotolistclass *protos, ostream &logout)
112{
113 // define_internal_macros sets the following macros:
114}
115
116
117bool dynamicclassifieraction::do_action(cgiargsclass &args, recptprotolistclass *protos,
118 browsermapclass *browsers, displayclass &disp,
119 outconvertclass &outconvert, ostream &textout,
120 ostream &logout)
121{
122 // A valid collection server is vital
123 recptproto *collectproto = protos->getrecptproto (args["c"], logout);
124 if (collectproto == NULL)
125 {
126 logout << "dynamicclassifieraction::do_action called with NULL collectproto\n";
127 return false;
128 }
129
130 textout << outconvert << disp << "_dynamicclassifier:header_\n";
131 textout << outconvert << disp << "_dynamicclassifier:content_\n";
132
133 // Check a dynamic classifier ID has been specified
134 text_t arg_dcl = args["dcl"];
135 if (arg_dcl.empty())
136 {
137 textout << outconvert << disp << "Error: Missing dcl argument.\n";
138 textout << outconvert << disp << "_dynamicclassifier:footer_\n";
139 return true;
140 }
141
142 // Check the dynamic classifier ID is valid (ie. there is an entry in the collect.cfg file for it)
143 ColInfoResponse_t *cinfo = recpt->get_collectinfo_ptr (collectproto, args["c"], logout);
144 if (cinfo->dynamic_classifiers.find(arg_dcl) == cinfo->dynamic_classifiers.end())
145 {
146 textout << outconvert << disp << "Error: Invalid dcl value \"" << arg_dcl << "\".\n";
147 textout << outconvert << disp << "_dynamicclassifier:footer_\n";
148 return true;
149 }
150
151 // Parse the classifier options from the specification
152 text_t classifier_specification = cinfo->dynamic_classifiers[arg_dcl];
153 text_tmap classifier_options = parse_classifier_options (classifier_specification, args);
154
155 // Output the "<ID>Header" format statement if there is one
156 text_t classifier_header_format_statement = "";
157 get_formatstring (arg_dcl + "Header", cinfo->format, classifier_header_format_statement);
158 textout << outconvert << disp << classifier_header_format_statement << "\n";
159
160 // Resolve any ".pr" bits at the end of the "dcn" argument
161 if (ends_with (args["dcn"], ".pr"))
162 {
163 // Change the "dcn" argument to be the OID of the parent of the specified classifier node
164 text_t::iterator parent_classifier_node_OID_end = findlastchar (args["dcn"].begin(), args["dcn"].end(), '|');
165 if (parent_classifier_node_OID_end != args["dcn"].end())
166 {
167 args["dcn"] = substr (args["dcn"].begin(), parent_classifier_node_OID_end);
168 }
169 else
170 {
171 args["dcn"] = "";
172 }
173 }
174
175 // Output the dynamic classifier, beginning with the (optional) grouping nodes
176 text_t selected_grouping_node_OID = "";
177 if (!classifier_options["-group_using"].empty())
178 {
179 selected_grouping_node_OID = output_grouping_nodes (classifier_options, args, collectproto, browsers, disp, outconvert, textout, logout);
180 }
181 text_t classifier_node_OID = args["dcn"]; // args["dcn"] may have been modified by output_grouping_nodes()
182 int classifier_node_indent = 0;
183
184 // Simple case at the top level: just output the child classifier nodes
185 if (classifier_node_OID == selected_grouping_node_OID)
186 {
187 text_t metadata_value_filter = selected_grouping_node_OID + "*";
188 output_child_classifier_nodes (classifier_node_OID, "", metadata_value_filter, classifier_node_indent, classifier_options, args, collectproto, browsers, disp, outconvert, textout, logout);
189 }
190
191 // More complex case below the top level
192 else
193 {
194 // This is the classifier node OID without any grouping information
195 text_t classifier_node_OID_sans_grouping = classifier_node_OID;
196 if (starts_with (classifier_node_OID, selected_grouping_node_OID + "|"))
197 {
198 classifier_node_OID_sans_grouping = substr (classifier_node_OID.begin() + (selected_grouping_node_OID + "|").size(), classifier_node_OID.end());
199 }
200
201 // Determine the parent classifier node labels
202 text_tlist parent_classifier_node_labels;
203 splitchar(classifier_node_OID_sans_grouping.begin(), classifier_node_OID_sans_grouping.end(), '|', parent_classifier_node_labels);
204
205 // Output the parent classifier nodes and the current classifier node
206 output_upper_classifier_nodes (selected_grouping_node_OID, parent_classifier_node_labels, classifier_node_indent, classifier_options, args, collectproto, browsers, disp, outconvert, textout, logout);
207
208 // Output the child classifier nodes
209 text_t classifier_node_metadata_value = classifier_node_OID_sans_grouping;
210 text_t metadata_value_filter = classifier_node_OID_sans_grouping + "|*";
211 output_child_classifier_nodes (classifier_node_OID, classifier_node_metadata_value, metadata_value_filter, classifier_node_indent, classifier_options, args, collectproto, browsers, disp, outconvert, textout, logout);
212
213 // Get the document nodes at this level
214 text_t metadata_element_name = classifier_options["metadata_element_name"];
215 text_t sort_documents_by = classifier_options["-sort_documents_by"];
216 FilterResponse_t documents_response;
217 get_documents_with_metadata_value (metadata_element_name, classifier_node_metadata_value, sort_documents_by, args["c"], collectproto, documents_response, logout);
218
219 // Display the document nodes
220 display_document_nodes (documents_response, classifier_node_indent, args, collectproto, browsers, disp, outconvert, textout, logout);
221 }
222
223 // Output the "<ID>Footer" format statement if there is one
224 text_t classifier_footer_format_statement = "";
225 get_formatstring (arg_dcl + "Footer", cinfo->format, classifier_footer_format_statement);
226 textout << outconvert << disp << classifier_footer_format_statement << "\n";
227
228 textout << outconvert << disp << "_dynamicclassifier:footer_\n";
229 return true;
230}
231
232
233text_tmap dynamicclassifieraction::parse_classifier_options (text_t classifier_specification, cgiargsclass &args)
234{
235 text_tmap classifier_options;
236
237 // Split the classifier specification string by spaces
238 text_tlist classifier_specification_parts;
239 splitchar (classifier_specification.begin(), classifier_specification.end(), ' ', classifier_specification_parts);
240
241 // The metadata element to classify by should be the first value
242 classifier_options["metadata_element_name"] = classifier_specification_parts.front();
243 classifier_specification_parts.pop_front();
244
245 // Parse options from the remainder of the classifier specification
246 while (!classifier_specification_parts.empty())
247 {
248 // Parse the option name
249 text_t classifier_option_name = classifier_specification_parts.front();
250 classifier_specification_parts.pop_front();
251
252 // Check if the option has a value (it may just be a flag, in which case we use "1" as the value)
253 text_t classifier_option_value = "1";
254 if (!classifier_specification_parts.empty() && !starts_with(classifier_specification_parts.front(), "-"))
255 {
256 classifier_option_value = classifier_specification_parts.front();
257 classifier_specification_parts.pop_front();
258 }
259
260 // Record the option
261 classifier_options[classifier_option_name] = classifier_option_value;
262 }
263
264 return classifier_options;
265}
266
267
268text_t dynamicclassifieraction::output_grouping_nodes (text_tmap classifier_options, cgiargsclass &args,
269 recptproto *collectproto, browsermapclass *browsers,
270 displayclass &disp, outconvertclass &outconvert,
271 ostream &textout, ostream &logout)
272{
273 // Get all the metadata values for the specified element, and group them according to the "-group_using" value
274 text_t metadata_element_name = classifier_options["metadata_element_name"];
275 text_t metadata_value_grouping_expression = classifier_options["-group_using"];
276 FilterResponse_t grouping_nodes_response;
277 bool request_success = get_metadata_values (metadata_element_name, "", metadata_value_grouping_expression, args["c"], collectproto, grouping_nodes_response, logout);
278
279 // If the request failed then it's probably because the collection isn't using an SQL infodbtype
280 if (request_success == false)
281 {
282 textout << outconvert << disp << "Error: Dynamic classifier functionality is not available. Please check you are using an SQL infodbtype and the collection has been rebuilt.\n";
283 return "";
284 }
285
286 // Check some grouping nodes were returned
287 if (grouping_nodes_response.docInfo.empty())
288 {
289 return "";
290 }
291
292 // If no classifier node has been specified automatically go to the first grouping node
293 if (args["dcn"] == "")
294 {
295 args["dcn"] = grouping_nodes_response.docInfo.front().OID;
296 }
297
298 // Add the necessary metadata to the grouping nodes
299 text_t selected_grouping_node_OID = "";
300 ResultDocInfo_tarray::iterator grouping_node_iterator = grouping_nodes_response.docInfo.begin();
301 while (grouping_node_iterator != grouping_nodes_response.docInfo.end())
302 {
303 // Is this the grouping node that is currently selected?
304 if (starts_with (args["dcn"], (*grouping_node_iterator).OID))
305 {
306 selected_grouping_node_OID = (*grouping_node_iterator).OID;
307 }
308
309 // Add the necessary metadata required to display the grouping nodes correctly
310 (*grouping_node_iterator).metadata["doctype"].values.push_back ("classify");
311 (*grouping_node_iterator).metadata["haschildren"].values.push_back ("1");
312 (*grouping_node_iterator).metadata["numleafdocs"].values.push_back ("?"); // We can't determine this without more database requests
313 (*grouping_node_iterator).metadata["Title"].values.push_back ((*grouping_node_iterator).OID);
314 grouping_node_iterator++;
315 }
316
317 // Display the grouping nodes
318 display_classifier_nodes (grouping_nodes_response, "HList", 0, args, collectproto, browsers, disp, outconvert, textout, logout);
319
320 return selected_grouping_node_OID;
321}
322
323
324void dynamicclassifieraction::output_upper_classifier_nodes (text_t root_classifier_node_OID,
325 text_tlist upper_classifier_node_labels,
326 int& classifier_node_indent,
327 text_tmap classifier_options, cgiargsclass &args,
328 recptproto *collectproto, browsermapclass *browsers,
329 displayclass &disp, outconvertclass &outconvert,
330 ostream &textout, ostream &logout)
331{
332 // Display the upper classifier nodes
333 text_t upper_classifier_node_OID = root_classifier_node_OID;
334 text_tlist::iterator upper_classifier_node_labels_iterator = upper_classifier_node_labels.begin();
335 while (upper_classifier_node_labels_iterator != upper_classifier_node_labels.end())
336 {
337 upper_classifier_node_OID += (upper_classifier_node_OID != "" ? "|" : "");
338 upper_classifier_node_OID += *upper_classifier_node_labels_iterator;
339
340 ResultDocInfo_t upper_classifier_node;
341 upper_classifier_node.OID = upper_classifier_node_OID;
342 upper_classifier_node.metadata["doctype"].values.push_back ("classify");
343 upper_classifier_node.metadata["haschildren"].values.push_back ("1");
344 upper_classifier_node.metadata["numleafdocs"].values.push_back ("?"); // We can't determine this without more database requests
345 upper_classifier_node.metadata["Title"].values.push_back (*upper_classifier_node_labels_iterator);
346
347 FilterResponse_t upper_classifier_node_response;
348 upper_classifier_node_response.docInfo.push_back(upper_classifier_node);
349 display_classifier_nodes (upper_classifier_node_response, "VList", classifier_node_indent, args, collectproto, browsers, disp, outconvert, textout, logout);
350 classifier_node_indent++;
351
352 upper_classifier_node_labels_iterator++;
353 }
354}
355
356
357void dynamicclassifieraction::output_child_classifier_nodes (text_t classifier_node_OID,
358 text_t classifier_node_metadata_value,
359 text_t metadata_value_filter,
360 int& classifier_node_indent,
361 text_tmap classifier_options, cgiargsclass &args,
362 recptproto *collectproto, browsermapclass *browsers,
363 displayclass &disp, outconvertclass &outconvert,
364 ostream &textout, ostream &logout)
365{
366 // Get all the metadata values for the specified element that match the filter
367 text_t metadata_element_name = classifier_options["metadata_element_name"];
368 FilterResponse_t metadata_values_response;
369 bool request_success = get_metadata_values (metadata_element_name, metadata_value_filter, "", args["c"], collectproto, metadata_values_response, logout);
370
371 // If the request failed then it's probably because the collection isn't using an SQL infodbtype
372 if (request_success == false)
373 {
374 textout << outconvert << disp << "Error: Dynamic classifier functionality is not available. Please check you are using an SQL infodbtype and the collection has been rebuilt.\n";
375 return;
376 }
377
378 // After processing any hierarchical metadata values we're left with the child classifer nodes
379 map<text_t, int, lttext_t> child_classifier_nodes;
380 ResultDocInfo_tarray::iterator metadata_value_iterator = metadata_values_response.docInfo.begin();
381 while (metadata_value_iterator != metadata_values_response.docInfo.end())
382 {
383 text_t metadata_value = (*metadata_value_iterator).OID;
384
385 // If we're not at the top-level we need to remove the current position from the metadata values
386 if (starts_with(metadata_value, classifier_node_metadata_value + "|"))
387 {
388 metadata_value = substr(metadata_value.begin() + (classifier_node_metadata_value + "|").size(), metadata_value.end());
389 }
390
391 // Is this metadata value hierarchical?
392 text_t::iterator hierarchy_split_position = findchar(metadata_value.begin(), metadata_value.end(), '|');
393 if (hierarchy_split_position != metadata_value.end())
394 {
395 // Yes, so use the first part of the hierarchy only
396 metadata_value = substr(metadata_value.begin(), hierarchy_split_position);
397 }
398
399 // Create a node for this metadata value if we haven't seen it before
400 if (child_classifier_nodes.find(metadata_value) == child_classifier_nodes.end())
401 {
402 child_classifier_nodes[metadata_value] = 0;
403 }
404
405 // Increment the occurrence count
406 child_classifier_nodes[metadata_value] += (*metadata_value_iterator).result_num;
407
408 metadata_value_iterator++;
409 }
410
411 // Add the necessary metadata to the child classifier nodes
412 FilterResponse_t child_classifier_nodes_response;
413 map<text_t, int, lttext_t>::iterator child_classifier_nodes_iterator = child_classifier_nodes.begin();
414 while (child_classifier_nodes_iterator != child_classifier_nodes.end())
415 {
416 text_t child_classifier_node_OID = (*child_classifier_nodes_iterator).first;
417 if (classifier_node_OID != "")
418 {
419 child_classifier_node_OID = classifier_node_OID + "|" + child_classifier_node_OID;
420 }
421
422 ResultDocInfo_t child_classifier_node;
423 child_classifier_node.OID = child_classifier_node_OID;
424 child_classifier_node.metadata["doctype"].values.push_back ("classify");
425 child_classifier_node.metadata["haschildren"].values.push_back ("1");
426 child_classifier_node.metadata["numleafdocs"].values.push_back ((*child_classifier_nodes_iterator).second);
427 child_classifier_node.metadata["Title"].values.push_back ((*child_classifier_nodes_iterator).first);
428 child_classifier_nodes_response.docInfo.push_back (child_classifier_node);
429
430 child_classifier_nodes_iterator++;
431 }
432
433 // Display the child classifier nodes
434 display_classifier_nodes (child_classifier_nodes_response, "VList", classifier_node_indent, args, collectproto, browsers, disp, outconvert, textout, logout);
435}
436
437
438void dynamicclassifieraction::display_classifier_nodes (FilterResponse_t classifier_nodes_response,
439 text_t classifier_nodes_type,
440 int classifier_nodes_indent,
441 cgiargsclass &args, recptproto *collectproto,
442 browsermapclass *browsers, displayclass &disp,
443 outconvertclass &outconvert, ostream &textout,
444 ostream &logout)
445{
446 // Check there are some classifier nodes to display
447 if (classifier_nodes_response.docInfo.empty()) return;
448
449 // Get the format statement for this classifier if there is one, or use the browser's default otherwise
450 text_t formatstring;
451 browserclass *bptr = browsers->getbrowser (classifier_nodes_type);
452 ColInfoResponse_t *cinfo = recpt->get_collectinfo_ptr (collectproto, args["c"], logout);
453 if (!get_formatstring (args["dcl"], classifier_nodes_type, cinfo->format, formatstring))
454 {
455 formatstring = bptr->get_default_formatstring();
456 }
457 format_t *formatlistptr = new format_t();
458 text_tset metadata;
459 bool getParents = false;
460 parse_formatstring (formatstring, formatlistptr, metadata, getParents);
461 bool use_table = is_table_content (formatlistptr);
462
463 // Display the classifier nodes
464 bptr->output_section_group (classifier_nodes_response, args, args["c"], classifier_nodes_indent, formatlistptr, use_table, metadata, getParents, collectproto, disp, outconvert, textout, logout);
465}
466
467
468void dynamicclassifieraction::display_document_nodes (FilterResponse_t documents_response,
469 int document_nodes_indent,
470 cgiargsclass &args, recptproto *collectproto,
471 browsermapclass *browsers, displayclass &disp,
472 outconvertclass &outconvert, ostream &textout,
473 ostream &logout)
474{
475 // Check there are some documents to display
476 if (documents_response.docInfo.empty()) return;
477
478 // Get the format statement for the document nodes if there is one, or use the browser's default otherwise
479 text_t formatstring;
480 browserclass *bptr = browsers->getbrowser ("VList");
481 ColInfoResponse_t *cinfo = recpt->get_collectinfo_ptr (collectproto, args["c"], logout);
482 if (!get_formatstring (args["dcl"], "DocumentNodes", cinfo->format, formatstring))
483 {
484 formatstring = bptr->get_default_formatstring();
485 }
486 format_t *formatlistptr = new format_t();
487 text_tset metadata;
488 bool getParents = false;
489 parse_formatstring (formatstring, formatlistptr, metadata, getParents);
490 bool use_table = is_table_content (formatlistptr);
491
492 // Request the necessary metadata for displaying the documents
493 text_tarray document_OIDs;
494 ResultDocInfo_tarray::iterator document_iterator = documents_response.docInfo.begin();
495 while (document_iterator != documents_response.docInfo.end())
496 {
497 document_OIDs.push_back ((*document_iterator).OID);
498 document_iterator++;
499 }
500 FilterResponse_t document_nodes_response;
501 get_info (document_OIDs, args["c"], args["l"], metadata, getParents, collectproto, document_nodes_response, logout);
502
503 // Display the document nodes
504 bptr->output_section_group (document_nodes_response, args, args["c"], document_nodes_indent, formatlistptr, use_table, metadata, getParents, collectproto, disp, outconvert, textout, logout);
505}
Note: See TracBrowser for help on using the repository browser.