[4855] | 1 | package org.greenstone.gsdl3.action;
|
---|
| 2 |
|
---|
| 3 | import org.greenstone.gsdl3.core.ModuleInterface;
|
---|
| 4 | import org.greenstone.gsdl3.util.*;
|
---|
| 5 | // XML classes
|
---|
| 6 | import org.w3c.dom.Node;
|
---|
| 7 | import org.w3c.dom.NodeList;
|
---|
| 8 | import org.w3c.dom.Document;
|
---|
| 9 | import org.w3c.dom.Element;
|
---|
| 10 |
|
---|
| 11 | import java.util.HashMap;
|
---|
| 12 | import java.util.HashSet;
|
---|
| 13 | import java.util.Vector;
|
---|
| 14 | import java.io.File;
|
---|
| 15 |
|
---|
[13124] | 16 | import org.apache.log4j.*;
|
---|
| 17 |
|
---|
[4855] | 18 | /** action for GS2 style classifier browsing */
|
---|
| 19 | public class GS2BrowseAction extends Action {
|
---|
| 20 |
|
---|
| 21 | public static final String CLASSIFIER_ARG = "cl";
|
---|
[13124] | 22 |
|
---|
[13270] | 23 | static Logger logger = Logger.getLogger(org.greenstone.gsdl3.action.GS2BrowseAction.class.getName());
|
---|
[13124] | 24 |
|
---|
[4855] | 25 | /** process the request */
|
---|
[16688] | 26 | public Node process (Node message_node) {
|
---|
[4855] | 27 |
|
---|
[16688] | 28 | Element message = this.converter.nodeToElement(message_node);
|
---|
| 29 |
|
---|
[4855] | 30 | // get the request - assume only one
|
---|
| 31 | Element request = (Element)GSXML.getChildByTagName(message, GSXML.REQUEST_ELEM);
|
---|
| 32 |
|
---|
| 33 | // the result
|
---|
[5155] | 34 | Element result = this.doc.createElement(GSXML.MESSAGE_ELEM);
|
---|
[4855] | 35 | Element response = classifierBrowse(request);
|
---|
| 36 | result.appendChild(response);
|
---|
| 37 | return result;
|
---|
| 38 | }
|
---|
| 39 |
|
---|
| 40 |
|
---|
| 41 | protected Element classifierBrowse(Element request) {
|
---|
| 42 |
|
---|
[5155] | 43 | Element page_response = this.doc.createElement(GSXML.RESPONSE_ELEM);
|
---|
[4855] | 44 |
|
---|
| 45 | // extract the params from the cgi-request, and check that we have a coll specified
|
---|
| 46 | Element cgi_paramList = (Element)GSXML.getChildByTagName(request, GSXML.PARAM_ELEM+GSXML.LIST_MODIFIER);
|
---|
| 47 | HashMap params = GSXML.extractParams(cgi_paramList, false);
|
---|
| 48 |
|
---|
[5147] | 49 | String service_name = (String)params.get(GSParams.SERVICE);
|
---|
| 50 | String collection = (String)params.get(GSParams.COLLECTION);
|
---|
[4855] | 51 | if (collection == null || collection.equals("")) {
|
---|
[13124] | 52 | logger.error("classifierBrowse, need to specify a collection!");
|
---|
[4855] | 53 | return page_response;
|
---|
| 54 |
|
---|
| 55 | }
|
---|
| 56 |
|
---|
| 57 | String lang = request.getAttribute(GSXML.LANG_ATT);
|
---|
[6300] | 58 | String uid = request.getAttribute(GSXML.USER_ID_ATT);
|
---|
[4855] | 59 | String to = GSPath.appendLink(collection, service_name);
|
---|
| 60 |
|
---|
| 61 | // the first part of the response is the service description
|
---|
| 62 | // for now get this again from the service.
|
---|
| 63 | // this should be cached somehow later on.
|
---|
| 64 |
|
---|
[5155] | 65 | Element info_message = this.doc.createElement(GSXML.MESSAGE_ELEM);
|
---|
[6300] | 66 | Element info_request = GSXML.createBasicRequest(this.doc, GSXML.REQUEST_TYPE_DESCRIBE, to, lang, uid);
|
---|
[4855] | 67 | info_message.appendChild(info_request);
|
---|
| 68 |
|
---|
| 69 | // also get the format stuff now if there is some
|
---|
[6300] | 70 | Element format_request = GSXML.createBasicRequest(this.doc, GSXML.REQUEST_TYPE_FORMAT, to, lang, uid);
|
---|
[4855] | 71 | info_message.appendChild(format_request);
|
---|
| 72 | // process the requests
|
---|
| 73 |
|
---|
[5155] | 74 | Element info_response = (Element) this.mr.process(info_message);
|
---|
[4855] | 75 |
|
---|
| 76 | // the two responses
|
---|
| 77 | NodeList responses = info_response.getElementsByTagName(GSXML.RESPONSE_ELEM);
|
---|
| 78 | Element service_response = (Element)responses.item(0);
|
---|
| 79 | Element format_response = (Element)responses.item(1);
|
---|
| 80 |
|
---|
| 81 | Element service_description = (Element)GSXML.getChildByTagName(service_response, GSXML.SERVICE_ELEM);
|
---|
[5155] | 82 | page_response.appendChild(this.doc.importNode(service_description, true));
|
---|
[4855] | 83 |
|
---|
[19984] | 84 | //append site metadata
|
---|
| 85 | addSiteMetadata( page_response, lang, uid);
|
---|
| 86 |
|
---|
[4855] | 87 | // if rt=d, then we are just displaying the service
|
---|
[5147] | 88 | String request_type = (String)params.get(GSParams.REQUEST_TYPE);
|
---|
[4855] | 89 | if (request_type.equals("d")) {
|
---|
| 90 | //return the page that we have so far
|
---|
| 91 | return page_response;
|
---|
| 92 | }
|
---|
| 93 |
|
---|
| 94 | // get the node that the user has clicked on
|
---|
| 95 | String classifier_node = (String)params.get(CLASSIFIER_ARG);
|
---|
| 96 |
|
---|
| 97 | // if the node is not defined, return the page that we have so far
|
---|
| 98 | if (classifier_node ==null || classifier_node.equals("")) {
|
---|
| 99 | return page_response;
|
---|
| 100 | }
|
---|
| 101 |
|
---|
| 102 | // the id of the classifier is the top id of the selected node
|
---|
| 103 | String top_id = OID.getTop(classifier_node);
|
---|
| 104 | HashSet doc_meta_names = new HashSet();
|
---|
| 105 | HashSet class_meta_names = new HashSet();
|
---|
| 106 | // add in the defaults
|
---|
| 107 | doc_meta_names.add("Title");
|
---|
| 108 | class_meta_names.add("Title");
|
---|
| 109 |
|
---|
| 110 | // add the format info into the response
|
---|
| 111 | Element format_elem = (Element)GSXML.getChildByTagName(format_response, GSXML.FORMAT_ELEM);
|
---|
| 112 | if (format_elem != null) {
|
---|
| 113 |
|
---|
| 114 | // find the one for the classifier we are in
|
---|
| 115 | Element this_format = GSXML.getNamedElement(format_elem, GSXML.CLASSIFIER_ELEM, GSXML.NAME_ATT, top_id);
|
---|
[6165] | 116 | if (this_format == null) {
|
---|
| 117 | this_format = (Element)GSXML.getChildByTagName(format_elem, GSXML.DEFAULT_ELEM);
|
---|
| 118 | }
|
---|
| 119 |
|
---|
[4855] | 120 | if (this_format != null) {
|
---|
[5155] | 121 | Element new_format = GSXML.duplicateWithNewName(this.doc, this_format, GSXML.FORMAT_ELEM, false);
|
---|
[4855] | 122 | extractMetadataNames(new_format, doc_meta_names, class_meta_names);
|
---|
[5401] | 123 | // set the format type
|
---|
[4855] | 124 | new_format.setAttribute(GSXML.TYPE_ATT, "browse");
|
---|
| 125 |
|
---|
| 126 | page_response.appendChild(new_format);
|
---|
| 127 | }
|
---|
| 128 | }
|
---|
| 129 |
|
---|
| 130 | // find out if this classifier is horizontal at top
|
---|
| 131 | Element class_list = (Element)GSXML.getChildByTagName(service_description, GSXML.CLASSIFIER_ELEM+GSXML.LIST_MODIFIER);
|
---|
| 132 | Element this_classifier = GSXML.getNamedElement(class_list, GSXML.CLASSIFIER_ELEM, GSXML.NAME_ATT, top_id);
|
---|
| 133 | boolean horizontal_at_top = false;
|
---|
| 134 | if (!this_classifier.getAttribute("horizontalAtTop").equals("")) {
|
---|
| 135 | horizontal_at_top = true;
|
---|
| 136 | }
|
---|
[9900] | 137 | if (top_id.equals(classifier_node) && horizontal_at_top) {
|
---|
[8575] | 138 | // we have asked for a top node - if the first list is horizontal, we will select the first element of that list
|
---|
[9874] | 139 | // this is a hack. also it craps out if the classifier really isn't horizontalAtTop. -
|
---|
[9900] | 140 | classifier_node = classifier_node+".1";
|
---|
[8575] | 141 |
|
---|
[9900] | 142 | }
|
---|
[8575] | 143 |
|
---|
[4855] | 144 | // get the browse structure for the selected node
|
---|
[5155] | 145 | Element classify_message = this.doc.createElement(GSXML.MESSAGE_ELEM);
|
---|
[6695] | 146 | Element classify_request = GSXML.createBasicRequest(this.doc, GSXML.REQUEST_TYPE_PROCESS, to, lang, uid);
|
---|
[4855] | 147 | classify_message.appendChild(classify_request);
|
---|
| 148 |
|
---|
| 149 | //Create a parameter list to specify the required structure information
|
---|
| 150 | // for now, always get ancestors and children
|
---|
[5155] | 151 | Element param_list = this.doc.createElement(GSXML.PARAM_ELEM+GSXML.LIST_MODIFIER);
|
---|
[4855] | 152 | classify_request.appendChild(param_list);
|
---|
[5155] | 153 | Element param = this.doc.createElement(GSXML.PARAM_ELEM);
|
---|
[4855] | 154 | param_list.appendChild(param);
|
---|
| 155 | param.setAttribute(GSXML.NAME_ATT, "structure");
|
---|
| 156 | param.setAttribute(GSXML.VALUE_ATT, "ancestors");
|
---|
[5155] | 157 | param = this.doc.createElement(GSXML.PARAM_ELEM);
|
---|
[4855] | 158 | param_list.appendChild(param);
|
---|
| 159 | param.setAttribute(GSXML.NAME_ATT, "structure");
|
---|
| 160 | param.setAttribute(GSXML.VALUE_ATT, "children");
|
---|
| 161 |
|
---|
| 162 | // put the classifier node into a classifier node list
|
---|
[5155] | 163 | Element classifier_list = this.doc.createElement(GSXML.CLASS_NODE_ELEM+GSXML.LIST_MODIFIER);
|
---|
| 164 | Element classifier = this.doc.createElement(GSXML.CLASS_NODE_ELEM);
|
---|
[4855] | 165 | classifier.setAttribute(GSXML.NODE_ID_ATT, classifier_node);
|
---|
| 166 | classifier_list.appendChild(classifier);
|
---|
| 167 | classify_request.appendChild(classifier_list);
|
---|
| 168 |
|
---|
| 169 | if (horizontal_at_top && !classifier_node.equals(top_id)) {
|
---|
[5401] | 170 | // also put the top id in, to get the persistant horizontal info
|
---|
[5155] | 171 | classifier = this.doc.createElement(GSXML.CLASS_NODE_ELEM);
|
---|
[4855] | 172 | classifier.setAttribute(GSXML.NODE_ID_ATT, top_id);
|
---|
| 173 | classifier_list.appendChild(classifier);
|
---|
| 174 | }
|
---|
| 175 | // process the request
|
---|
[5155] | 176 | Element classify_response = (Element)this.mr.process(classify_message);
|
---|
[4855] | 177 | String path = GSPath.appendLink(GSXML.RESPONSE_ELEM, GSXML.CLASS_NODE_ELEM+GSXML.LIST_MODIFIER);
|
---|
| 178 | Element class_node_list = (Element)GSXML.getNodeByPath(classify_response, path);
|
---|
| 179 |
|
---|
| 180 | path = GSPath.appendLink(GSXML.CLASS_NODE_ELEM, GSXML.NODE_STRUCTURE_ELEM);
|
---|
| 181 | // assume that we always get back the top level CL1 node - this becomes the page_classifier node
|
---|
| 182 | path = GSPath.appendLink(path, GSXML.CLASS_NODE_ELEM);
|
---|
| 183 | Element cl_structure = (Element)GSXML.getNodeByPath(class_node_list,
|
---|
| 184 | path);
|
---|
| 185 | if (cl_structure ==null) {
|
---|
[13124] | 186 | logger.error("classifier structure request returned no structure");
|
---|
[4855] | 187 | return page_response;
|
---|
| 188 | }
|
---|
| 189 |
|
---|
| 190 | Element page_classifier = null;
|
---|
| 191 | if (horizontal_at_top && !classifier_node.equals(top_id)) {
|
---|
| 192 | // get the info for the top node
|
---|
| 193 | Element top_node = GSXML.getNamedElement(class_node_list, GSXML.CLASS_NODE_ELEM, GSXML.NODE_ID_ATT, top_id);
|
---|
| 194 | if (top_node !=null) {
|
---|
| 195 | path = GSPath.appendLink(GSXML.NODE_STRUCTURE_ELEM, GSXML.CLASS_NODE_ELEM);
|
---|
| 196 | Element top_structure = (Element)GSXML.getNodeByPath(top_node, path);
|
---|
| 197 | // add this as the classifier elem
|
---|
[5155] | 198 | page_classifier = GSXML.duplicateWithNewName(this.doc, top_structure, GSXML.CLASSIFIER_ELEM, true);
|
---|
[4855] | 199 | page_response.appendChild(page_classifier);
|
---|
| 200 | // now replace the child with the structure from the other request
|
---|
| 201 | Element new_classifier = (Element)GSXML.getChildByTagName(cl_structure, GSXML.CLASS_NODE_ELEM);
|
---|
| 202 | String replace_name = new_classifier.getAttribute(GSXML.NODE_ID_ATT);
|
---|
| 203 |
|
---|
| 204 | // find the appropriate child
|
---|
| 205 | Element old_classifier = GSXML.getNamedElement(page_classifier, GSXML.CLASS_NODE_ELEM, GSXML.NODE_ID_ATT, replace_name);
|
---|
[5155] | 206 | page_classifier.replaceChild(this.doc.importNode(new_classifier, true), old_classifier);
|
---|
[4855] | 207 | page_classifier.setAttribute(GSXML.NAME_ATT, top_id);
|
---|
| 208 | } else {
|
---|
| 209 | // add the single classifier node as the page classifier
|
---|
[5155] | 210 | page_classifier = GSXML.duplicateWithNewName(this.doc, cl_structure, GSXML.CLASSIFIER_ELEM, true);
|
---|
[4855] | 211 | page_response.appendChild(page_classifier);
|
---|
| 212 | page_classifier.setAttribute(GSXML.NAME_ATT, top_id);
|
---|
| 213 | }
|
---|
| 214 |
|
---|
| 215 | } else {
|
---|
| 216 | // add the single classifier node as the page classifier
|
---|
[5155] | 217 | page_classifier = GSXML.duplicateWithNewName(this.doc, cl_structure, GSXML.CLASSIFIER_ELEM, true);
|
---|
[4855] | 218 | page_response.appendChild(page_classifier);
|
---|
| 219 | page_classifier.setAttribute(GSXML.NAME_ATT, top_id);
|
---|
| 220 | }
|
---|
| 221 | // get the metadata for each classifier node,
|
---|
| 222 | // then for each document node
|
---|
| 223 |
|
---|
[5155] | 224 | Element metadata_message = this.doc.createElement(GSXML.MESSAGE_ELEM);
|
---|
[4855] | 225 |
|
---|
| 226 | boolean did_classifier = false;
|
---|
| 227 | boolean did_documents = false;
|
---|
| 228 |
|
---|
| 229 |
|
---|
| 230 | // if there are classifier nodes
|
---|
| 231 | // create a metadata request for the classifier, and add it to
|
---|
| 232 | // the the message
|
---|
| 233 | NodeList cl_nodes = page_classifier.getElementsByTagName(GSXML.CLASS_NODE_ELEM);
|
---|
| 234 |
|
---|
| 235 | if (cl_nodes.getLength() > 0) {
|
---|
| 236 | did_classifier = true;
|
---|
[6695] | 237 | Element cl_meta_request = GSXML.createBasicRequest(this.doc, GSXML.REQUEST_TYPE_PROCESS, to+"MetadataRetrieve", lang, uid);
|
---|
[4855] | 238 | metadata_message.appendChild(cl_meta_request);
|
---|
| 239 |
|
---|
[5155] | 240 | Element new_cl_nodes_list = this.doc.createElement(GSXML.CLASS_NODE_ELEM+GSXML.LIST_MODIFIER);
|
---|
[4855] | 241 | cl_meta_request.appendChild(new_cl_nodes_list);
|
---|
| 242 |
|
---|
| 243 | for (int c=0; c<cl_nodes.getLength(); c++) {
|
---|
| 244 |
|
---|
[5155] | 245 | Element cl = this.doc.createElement(GSXML.CLASS_NODE_ELEM);
|
---|
[4855] | 246 | cl.setAttribute(GSXML.NODE_ID_ATT, ((Element)cl_nodes.item(c)).getAttribute(GSXML.NODE_ID_ATT));
|
---|
| 247 | new_cl_nodes_list.appendChild(cl);
|
---|
| 248 | }
|
---|
| 249 |
|
---|
| 250 | // create and add in the param list - for now get all the metadata
|
---|
| 251 | // should be based on info sent in from the recept, and the
|
---|
| 252 | // format stuff
|
---|
| 253 | Element cl_param_list = createMetadataParamList(class_meta_names);
|
---|
| 254 | cl_meta_request.appendChild(cl_param_list);
|
---|
| 255 |
|
---|
| 256 | }
|
---|
| 257 |
|
---|
| 258 | // if there are document nodes in the classification (happens
|
---|
| 259 | // sometimes), create a second request for document metadata and
|
---|
| 260 | // append to the message
|
---|
| 261 | NodeList doc_nodes = page_classifier.getElementsByTagName(GSXML.DOC_NODE_ELEM);
|
---|
| 262 | if (doc_nodes.getLength() > 0) {
|
---|
| 263 | did_documents = true;
|
---|
[6695] | 264 | Element doc_meta_request = GSXML.createBasicRequest(this.doc, GSXML.REQUEST_TYPE_PROCESS, GSPath.appendLink(collection, "DocumentMetadataRetrieve"), lang, uid);
|
---|
[4855] | 265 | metadata_message.appendChild(doc_meta_request);
|
---|
| 266 |
|
---|
[5155] | 267 | Element doc_list = this.doc.createElement(GSXML.DOC_NODE_ELEM+GSXML.LIST_MODIFIER);
|
---|
[4855] | 268 | doc_meta_request.appendChild(doc_list);
|
---|
| 269 |
|
---|
| 270 | for (int c=0; c<doc_nodes.getLength(); c++) {
|
---|
| 271 |
|
---|
[5155] | 272 | Element d = this.doc.createElement(GSXML.DOC_NODE_ELEM);
|
---|
[4855] | 273 | d.setAttribute(GSXML.NODE_ID_ATT, ((Element)doc_nodes.item(c)).getAttribute(GSXML.NODE_ID_ATT));
|
---|
| 274 | doc_list.appendChild(d);
|
---|
| 275 | }
|
---|
| 276 |
|
---|
| 277 | // create and add in the param list - add all for now
|
---|
| 278 | Element doc_param_list = createMetadataParamList(doc_meta_names);
|
---|
| 279 | doc_meta_request.appendChild(doc_param_list);
|
---|
| 280 |
|
---|
| 281 | }
|
---|
| 282 |
|
---|
| 283 | // process the metadata requests
|
---|
[5155] | 284 | Element metadata_response = (Element)this.mr.process(metadata_message);
|
---|
[21928] | 285 | if (did_classifier) {
|
---|
[4855] | 286 | // the classifier one will be the first response
|
---|
| 287 | // add the metadata lists for each node back into the
|
---|
| 288 | // page_classifier nodes
|
---|
| 289 | path = GSPath.appendLink(GSXML.RESPONSE_ELEM,
|
---|
| 290 | GSXML.CLASS_NODE_ELEM+GSXML.LIST_MODIFIER);
|
---|
[13568] | 291 | Node pathNode = GSXML.getNodeByPath(metadata_response, path);
|
---|
| 292 | if (pathNode ==null){
|
---|
| 293 | return page_response;
|
---|
| 294 | }
|
---|
[21928] | 295 | //NodeList meta_response_cls = (Element)pathNode.getChildNodes(); // can't handle empty elements from converting formatted strings (with empty newlines) into XML
|
---|
| 296 | NodeList meta_response_cls = ((Element)pathNode).getElementsByTagName(GSXML.CLASS_NODE_ELEM);
|
---|
[4855] | 297 | for (int i = 0; i < cl_nodes.getLength(); i++) {
|
---|
| 298 | GSXML.mergeMetadataLists(cl_nodes.item(i), meta_response_cls.item(i));
|
---|
| 299 | }
|
---|
| 300 | }
|
---|
[13568] | 301 |
|
---|
[4855] | 302 | if (did_documents) {
|
---|
| 303 | NodeList meta_response_docs = null;
|
---|
| 304 | if (!did_classifier) {
|
---|
| 305 | // its the first response
|
---|
| 306 | path = GSPath.appendLink(GSXML.RESPONSE_ELEM,
|
---|
| 307 | GSXML.DOC_NODE_ELEM+GSXML.LIST_MODIFIER);
|
---|
[13568] | 308 | Node pathNode = GSXML.getNodeByPath(metadata_response, path);
|
---|
| 309 | if (pathNode ==null){
|
---|
| 310 | return page_response;
|
---|
| 311 | }
|
---|
| 312 |
|
---|
| 313 | meta_response_docs = pathNode.getChildNodes();
|
---|
| 314 |
|
---|
| 315 |
|
---|
[4855] | 316 | } else { // its the second response
|
---|
[13568] | 317 | Node nodes = GSXML.getChildByTagName(metadata_response.getElementsByTagName(GSXML.RESPONSE_ELEM).item(1), GSXML.DOC_NODE_ELEM+GSXML.LIST_MODIFIER);
|
---|
| 318 | if (nodes ==null){
|
---|
| 319 | return page_response;
|
---|
| 320 | }
|
---|
| 321 | meta_response_docs = nodes.getChildNodes();
|
---|
[4855] | 322 | }
|
---|
| 323 |
|
---|
| 324 | for (int i = 0; i < doc_nodes.getLength(); i++) {
|
---|
| 325 | GSXML.mergeMetadataLists(doc_nodes.item(i), meta_response_docs.item(i));
|
---|
| 326 | }
|
---|
| 327 | }
|
---|
| 328 |
|
---|
| 329 |
|
---|
[13124] | 330 | logger.debug("(GS2BrowseAction) Page:\n" + this.converter.getPrettyString(page_response));
|
---|
[4855] | 331 | return page_response;
|
---|
| 332 | }
|
---|
| 333 |
|
---|
[8575] | 334 |
|
---|
[4855] | 335 | protected void extractMetadataNames(Element new_format, HashSet doc_meta_names, HashSet class_meta_names) {
|
---|
| 336 |
|
---|
| 337 | NodeList templates = new_format.getElementsByTagName("gsf:template");
|
---|
| 338 | for (int i=0; i<templates.getLength(); i++) {
|
---|
| 339 | Element template = (Element)templates.item(i);
|
---|
| 340 | String match = template.getAttribute("match");
|
---|
| 341 | if (match.equals("documentNode")) {
|
---|
| 342 | extractMetadataNames(template, doc_meta_names);
|
---|
| 343 | } else if (match.equals("classifierNode")) {
|
---|
| 344 | extractMetadataNames(template, class_meta_names);
|
---|
| 345 | }
|
---|
| 346 | }
|
---|
| 347 | }
|
---|
| 348 |
|
---|
| 349 | }
|
---|
| 350 |
|
---|
| 351 |
|
---|