/********************************************************************** * * basequeryaction.cpp -- * Copyright (C) 1999 The New Zealand Digital Library Project * * A component of the Greenstone digital library software * from the New Zealand Digital Library Project at the * University of Waikato, New Zealand. * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. * *********************************************************************/ #include "basequeryaction.h" #include "querytools.h" #include "formattools.h" #include "cgiutils.h" #include "OIDtools.h" #include "fileutil.h" #include "text_t.h" #include "historydb.h" #include "htmlutils.h" // for html_safe in do_action #include "gsdltools.h" #include "phrases.h" // for get_phrases #include // for strtol #include void colinfo_t::clear () { formatlistptr = NULL; browserptr = NULL; } void QueryResult_t::clear() { doc.clear(); collection.clear(); } basequeryaction::basequeryaction () { recpt = NULL; cgiarginfo arg_ainfo; // "q" arg_ainfo.shortname = "q"; arg_ainfo.longname = "query string"; arg_ainfo.multiplechar = true; arg_ainfo.defaultstatus = cgiarginfo::weak; arg_ainfo.argdefault = g_EmptyText; arg_ainfo.savedarginfo = cgiarginfo::must; argsinfo.addarginfo (NULL, arg_ainfo); // "q2" arg_ainfo.shortname = "q2"; arg_ainfo.longname = "query string for second query"; arg_ainfo.multiplechar = true; arg_ainfo.defaultstatus = cgiarginfo::weak; arg_ainfo.argdefault = g_EmptyText; arg_ainfo.savedarginfo = cgiarginfo::must; argsinfo.addarginfo (NULL, arg_ainfo); // "cq2" ""=don't combine, "and", "or", "not" arg_ainfo.shortname = "cq2"; arg_ainfo.longname = "combine queries"; arg_ainfo.multiplechar = true; arg_ainfo.defaultstatus = cgiarginfo::weak; arg_ainfo.argdefault = g_EmptyText; arg_ainfo.savedarginfo = cgiarginfo::must; argsinfo.addarginfo (NULL, arg_ainfo); // "m" arg_ainfo.shortname = "m"; arg_ainfo.longname = "maximum number of documents"; arg_ainfo.multiplechar = true; arg_ainfo.defaultstatus = cgiarginfo::weak; arg_ainfo.argdefault = "50"; arg_ainfo.savedarginfo = cgiarginfo::must; argsinfo.addarginfo (NULL, arg_ainfo); // "o" arg_ainfo.shortname = "o"; arg_ainfo.longname = "hits per page"; arg_ainfo.multiplechar = true; arg_ainfo.defaultstatus = cgiarginfo::weak; arg_ainfo.argdefault = "20"; arg_ainfo.savedarginfo = cgiarginfo::must; argsinfo.addarginfo (NULL, arg_ainfo); // "r" arg_ainfo.shortname = "r"; arg_ainfo.longname = "start results from"; arg_ainfo.multiplechar = true; arg_ainfo.defaultstatus = cgiarginfo::weak; arg_ainfo.argdefault = "1"; arg_ainfo.savedarginfo = cgiarginfo::must; argsinfo.addarginfo (NULL, arg_ainfo); // "ifl" - I'm feeling lucky! (Go directly to a matching document) arg_ainfo.shortname = "ifl"; arg_ainfo.longname = "i'm feeling lucky"; arg_ainfo.multiplechar = false; arg_ainfo.defaultstatus = cgiarginfo::weak; arg_ainfo.argdefault = g_EmptyText; arg_ainfo.savedarginfo = cgiarginfo::mustnot; argsinfo.addarginfo (NULL, arg_ainfo); // "ifln" - I'm feeling lucky number (Go directly to the nth matching document) arg_ainfo.shortname = "ifln"; arg_ainfo.longname = "i'm feeling lucky number"; arg_ainfo.multiplechar = true; arg_ainfo.defaultstatus = cgiarginfo::weak; arg_ainfo.argdefault = "1"; arg_ainfo.savedarginfo = cgiarginfo::mustnot; argsinfo.addarginfo (NULL, arg_ainfo); // "srn" - the next search result arg_ainfo.shortname = "srn"; arg_ainfo.longname = "the next search result number"; arg_ainfo.multiplechar = true; arg_ainfo.defaultstatus = cgiarginfo::weak; arg_ainfo.argdefault = "0"; arg_ainfo.savedarginfo = cgiarginfo::must; argsinfo.addarginfo (NULL, arg_ainfo); // "srp" - the previous search result arg_ainfo.shortname = "srp"; arg_ainfo.longname = "the previous search result number"; arg_ainfo.multiplechar = true; arg_ainfo.defaultstatus = cgiarginfo::weak; arg_ainfo.argdefault = "0"; arg_ainfo.savedarginfo = cgiarginfo::must; argsinfo.addarginfo (NULL, arg_ainfo); // "sf" - Sort field. Set to field to be used for sorting search reult // set (only implemented for lucene collections at present). arg_ainfo.shortname = "sf"; arg_ainfo.longname = "sort field"; arg_ainfo.multiplechar = true; arg_ainfo.defaultstatus = cgiarginfo::weak; arg_ainfo.argdefault = g_EmptyText; arg_ainfo.savedarginfo = cgiarginfo::must; argsinfo.addarginfo (NULL, arg_ainfo); // "fqn" - number of fields in the query form arg_ainfo.shortname = "fqn"; arg_ainfo.longname = "form query num fields"; arg_ainfo.multiplechar = true; arg_ainfo.defaultstatus = cgiarginfo::weak; arg_ainfo.argdefault = "4"; arg_ainfo.savedarginfo = cgiarginfo::must; argsinfo.addarginfo (NULL, arg_ainfo); // "fqf" - the list of field names in the form query // - a comma separated list arg_ainfo.shortname = "fqf"; arg_ainfo.longname = "form query fields"; arg_ainfo.multiplechar = true; arg_ainfo.defaultstatus = cgiarginfo::weak; arg_ainfo.argdefault = g_EmptyText; arg_ainfo.savedarginfo = cgiarginfo::must; argsinfo.addarginfo (NULL, arg_ainfo); // "fqv" - the list of values in the form query // - a comma separated list arg_ainfo.shortname = "fqv"; arg_ainfo.longname = "form query values"; arg_ainfo.multiplechar = true; arg_ainfo.defaultstatus = cgiarginfo::weak; arg_ainfo.argdefault = g_EmptyText; arg_ainfo.savedarginfo = cgiarginfo::must; argsinfo.addarginfo (NULL, arg_ainfo); // "fqc" - the list of boolean operators in the form query // - a comma separated list arg_ainfo.shortname = "fqc"; arg_ainfo.longname = "form query combines"; arg_ainfo.multiplechar = true; arg_ainfo.defaultstatus = cgiarginfo::weak; arg_ainfo.argdefault = g_EmptyText; arg_ainfo.savedarginfo = cgiarginfo::must; argsinfo.addarginfo (NULL, arg_ainfo); // "fqa" - form query advanced - for "run query" arg_ainfo.shortname = "fqa"; arg_ainfo.longname = "form query advanced query"; arg_ainfo.multiplechar = false; arg_ainfo.defaultstatus = cgiarginfo::weak; arg_ainfo.argdefault = "0"; arg_ainfo.savedarginfo = cgiarginfo::must; argsinfo.addarginfo (NULL, arg_ainfo); // "fuzziness" controls how closely the search terms must match // 100 = exact match, 0 = very inexact match (only implemented for Lucene) arg_ainfo.shortname = "fuzziness"; arg_ainfo.longname = "Lucene fuzziness value"; arg_ainfo.multiplechar = true; arg_ainfo.defaultstatus = cgiarginfo::weak; arg_ainfo.argdefault = g_EmptyText; arg_ainfo.savedarginfo = cgiarginfo::must; argsinfo.addarginfo (NULL, arg_ainfo); // "hd" history display - search history only displayed when // this var set to something other than 0 // this number of records is displayed arg_ainfo.shortname = "hd"; arg_ainfo.longname = "history display"; arg_ainfo.multiplechar = true; arg_ainfo.multiplevalue = false; arg_ainfo.defaultstatus = cgiarginfo::weak; arg_ainfo.argdefault = "0"; arg_ainfo.savedarginfo = cgiarginfo::must; argsinfo.addarginfo (NULL, arg_ainfo); // "hs" save - set to 1 in query form, so only save when submit // query // 0 = no save 1 = save arg_ainfo.shortname = "hs"; arg_ainfo.longname = "history save"; arg_ainfo.multiplechar = false; arg_ainfo.defaultstatus = cgiarginfo::weak; arg_ainfo.argdefault = "0"; arg_ainfo.savedarginfo = cgiarginfo::mustnot; argsinfo.addarginfo (NULL, arg_ainfo); } void basequeryaction::configure (const text_t &key, const text_tarray &cfgline) { action::configure (key, cfgline); } bool basequeryaction::init (ostream &logout) { return action::init (logout); } bool basequeryaction::check_cgiargs (cgiargsinfoclass &argsinfo, cgiargsclass &args, recptprotolistclass * /*protos*/, ostream &logout) { // check m argument int arg_m = args.getintarg("m"); if (arg_m < -1) { logout << "Warning: \"m\" argument less than -1 (" << arg_m << ")\n"; cgiarginfo *minfo = argsinfo.getarginfo ("m"); if (minfo != NULL) args["m"] = minfo->argdefault; } // check o argument int arg_o = args.getintarg("o"); if (arg_o < -1) { logout << "Warning: \"o\" argument less than -1 (" << arg_o << ")\n"; cgiarginfo *oinfo = argsinfo.getarginfo ("o"); if (oinfo != NULL) args["o"] = oinfo->argdefault; } // check r argument int arg_r = args.getintarg("r"); if (arg_r < 1) { logout << "Warning: \"r\" argument less than 1 (" << arg_r << ")\n"; cgiarginfo *rinfo = argsinfo.getarginfo ("r"); if (rinfo != NULL) args["r"] = rinfo->argdefault; } //check hd argument int arg_hd = args.getintarg("hd"); if (arg_hd <0 ) { logout << "Warning: \"hd\" argument less than 0 (" << arg_hd << ")\n"; cgiarginfo *hdinfo = argsinfo.getarginfo ("hd"); if (hdinfo != NULL) args["hd"] = hdinfo->argdefault; } //check hs argument int arg_hs = args.getintarg("hs"); if (arg_hs !=0 && arg_hs !=1) { logout << "Warning: \"hs\" argument out of range (" << arg_hs << ")\n"; cgiarginfo *hsinfo = argsinfo.getarginfo ("hs"); if (hsinfo != NULL) args["hs"] = hsinfo->argdefault; } return true; } void basequeryaction::get_cgihead_info (cgiargsclass &args, recptprotolistclass * /*protos*/, response_t &response, text_t &response_data, ostream &/*logout*/) { // If this is an "I'm feeling lucky" request, we don't know the target location until later if (!args["ifl"].empty()) { response = undecided_location; return; } response = content; response_data = "text/html"; } void basequeryaction::define_internal_macros (displayclass &disp, cgiargsclass &args, recptprotolistclass * protos, ostream &logout) { // The following macros are set later (in define_query_macros) as they can't be set until // the query has been done. // _quotedquery_ the part of the query string that was quoted for post-processing // _freqmsg_ the term frequency string // _resultline_ the "x documents matched the query" string // _prevfirst_ these are used when setting up the links to previous/next // _prevlast_ pages of results (_thisfirst_ and _thislast_ are used to set // _nextfirst_ the 'results x-x for query: xxxx' string in the title bar) // _nextlast_ // _thisfirst_ // _thislast_ define_form_macros(disp, args, protos, logout); } // define_query_macros sets the macros that couldn't be set until the // query had been done. Those macros are // _resultline_, _nextfirst_, _nextlast_, _prevfirst_, _prevlast_, // _thisfirst_, and _thislast_ and _quotedquery_ // this has been simplified so it can be used with both search_single_coll // and search_multiple_coll void basequeryaction::define_query_macros (cgiargsclass &args, displayclass &disp, int numdocs, isapprox isApprox) { // set up _resultline_ macro text_t resline; int maxdocs = args.getintarg("m"); if (maxdocs == -1) maxdocs = numdocs; else if (numdocs > maxdocs) { numdocs = maxdocs; isApprox = MoreThan; } if (isApprox == Approximate) resline = "_textapprox_"; else if (isApprox == MoreThan) resline = "_textmorethan_"; if (numdocs == 0) resline = "_textnodocs_"; else if (numdocs == 1) resline += "_text1doc_"; else resline += text_t(numdocs) + " _textlotsdocs_"; disp.setmacro("resultline", "query", resline); int firstdoc = args.getintarg("r"); int hitsperpage = args.getintarg("o"); if (hitsperpage == -1) hitsperpage = numdocs; // set up _thisfirst_ and _thislast_ macros disp.setmacro ("thisfirst", "query", firstdoc); int thislast = firstdoc + (hitsperpage - 1); if (thislast > numdocs) thislast = numdocs; disp.setmacro ("thislast", "query", thislast); // set up _prevfirst_ and _prevlast_ macros if (firstdoc > 1) { disp.setmacro ("prevlast", "query", firstdoc - 1); int prevfirst = firstdoc - hitsperpage; if (prevfirst < 1) prevfirst = 1; disp.setmacro ("prevfirst", "query", prevfirst); } // set up _nextfirst_ and _nextlast_ macros if (thislast < numdocs) { disp.setmacro ("nextfirst", "query", thislast + 1); int nextlast = thislast + hitsperpage; if (nextlast > numdocs) nextlast = numdocs; disp.setmacro ("nextlast", "query", nextlast); } } // sets the selection box macros such as: // _hselection_, _jselection_, _nselection_ _gselection_, _fqfselection_ void basequeryaction::set_option_macro (const text_t ¯oname, text_t current_value, bool display_single, bool add_js_update, const FilterOption_t &option, displayclass &disp) { if (option.validValues.empty()) return; if (option.validValues.size() == 1) { if (display_single) { disp.setmacro (macroname + "selection", displayclass::defaultpackage, "_" + option.defaultValue + "_"); } return; } if (option.validValues.size() < 2) return; text_t macrovalue = "