10.000.000)" * "(is_a::city or is_a::country) and population < 10.000.000" * * Subqueries, with variables bound to the matching pagename, with (for ...): * "works_at::_organization * and (for _organization located_in::_city * and (for _city population>1000000))" * * "works_at::_organization * and (for _organization * (located_in::_city * and (for _city is_a::City * and population>1000000)) * or (located_in::_country * and (for _country is_a::Country and population>5000000))) * * Relation links may contain wildcards. For relation and attribute names I'm not sure yet. * * @author: Reini Urban */ class WikiPlugin_SemanticSearchAdvanced extends WikiPlugin_SemanticSearch { public $_supported_operators; function getDescription() { return _("Parse and execute a full query expression."); } function getDefaultArguments() { return array_merge ( PageList::supportedArgs(), // paging and more. array( 's' => "", // query expression 'page' => "*", // which pages (glob allowed), default: all 'case_exact' => false, 'regex' => 'auto', // hmm 'noform' => false, // don't show form with results. 'noheader' => false // no caption )); } function showForm(&$dbi, &$request, $args, $allrelations) { $action = $request->getPostURL(); $hiddenfield = HiddenInputs($request->getArgs(), '', array('action', 'page', 's')); $pagefilter = HTML::input(array('name' => 'page', 'value' => $args['page'], 'title' => _("Search only in these pages. With autocompletion."), 'class' => 'dropdown', 'acdropdown' => 'true', 'autocomplete_complete' => 'true', 'autocomplete_matchsubstring' => 'false', 'autocomplete_list' => 'xmlrpc:wiki.titleSearch ^[S] 4' ), ''); $help = Button('submit:semsearch[help]', "?", false); $svalues = empty($allrelations) ? "" : join("','", $allrelations); $reldef = JavaScript("var semsearch_relations = new Array('" . $svalues . "')"); $querybox = HTML::textarea(array('name' => 's', 'title' => _("Enter a valid query expression"), 'rows' => 4, 'acdropdown' => 'true', 'autocomplete_complete' => 'true', 'autocomplete_assoc' => 'false', 'autocomplete_matchsubstring' => 'true', 'autocomplete_list' => 'array:semsearch_relations' ), $args['s']); $submit = Button('submit:semsearch[relations]', _("Search"), false, array('title' => 'Move to help page. No separate window')); $instructions = _("Search in all specified pages for the expression."); $form = HTML::form(array('action' => $action, 'method' => 'post', 'accept-charset' => 'UTF-8'), $reldef, $hiddenfield, HiddenInputs(array('attribute' => '')), $instructions, HTML::br(), HTML::table(array('class' => 'fullwidth'), HTML::tr(HTML::td(_("Page Name")._(': '), $pagefilter), HTML::td(array('class' => 'align-right'), $help)), HTML::tr(HTML::td(array('colspan' => 2), $querybox))), HTML::br(), HTML::div(array('class' => 'align-center'), $submit)); return $form; } /** * @param WikiDB $dbi * @param string $argstr * @param WikiRequest $request * @param string $basepage * @return mixed */ function run($dbi, $argstr, &$request, $basepage) { $this->_supported_operators = array(':=', '<', '<=', '>', '>=', '!=', '==', '=~'); $args = $this->getArgs($argstr, $request); $posted = $request->getArg('semsearch'); $request->setArg('semsearch', false); if ($request->isPost() and isset($posted['help'])) { $request->redirect(WikiURL(__("Help")."/".__("SemanticSearchAdvancedPlugin"), array('redirectfrom' => $basepage), true)); } $allrelations = $dbi->listRelations(); $form = $this->showForm($dbi, $request, $args, $allrelations); if (isset($this->_norelations_warning)) $form->pushContent(HTML::div(array('class' => 'warning'), _("Warning:") . $this->_norelations_warning)); extract($args); // For convenience, peace and harmony we allow GET requests also. if (!$args['s']) // check for good GET request return $form; // nobody called us, so just display our form // In reality we have to iterate over all found pages. // To makes things shorter extract the next AND required expr and // iterate only over this, then recurse into the next AND expr. // => Split into an AND and OR expression tree. $parsed_relations = $this->detectRelationsAndAttributes($args['s']); $regex = ''; if ($parsed_relations) $regex = preg_grep("/[\*\?]/", $parsed_relations); // Check that all those do exist. else $this->error("Invalid query: No relations or attributes in the query $s found"); $pagelist = new PageList($args['info'], $args['exclude'], $args); if (!$noheader) { $pagelist->setCaption (HTML($noform ? '' : HTML($form, HTML::hr()), fmt("Semantic %s Search Result for \"%s\" in pages \"%s\"", '', $s, $page))); } if (!$regex and $missing = array_diff($parsed_relations, $allrelations)) return $pagelist; $relquery = new TextSearchQuery(join(" ", $parsed_relations)); if (!$relquery->match(join(" ", $allrelations))) return $pagelist; $pagequery = new TextSearchQuery($page, $args['case_exact'], $args['regex']); // if we have only numeric or text ops we can optimize. //$parsed_attr_ops = $this->detectAttrOps($args['s']); //TODO: writeme $linkquery = new TextSearchQuery($s, $args['case_exact'], $args['regex']); $links = $dbi->linkSearch($pagequery, $linkquery, 'relation', $relquery); $pagelist->_links = array(); while ($link = $links->next()) { $pagelist->addPage($link['pagename']); $pagelist->_links[] = $link; } $pagelist->addColumnObject (new _PageList_Column_SemanticSearch_relation('relation', _("Relation"), $pagelist)); $pagelist->addColumnObject (new _PageList_Column_SemanticSearch_link('link', _("Link"), $pagelist)); return $pagelist; } // ... (for _variable subquery) ... function bindSubquery($query) { } // is_a::city* and (population < 1.000.000 or population > 10.000.000) // => is_a population // Do we support wildcards in relation names also? is_*::city function detectRelationsAndAttributes($subquery) { $relations = array(); // relations are easy //$reltoken = preg_grep("/::/", preg_split("/\s+/", $query)); //$relations = array_map(create_function('$a','list($f,$b)=split("::",$a); return $f'), // $reltoken); foreach (preg_split("/\s+/", $query) as $whitetok) { if (preg_match("/^([\w\*\?]+)::/", $whitetok)) $relations[] = $m[1]; } return $relations; // for attributes we might use the tokenizer. All non-numerics excl. units and non-ops } } // Local Variables: // mode: php // tab-width: 8 // c-basic-offset: 4 // c-hanging-comment-ender-p: nil // indent-tabs-mode: nil // End: