2007-07-30 08:09:15 +00:00
|
|
|
<?php
|
2010-02-24 14:45:19 +00:00
|
|
|
/**
|
2010-12-22 20:52:06 +00:00
|
|
|
*
|
2007-07-30 08:09:15 +00:00
|
|
|
*
|
2010-08-07 19:59:42 +00:00
|
|
|
* Created on July 30, 2007
|
|
|
|
|
*
|
2012-07-15 20:13:02 +00:00
|
|
|
* Copyright © 2007 Yuri Astrakhan "<Firstname><Lastname>@gmail.com"
|
2007-07-30 08:09:15 +00:00
|
|
|
*
|
|
|
|
|
* This program is free software; you can redistribute it and/or modify
|
|
|
|
|
* it under the terms of the GNU General Public License as published by
|
|
|
|
|
* the Free Software Foundation; either version 2 of the License, or
|
|
|
|
|
* (at your option) any later version.
|
|
|
|
|
*
|
|
|
|
|
* This program is distributed in the hope that it will be useful,
|
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
|
* GNU General Public License for more details.
|
|
|
|
|
*
|
|
|
|
|
* You should have received a copy of the GNU General Public License along
|
|
|
|
|
* with this program; if not, write to the Free Software Foundation, Inc.,
|
2010-06-21 13:13:32 +00:00
|
|
|
* 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
|
2007-07-30 08:09:15 +00:00
|
|
|
* http://www.gnu.org/copyleft/gpl.html
|
2010-08-07 19:59:42 +00:00
|
|
|
*
|
|
|
|
|
* @file
|
2007-07-30 08:09:15 +00:00
|
|
|
*/
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Query module to perform full text search within wiki titles and content
|
2008-04-14 07:45:50 +00:00
|
|
|
*
|
WARNING: HUGE COMMIT
Doxygen documentation update:
* Changed alls @addtogroup to @ingroup. @addtogroup adds the comment to the group description, but doesn't add the file, class, function, ... to the group like @ingroup does. See for example http://svn.wikimedia.org/doc/group__SpecialPage.html where it's impossible to see related files, classes, ... that should belong to that group.
* Added @file to file description, it seems that it should be explicitely decalred for file descriptions, otherwise doxygen will think that the comment document the first class, variabled, function, ... that is in that file.
* Removed some empty comments
* Removed some ?>
Added following groups:
* ExternalStorage
* JobQueue
* MaintenanceLanguage
One more thing: there are still a lot of warnings when generating the doc.
2008-05-20 17:13:28 +00:00
|
|
|
* @ingroup API
|
2007-07-30 08:09:15 +00:00
|
|
|
*/
|
|
|
|
|
class ApiQuerySearch extends ApiQueryGeneratorBase {
|
|
|
|
|
|
2013-07-31 18:33:57 +00:00
|
|
|
/**
|
|
|
|
|
* When $wgSearchType is null, $wgSearchAlternatives[0] is null. Null isn't
|
|
|
|
|
* a valid option for an array for PARAM_TYPE, so we'll use a fake name
|
|
|
|
|
* that can't possibly be a class name and describes what the null behavior
|
|
|
|
|
* does
|
|
|
|
|
*/
|
|
|
|
|
const BACKEND_NULL_PARAM = 'database-backed';
|
|
|
|
|
|
2009-08-25 20:18:12 +00:00
|
|
|
public function __construct( $query, $moduleName ) {
|
2010-02-24 14:45:19 +00:00
|
|
|
parent::__construct( $query, $moduleName, 'sr' );
|
2007-07-30 08:09:15 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
public function execute() {
|
|
|
|
|
$this->run();
|
|
|
|
|
}
|
|
|
|
|
|
2009-08-25 20:18:12 +00:00
|
|
|
public function executeGenerator( $resultPageSet ) {
|
|
|
|
|
$this->run( $resultPageSet );
|
2007-07-30 08:09:15 +00:00
|
|
|
}
|
|
|
|
|
|
2011-02-19 00:30:18 +00:00
|
|
|
/**
|
2014-04-15 18:12:09 +00:00
|
|
|
* @param ApiPageSet $resultPageSet
|
2012-01-12 19:41:18 +00:00
|
|
|
* @return void
|
2011-02-19 00:30:18 +00:00
|
|
|
*/
|
2009-08-25 20:18:12 +00:00
|
|
|
private function run( $resultPageSet = null ) {
|
2009-07-07 20:17:54 +00:00
|
|
|
global $wgContLang;
|
2007-07-30 08:09:15 +00:00
|
|
|
$params = $this->extractRequestParams();
|
|
|
|
|
|
2009-08-25 20:18:12 +00:00
|
|
|
// Extract parameters
|
2007-07-30 08:09:15 +00:00
|
|
|
$limit = $params['limit'];
|
2008-04-14 07:45:50 +00:00
|
|
|
$query = $params['search'];
|
2008-07-27 21:31:11 +00:00
|
|
|
$what = $params['what'];
|
2014-02-12 17:30:22 +00:00
|
|
|
$interwiki = $params['interwiki'];
|
2009-08-25 20:18:12 +00:00
|
|
|
$searchInfo = array_flip( $params['info'] );
|
|
|
|
|
$prop = array_flip( $params['prop'] );
|
2010-02-24 14:45:19 +00:00
|
|
|
|
2009-08-25 20:18:12 +00:00
|
|
|
// Create search engine instance and set options
|
2013-07-31 18:33:57 +00:00
|
|
|
$search = isset( $params['backend'] ) && $params['backend'] != self::BACKEND_NULL_PARAM ?
|
|
|
|
|
SearchEngine::create( $params['backend'] ) : SearchEngine::create();
|
2010-01-11 15:55:52 +00:00
|
|
|
$search->setLimitOffset( $limit + 1, $params['offset'] );
|
2007-07-30 08:09:15 +00:00
|
|
|
$search->setNamespaces( $params['namespace'] );
|
2008-04-14 07:45:50 +00:00
|
|
|
|
2011-07-26 15:10:57 +00:00
|
|
|
$query = $search->transformSearchTerm( $query );
|
|
|
|
|
$query = $search->replacePrefixes( $query );
|
|
|
|
|
|
2009-08-25 20:18:12 +00:00
|
|
|
// Perform the actual search
|
|
|
|
|
if ( $what == 'text' ) {
|
2007-07-30 08:09:15 +00:00
|
|
|
$matches = $search->searchText( $query );
|
2010-01-11 15:55:52 +00:00
|
|
|
} elseif ( $what == 'title' ) {
|
2007-07-30 08:09:15 +00:00
|
|
|
$matches = $search->searchTitle( $query );
|
2010-07-09 11:08:18 +00:00
|
|
|
} elseif ( $what == 'nearmatch' ) {
|
|
|
|
|
$matches = SearchEngine::getNearMatchResultSet( $query );
|
2008-07-27 21:31:11 +00:00
|
|
|
} else {
|
|
|
|
|
// We default to title searches; this is a terrible legacy
|
|
|
|
|
// of the way we initially set up the MySQL fulltext-based
|
|
|
|
|
// search engine with separate title and text fields.
|
|
|
|
|
// In the future, the default should be for a combined index.
|
2008-12-03 19:33:57 +00:00
|
|
|
$what = 'title';
|
2008-07-27 21:31:11 +00:00
|
|
|
$matches = $search->searchTitle( $query );
|
2010-02-24 14:45:19 +00:00
|
|
|
|
2008-07-27 21:31:11 +00:00
|
|
|
// Not all search engines support a separate title search,
|
|
|
|
|
// for instance the Lucene-based engine we use on Wikipedia.
|
|
|
|
|
// In this case, fall back to full-text search (which will
|
|
|
|
|
// include titles in it!)
|
2010-01-11 15:55:52 +00:00
|
|
|
if ( is_null( $matches ) ) {
|
2008-12-03 19:33:57 +00:00
|
|
|
$what = 'text';
|
2008-07-27 21:31:11 +00:00
|
|
|
$matches = $search->searchText( $query );
|
2008-12-03 19:33:57 +00:00
|
|
|
}
|
2008-07-27 21:31:11 +00:00
|
|
|
}
|
2010-02-24 14:45:19 +00:00
|
|
|
if ( is_null( $matches ) ) {
|
2009-08-25 20:18:12 +00:00
|
|
|
$this->dieUsage( "{$what} search is disabled", "search-{$what}-disabled" );
|
2013-04-27 12:02:08 +00:00
|
|
|
} elseif ( $matches instanceof Status && !$matches->isGood() ) {
|
2013-04-18 15:29:21 +00:00
|
|
|
$this->dieUsage( $matches->getWikiText(), 'search-error' );
|
2010-02-24 14:45:19 +00:00
|
|
|
}
|
|
|
|
|
|
2011-07-06 20:18:22 +00:00
|
|
|
$apiResult = $this->getResult();
|
2009-08-25 20:18:12 +00:00
|
|
|
// Add search meta data to result
|
|
|
|
|
if ( isset( $searchInfo['totalhits'] ) ) {
|
|
|
|
|
$totalhits = $matches->getTotalHits();
|
2010-01-11 15:55:52 +00:00
|
|
|
if ( $totalhits !== null ) {
|
2011-07-06 20:18:22 +00:00
|
|
|
$apiResult->addValue( array( 'query', 'searchinfo' ),
|
2013-11-14 13:00:02 +00:00
|
|
|
'totalhits', $totalhits );
|
2009-08-25 20:18:12 +00:00
|
|
|
}
|
* Added fields to list=search output: size, wordcount, timestamp, snippet
* Where supported by backend, list=search adds a 'searchinfo' element with
optional info: 'totalhits' count and 'suggestion' alternate query term
Snippets added to result items earlier by Roan; extended this with the other
byte size, word count, and timestamp available on the result items and exposed
through the regular UI.
Had to work out a backwards-compatible method for the search meta-information
with Roan; added a second 'searchinfo' element since adding attributes to
'search' would break compatibility for JSON output (despite being safe in XML).
'searchinfo' is present only if the backend supports the extra info and has
something available; 'totalhits' with a total hit count and 'suggestion' for
an alternate query suggestion (exposed as "Did you mean X?" link in UI).
Note that total hit counts can be enabled for MySQL backend now by setting
the experimental option $wgSearchMySQLTotalHits, but did-you-mean suggestions
are not yet supported and need to be tested with a hack or another backend.
Sample XML and JSON output with the new searchinfo items (which can be
present whether or not there are any result items):
<?xml version="1.0"?>
<api>
<query>
<searchinfo totalhits="0" suggestion="joe momma" />
<search />
</query>
</api>
{
"query": {
"searchinfo": {
"totalhits": 0,
"suggestion": "joe momma"
},
"search": [
]
}
}
The suggestion value is suitable for plugging back in as a search term,
if present.
2009-07-28 21:13:48 +00:00
|
|
|
}
|
2009-08-25 20:18:12 +00:00
|
|
|
if ( isset( $searchInfo['suggestion'] ) && $matches->hasSuggestion() ) {
|
2011-07-06 20:18:22 +00:00
|
|
|
$apiResult->addValue( array( 'query', 'searchinfo' ),
|
2013-11-14 13:00:02 +00:00
|
|
|
'suggestion', $matches->getSuggestionQuery() );
|
* Added fields to list=search output: size, wordcount, timestamp, snippet
* Where supported by backend, list=search adds a 'searchinfo' element with
optional info: 'totalhits' count and 'suggestion' alternate query term
Snippets added to result items earlier by Roan; extended this with the other
byte size, word count, and timestamp available on the result items and exposed
through the regular UI.
Had to work out a backwards-compatible method for the search meta-information
with Roan; added a second 'searchinfo' element since adding attributes to
'search' would break compatibility for JSON output (despite being safe in XML).
'searchinfo' is present only if the backend supports the extra info and has
something available; 'totalhits' with a total hit count and 'suggestion' for
an alternate query suggestion (exposed as "Did you mean X?" link in UI).
Note that total hit counts can be enabled for MySQL backend now by setting
the experimental option $wgSearchMySQLTotalHits, but did-you-mean suggestions
are not yet supported and need to be tested with a hack or another backend.
Sample XML and JSON output with the new searchinfo items (which can be
present whether or not there are any result items):
<?xml version="1.0"?>
<api>
<query>
<searchinfo totalhits="0" suggestion="joe momma" />
<search />
</query>
</api>
{
"query": {
"searchinfo": {
"totalhits": 0,
"suggestion": "joe momma"
},
"search": [
]
}
}
The suggestion value is suitable for plugging back in as a search term,
if present.
2009-07-28 21:13:48 +00:00
|
|
|
}
|
2007-07-30 08:09:15 +00:00
|
|
|
|
2009-08-25 20:18:12 +00:00
|
|
|
// Add the search results to the result
|
|
|
|
|
$terms = $wgContLang->convertForSearchResult( $matches->termMatches() );
|
2010-02-24 14:45:19 +00:00
|
|
|
$titles = array();
|
2007-07-30 08:09:15 +00:00
|
|
|
$count = 0;
|
2011-03-25 10:36:07 +00:00
|
|
|
$result = $matches->next();
|
2011-07-06 20:18:22 +00:00
|
|
|
|
2011-03-25 10:36:07 +00:00
|
|
|
while ( $result ) {
|
2013-11-14 13:00:02 +00:00
|
|
|
if ( ++$count > $limit ) {
|
2013-11-14 13:58:14 +00:00
|
|
|
// We've reached the one extra which shows that there are
|
|
|
|
|
// additional items to be had. Stop here...
|
2009-08-25 20:18:12 +00:00
|
|
|
$this->setContinueEnumParameter( 'offset', $params['offset'] + $params['limit'] );
|
2007-07-30 08:09:15 +00:00
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
2008-08-16 21:00:19 +00:00
|
|
|
// Silently skip broken and missing titles
|
2010-02-24 14:45:19 +00:00
|
|
|
if ( $result->isBrokenTitle() || $result->isMissingRevision() ) {
|
2011-11-09 17:20:05 +00:00
|
|
|
$result = $matches->next();
|
2008-08-16 21:00:19 +00:00
|
|
|
continue;
|
2010-02-24 14:45:19 +00:00
|
|
|
}
|
|
|
|
|
|
2007-07-30 08:09:15 +00:00
|
|
|
$title = $result->getTitle();
|
2009-08-25 20:18:12 +00:00
|
|
|
if ( is_null( $resultPageSet ) ) {
|
2009-02-27 16:03:01 +00:00
|
|
|
$vals = array();
|
2009-08-25 20:18:12 +00:00
|
|
|
ApiQueryBase::addTitleInfo( $vals, $title );
|
2010-02-24 14:45:19 +00:00
|
|
|
|
|
|
|
|
if ( isset( $prop['snippet'] ) ) {
|
2009-08-25 20:18:12 +00:00
|
|
|
$vals['snippet'] = $result->getTextSnippet( $terms );
|
2010-02-24 14:45:19 +00:00
|
|
|
}
|
|
|
|
|
if ( isset( $prop['size'] ) ) {
|
2009-08-25 20:18:12 +00:00
|
|
|
$vals['size'] = $result->getByteSize();
|
2010-02-24 14:45:19 +00:00
|
|
|
}
|
|
|
|
|
if ( isset( $prop['wordcount'] ) ) {
|
2009-08-25 20:18:12 +00:00
|
|
|
$vals['wordcount'] = $result->getWordCount();
|
2010-02-24 14:45:19 +00:00
|
|
|
}
|
|
|
|
|
if ( isset( $prop['timestamp'] ) ) {
|
2009-08-25 20:18:12 +00:00
|
|
|
$vals['timestamp'] = wfTimestamp( TS_ISO_8601, $result->getTimestamp() );
|
2010-02-24 14:45:19 +00:00
|
|
|
}
|
2010-11-08 12:23:24 +00:00
|
|
|
if ( !is_null( $result->getScore() ) && isset( $prop['score'] ) ) {
|
|
|
|
|
$vals['score'] = $result->getScore();
|
2010-11-01 18:14:45 +00:00
|
|
|
}
|
|
|
|
|
if ( isset( $prop['titlesnippet'] ) ) {
|
|
|
|
|
$vals['titlesnippet'] = $result->getTitleSnippet( $terms );
|
|
|
|
|
}
|
|
|
|
|
if ( !is_null( $result->getRedirectTitle() ) ) {
|
|
|
|
|
if ( isset( $prop['redirecttitle'] ) ) {
|
|
|
|
|
$vals['redirecttitle'] = $result->getRedirectTitle();
|
|
|
|
|
}
|
|
|
|
|
if ( isset( $prop['redirectsnippet'] ) ) {
|
|
|
|
|
$vals['redirectsnippet'] = $result->getRedirectSnippet( $terms );
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
if ( !is_null( $result->getSectionTitle() ) ) {
|
|
|
|
|
if ( isset( $prop['sectiontitle'] ) ) {
|
2011-07-06 20:41:12 +00:00
|
|
|
$vals['sectiontitle'] = $result->getSectionTitle()->getFragment();
|
2010-11-01 18:14:45 +00:00
|
|
|
}
|
|
|
|
|
if ( isset( $prop['sectionsnippet'] ) ) {
|
|
|
|
|
$vals['sectionsnippet'] = $result->getSectionSnippet();
|
|
|
|
|
}
|
|
|
|
|
}
|
2010-11-08 12:23:24 +00:00
|
|
|
if ( isset( $prop['hasrelated'] ) && $result->hasRelated() ) {
|
2013-01-12 06:50:48 +00:00
|
|
|
$vals['hasrelated'] = '';
|
2010-11-01 18:14:45 +00:00
|
|
|
}
|
2010-02-24 14:45:19 +00:00
|
|
|
|
2009-08-25 20:18:12 +00:00
|
|
|
// Add item to results and see whether it fits
|
2011-07-06 20:18:22 +00:00
|
|
|
$fit = $apiResult->addValue( array( 'query', $this->getModuleName() ),
|
2013-11-14 13:00:02 +00:00
|
|
|
null, $vals );
|
2009-08-25 20:18:12 +00:00
|
|
|
if ( !$fit ) {
|
|
|
|
|
$this->setContinueEnumParameter( 'offset', $params['offset'] + $count - 1 );
|
* API: BREAKING CHANGE: (bug 11430) Return fewer results than the limit in some cases to prevent running out of memory
* This means queries could possibly return fewer results than the limit and still set a query-continue
* Add iicontinue, rvcontinue, cicontinue, incontinue, amfrom to faciliate query-continue for these modules
* Implemented by blocking additions to the ApiResult object if they would make it too large
** Important things like query-continue values and warnings are exempt from this check
** RSS feeds and exported XML are also exempted (size-checking them would be too messy)
** Result size is checked against $wgAPIMaxResultSize, which defaults to 8 MB
For those who really care, per-file details follow:
ApiResult.php:
* Introduced ApiResult::$mSize which keeps track of the result size.
* Introduced ApiResult::size() which calculates an array's size
(which is the sum of the strlen()s of its elements).
* ApiResult::addValue() now checks that the result size stays below
$wgAPIMaxResultSize. If the item won't fit, it won't be added and addValue()
will return false. Callers should check the return value and set a
query-continue if it's false.
* Closed the back door that is ApiResult::getData(): callers can't manipulate
the data array directly anymore so they can't bypass the result size limit.
* Added ApiResult::setIndexedTagName_internal() which will call
setIndexedTagName() on an array already in the result. This is needed for the
'new' order of adding results, which means addValue()ing one result at a time
until you hit the limit or run out, then calling this function to set the tag
name.
* Added ApiResult::disableSizeCheck() and enableSizeCheck() which disable and
enable size checking in addValue(). This is used for stuff like query-continue
elements and warnings which shouldn't count towards the result size.
* Added ApiResult::unsetValue() which removes an element from the result and
decreases $mSize.
ApiBase.php:
* Like ApiResult::getData(), ApiBase::getResultData() no longer returns a
reference.
* Use ApiResult::disableSizeCheck() in ApiBase::setWarning()
ApiQueryBase.php:
* Added ApiQueryBase::addPageSubItem(), which adds page subitems one item
at a time.
* addPageSubItem() and addPageSubItems() now return whether the subitem
fit in the result.
* Use ApiResult::disableSizeCheck() in setContinueEnumParameter()
ApiMain.php:
* Use ApiResult::disableSizeCheck() in ApiMain::substituteResultWithError()
* Use getParameter() rather than $mRequest to obtain requestid
DefaultSettings.php:
* Added $wgAPIMaxResultSize, with a default value of 8 MB
ApiQuery*.php:
* Added results one at a time, and set a query-continue if the result is full.
ApiQueryLangLinks.php and friends:
* Migrated from addPageSubItems() to addPageSubItem(). This eliminates the
need for $lastId.
ApiQueryAllLinks.php, ApiQueryWatchlist.php, ApiQueryAllimages.php, ApiQuerySearch.php:
* Renamed $data to something more appropriate ($pageids, $ids or $titles)
ApiQuerySiteinfo.php:
* Abuse siprop as a query-continue parameter and set it to all props that
couldn't be processed.
ApiQueryRandom.php:
* Doesn't do continuations, because the result is supposed to be random.
* Be smart enough to not run the second query if the results of the first
didn't fit.
ApiQueryImageInfo.php, ApiQueryRevisions.php, ApiQueryCategoryInfo.php, ApiQueryInfo.php:
* Added continue parameter which basically skips the first so many items
ApiQueryBacklinks.php:
* Throw the result in a big array first and addValue() that one element at a time if necessary
** This is necessary because the results aren't retrieved in order
* Introduced $this->pageMap to map namespace and title to page ID
* Rewritten extractRowInfo() and extractRedirRowInfo() a little
* Declared all private member variables explicitly
ApiQueryDeletedrevs.php:
* Use a pagemap just like in Backlinks
* Introduce fake page IDs and keep track of them so we know where to add what
** This doesn't change the output format, because the fake page IDs start at 0 and are consecutive
ApiQueryAllmessages.php:
* Add amfrom to facilitate query-continue
ApiQueryUsers.php:
* Rewrite: put the getOtherUsersInfo() code in execute()
2009-02-05 14:30:59 +00:00
|
|
|
break;
|
|
|
|
|
}
|
2007-07-30 08:09:15 +00:00
|
|
|
} else {
|
* API: BREAKING CHANGE: (bug 11430) Return fewer results than the limit in some cases to prevent running out of memory
* This means queries could possibly return fewer results than the limit and still set a query-continue
* Add iicontinue, rvcontinue, cicontinue, incontinue, amfrom to faciliate query-continue for these modules
* Implemented by blocking additions to the ApiResult object if they would make it too large
** Important things like query-continue values and warnings are exempt from this check
** RSS feeds and exported XML are also exempted (size-checking them would be too messy)
** Result size is checked against $wgAPIMaxResultSize, which defaults to 8 MB
For those who really care, per-file details follow:
ApiResult.php:
* Introduced ApiResult::$mSize which keeps track of the result size.
* Introduced ApiResult::size() which calculates an array's size
(which is the sum of the strlen()s of its elements).
* ApiResult::addValue() now checks that the result size stays below
$wgAPIMaxResultSize. If the item won't fit, it won't be added and addValue()
will return false. Callers should check the return value and set a
query-continue if it's false.
* Closed the back door that is ApiResult::getData(): callers can't manipulate
the data array directly anymore so they can't bypass the result size limit.
* Added ApiResult::setIndexedTagName_internal() which will call
setIndexedTagName() on an array already in the result. This is needed for the
'new' order of adding results, which means addValue()ing one result at a time
until you hit the limit or run out, then calling this function to set the tag
name.
* Added ApiResult::disableSizeCheck() and enableSizeCheck() which disable and
enable size checking in addValue(). This is used for stuff like query-continue
elements and warnings which shouldn't count towards the result size.
* Added ApiResult::unsetValue() which removes an element from the result and
decreases $mSize.
ApiBase.php:
* Like ApiResult::getData(), ApiBase::getResultData() no longer returns a
reference.
* Use ApiResult::disableSizeCheck() in ApiBase::setWarning()
ApiQueryBase.php:
* Added ApiQueryBase::addPageSubItem(), which adds page subitems one item
at a time.
* addPageSubItem() and addPageSubItems() now return whether the subitem
fit in the result.
* Use ApiResult::disableSizeCheck() in setContinueEnumParameter()
ApiMain.php:
* Use ApiResult::disableSizeCheck() in ApiMain::substituteResultWithError()
* Use getParameter() rather than $mRequest to obtain requestid
DefaultSettings.php:
* Added $wgAPIMaxResultSize, with a default value of 8 MB
ApiQuery*.php:
* Added results one at a time, and set a query-continue if the result is full.
ApiQueryLangLinks.php and friends:
* Migrated from addPageSubItems() to addPageSubItem(). This eliminates the
need for $lastId.
ApiQueryAllLinks.php, ApiQueryWatchlist.php, ApiQueryAllimages.php, ApiQuerySearch.php:
* Renamed $data to something more appropriate ($pageids, $ids or $titles)
ApiQuerySiteinfo.php:
* Abuse siprop as a query-continue parameter and set it to all props that
couldn't be processed.
ApiQueryRandom.php:
* Doesn't do continuations, because the result is supposed to be random.
* Be smart enough to not run the second query if the results of the first
didn't fit.
ApiQueryImageInfo.php, ApiQueryRevisions.php, ApiQueryCategoryInfo.php, ApiQueryInfo.php:
* Added continue parameter which basically skips the first so many items
ApiQueryBacklinks.php:
* Throw the result in a big array first and addValue() that one element at a time if necessary
** This is necessary because the results aren't retrieved in order
* Introduced $this->pageMap to map namespace and title to page ID
* Rewritten extractRowInfo() and extractRedirRowInfo() a little
* Declared all private member variables explicitly
ApiQueryDeletedrevs.php:
* Use a pagemap just like in Backlinks
* Introduce fake page IDs and keep track of them so we know where to add what
** This doesn't change the output format, because the fake page IDs start at 0 and are consecutive
ApiQueryAllmessages.php:
* Add amfrom to facilitate query-continue
ApiQueryUsers.php:
* Rewrite: put the getOtherUsersInfo() code in execute()
2009-02-05 14:30:59 +00:00
|
|
|
$titles[] = $title;
|
2007-07-30 08:09:15 +00:00
|
|
|
}
|
2011-03-25 10:36:07 +00:00
|
|
|
|
|
|
|
|
$result = $matches->next();
|
2007-07-30 08:09:15 +00:00
|
|
|
}
|
|
|
|
|
|
2014-02-12 17:30:22 +00:00
|
|
|
$hasInterwikiResults = false;
|
|
|
|
|
if ( $interwiki && $resultPageSet === null && $matches->hasInterwikiResults() ) {
|
|
|
|
|
$matches = $matches->getInterwikiResults();
|
|
|
|
|
$iwprefixes = array();
|
|
|
|
|
$hasInterwikiResults = true;
|
|
|
|
|
|
|
|
|
|
// Include number of results if requested
|
|
|
|
|
if ( isset( $searchInfo['totalhits'] ) ) {
|
|
|
|
|
$totalhits = $matches->getTotalHits();
|
|
|
|
|
if ( $totalhits !== null ) {
|
|
|
|
|
$apiResult->addValue( array( 'query', 'interwikisearchinfo' ),
|
|
|
|
|
'totalhits', $totalhits );
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
$result = $matches->next();
|
|
|
|
|
while ( $result ) {
|
|
|
|
|
$title = $result->getTitle();
|
|
|
|
|
$vals = array(
|
|
|
|
|
'namespace' => $result->getInterwikiNamespaceText(),
|
|
|
|
|
'title' => $title->getText(),
|
|
|
|
|
'url' => $title->getFullUrl(),
|
|
|
|
|
);
|
|
|
|
|
|
|
|
|
|
// Add item to results and see whether it fits
|
2014-04-24 19:50:01 +00:00
|
|
|
$fit = $apiResult->addValue(
|
|
|
|
|
array( 'query', 'interwiki' . $this->getModuleName(), $result->getInterwikiPrefix() ),
|
|
|
|
|
null,
|
|
|
|
|
$vals
|
|
|
|
|
);
|
|
|
|
|
|
2014-02-12 17:30:22 +00:00
|
|
|
if ( !$fit ) {
|
|
|
|
|
// We hit the limit. We can't really provide any meaningful
|
|
|
|
|
// pagination info so just bail out
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
$result = $matches->next();
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2009-08-25 20:18:12 +00:00
|
|
|
if ( is_null( $resultPageSet ) ) {
|
2011-07-06 20:18:22 +00:00
|
|
|
$apiResult->setIndexedTagName_internal( array(
|
2013-11-14 13:00:02 +00:00
|
|
|
'query', $this->getModuleName()
|
|
|
|
|
), 'p' );
|
2014-02-12 17:30:22 +00:00
|
|
|
if ( $hasInterwikiResults ) {
|
|
|
|
|
$apiResult->setIndexedTagName_internal( array(
|
|
|
|
|
'query', 'interwiki' . $this->getModuleName()
|
|
|
|
|
), 'p' );
|
|
|
|
|
}
|
2007-07-30 08:09:15 +00:00
|
|
|
} else {
|
2009-08-25 20:18:12 +00:00
|
|
|
$resultPageSet->populateFromTitles( $titles );
|
2007-07-30 08:09:15 +00:00
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2010-07-23 07:17:56 +00:00
|
|
|
public function getCacheMode( $params ) {
|
|
|
|
|
return 'public';
|
|
|
|
|
}
|
|
|
|
|
|
2008-01-28 19:05:26 +00:00
|
|
|
public function getAllowedParams() {
|
2013-07-31 18:33:57 +00:00
|
|
|
global $wgSearchType;
|
|
|
|
|
|
|
|
|
|
$params = array(
|
2010-08-04 20:47:58 +00:00
|
|
|
'search' => array(
|
|
|
|
|
ApiBase::PARAM_TYPE => 'string',
|
|
|
|
|
ApiBase::PARAM_REQUIRED => true
|
|
|
|
|
),
|
2010-02-24 14:45:19 +00:00
|
|
|
'namespace' => array(
|
2012-12-27 13:54:16 +00:00
|
|
|
ApiBase::PARAM_DFLT => NS_MAIN,
|
2010-02-24 14:45:19 +00:00
|
|
|
ApiBase::PARAM_TYPE => 'namespace',
|
|
|
|
|
ApiBase::PARAM_ISMULTI => true,
|
2007-07-30 08:09:15 +00:00
|
|
|
),
|
2010-02-24 14:45:19 +00:00
|
|
|
'what' => array(
|
|
|
|
|
ApiBase::PARAM_DFLT => null,
|
|
|
|
|
ApiBase::PARAM_TYPE => array(
|
2007-07-30 08:09:15 +00:00
|
|
|
'title',
|
|
|
|
|
'text',
|
2010-07-09 11:08:18 +00:00
|
|
|
'nearmatch',
|
2007-07-30 08:09:15 +00:00
|
|
|
)
|
|
|
|
|
),
|
2009-08-25 20:18:12 +00:00
|
|
|
'info' => array(
|
2010-02-24 14:45:19 +00:00
|
|
|
ApiBase::PARAM_DFLT => 'totalhits|suggestion',
|
|
|
|
|
ApiBase::PARAM_TYPE => array(
|
2009-08-25 20:18:12 +00:00
|
|
|
'totalhits',
|
|
|
|
|
'suggestion',
|
|
|
|
|
),
|
2010-02-24 14:45:19 +00:00
|
|
|
ApiBase::PARAM_ISMULTI => true,
|
2009-08-25 20:18:12 +00:00
|
|
|
),
|
|
|
|
|
'prop' => array(
|
2010-02-24 14:45:19 +00:00
|
|
|
ApiBase::PARAM_DFLT => 'size|wordcount|timestamp|snippet',
|
|
|
|
|
ApiBase::PARAM_TYPE => array(
|
2009-08-25 20:18:12 +00:00
|
|
|
'size',
|
|
|
|
|
'wordcount',
|
|
|
|
|
'timestamp',
|
2010-11-01 18:14:45 +00:00
|
|
|
'score',
|
2009-08-25 20:18:12 +00:00
|
|
|
'snippet',
|
2010-11-01 18:14:45 +00:00
|
|
|
'titlesnippet',
|
|
|
|
|
'redirecttitle',
|
|
|
|
|
'redirectsnippet',
|
|
|
|
|
'sectiontitle',
|
|
|
|
|
'sectionsnippet',
|
|
|
|
|
'hasrelated',
|
2009-08-25 20:18:12 +00:00
|
|
|
),
|
2010-02-24 14:45:19 +00:00
|
|
|
ApiBase::PARAM_ISMULTI => true,
|
2009-08-25 20:18:12 +00:00
|
|
|
),
|
2007-07-30 08:09:15 +00:00
|
|
|
'offset' => 0,
|
2010-02-24 14:45:19 +00:00
|
|
|
'limit' => array(
|
|
|
|
|
ApiBase::PARAM_DFLT => 10,
|
|
|
|
|
ApiBase::PARAM_TYPE => 'limit',
|
|
|
|
|
ApiBase::PARAM_MIN => 1,
|
|
|
|
|
ApiBase::PARAM_MAX => ApiBase::LIMIT_SML1,
|
|
|
|
|
ApiBase::PARAM_MAX2 => ApiBase::LIMIT_SML2
|
2014-02-12 17:30:22 +00:00
|
|
|
),
|
|
|
|
|
'interwiki' => false,
|
2007-07-30 08:09:15 +00:00
|
|
|
);
|
2013-07-31 18:33:57 +00:00
|
|
|
|
|
|
|
|
$alternatives = SearchEngine::getSearchTypes();
|
|
|
|
|
if ( count( $alternatives ) > 1 ) {
|
|
|
|
|
if ( $alternatives[0] === null ) {
|
|
|
|
|
$alternatives[0] = self::BACKEND_NULL_PARAM;
|
|
|
|
|
}
|
|
|
|
|
$params['backend'] = array(
|
|
|
|
|
ApiBase::PARAM_DFLT => $wgSearchType,
|
|
|
|
|
ApiBase::PARAM_TYPE => $alternatives,
|
|
|
|
|
);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return $params;
|
2007-07-30 08:09:15 +00:00
|
|
|
}
|
|
|
|
|
|
2008-01-28 19:05:26 +00:00
|
|
|
public function getParamDescription() {
|
2013-07-31 18:33:57 +00:00
|
|
|
$descriptions = array(
|
2010-05-11 22:30:18 +00:00
|
|
|
'search' => 'Search for all page titles (or content) that has this value',
|
|
|
|
|
'namespace' => 'The namespace(s) to enumerate',
|
|
|
|
|
'what' => 'Search inside the text or titles',
|
|
|
|
|
'info' => 'What metadata to return',
|
2010-06-23 19:36:26 +00:00
|
|
|
'prop' => array(
|
|
|
|
|
'What properties to return',
|
2010-11-01 18:14:45 +00:00
|
|
|
' size - Adds the size of the page in bytes',
|
|
|
|
|
' wordcount - Adds the word count of the page',
|
|
|
|
|
' timestamp - Adds the timestamp of when the page was last edited',
|
|
|
|
|
' score - Adds the score (if any) from the search engine',
|
|
|
|
|
' snippet - Adds a parsed snippet of the page',
|
|
|
|
|
' titlesnippet - Adds a parsed snippet of the page title',
|
2011-07-06 20:47:26 +00:00
|
|
|
' redirectsnippet - Adds a parsed snippet of the redirect title',
|
|
|
|
|
' redirecttitle - Adds the title of the matching redirect',
|
|
|
|
|
' sectionsnippet - Adds a parsed snippet of the matching section title',
|
|
|
|
|
' sectiontitle - Adds the title of the matching section',
|
2010-11-01 18:14:45 +00:00
|
|
|
' hasrelated - Indicates whether a related search is available',
|
2010-06-23 19:36:26 +00:00
|
|
|
),
|
2007-07-30 08:09:15 +00:00
|
|
|
'offset' => 'Use this value to continue paging (return by query)',
|
2014-02-12 17:30:22 +00:00
|
|
|
'limit' => 'How many total pages to return',
|
|
|
|
|
'interwiki' => 'Include interwiki results in the search, if available'
|
2007-07-30 08:09:15 +00:00
|
|
|
);
|
2013-07-31 18:33:57 +00:00
|
|
|
|
|
|
|
|
if ( count( SearchEngine::getSearchTypes() ) > 1 ) {
|
|
|
|
|
$descriptions['backend'] = 'Which search backend to use, if not the default';
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return $descriptions;
|
2007-07-30 08:09:15 +00:00
|
|
|
}
|
|
|
|
|
|
Added result properties to action=paraminfo
Added information about the properties of the results of API calls
to action=paraminfo, including information about "property groups":
what should the prop parameter be set to to get that property.
Uses the same format for types as parameters already do.
The output format of some modules doesn't fit this, so the result
properties for them weren't added, or only partially.
Partially implemented modules:
* expandtemplates:
parsetree is in its own tag
* protect, allusers, backlinks, deletedrevs, info, imageinfo,
logevents, querypage, recentchanges, revisions, searchinfo,
usercontribs, userinfo, users, watchlist, upload:
response with partially complex structure
Not implemented modules:
* feedcontributions, feedwatchlist, opensearch, rds:
non-standard reponse
* help:
error is normal response; not very useful for automated tools anyway
* paraminfo, parse, pageprops, siteinfo, userrights:
response with complex structure
Change-Id: Iff2a9bef79f994e73eef3062b4dd5461bff968ab
2012-05-02 15:00:30 +00:00
|
|
|
public function getResultProperties() {
|
|
|
|
|
return array(
|
|
|
|
|
'' => array(
|
|
|
|
|
'ns' => 'namespace',
|
|
|
|
|
'title' => 'string'
|
|
|
|
|
),
|
|
|
|
|
'snippet' => array(
|
|
|
|
|
'snippet' => 'string'
|
|
|
|
|
),
|
|
|
|
|
'size' => array(
|
|
|
|
|
'size' => 'integer'
|
|
|
|
|
),
|
|
|
|
|
'wordcount' => array(
|
|
|
|
|
'wordcount' => 'integer'
|
|
|
|
|
),
|
|
|
|
|
'timestamp' => array(
|
|
|
|
|
'timestamp' => 'timestamp'
|
|
|
|
|
),
|
|
|
|
|
'score' => array(
|
|
|
|
|
'score' => array(
|
|
|
|
|
ApiBase::PROP_TYPE => 'string',
|
|
|
|
|
ApiBase::PROP_NULLABLE => true
|
|
|
|
|
)
|
|
|
|
|
),
|
|
|
|
|
'titlesnippet' => array(
|
|
|
|
|
'titlesnippet' => 'string'
|
|
|
|
|
),
|
|
|
|
|
'redirecttitle' => array(
|
|
|
|
|
'redirecttitle' => array(
|
|
|
|
|
ApiBase::PROP_TYPE => 'string',
|
|
|
|
|
ApiBase::PROP_NULLABLE => true
|
|
|
|
|
)
|
|
|
|
|
),
|
|
|
|
|
'redirectsnippet' => array(
|
|
|
|
|
'redirectsnippet' => array(
|
|
|
|
|
ApiBase::PROP_TYPE => 'string',
|
|
|
|
|
ApiBase::PROP_NULLABLE => true
|
|
|
|
|
)
|
|
|
|
|
),
|
|
|
|
|
'sectiontitle' => array(
|
|
|
|
|
'sectiontitle' => array(
|
|
|
|
|
ApiBase::PROP_TYPE => 'string',
|
|
|
|
|
ApiBase::PROP_NULLABLE => true
|
|
|
|
|
)
|
|
|
|
|
),
|
|
|
|
|
'sectionsnippet' => array(
|
|
|
|
|
'sectionsnippet' => array(
|
|
|
|
|
ApiBase::PROP_TYPE => 'string',
|
|
|
|
|
ApiBase::PROP_NULLABLE => true
|
|
|
|
|
)
|
|
|
|
|
),
|
|
|
|
|
'hasrelated' => array(
|
|
|
|
|
'hasrelated' => 'boolean'
|
|
|
|
|
)
|
|
|
|
|
);
|
|
|
|
|
}
|
|
|
|
|
|
2008-01-28 19:05:26 +00:00
|
|
|
public function getDescription() {
|
2014-03-09 20:22:47 +00:00
|
|
|
return 'Perform a full text search.';
|
2007-07-30 08:09:15 +00:00
|
|
|
}
|
2010-02-24 14:45:19 +00:00
|
|
|
|
2010-02-13 01:28:26 +00:00
|
|
|
public function getPossibleErrors() {
|
|
|
|
|
return array_merge( parent::getPossibleErrors(), array(
|
|
|
|
|
array( 'code' => 'search-text-disabled', 'info' => 'text search is disabled' ),
|
|
|
|
|
array( 'code' => 'search-title-disabled', 'info' => 'title search is disabled' ),
|
2013-04-18 15:29:21 +00:00
|
|
|
array( 'code' => 'search-error', 'info' => 'search error has occurred' ),
|
2010-02-13 01:28:26 +00:00
|
|
|
) );
|
|
|
|
|
}
|
2007-07-30 08:09:15 +00:00
|
|
|
|
2011-08-17 22:24:21 +00:00
|
|
|
public function getExamples() {
|
2010-02-24 14:45:19 +00:00
|
|
|
return array(
|
2007-07-30 08:09:15 +00:00
|
|
|
'api.php?action=query&list=search&srsearch=meaning',
|
|
|
|
|
'api.php?action=query&list=search&srwhat=text&srsearch=meaning',
|
|
|
|
|
'api.php?action=query&generator=search&gsrsearch=meaning&prop=info',
|
|
|
|
|
);
|
|
|
|
|
}
|
|
|
|
|
|
2011-07-17 17:02:06 +00:00
|
|
|
public function getHelpUrls() {
|
2011-11-28 15:43:11 +00:00
|
|
|
return 'https://www.mediawiki.org/wiki/API:Search';
|
2011-07-17 17:02:06 +00:00
|
|
|
}
|
2009-08-26 21:13:06 +00:00
|
|
|
}
|