Bug: T231636 Depends-On: I2cd24e73726394e3200a570c45d5e86b6849bfa9 Depends-On: I4fa3e6aad872434ca397325ed7a83f94973661d0 Change-Id: Ie6233561de78457cae5e4e44e220feec2d1272d8
386 lines
11 KiB
PHP
386 lines
11 KiB
PHP
<?php
|
||
/**
|
||
* Copyright © 2006 Yuri Astrakhan "<Firstname><Lastname>@gmail.com"
|
||
* Copyright © 2008 Brion Vibber <brion@wikimedia.org>
|
||
* Copyright © 2014 Wikimedia Foundation and contributors
|
||
*
|
||
* This program is free software; you can redistribute it and/or modify
|
||
* it under the terms of the GNU General Public License as published by
|
||
* the Free Software Foundation; either version 2 of the License, or
|
||
* (at your option) any later version.
|
||
*
|
||
* This program is distributed in the hope that it will be useful,
|
||
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||
* GNU General Public License for more details.
|
||
*
|
||
* You should have received a copy of the GNU General Public License along
|
||
* with this program; if not, write to the Free Software Foundation, Inc.,
|
||
* 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
|
||
* http://www.gnu.org/copyleft/gpl.html
|
||
*
|
||
* @file
|
||
*/
|
||
|
||
use MediaWiki\MediaWikiServices;
|
||
|
||
/**
|
||
* @ingroup API
|
||
*/
|
||
class ApiOpenSearch extends ApiBase {
|
||
use SearchApi;
|
||
|
||
private $format = null;
|
||
private $fm = null;
|
||
|
||
/** @var array list of api allowed params */
|
||
private $allowedParams = null;
|
||
|
||
/**
|
||
* Get the output format
|
||
*
|
||
* @return string
|
||
*/
|
||
protected function getFormat() {
|
||
if ( $this->format === null ) {
|
||
$params = $this->extractRequestParams();
|
||
$format = $params['format'];
|
||
|
||
$allowedParams = $this->getAllowedParams();
|
||
if ( !in_array( $format, $allowedParams['format'][ApiBase::PARAM_TYPE] ) ) {
|
||
$format = $allowedParams['format'][ApiBase::PARAM_DFLT];
|
||
}
|
||
|
||
if ( substr( $format, -2 ) === 'fm' ) {
|
||
$this->format = substr( $format, 0, -2 );
|
||
$this->fm = 'fm';
|
||
} else {
|
||
$this->format = $format;
|
||
$this->fm = '';
|
||
}
|
||
}
|
||
return $this->format;
|
||
}
|
||
|
||
public function getCustomPrinter() {
|
||
switch ( $this->getFormat() ) {
|
||
case 'json':
|
||
return new ApiOpenSearchFormatJson(
|
||
$this->getMain(), $this->fm, $this->getParameter( 'warningsaserror' )
|
||
);
|
||
|
||
case 'xml':
|
||
$printer = $this->getMain()->createPrinterByName( 'xml' . $this->fm );
|
||
'@phan-var ApiFormatXML $printer';
|
||
$printer->setRootElement( 'SearchSuggestion' );
|
||
return $printer;
|
||
|
||
default:
|
||
ApiBase::dieDebug( __METHOD__, "Unsupported format '{$this->getFormat()}'" );
|
||
}
|
||
}
|
||
|
||
public function execute() {
|
||
$params = $this->extractRequestParams();
|
||
$search = $params['search'];
|
||
$suggest = $params['suggest'];
|
||
$results = [];
|
||
if ( !$suggest || $this->getConfig()->get( 'EnableOpenSearchSuggest' ) ) {
|
||
// Open search results may be stored for a very long time
|
||
$this->getMain()->setCacheMaxAge( $this->getConfig()->get( 'SearchSuggestCacheExpiry' ) );
|
||
$this->getMain()->setCacheMode( 'public' );
|
||
$results = $this->search( $search, $params );
|
||
|
||
// Allow hooks to populate extracts and images
|
||
Hooks::run( 'ApiOpenSearchSuggest', [ &$results ] );
|
||
|
||
// Trim extracts, if necessary
|
||
$length = $this->getConfig()->get( 'OpenSearchDescriptionLength' );
|
||
foreach ( $results as &$r ) {
|
||
// @phan-suppress-next-line PhanTypeInvalidDimOffset
|
||
if ( is_string( $r['extract'] ) && !$r['extract trimmed'] ) {
|
||
$r['extract'] = self::trimExtract( $r['extract'], $length );
|
||
}
|
||
}
|
||
}
|
||
|
||
// Populate result object
|
||
$this->populateResult( $search, $results );
|
||
}
|
||
|
||
/**
|
||
* Perform the search
|
||
* @param string $search the search query
|
||
* @param array $params api request params
|
||
* @return array search results. Keys are integers.
|
||
* @phan-return array<array{title:Title,redirect_from:?Title,extract:false,extract_trimmed:false,image:false,url:string}>
|
||
* Note that phan annotations don't support keys containing a space.
|
||
*/
|
||
private function search( $search, array $params ) {
|
||
$searchEngine = $this->buildSearchEngine( $params );
|
||
$titles = $searchEngine->extractTitles( $searchEngine->completionSearchWithVariants( $search ) );
|
||
$results = [];
|
||
|
||
if ( !$titles ) {
|
||
return $results;
|
||
}
|
||
|
||
// Special pages need unique integer ids in the return list, so we just
|
||
// assign them negative numbers because those won't clash with the
|
||
// always positive articleIds that non-special pages get.
|
||
$nextSpecialPageId = -1;
|
||
|
||
if ( $params['redirects'] === null ) {
|
||
// Backwards compatibility, don't resolve for JSON.
|
||
$resolveRedir = $this->getFormat() !== 'json';
|
||
} else {
|
||
$resolveRedir = $params['redirects'] === 'resolve';
|
||
}
|
||
|
||
if ( $resolveRedir ) {
|
||
// Query for redirects
|
||
$redirects = [];
|
||
$lb = new LinkBatch( $titles );
|
||
if ( !$lb->isEmpty() ) {
|
||
$db = $this->getDB();
|
||
$res = $db->select(
|
||
[ 'page', 'redirect' ],
|
||
[ 'page_namespace', 'page_title', 'rd_namespace', 'rd_title' ],
|
||
[
|
||
'rd_from = page_id',
|
||
'rd_interwiki IS NULL OR rd_interwiki = ' . $db->addQuotes( '' ),
|
||
$lb->constructSet( 'page', $db ),
|
||
],
|
||
__METHOD__
|
||
);
|
||
foreach ( $res as $row ) {
|
||
$redirects[$row->page_namespace][$row->page_title] =
|
||
[ $row->rd_namespace, $row->rd_title ];
|
||
}
|
||
}
|
||
|
||
// Bypass any redirects
|
||
$seen = [];
|
||
foreach ( $titles as $title ) {
|
||
$ns = $title->getNamespace();
|
||
$dbkey = $title->getDBkey();
|
||
$from = null;
|
||
if ( isset( $redirects[$ns][$dbkey] ) ) {
|
||
list( $ns, $dbkey ) = $redirects[$ns][$dbkey];
|
||
$from = $title;
|
||
$title = Title::makeTitle( $ns, $dbkey );
|
||
}
|
||
if ( !isset( $seen[$ns][$dbkey] ) ) {
|
||
$seen[$ns][$dbkey] = true;
|
||
$resultId = $title->getArticleID();
|
||
if ( $resultId === 0 ) {
|
||
$resultId = $nextSpecialPageId;
|
||
$nextSpecialPageId -= 1;
|
||
}
|
||
$results[$resultId] = [
|
||
'title' => $title,
|
||
'redirect from' => $from,
|
||
'extract' => false,
|
||
'extract trimmed' => false,
|
||
'image' => false,
|
||
'url' => wfExpandUrl( $title->getFullURL(), PROTO_CURRENT ),
|
||
];
|
||
}
|
||
}
|
||
} else {
|
||
foreach ( $titles as $title ) {
|
||
$resultId = $title->getArticleID();
|
||
if ( $resultId === 0 ) {
|
||
$resultId = $nextSpecialPageId;
|
||
$nextSpecialPageId -= 1;
|
||
}
|
||
$results[$resultId] = [
|
||
'title' => $title,
|
||
'redirect from' => null,
|
||
'extract' => false,
|
||
'extract trimmed' => false,
|
||
'image' => false,
|
||
'url' => wfExpandUrl( $title->getFullURL(), PROTO_CURRENT ),
|
||
];
|
||
}
|
||
}
|
||
|
||
return $results;
|
||
}
|
||
|
||
/**
|
||
* @param string $search
|
||
* @param array &$results
|
||
*/
|
||
protected function populateResult( $search, &$results ) {
|
||
$result = $this->getResult();
|
||
|
||
switch ( $this->getFormat() ) {
|
||
case 'json':
|
||
// http://www.opensearch.org/Specifications/OpenSearch/Extensions/Suggestions/1.1
|
||
$result->addArrayType( null, 'array' );
|
||
$result->addValue( null, 0, strval( $search ) );
|
||
$terms = [];
|
||
$descriptions = [];
|
||
$urls = [];
|
||
foreach ( $results as $r ) {
|
||
$terms[] = $r['title']->getPrefixedText();
|
||
$descriptions[] = strval( $r['extract'] );
|
||
$urls[] = $r['url'];
|
||
}
|
||
$result->addValue( null, 1, $terms );
|
||
$result->addValue( null, 2, $descriptions );
|
||
$result->addValue( null, 3, $urls );
|
||
break;
|
||
|
||
case 'xml':
|
||
// https://msdn.microsoft.com/en-us/library/cc891508(v=vs.85).aspx
|
||
$imageKeys = [
|
||
'source' => true,
|
||
'alt' => true,
|
||
'width' => true,
|
||
'height' => true,
|
||
'align' => true,
|
||
];
|
||
$items = [];
|
||
foreach ( $results as $r ) {
|
||
$item = [
|
||
'Text' => $r['title']->getPrefixedText(),
|
||
'Url' => $r['url'],
|
||
];
|
||
if ( is_string( $r['extract'] ) && $r['extract'] !== '' ) {
|
||
$item['Description'] = $r['extract'];
|
||
}
|
||
// @phan-suppress-next-line PhanTypeArraySuspiciousNullable
|
||
if ( is_array( $r['image'] ) && isset( $r['image']['source'] ) ) {
|
||
$item['Image'] = array_intersect_key( $r['image'], $imageKeys );
|
||
}
|
||
ApiResult::setSubelementsList( $item, array_keys( $item ) );
|
||
$items[] = $item;
|
||
}
|
||
ApiResult::setIndexedTagName( $items, 'Item' );
|
||
$result->addValue( null, 'version', '2.0' );
|
||
$result->addValue( null, 'xmlns', 'http://opensearch.org/searchsuggest2' );
|
||
$result->addValue( null, 'Query', strval( $search ) );
|
||
$result->addSubelementsList( null, 'Query' );
|
||
$result->addValue( null, 'Section', $items );
|
||
break;
|
||
|
||
default:
|
||
ApiBase::dieDebug( __METHOD__, "Unsupported format '{$this->getFormat()}'" );
|
||
}
|
||
}
|
||
|
||
public function getAllowedParams() {
|
||
if ( $this->allowedParams !== null ) {
|
||
return $this->allowedParams;
|
||
}
|
||
$this->allowedParams = $this->buildCommonApiParams( false ) + [
|
||
'suggest' => false,
|
||
'redirects' => [
|
||
ApiBase::PARAM_TYPE => [ 'return', 'resolve' ],
|
||
],
|
||
'format' => [
|
||
ApiBase::PARAM_DFLT => 'json',
|
||
ApiBase::PARAM_TYPE => [ 'json', 'jsonfm', 'xml', 'xmlfm' ],
|
||
],
|
||
'warningsaserror' => false,
|
||
];
|
||
|
||
// Use open search specific default limit
|
||
$this->allowedParams['limit'][ApiBase::PARAM_DFLT] = $this->getConfig()->get(
|
||
'OpenSearchDefaultLimit'
|
||
);
|
||
|
||
return $this->allowedParams;
|
||
}
|
||
|
||
public function getSearchProfileParams() {
|
||
return [
|
||
'profile' => [
|
||
'profile-type' => SearchEngine::COMPLETION_PROFILE_TYPE,
|
||
'help-message' => 'apihelp-query+prefixsearch-param-profile'
|
||
],
|
||
];
|
||
}
|
||
|
||
protected function getExamplesMessages() {
|
||
return [
|
||
'action=opensearch&search=Te'
|
||
=> 'apihelp-opensearch-example-te',
|
||
];
|
||
}
|
||
|
||
public function getHelpUrls() {
|
||
return 'https://www.mediawiki.org/wiki/Special:MyLanguage/API:Opensearch';
|
||
}
|
||
|
||
/**
|
||
* Trim an extract to a sensible length.
|
||
*
|
||
* Adapted from Extension:OpenSearchXml, which adapted it from
|
||
* Extension:ActiveAbstract.
|
||
*
|
||
* @param string $text
|
||
* @param int $length Target length; actual result will continue to the end of a sentence.
|
||
* @return string
|
||
*/
|
||
public static function trimExtract( $text, $length ) {
|
||
static $regex = null;
|
||
|
||
if ( $regex === null ) {
|
||
$endchars = [
|
||
'([^\d])\.\s', '\!\s', '\?\s', // regular ASCII
|
||
'。', // full-width ideographic full-stop
|
||
'.', '!', '?', // double-width roman forms
|
||
'。', // half-width ideographic full stop
|
||
];
|
||
$endgroup = implode( '|', $endchars );
|
||
$end = "(?:$endgroup)";
|
||
$sentence = ".{{$length},}?$end+";
|
||
$regex = "/^($sentence)/u";
|
||
}
|
||
|
||
$matches = [];
|
||
if ( preg_match( $regex, $text, $matches ) ) {
|
||
return trim( $matches[1] );
|
||
} else {
|
||
// Just return the first line
|
||
return trim( explode( "\n", $text )[0] );
|
||
}
|
||
}
|
||
|
||
/**
|
||
* Fetch the template for a type.
|
||
*
|
||
* @param string $type MIME type
|
||
* @return string
|
||
* @throws MWException
|
||
*/
|
||
public static function getOpenSearchTemplate( $type ) {
|
||
$config = MediaWikiServices::getInstance()->getSearchEngineConfig();
|
||
$template = $config->getConfig()->get( 'OpenSearchTemplate' );
|
||
|
||
if ( $template && $type === 'application/x-suggestions+json' ) {
|
||
return $template;
|
||
}
|
||
|
||
$ns = implode( '|', $config->defaultNamespaces() );
|
||
if ( !$ns ) {
|
||
$ns = '0';
|
||
}
|
||
|
||
switch ( $type ) {
|
||
case 'application/x-suggestions+json':
|
||
return $config->getConfig()->get( 'CanonicalServer' ) . wfScript( 'api' )
|
||
. '?action=opensearch&search={searchTerms}&namespace=' . $ns;
|
||
|
||
case 'application/x-suggestions+xml':
|
||
return $config->getConfig()->get( 'CanonicalServer' ) . wfScript( 'api' )
|
||
. '?action=opensearch&format=xml&search={searchTerms}&namespace=' . $ns;
|
||
|
||
default:
|
||
throw new MWException( __METHOD__ . ": Unknown type '$type'" );
|
||
}
|
||
}
|
||
}
|