wiki.techinc.nl/includes/api/ApiQueryExtLinksUsage.php
Aryeh Gregor 7b4b0135b9 Use str_starts_with/str_ends_with
All the other ways of doing it were ridiculous and much harder to read,
and usually required repeating the needle expression (to get its
length). I found these occurrences by grepping for various expressions,
but I undoubtedly missed some.

I didn't try replacing the many instances of strpos(...) === 0 with
str_starts_with(...), because I think they're readable enough as-is
(although less efficient). Likewise I didn't try porting strpos(...) !==
false to str_contains(...). For case-insensitive comparisons, Tim
Starling requested that we stick with substr_compare() because it's more
efficient than calling strtolower().

On PHP < 8 these functions will be included with a polyfill via
vendor/autoload.php. This is included at the beginning of
includes/AutoLoader.php, so if our autoloader has been included the
polyfill will be available. This means it should be safe to call these
functions from any code that would not be usable without our autoloader.

Three uses that Tim Starling identified as being performance-sensitive
have been split out to a separate commit for porting after the switch to
PHP 8.

Change-Id: I113a8d052b6845852c15969a2f0e6fbbe3e9f8d9
2022-05-02 10:59:58 +03:00

296 lines
7.8 KiB
PHP

<?php
/**
* Copyright © 2006 Yuri Astrakhan "<Firstname><Lastname>@gmail.com"
*
* This program is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation; either version 2 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License along
* with this program; if not, write to the Free Software Foundation, Inc.,
* 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
* http://www.gnu.org/copyleft/gpl.html
*
* @file
*/
use MediaWiki\MainConfigNames;
use MediaWiki\MediaWikiServices;
/**
* @ingroup API
*/
class ApiQueryExtLinksUsage extends ApiQueryGeneratorBase {
/**
* @param ApiQuery $query
* @param string $moduleName
*/
public function __construct( ApiQuery $query, $moduleName ) {
parent::__construct( $query, $moduleName, 'eu' );
}
public function execute() {
$this->run();
}
public function getCacheMode( $params ) {
return 'public';
}
public function executeGenerator( $resultPageSet ) {
$this->run( $resultPageSet );
}
/**
* @param ApiPageSet|null $resultPageSet
* @return void
*/
private function run( $resultPageSet = null ) {
$params = $this->extractRequestParams();
$db = $this->getDB();
$query = $params['query'];
$protocol = self::getProtocolPrefix( $params['protocol'] );
$this->addTables( [ 'externallinks', 'page' ] );
$this->addJoinConds( [ 'page' => [ 'JOIN', 'page_id=el_from' ] ] );
$miser_ns = [];
if ( $this->getConfig()->get( MainConfigNames::MiserMode ) ) {
$miser_ns = $params['namespace'] ?: [];
} else {
$this->addWhereFld( 'page_namespace', $params['namespace'] );
}
$orderBy = [];
if ( $query !== null && $query !== '' ) {
if ( $protocol === null ) {
$protocol = 'http://';
}
// Normalize query to match the normalization applied for the externallinks table
$query = Parser::normalizeLinkUrl( $protocol . $query );
$conds = LinkFilter::getQueryConditions( $query, [
'protocol' => '',
'oneWildcard' => true,
'db' => $db
] );
if ( !$conds ) {
$this->dieWithError( 'apierror-badquery' );
}
$this->addWhere( $conds );
if ( !isset( $conds['el_index_60'] ) ) {
$orderBy[] = 'el_index_60';
}
} else {
$orderBy[] = 'el_index_60';
if ( $protocol !== null ) {
$this->addWhere( 'el_index_60' . $db->buildLike( "$protocol", $db->anyString() ) );
} else {
// We're querying all protocols, filter out duplicate protocol-relative links
$this->addWhere( $db->makeList( [
'el_to NOT' . $db->buildLike( '//', $db->anyString() ),
'el_index_60 ' . $db->buildLike( 'http://', $db->anyString() ),
], LIST_OR ) );
}
}
$orderBy[] = 'el_id';
$this->addOption( 'ORDER BY', $orderBy );
$this->addFields( $orderBy ); // Make sure
$prop = array_fill_keys( $params['prop'], true );
$fld_ids = isset( $prop['ids'] );
$fld_title = isset( $prop['title'] );
$fld_url = isset( $prop['url'] );
if ( $resultPageSet === null ) {
$this->addFields( [
'page_id',
'page_namespace',
'page_title'
] );
$this->addFieldsIf( 'el_to', $fld_url );
} else {
$this->addFields( $resultPageSet->getPageTableFields() );
}
$limit = $params['limit'];
$this->addOption( 'LIMIT', $limit + 1 );
// T244254: Avoid MariaDB deciding to scan all of `page`.
$this->addOption( 'STRAIGHT_JOIN' );
if ( $params['continue'] !== null ) {
$cont = explode( '|', $params['continue'] );
$this->dieContinueUsageIf( count( $cont ) !== count( $orderBy ) );
$i = count( $cont ) - 1;
$cond = $orderBy[$i] . ' >= ' . $db->addQuotes( rawurldecode( $cont[$i] ) );
while ( $i-- > 0 ) {
$field = $orderBy[$i];
$v = $db->addQuotes( rawurldecode( $cont[$i] ) );
$cond = "($field > $v OR ($field = $v AND $cond))";
}
$this->addWhere( $cond );
}
$res = $this->select( __METHOD__ );
$result = $this->getResult();
if ( $resultPageSet === null ) {
$this->executeGenderCacheFromResultWrapper( $res, __METHOD__ );
}
$count = 0;
foreach ( $res as $row ) {
if ( ++$count > $limit ) {
// We've reached the one extra which shows that there are
// additional pages to be had. Stop here...
$this->setContinue( $orderBy, $row );
break;
}
if ( count( $miser_ns ) && !in_array( $row->page_namespace, $miser_ns ) ) {
continue;
}
if ( $resultPageSet === null ) {
$vals = [
ApiResult::META_TYPE => 'assoc',
];
if ( $fld_ids ) {
$vals['pageid'] = (int)$row->page_id;
}
if ( $fld_title ) {
$title = Title::makeTitle( $row->page_namespace, $row->page_title );
ApiQueryBase::addTitleInfo( $vals, $title );
}
if ( $fld_url ) {
$to = $row->el_to;
// expand protocol-relative urls
if ( $params['expandurl'] ) {
$to = wfExpandUrl( $to, PROTO_CANONICAL );
}
$vals['url'] = $to;
}
$fit = $result->addValue( [ 'query', $this->getModuleName() ], null, $vals );
if ( !$fit ) {
$this->setContinue( $orderBy, $row );
break;
}
} else {
$resultPageSet->processDbRow( $row );
}
}
if ( $resultPageSet === null ) {
$result->addIndexedTagName( [ 'query', $this->getModuleName() ],
$this->getModulePrefix() );
}
}
private function setContinue( $orderBy, $row ) {
$fields = [];
foreach ( $orderBy as $field ) {
$fields[] = strtr( $row->$field, [ '%' => '%25', '|' => '%7C' ] );
}
$this->setContinueEnumParameter( 'continue', implode( '|', $fields ) );
}
public function getAllowedParams() {
$ret = [
'prop' => [
ApiBase::PARAM_ISMULTI => true,
ApiBase::PARAM_DFLT => 'ids|title|url',
ApiBase::PARAM_TYPE => [
'ids',
'title',
'url'
],
ApiBase::PARAM_HELP_MSG_PER_VALUE => [],
],
'continue' => [
ApiBase::PARAM_HELP_MSG => 'api-help-param-continue',
],
'protocol' => [
ApiBase::PARAM_TYPE => self::prepareProtocols(),
ApiBase::PARAM_DFLT => '',
],
'query' => null,
'namespace' => [
ApiBase::PARAM_ISMULTI => true,
ApiBase::PARAM_TYPE => 'namespace'
],
'limit' => [
ApiBase::PARAM_DFLT => 10,
ApiBase::PARAM_TYPE => 'limit',
ApiBase::PARAM_MIN => 1,
ApiBase::PARAM_MAX => ApiBase::LIMIT_BIG1,
ApiBase::PARAM_MAX2 => ApiBase::LIMIT_BIG2
],
'expandurl' => false,
];
if ( $this->getConfig()->get( MainConfigNames::MiserMode ) ) {
$ret['namespace'][ApiBase::PARAM_HELP_MSG_APPEND] = [
'api-help-param-limited-in-miser-mode',
];
}
return $ret;
}
public static function prepareProtocols() {
$urlProtocols = MediaWikiServices::getInstance()->getMainConfig()
->get( MainConfigNames::UrlProtocols );
$protocols = [ '' ];
foreach ( $urlProtocols as $p ) {
if ( $p !== '//' ) {
$protocols[] = substr( $p, 0, strpos( $p, ':' ) );
}
}
return $protocols;
}
public static function getProtocolPrefix( $protocol ) {
// Find the right prefix
$urlProtocols = MediaWikiServices::getInstance()->getMainConfig()
->get( MainConfigNames::UrlProtocols );
if ( $protocol && !in_array( $protocol, $urlProtocols ) ) {
foreach ( $urlProtocols as $p ) {
if ( str_starts_with( $p, $protocol ) ) {
$protocol = $p;
break;
}
}
return $protocol;
} else {
return null;
}
}
protected function getExamplesMessages() {
return [
'action=query&list=exturlusage&euquery=www.mediawiki.org'
=> 'apihelp-query+exturlusage-example-simple',
];
}
public function getHelpUrls() {
return 'https://www.mediawiki.org/wiki/Special:MyLanguage/API:Exturlusage';
}
}