One of the big ones, so doing this alone. Bug: T166010 Change-Id: Ic2d59eb6764b1a273ed7162ecabf641f638b8f66
468 lines
14 KiB
PHP
468 lines
14 KiB
PHP
<?php
|
|
/**
|
|
* This program is free software; you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License as published by
|
|
* the Free Software Foundation; either version 2 of the License, or
|
|
* (at your option) any later version.
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License along
|
|
* with this program; if not, write to the Free Software Foundation, Inc.,
|
|
* 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
|
|
* http://www.gnu.org/copyleft/gpl.html
|
|
*
|
|
* @file
|
|
*/
|
|
namespace MediaWiki\Page;
|
|
|
|
use IBufferingStatsdDataFactory;
|
|
use InvalidArgumentException;
|
|
use MediaWiki\Logger\Spi as LoggerSpi;
|
|
use MediaWiki\Parser\ParserCacheFactory;
|
|
use MediaWiki\Parser\RevisionOutputCache;
|
|
use MediaWiki\Revision\RevisionLookup;
|
|
use MediaWiki\Revision\RevisionRecord;
|
|
use MediaWiki\Revision\RevisionRenderer;
|
|
use MediaWiki\Status\Status;
|
|
use MediaWiki\Title\TitleFormatter;
|
|
use ParserCache;
|
|
use ParserOptions;
|
|
use ParserOutput;
|
|
use PoolCounterWork;
|
|
use PoolWorkArticleView;
|
|
use PoolWorkArticleViewCurrent;
|
|
use PoolWorkArticleViewOld;
|
|
use Wikimedia\Assert\Assert;
|
|
use Wikimedia\Rdbms\ChronologyProtector;
|
|
use Wikimedia\Rdbms\ILBFactory;
|
|
|
|
/**
|
|
* Service for getting rendered output of a given page.
|
|
*
|
|
* This is a high level service, encapsulating concerns like caching
|
|
* and stampede protection via PoolCounter.
|
|
*
|
|
* @since 1.36
|
|
* @ingroup Page
|
|
*/
|
|
class ParserOutputAccess {
|
|
|
|
/**
|
|
* @var int Do not check the cache before parsing (force parse)
|
|
*/
|
|
public const OPT_NO_CHECK_CACHE = 1;
|
|
|
|
/** @var int Alias for NO_CHECK_CACHE */
|
|
public const OPT_FORCE_PARSE = self::OPT_NO_CHECK_CACHE;
|
|
|
|
/**
|
|
* @var int Do not update the cache after parsing.
|
|
*/
|
|
public const OPT_NO_UPDATE_CACHE = 2;
|
|
|
|
/**
|
|
* @var int Bypass audience check for deleted/suppressed revisions.
|
|
* The caller is responsible for ensuring that unauthorized access is prevented.
|
|
* If not set, output generation will fail if the revision is not public.
|
|
*/
|
|
public const OPT_NO_AUDIENCE_CHECK = 4;
|
|
|
|
/**
|
|
* @var int Do not check the cache before parsing,
|
|
* and do not update the cache after parsing (not cacheable).
|
|
*/
|
|
public const OPT_NO_CACHE = self::OPT_NO_UPDATE_CACHE | self::OPT_NO_CHECK_CACHE;
|
|
|
|
/**
|
|
* @var int Do perform an opportunistic LinksUpdate on cache miss
|
|
* @since 1.41
|
|
*/
|
|
public const OPT_LINKS_UPDATE = 8;
|
|
|
|
/** @var string Do not read or write any cache */
|
|
private const CACHE_NONE = 'none';
|
|
|
|
/** @var string Use primary cache */
|
|
private const CACHE_PRIMARY = 'primary';
|
|
|
|
/** @var string Use secondary cache */
|
|
private const CACHE_SECONDARY = 'secondary';
|
|
|
|
private ParserCacheFactory $parserCacheFactory;
|
|
|
|
/**
|
|
* In cases that an extension tries to get the same ParserOutput of
|
|
* the page right after it was parsed (T301310).
|
|
* @var ParserOutput[]
|
|
*/
|
|
private $localCache = [];
|
|
|
|
/** @var RevisionLookup */
|
|
private $revisionLookup;
|
|
|
|
/** @var RevisionRenderer */
|
|
private $revisionRenderer;
|
|
|
|
/** @var IBufferingStatsdDataFactory */
|
|
private $statsDataFactory;
|
|
|
|
/** @var ILBFactory */
|
|
private $lbFactory;
|
|
private ChronologyProtector $chronologyProtector;
|
|
|
|
/** @var LoggerSpi */
|
|
private $loggerSpi;
|
|
|
|
/** @var WikiPageFactory */
|
|
private $wikiPageFactory;
|
|
|
|
/** @var TitleFormatter */
|
|
private $titleFormatter;
|
|
|
|
/**
|
|
* @param ParserCacheFactory $parserCacheFactory
|
|
* @param RevisionLookup $revisionLookup
|
|
* @param RevisionRenderer $revisionRenderer
|
|
* @param IBufferingStatsdDataFactory $statsDataFactory
|
|
* @param ILBFactory $lbFactory
|
|
* @param ChronologyProtector $chronologyProtector
|
|
* @param LoggerSpi $loggerSpi
|
|
* @param WikiPageFactory $wikiPageFactory
|
|
* @param TitleFormatter $titleFormatter
|
|
*/
|
|
public function __construct(
|
|
ParserCacheFactory $parserCacheFactory,
|
|
RevisionLookup $revisionLookup,
|
|
RevisionRenderer $revisionRenderer,
|
|
IBufferingStatsdDataFactory $statsDataFactory,
|
|
ILBFactory $lbFactory,
|
|
ChronologyProtector $chronologyProtector,
|
|
LoggerSpi $loggerSpi,
|
|
WikiPageFactory $wikiPageFactory,
|
|
TitleFormatter $titleFormatter
|
|
) {
|
|
$this->parserCacheFactory = $parserCacheFactory;
|
|
$this->revisionLookup = $revisionLookup;
|
|
$this->revisionRenderer = $revisionRenderer;
|
|
$this->statsDataFactory = $statsDataFactory;
|
|
$this->lbFactory = $lbFactory;
|
|
$this->chronologyProtector = $chronologyProtector;
|
|
$this->loggerSpi = $loggerSpi;
|
|
$this->wikiPageFactory = $wikiPageFactory;
|
|
$this->titleFormatter = $titleFormatter;
|
|
}
|
|
|
|
/**
|
|
* Use a cache?
|
|
*
|
|
* @param PageRecord $page
|
|
* @param RevisionRecord|null $rev
|
|
*
|
|
* @return string One of the CACHE_XXX constants.
|
|
*/
|
|
private function shouldUseCache(
|
|
PageRecord $page,
|
|
?RevisionRecord $rev
|
|
) {
|
|
if ( $rev && !$rev->getId() ) {
|
|
// The revision isn't from the database, so the output can't safely be cached.
|
|
return self::CACHE_NONE;
|
|
}
|
|
|
|
// NOTE: Keep in sync with ParserWikiPage::shouldCheckParserCache().
|
|
// NOTE: when we allow caching of old revisions in the future,
|
|
// we must not allow caching of deleted revisions.
|
|
|
|
$wikiPage = $this->wikiPageFactory->newFromTitle( $page );
|
|
if ( !$page->exists() || !$wikiPage->getContentHandler()->isParserCacheSupported() ) {
|
|
return self::CACHE_NONE;
|
|
}
|
|
|
|
$isOld = $rev && $rev->getId() !== $page->getLatest();
|
|
if ( !$isOld ) {
|
|
return self::CACHE_PRIMARY;
|
|
}
|
|
|
|
if ( !$rev->audienceCan( RevisionRecord::DELETED_TEXT, RevisionRecord::FOR_PUBLIC ) ) {
|
|
// deleted/suppressed revision
|
|
return self::CACHE_NONE;
|
|
}
|
|
|
|
return self::CACHE_SECONDARY;
|
|
}
|
|
|
|
/**
|
|
* Returns the rendered output for the given page if it is present in the cache.
|
|
*
|
|
* @param PageRecord $page
|
|
* @param ParserOptions $parserOptions
|
|
* @param RevisionRecord|null $revision
|
|
* @param int $options Bitfield using the OPT_XXX constants
|
|
*
|
|
* @return ParserOutput|null
|
|
*/
|
|
public function getCachedParserOutput(
|
|
PageRecord $page,
|
|
ParserOptions $parserOptions,
|
|
?RevisionRecord $revision = null,
|
|
int $options = 0
|
|
): ?ParserOutput {
|
|
$isOld = $revision && $revision->getId() !== $page->getLatest();
|
|
$useCache = $this->shouldUseCache( $page, $revision );
|
|
$primaryCache = $this->getPrimaryCache( $parserOptions );
|
|
$classCacheKey = $primaryCache->makeParserOutputKey( $page, $parserOptions );
|
|
|
|
if ( $useCache === self::CACHE_PRIMARY ) {
|
|
if ( isset( $this->localCache[$classCacheKey] ) && !$isOld ) {
|
|
return $this->localCache[$classCacheKey];
|
|
}
|
|
$output = $primaryCache->get( $page, $parserOptions );
|
|
} elseif ( $useCache === self::CACHE_SECONDARY && $revision ) {
|
|
$secondaryCache = $this->getSecondaryCache( $parserOptions );
|
|
$output = $secondaryCache->get( $revision, $parserOptions );
|
|
} else {
|
|
$output = null;
|
|
}
|
|
|
|
if ( $output && !$isOld ) {
|
|
$this->localCache[$classCacheKey] = $output;
|
|
}
|
|
|
|
if ( $output ) {
|
|
$this->statsDataFactory->increment( "ParserOutputAccess.Cache.$useCache.hit" );
|
|
} else {
|
|
$this->statsDataFactory->increment( "ParserOutputAccess.Cache.$useCache.miss" );
|
|
}
|
|
|
|
return $output ?: null; // convert false to null
|
|
}
|
|
|
|
/**
|
|
* Returns the rendered output for the given page.
|
|
* Caching and concurrency control is applied.
|
|
*
|
|
* @param PageRecord $page
|
|
* @param ParserOptions $parserOptions
|
|
* @param RevisionRecord|null $revision
|
|
* @param int $options Bitfield using the OPT_XXX constants
|
|
*
|
|
* @return Status containing a ParserOutput if no error occurred.
|
|
* Well known errors and warnings include the following messages:
|
|
* - 'view-pool-dirty-output' (warning) The output is dirty (from a stale cache entry).
|
|
* - 'view-pool-contention' (warning) Dirty output was returned immediately instead of
|
|
* waiting to acquire a work lock (when "fast stale" mode is enabled in PoolCounter).
|
|
* - 'view-pool-timeout' (warning) Dirty output was returned after failing to acquire
|
|
* a work lock (got QUEUE_FULL or TIMEOUT from PoolCounter).
|
|
* - 'pool-queuefull' (error) unable to acquire work lock, and no cached content found.
|
|
* - 'pool-timeout' (error) unable to acquire work lock, and no cached content found.
|
|
* - 'pool-servererror' (error) PoolCounterWork failed due to a lock service error.
|
|
* - 'pool-unknownerror' (error) PoolCounterWork failed for an unknown reason.
|
|
* - 'nopagetext' (error) The page does not exist
|
|
*/
|
|
public function getParserOutput(
|
|
PageRecord $page,
|
|
ParserOptions $parserOptions,
|
|
?RevisionRecord $revision = null,
|
|
int $options = 0
|
|
): Status {
|
|
$error = $this->checkPreconditions( $page, $revision, $options );
|
|
if ( $error ) {
|
|
$this->statsDataFactory->increment( "ParserOutputAccess.Case.error" );
|
|
return $error;
|
|
}
|
|
|
|
$isOld = $revision && $revision->getId() !== $page->getLatest();
|
|
if ( $isOld ) {
|
|
$this->statsDataFactory->increment( 'ParserOutputAccess.Case.old' );
|
|
} else {
|
|
$this->statsDataFactory->increment( 'ParserOutputAccess.Case.current' );
|
|
}
|
|
|
|
if ( !( $options & self::OPT_NO_CHECK_CACHE ) ) {
|
|
$output = $this->getCachedParserOutput( $page, $parserOptions, $revision );
|
|
if ( $output ) {
|
|
return Status::newGood( $output );
|
|
}
|
|
}
|
|
|
|
if ( !$revision ) {
|
|
$revId = $page->getLatest();
|
|
$revision = $revId ? $this->revisionLookup->getRevisionById( $revId ) : null;
|
|
|
|
if ( !$revision ) {
|
|
$this->statsDataFactory->increment( "ParserOutputAccess.Status.norev" );
|
|
return Status::newFatal( 'missing-revision', $revId );
|
|
}
|
|
}
|
|
|
|
$work = $this->newPoolWorkArticleView( $page, $parserOptions, $revision, $options );
|
|
/** @var Status $status */
|
|
$status = $work->execute();
|
|
$output = $status->getValue();
|
|
Assert::postcondition( $output || !$status->isOK(), 'Worker returned invalid status' );
|
|
|
|
if ( $output && !$isOld ) {
|
|
$primaryCache = $this->getPrimaryCache( $parserOptions );
|
|
$classCacheKey = $primaryCache->makeParserOutputKey( $page, $parserOptions );
|
|
$this->localCache[$classCacheKey] = $output;
|
|
}
|
|
|
|
if ( $status->isGood() ) {
|
|
$this->statsDataFactory->increment( 'ParserOutputAccess.Status.good' );
|
|
} elseif ( $status->isOK() ) {
|
|
$this->statsDataFactory->increment( 'ParserOutputAccess.Status.ok' );
|
|
} else {
|
|
$this->statsDataFactory->increment( 'ParserOutputAccess.Status.error' );
|
|
}
|
|
|
|
return $status;
|
|
}
|
|
|
|
/**
|
|
* @param PageRecord $page
|
|
* @param RevisionRecord|null $revision
|
|
* @param int $options
|
|
*
|
|
* @return Status|null
|
|
*/
|
|
private function checkPreconditions(
|
|
PageRecord $page,
|
|
?RevisionRecord $revision = null,
|
|
int $options = 0
|
|
): ?Status {
|
|
if ( !$page->exists() ) {
|
|
return Status::newFatal( 'nopagetext' );
|
|
}
|
|
|
|
if ( !( $options & self::OPT_NO_UPDATE_CACHE ) && $revision && !$revision->getId() ) {
|
|
throw new InvalidArgumentException(
|
|
'The revision does not have a known ID. Use OPT_NO_CACHE.'
|
|
);
|
|
}
|
|
|
|
if ( $revision && $revision->getPageId() !== $page->getId() ) {
|
|
throw new InvalidArgumentException(
|
|
'The revision does not belong to the given page.'
|
|
);
|
|
}
|
|
|
|
if ( $revision && !( $options & self::OPT_NO_AUDIENCE_CHECK ) ) {
|
|
// NOTE: If per-user checks are desired, the caller should perform them and
|
|
// then set OPT_NO_AUDIENCE_CHECK if they passed.
|
|
if ( !$revision->audienceCan( RevisionRecord::DELETED_TEXT, RevisionRecord::FOR_PUBLIC ) ) {
|
|
return Status::newFatal(
|
|
'missing-revision-permission',
|
|
$revision->getId(),
|
|
$revision->getTimestamp(),
|
|
$this->titleFormatter->getPrefixedDBkey( $page )
|
|
);
|
|
}
|
|
}
|
|
|
|
return null;
|
|
}
|
|
|
|
/**
|
|
* @param PageRecord $page
|
|
* @param ParserOptions $parserOptions
|
|
* @param RevisionRecord $revision
|
|
* @param int $options
|
|
*
|
|
* @return PoolCounterWork
|
|
*/
|
|
private function newPoolWorkArticleView(
|
|
PageRecord $page,
|
|
ParserOptions $parserOptions,
|
|
RevisionRecord $revision,
|
|
int $options
|
|
): PoolCounterWork {
|
|
$useCache = $this->shouldUseCache( $page, $revision );
|
|
|
|
switch ( $useCache ) {
|
|
case self::CACHE_PRIMARY:
|
|
$this->statsDataFactory->increment( 'ParserOutputAccess.PoolWork.Current' );
|
|
$primaryCache = $this->getPrimaryCache( $parserOptions );
|
|
$parserCacheMetadata = $primaryCache->getMetadata( $page );
|
|
$cacheKey = $primaryCache->makeParserOutputKey( $page, $parserOptions,
|
|
$parserCacheMetadata ? $parserCacheMetadata->getUsedOptions() : null
|
|
);
|
|
|
|
$workKey = $cacheKey . ':revid:' . $revision->getId();
|
|
|
|
return new PoolWorkArticleViewCurrent(
|
|
$workKey,
|
|
$page,
|
|
$revision,
|
|
$parserOptions,
|
|
$this->revisionRenderer,
|
|
$primaryCache,
|
|
$this->lbFactory,
|
|
$this->chronologyProtector,
|
|
$this->loggerSpi,
|
|
$this->wikiPageFactory,
|
|
!( $options & self::OPT_NO_UPDATE_CACHE ),
|
|
(bool)( $options & self::OPT_LINKS_UPDATE )
|
|
);
|
|
|
|
case self::CACHE_SECONDARY:
|
|
$this->statsDataFactory->increment( 'ParserOutputAccess.PoolWork.Old' );
|
|
$secondaryCache = $this->getSecondaryCache( $parserOptions );
|
|
$workKey = $secondaryCache->makeParserOutputKey( $revision, $parserOptions );
|
|
return new PoolWorkArticleViewOld(
|
|
$workKey,
|
|
$secondaryCache,
|
|
$revision,
|
|
$parserOptions,
|
|
$this->revisionRenderer,
|
|
$this->loggerSpi
|
|
);
|
|
|
|
default:
|
|
$this->statsDataFactory->increment( 'ParserOutputAccess.PoolWork.Uncached' );
|
|
$secondaryCache = $this->getSecondaryCache( $parserOptions );
|
|
$workKey = $secondaryCache->makeParserOutputKeyOptionalRevId( $revision, $parserOptions );
|
|
return new PoolWorkArticleView(
|
|
$workKey,
|
|
$revision,
|
|
$parserOptions,
|
|
$this->revisionRenderer,
|
|
$this->loggerSpi
|
|
);
|
|
}
|
|
|
|
// unreachable
|
|
}
|
|
|
|
private function getPrimaryCache( ParserOptions $pOpts ): ParserCache {
|
|
if ( $pOpts->getUseParsoid() ) {
|
|
// T331148: This is different from
|
|
// ParsoidOutputAccess::PARSOID_PARSER_CACHE_NAME; will be
|
|
// renamed once the contents cached on the read-views and
|
|
// the REST path are identical.
|
|
return $this->parserCacheFactory->getParserCache(
|
|
'parsoid-' . ParserCacheFactory::DEFAULT_NAME
|
|
);
|
|
}
|
|
|
|
return $this->parserCacheFactory->getParserCache(
|
|
ParserCacheFactory::DEFAULT_NAME
|
|
);
|
|
}
|
|
|
|
private function getSecondaryCache( ParserOptions $pOpts ): RevisionOutputCache {
|
|
if ( $pOpts->getUseParsoid() ) {
|
|
return $this->parserCacheFactory->getRevisionOutputCache(
|
|
'parsoid-' . ParserCacheFactory::DEFAULT_RCACHE_NAME
|
|
);
|
|
}
|
|
|
|
return $this->parserCacheFactory->getRevisionOutputCache(
|
|
ParserCacheFactory::DEFAULT_RCACHE_NAME
|
|
);
|
|
}
|
|
|
|
}
|