This patch introduces a ParsoidOutputAccess service for getting parsoid outputs and warms the cache with pregenerated outputs. It also introduces a config variable in ParsoidCacheConfig that is turned off by default for controlling the cache warming. Bug: T301371 Change-Id: I6152c42ea765d94093d8d62598b1b4278314adec
148 lines
4.1 KiB
PHP
148 lines
4.1 KiB
PHP
<?php
|
|
|
|
namespace MediaWiki\Rest\Handler;
|
|
|
|
use Config;
|
|
use IBufferingStatsdDataFactory;
|
|
use LogicException;
|
|
use MediaWiki\Edit\ParsoidOutputStash;
|
|
use MediaWiki\MediaWikiServices;
|
|
use MediaWiki\Page\PageLookup;
|
|
use MediaWiki\Parser\Parsoid\ParsoidOutputAccess;
|
|
use MediaWiki\Rest\LocalizedHttpException;
|
|
use MediaWiki\Rest\Response;
|
|
use MediaWiki\Rest\SimpleHandler;
|
|
use MediaWiki\Rest\StringStream;
|
|
use MediaWiki\Revision\RevisionLookup;
|
|
use TitleFormatter;
|
|
use Wikimedia\Assert\Assert;
|
|
|
|
/**
|
|
* A handler that returns Parsoid HTML for the following routes:
|
|
* - /page/{title}/html,
|
|
* - /page/{title}/with_html
|
|
*
|
|
* @package MediaWiki\Rest\Handler
|
|
*/
|
|
class PageHTMLHandler extends SimpleHandler {
|
|
|
|
/** @var ParsoidHTMLHelper */
|
|
private $htmlHelper;
|
|
|
|
/** @var PageContentHelper */
|
|
private $contentHelper;
|
|
|
|
public function __construct(
|
|
Config $config,
|
|
RevisionLookup $revisionLookup,
|
|
TitleFormatter $titleFormatter,
|
|
PageLookup $pageLookup,
|
|
ParsoidOutputStash $parsoidOutputStash,
|
|
IBufferingStatsdDataFactory $statsDataFactory,
|
|
ParsoidOutputAccess $parsoidOutputAccess
|
|
) {
|
|
$this->contentHelper = new PageContentHelper(
|
|
$config,
|
|
$revisionLookup,
|
|
$titleFormatter,
|
|
$pageLookup
|
|
);
|
|
$this->htmlHelper = new ParsoidHTMLHelper(
|
|
$parsoidOutputStash,
|
|
$statsDataFactory,
|
|
$parsoidOutputAccess
|
|
);
|
|
}
|
|
|
|
protected function postValidationSetup() {
|
|
// TODO: Once Authority supports rate limit (T310476), just inject the Authority.
|
|
$user = MediaWikiServices::getInstance()->getUserFactory()
|
|
->newFromUserIdentity( $this->getAuthority()->getUser() );
|
|
|
|
$this->contentHelper->init( $user, $this->getValidatedParams() );
|
|
|
|
$page = $this->contentHelper->getPage();
|
|
if ( $page ) {
|
|
$this->htmlHelper->init( $page, $this->getValidatedParams(), $user );
|
|
}
|
|
}
|
|
|
|
/**
|
|
* @return Response
|
|
* @throws LocalizedHttpException
|
|
*/
|
|
public function run(): Response {
|
|
$this->contentHelper->checkAccess();
|
|
|
|
$page = $this->contentHelper->getPage();
|
|
|
|
// The call to $this->contentHelper->getPage() should not return null if
|
|
// $this->contentHelper->checkAccess() did not throw.
|
|
Assert::invariant( $page !== null, 'Page should be known' );
|
|
|
|
$parserOutput = $this->htmlHelper->getHtml();
|
|
// Do not de-duplicate styles, Parsoid already does it in a slightly different way (T300325)
|
|
$parserOutputHtml = $parserOutput->getText( [ 'deduplicateStyles' => false ] );
|
|
|
|
$outputMode = $this->getOutputMode();
|
|
switch ( $outputMode ) {
|
|
case 'html':
|
|
$response = $this->getResponseFactory()->create();
|
|
// TODO: need to respect content-type returned by Parsoid.
|
|
$response->setHeader( 'Content-Type', 'text/html' );
|
|
$this->contentHelper->setCacheControl( $response, $parserOutput->getCacheExpiry() );
|
|
$response->setBody( new StringStream( $parserOutputHtml ) );
|
|
break;
|
|
case 'with_html':
|
|
$body = $this->contentHelper->constructMetadata();
|
|
$body['html'] = $parserOutputHtml;
|
|
$response = $this->getResponseFactory()->createJson( $body );
|
|
$this->contentHelper->setCacheControl( $response, $parserOutput->getCacheExpiry() );
|
|
break;
|
|
default:
|
|
throw new LogicException( "Unknown HTML type $outputMode" );
|
|
}
|
|
|
|
return $response;
|
|
}
|
|
|
|
/**
|
|
* Returns an ETag representing a page's source. The ETag assumes a page's source has changed
|
|
* if the latest revision of a page has been made private, un-readable for another reason,
|
|
* or a newer revision exists.
|
|
* @return string|null
|
|
*/
|
|
protected function getETag(): ?string {
|
|
if ( !$this->contentHelper->isAccessible() ) {
|
|
return null;
|
|
}
|
|
|
|
// Vary eTag based on output mode
|
|
return $this->htmlHelper->getETag( $this->getOutputMode() );
|
|
}
|
|
|
|
/**
|
|
* @return string|null
|
|
*/
|
|
protected function getLastModified(): ?string {
|
|
if ( !$this->contentHelper->isAccessible() ) {
|
|
return null;
|
|
}
|
|
return $this->htmlHelper->getLastModified();
|
|
}
|
|
|
|
private function getOutputMode(): string {
|
|
return $this->getConfig()['format'];
|
|
}
|
|
|
|
public function needsWriteAccess(): bool {
|
|
return false;
|
|
}
|
|
|
|
public function getParamSettings(): array {
|
|
return array_merge(
|
|
$this->contentHelper->getParamSettings(),
|
|
$this->htmlHelper->getParamSettings()
|
|
);
|
|
}
|
|
}
|