mirror of
https://gerrit.wikimedia.org/r/mediawiki/extensions/VisualEditor
synced 2025-01-22 10:34:26 +00:00
10cb01cdd1
We're trying to avoid passing raw strings around, since they can be ambiguous specifiers of language. This patch makes VE compatible with I982e0df706a633b05dcc02b5220b737c19adc401, with a backward compatibility workaround which can be removed after I982e0df706a633b05dcc02b5220b737c19adc401 merges. The new code also uses slightly more methods of the Language object, which need to be mocked in a unit test. Change-Id: I830867d58f8962d6a57be16ce3735e8384f9ac1c
300 lines
7.9 KiB
PHP
300 lines
7.9 KiB
PHP
<?php
|
|
/**
|
|
* Helper functions for using the REST interface to Parsoid.
|
|
*
|
|
* @file
|
|
* @ingroup Extensions
|
|
* @copyright 2022 VisualEditor Team and others; see AUTHORS.txt
|
|
* @license MIT
|
|
*/
|
|
|
|
namespace MediaWiki\Extension\VisualEditor;
|
|
|
|
use Exception;
|
|
use Language;
|
|
use LocalizedException;
|
|
use MediaWiki\Page\PageIdentity;
|
|
use MediaWiki\Parser\Parsoid\ParsoidRenderID;
|
|
use MediaWiki\Permissions\Authority;
|
|
use MediaWiki\Rest\Handler\Helper\HtmlInputTransformHelper;
|
|
use MediaWiki\Rest\Handler\Helper\HtmlOutputRendererHelper;
|
|
use MediaWiki\Rest\Handler\Helper\PageRestHelperFactory;
|
|
use MediaWiki\Rest\HttpException;
|
|
use MediaWiki\Rest\LocalizedHttpException;
|
|
use MediaWiki\Revision\MutableRevisionRecord;
|
|
use MediaWiki\Revision\RevisionRecord;
|
|
use MediaWiki\Revision\SlotRecord;
|
|
use RawMessage;
|
|
use User;
|
|
use Wikimedia\Bcp47Code\Bcp47CodeValue;
|
|
use WikitextContent;
|
|
|
|
class DirectParsoidClient implements ParsoidClient {
|
|
|
|
/**
|
|
* Requested Parsoid HTML version.
|
|
* Keep this in sync with the Accept: header in
|
|
* ve.init.mw.ArticleTargetLoader.js
|
|
*/
|
|
public const PARSOID_VERSION = '2.6.0';
|
|
|
|
private const FLAVOR_DEFAULT = 'view';
|
|
|
|
/** @var PageRestHelperFactory */
|
|
private $helperFactory;
|
|
|
|
/** @var Authority */
|
|
private $performer;
|
|
|
|
/**
|
|
* @param PageRestHelperFactory $helperFactory
|
|
* @param Authority $performer
|
|
*/
|
|
public function __construct(
|
|
PageRestHelperFactory $helperFactory,
|
|
Authority $performer
|
|
) {
|
|
$this->performer = $performer;
|
|
$this->helperFactory = $helperFactory;
|
|
}
|
|
|
|
/**
|
|
* @param PageIdentity $page
|
|
* @param RevisionRecord|null $revision
|
|
* @param Language|null $pageLanguage
|
|
* @param bool $stash
|
|
* @param string $flavor
|
|
*
|
|
* @return HtmlOutputRendererHelper
|
|
*/
|
|
private function getHtmlOutputRendererHelper(
|
|
PageIdentity $page,
|
|
?RevisionRecord $revision = null,
|
|
Language $pageLanguage = null,
|
|
bool $stash = false,
|
|
string $flavor = self::FLAVOR_DEFAULT
|
|
): HtmlOutputRendererHelper {
|
|
$helper = $this->helperFactory->newHtmlOutputRendererHelper();
|
|
|
|
// TODO: remove this once we no longer need a User object for rate limiting (T310476).
|
|
if ( $this->performer instanceof User ) {
|
|
$user = $this->performer;
|
|
} else {
|
|
$user = User::newFromIdentity( $this->performer->getUser() );
|
|
}
|
|
|
|
$helper->init( $page, [], $user, $revision );
|
|
|
|
$helper->setStashingEnabled( $stash );
|
|
$helper->setFlavor( $flavor );
|
|
|
|
if ( $revision ) {
|
|
$helper->setRevision( $revision );
|
|
}
|
|
|
|
if ( $pageLanguage ) {
|
|
$helper->setPageLanguage( $pageLanguage );
|
|
}
|
|
|
|
return $helper;
|
|
}
|
|
|
|
/**
|
|
* @param PageIdentity $page
|
|
* @param string $html
|
|
* @param int|null $oldid
|
|
* @param string|null $etag
|
|
* @param Language|null $pageLanguage
|
|
*
|
|
* @return HtmlInputTransformHelper
|
|
*/
|
|
private function getHtmlInputTransformHelper(
|
|
PageIdentity $page,
|
|
string $html,
|
|
int $oldid = null,
|
|
string $etag = null,
|
|
Language $pageLanguage = null
|
|
): HtmlInputTransformHelper {
|
|
$helper = $this->helperFactory->newHtmlInputTransformHelper();
|
|
|
|
// Fake REST body
|
|
$body = [
|
|
'html' => [
|
|
'body' => $html,
|
|
]
|
|
];
|
|
|
|
$renderId = $etag ? ParsoidRenderID::newFromETag( $etag ) : null;
|
|
|
|
$helper->init( $page, $body, [], null, $pageLanguage );
|
|
|
|
if ( $oldid || $renderId ) {
|
|
$helper->setOriginal( $oldid, $renderId );
|
|
}
|
|
|
|
return $helper;
|
|
}
|
|
|
|
/**
|
|
* Request page HTML from Parsoid.
|
|
*
|
|
* @param RevisionRecord $revision Page revision
|
|
* @param ?Language $targetLanguage Page language (default: `null`)
|
|
*
|
|
* @return array An array mimicking a RESTbase server's response,
|
|
* with keys: 'error', 'headers' and 'body'
|
|
*/
|
|
public function getPageHtml( RevisionRecord $revision, ?Language $targetLanguage = null ): array {
|
|
// In the VE client, we always want to stash.
|
|
$page = $revision->getPage();
|
|
|
|
try {
|
|
$helper = $this->getHtmlOutputRendererHelper( $page, $revision, $targetLanguage, true );
|
|
$parserOutput = $helper->getHtml();
|
|
|
|
return $this->fakeRESTbaseHTMLResponse( $parserOutput->getRawText(), $helper );
|
|
} catch ( HttpException $ex ) {
|
|
return $this->fakeRESTbaseError( $ex );
|
|
}
|
|
}
|
|
|
|
/**
|
|
* @param PageIdentity $page
|
|
* @param string $wikitext
|
|
*
|
|
* @return RevisionRecord
|
|
*/
|
|
private function makeFakeRevision(
|
|
PageIdentity $page,
|
|
string $wikitext
|
|
): RevisionRecord {
|
|
$rev = new MutableRevisionRecord( $page );
|
|
$rev->setId( 0 );
|
|
$rev->setPageId( $page->getId() );
|
|
|
|
$rev->setContent( SlotRecord::MAIN, new WikitextContent( $wikitext ) );
|
|
|
|
return $rev;
|
|
}
|
|
|
|
/**
|
|
* Transform wikitext to HTML with Parsoid. Wrapper for ::postData().
|
|
*
|
|
* @param PageIdentity $page The page the content belongs to use as the parsing context
|
|
* @param Language $targetLanguage Page language
|
|
* @param string $wikitext The wikitext fragment to parse
|
|
* @param bool $bodyOnly Whether to provide only the contents of the `<body>` tag
|
|
* @param int|null $oldid What oldid revision, if any, to base the request from (default: `null`)
|
|
* @param bool $stash Whether to stash the result in the server-side cache (default: `false`)
|
|
*
|
|
* @return array An array mimicking a RESTbase server's response,
|
|
* with keys 'code', 'reason', 'headers' and 'body'
|
|
*/
|
|
public function transformWikitext(
|
|
PageIdentity $page,
|
|
Language $targetLanguage,
|
|
string $wikitext,
|
|
bool $bodyOnly,
|
|
?int $oldid,
|
|
bool $stash
|
|
): array {
|
|
$revision = $this->makeFakeRevision( $page, $wikitext );
|
|
|
|
try {
|
|
$helper = $this->getHtmlOutputRendererHelper( $page, $revision, $targetLanguage, $stash );
|
|
|
|
if ( $bodyOnly ) {
|
|
$helper->setFlavor( 'fragment' );
|
|
}
|
|
|
|
$parserOutput = $helper->getHtml();
|
|
$html = $parserOutput->getRawText();
|
|
|
|
return $this->fakeRESTbaseHTMLResponse( $html, $helper );
|
|
} catch ( HttpException $ex ) {
|
|
return $this->fakeRESTbaseError( $ex );
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Transform HTML to wikitext with Parsoid
|
|
*
|
|
* @param PageIdentity $page The page the content belongs to
|
|
* @param Language $targetLanguage The desired output language
|
|
* @param string $html The HTML of the page to be transformed
|
|
* @param ?int $oldid What oldid revision, if any, to base the request from (default: `null`)
|
|
* @param ?string $etag The ETag to set in the HTTP request header
|
|
*
|
|
* @return array The response, 'code', 'reason', 'headers' and 'body'
|
|
*/
|
|
public function transformHTML(
|
|
PageIdentity $page, Language $targetLanguage, string $html, ?int $oldid, ?string $etag
|
|
): array {
|
|
try {
|
|
$helper = $this->getHtmlInputTransformHelper( $page, $html, $oldid, $etag, $targetLanguage );
|
|
|
|
$content = $helper->getContent();
|
|
$format = $content->getDefaultFormat();
|
|
|
|
return [
|
|
'code' => 200,
|
|
'headers' => [
|
|
'Content-Type' => $format,
|
|
],
|
|
'body' => $content->serialize( $format ),
|
|
];
|
|
} catch ( HttpException $ex ) {
|
|
return $this->fakeRESTbaseError( $ex );
|
|
}
|
|
}
|
|
|
|
/**
|
|
* @param mixed $data
|
|
* @param HtmlOutputRendererHelper $helper
|
|
*
|
|
* @return array
|
|
*/
|
|
private function fakeRESTbaseHTMLResponse( $data, HtmlOutputRendererHelper $helper ): array {
|
|
$contentLanguage = $helper->getHtmlOutputContentLanguage();
|
|
// @phan-suppress-next-line PhanRedundantCondition
|
|
if ( is_string( $contentLanguage ) ) {
|
|
// Backwards-compatibility; remove after
|
|
// I982e0df706a633b05dcc02b5220b737c19adc401 is deployed
|
|
$contentLanguage = new Bcp47CodeValue( $contentLanguage );
|
|
}
|
|
return [
|
|
'code' => 200,
|
|
'headers' => [
|
|
'content-language' => $contentLanguage->toBcp47Code(),
|
|
'etag' => $helper->getETag()
|
|
],
|
|
'body' => $data,
|
|
];
|
|
}
|
|
|
|
/**
|
|
* @param Exception $ex
|
|
*
|
|
* @return array
|
|
*/
|
|
private function fakeRESTbaseError( Exception $ex ): array {
|
|
if ( $ex instanceof LocalizedHttpException ) {
|
|
$msg = $ex->getMessageValue();
|
|
} elseif ( $ex instanceof LocalizedException ) {
|
|
$msg = $ex->getMessageObject();
|
|
} else {
|
|
$msg = new RawMessage( $ex->getMessage() );
|
|
}
|
|
|
|
return [
|
|
'error' => [
|
|
'message' => $msg->getKey() ?? '',
|
|
'params' => $msg->getParams() ?? []
|
|
],
|
|
'headers' => [],
|
|
'body' => $ex->getMessage(),
|
|
];
|
|
}
|
|
|
|
}
|