mediawiki-extensions-SpamBl.../includes/SpamBlacklistHooks.php
Amir Sarabadani 3cb265f12e Give priority to PreparedUpdate
StashedEdit is slower than the PreparedUpdate

Bug: T288639
Change-Id: Ibeb934050c6b24720da4b69dba6273c8b3e15acc
2022-01-10 09:10:18 +01:00

265 lines
6.8 KiB
PHP

<?php
use MediaWiki\MediaWikiServices;
use MediaWiki\Revision\RevisionRecord;
use MediaWiki\Storage\EditResult;
use MediaWiki\User\UserIdentity;
use Wikimedia\Assert\PreconditionException;
/**
* Hooks for the spam blacklist extension
*/
class SpamBlacklistHooks implements
\MediaWiki\Hook\EditFilterHook,
\MediaWiki\Hook\EditFilterMergedContentHook,
\MediaWiki\Hook\UploadVerifyUploadHook,
\MediaWiki\Storage\Hook\PageSaveCompleteHook,
\MediaWiki\Storage\Hook\ParserOutputStashForEditHook,
\MediaWiki\User\Hook\UserCanSendEmailHook
{
/**
* Hook function for EditFilterMergedContent
*
* @param IContextSource $context
* @param Content $content
* @param Status $status
* @param string $summary
* @param User $user
* @param bool $minoredit
*
* @return bool
*/
public function onEditFilterMergedContent(
IContextSource $context,
Content $content,
Status $status,
$summary,
User $user,
$minoredit
) {
$title = $context->getTitle();
try {
// Try getting the update directly
$updater = $context->getWikiPage()->getCurrentUpdate();
$pout = $updater->getParserOutputForMetaData();
} catch ( PreconditionException $exception ) {
$services = MediaWikiServices::getInstance();
$stashedEdit = $services->getPageEditStash()->checkCache(
$title,
$content,
$user
);
if ( $stashedEdit ) {
// Try getting the value from edit stash
/** @var ParserOutput $output */
$pout = $stashedEdit->output;
} else {
// Last resort, parse the page.
$contentRenderer = $services->getContentRenderer();
$pout = $contentRenderer->getParserOutput(
$content,
$title,
null,
null,
false
);
}
}
$links = array_keys( $pout->getExternalLinks() );
// HACK: treat the edit summary as a link if it contains anything
// that looks like it could be a URL or e-mail address.
if ( preg_match( '/\S(\.[^\s\d]{2,}|[\/@]\S)/', $summary ) ) {
$links[] = $summary;
}
$spamObj = BaseBlacklist::getSpamBlacklist();
$matches = $spamObj->filter( $links, $title, $user );
if ( $matches !== false ) {
$error = new ApiMessage(
wfMessage( 'spam-blacklisted-link', Message::listParam( $matches ) ),
'spamblacklist',
[
'spamblacklist' => [ 'matches' => $matches ],
]
);
$status->fatal( $error );
// @todo Remove this line after this extension do not support mediawiki version 1.36 and before
$status->value = EditPage::AS_HOOK_ERROR_EXPECTED;
return false;
}
return true;
}
/**
* @param WikiPage $page
* @param Content $content
* @param ParserOutput $output
* @param string $summary
* @param User $user
*/
public function onParserOutputStashForEdit(
$page,
$content,
$output,
$summary,
$user
) {
$links = array_keys( $output->getExternalLinks() );
$spamObj = BaseBlacklist::getSpamBlacklist();
$spamObj->warmCachesForFilter( $page->getTitle(), $links, $user );
}
/**
* Verify that the user can send emails
*
* @param User $user
* @param array &$hookErr
* @return bool
*/
public function onUserCanSendEmail( $user, &$hookErr ) {
$blacklist = BaseBlacklist::getEmailBlacklist();
if ( $blacklist->checkUser( $user ) ) {
return true;
}
$hookErr = [ 'spam-blacklisted-email', 'spam-blacklisted-email-text', null ];
// No other hook handler should run
return false;
}
/**
* Hook function for EditFilter
* Confirm that a local blacklist page being saved is valid,
* and toss back a warning to the user if it isn't.
*
* @param EditPage $editPage
* @param string $text
* @param string $section
* @param string &$hookError
* @param string $summary
*/
public function onEditFilter( $editPage, $text, $section, &$hookError, $summary ) {
$title = $editPage->getTitle();
$thisPageName = $title->getPrefixedDBkey();
if ( !BaseBlacklist::isLocalSource( $title ) ) {
wfDebugLog( 'SpamBlacklist',
"Spam blacklist validator: [[$thisPageName]] not a local blacklist\n"
);
return;
}
$type = BaseBlacklist::getTypeFromTitle( $title );
if ( $type === false ) {
return;
}
$lines = explode( "\n", $text );
$badLines = SpamRegexBatch::getBadLines( $lines, BaseBlacklist::getInstance( $type ) );
if ( $badLines ) {
wfDebugLog( 'SpamBlacklist',
"Spam blacklist validator: [[$thisPageName]] given invalid input lines: " .
implode( ', ', $badLines ) . "\n"
);
$badList = "*<code>" .
implode( "</code>\n*<code>",
array_map( 'wfEscapeWikiText', $badLines ) ) .
"</code>\n";
$hookError =
"<div class='errorbox'>" .
wfMessage( 'spam-invalid-lines' )->numParams( $badLines )->text() . "<br />" .
$badList .
"</div>\n" .
"<br clear='all' />\n";
} else {
wfDebugLog( 'SpamBlacklist',
"Spam blacklist validator: [[$thisPageName]] ok or empty blacklist\n"
);
}
}
/**
* Hook function for PageSaveComplete
* Clear local spam blacklist caches on page save.
*
* @param WikiPage $wikiPage
* @param UserIdentity $userIdentity
* @param string $summary
* @param int $flags
* @param RevisionRecord $revisionRecord
* @param EditResult $editResult
*/
public function onPageSaveComplete(
$wikiPage,
$userIdentity,
$summary,
$flags,
$revisionRecord,
$editResult
) {
if ( !BaseBlacklist::isLocalSource( $wikiPage->getTitle() ) ) {
return;
}
// This sucks because every Blacklist needs to be cleared
foreach ( BaseBlacklist::getBlacklistTypes() as $type => $class ) {
$blacklist = BaseBlacklist::getInstance( $type );
$blacklist->clearCache();
}
}
/**
* @param UploadBase $upload
* @param User $user
* @param array|null $props
* @param string $comment
* @param string $pageText
* @param array|MessageSpecifier &$error
*/
public function onUploadVerifyUpload(
UploadBase $upload,
User $user,
?array $props,
$comment,
$pageText,
&$error
) {
$title = $upload->getTitle();
// get the link from the not-yet-saved page content.
$content = ContentHandler::makeContent( $pageText, $title );
$parserOptions = ParserOptions::newFromAnon();
$contentRenderer = MediaWikiServices::getInstance()->getContentRenderer();
$output = $contentRenderer->getParserOutput( $content, $title, null, $parserOptions );
$links = array_keys( $output->getExternalLinks() );
// HACK: treat comment as a link if it contains anything
// that looks like it could be a URL or e-mail address.
if ( preg_match( '/\S(\.[^\s\d]{2,}|[\/@]\S)/', $comment ) ) {
$links[] = $comment;
}
if ( !$links ) {
return;
}
$spamObj = BaseBlacklist::getSpamBlacklist();
$matches = $spamObj->filter( $links, $title, $user );
if ( $matches !== false ) {
$error = new ApiMessage(
wfMessage( 'spam-blacklisted-link', Message::listParam( $matches ) ),
'spamblacklist',
[
'spamblacklist' => [ 'matches' => $matches ],
]
);
}
}
}