mirror of
https://gerrit.wikimedia.org/r/mediawiki/extensions/SpamBlacklist
synced 2024-11-24 15:13:44 +00:00
3cb265f12e
StashedEdit is slower than the PreparedUpdate Bug: T288639 Change-Id: Ibeb934050c6b24720da4b69dba6273c8b3e15acc
265 lines
6.8 KiB
PHP
265 lines
6.8 KiB
PHP
<?php
|
|
|
|
use MediaWiki\MediaWikiServices;
|
|
use MediaWiki\Revision\RevisionRecord;
|
|
use MediaWiki\Storage\EditResult;
|
|
use MediaWiki\User\UserIdentity;
|
|
use Wikimedia\Assert\PreconditionException;
|
|
|
|
/**
|
|
* Hooks for the spam blacklist extension
|
|
*/
|
|
class SpamBlacklistHooks implements
|
|
\MediaWiki\Hook\EditFilterHook,
|
|
\MediaWiki\Hook\EditFilterMergedContentHook,
|
|
\MediaWiki\Hook\UploadVerifyUploadHook,
|
|
\MediaWiki\Storage\Hook\PageSaveCompleteHook,
|
|
\MediaWiki\Storage\Hook\ParserOutputStashForEditHook,
|
|
\MediaWiki\User\Hook\UserCanSendEmailHook
|
|
{
|
|
|
|
/**
|
|
* Hook function for EditFilterMergedContent
|
|
*
|
|
* @param IContextSource $context
|
|
* @param Content $content
|
|
* @param Status $status
|
|
* @param string $summary
|
|
* @param User $user
|
|
* @param bool $minoredit
|
|
*
|
|
* @return bool
|
|
*/
|
|
public function onEditFilterMergedContent(
|
|
IContextSource $context,
|
|
Content $content,
|
|
Status $status,
|
|
$summary,
|
|
User $user,
|
|
$minoredit
|
|
) {
|
|
$title = $context->getTitle();
|
|
try {
|
|
// Try getting the update directly
|
|
$updater = $context->getWikiPage()->getCurrentUpdate();
|
|
$pout = $updater->getParserOutputForMetaData();
|
|
} catch ( PreconditionException $exception ) {
|
|
$services = MediaWikiServices::getInstance();
|
|
$stashedEdit = $services->getPageEditStash()->checkCache(
|
|
$title,
|
|
$content,
|
|
$user
|
|
);
|
|
if ( $stashedEdit ) {
|
|
// Try getting the value from edit stash
|
|
/** @var ParserOutput $output */
|
|
$pout = $stashedEdit->output;
|
|
} else {
|
|
// Last resort, parse the page.
|
|
$contentRenderer = $services->getContentRenderer();
|
|
$pout = $contentRenderer->getParserOutput(
|
|
$content,
|
|
$title,
|
|
null,
|
|
null,
|
|
false
|
|
);
|
|
}
|
|
}
|
|
$links = array_keys( $pout->getExternalLinks() );
|
|
// HACK: treat the edit summary as a link if it contains anything
|
|
// that looks like it could be a URL or e-mail address.
|
|
if ( preg_match( '/\S(\.[^\s\d]{2,}|[\/@]\S)/', $summary ) ) {
|
|
$links[] = $summary;
|
|
}
|
|
|
|
$spamObj = BaseBlacklist::getSpamBlacklist();
|
|
$matches = $spamObj->filter( $links, $title, $user );
|
|
|
|
if ( $matches !== false ) {
|
|
$error = new ApiMessage(
|
|
wfMessage( 'spam-blacklisted-link', Message::listParam( $matches ) ),
|
|
'spamblacklist',
|
|
[
|
|
'spamblacklist' => [ 'matches' => $matches ],
|
|
]
|
|
);
|
|
$status->fatal( $error );
|
|
// @todo Remove this line after this extension do not support mediawiki version 1.36 and before
|
|
$status->value = EditPage::AS_HOOK_ERROR_EXPECTED;
|
|
return false;
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
/**
|
|
* @param WikiPage $page
|
|
* @param Content $content
|
|
* @param ParserOutput $output
|
|
* @param string $summary
|
|
* @param User $user
|
|
*/
|
|
public function onParserOutputStashForEdit(
|
|
$page,
|
|
$content,
|
|
$output,
|
|
$summary,
|
|
$user
|
|
) {
|
|
$links = array_keys( $output->getExternalLinks() );
|
|
$spamObj = BaseBlacklist::getSpamBlacklist();
|
|
$spamObj->warmCachesForFilter( $page->getTitle(), $links, $user );
|
|
}
|
|
|
|
/**
|
|
* Verify that the user can send emails
|
|
*
|
|
* @param User $user
|
|
* @param array &$hookErr
|
|
* @return bool
|
|
*/
|
|
public function onUserCanSendEmail( $user, &$hookErr ) {
|
|
$blacklist = BaseBlacklist::getEmailBlacklist();
|
|
if ( $blacklist->checkUser( $user ) ) {
|
|
return true;
|
|
}
|
|
|
|
$hookErr = [ 'spam-blacklisted-email', 'spam-blacklisted-email-text', null ];
|
|
|
|
// No other hook handler should run
|
|
return false;
|
|
}
|
|
|
|
/**
|
|
* Hook function for EditFilter
|
|
* Confirm that a local blacklist page being saved is valid,
|
|
* and toss back a warning to the user if it isn't.
|
|
*
|
|
* @param EditPage $editPage
|
|
* @param string $text
|
|
* @param string $section
|
|
* @param string &$hookError
|
|
* @param string $summary
|
|
*/
|
|
public function onEditFilter( $editPage, $text, $section, &$hookError, $summary ) {
|
|
$title = $editPage->getTitle();
|
|
$thisPageName = $title->getPrefixedDBkey();
|
|
|
|
if ( !BaseBlacklist::isLocalSource( $title ) ) {
|
|
wfDebugLog( 'SpamBlacklist',
|
|
"Spam blacklist validator: [[$thisPageName]] not a local blacklist\n"
|
|
);
|
|
return;
|
|
}
|
|
|
|
$type = BaseBlacklist::getTypeFromTitle( $title );
|
|
if ( $type === false ) {
|
|
return;
|
|
}
|
|
|
|
$lines = explode( "\n", $text );
|
|
|
|
$badLines = SpamRegexBatch::getBadLines( $lines, BaseBlacklist::getInstance( $type ) );
|
|
if ( $badLines ) {
|
|
wfDebugLog( 'SpamBlacklist',
|
|
"Spam blacklist validator: [[$thisPageName]] given invalid input lines: " .
|
|
implode( ', ', $badLines ) . "\n"
|
|
);
|
|
|
|
$badList = "*<code>" .
|
|
implode( "</code>\n*<code>",
|
|
array_map( 'wfEscapeWikiText', $badLines ) ) .
|
|
"</code>\n";
|
|
$hookError =
|
|
"<div class='errorbox'>" .
|
|
wfMessage( 'spam-invalid-lines' )->numParams( $badLines )->text() . "<br />" .
|
|
$badList .
|
|
"</div>\n" .
|
|
"<br clear='all' />\n";
|
|
} else {
|
|
wfDebugLog( 'SpamBlacklist',
|
|
"Spam blacklist validator: [[$thisPageName]] ok or empty blacklist\n"
|
|
);
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Hook function for PageSaveComplete
|
|
* Clear local spam blacklist caches on page save.
|
|
*
|
|
* @param WikiPage $wikiPage
|
|
* @param UserIdentity $userIdentity
|
|
* @param string $summary
|
|
* @param int $flags
|
|
* @param RevisionRecord $revisionRecord
|
|
* @param EditResult $editResult
|
|
*/
|
|
public function onPageSaveComplete(
|
|
$wikiPage,
|
|
$userIdentity,
|
|
$summary,
|
|
$flags,
|
|
$revisionRecord,
|
|
$editResult
|
|
) {
|
|
if ( !BaseBlacklist::isLocalSource( $wikiPage->getTitle() ) ) {
|
|
return;
|
|
}
|
|
|
|
// This sucks because every Blacklist needs to be cleared
|
|
foreach ( BaseBlacklist::getBlacklistTypes() as $type => $class ) {
|
|
$blacklist = BaseBlacklist::getInstance( $type );
|
|
$blacklist->clearCache();
|
|
}
|
|
}
|
|
|
|
/**
|
|
* @param UploadBase $upload
|
|
* @param User $user
|
|
* @param array|null $props
|
|
* @param string $comment
|
|
* @param string $pageText
|
|
* @param array|MessageSpecifier &$error
|
|
*/
|
|
public function onUploadVerifyUpload(
|
|
UploadBase $upload,
|
|
User $user,
|
|
?array $props,
|
|
$comment,
|
|
$pageText,
|
|
&$error
|
|
) {
|
|
$title = $upload->getTitle();
|
|
|
|
// get the link from the not-yet-saved page content.
|
|
$content = ContentHandler::makeContent( $pageText, $title );
|
|
$parserOptions = ParserOptions::newFromAnon();
|
|
$contentRenderer = MediaWikiServices::getInstance()->getContentRenderer();
|
|
$output = $contentRenderer->getParserOutput( $content, $title, null, $parserOptions );
|
|
$links = array_keys( $output->getExternalLinks() );
|
|
|
|
// HACK: treat comment as a link if it contains anything
|
|
// that looks like it could be a URL or e-mail address.
|
|
if ( preg_match( '/\S(\.[^\s\d]{2,}|[\/@]\S)/', $comment ) ) {
|
|
$links[] = $comment;
|
|
}
|
|
if ( !$links ) {
|
|
return;
|
|
}
|
|
|
|
$spamObj = BaseBlacklist::getSpamBlacklist();
|
|
$matches = $spamObj->filter( $links, $title, $user );
|
|
|
|
if ( $matches !== false ) {
|
|
$error = new ApiMessage(
|
|
wfMessage( 'spam-blacklisted-link', Message::listParam( $matches ) ),
|
|
'spamblacklist',
|
|
[
|
|
'spamblacklist' => [ 'matches' => $matches ],
|
|
]
|
|
);
|
|
}
|
|
}
|
|
}
|