2019-10-28 12:28:17 +00:00
|
|
|
<?php
|
|
|
|
/**
|
2022-02-19 04:03:09 +00:00
|
|
|
* Generates language-specific data used by DiscussionTools.
|
2019-10-28 12:28:17 +00:00
|
|
|
*
|
|
|
|
* @file
|
|
|
|
* @ingroup Extensions
|
|
|
|
* @license MIT
|
|
|
|
*/
|
|
|
|
|
2020-05-14 22:44:49 +00:00
|
|
|
namespace MediaWiki\Extension\DiscussionTools;
|
|
|
|
|
|
|
|
use Config;
|
2020-05-19 18:40:05 +00:00
|
|
|
use DateTimeZone;
|
2020-09-03 20:59:33 +00:00
|
|
|
use ILanguageConverter;
|
2020-05-14 22:44:49 +00:00
|
|
|
use Language;
|
2019-10-28 12:28:17 +00:00
|
|
|
use MediaWiki\MediaWikiServices;
|
|
|
|
|
2022-02-19 04:03:09 +00:00
|
|
|
class LanguageData {
|
2019-10-28 12:28:17 +00:00
|
|
|
/**
|
2022-02-19 04:03:09 +00:00
|
|
|
* Compute data we need to parse discussion threads on pages.
|
2019-10-28 12:28:17 +00:00
|
|
|
*
|
2020-01-13 19:48:11 +00:00
|
|
|
* @param Config $config
|
2022-02-19 04:03:09 +00:00
|
|
|
* @param Language $lang
|
2019-10-28 12:28:17 +00:00
|
|
|
* @return array
|
|
|
|
*/
|
2022-02-19 04:03:09 +00:00
|
|
|
public static function getLocalData( Config $config, Language $lang ): array {
|
2021-02-27 14:46:23 +00:00
|
|
|
$langConv = MediaWikiServices::getInstance()->getLanguageConverterFactory()
|
|
|
|
->getLanguageConverter( $lang );
|
2020-09-03 20:59:33 +00:00
|
|
|
|
2019-10-28 12:28:17 +00:00
|
|
|
$data = [];
|
|
|
|
|
2020-09-03 20:59:33 +00:00
|
|
|
$data['dateFormat'] = [];
|
|
|
|
$dateFormat = $lang->getDateFormatString( 'both', $lang->dateFormat( false ) );
|
2021-02-27 14:46:23 +00:00
|
|
|
foreach ( $langConv->getVariants() as $variant ) {
|
2020-09-03 20:59:33 +00:00
|
|
|
$convDateFormat = self::convertDateFormat( $dateFormat, $langConv, $variant );
|
|
|
|
$data['dateFormat'][$variant] = $convDateFormat;
|
|
|
|
}
|
2019-10-28 12:28:17 +00:00
|
|
|
|
2020-09-03 20:59:33 +00:00
|
|
|
$data['digits'] = [];
|
2021-02-27 14:46:23 +00:00
|
|
|
foreach ( $langConv->getVariants() as $variant ) {
|
2020-09-03 20:59:33 +00:00
|
|
|
$data['digits'][$variant] = [];
|
|
|
|
foreach ( str_split( '0123456789' ) as $digit ) {
|
|
|
|
if ( $config->get( 'TranslateNumerals' ) ) {
|
|
|
|
$localDigit = $lang->formatNumNoSeparators( $digit );
|
|
|
|
} else {
|
|
|
|
$localDigit = $digit;
|
|
|
|
}
|
|
|
|
$convLocalDigit = $langConv->translate( $localDigit, $variant );
|
|
|
|
$data['digits'][$variant][] = $convLocalDigit;
|
|
|
|
}
|
|
|
|
}
|
2019-10-28 12:28:17 +00:00
|
|
|
|
|
|
|
// ApiQuerySiteinfo
|
|
|
|
$data['localTimezone'] = $config->get( 'Localtimezone' );
|
|
|
|
|
2020-02-19 23:14:27 +00:00
|
|
|
$data['specialContributionsName'] = MediaWikiServices::getInstance()
|
|
|
|
->getSpecialPageFactory()->getLocalNameFor( 'Contributions' );
|
2021-07-22 20:20:16 +00:00
|
|
|
$data['specialNewSectionName'] = MediaWikiServices::getInstance()
|
|
|
|
->getSpecialPageFactory()->getLocalNameFor( 'NewSection' );
|
2019-10-28 12:28:17 +00:00
|
|
|
|
|
|
|
$localTimezone = $config->get( 'Localtimezone' );
|
2020-10-14 19:53:00 +00:00
|
|
|
// Return all timezone abbreviations for the local timezone (there will often be two, for
|
2019-10-28 12:28:17 +00:00
|
|
|
// non-DST and DST timestamps, and sometimes more due to historical data, but that's okay).
|
2020-10-14 19:53:00 +00:00
|
|
|
// Avoid DateTimeZone::listAbbreviations(), it returns some half-baked list that is different
|
|
|
|
// from the timezone data used by everything else in PHP.
|
|
|
|
$timezoneAbbrs = array_values( array_unique(
|
2021-05-05 06:59:38 +00:00
|
|
|
array_map( static function ( $transition ) {
|
2020-10-14 19:53:00 +00:00
|
|
|
return $transition['abbr'];
|
|
|
|
}, ( new DateTimeZone( $localTimezone ) )->getTransitions() )
|
2019-10-28 12:28:17 +00:00
|
|
|
) );
|
2020-09-03 20:59:33 +00:00
|
|
|
|
|
|
|
$data['timezones'] = [];
|
2021-02-27 14:46:23 +00:00
|
|
|
foreach ( $langConv->getVariants() as $variant ) {
|
2020-09-03 20:59:33 +00:00
|
|
|
$data['timezones'][$variant] = array_combine(
|
2021-05-05 06:59:38 +00:00
|
|
|
array_map( static function ( string $tzMsg ) use ( $lang, $langConv, $variant ) {
|
2020-09-03 20:59:33 +00:00
|
|
|
// MWTimestamp::getTimezoneMessage()
|
|
|
|
// Parser::pstPass2()
|
|
|
|
// Messages used here: 'timezone-utc' and so on
|
|
|
|
$key = 'timezone-' . strtolower( trim( $tzMsg ) );
|
|
|
|
$msg = wfMessage( $key )->inLanguage( $lang );
|
|
|
|
// TODO: This probably causes a similar issue to https://phabricator.wikimedia.org/T221294,
|
|
|
|
// but we *must* check the message existence in the database, because the messages are not
|
|
|
|
// actually defined by MediaWiki core for any timezone other than UTC...
|
|
|
|
if ( $msg->exists() ) {
|
|
|
|
$text = $msg->text();
|
|
|
|
} else {
|
|
|
|
$text = strtoupper( $tzMsg );
|
|
|
|
}
|
|
|
|
$convText = $langConv->translate( $text, $variant );
|
|
|
|
return $convText;
|
|
|
|
}, $timezoneAbbrs ),
|
|
|
|
array_map( 'strtoupper', $timezoneAbbrs )
|
|
|
|
);
|
|
|
|
}
|
2019-10-28 12:28:17 +00:00
|
|
|
|
|
|
|
// Messages in content language
|
|
|
|
$messagesKeys = array_merge(
|
2020-02-28 08:18:16 +00:00
|
|
|
Language::WEEKDAY_MESSAGES,
|
|
|
|
Language::WEEKDAY_ABBREVIATED_MESSAGES,
|
|
|
|
Language::MONTH_MESSAGES,
|
|
|
|
Language::MONTH_GENITIVE_MESSAGES,
|
|
|
|
Language::MONTH_ABBREVIATED_MESSAGES
|
2019-10-28 12:28:17 +00:00
|
|
|
);
|
2020-09-03 20:59:33 +00:00
|
|
|
$data['contLangMessages'] = [];
|
2021-02-27 14:46:23 +00:00
|
|
|
foreach ( $langConv->getVariants() as $variant ) {
|
2020-09-03 20:59:33 +00:00
|
|
|
$data['contLangMessages'][$variant] = array_combine(
|
|
|
|
$messagesKeys,
|
2021-05-05 06:59:38 +00:00
|
|
|
array_map( static function ( $key ) use ( $lang, $langConv, $variant ) {
|
2020-09-03 20:59:33 +00:00
|
|
|
$text = wfMessage( $key )->inLanguage( $lang )->text();
|
|
|
|
return $langConv->translate( $text, $variant );
|
|
|
|
}, $messagesKeys )
|
|
|
|
);
|
|
|
|
}
|
2019-10-28 12:28:17 +00:00
|
|
|
|
|
|
|
// How far backwards we look for a signature associated with a timestamp before giving up.
|
|
|
|
// Note that this is not a hard limit on the length of signatures we detect.
|
|
|
|
$data['signatureScanLimit'] = 100;
|
|
|
|
|
|
|
|
return $data;
|
|
|
|
}
|
2020-03-10 13:03:45 +00:00
|
|
|
|
2020-09-03 20:59:33 +00:00
|
|
|
/**
|
|
|
|
* Convert a date format string to a different language variant, leaving all special characters
|
|
|
|
* unchanged and applying language conversion to the plain text fragments.
|
|
|
|
*
|
|
|
|
* @param string $format
|
|
|
|
* @param ILanguageConverter $langConv
|
|
|
|
* @param string $variant
|
|
|
|
* @return string
|
|
|
|
*/
|
|
|
|
private static function convertDateFormat(
|
|
|
|
string $format,
|
|
|
|
ILanguageConverter $langConv,
|
|
|
|
string $variant
|
2021-07-22 07:25:13 +00:00
|
|
|
): string {
|
2020-09-03 20:59:33 +00:00
|
|
|
$formatLength = strlen( $format );
|
|
|
|
$s = '';
|
|
|
|
// The supported codes must match CommentParser::getTimestampRegexp()
|
|
|
|
for ( $p = 0; $p < $formatLength; $p++ ) {
|
|
|
|
$num = false;
|
|
|
|
$code = $format[ $p ];
|
|
|
|
if ( $code === 'x' && $p < $formatLength - 1 ) {
|
|
|
|
$code .= $format[++$p];
|
|
|
|
}
|
|
|
|
if ( $code === 'xk' && $p < $formatLength - 1 ) {
|
|
|
|
$code .= $format[++$p];
|
|
|
|
}
|
|
|
|
|
|
|
|
// LAZY SHORTCUTS that might cause bugs:
|
|
|
|
// * We assume that result of $langConv->translate() doesn't produce any special codes/characters
|
|
|
|
// * We assume that calling $langConv->translate() separately for each character is correct
|
|
|
|
switch ( $code ) {
|
2020-10-29 10:52:56 +00:00
|
|
|
case 'xx':
|
2020-09-03 20:59:33 +00:00
|
|
|
case 'xg':
|
|
|
|
case 'd':
|
|
|
|
case 'D':
|
|
|
|
case 'j':
|
|
|
|
case 'l':
|
|
|
|
case 'F':
|
|
|
|
case 'M':
|
|
|
|
case 'n':
|
|
|
|
case 'Y':
|
|
|
|
case 'xkY':
|
|
|
|
case 'G':
|
|
|
|
case 'H':
|
|
|
|
case 'i':
|
|
|
|
// Special code - pass through unchanged
|
|
|
|
$s .= $code;
|
|
|
|
break;
|
|
|
|
case '\\':
|
|
|
|
// Plain text (backslash escaping) - convert to language variant
|
|
|
|
if ( $p < $formatLength - 1 ) {
|
|
|
|
$s .= '\\' . $langConv->translate( $format[++$p], $variant );
|
|
|
|
} else {
|
|
|
|
$s .= $code;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
case '"':
|
|
|
|
// Plain text (quoted literal) - convert to language variant
|
|
|
|
if ( $p < $formatLength - 1 ) {
|
|
|
|
$endQuote = strpos( $format, '"', $p + 1 );
|
|
|
|
if ( $endQuote === false ) {
|
|
|
|
// No terminating quote, assume literal "
|
|
|
|
$s .= $code;
|
|
|
|
} else {
|
|
|
|
$s .= '"' .
|
|
|
|
$langConv->translate( substr( $format, $p + 1, $endQuote - $p - 1 ), $variant ) .
|
|
|
|
'"';
|
|
|
|
$p = $endQuote;
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
// Quote at end of string, assume literal "
|
|
|
|
$s .= $code;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
// Plain text - convert to language variant
|
|
|
|
$s .= $langConv->translate( $format[$p], $variant );
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return $s;
|
|
|
|
}
|
2019-10-28 12:28:17 +00:00
|
|
|
}
|