2019-10-28 12:28:17 +00:00
|
|
|
<?php
|
|
|
|
/**
|
2022-02-19 04:03:09 +00:00
|
|
|
* Generates language-specific data used by DiscussionTools.
|
2019-10-28 12:28:17 +00:00
|
|
|
*
|
|
|
|
* @file
|
|
|
|
* @ingroup Extensions
|
|
|
|
* @license MIT
|
|
|
|
*/
|
|
|
|
|
2020-05-14 22:44:49 +00:00
|
|
|
namespace MediaWiki\Extension\DiscussionTools;
|
|
|
|
|
2020-05-19 18:40:05 +00:00
|
|
|
use DateTimeZone;
|
2020-09-03 20:59:33 +00:00
|
|
|
use ILanguageConverter;
|
2020-05-14 22:44:49 +00:00
|
|
|
use Language;
|
2023-12-11 15:38:02 +00:00
|
|
|
use MediaWiki\Config\Config;
|
Change CommentParser into a service
Goal:
-----
To have a method like CommentParser::parse(), which just takes a node
to parse and a title and returns plain data, so that we don't need to
keep track of the config to construct a CommentParser object (the
required config like content language is provided by services) and
we don't need to keep that object around after parsing.
Changes:
--------
CommentParser.php:
* …is now a service. Constructor only takes services as arguments.
The node and title are passed to a new parse() method.
* parse() should return plain data, but I split this part to a separate
patch for ease of review: I49bfe019aa460651447fd383f73eafa9d7180a92.
* CommentParser still cheats and accesses global state in a few places,
e.g. calling Title::makeTitleSafe or CommentUtils::getTitleFromUrl,
so we can't turn its tests into true unit tests. This work is left
for future commits.
LanguageData.php:
* …is now a service, instead of a static class.
Parser.js:
* …is not a real service, but it's changed to behave in a similar way.
Constructor takes only the required config as argument,
and node and title are instead passed to a new parse() method.
CommentParserTest.php:
parser.test.js:
* Can be simplified, now that we don't need a useless node and title
to test internal methods that don't use them.
testUtils.js:
* Can be simplified, now that we don't need to override internal
ResourceLoader stuff just to change the parser config.
Change-Id: Iadb7757debe000025e52770ca51ebcf24ca8ee66
2022-02-19 02:43:21 +00:00
|
|
|
use MediaWiki\Languages\LanguageConverterFactory;
|
2023-05-19 07:36:50 +00:00
|
|
|
use MediaWiki\MainConfigNames;
|
Change CommentParser into a service
Goal:
-----
To have a method like CommentParser::parse(), which just takes a node
to parse and a title and returns plain data, so that we don't need to
keep track of the config to construct a CommentParser object (the
required config like content language is provided by services) and
we don't need to keep that object around after parsing.
Changes:
--------
CommentParser.php:
* …is now a service. Constructor only takes services as arguments.
The node and title are passed to a new parse() method.
* parse() should return plain data, but I split this part to a separate
patch for ease of review: I49bfe019aa460651447fd383f73eafa9d7180a92.
* CommentParser still cheats and accesses global state in a few places,
e.g. calling Title::makeTitleSafe or CommentUtils::getTitleFromUrl,
so we can't turn its tests into true unit tests. This work is left
for future commits.
LanguageData.php:
* …is now a service, instead of a static class.
Parser.js:
* …is not a real service, but it's changed to behave in a similar way.
Constructor takes only the required config as argument,
and node and title are instead passed to a new parse() method.
CommentParserTest.php:
parser.test.js:
* Can be simplified, now that we don't need a useless node and title
to test internal methods that don't use them.
testUtils.js:
* Can be simplified, now that we don't need to override internal
ResourceLoader stuff just to change the parser config.
Change-Id: Iadb7757debe000025e52770ca51ebcf24ca8ee66
2022-02-19 02:43:21 +00:00
|
|
|
use MediaWiki\SpecialPage\SpecialPageFactory;
|
2019-10-28 12:28:17 +00:00
|
|
|
|
2022-02-19 04:03:09 +00:00
|
|
|
class LanguageData {
|
2022-10-21 19:34:18 +00:00
|
|
|
|
|
|
|
private Config $config;
|
|
|
|
private Language $language;
|
|
|
|
private LanguageConverterFactory $languageConverterFactory;
|
|
|
|
private SpecialPageFactory $specialPageFactory;
|
Change CommentParser into a service
Goal:
-----
To have a method like CommentParser::parse(), which just takes a node
to parse and a title and returns plain data, so that we don't need to
keep track of the config to construct a CommentParser object (the
required config like content language is provided by services) and
we don't need to keep that object around after parsing.
Changes:
--------
CommentParser.php:
* …is now a service. Constructor only takes services as arguments.
The node and title are passed to a new parse() method.
* parse() should return plain data, but I split this part to a separate
patch for ease of review: I49bfe019aa460651447fd383f73eafa9d7180a92.
* CommentParser still cheats and accesses global state in a few places,
e.g. calling Title::makeTitleSafe or CommentUtils::getTitleFromUrl,
so we can't turn its tests into true unit tests. This work is left
for future commits.
LanguageData.php:
* …is now a service, instead of a static class.
Parser.js:
* …is not a real service, but it's changed to behave in a similar way.
Constructor takes only the required config as argument,
and node and title are instead passed to a new parse() method.
CommentParserTest.php:
parser.test.js:
* Can be simplified, now that we don't need a useless node and title
to test internal methods that don't use them.
testUtils.js:
* Can be simplified, now that we don't need to override internal
ResourceLoader stuff just to change the parser config.
Change-Id: Iadb7757debe000025e52770ca51ebcf24ca8ee66
2022-02-19 02:43:21 +00:00
|
|
|
|
|
|
|
public function __construct(
|
|
|
|
Config $config,
|
|
|
|
Language $language,
|
|
|
|
LanguageConverterFactory $languageConverterFactory,
|
|
|
|
SpecialPageFactory $specialPageFactory
|
|
|
|
) {
|
|
|
|
$this->config = $config;
|
|
|
|
$this->language = $language;
|
|
|
|
$this->languageConverterFactory = $languageConverterFactory;
|
|
|
|
$this->specialPageFactory = $specialPageFactory;
|
|
|
|
}
|
|
|
|
|
2019-10-28 12:28:17 +00:00
|
|
|
/**
|
2022-02-19 04:03:09 +00:00
|
|
|
* Compute data we need to parse discussion threads on pages.
|
2019-10-28 12:28:17 +00:00
|
|
|
*/
|
Change CommentParser into a service
Goal:
-----
To have a method like CommentParser::parse(), which just takes a node
to parse and a title and returns plain data, so that we don't need to
keep track of the config to construct a CommentParser object (the
required config like content language is provided by services) and
we don't need to keep that object around after parsing.
Changes:
--------
CommentParser.php:
* …is now a service. Constructor only takes services as arguments.
The node and title are passed to a new parse() method.
* parse() should return plain data, but I split this part to a separate
patch for ease of review: I49bfe019aa460651447fd383f73eafa9d7180a92.
* CommentParser still cheats and accesses global state in a few places,
e.g. calling Title::makeTitleSafe or CommentUtils::getTitleFromUrl,
so we can't turn its tests into true unit tests. This work is left
for future commits.
LanguageData.php:
* …is now a service, instead of a static class.
Parser.js:
* …is not a real service, but it's changed to behave in a similar way.
Constructor takes only the required config as argument,
and node and title are instead passed to a new parse() method.
CommentParserTest.php:
parser.test.js:
* Can be simplified, now that we don't need a useless node and title
to test internal methods that don't use them.
testUtils.js:
* Can be simplified, now that we don't need to override internal
ResourceLoader stuff just to change the parser config.
Change-Id: Iadb7757debe000025e52770ca51ebcf24ca8ee66
2022-02-19 02:43:21 +00:00
|
|
|
public function getLocalData(): array {
|
|
|
|
$config = $this->config;
|
|
|
|
$lang = $this->language;
|
|
|
|
$langConv = $this->languageConverterFactory->getLanguageConverter( $lang );
|
2020-09-03 20:59:33 +00:00
|
|
|
|
2019-10-28 12:28:17 +00:00
|
|
|
$data = [];
|
|
|
|
|
2020-09-03 20:59:33 +00:00
|
|
|
$data['dateFormat'] = [];
|
|
|
|
$dateFormat = $lang->getDateFormatString( 'both', $lang->dateFormat( false ) );
|
2021-02-27 14:46:23 +00:00
|
|
|
foreach ( $langConv->getVariants() as $variant ) {
|
Change CommentParser into a service
Goal:
-----
To have a method like CommentParser::parse(), which just takes a node
to parse and a title and returns plain data, so that we don't need to
keep track of the config to construct a CommentParser object (the
required config like content language is provided by services) and
we don't need to keep that object around after parsing.
Changes:
--------
CommentParser.php:
* …is now a service. Constructor only takes services as arguments.
The node and title are passed to a new parse() method.
* parse() should return plain data, but I split this part to a separate
patch for ease of review: I49bfe019aa460651447fd383f73eafa9d7180a92.
* CommentParser still cheats and accesses global state in a few places,
e.g. calling Title::makeTitleSafe or CommentUtils::getTitleFromUrl,
so we can't turn its tests into true unit tests. This work is left
for future commits.
LanguageData.php:
* …is now a service, instead of a static class.
Parser.js:
* …is not a real service, but it's changed to behave in a similar way.
Constructor takes only the required config as argument,
and node and title are instead passed to a new parse() method.
CommentParserTest.php:
parser.test.js:
* Can be simplified, now that we don't need a useless node and title
to test internal methods that don't use them.
testUtils.js:
* Can be simplified, now that we don't need to override internal
ResourceLoader stuff just to change the parser config.
Change-Id: Iadb7757debe000025e52770ca51ebcf24ca8ee66
2022-02-19 02:43:21 +00:00
|
|
|
$convDateFormat = $this->convertDateFormat( $dateFormat, $langConv, $variant );
|
2020-09-03 20:59:33 +00:00
|
|
|
$data['dateFormat'][$variant] = $convDateFormat;
|
|
|
|
}
|
2019-10-28 12:28:17 +00:00
|
|
|
|
2020-09-03 20:59:33 +00:00
|
|
|
$data['digits'] = [];
|
2021-02-27 14:46:23 +00:00
|
|
|
foreach ( $langConv->getVariants() as $variant ) {
|
2020-09-03 20:59:33 +00:00
|
|
|
$data['digits'][$variant] = [];
|
|
|
|
foreach ( str_split( '0123456789' ) as $digit ) {
|
2023-05-19 07:36:50 +00:00
|
|
|
if ( $config->get( MainConfigNames::TranslateNumerals ) ) {
|
2020-09-03 20:59:33 +00:00
|
|
|
$localDigit = $lang->formatNumNoSeparators( $digit );
|
|
|
|
} else {
|
|
|
|
$localDigit = $digit;
|
|
|
|
}
|
|
|
|
$convLocalDigit = $langConv->translate( $localDigit, $variant );
|
|
|
|
$data['digits'][$variant][] = $convLocalDigit;
|
|
|
|
}
|
|
|
|
}
|
2019-10-28 12:28:17 +00:00
|
|
|
|
|
|
|
// ApiQuerySiteinfo
|
2023-05-19 07:36:50 +00:00
|
|
|
$data['localTimezone'] = $config->get( MainConfigNames::Localtimezone );
|
2019-10-28 12:28:17 +00:00
|
|
|
|
2023-01-16 19:53:39 +00:00
|
|
|
// special page names compared against Title::getText, which contains space
|
|
|
|
// But aliases are stored with underscores (db key) in the alias files
|
|
|
|
$data['specialContributionsName'] = str_replace( '_', ' ', $this->specialPageFactory
|
|
|
|
->getLocalNameFor( 'Contributions' ) );
|
|
|
|
$data['specialNewSectionName'] = str_replace( '_', ' ', $this->specialPageFactory
|
|
|
|
->getLocalNameFor( 'NewSection' ) );
|
2019-10-28 12:28:17 +00:00
|
|
|
|
2023-05-19 07:36:50 +00:00
|
|
|
$localTimezone = $config->get( MainConfigNames::Localtimezone );
|
2020-10-14 19:53:00 +00:00
|
|
|
// Return all timezone abbreviations for the local timezone (there will often be two, for
|
2019-10-28 12:28:17 +00:00
|
|
|
// non-DST and DST timestamps, and sometimes more due to historical data, but that's okay).
|
2020-10-14 19:53:00 +00:00
|
|
|
// Avoid DateTimeZone::listAbbreviations(), it returns some half-baked list that is different
|
|
|
|
// from the timezone data used by everything else in PHP.
|
2022-07-07 01:56:21 +00:00
|
|
|
$timezoneTransitions = ( new DateTimeZone( $localTimezone ) )->getTransitions();
|
|
|
|
if ( !is_array( $timezoneTransitions ) ) {
|
|
|
|
// Handle (arguably invalid) config where $wgLocaltimezone is an abbreviation like "CST"
|
|
|
|
// instead of a real IANA timezone name like "America/Chicago". (T312310)
|
|
|
|
// "DateTimeZone objects wrapping type 1 (UTC offsets) and type 2 (abbreviations) do not
|
|
|
|
// contain any transitions, and calling this method on them will return false."
|
|
|
|
// https://www.php.net/manual/en/datetimezone.gettransitions.php
|
|
|
|
$timezoneAbbrs = [ $localTimezone ];
|
|
|
|
} else {
|
|
|
|
$timezoneAbbrs = array_values( array_unique(
|
|
|
|
array_map( static function ( $transition ) {
|
|
|
|
return $transition['abbr'];
|
|
|
|
}, $timezoneTransitions )
|
|
|
|
) );
|
|
|
|
}
|
2020-09-03 20:59:33 +00:00
|
|
|
|
|
|
|
$data['timezones'] = [];
|
2021-02-27 14:46:23 +00:00
|
|
|
foreach ( $langConv->getVariants() as $variant ) {
|
2020-09-03 20:59:33 +00:00
|
|
|
$data['timezones'][$variant] = array_combine(
|
2021-05-05 06:59:38 +00:00
|
|
|
array_map( static function ( string $tzMsg ) use ( $lang, $langConv, $variant ) {
|
2020-09-03 20:59:33 +00:00
|
|
|
// MWTimestamp::getTimezoneMessage()
|
|
|
|
// Parser::pstPass2()
|
|
|
|
// Messages used here: 'timezone-utc' and so on
|
|
|
|
$key = 'timezone-' . strtolower( trim( $tzMsg ) );
|
|
|
|
$msg = wfMessage( $key )->inLanguage( $lang );
|
|
|
|
// TODO: This probably causes a similar issue to https://phabricator.wikimedia.org/T221294,
|
|
|
|
// but we *must* check the message existence in the database, because the messages are not
|
|
|
|
// actually defined by MediaWiki core for any timezone other than UTC...
|
|
|
|
if ( $msg->exists() ) {
|
|
|
|
$text = $msg->text();
|
|
|
|
} else {
|
|
|
|
$text = strtoupper( $tzMsg );
|
|
|
|
}
|
|
|
|
$convText = $langConv->translate( $text, $variant );
|
|
|
|
return $convText;
|
|
|
|
}, $timezoneAbbrs ),
|
|
|
|
array_map( 'strtoupper', $timezoneAbbrs )
|
|
|
|
);
|
|
|
|
}
|
2019-10-28 12:28:17 +00:00
|
|
|
|
|
|
|
// Messages in content language
|
|
|
|
$messagesKeys = array_merge(
|
2020-02-28 08:18:16 +00:00
|
|
|
Language::WEEKDAY_MESSAGES,
|
|
|
|
Language::WEEKDAY_ABBREVIATED_MESSAGES,
|
|
|
|
Language::MONTH_MESSAGES,
|
|
|
|
Language::MONTH_GENITIVE_MESSAGES,
|
|
|
|
Language::MONTH_ABBREVIATED_MESSAGES
|
2019-10-28 12:28:17 +00:00
|
|
|
);
|
2020-09-03 20:59:33 +00:00
|
|
|
$data['contLangMessages'] = [];
|
2021-02-27 14:46:23 +00:00
|
|
|
foreach ( $langConv->getVariants() as $variant ) {
|
2020-09-03 20:59:33 +00:00
|
|
|
$data['contLangMessages'][$variant] = array_combine(
|
|
|
|
$messagesKeys,
|
2021-05-05 06:59:38 +00:00
|
|
|
array_map( static function ( $key ) use ( $lang, $langConv, $variant ) {
|
2020-09-03 20:59:33 +00:00
|
|
|
$text = wfMessage( $key )->inLanguage( $lang )->text();
|
|
|
|
return $langConv->translate( $text, $variant );
|
|
|
|
}, $messagesKeys )
|
|
|
|
);
|
|
|
|
}
|
2019-10-28 12:28:17 +00:00
|
|
|
|
|
|
|
return $data;
|
|
|
|
}
|
2020-03-10 13:03:45 +00:00
|
|
|
|
2020-09-03 20:59:33 +00:00
|
|
|
/**
|
|
|
|
* Convert a date format string to a different language variant, leaving all special characters
|
|
|
|
* unchanged and applying language conversion to the plain text fragments.
|
|
|
|
*/
|
Change CommentParser into a service
Goal:
-----
To have a method like CommentParser::parse(), which just takes a node
to parse and a title and returns plain data, so that we don't need to
keep track of the config to construct a CommentParser object (the
required config like content language is provided by services) and
we don't need to keep that object around after parsing.
Changes:
--------
CommentParser.php:
* …is now a service. Constructor only takes services as arguments.
The node and title are passed to a new parse() method.
* parse() should return plain data, but I split this part to a separate
patch for ease of review: I49bfe019aa460651447fd383f73eafa9d7180a92.
* CommentParser still cheats and accesses global state in a few places,
e.g. calling Title::makeTitleSafe or CommentUtils::getTitleFromUrl,
so we can't turn its tests into true unit tests. This work is left
for future commits.
LanguageData.php:
* …is now a service, instead of a static class.
Parser.js:
* …is not a real service, but it's changed to behave in a similar way.
Constructor takes only the required config as argument,
and node and title are instead passed to a new parse() method.
CommentParserTest.php:
parser.test.js:
* Can be simplified, now that we don't need a useless node and title
to test internal methods that don't use them.
testUtils.js:
* Can be simplified, now that we don't need to override internal
ResourceLoader stuff just to change the parser config.
Change-Id: Iadb7757debe000025e52770ca51ebcf24ca8ee66
2022-02-19 02:43:21 +00:00
|
|
|
private function convertDateFormat(
|
2020-09-03 20:59:33 +00:00
|
|
|
string $format,
|
|
|
|
ILanguageConverter $langConv,
|
|
|
|
string $variant
|
2021-07-22 07:25:13 +00:00
|
|
|
): string {
|
2020-09-03 20:59:33 +00:00
|
|
|
$formatLength = strlen( $format );
|
|
|
|
$s = '';
|
|
|
|
// The supported codes must match CommentParser::getTimestampRegexp()
|
|
|
|
for ( $p = 0; $p < $formatLength; $p++ ) {
|
|
|
|
$num = false;
|
|
|
|
$code = $format[ $p ];
|
|
|
|
if ( $code === 'x' && $p < $formatLength - 1 ) {
|
|
|
|
$code .= $format[++$p];
|
|
|
|
}
|
|
|
|
if ( $code === 'xk' && $p < $formatLength - 1 ) {
|
|
|
|
$code .= $format[++$p];
|
|
|
|
}
|
|
|
|
|
|
|
|
// LAZY SHORTCUTS that might cause bugs:
|
|
|
|
// * We assume that result of $langConv->translate() doesn't produce any special codes/characters
|
|
|
|
// * We assume that calling $langConv->translate() separately for each character is correct
|
|
|
|
switch ( $code ) {
|
2020-10-29 10:52:56 +00:00
|
|
|
case 'xx':
|
2020-09-03 20:59:33 +00:00
|
|
|
case 'xg':
|
2023-06-04 18:16:56 +00:00
|
|
|
case 'xn':
|
2020-09-03 20:59:33 +00:00
|
|
|
case 'd':
|
|
|
|
case 'D':
|
|
|
|
case 'j':
|
|
|
|
case 'l':
|
|
|
|
case 'F':
|
|
|
|
case 'M':
|
2023-06-04 18:16:56 +00:00
|
|
|
case 'm':
|
2020-09-03 20:59:33 +00:00
|
|
|
case 'n':
|
|
|
|
case 'Y':
|
|
|
|
case 'xkY':
|
|
|
|
case 'G':
|
|
|
|
case 'H':
|
|
|
|
case 'i':
|
2023-06-04 18:16:56 +00:00
|
|
|
case 's':
|
2020-09-03 20:59:33 +00:00
|
|
|
// Special code - pass through unchanged
|
|
|
|
$s .= $code;
|
|
|
|
break;
|
|
|
|
case '\\':
|
|
|
|
// Plain text (backslash escaping) - convert to language variant
|
|
|
|
if ( $p < $formatLength - 1 ) {
|
|
|
|
$s .= '\\' . $langConv->translate( $format[++$p], $variant );
|
|
|
|
} else {
|
|
|
|
$s .= $code;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
case '"':
|
|
|
|
// Plain text (quoted literal) - convert to language variant
|
|
|
|
if ( $p < $formatLength - 1 ) {
|
|
|
|
$endQuote = strpos( $format, '"', $p + 1 );
|
|
|
|
if ( $endQuote === false ) {
|
|
|
|
// No terminating quote, assume literal "
|
|
|
|
$s .= $code;
|
|
|
|
} else {
|
|
|
|
$s .= '"' .
|
|
|
|
$langConv->translate( substr( $format, $p + 1, $endQuote - $p - 1 ), $variant ) .
|
|
|
|
'"';
|
|
|
|
$p = $endQuote;
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
// Quote at end of string, assume literal "
|
|
|
|
$s .= $code;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
// Plain text - convert to language variant
|
|
|
|
$s .= $langConv->translate( $format[$p], $variant );
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return $s;
|
|
|
|
}
|
2019-10-28 12:28:17 +00:00
|
|
|
}
|