2021-06-30 12:51:04 +00:00
|
|
|
<?php
|
|
|
|
|
2022-05-23 07:32:40 +00:00
|
|
|
namespace MediaWiki\Skins\Vector\Services;
|
2021-06-30 12:51:04 +00:00
|
|
|
|
|
|
|
class LanguageService {
|
|
|
|
/**
|
|
|
|
* The list of language codes for those languages that the search autocomplete widget cannot
|
|
|
|
* split a word on a Unicode code point followed by one or many combining marks (also code
|
|
|
|
* points).
|
|
|
|
*
|
|
|
|
* This list was compiled by [@TJones](https://phabricator.wikimedia.org/p/TJones/) as part
|
|
|
|
* of [T281797](https://phabricator.wikimedia.org/T281797).
|
|
|
|
*
|
|
|
|
* @var string[]
|
|
|
|
*/
|
|
|
|
private $splittableLanguages;
|
|
|
|
|
|
|
|
public function __construct() {
|
|
|
|
$this->splittableLanguages = [
|
|
|
|
'ar', 'ary', 'arz', 'ckb', 'fa', 'glk', 'ks', 'mzn', 'pnb', 'ps', 'sd', 'skr', 'ug', 'ur',
|
|
|
|
'as', 'bn', 'bpy',
|
|
|
|
'awa', 'bh', 'dty', 'gom', 'hi', 'ks', 'mai', 'mr', 'ne', 'new', 'pi', 'sa',
|
|
|
|
'gu',
|
|
|
|
'pa',
|
|
|
|
'kn', 'tcy',
|
|
|
|
'km',
|
|
|
|
'ml',
|
|
|
|
'or',
|
|
|
|
'si',
|
|
|
|
'ta',
|
|
|
|
'te',
|
|
|
|
];
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Gets whether or not we can split words arbitrarily, for example when highlighting the user's query in the search
|
|
|
|
* autocomplete widget.
|
|
|
|
*
|
|
|
|
* @param string $code
|
|
|
|
* @return bool
|
|
|
|
*/
|
|
|
|
public function canWordsBeSplitSafely( string $code ): bool {
|
|
|
|
return !in_array( $code, $this->splittableLanguages );
|
|
|
|
}
|
|
|
|
}
|