Code Coverage for /workspace/src/includes/language/Language.php

	Code Coverage
	Lines			Functions and Methods				Classes and Traits
Total	74.78% covered (warning)	74.78%	1257 / 1681	35.33% covered (danger)	35.33%	53 / 150	CRAP	0.00% covered (danger)	0.00%	0 / 1
Language	74.82% covered (warning)	74.82%	1257 / 1680	35.33% covered (danger)	35.33%	53 / 150	7902.75	0.00% covered (danger)	0.00%	0 / 1
__construct	60.47% covered (warning)	60.47%	26 / 43	0.00% covered (danger)	0.00%	0 / 1	3.56
getFallbackLanguages	0.00% covered (danger)	0.00%	0 / 1	0.00% covered (danger)	0.00%	0 / 1	2
getBookstoreList	0.00% covered (danger)	0.00%	0 / 1	0.00% covered (danger)	0.00%	0 / 1	2
getNamespaces	95.00% covered (success)	95.00%	19 / 20	0.00% covered (danger)	0.00%	0 / 1	5
setNamespaces	0.00% covered (danger)	0.00%	0 / 2	0.00% covered (danger)	0.00%	0 / 1	2
resetNamespaces	0.00% covered (danger)	0.00%	0 / 3	0.00% covered (danger)	0.00%	0 / 1	2
getFormattedNamespaces	0.00% covered (danger)	0.00%	0 / 4	0.00% covered (danger)	0.00%	0 / 1	6
getNsText	100.00% covered (success)	100.00%	2 / 2	100.00% covered (success)	100.00%	1 / 1	1
getFormattedNsText	100.00% covered (success)	100.00%	2 / 2	100.00% covered (success)	100.00%	1 / 1	2
getGenderNsText	0.00% covered (danger)	0.00%	0 / 4	0.00% covered (danger)	0.00%	0 / 1	2
needsGenderDistinction	75.00% covered (warning)	75.00%	6 / 8	0.00% covered (danger)	0.00%	0 / 1	4.25
getLocalNsIndex	0.00% covered (danger)	0.00%	0 / 3	0.00% covered (danger)	0.00%	0 / 1	2
getNamespaceAliases	90.00% covered (success)	90.00%	27 / 30	0.00% covered (danger)	0.00%	0 / 1	10.10
getNamespaceIds	0.00% covered (danger)	0.00%	0 / 7	0.00% covered (danger)	0.00%	0 / 1	20
getNsIndex	0.00% covered (danger)	0.00%	0 / 6	0.00% covered (danger)	0.00%	0 / 1	6
getVariantname	0.00% covered (danger)	0.00%	0 / 8	0.00% covered (danger)	0.00%	0 / 1	20
getDatePreferences	0.00% covered (danger)	0.00%	0 / 1	0.00% covered (danger)	0.00%	0 / 1	2
getDateFormats	0.00% covered (danger)	0.00%	0 / 1	0.00% covered (danger)	0.00%	0 / 1	2
getDefaultDateFormat	75.00% covered (warning)	75.00%	3 / 4	0.00% covered (danger)	0.00%	0 / 1	3.14
getDatePreferenceMigrationMap	100.00% covered (success)	100.00%	1 / 1	100.00% covered (success)	100.00%	1 / 1	1
getMessageFromDB	100.00% covered (success)	100.00%	1 / 1	100.00% covered (success)	100.00%	1 / 1	1
msg	100.00% covered (success)	100.00%	1 / 1	100.00% covered (success)	100.00%	1 / 1	1
getMonthName	100.00% covered (success)	100.00%	1 / 1	100.00% covered (success)	100.00%	1 / 1	1
getMonthNamesArray	0.00% covered (danger)	0.00%	0 / 4	0.00% covered (danger)	0.00%	0 / 1	6
getMonthNameGen	100.00% covered (success)	100.00%	1 / 1	100.00% covered (success)	100.00%	1 / 1	1
getMonthAbbreviation	100.00% covered (success)	100.00%	1 / 1	100.00% covered (success)	100.00%	1 / 1	1
getMonthAbbreviationsArray	0.00% covered (danger)	0.00%	0 / 4	0.00% covered (danger)	0.00%	0 / 1	6
getWeekdayName	100.00% covered (success)	100.00%	1 / 1	100.00% covered (success)	100.00%	1 / 1	1
getWeekdayAbbreviation	100.00% covered (success)	100.00%	1 / 1	100.00% covered (success)	100.00%	1 / 1	1
dateTimeObjFormat	100.00% covered (success)	100.00%	5 / 5	100.00% covered (success)	100.00%	1 / 1	3
sprintfDate	93.57% covered (success)	93.57%	364 / 389	0.00% covered (danger)	0.00%	0 / 1	138.77
tsToIranian	96.15% covered (success)	96.15%	25 / 26	0.00% covered (danger)	0.00%	0 / 1	9
tsToHijri	92.31% covered (success)	92.31%	24 / 26	0.00% covered (danger)	0.00%	0 / 1	7.02
tsToHebrew	59.65% covered (warning)	59.65%	34 / 57	0.00% covered (danger)	0.00%	0 / 1	79.51
hebrewYearStart	77.78% covered (warning)	77.78%	14 / 18	0.00% covered (danger)	0.00%	0 / 1	13.58
tsToYear	76.92% covered (warning)	76.92%	10 / 13	0.00% covered (danger)	0.00%	0 / 1	7.60
tsToJapaneseGengo	100.00% covered (success)	100.00%	13 / 13	100.00% covered (success)	100.00%	1 / 1	10
tsToJapaneseGengoCalculate	100.00% covered (success)	100.00%	4 / 4	100.00% covered (success)	100.00%	1 / 1	2
strongDirFromContent	100.00% covered (success)	100.00%	5 / 5	100.00% covered (success)	100.00%	1 / 1	3
romanNumeral	93.75% covered (success)	93.75%	15 / 16	0.00% covered (danger)	0.00%	0 / 1	5.01
hebrewNumeral	100.00% covered (success)	100.00%	50 / 50	100.00% covered (success)	100.00%	1 / 1	13
userAdjust	73.68% covered (warning)	73.68%	14 / 19	0.00% covered (danger)	0.00%	0 / 1	4.29
makeMediaWikiTimestamp	0.00% covered (danger)	0.00%	0 / 2	0.00% covered (danger)	0.00%	0 / 1	6
dateFormat	72.73% covered (warning)	72.73%	8 / 11	0.00% covered (danger)	0.00%	0 / 1	4.32
getDateFormatString	73.33% covered (warning)	73.33%	11 / 15	0.00% covered (danger)	0.00%	0 / 1	7.93
date	0.00% covered (danger)	0.00%	0 / 5	0.00% covered (danger)	0.00%	0 / 1	6
time	0.00% covered (danger)	0.00%	0 / 5	0.00% covered (danger)	0.00%	0 / 1	6
timeanddate	80.00% covered (warning)	80.00%	4 / 5	0.00% covered (danger)	0.00%	0 / 1	2.03
formatDuration	100.00% covered (success)	100.00%	6 / 6	100.00% covered (success)	100.00%	1 / 1	2
formatDurationBetweenTimestamps	100.00% covered (success)	100.00%	34 / 34	100.00% covered (success)	100.00%	1 / 1	11
getDurationIntervals	100.00% covered (success)	100.00%	22 / 22	100.00% covered (success)	100.00%	1 / 1	6
internalUserTimeAndDate	0.00% covered (danger)	0.00%	0 / 17	0.00% covered (danger)	0.00%	0 / 1	20
userDate	0.00% covered (danger)	0.00%	0 / 1	0.00% covered (danger)	0.00%	0 / 1	2
userTime	0.00% covered (danger)	0.00%	0 / 1	0.00% covered (danger)	0.00%	0 / 1	2
userTimeAndDate	0.00% covered (danger)	0.00%	0 / 1	0.00% covered (danger)	0.00%	0 / 1	2
getHumanTimestamp	0.00% covered (danger)	0.00%	0 / 14	0.00% covered (danger)	0.00%	0 / 1	12
getHumanTimestampInternal	0.00% covered (danger)	0.00%	0 / 38	0.00% covered (danger)	0.00%	0 / 1	420
getGroupName	100.00% covered (success)	100.00%	2 / 2	100.00% covered (success)	100.00%	1 / 1	2
getGroupMemberName	100.00% covered (success)	100.00%	4 / 4	100.00% covered (success)	100.00%	1 / 1	3
getMessage	0.00% covered (danger)	0.00%	0 / 1	0.00% covered (danger)	0.00%	0 / 1	2
getAllMessages	0.00% covered (danger)	0.00%	0 / 1	0.00% covered (danger)	0.00%	0 / 1	2
iconv	0.00% covered (danger)	0.00%	0 / 4	0.00% covered (danger)	0.00%	0 / 1	2
ucfirst	92.86% covered (success)	92.86%	13 / 14	0.00% covered (danger)	0.00%	0 / 1	5.01
uc	0.00% covered (danger)	0.00%	0 / 3	0.00% covered (danger)	0.00%	0 / 1	12
lcfirst	90.00% covered (success)	90.00%	9 / 10	0.00% covered (danger)	0.00%	0 / 1	4.02
lc	66.67% covered (warning)	66.67%	2 / 3	0.00% covered (danger)	0.00%	0 / 1	3.33
isMultibyte	100.00% covered (success)	100.00%	1 / 1	100.00% covered (success)	100.00%	1 / 1	1
ucwords	100.00% covered (success)	100.00%	11 / 11	100.00% covered (success)	100.00%	1 / 1	2
ucwordbreaks	100.00% covered (success)	100.00%	19 / 19	100.00% covered (success)	100.00%	1 / 1	2
caseFold	0.00% covered (danger)	0.00%	0 / 1	0.00% covered (danger)	0.00%	0 / 1	2
checkTitleEncoding	66.67% covered (warning)	66.67%	2 / 3	0.00% covered (danger)	0.00%	0 / 1	2.15
fallback8bitEncoding	0.00% covered (danger)	0.00%	0 / 1	0.00% covered (danger)	0.00%	0 / 1	2
hasWordBreaks	0.00% covered (danger)	0.00%	0 / 1	0.00% covered (danger)	0.00%	0 / 1	2
segmentByWord	0.00% covered (danger)	0.00%	0 / 1	0.00% covered (danger)	0.00%	0 / 1	2
getSearchIndexVariant	100.00% covered (success)	100.00%	1 / 1	100.00% covered (success)	100.00%	1 / 1	1
normalizeForSearch	75.00% covered (warning)	75.00%	3 / 4	0.00% covered (danger)	0.00%	0 / 1	2.06
convertDoubleWidth	100.00% covered (success)	100.00%	6 / 6	100.00% covered (success)	100.00%	1 / 1	1
insertSpace	0.00% covered (danger)	0.00%	0 / 2	0.00% covered (danger)	0.00%	0 / 1	2
convertForSearchResult	0.00% covered (danger)	0.00%	0 / 1	0.00% covered (danger)	0.00%	0 / 1	2
firstChar	42.42% covered (danger)	42.42%	14 / 33	0.00% covered (danger)	0.00%	0 / 1	79.84
normalize	66.67% covered (warning)	66.67%	4 / 6	0.00% covered (danger)	0.00%	0 / 1	2.15
transformUsingPairFile	0.00% covered (danger)	0.00%	0 / 3	0.00% covered (danger)	0.00%	0 / 1	6
isRTL	0.00% covered (danger)	0.00%	0 / 1	0.00% covered (danger)	0.00%	0 / 1	2
getDir	0.00% covered (danger)	0.00%	0 / 1	0.00% covered (danger)	0.00%	0 / 1	6
alignStart	0.00% covered (danger)	0.00%	0 / 1	0.00% covered (danger)	0.00%	0 / 1	6
alignEnd	0.00% covered (danger)	0.00%	0 / 1	0.00% covered (danger)	0.00%	0 / 1	6
getDirMarkEntity	0.00% covered (danger)	0.00%	0 / 4	0.00% covered (danger)	0.00%	0 / 1	20
getDirMark	0.00% covered (danger)	0.00%	0 / 3	0.00% covered (danger)	0.00%	0 / 1	20
getArrow	0.00% covered (danger)	0.00%	0 / 12	0.00% covered (danger)	0.00%	0 / 1	90
linkPrefixExtension	0.00% covered (danger)	0.00%	0 / 1	0.00% covered (danger)	0.00%	0 / 1	2
getMagicWords	0.00% covered (danger)	0.00%	0 / 1	0.00% covered (danger)	0.00%	0 / 1	2
getMagic	83.33% covered (warning)	83.33%	5 / 6	0.00% covered (danger)	0.00%	0 / 1	2.02
getSpecialPageAliases	0.00% covered (danger)	0.00%	0 / 3	0.00% covered (danger)	0.00%	0 / 1	2
emphasize	0.00% covered (danger)	0.00%	0 / 1	0.00% covered (danger)	0.00%	0 / 1	2
formatNum	100.00% covered (success)	100.00%	1 / 1	100.00% covered (success)	100.00%	1 / 1	1
formatNumInternal	86.30% covered (warning)	86.30%	63 / 73	0.00% covered (danger)	0.00%	0 / 1	25.48
formatNumNoSeparators	100.00% covered (success)	100.00%	1 / 1	100.00% covered (success)	100.00%	1 / 1	1
parseFormattedNumber	100.00% covered (success)	100.00%	16 / 16	100.00% covered (success)	100.00%	1 / 1	6
digitGroupingPattern	100.00% covered (success)	100.00%	1 / 1	100.00% covered (success)	100.00%	1 / 1	1
digitTransformTable	100.00% covered (success)	100.00%	1 / 1	100.00% covered (success)	100.00%	1 / 1	1
separatorTransformTable	100.00% covered (success)	100.00%	1 / 1	100.00% covered (success)	100.00%	1 / 1	1
minimumGroupingDigits	100.00% covered (success)	100.00%	1 / 1	100.00% covered (success)	100.00%	1 / 1	1
listToText	100.00% covered (success)	100.00%	12 / 12	100.00% covered (success)	100.00%	1 / 1	4
commaList	0.00% covered (danger)	0.00%	0 / 4	0.00% covered (danger)	0.00%	0 / 1	2
semicolonList	0.00% covered (danger)	0.00%	0 / 4	0.00% covered (danger)	0.00%	0 / 1	2
pipeList	0.00% covered (danger)	0.00%	0 / 4	0.00% covered (danger)	0.00%	0 / 1	2
truncateForDatabase	100.00% covered (success)	100.00%	3 / 3	100.00% covered (success)	100.00%	1 / 1	1
truncateForVisual	100.00% covered (success)	100.00%	3 / 3	100.00% covered (success)	100.00%	1 / 1	1
truncateInternal	95.00% covered (success)	95.00%	19 / 20	0.00% covered (danger)	0.00%	0 / 1	9
removeBadCharLast	80.00% covered (warning)	80.00%	8 / 10	0.00% covered (danger)	0.00%	0 / 1	5.20
truncateHtml	97.06% covered (success)	97.06%	66 / 68	0.00% covered (danger)	0.00%	0 / 1	29
truncate_skip	100.00% covered (success)	100.00%	9 / 9	100.00% covered (success)	100.00%	1 / 1	4
truncate_endBracket	100.00% covered (success)	100.00%	8 / 8	100.00% covered (success)	100.00%	1 / 1	7
convertGrammar	79.17% covered (warning)	79.17%	19 / 24	0.00% covered (danger)	0.00%	0 / 1	8.58
getGrammarForms	0.00% covered (danger)	0.00%	0 / 5	0.00% covered (danger)	0.00%	0 / 1	12
getGrammarTransformations	88.89% covered (warning)	88.89%	8 / 9	0.00% covered (danger)	0.00%	0 / 1	4.02
gender	0.00% covered (danger)	0.00%	0 / 8	0.00% covered (danger)	0.00%	0 / 1	20
convertPlural	100.00% covered (success)	100.00%	8 / 8	100.00% covered (success)	100.00%	1 / 1	3
handleExplicitPluralForms	100.00% covered (success)	100.00%	7 / 7	100.00% covered (success)	100.00%	1 / 1	4
preConvertPlural	0.00% covered (danger)	0.00%	0 / 1	0.00% covered (danger)	0.00%	0 / 1	2
getFormalityIndex	0.00% covered (danger)	0.00%	0 / 1	0.00% covered (danger)	0.00%	0 / 1	2
embedBidi	100.00% covered (success)	100.00%	6 / 6	100.00% covered (success)	100.00%	1 / 1	3
getBlockDurations	85.71% covered (warning)	85.71%	6 / 7	0.00% covered (danger)	0.00%	0 / 1	4.05
translateBlockExpiry	94.44% covered (success)	94.44%	17 / 18	0.00% covered (danger)	0.00%	0 / 1	9.01
segmentForDiff	0.00% covered (danger)	0.00%	0 / 1	0.00% covered (danger)	0.00%	0 / 1	2
unsegmentForDiff	0.00% covered (danger)	0.00%	0 / 1	0.00% covered (danger)	0.00%	0 / 1	2
linkTrail	0.00% covered (danger)	0.00%	0 / 1	0.00% covered (danger)	0.00%	0 / 1	2
linkPrefixCharset	0.00% covered (danger)	0.00%	0 / 1	0.00% covered (danger)	0.00%	0 / 1	2
equals	100.00% covered (success)	100.00%	1 / 1	100.00% covered (success)	100.00%	1 / 1	2
getCode	100.00% covered (success)	100.00%	1 / 1	100.00% covered (success)	100.00%	1 / 1	1
getHtmlCode	100.00% covered (success)	100.00%	2 / 2	100.00% covered (success)	100.00%	1 / 1	1
toBcp47Code	100.00% covered (success)	100.00%	1 / 1	100.00% covered (success)	100.00%	1 / 1	1
isSameCodeAs	60.00% covered (warning)	60.00%	3 / 5	0.00% covered (danger)	0.00%	0 / 1	3.58
getCodeFromFileName	0.00% covered (danger)	0.00%	0 / 6	0.00% covered (danger)	0.00%	0 / 1	6
fixVariableInNamespace	100.00% covered (success)	100.00%	11 / 11	100.00% covered (success)	100.00%	1 / 1	2
formatExpiry	0.00% covered (danger)	0.00%	0 / 13	0.00% covered (danger)	0.00%	0 / 1	56
formatTimePeriod	100.00% covered (success)	100.00%	73 / 73	100.00% covered (success)	100.00%	1 / 1	23
formatBitrate	100.00% covered (success)	100.00%	1 / 1	100.00% covered (success)	100.00%	1 / 1	1
formatComputingNumbers	100.00% covered (success)	100.00%	17 / 17	100.00% covered (success)	100.00%	1 / 1	5
formatSize	100.00% covered (success)	100.00%	1 / 1	100.00% covered (success)	100.00%	1 / 1	1
specialList	0.00% covered (danger)	0.00%	0 / 5	0.00% covered (danger)	0.00%	0 / 1	6
getCompiledPluralRules	40.00% covered (danger)	40.00%	4 / 10	0.00% covered (danger)	0.00%	0 / 1	7.46
getPluralRules	0.00% covered (danger)	0.00%	0 / 10	0.00% covered (danger)	0.00%	0 / 1	20
getPluralRuleTypes	0.00% covered (danger)	0.00%	0 / 10	0.00% covered (danger)	0.00%	0 / 1	20
getPluralRuleIndexNumber	100.00% covered (success)	100.00%	2 / 2	100.00% covered (success)	100.00%	1 / 1	1
getPluralRuleType	100.00% covered (success)	100.00%	3 / 3	100.00% covered (success)	100.00%	1 / 1	1
getConverterInternal	100.00% covered (success)	100.00%	1 / 1	100.00% covered (success)	100.00%	1 / 1	1
getHookContainer	0.00% covered (danger)	0.00%	0 / 1	0.00% covered (danger)	0.00%	0 / 1	2
getHookRunner	100.00% covered (success)	100.00%	1 / 1	100.00% covered (success)	100.00%	1 / 1	1
getJsData	0.00% covered (danger)	0.00%	0 / 12	0.00% covered (danger)	0.00%	0 / 1	2

1	<?php
2	/**
3	* This program is free software; you can redistribute it and/or modify
4	* it under the terms of the GNU General Public License as published by
5	* the Free Software Foundation; either version 2 of the License, or
6	* (at your option) any later version.
7	*
8	* This program is distributed in the hope that it will be useful,
9	* but WITHOUT ANY WARRANTY; without even the implied warranty of
10	* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
11	* GNU General Public License for more details.
12	*
13	* You should have received a copy of the GNU General Public License along
14	* with this program; if not, write to the Free Software Foundation, Inc.,
15	* 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
16	* http://www.gnu.org/copyleft/gpl.html
17	*
18	* @file
19	*/
20
21	/**
22	* @defgroup Language Internationalisation
23	*
24	* See https://www.mediawiki.org/wiki/Special:MyLanguage/Localisation for more information.
25	*/
26
27	/**
28	* @defgroup Languages Languages
29	* @ingroup Language
30	*/
31
32	namespace MediaWiki\Language;
33
34	use CLDRPluralRuleParser\Evaluator;
35	use DateTime;
36	use DateTimeImmutable;
37	use DateTimeZone;
38	use InvalidArgumentException;
39	use LocalisationCache;
40	use MediaWiki\Config\Config;
41	use MediaWiki\Context\RequestContext;
42	use MediaWiki\HookContainer\HookContainer;
43	use MediaWiki\HookContainer\HookRunner;
44	use MediaWiki\Html\Html;
45	use MediaWiki\Json\FormatJson;
46	use MediaWiki\Languages\Data\NormalizeAr;
47	use MediaWiki\Languages\Data\NormalizeMl;
48	use MediaWiki\Languages\LanguageConverterFactory;
49	use MediaWiki\Languages\LanguageFallback;
50	use MediaWiki\Languages\LanguageNameUtils;
51	use MediaWiki\Logger\LoggerFactory;
52	use MediaWiki\MainConfigNames;
53	use MediaWiki\MediaWikiServices;
54	use MediaWiki\Message\Message;
55	use MediaWiki\Parser\MagicWord;
56	use MediaWiki\Title\NamespaceInfo;
57	use MediaWiki\User\User;
58	use MediaWiki\User\UserIdentity;
59	use MediaWiki\User\UserTimeCorrection;
60	use MediaWiki\Utils\MWTimestamp;
61	use MediaWiki\Xml\XmlSelect;
62	use NumberFormatter;
63	use RuntimeException;
64	use StringUtils;
65	use UtfNormal\Validator as UtfNormalValidator;
66	use Wikimedia\Assert\Assert;
67	use Wikimedia\AtEase\AtEase;
68	use Wikimedia\Bcp47Code\Bcp47Code;
69	use Wikimedia\DebugInfo\DebugInfoTrait;
70	use Wikimedia\Message\MessageParam;
71	use Wikimedia\Message\MessageSpecifier;
72
73	/**
74	* Base class for language-specific code.
75	*
76	* See https://www.mediawiki.org/wiki/Special:MyLanguage/Localisation for more information.
77	*
78	* @ingroup Language
79	*/
80	class Language implements Bcp47Code {
81	use DebugInfoTrait;
82
83	/** @var string */
84	public $mCode;
85
86	/**
87	* @deprecated since 1.35, use LocalisationCache with custom language config
88	*/
89	public $mMagicExtensions = [];
90
91	/** @var string\|null */
92	private $mHtmlCode = null;
93
94	/**
95	* memoize
96	* @var string[][]
97	* @deprecated since 1.35, must be private
98	*/
99	public $dateFormatStrings = [];
100
101	/**
102	* memoize
103	* @var string[][]\|null
104	* @deprecated since 1.35, must be protected
105	*/
106	public $mExtendedSpecialPageAliases;
107
108	/** @var array<int,string>\|null Indexed by numeric namespace ID */
109	protected $namespaceNames;
110	/** @var array<string,int>\|null Indexed by localized lower-cased namespace name */
111	protected $mNamespaceIds;
112	/** @var array<string,int>\|null Map from alias to namespace ID */
113	protected $namespaceAliases;
114
115	/**
116	* @var ReplacementArray[]
117	* @noVarDump
118	*/
119	private $transformData = [];
120
121	/**
122	* @var NamespaceInfo
123	* @noVarDump
124	*/
125	private $namespaceInfo;
126
127	/**
128	* @var LocalisationCache
129	* @noVarDump
130	*/
131	private $localisationCache;
132
133	/**
134	* @var LanguageNameUtils
135	* @noVarDump
136	*/
137	private $langNameUtils;
138
139	/**
140	* @var LanguageFallback
141	* @noVarDump
142	*/
143	private $langFallback;
144
145	/**
146	* @var array[]\|null
147	* @noVarDump
148	*/
149	private $grammarTransformCache;
150
151	/**
152	* @var LanguageConverterFactory
153	* @noVarDump
154	*/
155	private $converterFactory;
156
157	/**
158	* @var HookContainer
159	* @noVarDump
160	*/
161	private $hookContainer;
162
163	/**
164	* @var HookRunner
165	* @noVarDump
166	*/
167	private $hookRunner;
168
169	/**
170	* @var Config
171	* @noVarDump
172	*/
173	private $config;
174
175	/**
176	* @var array\|null
177	*/
178	private $overrideUcfirstCharacters;
179
180	/**
181	* @since 1.35
182	*/
183	public const WEEKDAY_MESSAGES = [
184	'sunday', 'monday', 'tuesday', 'wednesday', 'thursday',
185	'friday', 'saturday'
186	];
187
188	/**
189	* @since 1.35
190	*/
191	public const WEEKDAY_ABBREVIATED_MESSAGES = [
192	'sun', 'mon', 'tue', 'wed', 'thu', 'fri', 'sat'
193	];
194
195	/**
196	* @since 1.35
197	*/
198	public const MONTH_MESSAGES = [
199	'january', 'february', 'march', 'april', 'may_long', 'june',
200	'july', 'august', 'september', 'october', 'november',
201	'december'
202	];
203
204	/**
205	* @deprecated since 1.35, use the MONTH_MESSAGES constant
206	*/
207	public static $mMonthMsgs = self::MONTH_MESSAGES;
208
209	/**
210	* @since 1.35
211	*/
212	public const MONTH_GENITIVE_MESSAGES = [
213	'january-gen', 'february-gen', 'march-gen', 'april-gen', 'may-gen', 'june-gen',
214	'july-gen', 'august-gen', 'september-gen', 'october-gen', 'november-gen',
215	'december-gen'
216	];
217
218	/**
219	* @since 1.35
220	*/
221	public const MONTH_ABBREVIATED_MESSAGES = [
222	'jan', 'feb', 'mar', 'apr', 'may', 'jun', 'jul', 'aug',
223	'sep', 'oct', 'nov', 'dec'
224	];
225
226	/**
227	* @deprecated since 1.35, use the MONTH_ABBREVIATED_MESSAGES constant
228	*/
229	public static $mMonthAbbrevMsgs = self::MONTH_ABBREVIATED_MESSAGES;
230
231	/**
232	* @since 1.35
233	*/
234	public const IRANIAN_CALENDAR_MONTHS_MESSAGES = [
235	'iranian-calendar-m1', 'iranian-calendar-m2', 'iranian-calendar-m3',
236	'iranian-calendar-m4', 'iranian-calendar-m5', 'iranian-calendar-m6',
237	'iranian-calendar-m7', 'iranian-calendar-m8', 'iranian-calendar-m9',
238	'iranian-calendar-m10', 'iranian-calendar-m11', 'iranian-calendar-m12'
239	];
240
241	/**
242	* @since 1.35
243	*/
244	public const HEBREW_CALENDAR_MONTHS_MESSAGES = [
245	'hebrew-calendar-m1', 'hebrew-calendar-m2', 'hebrew-calendar-m3',
246	'hebrew-calendar-m4', 'hebrew-calendar-m5', 'hebrew-calendar-m6',
247	'hebrew-calendar-m7', 'hebrew-calendar-m8', 'hebrew-calendar-m9',
248	'hebrew-calendar-m10', 'hebrew-calendar-m11', 'hebrew-calendar-m12',
249	'hebrew-calendar-m6a', 'hebrew-calendar-m6b'
250	];
251
252	/**
253	* @since 1.35
254	*/
255	public const HEBREW_CALENDAR_MONTH_GENITIVE_MESSAGES = [
256	'hebrew-calendar-m1-gen', 'hebrew-calendar-m2-gen', 'hebrew-calendar-m3-gen',
257	'hebrew-calendar-m4-gen', 'hebrew-calendar-m5-gen', 'hebrew-calendar-m6-gen',
258	'hebrew-calendar-m7-gen', 'hebrew-calendar-m8-gen', 'hebrew-calendar-m9-gen',
259	'hebrew-calendar-m10-gen', 'hebrew-calendar-m11-gen', 'hebrew-calendar-m12-gen',
260	'hebrew-calendar-m6a-gen', 'hebrew-calendar-m6b-gen'
261	];
262
263	/**
264	* @since 1.35
265	*/
266	public const HIJRI_CALENDAR_MONTH_MESSAGES = [
267	'hijri-calendar-m1', 'hijri-calendar-m2', 'hijri-calendar-m3',
268	'hijri-calendar-m4', 'hijri-calendar-m5', 'hijri-calendar-m6',
269	'hijri-calendar-m7', 'hijri-calendar-m8', 'hijri-calendar-m9',
270	'hijri-calendar-m10', 'hijri-calendar-m11', 'hijri-calendar-m12'
271	];
272
273	/**
274	* @since 1.35
275	*/
276	protected const DURATION_INTERVALS = [
277	'millennia' => 1000 * 31_556_952,
278	'centuries' => 100 * 31_556_952,
279	'decades' => 10 * 31_556_952,
280	// The average year is 365.2425 days (365 + (24 * 3 + 25) / 400)
281	'years' => 31_556_952, // 365.2425 * 24 * 3600
282	// To simplify, we consider a month to be 1/12 of a year
283	'months' => 365.2425 * 24 * 3600 / 12,
284	'days' => 24 * 3600,
285	'hours' => 3600,
286	'minutes' => 60,
287	'seconds' => 1,
288	];
289
290	/**
291	* @deprecated since 1.35, use the DURATION_INTERVALS constant
292	* @since 1.20
293	* @var int[]
294	*/
295	public static $durationIntervals = self::DURATION_INTERVALS;
296
297	/**
298	* Unicode directional formatting characters
299	*/
300	private const LRM = "\u{200E}"; // U+200E LEFT-TO-RIGHT MARK
301	private const RLM = "\u{200F}"; // U+200F RIGHT-TO-LEFT MARK
302	private const LRE = "\u{202A}"; // U+202A LEFT-TO-RIGHT EMBEDDING
303	private const RLE = "\u{202B}"; // U+202B RIGHT-TO-LEFT EMBEDDING
304	private const PDF = "\u{202C}"; // U+202C POP DIRECTIONAL FORMATTING
305	// https://en.wikipedia.org/wiki/Arabic_letter_mark (Unicode 6.3.0)
306	private const ALM = "\u{061C}"; // U+061C ARABIC LETTER MARK
307
308	/**
309	* Directionality test regex for embedBidi(). Matches the first strong directionality codepoint:
310	* - in group 1 if it is LTR
311	* - in group 2 if it is RTL
312	* Does not match if there is no strong directionality codepoint.
313	*
314	* The form is '/(?:([strong ltr codepoint])\|([strong rtl codepoint]))/u'.
315	*
316	* Generated by UnicodeJS (see tools/strongDir) from the UCD; see
317	* https://gerrit.wikimedia.org/g/unicodejs .
318	* @var string
319	*/
320	// @codeCoverageIgnoreStart
321	// phpcs:ignore Generic.Files.LineLength,MediaWiki.Commenting.PropertyDocumentation.MissingDocumentationPrivate
322	private static $strongDirRegex = '/(?:([\x{41}-\x{5a}\x{61}-\x{7a}\x{aa}\x{b5}\x{ba}\x{c0}-\x{d6}\x{d8}-\x{f6}\x{f8}-\x{2b8}\x{2bb}-\x{2c1}\x{2d0}\x{2d1}\x{2e0}-\x{2e4}\x{2ee}\x{370}-\x{373}\x{376}\x{377}\x{37a}-\x{37d}\x{37f}\x{386}\x{388}-\x{38a}\x{38c}\x{38e}-\x{3a1}\x{3a3}-\x{3f5}\x{3f7}-\x{482}\x{48a}-\x{52f}\x{531}-\x{556}\x{559}-\x{55f}\x{561}-\x{587}\x{589}\x{903}-\x{939}\x{93b}\x{93d}-\x{940}\x{949}-\x{94c}\x{94e}-\x{950}\x{958}-\x{961}\x{964}-\x{980}\x{982}\x{983}\x{985}-\x{98c}\x{98f}\x{990}\x{993}-\x{9a8}\x{9aa}-\x{9b0}\x{9b2}\x{9b6}-\x{9b9}\x{9bd}-\x{9c0}\x{9c7}\x{9c8}\x{9cb}\x{9cc}\x{9ce}\x{9d7}\x{9dc}\x{9dd}\x{9df}-\x{9e1}\x{9e6}-\x{9f1}\x{9f4}-\x{9fa}\x{a03}\x{a05}-\x{a0a}\x{a0f}\x{a10}\x{a13}-\x{a28}\x{a2a}-\x{a30}\x{a32}\x{a33}\x{a35}\x{a36}\x{a38}\x{a39}\x{a3e}-\x{a40}\x{a59}-\x{a5c}\x{a5e}\x{a66}-\x{a6f}\x{a72}-\x{a74}\x{a83}\x{a85}-\x{a8d}\x{a8f}-\x{a91}\x{a93}-\x{aa8}\x{aaa}-\x{ab0}\x{ab2}\x{ab3}\x{ab5}-\x{ab9}\x{abd}-\x{ac0}\x{ac9}\x{acb}\x{acc}\x{ad0}\x{ae0}\x{ae1}\x{ae6}-\x{af0}\x{af9}\x{b02}\x{b03}\x{b05}-\x{b0c}\x{b0f}\x{b10}\x{b13}-\x{b28}\x{b2a}-\x{b30}\x{b32}\x{b33}\x{b35}-\x{b39}\x{b3d}\x{b3e}\x{b40}\x{b47}\x{b48}\x{b4b}\x{b4c}\x{b57}\x{b5c}\x{b5d}\x{b5f}-\x{b61}\x{b66}-\x{b77}\x{b83}\x{b85}-\x{b8a}\x{b8e}-\x{b90}\x{b92}-\x{b95}\x{b99}\x{b9a}\x{b9c}\x{b9e}\x{b9f}\x{ba3}\x{ba4}\x{ba8}-\x{baa}\x{bae}-\x{bb9}\x{bbe}\x{bbf}\x{bc1}\x{bc2}\x{bc6}-\x{bc8}\x{bca}-\x{bcc}\x{bd0}\x{bd7}\x{be6}-\x{bf2}\x{c01}-\x{c03}\x{c05}-\x{c0c}\x{c0e}-\x{c10}\x{c12}-\x{c28}\x{c2a}-\x{c39}\x{c3d}\x{c41}-\x{c44}\x{c58}-\x{c5a}\x{c60}\x{c61}\x{c66}-\x{c6f}\x{c7f}\x{c82}\x{c83}\x{c85}-\x{c8c}\x{c8e}-\x{c90}\x{c92}-\x{ca8}\x{caa}-\x{cb3}\x{cb5}-\x{cb9}\x{cbd}-\x{cc4}\x{cc6}-\x{cc8}\x{cca}\x{ccb}\x{cd5}\x{cd6}\x{cde}\x{ce0}\x{ce1}\x{ce6}-\x{cef}\x{cf1}\x{cf2}\x{d02}\x{d03}\x{d05}-\x{d0c}\x{d0e}-\x{d10}\x{d12}-\x{d3a}\x{d3d}-\x{d40}\x{d46}-\x{d48}\x{d4a}-\x{d4c}\x{d4e}\x{d57}\x{d5f}-\x{d61}\x{d66}-\x{d75}\x{d79}-\x{d7f}\x{d82}\x{d83}\x{d85}-\x{d96}\x{d9a}-\x{db1}\x{db3}-\x{dbb}\x{dbd}\x{dc0}-\x{dc6}\x{dcf}-\x{dd1}\x{dd8}-\x{ddf}\x{de6}-\x{def}\x{df2}-\x{df4}\x{e01}-\x{e30}\x{e32}\x{e33}\x{e40}-\x{e46}\x{e4f}-\x{e5b}\x{e81}\x{e82}\x{e84}\x{e87}\x{e88}\x{e8a}\x{e8d}\x{e94}-\x{e97}\x{e99}-\x{e9f}\x{ea1}-\x{ea3}\x{ea5}\x{ea7}\x{eaa}\x{eab}\x{ead}-\x{eb0}\x{eb2}\x{eb3}\x{ebd}\x{ec0}-\x{ec4}\x{ec6}\x{ed0}-\x{ed9}\x{edc}-\x{edf}\x{f00}-\x{f17}\x{f1a}-\x{f34}\x{f36}\x{f38}\x{f3e}-\x{f47}\x{f49}-\x{f6c}\x{f7f}\x{f85}\x{f88}-\x{f8c}\x{fbe}-\x{fc5}\x{fc7}-\x{fcc}\x{fce}-\x{fda}\x{1000}-\x{102c}\x{1031}\x{1038}\x{103b}\x{103c}\x{103f}-\x{1057}\x{105a}-\x{105d}\x{1061}-\x{1070}\x{1075}-\x{1081}\x{1083}\x{1084}\x{1087}-\x{108c}\x{108e}-\x{109c}\x{109e}-\x{10c5}\x{10c7}\x{10cd}\x{10d0}-\x{1248}\x{124a}-\x{124d}\x{1250}-\x{1256}\x{1258}\x{125a}-\x{125d}\x{1260}-\x{1288}\x{128a}-\x{128d}\x{1290}-\x{12b0}\x{12b2}-\x{12b5}\x{12b8}-\x{12be}\x{12c0}\x{12c2}-\x{12c5}\x{12c8}-\x{12d6}\x{12d8}-\x{1310}\x{1312}-\x{1315}\x{1318}-\x{135a}\x{1360}-\x{137c}\x{1380}-\x{138f}\x{13a0}-\x{13f5}\x{13f8}-\x{13fd}\x{1401}-\x{167f}\x{1681}-\x{169a}\x{16a0}-\x{16f8}\x{1700}-\x{170c}\x{170e}-\x{1711}\x{1720}-\x{1731}\x{1735}\x{1736}\x{1740}-\x{1751}\x{1760}-\x{176c}\x{176e}-\x{1770}\x{1780}-\x{17b3}\x{17b6}\x{17be}-\x{17c5}\x{17c7}\x{17c8}\x{17d4}-\x{17da}\x{17dc}\x{17e0}-\x{17e9}\x{1810}-\x{1819}\x{1820}-\x{1877}\x{1880}-\x{18a8}\x{18aa}\x{18b0}-\x{18f5}\x{1900}-\x{191e}\x{1923}-\x{1926}\x{1929}-\x{192b}\x{1930}\x{1931}\x{1933}-\x{1938}\x{1946}-\x{196d}\x{1970}-\x{1974}\x{1980}-\x{19ab}\x{19b0}-\x{19c9}\x{19d0}-\x{19da}\x{1a00}-\x{1a16}\x{1a19}\x{1a1a}\x{1a1e}-\x{1a55}\x{1a57}\x{1a61}\x{1a63}\x{1a64}\x{1a6d}-\x{1a72}\x{1a80}-\x{1a89}\x{1a90}-\x{1a99}\x{1aa0}-\x{1aad}\x{1b04}-\x{1b33}\x{1b35}\x{1b3b}\x{1b3d}-\x{1b41}\x{1b43}-\x{1b4b}\x{1b50}-\x{1b6a}\x{1b74}-\x{1b7c}\x{1b82}-\x{1ba1}\x{1ba6}\x{1ba7}\x{1baa}\x{1bae}-\x{1be5}\x{1be7}\x{1bea}-\x{1bec}\x{1bee}\x{1bf2}\x{1bf3}\x{1bfc}-\x{1c2b}\x{1c34}\x{1c35}\x{1c3b}-\x{1c49}\x{1c4d}-\x{1c7f}\x{1cc0}-\x{1cc7}\x{1cd3}\x{1ce1}\x{1ce9}-\x{1cec}\x{1cee}-\x{1cf3}\x{1cf5}\x{1cf6}\x{1d00}-\x{1dbf}\x{1e00}-\x{1f15}\x{1f18}-\x{1f1d}\x{1f20}-\x{1f45}\x{1f48}-\x{1f4d}\x{1f50}-\x{1f57}\x{1f59}\x{1f5b}\x{1f5d}\x{1f5f}-\x{1f7d}\x{1f80}-\x{1fb4}\x{1fb6}-\x{1fbc}\x{1fbe}\x{1fc2}-\x{1fc4}\x{1fc6}-\x{1fcc}\x{1fd0}-\x{1fd3}\x{1fd6}-\x{1fdb}\x{1fe0}-\x{1fec}\x{1ff2}-\x{1ff4}\x{1ff6}-\x{1ffc}\x{200e}\x{2071}\x{207f}\x{2090}-\x{209c}\x{2102}\x{2107}\x{210a}-\x{2113}\x{2115}\x{2119}-\x{211d}\x{2124}\x{2126}\x{2128}\x{212a}-\x{212d}\x{212f}-\x{2139}\x{213c}-\x{213f}\x{2145}-\x{2149}\x{214e}\x{214f}\x{2160}-\x{2188}\x{2336}-\x{237a}\x{2395}\x{249c}-\x{24e9}\x{26ac}\x{2800}-\x{28ff}\x{2c00}-\x{2c2e}\x{2c30}-\x{2c5e}\x{2c60}-\x{2ce4}\x{2ceb}-\x{2cee}\x{2cf2}\x{2cf3}\x{2d00}-\x{2d25}\x{2d27}\x{2d2d}\x{2d30}-\x{2d67}\x{2d6f}\x{2d70}\x{2d80}-\x{2d96}\x{2da0}-\x{2da6}\x{2da8}-\x{2dae}\x{2db0}-\x{2db6}\x{2db8}-\x{2dbe}\x{2dc0}-\x{2dc6}\x{2dc8}-\x{2dce}\x{2dd0}-\x{2dd6}\x{2dd8}-\x{2dde}\x{3005}-\x{3007}\x{3021}-\x{3029}\x{302e}\x{302f}\x{3031}-\x{3035}\x{3038}-\x{303c}\x{3041}-\x{3096}\x{309d}-\x{309f}\x{30a1}-\x{30fa}\x{30fc}-\x{30ff}\x{3105}-\x{312d}\x{3131}-\x{318e}\x{3190}-\x{31ba}\x{31f0}-\x{321c}\x{3220}-\x{324f}\x{3260}-\x{327b}\x{327f}-\x{32b0}\x{32c0}-\x{32cb}\x{32d0}-\x{32fe}\x{3300}-\x{3376}\x{337b}-\x{33dd}\x{33e0}-\x{33fe}\x{3400}-\x{4db5}\x{4e00}-\x{9fd5}\x{a000}-\x{a48c}\x{a4d0}-\x{a60c}\x{a610}-\x{a62b}\x{a640}-\x{a66e}\x{a680}-\x{a69d}\x{a6a0}-\x{a6ef}\x{a6f2}-\x{a6f7}\x{a722}-\x{a787}\x{a789}-\x{a7ad}\x{a7b0}-\x{a7b7}\x{a7f7}-\x{a801}\x{a803}-\x{a805}\x{a807}-\x{a80a}\x{a80c}-\x{a824}\x{a827}\x{a830}-\x{a837}\x{a840}-\x{a873}\x{a880}-\x{a8c3}\x{a8ce}-\x{a8d9}\x{a8f2}-\x{a8fd}\x{a900}-\x{a925}\x{a92e}-\x{a946}\x{a952}\x{a953}\x{a95f}-\x{a97c}\x{a983}-\x{a9b2}\x{a9b4}\x{a9b5}\x{a9ba}\x{a9bb}\x{a9bd}-\x{a9cd}\x{a9cf}-\x{a9d9}\x{a9de}-\x{a9e4}\x{a9e6}-\x{a9fe}\x{aa00}-\x{aa28}\x{aa2f}\x{aa30}\x{aa33}\x{aa34}\x{aa40}-\x{aa42}\x{aa44}-\x{aa4b}\x{aa4d}\x{aa50}-\x{aa59}\x{aa5c}-\x{aa7b}\x{aa7d}-\x{aaaf}\x{aab1}\x{aab5}\x{aab6}\x{aab9}-\x{aabd}\x{aac0}\x{aac2}\x{aadb}-\x{aaeb}\x{aaee}-\x{aaf5}\x{ab01}-\x{ab06}\x{ab09}-\x{ab0e}\x{ab11}-\x{ab16}\x{ab20}-\x{ab26}\x{ab28}-\x{ab2e}\x{ab30}-\x{ab65}\x{ab70}-\x{abe4}\x{abe6}\x{abe7}\x{abe9}-\x{abec}\x{abf0}-\x{abf9}\x{ac00}-\x{d7a3}\x{d7b0}-\x{d7c6}\x{d7cb}-\x{d7fb}\x{e000}-\x{fa6d}\x{fa70}-\x{fad9}\x{fb00}-\x{fb06}\x{fb13}-\x{fb17}\x{ff21}-\x{ff3a}\x{ff41}-\x{ff5a}\x{ff66}-\x{ffbe}\x{ffc2}-\x{ffc7}\x{ffca}-\x{ffcf}\x{ffd2}-\x{ffd7}\x{ffda}-\x{ffdc}\x{10000}-\x{1000b}\x{1000d}-\x{10026}\x{10028}-\x{1003a}\x{1003c}\x{1003d}\x{1003f}-\x{1004d}\x{10050}-\x{1005d}\x{10080}-\x{100fa}\x{10100}\x{10102}\x{10107}-\x{10133}\x{10137}-\x{1013f}\x{101d0}-\x{101fc}\x{10280}-\x{1029c}\x{102a0}-\x{102d0}\x{10300}-\x{10323}\x{10330}-\x{1034a}\x{10350}-\x{10375}\x{10380}-\x{1039d}\x{1039f}-\x{103c3}\x{103c8}-\x{103d5}\x{10400}-\x{1049d}\x{104a0}-\x{104a9}\x{10500}-\x{10527}\x{10530}-\x{10563}\x{1056f}\x{10600}-\x{10736}\x{10740}-\x{10755}\x{10760}-\x{10767}\x{11000}\x{11002}-\x{11037}\x{11047}-\x{1104d}\x{11066}-\x{1106f}\x{11082}-\x{110b2}\x{110b7}\x{110b8}\x{110bb}-\x{110c1}\x{110d0}-\x{110e8}\x{110f0}-\x{110f9}\x{11103}-\x{11126}\x{1112c}\x{11136}-\x{11143}\x{11150}-\x{11172}\x{11174}-\x{11176}\x{11182}-\x{111b5}\x{111bf}-\x{111c9}\x{111cd}\x{111d0}-\x{111df}\x{111e1}-\x{111f4}\x{11200}-\x{11211}\x{11213}-\x{1122e}\x{11232}\x{11233}\x{11235}\x{11238}-\x{1123d}\x{11280}-\x{11286}\x{11288}\x{1128a}-\x{1128d}\x{1128f}-\x{1129d}\x{1129f}-\x{112a9}\x{112b0}-\x{112de}\x{112e0}-\x{112e2}\x{112f0}-\x{112f9}\x{11302}\x{11303}\x{11305}-\x{1130c}\x{1130f}\x{11310}\x{11313}-\x{11328}\x{1132a}-\x{11330}\x{11332}\x{11333}\x{11335}-\x{11339}\x{1133d}-\x{1133f}\x{11341}-\x{11344}\x{11347}\x{11348}\x{1134b}-\x{1134d}\x{11350}\x{11357}\x{1135d}-\x{11363}\x{11480}-\x{114b2}\x{114b9}\x{114bb}-\x{114be}\x{114c1}\x{114c4}-\x{114c7}\x{114d0}-\x{114d9}\x{11580}-\x{115b1}\x{115b8}-\x{115bb}\x{115be}\x{115c1}-\x{115db}\x{11600}-\x{11632}\x{1163b}\x{1163c}\x{1163e}\x{11641}-\x{11644}\x{11650}-\x{11659}\x{11680}-\x{116aa}\x{116ac}\x{116ae}\x{116af}\x{116b6}\x{116c0}-\x{116c9}\x{11700}-\x{11719}\x{11720}\x{11721}\x{11726}\x{11730}-\x{1173f}\x{118a0}-\x{118f2}\x{118ff}\x{11ac0}-\x{11af8}\x{12000}-\x{12399}\x{12400}-\x{1246e}\x{12470}-\x{12474}\x{12480}-\x{12543}\x{13000}-\x{1342e}\x{14400}-\x{14646}\x{16800}-\x{16a38}\x{16a40}-\x{16a5e}\x{16a60}-\x{16a69}\x{16a6e}\x{16a6f}\x{16ad0}-\x{16aed}\x{16af5}\x{16b00}-\x{16b2f}\x{16b37}-\x{16b45}\x{16b50}-\x{16b59}\x{16b5b}-\x{16b61}\x{16b63}-\x{16b77}\x{16b7d}-\x{16b8f}\x{16f00}-\x{16f44}\x{16f50}-\x{16f7e}\x{16f93}-\x{16f9f}\x{1b000}\x{1b001}\x{1bc00}-\x{1bc6a}\x{1bc70}-\x{1bc7c}\x{1bc80}-\x{1bc88}\x{1bc90}-\x{1bc99}\x{1bc9c}\x{1bc9f}\x{1d000}-\x{1d0f5}\x{1d100}-\x{1d126}\x{1d129}-\x{1d166}\x{1d16a}-\x{1d172}\x{1d183}\x{1d184}\x{1d18c}-\x{1d1a9}\x{1d1ae}-\x{1d1e8}\x{1d360}-\x{1d371}\x{1d400}-\x{1d454}\x{1d456}-\x{1d49c}\x{1d49e}\x{1d49f}\x{1d4a2}\x{1d4a5}\x{1d4a6}\x{1d4a9}-\x{1d4ac}\x{1d4ae}-\x{1d4b9}\x{1d4bb}\x{1d4bd}-\x{1d4c3}\x{1d4c5}-\x{1d505}\x{1d507}-\x{1d50a}\x{1d50d}-\x{1d514}\x{1d516}-\x{1d51c}\x{1d51e}-\x{1d539}\x{1d53b}-\x{1d53e}\x{1d540}-\x{1d544}\x{1d546}\x{1d54a}-\x{1d550}\x{1d552}-\x{1d6a5}\x{1d6a8}-\x{1d6da}\x{1d6dc}-\x{1d714}\x{1d716}-\x{1d74e}\x{1d750}-\x{1d788}\x{1d78a}-\x{1d7c2}\x{1d7c4}-\x{1d7cb}\x{1d800}-\x{1d9ff}\x{1da37}-\x{1da3a}\x{1da6d}-\x{1da74}\x{1da76}-\x{1da83}\x{1da85}-\x{1da8b}\x{1f110}-\x{1f12e}\x{1f130}-\x{1f169}\x{1f170}-\x{1f19a}\x{1f1e6}-\x{1f202}\x{1f210}-\x{1f23a}\x{1f240}-\x{1f248}\x{1f250}\x{1f251}\x{20000}-\x{2a6d6}\x{2a700}-\x{2b734}\x{2b740}-\x{2b81d}\x{2b820}-\x{2cea1}\x{2f800}-\x{2fa1d}\x{f0000}-\x{ffffd}\x{100000}-\x{10fffd}])\|([\x{590}\x{5be}\x{5c0}\x{5c3}\x{5c6}\x{5c8}-\x{5ff}\x{7c0}-\x{7ea}\x{7f4}\x{7f5}\x{7fa}-\x{815}\x{81a}\x{824}\x{828}\x{82e}-\x{858}\x{85c}-\x{89f}\x{200f}\x{fb1d}\x{fb1f}-\x{fb28}\x{fb2a}-\x{fb4f}\x{10800}-\x{1091e}\x{10920}-\x{10a00}\x{10a04}\x{10a07}-\x{10a0b}\x{10a10}-\x{10a37}\x{10a3b}-\x{10a3e}\x{10a40}-\x{10ae4}\x{10ae7}-\x{10b38}\x{10b40}-\x{10e5f}\x{10e7f}-\x{10fff}\x{1e800}-\x{1e8cf}\x{1e8d7}-\x{1edff}\x{1ef00}-\x{1efff}\x{608}\x{60b}\x{60d}\x{61b}-\x{64a}\x{66d}-\x{66f}\x{671}-\x{6d5}\x{6e5}\x{6e6}\x{6ee}\x{6ef}\x{6fa}-\x{710}\x{712}-\x{72f}\x{74b}-\x{7a5}\x{7b1}-\x{7bf}\x{8a0}-\x{8e2}\x{fb50}-\x{fd3d}\x{fd40}-\x{fdcf}\x{fdf0}-\x{fdfc}\x{fdfe}\x{fdff}\x{fe70}-\x{fefe}\x{1ee00}-\x{1eeef}\x{1eef2}-\x{1eeff}]))/u';
323	// @codeCoverageIgnoreEnd
324
325	/**
326	* @internal Calling this directly is deprecated. Use LanguageFactory instead.
327	*
328	* @param string\|null $code Which code to use. Passing null is deprecated in 1.35, hard-deprecated since 1.43.
329	* @param NamespaceInfo\|null $namespaceInfo
330	* @param LocalisationCache\|null $localisationCache
331	* @param LanguageNameUtils\|null $langNameUtils
332	* @param LanguageFallback\|null $langFallback
333	* @param LanguageConverterFactory\|null $converterFactory
334	* @param HookContainer\|null $hookContainer
335	* @param Config\|null $config
336	*/
337	public function __construct(
338	$code = null,
339	?NamespaceInfo $namespaceInfo = null,
340	?LocalisationCache $localisationCache = null,
341	?LanguageNameUtils $langNameUtils = null,
342	?LanguageFallback $langFallback = null,
343	?LanguageConverterFactory $converterFactory = null,
344	?HookContainer $hookContainer = null,
345	?Config $config = null
346	) {
347	if ( !func_num_args() ) {
348	// Old calling convention, deprecated
349	wfDeprecatedMsg(
350	__METHOD__ . ' without providing all services is deprecated',
351	'1.35'
352	);
353	if ( static::class === 'Language' ) {
354	$this->mCode = 'en';
355	} else {
356	$this->mCode = str_replace( '_', '-', strtolower( substr( static::class, 8 ) ) );
357	}
358
359	$services = MediaWikiServices::getInstance();
360	$this->namespaceInfo = $services->getNamespaceInfo();
361	$this->localisationCache = $services->getLocalisationCache();
362	$this->langNameUtils = $services->getLanguageNameUtils();
363	$this->langFallback = $services->getLanguageFallback();
364	$this->converterFactory = $services->getLanguageConverterFactory();
365	$this->hookContainer = $services->getHookContainer();
366	$this->hookRunner = new HookRunner( $this->hookContainer );
367	$this->config = $services->getMainConfig();
368	return;
369	}
370
371	Assert::parameter( $code !== null, '$code',
372	'Parameters cannot be null unless all are omitted' );
373	Assert::parameter( $namespaceInfo !== null, '$namespaceInfo',
374	'Parameters cannot be null unless all are omitted' );
375	Assert::parameter( $localisationCache !== null, '$localisationCache',
376	'Parameters cannot be null unless all are omitted' );
377	Assert::parameter( $langNameUtils !== null, '$langNameUtils',
378	'Parameters cannot be null unless all are omitted' );
379	Assert::parameter( $langFallback !== null, '$langFallback',
380	'Parameters cannot be null unless all are omitted' );
381	Assert::parameter( $converterFactory !== null, '$converterFactory',
382	'Parameters cannot be null unless all are omitted' );
383	Assert::parameter( $hookContainer !== null, '$hookContainer',
384	'Parameters cannot be null unless all are omitted' );
385	Assert::parameter( $config !== null, '$config',
386	'Parameters cannot be null unless all are omitted' );
387
388	$this->mCode = $code;
389	$this->namespaceInfo = $namespaceInfo;
390	$this->localisationCache = $localisationCache;
391	$this->langNameUtils = $langNameUtils;
392	$this->langFallback = $langFallback;
393	$this->converterFactory = $converterFactory;
394	$this->hookContainer = $hookContainer;
395	$this->hookRunner = new HookRunner( $hookContainer );
396	$this->config = $config;
397	}
398
399	/**
400	* @return array
401	* @since 1.19
402	*/
403	public function getFallbackLanguages() {
404	return $this->langFallback->getAll( $this->mCode );
405	}
406
407	/**
408	* Exports $wgBookstoreListEn
409	* @return array
410	*/
411	public function getBookstoreList() {
412	return $this->localisationCache->getItem( $this->mCode, 'bookstoreList' );
413	}
414
415	/**
416	* Returns an array of localised namespaces indexed by their numbers. If the namespace is not
417	* available in localised form, it will be included in English.
418	*
419	* @return array<int,string> List of localized namespace names, indexed by numeric namespace ID.
420	*/
421	public function getNamespaces() {
422	if ( $this->namespaceNames === null ) {
423	$metaNamespace = $this->config->get( MainConfigNames::MetaNamespace );
424	$metaNamespaceTalk = $this->config->get( MainConfigNames::MetaNamespaceTalk );
425	$extraNamespaces = $this->config->get( MainConfigNames::ExtraNamespaces );
426	$validNamespaces = $this->namespaceInfo->getCanonicalNamespaces();
427
428	// @phan-suppress-next-line PhanTypeMismatchProperty
429	$this->namespaceNames = $extraNamespaces +
430	$this->localisationCache->getItem( $this->mCode, 'namespaceNames' );
431	// @phan-suppress-next-line PhanTypeInvalidLeftOperand
432	$this->namespaceNames += $validNamespaces;
433
434	$this->namespaceNames[NS_PROJECT] = $metaNamespace;
435	if ( $metaNamespaceTalk ) {
436	$this->namespaceNames[NS_PROJECT_TALK] = $metaNamespaceTalk;
437	} else {
438	$talk = $this->namespaceNames[NS_PROJECT_TALK];
439	$this->namespaceNames[NS_PROJECT_TALK] =
440	$this->fixVariableInNamespace( $talk );
441	}
442
443	# Sometimes a language will be localised but not actually exist on this wiki.
444	foreach ( $this->namespaceNames as $key => $text ) {
445	if ( !isset( $validNamespaces[$key] ) ) {
446	unset( $this->namespaceNames[$key] );
447	}
448	}
449
450	# The above mixing may leave namespaces out of canonical order.
451	# Re-order by namespace ID number...
452	ksort( $this->namespaceNames );
453
454	$this->getHookRunner()->onLanguageGetNamespaces( $this->namespaceNames );
455	}
456
457	return $this->namespaceNames;
458	}
459
460	/**
461	* Arbitrarily set all the namespace names at once. Mainly used for testing
462	* @param string[] $namespaces Array of namespaces (id => name)
463	*/
464	public function setNamespaces( array $namespaces ) {
465	$this->namespaceNames = $namespaces;
466	$this->mNamespaceIds = null;
467	}
468
469	/**
470	* Resets all the namespace caches. Mainly used for testing
471	* @deprecated since 1.39 Use MediaWikiServices::resetServiceForTesting() instead.
472	*/
473	public function resetNamespaces() {
474	$this->namespaceNames = null;
475	$this->mNamespaceIds = null;
476	$this->namespaceAliases = null;
477	}
478
479	/**
480	* A convenience function that returns getNamespaces() with spaces instead of underscores
481	* in values. Useful for producing output to be displayed e.g. in `<select>` forms.
482	*
483	* @return string[]
484	*/
485	public function getFormattedNamespaces() {
486	$ns = $this->getNamespaces();
487	foreach ( $ns as $k => $v ) {
488	$ns[$k] = strtr( $v, '_', ' ' );
489	}
490	return $ns;
491	}
492
493	/**
494	* Get a namespace value by key
495	*
496	* Namespace name uses underscores (not spaces), e.g. 'MediaWiki_talk'.
497	*
498	* <code>
499	* $mw_ns = $lang->getNsText( NS_MEDIAWIKI_TALK );
500	* echo $mw_ns; // prints 'MediaWiki_talk'
501	* </code>
502	*
503	* @param int $index The array key of the namespace to return
504	* @return string\|false String if the namespace value exists, otherwise false
505	*/
506	public function getNsText( $index ) {
507	$ns = $this->getNamespaces();
508	return $ns[$index] ?? false;
509	}
510
511	/**
512	* A convenience function that returns the same thing as
513	* getNsText() except with '_' changed to ' ', useful for
514	* producing output.
515	*
516	* <code>
517	* $mw_ns = $lang->getFormattedNsText( NS_MEDIAWIKI_TALK );
518	* echo $mw_ns; // prints 'MediaWiki talk'
519	* </code>
520	*
521	* @param int $index The array key of the namespace to return
522	* @return string Namespace name without underscores (empty string if namespace does not exist)
523	*/
524	public function getFormattedNsText( $index ) {
525	$ns = $this->getNsText( $index );
526	return $ns === false ? '' : strtr( $ns, '_', ' ' );
527	}
528
529	/**
530	* Returns gender-dependent namespace alias if available.
531	* See https://www.mediawiki.org/wiki/Manual:$wgExtraGenderNamespaces
532	* @param int $index Namespace index
533	* @param string $gender Gender key (male, female... )
534	* @return string\|false
535	* @since 1.18
536	*/
537	public function getGenderNsText( $index, $gender ) {
538	$extraGenderNamespaces = $this->config->get( MainConfigNames::ExtraGenderNamespaces );
539
540	$ns = $extraGenderNamespaces +
541	(array)$this->localisationCache->getItem( $this->mCode, 'namespaceGenderAliases' );
542
543	return $ns[$index][$gender] ?? $this->getNsText( $index );
544	}
545
546	/**
547	* Whether this language uses gender-dependent namespace aliases.
548	* See https://www.mediawiki.org/wiki/Manual:$wgExtraGenderNamespaces
549	* @return bool
550	* @since 1.18
551	*/
552	public function needsGenderDistinction() {
553	$extraGenderNamespaces = $this->config->get( MainConfigNames::ExtraGenderNamespaces );
554	$extraNamespaces = $this->config->get( MainConfigNames::ExtraNamespaces );
555	if ( count( $extraGenderNamespaces ) > 0 ) {
556	// $wgExtraGenderNamespaces overrides everything
557	return true;
558	} elseif ( isset( $extraNamespaces[NS_USER] ) && isset( $extraNamespaces[NS_USER_TALK] ) ) {
559	// @todo There may be other gender namespace than NS_USER & NS_USER_TALK in the future
560	// $wgExtraNamespaces overrides any gender aliases specified in i18n files
561	return false;
562	} else {
563	// Check what is in i18n files
564	$aliases = $this->localisationCache->getItem( $this->mCode, 'namespaceGenderAliases' );
565	return count( $aliases ) > 0;
566	}
567	}
568
569	/**
570	* Get a namespace key by case-insensitive value.
571	* Only matches namespace names for the current language, not the
572	* canonical ones defined in Namespace.php.
573	*
574	* @param string $text
575	* @return int\|false An integer if $text is a valid value otherwise false
576	*/
577	public function getLocalNsIndex( $text ) {
578	$lctext = $this->lc( $text );
579	$ids = $this->getNamespaceIds();
580	return $ids[$lctext] ?? false;
581	}
582
583	/**
584	* @return array<string,int> Map from names to namespace IDs. Note that each
585	* namespace ID can have multiple alias.
586	*/
587	public function getNamespaceAliases() {
588	if ( $this->namespaceAliases === null ) {
589	$aliases = $this->localisationCache->getItem( $this->mCode, 'namespaceAliases' );
590	if ( !$aliases ) {
591	$aliases = [];
592	} else {
593	foreach ( $aliases as $name => $index ) {
594	if ( $index === NS_PROJECT_TALK ) {
595	unset( $aliases[$name] );
596	$name = $this->fixVariableInNamespace( $name );
597	$aliases[$name] = $index;
598	}
599	}
600	}
601
602	$extraGenderNamespaces = $this->config->get( MainConfigNames::ExtraGenderNamespaces );
603	$genders = $extraGenderNamespaces + (array)$this->localisationCache
604	->getItem( $this->mCode, 'namespaceGenderAliases' );
605	foreach ( $genders as $index => $forms ) {
606	foreach ( $forms as $alias ) {
607	$aliases[$alias] = $index;
608	}
609	}
610
611	$langConverter = $this->getConverterInternal();
612	# Also add converted namespace names as aliases, to avoid confusion.
613	$convertedNames = [];
614	foreach ( $langConverter->getVariants() as $variant ) {
615	if ( $variant === $this->mCode ) {
616	continue;
617	}
618	foreach ( $this->getNamespaces() as $ns => $_ ) {
619	$convertedNames[$langConverter->convertNamespace( $ns, $variant )] = $ns;
620	}
621	}
622
623	$this->namespaceAliases = $aliases + $convertedNames;
624
625	// In the case of conflicts between $wgNamespaceAliases and other sources
626	// of aliasing, $wgNamespaceAliases wins.
627	$this->namespaceAliases = $this->config->get( MainConfigNames::NamespaceAliases ) +
628	$this->namespaceAliases;
629
630	# Filter out aliases to namespaces that don't exist, e.g. from extensions
631	# that aren't loaded here but are included in the l10n cache.
632	# (array_intersect preserves keys from its first argument)
633	$this->namespaceAliases = array_intersect(
634	$this->namespaceAliases,
635	array_keys( $this->getNamespaces() )
636	);
637	}
638
639	return $this->namespaceAliases;
640	}
641
642	/**
643	* @return array<string,int> indexed by localized lower-cased namespace name
644	*/
645	public function getNamespaceIds() {
646	if ( $this->mNamespaceIds === null ) {
647	# Put namespace names and aliases into a hashtable.
648	# If this is too slow, then we should arrange it so that it is done
649	# before caching. The catch is that at pre-cache time, the above
650	# class-specific fixup hasn't been done.
651	$this->mNamespaceIds = [];
652	foreach ( $this->getNamespaces() as $index => $name ) {
653	$this->mNamespaceIds[$this->lc( $name )] = $index;
654	}
655	foreach ( $this->getNamespaceAliases() as $name => $index ) {
656	$this->mNamespaceIds[$this->lc( $name )] = $index;
657	}
658	}
659	return $this->mNamespaceIds;
660	}
661
662	/**
663	* Get a namespace key by case-insensitive value. Canonical namespace
664	* names override custom ones defined for the current language.
665	*
666	* @param string $text
667	* @return int\|false An integer if $text is a valid value otherwise false
668	*/
669	public function getNsIndex( $text ) {
670	$lctext = $this->lc( $text );
671	$ns = $this->namespaceInfo->getCanonicalIndex( $lctext );
672	if ( $ns !== null ) {
673	return $ns;
674	}
675	$ids = $this->getNamespaceIds();
676	return $ids[$lctext] ?? false;
677	}
678
679	/**
680	* Short names for language variants used for language conversion links.
681	*
682	* @param string $code
683	* @param bool $usemsg Use the "variantname-xyz" message if it exists
684	* @return string
685	*/
686	public function getVariantname( $code, $usemsg = true ) {
687	if ( $usemsg ) {
688	$msg = $this->msg( "variantname-$code" );
689	if ( $msg->exists() ) {
690	return $msg->text();
691	}
692	}
693	$name = $this->langNameUtils->getLanguageName( $code );
694	if ( $name ) {
695	return $name; # if it's defined as a language name, show that
696	} else {
697	# otherwise, output the language code
698	return $code;
699	}
700	}
701
702	/**
703	* @return string[]\|false List of date format preference keys, or false if disabled.
704	*/
705	public function getDatePreferences() {
706	return $this->localisationCache->getItem( $this->mCode, 'datePreferences' );
707	}
708
709	/**
710	* @return string[]
711	*/
712	public function getDateFormats() {
713	return $this->localisationCache->getItem( $this->mCode, 'dateFormats' );
714	}
715
716	/**
717	* @return string
718	*/
719	public function getDefaultDateFormat() {
720	$df = $this->localisationCache->getItem( $this->mCode, 'defaultDateFormat' );
721	if ( $df === 'dmy or mdy' ) {
722	return $this->config->get( MainConfigNames::AmericanDates ) ? 'mdy' : 'dmy';
723	} else {
724	return $df;
725	}
726	}
727
728	/**
729	* @return string[]
730	*/
731	public function getDatePreferenceMigrationMap() {
732	return $this->localisationCache->getItem( $this->mCode, 'datePreferenceMigrationMap' );
733	}
734
735	/**
736	* Get a message from the MediaWiki namespace.
737	*
738	* @param string $msg Message name
739	* @return string
740	*/
741	public function getMessageFromDB( $msg ) {
742	return $this->msg( $msg )->text();
743	}
744
745	/**
746	* Gets the Message object from this language. Only for use inside this class.
747	*
748	* @param string $msg Message name
749	* @phpcs:ignore Generic.Files.LineLength
750	* @param MessageParam\|MessageSpecifier\|string\|int\|float\|list<MessageParam\|MessageSpecifier\|string\|int\|float> ...$params
751	* See Message::params()
752	* @return Message
753	*/
754	protected function msg( $msg, ...$params ) {
755	return wfMessage( $msg, ...$params )->inLanguage( $this );
756	}
757
758	/**
759	* @param int $key Number from 1 to 12
760	* @return string
761	*/
762	public function getMonthName( $key ) {
763	return $this->getMessageFromDB( self::MONTH_MESSAGES[$key - 1] );
764	}
765
766	/**
767	* @return string[] Indexed from 0 to 11
768	*/
769	public function getMonthNamesArray() {
770	$monthNames = [ '' ];
771	for ( $i = 1; $i <= 12; $i++ ) {
772	$monthNames[] = $this->getMonthName( $i );
773	}
774	return $monthNames;
775	}
776
777	/**
778	* @param int $key Number from 1 to 12
779	* @return string
780	*/
781	public function getMonthNameGen( $key ) {
782	return $this->getMessageFromDB( self::MONTH_GENITIVE_MESSAGES[$key - 1] );
783	}
784
785	/**
786	* @param int $key Number from 1 to 12
787	* @return string
788	*/
789	public function getMonthAbbreviation( $key ) {
790	return $this->getMessageFromDB( self::MONTH_ABBREVIATED_MESSAGES[$key - 1] );
791	}
792
793	/**
794	* @return string[] Indexed from 0 to 11
795	*/
796	public function getMonthAbbreviationsArray() {
797	$monthNames = [ '' ];
798	for ( $i = 1; $i <= 12; $i++ ) {
799	$monthNames[] = $this->getMonthAbbreviation( $i );
800	}
801	return $monthNames;
802	}
803
804	/**
805	* @param int $key Number from 1 to 7
806	* @return string
807	*/
808	public function getWeekdayName( $key ) {
809	return $this->getMessageFromDB( self::WEEKDAY_MESSAGES[$key - 1] );
810	}
811
812	/**
813	* @param int $key Number from 1 to 7
814	* @return string
815	*/
816	public function getWeekdayAbbreviation( $key ) {
817	return $this->getMessageFromDB( self::WEEKDAY_ABBREVIATED_MESSAGES[$key - 1] );
818	}
819
820	/**
821	* Pass through the result from $dateTimeObj->format()
822	*
823	* @param DateTime\|false\|null &$dateTimeObj
824	* @param string $ts
825	* @param DateTimeZone\|false\|null $zone
826	* @param string $code
827	* @return string
828	*/
829	private static function dateTimeObjFormat( &$dateTimeObj, $ts, $zone, $code ) {
830	if ( !$dateTimeObj ) {
831	$dateTimeObj = DateTime::createFromFormat(
832	'YmdHis', $ts, $zone ?: new DateTimeZone( 'UTC' )
833	);
834	}
835	return $dateTimeObj->format( $code );
836	}
837
838	/**
839	* This is a workalike of PHP's date() function, but with better
840	* internationalisation, a reduced set of format characters, and a better
841	* escaping format.
842	*
843	* Supported format characters are dDjlNwzWFmMntLoYyaAgGhHiscrUeIOPTZ. See
844	* the PHP manual for definitions. There are a number of extensions, which
845	* start with "x":
846	*
847	* xn Do not translate digits of the next numeric format character
848	* xN Toggle raw digit (xn) flag, stays set until explicitly unset
849	* xr Use roman numerals for the next numeric format character
850	* xh Use hebrew numerals for the next numeric format character
851	* xx Literal x
852	* xg Genitive month name
853	*
854	* xij j (day number) in Iranian calendar
855	* xiF F (month name) in Iranian calendar
856	* xin n (month number) in Iranian calendar
857	* xiy y (two digit year) in Iranian calendar
858	* xiY Y (full year) in Iranian calendar
859	* xit t (days in month) in Iranian calendar
860	* xiz z (day of the year) in Iranian calendar
861	*
862	* xjj j (day number) in Hebrew calendar
863	* xjF F (month name) in Hebrew calendar
864	* xjt t (days in month) in Hebrew calendar
865	* xjx xg (genitive month name) in Hebrew calendar
866	* xjn n (month number) in Hebrew calendar
867	* xjY Y (full year) in Hebrew calendar
868	*
869	* xmj j (day number) in Hijri calendar
870	* xmF F (month name) in Hijri calendar
871	* xmn n (month number) in Hijri calendar
872	* xmY Y (full year) in Hijri calendar
873	*
874	* xkY Y (full year) in Thai solar calendar. Months and days are
875	* identical to the Gregorian calendar
876	* xoY Y (full year) in Minguo calendar or Juche year.
877	* Months and days are identical to the
878	* Gregorian calendar
879	* xtY Y (full year) in Japanese nengo. Months and days are
880	* identical to the Gregorian calendar
881	*
882	* Characters enclosed in double quotes will be considered literal (with
883	* the quotes themselves removed). Unmatched quotes will be considered
884	* literal quotes. Example:
885	*
886	* "The month is" F => The month is January
887	* i's" => 20'11"
888	*
889	* Backslash escaping is also supported.
890	*
891	* Input timestamp is assumed to be pre-normalized to the desired local
892	* time zone, if any. Note that the format characters crUeIOPTZ will assume
893	* $ts is UTC if $zone is not given.
894	*
895	* @param string $format
896	* @param string $ts 14-character timestamp
897	* YYYYMMDDHHMMSS
898	* 01234567890123
899	* @param DateTimeZone\|null $zone Timezone of $ts
900	* @param int\|null &$ttl The amount of time (in seconds) the output may be cached for.
901	* Only makes sense if $ts is the current time.
902	* @todo handling of "o" format character for Iranian, Hebrew, Hijri & Thai?
903	*
904	* @return string
905	* @return-taint tainted
906	*/
907	public function sprintfDate( $format, $ts, ?DateTimeZone $zone = null, &$ttl = 'unused' ) {
908	// @phan-suppress-previous-line PhanTypeMismatchDefault Type mismatch on pass-by-ref args
909	$s = '';
910	$raw = false;
911	$roman = false;
912	$hebrewNum = false;
913	$dateTimeObj = false;
914	$rawToggle = false;
915	$iranian = false;
916	$hebrew = false;
917	$hijri = false;
918	$thai = false;
919	$minguo = false;
920	$tenno = false;
921
922	$usedSecond = false;
923	$usedMinute = false;
924	$usedHour = false;
925	$usedAMPM = false;
926	$usedDay = false;
927	$usedWeek = false;
928	$usedMonth = false;
929	$usedYear = false;
930	$usedISOYear = false;
931	$usedIsLeapYear = false;
932
933	$usedHebrewMonth = false;
934	$usedIranianMonth = false;
935	$usedHijriMonth = false;
936	$usedHebrewYear = false;
937	$usedIranianYear = false;
938	$usedHijriYear = false;
939	$usedTennoYear = false;
940
941	if ( strlen( $ts ) !== 14 ) {
942	throw new InvalidArgumentException( __METHOD__ . ": The timestamp $ts should have 14 characters" );
943	}
944
945	if ( !ctype_digit( $ts ) ) {
946	throw new InvalidArgumentException( __METHOD__ . ": The timestamp $ts should be a number" );
947	}
948
949	$formatLength = strlen( $format );
950	for ( $p = 0; $p < $formatLength; $p++ ) {
951	$num = false;
952	$code = $format[$p];
953	if ( $code == 'x' && $p < $formatLength - 1 ) {
954	$code .= $format[++$p];
955	}
956
957	if ( ( $code === 'xi'
958	\|\| $code === 'xj'
959	\|\| $code === 'xk'
960	\|\| $code === 'xm'
961	\|\| $code === 'xo'
962	\|\| $code === 'xt' )
963	&& $p < $formatLength - 1
964	) {
965	$code .= $format[++$p];
966	}
967
968	switch ( $code ) {
969	case 'xx':
970	$s .= 'x';
971	break;
972
973	case 'xn':
974	$raw = true;
975	break;
976
977	case 'xN':
978	$rawToggle = !$rawToggle;
979	break;
980
981	case 'xr':
982	$roman = true;
983	break;
984
985	case 'xh':
986	$hebrewNum = true;
987	break;
988
989	case 'xg':
990	$usedMonth = true;
991	$s .= $this->getMonthNameGen( (int)substr( $ts, 4, 2 ) );
992	break;
993
994	case 'xjx':
995	$usedHebrewMonth = true;
996	if ( !$hebrew ) {
997	$hebrew = self::tsToHebrew( $ts );
998	}
999	$s .= $this->getMessageFromDB( self::HEBREW_CALENDAR_MONTH_GENITIVE_MESSAGES[$hebrew[1] - 1] );
1000	break;
1001
1002	case 'd':
1003	$usedDay = true;
1004	$num = substr( $ts, 6, 2 );
1005	break;
1006
1007	case 'D':
1008	$usedDay = true;
1009	$s .= $this->getWeekdayAbbreviation(
1010	(int)self::dateTimeObjFormat( $dateTimeObj, $ts, $zone, 'w' ) + 1
1011	);
1012	break;
1013
1014	case 'j':
1015	$usedDay = true;
1016	$num = intval( substr( $ts, 6, 2 ) );
1017	break;
1018
1019	case 'xij':
1020	$usedDay = true;
1021	if ( !$iranian ) {
1022	$iranian = self::tsToIranian( $ts );
1023	}
1024	$num = $iranian[2];
1025	break;
1026
1027	case 'xmj':
1028	$usedDay = true;
1029	if ( !$hijri ) {
1030	$hijri = self::tsToHijri( $ts );
1031	}
1032	$num = $hijri[2];
1033	break;
1034
1035	case 'xjj':
1036	$usedDay = true;
1037	if ( !$hebrew ) {
1038	$hebrew = self::tsToHebrew( $ts );
1039	}
1040	$num = $hebrew[2];
1041	break;
1042
1043	case 'l':
1044	$usedDay = true;
1045	$s .= $this->getWeekdayName(
1046	(int)self::dateTimeObjFormat( $dateTimeObj, $ts, $zone, 'w' ) + 1
1047	);
1048	break;
1049
1050	case 'F':
1051	$usedMonth = true;
1052	$s .= $this->getMonthName( (int)substr( $ts, 4, 2 ) );
1053	break;
1054
1055	case 'xiF':
1056	$usedIranianMonth = true;
1057	if ( !$iranian ) {
1058	$iranian = self::tsToIranian( $ts );
1059	}
1060	$s .= $this->getMessageFromDB( self::IRANIAN_CALENDAR_MONTHS_MESSAGES[$iranian[1] - 1] );
1061	break;
1062
1063	case 'xmF':
1064	$usedHijriMonth = true;
1065	if ( !$hijri ) {
1066	$hijri = self::tsToHijri( $ts );
1067	}
1068	$s .= $this->getMessageFromDB( self::HIJRI_CALENDAR_MONTH_MESSAGES[$hijri[1] - 1] );
1069	break;
1070
1071	case 'xjF':
1072	$usedHebrewMonth = true;
1073	if ( !$hebrew ) {
1074	$hebrew = self::tsToHebrew( $ts );
1075	}
1076	$s .= $this->getMessageFromDB( self::HEBREW_CALENDAR_MONTHS_MESSAGES[$hebrew[1] - 1] );
1077	break;
1078
1079	case 'm':
1080	$usedMonth = true;
1081	$num = substr( $ts, 4, 2 );
1082	break;
1083
1084	case 'M':
1085	$usedMonth = true;
1086	$s .= $this->getMonthAbbreviation( (int)substr( $ts, 4, 2 ) );
1087	break;
1088
1089	case 'n':
1090	$usedMonth = true;
1091	$num = intval( substr( $ts, 4, 2 ) );
1092	break;
1093
1094	case 'xin':
1095	$usedIranianMonth = true;
1096	if ( !$iranian ) {
1097	$iranian = self::tsToIranian( $ts );
1098	}
1099	$num = $iranian[1];
1100	break;
1101
1102	case 'xmn':
1103	$usedHijriMonth = true;
1104	if ( !$hijri ) {
1105	$hijri = self::tsToHijri( $ts );
1106	}
1107	$num = $hijri[1];
1108	break;
1109
1110	case 'xjn':
1111	$usedHebrewMonth = true;
1112	if ( !$hebrew ) {
1113	$hebrew = self::tsToHebrew( $ts );
1114	}
1115	$num = $hebrew[1];
1116	break;
1117
1118	case 'xjt':
1119	$usedHebrewMonth = true;
1120	if ( !$hebrew ) {
1121	$hebrew = self::tsToHebrew( $ts );
1122	}
1123	$num = $hebrew[3];
1124	break;
1125
1126	case 'Y':
1127	$usedYear = true;
1128	$num = substr( $ts, 0, 4 );
1129	break;
1130
1131	case 'xiY':
1132	$usedIranianYear = true;
1133	if ( !$iranian ) {
1134	$iranian = self::tsToIranian( $ts );
1135	}
1136	$num = $iranian[0];
1137	break;
1138
1139	case 'xmY':
1140	$usedHijriYear = true;
1141	if ( !$hijri ) {
1142	$hijri = self::tsToHijri( $ts );
1143	}
1144	$num = $hijri[0];
1145	break;
1146
1147	case 'xjY':
1148	$usedHebrewYear = true;
1149	if ( !$hebrew ) {
1150	$hebrew = self::tsToHebrew( $ts );
1151	}
1152	$num = $hebrew[0];
1153	break;
1154
1155	case 'xkY':
1156	$usedYear = true;
1157	if ( !$thai ) {
1158	$thai = self::tsToYear( $ts, 'thai' );
1159	}
1160	$num = $thai[0];
1161	break;
1162
1163	case 'xoY':
1164	$usedYear = true;
1165	if ( !$minguo ) {
1166	$minguo = self::tsToYear( $ts, 'minguo' );
1167	}
1168	$num = $minguo[0];
1169	break;
1170
1171	case 'xtY':
1172	$usedTennoYear = true;
1173	if ( !$tenno ) {
1174	$tenno = self::tsToJapaneseGengo( $ts );
1175	}
1176	$num = $tenno;
1177	break;
1178
1179	case 'y':
1180	$usedYear = true;
1181	$num = substr( $ts, 2, 2 );
1182	break;
1183
1184	case 'xiy':
1185	$usedIranianYear = true;
1186	if ( !$iranian ) {
1187	$iranian = self::tsToIranian( $ts );
1188	}
1189	$num = substr( (string)$iranian[0], -2 );
1190	break;
1191
1192	case 'xit':
1193	$usedIranianYear = true;
1194	if ( !$iranian ) {
1195	$iranian = self::tsToIranian( $ts );
1196	}
1197	$num = self::IRANIAN_DAYS[$iranian[1] - 1];
1198	break;
1199
1200	case 'xiz':
1201	$usedIranianYear = true;
1202	if ( !$iranian ) {
1203	$iranian = self::tsToIranian( $ts );
1204	}
1205	$num = $iranian[3];
1206	break;
1207
1208	case 'a':
1209	$usedAMPM = true;
1210	$s .= intval( substr( $ts, 8, 2 ) ) < 12 ? 'am' : 'pm';
1211	break;
1212
1213	case 'A':
1214	$usedAMPM = true;
1215	$s .= intval( substr( $ts, 8, 2 ) ) < 12 ? 'AM' : 'PM';
1216	break;
1217
1218	case 'g':
1219	$usedHour = true;
1220	$h = (int)substr( $ts, 8, 2 );
1221	$num = $h % 12 ?: 12;
1222	break;
1223
1224	case 'G':
1225	$usedHour = true;
1226	$num = intval( substr( $ts, 8, 2 ) );
1227	break;
1228
1229	case 'h':
1230	$usedHour = true;
1231	$h = (int)substr( $ts, 8, 2 );
1232	$num = sprintf( '%02d', $h % 12 ?: 12 );
1233	break;
1234
1235	case 'H':
1236	$usedHour = true;
1237	$num = substr( $ts, 8, 2 );
1238	break;
1239
1240	case 'i':
1241	$usedMinute = true;
1242	$num = substr( $ts, 10, 2 );
1243	break;
1244
1245	case 's':
1246	$usedSecond = true;
1247	$num = substr( $ts, 12, 2 );
1248	break;
1249
1250	case 'c':
1251	case 'r':
1252	$usedSecond = true;
1253	// fall through
1254	case 'e':
1255	case 'O':
1256	case 'P':
1257	case 'T':
1258	$s .= self::dateTimeObjFormat( $dateTimeObj, $ts, $zone, $code );
1259	break;
1260
1261	case 'w':
1262	case 'N':
1263	case 'z':
1264	$usedDay = true;
1265	$num = self::dateTimeObjFormat( $dateTimeObj, $ts, $zone, $code );
1266	break;
1267
1268	case 'W':
1269	$usedWeek = true;
1270	$num = self::dateTimeObjFormat( $dateTimeObj, $ts, $zone, $code );
1271	break;
1272
1273	case 't':
1274	$usedMonth = true;
1275	$num = self::dateTimeObjFormat( $dateTimeObj, $ts, $zone, $code );
1276	break;
1277
1278	case 'L':
1279	$usedIsLeapYear = true;
1280	$num = self::dateTimeObjFormat( $dateTimeObj, $ts, $zone, $code );
1281	break;
1282
1283	case 'o':
1284	$usedISOYear = true;
1285	$num = self::dateTimeObjFormat( $dateTimeObj, $ts, $zone, $code );
1286	break;
1287
1288	case 'U':
1289	$usedSecond = true;
1290	// fall through
1291	case 'I':
1292	case 'Z':
1293	$num = self::dateTimeObjFormat( $dateTimeObj, $ts, $zone, $code );
1294	break;
1295
1296	case '\\':
1297	# Backslash escaping
1298	if ( $p < $formatLength - 1 ) {
1299	$s .= $format[++$p];
1300	} else {
1301	$s .= '\\';
1302	}
1303	break;
1304
1305	case '"':
1306	# Quoted literal
1307	if ( $p < $formatLength - 1 ) {
1308	$endQuote = strpos( $format, '"', $p + 1 );
1309	if ( $endQuote === false ) {
1310	# No terminating quote, assume literal "
1311	$s .= '"';
1312	} else {
1313	$s .= substr( $format, $p + 1, $endQuote - $p - 1 );
1314	$p = $endQuote;
1315	}
1316	} else {
1317	# Quote at the end of the string, assume literal "
1318	$s .= '"';
1319	}
1320	break;
1321
1322	default:
1323	$s .= $format[$p];
1324	}
1325	if ( $num !== false ) {
1326	if ( $rawToggle \|\| $raw ) {
1327	$s .= $num;
1328	$raw = false;
1329	} elseif ( $roman ) {
1330	$s .= self::romanNumeral( $num );
1331	$roman = false;
1332	} elseif ( $hebrewNum ) {
1333	$s .= self::hebrewNumeral( $num );
1334	$hebrewNum = false;
1335	} elseif ( preg_match( '/^[\d.]+$/', $num ) ) {
1336	$s .= $this->formatNumNoSeparators( $num );
1337	} else {
1338	$s .= $num;
1339	}
1340	}
1341	}
1342
1343	if ( $ttl === 'unused' ) {
1344	// No need to calculate the TTL, the caller won't use it anyway.
1345	} elseif ( $usedSecond ) {
1346	$ttl = 1;
1347	} elseif ( $usedMinute ) {
1348	$ttl = 60 - (int)substr( $ts, 12, 2 );
1349	} elseif ( $usedHour ) {
1350	$ttl = 3600 - (int)substr( $ts, 10, 2 ) * 60 - (int)substr( $ts, 12, 2 );
1351	} elseif ( $usedAMPM ) {
1352	$ttl = 43200 - ( (int)substr( $ts, 8, 2 ) % 12 ) * 3600 -
1353	(int)substr( $ts, 10, 2 ) * 60 - (int)substr( $ts, 12, 2 );
1354	} elseif (
1355	$usedDay \|\|
1356	$usedHebrewMonth \|\|
1357	$usedIranianMonth \|\|
1358	$usedHijriMonth \|\|
1359	$usedHebrewYear \|\|
1360	$usedIranianYear \|\|
1361	$usedHijriYear \|\|
1362	$usedTennoYear
1363	) {
1364	// @todo Someone who understands the non-Gregorian calendars
1365	// should write proper logic for them so that they don't need purged every day.
1366	$ttl = 86400 - (int)substr( $ts, 8, 2 ) * 3600 -
1367	(int)substr( $ts, 10, 2 ) * 60 - (int)substr( $ts, 12, 2 );
1368	} else {
1369	$possibleTtls = [];
1370	$timeRemainingInDay = 86400 - (int)substr( $ts, 8, 2 ) * 3600 -
1371	(int)substr( $ts, 10, 2 ) * 60 - (int)substr( $ts, 12, 2 );
1372	if ( $usedWeek ) {
1373	$possibleTtls[] =
1374	( 7 - (int)self::dateTimeObjFormat( $dateTimeObj, $ts, $zone, 'N' ) ) * 86400 +
1375	$timeRemainingInDay;
1376	} elseif ( $usedISOYear ) {
1377	// December 28th falls on the last ISO week of the year, every year.
1378	// The last ISO week of a year can be 52 or 53.
1379	$lastWeekOfISOYear = (int)DateTime::createFromFormat(
1380	'Ymd',
1381	(int)substr( $ts, 0, 4 ) . '1228',
1382	$zone ?: new DateTimeZone( 'UTC' )
1383	)->format( 'W' );
1384	$currentISOWeek = (int)self::dateTimeObjFormat( $dateTimeObj, $ts, $zone, 'W' );
1385	$weeksRemaining = $lastWeekOfISOYear - $currentISOWeek;
1386	$timeRemainingInWeek =
1387	( 7 - (int)self::dateTimeObjFormat( $dateTimeObj, $ts, $zone, 'N' ) ) * 86400
1388	+ $timeRemainingInDay;
1389	$possibleTtls[] = $weeksRemaining * 604800 + $timeRemainingInWeek;
1390	}
1391
1392	if ( $usedMonth ) {
1393	$possibleTtls[] =
1394	( (int)self::dateTimeObjFormat( $dateTimeObj, $ts, $zone, 't' ) -
1395	(int)substr( $ts, 6, 2 ) ) * 86400
1396	+ $timeRemainingInDay;
1397	} elseif ( $usedYear ) {
1398	$possibleTtls[] =
1399	( (int)self::dateTimeObjFormat( $dateTimeObj, $ts, $zone, 'L' ) + 364 -
1400	(int)self::dateTimeObjFormat( $dateTimeObj, $ts, $zone, 'z' ) ) * 86400
1401	+ $timeRemainingInDay;
1402	} elseif ( $usedIsLeapYear ) {
1403	$year = (int)substr( $ts, 0, 4 );
1404	$timeRemainingInYear =
1405	( (int)self::dateTimeObjFormat( $dateTimeObj, $ts, $zone, 'L' ) + 364 -
1406	(int)self::dateTimeObjFormat( $dateTimeObj, $ts, $zone, 'z' ) ) * 86400
1407	+ $timeRemainingInDay;
1408	$mod = $year % 4;
1409	if ( $mod \|\| ( !( $year % 100 ) && $year % 400 ) ) {
1410	// this isn't a leap year. see when the next one starts
1411	$nextCandidate = $year - $mod + 4;
1412	if ( $nextCandidate % 100 \|\| !( $nextCandidate % 400 ) ) {
1413	$possibleTtls[] = ( $nextCandidate - $year - 1 ) * 365 * 86400 +
1414	$timeRemainingInYear;
1415	} else {
1416	$possibleTtls[] = ( $nextCandidate - $year + 3 ) * 365 * 86400 +
1417	$timeRemainingInYear;
1418	}
1419	} else {
1420	// this is a leap year, so the next year isn't
1421	$possibleTtls[] = $timeRemainingInYear;
1422	}
1423	}
1424
1425	if ( $possibleTtls ) {
1426	$ttl = min( $possibleTtls );
1427	}
1428	}
1429
1430	return $s;
1431	}
1432
1433	/**
1434	* Number of days in each month of the Gregorian calendar
1435	*/
1436	private const GREG_DAYS = [ 31, 28, 31, 30, 31, 30, 31, 31, 30, 31, 30, 31 ];
1437
1438	/**
1439	* Number of days in each month of the Iranian calendar
1440	*/
1441	private const IRANIAN_DAYS = [ 31, 31, 31, 31, 31, 31, 30, 30, 30, 30, 30, 29 ];
1442
1443	/**
1444	* Algorithm by Roozbeh Pournader and Mohammad Toossi to convert
1445	* Gregorian dates to Iranian dates. Originally written in C, it
1446	* is released under the terms of GNU Lesser General Public
1447	* License. Conversion to PHP was performed by Niklas Laxström.
1448	*
1449	* Link: http://www.farsiweb.info/jalali/jalali.c
1450	*
1451	* @param string $ts
1452	*
1453	* @return int[]
1454	*/
1455	private static function tsToIranian( $ts ) {
1456	$gy = (int)substr( $ts, 0, 4 ) - 1600;
1457	$gm = (int)substr( $ts, 4, 2 ) - 1;
1458	$gd = (int)substr( $ts, 6, 2 ) - 1;
1459
1460	# Days passed from the beginning (including leap years)
1461	$gDayNo = 365 * $gy
1462	+ floor( ( $gy + 3 ) / 4 )
1463	- floor( ( $gy + 99 ) / 100 )
1464	+ floor( ( $gy + 399 ) / 400 );
1465
1466	// Add the number of days for the past months of this year
1467	for ( $i = 0; $i < $gm; $i++ ) {
1468	$gDayNo += self::GREG_DAYS[$i];
1469	}
1470
1471	// Leap years
1472	if ( $gm > 1 && ( ( $gy % 4 === 0 && $gy % 100 !== 0 ) \|\| $gy % 400 == 0 ) ) {
1473	$gDayNo++;
1474	}
1475
1476	// Days passed in the current month
1477	$gDayNo += $gd;
1478
1479	$jDayNo = $gDayNo - 79;
1480
1481	$jNp = (int)floor( $jDayNo / 12053 );
1482	$jDayNo %= 12053;
1483
1484	$jy = 979 + 33 * $jNp + 4 * (int)floor( $jDayNo / 1461 );
1485	$jDayNo %= 1461;
1486
1487	if ( $jDayNo >= 366 ) {
1488	$jy += (int)floor( ( $jDayNo - 1 ) / 365 );
1489	$jDayNo = (int)floor( ( $jDayNo - 1 ) % 365 );
1490	}
1491
1492	$jz = $jDayNo;
1493
1494	for ( $i = 0; $i < 11 && $jDayNo >= self::IRANIAN_DAYS[$i]; $i++ ) {
1495	$jDayNo -= self::IRANIAN_DAYS[$i];
1496	}
1497
1498	$jm = $i + 1;
1499	$jd = $jDayNo + 1;
1500
1501	return [ $jy, $jm, $jd, $jz ];
1502	}
1503
1504	/**
1505	* Converting Gregorian dates to Hijri dates.
1506	*
1507	* Based on a PHP-Nuke block by Sharjeel which is released under GNU/GPL license
1508	*
1509	* @see https://phpnuke.org/modules.php?name=News&file=article&sid=8234&mode=thread&order=0&thold=0
1510	*
1511	* @param string $ts
1512	*
1513	* @return int[]
1514	*/
1515	private static function tsToHijri( $ts ) {
1516	$year = (int)substr( $ts, 0, 4 );
1517	$month = (int)substr( $ts, 4, 2 );
1518	$day = (int)substr( $ts, 6, 2 );
1519
1520	$zyr = $year;
1521	$zd = $day;
1522	$zm = $month;
1523	$zy = $zyr;
1524
1525	if (
1526	( $zy > 1582 ) \|\| ( ( $zy == 1582 ) && ( $zm > 10 ) ) \|\|
1527	( ( $zy == 1582 ) && ( $zm == 10 ) && ( $zd > 14 ) )
1528	) {
1529	$zjd = (int)( ( 1461 * ( $zy + 4800 + (int)( ( $zm - 14 ) / 12 ) ) ) / 4 ) +
1530	(int)( ( 367 * ( $zm - 2 - 12 * ( (int)( ( $zm - 14 ) / 12 ) ) ) ) / 12 ) -
1531	(int)( ( 3 * (int)( ( $zy + 4900 + (int)( ( $zm - 14 ) / 12 ) ) / 100 ) ) / 4 ) +
1532	$zd - 32075;
1533	} else {
1534	$zjd = 367 * $zy - (int)( ( 7 * ( $zy + 5001 + (int)( ( $zm - 9 ) / 7 ) ) ) / 4 ) +
1535	(int)( ( 275 * $zm ) / 9 ) + $zd + 1729777;
1536	}
1537
1538	$zl = $zjd - 1948440 + 10632;
1539	$zn = (int)( ( $zl - 1 ) / 10631 );
1540	$zl = $zl - 10631 * $zn + 354;
1541	$zj = ( (int)( ( 10985 - $zl ) / 5316 ) ) * ( (int)( ( 50 * $zl ) / 17719 ) ) +
1542	( (int)( $zl / 5670 ) ) * ( (int)( ( 43 * $zl ) / 15238 ) );
1543	$zl = $zl - ( (int)( ( 30 - $zj ) / 15 ) ) * ( (int)( ( 17719 * $zj ) / 50 ) ) -
1544	( (int)( $zj / 16 ) ) * ( (int)( ( 15238 * $zj ) / 43 ) ) + 29;
1545	$zm = (int)( ( 24 * $zl ) / 709 );
1546	$zd = $zl - (int)( ( 709 * $zm ) / 24 );
1547	$zy = 30 * $zn + $zj - 30;
1548
1549	return [ $zy, $zm, $zd ];
1550	}
1551
1552	/**
1553	* Converting Gregorian dates to Hebrew dates.
1554	*
1555	* Based on a JavaScript code by Abu Mami and Yisrael Hersch
1556	* (abu-mami@kaluach.net, http://www.kaluach.net), who permitted
1557	* to translate the relevant functions into PHP and release them under
1558	* GNU GPL.
1559	*
1560	* The months are counted from Tishrei = 1. In a leap year, Adar I is 13
1561	* and Adar II is 14. In a non-leap year, Adar is 6.
1562	*
1563	* @param string $ts
1564	*
1565	* @return int[]
1566	*/
1567	private static function tsToHebrew( $ts ) {
1568	# Parse date
1569	$year = (int)substr( $ts, 0, 4 );
1570	$month = (int)substr( $ts, 4, 2 );
1571	$day = (int)substr( $ts, 6, 2 );
1572
1573	# Calculate Hebrew year
1574	$hebrewYear = $year + 3760;
1575
1576	# Month number when September = 1, August = 12
1577	$month += 4;
1578	if ( $month > 12 ) {
1579	# Next year
1580	$month -= 12;
1581	$year++;
1582	$hebrewYear++;
1583	}
1584
1585	# Calculate day of year from 1 September
1586	$dayOfYear = $day;
1587	for ( $i = 1; $i < $month; $i++ ) {
1588	if ( $i == 6 ) {
1589	# February
1590	$dayOfYear += 28;
1591	# Check if the year is a leap year
1592	if ( $year % 400 == 0 \|\| ( $year % 4 == 0 && $year % 100 > 0 ) ) {
1593	$dayOfYear++;
1594	}
1595	} elseif ( $i == 8 \|\| $i == 10 \|\| $i == 1 \|\| $i == 3 ) {
1596	$dayOfYear += 30;
1597	} else {
1598	$dayOfYear += 31;
1599	}
1600	}
1601
1602	# Calculate the start of the Hebrew year
1603	$start = self::hebrewYearStart( $hebrewYear );
1604
1605	# Calculate next year's start
1606	if ( $dayOfYear <= $start ) {
1607	# Day is before the start of the year - it is the previous year
1608	# Next year's start
1609	$nextStart = $start;
1610	# Previous year
1611	$year--;
1612	$hebrewYear--;
1613	# Add days since the previous year's 1 September
1614	$dayOfYear += 365;
1615	if ( ( $year % 400 == 0 ) \|\| ( $year % 100 != 0 && $year % 4 == 0 ) ) {
1616	# Leap year
1617	$dayOfYear++;
1618	}
1619	# Start of the new (previous) year
1620	$start = self::hebrewYearStart( $hebrewYear );
1621	} else {
1622	# Next year's start
1623	$nextStart = self::hebrewYearStart( $hebrewYear + 1 );
1624	}
1625
1626	# Calculate Hebrew day of year
1627	$hebrewDayOfYear = $dayOfYear - $start;
1628
1629	# Difference between year's days
1630	$diff = $nextStart - $start;
1631	# Add 12 (or 13 for leap years) days to ignore the difference between
1632	# Hebrew and Gregorian year (353 at least vs. 365/6) - now the
1633	# difference is only about the year type
1634	if ( ( $year % 400 == 0 ) \|\| ( $year % 100 != 0 && $year % 4 == 0 ) ) {
1635	$diff += 13;
1636	} else {
1637	$diff += 12;
1638	}
1639
1640	# Check the year pattern, and is leap year
1641	# 0 means an incomplete year, 1 means a regular year, 2 means a complete year
1642	# This is mod 30, to work on both leap years (which add 30 days of Adar I)
1643	# and non-leap years
1644	$yearPattern = $diff % 30;
1645	# Check if leap year
1646	$isLeap = $diff >= 30;
1647
1648	# Calculate day in the month from number of day in the Hebrew year
1649	# Don't check Adar - if the day is not in Adar, we will stop before;
1650	# if it is in Adar, we will use it to check if it is Adar I or Adar II
1651	$hebrewDay = $hebrewDayOfYear;
1652	$hebrewMonth = 1;
1653	$days = 0;
1654	while ( $hebrewMonth <= 12 ) {
1655	# Calculate days in this month
1656	if ( $isLeap && $hebrewMonth == 6 ) {
1657	# Leap year - has Adar I, with 30 days, and Adar II, with 29 days
1658	$days = 30;
1659	if ( $hebrewDay <= $days ) {
1660	# Day in Adar I
1661	$hebrewMonth = 13;
1662	} else {
1663	# Subtract the days of Adar I
1664	$hebrewDay -= $days;
1665	# Try Adar II
1666	$days = 29;
1667	if ( $hebrewDay <= $days ) {
1668	# Day in Adar II
1669	$hebrewMonth = 14;
1670	}
1671	}
1672	} elseif ( $hebrewMonth == 2 && $yearPattern == 2 ) {
1673	# Cheshvan in a complete year (otherwise as the rule below)
1674	$days = 30;
1675	} elseif ( $hebrewMonth == 3 && $yearPattern == 0 ) {
1676	# Kislev in an incomplete year (otherwise as the rule below)
1677	$days = 29;
1678	} else {
1679	# Odd months have 30 days, even have 29
1680	$days = 30 - ( $hebrewMonth - 1 ) % 2;
1681	}
1682	if ( $hebrewDay <= $days ) {
1683	# In the current month
1684	break;
1685	} else {
1686	# Subtract the days of the current month
1687	$hebrewDay -= $days;
1688	# Try in the next month
1689	$hebrewMonth++;
1690	}
1691	}
1692
1693	return [ $hebrewYear, $hebrewMonth, $hebrewDay, $days ];
1694	}
1695
1696	/**
1697	* This calculates the Hebrew year start, as days since 1 September.
1698	* Based on Carl Friedrich Gauss algorithm for finding Easter date.
1699	* Used for Hebrew date.
1700	*
1701	* @param int $year
1702	*
1703	* @return int
1704	*/
1705	private static function hebrewYearStart( $year ) {
1706	$a = ( 12 * ( $year - 1 ) + 17 ) % 19;
1707	$b = ( $year - 1 ) % 4;
1708	$m = 32.044093161144 + 1.5542417966212 * $a + $b / 4.0 - 0.0031777940220923 * ( $year - 1 );
1709	if ( $m < 0 ) {
1710	$m--;
1711	}
1712	$Mar = intval( $m );
1713	if ( $m < 0 ) {
1714	$m++;
1715	}
1716	$m -= $Mar;
1717
1718	$c = ( $Mar + 3 * ( $year - 1 ) + 5 * $b + 5 ) % 7;
1719	if ( $c == 0 && $a > 11 && $m >= 0.89772376543210 ) {
1720	$Mar++;
1721	} elseif ( $c == 1 && $a > 6 && $m >= 0.63287037037037 ) {
1722	$Mar += 2;
1723	} elseif ( $c == 2 \|\| $c == 4 \|\| $c == 6 ) {
1724	$Mar++;
1725	}
1726
1727	$Mar += intval( ( $year - 3761 ) / 100 ) - intval( ( $year - 3761 ) / 400 ) - 24;
1728	return $Mar;
1729	}
1730
1731	/**
1732	* Algorithm to convert Gregorian dates to Thai solar dates,
1733	* Minguo dates or Minguo dates.
1734	*
1735	* Link: https://en.wikipedia.org/wiki/Thai_solar_calendar
1736	* https://en.wikipedia.org/wiki/Minguo_calendar
1737	*
1738	* @param string $ts 14-character timestamp
1739	* @param string $cName Calendar name
1740	* @return array Converted year, month, day
1741	*/
1742	private static function tsToYear( $ts, $cName ) {
1743	$gy = (int)substr( $ts, 0, 4 );
1744	$gm = (int)substr( $ts, 4, 2 );
1745	$gd = (int)substr( $ts, 6, 2 );
1746
1747	if ( $cName === 'thai' ) {
1748	# Thai solar dates
1749	# Add 543 years to the Gregorian calendar
1750	# Months and days are identical
1751	$gy_offset = $gy + 543;
1752	# fix for dates between 1912 and 1941
1753	# https://en.wikipedia.org/?oldid=836596673#New_year
1754	if ( $gy >= 1912 && $gy <= 1940 ) {
1755	if ( $gm <= 3 ) {
1756	$gy_offset--;
1757	}
1758	$gm = ( $gm - 3 ) % 12;
1759	}
1760	} elseif ( $cName === 'minguo' \|\| $cName === 'juche' ) {
1761	# Minguo dates
1762	# Deduct 1911 years from the Gregorian calendar
1763	# Months and days are identical
1764	$gy_offset = $gy - 1911;
1765	} else {
1766	$gy_offset = $gy;
1767	}
1768
1769	return [ $gy_offset, $gm, $gd ];
1770	}
1771
1772	/**
1773	* Algorithm to convert Gregorian dates to Japanese gengo year.
1774	*
1775	* Link: https://en.wikipedia.org/wiki/Japanese_era_name
1776	*
1777	* @param string $ts 14-character timestamp
1778	* @return string Converted year
1779	*/
1780	private static function tsToJapaneseGengo( $ts ) {
1781	# Nengō dates up to Meiji period.
1782	# Deduct years from the Gregorian calendar
1783	# depending on the nengo periods
1784	# The months and days are identical
1785	$gy = (int)substr( $ts, 0, 4 );
1786	$ts = (int)$ts;
1787	if ( $ts >= 18730101000000 && $ts < 19120730000000 ) {
1788	# Meiji period; start from meiji 6 (1873) it starts using gregorian year
1789	return self::tsToJapaneseGengoCalculate( $gy, 1868, '明治' );
1790	} elseif ( $ts >= 19120730000000 && $ts < 19261225000000 ) {
1791	# Taishō period
1792	return self::tsToJapaneseGengoCalculate( $gy, 1912, '大正' );
1793	} elseif ( $ts >= 19261225000000 && $ts < 19890108000000 ) {
1794	# Shōwa period
1795	return self::tsToJapaneseGengoCalculate( $gy, 1926, '昭和' );
1796	} elseif ( $ts >= 19890108000000 && $ts < 20190501000000 ) {
1797	# Heisei period
1798	return self::tsToJapaneseGengoCalculate( $gy, 1989, '平成' );
1799	} elseif ( $ts >= 20190501000000 ) {
1800	# Reiwa period
1801	return self::tsToJapaneseGengoCalculate( $gy, 2019, '令和' );
1802	}
1803	return "西暦$gy";
1804	}
1805
1806	/**
1807	* Calculate Gregorian year to Japanese gengo year.
1808	*
1809	* Link: https://en.wikipedia.org/wiki/Japanese_era_name
1810	*
1811	* @param int $gy 4-digit Gregorian year
1812	* @param int $startYear 4-digit Gengo start year
1813	* @param string $gengo Actual Gengo string
1814	* @return string Converted year
1815	*/
1816	private static function tsToJapaneseGengoCalculate( $gy, $startYear, $gengo ) {
1817	$gy_offset = $gy - $startYear + 1;
1818	if ( $gy_offset == 1 ) {
1819	$gy_offset = '元';
1820	}
1821	return "$gengo$gy_offset";
1822	}
1823
1824	/**
1825	* Gets directionality of the first strongly directional codepoint, for embedBidi()
1826	*
1827	* This is the rule the BIDI algorithm uses to determine the directionality of
1828	* paragraphs ( https://www.unicode.org/reports/tr9/#The_Paragraph_Level ) and
1829	* FSI isolates ( https://www.unicode.org/reports/tr9/#Explicit_Directional_Isolates ).
1830	*
1831	* TODO: Does not handle BIDI control characters inside the text.
1832	* TODO: Does not handle unallocated characters.
1833	*
1834	* @param string $text Text to test
1835	* @return null\|string Directionality ('ltr' or 'rtl') or null
1836	*/
1837	private static function strongDirFromContent( $text = '' ) {
1838	if ( !preg_match( self::$strongDirRegex, $text, $matches ) ) {
1839	return null;
1840	}
1841	if ( $matches[1] === '' ) {
1842	return 'rtl';
1843	}
1844	return 'ltr';
1845	}
1846
1847	/**
1848	* Roman number formatting up to 10000
1849	*
1850	* @param int $num
1851	*
1852	* @return string
1853	*/
1854	public static function romanNumeral( $num ) {
1855	static $table = [
1856	[ '', 'I', 'II', 'III', 'IV', 'V', 'VI', 'VII', 'VIII', 'IX', 'X' ],
1857	[ '', 'X', 'XX', 'XXX', 'XL', 'L', 'LX', 'LXX', 'LXXX', 'XC', 'C' ],
1858	[ '', 'C', 'CC', 'CCC', 'CD', 'D', 'DC', 'DCC', 'DCCC', 'CM', 'M' ],
1859	[ '', 'M', 'MM', 'MMM', 'MMMM', 'MMMMM', 'MMMMMM', 'MMMMMMM',
1860	'MMMMMMMM', 'MMMMMMMMM', 'MMMMMMMMMM' ]
1861	];
1862
1863	$num = intval( $num );
1864	if ( $num > 10000 \|\| $num <= 0 ) {
1865	return (string)$num;
1866	}
1867
1868	$s = '';
1869	for ( $pow10 = 1000, $i = 3; $i >= 0; $pow10 /= 10, $i-- ) {
1870	if ( $num >= $pow10 ) {
1871	$s .= $table[$i][(int)floor( $num / $pow10 )];
1872	}
1873	$num %= $pow10;
1874	}
1875	return $s;
1876	}
1877
1878	/**
1879	* Hebrew Gematria number formatting up to 9999
1880	*
1881	* @param int $num
1882	*
1883	* @return string
1884	*/
1885	public static function hebrewNumeral( $num ) {
1886	static $table = [
1887	[ '', 'א', 'ב', 'ג', 'ד', 'ה', 'ו', 'ז', 'ח', 'ט', 'י' ],
1888	[ '', 'י', 'כ', 'ל', 'מ', 'נ', 'ס', 'ע', 'פ', 'צ', 'ק' ],
1889	[ '',
1890	[ 'ק' ],
1891	[ 'ר' ],
1892	[ 'ש' ],
1893	[ 'ת' ],
1894	[ 'ת', 'ק' ],
1895	[ 'ת', 'ר' ],
1896	[ 'ת', 'ש' ],
1897	[ 'ת', 'ת' ],
1898	[ 'ת', 'ת', 'ק' ],
1899	[ 'ת', 'ת', 'ר' ],
1900	],
1901	[ '', 'א', 'ב', 'ג', 'ד', 'ה', 'ו', 'ז', 'ח', 'ט', 'י' ]
1902	];
1903
1904	$num = intval( $num );
1905	if ( $num > 9999 \|\| $num <= 0 ) {
1906	return (string)$num;
1907	}
1908
1909	// Round thousands have special notations
1910	if ( $num === 1000 ) {
1911	return "א' אלף";
1912	} elseif ( $num % 1000 === 0 ) {
1913	return $table[0][$num / 1000] . "' אלפים";
1914	}
1915
1916	$letters = [];
1917
1918	for ( $pow10 = 1000, $i = 3; $i >= 0; $pow10 /= 10, $i-- ) {
1919	if ( $num >= $pow10 ) {
1920	if ( $num === 15 \|\| $num === 16 ) {
1921	$letters[] = $table[0][9];
1922	$letters[] = $table[0][$num - 9];
1923	$num = 0;
1924	} else {
1925	$letters = array_merge(
1926	$letters,
1927	(array)$table[$i][intval( $num / $pow10 )]
1928	);
1929
1930	if ( $pow10 === 1000 ) {
1931	$letters[] = "'";
1932	}
1933	}
1934	}
1935
1936	$num %= $pow10;
1937	}
1938
1939	$preTransformLength = count( $letters );
1940	if ( $preTransformLength === 1 ) {
1941	// Add geresh (single quote) to one-letter numbers
1942	$letters[] = "'";
1943	} else {
1944	$lastIndex = $preTransformLength - 1;
1945	$letters[$lastIndex] = strtr(
1946	$letters[$lastIndex],
1947	[ 'כ' => 'ך', 'מ' => 'ם', 'נ' => 'ן', 'פ' => 'ף', 'צ' => 'ץ' ]
1948	);
1949
1950	// Add gershayim (double quote) to multiple-letter numbers,
1951	// but exclude numbers with only one letter after the thousands
1952	// (1001-1009, 1020, 1030, 2001-2009, etc.)
1953	if ( $letters[1] === "'" && $preTransformLength === 3 ) {
1954	$letters[] = "'";
1955	} else {
1956	array_splice( $letters, -1, 0, '"' );
1957	}
1958	}
1959
1960	return implode( $letters );
1961	}
1962
1963	/**
1964	* Used by date() and time() to adjust the time output.
1965	*
1966	* @param string $ts The time in date('YmdHis') format
1967	* @param string\|false $tz Adjust the time by this amount (default false, mean we
1968	* get user timecorrection setting)
1969	* @return string
1970	*/
1971	public function userAdjust( $ts, $tz = false ) {
1972	$localTZoffset = $this->config->get( MainConfigNames::LocalTZoffset );
1973	if ( $tz === false ) {
1974	$optionsLookup = MediaWikiServices::getInstance()->getUserOptionsLookup();
1975	$tz = $optionsLookup->getOption(
1976	RequestContext::getMain()->getUser(),
1977	'timecorrection'
1978	);
1979	}
1980
1981	$timeCorrection = new UserTimeCorrection( (string)$tz, null, $localTZoffset );
1982
1983	$tzObj = $timeCorrection->getTimeZone();
1984	if ( $tzObj ) {
1985	$date = new DateTime( $ts, new DateTimeZone( 'UTC' ) );
1986	$date->setTimezone( $tzObj );
1987	return self::makeMediaWikiTimestamp( $ts, $date );
1988	}
1989	$minDiff = $timeCorrection->getTimeOffset();
1990
1991	# No difference? Return the time unchanged
1992	if ( $minDiff === 0 ) {
1993	return $ts;
1994	}
1995
1996	$date = new DateTime( $ts );
1997	$date->modify( "{$minDiff} minutes" );
1998	return self::makeMediaWikiTimestamp( $ts, $date );
1999	}
2000
2001	/**
2002	* Convenience function to convert a PHP DateTime object to a 14-character MediaWiki timestamp,
2003	* falling back to the specified timestamp if the DateTime object holds a too large date (T32148, T277809).
2004	* This is a private utility method as it is only really useful for {@link userAdjust}.
2005	*
2006	* @param string $fallback 14-character MW timestamp to fall back to if the DateTime object holds a too large date
2007	* @param DateTime $date The DateTime object to convert
2008	* @return string 14-character MW timestamp
2009	*/
2010	private static function makeMediaWikiTimestamp( $fallback, $date ) {
2011	$ts = $date->format( 'YmdHis' );
2012	return strlen( $ts ) === 14 ? $ts : $fallback;
2013	}
2014
2015	/**
2016	* This is meant to be used by time(), date(), and timeanddate() to get
2017	* the date preference they're supposed to use. It should be used in
2018	* all children.
2019	*
2020	* function timeanddate([...], $format = true) {
2021	* $datePreference = $this->dateFormat($format);
2022	* [...]
2023	* }
2024	*
2025	* @param int\|string\|bool $usePrefs If true, the user's preference is used
2026	* if false, the site/language default is used
2027	* if int/string, assumed to be a format.
2028	* @return string
2029	*/
2030	public function dateFormat( $usePrefs = true ) {
2031	if ( is_bool( $usePrefs ) ) {
2032	if ( $usePrefs ) {
2033	$datePreference = RequestContext::getMain()
2034	->getUser()
2035	->getDatePreference();
2036	} else {
2037	$userOptionsLookup = MediaWikiServices::getInstance()->getUserOptionsLookup();
2038	$datePreference = (string)$userOptionsLookup->getDefaultOption( 'date' );
2039	}
2040	} else {
2041	$datePreference = (string)$usePrefs;
2042	}
2043
2044	// return int
2045	if ( $datePreference == '' ) {
2046	return 'default';
2047	}
2048
2049	return $datePreference;
2050	}
2051
2052	/**
2053	* Get a format string for a given type and preference
2054	* @param string $type One of 'date', 'time', 'both', or 'pretty'.
2055	* @param string $pref The format name as it appears in Messages*.php under
2056	* $datePreferences.
2057	*
2058	* @since 1.22 New type 'pretty' that provides a more readable timestamp format
2059	*
2060	* @return string
2061	*/
2062	public function getDateFormatString( $type, $pref ) {
2063	$wasDefault = false;
2064	if ( $pref == 'default' ) {
2065	$wasDefault = true;
2066	$pref = $this->getDefaultDateFormat();
2067	}
2068
2069	if ( !isset( $this->dateFormatStrings[$type][$pref] ) ) {
2070	$df = $this->localisationCache
2071	->getSubitem( $this->mCode, 'dateFormats', "$pref $type" );
2072
2073	if ( $type === 'pretty' && $df === null ) {
2074	$df = $this->getDateFormatString( 'date', $pref );
2075	}
2076
2077	if ( !$wasDefault && $df === null ) {
2078	$pref = $this->getDefaultDateFormat();
2079	$df = $this->localisationCache
2080	->getSubitem( $this->mCode, 'dateFormats', "$pref $type" );
2081	}
2082
2083	$this->dateFormatStrings[$type][$pref] = $df;
2084	}
2085	return $this->dateFormatStrings[$type][$pref];
2086	}
2087
2088	/**
2089	* @param string $ts The time format which needs to be turned into a
2090	* date('YmdHis') format with wfTimestamp(TS_MW,$ts)
2091	* @param bool $adj Whether to adjust the time output according to the
2092	* user configured offset ($timecorrection)
2093	* @param mixed $format True to use user's date format preference
2094	* @param string\|false $timecorrection The time offset as returned by
2095	* validateTimeZone() in Special:Preferences
2096	* @return string
2097	*/
2098	public function date( $ts, $adj = false, $format = true, $timecorrection = false ) {
2099	$ts = wfTimestamp( TS_MW, $ts );
2100	if ( $adj ) {
2101	$ts = $this->userAdjust( $ts, $timecorrection );
2102	}
2103	$df = $this->getDateFormatString( 'date', $this->dateFormat( $format ) );
2104	return $this->sprintfDate( $df, $ts );
2105	}
2106
2107	/**
2108	* @param string $ts The time format which needs to be turned into a
2109	* date('YmdHis') format with wfTimestamp(TS_MW,$ts)
2110	* @param bool $adj Whether to adjust the time output according to the
2111	* user configured offset ($timecorrection)
2112	* @param mixed $format True to use user's date format preference
2113	* @param string\|false $timecorrection The time offset as returned by
2114	* validateTimeZone() in Special:Preferences
2115	* @return string
2116	*/
2117	public function time( $ts, $adj = false, $format = true, $timecorrection = false ) {
2118	$ts = wfTimestamp( TS_MW, $ts );
2119	if ( $adj ) {
2120	$ts = $this->userAdjust( $ts, $timecorrection );
2121	}
2122	$df = $this->getDateFormatString( 'time', $this->dateFormat( $format ) );
2123	return $this->sprintfDate( $df, $ts );
2124	}
2125
2126	/**
2127	* @param string $ts The time format which needs to be turned into a
2128	* date('YmdHis') format with wfTimestamp(TS_MW,$ts)
2129	* @param bool $adj Whether to adjust the time output according to the
2130	* user configured offset ($timecorrection)
2131	* @param mixed $format What date format to return the result in; if it's false output the
2132	* default one (default true)
2133	* @param string\|false $timecorrection The time offset as returned by
2134	* validateTimeZone() in Special:Preferences
2135	* @return string
2136	*/
2137	public function timeanddate( $ts, $adj = false, $format = true, $timecorrection = false ) {
2138	$ts = wfTimestamp( TS_MW, $ts );
2139	if ( $adj ) {
2140	$ts = $this->userAdjust( $ts, $timecorrection );
2141	}
2142	$df = $this->getDateFormatString( 'both', $this->dateFormat( $format ) );
2143	return $this->sprintfDate( $df, $ts );
2144	}
2145
2146	/**
2147	* Takes a number of seconds and turns it into a text using values such as hours and minutes.
2148	*
2149	* @since 1.20
2150	*
2151	* @param int $seconds The number of seconds.
2152	* @param array $chosenIntervals The intervals to enable.
2153	*
2154	* @return string
2155	*/
2156	public function formatDuration( $seconds, array $chosenIntervals = [] ) {
2157	$intervals = $this->getDurationIntervals( $seconds, $chosenIntervals );
2158
2159	$segments = [];
2160
2161	foreach ( $intervals as $intervalName => $intervalValue ) {
2162	// Messages: duration-seconds, duration-minutes, duration-hours, duration-days, duration-weeks,
2163	// duration-years, duration-decades, duration-centuries, duration-millennia
2164	$message = $this->msg( 'duration-' . $intervalName )->numParams( $intervalValue );
2165	$segments[] = $message->escaped();
2166	}
2167
2168	return $this->listToText( $segments );
2169	}
2170
2171	/**
2172	* Takes two timestamps and turns the difference between them into a text using values such as hours and minutes.
2173	*
2174	* @param int $timestamp1 The first timestamp.
2175	* @param int $timestamp2 The second timestamp.
2176	* @param ?int $precision The number of intervals to show.
2177	*
2178	* @return string
2179	*/
2180	public function formatDurationBetweenTimestamps(
2181	int $timestamp1,
2182	int $timestamp2,
2183	?int $precision = null
2184	): string {
2185	$precision ??= count( self::DURATION_INTERVALS );
2186
2187	$sortedTimestamps = [ $timestamp1, $timestamp2 ];
2188	sort( $sortedTimestamps );
2189
2190	$date1 = ( new DateTimeImmutable() )->setTimestamp( $sortedTimestamps[0] );
2191	$date2 = ( new DateTimeImmutable() )->setTimestamp( $sortedTimestamps[1] );
2192
2193	$interval = $date1->diff( $date2 );
2194
2195	$format = [];
2196	if ( $interval->y >= 1000 ) {
2197	$millennia = floor( $interval->y / 1000 );
2198	$format[] = $this->msg( 'duration-millennia' )->numParams( $millennia )->text();
2199	$interval->y -= $millennia * 1000;
2200	}
2201	if ( $interval->y >= 100 ) {
2202	$centuries = floor( $interval->y / 100 );
2203	$format[] = $this->msg( 'duration-centuries' )->numParams( $centuries )->text();
2204	$interval->y -= $centuries * 100;
2205	}
2206	if ( $interval->y >= 10 ) {
2207	$decades = floor( $interval->y / 10 );
2208	$format[] = $this->msg( 'duration-decades' )->numParams( $decades )->text();
2209	$interval->y -= $decades * 10;
2210	}
2211	if ( $interval->y !== 0 ) {
2212	$format[] = $this->msg( 'duration-years' )->numParams( $interval->y )->text();
2213	}
2214	if ( $interval->m !== 0 ) {
2215	$format[] = $this->msg( 'duration-months' )->numParams( $interval->m )->text();
2216	}
2217	if ( $interval->d !== 0 ) {
2218	$format[] = $this->msg( 'duration-days' )->numParams( $interval->d )->text();
2219	}
2220	if ( $interval->h !== 0 ) {
2221	$format[] = $this->msg( 'duration-hours' )->numParams( $interval->h )->text();
2222	}
2223	if ( $interval->i !== 0 ) {
2224	$format[] = $this->msg( 'duration-minutes' )->numParams( $interval->i )->text();
2225	}
2226	if ( $interval->s !== 0 ) {
2227	$format[] = $this->msg( 'duration-seconds' )->numParams( $interval->s )->text();
2228	}
2229
2230	// slice the array to the provided precision
2231	$format = array_slice( $format, 0, $precision );
2232	// build the string from the array
2233	$format = $this->listToText( $format );
2234
2235	return $format ?: $this->msg( 'duration-seconds' )->numParams( 0 )->text();
2236	}
2237
2238	/**
2239	* Takes a number of seconds and returns an array with a set of corresponding intervals.
2240	* For example, 65 will be turned into [ minutes => 1, seconds => 5 ].
2241	*
2242	* @since 1.20
2243	*
2244	* @param int $seconds The number of seconds.
2245	* @param array $chosenIntervals The intervals to enable.
2246	*
2247	* @return int[]
2248	*/
2249	public function getDurationIntervals( $seconds, array $chosenIntervals = [] ) {
2250	if ( !$chosenIntervals ) {
2251	// Default intervals. Do not include `months` as they were not part of the origional default implementaiton
2252	$chosenIntervals = [
2253	'millennia',
2254	'centuries',
2255	'decades',
2256	'years',
2257	'days',
2258	'hours',
2259	'minutes',
2260	'seconds'
2261	];
2262	}
2263
2264	$intervals = array_intersect_key( self::DURATION_INTERVALS,
2265	array_fill_keys( $chosenIntervals, true ) );
2266	$sortedNames = array_keys( $intervals );
2267	$smallestInterval = array_pop( $sortedNames );
2268
2269	$segments = [];
2270
2271	foreach ( $intervals as $name => $length ) {
2272	$value = floor( $seconds / $length );
2273
2274	if ( $value > 0 \|\| ( $name == $smallestInterval && !$segments ) ) {
2275	$seconds -= $value * $length;
2276	$segments[$name] = $value;
2277	}
2278	}
2279
2280	return $segments;
2281	}
2282
2283	/**
2284	* Internal helper function for userDate(), userTime() and userTimeAndDate()
2285	*
2286	* @param string $type Can be 'date', 'time' or 'both'
2287	* @param string $ts The time format which needs to be turned into a
2288	* date('YmdHis') format with wfTimestamp(TS_MW,$ts)
2289	* @param UserIdentity $user User used to get preferences for timezone and format
2290	* @param array $options Array, can contain the following keys:
2291	* - 'timecorrection': time correction, can have the following values:
2292	* - true: use user's preference
2293	* - false: don't use time correction
2294	* - int: value of time correction in minutes
2295	* - 'format': format to use, can have the following values:
2296	* - true: use user's preference
2297	* - false: use default preference
2298	* - string: format to use
2299	* @since 1.19
2300	* @return string
2301	*/
2302	private function internalUserTimeAndDate( $type, $ts, UserIdentity $user, array $options ) {
2303	$ts = wfTimestamp( TS_MW, $ts );
2304	$options += [ 'timecorrection' => true, 'format' => true ];
2305	if ( $options['timecorrection'] !== false ) {
2306	if ( $options['timecorrection'] === true ) {
2307	$offset = MediaWikiServices::getInstance()
2308	->getUserOptionsLookup()
2309	->getOption( $user, 'timecorrection' );
2310	} else {
2311	$offset = $options['timecorrection'];
2312	}
2313	$ts = $this->userAdjust( $ts, $offset );
2314	}
2315	if ( $options['format'] === true ) {
2316	$format = MediaWikiServices::getInstance()
2317	->getUserFactory()
2318	->newFromUserIdentity( $user )
2319	->getDatePreference();
2320	} else {
2321	$format = $options['format'];
2322	}
2323	$df = $this->getDateFormatString( $type, $this->dateFormat( $format ) );
2324	return $this->sprintfDate( $df, $ts );
2325	}
2326
2327	/**
2328	* Get the formatted date for the given timestamp and formatted for
2329	* the given user.
2330	*
2331	* @param mixed $ts Mixed: the time format which needs to be turned into a
2332	* date('YmdHis') format with wfTimestamp(TS_MW,$ts)
2333	* @param UserIdentity $user User used to get preferences for timezone and format
2334	* @param array $options Array, can contain the following keys:
2335	* - 'timecorrection': time correction, can have the following values:
2336	* - true: use user's preference
2337	* - false: don't use time correction
2338	* - int: value of time correction in minutes
2339	* - 'format': format to use, can have the following values:
2340	* - true: use user's preference
2341	* - false: use default preference
2342	* - string: format to use
2343	* @since 1.19
2344	* @return string
2345	*/
2346	public function userDate( $ts, UserIdentity $user, array $options = [] ) {
2347	return $this->internalUserTimeAndDate( 'date', $ts, $user, $options );
2348	}
2349
2350	/**
2351	* Get the formatted time for the given timestamp and formatted for
2352	* the given user.
2353	*
2354	* @param mixed $ts The time format which needs to be turned into a
2355	* date('YmdHis') format with wfTimestamp(TS_MW,$ts)
2356	* @param UserIdentity $user User used to get preferences for timezone and format
2357	* @param array $options Array, can contain the following keys:
2358	* - 'timecorrection': time correction, can have the following values:
2359	* - true: use user's preference
2360	* - false: don't use time correction
2361	* - int: value of time correction in minutes
2362	* - 'format': format to use, can have the following values:
2363	* - true: use user's preference
2364	* - false: use default preference
2365	* - string: format to use
2366	* @since 1.19
2367	* @return string
2368	*/
2369	public function userTime( $ts, UserIdentity $user, array $options = [] ) {
2370	return $this->internalUserTimeAndDate( 'time', $ts, $user, $options );
2371	}
2372
2373	/**
2374	* Get the formatted date and time for the given timestamp and formatted for
2375	* the given user.
2376	*
2377	* @param mixed $ts The time format which needs to be turned into a
2378	* date('YmdHis') format with wfTimestamp(TS_MW,$ts)
2379	* @param UserIdentity $user User used to get preferences for timezone and format
2380	* @param array $options Array, can contain the following keys:
2381	* - 'timecorrection': time correction, can have the following values:
2382	* - true: use user's preference
2383	* - false: don't use time correction
2384	* - int: value of time correction in minutes
2385	* - 'format': format to use, can have the following values:
2386	* - true: use user's preference
2387	* - false: use default preference
2388	* - string: format to use
2389	* @since 1.19
2390	* @return string
2391	*/
2392	public function userTimeAndDate( $ts, UserIdentity $user, array $options = [] ) {
2393	return $this->internalUserTimeAndDate( 'both', $ts, $user, $options );
2394	}
2395
2396	/**
2397	* Get the timestamp in a human-friendly relative format, e.g., "3 days ago".
2398	*
2399	* Determine the difference between the timestamp and the current time, and
2400	* generate a readable timestamp by returning "<N> <units> ago", where the
2401	* largest possible unit is used.
2402	*
2403	* @since 1.26 (Prior to 1.26, the method existed but was not meant to be used directly)
2404	*
2405	* @param MWTimestamp $time
2406	* @param MWTimestamp\|null $relativeTo The base timestamp to compare to (defaults to now)
2407	* @param UserIdentity\|null $user User the timestamp is being generated for
2408	* (or null to use main context's user)
2409	* @return string Formatted timestamp
2410	*/
2411	public function getHumanTimestamp(
2412	MWTimestamp $time, ?MWTimestamp $relativeTo = null, ?UserIdentity $user = null
2413	) {
2414	$relativeTo ??= new MWTimestamp();
2415	if ( $user === null ) {
2416	$user = RequestContext::getMain()->getUser();
2417	} else {
2418	// For compatibility with the hook signature and self::getHumanTimestampInternal
2419	$user = MediaWikiServices::getInstance()
2420	->getUserFactory()
2421	->newFromUserIdentity( $user );
2422	}
2423
2424	// Adjust for the user's timezone.
2425	$offsetThis = $time->offsetForUser( $user );
2426	$offsetRel = $relativeTo->offsetForUser( $user );
2427
2428	$ts = '';
2429	if ( $this->getHookRunner()->onGetHumanTimestamp( $ts, $time, $relativeTo, $user, $this ) ) {
2430	$ts = $this->getHumanTimestampInternal( $time, $relativeTo, $user );
2431	}
2432
2433	// Reset the timezone on the objects.
2434	$time->timestamp->sub( $offsetThis );
2435	$relativeTo->timestamp->sub( $offsetRel );
2436
2437	return $ts;
2438	}
2439
2440	/**
2441	* Convert an MWTimestamp into a pretty human-readable timestamp using
2442	* the given user preferences and relative base time.
2443	*
2444	* @see Language::getHumanTimestamp
2445	* @param MWTimestamp $ts Timestamp to prettify
2446	* @param MWTimestamp $relativeTo Base timestamp
2447	* @param User $user User preferences to use
2448	* @return string Human timestamp
2449	* @since 1.26
2450	*/
2451	private function getHumanTimestampInternal(
2452	MWTimestamp $ts, MWTimestamp $relativeTo, User $user
2453	) {
2454	$diff = $ts->diff( $relativeTo );
2455	$diffDay = (bool)( (int)$ts->timestamp->format( 'w' ) -
2456	(int)$relativeTo->timestamp->format( 'w' ) );
2457	$days = $diff->days ?: (int)$diffDay;
2458
2459	if ( $diff->invert ) {
2460	// Future dates: Use full timestamp
2461	/**
2462	* @todo FIXME: Add better handling of future timestamps.
2463	*/
2464	$format = $this->getDateFormatString( 'both', $user->getDatePreference() ?: 'default' );
2465	$ts = $this->sprintfDate( $format, $ts->getTimestamp( TS_MW ) );
2466	} elseif (
2467	$days > 5 &&
2468	$ts->timestamp->format( 'Y' ) !== $relativeTo->timestamp->format( 'Y' )
2469	) {
2470	// Timestamps are in different years and more than 5 days apart: use full date
2471	$format = $this->getDateFormatString( 'date', $user->getDatePreference() ?: 'default' );
2472	$ts = $this->sprintfDate( $format, $ts->getTimestamp( TS_MW ) );
2473	} elseif ( $days > 5 ) {
2474	// Timestamps are in same year and more than 5 days ago: show day and month only.
2475	$format = $this->getDateFormatString( 'pretty', $user->getDatePreference() ?: 'default' );
2476	$ts = $this->sprintfDate( $format, $ts->getTimestamp( TS_MW ) );
2477	} elseif ( $days > 1 ) {
2478	// Timestamp within the past 5 days: show the day of the week and time
2479	$format = $this->getDateFormatString( 'time', $user->getDatePreference() ?: 'default' );
2480	$weekday = self::WEEKDAY_MESSAGES[(int)$ts->timestamp->format( 'w' )];
2481	// The following messages are used here:
2482	// * sunday-at, monday-at, tuesday-at, wednesday-at, thursday-at, friday-at, saturday-at
2483	$ts = $this->msg( "$weekday-at" )
2484	->params( $this->sprintfDate( $format, $ts->getTimestamp( TS_MW ) ) )
2485	->text();
2486	} elseif ( $days == 1 ) {
2487	// Timestamp was yesterday: say 'yesterday' and the time.
2488	$format = $this->getDateFormatString( 'time', $user->getDatePreference() ?: 'default' );
2489	$ts = $this->msg( 'yesterday-at' )
2490	->params( $this->sprintfDate( $format, $ts->getTimestamp( TS_MW ) ) )
2491	->text();
2492	} elseif ( $diff->h > 1 \|\| ( $diff->h == 1 && $diff->i > 30 ) ) {
2493	// Timestamp was today, but more than 90 minutes ago: say 'today' and the time.
2494	$format = $this->getDateFormatString( 'time', $user->getDatePreference() ?: 'default' );
2495	$ts = $this->msg( 'today-at' )
2496	->params( $this->sprintfDate( $format, $ts->getTimestamp( TS_MW ) ) )
2497	->text();
2498
2499	// From here on in, the timestamp was soon enough ago so that we can simply say
2500	// XX units ago, e.g., "2 hours ago" or "5 minutes ago"
2501	} elseif ( $diff->h == 1 ) {
2502	// Less than 90 minutes, but more than an hour ago.
2503	$ts = $this->msg( 'hours-ago' )->numParams( 1 )->text();
2504	} elseif ( $diff->i >= 1 ) {
2505	// A few minutes ago.
2506	$ts = $this->msg( 'minutes-ago' )->numParams( $diff->i )->text();
2507	} elseif ( $diff->s >= 30 ) {
2508	// Less than a minute, but more than 30 sec ago.
2509	$ts = $this->msg( 'seconds-ago' )->numParams( $diff->s )->text();
2510	} else {
2511	// Less than 30 seconds ago.
2512	$ts = $this->msg( 'just-now' )->text();
2513	}
2514
2515	return $ts;
2516	}
2517
2518	/**
2519	* Gets the localized friendly name for a group, if it exists. For example,
2520	* "Administrators" or "Bureaucrats"
2521	*
2522	* @since 1.38
2523	* @param string $group Internal group name
2524	* @return string Localized friendly group name
2525	*/
2526	public function getGroupName( $group ) {
2527	$msg = $this->msg( "group-$group" );
2528	return $msg->isBlank() ? $group : $msg->text();
2529	}
2530
2531	/**
2532	* Gets the localized name for a member of a user group if it exists.
2533	* For example, "administrator" or "bureaucrat"
2534	*
2535	* @since 1.38
2536	* @param string $group Internal group name
2537	* @param string\|UserIdentity $member
2538	* @return string Localized name for group member
2539	*/
2540	public function getGroupMemberName( string $group, $member ) {
2541	if ( $member instanceof UserIdentity ) {
2542	$member = $member->getName();
2543	}
2544	$msg = $this->msg( "group-$group-member", $member );
2545	return $msg->isBlank() ? $group : $msg->text();
2546	}
2547
2548	/**
2549	* @deprecated since 1.41, use LocalisationCache or MessageCache as appropriate.
2550	* @param string $key
2551	* @return string\|null
2552	*/
2553	public function getMessage( $key ) {
2554	return $this->localisationCache->getSubitem( $this->mCode, 'messages', $key );
2555	}
2556
2557	/**
2558	* @deprecated since 1.41, use LocalisationCache directly.
2559	* @return string[]
2560	*/
2561	public function getAllMessages() {
2562	return $this->localisationCache->getItem( $this->mCode, 'messages' );
2563	}
2564
2565	/**
2566	* @param string $in
2567	* @param string $out
2568	* @param string $string
2569	* @return string
2570	*/
2571	public function iconv( $in, $out, $string ) {
2572	# Even with //IGNORE iconv can whine about illegal characters in
2573	# input string. We just ignore those too.
2574	# REF: https://bugs.php.net/bug.php?id=37166
2575	# REF: https://phabricator.wikimedia.org/T18885
2576	AtEase::suppressWarnings();
2577	$text = iconv( $in, $out . '//IGNORE', $string );
2578	AtEase::restoreWarnings();
2579	return $text;
2580	}
2581
2582	/**
2583	* @param string $str
2584	* @return string The string with uppercase conversion applied to the first character
2585	*/
2586	public function ucfirst( $str ) {
2587	$octetCode = ord( $str );
2588	// See https://en.wikipedia.org/wiki/ASCII#Printable_characters
2589	if ( $octetCode < 96 ) {
2590	// Assume this is an uppercase/uncased ASCII character
2591	return (string)$str;
2592	} elseif ( $octetCode < 128 ) {
2593	// Assume this is a lowercase/uncased ASCII character
2594	return ucfirst( $str );
2595	}
2596	$first = mb_substr( $str, 0, 1 );
2597	if ( strlen( $first ) === 1 ) {
2598	// Broken UTF-8?
2599	return ucfirst( $str );
2600	}
2601
2602	// Memoize the config table
2603	$overrides = $this->overrideUcfirstCharacters
2604	??= $this->config->get( MainConfigNames::OverrideUcfirstCharacters );
2605
2606	// Use the config table and fall back to MB_CASE_TITLE
2607	$ucFirst = $overrides[$first] ?? mb_convert_case( $first, MB_CASE_TITLE );
2608	if ( $ucFirst !== $first ) {
2609	return $ucFirst . mb_substr( $str, 1 );
2610	} else {
2611	return $str;
2612	}
2613	}
2614
2615	/**
2616	* @param string $str
2617	* @param bool $first Whether to uppercase only the first character
2618	* @return string The string with uppercase conversion applied
2619	*/
2620	public function uc( $str, $first = false ) {
2621	if ( $first ) {
2622	return $this->ucfirst( $str );
2623	} else {
2624	return $this->isMultibyte( $str ) ? mb_strtoupper( $str ) : strtoupper( $str );
2625	}
2626	}
2627
2628	/**
2629	* @param string $str
2630	* @return string The string with lowercase conversion applied to the first character
2631	*/
2632	public function lcfirst( $str ) {
2633	$octetCode = ord( $str );
2634	// See https://en.wikipedia.org/wiki/ASCII#Printable_characters
2635	if ( $octetCode < 96 ) {
2636	// Assume this is an uppercase/uncased ASCII character
2637	return lcfirst( $str );
2638	} elseif ( $octetCode < 128 ) {
2639	// Assume this is a lowercase/uncased ASCII character
2640	return (string)$str;
2641	}
2642
2643	return $this->isMultibyte( $str )
2644	// Assume this is a multibyte character and mb_internal_encoding() is appropriate
2645	? mb_strtolower( mb_substr( $str, 0, 1 ) ) . mb_substr( $str, 1 )
2646	// Assume this is a non-multibyte character and LC_CASE is appropriate
2647	: lcfirst( $str );
2648	}
2649
2650	/**
2651	* @param string $str
2652	* @param bool $first Whether to lowercase only the first character
2653	* @return string The string with lowercase conversion applied
2654	*/
2655	public function lc( $str, $first = false ) {
2656	if ( $first ) {
2657	return $this->lcfirst( $str );
2658	} else {
2659	return $this->isMultibyte( $str ) ? mb_strtolower( $str ) : strtolower( $str );
2660	}
2661	}
2662
2663	/**
2664	* @param string $str
2665	* @return bool
2666	*/
2667	private function isMultibyte( $str ) {
2668	return strlen( $str ) !== mb_strlen( $str );
2669	}
2670
2671	/**
2672	* @param string $str
2673	* @return mixed\|string
2674	*/
2675	public function ucwords( $str ) {
2676	if ( $this->isMultibyte( $str ) ) {
2677	$str = $this->lc( $str );
2678
2679	// regexp to find the first letter in each word (i.e., after each space)
2680	$replaceRegexp = "/^([a-z]\|[\\xc0-\\xff][\\x80-\\xbf])\| ([a-z]\|[\\xc0-\\xff][\\x80-\\xbf])/";
2681
2682	// function to use to capitalize a single char
2683	return preg_replace_callback(
2684	$replaceRegexp,
2685	static function ( $matches ) {
2686	return mb_strtoupper( $matches[0] );
2687	},
2688	$str
2689	);
2690	} else {
2691	return ucwords( strtolower( $str ) );
2692	}
2693	}
2694
2695	/**
2696	* capitalize words at word breaks
2697	*
2698	* @param string $str
2699	* @return mixed
2700	*/
2701	public function ucwordbreaks( $str ) {
2702	if ( $this->isMultibyte( $str ) ) {
2703	$str = $this->lc( $str );
2704
2705	// since \b doesn't work for UTF-8, we explicitly define word break chars
2706	$breaks = "[ \-\}\{\.,\?!]";
2707
2708	// find the first letter after word break
2709	$replaceRegexp = "/^([a-z]\|[\\xc0-\\xff][\\x80-\\xbf]*)\|" .
2710	"$breaks([a-z]\|[\\xc0-\\xff][\\x80-\\xbf]*)/";
2711
2712	return preg_replace_callback(
2713	$replaceRegexp,
2714	static function ( $matches ) {
2715	return mb_strtoupper( $matches[0] );
2716	},
2717	$str
2718	);
2719	} else {
2720	return preg_replace_callback(
2721	'/\b([\w\x80-\xff]+)\b/',
2722	function ( $matches ) {
2723	return $this->ucfirst( $matches[1] );
2724	},
2725	$str
2726	);
2727	}
2728	}
2729
2730	/**
2731	* Return a case-folded representation of $s
2732	*
2733	* This is a representation such that caseFold($s1) == caseFold($s2) if $s1
2734	* and $s2 are the same except for the case of their characters. It is not
2735	* necessary for the value returned to make sense when displayed.
2736	*
2737	* Do not perform any other normalisation in this function. If a caller
2738	* uses this function when it should be using a more general normalisation
2739	* function, then fix the caller.
2740	*
2741	* @param string $s
2742	*
2743	* @return string
2744	*/
2745	public function caseFold( $s ) {
2746	return $this->uc( $s );
2747	}
2748
2749	/**
2750	* @param string $s
2751	* @return string
2752	*/
2753	public function checkTitleEncoding( string $s ) {
2754	if ( StringUtils::isUtf8( $s ) ) {
2755	return $s;
2756	}
2757
2758	return $this->iconv( $this->fallback8bitEncoding(), 'utf-8', $s );
2759	}
2760
2761	/**
2762	* @return string
2763	*/
2764	public function fallback8bitEncoding() {
2765	return $this->localisationCache->getItem( $this->mCode, 'fallback8bitEncoding' );
2766	}
2767
2768	/**
2769	* Most writing systems use whitespace to break up words.
2770	* Some languages such as Chinese don't conventionally do this,
2771	* which requires special handling when breaking up words for
2772	* searching, etc.
2773	*
2774	* @return bool
2775	*/
2776	public function hasWordBreaks() {
2777	return true;
2778	}
2779
2780	/**
2781	* Some languages such as Chinese require word segmentation,
2782	* Specify such segmentation when overridden in derived class.
2783	*
2784	* @param string $string
2785	* @return string
2786	*/
2787	public function segmentByWord( $string ) {
2788	return $string;
2789	}
2790
2791	/**
2792	* Specify the language variant that should be used for search indexing.
2793	*
2794	* @return string\|null
2795	*/
2796	protected function getSearchIndexVariant() {
2797	return null;
2798	}
2799
2800	/**
2801	* Some languages have special punctuation need to be normalized.
2802	* Make such changes here.
2803	*
2804	* Some languages such as Chinese have many-to-one conversions,
2805	* e.g., it should be better to use zh-hans for search, since conversion
2806	* from zh-hant to zh-hans is less ambiguous than the other way around.
2807	*
2808	* @param string $text
2809	* @return string
2810	*/
2811	public function normalizeForSearch( $text ) {
2812	$text = self::convertDoubleWidth( $text );
2813	if ( $this->getSearchIndexVariant() ) {
2814	return $this->getConverterInternal()->autoConvert( $text, $this->getSearchIndexVariant() );
2815	}
2816	return $text;
2817	}
2818
2819	/**
2820	* Convert double-width roman characters to single-width.
2821	* range: ff00-ff5f ~= 0020-007f
2822	*
2823	* @param string $string
2824	* @return string
2825	*/
2826	protected static function convertDoubleWidth( $string ) {
2827	static $transTable = null;
2828	$transTable ??= array_combine(
2829	mb_str_split( '０１２３４５６７８９ＡＢＣＤＥＦＧＨＩＪＫＬＭＮＯＰＱＲＳＴＵＶＷＸＹＺａｂｃｄｅｆｇｈｉｊｋｌｍｎｏｐｑｒｓｔｕｖｗｘｙｚ' ),
2830	str_split( '0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz' )
2831	);
2832
2833	return strtr( $string, $transTable );
2834	}
2835
2836	/**
2837	* @param string $string
2838	* @param string $pattern
2839	* @return string
2840	*/
2841	protected static function insertSpace( $string, $pattern ) {
2842	$string = preg_replace( $pattern, " $1 ", $string );
2843	return preg_replace( '/ +/', ' ', $string );
2844	}
2845
2846	/**
2847	* @param string[] $termsArray
2848	* @return string[]
2849	*/
2850	public function convertForSearchResult( $termsArray ) {
2851	# some languages, e.g., Chinese, need to do a conversion
2852	# in order for search results to be displayed correctly
2853	return $termsArray;
2854	}
2855
2856	/**
2857	* Get the first character of a string.
2858	*
2859	* @param string $s
2860	* @return string
2861	*/
2862	public function firstChar( $s ) {
2863	$firstChar = mb_substr( $s, 0, 1 );
2864
2865	if ( $firstChar === '' \|\| strlen( $firstChar ) != 3 ) {
2866	return $firstChar;
2867	}
2868
2869	// Break down Hangul syllables to grab the first jamo
2870	$code = mb_ord( $firstChar );
2871	if ( $code < 0xac00 \|\| $code >= 0xd7a4 ) {
2872	return $firstChar;
2873	} elseif ( $code < 0xb098 ) {
2874	return "\u{3131}";
2875	} elseif ( $code < 0xb2e4 ) {
2876	return "\u{3134}";
2877	} elseif ( $code < 0xb77c ) {
2878	return "\u{3137}";
2879	} elseif ( $code < 0xb9c8 ) {
2880	return "\u{3139}";
2881	} elseif ( $code < 0xbc14 ) {
2882	return "\u{3141}";
2883	} elseif ( $code < 0xc0ac ) {
2884	return "\u{3142}";
2885	} elseif ( $code < 0xc544 ) {
2886	return "\u{3145}";
2887	} elseif ( $code < 0xc790 ) {
2888	return "\u{3147}";
2889	} elseif ( $code < 0xcc28 ) {
2890	return "\u{3148}";
2891	} elseif ( $code < 0xce74 ) {
2892	return "\u{314A}";
2893	} elseif ( $code < 0xd0c0 ) {
2894	return "\u{314B}";
2895	} elseif ( $code < 0xd30c ) {
2896	return "\u{314C}";
2897	} elseif ( $code < 0xd558 ) {
2898	return "\u{314D}";
2899	} else {
2900	return "\u{314E}";
2901	}
2902	}
2903
2904	/**
2905	* Convert a UTF-8 string to normal form C. In Malayalam and Arabic, this
2906	* also cleans up certain backwards-compatible sequences, converting them
2907	* to the modern Unicode equivalent.
2908	*
2909	* @internal
2910	* @param string $s
2911	* @return string
2912	*/
2913	public function normalize( $s ) {
2914	$allUnicodeFixes = $this->config->get( MainConfigNames::AllUnicodeFixes );
2915
2916	$s = UtfNormalValidator::cleanUp( $s );
2917	// Optimization: This is disabled by default to avoid negative performance impact.
2918	if ( $allUnicodeFixes ) {
2919	$s = $this->transformUsingPairFile( NormalizeAr::class, $s );
2920	$s = $this->transformUsingPairFile( NormalizeMl::class, $s );
2921	}
2922
2923	return $s;
2924	}
2925
2926	/**
2927	* Transform a string using serialized data stored in the given file (which
2928	* must be in the serialized subdirectory of $IP). The file contains pairs
2929	* mapping source characters to destination characters.
2930	*
2931	* The data is cached in process memory.
2932	*
2933	* @param string $dataClass Name of a normalized pairs' data class
2934	* @param string $input
2935	* @return string
2936	*/
2937	protected function transformUsingPairFile( string $dataClass, string $input ): string {
2938	if ( !isset( $this->transformData[$dataClass] ) ) {
2939	$this->transformData[$dataClass] = new ReplacementArray( $dataClass::PAIRS );
2940	}
2941
2942	return $this->transformData[$dataClass]->replace( $input );
2943	}
2944
2945	/**
2946	* For right-to-left language support
2947	*
2948	* @return bool
2949	*/
2950	public function isRTL() {
2951	return $this->localisationCache->getItem( $this->mCode, 'rtl' );
2952	}
2953
2954	/**
2955	* Return the correct HTML 'dir' attribute value for this language.
2956	* @return string
2957	*/
2958	public function getDir() {
2959	return $this->isRTL() ? 'rtl' : 'ltr';
2960	}
2961
2962	/**
2963	* Return 'left' or 'right' as appropriate alignment for line-start
2964	* for this language's text direction.
2965	*
2966	* Should be equivalent to CSS3 'start' text-align value....
2967	*
2968	* @return string
2969	*/
2970	public function alignStart() {
2971	return $this->isRTL() ? 'right' : 'left';
2972	}
2973
2974	/**
2975	* Return 'right' or 'left' as appropriate alignment for line-end
2976	* for this language's text direction.
2977	*
2978	* Should be equivalent to CSS3 'end' text-align value....
2979	*
2980	* @return string
2981	*/
2982	public function alignEnd() {
2983	return $this->isRTL() ? 'left' : 'right';
2984	}
2985
2986	/**
2987	* A hidden direction mark (LRM or RLM), depending on the language direction.
2988	* Unlike getDirMark(), this function returns the character as an HTML entity.
2989	* This function should be used when the output is guaranteed to be HTML,
2990	* because it makes the output HTML source code more readable. When
2991	* the output is plain text or can be escaped, getDirMark() should be used.
2992	*
2993	* Use of hidden control characters when the output allows use of HTML markup
2994	* is discouraged and the recommendation is to use bdi HTML tag which doesn't
2995	* have the issue of hidden characters ending up in user clipboard in text
2996	* copy paste, see T375975.
2997	*
2998	* @deprecated hard deprecated since 1.43, use bdi HTML tag in HTML context
2999	* where possible.
3000	* @param bool $opposite Get the direction mark opposite to your language
3001	* @return string
3002	* @since 1.20
3003	*/
3004	public function getDirMarkEntity( $opposite = false ) {
3005	wfDeprecated( __METHOD__, '1.43' );
3006
3007	if ( $opposite ) {
3008	return $this->isRTL() ? '&lrm;' : '&rlm;';
3009	}
3010	return $this->isRTL() ? '&rlm;' : '&lrm;';
3011	}
3012
3013	/**
3014	* A hidden direction mark (LRM or RLM), depending on the language direction.
3015	* This function produces them as invisible Unicode characters and
3016	* the output may be hard to read and debug, so it should only be used
3017	* when the output is plain text or can be escaped.
3018	*
3019	* Use of hidden control characters when the output allows use of HTML markup
3020	* is discouraged and the recommendation is to use bdi HTML tag which doesn't
3021	* have the issue of hidden characters ending up in user clipboard in text
3022	* copy paste, see T375975.
3023	*
3024	* @deprecated since 1.43, use bdi HTML tag in HTML context where possible.
3025	* @param bool $opposite Get the direction mark opposite to your language
3026	* @return string
3027	*/
3028	public function getDirMark( $opposite = false ) {
3029	if ( $opposite ) {
3030	return $this->isRTL() ? self::LRM : self::RLM;
3031	}
3032	return $this->isRTL() ? self::RLM : self::LRM;
3033	}
3034
3035	/**
3036	* An arrow, depending on the language direction.
3037	*
3038	* @param string $direction The direction of the arrow: forwards (default),
3039	* backwards, left, right, up, down.
3040	* @return string
3041	*/
3042	public function getArrow( $direction = 'forwards' ) {
3043	switch ( $direction ) {
3044	case 'forwards':
3045	return $this->isRTL() ? '←' : '→';
3046	case 'backwards':
3047	return $this->isRTL() ? '→' : '←';
3048	case 'left':
3049	return '←';
3050	case 'right':
3051	return '→';
3052	case 'up':
3053	return '↑';
3054	case 'down':
3055	return '↓';
3056	}
3057	}
3058
3059	/**
3060	* To allow "foo[[bar]]" to extend the link over the whole word "foobar"
3061	*
3062	* @return bool
3063	*/
3064	public function linkPrefixExtension() {
3065	return $this->localisationCache->getItem( $this->mCode, 'linkPrefixExtension' );
3066	}
3067
3068	/**
3069	* Get all the magic words from the localisation cache.
3070	*
3071	* @return array<string,array> $magicWord => [ int $caseSensitive, string ...$alias ]
3072	*/
3073	public function getMagicWords() {
3074	return $this->localisationCache->getItem( $this->mCode, 'magicWords' );
3075	}
3076
3077	/**
3078	* Fill a MagicWord object with data from this instance
3079	*
3080	* @param MagicWord $mw
3081	*/
3082	public function getMagic( $mw ) {
3083	$rawEntry = $this->mMagicExtensions[$mw->mId] ??
3084	$this->localisationCache->getSubitem( $this->mCode, 'magicWords', $mw->mId );
3085
3086	if ( !is_array( $rawEntry ) ) {
3087	wfWarn( "\"$rawEntry\" is not a valid magic word for \"$mw->mId\"" );
3088	} else {
3089	$mw->mCaseSensitive = $rawEntry[0];
3090	$mw->mSynonyms = array_slice( $rawEntry, 1 );
3091	}
3092	}
3093
3094	/**
3095	* Get special page names, as an associative array
3096	* canonical name => array of valid names, including aliases
3097	* @return string[][]
3098	*/
3099	public function getSpecialPageAliases() {
3100	// Cache aliases because it may be slow to load them
3101	$this->mExtendedSpecialPageAliases ??=
3102	$this->localisationCache->getItem( $this->mCode, 'specialPageAliases' );
3103
3104	return $this->mExtendedSpecialPageAliases;
3105	}
3106
3107	/**
3108	* Italic is unsuitable for some languages
3109	*
3110	* @param string $text The text to be emphasized.
3111	* @return string
3112	*/
3113	public function emphasize( $text ) {
3114	return "<em>$text</em>";
3115	}
3116
3117	/**
3118	* Normally we output all numbers in plain en_US style, that is
3119	* 293,291.235 for two hundred ninety-three thousand two hundred ninety-one
3120	* point two hundred thirty-five. However, this is not suitable for all
3121	* languages, some such as Bengali (bn) want ২,৯৩,২৯১.২৩৫ and others such as
3122	* Icelandic just want to use commas instead of dots, and dots instead
3123	* of commas like "293.291,235".
3124	*
3125	* An example of this function being called:
3126	* <code>
3127	* wfMessage( 'message' )->numParams( $num )->text()
3128	* </code>
3129	*
3130	* See $separatorTransformTable on MessageIs.php for
3131	* the , => . and . => , implementation.
3132	*
3133	* @param string\|int\|float $number Expected to be a pre-formatted (e.g. leading zeros, number
3134	* of decimal places) numeric string. Any non-string will be cast to string.
3135	* @return string
3136	*/
3137	public function formatNum( $number ) {
3138	return $this->formatNumInternal( (string)$number, false, false );
3139	}
3140
3141	/**
3142	* Internal implementation function, shared between formatNum and formatNumNoSeparators.
3143	*
3144	* @param string $number The stringification of a valid PHP number
3145	* @param bool $noTranslate Whether to translate digits and separators
3146	* @param bool $noSeparators Whether to add separators
3147	* @return string
3148	*/
3149	private function formatNumInternal(
3150	string $number, bool $noTranslate, bool $noSeparators
3151	): string {
3152	$translateNumerals = $this->config->get( MainConfigNames::TranslateNumerals );
3153
3154	if ( $number === '' ) {
3155	return $number;
3156	}
3157	if ( $number === (string)NAN ) {
3158	return $this->msg( 'formatnum-nan' )->text();
3159	}
3160	if ( $number === (string)INF ) {
3161	return "∞";
3162	}
3163	if ( $number === (string)-INF ) {
3164	return "\u{2212}∞";
3165	}
3166	if ( !is_numeric( $number ) ) {
3167	# T267587: downgrade this to level:warn while we chase down the long
3168	# trail of callers.
3169	# wfDeprecated( 'Language::formatNum with a non-numeric string', '1.36' );
3170	LoggerFactory::getInstance( 'formatnum' )->warning(
3171	'Language::formatNum with non-numeric string',
3172	[ 'number' => $number ]
3173	);
3174	$validNumberRe = '(-(?=[\d\.]))?(\d+\|(?=\.\d))(\.\d*)?([Ee][-+]?\d+)?';
3175	// For backwards-compat, apply formatNum piecewise on the valid
3176	// numbers in the string. Don't split on NAN/INF in this legacy
3177	// case as they are likely to be found embedded inside non-numeric
3178	// text.
3179	return preg_replace_callback( "/{$validNumberRe}/", function ( $m ) use ( $noTranslate, $noSeparators ) {
3180	return $this->formatNumInternal( $m[0], $noTranslate, $noSeparators );
3181	}, $number );
3182	}
3183
3184	if ( !$noSeparators ) {
3185	$separatorTransformTable = $this->separatorTransformTable();
3186	$digitGroupingPattern = $this->digitGroupingPattern();
3187	$code = $this->getCode();
3188	if ( !( $translateNumerals && $this->langNameUtils->isValidCode( $code ) ) ) {
3189	$code = 'C'; // POSIX system default locale
3190	}
3191
3192	if ( $digitGroupingPattern ) {
3193	$fmt = new NumberFormatter(
3194	$code, NumberFormatter::PATTERN_DECIMAL, $digitGroupingPattern
3195	);
3196	} else {
3197	/** @suppress PhanParamTooFew Phan thinks this always requires 3 parameters, that's wrong */
3198	$fmt = new NumberFormatter( $code, NumberFormatter::DECIMAL );
3199	}
3200
3201	// minimumGroupingDigits can be used to suppress groupings below a certain value.
3202	// This is used for languages such as Polish, where one would only write the grouping
3203	// separator for values above 9999 - numbers with more than 4 digits.
3204	// NumberFormatter is yet to support minimumGroupingDigits, ICU has it as experimental feature.
3205	// The attribute value is used by adding it to the grouping separator value. If
3206	// the input number has fewer integer digits, the grouping separator is suppressed.
3207	$minimumGroupingDigits = $this->minimumGroupingDigits();
3208	// Minimum length of a number to do digit grouping on.
3209	// http://unicode.org/reports/tr35/tr35-numbers.html#Examples_of_minimumGroupingDigits
3210	$minimumLength = $minimumGroupingDigits + $fmt->getAttribute( NumberFormatter::GROUPING_SIZE );
3211	if ( $minimumGroupingDigits > 1
3212	&& !preg_match( '/^\-?\d{' . $minimumLength . '}/', $number )
3213	) {
3214	// This number does not need commas inserted (even if
3215	// NumberFormatter thinks it does) because it's not long
3216	// enough. We still need to do decimal separator
3217	// transformation, though. For example, 1234.56 becomes 1234,56
3218	// in pl with $minimumGroupingDigits = 2.
3219	if ( !$noTranslate ) {
3220	$number = strtr( $number, $separatorTransformTable ?: [] );
3221	}
3222	} elseif ( $number === '-0' ) {
3223	// Special case to ensure we don't lose the minus sign by
3224	// converting to an int.
3225	if ( !$noTranslate ) {
3226	$number = strtr( $number, $separatorTransformTable ?: [] );
3227	}
3228	} else {
3229	// NumberFormatter supports separator transformation,
3230	// but it does not know all languages MW
3231	// supports. Example: arq. Also, languages like pl have
3232	// customisation. So manually set it.
3233	if ( $noTranslate ) {
3234	$fmt->setSymbol(
3235	NumberFormatter::DECIMAL_SEPARATOR_SYMBOL,
3236	'.'
3237	);
3238	$fmt->setSymbol(
3239	NumberFormatter::GROUPING_SEPARATOR_SYMBOL,
3240	','
3241	);
3242	} elseif ( $separatorTransformTable ) {
3243	$fmt->setSymbol(
3244	NumberFormatter::DECIMAL_SEPARATOR_SYMBOL,
3245	$separatorTransformTable[ '.' ] ?? '.'
3246	);
3247	$fmt->setSymbol(
3248	NumberFormatter::GROUPING_SEPARATOR_SYMBOL,
3249	$separatorTransformTable[ ',' ] ?? ','
3250	);
3251	}
3252
3253	// Maintain # of digits before and after the decimal point
3254	// (and presence of decimal point)
3255	if ( preg_match( '/^-?(\d)(\.(\d))?$/', $number, $m ) ) {
3256	$fmt->setAttribute( NumberFormatter::MIN_INTEGER_DIGITS, strlen( $m[1] ) );
3257	if ( isset( $m[2] ) ) {
3258	$fmt->setAttribute( NumberFormatter::DECIMAL_ALWAYS_SHOWN, 1 );
3259	}
3260	$fmt->setAttribute( NumberFormatter::FRACTION_DIGITS, strlen( $m[3] ?? '' ) );
3261	}
3262	$number = $fmt->format( (float)$number );
3263	}
3264	}
3265
3266	if ( !$noTranslate ) {
3267	if ( $translateNumerals ) {
3268	// This is often unnecessary: PHP's NumberFormatter will often
3269	// do the digit transform itself (T267614)
3270	$s = $this->digitTransformTable();
3271	if ( $s ) {
3272	$number = strtr( $number, $s );
3273	}
3274	}
3275	# T10327: Make our formatted numbers prettier by using a
3276	# proper Unicode 'minus' character.
3277	$number = strtr( $number, [ '-' => "\u{2212}" ] );
3278	}
3279
3280	// Remove any LRM or RLM characters generated from NumberFormatter,
3281	// since directionality is handled outside of this context.
3282	// Similarly remove \u61C (ALM) which is added starting PHP 7.3+
3283	return strtr( $number, [
3284	self::LRM => '',
3285	self::RLM => '',
3286	self::ALM => '',
3287	] );
3288	}
3289
3290	/**
3291	* Front-end for non-commafied formatNum
3292	*
3293	* @param string\|int\|float $number The string to be formatted, should be an integer
3294	* or a floating point number.
3295	* @since 1.21
3296	* @return string
3297	*/
3298	public function formatNumNoSeparators( $number ) {
3299	return $this->formatNumInternal( (string)$number, false, true );
3300	}
3301
3302	/**
3303	* @param string $number
3304	* @return string
3305	*/
3306	public function parseFormattedNumber( $number ) {
3307	if ( $number === $this->msg( 'formatnum-nan' )->text() ) {
3308	return (string)NAN;
3309	}
3310	if ( $number === "∞" ) {
3311	return (string)INF;
3312	}
3313	// Accept either ASCII hyphen-minus or the unicode minus emitted by
3314	// ::formatNum()
3315	$number = strtr( $number, [ "\u{2212}" => '-' ] );
3316	if ( $number === "-∞" ) {
3317	return (string)-INF;
3318	}
3319	$s = $this->digitTransformTable();
3320	if ( $s ) {
3321	// Eliminate empty array values such as ''. (T66347)
3322	$s = array_filter( $s );
3323	$number = strtr( $number, array_flip( $s ) );
3324	}
3325
3326	$s = $this->separatorTransformTable();
3327	if ( $s ) {
3328	// Eliminate empty array values such as ''. (T66347)
3329	$s = array_filter( $s );
3330	$number = strtr( $number, array_flip( $s ) );
3331	}
3332
3333	return strtr( $number, [ ',' => '' ] );
3334	}
3335
3336	/**
3337	* @return string
3338	*/
3339	public function digitGroupingPattern() {
3340	return $this->localisationCache->getItem( $this->mCode, 'digitGroupingPattern' );
3341	}
3342
3343	/**
3344	* @return string[]
3345	*/
3346	public function digitTransformTable() {
3347	return $this->localisationCache->getItem( $this->mCode, 'digitTransformTable' );
3348	}
3349
3350	/**
3351	* @return string[]
3352	*/
3353	public function separatorTransformTable() {
3354	return $this->localisationCache->getItem( $this->mCode, 'separatorTransformTable' );
3355	}
3356
3357	/**
3358	* The minimum number of digits a number must have, in addition to the grouping
3359	* size, before grouping separators are added.
3360	*
3361	* For example, Polish has minimumGroupingDigits = 2, which with a grouping
3362	* size of 3 causes 4-digit numbers to be written like 9999, but 5-digit
3363	* numbers are written like "10 000".
3364	*
3365	* @return int
3366	*/
3367	public function minimumGroupingDigits(): int {
3368	return $this->localisationCache->getItem( $this->mCode, 'minimumGroupingDigits' ) ?? 1;
3369	}
3370
3371	/**
3372	* Take a list of strings and build a locale-friendly comma-separated
3373	* list, using the local comma-separator message.
3374	* The last two strings are chained with an "and".
3375	*
3376	* @param string[] $list
3377	* @param-taint $list tainted
3378	* @return string
3379	*/
3380	public function listToText( array $list ) {
3381	$itemCount = count( $list );
3382	if ( $itemCount < 1 ) {
3383	return '';
3384	}
3385	$text = array_pop( $list );
3386	if ( $itemCount > 1 ) {
3387	$and = $this->msg( 'and' )->escaped();
3388	$space = $this->msg( 'word-separator' )->escaped();
3389	$comma = '';
3390	if ( $itemCount > 2 ) {
3391	$comma = $this->msg( 'comma-separator' )->escaped();
3392	}
3393	$text = implode( $comma, $list ) . $and . $space . $text;
3394	}
3395	// @phan-suppress-next-line PhanTypeMismatchReturnNullable False positive
3396	return $text;
3397	}
3398
3399	/**
3400	* Take a list of strings and build a locale-friendly comma-separated
3401	* list, using the local comma-separator message.
3402	* @param string[] $list Array of strings to put in a comma list
3403	* @param-taint $list tainted
3404	* @return string
3405	*/
3406	public function commaList( array $list ) {
3407	return implode(
3408	$this->msg( 'comma-separator' )->escaped(),
3409	$list
3410	);
3411	}
3412
3413	/**
3414	* Take a list of strings and build a locale-friendly semicolon-separated
3415	* list, using the local semicolon-separator message.
3416	* @param string[] $list Array of strings to put in a semicolon list
3417	* @param-taint $list tainted
3418	* @return string
3419	*/
3420	public function semicolonList( array $list ) {
3421	return implode(
3422	$this->msg( 'semicolon-separator' )->escaped(),
3423	$list
3424	);
3425	}
3426
3427	/**
3428	* Same as commaList, but separate it with the pipe instead.
3429	* @param string[] $list Array of strings to put in a pipe list
3430	* @param-taint $list tainted
3431	* @return string
3432	*/
3433	public function pipeList( array $list ) {
3434	return implode(
3435	$this->msg( 'pipe-separator' )->escaped(),
3436	$list
3437	);
3438	}
3439
3440	/**
3441	* Truncate a string to a specified length in bytes, appending an optional
3442	* string (e.g., for ellipsis)
3443	* When an ellipsis isn't needed, using mb_strcut() directly is recommended.
3444	*
3445	* If $length is negative, the string will be truncated from the beginning
3446	*
3447	* @since 1.31
3448	*
3449	* @param string $string String to truncate
3450	* @param int $length Maximum length in bytes
3451	* @param string $ellipsis String to append to the end of truncated text
3452	* @param bool $adjustLength Subtract length of ellipsis from $length
3453	*
3454	* @return string
3455	*/
3456	public function truncateForDatabase( $string, $length, $ellipsis = '...', $adjustLength = true ) {
3457	return $this->truncateInternal(
3458	$string, $length, $ellipsis, $adjustLength, 'strlen', 'mb_strcut'
3459	);
3460	}
3461
3462	/**
3463	* Truncate a string to a specified number of characters, appending an optional
3464	* string (e.g., for ellipsis).
3465	*
3466	* This provides the multibyte version of truncateForDatabase() method of this class,
3467	* suitable for truncation based on number of characters, instead of number of bytes.
3468	*
3469	* The input should be a raw UTF-8 string, and NOT be HTML
3470	* escaped. It is not safe to truncate HTML-escaped strings,
3471	* because the entity can be truncated! Use ::truncateHtml() if you
3472	* need a specific number of HTML-encoded bytes, or
3473	* ::truncateForDatabase() if you need a specific number of PHP
3474	* bytes.
3475	*
3476	* If $length is negative, the string will be truncated from the beginning.
3477	*
3478	* @since 1.31
3479	*
3480	* @param string $string String to truncate
3481	* @param int $length Maximum number of characters
3482	* @param string $ellipsis String to append to the end of truncated text
3483	* @param bool $adjustLength Subtract length of ellipsis from $length
3484	*
3485	* @return string
3486	*/
3487	public function truncateForVisual( $string, $length, $ellipsis = '...', $adjustLength = true ) {
3488	// Passing encoding to mb_strlen and mb_substr is optional.
3489	// Encoding defaults to mb_internal_encoding(), which is set to UTF-8 in Setup.php, so
3490	// explicit specification of encoding is skipped.
3491	// Note: Both multibyte methods are callables invoked in truncateInternal.
3492	return $this->truncateInternal(
3493	$string, $length, $ellipsis, $adjustLength, 'mb_strlen', 'mb_substr'
3494	);
3495	}
3496
3497	/**
3498	* Internal method used for truncation. This method abstracts text truncation into
3499	* one common method, allowing users to provide the length measurement function and
3500	* function for finding substring.
3501	*
3502	* For usages, see truncateForDatabase and truncateForVisual.
3503	*
3504	* @param string $string String to truncate
3505	* @param int $length Maximum length of the final text
3506	* @param string $ellipsis String to append to the end of truncated text
3507	* @param bool $adjustLength Subtract length of ellipsis from $length
3508	* @param callable $measureLength Callable function used for determining the length of text
3509	* @param callable $getSubstring Callable function used for getting the substrings
3510	*
3511	* @return string
3512	*/
3513	private function truncateInternal(
3514	$string, $length, $ellipsis, $adjustLength, callable $measureLength, callable $getSubstring
3515	) {
3516	# Check if there is no need to truncate
3517	if ( $measureLength( $string ) <= abs( $length ) ) {
3518	return $string; // no need to truncate
3519	}
3520
3521	# Use the localized ellipsis character
3522	if ( $ellipsis == '...' ) {
3523	$ellipsis = $this->msg( 'ellipsis' )->text();
3524	}
3525	if ( $length == 0 ) {
3526	return $ellipsis; // convention
3527	}
3528
3529	$stringOriginal = $string;
3530	# If ellipsis length is >= $length then we can't apply $adjustLength
3531	if ( $adjustLength && $measureLength( $ellipsis ) >= abs( $length ) ) {
3532	$string = $ellipsis; // this can be slightly unexpected
3533	# Otherwise, truncate and add ellipsis...
3534	} else {
3535	$ellipsisLength = $adjustLength ? $measureLength( $ellipsis ) : 0;
3536	if ( $length > 0 ) {
3537	$length -= $ellipsisLength;
3538	$string = $getSubstring( $string, 0, $length ); // xyz...
3539	$string = rtrim( $string ) . $ellipsis;
3540	} else {
3541	$length += $ellipsisLength;
3542	$string = $getSubstring( $string, $length ); // ...xyz
3543	$string = $ellipsis . ltrim( $string );
3544	}
3545	}
3546
3547	# Do not truncate if the ellipsis makes the string longer/equal (T24181).
3548	# This check is not redundant if $adjustLength, due to the single case where
3549	# LEN($ellipsis) > ABS($limit arg); $stringOriginal could be shorter than $string.
3550	if ( $measureLength( $string ) < $measureLength( $stringOriginal ) ) {
3551	return $string;
3552	} else {
3553	return $stringOriginal;
3554	}
3555	}
3556
3557	/**
3558	* Remove bytes that represent an incomplete Unicode character
3559	* at the end of string (e.g. bytes of the char are missing)
3560	*
3561	* @param string $string
3562	* @return string
3563	*/
3564	protected function removeBadCharLast( $string ) {
3565	if ( $string != '' ) {
3566	$char = ord( $string[strlen( $string ) - 1] );
3567	$m = [];
3568	if ( $char >= 0xc0 ) {
3569	# We got the first byte only of a multibyte char; remove it.
3570	$string = substr( $string, 0, -1 );
3571	} elseif ( $char >= 0x80 &&
3572	// Use the /s modifier (PCRE_DOTALL) so (.*) also matches newlines
3573	preg_match( '/^(.*)(?:[\xe0-\xef][\x80-\xbf]\|' .
3574	'[\xf0-\xf7][\x80-\xbf]{1,2})$/s', $string, $m )
3575	) {
3576	# We chopped in the middle of a character; remove it
3577	$string = $m[1];
3578	}
3579	}
3580	return $string;
3581	}
3582
3583	/**
3584	* Truncate a string of valid HTML to a specified length in bytes,
3585	* appending an optional string (e.g., for ellipses), and return valid HTML
3586	*
3587	* This is only intended for styled/linked text, such as HTML with
3588	* tags like <span> and <a>, where the tags are self-contained (valid HTML).
3589	* Also, this will not detect things like "display:none" CSS.
3590	*
3591	* Note: since 1.18 you do not need to leave extra room in $length for ellipses.
3592	*
3593	* @param string $text HTML string to truncate
3594	* @param int $length (zero/positive) Maximum HTML length (including ellipses)
3595	* @param string $ellipsis String to append to the truncated text
3596	* @return string
3597	*/
3598	public function truncateHtml( $text, $length, $ellipsis = '...' ) {
3599	# Use the localized ellipsis character
3600	if ( $ellipsis == '...' ) {
3601	$ellipsis = $this->msg( 'ellipsis' )->escaped();
3602	}
3603	# Check if there is clearly no need to truncate
3604	if ( $length <= 0 ) {
3605	return $ellipsis; // no text shown, nothing to format (convention)
3606	} elseif ( strlen( $text ) <= $length ) {
3607	return $text; // string short enough even with HTML (short-circuit)
3608	}
3609
3610	$dispLen = 0; // innerHTML length so far
3611	$testingEllipsis = false; // check if ellipses will make the string longer/equal?
3612	$tagType = 0; // 0-open, 1-close
3613	$bracketState = 0; // 1-tag start, 2-tag name, 0-neither
3614	$entityState = 0; // 0-not entity, 1-entity
3615	$tag = $ret = ''; // accumulated tag name, accumulated result string
3616	$openTags = []; // open tag stack
3617	$maybeState = null; // possible truncation state
3618
3619	$textLen = strlen( $text );
3620	$neLength = max( 0, $length - strlen( $ellipsis ) ); // non-ellipsis len if truncated
3621	for ( $pos = 0; true; ++$pos ) {
3622	# Consider truncation once the display length has reached the maximum.
3623	# We check if $dispLen > 0 to grab tags for the $neLength = 0 case.
3624	# Check that we're not in the middle of a bracket/entity...
3625	if ( $dispLen && $dispLen >= $neLength && $bracketState == 0 && !$entityState ) {
3626	if ( !$testingEllipsis ) {
3627	$testingEllipsis = true;
3628	# Save where we are; we will truncate here unless there turn out to
3629	# be so few remaining characters that truncation is not necessary.
3630	if ( !$maybeState ) { // already saved? ($neLength = 0 case)
3631	$maybeState = [ $ret, $openTags ]; // save state
3632	}
3633	} elseif ( $dispLen > $length && $dispLen > strlen( $ellipsis ) ) {
3634	# The string in fact does need truncation, the truncation point was OK.
3635	// @phan-suppress-next-line PhanTypeInvalidExpressionArrayDestructuring
3636	[ $ret, $openTags ] = $maybeState; // reload state
3637	$ret = $this->removeBadCharLast( $ret ); // multi-byte char fix
3638	$ret .= $ellipsis; // add ellipsis
3639	break;
3640	}
3641	}
3642	if ( $pos >= $textLen ) {
3643	break; // extra iteration just for the checks above
3644	}
3645
3646	# Read the next char...
3647	$ch = $text[$pos];
3648	$lastCh = $pos ? $text[$pos - 1] : '';
3649	$ret .= $ch; // add to result string
3650	if ( $ch == '<' ) {
3651	$this->truncate_endBracket( $tag, $tagType, $lastCh, $openTags ); // for bad HTML
3652	$entityState = 0; // for bad HTML
3653	$bracketState = 1; // tag started (checking for backslash)
3654	} elseif ( $ch == '>' ) {
3655	$this->truncate_endBracket( $tag, $tagType, $lastCh, $openTags );
3656	$entityState = 0; // for bad HTML
3657	$bracketState = 0; // out of brackets
3658	} elseif ( $bracketState == 1 ) {
3659	if ( $ch == '/' ) {
3660	$tagType = 1; // close tag (e.g. "</span>")
3661	} else {
3662	$tagType = 0; // open tag (e.g. "<span>")
3663	$tag .= $ch;
3664	}
3665	$bracketState = 2; // building tag name
3666	} elseif ( $bracketState == 2 ) {
3667	if ( $ch != ' ' ) {
3668	$tag .= $ch;
3669	} else {
3670	// Name found (e.g. "<a href=..."), add on tag attributes...
3671	$pos += $this->truncate_skip( $ret, $text, "<>", $pos + 1 );
3672	}
3673	} elseif ( $bracketState == 0 ) {
3674	if ( $entityState ) {
3675	if ( $ch == ';' ) {
3676	$entityState = 0;
3677	$dispLen++; // entity is one displayed char
3678	}
3679	} else {
3680	if ( $neLength == 0 && !$maybeState ) {
3681	// Save the state without $ch. We want to hit the first
3682	// display char (to get tags) but not use it if truncating.
3683	$maybeState = [ substr( $ret, 0, -1 ), $openTags ];
3684	}
3685	if ( $ch == '&' ) {
3686	$entityState = 1; // entity found, (e.g. " ")
3687	} else {
3688	$dispLen++; // this char is displayed
3689	// Add the next $max display text chars after this in one swoop...
3690	$max = ( $testingEllipsis ? $length : $neLength ) - $dispLen;
3691	$skipped = $this->truncate_skip( $ret, $text, "<>&", $pos + 1, $max );
3692	$dispLen += $skipped;
3693	$pos += $skipped;
3694	}
3695	}
3696	}
3697	}
3698	// Close the last tag if left unclosed by bad HTML
3699	$this->truncate_endBracket( $tag, $tagType, $text[$textLen - 1], $openTags );
3700	while ( count( $openTags ) > 0 ) {
3701	$ret .= '</' . array_pop( $openTags ) . '>'; // close open tags
3702	}
3703	return $ret;
3704	}
3705
3706	/**
3707	* truncateHtml() helper function
3708	* like strcspn() but adds the skipped chars to $ret
3709	*
3710	* @param string &$ret
3711	* @param string $text
3712	* @param string $search
3713	* @param int $start
3714	* @param null\|int $len
3715	* @return int
3716	*/
3717	private function truncate_skip( &$ret, $text, $search, $start, $len = null ) {
3718	if ( $len === null ) {
3719	// -1 means "no limit" for strcspn
3720	$len = -1;
3721	} elseif ( $len < 0 ) {
3722	$len = 0;
3723	}
3724	$skipCount = 0;
3725	if ( $start < strlen( $text ) ) {
3726	$skipCount = strcspn( $text, $search, $start, $len );
3727	$ret .= substr( $text, $start, $skipCount );
3728	}
3729	return $skipCount;
3730	}
3731
3732	/**
3733	* truncateHtml() helper function
3734	* (a) push or pop $tag from $openTags as needed
3735	* (b) clear $tag value
3736	*
3737	* @param string &$tag Current HTML tag name we are looking at
3738	* @param int $tagType (0-open tag, 1-close tag)
3739	* @param string $lastCh Character before the '>' that ended this tag
3740	* @param array &$openTags Open tag stack (not accounting for $tag)
3741	*/
3742	private function truncate_endBracket( &$tag, $tagType, $lastCh, &$openTags ) {
3743	$tag = ltrim( $tag );
3744	if ( $tag != '' ) {
3745	if ( $tagType == 0 && $lastCh != '/' ) {
3746	$openTags[] = $tag; // tag opened (didn't close itself)
3747	} elseif ( $tagType == 1 ) {
3748	if ( $openTags && $tag == $openTags[count( $openTags ) - 1] ) {
3749	array_pop( $openTags ); // tag closed
3750	}
3751	}
3752	$tag = '';
3753	}
3754	}
3755
3756	/**
3757	* Grammatical transformations, needed for inflected languages
3758	* Invoked by putting {{grammar:case\|word}} in a message
3759	*
3760	* @param string $word
3761	* @param string $case
3762	* @return string
3763	*/
3764	public function convertGrammar( $word, $case ) {
3765	$grammarForms = $this->config->get( MainConfigNames::GrammarForms );
3766	if ( isset( $grammarForms[$this->getCode()][$case][$word] ) ) {
3767	return $grammarForms[$this->getCode()][$case][$word];
3768	}
3769
3770	$grammarTransformations = $this->getGrammarTransformations();
3771
3772	if ( isset( $grammarTransformations[$case] ) ) {
3773	$forms = $grammarTransformations[$case];
3774
3775	// Some names of grammar rules are aliases for other rules.
3776	// In such cases the value is a string rather than object,
3777	// so load the actual rules.
3778	if ( is_string( $forms ) ) {
3779	$forms = $grammarTransformations[$forms];
3780	}
3781
3782	foreach ( $forms as $rule ) {
3783	$form = $rule[0];
3784
3785	if ( $form === '@metadata' ) {
3786	continue;
3787	}
3788
3789	$replacement = $rule[1];
3790
3791	$regex = '/' . addcslashes( $form, '/' ) . '/u';
3792	$patternMatches = preg_match( $regex, $word );
3793
3794	if ( $patternMatches === false ) {
3795	wfLogWarning(
3796	'An error occurred while processing grammar. ' .
3797	"Word: '$word'. Regex: /$form/."
3798	);
3799	} elseif ( $patternMatches === 1 ) {
3800	$word = preg_replace( $regex, $replacement, $word );
3801
3802	break;
3803	}
3804	}
3805	}
3806
3807	return $word;
3808	}
3809
3810	/**
3811	* Get the grammar forms for the content language.
3812	*
3813	* @return array Array of grammar forms
3814	* @since 1.20
3815	*/
3816	public function getGrammarForms() {
3817	$grammarForms = $this->config->get( MainConfigNames::GrammarForms );
3818	if ( isset( $grammarForms[$this->getCode()] )
3819	&& is_array( $grammarForms[$this->getCode()] )
3820	) {
3821	return $grammarForms[$this->getCode()];
3822	}
3823
3824	return [];
3825	}
3826
3827	/**
3828	* Get the grammar transformations data for the language.
3829	* Used like grammar forms, with {{GRAMMAR}} and cases,
3830	* but uses pairs of regexes and replacements instead of code.
3831	*
3832	* @return array[] Array of grammar transformations.
3833	* @since 1.28
3834	*/
3835	public function getGrammarTransformations() {
3836	global $IP;
3837	if ( $this->grammarTransformCache !== null ) {
3838	return $this->grammarTransformCache;
3839	}
3840
3841	$grammarDataFile = $IP . "/languages/data/grammarTransformations/{$this->getCode()}.json";
3842	$this->grammarTransformCache = is_readable( $grammarDataFile )
3843	? FormatJson::decode( file_get_contents( $grammarDataFile ), true )
3844	: [];
3845
3846	if ( $this->grammarTransformCache === null ) {
3847	throw new RuntimeException( "Invalid grammar data for \"{$this->getCode()}\"." );
3848	}
3849
3850	return $this->grammarTransformCache;
3851	}
3852
3853	/**
3854	* Provides an alternative text depending on specified gender.
3855	* Usage {{gender:username\|masculine\|feminine\|unknown}}.
3856	* username is optional, in which case the gender of the current user is used,
3857	* but only in (some) interface messages; otherwise the default gender is used.
3858	*
3859	* If no forms are given, an empty string is returned. If only one form is
3860	* given, it will be returned unconditionally. These details are implied by
3861	* the caller and cannot be overridden in subclasses.
3862	*
3863	* If three forms are given, the default is to use the third (unknown) form.
3864	* If fewer than three forms are given, the default is to use the first (masculine) form.
3865	* These details can be overridden in subclasses.
3866	*
3867	* @param string $gender
3868	* @param array $forms
3869	*
3870	* @return string
3871	*/
3872	public function gender( $gender, $forms ) {
3873	if ( !count( $forms ) ) {
3874	return '';
3875	}
3876	$forms = $this->preConvertPlural( $forms, 2 );
3877	if ( $gender === 'male' ) {
3878	return $forms[0];
3879	}
3880	if ( $gender === 'female' ) {
3881	return $forms[1];
3882	}
3883	return $forms[2] ?? $forms[0];
3884	}
3885
3886	/**
3887	* Plural form transformations, needed for some languages.
3888	* For example, there are 3 forms of plural in Russian and Polish,
3889	* depending on "count mod 10". See [[w:Plural]]
3890	* For English it is pretty simple.
3891	*
3892	* Invoked by putting {{plural:count\|wordform1\|wordform2}}
3893	* or {{plural:count\|wordform1\|wordform2\|wordform3}}
3894	*
3895	* Example: {{plural:{{NUMBEROFARTICLES}}\|article\|articles}}
3896	*
3897	* @param int $count Non-localized number
3898	* @param array $forms Different plural forms
3899	* @return string Correct form of plural for $count in this language
3900	*/
3901	public function convertPlural( $count, $forms ) {
3902	// Handle explicit n=pluralform cases
3903	$forms = $this->handleExplicitPluralForms( $count, $forms );
3904	if ( is_string( $forms ) ) {
3905	return $forms;
3906	}
3907	if ( !count( $forms ) ) {
3908	return '';
3909	}
3910
3911	$pluralForm = $this->getPluralRuleIndexNumber( $count );
3912	$pluralForm = min( $pluralForm, count( $forms ) - 1 );
3913	return $forms[$pluralForm];
3914	}
3915
3916	/**
3917	* Handles explicit plural forms for Language::convertPlural()
3918	*
3919	* In {{PLURAL:$1\|0=nothing\|one\|many}}, 0=nothing will be returned if $1 equals zero.
3920	* If an explicitly defined plural form matches the $count, then the
3921	* string value is returned. Otherwise the array is returned for further consideration
3922	* by CLDR rules or overridden convertPlural().
3923	*
3924	* @since 1.23
3925	*
3926	* @param int $count Non-localized number
3927	* @param string[] $forms Different plural forms
3928	*
3929	* @return string[]\|string
3930	*/
3931	protected function handleExplicitPluralForms( $count, array $forms ) {
3932	foreach ( $forms as $index => $form ) {
3933	if ( preg_match( '/\d+=/i', $form ) ) {
3934	$pos = strpos( $form, '=' );
3935	if ( substr( $form, 0, $pos ) === (string)$count ) {
3936	return substr( $form, $pos + 1 );
3937	}
3938	unset( $forms[$index] );
3939	}
3940	}
3941	return array_values( $forms );
3942	}
3943
3944	/**
3945	* Checks that convertPlural was given an array and pads it to requested
3946	* number of forms by copying the last one.
3947	*
3948	* @param array $forms
3949	* @param int $count Minimum number of forms
3950	* @return array Padded array of forms
3951	*/
3952	protected function preConvertPlural( /* Array */ $forms, $count ) {
3953	return array_pad( $forms, $count, end( $forms ) );
3954	}
3955
3956	/**
3957	* Some languages provide translations in different levels of formality (or manner of address),
3958	* for example using the T-V distinction. Since most translations do not differ by formality,
3959	* we provide magic word, e.g. `{{#FORMAL:Du\|Sie}}` that allows translating only once
3960	* and defining different forms inline. This only works for languages that have a fallback
3961	* relation. For example `es` and `es-formal`. The return value indicates which form of
3962	* the forms given should be used for this language. Zero-based index.
3963	*
3964	* @since 1.43
3965	*/
3966	public function getFormalityIndex(): int {
3967	return $this->localisationCache->getItem( $this->mCode, 'formalityIndex' ) ?? 0;
3968	}
3969
3970	/**
3971	* Wraps argument with unicode control characters for directionality safety
3972	*
3973	* This solves the problem where directionality-neutral characters at the edge of
3974	* the argument string get interpreted with the wrong directionality from the
3975	* enclosing context, giving renderings that look corrupted like "(Ben_(WMF".
3976	*
3977	* The wrapping is LRE...PDF or RLE...PDF, depending on the detected
3978	* directionality of the argument string, using the BIDI algorithm's own "First
3979	* strong directional codepoint" rule. Essentially, this works round the fact that
3980	* there is no embedding equivalent of U+2068 FSI (isolation with heuristic
3981	* direction inference). The latter is cleaner but still not widely supported.
3982	*
3983	* Use of hidden control characters when the output allows use of HTML markup
3984	* is discouraged and the recommendation is to use bdi HTML tag which doesn't
3985	* have the issue of hidden characters ending up in user clipboard in text
3986	* copy paste, see T375975.
3987	*
3988	* @deprecated since 1.43, use bdi HTML tag in HTML context where possible.
3989	* @param string $text Text to wrap
3990	* @return string Text, wrapped in LRE...PDF or RLE...PDF or nothing
3991	*/
3992	public function embedBidi( $text = '' ) {
3993	$dir = self::strongDirFromContent( $text );
3994	if ( $dir === 'ltr' ) {
3995	// Wrap in LEFT-TO-RIGHT EMBEDDING ... POP DIRECTIONAL FORMATTING
3996	return self::LRE . $text . self::PDF;
3997	}
3998	if ( $dir === 'rtl' ) {
3999	// Wrap in RIGHT-TO-LEFT EMBEDDING ... POP DIRECTIONAL FORMATTING
4000	return self::RLE . $text . self::PDF;
4001	}
4002	// No strong directionality: do not wrap
4003	return $text;
4004	}
4005
4006	/**
4007	* Get an array of suggested block durations from MediaWiki:Ipboptions
4008	* @todo FIXME: This uses a rather odd syntax for the options, should it be converted
4009	* to the standard "**<duration>\|<displayname>" format?
4010	* @since 1.42
4011	* @param bool $includeOther Whether to include the 'other' option in the list of
4012	* suggestions
4013	* @return string[]
4014	*/
4015	public function getBlockDurations( $includeOther = true ): array {
4016	$msg = $this->msg( 'ipboptions' )->text();
4017
4018	if ( $msg == '-' ) {
4019	return [];
4020	}
4021
4022	$a = XmlSelect::parseOptionsMessage( $msg );
4023
4024	if ( $a && $includeOther ) {
4025	// If options exist, add other to the end instead of the beginning (which
4026	// is what happens by default).
4027	$a[ $this->msg( 'ipbother' )->text() ] = 'other';
4028	}
4029
4030	return $a;
4031	}
4032
4033	/**
4034	* @todo Maybe translate block durations. Note that this function is somewhat misnamed: it
4035	* deals with translating the duration ("1 week", "4 days", etc.), not the expiry time
4036	* (which is an absolute timestamp). Please note: do NOT add this blindly, as it is used
4037	* on old expiry lengths recorded in log entries. You'd need to provide the start date to
4038	* match up with it.
4039	*
4040	* @param string $str The validated block duration in English
4041	* @param UserIdentity\|null $user User to use timezone from or null for the context user
4042	* @param int $now Current timestamp, for formatting relative block durations
4043	* @return string Somehow translated block duration
4044	* @see LanguageFi.php file for an implementation example
4045	*/
4046	public function translateBlockExpiry( $str, ?UserIdentity $user = null, $now = 0 ) {
4047	$duration = $this->getBlockDurations();
4048	$show = array_search( $str, $duration, true );
4049	if ( $show !== false ) {
4050	return trim( $show );
4051	}
4052
4053	if ( wfIsInfinity( $str ) ) {
4054	foreach ( $duration as $show => $value ) {
4055	if ( wfIsInfinity( $value ) ) {
4056	return trim( $show );
4057	}
4058	}
4059	}
4060
4061	// If all else fails, return a standard duration or timestamp description.
4062	$time = strtotime( $str, $now );
4063	if ( $time === false ) { // Unknown format. Return it as-is in case.
4064	return $str;
4065	} elseif ( $time !== strtotime( $str, $now + 1 ) ) { // It's a relative timestamp.
4066	// The result differs based on current time, so the difference
4067	// is a fixed duration length.
4068	return $this->formatDurationBetweenTimestamps( $time, $now );
4069	} else { // It's an absolute timestamp.
4070	if ( $time === 0 ) {
4071	// wfTimestamp() handles 0 as current time instead of epoch.
4072	$time = '19700101000000';
4073	}
4074	if ( $user ) {
4075	return $this->userTimeAndDate( $time, $user );
4076	}
4077	return $this->timeanddate( $time );
4078	}
4079	}
4080
4081	/**
4082	* Languages like Chinese need to be segmented in order for the diff
4083	* to be of any use
4084	*
4085	* @param string $text
4086	* @return string
4087	*/
4088	public function segmentForDiff( $text ) {
4089	return $text;
4090	}
4091
4092	/**
4093	* And unsegment to show the result
4094	*
4095	* @param string $text
4096	* @return string
4097	*/
4098	public function unsegmentForDiff( $text ) {
4099	return $text;
4100	}
4101
4102	/**
4103	* A regular expression to match legal word-trailing characters
4104	* which should be merged onto a link of the form [[foo]]bar.
4105	*
4106	* @return string
4107	*/
4108	public function linkTrail() {
4109	return $this->localisationCache->getItem( $this->mCode, 'linkTrail' );
4110	}
4111
4112	/**
4113	* A regular expression character set to match legal word-prefixing
4114	* characters which should be merged onto a link of the form foo[[bar]].
4115	*
4116	* @return string
4117	*/
4118	public function linkPrefixCharset() {
4119	return $this->localisationCache->getItem( $this->mCode, 'linkPrefixCharset' );
4120	}
4121
4122	/**
4123	* Compare with another language object
4124	*
4125	* @since 1.28
4126	* @param Language $lang
4127	* @return bool
4128	*/
4129	public function equals( Language $lang ) {
4130	return $lang === $this \|\| $lang->getCode() === $this->mCode;
4131	}
4132
4133	/**
4134	* Get the internal language code for this language object
4135	*
4136	* NOTE: The return value of this function is NOT HTML-safe and must be escaped with
4137	* htmlspecialchars() or similar
4138	*
4139	* @return string
4140	*/
4141	public function getCode() {
4142	return $this->mCode;
4143	}
4144
4145	/**
4146	* Get the code in BCP 47 format which we can use
4147	* inside html lang="" tags.
4148	*
4149	* NOTE: The return value of this function is NOT HTML-safe and must be escaped with
4150	* htmlspecialchars() or similar.
4151	*
4152	* @since 1.19
4153	* @return string
4154	*/
4155	public function getHtmlCode() {
4156	$this->mHtmlCode ??= LanguageCode::bcp47( $this->getCode() );
4157	return $this->mHtmlCode;
4158	}
4159
4160	/**
4161	* Implement the Bcp47Code interface. This is an alias for
4162	* ::getHtmlCode().
4163	*
4164	* @since 1.40
4165	* @return string
4166	*/
4167	public function toBcp47Code(): string {
4168	return $this->getHtmlCode();
4169	}
4170
4171	/**
4172	* Compare this Language object to a Bcp47Code. This is part of the
4173	* Bcp47Code interface.
4174	* @param Bcp47Code $other
4175	* @return bool
4176	* @since 1.41
4177	*/
4178	public function isSameCodeAs( Bcp47Code $other ): bool {
4179	if ( $this === $other ) {
4180	return true;
4181	}
4182	if ( $other instanceof Language ) {
4183	// Compare the mediawiki-internal code
4184	return $this->equals( $other );
4185	}
4186	// Bcp-47 codes are case insensitive.
4187	// See Bcp47CodeValue::isSameCode()
4188	return strcasecmp( $this->toBcp47Code(), $other->toBcp47Code() ) === 0;
4189	}
4190
4191	/**
4192	* Get the language code from a file name. Inverse of getFileName()
4193	*
4194	* @param string $filename $prefix . $languageCode . $suffix
4195	* @param string $prefix Prefix before the language code
4196	* @param string $suffix Suffix after the language code
4197	* @return string\|false Language code, or false if $prefix or $suffix isn't found
4198	*/
4199	public static function getCodeFromFileName( $filename, $prefix = 'Language', $suffix = '.php' ) {
4200	$m = null;
4201	preg_match( '/' . preg_quote( $prefix, '/' ) . '([A-Z][a-z_]+)' .
4202	preg_quote( $suffix, '/' ) . '/', $filename, $m );
4203	if ( !count( $m ) ) {
4204	return false;
4205	}
4206	return str_replace( '_', '-', strtolower( $m[1] ) );
4207	}
4208
4209	/**
4210	* @param string $talk
4211	* @return string
4212	*/
4213	private function fixVariableInNamespace( $talk ) {
4214	if ( strpos( $talk, '$1' ) === false ) {
4215	return $talk;
4216	}
4217
4218	$talk = str_replace( '$1', $this->config->get( MainConfigNames::MetaNamespace ), $talk );
4219
4220	# Allow grammar transformations
4221	# Allowing full message-style parsing would make simple requests
4222	# such as action=raw much more expensive than they need to be.
4223	# This will hopefully cover most cases.
4224	$talk = preg_replace_callback(
4225	'/{{grammar:(.?)\\|(.?)}}/i',
4226	function ( $m ) {
4227	return $this->convertGrammar( trim( $m[2] ), trim( $m[1] ) );
4228	},
4229	$talk
4230	);
4231	return str_replace( ' ', '_', $talk );
4232	}
4233
4234	/**
4235	* Decode an expiry (block, protection, etc.) which has come from the DB
4236	*
4237	* @param string $expiry Database expiry String
4238	* @param true\|int $format True to process using language functions, or TS_ constant
4239	* to return the expiry in a given timestamp
4240	* @param string $infinity If $format is not true, use this string for infinite expiry
4241	* @param UserIdentity\|null $user If $format is true, use this user for date format
4242	* @return string
4243	* @since 1.18
4244	* @since 1.36 $user was added
4245	*/
4246	public function formatExpiry( $expiry, $format = true, $infinity = 'infinity', $user = null ) {
4247	static $dbInfinity;
4248	$dbInfinity ??= MediaWikiServices::getInstance()->getConnectionProvider()
4249	->getReplicaDatabase()
4250	->getInfinity();
4251
4252	if ( $expiry == '' \|\| $expiry === 'infinity' \|\| $expiry == $dbInfinity ) {
4253	return $format === true
4254	? $this->getMessageFromDB( 'infiniteblock' )
4255	: $infinity;
4256	} else {
4257	if ( $format === true ) {
4258	return $user
4259	? $this->userTimeAndDate( $expiry, $user )
4260	: $this->timeanddate( $expiry, /* User preference timezone */ true );
4261	}
4262	return wfTimestamp( $format, $expiry );
4263	}
4264	}
4265
4266	/**
4267	* Formats a time given in seconds into a string representation of that time.
4268	*
4269	* @param int\|float $seconds
4270	* @param array $format An optional argument that formats the returned string in different ways:
4271	* If $format['avoid'] === 'avoidhours': don't show hours, just show days
4272	* If $format['avoid'] === 'avoidseconds': don't show seconds if $seconds >= 1 hour,
4273	* If $format['avoid'] === 'avoidminutes': don't show seconds/minutes if $seconds > 48 hours,
4274	* If $format['noabbrevs'] is true: use 'seconds' and friends instead of 'seconds-abbrev'
4275	* and friends.
4276	* @note For backwards compatibility, $format may also be one of the strings 'avoidseconds'
4277	* or 'avoidminutes'.
4278	* @return string
4279	*/
4280	public function formatTimePeriod( $seconds, $format = [] ) {
4281	if ( !is_array( $format ) ) {
4282	$format = [ 'avoid' => $format ]; // For backwards compatibility
4283	}
4284	if ( !isset( $format['avoid'] ) ) {
4285	$format['avoid'] = false;
4286	}
4287	if ( !isset( $format['noabbrevs'] ) ) {
4288	$format['noabbrevs'] = false;
4289	}
4290	$secondsMsg = $this->msg( $format['noabbrevs'] ? 'seconds' : 'seconds-abbrev' );
4291	$minutesMsg = $this->msg( $format['noabbrevs'] ? 'minutes' : 'minutes-abbrev' );
4292	$hoursMsg = $this->msg( $format['noabbrevs'] ? 'hours' : 'hours-abbrev' );
4293	$daysMsg = $this->msg( $format['noabbrevs'] ? 'days' : 'days-abbrev' );
4294	$space = $this->msg( 'word-separator' )->text();
4295
4296	if ( round( $seconds * 10 ) < 100 ) {
4297	$s = $this->formatNum( sprintf( "%.1f", round( $seconds * 10 ) / 10 ) );
4298	$s = $secondsMsg->params( $s )->text();
4299	} elseif ( round( $seconds ) < 60 ) {
4300	$s = $this->formatNum( round( $seconds ) );
4301	$s = $secondsMsg->params( $s )->text();
4302	} elseif ( round( $seconds ) < 3600 ) {
4303	$minutes = floor( $seconds / 60 );
4304	$secondsPart = round( fmod( $seconds, 60 ) );
4305	if ( $secondsPart == 60 ) {
4306	$secondsPart = 0;
4307	$minutes++;
4308	}
4309	$s = $minutesMsg->params( $this->formatNum( $minutes ) )->text();
4310	$s .= $space;
4311	$s .= $secondsMsg->params( $this->formatNum( $secondsPart ) )->text();
4312	} elseif ( round( $seconds ) <= 2 * 86400 ) {
4313	$hours = floor( $seconds / 3600 );
4314	$minutes = floor( ( $seconds - $hours * 3600 ) / 60 );
4315	$secondsPart = round( $seconds - $hours * 3600 - $minutes * 60 );
4316	if ( $secondsPart == 60 ) {
4317	$secondsPart = 0;
4318	$minutes++;
4319	}
4320	if ( $minutes == 60 ) {
4321	$minutes = 0;
4322	$hours++;
4323	}
4324	$s = $hoursMsg->params( $this->formatNum( $hours ) )->text();
4325	$s .= $space;
4326	$s .= $minutesMsg->params( $this->formatNum( $minutes ) )->text();
4327	if ( !in_array( $format['avoid'], [ 'avoidseconds', 'avoidminutes', 'avoidhours' ] ) ) {
4328	$s .= $space . $secondsMsg->params( $this->formatNum( $secondsPart ) )->text();
4329	}
4330	} else {
4331	$days = floor( $seconds / 86400 );
4332	if ( $format['avoid'] === 'avoidhours' ) {
4333	$hours = round( ( $seconds - $days * 86400 ) / 3600 );
4334	if ( $hours == 24 ) {
4335	$days++;
4336	}
4337	$s = $daysMsg->params( $this->formatNum( $days ) )->text();
4338	} elseif ( $format['avoid'] === 'avoidminutes' ) {
4339	$hours = round( ( $seconds - $days * 86400 ) / 3600 );
4340	if ( $hours == 24 ) {
4341	$hours = 0;
4342	$days++;
4343	}
4344	$s = $daysMsg->params( $this->formatNum( $days ) )->text();
4345	$s .= $space;
4346	$s .= $hoursMsg->params( $this->formatNum( $hours ) )->text();
4347	} elseif ( $format['avoid'] === 'avoidseconds' ) {
4348	$hours = floor( ( $seconds - $days * 86400 ) / 3600 );
4349	$minutes = round( ( $seconds - $days * 86400 - $hours * 3600 ) / 60 );
4350	if ( $minutes == 60 ) {
4351	$minutes = 0;
4352	$hours++;
4353	}
4354	if ( $hours == 24 ) {
4355	$hours = 0;
4356	$days++;
4357	}
4358	$s = $daysMsg->params( $this->formatNum( $days ) )->text();
4359	$s .= $space;
4360	$s .= $hoursMsg->params( $this->formatNum( $hours ) )->text();
4361	$s .= $space;
4362	$s .= $minutesMsg->params( $this->formatNum( $minutes ) )->text();
4363	} else {
4364	$s = $daysMsg->params( $this->formatNum( $days ) )->text();
4365	$s .= $space;
4366	$s .= $this->formatTimePeriod( $seconds - $days * 86400, $format );
4367	}
4368	}
4369	return $s;
4370	}
4371
4372	/**
4373	* Format a bitrate for output, using an appropriate
4374	* unit (bps, kbps, Mbps, Gbps, Tbps, Pbps, Ebps, Zbps, Ybps, Rbps or Qbps) according to
4375	* the magnitude in question.
4376	*
4377	* This use base 1000. For base 1024 use formatSize(), for another base
4378	* see formatComputingNumbers().
4379	*
4380	* @param int $bps
4381	* @return string
4382	*/
4383	public function formatBitrate( $bps ) {
4384	// messages used: bitrate-bits, bitrate-kilobits, bitrate-megabits, bitrate-gigabits, bitrate-terabits,
4385	// bitrate-petabits, bitrate-exabits, bitrate-zettabits, bitrate-yottabits, bitrate-ronnabits,
4386	// bitrate-quettabits
4387	return $this->formatComputingNumbers( $bps, 1000, "bitrate-$1bits" );
4388	}
4389
4390	/**
4391	* @param int $size Size of the unit
4392	* @param int $boundary Size boundary (1000, or 1024 in most cases)
4393	* @param string $messageKey Message key to be used
4394	* @return string
4395	*/
4396	public function formatComputingNumbers( $size, $boundary, $messageKey ) {
4397	if ( $size <= 0 ) {
4398	return str_replace( '$1', $this->formatNum( $size ),
4399	$this->getMessageFromDB( str_replace( '$1', '', $messageKey ) )
4400	);
4401	}
4402	$sizes = [ '', 'kilo', 'mega', 'giga', 'tera', 'peta', 'exa', 'zetta', 'yotta', 'ronna', 'quetta' ];
4403	$index = 0;
4404
4405	$maxIndex = count( $sizes ) - 1;
4406	while ( $size >= $boundary && $index < $maxIndex ) {
4407	$index++;
4408	$size /= $boundary;
4409	}
4410
4411	// For small sizes no decimal places necessary
4412	$round = 0;
4413	if ( $index > 1 ) {
4414	// For MB and larger units, two decimal places are smarter
4415	$round = 2;
4416	}
4417	$msg = str_replace( '$1', $sizes[$index], $messageKey );
4418
4419	$size = round( $size, $round );
4420	$text = $this->getMessageFromDB( $msg );
4421	return str_replace( '$1', $this->formatNum( $size ), $text );
4422	}
4423
4424	/**
4425	* Format a size in bytes for output, using an appropriate
4426	* unit (B, KB, MB, GB, TB, PB, EB, ZB, YB, RB or QB) according to the magnitude in question
4427	*
4428	* This method use base 1024. For base 1000 use formatBitrate(), for
4429	* another base see formatComputingNumbers()
4430	*
4431	* @param int $size Size to format
4432	* @return string Plain text (not HTML)
4433	*/
4434	public function formatSize( $size ) {
4435	// messages used: size-bytes, size-kilobytes, size-megabytes, size-gigabytes, size-terabytes,
4436	// size-petabytes, size-exabytes, size-zettabytes, size-yottabytes, size-ronnabytes, size-quettabytes
4437	return $this->formatComputingNumbers( $size, 1024, "size-$1bytes" );
4438	}
4439
4440	/**
4441	* Make a list item, used by various special pages
4442	*
4443	* @param string $page Page link
4444	* @param string $details HTML safe text between brackets
4445	* @return string HTML escaped
4446	*/
4447	public function specialList( $page, $details ) {
4448	if ( !$details ) {
4449	return $page;
4450	}
4451
4452	return Html::rawElement( 'bdi', [ 'dir' => $this->getDir() ], $page ) .
4453	$this->msg( 'word-separator' )->escaped() .
4454	$this->msg( 'parentheses' )->rawParams( $details )->escaped();
4455	}
4456
4457	/**
4458	* Get the compiled plural rules for the language
4459	*
4460	* @since 1.20
4461	* @return array<int,string> Associative array with plural form, and plural rule as key-value pairs
4462	*/
4463	public function getCompiledPluralRules() {
4464	$pluralRules =
4465	$this->localisationCache->getItem( strtolower( $this->mCode ), 'compiledPluralRules' );
4466	if ( !$pluralRules ) {
4467	$fallbacks = $this->getFallbackLanguages();
4468	foreach ( $fallbacks as $fallbackCode ) {
4469	$pluralRules = $this->localisationCache
4470	->getItem( strtolower( $fallbackCode ), 'compiledPluralRules' );
4471	if ( $pluralRules ) {
4472	break;
4473	}
4474	}
4475	}
4476	return $pluralRules;
4477	}
4478
4479	/**
4480	* Get the plural rules for the language
4481	*
4482	* @since 1.20
4483	* @return array<int,string> Associative array with plural form number and plural rule as key-value pairs
4484	*/
4485	public function getPluralRules() {
4486	$pluralRules =
4487	$this->localisationCache->getItem( strtolower( $this->mCode ), 'pluralRules' );
4488	if ( !$pluralRules ) {
4489	$fallbacks = $this->getFallbackLanguages();
4490	foreach ( $fallbacks as $fallbackCode ) {
4491	$pluralRules = $this->localisationCache
4492	->getItem( strtolower( $fallbackCode ), 'pluralRules' );
4493	if ( $pluralRules ) {
4494	break;
4495	}
4496	}
4497	}
4498	return $pluralRules;
4499	}
4500
4501	/**
4502	* Get the plural rule types for the language
4503	*
4504	* @since 1.22
4505	* @return array<int,string> Associative array with plural form number and plural rule type as key-value pairs
4506	*/
4507	public function getPluralRuleTypes() {
4508	$pluralRuleTypes =
4509	$this->localisationCache->getItem( strtolower( $this->mCode ), 'pluralRuleTypes' );
4510	if ( !$pluralRuleTypes ) {
4511	$fallbacks = $this->getFallbackLanguages();
4512	foreach ( $fallbacks as $fallbackCode ) {
4513	$pluralRuleTypes = $this->localisationCache
4514	->getItem( strtolower( $fallbackCode ), 'pluralRuleTypes' );
4515	if ( $pluralRuleTypes ) {
4516	break;
4517	}
4518	}
4519	}
4520	return $pluralRuleTypes;
4521	}
4522
4523	/**
4524	* Find the index number of the plural rule appropriate for the given number
4525	*
4526	* @param int $number
4527	* @return int The index number of the plural rule
4528	*/
4529	public function getPluralRuleIndexNumber( $number ) {
4530	$pluralRules = $this->getCompiledPluralRules();
4531	return Evaluator::evaluateCompiled( $number, $pluralRules );
4532	}
4533
4534	/**
4535	* Find the plural rule type appropriate for the given number.
4536	* For example, if the language is set to Arabic, getPluralType(5) should
4537	* return 'few'.
4538	*
4539	* @since 1.22
4540	* @param int $number
4541	* @return string The name of the plural rule type, e.g., one, two, few, many
4542	*/
4543	public function getPluralRuleType( $number ) {
4544	$index = $this->getPluralRuleIndexNumber( $number );
4545	$pluralRuleTypes = $this->getPluralRuleTypes();
4546	return $pluralRuleTypes[$index] ?? 'other';
4547	}
4548
4549	/**
4550	* Return the LanguageConverter for this language,
4551	* convenience function for use in the language classes only
4552	*
4553	* @return ILanguageConverter
4554	*/
4555	protected function getConverterInternal() {
4556	return $this->converterFactory->getLanguageConverter( $this );
4557	}
4558
4559	/**
4560	* Get a HookContainer, for hook metadata and running extension hooks
4561	*
4562	* @since 1.35
4563	* @return HookContainer
4564	*/
4565	protected function getHookContainer() {
4566	return $this->hookContainer;
4567	}
4568
4569	/**
4570	* Get a HookRunner, for running core hooks
4571	*
4572	* @internal This is for use by core only. Hook interfaces may be removed
4573	* without notice.
4574	* @since 1.35
4575	* @return HookRunner
4576	*/
4577	protected function getHookRunner() {
4578	return $this->hookRunner;
4579	}
4580
4581	/**
4582	* @internal Only for use by the 'mediawiki.language' ResourceLoader module and
4583	* generateJqueryMsgData.php
4584	* @return array
4585	*/
4586	public function getJsData() {
4587	return [
4588	'digitTransformTable' => $this->digitTransformTable(),
4589	'separatorTransformTable' => $this->separatorTransformTable(),
4590	'minimumGroupingDigits' => $this->minimumGroupingDigits(),
4591	'formalityIndex' => $this->getFormalityIndex(),
4592	'grammarForms' => $this->getGrammarForms(),
4593	'grammarTransformations' => $this->getGrammarTransformations(),
4594	'pluralRules' => $this->getPluralRules(),
4595	'digitGroupingPattern' => $this->digitGroupingPattern(),
4596	'fallbackLanguages' => $this->getFallbackLanguages(),
4597	'bcp47Map' => LanguageCode::getNonstandardLanguageCodeMapping(),
4598	];
4599	}
4600	}
4601
4602	/** @deprecated class alias since 1.43 */
4603	class_alias( Language::class, 'Language' );