MediaWiki REL1_37
MediaWiki\Languages\Data\CrhExceptions Class Reference

Public Member Functions

 __construct ()
 
 loadExceptions ( $lcChars, $ucChars)
 

Public Attributes

 $Cyrl2LatnExceptions = []
 
 $Cyrl2LatnPatterns = []
 
 $Latn2CyrlExceptions = []
 
 $Latn2CyrlPatterns = []
 

Private Member Functions

 addMappings ( $mapArray, &$A2B, &$B2A, $exactCase=false, $prePat='', $postPat='')
 
 initLcUc ( $lcChars, $ucChars, $reinit=false)
 
 loadRegs ()
 
 myLc ( $string)
 
 myUc ( $string)
 
 myUcWord ( $string)
 

Private Attributes

 $Cyrl2LatnRegexes = []
 
 $CyrlCleanUpRegexes
 
string[] $exactCaseMappings
 map Cyrillic to Latin and back, simple string match only (no regex) no variants: map exactly as is
 
 $Latn2CyrlRegexes = []
 
 $lc2uc
 
string[] $ManyToOneC2LMappings
 map Latin to Cyrillic and back, simple string match only (no regex) variants: all lowercase, all uppercase, first letter capitalized
 
string[] $multiCaseMappings
 map Cyrillic to Latin and back, simple string match only (no regex) variants: all lowercase, all uppercase, first letter capitalized
 
string[] $prefixMapping
 map Cyrillic to Latin and back, match beginning of word variants: all lowercase, all uppercase, first letter capitalized items with capture group refs (e.g., $1) are only mapped from the regex to the reference
 
string[] $suffixMapping
 map Cyrillic to Latin and back, match end of word variants: all lowercase, all uppercase, first letter capitalized "first letter capitalized" variant was in the source items with capture group refs (e.g., $1) are only mapped from the regex to the reference
 
 $uc2lc
 
const WB = '\b'
 

Detailed Description

Definition at line 14 of file CrhExceptions.php.

Constructor & Destructor Documentation

◆ __construct()

MediaWiki\Languages\Data\CrhExceptions::__construct ( )

Member Function Documentation

◆ addMappings()

MediaWiki\Languages\Data\CrhExceptions::addMappings (   $mapArray,
$A2B,
$B2A,
  $exactCase = false,
  $prePat = '',
  $postPat = '' 
)
private

◆ initLcUc()

MediaWiki\Languages\Data\CrhExceptions::initLcUc (   $lcChars,
  $ucChars,
  $reinit = false 
)
private

◆ loadExceptions()

◆ loadRegs()

◆ myLc()

MediaWiki\Languages\Data\CrhExceptions::myLc (   $string)
private

Definition at line 51 of file CrhExceptions.php.

Referenced by MediaWiki\Languages\Data\CrhExceptions\myUcWord().

◆ myUc()

MediaWiki\Languages\Data\CrhExceptions::myUc (   $string)
private

◆ myUcWord()

MediaWiki\Languages\Data\CrhExceptions::myUcWord (   $string)
private

Member Data Documentation

◆ $Cyrl2LatnExceptions

MediaWiki\Languages\Data\CrhExceptions::$Cyrl2LatnExceptions = []

◆ $Cyrl2LatnPatterns

MediaWiki\Languages\Data\CrhExceptions::$Cyrl2LatnPatterns = []

◆ $Cyrl2LatnRegexes

MediaWiki\Languages\Data\CrhExceptions::$Cyrl2LatnRegexes = []
private

◆ $CyrlCleanUpRegexes

MediaWiki\Languages\Data\CrhExceptions::$CyrlCleanUpRegexes
private

◆ $exactCaseMappings

string [] MediaWiki\Languages\Data\CrhExceptions::$exactCaseMappings
private
Initial value:
= [
# аббревиатуры
# abbreviations
'ОБСЕ' => 'OBSE', 'КъМДж' => 'QMC', 'КъДж' => 'QC', 'КъАЭ' => 'QAE', 'ГъСМК' => 'ĞSMK',
'ШСДжБ' => 'ŞSCB', 'КъМШСДж' => 'QMŞSC', 'КъАССР' => 'QASSR', 'КъДМПУ' => 'QDMPU',
'КъМПУ' => 'QMPU',
]

map Cyrillic to Latin and back, simple string match only (no regex) no variants: map exactly as is

Definition at line 355 of file CrhExceptions.php.

◆ $Latn2CyrlExceptions

MediaWiki\Languages\Data\CrhExceptions::$Latn2CyrlExceptions = []

◆ $Latn2CyrlPatterns

MediaWiki\Languages\Data\CrhExceptions::$Latn2CyrlPatterns = []

◆ $Latn2CyrlRegexes

MediaWiki\Languages\Data\CrhExceptions::$Latn2CyrlRegexes = []
private

◆ $lc2uc

MediaWiki\Languages\Data\CrhExceptions::$lc2uc
private

Definition at line 28 of file CrhExceptions.php.

◆ $ManyToOneC2LMappings

string [] MediaWiki\Languages\Data\CrhExceptions::$ManyToOneC2LMappings
private
Initial value:
= [
# Carefully ordered many-to-one mappings
# these are ordered so C2L is correct (the later Latin one)
# see also L2C mappings below
'fevqülade' => 'февкъульаде', 'fevqulade' => 'февкъульаде',
'beyude' => 'бейуде', 'beyüde' => 'бейуде',
'curat' => 'джурьат', 'cürat' => 'джурьат',
'mesul' => 'месуль', 'mesül' => 'месуль',
]

map Latin to Cyrillic and back, simple string match only (no regex) variants: all lowercase, all uppercase, first letter capitalized

Definition at line 123 of file CrhExceptions.php.

◆ $multiCaseMappings

string [] MediaWiki\Languages\Data\CrhExceptions::$multiCaseMappings
private

map Cyrillic to Latin and back, simple string match only (no regex) variants: all lowercase, all uppercase, first letter capitalized

Definition at line 137 of file CrhExceptions.php.

◆ $prefixMapping

string [] MediaWiki\Languages\Data\CrhExceptions::$prefixMapping
private
Initial value:
= [
# originally C2L
'буюк([^ъ])' => 'büyük$1', 'бую([гдйлмнпрстчшc])(и)' => 'büyü$1$2',
'буют([^ыа])' => 'büyüt$1', 'джонк([^ъ])' => 'cönk$1', 'коюм' => 'köyüm', 'коюнъ' => 'köyüñ',
'коюн([ди])' => 'köyün$1', 'куе' => 'küye', 'куркке' => 'kürkke', 'куркни' => 'kürkni',
'куркте' => 'kürkte', 'куркчю' => 'kürkçü', 'кою' => 'köyü',
'жизнь' => 'jizn',
# арабизмы на муи- муэ- / Arabic муи- муэ-
'му([иэИЭ])' => 'mü$1',
# originally L2C, here swapped
'роль$1' => 'rol([^ü]|' . self::WB . ')',
'усть$1' => 'üst([^ü]|' . self::WB . ')',
# more prefixes
'ком-кок' => 'köm-kök',
]

map Cyrillic to Latin and back, match beginning of word variants: all lowercase, all uppercase, first letter capitalized items with capture group refs (e.g., $1) are only mapped from the regex to the reference

Definition at line 389 of file CrhExceptions.php.

◆ $suffixMapping

string [] MediaWiki\Languages\Data\CrhExceptions::$suffixMapping
private
Initial value:
= [
# originally C2L
'иаль' => 'ial', 'нуль' => 'nul', 'кой' => 'köy', 'койнинъ' => 'köyniñ', 'койни' => 'köyni',
'койге' => 'köyge', 'койде' => 'köyde', 'койдеки' => 'köydeki', 'койден' => 'köyden',
'козь' => 'köz', '-юнджи' => '-ünci', '-юнджиде' => '-üncide', '-юнджиден' => '-ünciden',
# originally L2C, here swapped
'льная' => 'lnaya', 'льное' => 'lnoye', 'льный' => 'lnıy', 'льний' => 'lniy',
'льская' => 'lskaya', 'льский' => 'lskiy', 'льское' => 'lskoye', 'ополь' => 'opol',
'щее' => 'şçeye', 'щий' => 'şçiy', 'щая' => 'şçaya', 'цепс' => 'tseps',
]

map Cyrillic to Latin and back, match end of word variants: all lowercase, all uppercase, first letter capitalized "first letter capitalized" variant was in the source items with capture group refs (e.g., $1) are only mapped from the regex to the reference

Definition at line 370 of file CrhExceptions.php.

◆ $uc2lc

MediaWiki\Languages\Data\CrhExceptions::$uc2lc
private

Definition at line 29 of file CrhExceptions.php.

◆ WB

const MediaWiki\Languages\Data\CrhExceptions::WB = '\b'
private

Definition at line 16 of file CrhExceptions.php.


The documentation for this class was generated from the following file: