MediaWiki REL1_30
MagicWordArray.php
Go to the documentation of this file.
1<?php
2
26
33 public $names = [];
34
36 private $hash;
37
38 private $baseRegex;
39
40 private $regex;
41
45 public function __construct( $names = [] ) {
46 $this->names = $names;
47 }
48
54 public function add( $name ) {
55 $this->names[] = $name;
56 $this->hash = $this->baseRegex = $this->regex = null;
57 }
58
64 public function addArray( $names ) {
65 $this->names = array_merge( $this->names, array_values( $names ) );
66 $this->hash = $this->baseRegex = $this->regex = null;
67 }
68
73 public function getHash() {
74 if ( is_null( $this->hash ) ) {
75 global $wgContLang;
76 $this->hash = [ 0 => [], 1 => [] ];
77 foreach ( $this->names as $name ) {
78 $magic = MagicWord::get( $name );
79 $case = intval( $magic->isCaseSensitive() );
80 foreach ( $magic->getSynonyms() as $syn ) {
81 if ( !$case ) {
82 $syn = $wgContLang->lc( $syn );
83 }
84 $this->hash[$case][$syn] = $name;
85 }
86 }
87 }
88 return $this->hash;
89 }
90
95 public function getBaseRegex() {
96 if ( is_null( $this->baseRegex ) ) {
97 $this->baseRegex = [ 0 => '', 1 => '' ];
98 $allGroups = [];
99 foreach ( $this->names as $name ) {
100 $magic = MagicWord::get( $name );
101 $case = intval( $magic->isCaseSensitive() );
102 foreach ( $magic->getSynonyms() as $i => $syn ) {
103 // Group name must start with a non-digit in PCRE 8.34+
104 $it = strtr( $i, '0123456789', 'abcdefghij' );
105 $groupName = $it . '_' . $name;
106 $group = '(?P<' . $groupName . '>' . preg_quote( $syn, '/' ) . ')';
107 // look for same group names to avoid same named subpatterns in the regex
108 if ( isset( $allGroups[$groupName] ) ) {
109 throw new MWException(
110 __METHOD__ . ': duplicate internal name in magic word array: ' . $name
111 );
112 }
113 $allGroups[$groupName] = true;
114 if ( $this->baseRegex[$case] === '' ) {
115 $this->baseRegex[$case] = $group;
116 } else {
117 $this->baseRegex[$case] .= '|' . $group;
118 }
119 }
120 }
121 }
122 return $this->baseRegex;
123 }
124
129 public function getRegex() {
130 if ( is_null( $this->regex ) ) {
131 $base = $this->getBaseRegex();
132 $this->regex = [ '', '' ];
133 if ( $this->baseRegex[0] !== '' ) {
134 $this->regex[0] = "/{$base[0]}/iuS";
135 }
136 if ( $this->baseRegex[1] !== '' ) {
137 $this->regex[1] = "/{$base[1]}/S";
138 }
139 }
140 return $this->regex;
141 }
142
148 public function getVariableRegex() {
149 return str_replace( "\\$1", "(.*?)", $this->getRegex() );
150 }
151
157 public function getRegexStart() {
158 $base = $this->getBaseRegex();
159 $newRegex = [ '', '' ];
160 if ( $base[0] !== '' ) {
161 $newRegex[0] = "/^(?:{$base[0]})/iuS";
162 }
163 if ( $base[1] !== '' ) {
164 $newRegex[1] = "/^(?:{$base[1]})/S";
165 }
166 return $newRegex;
167 }
168
174 public function getVariableStartToEndRegex() {
175 $base = $this->getBaseRegex();
176 $newRegex = [ '', '' ];
177 if ( $base[0] !== '' ) {
178 $newRegex[0] = str_replace( "\\$1", "(.*?)", "/^(?:{$base[0]})$/iuS" );
179 }
180 if ( $base[1] !== '' ) {
181 $newRegex[1] = str_replace( "\\$1", "(.*?)", "/^(?:{$base[1]})$/S" );
182 }
183 return $newRegex;
184 }
185
190 public function getNames() {
191 return $this->names;
192 }
193
204 public function parseMatch( $m ) {
205 reset( $m );
206 while ( list( $key, $value ) = each( $m ) ) {
207 if ( $key === 0 || $value === '' ) {
208 continue;
209 }
210 $parts = explode( '_', $key, 2 );
211 if ( count( $parts ) != 2 ) {
212 // This shouldn't happen
213 // continue;
214 throw new MWException( __METHOD__ . ': bad parameter name' );
215 }
216 list( /* $synIndex */, $magicName ) = $parts;
217 $paramValue = next( $m );
218 return [ $magicName, $paramValue ];
219 }
220 // This shouldn't happen either
221 throw new MWException( __METHOD__ . ': parameter not found' );
222 }
223
234 public function matchVariableStartToEnd( $text ) {
236 foreach ( $regexes as $regex ) {
237 if ( $regex !== '' ) {
238 $m = [];
239 if ( preg_match( $regex, $text, $m ) ) {
240 return $this->parseMatch( $m );
241 }
242 }
243 }
244 return [ false, false ];
245 }
246
255 public function matchStartToEnd( $text ) {
256 $hash = $this->getHash();
257 if ( isset( $hash[1][$text] ) ) {
258 return $hash[1][$text];
259 }
260 global $wgContLang;
261 $lc = $wgContLang->lc( $text );
262 if ( isset( $hash[0][$lc] ) ) {
263 return $hash[0][$lc];
264 }
265 return false;
266 }
267
276 public function matchAndRemove( &$text ) {
277 $found = [];
278 $regexes = $this->getRegex();
279 foreach ( $regexes as $regex ) {
280 if ( $regex === '' ) {
281 continue;
282 }
283 $matches = [];
284 $res = preg_match_all( $regex, $text, $matches, PREG_SET_ORDER );
285 if ( $res === false ) {
286 LoggerFactory::getInstance( 'parser' )->warning( 'preg_match_all returned false', [
287 'code' => preg_last_error(),
288 'regex' => $regex,
289 'text' => $text,
290 ] );
291 } elseif ( $res ) {
292 foreach ( $matches as $m ) {
293 list( $name, $param ) = $this->parseMatch( $m );
294 $found[$name] = $param;
295 }
296 }
297 $res = preg_replace( $regex, '', $text );
298 if ( $res === null ) {
299 LoggerFactory::getInstance( 'parser' )->warning( 'preg_replace returned null', [
300 'code' => preg_last_error(),
301 'regex' => $regex,
302 'text' => $text,
303 ] );
304 }
305 $text = $res;
306 }
307 return $found;
308 }
309
320 public function matchStartAndRemove( &$text ) {
321 $regexes = $this->getRegexStart();
322 foreach ( $regexes as $regex ) {
323 if ( $regex === '' ) {
324 continue;
325 }
326 if ( preg_match( $regex, $text, $m ) ) {
327 list( $id, ) = $this->parseMatch( $m );
328 if ( strlen( $m[0] ) >= strlen( $text ) ) {
329 $text = '';
330 } else {
331 $text = substr( $text, strlen( $m[0] ) );
332 }
333 return $id;
334 }
335 }
336 return false;
337 }
338}
MediaWiki exception.
Class for handling an array of magic words.
matchVariableStartToEnd( $text)
Match some text, with parameter capture Returns an array with the magic word name in the first elemen...
add( $name)
Add a magic word by name.
getVariableRegex()
Get a regex for matching variables with parameters.
parseMatch( $m)
Parse a match array from preg_match Returns array(magic word ID, parameter value) If there is no para...
matchStartToEnd( $text)
Match some text, without parameter capture Returns the magic word name, or false if there was no capt...
getRegexStart()
Get a regex anchored to the start of the string that does not match parameters.
getBaseRegex()
Get the base regex.
matchStartAndRemove(&$text)
Return the ID of the magic word at the start of $text, and remove the prefix from $text.
getRegex()
Get an unanchored regex that does not match parameters.
getVariableStartToEndRegex()
Get an anchored regex for matching variables with parameters.
__construct( $names=[])
getHash()
Get a 2-d hashtable for this array.
matchAndRemove(&$text)
Returns an associative array, ID => param value, for all items that match Removes the matched items f...
addArray( $names)
Add a number of magic words by name.
static & get( $id)
Factory: creates an object representing an ID.
PSR-3 logger instance factory.
if( $wgSpamBlacklistFiles) $regexes
Definition cleanup.php:88
$res
Definition database.txt:21
deferred txt A few of the database updates required by various functions here can be deferred until after the result page is displayed to the user For updating the view updating the linked to tables after a etc PHP does not yet have any way to tell the server to actually return and disconnect while still running these but it might have such a feature in the future We handle these by creating a deferred update object and putting those objects on a global list
Definition deferred.txt:11
this class mediates it Skin Encapsulates a look and feel for the wiki All of the functions that render HTML and make choices about how to render it are here and are called from various other places when and is meant to be subclassed with other skins that may override some of its functions The User object contains a reference to a and so rather than having a global skin object we just rely on the global User and get the skin with $wgUser and also has some character encoding functions and other locale stuff The current user interface language is instantiated as and the local content language as $wgContLang
Definition design.txt:57
Allows to change the fields on the form that will be generated $name
Definition hooks.txt:302
processing should stop and the error should be shown to the user * false
Definition hooks.txt:187