81 # Flags for Parser::setFunctionHook
85 # Constants needed for external link processing
86 # Everything except bracket, space, or control characters
87 # \p{Zs} is unicode 'separator, space' category. It covers the space 0x20
88 # as well as U+3000 is IDEOGRAPHIC SPACE for bug 19052
90 # Simplified expression to match an IPv4 or IPv6 address, or
91 # at least one character of a host name (embeds EXT_LINK_URL_CLASS)
92 const EXT_LINK_ADDR =
'(?:[0-9.]+|\\[(?i:[0-9a-f:.]+)\\]|[^][<>"\\x00-\\x20\\x7F\p{Zs}])';
93 # RegExp to make image URLs (embeds IPv6 part of EXT_LINK_ADDR)
95 const EXT_IMAGE_REGEX =
'/^(http:\/\/|https:\/\/)((?:\\[(?i:[0-9a-f:.]+)\\])?[^][<>"\\x00-\\x20\\x7F\p{Zs}]+)
96 \\/([A-Za-z0-9_.,~%\\-+&;#*?!=()@\\x80-\\xFF]+)\\.((?i)gif|png|jpg|jpeg)$/Sxu';
99 # Regular expression for a non-newline space
102 # State constants for the definition list colon extraction
112 # Flags for preprocessToDom
115 # Allowed values for $this->mOutputType
116 # Parameter to startExternalParse().
121 const
OT_PLAIN = 4;
# like extractSections() - portions of the original are returned unchanged.
140 const MARKER_SUFFIX =
"-QINU`\"'\x7f";
143 # Markers used for wrapping the table of contents
161 # Initialised by initialiseVariables()
172 # Initialised in constructor
175 # Initialized in getPreprocessor()
179 # Cleared with clearState():
210 # These are variables reset at least once per parse regardless of $clearState
223 public $mRevisionObject;
# The revision object of the specified revision ID
256 public $mInParse =
false;
265 $this->mConf = $conf;
267 $this->mExtLinkBracketedRegex =
'/\[(((?i)' . $this->mUrlProtocols .
')' .
268 self::EXT_LINK_ADDR .
269 self::EXT_LINK_URL_CLASS .
'*)\p{Zs}*([^\]\\x00-\\x08\\x0a-\\x1F]*?)\]/Su';
270 if ( isset( $conf[
'preprocessorClass'] ) ) {
271 $this->mPreprocessorClass = $conf[
'preprocessorClass'];
272 } elseif ( defined(
'HPHP_VERSION' ) ) {
273 # Preprocessor_Hash is much faster than Preprocessor_DOM under HipHop
274 $this->mPreprocessorClass =
'Preprocessor_Hash';
275 } elseif ( extension_loaded(
'domxml' ) ) {
276 # PECL extension that conflicts with the core DOM extension (bug 13770)
277 wfDebug(
"Warning: you have the obsolete domxml extension for PHP. Please remove it!\n" );
278 $this->mPreprocessorClass =
'Preprocessor_Hash';
279 } elseif ( extension_loaded(
'dom' ) ) {
280 $this->mPreprocessorClass =
'Preprocessor_DOM';
282 $this->mPreprocessorClass =
'Preprocessor_Hash';
284 wfDebug( __CLASS__ .
": using preprocessor: {$this->mPreprocessorClass}\n" );
291 if ( isset( $this->mLinkHolders ) ) {
292 unset( $this->mLinkHolders );
295 unset( $this->
$name );
303 $this->mInParse =
false;
311 foreach ( [
'mStripState',
'mVarCache' ]
as $k ) {
326 if ( !$this->mFirstCall ) {
329 $this->mFirstCall =
false;
335 Hooks::run(
'ParserFirstCallInit', [ &$this ] );
344 if ( $this->mFirstCall ) {
348 $this->mOptions->registerWatcher( [ $this->mOutput,
'recordOption' ] );
349 $this->mAutonumber = 0;
350 $this->mLastSection =
'';
351 $this->mDTopen =
false;
352 $this->mIncludeCount = [];
353 $this->mArgStack =
false;
354 $this->mInPre =
false;
357 $this->mRevisionObject = $this->mRevisionTimestamp =
358 $this->mRevisionId = $this->mRevisionUser = $this->mRevisionSize = null;
359 $this->mVarCache = [];
361 $this->mLangLinkLanguages = [];
362 $this->currentRevisionCache = null;
366 # Clear these on every parse, bug 4549
367 $this->mTplRedirCache = $this->mTplDomCache = [];
369 $this->mShowToc =
true;
370 $this->mForceTocPosition =
false;
371 $this->mIncludeSizes = [
375 $this->mPPNodeCount = 0;
376 $this->mGeneratedPPNodeCount = 0;
377 $this->mHighestExpansionDepth = 0;
378 $this->mDefaultSort =
false;
379 $this->mHeadings = [];
380 $this->mDoubleUnderscores = [];
381 $this->mExpensiveFunctionCount = 0;
384 if ( isset( $this->mPreprocessor ) && $this->mPreprocessor->parser !== $this ) {
385 $this->mPreprocessor = null;
406 $linestart =
true, $clearState =
true, $revid = null
418 $text = strtr( $text,
"\x7f",
"?" );
419 $magicScopeVariable = $this->
lock();
424 $this->currentRevisionCache = null;
425 $this->mInputSize = strlen( $text );
426 if ( $this->mOptions->getEnableLimitReport() ) {
427 $this->mOutput->resetParseStartTime();
435 if ( $revid !== null ) {
436 $this->mRevisionId = $revid;
437 $this->mRevisionObject = null;
438 $this->mRevisionTimestamp = null;
439 $this->mRevisionUser = null;
440 $this->mRevisionSize = null;
443 Hooks::run(
'ParserBeforeStrip', [ &$this, &$text, &$this->mStripState ] );
445 Hooks::run(
'ParserAfterStrip', [ &$this, &$text, &$this->mStripState ] );
447 Hooks::run(
'ParserAfterParse', [ &$this, &$text, &$this->mStripState ] );
459 || isset( $this->mDoubleUnderscores[
'nocontentconvert'] )
460 || isset( $this->mDoubleUnderscores[
'notitleconvert'] )
461 || $this->mOutput->getDisplayTitle() !==
false )
464 if ( $convruletitle ) {
465 $this->mOutput->setTitleText( $convruletitle );
468 $this->mOutput->setTitleText( $titleText );
472 if ( $this->mExpensiveFunctionCount > $this->mOptions->getExpensiveParserFunctionLimit() ) {
474 $this->mExpensiveFunctionCount,
475 $this->mOptions->getExpensiveParserFunctionLimit()
479 # Information on include size limits, for the benefit of users who try to skirt them
480 if ( $this->mOptions->getEnableLimitReport() ) {
481 $max = $this->mOptions->getMaxIncludeSize();
483 $cpuTime = $this->mOutput->getTimeSinceStart(
'cpu' );
484 if ( $cpuTime !== null ) {
485 $this->mOutput->setLimitReportData(
'limitreport-cputime',
486 sprintf(
"%.3f", $cpuTime )
490 $wallTime = $this->mOutput->getTimeSinceStart(
'wall' );
491 $this->mOutput->setLimitReportData(
'limitreport-walltime',
492 sprintf(
"%.3f", $wallTime )
495 $this->mOutput->setLimitReportData(
'limitreport-ppvisitednodes',
496 [ $this->mPPNodeCount, $this->mOptions->getMaxPPNodeCount() ]
498 $this->mOutput->setLimitReportData(
'limitreport-ppgeneratednodes',
499 [ $this->mGeneratedPPNodeCount, $this->mOptions->getMaxGeneratedPPNodeCount() ]
501 $this->mOutput->setLimitReportData(
'limitreport-postexpandincludesize',
502 [ $this->mIncludeSizes[
'post-expand'], $max ]
504 $this->mOutput->setLimitReportData(
'limitreport-templateargumentsize',
505 [ $this->mIncludeSizes[
'arg'], $max ]
507 $this->mOutput->setLimitReportData(
'limitreport-expansiondepth',
508 [ $this->mHighestExpansionDepth, $this->mOptions->getMaxPPExpandDepth() ]
510 $this->mOutput->setLimitReportData(
'limitreport-expensivefunctioncount',
511 [ $this->mExpensiveFunctionCount, $this->mOptions->getExpensiveParserFunctionLimit() ]
513 Hooks::run(
'ParserLimitReportPrepare', [ $this, $this->mOutput ] );
515 $limitReport =
"NewPP limit report\n";
516 if ( $wgShowHostnames ) {
517 $limitReport .=
'Parsed by ' .
wfHostname() .
"\n";
519 $limitReport .=
'Cached time: ' . $this->mOutput->getCacheTime() .
"\n";
520 $limitReport .=
'Cache expiry: ' . $this->mOutput->getCacheExpiry() .
"\n";
521 $limitReport .=
'Dynamic content: ' .
522 ( $this->mOutput->hasDynamicContent() ?
'true' :
'false' ) .
525 foreach ( $this->mOutput->getLimitReportData()
as $key =>
$value ) {
527 [ $key, &
$value, &$limitReport,
false,
false ]
529 $keyMsg =
wfMessage( $key )->inLanguage(
'en' )->useDatabase(
false );
530 $valueMsg =
wfMessage( [
"$key-value-text",
"$key-value" ] )
531 ->inLanguage(
'en' )->useDatabase(
false );
532 if ( !$valueMsg->exists() ) {
535 if ( !$keyMsg->isDisabled() && !$valueMsg->isDisabled() ) {
536 $valueMsg->params(
$value );
537 $limitReport .=
"{$keyMsg->text()}: {$valueMsg->text()}\n";
543 $limitReport = htmlspecialchars_decode( $limitReport );
544 Hooks::run(
'ParserLimitReport', [ $this, &$limitReport ] );
548 $limitReport = str_replace( [
'-',
'&' ], [
'‐',
'&' ], $limitReport );
549 $text .=
"\n<!-- \n$limitReport-->\n";
552 $dataByFunc = $this->mProfiler->getFunctionStats();
553 uasort( $dataByFunc,
function ( $a, $b ) {
554 return $a[
'real'] < $b[
'real'];
556 $profileReport =
"Transclusion expansion time report (%,ms,calls,template)\n";
557 foreach ( array_slice( $dataByFunc, 0, 10 )
as $item ) {
558 $profileReport .= sprintf(
"%6.2f%% %8.3f %6d - %s\n",
559 $item[
'%real'], $item[
'real'], $item[
'calls'],
560 htmlspecialchars( $item[
'name'] ) );
562 $text .=
"\n<!-- \n$profileReport-->\n";
564 if ( $this->mGeneratedPPNodeCount > $this->mOptions->getMaxGeneratedPPNodeCount() / 10 ) {
565 wfDebugLog(
'generated-pp-node-count', $this->mGeneratedPPNodeCount .
' ' .
566 $this->mTitle->getPrefixedDBkey() );
569 $this->mOutput->setText( $text );
571 $this->mRevisionId = $oldRevisionId;
572 $this->mRevisionObject = $oldRevisionObject;
573 $this->mRevisionTimestamp = $oldRevisionTimestamp;
574 $this->mRevisionUser = $oldRevisionUser;
575 $this->mRevisionSize = $oldRevisionSize;
576 $this->mInputSize =
false;
577 $this->currentRevisionCache = null;
605 Hooks::run(
'ParserBeforeStrip', [ &$this, &$text, &$this->mStripState ] );
606 Hooks::run(
'ParserAfterStrip', [ &$this, &$text, &$this->mStripState ] );
648 $magicScopeVariable = $this->
lock();
650 if ( $revid !== null ) {
651 $this->mRevisionId = $revid;
653 Hooks::run(
'ParserBeforeStrip', [ &$this, &$text, &$this->mStripState ] );
654 Hooks::run(
'ParserAfterStrip', [ &$this, &$text, &$this->mStripState ] );
656 $text = $this->mStripState->unstripBoth( $text );
671 $text = $this->mStripState->unstripBoth( $text );
690 $text = $msg->params(
$params )->plain();
692 # Parser (re)initialisation
693 $magicScopeVariable = $this->
lock();
699 $text = $this->mStripState->unstripBoth( $text );
721 $this->mUser =
$user;
732 return self::MARKER_PREFIX;
745 if (
$t->hasFragment() ) {
746 # Strip the fragment to avoid various odd effects
747 $this->mTitle =
$t->createFragmentTarget(
'' );
768 public function Title( $x = null ) {
769 return wfSetVar( $this->mTitle, $x );
778 $this->mOutputType =
$ot;
795 return wfSetVar( $this->mOutputType, $x );
823 return wfSetVar( $this->mOptions, $x );
830 return $this->mLinkID++;
837 $this->mLinkID = $id;
858 $target = $this->mOptions->getTargetLanguage();
860 if ( $target !== null ) {
862 } elseif ( $this->mOptions->getInterfaceMessage() ) {
863 return $this->mOptions->getUserLangObj();
864 } elseif ( is_null( $this->mTitle ) ) {
865 throw new MWException( __METHOD__ .
': $this->mTitle is null' );
868 return $this->mTitle->getPageLanguage();
886 if ( !is_null( $this->mUser ) ) {
889 return $this->mOptions->getUser();
898 if ( !isset( $this->mPreprocessor ) ) {
899 $class = $this->mPreprocessorClass;
900 $this->mPreprocessor =
new $class( $this );
927 if ( $uniq_prefix !== null ) {
928 wfDeprecated( __METHOD__ .
' called with $prefix argument',
'1.26' );
934 $taglist = implode(
'|', $elements );
935 $start =
"/<($taglist)(\\s+[^>]*?|\\s*?)(\/?" .
">)|<(!--)/i";
937 while ( $text !=
'' ) {
938 $p = preg_split( $start, $text, 2, PREG_SPLIT_DELIM_CAPTURE );
940 if ( count( $p ) < 5 ) {
943 if ( count( $p ) > 5 ) {
957 $marker = self::MARKER_PREFIX .
"-$element-" . sprintf(
'%08X', $n++ ) . self::MARKER_SUFFIX;
958 $stripped .= $marker;
960 if ( $close ===
'/>' ) {
961 # Empty element tag, <tag />
966 if ( $element ===
'!--' ) {
969 $end =
"/(<\\/$element\\s*>)/i";
971 $q = preg_split( $end, $inside, 2, PREG_SPLIT_DELIM_CAPTURE );
973 if ( count( $q ) < 3 ) {
974 # No end tag -- let it run out to the end of the text.
986 "<$element$attributes$close$content$tail" ];
1010 $marker = self::MARKER_PREFIX .
"-item-{$this->mMarkerIndex}-" . self::MARKER_SUFFIX;
1011 $this->mMarkerIndex++;
1012 $this->mStripState->addGeneral( $marker, $text );
1027 $td_history = []; # Is currently a td tag
open?
1028 $last_tag_history = []; # Save
history of last lag activated (td, th
or caption)
1029 $tr_history = []; # Is currently a tr tag
open?
1031 $has_opened_tr = []; # Did
this table open a <tr> element?
1032 $indent_level = 0; # indent level
of the table
1035 $line = trim( $outLine );
1037 if (
$line ===
'' ) { # empty
line, go to next line
1038 $out .= $outLine .
"\n";
1042 $first_character =
$line[0];
1043 $first_two = substr(
$line, 0, 2 );
1046 if ( preg_match(
'/^(:*)\s*\{\|(.*)$/',
$line,
$matches ) ) {
1047 # First check if we are starting a new table
1048 $indent_level = strlen(
$matches[1] );
1050 $attributes = $this->mStripState->unstripBoth(
$matches[2] );
1053 $outLine = str_repeat(
'<dl><dd>', $indent_level ) .
"<table{$attributes}>";
1054 array_push( $td_history,
false );
1055 array_push( $last_tag_history,
'' );
1056 array_push( $tr_history,
false );
1057 array_push( $tr_attributes,
'' );
1058 array_push( $has_opened_tr,
false );
1059 } elseif ( count( $td_history ) == 0 ) {
1060 # Don't do any of the following
1061 $out .= $outLine .
"\n";
1063 } elseif ( $first_two ===
'|}' ) {
1064 # We are ending a table
1066 $last_tag = array_pop( $last_tag_history );
1068 if ( !array_pop( $has_opened_tr ) ) {
1069 $line =
"<tr><td></td></tr>{$line}";
1072 if ( array_pop( $tr_history ) ) {
1073 $line =
"</tr>{$line}";
1076 if ( array_pop( $td_history ) ) {
1077 $line =
"</{$last_tag}>{$line}";
1079 array_pop( $tr_attributes );
1080 $outLine =
$line . str_repeat(
'</dd></dl>', $indent_level );
1081 } elseif ( $first_two ===
'|-' ) {
1082 # Now we have a table row
1083 $line = preg_replace(
'#^\|-+#',
'',
$line );
1085 # Whats after the tag is now only attributes
1086 $attributes = $this->mStripState->unstripBoth(
$line );
1088 array_pop( $tr_attributes );
1089 array_push( $tr_attributes, $attributes );
1092 $last_tag = array_pop( $last_tag_history );
1093 array_pop( $has_opened_tr );
1094 array_push( $has_opened_tr,
true );
1096 if ( array_pop( $tr_history ) ) {
1100 if ( array_pop( $td_history ) ) {
1101 $line =
"</{$last_tag}>{$line}";
1105 array_push( $tr_history,
false );
1106 array_push( $td_history,
false );
1107 array_push( $last_tag_history,
'' );
1108 } elseif ( $first_character ===
'|'
1109 || $first_character ===
'!'
1110 || $first_two ===
'|+'
1112 # This might be cell elements, td, th or captions
1113 if ( $first_two ===
'|+' ) {
1114 $first_character =
'+';
1121 if ( $first_character ===
'!' ) {
1125 # Split up multiple cells on the same line.
1126 # FIXME : This can result in improper nesting of tags processed
1127 # by earlier parser steps.
1128 $cells = explode(
'||',
$line );
1132 # Loop through each table cell
1133 foreach ( $cells
as $cell ) {
1135 if ( $first_character !==
'+' ) {
1136 $tr_after = array_pop( $tr_attributes );
1137 if ( !array_pop( $tr_history ) ) {
1138 $previous =
"<tr{$tr_after}>\n";
1140 array_push( $tr_history,
true );
1141 array_push( $tr_attributes,
'' );
1142 array_pop( $has_opened_tr );
1143 array_push( $has_opened_tr,
true );
1146 $last_tag = array_pop( $last_tag_history );
1148 if ( array_pop( $td_history ) ) {
1149 $previous =
"</{$last_tag}>\n{$previous}";
1152 if ( $first_character ===
'|' ) {
1154 } elseif ( $first_character ===
'!' ) {
1156 } elseif ( $first_character ===
'+' ) {
1157 $last_tag =
'caption';
1162 array_push( $last_tag_history, $last_tag );
1164 # A cell could contain both parameters and data
1165 $cell_data = explode(
'|', $cell, 2 );
1167 # Bug 553: Note that a '|' inside an invalid link should not
1168 # be mistaken as delimiting cell parameters
1169 if ( strpos( $cell_data[0],
'[[' ) !==
false ) {
1170 $cell =
"{$previous}<{$last_tag}>{$cell}";
1171 } elseif ( count( $cell_data ) == 1 ) {
1172 $cell =
"{$previous}<{$last_tag}>{$cell_data[0]}";
1174 $attributes = $this->mStripState->unstripBoth( $cell_data[0] );
1176 $cell =
"{$previous}<{$last_tag}{$attributes}>{$cell_data[1]}";
1180 array_push( $td_history,
true );
1183 $out .= $outLine .
"\n";
1186 # Closing open td, tr && table
1187 while ( count( $td_history ) > 0 ) {
1188 if ( array_pop( $td_history ) ) {
1191 if ( array_pop( $tr_history ) ) {
1194 if ( !array_pop( $has_opened_tr ) ) {
1195 $out .=
"<tr><td></td></tr>\n";
1198 $out .=
"</table>\n";
1201 # Remove trailing line-ending (b/c)
1202 if ( substr(
$out, -1 ) ===
"\n" ) {
1206 # special case: don't return empty table
1207 if (
$out ===
"<table>\n<tr><td></td></tr>\n</table>" ) {
1230 # Hook to suspend the parser in this state
1231 if ( !
Hooks::run(
'ParserBeforeInternalParse', [ &$this, &$text, &$this->mStripState ] ) ) {
1235 # if $frame is provided, then use $frame for replacing any variables
1237 # use frame depth to infer how include/noinclude tags should be handled
1238 # depth=0 means this is the top-level document; otherwise it's an included document
1239 if ( !$frame->depth ) {
1245 $text = $frame->expand( $dom );
1247 # if $frame is not provided, then use old-style replaceVariables
1251 Hooks::run(
'InternalParseBeforeSanitize', [ &$this, &$text, &$this->mStripState ] );
1254 [ &$this,
'attributeStripCallback' ],
1256 array_keys( $this->mTransparentTagHooks )
1258 Hooks::run(
'InternalParseBeforeLinks', [ &$this, &$text, &$this->mStripState ] );
1260 # Tables need to come after variable replacement for things to work
1261 # properly; putting them before other transformations should keep
1262 # exciting things like link expansions from showing up in surprising
1266 $text = preg_replace(
'/(^|\n)-----*/',
'\\1<hr />', $text );
1275 # replaceInternalLinks may sometimes leave behind
1276 # absolute URLs, which have to be masked to hide them from replaceExternalLinks
1277 $text = str_replace( self::MARKER_PREFIX .
'NOPARSE',
'', $text );
1295 $text = $this->mStripState->unstripGeneral( $text );
1298 Hooks::run(
'ParserAfterUnstrip', [ &$this, &$text ] );
1301 # Clean up special characters, only run once, next-to-last before doBlockLevels
1303 # french spaces, last one Guillemet-left
1304 # only if there is something before the space
1305 '/(.) (?=\\?|:|;|!|%|\\302\\273)/' =>
'\\1 ',
1306 # french spaces, Guillemet-right
1307 '/(\\302\\253) /' =>
'\\1 ',
1308 '/ (!\s*important)/' =>
' \\1', # Beware
of CSS magic word !important, bug #11874.
1310 $text = preg_replace( array_keys( $fixtags ), array_values( $fixtags ), $text );
1323 if ( !( $this->mOptions->getDisableContentConversion()
1324 || isset( $this->mDoubleUnderscores[
'nocontentconvert'] ) )
1326 if ( !$this->mOptions->getInterfaceMessage() ) {
1327 # The position of the convert() call should not be changed. it
1328 # assumes that the links are all replaced and the only thing left
1329 # is the <nowiki> mark.
1334 $text = $this->mStripState->unstripNoWiki( $text );
1337 Hooks::run(
'ParserBeforeTidy', [ &$this, &$text ] );
1341 $text = $this->mStripState->unstripGeneral( $text );
1349 # attempt to sanitize at least some nesting problems
1350 # (bug #2702 and quite a few others)
1352 # ''Something [http://www.cool.com cool''] -->
1353 # <i>Something</i><a href="http://www.cool.com"..><i>cool></i></a>
1354 '/(<([bi])>)(<([bi])>)?([^<]*)(<\/?a[^<]*>)([^<]*)(<\/\\4>)?(<\/\\2>)/' =>
1355 '\\1\\3\\5\\8\\9\\6\\1\\3\\7\\8\\9',
1356 # fix up an anchor inside another anchor, only
1357 # at least for a single single nested link (bug 3695)
1358 '/(<a[^>]+>)([^<]*)(<a[^>]+>[^<]*)<\/a>(.*)<\/a>/' =>
1359 '\\1\\2</a>\\3</a>\\1\\4</a>',
1360 # fix div inside inline elements- doBlockLevels won't wrap a line which
1361 # contains a div, so fix it up here; replace
1362 # div with escaped text
1363 '/(<([aib]) [^>]+>)([^<]*)(<div([^>]*)>)(.*)(<\/div>)([^<]*)(<\/\\2>)/' =>
1364 '\\1\\3<div\\5>\\6</div>\\8\\9',
1365 # remove empty italic or bold tag pairs, some
1366 # introduced by rules above
1367 '/<([bi])><\/\\1>/' =>
'',
1370 $text = preg_replace(
1371 array_keys( $tidyregs ),
1372 array_values( $tidyregs ),
1377 Hooks::run(
'ParserAfterTidy', [ &$this, &$text ] );
1396 $urlChar = self::EXT_LINK_URL_CLASS;
1397 $addr = self::EXT_LINK_ADDR;
1398 $space = self::SPACE_NOT_NL; # non-newline space
1399 $spdash =
"(?:-|$space)"; # a dash
or a non-newline space
1400 $spaces =
"$space++"; # possessive match
of 1
or more spaces
1401 $text = preg_replace_callback(
1403 (<a[ \t\r\n>].*?</a>) | # m[1]: Skip link text
1404 (<.*?>) | # m[2]: Skip stuff inside
1405 # HTML elements' .
"
1406 (\b(?i:$prots)($addr$urlChar*)) | # m[3]: Free external links
1407 # m[4]: Post-protocol path
1408 \b(?:RFC|PMID) $spaces # m[5]: RFC or PMID, capture number
1410 \bISBN $spaces ( # m[6]: ISBN, capture number
1411 (?: 97[89] $spdash? )? # optional 13-digit ISBN prefix
1412 (?: [0-9] $spdash? ){9} # 9 digits with opt. delimiters
1413 [0-9Xx] # check digit
1415 )!xu", [ &$this,
'magicLinkCallback' ], $text );
1425 if ( isset( $m[1] ) && $m[1] !==
'' ) {
1428 } elseif ( isset( $m[2] ) && $m[2] !==
'' ) {
1431 } elseif ( isset( $m[3] ) && $m[3] !==
'' ) {
1432 # Free external link
1434 } elseif ( isset( $m[5] ) && $m[5] !==
'' ) {
1436 if ( substr( $m[0], 0, 3 ) ===
'RFC' ) {
1439 $cssClass =
'mw-magiclink-rfc';
1441 } elseif ( substr( $m[0], 0, 4 ) ===
'PMID' ) {
1443 $urlmsg =
'pubmedurl';
1444 $cssClass =
'mw-magiclink-pmid';
1447 throw new MWException( __METHOD__ .
': unrecognised match type "' .
1448 substr( $m[0], 0, 20 ) .
'"' );
1450 $url =
wfMessage( $urlmsg, $id )->inContentLanguage()->text();
1452 } elseif ( isset( $m[6] ) && $m[6] !==
'' ) {
1455 $space = self::SPACE_NOT_NL; # non-newline space
1456 $isbn = preg_replace(
"/$space/",
' ', $isbn );
1457 $num = strtr( $isbn, [
1463 return '<a href="' .
1464 htmlspecialchars( $titleObj->getLocalURL() ) .
1465 "\" class=\"internal mw-magiclink-isbn\">ISBN $isbn</a>";
1483 # The characters '<' and '>' (which were escaped by
1484 # removeHTMLtags()) should not be included in
1485 # URLs, per RFC 2396.
1486 # Make terminate a URL as well (bug T84937)
1489 '/&(lt|gt|nbsp|#x0*(3[CcEe]|[Aa]0)|#0*(60|62|160));/',
1494 $trail = substr( $url, $m2[0][1] ) . $trail;
1495 $url = substr( $url, 0, $m2[0][1] );
1498 # Move trailing punctuation to $trail
1500 # If there is no left bracket, then consider right brackets fair game too
1501 if ( strpos( $url,
'(' ) ===
false ) {
1505 $urlRev = strrev( $url );
1506 $numSepChars = strspn( $urlRev, $sep );
1507 # Don't break a trailing HTML entity by moving the ; into $trail
1508 # This is in hot code, so use substr_compare to avoid having to
1509 # create a new string object for the comparison
1510 if ( $numSepChars && substr_compare( $url,
";", -$numSepChars, 1 ) === 0 ) {
1511 # more optimization: instead of running preg_match with a $
1512 # anchor, which can be slow, do the match on the reversed
1513 # string starting at the desired offset.
1514 # un-reversed regexp is: /&([a-z]+|#x[\da-f]+|#\d+)$/i
1515 if ( preg_match(
'/\G([a-z]+|[\da-f]+x#|\d+#)&/i', $urlRev, $m2, 0, $numSepChars ) ) {
1519 if ( $numSepChars ) {
1520 $trail = substr( $url, -$numSepChars ) . $trail;
1521 $url = substr( $url, 0, -$numSepChars );
1524 # Verify that we still have a real URL after trail removal, and
1525 # not just lone protocol
1526 if ( strlen( $trail ) >= $numPostProto ) {
1527 return $url . $trail;
1532 # Is this an external image?
1534 if ( $text ===
false ) {
1535 # Not an image, make a link
1540 # Register it in the output object...
1541 $this->mOutput->addExternalLink( $url );
1543 return $text . $trail;
1556 for ( $i = 6; $i >= 1; --$i ) {
1557 $h = str_repeat(
'=', $i );
1558 $text = preg_replace(
"/^$h(.+)$h\\s*$/m",
"<h$i>\\1</h$i>", $text );
1575 $outtext .= $this->
doQuotes( $line ) .
"\n";
1577 $outtext = substr( $outtext, 0, -1 );
1589 $arr = preg_split(
"/(''+)/", $text, -1, PREG_SPLIT_DELIM_CAPTURE );
1590 $countarr = count( $arr );
1591 if ( $countarr == 1 ) {
1600 for ( $i = 1; $i < $countarr; $i += 2 ) {
1601 $thislen = strlen( $arr[$i] );
1605 if ( $thislen == 4 ) {
1606 $arr[$i - 1] .=
"'";
1609 } elseif ( $thislen > 5 ) {
1613 $arr[$i - 1] .= str_repeat(
"'", $thislen - 5 );
1618 if ( $thislen == 2 ) {
1620 } elseif ( $thislen == 3 ) {
1622 } elseif ( $thislen == 5 ) {
1632 if ( ( $numbold % 2 == 1 ) && ( $numitalics % 2 == 1 ) ) {
1633 $firstsingleletterword = -1;
1634 $firstmultiletterword = -1;
1636 for ( $i = 1; $i < $countarr; $i += 2 ) {
1637 if ( strlen( $arr[$i] ) == 3 ) {
1638 $x1 = substr( $arr[$i - 1], -1 );
1639 $x2 = substr( $arr[$i - 1], -2, 1 );
1640 if ( $x1 ===
' ' ) {
1641 if ( $firstspace == -1 ) {
1644 } elseif ( $x2 ===
' ' ) {
1645 $firstsingleletterword = $i;
1650 if ( $firstmultiletterword == -1 ) {
1651 $firstmultiletterword = $i;
1658 if ( $firstsingleletterword > -1 ) {
1659 $arr[$firstsingleletterword] =
"''";
1660 $arr[$firstsingleletterword - 1] .=
"'";
1661 } elseif ( $firstmultiletterword > -1 ) {
1663 $arr[$firstmultiletterword] =
"''";
1664 $arr[$firstmultiletterword - 1] .=
"'";
1665 } elseif ( $firstspace > -1 ) {
1669 $arr[$firstspace] =
"''";
1670 $arr[$firstspace - 1] .=
"'";
1679 foreach ( $arr
as $r ) {
1680 if ( ( $i % 2 ) == 0 ) {
1681 if ( $state ===
'both' ) {
1687 $thislen = strlen( $r );
1688 if ( $thislen == 2 ) {
1689 if ( $state ===
'i' ) {
1692 } elseif ( $state ===
'bi' ) {
1695 } elseif ( $state ===
'ib' ) {
1698 } elseif ( $state ===
'both' ) {
1705 } elseif ( $thislen == 3 ) {
1706 if ( $state ===
'b' ) {
1709 } elseif ( $state ===
'bi' ) {
1712 } elseif ( $state ===
'ib' ) {
1715 } elseif ( $state ===
'both' ) {
1722 } elseif ( $thislen == 5 ) {
1723 if ( $state ===
'b' ) {
1726 } elseif ( $state ===
'i' ) {
1729 } elseif ( $state ===
'bi' ) {
1732 } elseif ( $state ===
'ib' ) {
1735 } elseif ( $state ===
'both' ) {
1747 if ( $state ===
'b' || $state ===
'ib' ) {
1750 if ( $state ===
'i' || $state ===
'bi' || $state ===
'ib' ) {
1753 if ( $state ===
'bi' ) {
1757 if ( $state ===
'both' &&
$buffer ) {
1778 $bits = preg_split( $this->mExtLinkBracketedRegex, $text, -1, PREG_SPLIT_DELIM_CAPTURE );
1779 if ( $bits ===
false ) {
1780 throw new MWException(
"PCRE needs to be compiled with "
1781 .
"--enable-unicode-properties in order for MediaWiki to function" );
1783 $s = array_shift( $bits );
1786 while ( $i < count( $bits ) ) {
1789 $text = $bits[$i++];
1790 $trail = $bits[$i++];
1792 # The characters '<' and '>' (which were escaped by
1793 # removeHTMLtags()) should not be included in
1794 # URLs, per RFC 2396.
1796 if ( preg_match(
'/&(lt|gt);/', $url, $m2, PREG_OFFSET_CAPTURE ) ) {
1797 $text = substr( $url, $m2[0][1] ) .
' ' . $text;
1798 $url = substr( $url, 0, $m2[0][1] );
1801 # If the link text is an image URL, replace it with an <img> tag
1802 # This happened by accident in the original parser, but some people used it extensively
1804 if ( $img !==
false ) {
1810 # Set linktype for CSS - if URL==text, link is essentially free
1811 $linktype = ( $text === $url ) ?
'free' :
'text';
1813 # No link text, e.g. [http://domain.tld/some.link]
1814 if ( $text ==
'' ) {
1817 $text =
'[' . $langObj->formatNum( ++$this->mAutonumber ) .
']';
1818 $linktype =
'autonumber';
1820 # Have link text, e.g. [http://domain.tld/some.link text]s
1829 # Use the encoded URL
1830 # This means that users can paste URLs directly into the text
1831 # Funny characters like ö aren't valid in URLs anyway
1832 # This was changed in August 2004
1836 # Register link in the output object.
1837 $this->mOutput->addExternalLink( $url );
1853 global $wgNoFollowLinks, $wgNoFollowNsExceptions, $wgNoFollowDomainExceptions;
1855 if ( $wgNoFollowLinks && !in_array( $ns, $wgNoFollowNsExceptions )
1875 $rel = self::getExternalLinkRel( $url, $this->mTitle );
1877 $target = $this->mOptions->getExternalLinkTarget();
1880 if ( !in_array( $target, [
'_self',
'_parent',
'_top' ] ) ) {
1884 if ( $rel !==
'' ) {
1887 $rel .=
'noreferrer noopener';
1903 return self::normalizeLinkUrl( $url );
1916 # First, make sure unsafe characters are encoded
1917 $url = preg_replace_callback(
'/[\x00-\x20"<>\[\\\\\]^`{|}\x7F-\xFF]/',
1919 return rawurlencode( $m[0] );
1925 $end = strlen( $url );
1927 # Fragment part - 'fragment'
1928 $start = strpos( $url,
'#' );
1929 if ( $start !==
false && $start < $end ) {
1930 $ret = self::normalizeUrlComponent(
1931 substr( $url, $start, $end - $start ),
'"#%<>[\]^`{|}' ) .
$ret;
1935 # Query part - 'query' minus &=+;
1936 $start = strpos( $url,
'?' );
1937 if ( $start !==
false && $start < $end ) {
1938 $ret = self::normalizeUrlComponent(
1939 substr( $url, $start, $end - $start ),
'"#%<>[\]^`{|}&=+;' ) .
$ret;
1943 # Scheme and path part - 'pchar'
1944 # (we assume no userinfo or encoded colons in the host)
1945 $ret = self::normalizeUrlComponent(
1946 substr( $url, 0, $end ),
'"#%<>[\]^`{|}/?' ) .
$ret;
1952 $callback =
function (
$matches )
use ( $unsafe ) {
1954 $ord = ord( $char );
1955 if ( $ord > 32 && $ord < 127 && strpos( $unsafe, $char ) ===
false ) {
1959 # Leave it escaped, but use uppercase for a-f
1963 return preg_replace_callback(
'/%[0-9A-Fa-f]{2}/', $callback, $component );
1975 $imagesfrom = $this->mOptions->getAllowExternalImagesFrom();
1976 $imagesexception = !empty( $imagesfrom );
1978 # $imagesfrom could be either a single string or an array of strings, parse out the latter
1979 if ( $imagesexception && is_array( $imagesfrom ) ) {
1980 $imagematch =
false;
1981 foreach ( $imagesfrom
as $match ) {
1982 if ( strpos( $url, $match ) === 0 ) {
1987 } elseif ( $imagesexception ) {
1988 $imagematch = ( strpos( $url, $imagesfrom ) === 0 );
1990 $imagematch =
false;
1993 if ( $this->mOptions->getAllowExternalImages()
1994 || ( $imagesexception && $imagematch )
1996 if ( preg_match( self::EXT_IMAGE_REGEX, $url ) ) {
2001 if ( !$text && $this->mOptions->getEnableImageWhitelist()
2002 && preg_match( self::EXT_IMAGE_REGEX, $url )
2004 $whitelist = explode(
2006 wfMessage(
'external_image_whitelist' )->inContentLanguage()->
text()
2009 foreach ( $whitelist
as $entry ) {
2010 # Sanitize the regex fragment, make it case-insensitive, ignore blank entries/comments
2011 if ( strpos( $entry,
'#' ) === 0 || $entry ===
'' ) {
2014 if ( preg_match(
'/' . str_replace(
'/',
'\\/', $entry ) .
'/i', $url ) ) {
2015 # Image matches a whitelist entry
2049 static $tc =
false, $e1, $e1_img;
2050 # the % is needed to support urlencoded titles as well
2053 # Match a link having the form [[namespace:link|alternate]]trail
2054 $e1 =
"/^([{$tc}]+)(?:\\|(.+?))?]](.*)\$/sD";
2055 # Match cases where there is no "]]", which might still be images
2056 $e1_img =
"/^([{$tc}]+)\\|(.*)\$/sD";
2061 # split the entire text string on occurrences of [[
2063 # get the first element (all text up to first [[), and remove the space we added
2066 $line = $a->current(); # Workaround
for broken ArrayIterator::next()
that returns
"void"
2067 $s = substr( $s, 1 );
2071 if ( $useLinkPrefixExtension ) {
2072 # Match the end of a line for a word that's not followed by whitespace,
2073 # e.g. in the case of 'The Arab al[[Razi]]', 'al' will be matched
2075 $charset = $wgContLang->linkPrefixCharset();
2076 $e2 =
"/^((?>.*[^$charset]|))(.+)$/sDu";
2079 if ( is_null( $this->mTitle ) ) {
2080 throw new MWException( __METHOD__ .
": \$this->mTitle is null\n" );
2082 $nottalk = !$this->mTitle->isTalkPage();
2084 if ( $useLinkPrefixExtension ) {
2086 if ( preg_match( $e2, $s, $m ) ) {
2087 $first_prefix = $m[2];
2089 $first_prefix =
false;
2098 # Loop for each link
2099 for ( ;
$line !==
false &&
$line !== null; $a->next(),
$line = $a->current() ) {
2102 # Check for excessive memory usage
2103 if ( $holders->isBig() ) {
2105 # Do the existence check, replace the link holders and clear the array
2106 $holders->replace( $s );
2110 if ( $useLinkPrefixExtension ) {
2111 if ( preg_match( $e2, $s, $m ) ) {
2118 if ( $first_prefix ) {
2119 $prefix = $first_prefix;
2120 $first_prefix =
false;
2124 $might_be_img =
false;
2128 # If we get a ] at the beginning of $m[3] that means we have a link that's something like:
2129 # [[Image:Foo.jpg|[http://example.com desc]]] <- having three ] in a row fucks up,
2130 # the real problem is with the $e1 regex
2132 # Still some problems for cases where the ] is meant to be outside punctuation,
2133 # and no image is in sight. See bug 2095.
2135 && substr( $m[3], 0, 1 ) ===
']'
2136 && strpos( $text,
'[' ) !==
false
2139 $m[3] = substr( $m[3], 1 );
2141 # fix up urlencoded title texts
2142 if ( strpos( $m[1],
'%' ) !==
false ) {
2143 # Should anchors '#' also be rejected?
2144 $m[1] = str_replace( [
'<',
'>' ], [
'<',
'>' ], rawurldecode( $m[1] ) );
2147 } elseif ( preg_match( $e1_img,
$line, $m ) ) {
2148 # Invalid, but might be an image with a link in its caption
2149 $might_be_img =
true;
2151 if ( strpos( $m[1],
'%' ) !==
false ) {
2152 $m[1] = str_replace( [
'<',
'>' ], [
'<',
'>' ], rawurldecode( $m[1] ) );
2156 $s .= $prefix .
'[[' .
$line;
2162 # Don't allow internal links to pages containing
2163 # PROTO: where PROTO is a valid URL protocol; these
2164 # should be external links.
2165 if ( preg_match(
'/^(?i:' . $this->mUrlProtocols .
')/', $origLink ) ) {
2166 $s .= $prefix .
'[[' .
$line;
2170 # Make subpage if necessary
2171 if ( $useSubpages ) {
2177 $noforce = ( substr( $origLink, 0, 1 ) !==
':' );
2179 # Strip off leading ':'
2183 $unstrip = $this->mStripState->unstripNoWiki(
$link );
2185 if ( $nt === null ) {
2186 $s .= $prefix .
'[[' .
$line;
2190 $ns = $nt->getNamespace();
2191 $iw = $nt->getInterwiki();
2193 if ( $might_be_img ) { #
if this is actually an invalid
link
2194 if ( $ns ==
NS_FILE && $noforce ) { # but might be an image
2197 # look at the next 'line' to see if we can close it there
2199 $next_line = $a->current();
2200 if ( $next_line ===
false || $next_line === null ) {
2203 $m = explode(
']]', $next_line, 3 );
2204 if ( count( $m ) == 3 ) {
2205 # the first ]] closes the inner link, the second the image
2207 $text .=
"[[{$m[0]}]]{$m[1]}";
2210 } elseif ( count( $m ) == 2 ) {
2211 # if there's exactly one ]] that's fine, we'll keep looking
2212 $text .=
"[[{$m[0]}]]{$m[1]}";
2214 # if $next_line is invalid too, we need look no further
2215 $text .=
'[[' . $next_line;
2220 # we couldn't find the end of this imageLink, so output it raw
2221 # but don't ignore what might be perfectly normal links in the text we've examined
2223 $s .=
"{$prefix}[[$link|$text";
2224 # note: no $trail, because without an end, there *is* no trail
2227 }
else { #
it's not an image, so output it raw
2228 $s .= "{$prefix}[[$link|$text";
2229 # note: no $trail, because without an end, there *is* no trail
2234 $wasblank = ( $text == '' );
2238 # Bug 4598 madness. Handle the quotes only if they come from the alternate part
2239 # [[Lista d''e paise d''o munno]] -> <a href="...">Lista d''e paise d''o munno</a>
2240 # [[Criticism of Harry Potter|Criticism of ''Harry Potter'']]
2241 # -> <a href="Criticism of Harry Potter">Criticism of <i>Harry Potter</i></a>
2242 $text = $this->doQuotes( $text );
2245 # Link not escaped by : , create the various objects
2246 if ( $noforce && !$nt->wasLocalInterwiki() ) {
2249 $iw && $this->mOptions->getInterwikiMagic() && $nottalk && (
2250 Language::fetchLanguageName( $iw, null, 'mw
' ) ||
2251 in_array( $iw, $wgExtraInterlanguageLinkPrefixes )
2254 # Bug 24502: filter duplicates
2255 if ( !isset( $this->mLangLinkLanguages[$iw] ) ) {
2256 $this->mLangLinkLanguages[$iw] = true;
2257 $this->mOutput->addLanguageLink( $nt->getFullText() );
2260 $s = rtrim( $s . $prefix );
2261 $s .= trim( $trail, "\n" ) == '' ? '': $prefix . $trail;
2265 if ( $ns == NS_FILE ) {
2266 if ( !wfIsBadImage( $nt->getDBkey(), $this->mTitle ) ) {
2268 # if no parameters were passed, $text
2269 # becomes something like "File:Foo.png",
2270 # which we don't want to pass
on to
the
2274 # recursively parse links inside the image caption
2275 # actually, this will parse them in any other parameters, too,
2276 # but it might be hard to fix that, and it doesn't matter ATM
2280 # cloak any absolute URLs inside the image markup, so replaceExternalLinks() won't touch them
2282 $this->
makeImage( $nt, $text, $holders ) ) . $trail;
2284 $s .= $prefix . $trail;
2290 $s = rtrim( $s .
"\n" ); # bug 87
2298 $sortkey = str_replace(
"\n",
'', $sortkey );
2300 $this->mOutput->addCategory( $nt->getDBkey(), $sortkey );
2305 $s .= trim( $prefix . $trail,
"\n" ) ==
'' ?
'' : $prefix . $trail;
2311 # Self-link checking. For some languages, variants of the title are checked in
2312 # LinkHolderArray::doVariants() to allow batching the existence checks necessary
2313 # for linking to a different variant.
2314 if ( $ns !=
NS_SPECIAL && $nt->equals( $this->mTitle ) && !$nt->hasFragment() ) {
2319 # NS_MEDIA is a pseudo-namespace for linking directly to a file
2320 # @todo FIXME: Should do batch file existence checks, see comment below
2322 # Give extensions a chance to select the file revision for us
2326 [ $this, $nt, &
$options, &$descQuery ] );
2327 # Fetch and register the file (file title may be different via hooks)
2329 # Cloak with NOPARSE to avoid replacement in replaceExternalLinks
2335 # Some titles, such as valid special pages or files in foreign repos, should
2336 # be shown as bluelinks even though they're not included in the page table
2337 # @todo FIXME: isAlwaysKnown() can be expensive for file links; we should really do
2338 # batch file existence checks for NS_FILE and NS_MEDIA
2339 if ( $iw ==
'' && $nt->isAlwaysKnown() ) {
2340 $this->mOutput->addLink( $nt );
2343 # Links will be added to the output link list after checking
2344 $s .= $holders->makeHolder( $nt, $text, [], $trail, $prefix );
2367 if ( is_string(
$query ) ) {
2370 if ( $text ==
'' ) {
2371 $text = htmlspecialchars( $nt->getPrefixedText() );
2376 return $this->armorLinks(
$link ) . $trail;
2390 return preg_replace(
'/\b((?i)' . $this->mUrlProtocols .
')/',
2391 self::MARKER_PREFIX .
"NOPARSE$1", $text );
2399 # Some namespaces don't allow subpages
2423 if ( $this->mLastSection !=
'' ) {
2424 $result =
'</' . $this->mLastSection .
">\n";
2426 $this->mInPre =
false;
2427 $this->mLastSection =
'';
2442 $fl = strlen( $st1 );
2443 $shorter = strlen( $st2 );
2444 if ( $fl < $shorter ) {
2448 for ( $i = 0; $i < $shorter; ++$i ) {
2449 if ( $st1[$i] != $st2[$i] ) {
2466 $result = $this->closeParagraph();
2468 if (
'*' === $char ) {
2470 } elseif (
'#' === $char ) {
2472 } elseif (
':' === $char ) {
2474 } elseif (
';' === $char ) {
2476 $this->mDTopen =
true;
2492 if (
'*' === $char ||
'#' === $char ) {
2493 return "</li>\n<li>";
2494 } elseif (
':' === $char ||
';' === $char ) {
2496 if ( $this->mDTopen ) {
2499 if (
';' === $char ) {
2500 $this->mDTopen =
true;
2501 return $close .
'<dt>';
2503 $this->mDTopen =
false;
2504 return $close .
'<dd>';
2507 return '<!-- ERR 2 -->';
2518 if (
'*' === $char ) {
2519 $text =
"</li></ul>";
2520 } elseif (
'#' === $char ) {
2521 $text =
"</li></ol>";
2522 } elseif (
':' === $char ) {
2523 if ( $this->mDTopen ) {
2524 $this->mDTopen =
false;
2525 $text =
"</dt></dl>";
2527 $text =
"</dd></dl>";
2530 return '<!-- ERR 3 -->';
2546 # Parsing through the text line by line. The main thing
2547 # happening here is handling of block-level elements p, pre,
2548 # and making lists from lines starting with * # : etc.
2552 $this->mDTopen = $inBlockElem =
false;
2554 $paragraphStack =
false;
2555 $inBlockquote =
false;
2557 foreach ( $textLines
as $oLine ) {
2559 if ( !$linestart ) {
2569 $lastPrefixLength = strlen( $lastPrefix );
2570 $preCloseMatch = preg_match(
'/<\\/pre/i', $oLine );
2571 $preOpenMatch = preg_match(
'/<pre/i', $oLine );
2572 # If not in a <pre> element, scan for and figure out what prefixes are there.
2573 if ( !$this->mInPre ) {
2574 # Multiple prefixes may abut each other for nested lists.
2575 $prefixLength = strspn( $oLine,
'*#:;' );
2576 $prefix = substr( $oLine, 0, $prefixLength );
2579 # ; and : are both from definition-lists, so they're equivalent
2580 # for the purposes of determining whether or not we need to open/close
2582 $prefix2 = str_replace(
';',
':', $prefix );
2583 $t = substr( $oLine, $prefixLength );
2584 $this->mInPre = (bool)$preOpenMatch;
2586 # Don't interpret any other prefixes in preformatted text
2588 $prefix = $prefix2 =
'';
2593 if ( $prefixLength && $lastPrefix === $prefix2 ) {
2594 # Same as the last item, so no need to deal with nesting or opening stuff
2595 $output .= $this->nextItem( substr( $prefix, -1 ) );
2596 $paragraphStack =
false;
2598 if ( substr( $prefix, -1 ) ===
';' ) {
2599 # The one nasty exception: definition lists work like this:
2600 # ; title : definition text
2601 # So we check for : in the remainder text to split up the
2602 # title and definition, without b0rking links.
2604 if ( $this->findColonNoLinks(
$t,
$term, $t2 ) !==
false ) {
2609 } elseif ( $prefixLength || $lastPrefixLength ) {
2610 # We need to open or close prefixes, or both.
2612 # Either open or close a level...
2613 $commonPrefixLength = $this->getCommon( $prefix, $lastPrefix );
2614 $paragraphStack =
false;
2616 # Close all the prefixes which aren't shared.
2617 while ( $commonPrefixLength < $lastPrefixLength ) {
2618 $output .= $this->closeList( $lastPrefix[$lastPrefixLength - 1] );
2619 --$lastPrefixLength;
2622 # Continue the current prefix if appropriate.
2623 if ( $prefixLength <= $commonPrefixLength && $commonPrefixLength > 0 ) {
2624 $output .= $this->nextItem( $prefix[$commonPrefixLength - 1] );
2627 # Open prefixes where appropriate.
2628 if ( $lastPrefix && $prefixLength > $commonPrefixLength ) {
2631 while ( $prefixLength > $commonPrefixLength ) {
2632 $char = substr( $prefix, $commonPrefixLength, 1 );
2633 $output .= $this->openList( $char );
2635 if (
';' === $char ) {
2636 # @todo FIXME: This is dupe of code above
2637 if ( $this->findColonNoLinks(
$t,
$term, $t2 ) !==
false ) {
2642 ++$commonPrefixLength;
2644 if ( !$prefixLength && $lastPrefix ) {
2647 $lastPrefix = $prefix2;
2650 # If we have no prefixes, go to paragraph mode.
2651 if ( 0 == $prefixLength ) {
2652 # No prefix (not in list)--go to paragraph mode
2653 # XXX: use a stack for nestable elements like span, table and div
2654 $openmatch = preg_match(
2655 '/(?:<table|<h1|<h2|<h3|<h4|<h5|<h6|<pre|<tr|'
2656 .
'<p|<ul|<ol|<dl|<li|<\\/tr|<\\/td|<\\/th)/iS',
2659 $closematch = preg_match(
2660 '/(?:<\\/table|<\\/h1|<\\/h2|<\\/h3|<\\/h4|<\\/h5|<\\/h6|'
2661 .
'<td|<th|<\\/?blockquote|<\\/?div|<hr|<\\/pre|<\\/p|<\\/mw:|'
2662 . self::MARKER_PREFIX
2663 .
'-pre|<\\/li|<\\/ul|<\\/ol|<\\/dl|<\\/?center)/iS',
2667 if ( $openmatch || $closematch ) {
2668 $paragraphStack =
false;
2669 # @todo bug 5718: paragraph closed
2670 $output .= $this->closeParagraph();
2671 if ( $preOpenMatch && !$preCloseMatch ) {
2672 $this->mInPre =
true;
2675 while ( preg_match(
'/<(\\/?)blockquote[\s>]/i',
$t,
2676 $bqMatch, PREG_OFFSET_CAPTURE, $bqOffset )
2678 $inBlockquote = !$bqMatch[1][0];
2679 $bqOffset = $bqMatch[0][1] + strlen( $bqMatch[0][0] );
2681 $inBlockElem = !$closematch;
2682 } elseif ( !$inBlockElem && !$this->mInPre ) {
2683 if (
' ' == substr(
$t, 0, 1 )
2684 && ( $this->mLastSection ===
'pre' || trim(
$t ) !=
'' )
2688 if ( $this->mLastSection !==
'pre' ) {
2689 $paragraphStack =
false;
2690 $output .= $this->closeParagraph() .
'<pre>';
2691 $this->mLastSection =
'pre';
2693 $t = substr(
$t, 1 );
2696 if ( trim(
$t ) ===
'' ) {
2697 if ( $paragraphStack ) {
2698 $output .= $paragraphStack .
'<br />';
2699 $paragraphStack =
false;
2700 $this->mLastSection =
'p';
2702 if ( $this->mLastSection !==
'p' ) {
2703 $output .= $this->closeParagraph();
2704 $this->mLastSection =
'';
2705 $paragraphStack =
'<p>';
2707 $paragraphStack =
'</p><p>';
2711 if ( $paragraphStack ) {
2713 $paragraphStack =
false;
2714 $this->mLastSection =
'p';
2715 } elseif ( $this->mLastSection !==
'p' ) {
2716 $output .= $this->closeParagraph() .
'<p>';
2717 $this->mLastSection =
'p';
2723 # somewhere above we forget to get out of pre block (bug 785)
2724 if ( $preCloseMatch && $this->mInPre ) {
2725 $this->mInPre =
false;
2727 if ( $paragraphStack ===
false ) {
2729 if ( $prefixLength === 0 ) {
2734 while ( $prefixLength ) {
2735 $output .= $this->closeList( $prefix2[$prefixLength - 1] );
2737 if ( !$prefixLength ) {
2741 if ( $this->mLastSection !=
'' ) {
2742 $output .=
'</' . $this->mLastSection .
'>';
2743 $this->mLastSection =
'';
2761 $pos = strpos( $str,
':' );
2762 if ( $pos ===
false ) {
2767 $lt = strpos( $str,
'<' );
2768 if ( $lt ===
false || $lt > $pos ) {
2769 # Easy; no tag nesting to worry about
2770 $before = substr( $str, 0, $pos );
2771 $after = substr( $str, $pos + 1 );
2775 # Ugly state machine to walk through avoiding tags.
2776 $state = self::COLON_STATE_TEXT;
2778 $len = strlen( $str );
2779 for ( $i = 0; $i < $len; $i++ ) {
2783 # (Using the number is a performance hack for common cases)
2784 case 0: # self::COLON_STATE_TEXT:
2787 # Could be either a <start> tag or an </end> tag
2788 $state = self::COLON_STATE_TAGSTART;
2791 if ( $stack == 0 ) {
2793 $before = substr( $str, 0, $i );
2794 $after = substr( $str, $i + 1 );
2797 # Embedded in a tag; don't break it.
2800 # Skip ahead looking for something interesting
2801 $colon = strpos( $str,
':', $i );
2802 if ( $colon ===
false ) {
2803 # Nothing else interesting
2806 $lt = strpos( $str,
'<', $i );
2807 if ( $stack === 0 ) {
2808 if ( $lt ===
false || $colon < $lt ) {
2810 $before = substr( $str, 0, $colon );
2811 $after = substr( $str, $colon + 1 );
2815 if ( $lt ===
false ) {
2816 # Nothing else interesting to find; abort!
2817 # We're nested, but there's no close tags left. Abort!
2820 # Skip ahead to next tag start
2822 $state = self::COLON_STATE_TAGSTART;
2825 case 1: # self::COLON_STATE_TAG:
2830 $state = self::COLON_STATE_TEXT;
2833 # Slash may be followed by >?
2834 $state = self::COLON_STATE_TAGSLASH;
2840 case 2: # self::COLON_STATE_TAGSTART:
2843 $state = self::COLON_STATE_CLOSETAG;
2846 $state = self::COLON_STATE_COMMENT;
2849 # Illegal early close? This shouldn't happen D:
2850 $state = self::COLON_STATE_TEXT;
2853 $state = self::COLON_STATE_TAG;
2856 case 3: # self::COLON_STATE_CLOSETAG:
2861 wfDebug( __METHOD__ .
": Invalid input; too many close tags\n" );
2864 $state = self::COLON_STATE_TEXT;
2867 case self::COLON_STATE_TAGSLASH:
2869 # Yes, a self-closed tag <blah/>
2870 $state = self::COLON_STATE_TEXT;
2872 # Probably we're jumping the gun, and this is an attribute
2873 $state = self::COLON_STATE_TAG;
2876 case 5: # self::COLON_STATE_COMMENT:
2878 $state = self::COLON_STATE_COMMENTDASH;
2881 case self::COLON_STATE_COMMENTDASH:
2883 $state = self::COLON_STATE_COMMENTDASHDASH;
2885 $state = self::COLON_STATE_COMMENT;
2888 case self::COLON_STATE_COMMENTDASHDASH:
2890 $state = self::COLON_STATE_TEXT;
2892 $state = self::COLON_STATE_COMMENT;
2896 throw new MWException(
"State machine error in " . __METHOD__ );
2900 wfDebug( __METHOD__ .
": Invalid input; not enough close tags (stack $stack, state $state)\n" );
2921 if ( is_null( $this->mTitle ) ) {
2926 throw new MWException( __METHOD__ .
' Should only be '
2927 .
' called while parsing (no title set)' );
2934 if (
Hooks::run(
'ParserGetVariableValueVarCache', [ &$this, &$this->mVarCache ] ) ) {
2935 if ( isset( $this->mVarCache[$index] ) ) {
2936 return $this->mVarCache[$index];
2941 Hooks::run(
'ParserGetVariableValueTs', [ &$this, &$ts ] );
2943 $pageLang = $this->getFunctionLang();
2949 case 'currentmonth':
2952 case 'currentmonth1':
2955 case 'currentmonthname':
2958 case 'currentmonthnamegen':
2961 case 'currentmonthabbrev':
2976 case 'localmonthname':
2979 case 'localmonthnamegen':
2982 case 'localmonthabbrev':
2997 case 'fullpagename':
3000 case 'fullpagenamee':
3006 case 'subpagenamee':
3009 case 'rootpagename':
3012 case 'rootpagenamee':
3016 $this->mTitle->getRootText()
3019 case 'basepagename':
3022 case 'basepagenamee':
3026 $this->mTitle->getBaseText()
3029 case 'talkpagename':
3030 if ( $this->mTitle->canTalk() ) {
3031 $talkPage = $this->mTitle->getTalkPage();
3037 case 'talkpagenamee':
3038 if ( $this->mTitle->canTalk() ) {
3039 $talkPage = $this->mTitle->getTalkPage();
3045 case 'subjectpagename':
3046 $subjPage = $this->mTitle->getSubjectPage();
3049 case 'subjectpagenamee':
3050 $subjPage = $this->mTitle->getSubjectPage();
3054 $pageid = $this->getTitle()->getArticleID();
3055 if ( $pageid == 0 ) {
3056 # 0 means the page doesn't exist in the database,
3057 # which means the user is previewing a new page.
3058 # The vary-revision flag must be set, because the magic word
3059 # will have a different value once the page is saved.
3060 $this->mOutput->setFlag(
'vary-revision' );
3061 wfDebug( __METHOD__ .
": {{PAGEID}} used in a new page, setting vary-revision...\n" );
3063 $value = $pageid ? $pageid : null;
3066 # Let the edit saving system know we should parse the page
3067 # *after* a revision ID has been assigned.
3068 $this->mOutput->setFlag(
'vary-revision' );
3069 wfDebug( __METHOD__ .
": {{REVISIONID}} used, setting vary-revision...\n" );
3070 $value = $this->mRevisionId;
3073 # Let the edit saving system know we should parse the page
3074 # *after* a revision ID has been assigned. This is for null edits.
3075 $this->mOutput->setFlag(
'vary-revision' );
3076 wfDebug( __METHOD__ .
": {{REVISIONDAY}} used, setting vary-revision...\n" );
3077 $value = intval( substr( $this->getRevisionTimestamp(), 6, 2 ) );
3079 case 'revisionday2':
3080 # Let the edit saving system know we should parse the page
3081 # *after* a revision ID has been assigned. This is for null edits.
3082 $this->mOutput->setFlag(
'vary-revision' );
3083 wfDebug( __METHOD__ .
": {{REVISIONDAY2}} used, setting vary-revision...\n" );
3084 $value = substr( $this->getRevisionTimestamp(), 6, 2 );
3086 case 'revisionmonth':
3087 # Let the edit saving system know we should parse the page
3088 # *after* a revision ID has been assigned. This is for null edits.
3089 $this->mOutput->setFlag(
'vary-revision' );
3090 wfDebug( __METHOD__ .
": {{REVISIONMONTH}} used, setting vary-revision...\n" );
3091 $value = substr( $this->getRevisionTimestamp(), 4, 2 );
3093 case 'revisionmonth1':
3094 # Let the edit saving system know we should parse the page
3095 # *after* a revision ID has been assigned. This is for null edits.
3096 $this->mOutput->setFlag(
'vary-revision' );
3097 wfDebug( __METHOD__ .
": {{REVISIONMONTH1}} used, setting vary-revision...\n" );
3098 $value = intval( substr( $this->getRevisionTimestamp(), 4, 2 ) );
3100 case 'revisionyear':
3101 # Let the edit saving system know we should parse the page
3102 # *after* a revision ID has been assigned. This is for null edits.
3103 $this->mOutput->setFlag(
'vary-revision' );
3104 wfDebug( __METHOD__ .
": {{REVISIONYEAR}} used, setting vary-revision...\n" );
3105 $value = substr( $this->getRevisionTimestamp(), 0, 4 );
3107 case 'revisiontimestamp':
3108 # Let the edit saving system know we should parse the page
3109 # *after* a revision ID has been assigned. This is for null edits.
3110 $this->mOutput->setFlag(
'vary-revision' );
3111 wfDebug( __METHOD__ .
": {{REVISIONTIMESTAMP}} used, setting vary-revision...\n" );
3112 $value = $this->getRevisionTimestamp();
3114 case 'revisionuser':
3115 # Let the edit saving system know we should parse the page
3116 # *after* a revision ID has been assigned. This is for null edits.
3117 $this->mOutput->setFlag(
'vary-revision' );
3118 wfDebug( __METHOD__ .
": {{REVISIONUSER}} used, setting vary-revision...\n" );
3119 $value = $this->getRevisionUser();
3121 case 'revisionsize':
3122 # Let the edit saving system know we should parse the page
3123 # *after* a revision ID has been assigned. This is for null edits.
3124 $this->mOutput->setFlag(
'vary-revision' );
3125 wfDebug( __METHOD__ .
": {{REVISIONSIZE}} used, setting vary-revision...\n" );
3126 $value = $this->getRevisionSize();
3129 $value = str_replace(
'_',
' ', $wgContLang->getNsText( $this->mTitle->getNamespace() ) );
3132 $value =
wfUrlencode( $wgContLang->getNsText( $this->mTitle->getNamespace() ) );
3134 case 'namespacenumber':
3135 $value = $this->mTitle->getNamespace();
3138 $value = $this->mTitle->canTalk()
3139 ? str_replace(
'_',
' ', $this->mTitle->getTalkNsText() )
3143 $value = $this->mTitle->canTalk() ?
wfUrlencode( $this->mTitle->getTalkNsText() ) :
'';
3145 case 'subjectspace':
3146 $value = str_replace(
'_',
' ', $this->mTitle->getSubjectNsText() );
3148 case 'subjectspacee':
3151 case 'currentdayname':
3164 # @bug 4594 PHP5 has it zero padded, PHP4 does not, cast to
3165 # int to remove the padding
3171 case 'localdayname':
3172 $value = $pageLang->getWeekdayName(
3180 $value = $pageLang->time(
3190 # @bug 4594 PHP5 has it zero padded, PHP4 does not, cast to
3191 # int to remove the padding
3197 case 'numberofarticles':
3200 case 'numberoffiles':
3203 case 'numberofusers':
3206 case 'numberofactiveusers':
3209 case 'numberofpages':
3212 case 'numberofadmins':
3215 case 'numberofedits':
3218 case 'currenttimestamp':
3221 case 'localtimestamp':
3224 case 'currentversion':
3239 case 'directionmark':
3240 return $pageLang->getDirMark();
3241 case 'contentlanguage':
3244 case 'cascadingsources':
3250 'ParserGetVariableValueSwitch',
3251 [ &$this, &$this->mVarCache, &$index, &
$ret, &$frame ]
3258 $this->mVarCache[$index] =
$value;
3300 $dom = $this->getPreprocessor()->preprocessToObj( $text,
$flags );
3312 $ltrimmed = ltrim(
$s );
3313 $w1 = substr(
$s, 0, strlen(
$s ) - strlen( $ltrimmed ) );
3314 $trimmed = rtrim( $ltrimmed );
3315 $diff = strlen( $ltrimmed ) - strlen( $trimmed );
3317 $w2 = substr( $ltrimmed, -$diff );
3321 return [ $w1, $trimmed, $w2 ];
3345 # Is there any text? Also, Prevent too big inclusions!
3346 $textSize = strlen( $text );
3347 if ( $textSize < 1 || $textSize > $this->mOptions->getMaxIncludeSize() ) {
3351 if ( $frame ===
false ) {
3352 $frame = $this->getPreprocessor()->newFrame();
3353 } elseif ( !( $frame instanceof
PPFrame ) ) {
3354 wfDebug( __METHOD__ .
" called using plain parameters instead of "
3355 .
"a PPFrame instance. Creating custom frame.\n" );
3356 $frame = $this->getPreprocessor()->newCustomFrame( $frame );
3359 $dom = $this->preprocessToDom( $text );
3361 $text = $frame->expand( $dom,
$flags );
3377 $eqpos = strpos( $arg,
'=' );
3378 if ( $eqpos ===
false ) {
3379 $assocArgs[$index++] = $arg;
3381 $name = trim( substr( $arg, 0, $eqpos ) );
3382 $value = trim( substr( $arg, $eqpos + 1 ) );
3383 if (
$value ===
false ) {
3386 if (
$name !==
false ) {
3422 # does no harm if $current and $max are present but are unnecessary for the message
3423 # Not doing ->inLanguage( $this->mOptions->getUserLangObj() ), since this is shown
3424 # only during preview, and that would split the parser cache unnecessarily.
3425 $warning =
wfMessage(
"$limitationType-warning" )->numParams( $current, $max )
3427 $this->mOutput->addWarning( $warning );
3428 $this->addTrackingCategory(
"$limitationType-category" );
3454 $forceRawInterwiki =
false;
3456 $isChildObj =
false;
3458 $isLocalObj =
false;
3460 # Title object, where $text came from
3463 # $part1 is the bit before the first |, and must contain only title characters.
3464 # Various prefixes will be stripped from it later.
3465 $titleWithSpaces = $frame->expand( $piece[
'title'] );
3466 $part1 = trim( $titleWithSpaces );
3469 # Original title text preserved for various purposes
3470 $originalTitle = $part1;
3472 # $args is a list of argument nodes, starting from index 0, not including $part1
3473 # @todo FIXME: If piece['parts'] is null then the call to getLength()
3474 # below won't work b/c this $args isn't an object
3475 $args = ( null == $piece[
'parts'] ) ? [] : $piece[
'parts'];
3477 $profileSection = null;
3481 $substMatch = $this->mSubstWords->matchStartAndRemove( $part1 );
3483 # Possibilities for substMatch: "subst", "safesubst" or FALSE
3484 # Decide whether to expand template or keep wikitext as-is.
3485 if ( $this->ot[
'wiki'] ) {
3486 if ( $substMatch ===
false ) {
3487 $literal =
true; # literal when
in PST with no prefix
3489 $literal =
false; # expand when
in PST with subst:
or safesubst:
3492 if ( $substMatch ==
'subst' ) {
3493 $literal =
true; # literal when not
in PST with plain subst:
3495 $literal =
false; # expand when not
in PST with safesubst:
or no prefix
3499 $text = $frame->virtualBracketedImplode(
'{{',
'|',
'}}', $titleWithSpaces,
$args );
3506 if ( !$found &&
$args->getLength() == 0 ) {
3507 $id = $this->mVariables->matchStartToEnd( $part1 );
3508 if ( $id !==
false ) {
3509 $text = $this->getVariableValue( $id, $frame );
3517 # MSG, MSGNW and RAW
3521 if ( $mwMsgnw->matchStartAndRemove( $part1 ) ) {
3524 # Remove obsolete MSG:
3526 $mwMsg->matchStartAndRemove( $part1 );
3531 if ( $mwRaw->matchStartAndRemove( $part1 ) ) {
3532 $forceRawInterwiki =
true;
3538 $colonPos = strpos( $part1,
':' );
3539 if ( $colonPos !==
false ) {
3540 $func = substr( $part1, 0, $colonPos );
3541 $funcArgs = [ trim( substr( $part1, $colonPos + 1 ) ) ];
3542 $argsLength =
$args->getLength();
3543 for ( $i = 0; $i < $argsLength; $i++ ) {
3544 $funcArgs[] =
$args->item( $i );
3547 $result = $this->callParserFunction( $frame, $func, $funcArgs );
3552 # The interface for parser functions allows for extracting
3553 # flags into the local scope. Extract any forwarded flags
3559 # Finish mangling title and then check for loops.
3560 # Set $title to a Title object and $titleText to the PDBK
3563 # Split the title into page and subpage
3565 $relative = $this->maybeDoSubpageLink( $part1, $subpage );
3566 if ( $part1 !== $relative ) {
3568 $ns = $this->mTitle->getNamespace();
3572 $titleText =
$title->getPrefixedText();
3573 # Check for language variants if the template is not found
3574 if ( $this->getConverterLanguage()->hasVariants() &&
$title->getArticleID() == 0 ) {
3575 $this->getConverterLanguage()->findVariantLink( $part1,
$title,
true );
3577 # Do recursion depth check
3578 $limit = $this->mOptions->getMaxTemplateDepth();
3579 if ( $frame->depth >=
$limit ) {
3581 $text =
'<span class="error">'
3582 .
wfMessage(
'parser-template-recursion-depth-warning' )
3583 ->numParams(
$limit )->inContentLanguage()->text()
3589 # Load from database
3590 if ( !$found &&
$title ) {
3591 $profileSection = $this->mProfiler->scopedProfileIn(
$title->getPrefixedDBkey() );
3592 if ( !
$title->isExternal() ) {
3593 if (
$title->isSpecialPage()
3594 && $this->mOptions->getAllowSpecialInclusion()
3595 && $this->ot[
'html']
3601 $argsLength =
$args->getLength();
3602 for ( $i = 0; $i < $argsLength; $i++ ) {
3603 $bits =
$args->item( $i )->splitArg();
3604 if ( strval( $bits[
'index'] ) ===
'' ) {
3606 $value = trim( $frame->expand( $bits[
'value'] ) );
3615 $context->setUser( $this->getUser() );
3616 $context->setLanguage( $this->mOptions->getUserLangObj() );
3619 $text =
$context->getOutput()->getHTML();
3620 $this->mOutput->addOutputPageMetadata(
$context->getOutput() );
3623 $this->disableCache();
3626 $found =
false; # access denied
3627 wfDebug( __METHOD__ .
": template inclusion denied for " .
3628 $title->getPrefixedDBkey() .
"\n" );
3631 if ( $text !==
false ) {
3637 # If the title is valid but undisplayable, make a link to it
3638 if ( !$found && ( $this->ot[
'html'] || $this->ot[
'pre'] ) ) {
3639 $text =
"[[:$titleText]]";
3642 } elseif (
$title->isTrans() ) {
3643 # Interwiki transclusion
3644 if ( $this->ot[
'html'] && !$forceRawInterwiki ) {
3645 $text = $this->interwikiTransclude(
$title,
'render' );
3648 $text = $this->interwikiTransclude(
$title,
'raw' );
3649 # Preprocess it like a template
3650 $text = $this->preprocessToDom( $text, self::PTD_FOR_INCLUSION );
3656 # Do infinite loop check
3657 # This has to be done after redirect resolution to avoid infinite loops via redirects
3658 if ( !$frame->loopCheck(
$title ) ) {
3660 $text =
'<span class="error">'
3661 .
wfMessage(
'parser-template-loop-warning', $titleText )->inContentLanguage()->text()
3663 wfDebug( __METHOD__ .
": template loop broken at '$titleText'\n" );
3667 # If we haven't found text to substitute by now, we're done
3668 # Recover the source wikitext and return it
3670 $text = $frame->virtualBracketedImplode(
'{{',
'|',
'}}', $titleWithSpaces,
$args );
3671 if ( $profileSection ) {
3672 $this->mProfiler->scopedProfileOut( $profileSection );
3674 return [
'object' => $text ];
3677 # Expand DOM-style return values in a child frame
3678 if ( $isChildObj ) {
3679 # Clean up argument array
3684 } elseif ( $titleText !==
false && $newFrame->isEmpty() ) {
3685 # Expansion is eligible for the empty-frame cache
3686 $text = $newFrame->cachedExpand( $titleText, $text );
3688 # Uncached expansion
3689 $text = $newFrame->expand( $text );
3692 if ( $isLocalObj && $nowiki ) {
3694 $isLocalObj =
false;
3697 if ( $profileSection ) {
3698 $this->mProfiler->scopedProfileOut( $profileSection );
3701 # Replace raw HTML by a placeholder
3703 $text = $this->insertStripItem( $text );
3704 } elseif ( $nowiki && ( $this->ot[
'html'] || $this->ot[
'pre'] ) ) {
3705 # Escape nowiki-style return values
3707 } elseif ( is_string( $text )
3708 && !$piece[
'lineStart']
3709 && preg_match(
'/^(?:{\\||:|;|#|\*)/', $text )
3711 # Bug 529: if the template begins with a table or block-level
3712 # element, it should be treated as beginning a new line.
3713 # This behavior is somewhat controversial.
3714 $text =
"\n" . $text;
3717 if ( is_string( $text ) && !$this->incrementIncludeSize(
'post-expand', strlen( $text ) ) ) {
3718 # Error, oversize inclusion
3719 if ( $titleText !==
false ) {
3720 # Make a working, properly escaped link if possible (bug 23588)
3721 $text =
"[[:$titleText]]";
3723 # This will probably not be a working link, but at least it may
3724 # provide some hint of where the problem is
3725 preg_replace(
'/^:/',
'', $originalTitle );
3726 $text =
"[[:$originalTitle]]";
3728 $text .= $this->insertStripItem(
'<!-- WARNING: template omitted, '
3729 .
'post-expand include size too large -->' );
3730 $this->limitationWarn(
'post-expand-template-inclusion' );
3733 if ( $isLocalObj ) {
3734 $ret = [
'object' => $text ];
3736 $ret = [
'text' => $text ];
3764 # Case sensitive functions
3765 if ( isset( $this->mFunctionSynonyms[1][$function] ) ) {
3766 $function = $this->mFunctionSynonyms[1][$function];
3768 # Case insensitive functions
3769 $function = $wgContLang->lc( $function );
3770 if ( isset( $this->mFunctionSynonyms[0][$function] ) ) {
3771 $function = $this->mFunctionSynonyms[0][$function];
3773 return [
'found' =>
false ];
3777 list( $callback,
$flags ) = $this->mFunctionHooks[$function];
3779 # Workaround for PHP bug 35229 and similar
3780 if ( !is_callable( $callback ) ) {
3781 throw new MWException(
"Tag hook for $function is not callable\n" );
3784 $allArgs = [ &$this ];
3786 # Convert arguments to PPNodes and collect for appending to $allArgs
3788 foreach (
$args as $k => $v ) {
3789 if ( $v instanceof
PPNode || $k === 0 ) {
3792 $funcArgs[] = $this->mPreprocessor->newPartNodeArray( [ $k => $v ] )->item( 0 );
3796 # Add a frame parameter, and pass the arguments as an array
3797 $allArgs[] = $frame;
3798 $allArgs[] = $funcArgs;
3800 # Convert arguments to plain text and append to $allArgs
3801 foreach (
$args as $k => $v ) {
3802 if ( $v instanceof
PPNode ) {
3803 $allArgs[] = trim( $frame->expand( $v ) );
3804 } elseif ( is_int( $k ) && $k >= 0 ) {
3805 $allArgs[] = trim( $v );
3807 $allArgs[] = trim(
"$k=$v" );
3812 $result = call_user_func_array( $callback, $allArgs );
3814 # The interface for function hooks allows them to return a wikitext
3815 # string or an array containing the string and any flags. This mungs
3816 # things around to match what this method should return.
3833 $preprocessFlags = 0;
3834 if ( isset(
$result[
'noparse'] ) ) {
3835 $noparse =
$result[
'noparse'];
3837 if ( isset(
$result[
'preprocessFlags'] ) ) {
3838 $preprocessFlags =
$result[
'preprocessFlags'];
3842 $result[
'text'] = $this->preprocessToDom(
$result[
'text'], $preprocessFlags );
3859 $titleText =
$title->getPrefixedDBkey();
3861 if ( isset( $this->mTplRedirCache[$titleText] ) ) {
3862 list( $ns, $dbk ) = $this->mTplRedirCache[$titleText];
3864 $titleText =
$title->getPrefixedDBkey();
3866 if ( isset( $this->mTplDomCache[$titleText] ) ) {
3867 return [ $this->mTplDomCache[$titleText],
$title ];
3870 # Cache miss, go to the database
3873 if ( $text ===
false ) {
3874 $this->mTplDomCache[$titleText] =
false;
3875 return [
false,
$title ];
3878 $dom = $this->preprocessToDom( $text, self::PTD_FOR_INCLUSION );
3879 $this->mTplDomCache[$titleText] = $dom;
3881 if ( !
$title->equals( $cacheTitle ) ) {
3882 $this->mTplRedirCache[$cacheTitle->getPrefixedDBkey()] =
3901 $cacheKey =
$title->getPrefixedDBkey();
3902 if ( !$this->currentRevisionCache ) {
3903 $this->currentRevisionCache =
new MapCacheLRU( 100 );
3905 if ( !$this->currentRevisionCache->has( $cacheKey ) ) {
3906 $this->currentRevisionCache->set( $cacheKey,
3908 call_user_func( $this->mOptions->getCurrentRevisionCallback(),
$title, $this )
3911 return $this->currentRevisionCache->get( $cacheKey );
3934 $templateCb = $this->mOptions->getTemplateCallback();
3935 $stuff = call_user_func( $templateCb,
$title, $this );
3937 $text = $stuff[
'text'];
3938 if ( is_string( $stuff[
'text'] ) ) {
3939 $text = strtr( $text,
"\x7f",
"?" );
3941 $finalTitle = isset( $stuff[
'finalTitle'] ) ? $stuff[
'finalTitle'] :
$title;
3942 if ( isset( $stuff[
'deps'] ) ) {
3943 foreach ( $stuff[
'deps']
as $dep ) {
3944 $this->mOutput->addTemplate( $dep[
'title'], $dep[
'page_id'], $dep[
'rev_id'] );
3945 if ( $dep[
'title']->equals( $this->getTitle() ) ) {
3948 $this->mOutput->setFlag(
'vary-revision' );
3952 return [ $text, $finalTitle ];
3961 return $this->fetchTemplateAndTitle(
$title )[0];
3974 $text = $skip =
false;
3978 # Loop to fetch the article, with up to 1 redirect
3980 for ( $i = 0; $i < 2 && is_object(
$title ); $i++ ) {
3982 # Give extensions a chance to select the revision instead
3983 $id =
false; # Assume current
3984 Hooks::run(
'BeforeParserFetchTemplateAndtitle',
3991 'page_id' =>
$title->getArticleID(),
4004 $rev_id =
$rev ?
$rev->getId() : 0;
4005 # If there is no current revision, there is no page
4006 if ( $id ===
false && !
$rev ) {
4008 $linkCache->addBadLinkObj(
$title );
4013 'page_id' =>
$title->getArticleID(),
4014 'rev_id' => $rev_id ];
4016 # We fetched a rev from a different title; register it too...
4018 'title' =>
$rev->getTitle(),
4019 'page_id' =>
$rev->getPage(),
4020 'rev_id' => $rev_id ];
4027 if ( $text ===
false || $text === null ) {
4033 $message =
wfMessage( $wgContLang->lcfirst(
$title->getText() ) )->inContentLanguage();
4034 if ( !$message->exists() ) {
4039 $text = $message->plain();
4052 'finalTitle' => $finalTitle,
4077 $time = $file ? $file->getTimestamp() :
false;
4078 $sha1 = $file ? $file->getSha1() :
false;
4079 # Register the file as a dependency...
4080 $this->mOutput->addImage(
$title->getDBkey(),
$time, $sha1 );
4081 if ( $file && !
$title->equals( $file->getTitle() ) ) {
4082 # Update fetched file title
4083 $title = $file->getTitle();
4084 $this->mOutput->addImage(
$title->getDBkey(),
$time, $sha1 );
4086 return [ $file,
$title ];
4100 if ( isset(
$options[
'broken'] ) ) {
4102 } elseif ( isset(
$options[
'sha1'] ) ) {
4119 global $wgEnableScaryTranscluding;
4121 if ( !$wgEnableScaryTranscluding ) {
4122 return wfMessage(
'scarytranscludedisabled' )->inContentLanguage()->text();
4125 $url =
$title->getFullURL( [
'action' => $action ] );
4127 if ( strlen( $url ) > 255 ) {
4128 return wfMessage(
'scarytranscludetoolong' )->inContentLanguage()->text();
4130 return $this->fetchScaryTemplateMaybeFromCache( $url );
4138 global $wgTranscludeCacheExpiry;
4140 $tsCond =
$dbr->timestamp( time() - $wgTranscludeCacheExpiry );
4141 $obj =
$dbr->selectRow(
'transcache', [
'tc_time',
'tc_contents' ],
4142 [
'tc_url' => $url,
"tc_time >= " .
$dbr->addQuotes( $tsCond ) ] );
4144 return $obj->tc_contents;
4150 $text =
$req->getContent();
4151 } elseif (
$req->getStatus() != 200 ) {
4153 return wfMessage(
'scarytranscludefailed-httpstatus' )
4154 ->params( $url,
$req->getStatus() )->inContentLanguage()->text();
4156 return wfMessage(
'scarytranscludefailed', $url )->inContentLanguage()->text();
4160 $dbw->replace(
'transcache', [
'tc_url' ], [
4162 'tc_time' => $dbw->timestamp( time() ),
4163 'tc_contents' => $text
4180 $parts = $piece[
'parts'];
4181 $nameWithSpaces = $frame->expand( $piece[
'title'] );
4182 $argName = trim( $nameWithSpaces );
4184 $text = $frame->getArgument( $argName );
4185 if ( $text ===
false && $parts->getLength() > 0
4186 && ( $this->ot[
'html']
4188 || ( $this->ot[
'wiki'] && $frame->isTemplate() )
4191 # No match in frame, use the supplied default
4192 $object = $parts->item( 0 )->getChildren();
4194 if ( !$this->incrementIncludeSize(
'arg', strlen( $text ) ) ) {
4195 $error =
'<!-- WARNING: argument omitted, expansion size too large -->';
4196 $this->limitationWarn(
'post-expand-template-argument' );
4199 if ( $text ===
false && $object ===
false ) {
4201 $object = $frame->virtualBracketedImplode(
'{{{',
'|',
'}}}', $nameWithSpaces, $parts );
4203 if ( $error !==
false ) {
4206 if ( $object !==
false ) {
4207 $ret = [
'object' => $object ];
4209 $ret = [
'text' => $text ];
4232 $attrText = !isset(
$params[
'attr'] ) ? null : $frame->expand(
$params[
'attr'] );
4234 $marker = self::MARKER_PREFIX .
"-$name-"
4235 . sprintf(
'%08X', $this->mMarkerIndex++ ) . self::MARKER_SUFFIX;
4237 $isFunctionTag = isset( $this->mFunctionTagHooks[strtolower(
$name )] ) &&
4238 ( $this->ot[
'html'] || $this->ot[
'pre'] );
4239 if ( $isFunctionTag ) {
4240 $markerType =
'none';
4242 $markerType =
'general';
4244 if ( $this->ot[
'html'] || $isFunctionTag ) {
4247 if ( isset(
$params[
'attributes'] ) ) {
4248 $attributes = $attributes +
$params[
'attributes'];
4251 if ( isset( $this->mTagHooks[
$name] ) ) {
4252 # Workaround for PHP bug 35229 and similar
4253 if ( !is_callable( $this->mTagHooks[$name] ) ) {
4254 throw new MWException(
"Tag hook for $name is not callable\n" );
4256 $output = call_user_func_array( $this->mTagHooks[$name],
4257 [
$content, $attributes, $this, $frame ] );
4258 } elseif ( isset( $this->mFunctionTagHooks[$name] ) ) {
4259 list( $callback, ) = $this->mFunctionTagHooks[
$name];
4260 if ( !is_callable( $callback ) ) {
4261 throw new MWException(
"Tag hook for $name is not callable\n" );
4264 $output = call_user_func_array( $callback, [ &$this, $frame,
$content, $attributes ] );
4266 $output =
'<span class="error">Invalid tag extension name: ' .
4267 htmlspecialchars( $name ) .
'</span>';
4271 # Extract flags to local scope (to override $markerType)
4278 if ( is_null( $attrText ) ) {
4281 if ( isset(
$params[
'attributes'] ) ) {
4282 foreach (
$params[
'attributes']
as $attrName => $attrValue ) {
4283 $attrText .=
' ' . htmlspecialchars( $attrName ) .
'="' .
4284 htmlspecialchars( $attrValue ) .
'"';
4288 $output =
"<$name$attrText/>";
4290 $close = is_null(
$params[
'close'] ) ?
'' : $frame->expand(
$params[
'close'] );
4291 $output =
"<$name$attrText>$content$close";
4295 if ( $markerType ===
'none' ) {
4297 } elseif ( $markerType ===
'nowiki' ) {
4298 $this->mStripState->addNoWiki( $marker,
$output );
4299 } elseif ( $markerType ===
'general' ) {
4300 $this->mStripState->addGeneral( $marker,
$output );
4302 throw new MWException( __METHOD__ .
': invalid marker type' );
4315 if ( $this->mIncludeSizes[
$type] + $size > $this->mOptions->getMaxIncludeSize() ) {
4318 $this->mIncludeSizes[
$type] += $size;
4329 $this->mExpensiveFunctionCount++;
4330 return $this->mExpensiveFunctionCount <= $this->mOptions->getExpensiveParserFunctionLimit();
4343 # The position of __TOC__ needs to be recorded
4345 if ( $mw->match( $text ) ) {
4346 $this->mShowToc =
true;
4347 $this->mForceTocPosition =
true;
4349 # Set a placeholder. At the end we'll fill it in with the TOC.
4350 $text = $mw->replace(
'<!--MWTOC-->', $text, 1 );
4352 # Only keep the first one.
4353 $text = $mw->replace(
'', $text );
4356 # Now match and remove the rest of them
4358 $this->mDoubleUnderscores = $mwa->matchAndRemove( $text );
4360 if ( isset( $this->mDoubleUnderscores[
'nogallery'] ) ) {
4361 $this->mOutput->mNoGallery =
true;
4363 if ( isset( $this->mDoubleUnderscores[
'notoc'] ) && !$this->mForceTocPosition ) {
4364 $this->mShowToc =
false;
4366 if ( isset( $this->mDoubleUnderscores[
'hiddencat'] )
4369 $this->addTrackingCategory(
'hidden-category-category' );
4371 # (bug 8068) Allow control over whether robots index a page.
4372 # @todo FIXME: Bug 14899: __INDEX__ always overrides __NOINDEX__ here! This
4373 # is not desirable, the last one on the page should win.
4374 if ( isset( $this->mDoubleUnderscores[
'noindex'] ) && $this->mTitle->canUseNoindex() ) {
4375 $this->mOutput->setIndexPolicy(
'noindex' );
4376 $this->addTrackingCategory(
'noindex-category' );
4378 if ( isset( $this->mDoubleUnderscores[
'index'] ) && $this->mTitle->canUseNoindex() ) {
4379 $this->mOutput->setIndexPolicy(
'index' );
4380 $this->addTrackingCategory(
'index-category' );
4383 # Cache all double underscores in the database
4384 foreach ( $this->mDoubleUnderscores
as $key => $val ) {
4385 $this->mOutput->setProperty(
$key,
'' );
4397 return $this->mOutput->addTrackingCategory( $msg, $this->mTitle );
4419 # Inhibit editsection links if requested in the page
4420 if ( isset( $this->mDoubleUnderscores[
'noeditsection'] ) ) {
4421 $maybeShowEditLink = $showEditLink =
false;
4423 $maybeShowEditLink =
true;
4424 $showEditLink = $this->mOptions->getEditSection();
4426 if ( $showEditLink ) {
4427 $this->mOutput->setEditSectionTokens(
true );
4430 # Get all headlines for numbering them and adding funky stuff like [edit]
4431 # links - this is for later, but we need the number of headlines right now
4433 $numMatches = preg_match_all(
4434 '/<H(?P<level>[1-6])(?P<attrib>.*?>)\s*(?P<header>[\s\S]*?)\s*<\/H[1-6] *>/i',
4439 # if there are fewer than 4 headlines in the article, do not show TOC
4440 # unless it's been explicitly enabled.
4441 $enoughToc = $this->mShowToc &&
4442 ( ( $numMatches >= 4 ) || $this->mForceTocPosition );
4444 # Allow user to stipulate that a page should have a "new section"
4445 # link added via __NEWSECTIONLINK__
4446 if ( isset( $this->mDoubleUnderscores[
'newsectionlink'] ) ) {
4447 $this->mOutput->setNewSection(
true );
4450 # Allow user to remove the "new section"
4451 # link via __NONEWSECTIONLINK__
4452 if ( isset( $this->mDoubleUnderscores[
'nonewsectionlink'] ) ) {
4453 $this->mOutput->hideNewSection(
true );
4456 # if the string __FORCETOC__ (not case-sensitive) occurs in the HTML,
4457 # override above conditions and always show TOC above first header
4458 if ( isset( $this->mDoubleUnderscores[
'forcetoc'] ) ) {
4459 $this->mShowToc =
true;
4467 # Ugh .. the TOC should have neat indentation levels which can be
4468 # passed to the skin functions. These are determined here
4472 $sublevelCount = [];
4478 $markerRegex = self::MARKER_PREFIX .
"-h-(\d+)-" . self::MARKER_SUFFIX;
4479 $baseTitleText = $this->mTitle->getPrefixedDBkey();
4480 $oldType = $this->mOutputType;
4482 $frame = $this->getPreprocessor()->newFrame();
4483 $root = $this->preprocessToDom( $origText );
4484 $node = $root->getFirstChild();
4489 $headlines = $numMatches !==
false ?
$matches[3] : [];
4491 foreach ( $headlines
as $headline ) {
4492 $isTemplate =
false;
4494 $sectionIndex =
false;
4496 $markerMatches = [];
4497 if ( preg_match(
"/^$markerRegex/", $headline, $markerMatches ) ) {
4498 $serial = $markerMatches[1];
4499 list( $titleText, $sectionIndex ) = $this->mHeadings[$serial];
4500 $isTemplate = ( $titleText != $baseTitleText );
4501 $headline = preg_replace(
"/^$markerRegex\\s*/",
"", $headline );
4505 $prevlevel = $level;
4507 $level =
$matches[1][$headlineCount];
4509 if ( $level > $prevlevel ) {
4510 # Increase TOC level
4512 $sublevelCount[$toclevel] = 0;
4513 if ( $toclevel < $wgMaxTocLevel ) {
4514 $prevtoclevel = $toclevel;
4518 } elseif ( $level < $prevlevel && $toclevel > 1 ) {
4519 # Decrease TOC level, find level to jump to
4521 for ( $i = $toclevel; $i > 0; $i-- ) {
4522 if ( $levelCount[$i] == $level ) {
4523 # Found last matching level
4526 } elseif ( $levelCount[$i] < $level ) {
4527 # Found first matching level below current level
4535 if ( $toclevel < $wgMaxTocLevel ) {
4536 if ( $prevtoclevel < $wgMaxTocLevel ) {
4537 # Unindent only if the previous toc level was shown :p
4539 $prevtoclevel = $toclevel;
4545 # No change in level, end TOC line
4546 if ( $toclevel < $wgMaxTocLevel ) {
4551 $levelCount[$toclevel] = $level;
4553 # count number of headlines for each level
4554 $sublevelCount[$toclevel]++;
4556 for ( $i = 1; $i <= $toclevel; $i++ ) {
4557 if ( !empty( $sublevelCount[$i] ) ) {
4561 $numbering .= $this->getTargetLanguage()->formatNum( $sublevelCount[$i] );
4566 # The safe header is a version of the header text safe to use for links
4568 # Remove link placeholders by the link text.
4569 # <!--LINK number-->
4571 # link text with suffix
4572 # Do this before unstrip since link text can contain strip markers
4573 $safeHeadline = $this->replaceLinkHoldersText( $headline );
4575 # Avoid insertion of weird stuff like <math> by expanding the relevant sections
4576 $safeHeadline = $this->mStripState->unstripBoth( $safeHeadline );
4578 # Strip out HTML (first regex removes any tag not allowed)
4580 # * <sup> and <sub> (bug 8393)
4583 # * <bdi> (bug 72884)
4584 # * <span dir="rtl"> and <span dir="ltr"> (bug 35167)
4585 # We strip any parameter from accepted tags (second regex), except dir="rtl|ltr" from <span>,
4586 # to allow setting directionality in toc items.
4587 $tocline = preg_replace(
4589 '#<(?!/?(span|sup|sub|bdi|i|b)(?: [^>]*)?>).*?>#',
4590 '#<(/?(?:span(?: dir="(?:rtl|ltr)")?|sup|sub|bdi|i|b))(?: .*?)?>#'
4596 # Strip '<span></span>', which is the result from the above if
4597 # <span id="foo"></span> is used to produce an additional anchor
4599 $tocline = str_replace(
'<span></span>',
'', $tocline );
4601 $tocline = trim( $tocline );
4603 # For the anchor, strip out HTML-y stuff period
4604 $safeHeadline = preg_replace(
'/<.*?>/',
'', $safeHeadline );
4607 # Save headline for section edit hint before it's escaped
4608 $headlineHint = $safeHeadline;
4610 if ( $wgExperimentalHtmlIds ) {
4611 # For reverse compatibility, provide an id that's
4612 # HTML4-compatible, like we used to.
4613 # It may be worth noting, academically, that it's possible for
4614 # the legacy anchor to conflict with a non-legacy headline
4615 # anchor on the page. In this case likely the "correct" thing
4616 # would be to either drop the legacy anchors or make sure
4617 # they're numbered first. However, this would require people
4618 # to type in section names like "abc_.D7.93.D7.90.D7.A4"
4619 # manually, so let's not bother worrying about it.
4621 [
'noninitial',
'legacy' ] );
4624 if ( $legacyHeadline == $safeHeadline ) {
4625 # No reason to have both (in fact, we can't)
4626 $legacyHeadline =
false;
4629 $legacyHeadline =
false;
4634 # HTML names must be case-insensitively unique (bug 10721).
4635 # This does not apply to Unicode characters per
4636 # http://www.w3.org/TR/html5/infrastructure.html#case-sensitivity-and-string-comparison
4637 # @todo FIXME: We may be changing them depending on the current locale.
4638 $arrayKey = strtolower( $safeHeadline );
4639 if ( $legacyHeadline ===
false ) {
4640 $legacyArrayKey =
false;
4642 $legacyArrayKey = strtolower( $legacyHeadline );
4645 # Create the anchor for linking from the TOC to the section
4646 $anchor = $safeHeadline;
4647 $legacyAnchor = $legacyHeadline;
4648 if ( isset( $refers[$arrayKey] ) ) {
4650 for ( $i = 2; isset( $refers[
"${arrayKey}_$i"] ); ++$i );
4653 $refers[
"${arrayKey}_$i"] =
true;
4655 $refers[$arrayKey] =
true;
4657 if ( $legacyHeadline !==
false && isset( $refers[$legacyArrayKey] ) ) {
4659 for ( $i = 2; isset( $refers[
"${legacyArrayKey}_$i"] ); ++$i );
4661 $legacyAnchor .=
"_$i";
4662 $refers[
"${legacyArrayKey}_$i"] =
true;
4664 $refers[$legacyArrayKey] =
true;
4667 # Don't number the heading if it is the only one (looks silly)
4668 if ( count(
$matches[3] ) > 1 && $this->mOptions->getNumberHeadings() ) {
4669 # the two are different if the line contains a link
4672 [
'class' =>
'mw-headline-number' ],
4674 ) .
' ' . $headline;
4677 if ( $enoughToc && ( !isset( $wgMaxTocLevel ) || $toclevel < $wgMaxTocLevel ) ) {
4679 $numbering, $toclevel, ( $isTemplate ?
false : $sectionIndex ) );
4682 # Add the section to the section tree
4683 # Find the DOM node for this header
4684 $noOffset = ( $isTemplate || $sectionIndex ===
false );
4685 while ( $node && !$noOffset ) {
4686 if ( $node->getName() ===
'h' ) {
4687 $bits = $node->splitHeading();
4688 if ( $bits[
'i'] == $sectionIndex ) {
4692 $byteOffset += mb_strlen( $this->mStripState->unstripBoth(
4694 $node = $node->getNextSibling();
4697 'toclevel' => $toclevel,
4700 'number' => $numbering,
4701 'index' => ( $isTemplate ?
'T-' :
'' ) . $sectionIndex,
4702 'fromtitle' => $titleText,
4703 'byteoffset' => ( $noOffset ? null : $byteOffset ),
4704 'anchor' => $anchor,
4707 # give headline the correct <h#> tag
4708 if ( $maybeShowEditLink && $sectionIndex !==
false ) {
4710 if ( $isTemplate ) {
4711 # Put a T flag in the section identifier, to indicate to extractSections()
4712 # that sections inside <includeonly> should be counted.
4713 $editsectionPage = $titleText;
4714 $editsectionSection =
"T-$sectionIndex";
4715 $editsectionContent = null;
4717 $editsectionPage = $this->mTitle->getPrefixedText();
4718 $editsectionSection = $sectionIndex;
4719 $editsectionContent = $headlineHint;
4733 $editlink =
'<mw:editsection page="' . htmlspecialchars( $editsectionPage );
4734 $editlink .=
'" section="' . htmlspecialchars( $editsectionSection ) .
'"';
4735 if ( $editsectionContent !== null ) {
4736 $editlink .=
'>' . $editsectionContent .
'</mw:editsection>';
4744 $matches[
'attrib'][$headlineCount], $anchor, $headline,
4745 $editlink, $legacyAnchor );
4750 $this->setOutputType( $oldType );
4752 # Never ever show TOC if no headers
4753 if ( $numVisible < 1 ) {
4758 if ( $prevtoclevel > 0 && $prevtoclevel < $wgMaxTocLevel ) {
4762 $this->mOutput->setTOCHTML( $toc );
4763 $toc = self::TOC_START . $toc . self::TOC_END;
4764 $this->mOutput->addModules(
'mediawiki.toc' );
4768 $this->mOutput->setSections( $tocraw );
4771 # split up and insert constructed headlines
4772 $blocks = preg_split(
'/<H[1-6].*?>[\s\S]*?<\/H[1-6]>/i', $text );
4777 foreach ( $blocks
as $block ) {
4779 if ( empty( $head[$i - 1] ) ) {
4780 $sections[$i] = $block;
4782 $sections[$i] = $head[$i - 1] . $block;
4795 Hooks::run(
'ParserSectionCreate', [ $this, $i, &$sections[$i], $showEditLink ] );
4800 if ( $enoughToc && $isMain && !$this->mForceTocPosition ) {
4803 $sections[0] = $sections[0] . $toc .
"\n";
4806 $full .= implode(
'', $sections );
4808 if ( $this->mForceTocPosition ) {
4809 return str_replace(
'<!--MWTOC-->', $toc, $full );
4829 if ( $clearState ) {
4830 $magicScopeVariable = $this->lock();
4832 $this->startParse( $title, $options,
self::OT_WIKI, $clearState );
4833 $this->setUser( $user );
4839 $text = str_replace( array_keys( $pairs ), array_values( $pairs ), $text );
4841 $text = $this->pstPass2( $text, $user );
4843 $text = $this->mStripState->unstripBoth( $text );
4845 $this->setUser( null ); # Reset
4861 # Note: This is the timestamp saved as hardcoded wikitext to
4862 # the database, we use $wgContLang here in order to give
4863 # everyone the same signature and use the default one rather
4864 # than the one selected in each user's preferences.
4865 # (see also bug 12815)
4866 $ts = $this->mOptions->getTimestamp();
4869 $tzMsg =
$timestamp->getTimezoneMessage()->inContentLanguage()->text();
4871 $d = $wgContLang->timeanddate( $ts,
false,
false ) .
" ($tzMsg)";
4873 # Variable replacement
4874 # Because mOutputType is OT_WIKI, this will only process {{subst:xxx}} type tags
4875 $text = $this->replaceVariables( $text );
4877 # This works almost by chance, as the replaceVariables are done before the getUserSig(),
4878 # which may corrupt this parser instance via its wfMessage()->text() call-
4881 $sigText = $this->getUserSig(
$user );
4882 $text = strtr( $text, [
4884 '~~~~' =>
"$sigText $d",
4888 # Context links ("pipe tricks"): [[|name]] and [[name (context)|]]
4890 $nc =
'[ _0-9A-Za-z\x80-\xff-]'; # Namespaces can
use non-ascii!
4893 $p1 =
"/\[\[(:?$nc+:|:|)($tc+?)( ?\\($tc+\\))\\|]]/";
4895 $p4 =
"/\[\[(:?$nc+:|:|)($tc+?)( ?($tc+))\\|]]/";
4897 $p3 =
"/\[\[(:?$nc+:|:|)($tc+?)( ?\\($tc+\\)|)((?:, |,)$tc+|)\\|]]/";
4899 $p2 =
"/\[\[\\|($tc+)]]/";
4901 # try $p1 first, to turn "[[A, B (C)|]]" into "[[A, B (C)|A, B]]"
4902 $text = preg_replace( $p1,
'[[\\1\\2\\3|\\2]]', $text );
4903 $text = preg_replace( $p4,
'[[\\1\\2\\3|\\2]]', $text );
4904 $text = preg_replace( $p3,
'[[\\1\\2\\3\\4|\\2]]', $text );
4906 $t = $this->mTitle->getText();
4908 if ( preg_match(
"/^($nc+:|)$tc+?( \\($tc+\\))$/",
$t, $m ) ) {
4909 $text = preg_replace( $p2,
"[[$m[1]\\1$m[2]|\\1]]", $text );
4910 } elseif ( preg_match(
"/^($nc+:|)$tc+?(, $tc+|)$/",
$t, $m ) &&
"$m[1]$m[2]" !=
'' ) {
4911 $text = preg_replace( $p2,
"[[$m[1]\\1$m[2]|\\1]]", $text );
4913 # if there's no context, don't bother duplicating the title
4914 $text = preg_replace( $p2,
'[[\\1]]', $text );
4917 # Trim trailing whitespace
4918 $text = rtrim( $text );
4942 # If not given, retrieve from the user object.
4943 if ( $nickname ===
false ) {
4944 $nickname =
$user->getOption(
'nickname' );
4947 if ( is_null( $fancySig ) ) {
4948 $fancySig =
$user->getBoolOption(
'fancysig' );
4951 $nickname = $nickname == null ?
$username : $nickname;
4953 if ( mb_strlen( $nickname ) > $wgMaxSigChars ) {
4955 wfDebug( __METHOD__ .
": $username has overlong signature.\n" );
4956 } elseif ( $fancySig !==
false ) {
4957 # Sig. might contain markup; validate this
4958 if ( $this->validateSig( $nickname ) !==
false ) {
4959 # Validated; clean up (if needed) and return it
4960 return $this->cleanSig( $nickname,
true );
4962 # Failed to validate; fall back to the default
4964 wfDebug( __METHOD__ .
": $username has bad XML tags in signature.\n" );
4968 # Make sure nickname doesnt get a sig in a sig
4969 $nickname = self::cleanSigInSig( $nickname );
4971 # If we're still here, make it a link to the user page
4974 $msgName =
$user->isAnon() ?
'signature-anon' :
'signature';
4976 return wfMessage( $msgName, $userText, $nickText )->inContentLanguage()
4977 ->title( $this->getTitle() )->text();
5003 $magicScopeVariable = $this->lock();
5007 # Option to disable this feature
5008 if ( !$this->mOptions->getCleanSignatures() ) {
5012 # @todo FIXME: Regex doesn't respect extension tags or nowiki
5013 # => Move this logic to braceSubstitution()
5015 $substRegex =
'/\{\{(?!(?:' . $substWord->getBaseRegex() .
'))/x' . $substWord->getRegexCase();
5016 $substText =
'{{' . $substWord->getSynonym( 0 );
5018 $text = preg_replace( $substRegex, $substText, $text );
5019 $text = self::cleanSigInSig( $text );
5020 $dom = $this->preprocessToDom( $text );
5021 $frame = $this->getPreprocessor()->newFrame();
5022 $text = $frame->expand( $dom );
5025 $text = $this->mStripState->unstripBoth( $text );
5038 $text = preg_replace(
'/~{3,5}/',
'', $text );
5052 $outputType, $clearState =
true
5054 $this->startParse(
$title, $options, $outputType, $clearState );
5064 $outputType, $clearState =
true
5066 $this->setTitle(
$title );
5068 $this->setOutputType( $outputType );
5069 if ( $clearState ) {
5070 $this->clearState();
5083 static $executing =
false;
5085 # Guard against infinite recursion
5128 if ( preg_match(
'/[<>\r\n]/',
$tag, $m ) ) {
5129 throw new MWException(
"Invalid character {$m[0]} in setHook('$tag', ...) call" );
5131 $oldVal = isset( $this->mTagHooks[
$tag] ) ? $this->mTagHooks[
$tag] : null;
5132 $this->mTagHooks[
$tag] = $callback;
5133 if ( !in_array( $tag, $this->mStripList ) ) {
5134 $this->mStripList[] =
$tag;
5159 if ( preg_match(
'/[<>\r\n]/',
$tag, $m ) ) {
5160 throw new MWException(
"Invalid character {$m[0]} in setTransparentHook('$tag', ...) call" );
5162 $oldVal = isset( $this->mTransparentTagHooks[
$tag] ) ? $this->mTransparentTagHooks[
$tag] : null;
5163 $this->mTransparentTagHooks[
$tag] = $callback;
5172 $this->mTagHooks = [];
5173 $this->mFunctionTagHooks = [];
5174 $this->mStripList = $this->mDefaultStripList;
5223 $oldVal = isset( $this->mFunctionHooks[$id] ) ? $this->mFunctionHooks[$id][0] : null;
5224 $this->mFunctionHooks[$id] = [ $callback,
$flags ];
5226 # Add to function cache
5229 throw new MWException( __METHOD__ .
'() expecting a magic word identifier.' );
5232 $synonyms = $mw->getSynonyms();
5233 $sensitive = intval( $mw->isCaseSensitive() );
5235 foreach ( $synonyms
as $syn ) {
5237 if ( !$sensitive ) {
5238 $syn = $wgContLang->lc( $syn );
5244 # Remove trailing colon
5245 if ( substr( $syn, -1, 1 ) ===
':' ) {
5246 $syn = substr( $syn, 0, -1 );
5248 $this->mFunctionSynonyms[$sensitive][$syn] = $id;
5259 return array_keys( $this->mFunctionHooks );
5274 if ( preg_match(
'/[<>\r\n]/',
$tag, $m ) ) {
5275 throw new MWException(
"Invalid character {$m[0]} in setFunctionTagHook('$tag', ...) call" );
5277 $old = isset( $this->mFunctionTagHooks[
$tag] ) ?
5278 $this->mFunctionTagHooks[
$tag] : null;
5279 $this->mFunctionTagHooks[
$tag] = [ $callback,
$flags ];
5281 if ( !in_array( $tag, $this->mStripList ) ) {
5282 $this->mStripList[] =
$tag;
5296 $this->mLinkHolders->replace( $text );
5307 return $this->mLinkHolders->replaceText( $text );
5326 if ( isset(
$params[
'mode'] ) ) {
5337 $ig->setContextTitle( $this->mTitle );
5338 $ig->setShowBytes(
false );
5339 $ig->setShowFilename(
false );
5340 $ig->setParser( $this );
5341 $ig->setHideBadImages();
5344 if ( isset(
$params[
'showfilename'] ) ) {
5345 $ig->setShowFilename(
true );
5347 $ig->setShowFilename(
false );
5349 if ( isset(
$params[
'caption'] ) ) {
5350 $caption =
$params[
'caption'];
5351 $caption = htmlspecialchars( $caption );
5352 $caption = $this->replaceInternalLinks( $caption );
5353 $ig->setCaptionHtml( $caption );
5355 if ( isset(
$params[
'perrow'] ) ) {
5356 $ig->setPerRow(
$params[
'perrow'] );
5358 if ( isset(
$params[
'widths'] ) ) {
5359 $ig->setWidths(
$params[
'widths'] );
5361 if ( isset(
$params[
'heights'] ) ) {
5362 $ig->setHeights(
$params[
'heights'] );
5364 $ig->setAdditionalOptions(
$params );
5366 Hooks::run(
'BeforeParserrenderImageGallery', [ &$this, &$ig ] );
5370 # match lines like these:
5371 # Image:someimage.jpg|This is some image
5373 preg_match(
"/^([^|]+)(\\|(.*))?$/", $line,
$matches );
5379 if ( strpos(
$matches[0],
'%' ) !==
false ) {
5383 if ( is_null(
$title ) ) {
5384 # Bogus title. Ignore these so we don't bomb out later.
5388 # We need to get what handler the file uses, to figure out parameters.
5389 # Note, a hook can overide the file name, and chose an entirely different
5390 # file (which potentially could be of a different type and have different handler).
5395 # Don't register it now, as ImageGallery does that later.
5397 $handler = $file ? $file->getHandler() :
false;
5400 'img_alt' =>
'gallery-internal-alt',
5401 'img_link' =>
'gallery-internal-link',
5404 $paramMap = $paramMap +
$handler->getParamMap();
5407 unset( $paramMap[
'img_width'] );
5415 $handlerOptions = [];
5426 foreach ( $parameterMatches
as $parameterMatch ) {
5427 list( $magicName, $match ) = $mwArray->matchVariableStartToEnd( $parameterMatch );
5429 $paramName = $paramMap[$magicName];
5431 switch ( $paramName ) {
5432 case 'gallery-internal-alt':
5433 $alt = $this->stripAltText( $match,
false );
5435 case 'gallery-internal-link':
5436 $linkValue = strip_tags( $this->replaceLinkHoldersText( $match ) );
5437 $chars = self::EXT_LINK_URL_CLASS;
5438 $addr = self::EXT_LINK_ADDR;
5439 $prots = $this->mUrlProtocols;
5441 if ( preg_match(
"/^($prots)$addr$chars*$/u", $linkValue ) ) {
5443 $this->mOutput->addExternalLink(
$link );
5446 if ( $localLinkTitle !== null ) {
5447 $this->mOutput->addLink( $localLinkTitle );
5454 if (
$handler->validateParam( $paramName, $match ) ) {
5455 $handlerOptions[$paramName] = $match;
5458 wfDebug(
"$parameterMatch failed parameter validation\n" );
5459 $label =
'|' . $parameterMatch;
5465 $label =
'|' . $parameterMatch;
5469 $label = substr( $label, 1 );
5472 $ig->add(
$title, $label, $alt,
$link, $handlerOptions );
5474 $html = $ig->toHTML();
5485 $handlerClass = get_class(
$handler );
5489 if ( !isset( $this->mImageParams[$handlerClass] ) ) {
5490 # Initialise static lists
5491 static $internalParamNames = [
5492 'horizAlign' => [
'left',
'right',
'center',
'none' ],
5493 'vertAlign' => [
'baseline',
'sub',
'super',
'top',
'text-top',
'middle',
5494 'bottom',
'text-bottom' ],
5495 'frame' => [
'thumbnail',
'manualthumb',
'framed',
'frameless',
5496 'upright',
'border',
'link',
'alt',
'class' ],
5498 static $internalParamMap;
5499 if ( !$internalParamMap ) {
5500 $internalParamMap = [];
5501 foreach ( $internalParamNames
as $type => $names ) {
5503 $magicName = str_replace(
'-',
'_',
"img_$name" );
5504 $internalParamMap[$magicName] = [
$type,
$name ];
5509 # Add handler params
5510 $paramMap = $internalParamMap;
5512 $handlerParamMap =
$handler->getParamMap();
5513 foreach ( $handlerParamMap
as $magic => $paramName ) {
5514 $paramMap[$magic] = [
'handler', $paramName ];
5517 $this->mImageParams[$handlerClass] = $paramMap;
5518 $this->mImageParamsMagicArray[$handlerClass] =
new MagicWordArray( array_keys( $paramMap ) );
5520 return [ $this->mImageParams[$handlerClass], $this->mImageParamsMagicArray[$handlerClass] ];
5532 # Check if the options text is of the form "options|alt text"
5534 # * thumbnail make a thumbnail with enlarge-icon and caption, alignment depends on lang
5535 # * left no resizing, just left align. label is used for alt= only
5536 # * right same, but right aligned
5537 # * none same, but not aligned
5538 # * ___px scale to ___ pixels width, no aligning. e.g. use in taxobox
5539 # * center center the image
5540 # * frame Keep original image size, no magnify-button.
5541 # * framed Same as "frame"
5542 # * frameless like 'thumb' but without a frame. Keeps user preferences for width
5543 # * upright reduce width for upright images, rounded to full __0 px
5544 # * border draw a 1px border around the image
5545 # * alt Text for HTML alt attribute (defaults to empty)
5546 # * class Set a class for img node
5547 # * link Set the target of the image link. Can be external, interwiki, or local
5548 # vertical-align values (no % or length right now):
5560 # Give extensions a chance to select the file revision for us
5565 # Fetch and register the file (file title may be different via hooks)
5569 $handler = $file ? $file->getHandler() :
false;
5571 list( $paramMap, $mwArray ) = $this->getImageParams(
$handler );
5574 $this->addTrackingCategory(
'broken-file-category' );
5577 # Process the input parameters
5579 $params = [
'frame' => [],
'handler' => [],
5580 'horizAlign' => [],
'vertAlign' => [] ];
5581 $seenformat =
false;
5582 foreach ( $parts
as $part ) {
5583 $part = trim( $part );
5584 list( $magicName,
$value ) = $mwArray->matchVariableStartToEnd( $part );
5586 if ( isset( $paramMap[$magicName] ) ) {
5587 list(
$type, $paramName ) = $paramMap[$magicName];
5589 # Special case; width and height come in one variable together
5590 if (
$type ===
'handler' && $paramName ===
'width' ) {
5591 $parsedWidthParam = $this->parseWidthParam(
$value );
5592 if ( isset( $parsedWidthParam[
'width'] ) ) {
5593 $width = $parsedWidthParam[
'width'];
5594 if (
$handler->validateParam(
'width', $width ) ) {
5599 if ( isset( $parsedWidthParam[
'height'] ) ) {
5600 $height = $parsedWidthParam[
'height'];
5601 if (
$handler->validateParam(
'height', $height ) ) {
5606 # else no validation -- bug 13436
5608 if (
$type ===
'handler' ) {
5609 # Validate handler parameter
5612 # Validate internal parameters
5613 switch ( $paramName ) {
5617 # @todo FIXME: Possibly check validity here for
5618 # manualthumb? downstream behavior seems odd with
5619 # missing manual thumbs.
5624 $chars = self::EXT_LINK_URL_CLASS;
5625 $addr = self::EXT_LINK_ADDR;
5626 $prots = $this->mUrlProtocols;
5628 $paramName =
'no-link';
5631 } elseif ( preg_match(
"/^((?i)$prots)/",
$value ) ) {
5632 if ( preg_match(
"/^((?i)$prots)$addr$chars*$/u",
$value, $m ) ) {
5633 $paramName =
'link-url';
5634 $this->mOutput->addExternalLink(
$value );
5635 if ( $this->mOptions->getExternalLinkTarget() ) {
5636 $params[
$type][
'link-target'] = $this->mOptions->getExternalLinkTarget();
5643 $paramName =
'link-title';
5645 $this->mOutput->addLink( $linkTitle );
5654 $validated = ! $seenformat;
5658 # Most other things appear to be empty or numeric...
5659 $validated = (
$value ===
false || is_numeric( trim(
$value ) ) );
5668 if ( !$validated ) {
5673 # Process alignment parameters
5674 if (
$params[
'horizAlign'] ) {
5681 $params[
'frame'][
'caption'] = $caption;
5683 # Will the image be presented in a frame, with the caption below?
5684 $imageIsFramed = isset(
$params[
'frame'][
'frame'] )
5685 || isset(
$params[
'frame'][
'framed'] )
5686 || isset(
$params[
'frame'][
'thumbnail'] )
5687 || isset(
$params[
'frame'][
'manualthumb'] );
5689 # In the old days, [[Image:Foo|text...]] would set alt text. Later it
5690 # came to also set the caption, ordinary text after the image -- which
5691 # makes no sense, because that just repeats the text multiple times in
5692 # screen readers. It *also* came to set the title attribute.
5693 # Now that we have an alt attribute, we should not set the alt text to
5694 # equal the caption: that's worse than useless, it just repeats the
5695 # text. This is the framed/thumbnail case. If there's no caption, we
5696 # use the unnamed parameter for alt text as well, just for the time be-
5697 # ing, if the unnamed param is set and the alt param is not.
5698 # For the future, we need to figure out if we want to tweak this more,
5699 # e.g., introducing a title= parameter for the title; ignoring the un-
5700 # named parameter entirely for images without a caption; adding an ex-
5701 # plicit caption= parameter and preserving the old magic unnamed para-
5703 if ( $imageIsFramed ) { # Framed image
5704 if ( $caption ===
'' && !isset(
$params[
'frame'][
'alt'] ) ) {
5705 # No caption or alt text, add the filename as the alt text so
5706 # that screen readers at least get some description of the image
5709 # Do not set $params['frame']['title'] because tooltips don't make sense
5711 }
else { # Inline image
5712 if ( !isset(
$params[
'frame'][
'alt'] ) ) {
5713 # No alt text, use the "caption" for the alt text
5714 if ( $caption !==
'' ) {
5715 $params[
'frame'][
'alt'] = $this->stripAltText( $caption, $holders );
5717 # No caption, fall back to using the filename for the
5722 # Use the "caption" for the tooltip text
5723 $params[
'frame'][
'title'] = $this->stripAltText( $caption, $holders );
5728 # Linker does the rest
5731 $time, $descQuery, $this->mOptions->getThumbSize() );
5733 # Give the handler a chance to modify the parser object
5735 $handler->parserTransformHook( $this, $file );
5747 # Strip bad stuff out of the title (tooltip). We can't just use
5748 # replaceLinkHoldersText() here, because if this function is called
5749 # from replaceInternalLinks2(), mLinkHolders won't be up-to-date.
5751 $tooltip = $holders->replaceText( $caption );
5753 $tooltip = $this->replaceLinkHoldersText( $caption );
5756 # make sure there are no placeholders in thumbnail attributes
5757 # that are later expanded to html- so expand them now and
5759 $tooltip = $this->mStripState->unstripBoth( $tooltip );
5770 wfDebug(
"Parser output marked as uncacheable.\n" );
5771 if ( !$this->mOutput ) {
5773 " can only be called when actually parsing something" );
5775 $this->mOutput->updateCacheExpiry( 0 );
5787 $text = $this->replaceVariables( $text, $frame );
5788 $text = $this->mStripState->unstripBoth( $text );
5799 array_keys( $this->mTransparentTagHooks ),
5800 array_keys( $this->mTagHooks ),
5801 array_keys( $this->mFunctionTagHooks )
5817 $elements = array_keys( $this->mTransparentTagHooks );
5818 $text = self::extractTagsAndParams( $elements, $text,
$matches );
5823 $tagName = strtolower( $element );
5824 if ( isset( $this->mTransparentTagHooks[$tagName] ) ) {
5825 $output = call_user_func_array(
5826 $this->mTransparentTagHooks[$tagName],
5832 $replacements[$marker] =
$output;
5834 return strtr( $text, $replacements );
5869 $magicScopeVariable = $this->lock();
5872 $frame = $this->getPreprocessor()->newFrame();
5874 # Process section extraction flags
5876 $sectionParts = explode(
'-', $sectionId );
5877 $sectionIndex = array_pop( $sectionParts );
5878 foreach ( $sectionParts
as $part ) {
5879 if ( $part ===
'T' ) {
5880 $flags |= self::PTD_FOR_INCLUSION;
5884 # Check for empty input
5885 if ( strval( $text ) ===
'' ) {
5886 # Only sections 0 and T-0 exist in an empty document
5887 if ( $sectionIndex == 0 ) {
5888 if ( $mode ===
'get' ) {
5894 if ( $mode ===
'get' ) {
5902 # Preprocess the text
5903 $root = $this->preprocessToDom( $text,
$flags );
5905 # <h> nodes indicate section breaks
5906 # They can only occur at the top level, so we can find them by iterating the root's children
5907 $node = $root->getFirstChild();
5909 # Find the target section
5910 if ( $sectionIndex == 0 ) {
5911 # Section zero doesn't nest, level=big
5912 $targetLevel = 1000;
5915 if ( $node->getName() ===
'h' ) {
5916 $bits = $node->splitHeading();
5917 if ( $bits[
'i'] == $sectionIndex ) {
5918 $targetLevel = $bits[
'level'];
5922 if ( $mode ===
'replace' ) {
5925 $node = $node->getNextSibling();
5931 if ( $mode ===
'get' ) {
5938 # Find the end of the section, including nested sections
5940 if ( $node->getName() ===
'h' ) {
5941 $bits = $node->splitHeading();
5942 $curLevel = $bits[
'level'];
5943 if ( $bits[
'i'] != $sectionIndex && $curLevel <= $targetLevel ) {
5947 if ( $mode ===
'get' ) {
5950 $node = $node->getNextSibling();
5953 # Write out the remainder (in replace mode only)
5954 if ( $mode ===
'replace' ) {
5955 # Output the replacement text
5956 # Add two newlines on -- trailing whitespace in $newText is conventionally
5957 # stripped by the editor, so we need both newlines to restore the paragraph gap
5958 # Only add trailing whitespace if there is newText
5959 if ( $newText !=
"" ) {
5960 $outText .= $newText .
"\n\n";
5965 $node = $node->getNextSibling();
5969 if ( is_string( $outText ) ) {
5970 # Re-insert stripped tags
5971 $outText = rtrim( $this->mStripState->unstripBoth( $outText ) );
5991 public function getSection( $text, $sectionId, $defaultText =
'' ) {
5992 return $this->extractSections( $text, $sectionId,
'get', $defaultText );
6008 return $this->extractSections( $oldText, $sectionId,
'replace', $newText );
6017 return $this->mRevisionId;
6027 if ( !is_null( $this->mRevisionObject ) ) {
6028 return $this->mRevisionObject;
6030 if ( is_null( $this->mRevisionId ) ) {
6034 $rev = call_user_func(
6035 $this->mOptions->getCurrentRevisionCallback(), $this->getTitle(), $this
6038 # If the parse is for a new revision, then the callback should have
6039 # already been set to force the object and should match mRevisionId.
6040 # If not, try to fetch by mRevisionId for sanity.
6041 if (
$rev &&
$rev->getId() != $this->mRevisionId ) {
6045 $this->mRevisionObject =
$rev;
6047 return $this->mRevisionObject;
6056 if ( is_null( $this->mRevisionTimestamp ) ) {
6059 $revObject = $this->getRevisionObject();
6062 # The cryptic '' timezone parameter tells to use the site-default
6063 # timezone offset instead of the user settings.
6064 # Since this value will be saved into the parser cache, served
6065 # to other users, and potentially even used inside links and such,
6066 # it needs to be consistent for all visitors.
6067 $this->mRevisionTimestamp = $wgContLang->userAdjust(
$timestamp,
'' );
6070 return $this->mRevisionTimestamp;
6079 if ( is_null( $this->mRevisionUser ) ) {
6080 $revObject = $this->getRevisionObject();
6082 # if this template is subst: the revision id will be blank,
6083 # so just use the current user's name
6085 $this->mRevisionUser = $revObject->getUserText();
6086 } elseif ( $this->ot[
'wiki'] || $this->mOptions->getIsPreview() ) {
6087 $this->mRevisionUser = $this->getUser()->getName();
6090 return $this->mRevisionUser;
6099 if ( is_null( $this->mRevisionSize ) ) {
6100 $revObject = $this->getRevisionObject();
6102 # if this variable is subst: the revision id will be blank,
6103 # so just use the parser input size, because the own substituation
6104 # will change the size.
6106 $this->mRevisionSize = $revObject->getSize();
6107 } elseif ( $this->ot[
'wiki'] || $this->mOptions->getIsPreview() ) {
6108 $this->mRevisionSize = $this->mInputSize;
6111 return $this->mRevisionSize;
6120 $this->mDefaultSort =
$sort;
6121 $this->mOutput->setProperty(
'defaultsort',
$sort );
6135 if ( $this->mDefaultSort !==
false ) {
6136 return $this->mDefaultSort;
6149 return $this->mDefaultSort;
6162 # Strip out wikitext links(they break the anchor)
6163 $text = $this->stripSectionName( $text );
6177 # Strip out wikitext links(they break the anchor)
6178 $text = $this->stripSectionName( $text );
6198 # Strip internal link markup
6199 $text = preg_replace(
'/\[\[:?([^[|]+)\|([^[]+)\]\]/',
'$2', $text );
6200 $text = preg_replace(
'/\[\[:?([^[]+)\|?\]\]/',
'$1', $text );
6202 # Strip external link markup
6203 # @todo FIXME: Not tolerant to blank link text
6204 # I.E. [https://www.mediawiki.org] will render as [1] or something depending
6205 # on how many empty links there are on the page - need to figure that out.
6206 $text = preg_replace(
'/\[(?i:' . $this->mUrlProtocols .
')([^ ]+?) ([^[]+)\]/',
'$2', $text );
6208 # Parse wikitext quotes (italics & bold)
6209 $text = $this->doQuotes( $text );
6229 $magicScopeVariable = $this->lock();
6230 $this->startParse( $title, $options, $outputType,
true );
6232 $text = $this->replaceVariables( $text );
6233 $text = $this->mStripState->unstripBoth( $text );
6245 return $this->preSaveTransform( $text, $title, $options->
getUser(),
$options );
6277 while ( $i < strlen(
$s ) ) {
6278 $markerStart = strpos(
$s, self::MARKER_PREFIX, $i );
6279 if ( $markerStart ===
false ) {
6280 $out .= call_user_func( $callback, substr(
$s, $i ) );
6283 $out .= call_user_func( $callback, substr(
$s, $i, $markerStart - $i ) );
6284 $markerEnd = strpos(
$s, self::MARKER_SUFFIX, $markerStart );
6285 if ( $markerEnd ===
false ) {
6286 $out .= substr(
$s, $markerStart );
6289 $markerEnd += strlen( self::MARKER_SUFFIX );
6290 $out .= substr(
$s, $markerStart, $markerEnd - $markerStart );
6305 return $this->mStripState->killMarkers( $text );
6327 'version' => self::HALF_PARSED_VERSION,
6328 'stripState' => $this->mStripState->getSubState( $text ),
6329 'linkHolders' => $this->mLinkHolders->getSubArray( $text )
6350 if ( !isset( $data[
'version'] ) || $data[
'version'] != self::HALF_PARSED_VERSION ) {
6351 throw new MWException( __METHOD__ .
': invalid version' );
6354 # First, extract the strip state.
6355 $texts = [ $data[
'text'] ];
6356 $texts = $this->mStripState->merge( $data[
'stripState'], $texts );
6358 # Now renumber links
6359 $texts = $this->mLinkHolders->mergeForeign( $data[
'linkHolders'], $texts );
6361 # Should be good to go.
6375 return isset( $data[
'version'] ) && $data[
'version'] == self::HALF_PARSED_VERSION;
6387 $parsedWidthParam = [];
6389 return $parsedWidthParam;
6392 # (bug 13500) In both cases (width/height and width only),
6393 # permit trailing "px" for backward compatibility.
6394 if ( preg_match(
'/^([0-9]*)x([0-9]*)\s*(?:px)?\s*$/',
$value, $m ) ) {
6395 $width = intval( $m[1] );
6396 $height = intval( $m[2] );
6397 $parsedWidthParam[
'width'] = $width;
6398 $parsedWidthParam[
'height'] = $height;
6399 } elseif ( preg_match(
'/^[0-9]*\s*(?:px)?\s*$/',
$value ) ) {
6400 $width = intval(
$value );
6401 $parsedWidthParam[
'width'] = $width;
6403 return $parsedWidthParam;
6416 if ( $this->mInParse ) {
6417 throw new MWException(
"Parser state cleared while parsing. "
6418 .
"Did you call Parser::parse recursively?" );
6420 $this->mInParse =
true;
6423 $this->mInParse =
false;
6426 return $recursiveCheck;
6441 if ( preg_match(
'/^<p>(.*)\n?<\/p>\n?$/sU',
$html, $m ) ) {
6442 if ( strpos( $m[1],
'</p>' ) ===
false ) {
6462 if ( $this->mInParse ) {
6463 return new $wgParserConf[
'class']( $wgParserConf );
6477 $this->mOutput->setEnableOOUI(
true );
getRevisionObject()
Get the revision object for $this->mRevisionId.
setTitle($t)
Set the context title.
markerSkipCallback($s, $callback)
Call a callback function on all regions of the given text that are not inside strip markers...
#define the
table suitable for use with IDatabase::select()
replaceInternalLinks2(&$s)
Process [[ ]] wikilinks (RIL)
static getVariableIDs()
Get an array of parser variable IDs.
you don t have to do a grep find to see where the $wgReverseTitle variable is used
deferred txt A few of the database updates required by various functions here can be deferred until after the result page is displayed to the user For updating the view updating the linked to tables after a etc PHP does not yet have any way to tell the server to actually return and disconnect while still running these but it might have such a feature in the future We handle these by creating a deferred update object and putting those objects on a global then executing the whole list after the page is displayed We don t do anything smart like collating updates to the same table or such because the list is almost always going to have just one item on if that
external whereas SearchGetNearMatch runs after $term
isValidHalfParsedText($data)
Returns true if the given array, presumed to be generated by serializeHalfParsedText(), is compatible with the current version of the parser.
null means default in associative array form
null means default in associative array with keys and values unescaped Should be merged with default with a value of false meaning to suppress the attribute in associative array with keys and values unescaped noclasses just before the function returns a value If you return an< a > element with HTML attributes $attribs and contents $html will be returned If you return $ret will be returned and may include noclasses & $html
static tocLineEnd()
End a Table Of Contents line.
deferred txt A few of the database updates required by various functions here can be deferred until after the result page is displayed to the user For updating the view updating the linked to tables after a etc PHP does not yet have any way to tell the server to actually return and disconnect while still running these but it might have such a feature in the future We handle these by creating a deferred update object and putting those objects on a global list
getSection($text, $sectionId, $defaultText= '')
This function returns the text of a section, specified by a number ($section).
static decodeTagAttributes($text)
Return an associative array of attribute names and values from a partial tag string.
killMarkers($text)
Remove any strip markers found in the given text.
wfGetDB($db, $groups=[], $wiki=false)
Get a Database object.
static tocList($toc, $lang=false)
Wraps the TOC in a table and provides the hide/collapse javascript.
fetchTemplateAndTitle($title)
Fetch the unparsed text of a template and register a reference to it.
this hook is for auditing only or null if authentication failed before getting that far or null if we can t even determine that probably a stub it is not rendered in wiki pages or galleries in category pages allow injecting custom HTML after the section Any uses of the hook need to handle escaping see BaseTemplate::getToolbox and BaseTemplate::makeListItem for details on the format of individual items inside of this array or by returning and letting standard HTTP rendering take place modifiable or by returning false and taking over the output $out
getRevisionUser()
Get the name of the user that edited the last revision.
setFunctionTagHook($tag, $callback, $flags)
Create a tag function, e.g.
the array() calling protocol came about after MediaWiki 1.4rc1.
stripSectionName($text)
Strips a text string of wikitext for use in a section anchor.
null for the local wiki Added should default to null in handler for backwards compatibility add a value to it if you want to add a cookie that have to vary cache options can modify $query
static linkKnown($target, $html=null, $customAttribs=[], $query=[], $options=[ 'known', 'noclasses'])
Identical to link(), except $options defaults to 'known'.
magic word the default is to use $key to get the and $key value or $key value text $key value html to format the value $key
Group all the pieces relevant to the context of a request into one instance.
getPreloadText($text, Title $title, ParserOptions $options, $params=[])
Process the wikitext for the "?preload=" feature.
validateSig($text)
Check that the user's signature contains no bad XML.
MapCacheLRU null $currentRevisionCache
$wgSitename
Name of the site.
renderImageGallery($text, $params)
Renders an image gallery from a text with one line per image.
recursivePreprocess($text, $frame=false)
Recursive parser entry point that can be called from an extension tag hook.
replaceExternalLinks($text)
Replace external links (REL)
static isNonincludable($index)
It is not possible to use pages from this namespace as template?
static replaceUnusualEscapes($url)
Replace unusual escape codes in a URL with their equivalent characters.
Apache License January AND DISTRIBUTION Definitions License shall mean the terms and conditions for use
doHeadings($text)
Parse headers and return html.
static getTitleFor($name, $subpage=false, $fragment= '')
Get a localised Title object for a specified special page name.
findColonNoLinks($str, &$before, &$after)
Split up a string on ':', ignoring any occurrences inside tags to prevent illegal overlapping...
static isWellFormedXmlFragment($text)
Check if a string is a well-formed XML fragment.
div flags Integer display flags(NO_ACTION_LINK, NO_EXTRA_USER_LINKS) 'LogException'returning false will NOT prevent logging $e
fetchFileAndTitle($title, $options=[])
Fetch a file and its title and register a reference to it.
We use the convention $dbr for read and $dbw for write to help you keep track of whether the database object is a the world will explode Or to be a subsequent write query which succeeded on the master may fail when replicated to the slave due to a unique key collision Replication on the slave will stop and it may take hours to repair the database and get it back online Setting read_only in my cnf on the slave will avoid this but given the dire we prefer to have as many checks as possible We provide a but the wrapper functions like please read the documentation for except in special pages derived from QueryPage It s a common pitfall for new developers to submit code containing SQL queries which examine huge numbers of rows Remember that COUNT * is(N), counting rows in atable is like counting beans in a bucket.------------------------------------------------------------------------Replication------------------------------------------------------------------------The largest installation of MediaWiki, Wikimedia, uses a large set ofslave MySQL servers replicating writes made to a master MySQL server.Itis important to understand the issues associated with this setup if youwant to write code destined for Wikipedia.It's often the case that the best algorithm to use for a given taskdepends on whether or not replication is in use.Due to our unabashedWikipedia-centrism, we often just use the replication-friendly version, but if you like, you can use wfGetLB() ->getServerCount() > 1 tocheck to see if replication is in use.===Lag===Lag primarily occurs when large write queries are sent to the master.Writes on the master are executed in parallel, but they are executed inserial when they are replicated to the slaves.The master writes thequery to the binlog when the transaction is committed.The slaves pollthe binlog and start executing the query as soon as it appears.They canservice reads while they are performing a write query, but will not readanything more from the binlog and thus will perform no more writes.Thismeans that if the write query runs for a long time, the slaves will lagbehind the master for the time it takes for the write query to complete.Lag can be exacerbated by high read load.MediaWiki's load balancer willstop sending reads to a slave when it is lagged by more than 30 seconds.If the load ratios are set incorrectly, or if there is too much loadgenerally, this may lead to a slave permanently hovering around 30seconds lag.If all slaves are lagged by more than 30 seconds, MediaWiki will stopwriting to the database.All edits and other write operations will berefused, with an error returned to the user.This gives the slaves achance to catch up.Before we had this mechanism, the slaves wouldregularly lag by several minutes, making review of recent editsdifficult.In addition to this, MediaWiki attempts to ensure that the user seesevents occurring on the wiki in chronological order.A few seconds of lagcan be tolerated, as long as the user sees a consistent picture fromsubsequent requests.This is done by saving the master binlog positionin the session, and then at the start of each request, waiting for theslave to catch up to that position before doing any reads from it.Ifthis wait times out, reads are allowed anyway, but the request isconsidered to be in"lagged slave mode".Lagged slave mode can bechecked by calling wfGetLB() ->getLaggedSlaveMode().The onlypractical consequence at present is a warning displayed in the pagefooter.===Lag avoidance===To avoid excessive lag, queries which write large numbers of rows shouldbe split up, generally to write one row at a time.Multi-row INSERT...SELECT queries are the worst offenders should be avoided altogether.Instead do the select first and then the insert.===Working with lag===Despite our best efforts, it's not practical to guarantee a low-lagenvironment.Lag will usually be less than one second, but mayoccasionally be up to 30 seconds.For scalability, it's very importantto keep load on the master low, so simply sending all your queries tothe master is not the answer.So when you have a genuine need forup-to-date data, the following approach is advised:1) Do a quick query to the master for a sequence number or timestamp 2) Run the full query on the slave and check if it matches the data you gotfrom the master 3) If it doesn't, run the full query on the masterTo avoid swamping the master every time the slaves lag, use of thisapproach should be kept to a minimum.In most cases you should just readfrom the slave and let the user deal with the delay.------------------------------------------------------------------------Lock contention------------------------------------------------------------------------Due to the high write rate on Wikipedia(and some other wikis), MediaWiki developers need to be very careful to structure their writesto avoid long-lasting locks.By default, MediaWiki opens a transactionat the first query, and commits it before the output is sent.Locks willbe held from the time when the query is done until the commit.So youcan reduce lock time by doing as much processing as possible before youdo your write queries.Often this approach is not good enough, and it becomes necessary toenclose small groups of queries in their own transaction.Use thefollowing syntax:$dbw=wfGetDB(DB_MASTER
initialiseVariables()
initialise the magic variables (like CURRENTMONTHNAME) and substitution modifiers ...
null means default in associative array with keys and values unescaped Should be merged with default with a value of false meaning to suppress the attribute in associative array with keys and values unescaped noclasses & $ret
Set options of the Parser.
static tidy($text)
Interface with html tidy.
getFunctionHooks()
Get all registered function hook identifiers.
globals txt Globals are evil The original MediaWiki code relied on globals for processing context far too often MediaWiki development since then has been a story of slowly moving context out of global variables and into objects Storing processing context in object member variables allows those objects to be reused in a much more flexible way Consider the elegance of
database rows
wfHostname()
Fetch server name for use in error reporting etc.
getFunctionLang()
Get a language object for use in parser functions such as {{FORMATNUM:}}.
processing should stop and the error should be shown to the user * false
argSubstitution($piece, $frame)
Triple brace replacement – used for template arguments.
testSrvus($text, Title $title, ParserOptions $options, $outputType=self::OT_HTML)
strip/replaceVariables/unstrip for preprocessor regression testing
uniqPrefix()
Accessor for mUniqPrefix.
Title($x=null)
Accessor/mutator for the Title object.
SectionProfiler $mProfiler
fetchFileNoRegister($title, $options=[])
Helper function for fetchFileAndTitle.
null for the local wiki Added in
There are three types of nodes:
clearTagHooks()
Remove all tag hooks.
const COLON_STATE_TAGSLASH
static makeSelfLinkObj($nt, $html= '', $query= '', $trail= '', $prefix= '')
Make appropriate markup for a link to the current article.
clearState()
Clear Parser state.
interwikiTransclude($title, $action)
Transclude an interwiki link.
pstPass2($text, $user)
Pre-save transform helper function.
guessLegacySectionNameFromWikiText($text)
Same as guessSectionNameFromWikiText(), but produces legacy anchors instead.
wfUrlProtocolsWithoutProtRel()
Like wfUrlProtocols(), but excludes '//' from the protocol list.
Options($x=null)
Accessor/mutator for the ParserOptions object.
it s the revision text itself In either if gzip is the revision text is gzipped $flags
serializeHalfParsedText($text)
Save the parser state required to convert the given half-parsed text to HTML.
replaceLinkHolders(&$text, $options=0)
Replace "" link placeholders with actual links, in the buffer Placeholders created in Link...
doQuotes($text)
Helper function for doAllQuotes()
preprocessToDom($text, $flags=0)
Preprocess some wikitext and return the document tree.
limitationWarn($limitationType, $current= '', $max= '')
Warn the user when a parser limitation is reached Will warn at most once the user per limitation type...
wfUrlencode($s)
We want some things to be included as literal characters in our title URLs for prettiness, which urlencode encodes by default.
static newFromText($text, $defaultNamespace=NS_MAIN)
Create a new Title from text, such as what one would find in a link.
Represents a title within MediaWiki.
static getRandomString()
Get a random string.
static stripAllTags($text)
Take a fragment of (potentially invalid) HTML and return a version with any tags removed, encoded as plain text.
when a variable name is used in a it is silently declared as a new local masking the global
doBlockLevels($text, $linestart)
#@-
OutputType($x=null)
Accessor/mutator for the output type.
static newFromTitle(LinkTarget $linkTarget, $id=0, $flags=0)
Load either the current, or a specified, revision that's attached to a given link target...
const COLON_STATE_COMMENTDASHDASH
getVariableValue($index, $frame=false)
Return value of a magic variable (like PAGENAME)
recursiveTagParse($text, $frame=false)
Half-parse wikitext to half-parsed HTML.
MagicWordArray $mVariables
static validateTagAttributes($attribs, $element)
Take an array of attribute names and values and normalize or discard illegal values for the given ele...
const COLON_STATE_COMMENTDASH
globals will be eliminated from MediaWiki replaced by an application object which would be passed to constructors Whether that would be an convenient solution remains to be but certainly PHP makes such object oriented programming models easier than they were in previous versions For the time being MediaWiki programmers will have to work in an environment with some global context At the time of globals were initialised on startup by MediaWiki of these were configuration which are documented in DefaultSettings php There is no comprehensive documentation for the remaining however some of the most important ones are listed below They are typically initialised either in index php or in Setup php For a description of the see design txt $wgTitle Title object created from the request URL $wgOut OutputPage object for HTTP response $wgUser User object for the user associated with the current request $wgLang Language object selected by user preferences $wgContLang Language object associated with the wiki being viewed $wgParser Parser object Parser extensions register their hooks here $wgRequest WebRequest object
wfRandomString($length=32)
Get a random string containing a number of pseudo-random hex characters.
preprocess($text, Title $title=null, ParserOptions $options, $revid=null, $frame=false)
Expand templates and variables in the text, producing valid, static wikitext.
static getCacheTTL($id)
Allow external reads of TTL array.
getRevisionId()
Get the ID of the revision we are parsing.
see documentation in includes Linker php for Linker::makeImageLink & $time
maybeDoSubpageLink($target, &$text)
Handle link to subpage if necessary.
If you want to remove the page from your watchlist later
replaceLinkHoldersText($text)
Replace "" link placeholders with plain text of links (not HTML-formatted).
wfDebug($text, $dest= 'all', array $context=[])
Sends a line to the debug log if enabled or, optionally, to a comment in output.
static createAssocArgs($args)
Clean up argument array - refactored in 1.9 so parserfunctions can use it, too.
The index of the header message $result[1]=The index of the body text message $result[2 through n]=Parameters passed to body text message.Please note the header message cannot receive/use parameters. 'ImportHandleLogItemXMLTag':When parsing a XML tag in a log item.Return false to stop further processing of the tag $reader:XMLReader object $logInfo:Array of information 'ImportHandlePageXMLTag':When parsing a XML tag in a page.Return false to stop further processing of the tag $reader:XMLReader object &$pageInfo:Array of information 'ImportHandleRevisionXMLTag':When parsing a XML tag in a page revision.Return false to stop further processing of the tag $reader:XMLReader object $pageInfo:Array of page information $revisionInfo:Array of revision information 'ImportHandleToplevelXMLTag':When parsing a top level XML tag.Return false to stop further processing of the tag $reader:XMLReader object 'ImportHandleUploadXMLTag':When parsing a XML tag in a file upload.Return false to stop further processing of the tag $reader:XMLReader object $revisionInfo:Array of information 'ImportLogInterwikiLink':Hook to change the interwiki link used in log entries and edit summaries for transwiki imports.&$fullInterwikiPrefix:Interwiki prefix, may contain colons.&$pageTitle:String that contains page title. 'ImportSources':Called when reading from the $wgImportSources configuration variable.Can be used to lazy-load the import sources list.&$importSources:The value of $wgImportSources.Modify as necessary.See the comment in DefaultSettings.php for the detail of how to structure this array. 'InfoAction':When building information to display on the action=info page.$context:IContextSource object &$pageInfo:Array of information 'InitializeArticleMaybeRedirect':MediaWiki check to see if title is a redirect.&$title:Title object for the current page &$request:WebRequest &$ignoreRedirect:boolean to skip redirect check &$target:Title/string of redirect target &$article:Article object 'InternalParseBeforeLinks':during Parser's internalParse method before links but after nowiki/noinclude/includeonly/onlyinclude and other processings.&$parser:Parser object &$text:string containing partially parsed text &$stripState:Parser's internal StripState object 'InternalParseBeforeSanitize':during Parser's internalParse method just before the parser removes unwanted/dangerous HTML tags and after nowiki/noinclude/includeonly/onlyinclude and other processings.Ideal for syntax-extensions after template/parser function execution which respect nowiki and HTML-comments.&$parser:Parser object &$text:string containing partially parsed text &$stripState:Parser's internal StripState object 'InterwikiLoadPrefix':When resolving if a given prefix is an interwiki or not.Return true without providing an interwiki to continue interwiki search.$prefix:interwiki prefix we are looking for.&$iwData:output array describing the interwiki with keys iw_url, iw_local, iw_trans and optionally iw_api and iw_wikiid. 'InvalidateEmailComplete':Called after a user's email has been invalidated successfully.$user:user(object) whose email is being invalidated 'IRCLineURL':When constructing the URL to use in an IRC notification.Callee may modify $url and $query, URL will be constructed as $url.$query &$url:URL to index.php &$query:Query string $rc:RecentChange object that triggered url generation 'IsFileCacheable':Override the result of Article::isFileCacheable()(if true) &$article:article(object) being checked 'IsTrustedProxy':Override the result of IP::isTrustedProxy() &$ip:IP being check &$result:Change this value to override the result of IP::isTrustedProxy() 'IsUploadAllowedFromUrl':Override the result of UploadFromUrl::isAllowedUrl() $url:URL used to upload from &$allowed:Boolean indicating if uploading is allowed for given URL 'isValidEmailAddr':Override the result of Sanitizer::validateEmail(), for instance to return false if the domain name doesn't match your organization.$addr:The e-mail address entered by the user &$result:Set this and return false to override the internal checks 'isValidPassword':Override the result of User::isValidPassword() $password:The password entered by the user &$result:Set this and return false to override the internal checks $user:User the password is being validated for 'Language::getMessagesFileName':$code:The language code or the language we're looking for a messages file for &$file:The messages file path, you can override this to change the location. 'LanguageGetMagic':DEPRECATED!Use $magicWords in a file listed in $wgExtensionMessagesFiles instead.Use this to define synonyms of magic words depending of the language &$magicExtensions:associative array of magic words synonyms $lang:language code(string) 'LanguageGetNamespaces':Provide custom ordering for namespaces or remove namespaces.Do not use this hook to add namespaces.Use CanonicalNamespaces for that.&$namespaces:Array of namespaces indexed by their numbers 'LanguageGetSpecialPageAliases':DEPRECATED!Use $specialPageAliases in a file listed in $wgExtensionMessagesFiles instead.Use to define aliases of special pages names depending of the language &$specialPageAliases:associative array of magic words synonyms $lang:language code(string) 'LanguageGetTranslatedLanguageNames':Provide translated language names.&$names:array of language code=> language name $code:language of the preferred translations 'LanguageLinks':Manipulate a page's language links.This is called in various places to allow extensions to define the effective language links for a page.$title:The page's Title.&$links:Associative array mapping language codes to prefixed links of the form"language:title".&$linkFlags:Associative array mapping prefixed links to arrays of flags.Currently unused, but planned to provide support for marking individual language links in the UI, e.g.for featured articles. 'LanguageSelector':Hook to change the language selector available on a page.$out:The output page.$cssClassName:CSS class name of the language selector. 'LinkBegin':Used when generating internal and interwiki links in Linker::link(), before processing starts.Return false to skip default processing and return $ret.See documentation for Linker::link() for details on the expected meanings of parameters.$skin:the Skin object $target:the Title that the link is pointing to &$html:the contents that the< a > tag should have(raw HTML) $result
the value to return A Title object or null for latest to be modified or replaced by the hook handler or if authentication is not possible after cache objects are set for highlighting & $link
static getLocalInstance($ts=false)
Get a timestamp instance in the server local timezone ($wgLocaltimezone)
static getDoubleUnderscoreArray()
Get a MagicWordArray of double-underscore entities.
static splitTrail($trail)
Split a link trail, return the "inside" portion and the remainder of the trail as a two-element array...
getTemplateDom($title)
Get the semi-parsed DOM representation of a template with a given title, and its redirect destination...
static decodeCharReferences($text)
Decode any character references, numeric or named entities, in the text and return a UTF-8 string...
openList($char)
These next three functions open, continue, and close the list element appropriate to the prefix chara...
cleanSig($text, $parsing=false)
Clean up signature text.
wfTimestamp($outputtype=TS_UNIX, $ts=0)
Get a timestamp string in one of various formats.
static factory($mode=false, IContextSource $context=null)
Get a new image gallery.
$wgLanguageCode
Site language code.
Custom PHP profiler for parser/DB type section names that xhprof/xdebug can't handle.
Class for asserting that a callback happens when an dummy object leaves scope.
$wgExtraInterlanguageLinkPrefixes
List of additional interwiki prefixes that should be treated as interlanguage links (i...
startExternalParse(Title $title=null, ParserOptions $options, $outputType, $clearState=true)
Set up some variables which are usually set up in parse() so that an external function can call some ...
wfCgiToArray($query)
This is the logical opposite of wfArrayToCgi(): it accepts a query string as its argument and returns...
wfDebugLog($logGroup, $text, $dest= 'all', array $context=[])
Send a line to a supplementary debug log file, if configured, or main debug log if not...
static capturePath(Title $title, IContextSource $context)
Just like executePath() but will override global variables and execute the page in "inclusion" mode...
addTrackingCategory($msg)
replaceInternalLinks($s)
Process [[ ]] wikilinks.
$wgStylePath
The URL path of the skins directory.
disableCache()
Set a flag in the output object indicating that the content is dynamic and shouldn't be cached...
static normalizeSectionNameWhitespace($section)
Normalizes whitespace in a section name, such as might be returned by Parser::stripSectionName(), for use in the id's that are used for section links.
internalParse($text, $isMain=true, $frame=false)
Helper function for parse() that transforms wiki markup into half-parsed HTML.
static delimiterReplace($startDelim, $endDelim, $replace, $subject, $flags= '')
Perform an operation equivalent to preg_replace() with flags.
__destruct()
Reduce memory usage to reduce the impact of circular references.
wfEscapeWikiText($text)
Escapes the given text so that it may be output using addWikiText() without any linking, formatting, etc.
getRevisionTimestamp()
Get the timestamp associated with the current revision, adjusted for the default server-local timesta...
static stripOuterParagraph($html)
Strip outer.
static singleton()
Get an instance of this class.
design txt This is a brief overview of the new design More thorough and up to date information is available on the documentation wiki at etc Handles the details of getting and saving to the user table of the and dealing with sessions and cookies OutputPage Encapsulates the entire HTML page that will be sent in response to any server request It is used by calling its functions to add in any and then calling but I prefer the flexibility This should also do the output encoding The system allocates a global one in $wgOut Title Represents the title of an and does all the work of translating among various forms such as plain database key
static normalizeSubpageLink($contextTitle, $target, &$text)
parseWidthParam($value)
Parsed a width param of imagelink like 300px or 200x300px.
fetchScaryTemplateMaybeFromCache($url)
fetchCurrentRevisionOfTitle($title)
Fetch the current revision of a given title.
stripAltText($caption, $holders)
doAllQuotes($text)
Replace single quotes with HTML markup.
static replaceMarkup($search, $replace, $text)
More or less "markup-safe" str_replace() Ignores any instances of the separator inside <...
static normalizeUrlComponent($component, $unsafe)
const VERSION
Update this version number when the ParserOutput format changes in an incompatible way...
this hook is for auditing only RecentChangesLinked and Watchlist RecentChangesLinked and Watchlist e g Watchlist removed from all revisions and log entries to which it was applied This gives extensions a chance to take it off their books as the deletion has already been partly carried out by this point or something similar the user will be unable to create the tag set and then return false from the hook function Ensure you consume the ChangeTagAfterDelete hook to carry out custom deletion actions as context called by AbstractContent::getParserOutput May be used to override the normal model specific rendering of page content as context as context $options
setHook($tag, $callback)
Create an HTML-style tag, e.g.
Preprocessor $mPreprocessor
getPreprocessor()
Get a preprocessor object.
This document is intended to provide useful advice for parties seeking to redistribute MediaWiki to end users It s targeted particularly at maintainers for Linux since it s been observed that distribution packages of MediaWiki often break We ve consistently had to recommend that users seeking support use official tarballs instead of their distribution s and this often solves whatever problem the user is having It would be nice if this could such and we might be restricted by PHP settings such as safe mode or open_basedir We cannot assume that the software even has read access anywhere useful Many shared hosts run all users web applications under the same so they can t rely on Unix and must forbid reads to even standard directories like tmp lest users read each others files We cannot assume that the user has the ability to install or run any programs not written as web accessible PHP scripts Since anything that works on cheap shared hosting will work if you have shell or root access MediaWiki s design is based around catering to the lowest common denominator Although we support higher end setups as the way many things work by default is tailored toward shared hosting These defaults are unconventional from the point of view of normal(non-web) applications--they might conflict with distributors'policies
static getInstance($ts=false)
Get a timestamp instance in GMT.
static singleton()
Get a RepoGroup instance.
replaceVariables($text, $frame=false, $argsOnly=false)
Replace magic variables, templates, and template arguments with the appropriate text.
wfMatchesDomainList($url, $domains)
Check whether a given URL has a domain that occurs in a given set of domains.
getUser()
Get a User object either from $this->mUser, if set, or from the ParserOptions object otherwise...
wfTimestampNow()
Convenience function; returns MediaWiki timestamp for the present time.
incrementIncludeSize($type, $size)
Increment an include size counter.
getStripList()
Get a list of strippable XML-like elements.
null means default in associative array with keys and values unescaped Should be merged with default with a value of false meaning to suppress the attribute in associative array with keys and values unescaped noclasses just before the function returns a value If you return an< a > element with HTML attributes $attribs and contents $html will be returned If you return $ret will be returned and may include noclasses after processing after in associative array form externallinks including delete and has completed for all link tables whether this was an auto creation default is conds Array Extra conditions for the No matching items in log is displayed if loglist is empty msgKey Array If you want a nice box with a set this to the key of the message First element is the message additional optional elements are parameters for the key that are processed with wfMessage() -> params() ->parseAsBlock()-offset Set to overwrite offset parameter in $wgRequest set to ''to unsetoffset-wrap String Wrap the message in html(usually something like"<
startParse(Title $title=null, ParserOptions $options, $outputType, $clearState=true)
static makeHeadline($level, $attribs, $anchor, $html, $link, $legacyAnchor=false)
Create a headline for content.
static extractTagsAndParams($elements, $text, &$matches, $uniq_prefix=null)
Replaces all occurrences of HTML-style comments and the given tags in the text with a random marker a...
and(b) You must cause any modified files to carry prominent notices stating that You changed the files
doTableStuff($text)
parse the wiki syntax used to render tables
wfDeprecated($function, $version=false, $component=false, $callerOffset=2)
Throws a warning that $function is deprecated.
getRevisionSize()
Get the size of the revision.
LinkHolderArray $mLinkHolders
deferred txt A few of the database updates required by various functions here can be deferred until after the result page is displayed to the user For updating the view updating the linked to tables after a save
Some information about database access in MediaWiki By Tim January Database layout For information about the MediaWiki database such as a description of the tables and their please see
closeParagraph()
#@+ Used by doBlockLevels()
preSaveTransform($text, Title $title, User $user, ParserOptions $options, $clearState=true)
Transform wiki markup when saving a page by doing "\\r\\n" -> "\\n" conversion, substituting signatur...
getTargetLanguage()
Get the target language for the content being parsed.
namespace and then decline to actually register it file or subcat img or subcat $title
static hasSubpages($index)
Does the namespace allow subpages?
formatHeadings($text, $origText, $isMain=true)
This function accomplishes several tasks: 1) Auto-number headings if that option is enabled 2) Add an...
getConverterLanguage()
Get the language object for language conversion.
static tocUnindent($level)
Finish one or more sublevels on the Table of Contents.
nextItem($char)
TODO: document.
static run($event, array $args=[], $deprecatedVersion=null)
Call hook functions defined in Hooks::register and $wgHooks.
static tocLine($anchor, $tocline, $tocnumber, $level, $sectionIndex=false)
parameter level defines if we are on an indentation level
design txt This is a brief overview of the new design More thorough and up to date information is available on the documentation wiki at etc Handles the details of getting and saving to the user table of the and dealing with sessions and cookies OutputPage Encapsulates the entire HTML page that will be sent in response to any server request It is used by calling its functions to add text
getExternalLinkAttribs($url=false)
Get an associative array of additional HTML attributes appropriate for a particular external link...
magicword txt Magic Words are some phrases used in the wikitext They are used for two things
this hook is for auditing only RecentChangesLinked and Watchlist RecentChangesLinked and Watchlist e g Watchlist removed from all revisions and log entries to which it was applied This gives extensions a chance to take it off their books $tag
getUserSig(&$user, $nickname=false, $fancySig=null)
Fetch the user's signature text, if any, and normalize to validated, ready-to-insert wikitext...
const HALF_PARSED_VERSION
Update this version number when the output of serialiseHalfParsedText() changes in an incompatible wa...
firstCallInit()
Do various kinds of initialisation on the first call of the parser.
Handles a simple LRU key/value map with a maximum number of entries.
static makeImageLink(Parser $parser, Title $title, $file, $frameParams=[], $handlerParams=[], $time=false, $query="", $widthOption=null)
Given parameters derived from [[Image:Foo|options...]], generate the HTML that that syntax inserts in...
null means default in associative array with keys and values unescaped Should be merged with default with a value of false meaning to suppress the attribute in associative array with keys and values unescaped broken
armorLinks($text)
Insert a NOPARSE hacky thing into any inline links in a chunk that's going to go through further pars...
presenting them properly to the user as errors is done by the caller return true use this to change the list i e etc $rev
static splitWhitespace($s)
Return a three-element array: leading whitespace, string contents, trailing whitespace.
This document is intended to provide useful advice for parties seeking to redistribute MediaWiki to end users It s targeted particularly at maintainers for Linux since it s been observed that distribution packages of MediaWiki often break We ve consistently had to recommend that users seeking support use official tarballs instead of their distribution s and this often solves whatever problem the user is having It would be nice if this could such as
setOutputType($ot)
Set the output type.
Class for handling an array of magic words.
static & get($id)
Factory: creates an object representing an ID.
static getModuleStyles()
Get CSS modules needed if HTML from the current driver is to be displayed.
enableOOUI()
Set's up the PHP implementation of OOUI for use in this request and instructs OutputPage to enable OO...
please add to it if you re going to add events to the MediaWiki code where normally authentication against an external auth plugin would be creating a local account $user
fetchTemplate($title)
Fetch the unparsed text of a template and register a reference to it.
maybeMakeExternalImage($url)
make an image if it's allowed, either through the global option, through the exception, or through the on-wiki whitelist
areSubpagesAllowed()
Return true if subpage links should be expanded on this page.
static escapeId($id, $options=[])
Given a value, escape it so that it can be used in an id attribute and return it. ...
this hook is for auditing only RecentChangesLinked and Watchlist RecentChangesLinked and Watchlist e g Watchlist removed from all revisions and log entries to which it was applied This gives extensions a chance to take it off their books as the deletion has already been partly carried out by this point or something similar the user will be unable to create the tag set and then return false from the hook function Ensure you consume the ChangeTagAfterDelete hook to carry out custom deletion actions as context called by AbstractContent::getParserOutput May be used to override the normal model specific rendering of page content as context as context the output can only depend on parameters provided to this hook not on global state indicating whether full HTML should be generated If generation of HTML may be but other information should still be present in the ParserOutput object & $output
static getSubstIDs()
Get an array of parser substitution modifier IDs.
const TS_MW
MediaWiki concatenated string timestamp (YYYYMMDDHHMMSS)
transformMsg($text, $options, $title=null)
Wrapper for preprocess()
static newFromId($id, $flags=0)
Load a page revision from a given revision ID number.
wfUrlProtocols($includeProtocolRelative=true)
Returns a regular expression of url protocols.
static makeExternalLink($url, $text, $escape=true, $linktype= '', $attribs=[], $title=null)
Make an external link.
__clone()
Allow extensions to clean up when the parser is cloned.
static getExternalLinkRel($url=false, $title=null)
Get the rel attribute for a particular external link.
injection txt This is an overview of how MediaWiki makes use of dependency injection The design described here grew from the discussion of RFC T384 The term dependency this means that anything an object needs to operate should be injected from the the object itself should only know narrow no concrete implementation of the logic it relies on The requirement to inject everything typically results in an architecture that based on two main types of and essentially stateless service objects that use other service objects to operate on the value objects As of the beginning MediaWiki is only starting to use the DI approach Much of the code still relies on global state or direct resulting in a highly cyclical dependency which acts as the top level factory for services in MediaWiki which can be used to gain access to default instances of various services MediaWikiServices however also allows new services to be defined and default services to be redefined Services are defined or redefined by providing a callback the instantiator that will return a new instance of the service When it will create an instance of MediaWikiServices and populate it with the services defined in the files listed by thereby bootstrapping the DI framework Per $wgServiceWiringFiles lists includes ServiceWiring php
wfSetVar(&$dest, $source, $force=false)
Sets dest to source and returns the original value of dest If source is NULL, it just returns the val...
this hook is for auditing only $req
this hook is for auditing only or null if authentication failed before getting that far $username
presenting them properly to the user as errors is done by the caller return true use this to change the list i e etc next in line in page history
array $mLangLinkLanguages
Array with the language name of each language link (i.e.
replaceTransparentTags($text)
Replace transparent tags in $text with the values given by the callbacks.
This document describes the state of Postgres support in and is fairly well maintained The main code is very well while extensions are very hit and miss it is probably the most supported database after MySQL Much of the work in making MediaWiki database agnostic came about through the work of creating Postgres as and are nearing end of but without copying over all the usage comments General notes on the but these can almost always be programmed around *Although Postgres has a true BOOLEAN type
replaceSection($oldText, $sectionId, $newText)
This function returns $oldtext after the content of the section specified by $section has been replac...
getLinkURL($query= '', $query2=false, $proto=PROTO_RELATIVE)
Get a URL that's the simplest URL that will be valid to link, locally, to the current Title...
doDoubleUnderscore($text)
Strip double-underscore items like NOGALLERY and NOTOC Fills $this->mDoubleUnderscores, returns the modified text.
testPreprocess($text, Title $title, ParserOptions $options)
deferred txt A few of the database updates required by various functions here can be deferred until after the result page is displayed to the user For updating the view updating the linked to tables after a etc PHP does not yet have any way to tell the server to actually return and disconnect while still running these but it might have such a feature in the future We handle these by creating a deferred update object and putting those objects on a global then executing the whole list after the page is displayed We don t do anything smart like collating updates to the same table or such because the list is almost always going to have just one item on if so it s not worth the trouble Since there is a job queue in the jobs table
MagicWordArray $mSubstWords
static normalizeCharReferences($text)
Ensure that any entities and character references are legal for XML and XHTML specifically.
callParserFunction($frame, $function, array $args=[])
Call a parser function and return an array with text and flags.
$wgScriptPath
The path we should point to.
Variant of the Message class.
getFreshParser()
Return this parser if it is not doing anything, otherwise get a fresh parser.
design txt This is a brief overview of the new design More thorough and up to date information is available on the documentation wiki at etc Handles the details of getting and saving to the user table of the and dealing with sessions and cookies OutputPage Encapsulates the entire HTML page that will be sent in response to any server request It is used by calling its functions to add in any and then calling but I prefer the flexibility This should also do the output encoding The system allocates a global one in $wgOut Title Represents the title of an and does all the work of translating among various forms such as plain database etc For and for historical it also represents a few features of articles that don t involve their such as access rights See also title txt Article Encapsulates access to the page table of the database The object represents a an and maintains state such as etc Revision Encapsulates individual page revision data and access to the revision text blobs storage system Higher level code should never touch text storage directly
this hook is for auditing only RecentChangesLinked and Watchlist RecentChangesLinked and Watchlist e g Watchlist removed from all revisions and log entries to which it was applied This gives extensions a chance to take it off their books as the deletion has already been partly carried out by this point or something similar the user will be unable to create the tag set and then return false from the hook function Ensure you consume the ChangeTagAfterDelete hook to carry out custom deletion actions as context called by AbstractContent::getParserOutput May be used to override the normal model specific rendering of page content $content
const COLON_STATE_TAGSTART
lock()
Lock the current instance of the parser.
const COLON_STATE_COMMENT
static statelessFetchTemplate($title, $parser=false)
Static function to get a template Can be overridden via ParserOptions::setTemplateCallback().
I won t presume to tell you how to I m just describing the methods I chose to use for myself If you do choose to follow these it will probably be easier for you to collaborate with others on the but if you want to contribute without by all means do which work well I also use K &R brace matching style I know that s a religious issue for so if you want to use a style that puts opening braces on the next line
setFunctionHook($id, $callback, $flags=0)
Create a function, e.g.
static setupOOUI($skinName= '', $dir= 'ltr')
Helper function to setup the PHP implementation of OOUI to use in this request.
static makeMediaLinkFile(Title $title, $file, $html= '')
Create a direct link to a given uploaded file.
usually copyright or history_copyright This message must be in HTML not wikitext if the section is included from a template to be included in the link
this hook is for auditing only RecentChangesLinked and Watchlist RecentChangesLinked and Watchlist e g Watchlist removed from all revisions and log entries to which it was applied This gives extensions a chance to take it off their books as the deletion has already been partly carried out by this point or something similar the user will be unable to create the tag set and then return false from the hook function Ensure you consume the ChangeTagAfterDelete hook to carry out custom deletion actions as context called by AbstractContent::getParserOutput May be used to override the normal model specific rendering of page content as context as context the output can only depend on parameters provided to this hook not on global state indicating whether full HTML should be generated If generation of HTML may be but other information should still be present in the ParserOutput object to manipulate or replace but no entry for that model exists in $wgContentHandlers if desired whether it is OK to use $contentModel on $title Handler functions that modify $ok should generally return false to prevent further hooks from further modifying $ok inclusive $limit
getTitle()
Accessor for the Title object.
this class mediates it Skin Encapsulates a look and feel for the wiki All of the functions that render HTML and make choices about how to render it are here and are called from various other places when and is meant to be subclassed with other skins that may override some of its functions The User object contains a reference to a and so rather than having a global skin object we just rely on the global User and get the skin with $wgUser and also has some character encoding functions and other locale stuff The current user interface language is instantiated as and the local content language as $wgContLang
extractSections($text, $sectionId, $mode, $newText= '')
Break wikitext input into sections, and either pull or replace some particular section's text...
getOutput()
Get the ParserOutput object.
$wgExperimentalHtmlIds
Should we allow a broader set of characters in id attributes, per HTML5? If not, use only HTML 4-comp...
static statelessFetchRevision($title, $parser=false)
Wrapper around Revision::newFromTitle to allow passing additional parameters without passing them on ...
doMagicLinks($text)
Replace special strings like "ISBN xxx" and "RFC xxx" with magic external links.
Apache License January AND DISTRIBUTION Definitions License shall mean the terms and conditions for and distribution as defined by Sections through of this document Licensor shall mean the copyright owner or entity authorized by the copyright owner that is granting the License Legal Entity shall mean the union of the acting entity and all other entities that control are controlled by or are under common control with that entity For the purposes of this definition control direct or to cause the direction or management of such whether by contract or including but not limited to software source documentation and configuration files Object form shall mean any form resulting from mechanical transformation or translation of a Source including but not limited to compiled object generated and conversions to other media types Work shall mean the work of whether in Source or Object made available under the as indicated by a copyright notice that is included in or attached to the whether in Source or Object that is based or other modifications as a an original work of authorship For the purposes of this Derivative Works shall not include works that remain separable or merely the Work and Derivative Works thereof Contribution shall mean any work of including the original version of the Work and any modifications or additions to that Work or Derivative Works that is intentionally submitted to Licensor for inclusion in the Work by the copyright owner or by an individual or Legal Entity authorized to submit on behalf of the copyright owner For the purposes of this submitted means any form of or written communication sent to the Licensor or its including but not limited to communication on electronic mailing source code control and issue tracking systems that are managed or on behalf the Licensor for the purpose of discussing and improving the but excluding communication that is conspicuously marked or otherwise designated in writing by the copyright owner as Not a Contribution Contributor shall mean Licensor and any individual or Legal Entity on behalf of whom a Contribution has been received by Licensor and subsequently incorporated within the Work Grant of Copyright License Subject to the terms and conditions of this each Contributor hereby grants to You a non no royalty irrevocable copyright license to prepare Derivative Works publicly display
getCommon($st1, $st2)
getCommon() returns the length of the longest common substring of both arguments, starting at the beg...
!html< table >< tr >< td > broken</td ></tr ></table >!end!test Table cell attributes
this hook is for auditing only RecentChangesLinked and Watchlist RecentChangesLinked and Watchlist e g Watchlist removed from all revisions and log entries to which it was applied This gives extensions a chance to take it off their books as the deletion has already been partly carried out by this point or something similar the user will be unable to create the tag set $status
static cleanSigInSig($text)
Strip 3, 4 or 5 tildes out of signatures.
setDefaultSort($sort)
Mutator for $mDefaultSort.
fetchFile($title, $options=[])
Fetch a file and its title and register a reference to it.
static fixTagAttributes($text, $element)
Take a tag soup fragment listing an HTML element's attributes and normalize it to well-formed XML...
static tocIndent()
Add another level to the Table of Contents.
static legalChars()
Get a regex character class describing the legal characters in a link.
design txt This is a brief overview of the new design More thorough and up to date information is available on the documentation wiki at etc Handles the details of getting and saving to the user table of the and dealing with sessions and cookies OutputPage Encapsulates the entire HTML page that will be sent in response to any server request It is used by calling its functions to add in any and then calling output() to send it all.It could be easily changed to send incrementally if that becomes useful
$wgServer
URL of the server.
We ve cleaned up the code here by removing clumps of infrequently used code and moving them off somewhere else It s much easier for someone working with this code to see what s _really_ going on
incrementExpensiveFunctionCount()
Increment the expensive function count.
getDisableTitleConversion()
static normalizeLinkUrl($url)
Replace unusual escape codes in a URL with their equivalent characters.
static removeHTMLtags($text, $processCallback=null, $args=[], $extratags=[], $removetags=[])
Cleans up HTML, removes dangerous tags and attributes, and removes HTML comments. ...
insertStripItem($text)
Add an item to the strip state Returns the unique tag which must be inserted into the stripped text T...
testPst($text, Title $title, ParserOptions $options)
static factory($url, $options=null, $caller=__METHOD__)
Generate a new request object.
const TS_UNIX
Unix time - the number of seconds since 1970-01-01 00:00:00 UTC.
if(!$wgRequest->checkUrlExtension()) if(!$wgEnableAPI) $wgTitle
static explode($separator, $subject)
Workalike for explode() with limited memory usage.
parse($text, Title $title, ParserOptions $options, $linestart=true, $clearState=true, $revid=null)
Convert wikitext to HTML Do not call this function recursively.
this hook is for auditing only or null if authentication failed before getting that far or null if we can t even determine that probably a stub it is not rendered in wiki pages or galleries in category pages allow injecting custom HTML after the section Any uses of the hook need to handle escaping see BaseTemplate::getToolbox and BaseTemplate::makeListItem for details on the format of individual items inside of this array or by returning and letting standard HTTP rendering take place modifiable or by returning false and taking over the output modifiable modifiable after all normalizations have been except for the $wgMaxImageArea check set to true or false to override the $wgMaxImageArea check result gives extension the possibility to transform it themselves $handler
static numberingroup($group)
Find the number of users in a given user group.
=Architecture==Two class hierarchies are used to provide the functionality associated with the different content models:*Content interface(and AbstractContent base class) define functionality that acts on the concrete content of a page, and *ContentHandler base class provides functionality specific to a content model, but not acting on concrete content.The most important function of ContentHandler is to act as a factory for the appropriate implementation of Content.These Content objects are to be used by MediaWiki everywhere, instead of passing page content around as text.All manipulation and analysis of page content must be done via the appropriate methods of the Content object.For each content model, a subclass of ContentHandler has to be registered with $wgContentHandlers.The ContentHandler object for a given content model can be obtained using ContentHandler::getForModelID($id).Also Title, WikiPage and Revision now have getContentHandler() methods for convenience.ContentHandler objects are singletons that provide functionality specific to the content type, but not directly acting on the content of some page.ContentHandler::makeEmptyContent() and ContentHandler::unserializeContent() can be used to create a Content object of the appropriate type.However, it is recommended to instead use WikiPage::getContent() resp.Revision::getContent() to get a page's content as a Content object.These two methods should be the ONLY way in which page content is accessed.Another important function of ContentHandler objects is to define custom action handlers for a content model, see ContentHandler::getActionOverrides().This is similar to what WikiPage::getActionOverrides() was already doing.==Serialization==With the ContentHandler facility, page content no longer has to be text based.Objects implementing the Content interface are used to represent and handle the content internally.For storage and data exchange, each content model supports at least one serialization format via ContentHandler::serializeContent($content).The list of supported formats for a given content model can be accessed using ContentHandler::getSupportedFormats().Content serialization formats are identified using MIME type like strings.The following formats are built in:*text/x-wiki-wikitext *text/javascript-for js pages *text/css-for css pages *text/plain-for future use, e.g.with plain text messages.*text/html-for future use, e.g.with plain html messages.*application/vnd.php.serialized-for future use with the api and for extensions *application/json-for future use with the api, and for use by extensions *application/xml-for future use with the api, and for use by extensions In PHP, use the corresponding CONTENT_FORMAT_XXX constant.Note that when using the API to access page content, especially action=edit, action=parse and action=query &prop=revisions, the model and format of the content should always be handled explicitly.Without that information, interpretation of the provided content is not reliable.The same applies to XML dumps generated via maintenance/dumpBackup.php or Special:Export.Also note that the API will provide encapsulated, serialized content-so if the API was called with format=json, and contentformat is also json(or rather, application/json), the page content is represented as a string containing an escaped json structure.Extensions that use JSON to serialize some types of page content may provide specialized API modules that allow access to that content in a more natural form.==Compatibility==The ContentHandler facility is introduced in a way that should allow all existing code to keep functioning at least for pages that contain wikitext or other text based content.However, a number of functions and hooks have been deprecated in favor of new versions that are aware of the page's content model, and will now generate warnings when used.Most importantly, the following functions have been deprecated:*Revisions::getText() is deprecated in favor Revisions::getContent()*WikiPage::getText() is deprecated in favor WikiPage::getContent() Also, the old Article::getContent()(which returns text) is superceded by Article::getContentObject().However, both methods should be avoided since they do not provide clean access to the page's actual content.For instance, they may return a system message for non-existing pages.Use WikiPage::getContent() instead.Code that relies on a textual representation of the page content should eventually be rewritten.However, ContentHandler::getContentText() provides a stop-gap that can be used to get text for a page.Its behavior is controlled by $wgContentHandlerTextFallback it
static getVersion($flags= '', $lang=null)
Return a string of the MediaWiki version with Git revision if available.
braceSubstitution($piece, $frame)
Return the text of a template, after recursively replacing any variables or templates within the temp...
setUser($user)
Set the current user.
makeImage($title, $options, $holders=false)
Parse image options text and use it to make an image.
attributeStripCallback(&$text, $frame=false)
Callback from the Sanitizer for expanding items found in HTML attribute values, so they can be safely...
static cascadingsources($parser, $title= '')
Returns the sources of any cascading protection acting on a specified page.
getCustomDefaultSort()
Accessor for $mDefaultSort Unlike getDefaultSort(), will return false if none is set.
extensionSubstitution($params, $frame)
Return the text to be used for a given extension tag.
static makeExternalImage($url, $alt= '')
Return the code for images which were added via external links, via Parser::maybeMakeExternalImage()...
recursiveTagParseFully($text, $frame=false)
Fully parse wikitext to fully parsed HTML.
setTransparentTagHook($tag, $callback)
As setHook(), but letting the contents be parsed.
static element($element, $attribs=[], $contents= '')
Identical to rawElement(), but HTML-escapes $contents (like Xml::element()).
wfFindFile($title, $options=[])
Find a file.
do that in ParserLimitReportFormat instead use this to modify the parameters of the image and a DIV can begin in one section and end in another Make sure your code can handle that case gracefully See the EditSectionClearerLink extension for an example zero but section is usually empty its values are the globals values before the output is cached one of or reset my talk page
unserializeHalfParsedText($data)
Load the parser state given in the $data array, which is assumed to have been generated by serializeH...
do that in ParserLimitReportFormat instead use this to modify the parameters of the image and a DIV can begin in one section and end in another Make sure your code can handle that case gracefully See the EditSectionClearerLink extension for an example zero but section is usually empty its values are the globals values before the output is cached one of or reset my talk my contributions etc etc otherwise the built in rate limiting checks are if enabled allows for interception of redirect as a string mapping parameter names to values & $type
guessSectionNameFromWikiText($text)
Try to guess the section anchor name based on a wikitext fragment presumably extracted from a heading...
static & makeTitle($ns, $title, $fragment= '', $interwiki= '')
Create a new Title from a namespace index and a DB key.
$wgServerName
Server name.
internalParseHalfParsed($text, $isMain=true, $linestart=true)
Helper function for parse() that transforms half-parsed HTML into fully parsed HTML.
if the prop value should be in the metadata multi language array format
null means default in associative array with keys and values unescaped Should be merged with default with a value of false meaning to suppress the attribute in associative array with keys and values unescaped noclasses just before the function returns a value If you return an< a > element with HTML attributes $attribs and contents $html will be returned If you return $ret will be returned and may include noclasses after processing & $attribs
controlled by $wgMainCacheType controlled by $wgParserCacheType controlled by $wgMessageCacheType If you set CACHE_NONE to one of the three control variable
getOptions()
Get the ParserOptions object.
makeKnownLinkHolder($nt, $text= '', $query=[], $trail= '', $prefix= '')
Render a forced-blue link inline; protect against double expansion of URLs if we're in a mode that pr...
getDefaultSort()
Accessor for $mDefaultSort Will use the empty string if none is set.
For a write use something like
makeFreeExternalLink($url, $numPostProto)
Make a free external link, given a user-supplied URL.
const COLON_STATE_CLOSETAG
Allows to change the fields on the form that will be generated $name