Code Coverage for /workspace/src/extensions/LabeledSectionTransclusion/includes/LabeledSectionTransclusion.php

	Code Coverage
	Lines			Functions and Methods				Classes and Traits
Total	0.00% covered (danger)	0.00%	0 / 203	0.00% covered (danger)	0.00%	0 / 12	CRAP	0.00% covered (danger)	0.00%	0 / 1
LabeledSectionTransclusion	0.00% covered (danger)	0.00%	0 / 203	0.00% covered (danger)	0.00%	0 / 12	4830	0.00% covered (danger)	0.00%	0 / 1
open	0.00% covered (danger)	0.00%	0 / 7	0.00% covered (danger)	0.00%	0 / 1	12
parse	0.00% covered (danger)	0.00%	0 / 6	0.00% covered (danger)	0.00%	0 / 1	6
noop	0.00% covered (danger)	0.00%	0 / 2	0.00% covered (danger)	0.00%	0 / 1	2
getAttrPattern	0.00% covered (danger)	0.00%	0 / 8	0.00% covered (danger)	0.00%	0 / 1	6
countHeadings	0.00% covered (danger)	0.00%	0 / 10	0.00% covered (danger)	0.00%	0 / 1	12
getTemplateText	0.00% covered (danger)	0.00%	0 / 9	0.00% covered (danger)	0.00%	0 / 1	20
setupPfunc12	0.00% covered (danger)	0.00%	0 / 40	0.00% covered (danger)	0.00%	0 / 1	110
isSection	0.00% covered (danger)	0.00%	0 / 6	0.00% covered (danger)	0.00%	0 / 1	12
expandSectionNode	0.00% covered (danger)	0.00%	0 / 3	0.00% covered (danger)	0.00%	0 / 1	6
pfuncIncludeObj	0.00% covered (danger)	0.00%	0 / 48	0.00% covered (danger)	0.00%	0 / 1	306
pfuncExcludeObj	0.00% covered (danger)	0.00%	0 / 35	0.00% covered (danger)	0.00%	0 / 1	182
pfuncIncludeHeading	0.00% covered (danger)	0.00%	0 / 29	0.00% covered (danger)	0.00%	0 / 1	90

1	<?php
2
3	namespace MediaWiki\Extension\LabeledSectionTransclusion;
4
5	use MediaWiki\Parser\Parser;
6	use MediaWiki\Parser\PPFrame;
7	use MediaWiki\Parser\PPNode;
8	use MediaWiki\Title\Title;
9
10	class LabeledSectionTransclusion {
11
12	/*
13	* To do transclusion from an extension, we need to interact with the parser
14	* at a low level. This is the general transclusion functionality
15	*/
16
17	/**
18	* Register what we're working on in the parser, so we don't fall into a trap.
19	* @param Parser $parser
20	* @param string $part1
21	* @return bool
22	*/
23	private static function open( $parser, $part1 ) {
24	// This property on Parser has been deprecated: T360573
25	if ( !isset( $parser->mTemplatePath ) ) {
26	$parser->mTemplatePath = [];
27	}
28
29	// Infinite loop test
30	if ( isset( $parser->mTemplatePath[$part1] ) ) {
31	wfDebug( __METHOD__ . ": template loop broken at '$part1'\n" );
32	return false;
33	} else {
34	$parser->mTemplatePath[$part1] = 1;
35	return true;
36	}
37	}
38
39	/**
40	* Handle recursive substitution here, so we can break cycles, and set up
41	* return values so that edit sections will resolve correctly.
42	* @param Parser $parser
43	* @param Title $title of target page
44	* @param string $text
45	* @param string $part1 Key for cycle detection
46	* @param int $skiphead Number of source string headers to skip for numbering
47	* @return mixed string or magic array of bits
48	* @todo handle mixed-case </section>
49	*/
50	private static function parse( $parser, $title, $text, $part1, $skiphead = 0 ) {
51	// if someone tries something like<section begin=blah>lst only</section>
52	// text, may as well do the right thing.
53	$text = str_replace( '</section>', '', $text );
54
55	if ( self::open( $parser, $part1 ) ) {
56	// Try to get edit sections correct by munging around the parser's guts.
57	return [ $text, 'title' => $title, 'replaceHeadings' => true,
58	'headingOffset' => $skiphead, 'noparse' => false, 'noargs' => false ];
59	} else {
60	return "[[" . $title->getPrefixedText() . "]]" .
61	"<!-- WARNING: LST loop detected -->";
62	}
63	}
64
65	/*
66	* And now, the labeled section transclusion
67	*/
68
69	/**
70	* Parser tag hook for <section>.
71	* The section markers aren't paired, so we only need to remove them.
72	*
73	* @param string $in
74	* @param array $assocArgs
75	* @param Parser\|null $parser
76	* @return string HTML output
77	*/
78	public static function noop( $in, $assocArgs = [], $parser = null ) {
79	return '';
80	}
81
82	/**
83	* Generate a regex fragment matching the attribute portion of a section tag
84	* @param string $sec Name of the target section
85	* @param string $type Either "begin" or "end" depending on the type of section tag to be matched
86	* @param string $lang
87	* @return string
88	*/
89	private static function getAttrPattern( $sec, $type, $lang ) {
90	$sec = preg_quote( $sec, '/' );
91	// Similiar like $ws="\s*", but special for attributes
92	$ws = "(?:\s+[^>]*)?";
93	$attrs = [ $type ];
94	$localName = Hooks::getLocalName( $type, $lang );
95	if ( $localName !== null ) {
96	$attrs[] = $localName;
97	}
98	$attrName = '(?i:' . implode( '\|', $attrs ) . ')';
99	return "$ws\s+$attrName\s=\s([\"']?)$sec\\1$ws";
100	}
101
102	/**
103	* Count headings in skipped text.
104	*
105	* Count skipped headings, so parser (as of r18218) can skip them, to
106	* prevent wrong heading links (see bug 6563).
107	*
108	* @param string $text
109	* @param int $limit Cutoff point in the text to stop searching
110	* @return int Number of matches
111	*/
112	private static function countHeadings( $text, $limit ) {
113	$pat = '^(={1,6}).+\1\s*$()';
114
115	$count = 0;
116	$offset = 0;
117	$m = [];
118	while ( preg_match( "/$pat/im", $text, $m, PREG_OFFSET_CAPTURE, $offset ) ) {
119	if ( $m[2][1] > $limit ) {
120	break;
121	}
122
123	$count++;
124	$offset = $m[2][1];
125	}
126
127	return $count;
128	}
129
130	/**
131	* Fetches content of target page if valid and found, otherwise
132	* produces wikitext of a link to the target page.
133	*
134	* @param Parser $parser
135	* @param string $page title text of target page
136	* @param Title &$title normalized title object
137	* @param string &$text wikitext output
138	* @return bool true if returning text, false if target not found
139	*/
140	private static function getTemplateText( $parser, $page, &$title, &$text ) {
141	$title = Title::newFromText( $page );
142
143	if ( $title === null \|\| $title->isExternal() ) {
144	$text = '';
145	return true;
146	} else {
147	[ $text, $title ] = $parser->fetchTemplateAndTitle( $title );
148	}
149
150	// if article doesn't exist, return a red link.
151	if ( $text === false ) {
152	$text = "[[" . $title->getPrefixedText() . "]]";
153	return false;
154	} else {
155	return true;
156	}
157	}
158
159	/**
160	* Set up some variables for MW-1.12 parser functions
161	* @param Parser $parser
162	* @param PPFrame $frame
163	* @param array $args
164	* @param string $func
165	* @return array\|string
166	*/
167	private static function setupPfunc12( $parser, $frame, $args, $func = 'lst' ) {
168	if ( !count( $args ) ) {
169	$parser->addTrackingCategory( "lst-invalid-section-category" );
170	return '';
171	}
172
173	$title = Title::newFromText( trim( $frame->expand( array_shift( $args ) ) ) );
174	if ( !$title \|\| $title->isExternal() ) {
175	$parser->addTrackingCategory( "lst-invalid-section-category" );
176	return '';
177	}
178	if ( !$frame->loopCheck( $title ) ) {
179	return '<span class="error">'
180	. wfMessage( 'parser-template-loop-warning', $title->getPrefixedText() )
181	->inContentLanguage()->text()
182	. '</span>';
183	}
184
185	[ $root, $finalTitle ] = $parser->getTemplateDom( $title );
186
187	// if article doesn't exist, return a red link.
188	if ( $root === false ) {
189	return "[[" . $title->getPrefixedText() . "]]";
190	}
191
192	$newFrame = $frame->newChild( false, $finalTitle );
193	if ( !count( $args ) ) {
194	return $newFrame->expand( $root );
195	}
196
197	$begin = trim( $frame->expand( array_shift( $args ) ) );
198
199	$repl = null;
200	if ( $func == 'lstx' ) {
201	if ( !count( $args ) ) {
202	$repl = '';
203	} else {
204	$repl = trim( $frame->expand( array_shift( $args ) ) );
205	}
206	}
207
208	if ( !count( $args ) ) {
209	$end = $begin;
210	} else {
211	$end = trim( $frame->expand( array_shift( $args ) ) );
212	}
213
214	$lang = $parser->getContentLanguage()->getCode();
215	$beginAttr = self::getAttrPattern( $begin, 'begin', $lang );
216	$beginRegex = "/^$beginAttr$/s";
217	$endAttr = self::getAttrPattern( $end, 'end', $lang );
218	$endRegex = "/^$endAttr$/s";
219
220	return [
221	'root' => $root,
222	'newFrame' => $newFrame,
223	'repl' => $repl,
224	'beginRegex' => $beginRegex,
225	'begin' => $begin,
226	'endRegex' => $endRegex,
227	];
228	}
229
230	/**
231	* Returns true if the given extension name is "section"
232	* @param string $name
233	* @param string $lang
234	* @return bool
235	*/
236	private static function isSection( $name, $lang ) {
237	$name = strtolower( $name );
238	$sectionLocal = Hooks::getLocalName( 'section', $lang );
239	return (
240	$name === 'section'
241	\|\| ( $sectionLocal !== null && $name === strtolower( $sectionLocal ) )
242	);
243	}
244
245	/**
246	* Returns the text for the inside of a split <section> node
247	* @param Parser $parser
248	* @param PPFrame $frame
249	* @param array $parts
250	* @return string
251	*/
252	private static function expandSectionNode( $parser, $frame, $parts ) {
253	if ( isset( $parts['inner'] ) ) {
254	return $parser->replaceVariables( $parts['inner'], $frame );
255	} else {
256	return '';
257	}
258	}
259
260	/**
261	* @param Parser $parser
262	* @param PPFrame $frame
263	* @param array $args
264	* @return array\|string
265	*/
266	public static function pfuncIncludeObj( $parser, $frame, $args ) {
267	$setup = self::setupPfunc12( $parser, $frame, $args, 'lst' );
268	if ( !is_array( $setup ) ) {
269	return $setup;
270	}
271
272	/**
273	* @var $root PPNode
274	*/
275	$root = $setup['root'];
276	/**
277	* @var $newFrame PPFrame
278	*/
279	$newFrame = $setup['newFrame'];
280	$beginRegex = $setup['beginRegex'];
281	$endRegex = $setup['endRegex'];
282	$begin = $setup['begin'];
283
284	$lang = $parser->getContentLanguage()->getCode();
285	$text = '';
286	$node = $root->getFirstChild();
287	$foundSection = false;
288	while ( $node ) {
289	// If the name of the begin node was specified, find it.
290	// Otherwise transclude everything from the beginning of the page.
291	if ( $begin !== '' ) {
292	// Find the begin node
293	$found = false;
294	for ( ; $node; $node = $node->getNextSibling() ) {
295	if ( $node->getName() !== 'ext' ) {
296	continue;
297	}
298	$parts = $node->splitExt();
299	$parts = array_map( [ $newFrame, 'expand' ], $parts );
300	if ( self::isSection( $parts['name'], $lang ) ) {
301	// @phan-suppress-next-line SecurityCheck-ReDoS
302	if ( preg_match( $beginRegex, $parts['attr'] ) ) {
303	$found = true;
304	$foundSection = true;
305	break;
306	}
307	}
308	}
309	if ( !$found \|\| !$node ) {
310	break;
311	}
312	}
313
314	// Write the text out while looking for the end node
315	$found = false;
316	for ( ; $node; $node = $node->getNextSibling() ) {
317	if ( $node->getName() === 'ext' ) {
318	$parts = $node->splitExt();
319	$parts = array_map( [ $newFrame, 'expand' ], $parts );
320	if ( self::isSection( $parts['name'], $lang ) ) {
321	// @phan-suppress-next-line SecurityCheck-ReDoS
322	if ( preg_match( $endRegex, $parts['attr'] ) ) {
323	$found = true;
324	$foundSection = true;
325	break;
326	}
327	$text .= self::expandSectionNode( $parser, $newFrame, $parts );
328	} else {
329	$text .= $newFrame->expand( $node );
330	}
331	} else {
332	$text .= $newFrame->expand( $node );
333	}
334	}
335	if ( !$found ) {
336	break;
337	} elseif ( $begin === '' ) {
338	// When the end node was found and text is transcluded from
339	// the beginning of the page, finish the transclusion
340	break;
341	}
342
343	$node = $node->getNextSibling();
344	}
345	if ( !$foundSection ) {
346	$parser->addTrackingCategory( "lst-invalid-section-category" );
347	}
348	return $text;
349	}
350
351	/**
352	* @param Parser $parser
353	* @param PPFrame $frame
354	* @param array $args
355	* @return array\|string
356	*/
357	public static function pfuncExcludeObj( $parser, $frame, $args ) {
358	$setup = self::setupPfunc12( $parser, $frame, $args, 'lstx' );
359	if ( !is_array( $setup ) ) {
360	return $setup;
361	}
362
363	/**
364	* @var $root PPNode
365	*/
366	$root = $setup['root'];
367	/**
368	* @var $newFrame PPFrame
369	*/
370	$newFrame = $setup['newFrame'];
371	$beginRegex = $setup['beginRegex'];
372	$endRegex = $setup['endRegex'];
373	$repl = $setup['repl'];
374
375	$lang = $parser->getContentLanguage()->getCode();
376	$text = '';
377	// phpcs:ignore Generic.CodeAnalysis.JumbledIncrementer.Found
378	for ( $node = $root->getFirstChild(); $node; $node = $node ? $node->getNextSibling() : false ) {
379	// Search for the start tag
380	$found = false;
381	for ( ; $node; $node = $node->getNextSibling() ) {
382	if ( $node->getName() == 'ext' ) {
383	$parts = $node->splitExt();
384	$parts = array_map( [ $newFrame, 'expand' ], $parts );
385	if ( self::isSection( $parts['name'], $lang ) ) {
386	// @phan-suppress-next-line SecurityCheck-ReDoS
387	if ( preg_match( $beginRegex, $parts['attr'] ) ) {
388	$found = true;
389	break;
390	}
391	$text .= self::expandSectionNode( $parser, $newFrame, $parts );
392	} else {
393	$text .= $newFrame->expand( $node );
394	}
395	} else {
396	$text .= $newFrame->expand( $node );
397	}
398	}
399
400	if ( !$found ) {
401	break;
402	}
403
404	// Append replacement text
405	$text .= $repl;
406
407	// Search for the end tag
408	for ( ; $node; $node = $node->getNextSibling() ) {
409	if ( $node->getName() == 'ext' ) {
410	$parts = $node->splitExt();
411	$parts = array_map( [ $newFrame, 'expand' ], $parts );
412	if ( self::isSection( $parts['name'], $lang ) ) {
413	// @phan-suppress-next-line SecurityCheck-ReDoS
414	if ( preg_match( $endRegex, $parts['attr'] ) ) {
415	$text .= self::expandSectionNode( $parser, $newFrame, $parts );
416	break;
417	}
418	}
419	}
420	}
421	}
422	return $text;
423	}
424
425	/**
426	* section inclusion - include all matching sections
427	*
428	* A parser extension that further extends labeled section transclusion,
429	* adding a function, #lsth for transcluding marked sections of text,
430	*
431	* @todo MW 1.12 version, as per #lst/#lstx
432	*
433	* @param Parser $parser
434	* @param string $page
435	* @param string $sec
436	* @param string $to
437	* @return mixed\|string
438	*/
439	public static function pfuncIncludeHeading( $parser, $page = '', $sec = '', $to = '' ) {
440	if ( self::getTemplateText( $parser, $page, $title, $text ) == false ) {
441	return $text;
442	}
443
444	// Generate a regex to match the === classical heading section(s) === we're
445	// interested in.
446	if ( $sec == '' ) {
447	$begin_off = 0;
448	$head_len = 6;
449	} else {
450	$pat = '^(={1,6})\s' . preg_quote( $sec, '/' ) . '\s\1\s*($)';
451	if ( preg_match( "/$pat/im", $text, $m, PREG_OFFSET_CAPTURE ) ) {
452	$begin_off = $m[2][1];
453	$head_len = strlen( $m[1][0] );
454	} else {
455	$parser->addTrackingCategory( "lst-invalid-section-category" );
456	return '';
457	}
458
459	}
460
461	$end_off = null;
462	if ( $to != '' ) {
463	// if $to is supplied, try and match it. If we don't match, just
464	// ignore it.
465	$pat = '^(={1,6})\s' . preg_quote( $to, '/' ) . '\s\1\s*$';
466	if ( preg_match( "/$pat/im", $text, $m, PREG_OFFSET_CAPTURE, $begin_off ) ) {
467	$end_off = $m[0][1] - 1;
468	}
469	}
470
471	if ( $end_off === null ) {
472	$pat = '^(={1,' . $head_len . '})(?!=).?\1\s$';
473	if ( preg_match( "/$pat/im", $text, $m, PREG_OFFSET_CAPTURE, $begin_off ) ) {
474	$end_off = $m[0][1] - 1;
475	}
476	}
477
478	$nhead = self::countHeadings( $text, $begin_off );
479
480	if ( $end_off !== null ) {
481	$result = substr( $text, $begin_off, $end_off - $begin_off );
482	} else {
483	$result = substr( $text, $begin_off );
484	}
485
486	$frame = $parser->getPreprocessor()->newFrame();
487	$dom = $parser->preprocessToDom( $result, Parser::PTD_FOR_INCLUSION );
488	$result = $frame->expand( $dom );
489	$result = trim( $result );
490
491	return self::parse( $parser, $title, $result, "#lsth:{$page}\|{$sec}", $nhead );
492	}
493	}