MediaWiki  1.27.1
MediaWikiTitleCodecTest.php
Go to the documentation of this file.
1 <?php
30 
31  public function setUp() {
32  parent::setUp();
33 
34  $this->setMwGlobals( [
35  'wgAllowUserJs' => false,
36  'wgDefaultLanguageVariant' => false,
37  'wgMetaNamespace' => 'Project',
38  'wgLocalInterwikis' => [ 'localtestiw' ],
39  'wgCapitalLinks' => true,
40 
41  // NOTE: this is why global state is evil.
42  // TODO: refactor access to the interwiki codes so it can be injected.
43  'wgHooks' => [
44  'InterwikiLoadPrefix' => [
45  function ( $prefix, &$data ) {
46  if ( $prefix === 'localtestiw' ) {
47  $data = [ 'iw_url' => 'localtestiw' ];
48  } elseif ( $prefix === 'remotetestiw' ) {
49  $data = [ 'iw_url' => 'remotetestiw' ];
50  }
51  return false;
52  }
53  ]
54  ]
55  ] );
56  $this->setUserLang( 'en' );
57  $this->setContentLang( 'en' );
58  }
59 
66  private function getGenderCache() {
67  $genderCache = $this->getMockBuilder( 'GenderCache' )
68  ->disableOriginalConstructor()
69  ->getMock();
70 
71  $genderCache->expects( $this->any() )
72  ->method( 'getGenderOf' )
73  ->will( $this->returnCallback( function ( $userName ) {
74  return preg_match( '/^[^- _]+a( |_|$)/u', $userName ) ? 'female' : 'male';
75  } ) );
76 
77  return $genderCache;
78  }
79 
80  protected function makeCodec( $lang ) {
81  $gender = $this->getGenderCache();
83  // language object can came from cache, which does not respect test settings
84  $lang->resetNamespaces();
85  return new MediaWikiTitleCodec( $lang, $gender );
86  }
87 
88  public static function provideFormat() {
89  return [
90  [ NS_MAIN, 'Foo_Bar', '', '', 'en', 'Foo Bar' ],
91  [ NS_USER, 'Hansi_Maier', 'stuff_and_so_on', '', 'en', 'User:Hansi Maier#stuff and so on' ],
92  [ false, 'Hansi_Maier', '', '', 'en', 'Hansi Maier' ],
93  [
95  'hansi__maier',
96  '',
97  '',
98  'en',
99  'User talk:hansi maier',
100  'User talk:Hansi maier'
101  ],
102 
103  // getGenderCache() provides a mock that considers first
104  // names ending in "a" to be female.
105  [ NS_USER, 'Lisa_Müller', '', '', 'de', 'Benutzerin:Lisa Müller' ],
106  [ NS_MAIN, 'FooBar', '', 'remotetestiw', 'en', 'remotetestiw:FooBar' ],
107  ];
108  }
109 
113  public function testFormat( $namespace, $text, $fragment, $interwiki, $lang, $expected,
114  $normalized = null
115  ) {
116  if ( $normalized === null ) {
117  $normalized = $expected;
118  }
119 
120  $codec = $this->makeCodec( $lang );
121  $actual = $codec->formatTitle( $namespace, $text, $fragment, $interwiki );
122 
123  $this->assertEquals( $expected, $actual, 'formatted' );
124 
125  // test round trip
126  $parsed = $codec->parseTitle( $actual, NS_MAIN );
127  $actual2 = $codec->formatTitle(
128  $parsed->getNamespace(),
129  $parsed->getText(),
130  $parsed->getFragment(),
131  $parsed->getInterwiki()
132  );
133 
134  $this->assertEquals( $normalized, $actual2, 'normalized after round trip' );
135  }
136 
137  public static function provideGetText() {
138  return [
139  [ NS_MAIN, 'Foo_Bar', '', 'en', 'Foo Bar' ],
140  [ NS_USER, 'Hansi_Maier', 'stuff_and_so_on', 'en', 'Hansi Maier' ],
141  ];
142  }
143 
147  public function testGetText( $namespace, $dbkey, $fragment, $lang, $expected ) {
148  $codec = $this->makeCodec( $lang );
149  $title = new TitleValue( $namespace, $dbkey, $fragment );
150 
151  $actual = $codec->getText( $title );
152 
153  $this->assertEquals( $expected, $actual );
154  }
155 
156  public static function provideGetPrefixedText() {
157  return [
158  [ NS_MAIN, 'Foo_Bar', '', 'en', 'Foo Bar' ],
159  [ NS_USER, 'Hansi_Maier', 'stuff_and_so_on', 'en', 'User:Hansi Maier' ],
160 
161  // No capitalization or normalization is applied while formatting!
162  [ NS_USER_TALK, 'hansi__maier', '', 'en', 'User talk:hansi maier' ],
163 
164  // getGenderCache() provides a mock that considers first
165  // names ending in "a" to be female.
166  [ NS_USER, 'Lisa_Müller', '', 'de', 'Benutzerin:Lisa Müller' ],
167  ];
168  }
169 
173  public function testGetPrefixedText( $namespace, $dbkey, $fragment, $lang, $expected ) {
174  $codec = $this->makeCodec( $lang );
175  $title = new TitleValue( $namespace, $dbkey, $fragment );
176 
177  $actual = $codec->getPrefixedText( $title );
178 
179  $this->assertEquals( $expected, $actual );
180  }
181 
182  public static function provideGetPrefixedDBkey() {
183  return [
184  [ NS_MAIN, 'Foo_Bar', '', '', 'en', 'Foo_Bar' ],
185  [ NS_USER, 'Hansi_Maier', 'stuff_and_so_on', '', 'en', 'User:Hansi_Maier' ],
186 
187  // No capitalization or normalization is applied while formatting!
188  [ NS_USER_TALK, 'hansi__maier', '', '', 'en', 'User_talk:hansi__maier' ],
189 
190  // getGenderCache() provides a mock that considers first
191  // names ending in "a" to be female.
192  [ NS_USER, 'Lisa_Müller', '', '', 'de', 'Benutzerin:Lisa_Müller' ],
193 
194  [ NS_MAIN, 'Remote_page', '', 'remotetestiw', 'en', 'remotetestiw:Remote_page' ],
195 
196  // non-existent namespace
197  [ 10000000, 'Foobar', '', '', 'en', ':Foobar' ],
198  ];
199  }
200 
204  public function testGetPrefixedDBkey( $namespace, $dbkey, $fragment,
205  $interwiki, $lang, $expected
206  ) {
207  $codec = $this->makeCodec( $lang );
208  $title = new TitleValue( $namespace, $dbkey, $fragment, $interwiki );
209 
210  $actual = $codec->getPrefixedDBkey( $title );
211 
212  $this->assertEquals( $expected, $actual );
213  }
214 
215  public static function provideGetFullText() {
216  return [
217  [ NS_MAIN, 'Foo_Bar', '', 'en', 'Foo Bar' ],
218  [ NS_USER, 'Hansi_Maier', 'stuff_and_so_on', 'en', 'User:Hansi Maier#stuff and so on' ],
219 
220  // No capitalization or normalization is applied while formatting!
221  [ NS_USER_TALK, 'hansi__maier', '', 'en', 'User talk:hansi maier' ],
222  ];
223  }
224 
228  public function testGetFullText( $namespace, $dbkey, $fragment, $lang, $expected ) {
229  $codec = $this->makeCodec( $lang );
230  $title = new TitleValue( $namespace, $dbkey, $fragment );
231 
232  $actual = $codec->getFullText( $title );
233 
234  $this->assertEquals( $expected, $actual );
235  }
236 
237  public static function provideParseTitle() {
238  // TODO: test capitalization and trimming
239  // TODO: test unicode normalization
240 
241  return [
242  [ ' : Hansi_Maier _ ', NS_MAIN, 'en',
243  new TitleValue( NS_MAIN, 'Hansi_Maier', '' ) ],
244  [ 'User:::1', NS_MAIN, 'de',
245  new TitleValue( NS_USER, '0:0:0:0:0:0:0:1', '' ) ],
246  [ ' lisa Müller', NS_USER, 'de',
247  new TitleValue( NS_USER, 'Lisa_Müller', '' ) ],
248  [ 'benutzerin:lisa Müller#stuff', NS_MAIN, 'de',
249  new TitleValue( NS_USER, 'Lisa_Müller', 'stuff' ) ],
250 
251  [ ':Category:Quux', NS_MAIN, 'en',
252  new TitleValue( NS_CATEGORY, 'Quux', '' ) ],
253  [ 'Category:Quux', NS_MAIN, 'en',
254  new TitleValue( NS_CATEGORY, 'Quux', '' ) ],
255  [ 'Category:Quux', NS_CATEGORY, 'en',
256  new TitleValue( NS_CATEGORY, 'Quux', '' ) ],
257  [ 'Quux', NS_CATEGORY, 'en',
258  new TitleValue( NS_CATEGORY, 'Quux', '' ) ],
259  [ ':Quux', NS_CATEGORY, 'en',
260  new TitleValue( NS_MAIN, 'Quux', '' ) ],
261 
262  // getGenderCache() provides a mock that considers first
263  // names ending in "a" to be female.
264 
265  [ 'a b c', NS_MAIN, 'en',
266  new TitleValue( NS_MAIN, 'A_b_c' ) ],
267  [ ' a b c ', NS_MAIN, 'en',
268  new TitleValue( NS_MAIN, 'A_b_c' ) ],
269  [ ' _ Foo __ Bar_ _', NS_MAIN, 'en',
270  new TitleValue( NS_MAIN, 'Foo_Bar' ) ],
271 
272  // NOTE: cases copied from TitleTest::testSecureAndSplit. Keep in sync.
273  [ 'Sandbox', NS_MAIN, 'en', ],
274  [ 'A "B"', NS_MAIN, 'en', ],
275  [ 'A \'B\'', NS_MAIN, 'en', ],
276  [ '.com', NS_MAIN, 'en', ],
277  [ '~', NS_MAIN, 'en', ],
278  [ '"', NS_MAIN, 'en', ],
279  [ '\'', NS_MAIN, 'en', ],
280 
281  [ 'Talk:Sandbox', NS_MAIN, 'en',
282  new TitleValue( NS_TALK, 'Sandbox' ) ],
283  [ 'Talk:Foo:Sandbox', NS_MAIN, 'en',
284  new TitleValue( NS_TALK, 'Foo:Sandbox' ) ],
285  [ 'File:Example.svg', NS_MAIN, 'en',
286  new TitleValue( NS_FILE, 'Example.svg' ) ],
287  [ 'File_talk:Example.svg', NS_MAIN, 'en',
288  new TitleValue( NS_FILE_TALK, 'Example.svg' ) ],
289  [ 'Foo/.../Sandbox', NS_MAIN, 'en',
290  'Foo/.../Sandbox' ],
291  [ 'Sandbox/...', NS_MAIN, 'en',
292  'Sandbox/...' ],
293  [ 'A~~', NS_MAIN, 'en',
294  'A~~' ],
295  // Length is 256 total, but only title part matters
296  [ 'Category:' . str_repeat( 'x', 248 ), NS_MAIN, 'en',
297  new TitleValue( NS_CATEGORY,
298  'X' . str_repeat( 'x', 247 ) ) ],
299  [ str_repeat( 'x', 252 ), NS_MAIN, 'en',
300  'X' . str_repeat( 'x', 251 ) ]
301  ];
302  }
303 
307  public function testParseTitle( $text, $ns, $lang, $title = null ) {
308  if ( $title === null ) {
309  $title = str_replace( ' ', '_', trim( $text ) );
310  }
311 
312  if ( is_string( $title ) ) {
313  $title = new TitleValue( NS_MAIN, $title, '' );
314  }
315 
316  $codec = $this->makeCodec( $lang );
317  $actual = $codec->parseTitle( $text, $ns );
318 
319  $this->assertEquals( $title, $actual );
320  }
321 
322  public static function provideParseTitle_invalid() {
323  // TODO: test unicode errors
324 
325  return [
326  [ '#' ],
327  [ '::' ],
328  [ '::xx' ],
329  [ '::##' ],
330  [ ' :: x' ],
331 
332  [ 'Talk:File:Foo.jpg' ],
333  [ 'Talk:localtestiw:Foo' ],
334  [ '::1' ], // only valid in user namespace
335  [ 'User::x' ], // leading ":" in a user name is only valid of IPv6 addresses
336 
337  // NOTE: cases copied from TitleTest::testSecureAndSplit. Keep in sync.
338  [ '' ],
339  [ ':' ],
340  [ '__ __' ],
341  [ ' __ ' ],
342  // Bad characters forbidden regardless of wgLegalTitleChars
343  [ 'A [ B' ],
344  [ 'A ] B' ],
345  [ 'A { B' ],
346  [ 'A } B' ],
347  [ 'A < B' ],
348  [ 'A > B' ],
349  [ 'A | B' ],
350  // URL encoding
351  [ 'A%20B' ],
352  [ 'A%23B' ],
353  [ 'A%2523B' ],
354  // XML/HTML character entity references
355  // Note: Commented out because they are not marked invalid by the PHP test as
356  // Title::newFromText runs Sanitizer::decodeCharReferencesAndNormalize first.
357  // array( 'A &eacute; B' ),
358  // array( 'A &#233; B' ),
359  // array( 'A &#x00E9; B' ),
360  // Subject of NS_TALK does not roundtrip to NS_MAIN
361  [ 'Talk:File:Example.svg' ],
362  // Directory navigation
363  [ '.' ],
364  [ '..' ],
365  [ './Sandbox' ],
366  [ '../Sandbox' ],
367  [ 'Foo/./Sandbox' ],
368  [ 'Foo/../Sandbox' ],
369  [ 'Sandbox/.' ],
370  [ 'Sandbox/..' ],
371  // Tilde
372  [ 'A ~~~ Name' ],
373  [ 'A ~~~~ Signature' ],
374  [ 'A ~~~~~ Timestamp' ],
375  [ str_repeat( 'x', 256 ) ],
376  // Namespace prefix without actual title
377  [ 'Talk:' ],
378  [ 'Category: ' ],
379  [ 'Category: #bar' ]
380  ];
381  }
382 
386  public function testParseTitle_invalid( $text ) {
387  $this->setExpectedException( 'MalformedTitleException' );
388 
389  $codec = $this->makeCodec( 'en' );
390  $codec->parseTitle( $text, NS_MAIN );
391  }
392 
393  public static function provideGetNamespaceName() {
394  return [
395  [ NS_MAIN, 'Foo', 'en', '' ],
396  [ NS_USER, 'Foo', 'en', 'User' ],
397  [ NS_USER, 'Hansi Maier', 'de', 'Benutzer' ],
398 
399  // getGenderCache() provides a mock that considers first
400  // names ending in "a" to be female.
401  [ NS_USER, 'Lisa Müller', 'de', 'Benutzerin' ],
402  ];
403  }
404 
408  public function testGetNamespaceName( $namespace, $text, $lang, $expected ) {
409  $codec = $this->makeCodec( $lang );
410  $name = $codec->getNamespaceName( $namespace, $text );
411 
412  $this->assertEquals( $expected, $name );
413  }
414 }
A codec for MediaWiki page titles.
testGetPrefixedText($namespace, $dbkey, $fragment, $lang, $expected)
provideGetPrefixedText
testGetText($namespace, $dbkey, $fragment, $lang, $expected)
provideGetText
const NS_MAIN
Definition: Defines.php:69
if(!isset($args[0])) $lang
Represents a page (or page fragment) title within MediaWiki.
Definition: TitleValue.php:36
testGetFullText($namespace, $dbkey, $fragment, $lang, $expected)
provideGetFullText
getGenderCache()
Returns a mock GenderCache that will consider a user "female" if the first part of the user name ends...
testGetPrefixedDBkey($namespace, $dbkey, $fragment, $interwiki, $lang, $expected)
provideGetPrefixedDBkey
const NS_CATEGORY
Definition: Defines.php:83
namespace and then decline to actually register it file or subcat img or subcat $title
Definition: hooks.txt:912
const NS_FILE
Definition: Defines.php:75
testGetNamespaceName($namespace, $text, $lang, $expected)
provideGetNamespaceName
const NS_FILE_TALK
Definition: Defines.php:76
injection txt This is an overview of how MediaWiki makes use of dependency injection The design described here grew from the discussion of RFC T384 The term dependency this means that anything an object needs to operate should be injected from the the object itself should only know narrow no concrete implementation of the logic it relies on The requirement to inject everything typically results in an architecture that based on two main types of and essentially stateless service objects that use other service objects to operate on the value objects As of the beginning MediaWiki is only starting to use the DI approach Much of the code still relies on global state or direct resulting in a highly cyclical dependency which acts as the top level factory for services in MediaWiki which can be used to gain access to default instances of various services MediaWikiServices however also allows new services to be defined and default services to be redefined Services are defined or redefined by providing a callback the instantiator that will return a new instance of the service When it will create an instance of MediaWikiServices and populate it with the services defined in the files listed by thereby bootstrapping the DI framework Per $wgServiceWiringFiles lists includes ServiceWiring php
Definition: injection.txt:35
testParseTitle($text, $ns, $lang, $title=null)
provideParseTitle
testFormat($namespace, $text, $fragment, $interwiki, $lang, $expected, $normalized=null)
provideFormat
testParseTitle_invalid($text)
provideParseTitle_invalid
const NS_TALK
Definition: Defines.php:70
static factory($code)
Get a cached or new language object for a given language code.
Definition: Language.php:179
setMwGlobals($pairs, $value=null)
const NS_USER_TALK
Definition: Defines.php:72
Allows to change the fields on the form that will be generated $name
Definition: hooks.txt:310