MediaWiki REL1_30
SearchEngine.php
Go to the documentation of this file.
1<?php
29
34abstract class SearchEngine {
36 public $prefix = '';
37
39 public $namespaces = [ NS_MAIN ];
40
42 protected $limit = 10;
43
45 protected $offset = 0;
46
48 protected $searchTerms = [];
49
51 protected $showSuggestion = true;
52 private $sort = 'relevance';
53
55 protected $features = [];
56
58 const COMPLETION_PROFILE_TYPE = 'completionSearchProfile';
59
61 const FT_QUERY_INDEP_PROFILE_TYPE = 'fulltextQueryIndepProfile';
62
64 const CHARS_ALL = 1;
65
67 const CHARS_NO_SYNTAX = 2;
68
77 function searchText( $term ) {
78 return null;
79 }
80
93 return Status::newGood( [] );
94 }
95
104 function searchTitle( $term ) {
105 return null;
106 }
107
113 public function supports( $feature ) {
114 switch ( $feature ) {
115 case 'search-update':
116 return true;
117 case 'title-suffix-filter':
118 default:
119 return false;
120 }
121 }
122
129 public function setFeatureData( $feature, $data ) {
130 $this->features[$feature] = $data;
131 }
132
140 public function getFeatureData( $feature ) {
141 if ( isset( $this->features[$feature] ) ) {
142 return $this->features[$feature];
143 }
144 return null;
145 }
146
155 public function normalizeText( $string ) {
156 global $wgContLang;
157
158 // Some languages such as Chinese require word segmentation
159 return $wgContLang->segmentByWord( $string );
160 }
161
169 public function transformSearchTerm( $term ) {
170 return $term;
171 }
172
178 public function getNearMatcher( Config $config ) {
179 global $wgContLang;
180 return new SearchNearMatcher( $config, $wgContLang );
181 }
182
187 protected static function defaultNearMatcher() {
188 $config = MediaWikiServices::getInstance()->getMainConfig();
189 return MediaWikiServices::getInstance()->newSearchEngine()->getNearMatcher( $config );
190 }
191
199 public static function getNearMatch( $searchterm ) {
200 return static::defaultNearMatcher()->getNearMatch( $searchterm );
201 }
202
210 public static function getNearMatchResultSet( $searchterm ) {
211 return static::defaultNearMatcher()->getNearMatchResultSet( $searchterm );
212 }
213
221 public static function legalSearchChars( $type = self::CHARS_ALL ) {
222 return "A-Za-z_'.0-9\\x80-\\xFF\\-";
223 }
224
232 function setLimitOffset( $limit, $offset = 0 ) {
233 $this->limit = intval( $limit );
234 $this->offset = intval( $offset );
235 }
236
244 if ( $namespaces ) {
245 // Filter namespaces to only keep valid ones
246 $validNs = $this->searchableNamespaces();
247 $namespaces = array_filter( $namespaces, function ( $ns ) use( $validNs ) {
248 return $ns < 0 || isset( $validNs[$ns] );
249 } );
250 } else {
251 $namespaces = [];
252 }
253 $this->namespaces = $namespaces;
254 }
255
263 function setShowSuggestion( $showSuggestion ) {
264 $this->showSuggestion = $showSuggestion;
265 }
266
274 public function getValidSorts() {
275 return [ 'relevance' ];
276 }
277
286 public function setSort( $sort ) {
287 if ( !in_array( $sort, $this->getValidSorts() ) ) {
288 throw new InvalidArgumentException( "Invalid sort: $sort. " .
289 "Must be one of: " . implode( ', ', $this->getValidSorts() ) );
290 }
291 $this->sort = $sort;
292 }
293
300 public function getSort() {
301 return $this->sort;
302 }
303
313 $queryAndNs = self::parseNamespacePrefixes( $query );
314 if ( $queryAndNs === false ) {
315 return $query;
316 }
317 $this->namespaces = $queryAndNs[1];
318 return $queryAndNs[0];
319 }
320
330 public static function parseNamespacePrefixes( $query ) {
331 global $wgContLang;
332
333 $parsed = $query;
334 if ( strpos( $query, ':' ) === false ) { // nothing to do
335 return false;
336 }
337 $extractedNamespace = null;
338
339 $allkeyword = wfMessage( 'searchall' )->inContentLanguage()->text() . ":";
340 if ( strncmp( $query, $allkeyword, strlen( $allkeyword ) ) == 0 ) {
341 $extractedNamespace = null;
342 $parsed = substr( $query, strlen( $allkeyword ) );
343 } elseif ( strpos( $query, ':' ) !== false ) {
344 // TODO: should we unify with PrefixSearch::extractNamespace ?
345 $prefix = str_replace( ' ', '_', substr( $query, 0, strpos( $query, ':' ) ) );
346 $index = $wgContLang->getNsIndex( $prefix );
347 if ( $index !== false ) {
348 $extractedNamespace = [ $index ];
349 $parsed = substr( $query, strlen( $prefix ) + 1 );
350 } else {
351 return false;
352 }
353 }
354
355 if ( trim( $parsed ) == '' ) {
356 $parsed = $query; // prefix was the whole query
357 }
358
359 return [ $parsed, $extractedNamespace ];
360 }
361
366 public static function userHighlightPrefs() {
367 $contextlines = 2; // Hardcode this. Old defaults sucked. :)
368 $contextchars = 75; // same as above.... :P
369 return [ $contextlines, $contextchars ];
370 }
371
381 function update( $id, $title, $text ) {
382 // no-op
383 }
384
393 function updateTitle( $id, $title ) {
394 // no-op
395 }
396
405 function delete( $id, $title ) {
406 // no-op
407 }
408
415 public static function getOpenSearchTemplate() {
416 wfDeprecated( __METHOD__, '1.25' );
417 return ApiOpenSearch::getOpenSearchTemplate( 'application/x-suggestions+json' );
418 }
419
430 public function getTextFromContent( Title $t, Content $c = null ) {
431 return $c ? $c->getTextForSearchIndex() : '';
432 }
433
441 public function textAlreadyUpdatedForIndex() {
442 return false;
443 }
444
451 protected function normalizeNamespaces( $search ) {
452 // Find a Title which is not an interwiki and is in NS_MAIN
453 $title = Title::newFromText( $search );
454 $ns = $this->namespaces;
455 if ( $title && !$title->isExternal() ) {
456 $ns = [ $title->getNamespace() ];
457 $search = $title->getText();
458 if ( $ns[0] == NS_MAIN ) {
459 $ns = $this->namespaces; // no explicit prefix, use default namespaces
460 Hooks::run( 'PrefixSearchExtractNamespace', [ &$ns, &$search ] );
461 }
462 } else {
463 $title = Title::newFromText( $search . 'Dummy' );
464 if ( $title && $title->getText() == 'Dummy'
465 && $title->getNamespace() != NS_MAIN
466 && !$title->isExternal()
467 ) {
468 $ns = [ $title->getNamespace() ];
469 $search = '';
470 } else {
471 Hooks::run( 'PrefixSearchExtractNamespace', [ &$ns, &$search ] );
472 }
473 }
474
475 $ns = array_map( function ( $space ) {
476 return $space == NS_MEDIA ? NS_FILE : $space;
477 }, $ns );
478
479 $this->setNamespaces( $ns );
480 return $search;
481 }
482
490 protected function completionSearchBackend( $search ) {
491 $results = [];
492
493 $search = trim( $search );
494
495 if ( !in_array( NS_SPECIAL, $this->namespaces ) && // We do not run hook on Special: search
496 !Hooks::run( 'PrefixSearchBackend',
497 [ $this->namespaces, $search, $this->limit, &$results, $this->offset ]
498 ) ) {
499 // False means hook worked.
500 // FIXME: Yes, the API is weird. That's why it is going to be deprecated.
501
502 return SearchSuggestionSet::fromStrings( $results );
503 } else {
504 // Hook did not do the job, use default simple search
505 $results = $this->simplePrefixSearch( $search );
506 return SearchSuggestionSet::fromTitles( $results );
507 }
508 }
509
515 public function completionSearch( $search ) {
516 if ( trim( $search ) === '' ) {
517 return SearchSuggestionSet::emptySuggestionSet(); // Return empty result
518 }
519 $search = $this->normalizeNamespaces( $search );
520 return $this->processCompletionResults( $search, $this->completionSearchBackend( $search ) );
521 }
522
528 public function completionSearchWithVariants( $search ) {
529 if ( trim( $search ) === '' ) {
530 return SearchSuggestionSet::emptySuggestionSet(); // Return empty result
531 }
532 $search = $this->normalizeNamespaces( $search );
533
534 $results = $this->completionSearchBackend( $search );
535 $fallbackLimit = $this->limit - $results->getSize();
536 if ( $fallbackLimit > 0 ) {
537 global $wgContLang;
538
539 $fallbackSearches = $wgContLang->autoConvertToAllVariants( $search );
540 $fallbackSearches = array_diff( array_unique( $fallbackSearches ), [ $search ] );
541
542 foreach ( $fallbackSearches as $fbs ) {
543 $this->setLimitOffset( $fallbackLimit );
544 $fallbackSearchResult = $this->completionSearch( $fbs );
545 $results->appendAll( $fallbackSearchResult );
546 $fallbackLimit -= count( $fallbackSearchResult );
547 if ( $fallbackLimit <= 0 ) {
548 break;
549 }
550 }
551 }
552 return $this->processCompletionResults( $search, $results );
553 }
554
560 public function extractTitles( SearchSuggestionSet $completionResults ) {
561 return $completionResults->map( function ( SearchSuggestion $sugg ) {
562 return $sugg->getSuggestedTitle();
563 } );
564 }
565
573 protected function processCompletionResults( $search, SearchSuggestionSet $suggestions ) {
574 $search = trim( $search );
575 // preload the titles with LinkBatch
576 $titles = $suggestions->map( function ( SearchSuggestion $sugg ) {
577 return $sugg->getSuggestedTitle();
578 } );
579 $lb = new LinkBatch( $titles );
580 $lb->setCaller( __METHOD__ );
581 $lb->execute();
582
583 $results = $suggestions->map( function ( SearchSuggestion $sugg ) {
584 return $sugg->getSuggestedTitle()->getPrefixedText();
585 } );
586
587 if ( $this->offset === 0 ) {
588 // Rescore results with an exact title match
589 // NOTE: in some cases like cross-namespace redirects
590 // (frequently used as shortcuts e.g. WP:WP on huwiki) some
591 // backends like Cirrus will return no results. We should still
592 // try an exact title match to workaround this limitation
593 $rescorer = new SearchExactMatchRescorer();
594 $rescoredResults = $rescorer->rescore( $search, $this->namespaces, $results, $this->limit );
595 } else {
596 // No need to rescore if offset is not 0
597 // The exact match must have been returned at position 0
598 // if it existed.
599 $rescoredResults = $results;
600 }
601
602 if ( count( $rescoredResults ) > 0 ) {
603 $found = array_search( $rescoredResults[0], $results );
604 if ( $found === false ) {
605 // If the first result is not in the previous array it
606 // means that we found a new exact match
607 $exactMatch = SearchSuggestion::fromTitle( 0, Title::newFromText( $rescoredResults[0] ) );
608 $suggestions->prepend( $exactMatch );
609 $suggestions->shrink( $this->limit );
610 } else {
611 // if the first result is not the same we need to rescore
612 if ( $found > 0 ) {
613 $suggestions->rescore( $found );
614 }
615 }
616 }
617
618 return $suggestions;
619 }
620
626 public function defaultPrefixSearch( $search ) {
627 if ( trim( $search ) === '' ) {
628 return [];
629 }
630
631 $search = $this->normalizeNamespaces( $search );
632 return $this->simplePrefixSearch( $search );
633 }
634
641 protected function simplePrefixSearch( $search ) {
642 // Use default database prefix search
643 $backend = new TitlePrefixSearch;
644 return $backend->defaultSearchBackend( $this->namespaces, $search, $this->limit, $this->offset );
645 }
646
652 public static function searchableNamespaces() {
653 return MediaWikiServices::getInstance()->getSearchEngineConfig()->searchableNamespaces();
654 }
655
663 public static function userNamespaces( $user ) {
664 return MediaWikiServices::getInstance()->getSearchEngineConfig()->userNamespaces( $user );
665 }
666
672 public static function defaultNamespaces() {
673 return MediaWikiServices::getInstance()->getSearchEngineConfig()->defaultNamespaces();
674 }
675
683 public static function namespacesAsText( $namespaces ) {
684 return MediaWikiServices::getInstance()->getSearchEngineConfig()->namespacesAsText( $namespaces );
685 }
686
694 public static function create( $type = null ) {
695 return MediaWikiServices::getInstance()->getSearchEngineFactory()->create( $type );
696 }
697
704 public static function getSearchTypes() {
705 return MediaWikiServices::getInstance()->getSearchEngineConfig()->getSearchTypes();
706 }
707
723 public function getProfiles( $profileType, User $user = null ) {
724 return null;
725 }
726
735 public function makeSearchFieldMapping( $name, $type ) {
736 return new NullIndexField();
737 }
738
744 public function getSearchIndexFields() {
746 $fields = [];
747 $seenHandlers = new SplObjectStorage();
748 foreach ( $models as $model ) {
749 try {
751 }
753 // If we can find no handler, ignore it
754 continue;
755 }
756 // Several models can have the same handler, so avoid processing it repeatedly
757 if ( $seenHandlers->contains( $handler ) ) {
758 // We already did this one
759 continue;
760 }
761 $seenHandlers->attach( $handler );
762 $handlerFields = $handler->getFieldsForSearchIndex( $this );
763 foreach ( $handlerFields as $fieldName => $fieldData ) {
764 if ( empty( $fields[$fieldName] ) ) {
765 $fields[$fieldName] = $fieldData;
766 } else {
767 // TODO: do we allow some clashes with the same type or reject all of them?
768 $mergeDef = $fields[$fieldName]->merge( $fieldData );
769 if ( !$mergeDef ) {
770 throw new InvalidArgumentException( "Duplicate field $fieldName for model $model" );
771 }
772 $fields[$fieldName] = $mergeDef;
773 }
774 }
775 }
776 // Hook to allow extensions to produce search mapping fields
777 Hooks::run( 'SearchIndexFields', [ &$fields, $this ] );
778 return $fields;
779 }
780
786 public function augmentSearchResults( SearchResultSet $resultSet ) {
787 $setAugmentors = [];
788 $rowAugmentors = [];
789 Hooks::run( "SearchResultsAugment", [ &$setAugmentors, &$rowAugmentors ] );
790
791 if ( !$setAugmentors && !$rowAugmentors ) {
792 // We're done here
793 return;
794 }
795
796 // Convert row augmentors to set augmentor
797 foreach ( $rowAugmentors as $name => $row ) {
798 if ( isset( $setAugmentors[$name] ) ) {
799 throw new InvalidArgumentException( "Both row and set augmentors are defined for $name" );
800 }
801 $setAugmentors[$name] = new PerRowAugmentor( $row );
802 }
803
804 foreach ( $setAugmentors as $name => $augmentor ) {
805 $data = $augmentor->augmentAll( $resultSet );
806 if ( $data ) {
807 $resultSet->setAugmentedData( $name, $data );
808 }
809 }
810 }
811}
812
820 // no-op
821}
to move a page</td >< td > &*You are moving the page across namespaces
wfDeprecated( $function, $version=false, $component=false, $callerOffset=2)
Throws a warning that $function is deprecated.
as see the revision history and available at free of to any person obtaining a copy of this software and associated documentation to deal in the Software without including without limitation the rights to use
static getOpenSearchTemplate( $type)
Fetch the template for a type.
static getForModelID( $modelId)
Returns the ContentHandler singleton for the given model ID.
static getContentModels()
Class representing a list of titles The execute() method checks them all for existence and adds them ...
Definition LinkBatch.php:34
Exception thrown when an unregistered content model is requested.
MediaWikiServices is the service locator for the application scope of MediaWiki.
Null index field - means search engine does not implement this field.
Perform augmentation of each row and return composite result, indexed by ID.
defaultSearchBackend( $namespaces, $search, $limit, $offset)
Unless overridden by PrefixSearchBackend hook... This is case-sensitive (First character may be autom...
Dummy class to be used when non-supported Database engine is present.
Contain a class for special pages.
static searchableNamespaces()
Make a list of searchable namespaces and their canonical names.
static userNamespaces( $user)
Extract default namespaces to search from the given user's settings, returning a list of index number...
makeSearchFieldMapping( $name, $type)
Create a search field definition.
getNearMatcher(Config $config)
Get service class to finding near matches.
searchTitle( $term)
Perform a title-only search query and return a result set.
supports( $feature)
processCompletionResults( $search, SearchSuggestionSet $suggestions)
Process completion search results.
static namespacesAsText( $namespaces)
Get a list of namespace names useful for showing in tooltips and preferences.
getFeatureData( $feature)
Way to retrieve custom data set by setFeatureData or by the engine itself.
update( $id, $title, $text)
Create or update the search index record for the given page.
setNamespaces( $namespaces)
Set which namespaces the search should include.
augmentSearchResults(SearchResultSet $resultSet)
Augment search results with extra data.
array $features
Feature values.
static parseNamespacePrefixes( $query)
Parse some common prefixes: all (search everything) or namespace names.
replacePrefixes( $query)
Parse some common prefixes: all (search everything) or namespace names and set the list of namespaces...
static defaultNamespaces()
An array of namespaces indexes to be searched by default.
array string $searchTerms
textAlreadyUpdatedForIndex()
If an implementation of SearchEngine handles all of its own text processing in getTextFromContent() a...
defaultPrefixSearch( $search)
Simple prefix search for subpages.
searchArchiveTitle( $term)
Perform a title search in the article archive.
normalizeText( $string)
When overridden in derived class, performs database-specific conversions on text to be used for searc...
setFeatureData( $feature, $data)
Way to pass custom data for engines.
completionSearchBackend( $search)
Perform a completion search.
getTextFromContent(Title $t, Content $c=null)
Get the raw text for updating the index from a content object Nicer search backends could possibly do...
static create( $type=null)
Load up the appropriate search engine class for the currently active database backend,...
getProfiles( $profileType, User $user=null)
Get a list of supported profiles.
transformSearchTerm( $term)
Transform search term in cases when parts of the query came as different GET params (when supported),...
static getNearMatch( $searchterm)
If an exact title match can be found, or a very slightly close match, return the title.
getSort()
Get the sort direction of the search results.
static defaultNearMatcher()
Get near matcher for default SearchEngine.
getSearchIndexFields()
Get fields for search index.
getValidSorts()
Get the valid sort directions.
static userHighlightPrefs()
Find snippet highlight settings for all users.
updateTitle( $id, $title)
Update a search index record's title only.
completionSearchWithVariants( $search)
Perform a completion search with variants.
normalizeNamespaces( $search)
Makes search simple string if it was namespaced.
const CHARS_ALL
@const int flag for legalSearchChars: includes all chars allowed in a search query
static getOpenSearchTemplate()
Get OpenSearch suggestion template.
static getSearchTypes()
Return the search engines we support.
completionSearch( $search)
Perform a completion search.
setLimitOffset( $limit, $offset=0)
Set the maximum number of results to return and how many to skip before returning the first.
const CHARS_NO_SYNTAX
@const int flag for legalSearchChars: includes all chars allowed in a search term
setShowSuggestion( $showSuggestion)
Set whether the searcher should try to build a suggestion.
static getNearMatchResultSet( $searchterm)
Do a near match (see SearchEngine::getNearMatch) and wrap it into a SearchResultSet.
simplePrefixSearch( $search)
Call out to simple search backend.
setSort( $sort)
Set the sort direction of the search results.
const FT_QUERY_INDEP_PROFILE_TYPE
@const string profile type for query independent ranking features
searchText( $term)
Perform a full text search query and return a result set.
extractTitles(SearchSuggestionSet $completionResults)
Extract titles from completion results.
const COMPLETION_PROFILE_TYPE
@const string profile type for completionSearch
static legalSearchChars( $type=self::CHARS_ALL)
Get chars legal for search NOTE: usage as static is deprecated and preserved only as BC measure.
An utility class to rescore search results by looking for an exact match in the db and add the page f...
Implementation of near match title search.
setAugmentedData( $name, $data)
Sets augmented data for result set.
Search suggestion sets.
rescore( $key)
Move the suggestion at index $key to the first position.
shrink( $limit)
Remove any extra elements in the suggestions set.
static fromStrings(array $titles)
Builds a new set of suggestion based on a string array.
map( $callback)
Call array_map on the suggestions array.
static fromTitles(array $titles)
Builds a new set of suggestion based on a title array.
prepend(SearchSuggestion $suggestion)
Add a new suggestion at the top.
Search suggestion.
static fromTitle( $score, Title $title)
Create suggestion from Title.
Performs prefix search, returning Title objects.
Represents a title within MediaWiki.
Definition Title.php:39
The User object encapsulates all of the user-specific settings (user_id, name, rights,...
Definition User.php:51
this class mediates it Skin Encapsulates a look and feel for the wiki All of the functions that render HTML and make choices about how to render it are here and are called from various other places when and is meant to be subclassed with other skins that may override some of its functions The User object contains a reference to a and so rather than having a global skin object we just rely on the global User and get the skin with $wgUser and also has some character encoding functions and other locale stuff The current user interface language is instantiated as and the local content language as $wgContLang
Definition design.txt:57
external whereas SearchGetNearMatch runs after $term
Definition hooks.txt:2814
namespace and then decline to actually register it & $namespaces
Definition hooks.txt:932
the value to return A Title object or null for latest all implement SearchIndexField must implement ResultSetAugmentor & $rowAugmentors
Definition hooks.txt:2851
namespace and then decline to actually register it file or subcat img or subcat $title
Definition hooks.txt:962
either a unescaped string or a HtmlArmor object after in associative array form externallinks including delete and has completed for all link tables whether this was an auto creation default is conds Array Extra conditions for the No matching items in log is displayed if loglist is empty msgKey Array If you want a nice box with a set this to the key of the message First element is the message additional optional elements are parameters for the key that are processed with wfMessage() -> params() ->parseAsBlock() - offset Set to overwrite offset parameter in $wgRequest set to '' to unset offset - wrap String Wrap the message in html(usually something like "&lt;div ...>$1&lt;/div>"). - flags Integer display flags(NO_ACTION_LINK, NO_EXTRA_USER_LINKS) 'LogException':Called before an exception(or PHP error) is logged. This is meant for integration with external error aggregation services
Allows to change the fields on the form that will be generated $name
Definition hooks.txt:302
this hook is for auditing only or null if authentication failed before getting that far or null if we can t even determine that probably a stub it is not rendered in wiki pages or galleries in category pages allow injecting custom HTML after the section Any uses of the hook need to handle escaping see BaseTemplate::getToolbox and BaseTemplate::makeListItem for details on the format of individual items inside of this array or by returning and letting standard HTTP rendering take place modifiable or by returning false and taking over the output modifiable modifiable after all normalizations have been except for the $wgMaxImageArea check set to true or false to override the $wgMaxImageArea check result gives extension the possibility to transform it themselves $handler
Definition hooks.txt:901
null for the local wiki Added should default to null in handler for backwards compatibility add a value to it if you want to add a cookie that have to vary cache options can modify $query
Definition hooks.txt:1610
returning false will NOT prevent logging $e
Definition hooks.txt:2146
const NS_FILE
Definition Defines.php:71
const NS_MAIN
Definition Defines.php:65
const NS_SPECIAL
Definition Defines.php:54
const NS_MEDIA
Definition Defines.php:53
Base interface for content objects.
Definition Content.php:34
linkcache txt The LinkCache class maintains a list of article titles and the information about whether or not the article exists in the database This is used to mark up links when displaying a page If the same link appears more than once on any page then it only has to be looked up once In most cases link lookups are done in batches with the LinkBatch class or the equivalent in so the link cache is mostly useful for short snippets of parsed and for links in the navigation areas of the skin The link cache was formerly used to track links used in a document for the purposes of updating the link tables This application is now deprecated To create a you can use the following $titles
Definition linkcache.txt:17
$sort