44 'spam' =>
'SpamBlacklist',
45 'email' =>
'EmailBlacklist',
61 foreach ( $settings as $name =>
$value ) {
72 abstract public function filter( array $links,
Title $title, $preventLog =
false );
81 self::$blacklistTypes[
$type] = $class;
116 if ( !isset( self::$blacklistTypes[
$type] ) ) {
117 throw new Exception(
"Invalid blacklist type '$type' passed to " . __METHOD__ );
120 if ( !isset( self::$instances[
$type] ) ) {
121 global $wgBlacklistSettings;
124 if ( !isset( $wgBlacklistSettings[
$type] ) ) {
125 $wgBlacklistSettings[
$type] = [];
128 $class = self::$blacklistTypes[
$type];
129 self::$instances[
$type] =
new $class( $wgBlacklistSettings[
$type] );
132 return self::$instances[
$type];
151 if ( $title->getNamespace() == NS_MEDIAWIKI ) {
153 foreach ( self::$blacklistTypes as
$type => $class ) {
161 if ( in_array( $title->getDBkey(), $sources ) ) {
167 $thisHttpRegex =
'/^' . preg_quote( $thisHttp,
'/' ) .
'(?:&.*)?$/';
170 foreach ( self::$blacklistTypes as
$type => $class ) {
171 if ( isset( $wgBlacklistSettings[
$type][
'files'] ) ) {
176 foreach (
$files as $fileName ) {
178 if ( preg_match(
'/^DB: (\w*) (.*)$/', $fileName,
$matches ) ) {
180 if (
$matches[2] == $title->getPrefixedDbKey() ) {
185 } elseif ( preg_match( $thisHttpRegex, $fileName ) ) {
204 $types = array_map( [
$wgContLang,
'ucfirst' ], array_keys( self::$blacklistTypes ) );
205 $regex =
'/(' . implode(
'|', $types ).
')-(?:blacklist|whitelist)/';
207 if ( preg_match( $regex, $title->getDBkey(), $m ) ) {
208 return strtolower( $m[1] );
220 if ( $this->regexes ===
false ) {
221 $this->regexes = array_merge(
237 return ObjectCache::getMainWANInstance()->getWithSetCallback(
240 function () use ( $that,
$type ) {
255 return ObjectCache::getMainWANInstance()->getWithSetCallback(
258 function () use ( $that,
$type ) {
271 wfDebugLog(
'SpamBlacklist',
"Loading $listType regex..." );
273 if ( count( $this->
files ) == 0 ) {
275 wfDebugLog(
'SpamBlacklist',
"no files specified\n" );
282 $regexes = ObjectCache::getMainWANInstance()->getWithSetCallback(
285 wfMemcKey(
'spamblacklist', $listType,
'shared-blacklist-regex' ),
287 function () use ( $that, &$miss ) {
289 return $that->buildSharedBlacklists();
294 wfDebugLog(
'SpamBlacklist',
"Got shared spam regexes from cache\n" );
308 $cache = ObjectCache::getMainWANInstance();
309 $cache->delete(
wfMemcKey(
'spamblacklist', $listType,
'shared-blacklist-regex' ) );
310 $cache->delete(
wfMemcKey(
'spamblacklist', $listType,
'blacklist-regex' ) );
311 $cache->delete(
wfMemcKey(
'spamblacklist', $listType,
'whitelist-regex' ) );
313 wfDebugLog(
'SpamBlacklist',
"$listType blacklist local cache cleared.\n" );
320 wfDebugLog(
'SpamBlacklist',
"Constructing $listType blacklist\n" );
321 foreach ( $this->
files as $fileName ) {
323 if ( preg_match(
'/^DB: ([\w-]*) (.*)$/', $fileName,
$matches ) ) {
325 } elseif ( preg_match(
'/^(https?:)?\/\//', $fileName ) ) {
328 $text = file_get_contents( $fileName );
329 wfDebugLog(
'SpamBlacklist',
"got from file $fileName\n" );
349 # To keep requests to a minimum, we save results into $messageMemc, which is
350 # similar to $wgMemc except almost certain to exist. By default, it is stored
352 # There are two keys, when the warning key expires, a random thread will refresh
353 # the real key. This reduces the chance of multiple requests under high traffic
355 $key =
"{$listType}_blacklist_file:$fileName";
356 $warningKey =
"$wgDBname:{$listType}filewarning:$fileName";
360 if ( !is_string( $httpText ) || ( !$warning && !mt_rand( 0, $this->warningChance ) ) ) {
361 wfDebugLog(
'SpamBlacklist',
"Loading $listType blacklist from $fileName\n" );
363 if ( $httpText ===
false ) {
364 wfDebugLog(
'SpamBlacklist',
"Error loading $listType blacklist from $fileName\n" );
366 $messageMemc->set( $warningKey, 1, $this->warningTime );
367 $messageMemc->set( $key, $httpText, $this->expiryTime );
369 wfDebugLog(
'SpamBlacklist',
"Got $listType blacklist from HTTP cache for $fileName\n" );
384 "Fetching {$this->getBlacklistType()} blacklist from '$article' on '$wiki'...\n" );
386 $title = Title::newFromText( $article );
390 if ( is_callable( [ Revision::class,
'getQueryInfo' ] ) ) {
391 $revQuery = Revision::getQueryInfo( [
'page',
'text' ] );
394 'tables' => [
'revision',
'page',
'text' ],
395 'fields' => array_merge(
396 Revision::selectFields(),
397 Revision::selectPageFields(),
398 Revision::selectTextFields()
401 'text' => [
'JOIN',
'old_id=rev_text_id' ]
409 'page_namespace' => $title->getNamespace(),
410 'page_title' => $title->getDBkey(),
414 [
'page' => [
'JOIN',
'rev_id=page_latest' ] ] +
$revQuery[
'joins']
418 ? ContentHandler::getContentText( Revision::newFromRow( $row )->getContent() )
428 return '/[a-z0-9_\-.]*';
438 return ( $batchSize > 0 ) ?
'/Sim' :
'/im';
c Accompany it with the information you received as to the offer to distribute corresponding source complete source code means all the source code for all modules it plus any associated interface definition files
wfGetDB( $db, $groups=[], $wiki=false)
Get a Database object.
wfExpandUrl( $url, $defaultProto=PROTO_CURRENT)
Expand a potentially local URL to a fully-qualified URL.
wfMemcKey()
Make a cache key for the local wiki.
wfDebugLog( $logGroup, $text, $dest='all', array $context=[])
Send a line to a supplementary debug log file, if configured, or main debug log if not.
Base class for different kinds of blacklists.
static array $blacklistTypes
Array containing blacklists that extend BaseBlacklist.
getLocalBlacklists()
Returns the local blacklist.
static getBlacklistTypes()
Return the array of blacklist types currently defined.
array $files
Array of blacklist sources.
static getEmailBlacklist()
__construct( $settings=[])
Constructor.
static getSpamBlacklist()
getBlacklists()
Fetch local and (possibly cached) remote blacklists.
clearCache()
Clear all primary blacklist cache keys.
filter(array $links, Title $title, $preventLog=false)
getWhitelists()
Returns the (local) whitelist.
getSharedBlacklists()
Fetch (possibly cached) remote blacklists.
getBlacklistType()
Returns the code for the blacklist implementation.
getRegexStart()
Returns the start of the regex for matches.
static getInstance( $type)
Returns an instance of the given blacklist.
getArticleText( $wiki, $article)
Fetch an article from this or another local MediaWiki database.
static getTypeFromTitle(Title $title)
Returns the type of blacklist from the given title.
bool array $regexes
Array containing regexes to test against.
static isLocalSource(Title $title)
Check if the given local page title is a spam regex source.
static array $instances
Array of blacklist instances.
static addBlacklistType( $type, $class)
Adds a blacklist class to the registry.
int $warningChance
Chance of receiving a warning when the filter is hit.
getRegexEnd( $batchSize)
Returns the end of the regex for matches.
warmCachesForFilter(Title $title, array $entries)
static get( $url, $options=[], $caller=__METHOD__)
Simple wrapper for Http::request( 'GET' )
static regexesFromMessage( $message, BaseBlacklist $blacklist)
Build a set of regular expressions from a MediaWiki message.
static regexesFromText( $source, BaseBlacklist $blacklist, $fileName=false)
Build a set of regular expressions from the given multiline input text, with empty lines and comments...
Represents a title within MediaWiki.
this class mediates it Skin Encapsulates a look and feel for the wiki All of the functions that render HTML and make choices about how to render it are here and are called from various other places when and is meant to be subclassed with other skins that may override some of its functions The User object contains a reference to a and so rather than having a global skin object we just rely on the global User and get the skin with $wgUser and also has some character encoding functions and other locale stuff The current user interface language is instantiated as and the local content language as $wgContLang
globals will be eliminated from MediaWiki replaced by an application object which would be passed to constructors Whether that would be an convenient solution remains to be but certainly PHP makes such object oriented programming models easier than they were in previous versions For the time being MediaWiki programmers will have to work in an environment with some global context At the time of globals were initialised on startup by MediaWiki of these were configuration which are documented in DefaultSettings php There is no comprehensive documentation for the remaining however some of the most important ones are listed below They are typically initialised either in index php or in Setup php For a description of the see design txt $wgTitle Title object created from the request URL $wgOut OutputPage object for HTTP response $wgUser User object for the user associated with the current request $wgLang Language object selected by user preferences $wgContLang Language object associated with the wiki being viewed $wgParser Parser object Parser extensions register their hooks here $wgRequest WebRequest to get request data $messageMemc
controlled by $wgMainCacheType controlled by $wgParserCacheType controlled by $wgMessageCacheType If you set CACHE_NONE to one of the three control default value for MediaWiki still create a but requests to it are no ops and we always fall through to the database If the cache daemon can t be it should also disable itself fairly smoothly By $wgMemc is used but when it is $parserMemc or $messageMemc this is mentioned $wgDBname