44 'spam' =>
'SpamBlacklist',
45 'email' =>
'EmailBlacklist',
61 foreach ( $settings as $name =>
$value ) {
72 abstract public function filter( array $links,
Title $title, $preventLog =
false );
81 self::$blacklistTypes[
$type] = $class;
101 if ( !isset( self::$blacklistTypes[
$type] ) ) {
102 throw new Exception(
"Invalid blacklist type '$type' passed to " . __METHOD__ );
105 if ( !isset( self::$instances[
$type] ) ) {
106 global $wgBlacklistSettings;
109 if ( !isset( $wgBlacklistSettings[
$type] ) ) {
110 $wgBlacklistSettings[
$type] = [];
113 $class = self::$blacklistTypes[
$type];
114 self::$instances[
$type] =
new $class( $wgBlacklistSettings[
$type] );
117 return self::$instances[
$type];
136 if ( $title->getNamespace() == NS_MEDIAWIKI ) {
138 foreach ( self::$blacklistTypes as
$type => $class ) {
146 if ( in_array( $title->getDBkey(), $sources ) ) {
152 $thisHttpRegex =
'/^' . preg_quote( $thisHttp,
'/' ) .
'(?:&.*)?$/';
155 foreach ( self::$blacklistTypes as
$type => $class ) {
156 if ( isset( $wgBlacklistSettings[
$type][
'files'] ) ) {
161 foreach (
$files as $fileName ) {
163 if ( preg_match(
'/^DB: (\w*) (.*)$/', $fileName,
$matches ) ) {
165 if (
$matches[2] == $title->getPrefixedDbKey() ) {
170 } elseif ( preg_match( $thisHttpRegex, $fileName ) ) {
189 $types = array_map( [
$wgContLang,
'ucfirst' ], array_keys( self::$blacklistTypes ) );
190 $regex =
'/(' . implode(
'|', $types ).
')-(?:blacklist|whitelist)/';
192 if ( preg_match( $regex, $title->getDBkey(), $m ) ) {
193 return strtolower( $m[1] );
205 if ( $this->regexes ===
false ) {
206 $this->regexes = array_merge(
222 return ObjectCache::getMainWANInstance()->getWithSetCallback(
225 function () use ( $that,
$type ) {
240 return ObjectCache::getMainWANInstance()->getWithSetCallback(
243 function () use ( $that,
$type ) {
256 wfDebugLog(
'SpamBlacklist',
"Loading $listType regex..." );
258 if ( count( $this->
files ) == 0 ) {
260 wfDebugLog(
'SpamBlacklist',
"no files specified\n" );
267 $regexes = ObjectCache::getMainWANInstance()->getWithSetCallback(
270 wfMemcKey(
'spamblacklist', $listType,
'shared-blacklist-regex' ),
272 function () use ( $that, &$miss ) {
274 return $that->buildSharedBlacklists();
279 wfDebugLog(
'SpamBlacklist',
"Got shared spam regexes from cache\n" );
293 $cache = ObjectCache::getMainWANInstance();
294 $cache->delete(
wfMemcKey(
'spamblacklist', $listType,
'shared-blacklist-regex' ) );
295 $cache->delete(
wfMemcKey(
'spamblacklist', $listType,
'blacklist-regex' ) );
296 $cache->delete(
wfMemcKey(
'spamblacklist', $listType,
'whitelist-regex' ) );
298 wfDebugLog(
'SpamBlacklist',
"$listType blacklist local cache cleared.\n" );
305 wfDebugLog(
'SpamBlacklist',
"Constructing $listType blacklist\n" );
306 foreach ( $this->
files as $fileName ) {
308 if ( preg_match(
'/^DB: ([\w-]*) (.*)$/', $fileName,
$matches ) ) {
310 } elseif ( preg_match(
'/^(https?:)?\/\//', $fileName ) ) {
313 $text = file_get_contents( $fileName );
314 wfDebugLog(
'SpamBlacklist',
"got from file $fileName\n" );
334 # To keep requests to a minimum, we save results into $messageMemc, which is
335 # similar to $wgMemc except almost certain to exist. By default, it is stored
337 # There are two keys, when the warning key expires, a random thread will refresh
338 # the real key. This reduces the chance of multiple requests under high traffic
340 $key =
"{$listType}_blacklist_file:$fileName";
341 $warningKey =
"$wgDBname:{$listType}filewarning:$fileName";
345 if ( !is_string( $httpText ) || ( !$warning && !mt_rand( 0, $this->warningChance ) ) ) {
346 wfDebugLog(
'SpamBlacklist',
"Loading $listType blacklist from $fileName\n" );
347 $httpText = Http::get( $fileName );
348 if ( $httpText ===
false ) {
349 wfDebugLog(
'SpamBlacklist',
"Error loading $listType blacklist from $fileName\n" );
351 $messageMemc->set( $warningKey, 1, $this->warningTime );
352 $messageMemc->set( $key, $httpText, $this->expiryTime );
354 wfDebugLog(
'SpamBlacklist',
"Got $listType blacklist from HTTP cache for $fileName\n" );
369 "Fetching {$this->getBlacklistType()} blacklist from '$article' on '$wiki'...\n" );
371 $title = Title::newFromText( $article );
376 [
'page',
'revision',
'text' ],
383 'page_namespace' => $title->getNamespace(),
384 'page_title' => $title->getDBkey(),
385 'rev_id=page_latest',
402 return '/[a-z0-9_\-.]*';
412 return ( $batchSize > 0 ) ?
'/Sim' :
'/im';
c Accompany it with the information you received as to the offer to distribute corresponding source complete source code means all the source code for all modules it plus any associated interface definition files
wfGetDB( $db, $groups=[], $wiki=false)
Get a Database object.
wfExpandUrl( $url, $defaultProto=PROTO_CURRENT)
Expand a potentially local URL to a fully-qualified URL.
wfMemcKey()
Make a cache key for the local wiki.
wfDebugLog( $logGroup, $text, $dest='all', array $context=[])
Send a line to a supplementary debug log file, if configured, or main debug log if not.
Base class for different kinds of blacklists.
static array $blacklistTypes
Array containing blacklists that extend BaseBlacklist.
getLocalBlacklists()
Returns the local blacklist.
static getBlacklistTypes()
Return the array of blacklist types currently defined.
array $files
Array of blacklist sources.
__construct( $settings=[])
Constructor.
getBlacklists()
Fetch local and (possibly cached) remote blacklists.
clearCache()
Clear all primary blacklist cache keys.
filter(array $links, Title $title, $preventLog=false)
getWhitelists()
Returns the (local) whitelist.
getSharedBlacklists()
Fetch (possibly cached) remote blacklists.
getBlacklistType()
Returns the code for the blacklist implementation.
getRegexStart()
Returns the start of the regex for matches.
static getInstance( $type)
Returns an instance of the given blacklist.
getArticleText( $wiki, $article)
Fetch an article from this or another local MediaWiki database.
static getTypeFromTitle(Title $title)
Returns the type of blacklist from the given title.
bool array $regexes
Array containing regexes to test against.
static isLocalSource(Title $title)
Check if the given local page title is a spam regex source.
static array $instances
Array of blacklist instances.
static addBlacklistType( $type, $class)
Adds a blacklist class to the registry.
int $warningChance
Chance of receiving a warning when the filter is hit.
getRegexEnd( $batchSize)
Returns the end of the regex for matches.
warmCachesForFilter(Title $title, array $entries)
static getContentText(Content $content=null)
Convenience function for getting flat text from a Content object.
static selectTextFields()
Return the list of text fields that should be selected to read the revision text.
static selectPageFields()
Return the list of page fields that should be selected from page table.
static selectFields()
Return the list of revision fields that should be selected to create a new revision.
static regexesFromMessage( $message, BaseBlacklist $blacklist)
Build a set of regular expressions from a MediaWiki message.
static regexesFromText( $source, BaseBlacklist $blacklist, $fileName=false)
Build a set of regular expressions from the given multiline input text, with empty lines and comments...
Represents a title within MediaWiki.
this class mediates it Skin Encapsulates a look and feel for the wiki All of the functions that render HTML and make choices about how to render it are here and are called from various other places when and is meant to be subclassed with other skins that may override some of its functions The User object contains a reference to a and so rather than having a global skin object we just rely on the global User and get the skin with $wgUser and also has some character encoding functions and other locale stuff The current user interface language is instantiated as and the local content language as $wgContLang
globals will be eliminated from MediaWiki replaced by an application object which would be passed to constructors Whether that would be an convenient solution remains to be but certainly PHP makes such object oriented programming models easier than they were in previous versions For the time being MediaWiki programmers will have to work in an environment with some global context At the time of globals were initialised on startup by MediaWiki of these were configuration which are documented in DefaultSettings php There is no comprehensive documentation for the remaining however some of the most important ones are listed below They are typically initialised either in index php or in Setup php For a description of the see design txt $wgTitle Title object created from the request URL $wgOut OutputPage object for HTTP response $wgUser User object for the user associated with the current request $wgLang Language object selected by user preferences $wgContLang Language object associated with the wiki being viewed $wgParser Parser object Parser extensions register their hooks here $wgRequest WebRequest to get request data $messageMemc
controlled by $wgMainCacheType controlled by $wgParserCacheType controlled by $wgMessageCacheType If you set CACHE_NONE to one of the three control default value for MediaWiki still create a but requests to it are no ops and we always fall through to the database If the cache daemon can t be it should also disable itself fairly smoothly By $wgMemc is used but when it is $parserMemc or $messageMemc this is mentioned $wgDBname