MediaWiki  1.27.2
CdnCacheUpdate.php
Go to the documentation of this file.
1 <?php
26 
33  protected $urls = [];
34 
38  public function __construct( array $urlArr ) {
39  $this->urls = $urlArr;
40  }
41 
42  public function merge( MergeableUpdate $update ) {
44  Assert::parameterType( __CLASS__, $update, '$update' );
45 
46  $this->urls = array_merge( $this->urls, $update->urls );
47  }
48 
56  public static function newFromTitles( $titles, $urlArr = [] ) {
58  foreach ( $titles as $title ) {
59  $urlArr = array_merge( $urlArr, $title->getCdnUrls() );
60  }
61 
62  return new CdnCacheUpdate( $urlArr );
63  }
64 
70  public static function newSimplePurge( Title $title ) {
71  return new CdnCacheUpdate( $title->getCdnUrls() );
72  }
73 
77  public function doUpdate() {
79 
80  self::purge( $this->urls );
81 
82  if ( $wgCdnReboundPurgeDelay > 0 ) {
83  JobQueueGroup::singleton()->lazyPush( new CdnPurgeJob(
84  Title::makeTitle( NS_SPECIAL, 'Badtitle/' . __CLASS__ ),
85  [
86  'urls' => $this->urls,
87  'jobReleaseTimestamp' => time() + $wgCdnReboundPurgeDelay
88  ]
89  ) );
90  }
91  }
92 
100  public static function purge( array $urlArr ) {
102 
103  if ( !$urlArr ) {
104  return;
105  }
106 
107  // Remove duplicate URLs from list
108  $urlArr = array_unique( $urlArr );
109 
110  wfDebugLog( 'squid', __METHOD__ . ': ' . implode( ' ', $urlArr ) );
111 
112  // Reliably broadcast the purge to all edge nodes
113  $relayer = MediaWikiServices::getInstance()->getEventRelayerGroup()
114  ->getRelayer( 'cdn-url-purges' );
115  $relayer->notify(
116  'cdn-url-purges',
117  [
118  'urls' => array_values( $urlArr ), // JSON array
119  'timestamp' => microtime( true )
120  ]
121  );
122 
123  // Send lossy UDP broadcasting if enabled
124  if ( $wgHTCPRouting ) {
125  self::HTCPPurge( $urlArr );
126  }
127 
128  // Do direct server purges if enabled (this does not scale very well)
129  if ( $wgSquidServers ) {
130  // Maximum number of parallel connections per squid
131  $maxSocketsPerSquid = 8;
132  // Number of requests to send per socket
133  // 400 seems to be a good tradeoff, opening a socket takes a while
134  $urlsPerSocket = 400;
135  $socketsPerSquid = ceil( count( $urlArr ) / $urlsPerSocket );
136  if ( $socketsPerSquid > $maxSocketsPerSquid ) {
137  $socketsPerSquid = $maxSocketsPerSquid;
138  }
139 
140  $pool = new SquidPurgeClientPool;
141  $chunks = array_chunk( $urlArr, ceil( count( $urlArr ) / $socketsPerSquid ) );
142  foreach ( $wgSquidServers as $server ) {
143  foreach ( $chunks as $chunk ) {
144  $client = new SquidPurgeClient( $server );
145  foreach ( $chunk as $url ) {
146  $client->queuePurge( $url );
147  }
148  $pool->addClient( $client );
149  }
150  }
151 
152  $pool->run();
153  }
154  }
155 
162  private static function HTCPPurge( array $urlArr ) {
164 
165  // HTCP CLR operation
166  $htcpOpCLR = 4;
167 
168  // @todo FIXME: PHP doesn't support these socket constants (include/linux/in.h)
169  if ( !defined( "IPPROTO_IP" ) ) {
170  define( "IPPROTO_IP", 0 );
171  define( "IP_MULTICAST_LOOP", 34 );
172  define( "IP_MULTICAST_TTL", 33 );
173  }
174 
175  // pfsockopen doesn't work because we need set_sock_opt
176  $conn = socket_create( AF_INET, SOCK_DGRAM, SOL_UDP );
177  if ( !$conn ) {
178  $errstr = socket_strerror( socket_last_error() );
179  wfDebugLog( 'squid', __METHOD__ .
180  ": Error opening UDP socket: $errstr" );
181 
182  return;
183  }
184 
185  // Set socket options
186  socket_set_option( $conn, IPPROTO_IP, IP_MULTICAST_LOOP, 0 );
187  if ( $wgHTCPMulticastTTL != 1 ) {
188  // Set multicast time to live (hop count) option on socket
189  socket_set_option( $conn, IPPROTO_IP, IP_MULTICAST_TTL,
190  $wgHTCPMulticastTTL );
191  }
192 
193  // Get sequential trx IDs for packet loss counting
195  'squidhtcppurge', 32, count( $urlArr ), UIDGenerator::QUICK_VOLATILE
196  );
197 
198  foreach ( $urlArr as $url ) {
199  if ( !is_string( $url ) ) {
200  throw new MWException( 'Bad purge URL' );
201  }
202  $url = self::expand( $url );
203  $conf = self::getRuleForURL( $url, $wgHTCPRouting );
204  if ( !$conf ) {
205  wfDebugLog( 'squid', __METHOD__ .
206  "No HTCP rule configured for URL {$url} , skipping" );
207  continue;
208  }
209 
210  if ( isset( $conf['host'] ) && isset( $conf['port'] ) ) {
211  // Normalize single entries
212  $conf = [ $conf ];
213  }
214  foreach ( $conf as $subconf ) {
215  if ( !isset( $subconf['host'] ) || !isset( $subconf['port'] ) ) {
216  throw new MWException( "Invalid HTCP rule for URL $url\n" );
217  }
218  }
219 
220  // Construct a minimal HTCP request diagram
221  // as per RFC 2756
222  // Opcode 'CLR', no response desired, no auth
223  $htcpTransID = current( $ids );
224  next( $ids );
225 
226  $htcpSpecifier = pack( 'na4na*na8n',
227  4, 'HEAD', strlen( $url ), $url,
228  8, 'HTTP/1.0', 0 );
229 
230  $htcpDataLen = 8 + 2 + strlen( $htcpSpecifier );
231  $htcpLen = 4 + $htcpDataLen + 2;
232 
233  // Note! Squid gets the bit order of the first
234  // word wrong, wrt the RFC. Apparently no other
235  // implementation exists, so adapt to Squid
236  $htcpPacket = pack( 'nxxnCxNxxa*n',
237  $htcpLen, $htcpDataLen, $htcpOpCLR,
238  $htcpTransID, $htcpSpecifier, 2 );
239 
240  wfDebugLog( 'squid', __METHOD__ .
241  "Purging URL $url via HTCP" );
242  foreach ( $conf as $subconf ) {
243  socket_sendto( $conn, $htcpPacket, $htcpLen, 0,
244  $subconf['host'], $subconf['port'] );
245  }
246  }
247  }
248 
263  public static function expand( $url ) {
264  return wfExpandUrl( $url, PROTO_INTERNAL );
265  }
266 
273  private static function getRuleForURL( $url, $rules ) {
274  foreach ( $rules as $regex => $routing ) {
275  if ( $regex === '' || preg_match( $regex, $url ) ) {
276  return $routing;
277  }
278  }
279 
280  return false;
281  }
282 }
283 
288  // Keep class name for b/c
289 }
const QUICK_VOLATILE
the array() calling protocol came about after MediaWiki 1.4rc1.
static HTCPPurge(array $urlArr)
Send Hyper Text Caching Protocol (HTCP) CLR requests.
$wgSquidServers
List of proxy servers to purge on changes; default port is 80.
static purge(array $urlArr)
Purges a list of CDN nodes defined in $wgSquidServers.
Interface that deferrable updates should implement.
Apache License January AND DISTRIBUTION Definitions License shall mean the terms and conditions for use
static newSequentialPerNodeIDs($bucket, $bits, $count, $flags=0)
Return IDs that are sequential only for this node and bucket.
static newSimplePurge(Title $title)
Handles purging appropriate CDN URLs given a title (or titles)
Interface that deferrable updates can implement.
const NS_SPECIAL
Definition: Defines.php:58
injection txt This is an overview of how MediaWiki makes use of dependency injection The design described here grew from the discussion of RFC T384 The term dependency this means that anything an object needs to operate should be injected from the the object itself should only know narrow no concrete implementation of the logic it relies on The requirement to inject everything typically results in an architecture that based on two main types of and essentially stateless service objects that use other service objects to operate on the value objects As of the beginning MediaWiki is only starting to use the DI approach Much of the code still relies on global state or direct resulting in a highly cyclical dependency MediaWikiServices
Definition: injection.txt:23
Represents a title within MediaWiki.
Definition: Title.php:34
when a variable name is used in a it is silently declared as a new local masking the global
Definition: design.txt:93
wfExpandUrl($url, $defaultProto=PROTO_CURRENT)
Expand a potentially local URL to a fully-qualified URL.
static getRuleForURL($url, $rules)
Find the HTCP routing rule to use for a given URL.
wfDebugLog($logGroup, $text, $dest= 'all', array $context=[])
Send a line to a supplementary debug log file, if configured, or main debug log if not...
const PROTO_INTERNAL
Definition: Defines.php:266
string[] $urls
Collection of URLs to purge.
An HTTP 1.0 client built for the purposes of purging Squid and Varnish.
doUpdate()
Purges the list of URLs passed to the constructor.
getCdnUrls()
Get a list of URLs to purge from the CDN cache when this page changes.
Definition: Title.php:3572
merge(MergeableUpdate $update)
Merge this update with $update.
__construct(array $urlArr)
namespace and then decline to actually register it file or subcat img or subcat $title
Definition: hooks.txt:912
static expand($url)
Expand local URLs to fully-qualified URLs using the internal protocol and host defined in $wgInternal...
$wgHTCPMulticastTTL
HTCP multicast TTL.
This document is intended to provide useful advice for parties seeking to redistribute MediaWiki to end users It s targeted particularly at maintainers for Linux since it s been observed that distribution packages of MediaWiki often break We ve consistently had to recommend that users seeking support use official tarballs instead of their distribution s and this often solves whatever problem the user is having It would be nice if this could such as
Definition: distributors.txt:9
static singleton($wiki=false)
injection txt This is an overview of how MediaWiki makes use of dependency injection The design described here grew from the discussion of RFC T384 The term dependency this means that anything an object needs to operate should be injected from the the object itself should only know narrow no concrete implementation of the logic it relies on The requirement to inject everything typically results in an architecture that based on two main types of and essentially stateless service objects that use other service objects to operate on the value objects As of the beginning MediaWiki is only starting to use the DI approach Much of the code still relies on global state or direct resulting in a highly cyclical dependency which acts as the top level factory for services in MediaWiki which can be used to gain access to default instances of various services MediaWikiServices however also allows new services to be defined and default services to be redefined Services are defined or redefined by providing a callback the instantiator that will return a new instance of the service When it will create an instance of MediaWikiServices and populate it with the services defined in the files listed by thereby bootstrapping the DI framework Per $wgServiceWiringFiles lists includes ServiceWiring php
Definition: injection.txt:35
linkcache txt The LinkCache class maintains a list of article titles and the information about whether or not the article exists in the database This is used to mark up links when displaying a page If the same link appears more than once on any page then it only has to be looked up once In most cases link lookups are done in batches with the LinkBatch class or the equivalent in so the link cache is mostly useful for short snippets of parsed and for links in the navigation areas of the skin The link cache was formerly used to track links used in a document for the purposes of updating the link tables This application is now deprecated To create a you can use the following $titles
Definition: linkcache.txt:17
$wgHTCPRouting
Routing configuration for HTCP multicast purging.
static & makeTitle($ns, $title, $fragment= '', $interwiki= '')
Create a new Title from a namespace index and a DB key.
Definition: Title.php:524
Job to purge a set of URLs from CDN.
Definition: CdnPurgeJob.php:30
static newFromTitles($titles, $urlArr=[])
Create an update object from an array of Title objects, or a TitleArray object.
$wgCdnReboundPurgeDelay
If set, any SquidPurge call on a URL or URLs will send a second purge no less than this many seconds ...