MediaWiki master
orphanStats.php
Go to the documentation of this file.
1<?php
24// @codeCoverageIgnoreStart
25require_once __DIR__ . '/../Maintenance.php';
26// @codeCoverageIgnoreEnd
27
34class OrphanStats extends Maintenance {
35 public function __construct() {
36 parent::__construct();
37 $this->addDescription(
38 "Show some statistics on the blob_orphans table, created with trackBlobs.php" );
39 }
40
41 protected function getExternalDB( $db, $cluster ) {
42 $lbFactory = $this->getServiceContainer()->getDBLoadBalancerFactory();
43 $lb = $lbFactory->getExternalLB( $cluster );
44
45 return $lb->getMaintenanceConnectionRef( $db );
46 }
47
48 public function execute() {
49 if ( !$this->getDB( DB_PRIMARY )->tableExists( 'blob_orphans', __METHOD__ ) ) {
50 $this->fatalError( "blob_orphans doesn't seem to exist, need to run trackBlobs.php first" );
51 }
52 $dbr = $this->getReplicaDB();
53 $res = $dbr->newSelectQueryBuilder()
54 ->select( '*' )
55 ->from( 'blob_orphans' )
56 ->caller( __METHOD__ )->fetchResultSet();
57
58 $num = 0;
59 $totalSize = 0;
60 $hashes = [];
61 $maxSize = 0;
62
63 foreach ( $res as $row ) {
64 $extDB = $this->getExternalDB( DB_REPLICA, $row->bo_cluster );
65 $blobRow = $extDB->newSelectQueryBuilder()
66 ->select( '*' )
67 ->from( 'blobs' )
68 ->where( [ 'blob_id' => $row->bo_blob_id ] )
69 ->caller( __METHOD__ )->fetchRow();
70
71 $num++;
72 $size = strlen( $blobRow->blob_text );
73 $totalSize += $size;
74 $hashes[sha1( $blobRow->blob_text )] = true;
75 $maxSize = max( $size, $maxSize );
76 }
77 unset( $res );
78
79 $this->output( "Number of orphans: $num\n" );
80 if ( $num > 0 ) {
81 $this->output( "Average size: " . round( $totalSize / $num, 0 ) . " bytes\n" .
82 "Max size: $maxSize\n" .
83 "Number of unique texts: " . count( $hashes ) . "\n" );
84 }
85 }
86}
87
88// @codeCoverageIgnoreStart
89$maintClass = OrphanStats::class;
90require_once RUN_MAINTENANCE_IF_MAIN;
91// @codeCoverageIgnoreEnd
Abstract maintenance class for quickly writing and churning out maintenance scripts with minimal effo...
getDB( $db, $groups=[], $dbDomain=false)
Returns a database to be used by current maintenance script.
output( $out, $channel=null)
Throw some output to the user.
getServiceContainer()
Returns the main service container.
addDescription( $text)
Set the description text.
fatalError( $msg, $exitCode=1)
Output a message and terminate the current script.
Maintenance script that shows some statistics on the blob_orphans table, created with trackBlobs....
getExternalDB( $db, $cluster)
__construct()
Default constructor.
execute()
Do the actual work.
$maintClass
const DB_REPLICA
Definition defines.php:26
const DB_PRIMARY
Definition defines.php:28