MediaWiki 1.40.4
populateFilearchiveSha1.php
Go to the documentation of this file.
1<?php
24require_once __DIR__ . '/Maintenance.php';
25
33 public function __construct() {
34 parent::__construct();
35 $this->addDescription( 'Populate the fa_sha1 field from fa_storage_key' );
36 }
37
38 protected function getUpdateKey() {
39 return 'populate fa_sha1';
40 }
41
42 protected function updateSkippedMessage() {
43 return 'fa_sha1 column of filearchive table already populated.';
44 }
45
46 public function doDBUpdates() {
47 $startTime = microtime( true );
48 $dbw = $this->getDB( DB_PRIMARY );
49 $table = 'filearchive';
50 $conds = [ 'fa_sha1' => '', 'fa_storage_key IS NOT NULL' ];
51
52 if ( !$dbw->fieldExists( $table, 'fa_sha1', __METHOD__ ) ) {
53 $this->output( "fa_sha1 column does not exist\n\n", true );
54
55 return false;
56 }
57
58 $this->output( "Populating fa_sha1 field from fa_storage_key\n" );
59 $endId = $dbw->selectField( $table, 'MAX(fa_id)', '', __METHOD__ );
60
61 $batchSize = $this->getBatchSize();
62 $done = 0;
63
64 do {
65 $res = $dbw->select(
66 $table,
67 [ 'fa_id', 'fa_storage_key' ],
68 $conds,
69 __METHOD__,
70 [ 'LIMIT' => $batchSize ]
71 );
72
73 $i = 0;
74 foreach ( $res as $row ) {
75 if ( $row->fa_storage_key == '' ) {
76 // Revision was missing pre-deletion
77 continue;
78 }
79 $sha1 = LocalRepo::getHashFromKey( $row->fa_storage_key );
80 $dbw->update( $table,
81 [ 'fa_sha1' => $sha1 ],
82 [ 'fa_id' => $row->fa_id ],
83 __METHOD__
84 );
85 $lastId = $row->fa_id;
86 $i++;
87 }
88
89 $done += $i;
90 if ( $i !== $batchSize ) {
91 break;
92 }
93
94 // print status and let replica DBs catch up
95 $this->output( sprintf(
96 // @phan-suppress-next-line PhanPossiblyUndeclaredVariable $lastId is set for non-empty $res
97 "id %d done (up to %d), %5.3f%% \r", $lastId, $endId, $lastId / $endId * 100 ) );
98 $this->waitForReplication();
99 } while ( true );
100
101 $processingTime = microtime( true ) - $startTime;
102 $this->output( sprintf( "\nDone %d files in %.1f seconds\n", $done, $processingTime ) );
103
104 // we only updated *some* files, don't log
105 return true;
106 }
107}
108
109$maintClass = PopulateFilearchiveSha1::class;
110require_once RUN_MAINTENANCE_IF_MAIN;
getDB()
Class for scripts that perform database maintenance and want to log the update in updatelog so we can...
output( $out, $channel=null)
Throw some output to the user.
waitForReplication()
Wait for replica DBs to catch up.
getBatchSize()
Returns batch size.
addDescription( $text)
Set the description text.
Maintenance script to populate the fa_sha1 field.
__construct()
Default constructor.
updateSkippedMessage()
Message to show that the update was done already and was just skipped.
getUpdateKey()
Get the update key name to go in the update log table.
const DB_PRIMARY
Definition defines.php:28