MediaWiki master
resolveStubs.php
Go to the documentation of this file.
1<?php
27
28// @codeCoverageIgnoreStart
29require_once __DIR__ . '/../Maintenance.php';
30// @codeCoverageIgnoreEnd
31
32class ResolveStubs extends Maintenance {
34 private $undoLog;
35
36 public function __construct() {
37 parent::__construct();
38 $this->setBatchSize( 1000 );
39 $this->addOption( 'dry-run', 'Don\'t update any rows' );
40 $this->addOption( 'undo', 'Undo log location', false, true );
41 }
42
47 public function execute() {
48 $dbw = $this->getPrimaryDB();
49 $dbr = $this->getReplicaDB();
50 $maxID = $dbr->newSelectQueryBuilder()
51 ->select( 'MAX(old_id)' )
52 ->from( 'text' )
53 ->caller( __METHOD__ )->fetchField();
54 $blockSize = $this->getBatchSize();
55 $dryRun = $this->getOption( 'dry-run' );
56 $this->setUndoLog( new UndoLog( $this->getOption( 'undo' ), $dbw ) );
57
58 $numBlocks = intval( $maxID / $blockSize ) + 1;
59 $numResolved = 0;
60 $numTotal = 0;
61
62 for ( $b = 0; $b < $numBlocks; $b++ ) {
63 $this->waitForReplication();
64
65 $this->output( sprintf( "%5.2f%%\n", $b / $numBlocks * 100 ) );
66 $start = $blockSize * $b + 1;
67 $end = $blockSize * ( $b + 1 );
68
69 $res = $dbr->newSelectQueryBuilder()
70 ->select( [ 'old_id', 'old_text', 'old_flags' ] )
71 ->from( 'text' )
72 ->where(
73 "old_id>=$start AND old_id<=$end " .
74 "AND old_flags LIKE '%object%' AND old_flags NOT LIKE '%external%' " .
75 // LOWER() doesn't work on binary text, need to convert
76 'AND LOWER(CONVERT(LEFT(old_text,22) USING latin1)) = \'o:15:"historyblobstub"\''
77 )
78 ->caller( __METHOD__ )->fetchResultSet();
79 foreach ( $res as $row ) {
80 $numResolved += $this->resolveStub( $row, $dryRun ) ? 1 : 0;
81 $numTotal++;
82 }
83 }
84 $this->output( "100%\n" );
85 $this->output( "$numResolved of $numTotal stubs resolved\n" );
86 }
87
88 public function setUndoLog( UndoLog $undoLog ) {
89 $this->undoLog = $undoLog;
90 }
91
101 public function resolveStub( $row, $dryRun ) {
102 $id = $row->old_id;
103 $stub = unserialize( $row->old_text );
104 $flags = SqlBlobStore::explodeFlags( $row->old_flags );
105
106 $dbr = $this->getReplicaDB();
107
108 if ( !( $stub instanceof HistoryBlobStub ) ) {
109 print "Error at old_id $id: found object of class " . get_class( $stub ) .
110 ", expecting HistoryBlobStub\n";
111 return false;
112 }
113
114 $mainId = $stub->getLocation();
115 if ( !$mainId ) {
116 print "Error at old_id $id: falsey location\n";
117 return false;
118 }
119
120 # Get the main text row
121 $mainTextRow = $dbr->newSelectQueryBuilder()
122 ->select( [ 'old_text', 'old_flags' ] )
123 ->from( 'text' )
124 ->where( [ 'old_id' => $mainId ] )
125 ->caller( __METHOD__ )->fetchRow();
126
127 if ( !$mainTextRow ) {
128 print "Error at old_id $id: can't find main text row old_id $mainId\n";
129 return false;
130 }
131
132 $mainFlags = SqlBlobStore::explodeFlags( $mainTextRow->old_flags );
133 $mainText = $mainTextRow->old_text;
134
135 if ( !in_array( 'external', $mainFlags ) ) {
136 print "Error at old_id $id: target $mainId is not external\n";
137 return false;
138 }
139 if ( preg_match( '!^DB://([^/]*)/([^/]*)/[0-9a-f]{32}$!', $mainText ) ) {
140 print "Error at old_id $id: target $mainId is a CGZ pointer\n";
141 return false;
142 }
143 if ( preg_match( '!^DB://([^/]*)/([^/]*)/[0-9]{1,6}$!', $mainText ) ) {
144 print "Error at old_id $id: target $mainId is a DHB pointer\n";
145 return false;
146 }
147 if ( !preg_match( '!^DB://([^/]*)/([^/]*)$!', $mainText ) ) {
148 print "Error at old_id $id: target $mainId has unrecognised text\n";
149 return false;
150 }
151
152 # Preserve the legacy encoding flag, but switch from object to external
153 if ( in_array( 'utf-8', $flags ) ) {
154 $newFlags = 'utf-8,external';
155 } else {
156 $newFlags = 'external';
157 }
158 $newText = $mainText . '/' . $stub->getHash();
159
160 # Update the row
161 if ( $dryRun ) {
162 $this->output( "Resolve $id => $newFlags $newText\n" );
163 } else {
164 $updated = $this->undoLog->update(
165 'text',
166 [
167 'old_flags' => $newFlags,
168 'old_text' => $newText
169 ],
170 (array)$row,
171 __METHOD__
172 );
173 if ( !$updated ) {
174 $this->output( "Updated of old_id $id failed to match\n" );
175 return false;
176 }
177 }
178 return true;
179 }
180}
181
182// @codeCoverageIgnoreStart
183$maintClass = ResolveStubs::class;
184require_once RUN_MAINTENANCE_IF_MAIN;
185// @codeCoverageIgnoreEnd
Pointer object for an item within a CGZ blob stored in the text table.
Update a database while optionally writing SQL that reverses the update to a file.
Definition UndoLog.php:11
Service for storing and loading Content objects representing revision data blobs.
setUndoLog(UndoLog $undoLog)
resolveStub( $row, $dryRun)
Resolve a history stub.
execute()
Convert history stubs that point to an external row to direct external pointers.
$maintClass