91 return $zdr->execute();
138 if ( isset( $options[
'zip64'] ) ) {
139 $this->zip64 = $options[
'zip64'];
149 $this->file = fopen( $this->fileName,
'r' );
151 if ( !$this->file ) {
152 return Status::newFatal(
'zip-file-open-error' );
155 $status = Status::newGood();
158 if ( $this->zip64 ) {
162 if ( $this->eocdr[
'CD size'] == 0xffffffff
163 || $this->eocdr[
'CD offset'] == 0xffffffff
164 || $this->eocdr[
'CD entries total'] == 0xffff
166 $this->
error(
'zip-unsupported',
'Central directory header indicates ZIP64, ' .
167 'but we are in legacy mode. Rejecting this upload is necessary to avoid ' .
168 'opening vulnerabilities on clients using OpenJDK 7 or later.' );
178 fclose( $this->file );
189 private function error( $code, $debugMessage ) {
190 wfDebug( __CLASS__ .
": Fatal error: $debugMessage" );
203 'CD start disk' => 2,
204 'CD entries this disk' => 2,
205 'CD entries total' => 2,
208 'file comment length' => 2,
212 if ( $startPos < 0 ) {
217 $this->
error(
'zip-wrong-format',
"The file is empty." );
220 $block = $this->
getBlock( $startPos );
221 $sigPos = strrpos( $block,
"PK\x05\x06" );
222 if ( $sigPos ===
false ) {
223 $this->
error(
'zip-wrong-format',
224 "zip file lacks EOCDR signature. It probably isn't a zip file." );
227 $this->eocdr = $this->
unpack( substr( $block, $sigPos ), $info );
228 $this->eocdr[
'EOCDR size'] = $structSize + $this->eocdr[
'file comment length'];
230 if ( $structSize + $this->eocdr[
'file comment length'] != strlen( $block ) - $sigPos ) {
232 $this->
error(
'zip-wrong-format',
'there is a ZIP signature but it is not at ' .
233 'the end of the file. It could be an OLE file with a ZIP file embedded.' );
235 if ( $this->eocdr[
'disk'] !== 0
236 || $this->eocdr[
'CD start disk'] !== 0
238 $this->
error(
'zip-unsupported',
'more than one disk (in EOCDR)' );
240 $this->eocdr += $this->
unpack(
242 [
'file comment' => [
'string', $this->eocdr[
'file comment length'] ] ],
243 $sigPos + $structSize );
244 $this->eocdr[
'position'] = $startPos + $sigPos;
253 'signature' => [
'string', 4 ],
254 'eocdr64 start disk' => 4,
255 'eocdr64 offset' => 8,
256 'number of disks' => 4,
260 $start = $this->
getFileLength() - $this->eocdr[
'EOCDR size'] - $structSize;
261 $block = $this->
getBlock( $start, $structSize );
262 $this->eocdr64Locator =
$data = $this->
unpack( $block, $info );
264 if (
$data[
'signature'] !==
"PK\x06\x07" ) {
268 $this->
error(
'zip-bad',
'wrong signature on Zip64 end of central directory locator' );
277 if ( $this->eocdr64Locator[
'eocdr64 start disk'] != 0
278 || $this->eocdr64Locator[
'number of disks'] != 0
280 $this->
error(
'zip-unsupported',
'more than one disk (in EOCDR64 locator)' );
284 'signature' => [
'string', 4 ],
286 'version made by' => 2,
287 'version needed' => 2,
289 'CD start disk' => 4,
290 'CD entries this disk' => 8,
291 'CD entries total' => 8,
296 $block = $this->
getBlock( $this->eocdr64Locator[
'eocdr64 offset'], $structSize );
297 $this->eocdr64 =
$data = $this->
unpack( $block, $info );
298 if (
$data[
'signature'] !==
"PK\x06\x06" ) {
299 $this->
error(
'zip-bad',
'wrong signature on Zip64 end of central directory record' );
301 if (
$data[
'disk'] !== 0
302 ||
$data[
'CD start disk'] !== 0
304 $this->
error(
'zip-unsupported',
'more than one disk (in EOCDR64)' );
315 $size = $this->eocdr[
'CD size'];
316 $offset = $this->eocdr[
'CD offset'];
317 $endPos = $this->eocdr[
'position'];
321 if ( $offset + $size != $endPos ) {
322 $this->
error(
'zip-bad',
'the central directory does not immediately precede the end ' .
323 'of central directory record' );
326 return [ $offset, $size ];
339 $size = $this->eocdr[
'CD size'];
340 $offset = $this->eocdr[
'CD offset'];
341 $numEntries = $this->eocdr[
'CD entries total'];
342 $endPos = $this->eocdr[
'position'];
343 if ( $size == 0xffffffff
344 || $offset == 0xffffffff
345 || $numEntries == 0xffff
349 if ( isset( $this->eocdr64Locator[
'eocdr64 offset'] ) ) {
351 if ( isset( $this->eocdr64[
'CD offset'] ) ) {
352 $size = $this->eocdr64[
'CD size'];
353 $offset = $this->eocdr64[
'CD offset'];
354 $endPos = $this->eocdr64Locator[
'eocdr64 offset'];
360 if ( $offset + $size != $endPos ) {
361 $this->
error(
'zip-bad',
'the central directory does not immediately precede the end ' .
362 'of central directory record' );
365 return [ $offset, $size ];
374 $block = $this->
getBlock( $offset, $size );
377 'signature' => [
'string', 4 ],
378 'version made by' => 2,
379 'version needed' => 2,
381 'compression method' => 2,
385 'compressed size' => 4,
386 'uncompressed size' => 4,
388 'extra field length' => 2,
389 'comment length' => 2,
390 'disk number start' => 2,
391 'internal attrs' => 2,
392 'external attrs' => 4,
393 'local header offset' => 4,
398 while ( $pos < $size ) {
402 if (
$data[
'signature'] !==
"PK\x01\x02" ) {
403 $this->
error(
'zip-bad',
'Invalid signature found in directory entry' );
407 'name' => [
'string',
$data[
'name length'] ],
408 'extra field' => [
'string',
$data[
'extra field length'] ],
409 'comment' => [
'string',
$data[
'comment length'] ],
411 $data += $this->
unpack( $block, $variableInfo, $pos );
414 if ( $this->zip64 && (
415 $data[
'compressed size'] == 0xffffffff
416 ||
$data[
'uncompressed size'] == 0xffffffff
417 ||
$data[
'local header offset'] == 0xffffffff )
425 if ( $this->
testBit(
$data[
'general bits'], self::GENERAL_CD_ENCRYPTED ) ) {
426 $this->
error(
'zip-unsupported',
'central directory encryption is not supported' );
432 $time =
$data[
'mod time'];
433 $date =
$data[
'mod date'];
435 $year = 1980 + ( $date >> 9 );
436 $month = ( $date >> 5 ) & 15;
438 $hour = ( $time >> 11 ) & 31;
439 $minute = ( $time >> 5 ) & 63;
440 $second = ( $time & 31 ) * 2;
441 $timestamp = sprintf(
"%04d%02d%02d%02d%02d%02d",
442 $year, $month, $day, $hour, $minute, $second );
445 if ( $this->
testBit(
$data[
'general bits'], self::GENERAL_UTF8 ) ) {
446 $name =
$data[
'name'];
448 $name = iconv(
'CP437',
'UTF-8',
$data[
'name'] );
454 'mtime' => $timestamp,
455 'size' =>
$data[
'uncompressed size'],
457 call_user_func( $this->callback, $userData );
474 'uncompressed size' => 8,
475 'compressed size' => 8,
476 'local header offset' => 8,
477 'disk number start' => 4,
481 while ( $extraPos < strlen( $extraField ) ) {
482 $extra = $this->
unpack( $extraField, $extraHeaderInfo, $extraPos );
483 $extraPos += $extraHeaderSize;
484 $extra += $this->
unpack( $extraField,
485 [
'data' => [
'string', $extra[
'size'] ] ],
487 $extraPos += $extra[
'size'];
489 if ( $extra[
'id'] == self::ZIP64_EXTRA_HEADER ) {
490 return $this->
unpack( $extra[
'data'], $zip64ExtraInfo );
502 if ( $this->fileLength ===
null ) {
503 $stat = fstat( $this->file );
504 $this->fileLength = $stat[
'size'];
520 private function getBlock( $start, $length =
null ) {
523 $this->
error(
'zip-bad',
"getBlock() requested position $start, " .
524 "file length is $fileLength" );
526 if ( $length ===
null ) {
529 $end = $start + $length;
531 $this->
error(
'zip-bad',
"getBlock() requested end position $end, " .
532 "file length is $fileLength" );
534 $startSeg = floor( $start / self::SEGSIZE );
535 $endSeg = ceil( $end / self::SEGSIZE );
538 for ( $segIndex = $startSeg; $segIndex <= $endSeg; $segIndex++ ) {
542 $block = substr( $block,
543 $start - $startSeg * self::SEGSIZE,
546 if ( strlen( $block ) < $length ) {
547 $this->
error(
'zip-bad',
'getBlock() returned an unexpectedly small amount of data' );
567 if ( !isset( $this->buffer[$segIndex] ) ) {
570 $this->buffer[$segIndex] =
'';
574 if ( fseek( $this->file, $bytePos ) ) {
575 $this->
error(
'zip-bad',
"seek to $bytePos failed" );
577 $seg = fread( $this->file, self::SEGSIZE );
578 if ( $seg ===
false ) {
579 $this->
error(
'zip-bad',
"read from $bytePos failed" );
581 $this->buffer[$segIndex] = $seg;
584 return $this->buffer[$segIndex];
594 foreach ( $struct as
$type ) {
595 if ( is_array(
$type ) ) {
596 list( , $fieldSize ) =
$type;
628 private function unpack( $string, $struct, $offset = 0 ) {
630 if ( $offset + $size > strlen( $string ) ) {
631 $this->
error(
'zip-bad',
'unpack() would run past the end of the supplied string' );
636 foreach ( $struct as $key =>
$type ) {
637 if ( is_array(
$type ) ) {
638 list( $typeName, $fieldSize ) =
$type;
639 switch ( $typeName ) {
641 $data[$key] = substr( $string, $pos, $fieldSize );
645 throw new MWException( __METHOD__ .
": invalid type \"$typeName\"" );
649 $length = intval(
$type );
654 for ( $i = $length - 1; $i >= 0; $i-- ) {
656 $value += ord( $string[$pos + $i] );
660 if ( $value > 2 ** 52 ) {
661 $this->
error(
'zip-unsupported',
'number too large to be stored in a double. ' .
662 'This could happen if we tried to unpack a 64-bit structure ' .
663 'at an invalid location.' );
665 $data[$key] = $value;
681 private function testBit( $value, $bitIndex ) {
682 return (
bool)( ( $value >> $bitIndex ) & 1 );
wfDebug( $text, $dest='all', array $context=[])
Sends a line to the debug log if enabled or, optionally, to a comment in output.
Internal exception class.
A class for reading ZIP file directories, for the purposes of upload verification.
$callback
The file data callback.
const GENERAL_UTF8
The index of the "general field" bit for UTF-8 file names.
readEndOfCentralDirectoryRecord()
Read the header which is at the end of the central directory, unimaginatively called the "end of cent...
error( $code, $debugMessage)
Throw an error, and log a debug message.
execute()
Read the directory according to settings in $this.
__construct( $fileName, $callback, $options)
readZip64EndOfCentralDirectoryRecord()
Read the header called the "ZIP64 end of central directory record".
getSegment( $segIndex)
Get a section of the file starting at position $segIndex * self::SEGSIZE, of length self::SEGSIZE.
const ZIP64_EXTRA_HEADER
The "extra field" ID for ZIP64 central directory entries.
findZip64CentralDirectory()
Find the location of the central directory, as would be seen by a ZIP64-compliant reader.
$file
The opened file resource.
static read( $fileName, $callback, $options=[])
Read a ZIP file and call a function for each file discovered in it.
testBit( $value, $bitIndex)
Returns a bit from a given position in an integer value, converted to boolean.
getFileLength()
Get the length of the file.
const GENERAL_CD_ENCRYPTED
The index of the "general field" bit for central directory encryption.
getStructSize( $struct)
Get the size of a structure in bytes.
readZip64EndOfCentralDirectoryLocator()
Read the header called the "ZIP64 end of central directory locator".
findOldCentralDirectory()
Find the location of the central directory, as would be seen by a non-ZIP64 reader.
$buffer
A segmented cache of the file contents.
getBlock( $start, $length=null)
Get the file contents from a given offset.
unpack( $string, $struct, $offset=0)
Unpack a binary structure.
const SEGSIZE
The segment size for the file contents cache.
$fileLength
The cached length of the file, or null if it has not been loaded yet.
readCentralDirectory( $offset, $size)
Read the central directory at the given location.
unpackZip64Extra( $extraField)
Interpret ZIP64 "extra field" data and return an associative array.