This project does not seem to handle request data directly as such no vulnerable execution paths were found.
include
, or for example
via PHP's auto-loading mechanism.
These results are based on our legacy PHP analysis, consider migrating to our new PHP analysis engine instead. Learn more
1 | <?php |
||
2 | /** |
||
3 | * ZIP file directories reader, for the purposes of upload verification. |
||
4 | * |
||
5 | * This program is free software; you can redistribute it and/or modify |
||
6 | * it under the terms of the GNU General Public License as published by |
||
7 | * the Free Software Foundation; either version 2 of the License, or |
||
8 | * (at your option) any later version. |
||
9 | * |
||
10 | * This program is distributed in the hope that it will be useful, |
||
11 | * but WITHOUT ANY WARRANTY; without even the implied warranty of |
||
12 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
||
13 | * GNU General Public License for more details. |
||
14 | * |
||
15 | * You should have received a copy of the GNU General Public License along |
||
16 | * with this program; if not, write to the Free Software Foundation, Inc., |
||
17 | * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA. |
||
18 | * http://www.gnu.org/copyleft/gpl.html |
||
19 | * |
||
20 | * @file |
||
21 | */ |
||
22 | |||
23 | /** |
||
24 | * A class for reading ZIP file directories, for the purposes of upload |
||
25 | * verification. |
||
26 | * |
||
27 | * Only a functional interface is provided: ZipFileReader::read(). No access is |
||
28 | * given to object instances. |
||
29 | * |
||
30 | */ |
||
31 | class ZipDirectoryReader { |
||
32 | /** |
||
33 | * Read a ZIP file and call a function for each file discovered in it. |
||
34 | * |
||
35 | * Because this class is aimed at verification, an error is raised on |
||
36 | * suspicious or ambiguous input, instead of emulating some standard |
||
37 | * behavior. |
||
38 | * |
||
39 | * @param string $fileName The archive file name |
||
40 | * @param array $callback The callback function. It will be called for each file |
||
41 | * with a single associative array each time, with members: |
||
42 | * |
||
43 | * - name: The file name. Directories conventionally have a trailing |
||
44 | * slash. |
||
45 | * |
||
46 | * - mtime: The file modification time, in MediaWiki 14-char format |
||
47 | * |
||
48 | * - size: The uncompressed file size |
||
49 | * |
||
50 | * @param array $options An associative array of read options, with the option |
||
51 | * name in the key. This may currently contain: |
||
52 | * |
||
53 | * - zip64: If this is set to true, then we will emulate a |
||
54 | * library with ZIP64 support, like OpenJDK 7. If it is set to |
||
55 | * false, then we will emulate a library with no knowledge of |
||
56 | * ZIP64. |
||
57 | * |
||
58 | * NOTE: The ZIP64 code is untested and probably doesn't work. It |
||
59 | * turned out to be easier to just reject ZIP64 archive uploads, |
||
60 | * since they are likely to be very rare. Confirming safety of a |
||
61 | * ZIP64 file is fairly complex. What do you do with a file that is |
||
62 | * ambiguous and broken when read with a non-ZIP64 reader, but valid |
||
63 | * when read with a ZIP64 reader? This situation is normal for a |
||
64 | * valid ZIP64 file, and working out what non-ZIP64 readers will make |
||
65 | * of such a file is not trivial. |
||
66 | * |
||
67 | * @return Status A Status object. The following fatal errors are defined: |
||
68 | * |
||
69 | * - zip-file-open-error: The file could not be opened. |
||
70 | * |
||
71 | * - zip-wrong-format: The file does not appear to be a ZIP file. |
||
72 | * |
||
73 | * - zip-bad: There was something wrong or ambiguous about the file |
||
74 | * data. |
||
75 | * |
||
76 | * - zip-unsupported: The ZIP file uses features which |
||
77 | * ZipDirectoryReader does not support. |
||
78 | * |
||
79 | * The default messages for those fatal errors are written in a way that |
||
80 | * makes sense for upload verification. |
||
81 | * |
||
82 | * If a fatal error is returned, more information about the error will be |
||
83 | * available in the debug log. |
||
84 | * |
||
85 | * Note that the callback function may be called any number of times before |
||
86 | * a fatal error is returned. If this occurs, the data sent to the callback |
||
87 | * function should be discarded. |
||
88 | */ |
||
89 | public static function read( $fileName, $callback, $options = [] ) { |
||
90 | $zdr = new self( $fileName, $callback, $options ); |
||
91 | |||
92 | return $zdr->execute(); |
||
93 | } |
||
94 | |||
95 | /** The file name */ |
||
96 | protected $fileName; |
||
97 | |||
98 | /** The opened file resource */ |
||
99 | protected $file; |
||
100 | |||
101 | /** The cached length of the file, or null if it has not been loaded yet. */ |
||
102 | protected $fileLength; |
||
103 | |||
104 | /** A segmented cache of the file contents */ |
||
105 | protected $buffer; |
||
106 | |||
107 | /** The file data callback */ |
||
108 | protected $callback; |
||
109 | |||
110 | /** The ZIP64 mode */ |
||
111 | protected $zip64 = false; |
||
112 | |||
113 | /** Stored headers */ |
||
114 | protected $eocdr, $eocdr64, $eocdr64Locator; |
||
0 ignored issues
–
show
|
|||
115 | |||
116 | protected $data; |
||
117 | |||
118 | /** The "extra field" ID for ZIP64 central directory entries */ |
||
119 | const ZIP64_EXTRA_HEADER = 0x0001; |
||
120 | |||
121 | /** The segment size for the file contents cache */ |
||
122 | const SEGSIZE = 16384; |
||
123 | |||
124 | /** The index of the "general field" bit for UTF-8 file names */ |
||
125 | const GENERAL_UTF8 = 11; |
||
126 | |||
127 | /** The index of the "general field" bit for central directory encryption */ |
||
128 | const GENERAL_CD_ENCRYPTED = 13; |
||
129 | |||
130 | /** |
||
131 | * Private constructor |
||
132 | * @param string $fileName |
||
133 | * @param callable $callback |
||
134 | * @param array $options |
||
135 | */ |
||
136 | protected function __construct( $fileName, $callback, $options ) { |
||
137 | $this->fileName = $fileName; |
||
138 | $this->callback = $callback; |
||
139 | |||
140 | if ( isset( $options['zip64'] ) ) { |
||
141 | $this->zip64 = $options['zip64']; |
||
142 | } |
||
143 | } |
||
144 | |||
145 | /** |
||
146 | * Read the directory according to settings in $this. |
||
147 | * |
||
148 | * @return Status |
||
149 | */ |
||
150 | function execute() { |
||
151 | $this->file = fopen( $this->fileName, 'r' ); |
||
152 | $this->data = []; |
||
153 | if ( !$this->file ) { |
||
154 | return Status::newFatal( 'zip-file-open-error' ); |
||
155 | } |
||
156 | |||
157 | $status = Status::newGood(); |
||
158 | try { |
||
159 | $this->readEndOfCentralDirectoryRecord(); |
||
160 | if ( $this->zip64 ) { |
||
161 | list( $offset, $size ) = $this->findZip64CentralDirectory(); |
||
162 | $this->readCentralDirectory( $offset, $size ); |
||
163 | } else { |
||
164 | if ( $this->eocdr['CD size'] == 0xffffffff |
||
165 | || $this->eocdr['CD offset'] == 0xffffffff |
||
166 | || $this->eocdr['CD entries total'] == 0xffff |
||
167 | ) { |
||
168 | $this->error( 'zip-unsupported', 'Central directory header indicates ZIP64, ' . |
||
169 | 'but we are in legacy mode. Rejecting this upload is necessary to avoid ' . |
||
170 | 'opening vulnerabilities on clients using OpenJDK 7 or later.' ); |
||
171 | } |
||
172 | |||
173 | list( $offset, $size ) = $this->findOldCentralDirectory(); |
||
174 | $this->readCentralDirectory( $offset, $size ); |
||
175 | } |
||
176 | } catch ( ZipDirectoryReaderError $e ) { |
||
177 | $status->fatal( $e->getErrorCode() ); |
||
178 | } |
||
179 | |||
180 | fclose( $this->file ); |
||
181 | |||
182 | return $status; |
||
183 | } |
||
184 | |||
185 | /** |
||
186 | * Throw an error, and log a debug message |
||
187 | * @param mixed $code |
||
188 | * @param string $debugMessage |
||
189 | * @throws ZipDirectoryReaderError |
||
190 | */ |
||
191 | function error( $code, $debugMessage ) { |
||
192 | wfDebug( __CLASS__ . ": Fatal error: $debugMessage\n" ); |
||
193 | throw new ZipDirectoryReaderError( $code ); |
||
194 | } |
||
195 | |||
196 | /** |
||
197 | * Read the header which is at the end of the central directory, |
||
198 | * unimaginatively called the "end of central directory record" by the ZIP |
||
199 | * spec. |
||
200 | */ |
||
201 | function readEndOfCentralDirectoryRecord() { |
||
202 | $info = [ |
||
203 | 'signature' => 4, |
||
204 | 'disk' => 2, |
||
205 | 'CD start disk' => 2, |
||
206 | 'CD entries this disk' => 2, |
||
207 | 'CD entries total' => 2, |
||
208 | 'CD size' => 4, |
||
209 | 'CD offset' => 4, |
||
210 | 'file comment length' => 2, |
||
211 | ]; |
||
212 | $structSize = $this->getStructSize( $info ); |
||
213 | $startPos = $this->getFileLength() - 65536 - $structSize; |
||
214 | if ( $startPos < 0 ) { |
||
215 | $startPos = 0; |
||
216 | } |
||
217 | |||
218 | if ( $this->getFileLength() === 0 ) { |
||
219 | $this->error( 'zip-wrong-format', "The file is empty." ); |
||
220 | } |
||
221 | |||
222 | $block = $this->getBlock( $startPos ); |
||
223 | $sigPos = strrpos( $block, "PK\x05\x06" ); |
||
224 | if ( $sigPos === false ) { |
||
225 | $this->error( 'zip-wrong-format', |
||
226 | "zip file lacks EOCDR signature. It probably isn't a zip file." ); |
||
227 | } |
||
228 | |||
229 | $this->eocdr = $this->unpack( substr( $block, $sigPos ), $info ); |
||
230 | $this->eocdr['EOCDR size'] = $structSize + $this->eocdr['file comment length']; |
||
231 | |||
232 | if ( $structSize + $this->eocdr['file comment length'] != strlen( $block ) - $sigPos ) { |
||
233 | $this->error( 'zip-bad', 'trailing bytes after the end of the file comment' ); |
||
234 | } |
||
235 | if ( $this->eocdr['disk'] !== 0 |
||
236 | || $this->eocdr['CD start disk'] !== 0 |
||
237 | ) { |
||
238 | $this->error( 'zip-unsupported', 'more than one disk (in EOCDR)' ); |
||
239 | } |
||
240 | $this->eocdr += $this->unpack( |
||
241 | $block, |
||
242 | [ 'file comment' => [ 'string', $this->eocdr['file comment length'] ] ], |
||
243 | $sigPos + $structSize ); |
||
244 | $this->eocdr['position'] = $startPos + $sigPos; |
||
245 | } |
||
246 | |||
247 | /** |
||
248 | * Read the header called the "ZIP64 end of central directory locator". An |
||
249 | * error will be raised if it does not exist. |
||
250 | */ |
||
251 | function readZip64EndOfCentralDirectoryLocator() { |
||
252 | $info = [ |
||
253 | 'signature' => [ 'string', 4 ], |
||
254 | 'eocdr64 start disk' => 4, |
||
255 | 'eocdr64 offset' => 8, |
||
256 | 'number of disks' => 4, |
||
257 | ]; |
||
258 | $structSize = $this->getStructSize( $info ); |
||
259 | |||
260 | $start = $this->getFileLength() - $this->eocdr['EOCDR size'] - $structSize; |
||
261 | $block = $this->getBlock( $start, $structSize ); |
||
262 | $this->eocdr64Locator = $data = $this->unpack( $block, $info ); |
||
263 | |||
264 | if ( $data['signature'] !== "PK\x06\x07" ) { |
||
265 | // Note: Java will allow this and continue to read the |
||
266 | // EOCDR64, so we have to reject the upload, we can't |
||
267 | // just use the EOCDR header instead. |
||
268 | $this->error( 'zip-bad', 'wrong signature on Zip64 end of central directory locator' ); |
||
269 | } |
||
270 | } |
||
271 | |||
272 | /** |
||
273 | * Read the header called the "ZIP64 end of central directory record". It |
||
274 | * may replace the regular "end of central directory record" in ZIP64 files. |
||
275 | */ |
||
276 | function readZip64EndOfCentralDirectoryRecord() { |
||
277 | if ( $this->eocdr64Locator['eocdr64 start disk'] != 0 |
||
278 | || $this->eocdr64Locator['number of disks'] != 0 |
||
279 | ) { |
||
280 | $this->error( 'zip-unsupported', 'more than one disk (in EOCDR64 locator)' ); |
||
281 | } |
||
282 | |||
283 | $info = [ |
||
284 | 'signature' => [ 'string', 4 ], |
||
285 | 'EOCDR64 size' => 8, |
||
286 | 'version made by' => 2, |
||
287 | 'version needed' => 2, |
||
288 | 'disk' => 4, |
||
289 | 'CD start disk' => 4, |
||
290 | 'CD entries this disk' => 8, |
||
291 | 'CD entries total' => 8, |
||
292 | 'CD size' => 8, |
||
293 | 'CD offset' => 8 |
||
294 | ]; |
||
295 | $structSize = $this->getStructSize( $info ); |
||
296 | $block = $this->getBlock( $this->eocdr64Locator['eocdr64 offset'], $structSize ); |
||
297 | $this->eocdr64 = $data = $this->unpack( $block, $info ); |
||
298 | if ( $data['signature'] !== "PK\x06\x06" ) { |
||
299 | $this->error( 'zip-bad', 'wrong signature on Zip64 end of central directory record' ); |
||
300 | } |
||
301 | if ( $data['disk'] !== 0 |
||
302 | || $data['CD start disk'] !== 0 |
||
303 | ) { |
||
304 | $this->error( 'zip-unsupported', 'more than one disk (in EOCDR64)' ); |
||
305 | } |
||
306 | } |
||
307 | |||
308 | /** |
||
309 | * Find the location of the central directory, as would be seen by a |
||
310 | * non-ZIP64 reader. |
||
311 | * |
||
312 | * @return array List containing offset, size and end position. |
||
313 | */ |
||
314 | function findOldCentralDirectory() { |
||
315 | $size = $this->eocdr['CD size']; |
||
316 | $offset = $this->eocdr['CD offset']; |
||
317 | $endPos = $this->eocdr['position']; |
||
318 | |||
319 | // Some readers use the EOCDR position instead of the offset field |
||
320 | // to find the directory, so to be safe, we check if they both agree. |
||
321 | if ( $offset + $size != $endPos ) { |
||
322 | $this->error( 'zip-bad', 'the central directory does not immediately precede the end ' . |
||
323 | 'of central directory record' ); |
||
324 | } |
||
325 | |||
326 | return [ $offset, $size ]; |
||
327 | } |
||
328 | |||
329 | /** |
||
330 | * Find the location of the central directory, as would be seen by a |
||
331 | * ZIP64-compliant reader. |
||
332 | * |
||
333 | * @return array List containing offset, size and end position. |
||
334 | */ |
||
335 | function findZip64CentralDirectory() { |
||
336 | // The spec is ambiguous about the exact rules of precedence between the |
||
337 | // ZIP64 headers and the original headers. Here we follow zip_util.c |
||
338 | // from OpenJDK 7. |
||
339 | $size = $this->eocdr['CD size']; |
||
340 | $offset = $this->eocdr['CD offset']; |
||
341 | $numEntries = $this->eocdr['CD entries total']; |
||
342 | $endPos = $this->eocdr['position']; |
||
343 | if ( $size == 0xffffffff |
||
344 | || $offset == 0xffffffff |
||
345 | || $numEntries == 0xffff |
||
346 | ) { |
||
347 | $this->readZip64EndOfCentralDirectoryLocator(); |
||
348 | |||
349 | if ( isset( $this->eocdr64Locator['eocdr64 offset'] ) ) { |
||
350 | $this->readZip64EndOfCentralDirectoryRecord(); |
||
351 | if ( isset( $this->eocdr64['CD offset'] ) ) { |
||
352 | $size = $this->eocdr64['CD size']; |
||
353 | $offset = $this->eocdr64['CD offset']; |
||
354 | $endPos = $this->eocdr64Locator['eocdr64 offset']; |
||
355 | } |
||
356 | } |
||
357 | } |
||
358 | // Some readers use the EOCDR position instead of the offset field |
||
359 | // to find the directory, so to be safe, we check if they both agree. |
||
360 | if ( $offset + $size != $endPos ) { |
||
361 | $this->error( 'zip-bad', 'the central directory does not immediately precede the end ' . |
||
362 | 'of central directory record' ); |
||
363 | } |
||
364 | |||
365 | return [ $offset, $size ]; |
||
366 | } |
||
367 | |||
368 | /** |
||
369 | * Read the central directory at the given location |
||
370 | * @param int $offset |
||
371 | * @param int $size |
||
372 | */ |
||
373 | function readCentralDirectory( $offset, $size ) { |
||
374 | $block = $this->getBlock( $offset, $size ); |
||
375 | |||
376 | $fixedInfo = [ |
||
377 | 'signature' => [ 'string', 4 ], |
||
378 | 'version made by' => 2, |
||
379 | 'version needed' => 2, |
||
380 | 'general bits' => 2, |
||
381 | 'compression method' => 2, |
||
382 | 'mod time' => 2, |
||
383 | 'mod date' => 2, |
||
384 | 'crc-32' => 4, |
||
385 | 'compressed size' => 4, |
||
386 | 'uncompressed size' => 4, |
||
387 | 'name length' => 2, |
||
388 | 'extra field length' => 2, |
||
389 | 'comment length' => 2, |
||
390 | 'disk number start' => 2, |
||
391 | 'internal attrs' => 2, |
||
392 | 'external attrs' => 4, |
||
393 | 'local header offset' => 4, |
||
394 | ]; |
||
395 | $fixedSize = $this->getStructSize( $fixedInfo ); |
||
396 | |||
397 | $pos = 0; |
||
398 | while ( $pos < $size ) { |
||
399 | $data = $this->unpack( $block, $fixedInfo, $pos ); |
||
400 | $pos += $fixedSize; |
||
401 | |||
402 | if ( $data['signature'] !== "PK\x01\x02" ) { |
||
403 | $this->error( 'zip-bad', 'Invalid signature found in directory entry' ); |
||
404 | } |
||
405 | |||
406 | $variableInfo = [ |
||
407 | 'name' => [ 'string', $data['name length'] ], |
||
408 | 'extra field' => [ 'string', $data['extra field length'] ], |
||
409 | 'comment' => [ 'string', $data['comment length'] ], |
||
410 | ]; |
||
411 | $data += $this->unpack( $block, $variableInfo, $pos ); |
||
412 | $pos += $this->getStructSize( $variableInfo ); |
||
413 | |||
414 | if ( $this->zip64 && ( |
||
415 | $data['compressed size'] == 0xffffffff |
||
416 | || $data['uncompressed size'] == 0xffffffff |
||
417 | || $data['local header offset'] == 0xffffffff ) |
||
418 | ) { |
||
419 | $zip64Data = $this->unpackZip64Extra( $data['extra field'] ); |
||
420 | if ( $zip64Data ) { |
||
421 | $data = $zip64Data + $data; |
||
422 | } |
||
423 | } |
||
424 | |||
425 | if ( $this->testBit( $data['general bits'], self::GENERAL_CD_ENCRYPTED ) ) { |
||
426 | $this->error( 'zip-unsupported', 'central directory encryption is not supported' ); |
||
427 | } |
||
428 | |||
429 | // Convert the timestamp into MediaWiki format |
||
430 | // For the format, please see the MS-DOS 2.0 Programmer's Reference, |
||
431 | // pages 3-5 and 3-6. |
||
432 | $time = $data['mod time']; |
||
433 | $date = $data['mod date']; |
||
434 | |||
435 | $year = 1980 + ( $date >> 9 ); |
||
436 | $month = ( $date >> 5 ) & 15; |
||
437 | $day = $date & 31; |
||
438 | $hour = ( $time >> 11 ) & 31; |
||
439 | $minute = ( $time >> 5 ) & 63; |
||
440 | $second = ( $time & 31 ) * 2; |
||
441 | $timestamp = sprintf( "%04d%02d%02d%02d%02d%02d", |
||
442 | $year, $month, $day, $hour, $minute, $second ); |
||
443 | |||
444 | // Convert the character set in the file name |
||
445 | if ( $this->testBit( $data['general bits'], self::GENERAL_UTF8 ) ) { |
||
446 | $name = $data['name']; |
||
447 | } else { |
||
448 | $name = iconv( 'CP437', 'UTF-8', $data['name'] ); |
||
449 | } |
||
450 | |||
451 | // Compile a data array for the user, with a sensible format |
||
452 | $userData = [ |
||
453 | 'name' => $name, |
||
454 | 'mtime' => $timestamp, |
||
455 | 'size' => $data['uncompressed size'], |
||
456 | ]; |
||
457 | call_user_func( $this->callback, $userData ); |
||
458 | } |
||
459 | } |
||
460 | |||
461 | /** |
||
462 | * Interpret ZIP64 "extra field" data and return an associative array. |
||
463 | * @param string $extraField |
||
464 | * @return array|bool |
||
465 | */ |
||
466 | function unpackZip64Extra( $extraField ) { |
||
467 | $extraHeaderInfo = [ |
||
468 | 'id' => 2, |
||
469 | 'size' => 2, |
||
470 | ]; |
||
471 | $extraHeaderSize = $this->getStructSize( $extraHeaderInfo ); |
||
472 | |||
473 | $zip64ExtraInfo = [ |
||
474 | 'uncompressed size' => 8, |
||
475 | 'compressed size' => 8, |
||
476 | 'local header offset' => 8, |
||
477 | 'disk number start' => 4, |
||
478 | ]; |
||
479 | |||
480 | $extraPos = 0; |
||
481 | while ( $extraPos < strlen( $extraField ) ) { |
||
482 | $extra = $this->unpack( $extraField, $extraHeaderInfo, $extraPos ); |
||
483 | $extraPos += $extraHeaderSize; |
||
484 | $extra += $this->unpack( $extraField, |
||
485 | [ 'data' => [ 'string', $extra['size'] ] ], |
||
486 | $extraPos ); |
||
487 | $extraPos += $extra['size']; |
||
488 | |||
489 | if ( $extra['id'] == self::ZIP64_EXTRA_HEADER ) { |
||
490 | return $this->unpack( $extra['data'], $zip64ExtraInfo ); |
||
491 | } |
||
492 | } |
||
493 | |||
494 | return false; |
||
495 | } |
||
496 | |||
497 | /** |
||
498 | * Get the length of the file. |
||
499 | * @return int |
||
500 | */ |
||
501 | function getFileLength() { |
||
502 | if ( $this->fileLength === null ) { |
||
503 | $stat = fstat( $this->file ); |
||
504 | $this->fileLength = $stat['size']; |
||
505 | } |
||
506 | |||
507 | return $this->fileLength; |
||
508 | } |
||
509 | |||
510 | /** |
||
511 | * Get the file contents from a given offset. If there are not enough bytes |
||
512 | * in the file to satisfy the request, an exception will be thrown. |
||
513 | * |
||
514 | * @param int $start The byte offset of the start of the block. |
||
515 | * @param int $length The number of bytes to return. If omitted, the remainder |
||
516 | * of the file will be returned. |
||
517 | * |
||
518 | * @return string |
||
519 | */ |
||
520 | function getBlock( $start, $length = null ) { |
||
521 | $fileLength = $this->getFileLength(); |
||
522 | if ( $start >= $fileLength ) { |
||
523 | $this->error( 'zip-bad', "getBlock() requested position $start, " . |
||
524 | "file length is $fileLength" ); |
||
525 | } |
||
526 | if ( $length === null ) { |
||
527 | $length = $fileLength - $start; |
||
528 | } |
||
529 | $end = $start + $length; |
||
530 | if ( $end > $fileLength ) { |
||
531 | $this->error( 'zip-bad', "getBlock() requested end position $end, " . |
||
532 | "file length is $fileLength" ); |
||
533 | } |
||
534 | $startSeg = floor( $start / self::SEGSIZE ); |
||
535 | $endSeg = ceil( $end / self::SEGSIZE ); |
||
536 | |||
537 | $block = ''; |
||
538 | for ( $segIndex = $startSeg; $segIndex <= $endSeg; $segIndex++ ) { |
||
539 | $block .= $this->getSegment( $segIndex ); |
||
540 | } |
||
541 | |||
542 | $block = substr( $block, |
||
543 | $start - $startSeg * self::SEGSIZE, |
||
544 | $length ); |
||
545 | |||
546 | if ( strlen( $block ) < $length ) { |
||
547 | $this->error( 'zip-bad', 'getBlock() returned an unexpectedly small amount of data' ); |
||
548 | } |
||
549 | |||
550 | return $block; |
||
551 | } |
||
552 | |||
553 | /** |
||
554 | * Get a section of the file starting at position $segIndex * self::SEGSIZE, |
||
555 | * of length self::SEGSIZE. The result is cached. This is a helper function |
||
556 | * for getBlock(). |
||
557 | * |
||
558 | * If there are not enough bytes in the file to satisfy the request, the |
||
559 | * return value will be truncated. If a request is made for a segment beyond |
||
560 | * the end of the file, an empty string will be returned. |
||
561 | * |
||
562 | * @param int $segIndex |
||
563 | * |
||
564 | * @return string |
||
565 | */ |
||
566 | function getSegment( $segIndex ) { |
||
567 | if ( !isset( $this->buffer[$segIndex] ) ) { |
||
568 | $bytePos = $segIndex * self::SEGSIZE; |
||
569 | if ( $bytePos >= $this->getFileLength() ) { |
||
570 | $this->buffer[$segIndex] = ''; |
||
571 | |||
572 | return ''; |
||
573 | } |
||
574 | if ( fseek( $this->file, $bytePos ) ) { |
||
575 | $this->error( 'zip-bad', "seek to $bytePos failed" ); |
||
576 | } |
||
577 | $seg = fread( $this->file, self::SEGSIZE ); |
||
578 | if ( $seg === false ) { |
||
579 | $this->error( 'zip-bad', "read from $bytePos failed" ); |
||
580 | } |
||
581 | $this->buffer[$segIndex] = $seg; |
||
582 | } |
||
583 | |||
584 | return $this->buffer[$segIndex]; |
||
585 | } |
||
586 | |||
587 | /** |
||
588 | * Get the size of a structure in bytes. See unpack() for the format of $struct. |
||
589 | * @param array $struct |
||
590 | * @return int |
||
591 | */ |
||
592 | function getStructSize( $struct ) { |
||
593 | $size = 0; |
||
594 | foreach ( $struct as $type ) { |
||
595 | if ( is_array( $type ) ) { |
||
596 | list( , $fieldSize ) = $type; |
||
597 | $size += $fieldSize; |
||
598 | } else { |
||
599 | $size += $type; |
||
600 | } |
||
601 | } |
||
602 | |||
603 | return $size; |
||
604 | } |
||
605 | |||
606 | /** |
||
607 | * Unpack a binary structure. This is like the built-in unpack() function |
||
608 | * except nicer. |
||
609 | * |
||
610 | * @param string $string The binary data input |
||
611 | * |
||
612 | * @param array $struct An associative array giving structure members and their |
||
613 | * types. In the key is the field name. The value may be either an |
||
614 | * integer, in which case the field is a little-endian unsigned integer |
||
615 | * encoded in the given number of bytes, or an array, in which case the |
||
616 | * first element of the array is the type name, and the subsequent |
||
617 | * elements are type-dependent parameters. Only one such type is defined: |
||
618 | * - "string": The second array element gives the length of string. |
||
619 | * Not null terminated. |
||
620 | * |
||
621 | * @param int $offset The offset into the string at which to start unpacking. |
||
622 | * |
||
623 | * @throws MWException |
||
624 | * @return array Unpacked associative array. Note that large integers in the input |
||
625 | * may be represented as floating point numbers in the return value, so |
||
626 | * the use of weak comparison is advised. |
||
627 | */ |
||
628 | function unpack( $string, $struct, $offset = 0 ) { |
||
629 | $size = $this->getStructSize( $struct ); |
||
630 | if ( $offset + $size > strlen( $string ) ) { |
||
631 | $this->error( 'zip-bad', 'unpack() would run past the end of the supplied string' ); |
||
632 | } |
||
633 | |||
634 | $data = []; |
||
635 | $pos = $offset; |
||
636 | foreach ( $struct as $key => $type ) { |
||
637 | if ( is_array( $type ) ) { |
||
638 | list( $typeName, $fieldSize ) = $type; |
||
639 | switch ( $typeName ) { |
||
640 | case 'string': |
||
641 | $data[$key] = substr( $string, $pos, $fieldSize ); |
||
642 | $pos += $fieldSize; |
||
643 | break; |
||
644 | default: |
||
645 | throw new MWException( __METHOD__ . ": invalid type \"$typeName\"" ); |
||
646 | } |
||
647 | } else { |
||
648 | // Unsigned little-endian integer |
||
649 | $length = intval( $type ); |
||
650 | |||
651 | // Calculate the value. Use an algorithm which automatically |
||
652 | // upgrades the value to floating point if necessary. |
||
653 | $value = 0; |
||
654 | for ( $i = $length - 1; $i >= 0; $i-- ) { |
||
655 | $value *= 256; |
||
656 | $value += ord( $string[$pos + $i] ); |
||
657 | } |
||
658 | |||
659 | // Throw an exception if there was loss of precision |
||
660 | if ( $value > pow( 2, 52 ) ) { |
||
661 | $this->error( 'zip-unsupported', 'number too large to be stored in a double. ' . |
||
662 | 'This could happen if we tried to unpack a 64-bit structure ' . |
||
663 | 'at an invalid location.' ); |
||
664 | } |
||
665 | $data[$key] = $value; |
||
666 | $pos += $length; |
||
667 | } |
||
668 | } |
||
669 | |||
670 | return $data; |
||
671 | } |
||
672 | |||
673 | /** |
||
674 | * Returns a bit from a given position in an integer value, converted to |
||
675 | * boolean. |
||
676 | * |
||
677 | * @param int $value |
||
678 | * @param int $bitIndex The index of the bit, where 0 is the LSB. |
||
679 | * @return bool |
||
680 | */ |
||
681 | function testBit( $value, $bitIndex ) { |
||
682 | return (bool)( ( $value >> $bitIndex ) & 1 ); |
||
683 | } |
||
684 | |||
685 | /** |
||
686 | * Debugging helper function which dumps a string in hexdump -C format. |
||
687 | * @param string $s |
||
688 | */ |
||
689 | function hexDump( $s ) { |
||
690 | $n = strlen( $s ); |
||
691 | for ( $i = 0; $i < $n; $i += 16 ) { |
||
692 | printf( "%08X ", $i ); |
||
693 | for ( $j = 0; $j < 16; $j++ ) { |
||
694 | print " "; |
||
695 | if ( $j == 8 ) { |
||
696 | print " "; |
||
697 | } |
||
698 | if ( $i + $j >= $n ) { |
||
699 | print " "; |
||
700 | } else { |
||
701 | printf( "%02X", ord( $s[$i + $j] ) ); |
||
702 | } |
||
703 | } |
||
704 | |||
705 | print " |"; |
||
706 | for ( $j = 0; $j < 16; $j++ ) { |
||
707 | if ( $i + $j >= $n ) { |
||
708 | print " "; |
||
709 | } elseif ( ctype_print( $s[$i + $j] ) ) { |
||
710 | print $s[$i + $j]; |
||
711 | } else { |
||
712 | print '.'; |
||
713 | } |
||
714 | } |
||
715 | print "|\n"; |
||
716 | } |
||
717 | } |
||
718 | } |
||
719 | |||
720 | /** |
||
721 | * Internal exception class. Will be caught by private code. |
||
722 | */ |
||
723 | class ZipDirectoryReaderError extends Exception { |
||
724 | protected $errorCode; |
||
725 | |||
726 | function __construct( $code ) { |
||
727 | $this->errorCode = $code; |
||
728 | parent::__construct( "ZipDirectoryReader error: $code" ); |
||
729 | } |
||
730 | |||
731 | /** |
||
732 | * @return mixed |
||
733 | */ |
||
734 | function getErrorCode() { |
||
735 | return $this->errorCode; |
||
736 | } |
||
737 | } |
||
738 |
Only declaring a single property per statement allows you to later on add doc comments more easily.
It is also recommended by PSR2, so it is a common style that many people expect.