/
archiver_zip.c
1715 lines (1389 loc) · 52.7 KB
1
2
3
/*
* ZIP support routines for PhysicsFS.
*
4
* Please see the file LICENSE.txt in the source's root directory.
5
*
6
7
* This file written by Ryan C. Gordon, with some peeking at "unzip.c"
* by Gilles Vollant.
8
9
*/
10
11
12
13
#define __PHYSICSFS_INTERNAL__
#include "physfs_internal.h"
#if PHYSFS_SUPPORTS_ZIP
14
15
#include <errno.h>
16
#include <time.h>
17
18
19
20
21
22
23
24
#define USE_MINIZ 1
#if USE_MINIZ
#include "physfs_miniz.h"
#else
#include <zlib.h>
#endif
25
/*
26
27
* A buffer of ZIP_READBUFSIZE is allocated for each compressed file opened,
* and is freed when you close the file; compressed data is read into
28
29
30
31
32
33
34
35
36
37
38
* this buffer, and then is decompressed into the buffer passed to
* PHYSFS_read().
*
* Uncompressed entries in a zipfile do not allocate this buffer; they just
* read data directly into the buffer passed to PHYSFS_read().
*
* Depending on your speed and memory requirements, you should tweak this
* value.
*/
#define ZIP_READBUFSIZE (16 * 1024)
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
/*
* Entries are "unresolved" until they are first opened. At that time,
* local file headers parsed/validated, data offsets will be updated to look
* at the actual file data instead of the header, and symlinks will be
* followed and optimized. This means that we don't seek and read around the
* archive until forced to do so, and after the first time, we had to do
* less reading and parsing, which is very CD-ROM friendly.
*/
typedef enum
{
ZIP_UNRESOLVED_FILE,
ZIP_UNRESOLVED_SYMLINK,
ZIP_RESOLVING,
ZIP_RESOLVED,
ZIP_BROKEN_FILE,
55
ZIP_BROKEN_SYMLINK
56
57
58
} ZipResolveType;
59
60
61
/*
* One ZIPentry is kept for each file in an open ZIP archive.
*/
62
typedef struct _ZIPentry
63
{
64
65
66
char *name; /* Name of file in archive */
struct _ZIPentry *symlink; /* NULL or file we symlink to */
ZipResolveType resolved; /* Have we resolved file/symlink? */
67
PHYSFS_uint64 offset; /* offset of data in archive */
68
69
70
71
PHYSFS_uint16 version; /* version made by */
PHYSFS_uint16 version_needed; /* version needed to extract */
PHYSFS_uint16 compression_method; /* compression method */
PHYSFS_uint32 crc; /* crc-32 */
72
73
PHYSFS_uint64 compressed_size; /* compressed size */
PHYSFS_uint64 uncompressed_size; /* uncompressed size */
74
PHYSFS_sint64 last_mod_time; /* last file mod time */
75
76
} ZIPentry;
77
78
79
/*
* One ZIPinfo is kept for each open ZIP archive.
*/
80
81
typedef struct
{
82
PHYSFS_Io *io;
83
84
85
int zip64; /* non-zero if this is a Zip64 archive. */
PHYSFS_uint64 entryCount; /* Number of files in ZIP. */
ZIPentry *entries; /* info on all files in ZIP. */
86
87
} ZIPinfo;
88
89
90
/*
* One ZIPfileinfo is kept for each open file in a ZIP archive.
*/
91
92
typedef struct
{
93
ZIPentry *entry; /* Info on file. */
94
PHYSFS_Io *io; /* physical file handle. */
95
96
97
98
PHYSFS_uint32 compressed_position; /* offset in compressed data. */
PHYSFS_uint32 uncompressed_position; /* tell() position. */
PHYSFS_uint8 *buffer; /* decompression buffer. */
z_stream stream; /* zlib stream state. */
99
100
101
} ZIPfileinfo;
102
/* Magic numbers... */
103
104
105
106
107
108
#define ZIP_LOCAL_FILE_SIG 0x04034b50
#define ZIP_CENTRAL_DIR_SIG 0x02014b50
#define ZIP_END_OF_CENTRAL_DIR_SIG 0x06054b50
#define ZIP64_END_OF_CENTRAL_DIR_SIG 0x06064b50
#define ZIP64_END_OF_CENTRAL_DIRECTORY_LOCATOR_SIG 0x07064b50
#define ZIP64_EXTENDED_INFO_EXTRA_FIELD_SIG 0x0001
109
110
111
112
113
114
/* compression methods... */
#define COMPMETH_NONE 0
/* ...and others... */
115
116
117
118
#define UNIX_FILETYPE_MASK 0170000
#define UNIX_FILETYPE_SYMLINK 0120000
119
120
121
122
123
/*
* Bridge physfs allocation functions to zlib's format...
*/
static voidpf zlibPhysfsAlloc(voidpf opaque, uInt items, uInt size)
{
124
return ((PHYSFS_Allocator *) opaque)->Malloc(items * size);
125
126
127
128
129
130
131
} /* zlibPhysfsAlloc */
/*
* Bridge physfs allocation functions to zlib's format...
*/
static void zlibPhysfsFree(voidpf opaque, voidpf address)
{
132
((PHYSFS_Allocator *) opaque)->Free(address);
133
134
135
136
137
138
139
140
141
142
143
} /* zlibPhysfsFree */
/*
* Construct a new z_stream to a sane state.
*/
static void initializeZStream(z_stream *pstr)
{
memset(pstr, '\0', sizeof (z_stream));
pstr->zalloc = zlibPhysfsAlloc;
pstr->zfree = zlibPhysfsFree;
144
pstr->opaque = &allocator;
145
146
147
} /* initializeZStream */
148
static PHYSFS_ErrorCode zlib_error_code(int rc)
149
150
151
{
switch (rc)
{
152
153
154
155
156
case Z_OK: return PHYSFS_ERR_OK; /* not an error. */
case Z_STREAM_END: return PHYSFS_ERR_OK; /* not an error. */
case Z_ERRNO: return PHYSFS_ERR_IO;
case Z_MEM_ERROR: return PHYSFS_ERR_OUT_OF_MEMORY;
default: return PHYSFS_ERR_CORRUPT;
157
} /* switch */
158
159
} /* zlib_error_string */
160
161
162
163
/*
* Wrap all zlib calls in this, so the physfs error state is set appropriately.
*/
164
static int zlib_err(const int rc)
165
{
166
__PHYSFS_setError(zlib_error_code(rc));
167
return rc;
168
169
170
} /* zlib_err */
171
172
173
174
175
176
177
178
179
180
181
/*
* Read an unsigned 64-bit int and swap to native byte order.
*/
static int readui64(PHYSFS_Io *io, PHYSFS_uint64 *val)
{
PHYSFS_uint64 v;
BAIL_IF_MACRO(!__PHYSFS_readAll(io, &v, sizeof (v)), ERRPASS, 0);
*val = PHYSFS_swapULE64(v);
return 1;
} /* readui64 */
182
183
184
/*
* Read an unsigned 32-bit int and swap to native byte order.
*/
185
static int readui32(PHYSFS_Io *io, PHYSFS_uint32 *val)
186
187
{
PHYSFS_uint32 v;
188
BAIL_IF_MACRO(!__PHYSFS_readAll(io, &v, sizeof (v)), ERRPASS, 0);
189
*val = PHYSFS_swapULE32(v);
190
return 1;
191
192
193
194
195
196
} /* readui32 */
/*
* Read an unsigned 16-bit int and swap to native byte order.
*/
197
static int readui16(PHYSFS_Io *io, PHYSFS_uint16 *val)
198
199
{
PHYSFS_uint16 v;
200
BAIL_IF_MACRO(!__PHYSFS_readAll(io, &v, sizeof (v)), ERRPASS, 0);
201
*val = PHYSFS_swapULE16(v);
202
return 1;
203
204
205
} /* readui16 */
206
static PHYSFS_sint64 ZIP_read(PHYSFS_Io *_io, void *buf, PHYSFS_uint64 len)
207
{
208
209
ZIPfileinfo *finfo = (ZIPfileinfo *) _io->opaque;
PHYSFS_Io *io = finfo->io;
210
211
ZIPentry *entry = finfo->entry;
PHYSFS_sint64 retval = 0;
212
PHYSFS_sint64 maxread = (PHYSFS_sint64) len;
213
214
215
216
PHYSFS_sint64 avail = entry->uncompressed_size -
finfo->uncompressed_position;
if (avail < maxread)
217
maxread = avail;
218
219
BAIL_IF_MACRO(maxread == 0, ERRPASS, 0); /* quick rejection. */
220
221
if (entry->compression_method == COMPMETH_NONE)
222
retval = io->read(io, buf, maxread);
223
224
225
else
{
finfo->stream.next_out = buf;
226
finfo->stream.avail_out = (uInt) maxread;
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
while (retval < maxread)
{
PHYSFS_uint32 before = finfo->stream.total_out;
int rc;
if (finfo->stream.avail_in == 0)
{
PHYSFS_sint64 br;
br = entry->compressed_size - finfo->compressed_position;
if (br > 0)
{
if (br > ZIP_READBUFSIZE)
br = ZIP_READBUFSIZE;
243
br = io->read(io, finfo->buffer, (PHYSFS_uint64) br);
244
245
246
if (br <= 0)
break;
247
finfo->compressed_position += (PHYSFS_uint32) br;
248
finfo->stream.next_in = finfo->buffer;
249
finfo->stream.avail_in = (PHYSFS_uint32) br;
250
251
} /* if */
} /* if */
252
253
254
rc = zlib_err(inflate(&finfo->stream, Z_SYNC_FLUSH));
retval += (finfo->stream.total_out - before);
255
256
257
258
259
260
261
if (rc != Z_OK)
break;
} /* while */
} /* else */
if (retval > 0)
262
finfo->uncompressed_position += (PHYSFS_uint32) retval;
263
264
return retval;
265
266
267
} /* ZIP_read */
268
static PHYSFS_sint64 ZIP_write(PHYSFS_Io *io, const void *b, PHYSFS_uint64 len)
269
{
270
BAIL_MACRO(PHYSFS_ERR_READ_ONLY, -1);
271
272
273
} /* ZIP_write */
274
static PHYSFS_sint64 ZIP_tell(PHYSFS_Io *io)
275
{
276
return ((ZIPfileinfo *) io->opaque)->uncompressed_position;
277
278
279
} /* ZIP_tell */
280
static int ZIP_seek(PHYSFS_Io *_io, PHYSFS_uint64 offset)
281
{
282
ZIPfileinfo *finfo = (ZIPfileinfo *) _io->opaque;
283
ZIPentry *entry = finfo->entry;
284
PHYSFS_Io *io = finfo->io;
285
286
BAIL_IF_MACRO(offset > entry->uncompressed_size, PHYSFS_ERR_PAST_EOF, 0);
287
288
if (entry->compression_method == COMPMETH_NONE)
289
{
290
const PHYSFS_sint64 newpos = offset + entry->offset;
291
BAIL_IF_MACRO(!io->seek(io, newpos), ERRPASS, 0);
292
finfo->uncompressed_position = (PHYSFS_uint32) offset;
293
} /* if */
294
295
else
296
{
297
298
299
300
/*
* If seeking backwards, we need to redecode the file
* from the start and throw away the compressed bits until we hit
* the offset we need. If seeking forward, we still need to
301
* decode, but we don't rewind first.
302
303
304
305
306
*/
if (offset < finfo->uncompressed_position)
{
/* we do a copy so state is sane if inflateInit2() fails. */
z_stream str;
307
initializeZStream(&str);
308
if (zlib_err(inflateInit2(&str, -MAX_WBITS)) != Z_OK)
309
return 0;
310
311
if (!io->seek(io, entry->offset))
312
return 0;
313
314
315
316
317
318
319
320
321
inflateEnd(&finfo->stream);
memcpy(&finfo->stream, &str, sizeof (z_stream));
finfo->uncompressed_position = finfo->compressed_position = 0;
} /* if */
while (finfo->uncompressed_position != offset)
{
PHYSFS_uint8 buf[512];
322
323
324
PHYSFS_uint32 maxread;
maxread = (PHYSFS_uint32) (offset - finfo->uncompressed_position);
325
326
327
if (maxread > sizeof (buf))
maxread = sizeof (buf);
328
if (ZIP_read(_io, buf, maxread) != maxread)
329
return 0;
330
331
332
} /* while */
} /* else */
333
return 1;
334
335
336
} /* ZIP_seek */
337
static PHYSFS_sint64 ZIP_length(PHYSFS_Io *io)
338
{
339
const ZIPfileinfo *finfo = (ZIPfileinfo *) io->opaque;
340
return (PHYSFS_sint64) finfo->entry->uncompressed_size;
341
} /* ZIP_length */
342
343
344
345
346
static PHYSFS_Io *zip_get_io(PHYSFS_Io *io, ZIPinfo *inf, ZIPentry *entry);
static PHYSFS_Io *ZIP_duplicate(PHYSFS_Io *io)
347
{
348
349
350
ZIPfileinfo *origfinfo = (ZIPfileinfo *) io->opaque;
PHYSFS_Io *retval = (PHYSFS_Io *) allocator.Malloc(sizeof (PHYSFS_Io));
ZIPfileinfo *finfo = (ZIPfileinfo *) allocator.Malloc(sizeof (ZIPfileinfo));
351
352
GOTO_IF_MACRO(!retval, PHYSFS_ERR_OUT_OF_MEMORY, failed);
GOTO_IF_MACRO(!finfo, PHYSFS_ERR_OUT_OF_MEMORY, failed);
353
354
355
356
memset(finfo, '\0', sizeof (*finfo));
finfo->entry = origfinfo->entry;
finfo->io = zip_get_io(origfinfo->io, NULL, finfo->entry);
357
GOTO_IF_MACRO(!finfo->io, ERRPASS, failed);
358
359
360
361
if (finfo->entry->compression_method != COMPMETH_NONE)
{
finfo->buffer = (PHYSFS_uint8 *) allocator.Malloc(ZIP_READBUFSIZE);
362
363
364
GOTO_IF_MACRO(!finfo->buffer, PHYSFS_ERR_OUT_OF_MEMORY, failed);
if (zlib_err(inflateInit2(&finfo->stream, -MAX_WBITS)) != Z_OK)
goto failed;
365
366
367
368
369
370
} /* if */
memcpy(retval, io, sizeof (PHYSFS_Io));
retval->opaque = finfo;
return retval;
371
failed:
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
if (finfo != NULL)
{
if (finfo->io != NULL)
finfo->io->destroy(finfo->io);
if (finfo->buffer != NULL)
{
allocator.Free(finfo->buffer);
inflateEnd(&finfo->stream);
} /* if */
allocator.Free(finfo);
} /* if */
if (retval != NULL)
allocator.Free(retval);
return NULL;
} /* ZIP_duplicate */
static int ZIP_flush(PHYSFS_Io *io) { return 1; /* no write support. */ }
static void ZIP_destroy(PHYSFS_Io *io)
{
ZIPfileinfo *finfo = (ZIPfileinfo *) io->opaque;
finfo->io->destroy(finfo->io);
398
399
400
401
402
if (finfo->entry->compression_method != COMPMETH_NONE)
inflateEnd(&finfo->stream);
if (finfo->buffer != NULL)
403
allocator.Free(finfo->buffer);
404
405
allocator.Free(finfo);
406
407
408
409
410
411
allocator.Free(io);
} /* ZIP_destroy */
static const PHYSFS_Io ZIP_Io =
{
412
CURRENT_PHYSFS_IO_API_VERSION, NULL,
413
414
415
416
417
418
419
ZIP_read,
ZIP_write,
ZIP_seek,
ZIP_tell,
ZIP_length,
ZIP_duplicate,
ZIP_flush,
420
ZIP_destroy
421
422
};
423
424
425
static PHYSFS_sint64 zip_find_end_of_central_dir(PHYSFS_Io *io, PHYSFS_sint64 *len)
426
{
427
PHYSFS_uint8 buf[256];
428
PHYSFS_uint8 extra[4] = { 0, 0, 0, 0 };
429
PHYSFS_sint32 i = 0;
430
431
432
PHYSFS_sint64 filelen;
PHYSFS_sint64 filepos;
PHYSFS_sint32 maxread;
433
434
PHYSFS_sint32 totalread = 0;
int found = 0;
435
436
filelen = io->length(io);
437
BAIL_IF_MACRO(filelen == -1, ERRPASS, 0);
438
439
440
441
442
443
444
445
446
/*
* Jump to the end of the file and start reading backwards.
* The last thing in the file is the zipfile comment, which is variable
* length, and the field that specifies its size is before it in the
* file (argh!)...this means that we need to scan backwards until we
* hit the end-of-central-dir signature. We can then sanity check that
* the comment was as big as it should be to make sure we're in the
* right place. The comment length field is 16 bits, so we can stop
447
448
* searching for that signature after a little more than 64k at most,
* and call it a corrupted zipfile.
449
450
451
452
453
454
455
456
457
458
*/
if (sizeof (buf) < filelen)
{
filepos = filelen - sizeof (buf);
maxread = sizeof (buf);
} /* if */
else
{
filepos = 0;
459
maxread = (PHYSFS_uint32) filelen;
460
461
} /* else */
462
while ((totalread < filelen) && (totalread < 65557))
463
{
464
BAIL_IF_MACRO(!io->seek(io, filepos), ERRPASS, -1);
465
466
467
/* make sure we catch a signature between buffers. */
if (totalread != 0)
468
{
469
if (!__PHYSFS_readAll(io, buf, maxread - 4))
470
return -1;
471
memcpy(&buf[maxread - 4], &extra, sizeof (extra));
472
totalread += maxread - 4;
473
} /* if */
474
475
else
{
476
if (!__PHYSFS_readAll(io, buf, maxread))
477
return -1;
478
479
480
totalread += maxread;
} /* else */
481
memcpy(&extra, buf, sizeof (extra));
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
for (i = maxread - 4; i > 0; i--)
{
if ((buf[i + 0] == 0x50) &&
(buf[i + 1] == 0x4B) &&
(buf[i + 2] == 0x05) &&
(buf[i + 3] == 0x06) )
{
found = 1; /* that's the signature! */
break;
} /* if */
} /* for */
if (found)
break;
filepos -= (maxread - 4);
499
500
if (filepos < 0)
filepos = 0;
501
502
} /* while */
503
BAIL_IF_MACRO(!found, PHYSFS_ERR_UNSUPPORTED, -1);
504
505
506
507
if (len != NULL)
*len = filelen;
508
return (filepos + i);
509
} /* zip_find_end_of_central_dir */
510
511
512
static int isZip(PHYSFS_Io *io)
513
{
514
PHYSFS_uint32 sig = 0;
515
int retval = 0;
516
517
518
519
520
/*
* The first thing in a zip file might be the signature of the
* first local file record, so it makes for a quick determination.
*/
521
if (readui32(io, &sig))
522
{
523
524
525
526
527
528
529
530
retval = (sig == ZIP_LOCAL_FILE_SIG);
if (!retval)
{
/*
* No sig...might be a ZIP with data at the start
* (a self-extracting executable, etc), so we'll have to do
* it the hard way...
*/
531
retval = (zip_find_end_of_central_dir(io, NULL) != -1);
532
} /* if */
533
534
} /* if */
535
return retval;
536
} /* isZip */
537
538
539
static void zip_free_entries(ZIPentry *entries, PHYSFS_uint64 max)
540
{
541
PHYSFS_uint64 i;
542
for (i = 0; i < max; i++)
543
{
544
545
ZIPentry *entry = &entries[i];
if (entry->name != NULL)
546
allocator.Free(entry->name);
547
548
} /* for */
549
allocator.Free(entries);
550
551
552
} /* zip_free_entries */
553
554
555
556
557
/*
* This will find the ZIPentry associated with a path in platform-independent
* notation. Directories don't have ZIPentries associated with them, but
* (*isDir) will be set to non-zero if a dir was hit.
*/
558
559
static ZIPentry *zip_find_entry(const ZIPinfo *info, const char *path,
int *isDir)
560
561
{
ZIPentry *a = info->entries;
562
PHYSFS_sint32 pathlen = (PHYSFS_sint32) strlen(path);
563
564
565
PHYSFS_sint64 lo = 0;
PHYSFS_sint64 hi = (PHYSFS_sint64) (info->entryCount - 1);
PHYSFS_sint64 middle;
566
const char *thispath = NULL;
567
568
569
570
int rc;
while (lo <= hi)
{
571
572
573
middle = lo + ((hi - lo) / 2);
thispath = a[middle].name;
rc = strncmp(path, thispath, pathlen);
574
575
if (rc > 0)
576
lo = middle + 1;
577
578
else if (rc < 0)
579
hi = middle - 1;
580
581
582
else /* substring match...might be dir or entry or nothing. */
{
583
584
if (isDir != NULL)
{
585
586
*isDir = (thispath[pathlen] == '/');
if (*isDir)
587
return NULL;
588
589
590
} /* if */
if (thispath[pathlen] == '\0') /* found entry? */
591
return &a[middle];
592
593
594
/* adjust search params, try again. */
else if (thispath[pathlen] > '/')
hi = middle - 1;
595
else
596
lo = middle + 1;
597
598
} /* if */
} /* while */
599
600
601
if (isDir != NULL)
*isDir = 0;
602
603
BAIL_MACRO(PHYSFS_ERR_NO_SUCH_PATH, NULL);
604
} /* zip_find_entry */
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
/* Convert paths from old, buggy DOS zippers... */
static void zip_convert_dos_path(ZIPentry *entry, char *path)
{
PHYSFS_uint8 hosttype = (PHYSFS_uint8) ((entry->version >> 8) & 0xFF);
if (hosttype == 0) /* FS_FAT_ */
{
while (*path)
{
if (*path == '\\')
*path = '/';
path++;
} /* while */
} /* if */
} /* zip_convert_dos_path */
621
622
623
static void zip_expand_symlink_path(char *path)
624
{
625
626
char *ptr = path;
char *prevptr = path;
627
628
while (1)
629
{
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
ptr = strchr(ptr, '/');
if (ptr == NULL)
break;
if (*(ptr + 1) == '.')
{
if (*(ptr + 2) == '/')
{
/* current dir in middle of string: ditch it. */
memmove(ptr, ptr + 2, strlen(ptr + 2) + 1);
} /* else if */
else if (*(ptr + 2) == '\0')
{
/* current dir at end of string: ditch it. */
*ptr = '\0';
} /* else if */
else if (*(ptr + 2) == '.')
{
if (*(ptr + 3) == '/')
{
/* parent dir in middle: move back one, if possible. */
memmove(prevptr, ptr + 4, strlen(ptr + 4) + 1);
ptr = prevptr;
while (prevptr != path)
{
prevptr--;
if (*prevptr == '/')
{
prevptr++;
break;
} /* if */
} /* while */
} /* if */
665
666
667
668
669
670
671
672
673
674
675
if (*(ptr + 3) == '\0')
{
/* parent dir at end: move back one, if possible. */
*prevptr = '\0';
} /* if */
} /* if */
} /* if */
else
{
prevptr = ptr;
676
ptr++;
677
678
679
} /* else */
} /* while */
} /* zip_expand_symlink_path */
680
681
/* (forward reference: zip_follow_symlink and zip_resolve call each other.) */
682
static int zip_resolve(PHYSFS_Io *io, ZIPinfo *info, ZIPentry *entry);
683
684
/*
685
686
687
* Look for the entry named by (path). If it exists, resolve it, and return
* a pointer to that entry. If it's another symlink, keep resolving until you
* hit a real file and then return a pointer to the final non-symlink entry.
688
* If there's a problem, return NULL.
689
*/
690
static ZIPentry *zip_follow_symlink(PHYSFS_Io *io, ZIPinfo *info, char *path)
691
{
692
693
694
ZIPentry *entry;
zip_expand_symlink_path(path);
695
entry = zip_find_entry(info, path, NULL);
696
697
if (entry != NULL)
{
698
if (!zip_resolve(io, info, entry)) /* recursive! */
699
700
701
702
703
704
705
706
entry = NULL;
else
{
if (entry->symlink != NULL)
entry = entry->symlink;
} /* else */
} /* if */
707
return entry;
708
} /* zip_follow_symlink */
709
710
711
static int zip_resolve_symlink(PHYSFS_Io *io, ZIPinfo *info, ZIPentry *entry)
712
{
713
const PHYSFS_uint64 size = entry->uncompressed_size;
714
char *path = NULL;
715
716
int rc = 0;
717
718
719
720
721
722
/*
* We've already parsed the local file header of the symlink at this
* point. Now we need to read the actual link from the file data and
* follow it.
*/
723
BAIL_IF_MACRO(!io->seek(io, entry->offset), ERRPASS, 0);
724
725
726
path = (char *) __PHYSFS_smallAlloc(size + 1);
BAIL_IF_MACRO(!path, PHYSFS_ERR_OUT_OF_MEMORY, 0);
727
728
if (entry->compression_method == COMPMETH_NONE)
729
rc = __PHYSFS_readAll(io, path, size);
730
731
732
733
else /* symlink target path is compressed... */
{
z_stream stream;
734
const PHYSFS_uint64 complen = entry->compressed_size;
735
PHYSFS_uint8 *compressed = (PHYSFS_uint8*) __PHYSFS_smallAlloc(complen);
736
737
if (compressed != NULL)
{
738
if (__PHYSFS_readAll(io, compressed, complen))
739
{
740
initializeZStream(&stream);
741
stream.next_in = compressed;
742
stream.avail_in = complen;
743
stream.next_out = (unsigned char *) path;
744
745
746
stream.avail_out = size;
if (zlib_err(inflateInit2(&stream, -MAX_WBITS)) == Z_OK)
{
747
rc = zlib_err(inflate(&stream, Z_FINISH));
748
inflateEnd(&stream);
749
750
751
/* both are acceptable outcomes... */
rc = ((rc == Z_OK) || (rc == Z_STREAM_END));
752
753
} /* if */
} /* if */
754
__PHYSFS_smallFree(compressed);
755
756
} /* if */
} /* else */
757
758
if (rc)
759
760
761
{
path[entry->uncompressed_size] = '\0'; /* null-terminate it. */
zip_convert_dos_path(entry, path);
762
entry->symlink = zip_follow_symlink(io, info, path);
763
764
} /* else */
765
766
__PHYSFS_smallFree(path);
767
return (entry->symlink != NULL);
768
769
770
771
772
773
} /* zip_resolve_symlink */
/*
* Parse the local file header of an entry, and update entry->offset.
*/
774
static int zip_parse_local(PHYSFS_Io *io, ZIPentry *entry)
775
776
777
778
779
780
{
PHYSFS_uint32 ui32;
PHYSFS_uint16 ui16;
PHYSFS_uint16 fnamelen;
PHYSFS_uint16 extralen;
781
782
783
784
785
/*
* crc and (un)compressed_size are always zero if this is a "JAR"
* archive created with Sun's Java tools, apparently. We only
* consider this archive corrupted if those entries don't match and
* aren't zero. That seems to work well.
786
787
* We also ignore a mismatch if the value is 0xFFFFFFFF here, since it's
* possible that's a Zip64 thing.
788
789
*/
790
791
792
793
794
795
796
797
798
799
800
BAIL_IF_MACRO(!io->seek(io, entry->offset), ERRPASS, 0);
BAIL_IF_MACRO(!readui32(io, &ui32), ERRPASS, 0);
BAIL_IF_MACRO(ui32 != ZIP_LOCAL_FILE_SIG, PHYSFS_ERR_CORRUPT, 0);
BAIL_IF_MACRO(!readui16(io, &ui16), ERRPASS, 0);
BAIL_IF_MACRO(ui16 != entry->version_needed, PHYSFS_ERR_CORRUPT, 0);
BAIL_IF_MACRO(!readui16(io, &ui16), ERRPASS, 0); /* general bits. */
BAIL_IF_MACRO(!readui16(io, &ui16), ERRPASS, 0);
BAIL_IF_MACRO(ui16 != entry->compression_method, PHYSFS_ERR_CORRUPT, 0);
BAIL_IF_MACRO(!readui32(io, &ui32), ERRPASS, 0); /* date/time */
BAIL_IF_MACRO(!readui32(io, &ui32), ERRPASS, 0);
BAIL_IF_MACRO(ui32 && (ui32 != entry->crc), PHYSFS_ERR_CORRUPT, 0);
801
802
BAIL_IF_MACRO(!readui32(io, &ui32), ERRPASS, 0);
803
804
805
BAIL_IF_MACRO(ui32 && (ui32 != 0xFFFFFFFF) &&
(ui32 != entry->compressed_size), PHYSFS_ERR_CORRUPT, 0);
806
BAIL_IF_MACRO(!readui32(io, &ui32), ERRPASS, 0);
807
808
809
BAIL_IF_MACRO(ui32 && (ui32 != 0xFFFFFFFF) &&
(ui32 != entry->uncompressed_size), PHYSFS_ERR_CORRUPT, 0);
810
811
BAIL_IF_MACRO(!readui16(io, &fnamelen), ERRPASS, 0);
BAIL_IF_MACRO(!readui16(io, &extralen), ERRPASS, 0);
812
813
entry->offset += fnamelen + extralen + 30;
814
return 1;
815
816
817
} /* zip_parse_local */
818
static int zip_resolve(PHYSFS_Io *io, ZIPinfo *info, ZIPentry *entry)
819
820
821
822
823
{
int retval = 1;
ZipResolveType resolve_type = entry->resolved;
/* Don't bother if we've failed to resolve this entry before. */
824
825
BAIL_IF_MACRO(resolve_type == ZIP_BROKEN_FILE, PHYSFS_ERR_CORRUPT, 0);
BAIL_IF_MACRO(resolve_type == ZIP_BROKEN_SYMLINK, PHYSFS_ERR_CORRUPT, 0);
826
827
/* uhoh...infinite symlink loop! */
828
BAIL_IF_MACRO(resolve_type == ZIP_RESOLVING, PHYSFS_ERR_SYMLINK_LOOP, 0);
829
830
831
832
833
834
835
836
837
838
839
840
/*
* We fix up the offset to point to the actual data on the
* first open, since we don't want to seek across the whole file on
* archive open (can be SLOW on large, CD-stored files), but we
* need to check the local file header...not just for corruption,
* but since it stores offset info the central directory does not.
*/
if (resolve_type != ZIP_RESOLVED)
{
entry->resolved = ZIP_RESOLVING;
841
retval = zip_parse_local(io, entry);
842
843
844
845
846
847
848
849
if (retval)
{
/*
* If it's a symlink, find the original file. This will cause
* resolution of other entries (other symlinks and, eventually,
* the real file) if all goes well.
*/
if (resolve_type == ZIP_UNRESOLVED_SYMLINK)
850
retval = zip_resolve_symlink(io, info, entry);
851
852
853
854
855
856
} /* if */
if (resolve_type == ZIP_UNRESOLVED_SYMLINK)
entry->resolved = ((retval) ? ZIP_RESOLVED : ZIP_BROKEN_SYMLINK);
else if (resolve_type == ZIP_UNRESOLVED_FILE)
entry->resolved = ((retval) ? ZIP_RESOLVED : ZIP_BROKEN_FILE);
857
} /* if */
858
859
return retval;
860
} /* zip_resolve */
861
862
863
static int zip_version_does_symlinks(PHYSFS_uint32 version)
864
865
{
int retval = 0;
866
PHYSFS_uint8 hosttype = (PHYSFS_uint8) ((version >> 8) & 0xFF);
867
868
869
switch (hosttype)
{
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
/*
* These are the platforms that can NOT build an archive with
* symlinks, according to the Info-ZIP project.
*/
case 0: /* FS_FAT_ */
case 1: /* AMIGA_ */
case 2: /* VMS_ */
case 4: /* VM_CSM_ */
case 6: /* FS_HPFS_ */
case 11: /* FS_NTFS_ */
case 14: /* FS_VFAT_ */
case 13: /* ACORN_ */
case 15: /* MVS_ */
case 18: /* THEOS_ */
break; /* do nothing. */
default: /* assume the rest to be unix-like. */
887
888
889
890
retval = 1;
break;
} /* switch */
891
return retval;
892
893
894
} /* zip_version_does_symlinks */
895
static int zip_entry_is_symlink(const ZIPentry *entry)
896
{
897
898
899
return ((entry->resolved == ZIP_UNRESOLVED_SYMLINK) ||
(entry->resolved == ZIP_BROKEN_SYMLINK) ||
(entry->symlink));
900
} /* zip_entry_is_symlink */
901
902
903
static int zip_has_symlink_attr(ZIPentry *entry, PHYSFS_uint32 extern_attr)
904
{
905
PHYSFS_uint16 xattr = ((extern_attr >> 16) & 0xFFFF);
906
907
908
return ( (zip_version_does_symlinks(entry->version)) &&
(entry->uncompressed_size > 0) &&
((xattr & UNIX_FILETYPE_MASK) == UNIX_FILETYPE_SYMLINK) );
909
} /* zip_has_symlink_attr */
910
911
912
static PHYSFS_sint64 zip_dos_time_to_physfs_time(PHYSFS_uint32 dostime)
913
{
914
PHYSFS_uint32 dosdate;
915
916
struct tm unixtime;
memset(&unixtime, '\0', sizeof (unixtime));
917
918
919
dosdate = (PHYSFS_uint32) ((dostime >> 16) & 0xFFFF);
dostime &= 0xFFFF;
920
921
922
923
924
925
926
927
928
929
930
931
932
/* dissect date */
unixtime.tm_year = ((dosdate >> 9) & 0x7F) + 80;
unixtime.tm_mon = ((dosdate >> 5) & 0x0F) - 1;
unixtime.tm_mday = ((dosdate ) & 0x1F);
/* dissect time */
unixtime.tm_hour = ((dostime >> 11) & 0x1F);
unixtime.tm_min = ((dostime >> 5) & 0x3F);
unixtime.tm_sec = ((dostime << 1) & 0x3E);
/* let mktime calculate daylight savings time. */
unixtime.tm_isdst = -1;
933
934
return ((PHYSFS_sint64) mktime(&unixtime));
935
} /* zip_dos_time_to_physfs_time */
936
937
938
939
static int zip_load_entry(PHYSFS_Io *io, const int zip64, ZIPentry *entry,
PHYSFS_uint64 ofs_fixup)
940
941
942
{
PHYSFS_uint16 fnamelen, extralen, commentlen;
PHYSFS_uint32 external_attr;
943
944
PHYSFS_uint32 starting_disk;
PHYSFS_uint64 offset;
945
946
947
948
949
PHYSFS_uint16 ui16;
PHYSFS_uint32 ui32;
PHYSFS_sint64 si64;
/* sanity check with central directory signature... */
950
951
BAIL_IF_MACRO(!readui32(io, &ui32), ERRPASS, 0);
BAIL_IF_MACRO(ui32 != ZIP_CENTRAL_DIR_SIG, PHYSFS_ERR_CORRUPT, 0);
952
953
/* Get the pertinent parts of the record... */
954
955
956
957
958
BAIL_IF_MACRO(!readui16(io, &entry->version), ERRPASS, 0);
BAIL_IF_MACRO(!readui16(io, &entry->version_needed), ERRPASS, 0);
BAIL_IF_MACRO(!readui16(io, &ui16), ERRPASS, 0); /* general bits */
BAIL_IF_MACRO(!readui16(io, &entry->compression_method), ERRPASS, 0);
BAIL_IF_MACRO(!readui32(io, &ui32), ERRPASS, 0);
959
entry->last_mod_time = zip_dos_time_to_physfs_time(ui32);
960
BAIL_IF_MACRO(!readui32(io, &entry->crc), ERRPASS, 0);
961
962
963
964
BAIL_IF_MACRO(!readui32(io, &ui32), ERRPASS, 0);
entry->compressed_size = (PHYSFS_uint64) ui32;
BAIL_IF_MACRO(!readui32(io, &ui32), ERRPASS, 0);
entry->uncompressed_size = (PHYSFS_uint64) ui32;
965
966
967
BAIL_IF_MACRO(!readui16(io, &fnamelen), ERRPASS, 0);
BAIL_IF_MACRO(!readui16(io, &extralen), ERRPASS, 0);
BAIL_IF_MACRO(!readui16(io, &commentlen), ERRPASS, 0);
968
969
BAIL_IF_MACRO(!readui16(io, &ui16), ERRPASS, 0);
starting_disk = (PHYSFS_uint32) ui16;
970
971
BAIL_IF_MACRO(!readui16(io, &ui16), ERRPASS, 0); /* internal file attribs */
BAIL_IF_MACRO(!readui32(io, &external_attr), ERRPASS, 0);
972
973
BAIL_IF_MACRO(!readui32(io, &ui32), ERRPASS, 0);
offset = (PHYSFS_uint64) ui32;
974
975
976
977
entry->symlink = NULL; /* will be resolved later, if necessary. */
entry->resolved = (zip_has_symlink_attr(entry, external_attr)) ?
ZIP_UNRESOLVED_SYMLINK : ZIP_UNRESOLVED_FILE;
978
979
entry->name = (char *) allocator.Malloc(fnamelen + 1);
980
BAIL_IF_MACRO(entry->name == NULL, PHYSFS_ERR_OUT_OF_MEMORY, 0);
981
if (!__PHYSFS_readAll(io, entry->name, fnamelen))
982
goto zip_load_entry_puked;
983
984
entry->name[fnamelen] = '\0'; /* null-terminate the filename. */
985
zip_convert_dos_path(entry, entry->name);
986
987
si64 = io->tell(io);
988
if (si64 == -1)
989
goto zip_load_entry_puked;
990
991
992
993
994
995
996
997
998
999
1000
/*
* The actual sizes didn't fit in 32-bits; look for the Zip64
* extended information extra field...
*/
if ( (zip64) &&
((offset == 0xFFFFFFFF) ||
(starting_disk == 0xFFFFFFFF) ||
(entry->compressed_size == 0xFFFFFFFF) ||
(entry->uncompressed_size == 0xFFFFFFFF)) )
{