/
archiver_zip.c
1716 lines (1387 loc) · 52.4 KB
1
2
3
/*
* ZIP support routines for PhysicsFS.
*
4
* Please see the file LICENSE.txt in the source's root directory.
5
*
6
7
* This file written by Ryan C. Gordon, with some peeking at "unzip.c"
* by Gilles Vollant.
8
9
*/
10
11
12
13
#define __PHYSICSFS_INTERNAL__
#include "physfs_internal.h"
#if PHYSFS_SUPPORTS_ZIP
14
15
#include <errno.h>
16
#include <time.h>
17
18
19
#include "physfs_miniz.h"
20
/*
21
22
* A buffer of ZIP_READBUFSIZE is allocated for each compressed file opened,
* and is freed when you close the file; compressed data is read into
23
24
25
26
27
28
29
30
31
32
33
* this buffer, and then is decompressed into the buffer passed to
* PHYSFS_read().
*
* Uncompressed entries in a zipfile do not allocate this buffer; they just
* read data directly into the buffer passed to PHYSFS_read().
*
* Depending on your speed and memory requirements, you should tweak this
* value.
*/
#define ZIP_READBUFSIZE (16 * 1024)
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
/*
* Entries are "unresolved" until they are first opened. At that time,
* local file headers parsed/validated, data offsets will be updated to look
* at the actual file data instead of the header, and symlinks will be
* followed and optimized. This means that we don't seek and read around the
* archive until forced to do so, and after the first time, we had to do
* less reading and parsing, which is very CD-ROM friendly.
*/
typedef enum
{
ZIP_UNRESOLVED_FILE,
ZIP_UNRESOLVED_SYMLINK,
ZIP_RESOLVING,
ZIP_RESOLVED,
ZIP_BROKEN_FILE,
50
ZIP_BROKEN_SYMLINK
51
52
53
} ZipResolveType;
54
55
56
/*
* One ZIPentry is kept for each file in an open ZIP archive.
*/
57
typedef struct _ZIPentry
58
{
59
60
61
char *name; /* Name of file in archive */
struct _ZIPentry *symlink; /* NULL or file we symlink to */
ZipResolveType resolved; /* Have we resolved file/symlink? */
62
PHYSFS_uint64 offset; /* offset of data in archive */
63
64
65
66
PHYSFS_uint16 version; /* version made by */
PHYSFS_uint16 version_needed; /* version needed to extract */
PHYSFS_uint16 compression_method; /* compression method */
PHYSFS_uint32 crc; /* crc-32 */
67
68
PHYSFS_uint64 compressed_size; /* compressed size */
PHYSFS_uint64 uncompressed_size; /* uncompressed size */
69
PHYSFS_sint64 last_mod_time; /* last file mod time */
70
71
} ZIPentry;
72
73
74
/*
* One ZIPinfo is kept for each open ZIP archive.
*/
75
76
typedef struct
{
77
PHYSFS_Io *io; /* the i/o interface for this archive. */
78
79
80
int zip64; /* non-zero if this is a Zip64 archive. */
PHYSFS_uint64 entryCount; /* Number of files in ZIP. */
ZIPentry *entries; /* info on all files in ZIP. */
81
82
} ZIPinfo;
83
84
85
/*
* One ZIPfileinfo is kept for each open file in a ZIP archive.
*/
86
87
typedef struct
{
88
ZIPentry *entry; /* Info on file. */
89
PHYSFS_Io *io; /* physical file handle. */
90
91
92
93
PHYSFS_uint32 compressed_position; /* offset in compressed data. */
PHYSFS_uint32 uncompressed_position; /* tell() position. */
PHYSFS_uint8 *buffer; /* decompression buffer. */
z_stream stream; /* zlib stream state. */
94
95
96
} ZIPfileinfo;
97
/* Magic numbers... */
98
99
100
101
102
103
#define ZIP_LOCAL_FILE_SIG 0x04034b50
#define ZIP_CENTRAL_DIR_SIG 0x02014b50
#define ZIP_END_OF_CENTRAL_DIR_SIG 0x06054b50
#define ZIP64_END_OF_CENTRAL_DIR_SIG 0x06064b50
#define ZIP64_END_OF_CENTRAL_DIRECTORY_LOCATOR_SIG 0x07064b50
#define ZIP64_EXTENDED_INFO_EXTRA_FIELD_SIG 0x0001
104
105
106
107
108
109
/* compression methods... */
#define COMPMETH_NONE 0
/* ...and others... */
110
111
112
113
#define UNIX_FILETYPE_MASK 0170000
#define UNIX_FILETYPE_SYMLINK 0120000
114
115
116
117
118
/*
* Bridge physfs allocation functions to zlib's format...
*/
static voidpf zlibPhysfsAlloc(voidpf opaque, uInt items, uInt size)
{
119
return ((PHYSFS_Allocator *) opaque)->Malloc(items * size);
120
121
122
123
124
125
126
} /* zlibPhysfsAlloc */
/*
* Bridge physfs allocation functions to zlib's format...
*/
static void zlibPhysfsFree(voidpf opaque, voidpf address)
{
127
((PHYSFS_Allocator *) opaque)->Free(address);
128
129
130
131
132
133
134
135
136
137
138
} /* zlibPhysfsFree */
/*
* Construct a new z_stream to a sane state.
*/
static void initializeZStream(z_stream *pstr)
{
memset(pstr, '\0', sizeof (z_stream));
pstr->zalloc = zlibPhysfsAlloc;
pstr->zfree = zlibPhysfsFree;
139
pstr->opaque = &allocator;
140
141
142
} /* initializeZStream */
143
static PHYSFS_ErrorCode zlib_error_code(int rc)
144
145
146
{
switch (rc)
{
147
148
149
150
151
case Z_OK: return PHYSFS_ERR_OK; /* not an error. */
case Z_STREAM_END: return PHYSFS_ERR_OK; /* not an error. */
case Z_ERRNO: return PHYSFS_ERR_IO;
case Z_MEM_ERROR: return PHYSFS_ERR_OUT_OF_MEMORY;
default: return PHYSFS_ERR_CORRUPT;
152
} /* switch */
153
154
} /* zlib_error_string */
155
156
157
158
/*
* Wrap all zlib calls in this, so the physfs error state is set appropriately.
*/
159
static int zlib_err(const int rc)
160
{
161
PHYSFS_setErrorCode(zlib_error_code(rc));
162
return rc;
163
164
165
} /* zlib_err */
166
167
168
169
170
171
172
173
174
175
176
/*
* Read an unsigned 64-bit int and swap to native byte order.
*/
static int readui64(PHYSFS_Io *io, PHYSFS_uint64 *val)
{
PHYSFS_uint64 v;
BAIL_IF_MACRO(!__PHYSFS_readAll(io, &v, sizeof (v)), ERRPASS, 0);
*val = PHYSFS_swapULE64(v);
return 1;
} /* readui64 */
177
178
179
/*
* Read an unsigned 32-bit int and swap to native byte order.
*/
180
static int readui32(PHYSFS_Io *io, PHYSFS_uint32 *val)
181
182
{
PHYSFS_uint32 v;
183
BAIL_IF_MACRO(!__PHYSFS_readAll(io, &v, sizeof (v)), ERRPASS, 0);
184
*val = PHYSFS_swapULE32(v);
185
return 1;
186
187
188
189
190
191
} /* readui32 */
/*
* Read an unsigned 16-bit int and swap to native byte order.
*/
192
static int readui16(PHYSFS_Io *io, PHYSFS_uint16 *val)
193
194
{
PHYSFS_uint16 v;
195
BAIL_IF_MACRO(!__PHYSFS_readAll(io, &v, sizeof (v)), ERRPASS, 0);
196
*val = PHYSFS_swapULE16(v);
197
return 1;
198
199
200
} /* readui16 */
201
static PHYSFS_sint64 ZIP_read(PHYSFS_Io *_io, void *buf, PHYSFS_uint64 len)
202
{
203
204
ZIPfileinfo *finfo = (ZIPfileinfo *) _io->opaque;
PHYSFS_Io *io = finfo->io;
205
206
ZIPentry *entry = finfo->entry;
PHYSFS_sint64 retval = 0;
207
PHYSFS_sint64 maxread = (PHYSFS_sint64) len;
208
209
210
211
PHYSFS_sint64 avail = entry->uncompressed_size -
finfo->uncompressed_position;
if (avail < maxread)
212
maxread = avail;
213
214
BAIL_IF_MACRO(maxread == 0, ERRPASS, 0); /* quick rejection. */
215
216
if (entry->compression_method == COMPMETH_NONE)
217
retval = io->read(io, buf, maxread);
218
219
220
else
{
finfo->stream.next_out = buf;
221
finfo->stream.avail_out = (uInt) maxread;
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
while (retval < maxread)
{
PHYSFS_uint32 before = finfo->stream.total_out;
int rc;
if (finfo->stream.avail_in == 0)
{
PHYSFS_sint64 br;
br = entry->compressed_size - finfo->compressed_position;
if (br > 0)
{
if (br > ZIP_READBUFSIZE)
br = ZIP_READBUFSIZE;
238
br = io->read(io, finfo->buffer, (PHYSFS_uint64) br);
239
240
241
if (br <= 0)
break;
242
finfo->compressed_position += (PHYSFS_uint32) br;
243
finfo->stream.next_in = finfo->buffer;
244
finfo->stream.avail_in = (PHYSFS_uint32) br;
245
246
} /* if */
} /* if */
247
248
249
rc = zlib_err(inflate(&finfo->stream, Z_SYNC_FLUSH));
retval += (finfo->stream.total_out - before);
250
251
252
253
254
255
256
if (rc != Z_OK)
break;
} /* while */
} /* else */
if (retval > 0)
257
finfo->uncompressed_position += (PHYSFS_uint32) retval;
258
259
return retval;
260
261
262
} /* ZIP_read */
263
static PHYSFS_sint64 ZIP_write(PHYSFS_Io *io, const void *b, PHYSFS_uint64 len)
264
{
265
BAIL_MACRO(PHYSFS_ERR_READ_ONLY, -1);
266
267
268
} /* ZIP_write */
269
static PHYSFS_sint64 ZIP_tell(PHYSFS_Io *io)
270
{
271
return ((ZIPfileinfo *) io->opaque)->uncompressed_position;
272
273
274
} /* ZIP_tell */
275
static int ZIP_seek(PHYSFS_Io *_io, PHYSFS_uint64 offset)
276
{
277
ZIPfileinfo *finfo = (ZIPfileinfo *) _io->opaque;
278
ZIPentry *entry = finfo->entry;
279
PHYSFS_Io *io = finfo->io;
280
281
BAIL_IF_MACRO(offset > entry->uncompressed_size, PHYSFS_ERR_PAST_EOF, 0);
282
283
if (entry->compression_method == COMPMETH_NONE)
284
{
285
const PHYSFS_sint64 newpos = offset + entry->offset;
286
BAIL_IF_MACRO(!io->seek(io, newpos), ERRPASS, 0);
287
finfo->uncompressed_position = (PHYSFS_uint32) offset;
288
} /* if */
289
290
else
291
{
292
293
294
295
/*
* If seeking backwards, we need to redecode the file
* from the start and throw away the compressed bits until we hit
* the offset we need. If seeking forward, we still need to
296
* decode, but we don't rewind first.
297
298
299
300
301
*/
if (offset < finfo->uncompressed_position)
{
/* we do a copy so state is sane if inflateInit2() fails. */
z_stream str;
302
initializeZStream(&str);
303
if (zlib_err(inflateInit2(&str, -MAX_WBITS)) != Z_OK)
304
return 0;
305
306
if (!io->seek(io, entry->offset))
307
return 0;
308
309
310
311
312
313
314
315
316
inflateEnd(&finfo->stream);
memcpy(&finfo->stream, &str, sizeof (z_stream));
finfo->uncompressed_position = finfo->compressed_position = 0;
} /* if */
while (finfo->uncompressed_position != offset)
{
PHYSFS_uint8 buf[512];
317
318
319
PHYSFS_uint32 maxread;
maxread = (PHYSFS_uint32) (offset - finfo->uncompressed_position);
320
321
322
if (maxread > sizeof (buf))
maxread = sizeof (buf);
323
if (ZIP_read(_io, buf, maxread) != maxread)
324
return 0;
325
326
327
} /* while */
} /* else */
328
return 1;
329
330
331
} /* ZIP_seek */
332
static PHYSFS_sint64 ZIP_length(PHYSFS_Io *io)
333
{
334
const ZIPfileinfo *finfo = (ZIPfileinfo *) io->opaque;
335
return (PHYSFS_sint64) finfo->entry->uncompressed_size;
336
} /* ZIP_length */
337
338
339
340
341
static PHYSFS_Io *zip_get_io(PHYSFS_Io *io, ZIPinfo *inf, ZIPentry *entry);
static PHYSFS_Io *ZIP_duplicate(PHYSFS_Io *io)
342
{
343
344
345
ZIPfileinfo *origfinfo = (ZIPfileinfo *) io->opaque;
PHYSFS_Io *retval = (PHYSFS_Io *) allocator.Malloc(sizeof (PHYSFS_Io));
ZIPfileinfo *finfo = (ZIPfileinfo *) allocator.Malloc(sizeof (ZIPfileinfo));
346
347
GOTO_IF_MACRO(!retval, PHYSFS_ERR_OUT_OF_MEMORY, failed);
GOTO_IF_MACRO(!finfo, PHYSFS_ERR_OUT_OF_MEMORY, failed);
348
349
350
351
memset(finfo, '\0', sizeof (*finfo));
finfo->entry = origfinfo->entry;
finfo->io = zip_get_io(origfinfo->io, NULL, finfo->entry);
352
GOTO_IF_MACRO(!finfo->io, ERRPASS, failed);
353
354
355
356
if (finfo->entry->compression_method != COMPMETH_NONE)
{
finfo->buffer = (PHYSFS_uint8 *) allocator.Malloc(ZIP_READBUFSIZE);
357
358
359
GOTO_IF_MACRO(!finfo->buffer, PHYSFS_ERR_OUT_OF_MEMORY, failed);
if (zlib_err(inflateInit2(&finfo->stream, -MAX_WBITS)) != Z_OK)
goto failed;
360
361
362
363
364
365
} /* if */
memcpy(retval, io, sizeof (PHYSFS_Io));
retval->opaque = finfo;
return retval;
366
failed:
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
if (finfo != NULL)
{
if (finfo->io != NULL)
finfo->io->destroy(finfo->io);
if (finfo->buffer != NULL)
{
allocator.Free(finfo->buffer);
inflateEnd(&finfo->stream);
} /* if */
allocator.Free(finfo);
} /* if */
if (retval != NULL)
allocator.Free(retval);
return NULL;
} /* ZIP_duplicate */
static int ZIP_flush(PHYSFS_Io *io) { return 1; /* no write support. */ }
static void ZIP_destroy(PHYSFS_Io *io)
{
ZIPfileinfo *finfo = (ZIPfileinfo *) io->opaque;
finfo->io->destroy(finfo->io);
393
394
395
396
397
if (finfo->entry->compression_method != COMPMETH_NONE)
inflateEnd(&finfo->stream);
if (finfo->buffer != NULL)
398
allocator.Free(finfo->buffer);
399
400
allocator.Free(finfo);
401
402
403
404
405
406
allocator.Free(io);
} /* ZIP_destroy */
static const PHYSFS_Io ZIP_Io =
{
407
CURRENT_PHYSFS_IO_API_VERSION, NULL,
408
409
410
411
412
413
414
ZIP_read,
ZIP_write,
ZIP_seek,
ZIP_tell,
ZIP_length,
ZIP_duplicate,
ZIP_flush,
415
ZIP_destroy
416
417
};
418
419
420
static PHYSFS_sint64 zip_find_end_of_central_dir(PHYSFS_Io *io, PHYSFS_sint64 *len)
421
{
422
PHYSFS_uint8 buf[256];
423
PHYSFS_uint8 extra[4] = { 0, 0, 0, 0 };
424
PHYSFS_sint32 i = 0;
425
426
427
PHYSFS_sint64 filelen;
PHYSFS_sint64 filepos;
PHYSFS_sint32 maxread;
428
429
PHYSFS_sint32 totalread = 0;
int found = 0;
430
431
filelen = io->length(io);
432
BAIL_IF_MACRO(filelen == -1, ERRPASS, -1);
433
434
435
436
437
438
439
440
441
/*
* Jump to the end of the file and start reading backwards.
* The last thing in the file is the zipfile comment, which is variable
* length, and the field that specifies its size is before it in the
* file (argh!)...this means that we need to scan backwards until we
* hit the end-of-central-dir signature. We can then sanity check that
* the comment was as big as it should be to make sure we're in the
* right place. The comment length field is 16 bits, so we can stop
442
443
* searching for that signature after a little more than 64k at most,
* and call it a corrupted zipfile.
444
445
446
447
448
449
450
451
452
453
*/
if (sizeof (buf) < filelen)
{
filepos = filelen - sizeof (buf);
maxread = sizeof (buf);
} /* if */
else
{
filepos = 0;
454
maxread = (PHYSFS_uint32) filelen;
455
456
} /* else */
457
while ((totalread < filelen) && (totalread < 65557))
458
{
459
BAIL_IF_MACRO(!io->seek(io, filepos), ERRPASS, -1);
460
461
462
/* make sure we catch a signature between buffers. */
if (totalread != 0)
463
{
464
if (!__PHYSFS_readAll(io, buf, maxread - 4))
465
return -1;
466
memcpy(&buf[maxread - 4], &extra, sizeof (extra));
467
totalread += maxread - 4;
468
} /* if */
469
470
else
{
471
if (!__PHYSFS_readAll(io, buf, maxread))
472
return -1;
473
474
475
totalread += maxread;
} /* else */
476
memcpy(&extra, buf, sizeof (extra));
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
for (i = maxread - 4; i > 0; i--)
{
if ((buf[i + 0] == 0x50) &&
(buf[i + 1] == 0x4B) &&
(buf[i + 2] == 0x05) &&
(buf[i + 3] == 0x06) )
{
found = 1; /* that's the signature! */
break;
} /* if */
} /* for */
if (found)
break;
filepos -= (maxread - 4);
494
495
if (filepos < 0)
filepos = 0;
496
497
} /* while */
498
BAIL_IF_MACRO(!found, PHYSFS_ERR_UNSUPPORTED, -1);
499
500
501
502
if (len != NULL)
*len = filelen;
503
return (filepos + i);
504
} /* zip_find_end_of_central_dir */
505
506
507
static int isZip(PHYSFS_Io *io)
508
{
509
PHYSFS_uint32 sig = 0;
510
int retval = 0;
511
512
513
514
515
/*
* The first thing in a zip file might be the signature of the
* first local file record, so it makes for a quick determination.
*/
516
if (readui32(io, &sig))
517
{
518
519
520
521
522
523
524
525
retval = (sig == ZIP_LOCAL_FILE_SIG);
if (!retval)
{
/*
* No sig...might be a ZIP with data at the start
* (a self-extracting executable, etc), so we'll have to do
* it the hard way...
*/
526
retval = (zip_find_end_of_central_dir(io, NULL) != -1);
527
} /* if */
528
529
} /* if */
530
return retval;
531
} /* isZip */
532
533
534
static void zip_free_entries(ZIPentry *entries, PHYSFS_uint64 max)
535
{
536
PHYSFS_uint64 i;
537
for (i = 0; i < max; i++)
538
{
539
540
ZIPentry *entry = &entries[i];
if (entry->name != NULL)
541
allocator.Free(entry->name);
542
543
} /* for */
544
allocator.Free(entries);
545
546
547
} /* zip_free_entries */
548
549
550
551
552
/*
* This will find the ZIPentry associated with a path in platform-independent
* notation. Directories don't have ZIPentries associated with them, but
* (*isDir) will be set to non-zero if a dir was hit.
*/
553
554
static ZIPentry *zip_find_entry(const ZIPinfo *info, const char *path,
int *isDir)
555
556
{
ZIPentry *a = info->entries;
557
PHYSFS_sint32 pathlen = (PHYSFS_sint32) strlen(path);
558
559
560
PHYSFS_sint64 lo = 0;
PHYSFS_sint64 hi = (PHYSFS_sint64) (info->entryCount - 1);
PHYSFS_sint64 middle;
561
const char *thispath = NULL;
562
563
564
565
int rc;
while (lo <= hi)
{
566
567
568
middle = lo + ((hi - lo) / 2);
thispath = a[middle].name;
rc = strncmp(path, thispath, pathlen);
569
570
if (rc > 0)
571
lo = middle + 1;
572
573
else if (rc < 0)
574
hi = middle - 1;
575
576
577
else /* substring match...might be dir or entry or nothing. */
{
578
579
if (isDir != NULL)
{
580
581
*isDir = (thispath[pathlen] == '/');
if (*isDir)
582
return NULL;
583
584
585
} /* if */
if (thispath[pathlen] == '\0') /* found entry? */
586
return &a[middle];
587
588
589
/* adjust search params, try again. */
else if (thispath[pathlen] > '/')
hi = middle - 1;
590
else
591
lo = middle + 1;
592
593
} /* if */
} /* while */
594
595
596
if (isDir != NULL)
*isDir = 0;
597
598
BAIL_MACRO(PHYSFS_ERR_NOT_FOUND, NULL);
599
} /* zip_find_entry */
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
/* Convert paths from old, buggy DOS zippers... */
static void zip_convert_dos_path(ZIPentry *entry, char *path)
{
PHYSFS_uint8 hosttype = (PHYSFS_uint8) ((entry->version >> 8) & 0xFF);
if (hosttype == 0) /* FS_FAT_ */
{
while (*path)
{
if (*path == '\\')
*path = '/';
path++;
} /* while */
} /* if */
} /* zip_convert_dos_path */
616
617
618
static void zip_expand_symlink_path(char *path)
619
{
620
621
char *ptr = path;
char *prevptr = path;
622
623
while (1)
624
{
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
ptr = strchr(ptr, '/');
if (ptr == NULL)
break;
if (*(ptr + 1) == '.')
{
if (*(ptr + 2) == '/')
{
/* current dir in middle of string: ditch it. */
memmove(ptr, ptr + 2, strlen(ptr + 2) + 1);
} /* else if */
else if (*(ptr + 2) == '\0')
{
/* current dir at end of string: ditch it. */
*ptr = '\0';
} /* else if */
else if (*(ptr + 2) == '.')
{
if (*(ptr + 3) == '/')
{
/* parent dir in middle: move back one, if possible. */
memmove(prevptr, ptr + 4, strlen(ptr + 4) + 1);
ptr = prevptr;
while (prevptr != path)
{
prevptr--;
if (*prevptr == '/')
{
prevptr++;
break;
} /* if */
} /* while */
} /* if */
660
661
662
663
664
665
666
667
668
669
670
if (*(ptr + 3) == '\0')
{
/* parent dir at end: move back one, if possible. */
*prevptr = '\0';
} /* if */
} /* if */
} /* if */
else
{
prevptr = ptr;
671
ptr++;
672
673
674
} /* else */
} /* while */
} /* zip_expand_symlink_path */
675
676
/* (forward reference: zip_follow_symlink and zip_resolve call each other.) */
677
static int zip_resolve(PHYSFS_Io *io, ZIPinfo *info, ZIPentry *entry);
678
679
/*
680
681
682
* Look for the entry named by (path). If it exists, resolve it, and return
* a pointer to that entry. If it's another symlink, keep resolving until you
* hit a real file and then return a pointer to the final non-symlink entry.
683
* If there's a problem, return NULL.
684
*/
685
static ZIPentry *zip_follow_symlink(PHYSFS_Io *io, ZIPinfo *info, char *path)
686
{
687
688
689
ZIPentry *entry;
zip_expand_symlink_path(path);
690
entry = zip_find_entry(info, path, NULL);
691
692
if (entry != NULL)
{
693
if (!zip_resolve(io, info, entry)) /* recursive! */
694
695
696
697
698
699
700
701
entry = NULL;
else
{
if (entry->symlink != NULL)
entry = entry->symlink;
} /* else */
} /* if */
702
return entry;
703
} /* zip_follow_symlink */
704
705
706
static int zip_resolve_symlink(PHYSFS_Io *io, ZIPinfo *info, ZIPentry *entry)
707
{
708
const PHYSFS_uint64 size = entry->uncompressed_size;
709
char *path = NULL;
710
711
int rc = 0;
712
713
714
715
716
717
/*
* We've already parsed the local file header of the symlink at this
* point. Now we need to read the actual link from the file data and
* follow it.
*/
718
BAIL_IF_MACRO(!io->seek(io, entry->offset), ERRPASS, 0);
719
720
721
path = (char *) __PHYSFS_smallAlloc(size + 1);
BAIL_IF_MACRO(!path, PHYSFS_ERR_OUT_OF_MEMORY, 0);
722
723
if (entry->compression_method == COMPMETH_NONE)
724
rc = __PHYSFS_readAll(io, path, size);
725
726
727
728
else /* symlink target path is compressed... */
{
z_stream stream;
729
const PHYSFS_uint64 complen = entry->compressed_size;
730
PHYSFS_uint8 *compressed = (PHYSFS_uint8*) __PHYSFS_smallAlloc(complen);
731
732
if (compressed != NULL)
{
733
if (__PHYSFS_readAll(io, compressed, complen))
734
{
735
initializeZStream(&stream);
736
stream.next_in = compressed;
737
stream.avail_in = complen;
738
stream.next_out = (unsigned char *) path;
739
740
741
stream.avail_out = size;
if (zlib_err(inflateInit2(&stream, -MAX_WBITS)) == Z_OK)
{
742
rc = zlib_err(inflate(&stream, Z_FINISH));
743
inflateEnd(&stream);
744
745
746
/* both are acceptable outcomes... */
rc = ((rc == Z_OK) || (rc == Z_STREAM_END));
747
748
} /* if */
} /* if */
749
__PHYSFS_smallFree(compressed);
750
751
} /* if */
} /* else */
752
753
if (rc)
754
755
756
{
path[entry->uncompressed_size] = '\0'; /* null-terminate it. */
zip_convert_dos_path(entry, path);
757
entry->symlink = zip_follow_symlink(io, info, path);
758
759
} /* else */
760
761
__PHYSFS_smallFree(path);
762
return (entry->symlink != NULL);
763
764
765
766
767
768
} /* zip_resolve_symlink */
/*
* Parse the local file header of an entry, and update entry->offset.
*/
769
static int zip_parse_local(PHYSFS_Io *io, ZIPentry *entry)
770
771
772
773
774
775
{
PHYSFS_uint32 ui32;
PHYSFS_uint16 ui16;
PHYSFS_uint16 fnamelen;
PHYSFS_uint16 extralen;
776
777
778
779
780
/*
* crc and (un)compressed_size are always zero if this is a "JAR"
* archive created with Sun's Java tools, apparently. We only
* consider this archive corrupted if those entries don't match and
* aren't zero. That seems to work well.
781
782
* We also ignore a mismatch if the value is 0xFFFFFFFF here, since it's
* possible that's a Zip64 thing.
783
784
*/
785
786
787
788
789
790
791
792
793
794
795
BAIL_IF_MACRO(!io->seek(io, entry->offset), ERRPASS, 0);
BAIL_IF_MACRO(!readui32(io, &ui32), ERRPASS, 0);
BAIL_IF_MACRO(ui32 != ZIP_LOCAL_FILE_SIG, PHYSFS_ERR_CORRUPT, 0);
BAIL_IF_MACRO(!readui16(io, &ui16), ERRPASS, 0);
BAIL_IF_MACRO(ui16 != entry->version_needed, PHYSFS_ERR_CORRUPT, 0);
BAIL_IF_MACRO(!readui16(io, &ui16), ERRPASS, 0); /* general bits. */
BAIL_IF_MACRO(!readui16(io, &ui16), ERRPASS, 0);
BAIL_IF_MACRO(ui16 != entry->compression_method, PHYSFS_ERR_CORRUPT, 0);
BAIL_IF_MACRO(!readui32(io, &ui32), ERRPASS, 0); /* date/time */
BAIL_IF_MACRO(!readui32(io, &ui32), ERRPASS, 0);
BAIL_IF_MACRO(ui32 && (ui32 != entry->crc), PHYSFS_ERR_CORRUPT, 0);
796
797
BAIL_IF_MACRO(!readui32(io, &ui32), ERRPASS, 0);
798
799
800
BAIL_IF_MACRO(ui32 && (ui32 != 0xFFFFFFFF) &&
(ui32 != entry->compressed_size), PHYSFS_ERR_CORRUPT, 0);
801
BAIL_IF_MACRO(!readui32(io, &ui32), ERRPASS, 0);
802
803
804
BAIL_IF_MACRO(ui32 && (ui32 != 0xFFFFFFFF) &&
(ui32 != entry->uncompressed_size), PHYSFS_ERR_CORRUPT, 0);
805
806
BAIL_IF_MACRO(!readui16(io, &fnamelen), ERRPASS, 0);
BAIL_IF_MACRO(!readui16(io, &extralen), ERRPASS, 0);
807
808
entry->offset += fnamelen + extralen + 30;
809
return 1;
810
811
812
} /* zip_parse_local */
813
static int zip_resolve(PHYSFS_Io *io, ZIPinfo *info, ZIPentry *entry)
814
815
816
817
818
{
int retval = 1;
ZipResolveType resolve_type = entry->resolved;
/* Don't bother if we've failed to resolve this entry before. */
819
820
BAIL_IF_MACRO(resolve_type == ZIP_BROKEN_FILE, PHYSFS_ERR_CORRUPT, 0);
BAIL_IF_MACRO(resolve_type == ZIP_BROKEN_SYMLINK, PHYSFS_ERR_CORRUPT, 0);
821
822
/* uhoh...infinite symlink loop! */
823
BAIL_IF_MACRO(resolve_type == ZIP_RESOLVING, PHYSFS_ERR_SYMLINK_LOOP, 0);
824
825
826
827
828
829
830
831
832
833
834
835
/*
* We fix up the offset to point to the actual data on the
* first open, since we don't want to seek across the whole file on
* archive open (can be SLOW on large, CD-stored files), but we
* need to check the local file header...not just for corruption,
* but since it stores offset info the central directory does not.
*/
if (resolve_type != ZIP_RESOLVED)
{
entry->resolved = ZIP_RESOLVING;
836
retval = zip_parse_local(io, entry);
837
838
839
840
841
842
843
844
if (retval)
{
/*
* If it's a symlink, find the original file. This will cause
* resolution of other entries (other symlinks and, eventually,
* the real file) if all goes well.
*/
if (resolve_type == ZIP_UNRESOLVED_SYMLINK)
845
retval = zip_resolve_symlink(io, info, entry);
846
847
848
849
850
851
} /* if */
if (resolve_type == ZIP_UNRESOLVED_SYMLINK)
entry->resolved = ((retval) ? ZIP_RESOLVED : ZIP_BROKEN_SYMLINK);
else if (resolve_type == ZIP_UNRESOLVED_FILE)
entry->resolved = ((retval) ? ZIP_RESOLVED : ZIP_BROKEN_FILE);
852
} /* if */
853
854
return retval;
855
} /* zip_resolve */
856
857
858
static int zip_version_does_symlinks(PHYSFS_uint32 version)
859
860
{
int retval = 0;
861
PHYSFS_uint8 hosttype = (PHYSFS_uint8) ((version >> 8) & 0xFF);
862
863
864
switch (hosttype)
{
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
/*
* These are the platforms that can NOT build an archive with
* symlinks, according to the Info-ZIP project.
*/
case 0: /* FS_FAT_ */
case 1: /* AMIGA_ */
case 2: /* VMS_ */
case 4: /* VM_CSM_ */
case 6: /* FS_HPFS_ */
case 11: /* FS_NTFS_ */
case 14: /* FS_VFAT_ */
case 13: /* ACORN_ */
case 15: /* MVS_ */
case 18: /* THEOS_ */
break; /* do nothing. */
default: /* assume the rest to be unix-like. */
882
883
884
885
retval = 1;
break;
} /* switch */
886
return retval;
887
888
889
} /* zip_version_does_symlinks */
890
static int zip_entry_is_symlink(const ZIPentry *entry)
891
{
892
893
894
return ((entry->resolved == ZIP_UNRESOLVED_SYMLINK) ||
(entry->resolved == ZIP_BROKEN_SYMLINK) ||
(entry->symlink));
895
} /* zip_entry_is_symlink */
896
897
898
static int zip_has_symlink_attr(ZIPentry *entry, PHYSFS_uint32 extern_attr)
899
{
900
PHYSFS_uint16 xattr = ((extern_attr >> 16) & 0xFFFF);
901
902
903
return ( (zip_version_does_symlinks(entry->version)) &&
(entry->uncompressed_size > 0) &&
((xattr & UNIX_FILETYPE_MASK) == UNIX_FILETYPE_SYMLINK) );
904
} /* zip_has_symlink_attr */
905
906
907
static PHYSFS_sint64 zip_dos_time_to_physfs_time(PHYSFS_uint32 dostime)
908
{
909
PHYSFS_uint32 dosdate;
910
911
struct tm unixtime;
memset(&unixtime, '\0', sizeof (unixtime));
912
913
914
dosdate = (PHYSFS_uint32) ((dostime >> 16) & 0xFFFF);
dostime &= 0xFFFF;
915
916
917
918
919
920
921
922
923
924
925
926
927
/* dissect date */
unixtime.tm_year = ((dosdate >> 9) & 0x7F) + 80;
unixtime.tm_mon = ((dosdate >> 5) & 0x0F) - 1;
unixtime.tm_mday = ((dosdate ) & 0x1F);
/* dissect time */
unixtime.tm_hour = ((dostime >> 11) & 0x1F);
unixtime.tm_min = ((dostime >> 5) & 0x3F);
unixtime.tm_sec = ((dostime << 1) & 0x3E);
/* let mktime calculate daylight savings time. */
unixtime.tm_isdst = -1;
928
929
return ((PHYSFS_sint64) mktime(&unixtime));
930
} /* zip_dos_time_to_physfs_time */
931
932
933
934
static int zip_load_entry(PHYSFS_Io *io, const int zip64, ZIPentry *entry,
PHYSFS_uint64 ofs_fixup)
935
936
937
{
PHYSFS_uint16 fnamelen, extralen, commentlen;
PHYSFS_uint32 external_attr;
938
939
PHYSFS_uint32 starting_disk;
PHYSFS_uint64 offset;
940
941
942
943
944
PHYSFS_uint16 ui16;
PHYSFS_uint32 ui32;
PHYSFS_sint64 si64;
/* sanity check with central directory signature... */
945
946
BAIL_IF_MACRO(!readui32(io, &ui32), ERRPASS, 0);
BAIL_IF_MACRO(ui32 != ZIP_CENTRAL_DIR_SIG, PHYSFS_ERR_CORRUPT, 0);
947
948
/* Get the pertinent parts of the record... */
949
950
951
952
953
BAIL_IF_MACRO(!readui16(io, &entry->version), ERRPASS, 0);
BAIL_IF_MACRO(!readui16(io, &entry->version_needed), ERRPASS, 0);
BAIL_IF_MACRO(!readui16(io, &ui16), ERRPASS, 0); /* general bits */
BAIL_IF_MACRO(!readui16(io, &entry->compression_method), ERRPASS, 0);
BAIL_IF_MACRO(!readui32(io, &ui32), ERRPASS, 0);
954
entry->last_mod_time = zip_dos_time_to_physfs_time(ui32);
955
BAIL_IF_MACRO(!readui32(io, &entry->crc), ERRPASS, 0);
956
957
958
959
BAIL_IF_MACRO(!readui32(io, &ui32), ERRPASS, 0);
entry->compressed_size = (PHYSFS_uint64) ui32;
BAIL_IF_MACRO(!readui32(io, &ui32), ERRPASS, 0);
entry->uncompressed_size = (PHYSFS_uint64) ui32;
960
961
962
BAIL_IF_MACRO(!readui16(io, &fnamelen), ERRPASS, 0);
BAIL_IF_MACRO(!readui16(io, &extralen), ERRPASS, 0);
BAIL_IF_MACRO(!readui16(io, &commentlen), ERRPASS, 0);
963
964
BAIL_IF_MACRO(!readui16(io, &ui16), ERRPASS, 0);
starting_disk = (PHYSFS_uint32) ui16;
965
966
BAIL_IF_MACRO(!readui16(io, &ui16), ERRPASS, 0); /* internal file attribs */
BAIL_IF_MACRO(!readui32(io, &external_attr), ERRPASS, 0);
967
968
BAIL_IF_MACRO(!readui32(io, &ui32), ERRPASS, 0);
offset = (PHYSFS_uint64) ui32;
969
970
971
972
entry->symlink = NULL; /* will be resolved later, if necessary. */
entry->resolved = (zip_has_symlink_attr(entry, external_attr)) ?
ZIP_UNRESOLVED_SYMLINK : ZIP_UNRESOLVED_FILE;
973
974
entry->name = (char *) allocator.Malloc(fnamelen + 1);
975
BAIL_IF_MACRO(entry->name == NULL, PHYSFS_ERR_OUT_OF_MEMORY, 0);
976
if (!__PHYSFS_readAll(io, entry->name, fnamelen))
977
goto zip_load_entry_puked;
978
979
entry->name[fnamelen] = '\0'; /* null-terminate the filename. */
980
zip_convert_dos_path(entry, entry->name);
981
982
si64 = io->tell(io);
983
if (si64 == -1)
984
goto zip_load_entry_puked;
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
/*
* The actual sizes didn't fit in 32-bits; look for the Zip64
* extended information extra field...
*/
if ( (zip64) &&
((offset == 0xFFFFFFFF) ||
(starting_disk == 0xFFFFFFFF) ||
(entry->compressed_size == 0xFFFFFFFF) ||
(entry->uncompressed_size == 0xFFFFFFFF)) )
{
int found = 0;
PHYSFS_uint16 sig, len;
while (extralen > 4)
{
if (!readui16(io, &sig))