/
zip.c
1440 lines (1172 loc) · 43.6 KB
1
2
3
4
5
/*
* ZIP support routines for PhysicsFS.
*
* Please see the file LICENSE in the source's root directory.
*
6
7
* This file written by Ryan C. Gordon, with some peeking at "unzip.c"
* by Gilles Vollant.
8
9
*/
10
11
#if (defined PHYSFS_SUPPORTS_ZIP)
12
13
#include <stdio.h>
#include <stdlib.h>
14
#include <string.h>
15
#ifndef _WIN32_WCE
16
#include <errno.h>
17
#include <time.h>
18
#endif
19
20
#include "physfs.h"
#include "zlib.h"
21
22
23
24
#define __PHYSICSFS_INTERNAL__
#include "physfs_internal.h"
25
/*
26
27
* A buffer of ZIP_READBUFSIZE is allocated for each compressed file opened,
* and is freed when you close the file; compressed data is read into
28
29
30
31
32
33
34
35
36
37
38
* this buffer, and then is decompressed into the buffer passed to
* PHYSFS_read().
*
* Uncompressed entries in a zipfile do not allocate this buffer; they just
* read data directly into the buffer passed to PHYSFS_read().
*
* Depending on your speed and memory requirements, you should tweak this
* value.
*/
#define ZIP_READBUFSIZE (16 * 1024)
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
/*
* Entries are "unresolved" until they are first opened. At that time,
* local file headers parsed/validated, data offsets will be updated to look
* at the actual file data instead of the header, and symlinks will be
* followed and optimized. This means that we don't seek and read around the
* archive until forced to do so, and after the first time, we had to do
* less reading and parsing, which is very CD-ROM friendly.
*/
typedef enum
{
ZIP_UNRESOLVED_FILE,
ZIP_UNRESOLVED_SYMLINK,
ZIP_RESOLVING,
ZIP_RESOLVED,
ZIP_BROKEN_FILE,
55
ZIP_BROKEN_SYMLINK
56
57
58
} ZipResolveType;
59
60
61
/*
* One ZIPentry is kept for each file in an open ZIP archive.
*/
62
typedef struct _ZIPentry
63
{
64
65
66
67
68
69
70
71
72
73
74
char *name; /* Name of file in archive */
struct _ZIPentry *symlink; /* NULL or file we symlink to */
ZipResolveType resolved; /* Have we resolved file/symlink? */
PHYSFS_uint32 offset; /* offset of data in archive */
PHYSFS_uint16 version; /* version made by */
PHYSFS_uint16 version_needed; /* version needed to extract */
PHYSFS_uint16 compression_method; /* compression method */
PHYSFS_uint32 crc; /* crc-32 */
PHYSFS_uint32 compressed_size; /* compressed size */
PHYSFS_uint32 uncompressed_size; /* uncompressed size */
PHYSFS_sint64 last_mod_time; /* last file mod time */
75
76
} ZIPentry;
77
78
79
/*
* One ZIPinfo is kept for each open ZIP archive.
*/
80
81
typedef struct
{
82
83
84
char *archiveName; /* path to ZIP in platform-dependent notation. */
PHYSFS_uint16 entryCount; /* Number of files in ZIP. */
ZIPentry *entries; /* info on all files in ZIP. */
85
86
} ZIPinfo;
87
88
89
/*
* One ZIPfileinfo is kept for each open file in a ZIP archive.
*/
90
91
typedef struct
{
92
93
94
95
96
97
ZIPentry *entry; /* Info on file. */
void *handle; /* physical file handle. */
PHYSFS_uint32 compressed_position; /* offset in compressed data. */
PHYSFS_uint32 uncompressed_position; /* tell() position. */
PHYSFS_uint8 *buffer; /* decompression buffer. */
z_stream stream; /* zlib stream state. */
98
99
100
} ZIPfileinfo;
101
102
103
104
105
106
107
108
109
110
/* Magic numbers... */
#define ZIP_LOCAL_FILE_SIG 0x04034b50
#define ZIP_CENTRAL_DIR_SIG 0x02014b50
#define ZIP_END_OF_CENTRAL_DIR_SIG 0x06054b50
/* compression methods... */
#define COMPMETH_NONE 0
/* ...and others... */
111
112
113
114
#define UNIX_FILETYPE_MASK 0170000
#define UNIX_FILETYPE_SYMLINK 0120000
115
116
117
118
119
/*
* Bridge physfs allocation functions to zlib's format...
*/
static voidpf zlibPhysfsAlloc(voidpf opaque, uInt items, uInt size)
{
120
return(((PHYSFS_Allocator *) opaque)->Malloc(items * size));
121
122
123
124
125
126
127
} /* zlibPhysfsAlloc */
/*
* Bridge physfs allocation functions to zlib's format...
*/
static void zlibPhysfsFree(voidpf opaque, voidpf address)
{
128
((PHYSFS_Allocator *) opaque)->Free(address);
129
130
131
132
133
134
135
136
137
138
139
} /* zlibPhysfsFree */
/*
* Construct a new z_stream to a sane state.
*/
static void initializeZStream(z_stream *pstr)
{
memset(pstr, '\0', sizeof (z_stream));
pstr->zalloc = zlibPhysfsAlloc;
pstr->zfree = zlibPhysfsFree;
140
pstr->opaque = &allocator;
141
142
143
} /* initializeZStream */
144
static const char *zlib_error_string(int rc)
145
146
147
{
switch (rc)
{
148
149
case Z_OK: return(NULL); /* not an error. */
case Z_STREAM_END: return(NULL); /* not an error. */
150
#ifndef _WIN32_WCE
151
case Z_ERRNO: return(strerror(errno));
152
#endif
153
154
155
156
157
158
case Z_NEED_DICT: return(ERR_NEED_DICT);
case Z_DATA_ERROR: return(ERR_DATA_ERROR);
case Z_MEM_ERROR: return(ERR_MEMORY_ERROR);
case Z_BUF_ERROR: return(ERR_BUFFER_ERROR);
case Z_VERSION_ERROR: return(ERR_VERSION_ERROR);
default: return(ERR_UNKNOWN_ERROR);
159
160
} /* switch */
161
162
163
return(NULL);
} /* zlib_error_string */
164
165
166
167
168
169
170
171
172
/*
* Wrap all zlib calls in this, so the physfs error state is set appropriately.
*/
static int zlib_err(int rc)
{
const char *str = zlib_error_string(rc);
if (str != NULL)
__PHYSFS_setError(str);
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
return(rc);
} /* zlib_err */
/*
* Read an unsigned 32-bit int and swap to native byte order.
*/
static int readui32(void *in, PHYSFS_uint32 *val)
{
PHYSFS_uint32 v;
BAIL_IF_MACRO(__PHYSFS_platformRead(in, &v, sizeof (v), 1) != 1, NULL, 0);
*val = PHYSFS_swapULE32(v);
return(1);
} /* readui32 */
/*
* Read an unsigned 16-bit int and swap to native byte order.
*/
static int readui16(void *in, PHYSFS_uint16 *val)
{
PHYSFS_uint16 v;
BAIL_IF_MACRO(__PHYSFS_platformRead(in, &v, sizeof (v), 1) != 1, NULL, 0);
*val = PHYSFS_swapULE16(v);
return(1);
} /* readui16 */
201
static PHYSFS_sint64 ZIP_read(fvoid *opaque, void *buf,
202
PHYSFS_uint32 objSize, PHYSFS_uint32 objCount)
203
{
204
ZIPfileinfo *finfo = (ZIPfileinfo *) opaque;
205
206
207
208
209
210
211
212
213
214
215
ZIPentry *entry = finfo->entry;
PHYSFS_sint64 retval = 0;
PHYSFS_sint64 maxread = ((PHYSFS_sint64) objSize) * objCount;
PHYSFS_sint64 avail = entry->uncompressed_size -
finfo->uncompressed_position;
BAIL_IF_MACRO(maxread == 0, NULL, 0); /* quick rejection. */
if (avail < maxread)
{
maxread = avail - (avail % objSize);
216
objCount = (PHYSFS_uint32) (maxread / objSize);
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
BAIL_IF_MACRO(objCount == 0, ERR_PAST_EOF, 0); /* quick rejection. */
__PHYSFS_setError(ERR_PAST_EOF); /* this is always true here. */
} /* if */
if (entry->compression_method == COMPMETH_NONE)
{
retval = __PHYSFS_platformRead(finfo->handle, buf, objSize, objCount);
} /* if */
else
{
finfo->stream.next_out = buf;
finfo->stream.avail_out = objSize * objCount;
while (retval < maxread)
{
PHYSFS_uint32 before = finfo->stream.total_out;
int rc;
if (finfo->stream.avail_in == 0)
{
PHYSFS_sint64 br;
br = entry->compressed_size - finfo->compressed_position;
if (br > 0)
{
if (br > ZIP_READBUFSIZE)
br = ZIP_READBUFSIZE;
br = __PHYSFS_platformRead(finfo->handle,
finfo->buffer,
248
1, (PHYSFS_uint32) br);
249
250
251
if (br <= 0)
break;
252
finfo->compressed_position += (PHYSFS_uint32) br;
253
finfo->stream.next_in = finfo->buffer;
254
finfo->stream.avail_in = (PHYSFS_uint32) br;
255
256
} /* if */
} /* if */
257
258
259
rc = zlib_err(inflate(&finfo->stream, Z_SYNC_FLUSH));
retval += (finfo->stream.total_out - before);
260
261
262
263
264
265
266
267
268
if (rc != Z_OK)
break;
} /* while */
retval /= objSize;
} /* else */
if (retval > 0)
269
finfo->uncompressed_position += (PHYSFS_uint32) (retval * objSize);
270
271
return(retval);
272
273
274
} /* ZIP_read */
275
static PHYSFS_sint64 ZIP_write(fvoid *opaque, const void *buf,
276
277
278
279
280
281
PHYSFS_uint32 objSize, PHYSFS_uint32 objCount)
{
BAIL_MACRO(ERR_NOT_SUPPORTED, -1);
} /* ZIP_write */
282
static int ZIP_eof(fvoid *opaque)
283
{
284
ZIPfileinfo *finfo = (ZIPfileinfo *) opaque;
285
return(finfo->uncompressed_position >= finfo->entry->uncompressed_size);
286
287
288
} /* ZIP_eof */
289
static PHYSFS_sint64 ZIP_tell(fvoid *opaque)
290
{
291
return(((ZIPfileinfo *) opaque)->uncompressed_position);
292
293
294
} /* ZIP_tell */
295
static int ZIP_seek(fvoid *opaque, PHYSFS_uint64 offset)
296
{
297
ZIPfileinfo *finfo = (ZIPfileinfo *) opaque;
298
299
ZIPentry *entry = finfo->entry;
void *in = finfo->handle;
300
301
BAIL_IF_MACRO(offset > entry->uncompressed_size, ERR_PAST_EOF, 0);
302
303
if (entry->compression_method == COMPMETH_NONE)
304
{
305
306
PHYSFS_sint64 newpos = offset + entry->offset;
BAIL_IF_MACRO(!__PHYSFS_platformSeek(in, newpos), NULL, 0);
307
finfo->uncompressed_position = (PHYSFS_uint32) offset;
308
} /* if */
309
310
else
311
{
312
313
314
315
/*
* If seeking backwards, we need to redecode the file
* from the start and throw away the compressed bits until we hit
* the offset we need. If seeking forward, we still need to
316
* decode, but we don't rewind first.
317
318
319
320
321
*/
if (offset < finfo->uncompressed_position)
{
/* we do a copy so state is sane if inflateInit2() fails. */
z_stream str;
322
initializeZStream(&str);
323
324
325
if (zlib_err(inflateInit2(&str, -MAX_WBITS)) != Z_OK)
return(0);
326
327
328
if (!__PHYSFS_platformSeek(in, entry->offset))
return(0);
329
330
331
332
333
334
335
336
inflateEnd(&finfo->stream);
memcpy(&finfo->stream, &str, sizeof (z_stream));
finfo->uncompressed_position = finfo->compressed_position = 0;
} /* if */
while (finfo->uncompressed_position != offset)
{
PHYSFS_uint8 buf[512];
337
338
339
PHYSFS_uint32 maxread;
maxread = (PHYSFS_uint32) (offset - finfo->uncompressed_position);
340
341
342
if (maxread > sizeof (buf))
maxread = sizeof (buf);
343
if (ZIP_read(finfo, buf, maxread, 1) != 1)
344
345
346
347
348
return(0);
} /* while */
} /* else */
return(1);
349
350
351
} /* ZIP_seek */
352
static PHYSFS_sint64 ZIP_fileLength(fvoid *opaque)
353
{
354
ZIPfileinfo *finfo = (ZIPfileinfo *) opaque;
355
return(finfo->entry->uncompressed_size);
356
357
358
} /* ZIP_fileLength */
359
static int ZIP_fileClose(fvoid *opaque)
360
{
361
ZIPfileinfo *finfo = (ZIPfileinfo *) opaque;
362
BAIL_IF_MACRO(!__PHYSFS_platformClose(finfo->handle), NULL, 0);
363
364
365
366
367
if (finfo->entry->compression_method != COMPMETH_NONE)
inflateEnd(&finfo->stream);
if (finfo->buffer != NULL)
368
allocator.Free(finfo->buffer);
369
370
allocator.Free(finfo);
371
return(1);
372
373
374
} /* ZIP_fileClose */
375
static PHYSFS_sint64 zip_find_end_of_central_dir(void *in, PHYSFS_sint64 *len)
376
{
377
PHYSFS_uint8 buf[256];
378
PHYSFS_sint32 i = 0;
379
380
381
PHYSFS_sint64 filelen;
PHYSFS_sint64 filepos;
PHYSFS_sint32 maxread;
382
383
PHYSFS_sint32 totalread = 0;
int found = 0;
384
PHYSFS_uint32 extra = 0;
385
386
filelen = __PHYSFS_platformFileLength(in);
387
BAIL_IF_MACRO(filelen == -1, NULL, 0); /* !!! FIXME: unlocalized string */
388
BAIL_IF_MACRO(filelen > 0xFFFFFFFF, "ZIP bigger than 2 gigs?!", 0);
389
390
391
392
393
394
395
396
397
/*
* Jump to the end of the file and start reading backwards.
* The last thing in the file is the zipfile comment, which is variable
* length, and the field that specifies its size is before it in the
* file (argh!)...this means that we need to scan backwards until we
* hit the end-of-central-dir signature. We can then sanity check that
* the comment was as big as it should be to make sure we're in the
* right place. The comment length field is 16 bits, so we can stop
398
399
* searching for that signature after a little more than 64k at most,
* and call it a corrupted zipfile.
400
401
402
403
404
405
406
407
408
409
*/
if (sizeof (buf) < filelen)
{
filepos = filelen - sizeof (buf);
maxread = sizeof (buf);
} /* if */
else
{
filepos = 0;
410
maxread = (PHYSFS_uint32) filelen;
411
412
} /* else */
413
while ((totalread < filelen) && (totalread < 65557))
414
{
415
416
417
418
BAIL_IF_MACRO(!__PHYSFS_platformSeek(in, filepos), NULL, -1);
/* make sure we catch a signature between buffers. */
if (totalread != 0)
419
{
420
421
422
423
if (__PHYSFS_platformRead(in, buf, maxread - 4, 1) != 1)
return(-1);
*((PHYSFS_uint32 *) (&buf[maxread - 4])) = extra;
totalread += maxread - 4;
424
} /* if */
425
426
427
428
429
430
431
432
else
{
if (__PHYSFS_platformRead(in, buf, maxread, 1) != 1)
return(-1);
totalread += maxread;
} /* else */
extra = *((PHYSFS_uint32 *) (&buf[0]));
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
for (i = maxread - 4; i > 0; i--)
{
if ((buf[i + 0] == 0x50) &&
(buf[i + 1] == 0x4B) &&
(buf[i + 2] == 0x05) &&
(buf[i + 3] == 0x06) )
{
found = 1; /* that's the signature! */
break;
} /* if */
} /* for */
if (found)
break;
filepos -= (maxread - 4);
} /* while */
BAIL_IF_MACRO(!found, ERR_NOT_AN_ARCHIVE, -1);
453
454
455
456
if (len != NULL)
*len = filelen;
457
458
return(filepos + i);
} /* zip_find_end_of_central_dir */
459
460
461
462
static int ZIP_isArchive(const char *filename, int forWriting)
{
463
PHYSFS_uint32 sig;
464
int retval = 0;
465
void *in;
466
467
468
469
470
471
472
473
in = __PHYSFS_platformOpenRead(filename);
BAIL_IF_MACRO(in == NULL, NULL, 0);
/*
* The first thing in a zip file might be the signature of the
* first local file record, so it makes for a quick determination.
*/
474
if (readui32(in, &sig))
475
{
476
477
478
479
480
481
482
483
484
485
retval = (sig == ZIP_LOCAL_FILE_SIG);
if (!retval)
{
/*
* No sig...might be a ZIP with data at the start
* (a self-extracting executable, etc), so we'll have to do
* it the hard way...
*/
retval = (zip_find_end_of_central_dir(in, NULL) != -1);
} /* if */
486
487
} /* if */
488
__PHYSFS_platformClose(in);
489
return(retval);
490
491
492
} /* ZIP_isArchive */
493
static void zip_free_entries(ZIPentry *entries, PHYSFS_uint32 max)
494
{
495
496
PHYSFS_uint32 i;
for (i = 0; i < max; i++)
497
{
498
499
ZIPentry *entry = &entries[i];
if (entry->name != NULL)
500
allocator.Free(entry->name);
501
502
} /* for */
503
allocator.Free(entries);
504
505
506
} /* zip_free_entries */
507
508
509
510
511
512
/*
* This will find the ZIPentry associated with a path in platform-independent
* notation. Directories don't have ZIPentries associated with them, but
* (*isDir) will be set to non-zero if a dir was hit.
*/
static ZIPentry *zip_find_entry(ZIPinfo *info, const char *path, int *isDir)
513
514
{
ZIPentry *a = info->entries;
515
516
PHYSFS_sint32 pathlen = strlen(path);
PHYSFS_sint32 lo = 0;
517
518
PHYSFS_sint32 hi = (PHYSFS_sint32) (info->entryCount - 1);
PHYSFS_sint32 middle;
519
const char *thispath = NULL;
520
521
522
523
int rc;
while (lo <= hi)
{
524
525
526
middle = lo + ((hi - lo) / 2);
thispath = a[middle].name;
rc = strncmp(path, thispath, pathlen);
527
528
if (rc > 0)
529
lo = middle + 1;
530
531
else if (rc < 0)
532
hi = middle - 1;
533
534
535
else /* substring match...might be dir or entry or nothing. */
{
536
537
if (isDir != NULL)
{
538
539
*isDir = (thispath[pathlen] == '/');
if (*isDir)
540
541
542
543
return(NULL);
} /* if */
if (thispath[pathlen] == '\0') /* found entry? */
544
545
546
547
548
return(&a[middle]);
else
hi = middle - 1; /* adjust search params, try again. */
} /* if */
} /* while */
549
550
551
if (isDir != NULL)
*isDir = 0;
552
553
554
BAIL_MACRO(ERR_NO_SUCH_FILE, NULL);
} /* zip_find_entry */
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
/* Convert paths from old, buggy DOS zippers... */
static void zip_convert_dos_path(ZIPentry *entry, char *path)
{
PHYSFS_uint8 hosttype = (PHYSFS_uint8) ((entry->version >> 8) & 0xFF);
if (hosttype == 0) /* FS_FAT_ */
{
while (*path)
{
if (*path == '\\')
*path = '/';
path++;
} /* while */
} /* if */
} /* zip_convert_dos_path */
571
572
573
static void zip_expand_symlink_path(char *path)
574
{
575
576
char *ptr = path;
char *prevptr = path;
577
578
while (1)
579
{
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
ptr = strchr(ptr, '/');
if (ptr == NULL)
break;
if (*(ptr + 1) == '.')
{
if (*(ptr + 2) == '/')
{
/* current dir in middle of string: ditch it. */
memmove(ptr, ptr + 2, strlen(ptr + 2) + 1);
} /* else if */
else if (*(ptr + 2) == '\0')
{
/* current dir at end of string: ditch it. */
*ptr = '\0';
} /* else if */
else if (*(ptr + 2) == '.')
{
if (*(ptr + 3) == '/')
{
/* parent dir in middle: move back one, if possible. */
memmove(prevptr, ptr + 4, strlen(ptr + 4) + 1);
ptr = prevptr;
while (prevptr != path)
{
prevptr--;
if (*prevptr == '/')
{
prevptr++;
break;
} /* if */
} /* while */
} /* if */
615
616
617
618
619
620
621
622
623
624
625
626
627
628
if (*(ptr + 3) == '\0')
{
/* parent dir at end: move back one, if possible. */
*prevptr = '\0';
} /* if */
} /* if */
} /* if */
else
{
prevptr = ptr;
} /* else */
} /* while */
} /* zip_expand_symlink_path */
629
630
631
/* (forward reference: zip_follow_symlink and zip_resolve call each other.) */
static int zip_resolve(void *in, ZIPinfo *info, ZIPentry *entry);
632
633
/*
634
635
636
637
638
* Look for the entry named by (path). If it exists, resolve it, and return
* a pointer to that entry. If it's another symlink, keep resolving until you
* hit a real file and then return a pointer to the final non-symlink entry.
* If there's a problem, return NULL. (path) is always free()'d by this
* function.
639
*/
640
static ZIPentry *zip_follow_symlink(void *in, ZIPinfo *info, char *path)
641
{
642
643
644
ZIPentry *entry;
zip_expand_symlink_path(path);
645
entry = zip_find_entry(info, path, NULL);
646
647
648
649
650
651
652
653
654
655
656
if (entry != NULL)
{
if (!zip_resolve(in, info, entry)) /* recursive! */
entry = NULL;
else
{
if (entry->symlink != NULL)
entry = entry->symlink;
} /* else */
} /* if */
657
allocator.Free(path);
658
659
return(entry);
} /* zip_follow_symlink */
660
661
662
static int zip_resolve_symlink(void *in, ZIPinfo *info, ZIPentry *entry)
663
{
664
665
666
667
char *path;
PHYSFS_uint32 size = entry->uncompressed_size;
int rc = 0;
668
669
670
671
672
673
674
675
/*
* We've already parsed the local file header of the symlink at this
* point. Now we need to read the actual link from the file data and
* follow it.
*/
BAIL_IF_MACRO(!__PHYSFS_platformSeek(in, entry->offset), NULL, 0);
676
path = (char *) allocator.Malloc(size + 1);
677
BAIL_IF_MACRO(path == NULL, ERR_OUT_OF_MEMORY, 0);
678
679
680
681
682
683
684
if (entry->compression_method == COMPMETH_NONE)
rc = (__PHYSFS_platformRead(in, path, size, 1) == 1);
else /* symlink target path is compressed... */
{
z_stream stream;
685
PHYSFS_uint32 compsize = entry->compressed_size;
686
PHYSFS_uint8 *compressed = (PHYSFS_uint8 *) allocator.Malloc(compsize);
687
688
689
690
if (compressed != NULL)
{
if (__PHYSFS_platformRead(in, compressed, compsize, 1) == 1)
{
691
initializeZStream(&stream);
692
693
stream.next_in = compressed;
stream.avail_in = compsize;
694
stream.next_out = (unsigned char *) path;
695
696
697
stream.avail_out = size;
if (zlib_err(inflateInit2(&stream, -MAX_WBITS)) == Z_OK)
{
698
rc = zlib_err(inflate(&stream, Z_FINISH));
699
inflateEnd(&stream);
700
701
702
/* both are acceptable outcomes... */
rc = ((rc == Z_OK) || (rc == Z_STREAM_END));
703
704
} /* if */
} /* if */
705
allocator.Free(compressed);
706
707
} /* if */
} /* else */
708
709
if (!rc)
710
allocator.Free(path);
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
else
{
path[entry->uncompressed_size] = '\0'; /* null-terminate it. */
zip_convert_dos_path(entry, path);
entry->symlink = zip_follow_symlink(in, info, path);
} /* else */
return(entry->symlink != NULL);
} /* zip_resolve_symlink */
/*
* Parse the local file header of an entry, and update entry->offset.
*/
static int zip_parse_local(void *in, ZIPentry *entry)
{
PHYSFS_uint32 ui32;
PHYSFS_uint16 ui16;
PHYSFS_uint16 fnamelen;
PHYSFS_uint16 extralen;
732
733
734
735
736
737
738
/*
* crc and (un)compressed_size are always zero if this is a "JAR"
* archive created with Sun's Java tools, apparently. We only
* consider this archive corrupted if those entries don't match and
* aren't zero. That seems to work well.
*/
739
740
741
742
743
744
745
746
747
748
BAIL_IF_MACRO(!__PHYSFS_platformSeek(in, entry->offset), NULL, 0);
BAIL_IF_MACRO(!readui32(in, &ui32), NULL, 0);
BAIL_IF_MACRO(ui32 != ZIP_LOCAL_FILE_SIG, ERR_CORRUPTED, 0);
BAIL_IF_MACRO(!readui16(in, &ui16), NULL, 0);
BAIL_IF_MACRO(ui16 != entry->version_needed, ERR_CORRUPTED, 0);
BAIL_IF_MACRO(!readui16(in, &ui16), NULL, 0); /* general bits. */
BAIL_IF_MACRO(!readui16(in, &ui16), NULL, 0);
BAIL_IF_MACRO(ui16 != entry->compression_method, ERR_CORRUPTED, 0);
BAIL_IF_MACRO(!readui32(in, &ui32), NULL, 0); /* date/time */
BAIL_IF_MACRO(!readui32(in, &ui32), NULL, 0);
749
BAIL_IF_MACRO(ui32 && (ui32 != entry->crc), ERR_CORRUPTED, 0);
750
BAIL_IF_MACRO(!readui32(in, &ui32), NULL, 0);
751
BAIL_IF_MACRO(ui32 && (ui32 != entry->compressed_size), ERR_CORRUPTED, 0);
752
BAIL_IF_MACRO(!readui32(in, &ui32), NULL, 0);
753
BAIL_IF_MACRO(ui32 && (ui32 != entry->uncompressed_size),ERR_CORRUPTED,0);
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
BAIL_IF_MACRO(!readui16(in, &fnamelen), NULL, 0);
BAIL_IF_MACRO(!readui16(in, &extralen), NULL, 0);
entry->offset += fnamelen + extralen + 30;
return(1);
} /* zip_parse_local */
static int zip_resolve(void *in, ZIPinfo *info, ZIPentry *entry)
{
int retval = 1;
ZipResolveType resolve_type = entry->resolved;
/* Don't bother if we've failed to resolve this entry before. */
BAIL_IF_MACRO(resolve_type == ZIP_BROKEN_FILE, ERR_CORRUPTED, 0);
BAIL_IF_MACRO(resolve_type == ZIP_BROKEN_SYMLINK, ERR_CORRUPTED, 0);
/* uhoh...infinite symlink loop! */
BAIL_IF_MACRO(resolve_type == ZIP_RESOLVING, ERR_SYMLINK_LOOP, 0);
/*
* We fix up the offset to point to the actual data on the
* first open, since we don't want to seek across the whole file on
* archive open (can be SLOW on large, CD-stored files), but we
* need to check the local file header...not just for corruption,
* but since it stores offset info the central directory does not.
*/
if (resolve_type != ZIP_RESOLVED)
{
entry->resolved = ZIP_RESOLVING;
retval = zip_parse_local(in, entry);
if (retval)
{
/*
* If it's a symlink, find the original file. This will cause
* resolution of other entries (other symlinks and, eventually,
* the real file) if all goes well.
*/
if (resolve_type == ZIP_UNRESOLVED_SYMLINK)
retval = zip_resolve_symlink(in, info, entry);
} /* if */
if (resolve_type == ZIP_UNRESOLVED_SYMLINK)
entry->resolved = ((retval) ? ZIP_RESOLVED : ZIP_BROKEN_SYMLINK);
else if (resolve_type == ZIP_UNRESOLVED_FILE)
entry->resolved = ((retval) ? ZIP_RESOLVED : ZIP_BROKEN_FILE);
801
} /* if */
802
803
804
return(retval);
} /* zip_resolve */
805
806
807
static int zip_version_does_symlinks(PHYSFS_uint32 version)
808
809
{
int retval = 0;
810
PHYSFS_uint8 hosttype = (PHYSFS_uint8) ((version >> 8) & 0xFF);
811
812
813
switch (hosttype)
{
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
/*
* These are the platforms that can NOT build an archive with
* symlinks, according to the Info-ZIP project.
*/
case 0: /* FS_FAT_ */
case 1: /* AMIGA_ */
case 2: /* VMS_ */
case 4: /* VM_CSM_ */
case 6: /* FS_HPFS_ */
case 11: /* FS_NTFS_ */
case 14: /* FS_VFAT_ */
case 13: /* ACORN_ */
case 15: /* MVS_ */
case 18: /* THEOS_ */
break; /* do nothing. */
default: /* assume the rest to be unix-like. */
831
832
833
834
835
retval = 1;
break;
} /* switch */
return(retval);
836
837
838
839
840
841
842
843
844
} /* zip_version_does_symlinks */
static int zip_entry_is_symlink(ZIPentry *entry)
{
return((entry->resolved == ZIP_UNRESOLVED_SYMLINK) ||
(entry->resolved == ZIP_BROKEN_SYMLINK) ||
(entry->symlink));
} /* zip_entry_is_symlink */
845
846
847
static int zip_has_symlink_attr(ZIPentry *entry, PHYSFS_uint32 extern_attr)
848
{
849
850
PHYSFS_uint16 xattr = ((extern_attr >> 16) & 0xFFFF);
851
return (
852
(zip_version_does_symlinks(entry->version)) &&
853
(entry->uncompressed_size > 0) &&
854
((xattr & UNIX_FILETYPE_MASK) == UNIX_FILETYPE_SYMLINK)
855
);
856
} /* zip_has_symlink_attr */
857
858
859
static PHYSFS_sint64 zip_dos_time_to_physfs_time(PHYSFS_uint32 dostime)
860
{
861
#ifdef _WIN32_WCE
862
863
864
/* We have no struct tm and no mktime right now.
FIXME: This should probably be fixed at some point.
*/
865
866
return -1;
#else
867
PHYSFS_uint32 dosdate;
868
869
struct tm unixtime;
memset(&unixtime, '\0', sizeof (unixtime));
870
871
872
dosdate = (PHYSFS_uint32) ((dostime >> 16) & 0xFFFF);
dostime &= 0xFFFF;
873
874
875
876
877
878
879
880
881
882
883
884
885
/* dissect date */
unixtime.tm_year = ((dosdate >> 9) & 0x7F) + 80;
unixtime.tm_mon = ((dosdate >> 5) & 0x0F) - 1;
unixtime.tm_mday = ((dosdate ) & 0x1F);
/* dissect time */
unixtime.tm_hour = ((dostime >> 11) & 0x1F);
unixtime.tm_min = ((dostime >> 5) & 0x3F);
unixtime.tm_sec = ((dostime << 1) & 0x3E);
/* let mktime calculate daylight savings time. */
unixtime.tm_isdst = -1;
886
887
return((PHYSFS_sint64) mktime(&unixtime));
888
#endif
889
} /* zip_dos_time_to_physfs_time */
890
891
892
static int zip_load_entry(void *in, ZIPentry *entry, PHYSFS_uint32 ofs_fixup)
893
894
895
896
897
898
899
900
901
902
903
904
905
906
{
PHYSFS_uint16 fnamelen, extralen, commentlen;
PHYSFS_uint32 external_attr;
PHYSFS_uint16 ui16;
PHYSFS_uint32 ui32;
PHYSFS_sint64 si64;
/* sanity check with central directory signature... */
BAIL_IF_MACRO(!readui32(in, &ui32), NULL, 0);
BAIL_IF_MACRO(ui32 != ZIP_CENTRAL_DIR_SIG, ERR_CORRUPTED, 0);
/* Get the pertinent parts of the record... */
BAIL_IF_MACRO(!readui16(in, &entry->version), NULL, 0);
BAIL_IF_MACRO(!readui16(in, &entry->version_needed), NULL, 0);
907
BAIL_IF_MACRO(!readui16(in, &ui16), NULL, 0); /* general bits */
908
909
BAIL_IF_MACRO(!readui16(in, &entry->compression_method), NULL, 0);
BAIL_IF_MACRO(!readui32(in, &ui32), NULL, 0);
910
entry->last_mod_time = zip_dos_time_to_physfs_time(ui32);
911
912
913
914
915
916
917
918
919
920
921
BAIL_IF_MACRO(!readui32(in, &entry->crc), NULL, 0);
BAIL_IF_MACRO(!readui32(in, &entry->compressed_size), NULL, 0);
BAIL_IF_MACRO(!readui32(in, &entry->uncompressed_size), NULL, 0);
BAIL_IF_MACRO(!readui16(in, &fnamelen), NULL, 0);
BAIL_IF_MACRO(!readui16(in, &extralen), NULL, 0);
BAIL_IF_MACRO(!readui16(in, &commentlen), NULL, 0);
BAIL_IF_MACRO(!readui16(in, &ui16), NULL, 0); /* disk number start */
BAIL_IF_MACRO(!readui16(in, &ui16), NULL, 0); /* internal file attribs */
BAIL_IF_MACRO(!readui32(in, &external_attr), NULL, 0);
BAIL_IF_MACRO(!readui32(in, &entry->offset), NULL, 0);
entry->offset += ofs_fixup;
922
923
924
925
entry->symlink = NULL; /* will be resolved later, if necessary. */
entry->resolved = (zip_has_symlink_attr(entry, external_attr)) ?
ZIP_UNRESOLVED_SYMLINK : ZIP_UNRESOLVED_FILE;
926
927
entry->name = (char *) allocator.Malloc(fnamelen + 1);
928
929
BAIL_IF_MACRO(entry->name == NULL, ERR_OUT_OF_MEMORY, 0);
if (__PHYSFS_platformRead(in, entry->name, fnamelen, 1) != 1)
930
goto zip_load_entry_puked;
931
932
entry->name[fnamelen] = '\0'; /* null-terminate the filename. */
933
zip_convert_dos_path(entry, entry->name);
934
935
936
si64 = __PHYSFS_platformTell(in);
if (si64 == -1)
937
goto zip_load_entry_puked;
938
939
940
/* seek to the start of the next entry in the central directory... */
if (!__PHYSFS_platformSeek(in, si64 + extralen + commentlen))
941
goto zip_load_entry_puked;
942
943
return(1); /* success. */
944
945
zip_load_entry_puked:
946
allocator.Free(entry->name);
947
return(0); /* failure. */
948
949
950
} /* zip_load_entry */
951
static int zip_entry_cmp(void *_a, PHYSFS_uint32 one, PHYSFS_uint32 two)
952
{
953
954
955
ZIPentry *a = (ZIPentry *) _a;
return(strcmp(a[one].name, a[two].name));
} /* zip_entry_cmp */
956
957
958
static void zip_entry_swap(void *_a, PHYSFS_uint32 one, PHYSFS_uint32 two)
959
960
{
ZIPentry tmp;
961
962
963
964
965
966
ZIPentry *first = &(((ZIPentry *) _a)[one]);
ZIPentry *second = &(((ZIPentry *) _a)[two]);
memcpy(&tmp, first, sizeof (ZIPentry));
memcpy(first, second, sizeof (ZIPentry));
memcpy(second, &tmp, sizeof (ZIPentry));
} /* zip_entry_swap */
967
968
969
static int zip_load_entries(void *in, ZIPinfo *info,
970
971
972
973
974
975
976
PHYSFS_uint32 data_ofs, PHYSFS_uint32 central_ofs)
{
PHYSFS_uint32 max = info->entryCount;
PHYSFS_uint32 i;
BAIL_IF_MACRO(!__PHYSFS_platformSeek(in, central_ofs), NULL, 0);
977
info->entries = (ZIPentry *) allocator.Malloc(sizeof (ZIPentry) * max);
978
979
980
981
BAIL_IF_MACRO(info->entries == NULL, ERR_OUT_OF_MEMORY, 0);
for (i = 0; i < max; i++)
{
982
if (!zip_load_entry(in, &info->entries[i], data_ofs))
983
{
984
zip_free_entries(info->entries, i);
985
986
987
988
return(0);
} /* if */
} /* for */
989
__PHYSFS_sort(info->entries, max, zip_entry_cmp, zip_entry_swap);
990
return(1);
991
} /* zip_load_entries */
992
993
994
static int zip_parse_end_of_central_dir(void *in, ZIPinfo *info,
995
996
PHYSFS_uint32 *data_start,
PHYSFS_uint32 *central_dir_ofs)
997
{
998
999
1000
PHYSFS_uint32 ui32;
PHYSFS_uint16 ui16;
PHYSFS_sint64 len;