Kaizen/external/unarr/zip/parse-zip.c

327 lines
11 KiB
C

/* Copyright 2015 the unarr project authors (see AUTHORS file).
License: LGPLv3 */
#include "zip.h"
#if defined(_MSC_VER) && !defined(inline)
#define inline __inline
#endif
static inline uint16_t uint16le(unsigned char *data) { return data[0] | data[1] << 8; }
static inline uint32_t uint32le(unsigned char *data) { return data[0] | data[1] << 8 | data[2] << 16 | (uint32_t) data[3] << 24; }
static inline uint64_t uint64le(unsigned char *data) { return (uint64_t)uint32le(data) | (uint64_t)uint32le(data + 4) << 32; }
bool zip_seek_to_compressed_data(ar_archive_zip *zip)
{
struct zip_entry entry;
if (!ar_seek(zip->super.stream, zip->entry.offset, SEEK_SET))
return false;
if (!zip_parse_local_file_entry(zip, &entry))
return false;
if (zip->entry.method != entry.method) {
warn("Compression methods don't match: %d != %d", zip->entry.method, entry.method);
if (!zip->entry.method)
zip->entry.method = entry.method;
}
if (zip->entry.dosdate != entry.dosdate) {
warn("Timestamps don't match");
if (!zip->entry.dosdate) {
zip->entry.dosdate = entry.dosdate;
zip->super.entry_filetime = ar_conv_dosdate_to_filetime(zip->entry.dosdate);
}
}
return ar_seek(zip->super.stream, zip->entry.offset + ZIP_LOCAL_ENTRY_FIXED_SIZE + entry.namelen + entry.extralen, SEEK_SET);
}
static bool zip_parse_extra_fields(ar_archive_zip *zip, struct zip_entry *entry)
{
uint8_t *extra;
if (!entry->extralen)
return true;
/* read ZIP64 values where needed */
if (!ar_skip(zip->super.stream, entry->namelen))
return false;
extra = malloc(entry->extralen);
if (!extra || ar_read(zip->super.stream, extra, entry->extralen) != entry->extralen) {
free(extra);
return false;
}
for (uint32_t idx = 0; idx + 4 < entry->extralen; idx += 4 + uint16le(&extra[idx + 2])) {
if (uint16le(&extra[idx]) == 0x0001) {
uint16_t size = uint16le(&extra[idx + 2]);
if (size + idx + 1 > entry->extralen) {
free(extra);
return false;
}
uint16_t offset = 0;
if (entry->uncompressed == UINT32_MAX && offset + 8 <= size) {
entry->uncompressed = uint64le(&extra[idx + 4 + offset]);
offset += 8;
}
if (entry->datasize == UINT32_MAX && offset + 8 <= size) {
entry->datasize = uint64le(&extra[idx + 4 + offset]);
offset += 8;
}
if (entry->header_offset == UINT32_MAX && offset + 8 <= size) {
entry->header_offset = (off64_t)uint64le(&extra[idx + 4 + offset]);
offset += 8;
}
if (entry->disk == UINT16_MAX && offset + 4 <= size) {
entry->disk = uint32le(&extra[idx + 4 + offset]);
offset += 4;
}
break;
}
}
free(extra);
return true;
}
bool zip_parse_local_file_entry(ar_archive_zip *zip, struct zip_entry *entry)
{
uint8_t data[ZIP_LOCAL_ENTRY_FIXED_SIZE];
if (ar_read(zip->super.stream, data, sizeof(data)) != sizeof(data))
return false;
memset(entry, 0, sizeof(*entry));
entry->signature = uint32le(data + 0);
entry->version = uint16le(data + 4);
entry->flags = uint16le(data + 6);
entry->method = uint16le(data + 8);
entry->dosdate = uint32le(data + 10);
entry->crc = uint32le(data + 14);
entry->datasize = uint32le(data + 18);
entry->uncompressed = uint32le(data + 22);
entry->namelen = uint16le(data + 26);
entry->extralen = uint16le(data + 28);
if (entry->signature != SIG_LOCAL_FILE_HEADER)
return false;
return zip_parse_extra_fields(zip, entry);
}
off64_t zip_find_next_local_file_entry(ar_stream *stream, off64_t offset)
{
uint8_t data[512];
int count, i;
if (!ar_seek(stream, offset, SEEK_SET))
return -1;
count = (int)ar_read(stream, data, sizeof(data));
while (count >= ZIP_LOCAL_ENTRY_FIXED_SIZE) {
for (i = 0; i < count - 4; i++) {
if (uint32le(data + i) == SIG_LOCAL_FILE_HEADER)
return offset + i;
}
memmove(data, data + count - 4, 4);
offset += count - 4;
count = (int)ar_read(stream, data + 4, sizeof(data) - 4) + 4;
}
return -1;
}
bool zip_parse_directory_entry(ar_archive_zip *zip, struct zip_entry *entry)
{
uint8_t data[ZIP_DIR_ENTRY_FIXED_SIZE];
if (ar_read(zip->super.stream, data, sizeof(data)) != sizeof(data))
return false;
entry->signature = uint32le(data + 0);
entry->version = uint16le(data + 4);
entry->min_version = uint16le(data + 6);
entry->flags = uint16le(data + 8);
entry->method = uint16le(data + 10);
entry->dosdate = uint32le(data + 12);
entry->crc = uint32le(data + 16);
entry->datasize = uint32le(data + 20);
entry->uncompressed = uint32le(data + 24);
entry->namelen = uint16le(data + 28);
entry->extralen = uint16le(data + 30);
entry->commentlen = uint16le(data + 32);
entry->disk = uint16le(data + 34);
entry->attr_internal = uint16le(data + 36);
entry->attr_external = uint32le(data + 38);
entry->header_offset = uint32le(data + 42);
if (entry->signature != SIG_CENTRAL_DIRECTORY)
return false;
return zip_parse_extra_fields(zip, entry);
}
off64_t zip_find_end_of_last_directory_entry(ar_stream *stream, struct zip_eocd64 *eocd)
{
uint8_t data[ZIP_DIR_ENTRY_FIXED_SIZE];
uint64_t i;
if (!ar_seek(stream, eocd->dir_offset, SEEK_SET))
return -1;
for (i = 0; i < eocd->numentries; i++) {
if (ar_read(stream, data, sizeof(data)) != sizeof(data))
return -1;
if (uint32le(data + 0) != SIG_CENTRAL_DIRECTORY)
return -1;
if (!ar_skip(stream, uint16le(data + 28) + uint16le(data + 30) + uint16le(data + 32)))
return -1;
}
return ar_tell(stream);
}
bool zip_parse_end_of_central_directory(ar_stream *stream, struct zip_eocd64 *eocd)
{
uint8_t data[56];
if (ar_read(stream, data, ZIP_END_OF_CENTRAL_DIR_SIZE) != ZIP_END_OF_CENTRAL_DIR_SIZE)
return false;
eocd->signature = uint32le(data + 0);
eocd->diskno = uint16le(data + 4);
eocd->diskno_dir = uint16le(data + 6);
eocd->numentries_disk = uint16le(data + 8);
eocd->numentries = uint16le(data + 10);
eocd->dir_size = uint32le(data + 12);
eocd->dir_offset = uint32le(data + 16);
eocd->commentlen = uint16le(data + 20);
if (eocd->signature != SIG_END_OF_CENTRAL_DIRECTORY)
return false;
/* try to locate the ZIP64 end of central directory */
if (!ar_skip(stream, -42))
return eocd->dir_size < 20;
if (ar_read(stream, data, 20) != 20)
return false;
if (uint32le(data + 0) != SIG_END_OF_CENTRAL_DIRECTORY_64_LOCATOR)
return true;
if ((eocd->diskno != UINT16_MAX && uint32le(data + 4) != eocd->diskno) || uint32le(data + 16) != 1) {
warn("Archive spanning isn't supported");
return false;
}
if (!ar_seek(stream, (off64_t)uint64le(data + 8), SEEK_SET))
return false;
if (ar_read(stream, data, 56) != 56)
return false;
/* use data from ZIP64 end of central directory (when necessary) */
eocd->signature = uint32le(data + 0);
eocd->version = uint16le(data + 12);
eocd->min_version = uint16le(data + 14);
if (eocd->diskno == UINT16_MAX)
eocd->diskno = uint32le(data + 16);
if (eocd->diskno_dir == UINT16_MAX)
eocd->diskno_dir = uint32le(data + 20);
if (eocd->numentries_disk == UINT16_MAX)
eocd->numentries_disk = uint64le(data + 24);
if (eocd->numentries == UINT16_MAX)
eocd->numentries = uint64le(data + 32);
if (eocd->dir_size == UINT32_MAX)
eocd->dir_size = uint64le(data + 40);
if (eocd->dir_offset == UINT32_MAX)
eocd->dir_offset = (off64_t)uint64le(data + 48);
if (eocd->signature != SIG_END_OF_CENTRAL_DIRECTORY_64)
return false;
if (eocd->diskno != eocd->diskno_dir || eocd->numentries != eocd->numentries_disk) {
warn("Archive spanning isn't supported");
return false;
}
if (uint64le(data + 4) > 44)
log("ZIP64 extensible data sector present @" PRIi64, ar_tell(stream));
return true;
}
off64_t zip_find_end_of_central_directory(ar_stream *stream)
{
uint8_t data[512];
off64_t filesize;
int fromend = 0;
int count, i;
if (!ar_seek(stream, 0, SEEK_END))
return -1;
filesize = ar_tell(stream);
while (fromend < UINT16_MAX + ZIP_END_OF_CENTRAL_DIR_SIZE && fromend < filesize) {
count = (filesize - fromend < (int)sizeof(data) ? (int)(filesize - fromend) : (int)sizeof(data));
fromend += count;
if (count < ZIP_END_OF_CENTRAL_DIR_SIZE)
return -1;
if (!ar_seek(stream, -fromend, SEEK_END))
return -1;
if (ar_read(stream, data, count) != (size_t)count)
return -1;
for (i = count - ZIP_END_OF_CENTRAL_DIR_SIZE; i >= 0; i--) {
if (uint32le(data + i) == SIG_END_OF_CENTRAL_DIRECTORY)
return filesize - fromend + i;
}
fromend -= ZIP_END_OF_CENTRAL_DIR_SIZE - 1;
}
return -1;
}
const char *zip_get_name(ar_archive *ar, bool raw)
{
ar_archive_zip *zip = (ar_archive_zip *)ar;
if (!zip->entry.name) {
struct zip_entry entry;
char *name;
if (zip->dir.end_offset >= 0) {
if (!ar_seek(ar->stream, ar->entry_offset, SEEK_SET))
return NULL;
if (!zip_parse_directory_entry(zip, &entry))
return NULL;
if (!ar_seek(ar->stream, ar->entry_offset + ZIP_DIR_ENTRY_FIXED_SIZE, SEEK_SET))
return NULL;
}
else {
if (!ar_seek(ar->stream, zip->entry.offset, SEEK_SET))
return NULL;
if (!zip_parse_local_file_entry(zip, &entry))
return NULL;
if (!ar_seek(ar->stream, ar->entry_offset + ZIP_LOCAL_ENTRY_FIXED_SIZE, SEEK_SET))
return NULL;
}
name = malloc(entry.namelen + 1);
if (!name || ar_read(ar->stream, name, entry.namelen) != entry.namelen) {
free(name);
return NULL;
}
name[entry.namelen] = '\0';
zip->entry.raw_name = malloc(entry.namelen + 1);
if (zip->entry.raw_name) {
memcpy(zip->entry.raw_name, name, entry.namelen + 1);
}
if ((entry.flags & (1 << 11))) {
zip->entry.name = name;
}
else {
zip->entry.name = ar_conv_dos_to_utf8(name);
free(name);
}
/* normalize path separators */
if (zip->entry.name) {
char *p = zip->entry.name;
while ((p = strchr(p, '\\')) != NULL) {
*p = '/';
}
}
}
return raw ? zip->entry.raw_name : zip->entry.name;
}