/* Copyright 2015 the unarr project authors (see AUTHORS file). License: LGPLv3 */ #include "zip.h" #if defined(_MSC_VER) && !defined(inline) #define inline __inline #endif static inline uint16_t uint16le(unsigned char *data) { return data[0] | data[1] << 8; } static inline uint32_t uint32le(unsigned char *data) { return data[0] | data[1] << 8 | data[2] << 16 | (uint32_t) data[3] << 24; } static inline uint64_t uint64le(unsigned char *data) { return (uint64_t)uint32le(data) | (uint64_t)uint32le(data + 4) << 32; } bool zip_seek_to_compressed_data(ar_archive_zip *zip) { struct zip_entry entry; if (!ar_seek(zip->super.stream, zip->entry.offset, SEEK_SET)) return false; if (!zip_parse_local_file_entry(zip, &entry)) return false; if (zip->entry.method != entry.method) { warn("Compression methods don't match: %d != %d", zip->entry.method, entry.method); if (!zip->entry.method) zip->entry.method = entry.method; } if (zip->entry.dosdate != entry.dosdate) { warn("Timestamps don't match"); if (!zip->entry.dosdate) { zip->entry.dosdate = entry.dosdate; zip->super.entry_filetime = ar_conv_dosdate_to_filetime(zip->entry.dosdate); } } return ar_seek(zip->super.stream, zip->entry.offset + ZIP_LOCAL_ENTRY_FIXED_SIZE + entry.namelen + entry.extralen, SEEK_SET); } static bool zip_parse_extra_fields(ar_archive_zip *zip, struct zip_entry *entry) { uint8_t *extra; if (!entry->extralen) return true; /* read ZIP64 values where needed */ if (!ar_skip(zip->super.stream, entry->namelen)) return false; extra = malloc(entry->extralen); if (!extra || ar_read(zip->super.stream, extra, entry->extralen) != entry->extralen) { free(extra); return false; } for (uint32_t idx = 0; idx + 4 < entry->extralen; idx += 4 + uint16le(&extra[idx + 2])) { if (uint16le(&extra[idx]) == 0x0001) { uint16_t size = uint16le(&extra[idx + 2]); if (size + idx + 1 > entry->extralen) { free(extra); return false; } uint16_t offset = 0; if (entry->uncompressed == UINT32_MAX && offset + 8 <= size) { entry->uncompressed = uint64le(&extra[idx + 4 + offset]); offset += 8; } if (entry->datasize == UINT32_MAX && offset + 8 <= size) { entry->datasize = uint64le(&extra[idx + 4 + offset]); offset += 8; } if (entry->header_offset == UINT32_MAX && offset + 8 <= size) { entry->header_offset = (off64_t)uint64le(&extra[idx + 4 + offset]); offset += 8; } if (entry->disk == UINT16_MAX && offset + 4 <= size) { entry->disk = uint32le(&extra[idx + 4 + offset]); offset += 4; } break; } } free(extra); return true; } bool zip_parse_local_file_entry(ar_archive_zip *zip, struct zip_entry *entry) { uint8_t data[ZIP_LOCAL_ENTRY_FIXED_SIZE]; if (ar_read(zip->super.stream, data, sizeof(data)) != sizeof(data)) return false; memset(entry, 0, sizeof(*entry)); entry->signature = uint32le(data + 0); entry->version = uint16le(data + 4); entry->flags = uint16le(data + 6); entry->method = uint16le(data + 8); entry->dosdate = uint32le(data + 10); entry->crc = uint32le(data + 14); entry->datasize = uint32le(data + 18); entry->uncompressed = uint32le(data + 22); entry->namelen = uint16le(data + 26); entry->extralen = uint16le(data + 28); if (entry->signature != SIG_LOCAL_FILE_HEADER) return false; return zip_parse_extra_fields(zip, entry); } off64_t zip_find_next_local_file_entry(ar_stream *stream, off64_t offset) { uint8_t data[512]; int count, i; if (!ar_seek(stream, offset, SEEK_SET)) return -1; count = (int)ar_read(stream, data, sizeof(data)); while (count >= ZIP_LOCAL_ENTRY_FIXED_SIZE) { for (i = 0; i < count - 4; i++) { if (uint32le(data + i) == SIG_LOCAL_FILE_HEADER) return offset + i; } memmove(data, data + count - 4, 4); offset += count - 4; count = (int)ar_read(stream, data + 4, sizeof(data) - 4) + 4; } return -1; } bool zip_parse_directory_entry(ar_archive_zip *zip, struct zip_entry *entry) { uint8_t data[ZIP_DIR_ENTRY_FIXED_SIZE]; if (ar_read(zip->super.stream, data, sizeof(data)) != sizeof(data)) return false; entry->signature = uint32le(data + 0); entry->version = uint16le(data + 4); entry->min_version = uint16le(data + 6); entry->flags = uint16le(data + 8); entry->method = uint16le(data + 10); entry->dosdate = uint32le(data + 12); entry->crc = uint32le(data + 16); entry->datasize = uint32le(data + 20); entry->uncompressed = uint32le(data + 24); entry->namelen = uint16le(data + 28); entry->extralen = uint16le(data + 30); entry->commentlen = uint16le(data + 32); entry->disk = uint16le(data + 34); entry->attr_internal = uint16le(data + 36); entry->attr_external = uint32le(data + 38); entry->header_offset = uint32le(data + 42); if (entry->signature != SIG_CENTRAL_DIRECTORY) return false; return zip_parse_extra_fields(zip, entry); } off64_t zip_find_end_of_last_directory_entry(ar_stream *stream, struct zip_eocd64 *eocd) { uint8_t data[ZIP_DIR_ENTRY_FIXED_SIZE]; uint64_t i; if (!ar_seek(stream, eocd->dir_offset, SEEK_SET)) return -1; for (i = 0; i < eocd->numentries; i++) { if (ar_read(stream, data, sizeof(data)) != sizeof(data)) return -1; if (uint32le(data + 0) != SIG_CENTRAL_DIRECTORY) return -1; if (!ar_skip(stream, uint16le(data + 28) + uint16le(data + 30) + uint16le(data + 32))) return -1; } return ar_tell(stream); } bool zip_parse_end_of_central_directory(ar_stream *stream, struct zip_eocd64 *eocd) { uint8_t data[56]; if (ar_read(stream, data, ZIP_END_OF_CENTRAL_DIR_SIZE) != ZIP_END_OF_CENTRAL_DIR_SIZE) return false; eocd->signature = uint32le(data + 0); eocd->diskno = uint16le(data + 4); eocd->diskno_dir = uint16le(data + 6); eocd->numentries_disk = uint16le(data + 8); eocd->numentries = uint16le(data + 10); eocd->dir_size = uint32le(data + 12); eocd->dir_offset = uint32le(data + 16); eocd->commentlen = uint16le(data + 20); if (eocd->signature != SIG_END_OF_CENTRAL_DIRECTORY) return false; /* try to locate the ZIP64 end of central directory */ if (!ar_skip(stream, -42)) return eocd->dir_size < 20; if (ar_read(stream, data, 20) != 20) return false; if (uint32le(data + 0) != SIG_END_OF_CENTRAL_DIRECTORY_64_LOCATOR) return true; if ((eocd->diskno != UINT16_MAX && uint32le(data + 4) != eocd->diskno) || uint32le(data + 16) != 1) { warn("Archive spanning isn't supported"); return false; } if (!ar_seek(stream, (off64_t)uint64le(data + 8), SEEK_SET)) return false; if (ar_read(stream, data, 56) != 56) return false; /* use data from ZIP64 end of central directory (when necessary) */ eocd->signature = uint32le(data + 0); eocd->version = uint16le(data + 12); eocd->min_version = uint16le(data + 14); if (eocd->diskno == UINT16_MAX) eocd->diskno = uint32le(data + 16); if (eocd->diskno_dir == UINT16_MAX) eocd->diskno_dir = uint32le(data + 20); if (eocd->numentries_disk == UINT16_MAX) eocd->numentries_disk = uint64le(data + 24); if (eocd->numentries == UINT16_MAX) eocd->numentries = uint64le(data + 32); if (eocd->dir_size == UINT32_MAX) eocd->dir_size = uint64le(data + 40); if (eocd->dir_offset == UINT32_MAX) eocd->dir_offset = (off64_t)uint64le(data + 48); if (eocd->signature != SIG_END_OF_CENTRAL_DIRECTORY_64) return false; if (eocd->diskno != eocd->diskno_dir || eocd->numentries != eocd->numentries_disk) { warn("Archive spanning isn't supported"); return false; } if (uint64le(data + 4) > 44) log("ZIP64 extensible data sector present @" PRIi64, ar_tell(stream)); return true; } off64_t zip_find_end_of_central_directory(ar_stream *stream) { uint8_t data[512]; off64_t filesize; int fromend = 0; int count, i; if (!ar_seek(stream, 0, SEEK_END)) return -1; filesize = ar_tell(stream); while (fromend < UINT16_MAX + ZIP_END_OF_CENTRAL_DIR_SIZE && fromend < filesize) { count = (filesize - fromend < (int)sizeof(data) ? (int)(filesize - fromend) : (int)sizeof(data)); fromend += count; if (count < ZIP_END_OF_CENTRAL_DIR_SIZE) return -1; if (!ar_seek(stream, -fromend, SEEK_END)) return -1; if (ar_read(stream, data, count) != (size_t)count) return -1; for (i = count - ZIP_END_OF_CENTRAL_DIR_SIZE; i >= 0; i--) { if (uint32le(data + i) == SIG_END_OF_CENTRAL_DIRECTORY) return filesize - fromend + i; } fromend -= ZIP_END_OF_CENTRAL_DIR_SIZE - 1; } return -1; } const char *zip_get_name(ar_archive *ar, bool raw) { ar_archive_zip *zip = (ar_archive_zip *)ar; if (!zip->entry.name) { struct zip_entry entry; char *name; if (zip->dir.end_offset >= 0) { if (!ar_seek(ar->stream, ar->entry_offset, SEEK_SET)) return NULL; if (!zip_parse_directory_entry(zip, &entry)) return NULL; if (!ar_seek(ar->stream, ar->entry_offset + ZIP_DIR_ENTRY_FIXED_SIZE, SEEK_SET)) return NULL; } else { if (!ar_seek(ar->stream, zip->entry.offset, SEEK_SET)) return NULL; if (!zip_parse_local_file_entry(zip, &entry)) return NULL; if (!ar_seek(ar->stream, ar->entry_offset + ZIP_LOCAL_ENTRY_FIXED_SIZE, SEEK_SET)) return NULL; } name = malloc(entry.namelen + 1); if (!name || ar_read(ar->stream, name, entry.namelen) != entry.namelen) { free(name); return NULL; } name[entry.namelen] = '\0'; zip->entry.raw_name = malloc(entry.namelen + 1); if (zip->entry.raw_name) { memcpy(zip->entry.raw_name, name, entry.namelen + 1); } if ((entry.flags & (1 << 11))) { zip->entry.name = name; } else { zip->entry.name = ar_conv_dos_to_utf8(name); free(name); } /* normalize path separators */ if (zip->entry.name) { char *p = zip->entry.name; while ((p = strchr(p, '\\')) != NULL) { *p = '/'; } } } return raw ? zip->entry.raw_name : zip->entry.name; }