// SPDX-License-Identifier: (LGPL-2.1 OR BSD-2-Clause) /* * Routines for dealing with .zip archives. * * Copyright (c) Meta Platforms, Inc. and affiliates. */ #include <errno.h> #include <fcntl.h> #include <stdint.h> #include <stdlib.h> #include <string.h> #include <sys/mman.h> #include <unistd.h> #include "libbpf_internal.h" #include "zip.h" #pragma GCC diagnostic push #pragma GCC diagnostic ignored "-Wpacked" #pragma GCC diagnostic ignored "-Wattributes" /* Specification of ZIP file format can be found here: * https://pkware.cachefly.net/webdocs/casestudies/APPNOTE.TXT * For a high level overview of the structure of a ZIP file see * sections 4.3.1 - 4.3.6. * * Data structures appearing in ZIP files do not contain any * padding and they might be misaligned. To allow us to safely * operate on pointers to such structures and their members, we * declare the types as packed. */ #define END_OF_CD_RECORD_MAGIC 0x06054b50 /* See section 4.3.16 of the spec. */ struct end_of_cd_record { /* Magic value equal to END_OF_CD_RECORD_MAGIC */ __u32 magic; /* Number of the file containing this structure or 0xFFFF if ZIP64 archive. * Zip archive might span multiple files (disks). */ __u16 this_disk; /* Number of the file containing the beginning of the central directory or * 0xFFFF if ZIP64 archive. */ __u16 cd_disk; /* Number of central directory records on this disk or 0xFFFF if ZIP64 * archive. */ __u16 cd_records; /* Number of central directory records on all disks or 0xFFFF if ZIP64 * archive. */ __u16 cd_records_total; /* Size of the central directory record or 0xFFFFFFFF if ZIP64 archive. */ __u32 cd_size; /* Offset of the central directory from the beginning of the archive or * 0xFFFFFFFF if ZIP64 archive. */ __u32 cd_offset; /* Length of comment data following end of central directory record. */ __u16 comment_length; /* Up to 64k of arbitrary bytes. */ /* uint8_t comment[comment_length] */ } __attribute__((packed)); #define CD_FILE_HEADER_MAGIC 0x02014b50 #define FLAG_ENCRYPTED (1 << 0) #define FLAG_HAS_DATA_DESCRIPTOR (1 << 3) /* See section 4.3.12 of the spec. */ struct cd_file_header { /* Magic value equal to CD_FILE_HEADER_MAGIC. */ __u32 magic; __u16 version; /* Minimum zip version needed to extract the file. */ __u16 min_version; __u16 flags; __u16 compression; __u16 last_modified_time; __u16 last_modified_date; __u32 crc; __u32 compressed_size; __u32 uncompressed_size; __u16 file_name_length; __u16 extra_field_length; __u16 file_comment_length; /* Number of the disk where the file starts or 0xFFFF if ZIP64 archive. */ __u16 disk; __u16 internal_attributes; __u32 external_attributes; /* Offset from the start of the disk containing the local file header to the * start of the local file header. */ __u32 offset; } __attribute__((packed)); #define LOCAL_FILE_HEADER_MAGIC 0x04034b50 /* See section 4.3.7 of the spec. */ struct local_file_header { /* Magic value equal to LOCAL_FILE_HEADER_MAGIC. */ __u32 magic; /* Minimum zip version needed to extract the file. */ __u16 min_version; __u16 flags; __u16 compression; __u16 last_modified_time; __u16 last_modified_date; __u32 crc; __u32 compressed_size; __u32 uncompressed_size; __u16 file_name_length; __u16 extra_field_length; } __attribute__((packed)); #pragma GCC diagnostic pop struct zip_archive { void *data; __u32 size; __u32 cd_offset; __u32 cd_records; }; static void *check_access(struct zip_archive *archive, __u32 offset, __u32 size) { if (offset + size > archive->size || offset > offset + size) return NULL; return archive->data + offset; } /* Returns 0 on success, -EINVAL on error and -ENOTSUP if the eocd indicates the * archive uses features which are not supported. */ static int try_parse_end_of_cd(struct zip_archive *archive, __u32 offset) { __u16 comment_length, cd_records; struct end_of_cd_record *eocd; __u32 cd_offset, cd_size; eocd = check_access(archive, offset, sizeof(*eocd)); if (!eocd || eocd->magic != END_OF_CD_RECORD_MAGIC) return -EINVAL; comment_length = eocd->comment_length; if (offset + sizeof(*eocd) + comment_length != archive->size) return -EINVAL; cd_records = eocd->cd_records; if (eocd->this_disk != 0 || eocd->cd_disk != 0 || eocd->cd_records_total != cd_records) /* This is a valid eocd, but we only support single-file non-ZIP64 archives. */ return -ENOTSUP; cd_offset = eocd->cd_offset; cd_size = eocd->cd_size; if (!check_access(archive, cd_offset, cd_size)) return -EINVAL; archive->cd_offset = cd_offset; archive->cd_records = cd_records; return 0; } static int find_cd(struct zip_archive *archive) { int64_t limit, offset; int rc = -EINVAL; if (archive->size <= sizeof(struct end_of_cd_record)) return -EINVAL; /* Because the end of central directory ends with a variable length array of * up to 0xFFFF bytes we can't know exactly where it starts and need to * search for it at the end of the file, scanning the (limit, offset] range. */ offset = archive->size - sizeof(struct end_of_cd_record); limit = (int64_t)offset - (1 << 16); for (; offset >= 0 && offset > limit && rc != 0; offset--) { rc = try_parse_end_of_cd(archive, offset); if (rc == -ENOTSUP) break; } return rc; } struct zip_archive *zip_archive_open(const char *path) { struct zip_archive *archive; int err, fd; off_t size; void *data; fd = open(path, O_RDONLY | O_CLOEXEC); if (fd < 0) return ERR_PTR(-errno); size = lseek(fd, 0, SEEK_END); if (size == (off_t)-1 || size > UINT32_MAX) { close(fd); return ERR_PTR(-EINVAL); } data = mmap(NULL, size, PROT_READ, MAP_PRIVATE, fd, 0); err = -errno; close(fd); if (data == MAP_FAILED) return ERR_PTR(err); archive = malloc(sizeof(*archive)); if (!archive) { munmap(data, size); return ERR_PTR(-ENOMEM); }; archive->data = data; archive->size = size; err = find_cd(archive); if (err) { munmap(data, size); free(archive); return ERR_PTR(err); } return archive; } void zip_archive_close(struct zip_archive *archive) { munmap(archive->data, archive->size); free(archive); } static struct local_file_header *local_file_header_at_offset(struct zip_archive *archive, __u32 offset) { struct local_file_header *lfh; lfh = check_access(archive, offset, sizeof(*lfh)); if (!lfh || lfh->magic != LOCAL_FILE_HEADER_MAGIC) return NULL; return lfh; } static int get_entry_at_offset(struct zip_archive *archive, __u32 offset, struct zip_entry *out) { struct local_file_header *lfh; __u32 compressed_size; const char *name; void *data; lfh = local_file_header_at_offset(archive, offset); if (!lfh) return -EINVAL; offset += sizeof(*lfh); if ((lfh->flags & FLAG_ENCRYPTED) || (lfh->flags & FLAG_HAS_DATA_DESCRIPTOR)) return -EINVAL; name = check_access(archive, offset, lfh->file_name_length); if (!name) return -EINVAL; offset += lfh->file_name_length; if (!check_access(archive, offset, lfh->extra_field_length)) return -EINVAL; offset += lfh->extra_field_length; compressed_size = lfh->compressed_size; data = check_access(archive, offset, compressed_size); if (!data) return -EINVAL; out->compression = lfh->compression; out->name_length = lfh->file_name_length; out->name = name; out->data = data; out->data_length = compressed_size; out->data_offset = offset; return 0; } int zip_archive_find_entry(struct zip_archive *archive, const char *file_name, struct zip_entry *out) { size_t file_name_length = strlen(file_name); __u32 i, offset = archive->cd_offset; for (i = 0; i < archive->cd_records; ++i) { __u16 cdfh_name_length, cdfh_flags; struct cd_file_header *cdfh; const char *cdfh_name; cdfh = check_access(archive, offset, sizeof(*cdfh)); if (!cdfh || cdfh->magic != CD_FILE_HEADER_MAGIC) return -EINVAL; offset += sizeof(*cdfh); cdfh_name_length = cdfh->file_name_length; cdfh_name = check_access(archive, offset, cdfh_name_length); if (!cdfh_name) return -EINVAL; cdfh_flags = cdfh->flags; if ((cdfh_flags & FLAG_ENCRYPTED) == 0 && (cdfh_flags & FLAG_HAS_DATA_DESCRIPTOR) == 0 && file_name_length == cdfh_name_length && memcmp(file_name, archive->data + offset, file_name_length) == 0) { return get_entry_at_offset(archive, cdfh->offset, out); } offset += cdfh_name_length; offset += cdfh->extra_field_length; offset += cdfh->file_comment_length; } return -ENOENT; }