You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
383 lines
14 KiB
383 lines
14 KiB
/*
|
|
* Copyright (C) 2013 The Android Open Source Project
|
|
*
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License.
|
|
*/
|
|
|
|
#pragma once
|
|
|
|
/*
|
|
* Read-only access to Zip archives, with minimal heap allocation.
|
|
*/
|
|
|
|
#include <stdint.h>
|
|
#include <string.h>
|
|
#include <sys/cdefs.h>
|
|
#include <sys/types.h>
|
|
|
|
#include <functional>
|
|
#include <string>
|
|
#include <string_view>
|
|
|
|
#include "android-base/off64_t.h"
|
|
|
|
/* Zip compression methods we support */
|
|
enum {
|
|
kCompressStored = 0, // no compression
|
|
kCompressDeflated = 8, // standard deflate
|
|
};
|
|
|
|
// This struct holds the common information of a zip entry other than the
|
|
// the entry size. The compressed and uncompressed length will be handled
|
|
// separately in the derived class.
|
|
struct ZipEntryCommon {
|
|
// Compression method. One of kCompressStored or kCompressDeflated.
|
|
// See also `gpbf` for deflate subtypes.
|
|
uint16_t method;
|
|
|
|
// Modification time. The zipfile format specifies
|
|
// that the first two little endian bytes contain the time
|
|
// and the last two little endian bytes contain the date.
|
|
// See `GetModificationTime`. Use signed integer to avoid the
|
|
// sub-overflow.
|
|
// TODO: should be overridden by extra time field, if present.
|
|
int32_t mod_time;
|
|
|
|
// Returns `mod_time` as a broken-down struct tm.
|
|
struct tm GetModificationTime() const;
|
|
|
|
// Suggested Unix mode for this entry, from the zip archive if created on
|
|
// Unix, or a default otherwise. See also `external_file_attributes`.
|
|
mode_t unix_mode;
|
|
|
|
// 1 if this entry contains a data descriptor segment, 0
|
|
// otherwise.
|
|
uint8_t has_data_descriptor;
|
|
|
|
// Crc32 value of this ZipEntry. This information might
|
|
// either be stored in the local file header or in a special
|
|
// Data descriptor footer at the end of the file entry.
|
|
uint32_t crc32;
|
|
|
|
// If the value of uncompressed length and compressed length are stored in
|
|
// the zip64 extended info of the extra field.
|
|
bool zip64_format_size{false};
|
|
|
|
// The offset to the start of data for this ZipEntry.
|
|
off64_t offset;
|
|
|
|
// The version of zip and the host file system this came from (for zipinfo).
|
|
uint16_t version_made_by;
|
|
|
|
// The raw attributes, whose interpretation depends on the host
|
|
// file system in `version_made_by` (for zipinfo). See also `unix_mode`.
|
|
uint32_t external_file_attributes;
|
|
|
|
// Specifics about the deflation (for zipinfo).
|
|
uint16_t gpbf;
|
|
// Whether this entry is believed to be text or binary (for zipinfo).
|
|
bool is_text;
|
|
};
|
|
|
|
struct ZipEntry64;
|
|
// Many users of the library assume the entry size is capped at UNIT32_MAX. So we keep
|
|
// the interface for the old ZipEntry here; and we could switch them over to the new
|
|
// ZipEntry64 later.
|
|
struct ZipEntry : public ZipEntryCommon {
|
|
// Compressed length of this ZipEntry. The maximum value is UNIT32_MAX.
|
|
// Might be present either in the local file header or in the data
|
|
// descriptor footer.
|
|
uint32_t compressed_length{0};
|
|
|
|
// Uncompressed length of this ZipEntry. The maximum value is UNIT32_MAX.
|
|
// Might be present either in the local file header or in the data
|
|
// descriptor footer.
|
|
uint32_t uncompressed_length{0};
|
|
|
|
// Copies the contents of a ZipEntry64 object to a 32 bits ZipEntry. Returns 0 if the
|
|
// size of the entry fits into uint32_t, returns a negative error code
|
|
// (kUnsupportedEntrySize) otherwise.
|
|
static int32_t CopyFromZipEntry64(ZipEntry* dst, const ZipEntry64* src);
|
|
|
|
private:
|
|
ZipEntry& operator=(const ZipEntryCommon& other) {
|
|
ZipEntryCommon::operator=(other);
|
|
return *this;
|
|
}
|
|
};
|
|
|
|
// Represents information about a zip entry in a zip file.
|
|
struct ZipEntry64 : public ZipEntryCommon {
|
|
// Compressed length of this ZipEntry. The maximum value is UNIT64_MAX.
|
|
// Might be present either in the local file header, the zip64 extended field,
|
|
// or in the data descriptor footer.
|
|
uint64_t compressed_length{0};
|
|
|
|
// Uncompressed length of this ZipEntry. The maximum value is UNIT64_MAX.
|
|
// Might be present either in the local file header, the zip64 extended field,
|
|
// or in the data descriptor footer.
|
|
uint64_t uncompressed_length{0};
|
|
|
|
explicit ZipEntry64() = default;
|
|
explicit ZipEntry64(const ZipEntry& zip_entry) : ZipEntryCommon(zip_entry) {
|
|
compressed_length = zip_entry.compressed_length;
|
|
uncompressed_length = zip_entry.uncompressed_length;
|
|
}
|
|
};
|
|
|
|
struct ZipArchive;
|
|
typedef ZipArchive* ZipArchiveHandle;
|
|
|
|
/*
|
|
* Open a Zip archive, and sets handle to the value of the opaque
|
|
* handle for the file. This handle must be released by calling
|
|
* CloseArchive with this handle.
|
|
*
|
|
* Returns 0 on success, and negative values on failure.
|
|
*/
|
|
int32_t OpenArchive(const char* fileName, ZipArchiveHandle* handle);
|
|
|
|
/*
|
|
* Like OpenArchive, but takes a file descriptor open for reading
|
|
* at the start of the file. The descriptor must be mappable (this does
|
|
* not allow access to a stream).
|
|
*
|
|
* Sets handle to the value of the opaque handle for this file descriptor.
|
|
* This handle must be released by calling CloseArchive with this handle.
|
|
*
|
|
* If assume_ownership parameter is 'true' calling CloseArchive will close
|
|
* the file.
|
|
*
|
|
* This function maps and scans the central directory and builds a table
|
|
* of entries for future lookups.
|
|
*
|
|
* "debugFileName" will appear in error messages, but is not otherwise used.
|
|
*
|
|
* Returns 0 on success, and negative values on failure.
|
|
*/
|
|
int32_t OpenArchiveFd(const int fd, const char* debugFileName, ZipArchiveHandle* handle,
|
|
bool assume_ownership = true);
|
|
|
|
int32_t OpenArchiveFdRange(const int fd, const char* debugFileName, ZipArchiveHandle* handle,
|
|
off64_t length, off64_t offset, bool assume_ownership = true);
|
|
|
|
int32_t OpenArchiveFromMemory(const void* address, size_t length, const char* debugFileName,
|
|
ZipArchiveHandle* handle);
|
|
/*
|
|
* Close archive, releasing resources associated with it. This will
|
|
* unmap the central directory of the zipfile and free all internal
|
|
* data structures associated with the file. It is an error to use
|
|
* this handle for any further operations without an intervening
|
|
* call to one of the OpenArchive variants.
|
|
*/
|
|
void CloseArchive(ZipArchiveHandle archive);
|
|
|
|
/** See GetArchiveInfo(). */
|
|
struct ZipArchiveInfo {
|
|
/** The size in bytes of the archive itself. Used by zipinfo. */
|
|
off64_t archive_size;
|
|
/** The number of entries in the archive. */
|
|
uint64_t entry_count;
|
|
};
|
|
|
|
/**
|
|
* Returns information about the given archive.
|
|
*/
|
|
ZipArchiveInfo GetArchiveInfo(ZipArchiveHandle archive);
|
|
|
|
/*
|
|
* Find an entry in the Zip archive, by name. |data| must be non-null.
|
|
*
|
|
* Returns 0 if an entry is found, and populates |data| with information
|
|
* about this entry. Returns negative values otherwise.
|
|
*
|
|
* It's important to note that |data->crc32|, |data->compLen| and
|
|
* |data->uncompLen| might be set to values from the central directory
|
|
* if this file entry contains a data descriptor footer. To verify crc32s
|
|
* and length, a call to VerifyCrcAndLengths must be made after entry data
|
|
* has been processed.
|
|
*
|
|
* On non-Windows platforms this method does not modify internal state and
|
|
* can be called concurrently.
|
|
*/
|
|
int32_t FindEntry(const ZipArchiveHandle archive, const std::string_view entryName,
|
|
ZipEntry64* data);
|
|
|
|
/*
|
|
* Start iterating over all entries of a zip file. The order of iteration
|
|
* is not guaranteed to be the same as the order of elements
|
|
* in the central directory but is stable for a given zip file. |cookie| will
|
|
* contain the value of an opaque cookie which can be used to make one or more
|
|
* calls to Next. All calls to StartIteration must be matched by a call to
|
|
* EndIteration to free any allocated memory.
|
|
*
|
|
* This method also accepts optional prefix and suffix to restrict iteration to
|
|
* entry names that start with |optional_prefix| or end with |optional_suffix|.
|
|
*
|
|
* Returns 0 on success and negative values on failure.
|
|
*/
|
|
int32_t StartIteration(ZipArchiveHandle archive, void** cookie_ptr,
|
|
const std::string_view optional_prefix = "",
|
|
const std::string_view optional_suffix = "");
|
|
|
|
/*
|
|
* Start iterating over all entries of a zip file. Use the matcher functor to
|
|
* restrict iteration to entry names that make the functor return true.
|
|
*
|
|
* Returns 0 on success and negative values on failure.
|
|
*/
|
|
int32_t StartIteration(ZipArchiveHandle archive, void** cookie_ptr,
|
|
std::function<bool(std::string_view entry_name)> matcher);
|
|
|
|
/*
|
|
* Advance to the next element in the zipfile in iteration order.
|
|
*
|
|
* Returns 0 on success, -1 if there are no more elements in this
|
|
* archive and lower negative values on failure.
|
|
*/
|
|
int32_t Next(void* cookie, ZipEntry64* data, std::string_view* name);
|
|
int32_t Next(void* cookie, ZipEntry64* data, std::string* name);
|
|
|
|
/*
|
|
* End iteration over all entries of a zip file and frees the memory allocated
|
|
* in StartIteration.
|
|
*/
|
|
void EndIteration(void* cookie);
|
|
|
|
/*
|
|
* Uncompress and write an entry to an open file identified by |fd|.
|
|
* |entry->uncompressed_length| bytes will be written to the file at
|
|
* its current offset, and the file will be truncated at the end of
|
|
* the uncompressed data (no truncation if |fd| references a block
|
|
* device).
|
|
*
|
|
* Returns 0 on success and negative values on failure.
|
|
*/
|
|
int32_t ExtractEntryToFile(ZipArchiveHandle archive, const ZipEntry64* entry, int fd);
|
|
|
|
/**
|
|
* Uncompress a given zip entry to the memory region at |begin| and of
|
|
* size |size|. This size is expected to be the same as the *declared*
|
|
* uncompressed length of the zip entry. It is an error if the *actual*
|
|
* number of uncompressed bytes differs from this number.
|
|
*
|
|
* Returns 0 on success and negative values on failure.
|
|
*/
|
|
int32_t ExtractToMemory(ZipArchiveHandle archive, const ZipEntry64* entry, uint8_t* begin,
|
|
size_t size);
|
|
|
|
int GetFileDescriptor(const ZipArchiveHandle archive);
|
|
|
|
/**
|
|
* Returns the offset of the zip archive in the backing file descriptor, or 0 if the zip archive is
|
|
* not backed by a file descriptor.
|
|
*/
|
|
off64_t GetFileDescriptorOffset(const ZipArchiveHandle archive);
|
|
|
|
const char* ErrorCodeString(int32_t error_code);
|
|
|
|
// Many users of libziparchive assume the entry size to be 32 bits long. So we keep these
|
|
// interfaces that use 32 bit ZipEntry to make old code work. TODO(xunchang) Remove the 32 bit
|
|
// wrapper functions once we switch all users to recognize ZipEntry64.
|
|
int32_t FindEntry(const ZipArchiveHandle archive, const std::string_view entryName, ZipEntry* data);
|
|
int32_t Next(void* cookie, ZipEntry* data, std::string* name);
|
|
int32_t Next(void* cookie, ZipEntry* data, std::string_view* name);
|
|
int32_t ExtractEntryToFile(ZipArchiveHandle archive, const ZipEntry* entry, int fd);
|
|
int32_t ExtractToMemory(ZipArchiveHandle archive, const ZipEntry* entry, uint8_t* begin,
|
|
size_t size);
|
|
|
|
//
|
|
// This gets defined for the version of the library that need to control all
|
|
// code accessing the zip file. Details in incfs_support/signal_handling.h
|
|
//
|
|
#if !ZIPARCHIVE_DISABLE_CALLBACK_API
|
|
|
|
#if !defined(_WIN32)
|
|
typedef bool (*ProcessZipEntryFunction)(const uint8_t* buf, size_t buf_size, void* cookie);
|
|
|
|
/*
|
|
* Stream the uncompressed data through the supplied function,
|
|
* passing cookie to it each time it gets called.
|
|
*/
|
|
int32_t ProcessZipEntryContents(ZipArchiveHandle archive, const ZipEntry* entry,
|
|
ProcessZipEntryFunction func, void* cookie);
|
|
int32_t ProcessZipEntryContents(ZipArchiveHandle archive, const ZipEntry64* entry,
|
|
ProcessZipEntryFunction func, void* cookie);
|
|
#endif // !defined(_WIN32)
|
|
|
|
#endif // !ZIPARCHIVE_DISABLE_CALLBACK_API
|
|
|
|
namespace zip_archive {
|
|
|
|
class Writer {
|
|
public:
|
|
virtual bool Append(uint8_t* buf, size_t buf_size) = 0;
|
|
virtual ~Writer();
|
|
|
|
protected:
|
|
Writer() = default;
|
|
|
|
private:
|
|
Writer(const Writer&) = delete;
|
|
void operator=(const Writer&) = delete;
|
|
};
|
|
|
|
class Reader {
|
|
public:
|
|
virtual bool ReadAtOffset(uint8_t* buf, size_t len, off64_t offset) const = 0;
|
|
virtual ~Reader();
|
|
|
|
protected:
|
|
Reader() = default;
|
|
|
|
private:
|
|
Reader(const Reader&) = delete;
|
|
void operator=(const Reader&) = delete;
|
|
};
|
|
|
|
//
|
|
// This gets defined for the version of the library that need to control all
|
|
// code accessing the zip file. Details in incfs_support/signal_handling.h
|
|
//
|
|
#if !ZIPARCHIVE_DISABLE_CALLBACK_API
|
|
|
|
/**
|
|
* Uncompress a given zip entry to given |writer|.
|
|
*
|
|
* Returns 0 on success and negative values on failure.
|
|
*/
|
|
int32_t ExtractToWriter(ZipArchiveHandle handle, const ZipEntry64* entry,
|
|
zip_archive::Writer* writer);
|
|
|
|
#endif // !ZIPARCHIVE_DISABLE_CALLBACK_API
|
|
|
|
/*
|
|
* Inflates the first |compressed_length| bytes of |reader| to a given |writer|.
|
|
* |crc_out| is set to the CRC32 checksum of the uncompressed data.
|
|
*
|
|
* Returns 0 on success and negative values on failure, for example if |reader|
|
|
* cannot supply the right amount of data, or if the number of bytes written to
|
|
* data does not match |uncompressed_length|.
|
|
*
|
|
* If |crc_out| is not nullptr, it is set to the crc32 checksum of the
|
|
* uncompressed data.
|
|
*
|
|
* NOTE: in the IncFS version of the library this function remains
|
|
* unprotected, because the data |reader| is supplying is under the full reader's
|
|
* control; it's the reader's duty to ensure it is available and OK to access.
|
|
*/
|
|
int32_t Inflate(const Reader& reader, const uint64_t compressed_length,
|
|
const uint64_t uncompressed_length, Writer* writer, uint64_t* crc_out);
|
|
|
|
} // namespace zip_archive
|