blob: bc7103b9685c273197443bc43a904693020685cc [file] [log] [blame]
Narayan Kamath7462f022013-11-21 13:05:04 +00001/*
2 * Copyright (C) 2008 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17/*
18 * Read-only access to Zip archives, with minimal heap allocation.
19 */
Narayan Kamath7462f022013-11-21 13:05:04 +000020
Mark Salyzyncfd5b082016-10-17 14:28:00 -070021#define LOG_TAG "ziparchive"
22
Elliott Hughese8f4b142018-10-19 16:09:39 -070023#include "ziparchive/zip_archive.h"
24
Narayan Kamath7462f022013-11-21 13:05:04 +000025#include <errno.h>
Mark Salyzyn99ef9912014-03-14 14:26:22 -070026#include <fcntl.h>
27#include <inttypes.h>
Narayan Kamath7462f022013-11-21 13:05:04 +000028#include <limits.h>
Narayan Kamath7462f022013-11-21 13:05:04 +000029#include <stdlib.h>
30#include <string.h>
Elliott Hughes55fd2932017-05-28 22:59:04 -070031#include <time.h>
Narayan Kamath7462f022013-11-21 13:05:04 +000032#include <unistd.h>
33
Dan Albert1ae07642015-04-09 14:11:18 -070034#include <memory>
35#include <vector>
36
Elliott Hughes9c8bd662018-10-26 16:14:21 -070037#if defined(__APPLE__)
38#define lseek64 lseek
39#endif
40
Josh Gao1b496342018-07-17 11:08:48 -070041#if defined(__BIONIC__)
42#include <android/fdsan.h>
43#endif
44
Mark Salyzynff2dcd92016-09-28 15:54:45 -070045#include <android-base/file.h>
46#include <android-base/logging.h>
47#include <android-base/macros.h> // TEMP_FAILURE_RETRY may or may not be in unistd
Elliott Hughese8f4b142018-10-19 16:09:39 -070048#include <android-base/mapped_file.h>
Mark Salyzynff2dcd92016-09-28 15:54:45 -070049#include <android-base/memory.h>
Ryan Mitchellc77f9d32018-08-25 14:06:29 -070050#include <android-base/utf8.h>
Mark Salyzyncfd5b082016-10-17 14:28:00 -070051#include <log/log.h>
Dan Albert1ae07642015-04-09 14:11:18 -070052#include "zlib.h"
Narayan Kamath7462f022013-11-21 13:05:04 +000053
Narayan Kamath044bc8e2014-12-03 18:22:53 +000054#include "entry_name_utils-inl.h"
Adam Lesinskiad4ad8c2015-10-05 18:16:18 -070055#include "zip_archive_common.h"
Christopher Ferrise6884ce2015-11-10 14:55:12 -080056#include "zip_archive_private.h"
Mark Salyzyn99ef9912014-03-14 14:26:22 -070057
Dan Albert1ae07642015-04-09 14:11:18 -070058using android::base::get_unaligned;
Narayan Kamath044bc8e2014-12-03 18:22:53 +000059
Narayan Kamath162b7052017-06-05 13:21:12 +010060// Used to turn on crc checks - verify that the content CRC matches the values
61// specified in the local file header and the central directory.
62static const bool kCrcChecksEnabled = false;
63
Narayan Kamath926973e2014-06-09 14:18:14 +010064// The maximum number of bytes to scan backwards for the EOCD start.
65static const uint32_t kMaxEOCDSearch = kMaxCommentLen + sizeof(EocdRecord);
66
Narayan Kamath7462f022013-11-21 13:05:04 +000067/*
68 * A Read-only Zip archive.
69 *
70 * We want "open" and "find entry by name" to be fast operations, and
71 * we want to use as little memory as possible. We memory-map the zip
72 * central directory, and load a hash table with pointers to the filenames
73 * (which aren't null-terminated). The other fields are at a fixed offset
74 * from the filename, so we don't need to extract those (but we do need
75 * to byte-read and endian-swap them every time we want them).
76 *
77 * It's possible that somebody has handed us a massive (~1GB) zip archive,
78 * so we can't expect to mmap the entire file.
79 *
80 * To speed comparisons when doing a lookup by name, we could make the mapping
81 * "private" (copy-on-write) and null-terminate the filenames after verifying
82 * the record structure. However, this requires a private mapping of
83 * every page that the Central Directory touches. Easier to tuck a copy
84 * of the string length into the hash table entry.
85 */
Narayan Kamath7462f022013-11-21 13:05:04 +000086
Narayan Kamath7462f022013-11-21 13:05:04 +000087/*
88 * Round up to the next highest power of 2.
89 *
90 * Found on http://graphics.stanford.edu/~seander/bithacks.html.
91 */
92static uint32_t RoundUpPower2(uint32_t val) {
93 val--;
94 val |= val >> 1;
95 val |= val >> 2;
96 val |= val >> 4;
97 val |= val >> 8;
98 val |= val >> 16;
99 val++;
100
101 return val;
102}
103
Yusuke Sato07447542015-06-25 14:39:19 -0700104static uint32_t ComputeHash(const ZipString& name) {
Nick Kralevichc0bf3662019-04-05 09:10:34 -0700105 return static_cast<uint32_t>(std::hash<std::string_view>{}(
106 std::string_view(reinterpret_cast<const char*>(name.name), name.name_length)));
Narayan Kamath7462f022013-11-21 13:05:04 +0000107}
108
Zimuzo5a503ef2018-09-17 19:49:55 +0100109static bool isZipStringEqual(const uint8_t* start, const ZipString& zip_string,
110 const ZipStringOffset& zip_string_offset) {
111 const ZipString from_offset = zip_string_offset.GetZipString(start);
112 return from_offset == zip_string;
113}
114
115/**
116 * Returns offset of ZipString#name from the start of the central directory in the memory map.
117 * For valid ZipStrings contained in the zip archive mmap, 0 < offset < 0xffffff.
118 */
119static inline uint32_t GetOffset(const uint8_t* name, const uint8_t* start) {
120 CHECK_GT(name, start);
121 CHECK_LT(name, start + 0xffffff);
122 return static_cast<uint32_t>(name - start);
123}
124
Narayan Kamath7462f022013-11-21 13:05:04 +0000125/*
126 * Convert a ZipEntry to a hash table index, verifying that it's in a
127 * valid range.
128 */
Zimuzo5a503ef2018-09-17 19:49:55 +0100129static int64_t EntryToIndex(const ZipStringOffset* hash_table, const uint32_t hash_table_size,
130 const ZipString& name, const uint8_t* start) {
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100131 const uint32_t hash = ComputeHash(name);
Narayan Kamath7462f022013-11-21 13:05:04 +0000132
133 // NOTE: (hash_table_size - 1) is guaranteed to be non-negative.
134 uint32_t ent = hash & (hash_table_size - 1);
Zimuzo5a503ef2018-09-17 19:49:55 +0100135 while (hash_table[ent].name_offset != 0) {
136 if (isZipStringEqual(start, name, hash_table[ent])) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000137 return ent;
138 }
Narayan Kamath7462f022013-11-21 13:05:04 +0000139 ent = (ent + 1) & (hash_table_size - 1);
140 }
141
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100142 ALOGV("Zip: Unable to find entry %.*s", name.name_length, name.name);
Narayan Kamath7462f022013-11-21 13:05:04 +0000143 return kEntryNotFound;
144}
145
146/*
147 * Add a new entry to the hash table.
148 */
Andreas Gampe964b95c2019-04-05 13:48:02 -0700149static int32_t AddToHash(ZipStringOffset* hash_table, const uint32_t hash_table_size,
Zimuzo5a503ef2018-09-17 19:49:55 +0100150 const ZipString& name, const uint8_t* start) {
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100151 const uint64_t hash = ComputeHash(name);
Narayan Kamath7462f022013-11-21 13:05:04 +0000152 uint32_t ent = hash & (hash_table_size - 1);
153
154 /*
155 * We over-allocated the table, so we're guaranteed to find an empty slot.
156 * Further, we guarantee that the hashtable size is not 0.
157 */
Zimuzo5a503ef2018-09-17 19:49:55 +0100158 while (hash_table[ent].name_offset != 0) {
159 if (isZipStringEqual(start, name, hash_table[ent])) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000160 // We've found a duplicate entry. We don't accept it
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100161 ALOGW("Zip: Found duplicate entry %.*s", name.name_length, name.name);
Narayan Kamath7462f022013-11-21 13:05:04 +0000162 return kDuplicateEntry;
163 }
164 ent = (ent + 1) & (hash_table_size - 1);
165 }
Zimuzo5a503ef2018-09-17 19:49:55 +0100166 hash_table[ent].name_offset = GetOffset(name.name, start);
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100167 hash_table[ent].name_length = name.name_length;
Narayan Kamath7462f022013-11-21 13:05:04 +0000168 return 0;
169}
170
Josh Gaoabdfc242018-09-07 12:44:40 -0700171#if defined(__BIONIC__)
172uint64_t GetOwnerTag(const ZipArchive* archive) {
173 return android_fdsan_create_owner_tag(ANDROID_FDSAN_OWNER_TYPE_ZIPARCHIVE,
174 reinterpret_cast<uint64_t>(archive));
175}
176#endif
177
Josh Gao1b496342018-07-17 11:08:48 -0700178ZipArchive::ZipArchive(const int fd, bool assume_ownership)
179 : mapped_zip(fd),
180 close_file(assume_ownership),
181 directory_offset(0),
182 central_directory(),
Elliott Hughese8f4b142018-10-19 16:09:39 -0700183 directory_map(),
Josh Gao1b496342018-07-17 11:08:48 -0700184 num_entries(0),
185 hash_table_size(0),
186 hash_table(nullptr) {
187#if defined(__BIONIC__)
188 if (assume_ownership) {
Josh Gaoabdfc242018-09-07 12:44:40 -0700189 android_fdsan_exchange_owner_tag(fd, 0, GetOwnerTag(this));
Josh Gao1b496342018-07-17 11:08:48 -0700190 }
191#endif
192}
193
194ZipArchive::ZipArchive(void* address, size_t length)
195 : mapped_zip(address, length),
196 close_file(false),
197 directory_offset(0),
198 central_directory(),
Elliott Hughese8f4b142018-10-19 16:09:39 -0700199 directory_map(),
Josh Gao1b496342018-07-17 11:08:48 -0700200 num_entries(0),
201 hash_table_size(0),
202 hash_table(nullptr) {}
203
204ZipArchive::~ZipArchive() {
205 if (close_file && mapped_zip.GetFileDescriptor() >= 0) {
206#if defined(__BIONIC__)
Josh Gaoabdfc242018-09-07 12:44:40 -0700207 android_fdsan_close_with_tag(mapped_zip.GetFileDescriptor(), GetOwnerTag(this));
Josh Gao1b496342018-07-17 11:08:48 -0700208#else
209 close(mapped_zip.GetFileDescriptor());
210#endif
211 }
212
213 free(hash_table);
214}
215
Tianjie Xu18c25922016-09-29 15:27:41 -0700216static int32_t MapCentralDirectory0(const char* debug_file_name, ZipArchive* archive,
Andreas Gampe964b95c2019-04-05 13:48:02 -0700217 off64_t file_length, uint32_t read_amount,
Zimuzo5a503ef2018-09-17 19:49:55 +0100218 uint8_t* scan_buffer) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000219 const off64_t search_start = file_length - read_amount;
220
Jiyong Parkcd997e62017-06-30 17:23:33 +0900221 if (!archive->mapped_zip.ReadAtOffset(scan_buffer, read_amount, search_start)) {
222 ALOGE("Zip: read %" PRId64 " from offset %" PRId64 " failed", static_cast<int64_t>(read_amount),
223 static_cast<int64_t>(search_start));
Narayan Kamath7462f022013-11-21 13:05:04 +0000224 return kIoError;
225 }
226
227 /*
228 * Scan backward for the EOCD magic. In an archive without a trailing
229 * comment, we'll find it on the first try. (We may want to consider
230 * doing an initial minimal read; if we don't find it, retry with a
231 * second read as above.)
232 */
Andreas Gampe964b95c2019-04-05 13:48:02 -0700233 CHECK_LE(read_amount, std::numeric_limits<int32_t>::max());
234 int32_t i = read_amount - sizeof(EocdRecord);
Narayan Kamath926973e2014-06-09 14:18:14 +0100235 for (; i >= 0; i--) {
Dan Albert1ae07642015-04-09 14:11:18 -0700236 if (scan_buffer[i] == 0x50) {
237 uint32_t* sig_addr = reinterpret_cast<uint32_t*>(&scan_buffer[i]);
238 if (get_unaligned<uint32_t>(sig_addr) == EocdRecord::kSignature) {
239 ALOGV("+++ Found EOCD at buf+%d", i);
240 break;
241 }
Narayan Kamath7462f022013-11-21 13:05:04 +0000242 }
243 }
244 if (i < 0) {
245 ALOGD("Zip: EOCD not found, %s is not zip", debug_file_name);
246 return kInvalidFile;
247 }
248
249 const off64_t eocd_offset = search_start + i;
Narayan Kamath926973e2014-06-09 14:18:14 +0100250 const EocdRecord* eocd = reinterpret_cast<const EocdRecord*>(scan_buffer + i);
Narayan Kamath7462f022013-11-21 13:05:04 +0000251 /*
Narayan Kamath926973e2014-06-09 14:18:14 +0100252 * Verify that there's no trailing space at the end of the central directory
253 * and its comment.
Narayan Kamath7462f022013-11-21 13:05:04 +0000254 */
Jiyong Parkcd997e62017-06-30 17:23:33 +0900255 const off64_t calculated_length = eocd_offset + sizeof(EocdRecord) + eocd->comment_length;
Narayan Kamath926973e2014-06-09 14:18:14 +0100256 if (calculated_length != file_length) {
Narayan Kamath4f6b4992014-06-03 13:59:23 +0100257 ALOGW("Zip: %" PRId64 " extraneous bytes at the end of the central directory",
Narayan Kamath926973e2014-06-09 14:18:14 +0100258 static_cast<int64_t>(file_length - calculated_length));
Narayan Kamath4f6b4992014-06-03 13:59:23 +0100259 return kInvalidFile;
260 }
Narayan Kamath7462f022013-11-21 13:05:04 +0000261
Narayan Kamath926973e2014-06-09 14:18:14 +0100262 /*
263 * Grab the CD offset and size, and the number of entries in the
264 * archive and verify that they look reasonable.
265 */
Tianjie Xu1ee48922016-09-21 14:58:11 -0700266 if (static_cast<off64_t>(eocd->cd_start_offset) + eocd->cd_size > eocd_offset) {
Narayan Kamath926973e2014-06-09 14:18:14 +0100267 ALOGW("Zip: bad offsets (dir %" PRIu32 ", size %" PRIu32 ", eocd %" PRId64 ")",
Jiyong Parkcd997e62017-06-30 17:23:33 +0900268 eocd->cd_start_offset, eocd->cd_size, static_cast<int64_t>(eocd_offset));
Narayan Kamath7462f022013-11-21 13:05:04 +0000269 return kInvalidOffset;
270 }
Narayan Kamath926973e2014-06-09 14:18:14 +0100271 if (eocd->num_records == 0) {
Adam Lesinskib354dce2018-03-01 21:32:13 +0000272#if defined(__ANDROID__)
Narayan Kamath7462f022013-11-21 13:05:04 +0000273 ALOGW("Zip: empty archive?");
Adam Lesinskib354dce2018-03-01 21:32:13 +0000274#endif
Narayan Kamath7462f022013-11-21 13:05:04 +0000275 return kEmptyArchive;
276 }
277
Jiyong Parkcd997e62017-06-30 17:23:33 +0900278 ALOGV("+++ num_entries=%" PRIu32 " dir_size=%" PRIu32 " dir_offset=%" PRIu32, eocd->num_records,
279 eocd->cd_size, eocd->cd_start_offset);
Narayan Kamath7462f022013-11-21 13:05:04 +0000280
281 /*
282 * It all looks good. Create a mapping for the CD, and set the fields
283 * in archive.
284 */
Tianjie Xu18c25922016-09-29 15:27:41 -0700285
Elliott Hughese8f4b142018-10-19 16:09:39 -0700286 if (!archive->InitializeCentralDirectory(static_cast<off64_t>(eocd->cd_start_offset),
Tianjie Xu18c25922016-09-29 15:27:41 -0700287 static_cast<size_t>(eocd->cd_size))) {
288 ALOGE("Zip: failed to intialize central directory.\n");
Narayan Kamatheaf98852013-12-11 14:51:51 +0000289 return kMmapFailed;
Narayan Kamath7462f022013-11-21 13:05:04 +0000290 }
291
Narayan Kamath926973e2014-06-09 14:18:14 +0100292 archive->num_entries = eocd->num_records;
293 archive->directory_offset = eocd->cd_start_offset;
Narayan Kamath7462f022013-11-21 13:05:04 +0000294
295 return 0;
296}
297
298/*
299 * Find the zip Central Directory and memory-map it.
300 *
301 * On success, returns 0 after populating fields from the EOCD area:
302 * directory_offset
Tianjie Xu18c25922016-09-29 15:27:41 -0700303 * directory_ptr
Narayan Kamath7462f022013-11-21 13:05:04 +0000304 * num_entries
305 */
Tianjie Xu18c25922016-09-29 15:27:41 -0700306static int32_t MapCentralDirectory(const char* debug_file_name, ZipArchive* archive) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000307 // Test file length. We use lseek64 to make sure the file
308 // is small enough to be a zip file (Its size must be less than
309 // 0xffffffff bytes).
Tianjie Xu18c25922016-09-29 15:27:41 -0700310 off64_t file_length = archive->mapped_zip.GetFileLength();
Narayan Kamath7462f022013-11-21 13:05:04 +0000311 if (file_length == -1) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000312 return kInvalidFile;
313 }
314
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800315 if (file_length > static_cast<off64_t>(0xffffffff)) {
Narayan Kamath926973e2014-06-09 14:18:14 +0100316 ALOGV("Zip: zip file too long %" PRId64, static_cast<int64_t>(file_length));
Narayan Kamath7462f022013-11-21 13:05:04 +0000317 return kInvalidFile;
318 }
319
Narayan Kamath926973e2014-06-09 14:18:14 +0100320 if (file_length < static_cast<off64_t>(sizeof(EocdRecord))) {
321 ALOGV("Zip: length %" PRId64 " is too small to be zip", static_cast<int64_t>(file_length));
Narayan Kamath7462f022013-11-21 13:05:04 +0000322 return kInvalidFile;
323 }
324
325 /*
326 * Perform the traditional EOCD snipe hunt.
327 *
328 * We're searching for the End of Central Directory magic number,
329 * which appears at the start of the EOCD block. It's followed by
330 * 18 bytes of EOCD stuff and up to 64KB of archive comment. We
331 * need to read the last part of the file into a buffer, dig through
332 * it to find the magic number, parse some values out, and use those
333 * to determine the extent of the CD.
334 *
335 * We start by pulling in the last part of the file.
336 */
Andreas Gampe964b95c2019-04-05 13:48:02 -0700337 uint32_t read_amount = kMaxEOCDSearch;
Narayan Kamath926973e2014-06-09 14:18:14 +0100338 if (file_length < read_amount) {
Andreas Gampe964b95c2019-04-05 13:48:02 -0700339 read_amount = static_cast<uint32_t>(file_length);
Narayan Kamath7462f022013-11-21 13:05:04 +0000340 }
341
Tianjie Xu18c25922016-09-29 15:27:41 -0700342 std::vector<uint8_t> scan_buffer(read_amount);
Jiyong Parkcd997e62017-06-30 17:23:33 +0900343 int32_t result =
344 MapCentralDirectory0(debug_file_name, archive, file_length, read_amount, scan_buffer.data());
Narayan Kamath7462f022013-11-21 13:05:04 +0000345 return result;
346}
347
348/*
349 * Parses the Zip archive's Central Directory. Allocates and populates the
350 * hash table.
351 *
352 * Returns 0 on success.
353 */
354static int32_t ParseZipArchive(ZipArchive* archive) {
Tianjie Xu18c25922016-09-29 15:27:41 -0700355 const uint8_t* const cd_ptr = archive->central_directory.GetBasePtr();
356 const size_t cd_length = archive->central_directory.GetMapLength();
Narayan Kamath926973e2014-06-09 14:18:14 +0100357 const uint16_t num_entries = archive->num_entries;
Narayan Kamath7462f022013-11-21 13:05:04 +0000358
359 /*
360 * Create hash table. We have a minimum 75% load factor, possibly as
361 * low as 50% after we round off to a power of 2. There must be at
362 * least one unused entry to avoid an infinite loop during creation.
363 */
364 archive->hash_table_size = RoundUpPower2(1 + (num_entries * 4) / 3);
Jiyong Parkcd997e62017-06-30 17:23:33 +0900365 archive->hash_table =
Zimuzo5a503ef2018-09-17 19:49:55 +0100366 reinterpret_cast<ZipStringOffset*>(calloc(archive->hash_table_size, sizeof(ZipStringOffset)));
Tianjie Xu9e020e22016-10-10 12:11:30 -0700367 if (archive->hash_table == nullptr) {
368 ALOGW("Zip: unable to allocate the %u-entry hash_table, entry size: %zu",
369 archive->hash_table_size, sizeof(ZipString));
370 return -1;
371 }
Narayan Kamath7462f022013-11-21 13:05:04 +0000372
373 /*
374 * Walk through the central directory, adding entries to the hash
375 * table and verifying values.
376 */
Narayan Kamath926973e2014-06-09 14:18:14 +0100377 const uint8_t* const cd_end = cd_ptr + cd_length;
Narayan Kamath7462f022013-11-21 13:05:04 +0000378 const uint8_t* ptr = cd_ptr;
379 for (uint16_t i = 0; i < num_entries; i++) {
Tianjie Xu0fda1cf2017-04-05 14:46:27 -0700380 if (ptr > cd_end - sizeof(CentralDirectoryRecord)) {
381 ALOGW("Zip: ran off the end (at %" PRIu16 ")", i);
382#if defined(__ANDROID__)
383 android_errorWriteLog(0x534e4554, "36392138");
384#endif
385 return -1;
386 }
387
Jiyong Parkcd997e62017-06-30 17:23:33 +0900388 const CentralDirectoryRecord* cdr = reinterpret_cast<const CentralDirectoryRecord*>(ptr);
Narayan Kamath926973e2014-06-09 14:18:14 +0100389 if (cdr->record_signature != CentralDirectoryRecord::kSignature) {
Mark Salyzyn088bf902014-05-08 16:02:20 -0700390 ALOGW("Zip: missed a central dir sig (at %" PRIu16 ")", i);
Dmitriy Ivanov3ea93da2015-03-06 11:48:47 -0800391 return -1;
Narayan Kamath7462f022013-11-21 13:05:04 +0000392 }
393
Narayan Kamath926973e2014-06-09 14:18:14 +0100394 const off64_t local_header_offset = cdr->local_file_header_offset;
Narayan Kamath7462f022013-11-21 13:05:04 +0000395 if (local_header_offset >= archive->directory_offset) {
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800396 ALOGW("Zip: bad LFH offset %" PRId64 " at entry %" PRIu16,
Jiyong Parkcd997e62017-06-30 17:23:33 +0900397 static_cast<int64_t>(local_header_offset), i);
Dmitriy Ivanov3ea93da2015-03-06 11:48:47 -0800398 return -1;
Narayan Kamath7462f022013-11-21 13:05:04 +0000399 }
400
Narayan Kamath926973e2014-06-09 14:18:14 +0100401 const uint16_t file_name_length = cdr->file_name_length;
402 const uint16_t extra_length = cdr->extra_field_length;
403 const uint16_t comment_length = cdr->comment_length;
Piotr Jastrzebski78271ba2014-08-15 12:53:00 +0100404 const uint8_t* file_name = ptr + sizeof(CentralDirectoryRecord);
405
Tianjie Xu9e020e22016-10-10 12:11:30 -0700406 if (file_name + file_name_length > cd_end) {
Jiyong Parkcd997e62017-06-30 17:23:33 +0900407 ALOGW(
408 "Zip: file name boundary exceeds the central directory range, file_name_length: "
409 "%" PRIx16 ", cd_length: %zu",
410 file_name_length, cd_length);
Tianjie Xu9e020e22016-10-10 12:11:30 -0700411 return -1;
412 }
Narayan Kamath044bc8e2014-12-03 18:22:53 +0000413 /* check that file name is valid UTF-8 and doesn't contain NUL (U+0000) characters */
414 if (!IsValidEntryName(file_name, file_name_length)) {
Dmitriy Ivanov3ea93da2015-03-06 11:48:47 -0800415 return -1;
Piotr Jastrzebski78271ba2014-08-15 12:53:00 +0100416 }
Narayan Kamath7462f022013-11-21 13:05:04 +0000417
418 /* add the CDE filename to the hash table */
Yusuke Sato07447542015-06-25 14:39:19 -0700419 ZipString entry_name;
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100420 entry_name.name = file_name;
421 entry_name.name_length = file_name_length;
Zimuzo5a503ef2018-09-17 19:49:55 +0100422 const int add_result = AddToHash(archive->hash_table, archive->hash_table_size, entry_name,
423 archive->central_directory.GetBasePtr());
Dmitriy Ivanov3ea93da2015-03-06 11:48:47 -0800424 if (add_result != 0) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000425 ALOGW("Zip: Error adding entry to hash table %d", add_result);
Dmitriy Ivanov3ea93da2015-03-06 11:48:47 -0800426 return add_result;
Narayan Kamath7462f022013-11-21 13:05:04 +0000427 }
428
Narayan Kamath926973e2014-06-09 14:18:14 +0100429 ptr += sizeof(CentralDirectoryRecord) + file_name_length + extra_length + comment_length;
430 if ((ptr - cd_ptr) > static_cast<int64_t>(cd_length)) {
Jiyong Parkcd997e62017-06-30 17:23:33 +0900431 ALOGW("Zip: bad CD advance (%tu vs %zu) at entry %" PRIu16, ptr - cd_ptr, cd_length, i);
Dmitriy Ivanov3ea93da2015-03-06 11:48:47 -0800432 return -1;
Narayan Kamath7462f022013-11-21 13:05:04 +0000433 }
434 }
Narayan Kamathc1a56dc2017-08-09 18:32:09 +0100435
436 uint32_t lfh_start_bytes;
437 if (!archive->mapped_zip.ReadAtOffset(reinterpret_cast<uint8_t*>(&lfh_start_bytes),
438 sizeof(uint32_t), 0)) {
439 ALOGW("Zip: Unable to read header for entry at offset == 0.");
440 return -1;
441 }
442
443 if (lfh_start_bytes != LocalFileHeader::kSignature) {
444 ALOGW("Zip: Entry at offset zero has invalid LFH signature %" PRIx32, lfh_start_bytes);
445#if defined(__ANDROID__)
446 android_errorWriteLog(0x534e4554, "64211847");
447#endif
448 return -1;
449 }
450
Mark Salyzyn088bf902014-05-08 16:02:20 -0700451 ALOGV("+++ zip good scan %" PRIu16 " entries", num_entries);
Narayan Kamath7462f022013-11-21 13:05:04 +0000452
Dmitriy Ivanov3ea93da2015-03-06 11:48:47 -0800453 return 0;
Narayan Kamath7462f022013-11-21 13:05:04 +0000454}
455
Jiyong Parkcd997e62017-06-30 17:23:33 +0900456static int32_t OpenArchiveInternal(ZipArchive* archive, const char* debug_file_name) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000457 int32_t result = -1;
Tianjie Xu18c25922016-09-29 15:27:41 -0700458 if ((result = MapCentralDirectory(debug_file_name, archive)) != 0) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000459 return result;
460 }
461
462 if ((result = ParseZipArchive(archive))) {
463 return result;
464 }
465
466 return 0;
467}
468
Jiyong Parkcd997e62017-06-30 17:23:33 +0900469int32_t OpenArchiveFd(int fd, const char* debug_file_name, ZipArchiveHandle* handle,
470 bool assume_ownership) {
Dmitriy Ivanov40b52b22014-07-15 19:33:00 -0700471 ZipArchive* archive = new ZipArchive(fd, assume_ownership);
Narayan Kamath7462f022013-11-21 13:05:04 +0000472 *handle = archive;
Narayan Kamath7462f022013-11-21 13:05:04 +0000473 return OpenArchiveInternal(archive, debug_file_name);
474}
475
476int32_t OpenArchive(const char* fileName, ZipArchiveHandle* handle) {
Nick Kralevich3bdf7442018-12-18 12:48:06 -0800477 const int fd = ::android::base::utf8::open(fileName, O_RDONLY | O_BINARY | O_CLOEXEC, 0);
Dmitriy Ivanov40b52b22014-07-15 19:33:00 -0700478 ZipArchive* archive = new ZipArchive(fd, true);
Narayan Kamath7462f022013-11-21 13:05:04 +0000479 *handle = archive;
480
Narayan Kamath7462f022013-11-21 13:05:04 +0000481 if (fd < 0) {
482 ALOGW("Unable to open '%s': %s", fileName, strerror(errno));
483 return kIoError;
Narayan Kamath7462f022013-11-21 13:05:04 +0000484 }
Dmitriy Ivanov40b52b22014-07-15 19:33:00 -0700485
Narayan Kamath7462f022013-11-21 13:05:04 +0000486 return OpenArchiveInternal(archive, fileName);
487}
488
Tianjie Xu18c25922016-09-29 15:27:41 -0700489int32_t OpenArchiveFromMemory(void* address, size_t length, const char* debug_file_name,
Jiyong Parkcd997e62017-06-30 17:23:33 +0900490 ZipArchiveHandle* handle) {
Tianjie Xu18c25922016-09-29 15:27:41 -0700491 ZipArchive* archive = new ZipArchive(address, length);
492 *handle = archive;
493 return OpenArchiveInternal(archive, debug_file_name);
494}
495
Narayan Kamath7462f022013-11-21 13:05:04 +0000496/*
497 * Close a ZipArchive, closing the file and freeing the contents.
498 */
Ryan Prichard3673f992018-10-10 22:41:14 -0700499void CloseArchive(ZipArchiveHandle archive) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000500 ALOGV("Closing archive %p", archive);
Neil Fullerb1a113f2014-07-25 14:43:04 +0100501 delete archive;
Narayan Kamath7462f022013-11-21 13:05:04 +0000502}
503
Narayan Kamath162b7052017-06-05 13:21:12 +0100504static int32_t ValidateDataDescriptor(MappedZipFile& mapped_zip, ZipEntry* entry) {
Narayan Kamath926973e2014-06-09 14:18:14 +0100505 uint8_t ddBuf[sizeof(DataDescriptor) + sizeof(DataDescriptor::kOptSignature)];
Adam Lesinskide117e42017-06-19 10:27:38 -0700506 off64_t offset = entry->offset;
507 if (entry->method != kCompressStored) {
508 offset += entry->compressed_length;
509 } else {
510 offset += entry->uncompressed_length;
511 }
512
513 if (!mapped_zip.ReadAtOffset(ddBuf, sizeof(ddBuf), offset)) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000514 return kIoError;
515 }
516
Narayan Kamath926973e2014-06-09 14:18:14 +0100517 const uint32_t ddSignature = *(reinterpret_cast<const uint32_t*>(ddBuf));
Adam Lesinskide117e42017-06-19 10:27:38 -0700518 const uint16_t ddOffset = (ddSignature == DataDescriptor::kOptSignature) ? 4 : 0;
519 const DataDescriptor* descriptor = reinterpret_cast<const DataDescriptor*>(ddBuf + ddOffset);
Narayan Kamath7462f022013-11-21 13:05:04 +0000520
Narayan Kamath162b7052017-06-05 13:21:12 +0100521 // Validate that the values in the data descriptor match those in the central
522 // directory.
523 if (entry->compressed_length != descriptor->compressed_size ||
524 entry->uncompressed_length != descriptor->uncompressed_size ||
525 entry->crc32 != descriptor->crc32) {
526 ALOGW("Zip: size/crc32 mismatch. expected {%" PRIu32 ", %" PRIu32 ", %" PRIx32
527 "}, was {%" PRIu32 ", %" PRIu32 ", %" PRIx32 "}",
528 entry->compressed_length, entry->uncompressed_length, entry->crc32,
529 descriptor->compressed_size, descriptor->uncompressed_size, descriptor->crc32);
530 return kInconsistentInformation;
531 }
Narayan Kamath7462f022013-11-21 13:05:04 +0000532
533 return 0;
534}
535
Andreas Gampe964b95c2019-04-05 13:48:02 -0700536static int32_t FindEntry(const ZipArchive* archive, const int32_t ent, ZipEntry* data) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000537 const uint16_t nameLen = archive->hash_table[ent].name_length;
Narayan Kamath7462f022013-11-21 13:05:04 +0000538
539 // Recover the start of the central directory entry from the filename
540 // pointer. The filename is the first entry past the fixed-size data,
541 // so we can just subtract back from that.
Zimuzo5a503ef2018-09-17 19:49:55 +0100542 const ZipString from_offset =
543 archive->hash_table[ent].GetZipString(archive->central_directory.GetBasePtr());
544 const uint8_t* ptr = from_offset.name;
Narayan Kamath926973e2014-06-09 14:18:14 +0100545 ptr -= sizeof(CentralDirectoryRecord);
Narayan Kamath7462f022013-11-21 13:05:04 +0000546
547 // This is the base of our mmapped region, we have to sanity check that
548 // the name that's in the hash table is a pointer to a location within
549 // this mapped region.
Tianjie Xu18c25922016-09-29 15:27:41 -0700550 const uint8_t* base_ptr = archive->central_directory.GetBasePtr();
551 if (ptr < base_ptr || ptr > base_ptr + archive->central_directory.GetMapLength()) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000552 ALOGW("Zip: Invalid entry pointer");
553 return kInvalidOffset;
554 }
555
Jiyong Parkcd997e62017-06-30 17:23:33 +0900556 const CentralDirectoryRecord* cdr = reinterpret_cast<const CentralDirectoryRecord*>(ptr);
Narayan Kamath926973e2014-06-09 14:18:14 +0100557
Narayan Kamath7462f022013-11-21 13:05:04 +0000558 // The offset of the start of the central directory in the zipfile.
559 // We keep this lying around so that we can sanity check all our lengths
560 // and our per-file structures.
561 const off64_t cd_offset = archive->directory_offset;
562
563 // Fill out the compression method, modification time, crc32
564 // and other interesting attributes from the central directory. These
565 // will later be compared against values from the local file header.
Narayan Kamath926973e2014-06-09 14:18:14 +0100566 data->method = cdr->compression_method;
beonit0e99a2f2015-07-18 02:08:16 +0900567 data->mod_time = cdr->last_mod_date << 16 | cdr->last_mod_time;
Narayan Kamath926973e2014-06-09 14:18:14 +0100568 data->crc32 = cdr->crc32;
569 data->compressed_length = cdr->compressed_size;
570 data->uncompressed_length = cdr->uncompressed_size;
Narayan Kamath7462f022013-11-21 13:05:04 +0000571
572 // Figure out the local header offset from the central directory. The
573 // actual file data will begin after the local header and the name /
574 // extra comments.
Narayan Kamath926973e2014-06-09 14:18:14 +0100575 const off64_t local_header_offset = cdr->local_file_header_offset;
576 if (local_header_offset + static_cast<off64_t>(sizeof(LocalFileHeader)) >= cd_offset) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000577 ALOGW("Zip: bad local hdr offset in zip");
578 return kInvalidOffset;
579 }
580
Narayan Kamath926973e2014-06-09 14:18:14 +0100581 uint8_t lfh_buf[sizeof(LocalFileHeader)];
Tianjie Xu18c25922016-09-29 15:27:41 -0700582 if (!archive->mapped_zip.ReadAtOffset(lfh_buf, sizeof(lfh_buf), local_header_offset)) {
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800583 ALOGW("Zip: failed reading lfh name from offset %" PRId64,
Jiyong Parkcd997e62017-06-30 17:23:33 +0900584 static_cast<int64_t>(local_header_offset));
Narayan Kamath7462f022013-11-21 13:05:04 +0000585 return kIoError;
586 }
587
Jiyong Parkcd997e62017-06-30 17:23:33 +0900588 const LocalFileHeader* lfh = reinterpret_cast<const LocalFileHeader*>(lfh_buf);
Narayan Kamath926973e2014-06-09 14:18:14 +0100589
590 if (lfh->lfh_signature != LocalFileHeader::kSignature) {
Mark Salyzyn99ef9912014-03-14 14:26:22 -0700591 ALOGW("Zip: didn't find signature at start of lfh, offset=%" PRId64,
Jiyong Parkcd997e62017-06-30 17:23:33 +0900592 static_cast<int64_t>(local_header_offset));
Narayan Kamath7462f022013-11-21 13:05:04 +0000593 return kInvalidOffset;
594 }
595
596 // Paranoia: Match the values specified in the local file header
597 // to those specified in the central directory.
Adam Lesinskid987c9d2017-04-06 18:55:47 -0700598
Narayan Kamath162b7052017-06-05 13:21:12 +0100599 // Warn if central directory and local file header don't agree on the use
600 // of a trailing Data Descriptor. The reference implementation is inconsistent
601 // and appears to use the LFH value during extraction (unzip) but the CD value
602 // while displayng information about archives (zipinfo). The spec remains
603 // silent on this inconsistency as well.
604 //
605 // For now, always use the version from the LFH but make sure that the values
606 // specified in the central directory match those in the data descriptor.
607 //
608 // NOTE: It's also worth noting that unzip *does* warn about inconsistencies in
609 // bit 11 (EFS: The language encoding flag, marking that filename and comment are
610 // encoded using UTF-8). This implementation does not check for the presence of
611 // that flag and always enforces that entry names are valid UTF-8.
612 if ((lfh->gpb_flags & kGPBDDFlagMask) != (cdr->gpb_flags & kGPBDDFlagMask)) {
613 ALOGW("Zip: gpb flag mismatch at bit 3. expected {%04" PRIx16 "}, was {%04" PRIx16 "}",
Adam Lesinskid987c9d2017-04-06 18:55:47 -0700614 cdr->gpb_flags, lfh->gpb_flags);
Adam Lesinskid987c9d2017-04-06 18:55:47 -0700615 }
616
617 // If there is no trailing data descriptor, verify that the central directory and local file
618 // header agree on the crc, compressed, and uncompressed sizes of the entry.
Narayan Kamath926973e2014-06-09 14:18:14 +0100619 if ((lfh->gpb_flags & kGPBDDFlagMask) == 0) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000620 data->has_data_descriptor = 0;
Jiyong Parkcd997e62017-06-30 17:23:33 +0900621 if (data->compressed_length != lfh->compressed_size ||
622 data->uncompressed_length != lfh->uncompressed_size || data->crc32 != lfh->crc32) {
623 ALOGW("Zip: size/crc32 mismatch. expected {%" PRIu32 ", %" PRIu32 ", %" PRIx32
624 "}, was {%" PRIu32 ", %" PRIu32 ", %" PRIx32 "}",
625 data->compressed_length, data->uncompressed_length, data->crc32, lfh->compressed_size,
626 lfh->uncompressed_size, lfh->crc32);
Narayan Kamath7462f022013-11-21 13:05:04 +0000627 return kInconsistentInformation;
628 }
629 } else {
630 data->has_data_descriptor = 1;
631 }
632
Elliott Hughes55fd2932017-05-28 22:59:04 -0700633 // 4.4.2.1: the upper byte of `version_made_by` gives the source OS. Unix is 3.
634 if ((cdr->version_made_by >> 8) == 3) {
635 data->unix_mode = (cdr->external_file_attributes >> 16) & 0xffff;
636 } else {
637 data->unix_mode = 0777;
638 }
639
Narayan Kamath7462f022013-11-21 13:05:04 +0000640 // Check that the local file header name matches the declared
641 // name in the central directory.
Narayan Kamath926973e2014-06-09 14:18:14 +0100642 if (lfh->file_name_length == nameLen) {
643 const off64_t name_offset = local_header_offset + sizeof(LocalFileHeader);
Mykola Kondratenko50afc152014-09-08 12:46:37 +0200644 if (name_offset + lfh->file_name_length > cd_offset) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000645 ALOGW("Zip: Invalid declared length");
646 return kInvalidOffset;
647 }
648
Tianjie Xu18c25922016-09-29 15:27:41 -0700649 std::vector<uint8_t> name_buf(nameLen);
650 if (!archive->mapped_zip.ReadAtOffset(name_buf.data(), nameLen, name_offset)) {
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800651 ALOGW("Zip: failed reading lfh name from offset %" PRId64, static_cast<int64_t>(name_offset));
Narayan Kamath7462f022013-11-21 13:05:04 +0000652 return kIoError;
653 }
Zimuzo5a503ef2018-09-17 19:49:55 +0100654 const ZipString from_offset =
655 archive->hash_table[ent].GetZipString(archive->central_directory.GetBasePtr());
656 if (memcmp(from_offset.name, name_buf.data(), nameLen)) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000657 return kInconsistentInformation;
658 }
659
Narayan Kamath7462f022013-11-21 13:05:04 +0000660 } else {
661 ALOGW("Zip: lfh name did not match central directory.");
662 return kInconsistentInformation;
663 }
664
Jiyong Parkcd997e62017-06-30 17:23:33 +0900665 const off64_t data_offset = local_header_offset + sizeof(LocalFileHeader) +
666 lfh->file_name_length + lfh->extra_field_length;
Narayan Kamath48953a12014-01-24 12:32:39 +0000667 if (data_offset > cd_offset) {
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800668 ALOGW("Zip: bad data offset %" PRId64 " in zip", static_cast<int64_t>(data_offset));
Narayan Kamath7462f022013-11-21 13:05:04 +0000669 return kInvalidOffset;
670 }
671
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800672 if (static_cast<off64_t>(data_offset + data->compressed_length) > cd_offset) {
Mark Salyzyn088bf902014-05-08 16:02:20 -0700673 ALOGW("Zip: bad compressed length in zip (%" PRId64 " + %" PRIu32 " > %" PRId64 ")",
Jiyong Parkcd997e62017-06-30 17:23:33 +0900674 static_cast<int64_t>(data_offset), data->compressed_length,
675 static_cast<int64_t>(cd_offset));
Narayan Kamath7462f022013-11-21 13:05:04 +0000676 return kInvalidOffset;
677 }
678
679 if (data->method == kCompressStored &&
Jiyong Parkcd997e62017-06-30 17:23:33 +0900680 static_cast<off64_t>(data_offset + data->uncompressed_length) > cd_offset) {
681 ALOGW("Zip: bad uncompressed length in zip (%" PRId64 " + %" PRIu32 " > %" PRId64 ")",
682 static_cast<int64_t>(data_offset), data->uncompressed_length,
683 static_cast<int64_t>(cd_offset));
684 return kInvalidOffset;
Narayan Kamath7462f022013-11-21 13:05:04 +0000685 }
686
687 data->offset = data_offset;
688 return 0;
689}
690
691struct IterationHandle {
692 uint32_t position;
Elliott Hughesb17bf522019-05-03 22:38:44 -0700693 // TODO: switch these to std::string now that Windows uses libc++ too.
Yusuke Sato07447542015-06-25 14:39:19 -0700694 ZipString prefix;
695 ZipString suffix;
Narayan Kamath7462f022013-11-21 13:05:04 +0000696 ZipArchive* archive;
Piotr Jastrzebski8e085362014-08-18 11:37:45 +0100697
Jiyong Parkcd997e62017-06-30 17:23:33 +0900698 IterationHandle(const ZipString* in_prefix, const ZipString* in_suffix) {
Yusuke Sato07447542015-06-25 14:39:19 -0700699 if (in_prefix) {
700 uint8_t* name_copy = new uint8_t[in_prefix->name_length];
701 memcpy(name_copy, in_prefix->name, in_prefix->name_length);
702 prefix.name = name_copy;
703 prefix.name_length = in_prefix->name_length;
704 } else {
705 prefix.name = NULL;
706 prefix.name_length = 0;
Yusuke Satof1d3d3b2015-06-25 14:09:00 -0700707 }
Yusuke Sato07447542015-06-25 14:39:19 -0700708 if (in_suffix) {
709 uint8_t* name_copy = new uint8_t[in_suffix->name_length];
710 memcpy(name_copy, in_suffix->name, in_suffix->name_length);
711 suffix.name = name_copy;
712 suffix.name_length = in_suffix->name_length;
713 } else {
714 suffix.name = NULL;
715 suffix.name_length = 0;
Yusuke Satof1d3d3b2015-06-25 14:09:00 -0700716 }
Piotr Jastrzebski8e085362014-08-18 11:37:45 +0100717 }
718
719 ~IterationHandle() {
Yusuke Sato07447542015-06-25 14:39:19 -0700720 delete[] prefix.name;
721 delete[] suffix.name;
Piotr Jastrzebski8e085362014-08-18 11:37:45 +0100722 }
Narayan Kamath7462f022013-11-21 13:05:04 +0000723};
724
Ryan Prichard3673f992018-10-10 22:41:14 -0700725int32_t StartIteration(ZipArchiveHandle archive, void** cookie_ptr,
726 const ZipString* optional_prefix, const ZipString* optional_suffix) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000727 if (archive == NULL || archive->hash_table == NULL) {
728 ALOGW("Zip: Invalid ZipArchiveHandle");
729 return kInvalidHandle;
730 }
731
Yusuke Satof1d3d3b2015-06-25 14:09:00 -0700732 IterationHandle* cookie = new IterationHandle(optional_prefix, optional_suffix);
Narayan Kamath7462f022013-11-21 13:05:04 +0000733 cookie->position = 0;
Narayan Kamath7462f022013-11-21 13:05:04 +0000734 cookie->archive = archive;
Narayan Kamath7462f022013-11-21 13:05:04 +0000735
Jiyong Parkcd997e62017-06-30 17:23:33 +0900736 *cookie_ptr = cookie;
Narayan Kamath7462f022013-11-21 13:05:04 +0000737 return 0;
738}
739
Piotr Jastrzebski79c8b342014-08-08 14:02:17 +0100740void EndIteration(void* cookie) {
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100741 delete reinterpret_cast<IterationHandle*>(cookie);
Piotr Jastrzebski79c8b342014-08-08 14:02:17 +0100742}
743
Elliott Hughesb17bf522019-05-03 22:38:44 -0700744// TODO: remove this internally.
Ryan Prichard3673f992018-10-10 22:41:14 -0700745int32_t FindEntry(const ZipArchiveHandle archive, const ZipString& entryName, ZipEntry* data) {
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100746 if (entryName.name_length == 0) {
747 ALOGW("Zip: Invalid filename %.*s", entryName.name_length, entryName.name);
Narayan Kamath7462f022013-11-21 13:05:04 +0000748 return kInvalidEntryName;
749 }
750
Zimuzo5a503ef2018-09-17 19:49:55 +0100751 const int64_t ent = EntryToIndex(archive->hash_table, archive->hash_table_size, entryName,
752 archive->central_directory.GetBasePtr());
Narayan Kamath7462f022013-11-21 13:05:04 +0000753 if (ent < 0) {
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100754 ALOGV("Zip: Could not find entry %.*s", entryName.name_length, entryName.name);
Andreas Gampe964b95c2019-04-05 13:48:02 -0700755 return static_cast<int32_t>(ent); // kEntryNotFound is safe to truncate.
Narayan Kamath7462f022013-11-21 13:05:04 +0000756 }
Andreas Gampe964b95c2019-04-05 13:48:02 -0700757 // We know there are at most hast_table_size entries, safe to truncate.
758 return FindEntry(archive, static_cast<uint32_t>(ent), data);
Narayan Kamath7462f022013-11-21 13:05:04 +0000759}
760
Elliott Hughesb17bf522019-05-03 22:38:44 -0700761int32_t FindEntry(const ZipArchiveHandle archive, const std::string_view entryName,
762 ZipEntry* data) {
763 if (entryName.empty() || entryName.size() > static_cast<size_t>(UINT16_MAX)) {
764 ALOGW("Zip: Invalid filename of length %zu", entryName.size());
765 return kInvalidEntryName;
766 }
767
768 const int64_t ent = EntryToIndex(archive->hash_table, archive->hash_table_size,
769 ZipString(entryName), archive->central_directory.GetBasePtr());
770 if (ent < 0) {
771 ALOGV("Zip: Could not find entry %.*s", static_cast<int>(entryName.size()), entryName.data());
772 return static_cast<int32_t>(ent); // kEntryNotFound is safe to truncate.
773 }
774 // We know there are at most hast_table_size entries, safe to truncate.
775 return FindEntry(archive, static_cast<uint32_t>(ent), data);
776}
777
Yusuke Sato07447542015-06-25 14:39:19 -0700778int32_t Next(void* cookie, ZipEntry* data, ZipString* name) {
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800779 IterationHandle* handle = reinterpret_cast<IterationHandle*>(cookie);
Narayan Kamath7462f022013-11-21 13:05:04 +0000780 if (handle == NULL) {
Zimuzo5a503ef2018-09-17 19:49:55 +0100781 ALOGW("Zip: Null ZipArchiveHandle");
Narayan Kamath7462f022013-11-21 13:05:04 +0000782 return kInvalidHandle;
783 }
784
785 ZipArchive* archive = handle->archive;
786 if (archive == NULL || archive->hash_table == NULL) {
787 ALOGW("Zip: Invalid ZipArchiveHandle");
788 return kInvalidHandle;
789 }
790
791 const uint32_t currentOffset = handle->position;
792 const uint32_t hash_table_length = archive->hash_table_size;
Zimuzo5a503ef2018-09-17 19:49:55 +0100793 const ZipStringOffset* hash_table = archive->hash_table;
Narayan Kamath7462f022013-11-21 13:05:04 +0000794 for (uint32_t i = currentOffset; i < hash_table_length; ++i) {
Zimuzo5a503ef2018-09-17 19:49:55 +0100795 const ZipString from_offset =
796 hash_table[i].GetZipString(archive->central_directory.GetBasePtr());
797 if (hash_table[i].name_offset != 0 &&
798 (handle->prefix.name_length == 0 || from_offset.StartsWith(handle->prefix)) &&
799 (handle->suffix.name_length == 0 || from_offset.EndsWith(handle->suffix))) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000800 handle->position = (i + 1);
801 const int error = FindEntry(archive, i, data);
802 if (!error) {
Zimuzo5a503ef2018-09-17 19:49:55 +0100803 name->name = from_offset.name;
Narayan Kamath7462f022013-11-21 13:05:04 +0000804 name->name_length = hash_table[i].name_length;
805 }
Narayan Kamath7462f022013-11-21 13:05:04 +0000806 return error;
807 }
808 }
809
810 handle->position = 0;
811 return kIterationEnd;
812}
813
Narayan Kamathf899bd52015-04-17 11:53:14 +0100814// A Writer that writes data to a fixed size memory region.
815// The size of the memory region must be equal to the total size of
816// the data appended to it.
Narayan Kamath485b3642017-10-26 14:42:39 +0100817class MemoryWriter : public zip_archive::Writer {
Narayan Kamathf899bd52015-04-17 11:53:14 +0100818 public:
Jiyong Parkcd997e62017-06-30 17:23:33 +0900819 MemoryWriter(uint8_t* buf, size_t size) : Writer(), buf_(buf), size_(size), bytes_written_(0) {}
Narayan Kamathf899bd52015-04-17 11:53:14 +0100820
821 virtual bool Append(uint8_t* buf, size_t buf_size) override {
822 if (bytes_written_ + buf_size > size_) {
Elliott Hughese8f4b142018-10-19 16:09:39 -0700823 ALOGW("Zip: Unexpected size %zu (declared) vs %zu (actual)", size_,
Jiyong Parkcd997e62017-06-30 17:23:33 +0900824 bytes_written_ + buf_size);
Narayan Kamathf899bd52015-04-17 11:53:14 +0100825 return false;
826 }
827
828 memcpy(buf_ + bytes_written_, buf, buf_size);
829 bytes_written_ += buf_size;
830 return true;
831 }
832
833 private:
834 uint8_t* const buf_;
835 const size_t size_;
836 size_t bytes_written_;
837};
838
839// A Writer that appends data to a file |fd| at its current position.
840// The file will be truncated to the end of the written data.
Narayan Kamath485b3642017-10-26 14:42:39 +0100841class FileWriter : public zip_archive::Writer {
Narayan Kamathf899bd52015-04-17 11:53:14 +0100842 public:
Narayan Kamathf899bd52015-04-17 11:53:14 +0100843 // Creates a FileWriter for |fd| and prepare to write |entry| to it,
844 // guaranteeing that the file descriptor is valid and that there's enough
845 // space on the volume to write out the entry completely and that the file
Tao Baoa456c212016-11-15 10:08:07 -0800846 // is truncated to the correct length (no truncation if |fd| references a
847 // block device).
Narayan Kamathf899bd52015-04-17 11:53:14 +0100848 //
849 // Returns a valid FileWriter on success, |nullptr| if an error occurred.
Yurii Zubrytskyi834326c2017-12-20 01:01:01 -0800850 static FileWriter Create(int fd, const ZipEntry* entry) {
Narayan Kamathf899bd52015-04-17 11:53:14 +0100851 const uint32_t declared_length = entry->uncompressed_length;
852 const off64_t current_offset = lseek64(fd, 0, SEEK_CUR);
853 if (current_offset == -1) {
854 ALOGW("Zip: unable to seek to current location on fd %d: %s", fd, strerror(errno));
Yurii Zubrytskyi834326c2017-12-20 01:01:01 -0800855 return FileWriter{};
Narayan Kamathf899bd52015-04-17 11:53:14 +0100856 }
857
Narayan Kamathf899bd52015-04-17 11:53:14 +0100858#if defined(__linux__)
859 if (declared_length > 0) {
860 // Make sure we have enough space on the volume to extract the compressed
861 // entry. Note that the call to ftruncate below will change the file size but
862 // will not allocate space on disk and this call to fallocate will not
863 // change the file size.
Badhri Jagan Sridharana68d0d12015-06-02 14:47:57 -0700864 // Note: fallocate is only supported by the following filesystems -
865 // btrfs, ext4, ocfs2, and xfs. Therefore fallocate might fail with
866 // EOPNOTSUPP error when issued in other filesystems.
867 // Hence, check for the return error code before concluding that the
868 // disk does not have enough space.
Andreas Gampe964b95c2019-04-05 13:48:02 -0700869 long result = TEMP_FAILURE_RETRY(fallocate(fd, 0, current_offset, declared_length));
Badhri Jagan Sridharana68d0d12015-06-02 14:47:57 -0700870 if (result == -1 && errno == ENOSPC) {
Elliott Hughes4089d342017-10-27 14:21:12 -0700871 ALOGW("Zip: unable to allocate %" PRId64 " bytes at offset %" PRId64 ": %s",
Narayan Kamathd5d7abe2016-08-10 12:24:05 +0100872 static_cast<int64_t>(declared_length), static_cast<int64_t>(current_offset),
873 strerror(errno));
Yurii Zubrytskyi834326c2017-12-20 01:01:01 -0800874 return FileWriter{};
Narayan Kamathf899bd52015-04-17 11:53:14 +0100875 }
876 }
877#endif // __linux__
878
Tao Baoa456c212016-11-15 10:08:07 -0800879 struct stat sb;
880 if (fstat(fd, &sb) == -1) {
881 ALOGW("Zip: unable to fstat file: %s", strerror(errno));
Yurii Zubrytskyi834326c2017-12-20 01:01:01 -0800882 return FileWriter{};
Narayan Kamathf899bd52015-04-17 11:53:14 +0100883 }
884
Tao Baoa456c212016-11-15 10:08:07 -0800885 // Block device doesn't support ftruncate(2).
886 if (!S_ISBLK(sb.st_mode)) {
Andreas Gampe964b95c2019-04-05 13:48:02 -0700887 long result = TEMP_FAILURE_RETRY(ftruncate(fd, declared_length + current_offset));
Tao Baoa456c212016-11-15 10:08:07 -0800888 if (result == -1) {
889 ALOGW("Zip: unable to truncate file to %" PRId64 ": %s",
890 static_cast<int64_t>(declared_length + current_offset), strerror(errno));
Yurii Zubrytskyi834326c2017-12-20 01:01:01 -0800891 return FileWriter{};
Tao Baoa456c212016-11-15 10:08:07 -0800892 }
893 }
894
Yurii Zubrytskyi834326c2017-12-20 01:01:01 -0800895 return FileWriter(fd, declared_length);
Narayan Kamathf899bd52015-04-17 11:53:14 +0100896 }
897
Chih-Hung Hsieh747eb142018-09-25 11:16:22 -0700898 FileWriter(FileWriter&& other) noexcept
Yurii Zubrytskyi834326c2017-12-20 01:01:01 -0800899 : fd_(other.fd_),
900 declared_length_(other.declared_length_),
901 total_bytes_written_(other.total_bytes_written_) {
902 other.fd_ = -1;
903 }
904
905 bool IsValid() const { return fd_ != -1; }
906
Narayan Kamathf899bd52015-04-17 11:53:14 +0100907 virtual bool Append(uint8_t* buf, size_t buf_size) override {
908 if (total_bytes_written_ + buf_size > declared_length_) {
Elliott Hughese8f4b142018-10-19 16:09:39 -0700909 ALOGW("Zip: Unexpected size %zu (declared) vs %zu (actual)", declared_length_,
Jiyong Parkcd997e62017-06-30 17:23:33 +0900910 total_bytes_written_ + buf_size);
Narayan Kamathf899bd52015-04-17 11:53:14 +0100911 return false;
912 }
913
Narayan Kamathe97e66e2015-04-27 16:25:53 +0100914 const bool result = android::base::WriteFully(fd_, buf, buf_size);
915 if (result) {
916 total_bytes_written_ += buf_size;
917 } else {
Elliott Hughese8f4b142018-10-19 16:09:39 -0700918 ALOGW("Zip: unable to write %zu bytes to file; %s", buf_size, strerror(errno));
Narayan Kamathf899bd52015-04-17 11:53:14 +0100919 }
920
Narayan Kamathe97e66e2015-04-27 16:25:53 +0100921 return result;
Narayan Kamathf899bd52015-04-17 11:53:14 +0100922 }
Jiyong Parkcd997e62017-06-30 17:23:33 +0900923
Narayan Kamathf899bd52015-04-17 11:53:14 +0100924 private:
Yurii Zubrytskyi834326c2017-12-20 01:01:01 -0800925 explicit FileWriter(const int fd = -1, const size_t declared_length = 0)
Jiyong Parkcd997e62017-06-30 17:23:33 +0900926 : Writer(), fd_(fd), declared_length_(declared_length), total_bytes_written_(0) {}
Narayan Kamathf899bd52015-04-17 11:53:14 +0100927
Yurii Zubrytskyi834326c2017-12-20 01:01:01 -0800928 int fd_;
Narayan Kamathf899bd52015-04-17 11:53:14 +0100929 const size_t declared_length_;
930 size_t total_bytes_written_;
931};
932
Narayan Kamath485b3642017-10-26 14:42:39 +0100933class EntryReader : public zip_archive::Reader {
Narayan Kamath8b8faed2017-10-26 14:08:38 +0100934 public:
935 EntryReader(const MappedZipFile& zip_file, const ZipEntry* entry)
936 : Reader(), zip_file_(zip_file), entry_(entry) {}
937
938 virtual bool ReadAtOffset(uint8_t* buf, size_t len, uint32_t offset) const {
939 return zip_file_.ReadAtOffset(buf, len, entry_->offset + offset);
940 }
941
942 virtual ~EntryReader() {}
943
944 private:
945 const MappedZipFile& zip_file_;
946 const ZipEntry* entry_;
947};
948
Dmitriy Ivanovf94e1592015-03-06 13:27:59 -0800949// This method is using libz macros with old-style-casts
950#pragma GCC diagnostic push
951#pragma GCC diagnostic ignored "-Wold-style-cast"
952static inline int zlib_inflateInit2(z_stream* stream, int window_bits) {
953 return inflateInit2(stream, window_bits);
954}
955#pragma GCC diagnostic pop
956
Narayan Kamath485b3642017-10-26 14:42:39 +0100957namespace zip_archive {
958
959// Moved out of line to avoid -Wweak-vtables.
960Reader::~Reader() {}
961Writer::~Writer() {}
962
963int32_t Inflate(const Reader& reader, const uint32_t compressed_length,
964 const uint32_t uncompressed_length, Writer* writer, uint64_t* crc_out) {
Dmitriy Ivanovedbabfe2015-03-12 09:58:15 -0700965 const size_t kBufSize = 32768;
966 std::vector<uint8_t> read_buf(kBufSize);
967 std::vector<uint8_t> write_buf(kBufSize);
Narayan Kamath7462f022013-11-21 13:05:04 +0000968 z_stream zstream;
969 int zerr;
970
971 /*
972 * Initialize the zlib stream struct.
973 */
974 memset(&zstream, 0, sizeof(zstream));
975 zstream.zalloc = Z_NULL;
976 zstream.zfree = Z_NULL;
977 zstream.opaque = Z_NULL;
978 zstream.next_in = NULL;
979 zstream.avail_in = 0;
Dmitriy Ivanovedbabfe2015-03-12 09:58:15 -0700980 zstream.next_out = &write_buf[0];
Narayan Kamath7462f022013-11-21 13:05:04 +0000981 zstream.avail_out = kBufSize;
982 zstream.data_type = Z_UNKNOWN;
983
984 /*
985 * Use the undocumented "negative window bits" feature to tell zlib
986 * that there's no zlib header waiting for it.
987 */
Dmitriy Ivanovf94e1592015-03-06 13:27:59 -0800988 zerr = zlib_inflateInit2(&zstream, -MAX_WBITS);
Narayan Kamath7462f022013-11-21 13:05:04 +0000989 if (zerr != Z_OK) {
990 if (zerr == Z_VERSION_ERROR) {
Jiyong Parkcd997e62017-06-30 17:23:33 +0900991 ALOGE("Installed zlib is not compatible with linked version (%s)", ZLIB_VERSION);
Narayan Kamath7462f022013-11-21 13:05:04 +0000992 } else {
993 ALOGW("Call to inflateInit2 failed (zerr=%d)", zerr);
994 }
995
996 return kZlibError;
997 }
998
Dmitriy Ivanov1f741e52015-03-06 14:26:37 -0800999 auto zstream_deleter = [](z_stream* stream) {
Jiyong Parkcd997e62017-06-30 17:23:33 +09001000 inflateEnd(stream); /* free up any allocated structures */
Dmitriy Ivanov1f741e52015-03-06 14:26:37 -08001001 };
1002
1003 std::unique_ptr<z_stream, decltype(zstream_deleter)> zstream_guard(&zstream, zstream_deleter);
1004
Narayan Kamath2d1e23f2017-10-30 11:17:28 +00001005 const bool compute_crc = (crc_out != nullptr);
Andreas Gampe964b95c2019-04-05 13:48:02 -07001006 uLong crc = 0;
Narayan Kamath8b8faed2017-10-26 14:08:38 +01001007 uint32_t remaining_bytes = compressed_length;
Narayan Kamath7462f022013-11-21 13:05:04 +00001008 do {
1009 /* read as much as we can */
1010 if (zstream.avail_in == 0) {
Andreas Gampe964b95c2019-04-05 13:48:02 -07001011 const uint32_t read_size = (remaining_bytes > kBufSize) ? kBufSize : remaining_bytes;
Narayan Kamath8b8faed2017-10-26 14:08:38 +01001012 const uint32_t offset = (compressed_length - remaining_bytes);
Adam Lesinskide117e42017-06-19 10:27:38 -07001013 // Make sure to read at offset to ensure concurrent access to the fd.
Narayan Kamath8b8faed2017-10-26 14:08:38 +01001014 if (!reader.ReadAtOffset(read_buf.data(), read_size, offset)) {
Andreas Gampe964b95c2019-04-05 13:48:02 -07001015 ALOGW("Zip: inflate read failed, getSize = %u: %s", read_size, strerror(errno));
Dmitriy Ivanov1f741e52015-03-06 14:26:37 -08001016 return kIoError;
Narayan Kamath7462f022013-11-21 13:05:04 +00001017 }
1018
Narayan Kamath8b8faed2017-10-26 14:08:38 +01001019 remaining_bytes -= read_size;
Narayan Kamath7462f022013-11-21 13:05:04 +00001020
Dmitriy Ivanovedbabfe2015-03-12 09:58:15 -07001021 zstream.next_in = &read_buf[0];
Narayan Kamath8b8faed2017-10-26 14:08:38 +01001022 zstream.avail_in = read_size;
Narayan Kamath7462f022013-11-21 13:05:04 +00001023 }
1024
1025 /* uncompress the data */
1026 zerr = inflate(&zstream, Z_NO_FLUSH);
1027 if (zerr != Z_OK && zerr != Z_STREAM_END) {
Jiyong Parkcd997e62017-06-30 17:23:33 +09001028 ALOGW("Zip: inflate zerr=%d (nIn=%p aIn=%u nOut=%p aOut=%u)", zerr, zstream.next_in,
1029 zstream.avail_in, zstream.next_out, zstream.avail_out);
Dmitriy Ivanov1f741e52015-03-06 14:26:37 -08001030 return kZlibError;
Narayan Kamath7462f022013-11-21 13:05:04 +00001031 }
1032
1033 /* write when we're full or when we're done */
Jiyong Parkcd997e62017-06-30 17:23:33 +09001034 if (zstream.avail_out == 0 || (zerr == Z_STREAM_END && zstream.avail_out != kBufSize)) {
Dmitriy Ivanovedbabfe2015-03-12 09:58:15 -07001035 const size_t write_size = zstream.next_out - &write_buf[0];
Narayan Kamathf899bd52015-04-17 11:53:14 +01001036 if (!writer->Append(&write_buf[0], write_size)) {
Narayan Kamath2d1e23f2017-10-30 11:17:28 +00001037 return kIoError;
1038 } else if (compute_crc) {
Andreas Gampe964b95c2019-04-05 13:48:02 -07001039 DCHECK_LE(write_size, kBufSize);
1040 crc = crc32(crc, &write_buf[0], static_cast<uint32_t>(write_size));
Narayan Kamath7462f022013-11-21 13:05:04 +00001041 }
Narayan Kamath7462f022013-11-21 13:05:04 +00001042
Dmitriy Ivanovedbabfe2015-03-12 09:58:15 -07001043 zstream.next_out = &write_buf[0];
Narayan Kamath7462f022013-11-21 13:05:04 +00001044 zstream.avail_out = kBufSize;
1045 }
1046 } while (zerr == Z_OK);
1047
Elliott Hughese8f4b142018-10-19 16:09:39 -07001048 CHECK_EQ(zerr, Z_STREAM_END); /* other errors should've been caught */
Narayan Kamath7462f022013-11-21 13:05:04 +00001049
Narayan Kamath162b7052017-06-05 13:21:12 +01001050 // NOTE: zstream.adler is always set to 0, because we're using the -MAX_WBITS
1051 // "feature" of zlib to tell it there won't be a zlib file header. zlib
1052 // doesn't bother calculating the checksum in that scenario. We just do
1053 // it ourselves above because there are no additional gains to be made by
1054 // having zlib calculate it for us, since they do it by calling crc32 in
1055 // the same manner that we have above.
Narayan Kamath2d1e23f2017-10-30 11:17:28 +00001056 if (compute_crc) {
1057 *crc_out = crc;
1058 }
Narayan Kamath7462f022013-11-21 13:05:04 +00001059
Narayan Kamath8b8faed2017-10-26 14:08:38 +01001060 if (zstream.total_out != uncompressed_length || remaining_bytes != 0) {
Jiyong Parkcd997e62017-06-30 17:23:33 +09001061 ALOGW("Zip: size mismatch on inflated file (%lu vs %" PRIu32 ")", zstream.total_out,
1062 uncompressed_length);
Dmitriy Ivanov1f741e52015-03-06 14:26:37 -08001063 return kInconsistentInformation;
Narayan Kamath7462f022013-11-21 13:05:04 +00001064 }
1065
Dmitriy Ivanov1f741e52015-03-06 14:26:37 -08001066 return 0;
Narayan Kamath7462f022013-11-21 13:05:04 +00001067}
Narayan Kamath485b3642017-10-26 14:42:39 +01001068} // namespace zip_archive
Narayan Kamath7462f022013-11-21 13:05:04 +00001069
Narayan Kamath8b8faed2017-10-26 14:08:38 +01001070static int32_t InflateEntryToWriter(MappedZipFile& mapped_zip, const ZipEntry* entry,
Narayan Kamath485b3642017-10-26 14:42:39 +01001071 zip_archive::Writer* writer, uint64_t* crc_out) {
Narayan Kamath8b8faed2017-10-26 14:08:38 +01001072 const EntryReader reader(mapped_zip, entry);
1073
Narayan Kamath485b3642017-10-26 14:42:39 +01001074 return zip_archive::Inflate(reader, entry->compressed_length, entry->uncompressed_length, writer,
1075 crc_out);
Narayan Kamath8b8faed2017-10-26 14:08:38 +01001076}
1077
Narayan Kamath485b3642017-10-26 14:42:39 +01001078static int32_t CopyEntryToWriter(MappedZipFile& mapped_zip, const ZipEntry* entry,
1079 zip_archive::Writer* writer, uint64_t* crc_out) {
Narayan Kamathf899bd52015-04-17 11:53:14 +01001080 static const uint32_t kBufSize = 32768;
1081 std::vector<uint8_t> buf(kBufSize);
1082
1083 const uint32_t length = entry->uncompressed_length;
1084 uint32_t count = 0;
Andreas Gampe964b95c2019-04-05 13:48:02 -07001085 uLong crc = 0;
Narayan Kamathf899bd52015-04-17 11:53:14 +01001086 while (count < length) {
1087 uint32_t remaining = length - count;
Adam Lesinskide117e42017-06-19 10:27:38 -07001088 off64_t offset = entry->offset + count;
Narayan Kamathf899bd52015-04-17 11:53:14 +01001089
Adam Lesinskide117e42017-06-19 10:27:38 -07001090 // Safe conversion because kBufSize is narrow enough for a 32 bit signed value.
Andreas Gampe964b95c2019-04-05 13:48:02 -07001091 const uint32_t block_size = (remaining > kBufSize) ? kBufSize : remaining;
Adam Lesinskide117e42017-06-19 10:27:38 -07001092
1093 // Make sure to read at offset to ensure concurrent access to the fd.
1094 if (!mapped_zip.ReadAtOffset(buf.data(), block_size, offset)) {
Andreas Gampe964b95c2019-04-05 13:48:02 -07001095 ALOGW("CopyFileToFile: copy read failed, block_size = %u, offset = %" PRId64 ": %s",
Adam Lesinskide117e42017-06-19 10:27:38 -07001096 block_size, static_cast<int64_t>(offset), strerror(errno));
Narayan Kamathf899bd52015-04-17 11:53:14 +01001097 return kIoError;
1098 }
1099
1100 if (!writer->Append(&buf[0], block_size)) {
1101 return kIoError;
1102 }
1103 crc = crc32(crc, &buf[0], block_size);
1104 count += block_size;
1105 }
1106
1107 *crc_out = crc;
1108
1109 return 0;
1110}
1111
Ryan Prichard3673f992018-10-10 22:41:14 -07001112int32_t ExtractToWriter(ZipArchiveHandle archive, ZipEntry* entry, zip_archive::Writer* writer) {
Narayan Kamath7462f022013-11-21 13:05:04 +00001113 const uint16_t method = entry->method;
Narayan Kamath7462f022013-11-21 13:05:04 +00001114
1115 // this should default to kUnknownCompressionMethod.
1116 int32_t return_value = -1;
1117 uint64_t crc = 0;
1118 if (method == kCompressStored) {
Tianjie Xu18c25922016-09-29 15:27:41 -07001119 return_value = CopyEntryToWriter(archive->mapped_zip, entry, writer, &crc);
Narayan Kamath7462f022013-11-21 13:05:04 +00001120 } else if (method == kCompressDeflated) {
Tianjie Xu18c25922016-09-29 15:27:41 -07001121 return_value = InflateEntryToWriter(archive->mapped_zip, entry, writer, &crc);
Narayan Kamath7462f022013-11-21 13:05:04 +00001122 }
1123
1124 if (!return_value && entry->has_data_descriptor) {
Narayan Kamath162b7052017-06-05 13:21:12 +01001125 return_value = ValidateDataDescriptor(archive->mapped_zip, entry);
Narayan Kamath7462f022013-11-21 13:05:04 +00001126 if (return_value) {
1127 return return_value;
1128 }
1129 }
1130
Narayan Kamath162b7052017-06-05 13:21:12 +01001131 // Validate that the CRC matches the calculated value.
1132 if (kCrcChecksEnabled && (entry->crc32 != static_cast<uint32_t>(crc))) {
Mark Salyzyn088bf902014-05-08 16:02:20 -07001133 ALOGW("Zip: crc mismatch: expected %" PRIu32 ", was %" PRIu64, entry->crc32, crc);
Narayan Kamath7462f022013-11-21 13:05:04 +00001134 return kInconsistentInformation;
1135 }
1136
1137 return return_value;
1138}
1139
Ryan Prichard3673f992018-10-10 22:41:14 -07001140int32_t ExtractToMemory(ZipArchiveHandle archive, ZipEntry* entry, uint8_t* begin, uint32_t size) {
Yurii Zubrytskyi834326c2017-12-20 01:01:01 -08001141 MemoryWriter writer(begin, size);
Ryan Prichard3673f992018-10-10 22:41:14 -07001142 return ExtractToWriter(archive, entry, &writer);
Narayan Kamathf899bd52015-04-17 11:53:14 +01001143}
1144
Ryan Prichard3673f992018-10-10 22:41:14 -07001145int32_t ExtractEntryToFile(ZipArchiveHandle archive, ZipEntry* entry, int fd) {
Yurii Zubrytskyi834326c2017-12-20 01:01:01 -08001146 auto writer = FileWriter::Create(fd, entry);
1147 if (!writer.IsValid()) {
Narayan Kamath7462f022013-11-21 13:05:04 +00001148 return kIoError;
1149 }
1150
Ryan Prichard3673f992018-10-10 22:41:14 -07001151 return ExtractToWriter(archive, entry, &writer);
Narayan Kamath7462f022013-11-21 13:05:04 +00001152}
1153
1154const char* ErrorCodeString(int32_t error_code) {
Narayan Kamath1ef9d2d2017-06-15 13:58:25 +01001155 // Make sure that the number of entries in kErrorMessages and ErrorCodes
1156 // match.
1157 static_assert((-kLastErrorCode + 1) == arraysize(kErrorMessages),
1158 "(-kLastErrorCode + 1) != arraysize(kErrorMessages)");
1159
1160 const uint32_t idx = -error_code;
1161 if (idx < arraysize(kErrorMessages)) {
1162 return kErrorMessages[idx];
Narayan Kamath7462f022013-11-21 13:05:04 +00001163 }
1164
Narayan Kamath1ef9d2d2017-06-15 13:58:25 +01001165 return "Unknown return code";
Narayan Kamath7462f022013-11-21 13:05:04 +00001166}
1167
Ryan Prichard3673f992018-10-10 22:41:14 -07001168int GetFileDescriptor(const ZipArchiveHandle archive) {
1169 return archive->mapped_zip.GetFileDescriptor();
Narayan Kamath7462f022013-11-21 13:05:04 +00001170}
Colin Cross7c6c7f02016-09-16 10:15:51 -07001171
Elliott Hughesb17bf522019-05-03 22:38:44 -07001172ZipString::ZipString(std::string_view entry_name)
1173 : name(reinterpret_cast<const uint8_t*>(entry_name.data())) {
1174 size_t len = entry_name.size();
Colin Cross7c6c7f02016-09-16 10:15:51 -07001175 CHECK_LE(len, static_cast<size_t>(UINT16_MAX));
1176 name_length = static_cast<uint16_t>(len);
1177}
Tianjie Xu18c25922016-09-29 15:27:41 -07001178
1179#if !defined(_WIN32)
Narayan Kamath485b3642017-10-26 14:42:39 +01001180class ProcessWriter : public zip_archive::Writer {
Tianjie Xu18c25922016-09-29 15:27:41 -07001181 public:
Jiyong Parkcd997e62017-06-30 17:23:33 +09001182 ProcessWriter(ProcessZipEntryFunction func, void* cookie)
1183 : Writer(), proc_function_(func), cookie_(cookie) {}
Tianjie Xu18c25922016-09-29 15:27:41 -07001184
1185 virtual bool Append(uint8_t* buf, size_t buf_size) override {
1186 return proc_function_(buf, buf_size, cookie_);
1187 }
1188
1189 private:
1190 ProcessZipEntryFunction proc_function_;
1191 void* cookie_;
1192};
1193
Ryan Prichard3673f992018-10-10 22:41:14 -07001194int32_t ProcessZipEntryContents(ZipArchiveHandle archive, ZipEntry* entry,
Tianjie Xu18c25922016-09-29 15:27:41 -07001195 ProcessZipEntryFunction func, void* cookie) {
1196 ProcessWriter writer(func, cookie);
Ryan Prichard3673f992018-10-10 22:41:14 -07001197 return ExtractToWriter(archive, entry, &writer);
Tianjie Xu18c25922016-09-29 15:27:41 -07001198}
1199
Jiyong Parkcd997e62017-06-30 17:23:33 +09001200#endif //! defined(_WIN32)
Tianjie Xu18c25922016-09-29 15:27:41 -07001201
1202int MappedZipFile::GetFileDescriptor() const {
1203 if (!has_fd_) {
1204 ALOGW("Zip: MappedZipFile doesn't have a file descriptor.");
1205 return -1;
1206 }
1207 return fd_;
1208}
1209
1210void* MappedZipFile::GetBasePtr() const {
1211 if (has_fd_) {
1212 ALOGW("Zip: MappedZipFile doesn't have a base pointer.");
1213 return nullptr;
1214 }
1215 return base_ptr_;
1216}
1217
1218off64_t MappedZipFile::GetFileLength() const {
1219 if (has_fd_) {
1220 off64_t result = lseek64(fd_, 0, SEEK_END);
1221 if (result == -1) {
1222 ALOGE("Zip: lseek on fd %d failed: %s", fd_, strerror(errno));
1223 }
1224 return result;
1225 } else {
1226 if (base_ptr_ == nullptr) {
1227 ALOGE("Zip: invalid file map\n");
1228 return -1;
1229 }
1230 return static_cast<off64_t>(data_length_);
1231 }
1232}
1233
Tianjie Xu18c25922016-09-29 15:27:41 -07001234// Attempts to read |len| bytes into |buf| at offset |off|.
Narayan Kamath8b8faed2017-10-26 14:08:38 +01001235bool MappedZipFile::ReadAtOffset(uint8_t* buf, size_t len, off64_t off) const {
Tianjie Xu18c25922016-09-29 15:27:41 -07001236 if (has_fd_) {
Adam Lesinskide117e42017-06-19 10:27:38 -07001237 if (!android::base::ReadFullyAtOffset(fd_, buf, len, off)) {
Tianjie Xu18c25922016-09-29 15:27:41 -07001238 ALOGE("Zip: failed to read at offset %" PRId64 "\n", off);
1239 return false;
1240 }
Adam Lesinskide117e42017-06-19 10:27:38 -07001241 } else {
1242 if (off < 0 || off > static_cast<off64_t>(data_length_)) {
1243 ALOGE("Zip: invalid offset: %" PRId64 ", data length: %" PRId64 "\n", off, data_length_);
1244 return false;
1245 }
1246 memcpy(buf, static_cast<uint8_t*>(base_ptr_) + off, len);
Tianjie Xu18c25922016-09-29 15:27:41 -07001247 }
Adam Lesinskide117e42017-06-19 10:27:38 -07001248 return true;
Tianjie Xu18c25922016-09-29 15:27:41 -07001249}
1250
1251void CentralDirectory::Initialize(void* map_base_ptr, off64_t cd_start_offset, size_t cd_size) {
1252 base_ptr_ = static_cast<uint8_t*>(map_base_ptr) + cd_start_offset;
1253 length_ = cd_size;
1254}
1255
Elliott Hughese8f4b142018-10-19 16:09:39 -07001256bool ZipArchive::InitializeCentralDirectory(off64_t cd_start_offset, size_t cd_size) {
Tianjie Xu18c25922016-09-29 15:27:41 -07001257 if (mapped_zip.HasFd()) {
Elliott Hughese8f4b142018-10-19 16:09:39 -07001258 directory_map = android::base::MappedFile::FromFd(mapped_zip.GetFileDescriptor(),
1259 cd_start_offset, cd_size, PROT_READ);
1260 if (!directory_map) return false;
Tianjie Xu18c25922016-09-29 15:27:41 -07001261
Elliott Hughese8f4b142018-10-19 16:09:39 -07001262 CHECK_EQ(directory_map->size(), cd_size);
1263 central_directory.Initialize(directory_map->data(), 0 /*offset*/, cd_size);
Tianjie Xu18c25922016-09-29 15:27:41 -07001264 } else {
1265 if (mapped_zip.GetBasePtr() == nullptr) {
1266 ALOGE("Zip: Failed to map central directory, bad mapped_zip base pointer\n");
1267 return false;
1268 }
1269 if (static_cast<off64_t>(cd_start_offset) + static_cast<off64_t>(cd_size) >
1270 mapped_zip.GetFileLength()) {
Jiyong Parkcd997e62017-06-30 17:23:33 +09001271 ALOGE(
1272 "Zip: Failed to map central directory, offset exceeds mapped memory region ("
1273 "start_offset %" PRId64 ", cd_size %zu, mapped_region_size %" PRId64 ")",
1274 static_cast<int64_t>(cd_start_offset), cd_size, mapped_zip.GetFileLength());
Tianjie Xu18c25922016-09-29 15:27:41 -07001275 return false;
1276 }
1277
1278 central_directory.Initialize(mapped_zip.GetBasePtr(), cd_start_offset, cd_size);
1279 }
1280 return true;
1281}
Elliott Hughes55fd2932017-05-28 22:59:04 -07001282
1283tm ZipEntry::GetModificationTime() const {
1284 tm t = {};
1285
1286 t.tm_hour = (mod_time >> 11) & 0x1f;
1287 t.tm_min = (mod_time >> 5) & 0x3f;
1288 t.tm_sec = (mod_time & 0x1f) << 1;
1289
1290 t.tm_year = ((mod_time >> 25) & 0x7f) + 80;
1291 t.tm_mon = ((mod_time >> 21) & 0xf) - 1;
1292 t.tm_mday = (mod_time >> 16) & 0x1f;
1293
1294 return t;
1295}