blob: a07df30a75d440ca9035bd960db421a40578c9af [file] [log] [blame]
Narayan Kamath7462f022013-11-21 13:05:04 +00001/*
2 * Copyright (C) 2008 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17/*
18 * Read-only access to Zip archives, with minimal heap allocation.
19 */
Narayan Kamath7462f022013-11-21 13:05:04 +000020
Mark Salyzyncfd5b082016-10-17 14:28:00 -070021#define LOG_TAG "ziparchive"
22
Narayan Kamath7462f022013-11-21 13:05:04 +000023#include <assert.h>
24#include <errno.h>
Mark Salyzyn99ef9912014-03-14 14:26:22 -070025#include <fcntl.h>
26#include <inttypes.h>
Narayan Kamath7462f022013-11-21 13:05:04 +000027#include <limits.h>
Narayan Kamath7462f022013-11-21 13:05:04 +000028#include <stdlib.h>
29#include <string.h>
Narayan Kamath7462f022013-11-21 13:05:04 +000030#include <unistd.h>
31
Dan Albert1ae07642015-04-09 14:11:18 -070032#include <memory>
33#include <vector>
34
Mark Salyzynff2dcd92016-09-28 15:54:45 -070035#include <android-base/file.h>
36#include <android-base/logging.h>
37#include <android-base/macros.h> // TEMP_FAILURE_RETRY may or may not be in unistd
38#include <android-base/memory.h>
Mark Salyzyncfd5b082016-10-17 14:28:00 -070039#include <log/log.h>
Mark Salyzynff2dcd92016-09-28 15:54:45 -070040#include <utils/Compat.h>
41#include <utils/FileMap.h>
Christopher Ferrise6884ce2015-11-10 14:55:12 -080042#include "ziparchive/zip_archive.h"
Dan Albert1ae07642015-04-09 14:11:18 -070043#include "zlib.h"
Narayan Kamath7462f022013-11-21 13:05:04 +000044
Narayan Kamath044bc8e2014-12-03 18:22:53 +000045#include "entry_name_utils-inl.h"
Adam Lesinskiad4ad8c2015-10-05 18:16:18 -070046#include "zip_archive_common.h"
Christopher Ferrise6884ce2015-11-10 14:55:12 -080047#include "zip_archive_private.h"
Mark Salyzyn99ef9912014-03-14 14:26:22 -070048
Dan Albert1ae07642015-04-09 14:11:18 -070049using android::base::get_unaligned;
Narayan Kamath044bc8e2014-12-03 18:22:53 +000050
Narayan Kamath926973e2014-06-09 14:18:14 +010051// This is for windows. If we don't open a file in binary mode, weird
Narayan Kamath7462f022013-11-21 13:05:04 +000052// things will happen.
53#ifndef O_BINARY
54#define O_BINARY 0
55#endif
56
Narayan Kamath926973e2014-06-09 14:18:14 +010057// The maximum number of bytes to scan backwards for the EOCD start.
58static const uint32_t kMaxEOCDSearch = kMaxCommentLen + sizeof(EocdRecord);
59
Narayan Kamath7462f022013-11-21 13:05:04 +000060static const char* kErrorMessages[] = {
61 "Unknown return code.",
Narayan Kamatheb41ad22013-12-09 16:26:36 +000062 "Iteration ended",
Narayan Kamath7462f022013-11-21 13:05:04 +000063 "Zlib error",
64 "Invalid file",
65 "Invalid handle",
66 "Duplicate entries in archive",
67 "Empty archive",
68 "Entry not found",
69 "Invalid offset",
70 "Inconsistent information",
71 "Invalid entry name",
Narayan Kamatheb41ad22013-12-09 16:26:36 +000072 "I/O Error",
Narayan Kamatheaf98852013-12-11 14:51:51 +000073 "File mapping failed"
Narayan Kamath7462f022013-11-21 13:05:04 +000074};
75
76static const int32_t kErrorMessageUpperBound = 0;
77
Narayan Kamatheb41ad22013-12-09 16:26:36 +000078static const int32_t kIterationEnd = -1;
Narayan Kamath7462f022013-11-21 13:05:04 +000079
80// We encountered a Zlib error when inflating a stream from this file.
81// Usually indicates file corruption.
82static const int32_t kZlibError = -2;
83
84// The input file cannot be processed as a zip archive. Usually because
85// it's too small, too large or does not have a valid signature.
86static const int32_t kInvalidFile = -3;
87
88// An invalid iteration / ziparchive handle was passed in as an input
89// argument.
90static const int32_t kInvalidHandle = -4;
91
92// The zip archive contained two (or possibly more) entries with the same
93// name.
94static const int32_t kDuplicateEntry = -5;
95
96// The zip archive contains no entries.
97static const int32_t kEmptyArchive = -6;
98
99// The specified entry was not found in the archive.
100static const int32_t kEntryNotFound = -7;
101
102// The zip archive contained an invalid local file header pointer.
103static const int32_t kInvalidOffset = -8;
104
105// The zip archive contained inconsistent entry information. This could
106// be because the central directory & local file header did not agree, or
107// if the actual uncompressed length or crc32 do not match their declared
108// values.
109static const int32_t kInconsistentInformation = -9;
110
111// An invalid entry name was encountered.
112static const int32_t kInvalidEntryName = -10;
113
Narayan Kamatheb41ad22013-12-09 16:26:36 +0000114// An I/O related system call (read, lseek, ftruncate, map) failed.
115static const int32_t kIoError = -11;
Narayan Kamath7462f022013-11-21 13:05:04 +0000116
Narayan Kamatheaf98852013-12-11 14:51:51 +0000117// We were not able to mmap the central directory or entry contents.
118static const int32_t kMmapFailed = -12;
Narayan Kamath7462f022013-11-21 13:05:04 +0000119
Narayan Kamatheaf98852013-12-11 14:51:51 +0000120static const int32_t kErrorMessageLowerBound = -13;
Narayan Kamath7462f022013-11-21 13:05:04 +0000121
Narayan Kamath7462f022013-11-21 13:05:04 +0000122/*
123 * A Read-only Zip archive.
124 *
125 * We want "open" and "find entry by name" to be fast operations, and
126 * we want to use as little memory as possible. We memory-map the zip
127 * central directory, and load a hash table with pointers to the filenames
128 * (which aren't null-terminated). The other fields are at a fixed offset
129 * from the filename, so we don't need to extract those (but we do need
130 * to byte-read and endian-swap them every time we want them).
131 *
132 * It's possible that somebody has handed us a massive (~1GB) zip archive,
133 * so we can't expect to mmap the entire file.
134 *
135 * To speed comparisons when doing a lookup by name, we could make the mapping
136 * "private" (copy-on-write) and null-terminate the filenames after verifying
137 * the record structure. However, this requires a private mapping of
138 * every page that the Central Directory touches. Easier to tuck a copy
139 * of the string length into the hash table entry.
140 */
Narayan Kamath7462f022013-11-21 13:05:04 +0000141
Narayan Kamath7462f022013-11-21 13:05:04 +0000142/*
143 * Round up to the next highest power of 2.
144 *
145 * Found on http://graphics.stanford.edu/~seander/bithacks.html.
146 */
147static uint32_t RoundUpPower2(uint32_t val) {
148 val--;
149 val |= val >> 1;
150 val |= val >> 2;
151 val |= val >> 4;
152 val |= val >> 8;
153 val |= val >> 16;
154 val++;
155
156 return val;
157}
158
Yusuke Sato07447542015-06-25 14:39:19 -0700159static uint32_t ComputeHash(const ZipString& name) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000160 uint32_t hash = 0;
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100161 uint16_t len = name.name_length;
162 const uint8_t* str = name.name;
Narayan Kamath7462f022013-11-21 13:05:04 +0000163
164 while (len--) {
165 hash = hash * 31 + *str++;
166 }
167
168 return hash;
169}
170
171/*
172 * Convert a ZipEntry to a hash table index, verifying that it's in a
173 * valid range.
174 */
Yusuke Sato07447542015-06-25 14:39:19 -0700175static int64_t EntryToIndex(const ZipString* hash_table,
Narayan Kamath7462f022013-11-21 13:05:04 +0000176 const uint32_t hash_table_size,
Yusuke Sato07447542015-06-25 14:39:19 -0700177 const ZipString& name) {
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100178 const uint32_t hash = ComputeHash(name);
Narayan Kamath7462f022013-11-21 13:05:04 +0000179
180 // NOTE: (hash_table_size - 1) is guaranteed to be non-negative.
181 uint32_t ent = hash & (hash_table_size - 1);
182 while (hash_table[ent].name != NULL) {
Yusuke Sato07447542015-06-25 14:39:19 -0700183 if (hash_table[ent] == name) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000184 return ent;
185 }
186
187 ent = (ent + 1) & (hash_table_size - 1);
188 }
189
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100190 ALOGV("Zip: Unable to find entry %.*s", name.name_length, name.name);
Narayan Kamath7462f022013-11-21 13:05:04 +0000191 return kEntryNotFound;
192}
193
194/*
195 * Add a new entry to the hash table.
196 */
Yusuke Sato07447542015-06-25 14:39:19 -0700197static int32_t AddToHash(ZipString *hash_table, const uint64_t hash_table_size,
198 const ZipString& name) {
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100199 const uint64_t hash = ComputeHash(name);
Narayan Kamath7462f022013-11-21 13:05:04 +0000200 uint32_t ent = hash & (hash_table_size - 1);
201
202 /*
203 * We over-allocated the table, so we're guaranteed to find an empty slot.
204 * Further, we guarantee that the hashtable size is not 0.
205 */
206 while (hash_table[ent].name != NULL) {
Yusuke Sato07447542015-06-25 14:39:19 -0700207 if (hash_table[ent] == name) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000208 // We've found a duplicate entry. We don't accept it
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100209 ALOGW("Zip: Found duplicate entry %.*s", name.name_length, name.name);
Narayan Kamath7462f022013-11-21 13:05:04 +0000210 return kDuplicateEntry;
211 }
212 ent = (ent + 1) & (hash_table_size - 1);
213 }
214
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100215 hash_table[ent].name = name.name;
216 hash_table[ent].name_length = name.name_length;
Narayan Kamath7462f022013-11-21 13:05:04 +0000217 return 0;
218}
219
Tianjie Xu18c25922016-09-29 15:27:41 -0700220static int32_t MapCentralDirectory0(const char* debug_file_name, ZipArchive* archive,
221 off64_t file_length, off64_t read_amount,
222 uint8_t* scan_buffer) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000223 const off64_t search_start = file_length - read_amount;
224
Tianjie Xu18c25922016-09-29 15:27:41 -0700225 if(!archive->mapped_zip.ReadAtOffset(scan_buffer, read_amount, search_start)) {
226 ALOGE("Zip: read %" PRId64 " from offset %" PRId64 " failed",
227 static_cast<int64_t>(read_amount), static_cast<int64_t>(search_start));
Narayan Kamath7462f022013-11-21 13:05:04 +0000228 return kIoError;
229 }
230
231 /*
232 * Scan backward for the EOCD magic. In an archive without a trailing
233 * comment, we'll find it on the first try. (We may want to consider
234 * doing an initial minimal read; if we don't find it, retry with a
235 * second read as above.)
236 */
Narayan Kamath926973e2014-06-09 14:18:14 +0100237 int i = read_amount - sizeof(EocdRecord);
238 for (; i >= 0; i--) {
Dan Albert1ae07642015-04-09 14:11:18 -0700239 if (scan_buffer[i] == 0x50) {
240 uint32_t* sig_addr = reinterpret_cast<uint32_t*>(&scan_buffer[i]);
241 if (get_unaligned<uint32_t>(sig_addr) == EocdRecord::kSignature) {
242 ALOGV("+++ Found EOCD at buf+%d", i);
243 break;
244 }
Narayan Kamath7462f022013-11-21 13:05:04 +0000245 }
246 }
247 if (i < 0) {
248 ALOGD("Zip: EOCD not found, %s is not zip", debug_file_name);
249 return kInvalidFile;
250 }
251
252 const off64_t eocd_offset = search_start + i;
Narayan Kamath926973e2014-06-09 14:18:14 +0100253 const EocdRecord* eocd = reinterpret_cast<const EocdRecord*>(scan_buffer + i);
Narayan Kamath7462f022013-11-21 13:05:04 +0000254 /*
Narayan Kamath926973e2014-06-09 14:18:14 +0100255 * Verify that there's no trailing space at the end of the central directory
256 * and its comment.
Narayan Kamath7462f022013-11-21 13:05:04 +0000257 */
Narayan Kamath926973e2014-06-09 14:18:14 +0100258 const off64_t calculated_length = eocd_offset + sizeof(EocdRecord)
259 + eocd->comment_length;
260 if (calculated_length != file_length) {
Narayan Kamath4f6b4992014-06-03 13:59:23 +0100261 ALOGW("Zip: %" PRId64 " extraneous bytes at the end of the central directory",
Narayan Kamath926973e2014-06-09 14:18:14 +0100262 static_cast<int64_t>(file_length - calculated_length));
Narayan Kamath4f6b4992014-06-03 13:59:23 +0100263 return kInvalidFile;
264 }
Narayan Kamath7462f022013-11-21 13:05:04 +0000265
Narayan Kamath926973e2014-06-09 14:18:14 +0100266 /*
267 * Grab the CD offset and size, and the number of entries in the
268 * archive and verify that they look reasonable.
269 */
Tianjie Xu1ee48922016-09-21 14:58:11 -0700270 if (static_cast<off64_t>(eocd->cd_start_offset) + eocd->cd_size > eocd_offset) {
Narayan Kamath926973e2014-06-09 14:18:14 +0100271 ALOGW("Zip: bad offsets (dir %" PRIu32 ", size %" PRIu32 ", eocd %" PRId64 ")",
272 eocd->cd_start_offset, eocd->cd_size, static_cast<int64_t>(eocd_offset));
Tianjie Xu1ee48922016-09-21 14:58:11 -0700273#if defined(__ANDROID__)
274 if (eocd->cd_start_offset + eocd->cd_size <= eocd_offset) {
275 android_errorWriteLog(0x534e4554, "31251826");
276 }
277#endif
Narayan Kamath7462f022013-11-21 13:05:04 +0000278 return kInvalidOffset;
279 }
Narayan Kamath926973e2014-06-09 14:18:14 +0100280 if (eocd->num_records == 0) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000281 ALOGW("Zip: empty archive?");
282 return kEmptyArchive;
283 }
284
Elliott Hughese49236b2015-06-04 15:21:59 -0700285 ALOGV("+++ num_entries=%" PRIu32 " dir_size=%" PRIu32 " dir_offset=%" PRIu32,
Narayan Kamath926973e2014-06-09 14:18:14 +0100286 eocd->num_records, eocd->cd_size, eocd->cd_start_offset);
Narayan Kamath7462f022013-11-21 13:05:04 +0000287
288 /*
289 * It all looks good. Create a mapping for the CD, and set the fields
290 * in archive.
291 */
Tianjie Xu18c25922016-09-29 15:27:41 -0700292
293 if (!archive->InitializeCentralDirectory(debug_file_name,
294 static_cast<off64_t>(eocd->cd_start_offset),
295 static_cast<size_t>(eocd->cd_size))) {
296 ALOGE("Zip: failed to intialize central directory.\n");
Narayan Kamatheaf98852013-12-11 14:51:51 +0000297 return kMmapFailed;
Narayan Kamath7462f022013-11-21 13:05:04 +0000298 }
299
Narayan Kamath926973e2014-06-09 14:18:14 +0100300 archive->num_entries = eocd->num_records;
301 archive->directory_offset = eocd->cd_start_offset;
Narayan Kamath7462f022013-11-21 13:05:04 +0000302
303 return 0;
304}
305
306/*
307 * Find the zip Central Directory and memory-map it.
308 *
309 * On success, returns 0 after populating fields from the EOCD area:
310 * directory_offset
Tianjie Xu18c25922016-09-29 15:27:41 -0700311 * directory_ptr
Narayan Kamath7462f022013-11-21 13:05:04 +0000312 * num_entries
313 */
Tianjie Xu18c25922016-09-29 15:27:41 -0700314static int32_t MapCentralDirectory(const char* debug_file_name, ZipArchive* archive) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000315
316 // Test file length. We use lseek64 to make sure the file
317 // is small enough to be a zip file (Its size must be less than
318 // 0xffffffff bytes).
Tianjie Xu18c25922016-09-29 15:27:41 -0700319 off64_t file_length = archive->mapped_zip.GetFileLength();
Narayan Kamath7462f022013-11-21 13:05:04 +0000320 if (file_length == -1) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000321 return kInvalidFile;
322 }
323
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800324 if (file_length > static_cast<off64_t>(0xffffffff)) {
Narayan Kamath926973e2014-06-09 14:18:14 +0100325 ALOGV("Zip: zip file too long %" PRId64, static_cast<int64_t>(file_length));
Narayan Kamath7462f022013-11-21 13:05:04 +0000326 return kInvalidFile;
327 }
328
Narayan Kamath926973e2014-06-09 14:18:14 +0100329 if (file_length < static_cast<off64_t>(sizeof(EocdRecord))) {
330 ALOGV("Zip: length %" PRId64 " is too small to be zip", static_cast<int64_t>(file_length));
Narayan Kamath7462f022013-11-21 13:05:04 +0000331 return kInvalidFile;
332 }
333
334 /*
335 * Perform the traditional EOCD snipe hunt.
336 *
337 * We're searching for the End of Central Directory magic number,
338 * which appears at the start of the EOCD block. It's followed by
339 * 18 bytes of EOCD stuff and up to 64KB of archive comment. We
340 * need to read the last part of the file into a buffer, dig through
341 * it to find the magic number, parse some values out, and use those
342 * to determine the extent of the CD.
343 *
344 * We start by pulling in the last part of the file.
345 */
Narayan Kamath926973e2014-06-09 14:18:14 +0100346 off64_t read_amount = kMaxEOCDSearch;
347 if (file_length < read_amount) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000348 read_amount = file_length;
349 }
350
Tianjie Xu18c25922016-09-29 15:27:41 -0700351 std::vector<uint8_t> scan_buffer(read_amount);
352 int32_t result = MapCentralDirectory0(debug_file_name, archive, file_length, read_amount,
353 scan_buffer.data());
Narayan Kamath7462f022013-11-21 13:05:04 +0000354 return result;
355}
356
357/*
358 * Parses the Zip archive's Central Directory. Allocates and populates the
359 * hash table.
360 *
361 * Returns 0 on success.
362 */
363static int32_t ParseZipArchive(ZipArchive* archive) {
Tianjie Xu18c25922016-09-29 15:27:41 -0700364 const uint8_t* const cd_ptr = archive->central_directory.GetBasePtr();
365 const size_t cd_length = archive->central_directory.GetMapLength();
Narayan Kamath926973e2014-06-09 14:18:14 +0100366 const uint16_t num_entries = archive->num_entries;
Narayan Kamath7462f022013-11-21 13:05:04 +0000367
368 /*
369 * Create hash table. We have a minimum 75% load factor, possibly as
370 * low as 50% after we round off to a power of 2. There must be at
371 * least one unused entry to avoid an infinite loop during creation.
372 */
373 archive->hash_table_size = RoundUpPower2(1 + (num_entries * 4) / 3);
Yusuke Sato07447542015-06-25 14:39:19 -0700374 archive->hash_table = reinterpret_cast<ZipString*>(calloc(archive->hash_table_size,
375 sizeof(ZipString)));
Narayan Kamath7462f022013-11-21 13:05:04 +0000376
377 /*
378 * Walk through the central directory, adding entries to the hash
379 * table and verifying values.
380 */
Narayan Kamath926973e2014-06-09 14:18:14 +0100381 const uint8_t* const cd_end = cd_ptr + cd_length;
Narayan Kamath7462f022013-11-21 13:05:04 +0000382 const uint8_t* ptr = cd_ptr;
383 for (uint16_t i = 0; i < num_entries; i++) {
Narayan Kamath926973e2014-06-09 14:18:14 +0100384 const CentralDirectoryRecord* cdr =
385 reinterpret_cast<const CentralDirectoryRecord*>(ptr);
386 if (cdr->record_signature != CentralDirectoryRecord::kSignature) {
Mark Salyzyn088bf902014-05-08 16:02:20 -0700387 ALOGW("Zip: missed a central dir sig (at %" PRIu16 ")", i);
Dmitriy Ivanov3ea93da2015-03-06 11:48:47 -0800388 return -1;
Narayan Kamath7462f022013-11-21 13:05:04 +0000389 }
390
Narayan Kamath926973e2014-06-09 14:18:14 +0100391 if (ptr + sizeof(CentralDirectoryRecord) > cd_end) {
Mark Salyzyn088bf902014-05-08 16:02:20 -0700392 ALOGW("Zip: ran off the end (at %" PRIu16 ")", i);
Dmitriy Ivanov3ea93da2015-03-06 11:48:47 -0800393 return -1;
Narayan Kamath7462f022013-11-21 13:05:04 +0000394 }
395
Narayan Kamath926973e2014-06-09 14:18:14 +0100396 const off64_t local_header_offset = cdr->local_file_header_offset;
Narayan Kamath7462f022013-11-21 13:05:04 +0000397 if (local_header_offset >= archive->directory_offset) {
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800398 ALOGW("Zip: bad LFH offset %" PRId64 " at entry %" PRIu16,
399 static_cast<int64_t>(local_header_offset), i);
Dmitriy Ivanov3ea93da2015-03-06 11:48:47 -0800400 return -1;
Narayan Kamath7462f022013-11-21 13:05:04 +0000401 }
402
Narayan Kamath926973e2014-06-09 14:18:14 +0100403 const uint16_t file_name_length = cdr->file_name_length;
404 const uint16_t extra_length = cdr->extra_field_length;
405 const uint16_t comment_length = cdr->comment_length;
Piotr Jastrzebski78271ba2014-08-15 12:53:00 +0100406 const uint8_t* file_name = ptr + sizeof(CentralDirectoryRecord);
407
Narayan Kamath044bc8e2014-12-03 18:22:53 +0000408 /* check that file name is valid UTF-8 and doesn't contain NUL (U+0000) characters */
409 if (!IsValidEntryName(file_name, file_name_length)) {
Dmitriy Ivanov3ea93da2015-03-06 11:48:47 -0800410 return -1;
Piotr Jastrzebski78271ba2014-08-15 12:53:00 +0100411 }
Narayan Kamath7462f022013-11-21 13:05:04 +0000412
413 /* add the CDE filename to the hash table */
Yusuke Sato07447542015-06-25 14:39:19 -0700414 ZipString entry_name;
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100415 entry_name.name = file_name;
416 entry_name.name_length = file_name_length;
Narayan Kamath7462f022013-11-21 13:05:04 +0000417 const int add_result = AddToHash(archive->hash_table,
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100418 archive->hash_table_size, entry_name);
Dmitriy Ivanov3ea93da2015-03-06 11:48:47 -0800419 if (add_result != 0) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000420 ALOGW("Zip: Error adding entry to hash table %d", add_result);
Dmitriy Ivanov3ea93da2015-03-06 11:48:47 -0800421 return add_result;
Narayan Kamath7462f022013-11-21 13:05:04 +0000422 }
423
Narayan Kamath926973e2014-06-09 14:18:14 +0100424 ptr += sizeof(CentralDirectoryRecord) + file_name_length + extra_length + comment_length;
425 if ((ptr - cd_ptr) > static_cast<int64_t>(cd_length)) {
Mark Salyzyn088bf902014-05-08 16:02:20 -0700426 ALOGW("Zip: bad CD advance (%tu vs %zu) at entry %" PRIu16,
427 ptr - cd_ptr, cd_length, i);
Dmitriy Ivanov3ea93da2015-03-06 11:48:47 -0800428 return -1;
Narayan Kamath7462f022013-11-21 13:05:04 +0000429 }
430 }
Mark Salyzyn088bf902014-05-08 16:02:20 -0700431 ALOGV("+++ zip good scan %" PRIu16 " entries", num_entries);
Narayan Kamath7462f022013-11-21 13:05:04 +0000432
Dmitriy Ivanov3ea93da2015-03-06 11:48:47 -0800433 return 0;
Narayan Kamath7462f022013-11-21 13:05:04 +0000434}
435
436static int32_t OpenArchiveInternal(ZipArchive* archive,
437 const char* debug_file_name) {
438 int32_t result = -1;
Tianjie Xu18c25922016-09-29 15:27:41 -0700439 if ((result = MapCentralDirectory(debug_file_name, archive)) != 0) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000440 return result;
441 }
442
443 if ((result = ParseZipArchive(archive))) {
444 return result;
445 }
446
447 return 0;
448}
449
450int32_t OpenArchiveFd(int fd, const char* debug_file_name,
Dmitriy Ivanov40b52b22014-07-15 19:33:00 -0700451 ZipArchiveHandle* handle, bool assume_ownership) {
452 ZipArchive* archive = new ZipArchive(fd, assume_ownership);
Narayan Kamath7462f022013-11-21 13:05:04 +0000453 *handle = archive;
Narayan Kamath7462f022013-11-21 13:05:04 +0000454 return OpenArchiveInternal(archive, debug_file_name);
455}
456
457int32_t OpenArchive(const char* fileName, ZipArchiveHandle* handle) {
Neil Fullerb1a113f2014-07-25 14:43:04 +0100458 const int fd = open(fileName, O_RDONLY | O_BINARY, 0);
Dmitriy Ivanov40b52b22014-07-15 19:33:00 -0700459 ZipArchive* archive = new ZipArchive(fd, true);
Narayan Kamath7462f022013-11-21 13:05:04 +0000460 *handle = archive;
461
Narayan Kamath7462f022013-11-21 13:05:04 +0000462 if (fd < 0) {
463 ALOGW("Unable to open '%s': %s", fileName, strerror(errno));
464 return kIoError;
Narayan Kamath7462f022013-11-21 13:05:04 +0000465 }
Dmitriy Ivanov40b52b22014-07-15 19:33:00 -0700466
Narayan Kamath7462f022013-11-21 13:05:04 +0000467 return OpenArchiveInternal(archive, fileName);
468}
469
Tianjie Xu18c25922016-09-29 15:27:41 -0700470int32_t OpenArchiveFromMemory(void* address, size_t length, const char* debug_file_name,
471 ZipArchiveHandle *handle) {
472 ZipArchive* archive = new ZipArchive(address, length);
473 *handle = archive;
474 return OpenArchiveInternal(archive, debug_file_name);
475}
476
Narayan Kamath7462f022013-11-21 13:05:04 +0000477/*
478 * Close a ZipArchive, closing the file and freeing the contents.
479 */
480void CloseArchive(ZipArchiveHandle handle) {
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800481 ZipArchive* archive = reinterpret_cast<ZipArchive*>(handle);
Narayan Kamath7462f022013-11-21 13:05:04 +0000482 ALOGV("Closing archive %p", archive);
Neil Fullerb1a113f2014-07-25 14:43:04 +0100483 delete archive;
Narayan Kamath7462f022013-11-21 13:05:04 +0000484}
485
Tianjie Xu18c25922016-09-29 15:27:41 -0700486static int32_t UpdateEntryFromDataDescriptor(MappedZipFile& mapped_zip,
Narayan Kamath7462f022013-11-21 13:05:04 +0000487 ZipEntry *entry) {
Narayan Kamath926973e2014-06-09 14:18:14 +0100488 uint8_t ddBuf[sizeof(DataDescriptor) + sizeof(DataDescriptor::kOptSignature)];
Tianjie Xu18c25922016-09-29 15:27:41 -0700489 if (!mapped_zip.ReadData(ddBuf, sizeof(ddBuf))) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000490 return kIoError;
491 }
492
Narayan Kamath926973e2014-06-09 14:18:14 +0100493 const uint32_t ddSignature = *(reinterpret_cast<const uint32_t*>(ddBuf));
494 const uint16_t offset = (ddSignature == DataDescriptor::kOptSignature) ? 4 : 0;
495 const DataDescriptor* descriptor = reinterpret_cast<const DataDescriptor*>(ddBuf + offset);
Narayan Kamath7462f022013-11-21 13:05:04 +0000496
Narayan Kamath926973e2014-06-09 14:18:14 +0100497 entry->crc32 = descriptor->crc32;
498 entry->compressed_length = descriptor->compressed_size;
499 entry->uncompressed_length = descriptor->uncompressed_size;
Narayan Kamath7462f022013-11-21 13:05:04 +0000500
501 return 0;
502}
503
Narayan Kamath7462f022013-11-21 13:05:04 +0000504static int32_t FindEntry(const ZipArchive* archive, const int ent,
505 ZipEntry* data) {
506 const uint16_t nameLen = archive->hash_table[ent].name_length;
Narayan Kamath7462f022013-11-21 13:05:04 +0000507
508 // Recover the start of the central directory entry from the filename
509 // pointer. The filename is the first entry past the fixed-size data,
510 // so we can just subtract back from that.
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100511 const uint8_t* ptr = archive->hash_table[ent].name;
Narayan Kamath926973e2014-06-09 14:18:14 +0100512 ptr -= sizeof(CentralDirectoryRecord);
Narayan Kamath7462f022013-11-21 13:05:04 +0000513
514 // This is the base of our mmapped region, we have to sanity check that
515 // the name that's in the hash table is a pointer to a location within
516 // this mapped region.
Tianjie Xu18c25922016-09-29 15:27:41 -0700517 const uint8_t* base_ptr = archive->central_directory.GetBasePtr();
518 if (ptr < base_ptr || ptr > base_ptr + archive->central_directory.GetMapLength()) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000519 ALOGW("Zip: Invalid entry pointer");
520 return kInvalidOffset;
521 }
522
Narayan Kamath926973e2014-06-09 14:18:14 +0100523 const CentralDirectoryRecord *cdr =
524 reinterpret_cast<const CentralDirectoryRecord*>(ptr);
525
Narayan Kamath7462f022013-11-21 13:05:04 +0000526 // The offset of the start of the central directory in the zipfile.
527 // We keep this lying around so that we can sanity check all our lengths
528 // and our per-file structures.
529 const off64_t cd_offset = archive->directory_offset;
530
531 // Fill out the compression method, modification time, crc32
532 // and other interesting attributes from the central directory. These
533 // will later be compared against values from the local file header.
Narayan Kamath926973e2014-06-09 14:18:14 +0100534 data->method = cdr->compression_method;
beonit0e99a2f2015-07-18 02:08:16 +0900535 data->mod_time = cdr->last_mod_date << 16 | cdr->last_mod_time;
Narayan Kamath926973e2014-06-09 14:18:14 +0100536 data->crc32 = cdr->crc32;
537 data->compressed_length = cdr->compressed_size;
538 data->uncompressed_length = cdr->uncompressed_size;
Narayan Kamath7462f022013-11-21 13:05:04 +0000539
540 // Figure out the local header offset from the central directory. The
541 // actual file data will begin after the local header and the name /
542 // extra comments.
Narayan Kamath926973e2014-06-09 14:18:14 +0100543 const off64_t local_header_offset = cdr->local_file_header_offset;
544 if (local_header_offset + static_cast<off64_t>(sizeof(LocalFileHeader)) >= cd_offset) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000545 ALOGW("Zip: bad local hdr offset in zip");
546 return kInvalidOffset;
547 }
548
Narayan Kamath926973e2014-06-09 14:18:14 +0100549 uint8_t lfh_buf[sizeof(LocalFileHeader)];
Tianjie Xu18c25922016-09-29 15:27:41 -0700550 if (!archive->mapped_zip.ReadAtOffset(lfh_buf, sizeof(lfh_buf), local_header_offset)) {
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800551 ALOGW("Zip: failed reading lfh name from offset %" PRId64,
552 static_cast<int64_t>(local_header_offset));
Narayan Kamath7462f022013-11-21 13:05:04 +0000553 return kIoError;
554 }
555
Narayan Kamath926973e2014-06-09 14:18:14 +0100556 const LocalFileHeader *lfh = reinterpret_cast<const LocalFileHeader*>(lfh_buf);
557
558 if (lfh->lfh_signature != LocalFileHeader::kSignature) {
Mark Salyzyn99ef9912014-03-14 14:26:22 -0700559 ALOGW("Zip: didn't find signature at start of lfh, offset=%" PRId64,
Narayan Kamath926973e2014-06-09 14:18:14 +0100560 static_cast<int64_t>(local_header_offset));
Narayan Kamath7462f022013-11-21 13:05:04 +0000561 return kInvalidOffset;
562 }
563
564 // Paranoia: Match the values specified in the local file header
565 // to those specified in the central directory.
Narayan Kamath926973e2014-06-09 14:18:14 +0100566 if ((lfh->gpb_flags & kGPBDDFlagMask) == 0) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000567 data->has_data_descriptor = 0;
Narayan Kamath926973e2014-06-09 14:18:14 +0100568 if (data->compressed_length != lfh->compressed_size
569 || data->uncompressed_length != lfh->uncompressed_size
570 || data->crc32 != lfh->crc32) {
Mark Salyzyn088bf902014-05-08 16:02:20 -0700571 ALOGW("Zip: size/crc32 mismatch. expected {%" PRIu32 ", %" PRIu32
572 ", %" PRIx32 "}, was {%" PRIu32 ", %" PRIu32 ", %" PRIx32 "}",
Narayan Kamath7462f022013-11-21 13:05:04 +0000573 data->compressed_length, data->uncompressed_length, data->crc32,
Narayan Kamath926973e2014-06-09 14:18:14 +0100574 lfh->compressed_size, lfh->uncompressed_size, lfh->crc32);
Narayan Kamath7462f022013-11-21 13:05:04 +0000575 return kInconsistentInformation;
576 }
577 } else {
578 data->has_data_descriptor = 1;
579 }
580
581 // Check that the local file header name matches the declared
582 // name in the central directory.
Narayan Kamath926973e2014-06-09 14:18:14 +0100583 if (lfh->file_name_length == nameLen) {
584 const off64_t name_offset = local_header_offset + sizeof(LocalFileHeader);
Mykola Kondratenko50afc152014-09-08 12:46:37 +0200585 if (name_offset + lfh->file_name_length > cd_offset) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000586 ALOGW("Zip: Invalid declared length");
587 return kInvalidOffset;
588 }
589
Tianjie Xu18c25922016-09-29 15:27:41 -0700590 std::vector<uint8_t> name_buf(nameLen);
591 if (!archive->mapped_zip.ReadAtOffset(name_buf.data(), nameLen, name_offset)) {
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800592 ALOGW("Zip: failed reading lfh name from offset %" PRId64, static_cast<int64_t>(name_offset));
Narayan Kamath7462f022013-11-21 13:05:04 +0000593 return kIoError;
594 }
595
Tianjie Xu18c25922016-09-29 15:27:41 -0700596 if (memcmp(archive->hash_table[ent].name, name_buf.data(), nameLen)) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000597 return kInconsistentInformation;
598 }
599
Narayan Kamath7462f022013-11-21 13:05:04 +0000600 } else {
601 ALOGW("Zip: lfh name did not match central directory.");
602 return kInconsistentInformation;
603 }
604
Narayan Kamath926973e2014-06-09 14:18:14 +0100605 const off64_t data_offset = local_header_offset + sizeof(LocalFileHeader)
606 + lfh->file_name_length + lfh->extra_field_length;
Narayan Kamath48953a12014-01-24 12:32:39 +0000607 if (data_offset > cd_offset) {
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800608 ALOGW("Zip: bad data offset %" PRId64 " in zip", static_cast<int64_t>(data_offset));
Narayan Kamath7462f022013-11-21 13:05:04 +0000609 return kInvalidOffset;
610 }
611
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800612 if (static_cast<off64_t>(data_offset + data->compressed_length) > cd_offset) {
Mark Salyzyn088bf902014-05-08 16:02:20 -0700613 ALOGW("Zip: bad compressed length in zip (%" PRId64 " + %" PRIu32 " > %" PRId64 ")",
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800614 static_cast<int64_t>(data_offset), data->compressed_length, static_cast<int64_t>(cd_offset));
Narayan Kamath7462f022013-11-21 13:05:04 +0000615 return kInvalidOffset;
616 }
617
618 if (data->method == kCompressStored &&
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800619 static_cast<off64_t>(data_offset + data->uncompressed_length) > cd_offset) {
Mark Salyzyn088bf902014-05-08 16:02:20 -0700620 ALOGW("Zip: bad uncompressed length in zip (%" PRId64 " + %" PRIu32 " > %" PRId64 ")",
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800621 static_cast<int64_t>(data_offset), data->uncompressed_length,
622 static_cast<int64_t>(cd_offset));
Narayan Kamath7462f022013-11-21 13:05:04 +0000623 return kInvalidOffset;
624 }
625
626 data->offset = data_offset;
627 return 0;
628}
629
630struct IterationHandle {
631 uint32_t position;
Piotr Jastrzebski10aa9a02014-08-19 09:01:20 +0100632 // We're not using vector here because this code is used in the Windows SDK
633 // where the STL is not available.
Yusuke Sato07447542015-06-25 14:39:19 -0700634 ZipString prefix;
635 ZipString suffix;
Narayan Kamath7462f022013-11-21 13:05:04 +0000636 ZipArchive* archive;
Piotr Jastrzebski8e085362014-08-18 11:37:45 +0100637
Yusuke Sato07447542015-06-25 14:39:19 -0700638 IterationHandle(const ZipString* in_prefix,
639 const ZipString* in_suffix) {
640 if (in_prefix) {
641 uint8_t* name_copy = new uint8_t[in_prefix->name_length];
642 memcpy(name_copy, in_prefix->name, in_prefix->name_length);
643 prefix.name = name_copy;
644 prefix.name_length = in_prefix->name_length;
645 } else {
646 prefix.name = NULL;
647 prefix.name_length = 0;
Yusuke Satof1d3d3b2015-06-25 14:09:00 -0700648 }
Yusuke Sato07447542015-06-25 14:39:19 -0700649 if (in_suffix) {
650 uint8_t* name_copy = new uint8_t[in_suffix->name_length];
651 memcpy(name_copy, in_suffix->name, in_suffix->name_length);
652 suffix.name = name_copy;
653 suffix.name_length = in_suffix->name_length;
654 } else {
655 suffix.name = NULL;
656 suffix.name_length = 0;
Yusuke Satof1d3d3b2015-06-25 14:09:00 -0700657 }
Piotr Jastrzebski8e085362014-08-18 11:37:45 +0100658 }
659
660 ~IterationHandle() {
Yusuke Sato07447542015-06-25 14:39:19 -0700661 delete[] prefix.name;
662 delete[] suffix.name;
Piotr Jastrzebski8e085362014-08-18 11:37:45 +0100663 }
Narayan Kamath7462f022013-11-21 13:05:04 +0000664};
665
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100666int32_t StartIteration(ZipArchiveHandle handle, void** cookie_ptr,
Yusuke Sato07447542015-06-25 14:39:19 -0700667 const ZipString* optional_prefix,
668 const ZipString* optional_suffix) {
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800669 ZipArchive* archive = reinterpret_cast<ZipArchive*>(handle);
Narayan Kamath7462f022013-11-21 13:05:04 +0000670
671 if (archive == NULL || archive->hash_table == NULL) {
672 ALOGW("Zip: Invalid ZipArchiveHandle");
673 return kInvalidHandle;
674 }
675
Yusuke Satof1d3d3b2015-06-25 14:09:00 -0700676 IterationHandle* cookie = new IterationHandle(optional_prefix, optional_suffix);
Narayan Kamath7462f022013-11-21 13:05:04 +0000677 cookie->position = 0;
Narayan Kamath7462f022013-11-21 13:05:04 +0000678 cookie->archive = archive;
Narayan Kamath7462f022013-11-21 13:05:04 +0000679
680 *cookie_ptr = cookie ;
681 return 0;
682}
683
Piotr Jastrzebski79c8b342014-08-08 14:02:17 +0100684void EndIteration(void* cookie) {
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100685 delete reinterpret_cast<IterationHandle*>(cookie);
Piotr Jastrzebski79c8b342014-08-08 14:02:17 +0100686}
687
Yusuke Sato07447542015-06-25 14:39:19 -0700688int32_t FindEntry(const ZipArchiveHandle handle, const ZipString& entryName,
Narayan Kamath7462f022013-11-21 13:05:04 +0000689 ZipEntry* data) {
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800690 const ZipArchive* archive = reinterpret_cast<ZipArchive*>(handle);
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100691 if (entryName.name_length == 0) {
692 ALOGW("Zip: Invalid filename %.*s", entryName.name_length, entryName.name);
Narayan Kamath7462f022013-11-21 13:05:04 +0000693 return kInvalidEntryName;
694 }
695
696 const int64_t ent = EntryToIndex(archive->hash_table,
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100697 archive->hash_table_size, entryName);
Narayan Kamath7462f022013-11-21 13:05:04 +0000698
699 if (ent < 0) {
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100700 ALOGV("Zip: Could not find entry %.*s", entryName.name_length, entryName.name);
Narayan Kamath7462f022013-11-21 13:05:04 +0000701 return ent;
702 }
703
704 return FindEntry(archive, ent, data);
705}
706
Yusuke Sato07447542015-06-25 14:39:19 -0700707int32_t Next(void* cookie, ZipEntry* data, ZipString* name) {
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800708 IterationHandle* handle = reinterpret_cast<IterationHandle*>(cookie);
Narayan Kamath7462f022013-11-21 13:05:04 +0000709 if (handle == NULL) {
710 return kInvalidHandle;
711 }
712
713 ZipArchive* archive = handle->archive;
714 if (archive == NULL || archive->hash_table == NULL) {
715 ALOGW("Zip: Invalid ZipArchiveHandle");
716 return kInvalidHandle;
717 }
718
719 const uint32_t currentOffset = handle->position;
720 const uint32_t hash_table_length = archive->hash_table_size;
Yusuke Sato07447542015-06-25 14:39:19 -0700721 const ZipString* hash_table = archive->hash_table;
Narayan Kamath7462f022013-11-21 13:05:04 +0000722
723 for (uint32_t i = currentOffset; i < hash_table_length; ++i) {
724 if (hash_table[i].name != NULL &&
Yusuke Sato07447542015-06-25 14:39:19 -0700725 (handle->prefix.name_length == 0 ||
726 hash_table[i].StartsWith(handle->prefix)) &&
727 (handle->suffix.name_length == 0 ||
728 hash_table[i].EndsWith(handle->suffix))) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000729 handle->position = (i + 1);
730 const int error = FindEntry(archive, i, data);
731 if (!error) {
732 name->name = hash_table[i].name;
733 name->name_length = hash_table[i].name_length;
734 }
735
736 return error;
737 }
738 }
739
740 handle->position = 0;
741 return kIterationEnd;
742}
743
Narayan Kamathf899bd52015-04-17 11:53:14 +0100744class Writer {
745 public:
746 virtual bool Append(uint8_t* buf, size_t buf_size) = 0;
747 virtual ~Writer() {}
748 protected:
749 Writer() = default;
750 private:
751 DISALLOW_COPY_AND_ASSIGN(Writer);
752};
753
754// A Writer that writes data to a fixed size memory region.
755// The size of the memory region must be equal to the total size of
756// the data appended to it.
757class MemoryWriter : public Writer {
758 public:
759 MemoryWriter(uint8_t* buf, size_t size) : Writer(),
760 buf_(buf), size_(size), bytes_written_(0) {
761 }
762
763 virtual bool Append(uint8_t* buf, size_t buf_size) override {
764 if (bytes_written_ + buf_size > size_) {
765 ALOGW("Zip: Unexpected size " ZD " (declared) vs " ZD " (actual)",
766 size_, bytes_written_ + buf_size);
767 return false;
768 }
769
770 memcpy(buf_ + bytes_written_, buf, buf_size);
771 bytes_written_ += buf_size;
772 return true;
773 }
774
775 private:
776 uint8_t* const buf_;
777 const size_t size_;
778 size_t bytes_written_;
779};
780
781// A Writer that appends data to a file |fd| at its current position.
782// The file will be truncated to the end of the written data.
783class FileWriter : public Writer {
784 public:
785
786 // Creates a FileWriter for |fd| and prepare to write |entry| to it,
787 // guaranteeing that the file descriptor is valid and that there's enough
788 // space on the volume to write out the entry completely and that the file
789 // is truncated to the correct length.
790 //
791 // Returns a valid FileWriter on success, |nullptr| if an error occurred.
792 static std::unique_ptr<FileWriter> Create(int fd, const ZipEntry* entry) {
793 const uint32_t declared_length = entry->uncompressed_length;
794 const off64_t current_offset = lseek64(fd, 0, SEEK_CUR);
795 if (current_offset == -1) {
796 ALOGW("Zip: unable to seek to current location on fd %d: %s", fd, strerror(errno));
797 return nullptr;
798 }
799
800 int result = 0;
801#if defined(__linux__)
802 if (declared_length > 0) {
803 // Make sure we have enough space on the volume to extract the compressed
804 // entry. Note that the call to ftruncate below will change the file size but
805 // will not allocate space on disk and this call to fallocate will not
806 // change the file size.
Badhri Jagan Sridharana68d0d12015-06-02 14:47:57 -0700807 // Note: fallocate is only supported by the following filesystems -
808 // btrfs, ext4, ocfs2, and xfs. Therefore fallocate might fail with
809 // EOPNOTSUPP error when issued in other filesystems.
810 // Hence, check for the return error code before concluding that the
811 // disk does not have enough space.
Narayan Kamathf899bd52015-04-17 11:53:14 +0100812 result = TEMP_FAILURE_RETRY(fallocate(fd, 0, current_offset, declared_length));
Badhri Jagan Sridharana68d0d12015-06-02 14:47:57 -0700813 if (result == -1 && errno == ENOSPC) {
Narayan Kamathd5d7abe2016-08-10 12:24:05 +0100814 ALOGW("Zip: unable to allocate %" PRId64 " bytes at offset %" PRId64 " : %s",
815 static_cast<int64_t>(declared_length), static_cast<int64_t>(current_offset),
816 strerror(errno));
Narayan Kamathf899bd52015-04-17 11:53:14 +0100817 return std::unique_ptr<FileWriter>(nullptr);
818 }
819 }
820#endif // __linux__
821
822 result = TEMP_FAILURE_RETRY(ftruncate(fd, declared_length + current_offset));
823 if (result == -1) {
824 ALOGW("Zip: unable to truncate file to %" PRId64 ": %s",
825 static_cast<int64_t>(declared_length + current_offset), strerror(errno));
826 return std::unique_ptr<FileWriter>(nullptr);
827 }
828
829 return std::unique_ptr<FileWriter>(new FileWriter(fd, declared_length));
830 }
831
832 virtual bool Append(uint8_t* buf, size_t buf_size) override {
833 if (total_bytes_written_ + buf_size > declared_length_) {
834 ALOGW("Zip: Unexpected size " ZD " (declared) vs " ZD " (actual)",
835 declared_length_, total_bytes_written_ + buf_size);
836 return false;
837 }
838
Narayan Kamathe97e66e2015-04-27 16:25:53 +0100839 const bool result = android::base::WriteFully(fd_, buf, buf_size);
840 if (result) {
841 total_bytes_written_ += buf_size;
842 } else {
843 ALOGW("Zip: unable to write " ZD " bytes to file; %s", buf_size, strerror(errno));
Narayan Kamathf899bd52015-04-17 11:53:14 +0100844 }
845
Narayan Kamathe97e66e2015-04-27 16:25:53 +0100846 return result;
Narayan Kamathf899bd52015-04-17 11:53:14 +0100847 }
848 private:
849 FileWriter(const int fd, const size_t declared_length) :
850 Writer(),
851 fd_(fd),
852 declared_length_(declared_length),
853 total_bytes_written_(0) {
854 }
855
856 const int fd_;
857 const size_t declared_length_;
858 size_t total_bytes_written_;
859};
860
Dmitriy Ivanovf94e1592015-03-06 13:27:59 -0800861// This method is using libz macros with old-style-casts
862#pragma GCC diagnostic push
863#pragma GCC diagnostic ignored "-Wold-style-cast"
864static inline int zlib_inflateInit2(z_stream* stream, int window_bits) {
865 return inflateInit2(stream, window_bits);
866}
867#pragma GCC diagnostic pop
868
Tianjie Xu18c25922016-09-29 15:27:41 -0700869static int32_t InflateEntryToWriter(MappedZipFile& mapped_zip, const ZipEntry* entry,
Narayan Kamathf899bd52015-04-17 11:53:14 +0100870 Writer* writer, uint64_t* crc_out) {
Dmitriy Ivanovedbabfe2015-03-12 09:58:15 -0700871 const size_t kBufSize = 32768;
872 std::vector<uint8_t> read_buf(kBufSize);
873 std::vector<uint8_t> write_buf(kBufSize);
Narayan Kamath7462f022013-11-21 13:05:04 +0000874 z_stream zstream;
875 int zerr;
876
877 /*
878 * Initialize the zlib stream struct.
879 */
880 memset(&zstream, 0, sizeof(zstream));
881 zstream.zalloc = Z_NULL;
882 zstream.zfree = Z_NULL;
883 zstream.opaque = Z_NULL;
884 zstream.next_in = NULL;
885 zstream.avail_in = 0;
Dmitriy Ivanovedbabfe2015-03-12 09:58:15 -0700886 zstream.next_out = &write_buf[0];
Narayan Kamath7462f022013-11-21 13:05:04 +0000887 zstream.avail_out = kBufSize;
888 zstream.data_type = Z_UNKNOWN;
889
890 /*
891 * Use the undocumented "negative window bits" feature to tell zlib
892 * that there's no zlib header waiting for it.
893 */
Dmitriy Ivanovf94e1592015-03-06 13:27:59 -0800894 zerr = zlib_inflateInit2(&zstream, -MAX_WBITS);
Narayan Kamath7462f022013-11-21 13:05:04 +0000895 if (zerr != Z_OK) {
896 if (zerr == Z_VERSION_ERROR) {
897 ALOGE("Installed zlib is not compatible with linked version (%s)",
898 ZLIB_VERSION);
899 } else {
900 ALOGW("Call to inflateInit2 failed (zerr=%d)", zerr);
901 }
902
903 return kZlibError;
904 }
905
Dmitriy Ivanov1f741e52015-03-06 14:26:37 -0800906 auto zstream_deleter = [](z_stream* stream) {
907 inflateEnd(stream); /* free up any allocated structures */
908 };
909
910 std::unique_ptr<z_stream, decltype(zstream_deleter)> zstream_guard(&zstream, zstream_deleter);
911
Narayan Kamath7462f022013-11-21 13:05:04 +0000912 const uint32_t uncompressed_length = entry->uncompressed_length;
913
914 uint32_t compressed_length = entry->compressed_length;
Narayan Kamath7462f022013-11-21 13:05:04 +0000915 do {
916 /* read as much as we can */
917 if (zstream.avail_in == 0) {
Yabin Cuib2a77002016-02-08 16:26:33 -0800918 const size_t getSize = (compressed_length > kBufSize) ? kBufSize : compressed_length;
Tianjie Xu18c25922016-09-29 15:27:41 -0700919 if (!mapped_zip.ReadData(read_buf.data(), getSize)) {
Yabin Cuib2a77002016-02-08 16:26:33 -0800920 ALOGW("Zip: inflate read failed, getSize = %zu: %s", getSize, strerror(errno));
Dmitriy Ivanov1f741e52015-03-06 14:26:37 -0800921 return kIoError;
Narayan Kamath7462f022013-11-21 13:05:04 +0000922 }
923
924 compressed_length -= getSize;
925
Dmitriy Ivanovedbabfe2015-03-12 09:58:15 -0700926 zstream.next_in = &read_buf[0];
Narayan Kamath7462f022013-11-21 13:05:04 +0000927 zstream.avail_in = getSize;
928 }
929
930 /* uncompress the data */
931 zerr = inflate(&zstream, Z_NO_FLUSH);
932 if (zerr != Z_OK && zerr != Z_STREAM_END) {
933 ALOGW("Zip: inflate zerr=%d (nIn=%p aIn=%u nOut=%p aOut=%u)",
934 zerr, zstream.next_in, zstream.avail_in,
935 zstream.next_out, zstream.avail_out);
Dmitriy Ivanov1f741e52015-03-06 14:26:37 -0800936 return kZlibError;
Narayan Kamath7462f022013-11-21 13:05:04 +0000937 }
938
939 /* write when we're full or when we're done */
940 if (zstream.avail_out == 0 ||
941 (zerr == Z_STREAM_END && zstream.avail_out != kBufSize)) {
Dmitriy Ivanovedbabfe2015-03-12 09:58:15 -0700942 const size_t write_size = zstream.next_out - &write_buf[0];
Narayan Kamathf899bd52015-04-17 11:53:14 +0100943 if (!writer->Append(&write_buf[0], write_size)) {
944 // The file might have declared a bogus length.
945 return kInconsistentInformation;
Narayan Kamath7462f022013-11-21 13:05:04 +0000946 }
Narayan Kamath7462f022013-11-21 13:05:04 +0000947
Dmitriy Ivanovedbabfe2015-03-12 09:58:15 -0700948 zstream.next_out = &write_buf[0];
Narayan Kamath7462f022013-11-21 13:05:04 +0000949 zstream.avail_out = kBufSize;
950 }
951 } while (zerr == Z_OK);
952
953 assert(zerr == Z_STREAM_END); /* other errors should've been caught */
954
955 // stream.adler holds the crc32 value for such streams.
956 *crc_out = zstream.adler;
957
958 if (zstream.total_out != uncompressed_length || compressed_length != 0) {
Mark Salyzyn088bf902014-05-08 16:02:20 -0700959 ALOGW("Zip: size mismatch on inflated file (%lu vs %" PRIu32 ")",
Narayan Kamath7462f022013-11-21 13:05:04 +0000960 zstream.total_out, uncompressed_length);
Dmitriy Ivanov1f741e52015-03-06 14:26:37 -0800961 return kInconsistentInformation;
Narayan Kamath7462f022013-11-21 13:05:04 +0000962 }
963
Dmitriy Ivanov1f741e52015-03-06 14:26:37 -0800964 return 0;
Narayan Kamath7462f022013-11-21 13:05:04 +0000965}
966
Tianjie Xu18c25922016-09-29 15:27:41 -0700967static int32_t CopyEntryToWriter(MappedZipFile& mapped_zip, const ZipEntry* entry, Writer* writer,
Narayan Kamathf899bd52015-04-17 11:53:14 +0100968 uint64_t *crc_out) {
969 static const uint32_t kBufSize = 32768;
970 std::vector<uint8_t> buf(kBufSize);
971
972 const uint32_t length = entry->uncompressed_length;
973 uint32_t count = 0;
974 uint64_t crc = 0;
975 while (count < length) {
976 uint32_t remaining = length - count;
977
978 // Safe conversion because kBufSize is narrow enough for a 32 bit signed
979 // value.
Yabin Cuib2a77002016-02-08 16:26:33 -0800980 const size_t block_size = (remaining > kBufSize) ? kBufSize : remaining;
Tianjie Xu18c25922016-09-29 15:27:41 -0700981 if (!mapped_zip.ReadData(buf.data(), block_size)) {
Yabin Cuib2a77002016-02-08 16:26:33 -0800982 ALOGW("CopyFileToFile: copy read failed, block_size = %zu: %s", block_size, strerror(errno));
Narayan Kamathf899bd52015-04-17 11:53:14 +0100983 return kIoError;
984 }
985
986 if (!writer->Append(&buf[0], block_size)) {
987 return kIoError;
988 }
989 crc = crc32(crc, &buf[0], block_size);
990 count += block_size;
991 }
992
993 *crc_out = crc;
994
995 return 0;
996}
997
998int32_t ExtractToWriter(ZipArchiveHandle handle,
999 ZipEntry* entry, Writer* writer) {
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -08001000 ZipArchive* archive = reinterpret_cast<ZipArchive*>(handle);
Narayan Kamath7462f022013-11-21 13:05:04 +00001001 const uint16_t method = entry->method;
1002 off64_t data_offset = entry->offset;
1003
Tianjie Xu18c25922016-09-29 15:27:41 -07001004 if (!archive->mapped_zip.SeekToOffset(data_offset)) {
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -08001005 ALOGW("Zip: lseek to data at %" PRId64 " failed", static_cast<int64_t>(data_offset));
Narayan Kamath7462f022013-11-21 13:05:04 +00001006 return kIoError;
1007 }
1008
1009 // this should default to kUnknownCompressionMethod.
1010 int32_t return_value = -1;
1011 uint64_t crc = 0;
1012 if (method == kCompressStored) {
Tianjie Xu18c25922016-09-29 15:27:41 -07001013 return_value = CopyEntryToWriter(archive->mapped_zip, entry, writer, &crc);
Narayan Kamath7462f022013-11-21 13:05:04 +00001014 } else if (method == kCompressDeflated) {
Tianjie Xu18c25922016-09-29 15:27:41 -07001015 return_value = InflateEntryToWriter(archive->mapped_zip, entry, writer, &crc);
Narayan Kamath7462f022013-11-21 13:05:04 +00001016 }
1017
1018 if (!return_value && entry->has_data_descriptor) {
Tianjie Xu18c25922016-09-29 15:27:41 -07001019 return_value = UpdateEntryFromDataDescriptor(archive->mapped_zip, entry);
Narayan Kamath7462f022013-11-21 13:05:04 +00001020 if (return_value) {
1021 return return_value;
1022 }
1023 }
1024
1025 // TODO: Fix this check by passing the right flags to inflate2 so that
1026 // it calculates the CRC for us.
1027 if (entry->crc32 != crc && false) {
Mark Salyzyn088bf902014-05-08 16:02:20 -07001028 ALOGW("Zip: crc mismatch: expected %" PRIu32 ", was %" PRIu64, entry->crc32, crc);
Narayan Kamath7462f022013-11-21 13:05:04 +00001029 return kInconsistentInformation;
1030 }
1031
1032 return return_value;
1033}
1034
Narayan Kamathf899bd52015-04-17 11:53:14 +01001035int32_t ExtractToMemory(ZipArchiveHandle handle, ZipEntry* entry,
1036 uint8_t* begin, uint32_t size) {
1037 std::unique_ptr<Writer> writer(new MemoryWriter(begin, size));
1038 return ExtractToWriter(handle, entry, writer.get());
1039}
1040
Narayan Kamath7462f022013-11-21 13:05:04 +00001041int32_t ExtractEntryToFile(ZipArchiveHandle handle,
1042 ZipEntry* entry, int fd) {
Narayan Kamathf899bd52015-04-17 11:53:14 +01001043 std::unique_ptr<Writer> writer(FileWriter::Create(fd, entry));
1044 if (writer.get() == nullptr) {
Narayan Kamath7462f022013-11-21 13:05:04 +00001045 return kIoError;
1046 }
1047
Narayan Kamathf899bd52015-04-17 11:53:14 +01001048 return ExtractToWriter(handle, entry, writer.get());
Narayan Kamath7462f022013-11-21 13:05:04 +00001049}
1050
1051const char* ErrorCodeString(int32_t error_code) {
1052 if (error_code > kErrorMessageLowerBound && error_code < kErrorMessageUpperBound) {
1053 return kErrorMessages[error_code * -1];
1054 }
1055
1056 return kErrorMessages[0];
1057}
1058
1059int GetFileDescriptor(const ZipArchiveHandle handle) {
Tianjie Xu18c25922016-09-29 15:27:41 -07001060 return reinterpret_cast<ZipArchive*>(handle)->mapped_zip.GetFileDescriptor();
Narayan Kamath7462f022013-11-21 13:05:04 +00001061}
Colin Cross7c6c7f02016-09-16 10:15:51 -07001062
1063ZipString::ZipString(const char* entry_name)
1064 : name(reinterpret_cast<const uint8_t*>(entry_name)) {
1065 size_t len = strlen(entry_name);
1066 CHECK_LE(len, static_cast<size_t>(UINT16_MAX));
1067 name_length = static_cast<uint16_t>(len);
1068}
Tianjie Xu18c25922016-09-29 15:27:41 -07001069
1070#if !defined(_WIN32)
1071class ProcessWriter : public Writer {
1072 public:
1073 ProcessWriter(ProcessZipEntryFunction func, void* cookie) : Writer(),
1074 proc_function_(func),
1075 cookie_(cookie) {
1076 }
1077
1078 virtual bool Append(uint8_t* buf, size_t buf_size) override {
1079 return proc_function_(buf, buf_size, cookie_);
1080 }
1081
1082 private:
1083 ProcessZipEntryFunction proc_function_;
1084 void* cookie_;
1085};
1086
1087int32_t ProcessZipEntryContents(ZipArchiveHandle handle, ZipEntry* entry,
1088 ProcessZipEntryFunction func, void* cookie) {
1089 ProcessWriter writer(func, cookie);
1090 return ExtractToWriter(handle, entry, &writer);
1091}
1092
1093#endif //!defined(_WIN32)
1094
1095int MappedZipFile::GetFileDescriptor() const {
1096 if (!has_fd_) {
1097 ALOGW("Zip: MappedZipFile doesn't have a file descriptor.");
1098 return -1;
1099 }
1100 return fd_;
1101}
1102
1103void* MappedZipFile::GetBasePtr() const {
1104 if (has_fd_) {
1105 ALOGW("Zip: MappedZipFile doesn't have a base pointer.");
1106 return nullptr;
1107 }
1108 return base_ptr_;
1109}
1110
1111off64_t MappedZipFile::GetFileLength() const {
1112 if (has_fd_) {
1113 off64_t result = lseek64(fd_, 0, SEEK_END);
1114 if (result == -1) {
1115 ALOGE("Zip: lseek on fd %d failed: %s", fd_, strerror(errno));
1116 }
1117 return result;
1118 } else {
1119 if (base_ptr_ == nullptr) {
1120 ALOGE("Zip: invalid file map\n");
1121 return -1;
1122 }
1123 return static_cast<off64_t>(data_length_);
1124 }
1125}
1126
1127bool MappedZipFile::SeekToOffset(off64_t offset) {
1128 if (has_fd_) {
1129 if (lseek64(fd_, offset, SEEK_SET) != offset) {
1130 ALOGE("Zip: lseek to %" PRId64 " failed: %s\n", offset, strerror(errno));
1131 return false;
1132 }
1133 return true;
1134 } else {
1135 if (offset < 0 || offset > static_cast<off64_t>(data_length_)) {
1136 ALOGE("Zip: invalid offset: %" PRId64 ", data length: %" PRId64 "\n" , offset,
1137 data_length_);
1138 return false;
1139 }
1140
1141 read_pos_ = offset;
1142 return true;
1143 }
1144}
1145
1146bool MappedZipFile::ReadData(uint8_t* buffer, size_t read_amount) {
1147 if (has_fd_) {
1148 if(!android::base::ReadFully(fd_, buffer, read_amount)) {
1149 ALOGE("Zip: read from %d failed\n", fd_);
1150 return false;
1151 }
1152 } else {
1153 memcpy(buffer, static_cast<uint8_t*>(base_ptr_) + read_pos_, read_amount);
1154 read_pos_ += read_amount;
1155 }
1156 return true;
1157}
1158
1159// Attempts to read |len| bytes into |buf| at offset |off|.
1160bool MappedZipFile::ReadAtOffset(uint8_t* buf, size_t len, off64_t off) {
1161#if !defined(_WIN32)
1162 if (has_fd_) {
1163 if (static_cast<size_t>(TEMP_FAILURE_RETRY(pread64(fd_, buf, len, off))) != len) {
1164 ALOGE("Zip: failed to read at offset %" PRId64 "\n", off);
1165 return false;
1166 }
1167 return true;
1168 }
1169#endif
1170 if (!SeekToOffset(off)) {
1171 return false;
1172 }
1173 return ReadData(buf, len);
1174
1175}
1176
1177void CentralDirectory::Initialize(void* map_base_ptr, off64_t cd_start_offset, size_t cd_size) {
1178 base_ptr_ = static_cast<uint8_t*>(map_base_ptr) + cd_start_offset;
1179 length_ = cd_size;
1180}
1181
1182bool ZipArchive::InitializeCentralDirectory(const char* debug_file_name, off64_t cd_start_offset,
1183 size_t cd_size) {
1184 if (mapped_zip.HasFd()) {
1185 if (!directory_map->create(debug_file_name, mapped_zip.GetFileDescriptor(),
1186 cd_start_offset, cd_size, true /* read only */)) {
1187 return false;
1188 }
1189
1190 CHECK_EQ(directory_map->getDataLength(), cd_size);
1191 central_directory.Initialize(directory_map->getDataPtr(), 0/*offset*/, cd_size);
1192 } else {
1193 if (mapped_zip.GetBasePtr() == nullptr) {
1194 ALOGE("Zip: Failed to map central directory, bad mapped_zip base pointer\n");
1195 return false;
1196 }
1197 if (static_cast<off64_t>(cd_start_offset) + static_cast<off64_t>(cd_size) >
1198 mapped_zip.GetFileLength()) {
1199 ALOGE("Zip: Failed to map central directory, offset exceeds mapped memory region ("
1200 "start_offset %" PRId64 ", cd_size %zu, mapped_region_size %" PRId64 ")",
1201 static_cast<int64_t>(cd_start_offset), cd_size, mapped_zip.GetFileLength());
1202 return false;
1203 }
1204
1205 central_directory.Initialize(mapped_zip.GetBasePtr(), cd_start_offset, cd_size);
1206 }
1207 return true;
1208}