blob: ebbab9f21cbc14907fe99881551572170b50d2ee [file] [log] [blame]
Narayan Kamath7462f022013-11-21 13:05:04 +00001/*
2 * Copyright (C) 2008 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17/*
18 * Read-only access to Zip archives, with minimal heap allocation.
19 */
Narayan Kamath7462f022013-11-21 13:05:04 +000020
21#include <assert.h>
22#include <errno.h>
Mark Salyzyn99ef9912014-03-14 14:26:22 -070023#include <fcntl.h>
24#include <inttypes.h>
Narayan Kamath7462f022013-11-21 13:05:04 +000025#include <limits.h>
26#include <log/log.h>
Narayan Kamath7462f022013-11-21 13:05:04 +000027#include <stdlib.h>
28#include <string.h>
Narayan Kamath7462f022013-11-21 13:05:04 +000029#include <unistd.h>
Mark Salyzyn51d562d2014-05-05 14:38:05 -070030#include <utils/Compat.h>
Narayan Kamatheaf98852013-12-11 14:51:51 +000031#include <utils/FileMap.h>
Mark Salyzyn99ef9912014-03-14 14:26:22 -070032#include <zlib.h>
Narayan Kamath7462f022013-11-21 13:05:04 +000033
34#include <JNIHelp.h> // TEMP_FAILURE_RETRY may or may not be in unistd
35
Narayan Kamath044bc8e2014-12-03 18:22:53 +000036#include "entry_name_utils-inl.h"
Mark Salyzyn99ef9912014-03-14 14:26:22 -070037#include "ziparchive/zip_archive.h"
38
Narayan Kamath044bc8e2014-12-03 18:22:53 +000039
Narayan Kamath926973e2014-06-09 14:18:14 +010040// This is for windows. If we don't open a file in binary mode, weird
Narayan Kamath7462f022013-11-21 13:05:04 +000041// things will happen.
42#ifndef O_BINARY
43#define O_BINARY 0
44#endif
45
Narayan Kamath926973e2014-06-09 14:18:14 +010046#define DISALLOW_IMPLICIT_CONSTRUCTORS(TypeName) \
47 TypeName(); \
48 TypeName(const TypeName&); \
49 void operator=(const TypeName&)
Narayan Kamath7462f022013-11-21 13:05:04 +000050
Narayan Kamath926973e2014-06-09 14:18:14 +010051// The "end of central directory" (EOCD) record. Each archive
52// contains exactly once such record which appears at the end of
53// the archive. It contains archive wide information like the
54// number of entries in the archive and the offset to the central
55// directory of the offset.
56struct EocdRecord {
57 static const uint32_t kSignature = 0x06054b50;
Narayan Kamath7462f022013-11-21 13:05:04 +000058
Narayan Kamath926973e2014-06-09 14:18:14 +010059 // End of central directory signature, should always be
60 // |kSignature|.
61 uint32_t eocd_signature;
62 // The number of the current "disk", i.e, the "disk" that this
63 // central directory is on.
64 //
65 // This implementation assumes that each archive spans a single
66 // disk only. i.e, that disk_num == 1.
67 uint16_t disk_num;
68 // The disk where the central directory starts.
69 //
70 // This implementation assumes that each archive spans a single
71 // disk only. i.e, that cd_start_disk == 1.
72 uint16_t cd_start_disk;
73 // The number of central directory records on this disk.
74 //
75 // This implementation assumes that each archive spans a single
76 // disk only. i.e, that num_records_on_disk == num_records.
77 uint16_t num_records_on_disk;
78 // The total number of central directory records.
79 uint16_t num_records;
80 // The size of the central directory (in bytes).
81 uint32_t cd_size;
82 // The offset of the start of the central directory, relative
83 // to the start of the file.
84 uint32_t cd_start_offset;
85 // Length of the central directory comment.
86 uint16_t comment_length;
87 private:
88 DISALLOW_IMPLICIT_CONSTRUCTORS(EocdRecord);
89} __attribute__((packed));
Narayan Kamath7462f022013-11-21 13:05:04 +000090
Narayan Kamath926973e2014-06-09 14:18:14 +010091// A structure representing the fixed length fields for a single
92// record in the central directory of the archive. In addition to
93// the fixed length fields listed here, each central directory
94// record contains a variable length "file_name" and "extra_field"
95// whose lengths are given by |file_name_length| and |extra_field_length|
96// respectively.
97struct CentralDirectoryRecord {
98 static const uint32_t kSignature = 0x02014b50;
Narayan Kamath7462f022013-11-21 13:05:04 +000099
Narayan Kamath926973e2014-06-09 14:18:14 +0100100 // The start of record signature. Must be |kSignature|.
101 uint32_t record_signature;
102 // Tool version. Ignored by this implementation.
103 uint16_t version_made_by;
104 // Tool version. Ignored by this implementation.
105 uint16_t version_needed;
106 // The "general purpose bit flags" for this entry. The only
107 // flag value that we currently check for is the "data descriptor"
108 // flag.
109 uint16_t gpb_flags;
110 // The compression method for this entry, one of |kCompressStored|
111 // and |kCompressDeflated|.
112 uint16_t compression_method;
113 // The file modification time and date for this entry.
114 uint16_t last_mod_time;
115 uint16_t last_mod_date;
116 // The CRC-32 checksum for this entry.
117 uint32_t crc32;
118 // The compressed size (in bytes) of this entry.
119 uint32_t compressed_size;
120 // The uncompressed size (in bytes) of this entry.
121 uint32_t uncompressed_size;
122 // The length of the entry file name in bytes. The file name
123 // will appear immediately after this record.
124 uint16_t file_name_length;
125 // The length of the extra field info (in bytes). This data
126 // will appear immediately after the entry file name.
127 uint16_t extra_field_length;
128 // The length of the entry comment (in bytes). This data will
129 // appear immediately after the extra field.
130 uint16_t comment_length;
131 // The start disk for this entry. Ignored by this implementation).
132 uint16_t file_start_disk;
133 // File attributes. Ignored by this implementation.
134 uint16_t internal_file_attributes;
135 // File attributes. Ignored by this implementation.
136 uint32_t external_file_attributes;
137 // The offset to the local file header for this entry, from the
138 // beginning of this archive.
139 uint32_t local_file_header_offset;
140 private:
141 DISALLOW_IMPLICIT_CONSTRUCTORS(CentralDirectoryRecord);
142} __attribute__((packed));
Narayan Kamath7462f022013-11-21 13:05:04 +0000143
Narayan Kamath926973e2014-06-09 14:18:14 +0100144// The local file header for a given entry. This duplicates information
145// present in the central directory of the archive. It is an error for
146// the information here to be different from the central directory
147// information for a given entry.
148struct LocalFileHeader {
149 static const uint32_t kSignature = 0x04034b50;
Narayan Kamath7462f022013-11-21 13:05:04 +0000150
Narayan Kamath926973e2014-06-09 14:18:14 +0100151 // The local file header signature, must be |kSignature|.
152 uint32_t lfh_signature;
153 // Tool version. Ignored by this implementation.
154 uint16_t version_needed;
155 // The "general purpose bit flags" for this entry. The only
156 // flag value that we currently check for is the "data descriptor"
157 // flag.
158 uint16_t gpb_flags;
159 // The compression method for this entry, one of |kCompressStored|
160 // and |kCompressDeflated|.
161 uint16_t compression_method;
162 // The file modification time and date for this entry.
163 uint16_t last_mod_time;
164 uint16_t last_mod_date;
165 // The CRC-32 checksum for this entry.
166 uint32_t crc32;
167 // The compressed size (in bytes) of this entry.
168 uint32_t compressed_size;
169 // The uncompressed size (in bytes) of this entry.
170 uint32_t uncompressed_size;
171 // The length of the entry file name in bytes. The file name
172 // will appear immediately after this record.
173 uint16_t file_name_length;
174 // The length of the extra field info (in bytes). This data
175 // will appear immediately after the entry file name.
176 uint16_t extra_field_length;
177 private:
178 DISALLOW_IMPLICIT_CONSTRUCTORS(LocalFileHeader);
179} __attribute__((packed));
180
181struct DataDescriptor {
182 // The *optional* data descriptor start signature.
183 static const uint32_t kOptSignature = 0x08074b50;
184
185 // CRC-32 checksum of the entry.
186 uint32_t crc32;
187 // Compressed size of the entry.
188 uint32_t compressed_size;
189 // Uncompressed size of the entry.
190 uint32_t uncompressed_size;
191 private:
192 DISALLOW_IMPLICIT_CONSTRUCTORS(DataDescriptor);
193} __attribute__((packed));
194
195#undef DISALLOW_IMPLICIT_CONSTRUCTORS
196
Piotr Jastrzebskibd0a7482014-08-13 09:49:25 +0000197static const uint32_t kGPBDDFlagMask = 0x0008; // mask value that signifies that the entry has a DD
Narayan Kamath7462f022013-11-21 13:05:04 +0000198
Narayan Kamath926973e2014-06-09 14:18:14 +0100199// The maximum size of a central directory or a file
200// comment in bytes.
201static const uint32_t kMaxCommentLen = 65535;
202
203// The maximum number of bytes to scan backwards for the EOCD start.
204static const uint32_t kMaxEOCDSearch = kMaxCommentLen + sizeof(EocdRecord);
205
Narayan Kamath7462f022013-11-21 13:05:04 +0000206static const char* kErrorMessages[] = {
207 "Unknown return code.",
Narayan Kamatheb41ad22013-12-09 16:26:36 +0000208 "Iteration ended",
Narayan Kamath7462f022013-11-21 13:05:04 +0000209 "Zlib error",
210 "Invalid file",
211 "Invalid handle",
212 "Duplicate entries in archive",
213 "Empty archive",
214 "Entry not found",
215 "Invalid offset",
216 "Inconsistent information",
217 "Invalid entry name",
Narayan Kamatheb41ad22013-12-09 16:26:36 +0000218 "I/O Error",
Narayan Kamatheaf98852013-12-11 14:51:51 +0000219 "File mapping failed"
Narayan Kamath7462f022013-11-21 13:05:04 +0000220};
221
222static const int32_t kErrorMessageUpperBound = 0;
223
Narayan Kamatheb41ad22013-12-09 16:26:36 +0000224static const int32_t kIterationEnd = -1;
Narayan Kamath7462f022013-11-21 13:05:04 +0000225
226// We encountered a Zlib error when inflating a stream from this file.
227// Usually indicates file corruption.
228static const int32_t kZlibError = -2;
229
230// The input file cannot be processed as a zip archive. Usually because
231// it's too small, too large or does not have a valid signature.
232static const int32_t kInvalidFile = -3;
233
234// An invalid iteration / ziparchive handle was passed in as an input
235// argument.
236static const int32_t kInvalidHandle = -4;
237
238// The zip archive contained two (or possibly more) entries with the same
239// name.
240static const int32_t kDuplicateEntry = -5;
241
242// The zip archive contains no entries.
243static const int32_t kEmptyArchive = -6;
244
245// The specified entry was not found in the archive.
246static const int32_t kEntryNotFound = -7;
247
248// The zip archive contained an invalid local file header pointer.
249static const int32_t kInvalidOffset = -8;
250
251// The zip archive contained inconsistent entry information. This could
252// be because the central directory & local file header did not agree, or
253// if the actual uncompressed length or crc32 do not match their declared
254// values.
255static const int32_t kInconsistentInformation = -9;
256
257// An invalid entry name was encountered.
258static const int32_t kInvalidEntryName = -10;
259
Narayan Kamatheb41ad22013-12-09 16:26:36 +0000260// An I/O related system call (read, lseek, ftruncate, map) failed.
261static const int32_t kIoError = -11;
Narayan Kamath7462f022013-11-21 13:05:04 +0000262
Narayan Kamatheaf98852013-12-11 14:51:51 +0000263// We were not able to mmap the central directory or entry contents.
264static const int32_t kMmapFailed = -12;
Narayan Kamath7462f022013-11-21 13:05:04 +0000265
Narayan Kamatheaf98852013-12-11 14:51:51 +0000266static const int32_t kErrorMessageLowerBound = -13;
Narayan Kamath7462f022013-11-21 13:05:04 +0000267
Narayan Kamatheaf98852013-12-11 14:51:51 +0000268static const char kTempMappingFileName[] = "zip: ExtractFileToFile";
Narayan Kamath7462f022013-11-21 13:05:04 +0000269
270/*
271 * A Read-only Zip archive.
272 *
273 * We want "open" and "find entry by name" to be fast operations, and
274 * we want to use as little memory as possible. We memory-map the zip
275 * central directory, and load a hash table with pointers to the filenames
276 * (which aren't null-terminated). The other fields are at a fixed offset
277 * from the filename, so we don't need to extract those (but we do need
278 * to byte-read and endian-swap them every time we want them).
279 *
280 * It's possible that somebody has handed us a massive (~1GB) zip archive,
281 * so we can't expect to mmap the entire file.
282 *
283 * To speed comparisons when doing a lookup by name, we could make the mapping
284 * "private" (copy-on-write) and null-terminate the filenames after verifying
285 * the record structure. However, this requires a private mapping of
286 * every page that the Central Directory touches. Easier to tuck a copy
287 * of the string length into the hash table entry.
288 */
289struct ZipArchive {
290 /* open Zip archive */
Neil Fullerb1a113f2014-07-25 14:43:04 +0100291 const int fd;
Dmitriy Ivanov40b52b22014-07-15 19:33:00 -0700292 const bool close_file;
Narayan Kamath7462f022013-11-21 13:05:04 +0000293
294 /* mapped central directory area */
295 off64_t directory_offset;
Narayan Kamatheaf98852013-12-11 14:51:51 +0000296 android::FileMap* directory_map;
Narayan Kamath7462f022013-11-21 13:05:04 +0000297
298 /* number of entries in the Zip archive */
299 uint16_t num_entries;
300
301 /*
302 * We know how many entries are in the Zip archive, so we can have a
303 * fixed-size hash table. We define a load factor of 0.75 and overallocat
304 * so the maximum number entries can never be higher than
305 * ((4 * UINT16_MAX) / 3 + 1) which can safely fit into a uint32_t.
306 */
307 uint32_t hash_table_size;
308 ZipEntryName* hash_table;
Neil Fullerb1a113f2014-07-25 14:43:04 +0100309
Dmitriy Ivanov40b52b22014-07-15 19:33:00 -0700310 ZipArchive(const int fd, bool assume_ownership) :
Neil Fullerb1a113f2014-07-25 14:43:04 +0100311 fd(fd),
Dmitriy Ivanov40b52b22014-07-15 19:33:00 -0700312 close_file(assume_ownership),
Neil Fullerb1a113f2014-07-25 14:43:04 +0100313 directory_offset(0),
314 directory_map(NULL),
315 num_entries(0),
316 hash_table_size(0),
317 hash_table(NULL) {}
318
319 ~ZipArchive() {
Dmitriy Ivanov40b52b22014-07-15 19:33:00 -0700320 if (close_file && fd >= 0) {
Neil Fullerb1a113f2014-07-25 14:43:04 +0100321 close(fd);
322 }
323
Narayan Kamath6832a7a2015-02-23 15:43:35 +0000324 delete directory_map;
Neil Fullerb1a113f2014-07-25 14:43:04 +0100325 free(hash_table);
326 }
Narayan Kamath7462f022013-11-21 13:05:04 +0000327};
328
329// Returns 0 on success and negative values on failure.
Narayan Kamatheaf98852013-12-11 14:51:51 +0000330static android::FileMap* MapFileSegment(const int fd, const off64_t start,
331 const size_t length, const bool read_only,
332 const char* debug_file_name) {
333 android::FileMap* file_map = new android::FileMap;
334 const bool success = file_map->create(debug_file_name, fd, start, length, read_only);
335 if (!success) {
Narayan Kamath6832a7a2015-02-23 15:43:35 +0000336 delete file_map;
Narayan Kamatheaf98852013-12-11 14:51:51 +0000337 return NULL;
Narayan Kamath7462f022013-11-21 13:05:04 +0000338 }
339
Narayan Kamatheaf98852013-12-11 14:51:51 +0000340 return file_map;
Narayan Kamath7462f022013-11-21 13:05:04 +0000341}
342
343static int32_t CopyFileToFile(int fd, uint8_t* begin, const uint32_t length, uint64_t *crc_out) {
344 static const uint32_t kBufSize = 32768;
345 uint8_t buf[kBufSize];
346
347 uint32_t count = 0;
348 uint64_t crc = 0;
Narayan Kamath58aaf462013-12-10 16:47:14 +0000349 while (count < length) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000350 uint32_t remaining = length - count;
351
352 // Safe conversion because kBufSize is narrow enough for a 32 bit signed
353 // value.
354 ssize_t get_size = (remaining > kBufSize) ? kBufSize : remaining;
355 ssize_t actual = TEMP_FAILURE_RETRY(read(fd, buf, get_size));
356
357 if (actual != get_size) {
Mark Salyzyn51d562d2014-05-05 14:38:05 -0700358 ALOGW("CopyFileToFile: copy read failed (" ZD " vs " ZD ")", actual, get_size);
Narayan Kamath7462f022013-11-21 13:05:04 +0000359 return kIoError;
360 }
361
362 memcpy(begin + count, buf, get_size);
363 crc = crc32(crc, buf, get_size);
364 count += get_size;
365 }
366
367 *crc_out = crc;
368
369 return 0;
370}
371
372/*
373 * Round up to the next highest power of 2.
374 *
375 * Found on http://graphics.stanford.edu/~seander/bithacks.html.
376 */
377static uint32_t RoundUpPower2(uint32_t val) {
378 val--;
379 val |= val >> 1;
380 val |= val >> 2;
381 val |= val >> 4;
382 val |= val >> 8;
383 val |= val >> 16;
384 val++;
385
386 return val;
387}
388
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100389static uint32_t ComputeHash(const ZipEntryName& name) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000390 uint32_t hash = 0;
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100391 uint16_t len = name.name_length;
392 const uint8_t* str = name.name;
Narayan Kamath7462f022013-11-21 13:05:04 +0000393
394 while (len--) {
395 hash = hash * 31 + *str++;
396 }
397
398 return hash;
399}
400
401/*
402 * Convert a ZipEntry to a hash table index, verifying that it's in a
403 * valid range.
404 */
405static int64_t EntryToIndex(const ZipEntryName* hash_table,
406 const uint32_t hash_table_size,
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100407 const ZipEntryName& name) {
408 const uint32_t hash = ComputeHash(name);
Narayan Kamath7462f022013-11-21 13:05:04 +0000409
410 // NOTE: (hash_table_size - 1) is guaranteed to be non-negative.
411 uint32_t ent = hash & (hash_table_size - 1);
412 while (hash_table[ent].name != NULL) {
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100413 if (hash_table[ent].name_length == name.name_length &&
414 memcmp(hash_table[ent].name, name.name, name.name_length) == 0) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000415 return ent;
416 }
417
418 ent = (ent + 1) & (hash_table_size - 1);
419 }
420
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100421 ALOGV("Zip: Unable to find entry %.*s", name.name_length, name.name);
Narayan Kamath7462f022013-11-21 13:05:04 +0000422 return kEntryNotFound;
423}
424
425/*
426 * Add a new entry to the hash table.
427 */
428static int32_t AddToHash(ZipEntryName *hash_table, const uint64_t hash_table_size,
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100429 const ZipEntryName& name) {
430 const uint64_t hash = ComputeHash(name);
Narayan Kamath7462f022013-11-21 13:05:04 +0000431 uint32_t ent = hash & (hash_table_size - 1);
432
433 /*
434 * We over-allocated the table, so we're guaranteed to find an empty slot.
435 * Further, we guarantee that the hashtable size is not 0.
436 */
437 while (hash_table[ent].name != NULL) {
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100438 if (hash_table[ent].name_length == name.name_length &&
439 memcmp(hash_table[ent].name, name.name, name.name_length) == 0) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000440 // We've found a duplicate entry. We don't accept it
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100441 ALOGW("Zip: Found duplicate entry %.*s", name.name_length, name.name);
Narayan Kamath7462f022013-11-21 13:05:04 +0000442 return kDuplicateEntry;
443 }
444 ent = (ent + 1) & (hash_table_size - 1);
445 }
446
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100447 hash_table[ent].name = name.name;
448 hash_table[ent].name_length = name.name_length;
Narayan Kamath7462f022013-11-21 13:05:04 +0000449 return 0;
450}
451
Narayan Kamath7462f022013-11-21 13:05:04 +0000452static int32_t MapCentralDirectory0(int fd, const char* debug_file_name,
453 ZipArchive* archive, off64_t file_length,
Narayan Kamath926973e2014-06-09 14:18:14 +0100454 off64_t read_amount, uint8_t* scan_buffer) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000455 const off64_t search_start = file_length - read_amount;
456
457 if (lseek64(fd, search_start, SEEK_SET) != search_start) {
Narayan Kamath926973e2014-06-09 14:18:14 +0100458 ALOGW("Zip: seek %" PRId64 " failed: %s", static_cast<int64_t>(search_start),
459 strerror(errno));
Narayan Kamath7462f022013-11-21 13:05:04 +0000460 return kIoError;
461 }
Narayan Kamath926973e2014-06-09 14:18:14 +0100462 ssize_t actual = TEMP_FAILURE_RETRY(
463 read(fd, scan_buffer, static_cast<size_t>(read_amount)));
464 if (actual != static_cast<ssize_t>(read_amount)) {
465 ALOGW("Zip: read %" PRId64 " failed: %s", static_cast<int64_t>(read_amount),
466 strerror(errno));
Narayan Kamath7462f022013-11-21 13:05:04 +0000467 return kIoError;
468 }
469
470 /*
471 * Scan backward for the EOCD magic. In an archive without a trailing
472 * comment, we'll find it on the first try. (We may want to consider
473 * doing an initial minimal read; if we don't find it, retry with a
474 * second read as above.)
475 */
Narayan Kamath926973e2014-06-09 14:18:14 +0100476 int i = read_amount - sizeof(EocdRecord);
477 for (; i >= 0; i--) {
478 if (scan_buffer[i] == 0x50 &&
479 ((*reinterpret_cast<uint32_t*>(&scan_buffer[i])) == EocdRecord::kSignature)) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000480 ALOGV("+++ Found EOCD at buf+%d", i);
481 break;
482 }
483 }
484 if (i < 0) {
485 ALOGD("Zip: EOCD not found, %s is not zip", debug_file_name);
486 return kInvalidFile;
487 }
488
489 const off64_t eocd_offset = search_start + i;
Narayan Kamath926973e2014-06-09 14:18:14 +0100490 const EocdRecord* eocd = reinterpret_cast<const EocdRecord*>(scan_buffer + i);
Narayan Kamath7462f022013-11-21 13:05:04 +0000491 /*
Narayan Kamath926973e2014-06-09 14:18:14 +0100492 * Verify that there's no trailing space at the end of the central directory
493 * and its comment.
Narayan Kamath7462f022013-11-21 13:05:04 +0000494 */
Narayan Kamath926973e2014-06-09 14:18:14 +0100495 const off64_t calculated_length = eocd_offset + sizeof(EocdRecord)
496 + eocd->comment_length;
497 if (calculated_length != file_length) {
Narayan Kamath4f6b4992014-06-03 13:59:23 +0100498 ALOGW("Zip: %" PRId64 " extraneous bytes at the end of the central directory",
Narayan Kamath926973e2014-06-09 14:18:14 +0100499 static_cast<int64_t>(file_length - calculated_length));
Narayan Kamath4f6b4992014-06-03 13:59:23 +0100500 return kInvalidFile;
501 }
Narayan Kamath7462f022013-11-21 13:05:04 +0000502
Narayan Kamath926973e2014-06-09 14:18:14 +0100503 /*
504 * Grab the CD offset and size, and the number of entries in the
505 * archive and verify that they look reasonable.
506 */
507 if (eocd->cd_start_offset + eocd->cd_size > eocd_offset) {
508 ALOGW("Zip: bad offsets (dir %" PRIu32 ", size %" PRIu32 ", eocd %" PRId64 ")",
509 eocd->cd_start_offset, eocd->cd_size, static_cast<int64_t>(eocd_offset));
Narayan Kamath7462f022013-11-21 13:05:04 +0000510 return kInvalidOffset;
511 }
Narayan Kamath926973e2014-06-09 14:18:14 +0100512 if (eocd->num_records == 0) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000513 ALOGW("Zip: empty archive?");
514 return kEmptyArchive;
515 }
516
Narayan Kamath926973e2014-06-09 14:18:14 +0100517 ALOGV("+++ num_entries=%" PRIu32 "dir_size=%" PRIu32 " dir_offset=%" PRIu32,
518 eocd->num_records, eocd->cd_size, eocd->cd_start_offset);
Narayan Kamath7462f022013-11-21 13:05:04 +0000519
520 /*
521 * It all looks good. Create a mapping for the CD, and set the fields
522 * in archive.
523 */
Narayan Kamath926973e2014-06-09 14:18:14 +0100524 android::FileMap* map = MapFileSegment(fd,
525 static_cast<off64_t>(eocd->cd_start_offset),
526 static_cast<size_t>(eocd->cd_size),
527 true /* read only */, debug_file_name);
Narayan Kamatheaf98852013-12-11 14:51:51 +0000528 if (map == NULL) {
529 archive->directory_map = NULL;
530 return kMmapFailed;
Narayan Kamath7462f022013-11-21 13:05:04 +0000531 }
532
Narayan Kamatheaf98852013-12-11 14:51:51 +0000533 archive->directory_map = map;
Narayan Kamath926973e2014-06-09 14:18:14 +0100534 archive->num_entries = eocd->num_records;
535 archive->directory_offset = eocd->cd_start_offset;
Narayan Kamath7462f022013-11-21 13:05:04 +0000536
537 return 0;
538}
539
540/*
541 * Find the zip Central Directory and memory-map it.
542 *
543 * On success, returns 0 after populating fields from the EOCD area:
544 * directory_offset
545 * directory_map
546 * num_entries
547 */
548static int32_t MapCentralDirectory(int fd, const char* debug_file_name,
549 ZipArchive* archive) {
550
551 // Test file length. We use lseek64 to make sure the file
552 // is small enough to be a zip file (Its size must be less than
553 // 0xffffffff bytes).
554 off64_t file_length = lseek64(fd, 0, SEEK_END);
555 if (file_length == -1) {
556 ALOGV("Zip: lseek on fd %d failed", fd);
557 return kInvalidFile;
558 }
559
560 if (file_length > (off64_t) 0xffffffff) {
Narayan Kamath926973e2014-06-09 14:18:14 +0100561 ALOGV("Zip: zip file too long %" PRId64, static_cast<int64_t>(file_length));
Narayan Kamath7462f022013-11-21 13:05:04 +0000562 return kInvalidFile;
563 }
564
Narayan Kamath926973e2014-06-09 14:18:14 +0100565 if (file_length < static_cast<off64_t>(sizeof(EocdRecord))) {
566 ALOGV("Zip: length %" PRId64 " is too small to be zip", static_cast<int64_t>(file_length));
Narayan Kamath7462f022013-11-21 13:05:04 +0000567 return kInvalidFile;
568 }
569
570 /*
571 * Perform the traditional EOCD snipe hunt.
572 *
573 * We're searching for the End of Central Directory magic number,
574 * which appears at the start of the EOCD block. It's followed by
575 * 18 bytes of EOCD stuff and up to 64KB of archive comment. We
576 * need to read the last part of the file into a buffer, dig through
577 * it to find the magic number, parse some values out, and use those
578 * to determine the extent of the CD.
579 *
580 * We start by pulling in the last part of the file.
581 */
Narayan Kamath926973e2014-06-09 14:18:14 +0100582 off64_t read_amount = kMaxEOCDSearch;
583 if (file_length < read_amount) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000584 read_amount = file_length;
585 }
586
Narayan Kamath926973e2014-06-09 14:18:14 +0100587 uint8_t* scan_buffer = reinterpret_cast<uint8_t*>(malloc(read_amount));
Narayan Kamath7462f022013-11-21 13:05:04 +0000588 int32_t result = MapCentralDirectory0(fd, debug_file_name, archive,
589 file_length, read_amount, scan_buffer);
590
591 free(scan_buffer);
592 return result;
593}
594
595/*
596 * Parses the Zip archive's Central Directory. Allocates and populates the
597 * hash table.
598 *
599 * Returns 0 on success.
600 */
601static int32_t ParseZipArchive(ZipArchive* archive) {
602 int32_t result = -1;
Narayan Kamath926973e2014-06-09 14:18:14 +0100603 const uint8_t* const cd_ptr = (const uint8_t*) archive->directory_map->getDataPtr();
604 const size_t cd_length = archive->directory_map->getDataLength();
605 const uint16_t num_entries = archive->num_entries;
Narayan Kamath7462f022013-11-21 13:05:04 +0000606
607 /*
608 * Create hash table. We have a minimum 75% load factor, possibly as
609 * low as 50% after we round off to a power of 2. There must be at
610 * least one unused entry to avoid an infinite loop during creation.
611 */
612 archive->hash_table_size = RoundUpPower2(1 + (num_entries * 4) / 3);
613 archive->hash_table = (ZipEntryName*) calloc(archive->hash_table_size,
614 sizeof(ZipEntryName));
615
616 /*
617 * Walk through the central directory, adding entries to the hash
618 * table and verifying values.
619 */
Narayan Kamath926973e2014-06-09 14:18:14 +0100620 const uint8_t* const cd_end = cd_ptr + cd_length;
Narayan Kamath7462f022013-11-21 13:05:04 +0000621 const uint8_t* ptr = cd_ptr;
622 for (uint16_t i = 0; i < num_entries; i++) {
Narayan Kamath926973e2014-06-09 14:18:14 +0100623 const CentralDirectoryRecord* cdr =
624 reinterpret_cast<const CentralDirectoryRecord*>(ptr);
625 if (cdr->record_signature != CentralDirectoryRecord::kSignature) {
Mark Salyzyn088bf902014-05-08 16:02:20 -0700626 ALOGW("Zip: missed a central dir sig (at %" PRIu16 ")", i);
Narayan Kamath7462f022013-11-21 13:05:04 +0000627 goto bail;
628 }
629
Narayan Kamath926973e2014-06-09 14:18:14 +0100630 if (ptr + sizeof(CentralDirectoryRecord) > cd_end) {
Mark Salyzyn088bf902014-05-08 16:02:20 -0700631 ALOGW("Zip: ran off the end (at %" PRIu16 ")", i);
Narayan Kamath7462f022013-11-21 13:05:04 +0000632 goto bail;
633 }
634
Narayan Kamath926973e2014-06-09 14:18:14 +0100635 const off64_t local_header_offset = cdr->local_file_header_offset;
Narayan Kamath7462f022013-11-21 13:05:04 +0000636 if (local_header_offset >= archive->directory_offset) {
Mark Salyzyn56a90a02014-05-08 17:20:55 -0700637 ALOGW("Zip: bad LFH offset %" PRId64 " at entry %" PRIu16, (int64_t)local_header_offset, i);
Narayan Kamath7462f022013-11-21 13:05:04 +0000638 goto bail;
639 }
640
Narayan Kamath926973e2014-06-09 14:18:14 +0100641 const uint16_t file_name_length = cdr->file_name_length;
642 const uint16_t extra_length = cdr->extra_field_length;
643 const uint16_t comment_length = cdr->comment_length;
Piotr Jastrzebski78271ba2014-08-15 12:53:00 +0100644 const uint8_t* file_name = ptr + sizeof(CentralDirectoryRecord);
645
Narayan Kamath044bc8e2014-12-03 18:22:53 +0000646 /* check that file name is valid UTF-8 and doesn't contain NUL (U+0000) characters */
647 if (!IsValidEntryName(file_name, file_name_length)) {
Piotr Jastrzebski78271ba2014-08-15 12:53:00 +0100648 goto bail;
649 }
Narayan Kamath7462f022013-11-21 13:05:04 +0000650
651 /* add the CDE filename to the hash table */
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100652 ZipEntryName entry_name;
653 entry_name.name = file_name;
654 entry_name.name_length = file_name_length;
Narayan Kamath7462f022013-11-21 13:05:04 +0000655 const int add_result = AddToHash(archive->hash_table,
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100656 archive->hash_table_size, entry_name);
Narayan Kamath7462f022013-11-21 13:05:04 +0000657 if (add_result) {
658 ALOGW("Zip: Error adding entry to hash table %d", add_result);
659 result = add_result;
660 goto bail;
661 }
662
Narayan Kamath926973e2014-06-09 14:18:14 +0100663 ptr += sizeof(CentralDirectoryRecord) + file_name_length + extra_length + comment_length;
664 if ((ptr - cd_ptr) > static_cast<int64_t>(cd_length)) {
Mark Salyzyn088bf902014-05-08 16:02:20 -0700665 ALOGW("Zip: bad CD advance (%tu vs %zu) at entry %" PRIu16,
666 ptr - cd_ptr, cd_length, i);
Narayan Kamath7462f022013-11-21 13:05:04 +0000667 goto bail;
668 }
669 }
Mark Salyzyn088bf902014-05-08 16:02:20 -0700670 ALOGV("+++ zip good scan %" PRIu16 " entries", num_entries);
Narayan Kamath7462f022013-11-21 13:05:04 +0000671
672 result = 0;
673
674bail:
675 return result;
676}
677
678static int32_t OpenArchiveInternal(ZipArchive* archive,
679 const char* debug_file_name) {
680 int32_t result = -1;
681 if ((result = MapCentralDirectory(archive->fd, debug_file_name, archive))) {
682 return result;
683 }
684
685 if ((result = ParseZipArchive(archive))) {
686 return result;
687 }
688
689 return 0;
690}
691
692int32_t OpenArchiveFd(int fd, const char* debug_file_name,
Dmitriy Ivanov40b52b22014-07-15 19:33:00 -0700693 ZipArchiveHandle* handle, bool assume_ownership) {
694 ZipArchive* archive = new ZipArchive(fd, assume_ownership);
Narayan Kamath7462f022013-11-21 13:05:04 +0000695 *handle = archive;
Narayan Kamath7462f022013-11-21 13:05:04 +0000696 return OpenArchiveInternal(archive, debug_file_name);
697}
698
699int32_t OpenArchive(const char* fileName, ZipArchiveHandle* handle) {
Neil Fullerb1a113f2014-07-25 14:43:04 +0100700 const int fd = open(fileName, O_RDONLY | O_BINARY, 0);
Dmitriy Ivanov40b52b22014-07-15 19:33:00 -0700701 ZipArchive* archive = new ZipArchive(fd, true);
Narayan Kamath7462f022013-11-21 13:05:04 +0000702 *handle = archive;
703
Narayan Kamath7462f022013-11-21 13:05:04 +0000704 if (fd < 0) {
705 ALOGW("Unable to open '%s': %s", fileName, strerror(errno));
706 return kIoError;
Narayan Kamath7462f022013-11-21 13:05:04 +0000707 }
Dmitriy Ivanov40b52b22014-07-15 19:33:00 -0700708
Narayan Kamath7462f022013-11-21 13:05:04 +0000709 return OpenArchiveInternal(archive, fileName);
710}
711
712/*
713 * Close a ZipArchive, closing the file and freeing the contents.
714 */
715void CloseArchive(ZipArchiveHandle handle) {
716 ZipArchive* archive = (ZipArchive*) handle;
717 ALOGV("Closing archive %p", archive);
Neil Fullerb1a113f2014-07-25 14:43:04 +0100718 delete archive;
Narayan Kamath7462f022013-11-21 13:05:04 +0000719}
720
721static int32_t UpdateEntryFromDataDescriptor(int fd,
722 ZipEntry *entry) {
Narayan Kamath926973e2014-06-09 14:18:14 +0100723 uint8_t ddBuf[sizeof(DataDescriptor) + sizeof(DataDescriptor::kOptSignature)];
Narayan Kamath7462f022013-11-21 13:05:04 +0000724 ssize_t actual = TEMP_FAILURE_RETRY(read(fd, ddBuf, sizeof(ddBuf)));
725 if (actual != sizeof(ddBuf)) {
726 return kIoError;
727 }
728
Narayan Kamath926973e2014-06-09 14:18:14 +0100729 const uint32_t ddSignature = *(reinterpret_cast<const uint32_t*>(ddBuf));
730 const uint16_t offset = (ddSignature == DataDescriptor::kOptSignature) ? 4 : 0;
731 const DataDescriptor* descriptor = reinterpret_cast<const DataDescriptor*>(ddBuf + offset);
Narayan Kamath7462f022013-11-21 13:05:04 +0000732
Narayan Kamath926973e2014-06-09 14:18:14 +0100733 entry->crc32 = descriptor->crc32;
734 entry->compressed_length = descriptor->compressed_size;
735 entry->uncompressed_length = descriptor->uncompressed_size;
Narayan Kamath7462f022013-11-21 13:05:04 +0000736
737 return 0;
738}
739
740// Attempts to read |len| bytes into |buf| at offset |off|.
741//
742// This method uses pread64 on platforms that support it and
743// lseek64 + read on platforms that don't. This implies that
744// callers should not rely on the |fd| offset being incremented
745// as a side effect of this call.
746static inline ssize_t ReadAtOffset(int fd, uint8_t* buf, size_t len,
747 off64_t off) {
Yabin Cui70160f42014-11-19 20:47:18 -0800748#if !defined(_WIN32)
Narayan Kamath7462f022013-11-21 13:05:04 +0000749 return TEMP_FAILURE_RETRY(pread64(fd, buf, len, off));
750#else
751 // The only supported platform that doesn't support pread at the moment
752 // is Windows. Only recent versions of windows support unix like forks,
753 // and even there the semantics are quite different.
754 if (lseek64(fd, off, SEEK_SET) != off) {
Mark Salyzyn99ef9912014-03-14 14:26:22 -0700755 ALOGW("Zip: failed seek to offset %" PRId64, off);
Narayan Kamath7462f022013-11-21 13:05:04 +0000756 return kIoError;
757 }
758
759 return TEMP_FAILURE_RETRY(read(fd, buf, len));
Yabin Cui70160f42014-11-19 20:47:18 -0800760#endif
Narayan Kamath7462f022013-11-21 13:05:04 +0000761}
762
763static int32_t FindEntry(const ZipArchive* archive, const int ent,
764 ZipEntry* data) {
765 const uint16_t nameLen = archive->hash_table[ent].name_length;
Narayan Kamath7462f022013-11-21 13:05:04 +0000766
767 // Recover the start of the central directory entry from the filename
768 // pointer. The filename is the first entry past the fixed-size data,
769 // so we can just subtract back from that.
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100770 const uint8_t* ptr = archive->hash_table[ent].name;
Narayan Kamath926973e2014-06-09 14:18:14 +0100771 ptr -= sizeof(CentralDirectoryRecord);
Narayan Kamath7462f022013-11-21 13:05:04 +0000772
773 // This is the base of our mmapped region, we have to sanity check that
774 // the name that's in the hash table is a pointer to a location within
775 // this mapped region.
Narayan Kamath926973e2014-06-09 14:18:14 +0100776 const uint8_t* base_ptr = reinterpret_cast<const uint8_t*>(
777 archive->directory_map->getDataPtr());
Narayan Kamatheaf98852013-12-11 14:51:51 +0000778 if (ptr < base_ptr || ptr > base_ptr + archive->directory_map->getDataLength()) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000779 ALOGW("Zip: Invalid entry pointer");
780 return kInvalidOffset;
781 }
782
Narayan Kamath926973e2014-06-09 14:18:14 +0100783 const CentralDirectoryRecord *cdr =
784 reinterpret_cast<const CentralDirectoryRecord*>(ptr);
785
Narayan Kamath7462f022013-11-21 13:05:04 +0000786 // The offset of the start of the central directory in the zipfile.
787 // We keep this lying around so that we can sanity check all our lengths
788 // and our per-file structures.
789 const off64_t cd_offset = archive->directory_offset;
790
791 // Fill out the compression method, modification time, crc32
792 // and other interesting attributes from the central directory. These
793 // will later be compared against values from the local file header.
Narayan Kamath926973e2014-06-09 14:18:14 +0100794 data->method = cdr->compression_method;
795 data->mod_time = cdr->last_mod_time;
796 data->crc32 = cdr->crc32;
797 data->compressed_length = cdr->compressed_size;
798 data->uncompressed_length = cdr->uncompressed_size;
Narayan Kamath7462f022013-11-21 13:05:04 +0000799
800 // Figure out the local header offset from the central directory. The
801 // actual file data will begin after the local header and the name /
802 // extra comments.
Narayan Kamath926973e2014-06-09 14:18:14 +0100803 const off64_t local_header_offset = cdr->local_file_header_offset;
804 if (local_header_offset + static_cast<off64_t>(sizeof(LocalFileHeader)) >= cd_offset) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000805 ALOGW("Zip: bad local hdr offset in zip");
806 return kInvalidOffset;
807 }
808
Narayan Kamath926973e2014-06-09 14:18:14 +0100809 uint8_t lfh_buf[sizeof(LocalFileHeader)];
Narayan Kamath7462f022013-11-21 13:05:04 +0000810 ssize_t actual = ReadAtOffset(archive->fd, lfh_buf, sizeof(lfh_buf),
811 local_header_offset);
812 if (actual != sizeof(lfh_buf)) {
Mark Salyzyn56a90a02014-05-08 17:20:55 -0700813 ALOGW("Zip: failed reading lfh name from offset %" PRId64, (int64_t)local_header_offset);
Narayan Kamath7462f022013-11-21 13:05:04 +0000814 return kIoError;
815 }
816
Narayan Kamath926973e2014-06-09 14:18:14 +0100817 const LocalFileHeader *lfh = reinterpret_cast<const LocalFileHeader*>(lfh_buf);
818
819 if (lfh->lfh_signature != LocalFileHeader::kSignature) {
Mark Salyzyn99ef9912014-03-14 14:26:22 -0700820 ALOGW("Zip: didn't find signature at start of lfh, offset=%" PRId64,
Narayan Kamath926973e2014-06-09 14:18:14 +0100821 static_cast<int64_t>(local_header_offset));
Narayan Kamath7462f022013-11-21 13:05:04 +0000822 return kInvalidOffset;
823 }
824
825 // Paranoia: Match the values specified in the local file header
826 // to those specified in the central directory.
Narayan Kamath926973e2014-06-09 14:18:14 +0100827 if ((lfh->gpb_flags & kGPBDDFlagMask) == 0) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000828 data->has_data_descriptor = 0;
Narayan Kamath926973e2014-06-09 14:18:14 +0100829 if (data->compressed_length != lfh->compressed_size
830 || data->uncompressed_length != lfh->uncompressed_size
831 || data->crc32 != lfh->crc32) {
Mark Salyzyn088bf902014-05-08 16:02:20 -0700832 ALOGW("Zip: size/crc32 mismatch. expected {%" PRIu32 ", %" PRIu32
833 ", %" PRIx32 "}, was {%" PRIu32 ", %" PRIu32 ", %" PRIx32 "}",
Narayan Kamath7462f022013-11-21 13:05:04 +0000834 data->compressed_length, data->uncompressed_length, data->crc32,
Narayan Kamath926973e2014-06-09 14:18:14 +0100835 lfh->compressed_size, lfh->uncompressed_size, lfh->crc32);
Narayan Kamath7462f022013-11-21 13:05:04 +0000836 return kInconsistentInformation;
837 }
838 } else {
839 data->has_data_descriptor = 1;
840 }
841
842 // Check that the local file header name matches the declared
843 // name in the central directory.
Narayan Kamath926973e2014-06-09 14:18:14 +0100844 if (lfh->file_name_length == nameLen) {
845 const off64_t name_offset = local_header_offset + sizeof(LocalFileHeader);
846 if (name_offset + lfh->file_name_length >= cd_offset) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000847 ALOGW("Zip: Invalid declared length");
848 return kInvalidOffset;
849 }
850
851 uint8_t* name_buf = (uint8_t*) malloc(nameLen);
852 ssize_t actual = ReadAtOffset(archive->fd, name_buf, nameLen,
853 name_offset);
854
855 if (actual != nameLen) {
Mark Salyzyn56a90a02014-05-08 17:20:55 -0700856 ALOGW("Zip: failed reading lfh name from offset %" PRId64, (int64_t)name_offset);
Narayan Kamath7462f022013-11-21 13:05:04 +0000857 free(name_buf);
858 return kIoError;
859 }
860
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100861 if (memcmp(archive->hash_table[ent].name, name_buf, nameLen)) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000862 free(name_buf);
863 return kInconsistentInformation;
864 }
865
866 free(name_buf);
867 } else {
868 ALOGW("Zip: lfh name did not match central directory.");
869 return kInconsistentInformation;
870 }
871
Narayan Kamath926973e2014-06-09 14:18:14 +0100872 const off64_t data_offset = local_header_offset + sizeof(LocalFileHeader)
873 + lfh->file_name_length + lfh->extra_field_length;
Narayan Kamath48953a12014-01-24 12:32:39 +0000874 if (data_offset > cd_offset) {
Mark Salyzyn56a90a02014-05-08 17:20:55 -0700875 ALOGW("Zip: bad data offset %" PRId64 " in zip", (int64_t)data_offset);
Narayan Kamath7462f022013-11-21 13:05:04 +0000876 return kInvalidOffset;
877 }
878
879 if ((off64_t)(data_offset + data->compressed_length) > cd_offset) {
Mark Salyzyn088bf902014-05-08 16:02:20 -0700880 ALOGW("Zip: bad compressed length in zip (%" PRId64 " + %" PRIu32 " > %" PRId64 ")",
Mark Salyzyn56a90a02014-05-08 17:20:55 -0700881 (int64_t)data_offset, data->compressed_length, (int64_t)cd_offset);
Narayan Kamath7462f022013-11-21 13:05:04 +0000882 return kInvalidOffset;
883 }
884
885 if (data->method == kCompressStored &&
886 (off64_t)(data_offset + data->uncompressed_length) > cd_offset) {
Mark Salyzyn088bf902014-05-08 16:02:20 -0700887 ALOGW("Zip: bad uncompressed length in zip (%" PRId64 " + %" PRIu32 " > %" PRId64 ")",
Mark Salyzyn96c5c992014-05-08 19:16:40 -0700888 (int64_t)data_offset, data->uncompressed_length, (int64_t)cd_offset);
Narayan Kamath7462f022013-11-21 13:05:04 +0000889 return kInvalidOffset;
890 }
891
892 data->offset = data_offset;
893 return 0;
894}
895
896struct IterationHandle {
897 uint32_t position;
Piotr Jastrzebski10aa9a02014-08-19 09:01:20 +0100898 // We're not using vector here because this code is used in the Windows SDK
899 // where the STL is not available.
Piotr Jastrzebski8e085362014-08-18 11:37:45 +0100900 const uint8_t* prefix;
901 uint16_t prefix_len;
Narayan Kamath7462f022013-11-21 13:05:04 +0000902 ZipArchive* archive;
Piotr Jastrzebski8e085362014-08-18 11:37:45 +0100903
904 IterationHandle() : prefix(NULL), prefix_len(0) {}
905
906 IterationHandle(const ZipEntryName& prefix_name)
907 : prefix_len(prefix_name.name_length) {
908 uint8_t* prefix_copy = new uint8_t[prefix_len];
Piotr Jastrzebski10aa9a02014-08-19 09:01:20 +0100909 memcpy(prefix_copy, prefix_name.name, prefix_len);
Piotr Jastrzebski8e085362014-08-18 11:37:45 +0100910 prefix = prefix_copy;
911 }
912
913 ~IterationHandle() {
Piotr Jastrzebski10aa9a02014-08-19 09:01:20 +0100914 delete[] prefix;
Piotr Jastrzebski8e085362014-08-18 11:37:45 +0100915 }
Narayan Kamath7462f022013-11-21 13:05:04 +0000916};
917
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100918int32_t StartIteration(ZipArchiveHandle handle, void** cookie_ptr,
919 const ZipEntryName* optional_prefix) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000920 ZipArchive* archive = (ZipArchive *) handle;
921
922 if (archive == NULL || archive->hash_table == NULL) {
923 ALOGW("Zip: Invalid ZipArchiveHandle");
924 return kInvalidHandle;
925 }
926
Piotr Jastrzebski8e085362014-08-18 11:37:45 +0100927 IterationHandle* cookie =
928 optional_prefix != NULL ? new IterationHandle(*optional_prefix) : new IterationHandle();
Narayan Kamath7462f022013-11-21 13:05:04 +0000929 cookie->position = 0;
Narayan Kamath7462f022013-11-21 13:05:04 +0000930 cookie->archive = archive;
Narayan Kamath7462f022013-11-21 13:05:04 +0000931
932 *cookie_ptr = cookie ;
933 return 0;
934}
935
Piotr Jastrzebski79c8b342014-08-08 14:02:17 +0100936void EndIteration(void* cookie) {
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100937 delete reinterpret_cast<IterationHandle*>(cookie);
Piotr Jastrzebski79c8b342014-08-08 14:02:17 +0100938}
939
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100940int32_t FindEntry(const ZipArchiveHandle handle, const ZipEntryName& entryName,
Narayan Kamath7462f022013-11-21 13:05:04 +0000941 ZipEntry* data) {
942 const ZipArchive* archive = (ZipArchive*) handle;
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100943 if (entryName.name_length == 0) {
944 ALOGW("Zip: Invalid filename %.*s", entryName.name_length, entryName.name);
Narayan Kamath7462f022013-11-21 13:05:04 +0000945 return kInvalidEntryName;
946 }
947
948 const int64_t ent = EntryToIndex(archive->hash_table,
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100949 archive->hash_table_size, entryName);
Narayan Kamath7462f022013-11-21 13:05:04 +0000950
951 if (ent < 0) {
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100952 ALOGV("Zip: Could not find entry %.*s", entryName.name_length, entryName.name);
Narayan Kamath7462f022013-11-21 13:05:04 +0000953 return ent;
954 }
955
956 return FindEntry(archive, ent, data);
957}
958
959int32_t Next(void* cookie, ZipEntry* data, ZipEntryName* name) {
960 IterationHandle* handle = (IterationHandle *) cookie;
961 if (handle == NULL) {
962 return kInvalidHandle;
963 }
964
965 ZipArchive* archive = handle->archive;
966 if (archive == NULL || archive->hash_table == NULL) {
967 ALOGW("Zip: Invalid ZipArchiveHandle");
968 return kInvalidHandle;
969 }
970
971 const uint32_t currentOffset = handle->position;
972 const uint32_t hash_table_length = archive->hash_table_size;
973 const ZipEntryName *hash_table = archive->hash_table;
974
975 for (uint32_t i = currentOffset; i < hash_table_length; ++i) {
976 if (hash_table[i].name != NULL &&
Piotr Jastrzebski8e085362014-08-18 11:37:45 +0100977 (handle->prefix_len == 0 ||
978 (memcmp(handle->prefix, hash_table[i].name, handle->prefix_len) == 0))) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000979 handle->position = (i + 1);
980 const int error = FindEntry(archive, i, data);
981 if (!error) {
982 name->name = hash_table[i].name;
983 name->name_length = hash_table[i].name_length;
984 }
985
986 return error;
987 }
988 }
989
990 handle->position = 0;
991 return kIterationEnd;
992}
993
994static int32_t InflateToFile(int fd, const ZipEntry* entry,
995 uint8_t* begin, uint32_t length,
996 uint64_t* crc_out) {
997 int32_t result = -1;
998 const uint32_t kBufSize = 32768;
999 uint8_t read_buf[kBufSize];
1000 uint8_t write_buf[kBufSize];
1001 z_stream zstream;
1002 int zerr;
1003
1004 /*
1005 * Initialize the zlib stream struct.
1006 */
1007 memset(&zstream, 0, sizeof(zstream));
1008 zstream.zalloc = Z_NULL;
1009 zstream.zfree = Z_NULL;
1010 zstream.opaque = Z_NULL;
1011 zstream.next_in = NULL;
1012 zstream.avail_in = 0;
1013 zstream.next_out = (Bytef*) write_buf;
1014 zstream.avail_out = kBufSize;
1015 zstream.data_type = Z_UNKNOWN;
1016
1017 /*
1018 * Use the undocumented "negative window bits" feature to tell zlib
1019 * that there's no zlib header waiting for it.
1020 */
1021 zerr = inflateInit2(&zstream, -MAX_WBITS);
1022 if (zerr != Z_OK) {
1023 if (zerr == Z_VERSION_ERROR) {
1024 ALOGE("Installed zlib is not compatible with linked version (%s)",
1025 ZLIB_VERSION);
1026 } else {
1027 ALOGW("Call to inflateInit2 failed (zerr=%d)", zerr);
1028 }
1029
1030 return kZlibError;
1031 }
1032
1033 const uint32_t uncompressed_length = entry->uncompressed_length;
1034
1035 uint32_t compressed_length = entry->compressed_length;
1036 uint32_t write_count = 0;
1037 do {
1038 /* read as much as we can */
1039 if (zstream.avail_in == 0) {
Mark Salyzyn51d562d2014-05-05 14:38:05 -07001040 const ZD_TYPE getSize = (compressed_length > kBufSize) ? kBufSize : compressed_length;
1041 const ZD_TYPE actual = TEMP_FAILURE_RETRY(read(fd, read_buf, getSize));
Narayan Kamath7462f022013-11-21 13:05:04 +00001042 if (actual != getSize) {
Mark Salyzyn51d562d2014-05-05 14:38:05 -07001043 ALOGW("Zip: inflate read failed (" ZD " vs " ZD ")", actual, getSize);
Narayan Kamath7462f022013-11-21 13:05:04 +00001044 result = kIoError;
1045 goto z_bail;
1046 }
1047
1048 compressed_length -= getSize;
1049
1050 zstream.next_in = read_buf;
1051 zstream.avail_in = getSize;
1052 }
1053
1054 /* uncompress the data */
1055 zerr = inflate(&zstream, Z_NO_FLUSH);
1056 if (zerr != Z_OK && zerr != Z_STREAM_END) {
1057 ALOGW("Zip: inflate zerr=%d (nIn=%p aIn=%u nOut=%p aOut=%u)",
1058 zerr, zstream.next_in, zstream.avail_in,
1059 zstream.next_out, zstream.avail_out);
1060 result = kZlibError;
1061 goto z_bail;
1062 }
1063
1064 /* write when we're full or when we're done */
1065 if (zstream.avail_out == 0 ||
1066 (zerr == Z_STREAM_END && zstream.avail_out != kBufSize)) {
1067 const size_t write_size = zstream.next_out - write_buf;
1068 // The file might have declared a bogus length.
1069 if (write_size + write_count > length) {
1070 goto z_bail;
1071 }
1072 memcpy(begin + write_count, write_buf, write_size);
1073 write_count += write_size;
1074
1075 zstream.next_out = write_buf;
1076 zstream.avail_out = kBufSize;
1077 }
1078 } while (zerr == Z_OK);
1079
1080 assert(zerr == Z_STREAM_END); /* other errors should've been caught */
1081
1082 // stream.adler holds the crc32 value for such streams.
1083 *crc_out = zstream.adler;
1084
1085 if (zstream.total_out != uncompressed_length || compressed_length != 0) {
Mark Salyzyn088bf902014-05-08 16:02:20 -07001086 ALOGW("Zip: size mismatch on inflated file (%lu vs %" PRIu32 ")",
Narayan Kamath7462f022013-11-21 13:05:04 +00001087 zstream.total_out, uncompressed_length);
1088 result = kInconsistentInformation;
1089 goto z_bail;
1090 }
1091
1092 result = 0;
1093
1094z_bail:
1095 inflateEnd(&zstream); /* free up any allocated structures */
1096
1097 return result;
1098}
1099
1100int32_t ExtractToMemory(ZipArchiveHandle handle,
1101 ZipEntry* entry, uint8_t* begin, uint32_t size) {
1102 ZipArchive* archive = (ZipArchive*) handle;
1103 const uint16_t method = entry->method;
1104 off64_t data_offset = entry->offset;
1105
1106 if (lseek64(archive->fd, data_offset, SEEK_SET) != data_offset) {
Mark Salyzyn56a90a02014-05-08 17:20:55 -07001107 ALOGW("Zip: lseek to data at %" PRId64 " failed", (int64_t)data_offset);
Narayan Kamath7462f022013-11-21 13:05:04 +00001108 return kIoError;
1109 }
1110
1111 // this should default to kUnknownCompressionMethod.
1112 int32_t return_value = -1;
1113 uint64_t crc = 0;
1114 if (method == kCompressStored) {
1115 return_value = CopyFileToFile(archive->fd, begin, size, &crc);
1116 } else if (method == kCompressDeflated) {
1117 return_value = InflateToFile(archive->fd, entry, begin, size, &crc);
1118 }
1119
1120 if (!return_value && entry->has_data_descriptor) {
1121 return_value = UpdateEntryFromDataDescriptor(archive->fd, entry);
1122 if (return_value) {
1123 return return_value;
1124 }
1125 }
1126
1127 // TODO: Fix this check by passing the right flags to inflate2 so that
1128 // it calculates the CRC for us.
1129 if (entry->crc32 != crc && false) {
Mark Salyzyn088bf902014-05-08 16:02:20 -07001130 ALOGW("Zip: crc mismatch: expected %" PRIu32 ", was %" PRIu64, entry->crc32, crc);
Narayan Kamath7462f022013-11-21 13:05:04 +00001131 return kInconsistentInformation;
1132 }
1133
1134 return return_value;
1135}
1136
1137int32_t ExtractEntryToFile(ZipArchiveHandle handle,
1138 ZipEntry* entry, int fd) {
1139 const int32_t declared_length = entry->uncompressed_length;
1140
Narayan Kamath00a258c2013-12-13 16:06:19 +00001141 const off64_t current_offset = lseek64(fd, 0, SEEK_CUR);
1142 if (current_offset == -1) {
1143 ALOGW("Zip: unable to seek to current location on fd %d: %s", fd,
1144 strerror(errno));
Narayan Kamath7462f022013-11-21 13:05:04 +00001145 return kIoError;
1146 }
1147
Narayan Kamath00a258c2013-12-13 16:06:19 +00001148 int result = TEMP_FAILURE_RETRY(ftruncate(fd, declared_length + current_offset));
1149 if (result == -1) {
Mark Salyzyn99ef9912014-03-14 14:26:22 -07001150 ALOGW("Zip: unable to truncate file to %" PRId64 ": %s",
Mark Salyzyn56a90a02014-05-08 17:20:55 -07001151 (int64_t)(declared_length + current_offset), strerror(errno));
Narayan Kamath00a258c2013-12-13 16:06:19 +00001152 return kIoError;
1153 }
1154
Narayan Kamath48953a12014-01-24 12:32:39 +00001155 // Don't attempt to map a region of length 0. We still need the
1156 // ftruncate() though, since the API guarantees that we will truncate
1157 // the file to the end of the uncompressed output.
1158 if (declared_length == 0) {
1159 return 0;
1160 }
1161
Narayan Kamath00a258c2013-12-13 16:06:19 +00001162 android::FileMap* map = MapFileSegment(fd, current_offset, declared_length,
Narayan Kamatheaf98852013-12-11 14:51:51 +00001163 false, kTempMappingFileName);
1164 if (map == NULL) {
1165 return kMmapFailed;
Narayan Kamath7462f022013-11-21 13:05:04 +00001166 }
1167
Narayan Kamatheaf98852013-12-11 14:51:51 +00001168 const int32_t error = ExtractToMemory(handle, entry,
1169 reinterpret_cast<uint8_t*>(map->getDataPtr()),
1170 map->getDataLength());
Narayan Kamath6832a7a2015-02-23 15:43:35 +00001171 delete map;
Narayan Kamath7462f022013-11-21 13:05:04 +00001172 return error;
1173}
1174
1175const char* ErrorCodeString(int32_t error_code) {
1176 if (error_code > kErrorMessageLowerBound && error_code < kErrorMessageUpperBound) {
1177 return kErrorMessages[error_code * -1];
1178 }
1179
1180 return kErrorMessages[0];
1181}
1182
1183int GetFileDescriptor(const ZipArchiveHandle handle) {
1184 return ((ZipArchive*) handle)->fd;
1185}
1186