blob: 7cc9ac39df3f835114871d9ce84d95bc21ac3498 [file] [log] [blame]
Narayan Kamath7462f022013-11-21 13:05:04 +00001/*
2 * Copyright (C) 2008 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17/*
18 * Read-only access to Zip archives, with minimal heap allocation.
19 */
Narayan Kamath7462f022013-11-21 13:05:04 +000020
21#include <assert.h>
22#include <errno.h>
Mark Salyzyn99ef9912014-03-14 14:26:22 -070023#include <fcntl.h>
24#include <inttypes.h>
Narayan Kamath7462f022013-11-21 13:05:04 +000025#include <limits.h>
26#include <log/log.h>
Narayan Kamath7462f022013-11-21 13:05:04 +000027#include <stdlib.h>
28#include <string.h>
Narayan Kamath7462f022013-11-21 13:05:04 +000029#include <unistd.h>
Mark Salyzyn51d562d2014-05-05 14:38:05 -070030#include <utils/Compat.h>
Narayan Kamatheaf98852013-12-11 14:51:51 +000031#include <utils/FileMap.h>
Mark Salyzyn99ef9912014-03-14 14:26:22 -070032#include <zlib.h>
Narayan Kamath7462f022013-11-21 13:05:04 +000033
34#include <JNIHelp.h> // TEMP_FAILURE_RETRY may or may not be in unistd
35
Mark Salyzyn99ef9912014-03-14 14:26:22 -070036#include "ziparchive/zip_archive.h"
37
Narayan Kamath926973e2014-06-09 14:18:14 +010038// This is for windows. If we don't open a file in binary mode, weird
Narayan Kamath7462f022013-11-21 13:05:04 +000039// things will happen.
40#ifndef O_BINARY
41#define O_BINARY 0
42#endif
43
Narayan Kamath926973e2014-06-09 14:18:14 +010044#define DISALLOW_IMPLICIT_CONSTRUCTORS(TypeName) \
45 TypeName(); \
46 TypeName(const TypeName&); \
47 void operator=(const TypeName&)
Narayan Kamath7462f022013-11-21 13:05:04 +000048
Narayan Kamath926973e2014-06-09 14:18:14 +010049// The "end of central directory" (EOCD) record. Each archive
50// contains exactly once such record which appears at the end of
51// the archive. It contains archive wide information like the
52// number of entries in the archive and the offset to the central
53// directory of the offset.
54struct EocdRecord {
55 static const uint32_t kSignature = 0x06054b50;
Narayan Kamath7462f022013-11-21 13:05:04 +000056
Narayan Kamath926973e2014-06-09 14:18:14 +010057 // End of central directory signature, should always be
58 // |kSignature|.
59 uint32_t eocd_signature;
60 // The number of the current "disk", i.e, the "disk" that this
61 // central directory is on.
62 //
63 // This implementation assumes that each archive spans a single
64 // disk only. i.e, that disk_num == 1.
65 uint16_t disk_num;
66 // The disk where the central directory starts.
67 //
68 // This implementation assumes that each archive spans a single
69 // disk only. i.e, that cd_start_disk == 1.
70 uint16_t cd_start_disk;
71 // The number of central directory records on this disk.
72 //
73 // This implementation assumes that each archive spans a single
74 // disk only. i.e, that num_records_on_disk == num_records.
75 uint16_t num_records_on_disk;
76 // The total number of central directory records.
77 uint16_t num_records;
78 // The size of the central directory (in bytes).
79 uint32_t cd_size;
80 // The offset of the start of the central directory, relative
81 // to the start of the file.
82 uint32_t cd_start_offset;
83 // Length of the central directory comment.
84 uint16_t comment_length;
85 private:
86 DISALLOW_IMPLICIT_CONSTRUCTORS(EocdRecord);
87} __attribute__((packed));
Narayan Kamath7462f022013-11-21 13:05:04 +000088
Narayan Kamath926973e2014-06-09 14:18:14 +010089// A structure representing the fixed length fields for a single
90// record in the central directory of the archive. In addition to
91// the fixed length fields listed here, each central directory
92// record contains a variable length "file_name" and "extra_field"
93// whose lengths are given by |file_name_length| and |extra_field_length|
94// respectively.
95struct CentralDirectoryRecord {
96 static const uint32_t kSignature = 0x02014b50;
Narayan Kamath7462f022013-11-21 13:05:04 +000097
Narayan Kamath926973e2014-06-09 14:18:14 +010098 // The start of record signature. Must be |kSignature|.
99 uint32_t record_signature;
100 // Tool version. Ignored by this implementation.
101 uint16_t version_made_by;
102 // Tool version. Ignored by this implementation.
103 uint16_t version_needed;
104 // The "general purpose bit flags" for this entry. The only
105 // flag value that we currently check for is the "data descriptor"
106 // flag.
107 uint16_t gpb_flags;
108 // The compression method for this entry, one of |kCompressStored|
109 // and |kCompressDeflated|.
110 uint16_t compression_method;
111 // The file modification time and date for this entry.
112 uint16_t last_mod_time;
113 uint16_t last_mod_date;
114 // The CRC-32 checksum for this entry.
115 uint32_t crc32;
116 // The compressed size (in bytes) of this entry.
117 uint32_t compressed_size;
118 // The uncompressed size (in bytes) of this entry.
119 uint32_t uncompressed_size;
120 // The length of the entry file name in bytes. The file name
121 // will appear immediately after this record.
122 uint16_t file_name_length;
123 // The length of the extra field info (in bytes). This data
124 // will appear immediately after the entry file name.
125 uint16_t extra_field_length;
126 // The length of the entry comment (in bytes). This data will
127 // appear immediately after the extra field.
128 uint16_t comment_length;
129 // The start disk for this entry. Ignored by this implementation).
130 uint16_t file_start_disk;
131 // File attributes. Ignored by this implementation.
132 uint16_t internal_file_attributes;
133 // File attributes. Ignored by this implementation.
134 uint32_t external_file_attributes;
135 // The offset to the local file header for this entry, from the
136 // beginning of this archive.
137 uint32_t local_file_header_offset;
138 private:
139 DISALLOW_IMPLICIT_CONSTRUCTORS(CentralDirectoryRecord);
140} __attribute__((packed));
Narayan Kamath7462f022013-11-21 13:05:04 +0000141
Narayan Kamath926973e2014-06-09 14:18:14 +0100142// The local file header for a given entry. This duplicates information
143// present in the central directory of the archive. It is an error for
144// the information here to be different from the central directory
145// information for a given entry.
146struct LocalFileHeader {
147 static const uint32_t kSignature = 0x04034b50;
Narayan Kamath7462f022013-11-21 13:05:04 +0000148
Narayan Kamath926973e2014-06-09 14:18:14 +0100149 // The local file header signature, must be |kSignature|.
150 uint32_t lfh_signature;
151 // Tool version. Ignored by this implementation.
152 uint16_t version_needed;
153 // The "general purpose bit flags" for this entry. The only
154 // flag value that we currently check for is the "data descriptor"
155 // flag.
156 uint16_t gpb_flags;
157 // The compression method for this entry, one of |kCompressStored|
158 // and |kCompressDeflated|.
159 uint16_t compression_method;
160 // The file modification time and date for this entry.
161 uint16_t last_mod_time;
162 uint16_t last_mod_date;
163 // The CRC-32 checksum for this entry.
164 uint32_t crc32;
165 // The compressed size (in bytes) of this entry.
166 uint32_t compressed_size;
167 // The uncompressed size (in bytes) of this entry.
168 uint32_t uncompressed_size;
169 // The length of the entry file name in bytes. The file name
170 // will appear immediately after this record.
171 uint16_t file_name_length;
172 // The length of the extra field info (in bytes). This data
173 // will appear immediately after the entry file name.
174 uint16_t extra_field_length;
175 private:
176 DISALLOW_IMPLICIT_CONSTRUCTORS(LocalFileHeader);
177} __attribute__((packed));
178
179struct DataDescriptor {
180 // The *optional* data descriptor start signature.
181 static const uint32_t kOptSignature = 0x08074b50;
182
183 // CRC-32 checksum of the entry.
184 uint32_t crc32;
185 // Compressed size of the entry.
186 uint32_t compressed_size;
187 // Uncompressed size of the entry.
188 uint32_t uncompressed_size;
189 private:
190 DISALLOW_IMPLICIT_CONSTRUCTORS(DataDescriptor);
191} __attribute__((packed));
192
193#undef DISALLOW_IMPLICIT_CONSTRUCTORS
194
195static const uint32_t kGPBDDFlagMask = 0x0008; // mask value that signifies that the entry has a DD
Narayan Kamath7462f022013-11-21 13:05:04 +0000196static const uint32_t kMaxErrorLen = 1024;
197
Narayan Kamath926973e2014-06-09 14:18:14 +0100198// The maximum size of a central directory or a file
199// comment in bytes.
200static const uint32_t kMaxCommentLen = 65535;
201
202// The maximum number of bytes to scan backwards for the EOCD start.
203static const uint32_t kMaxEOCDSearch = kMaxCommentLen + sizeof(EocdRecord);
204
Narayan Kamath7462f022013-11-21 13:05:04 +0000205static const char* kErrorMessages[] = {
206 "Unknown return code.",
Narayan Kamatheb41ad22013-12-09 16:26:36 +0000207 "Iteration ended",
Narayan Kamath7462f022013-11-21 13:05:04 +0000208 "Zlib error",
209 "Invalid file",
210 "Invalid handle",
211 "Duplicate entries in archive",
212 "Empty archive",
213 "Entry not found",
214 "Invalid offset",
215 "Inconsistent information",
216 "Invalid entry name",
Narayan Kamatheb41ad22013-12-09 16:26:36 +0000217 "I/O Error",
Narayan Kamatheaf98852013-12-11 14:51:51 +0000218 "File mapping failed"
Narayan Kamath7462f022013-11-21 13:05:04 +0000219};
220
221static const int32_t kErrorMessageUpperBound = 0;
222
Narayan Kamatheb41ad22013-12-09 16:26:36 +0000223static const int32_t kIterationEnd = -1;
Narayan Kamath7462f022013-11-21 13:05:04 +0000224
225// We encountered a Zlib error when inflating a stream from this file.
226// Usually indicates file corruption.
227static const int32_t kZlibError = -2;
228
229// The input file cannot be processed as a zip archive. Usually because
230// it's too small, too large or does not have a valid signature.
231static const int32_t kInvalidFile = -3;
232
233// An invalid iteration / ziparchive handle was passed in as an input
234// argument.
235static const int32_t kInvalidHandle = -4;
236
237// The zip archive contained two (or possibly more) entries with the same
238// name.
239static const int32_t kDuplicateEntry = -5;
240
241// The zip archive contains no entries.
242static const int32_t kEmptyArchive = -6;
243
244// The specified entry was not found in the archive.
245static const int32_t kEntryNotFound = -7;
246
247// The zip archive contained an invalid local file header pointer.
248static const int32_t kInvalidOffset = -8;
249
250// The zip archive contained inconsistent entry information. This could
251// be because the central directory & local file header did not agree, or
252// if the actual uncompressed length or crc32 do not match their declared
253// values.
254static const int32_t kInconsistentInformation = -9;
255
256// An invalid entry name was encountered.
257static const int32_t kInvalidEntryName = -10;
258
Narayan Kamatheb41ad22013-12-09 16:26:36 +0000259// An I/O related system call (read, lseek, ftruncate, map) failed.
260static const int32_t kIoError = -11;
Narayan Kamath7462f022013-11-21 13:05:04 +0000261
Narayan Kamatheaf98852013-12-11 14:51:51 +0000262// We were not able to mmap the central directory or entry contents.
263static const int32_t kMmapFailed = -12;
Narayan Kamath7462f022013-11-21 13:05:04 +0000264
Narayan Kamatheaf98852013-12-11 14:51:51 +0000265static const int32_t kErrorMessageLowerBound = -13;
Narayan Kamath7462f022013-11-21 13:05:04 +0000266
Narayan Kamatheaf98852013-12-11 14:51:51 +0000267static const char kTempMappingFileName[] = "zip: ExtractFileToFile";
Narayan Kamath7462f022013-11-21 13:05:04 +0000268
269/*
270 * A Read-only Zip archive.
271 *
272 * We want "open" and "find entry by name" to be fast operations, and
273 * we want to use as little memory as possible. We memory-map the zip
274 * central directory, and load a hash table with pointers to the filenames
275 * (which aren't null-terminated). The other fields are at a fixed offset
276 * from the filename, so we don't need to extract those (but we do need
277 * to byte-read and endian-swap them every time we want them).
278 *
279 * It's possible that somebody has handed us a massive (~1GB) zip archive,
280 * so we can't expect to mmap the entire file.
281 *
282 * To speed comparisons when doing a lookup by name, we could make the mapping
283 * "private" (copy-on-write) and null-terminate the filenames after verifying
284 * the record structure. However, this requires a private mapping of
285 * every page that the Central Directory touches. Easier to tuck a copy
286 * of the string length into the hash table entry.
287 */
288struct ZipArchive {
289 /* open Zip archive */
Neil Fuller00473682014-07-25 14:43:04 +0100290 const int fd;
Narayan Kamath7462f022013-11-21 13:05:04 +0000291
292 /* mapped central directory area */
293 off64_t directory_offset;
Narayan Kamatheaf98852013-12-11 14:51:51 +0000294 android::FileMap* directory_map;
Narayan Kamath7462f022013-11-21 13:05:04 +0000295
296 /* number of entries in the Zip archive */
297 uint16_t num_entries;
298
299 /*
300 * We know how many entries are in the Zip archive, so we can have a
301 * fixed-size hash table. We define a load factor of 0.75 and overallocat
302 * so the maximum number entries can never be higher than
303 * ((4 * UINT16_MAX) / 3 + 1) which can safely fit into a uint32_t.
304 */
305 uint32_t hash_table_size;
306 ZipEntryName* hash_table;
Neil Fuller00473682014-07-25 14:43:04 +0100307
308 ZipArchive(const int fd) :
309 fd(fd),
310 directory_offset(0),
311 directory_map(NULL),
312 num_entries(0),
313 hash_table_size(0),
314 hash_table(NULL) {}
315
316 ~ZipArchive() {
317 if (fd >= 0) {
318 close(fd);
319 }
320
321 if (directory_map != NULL) {
322 directory_map->release();
323 }
324 free(hash_table);
325 }
Narayan Kamath7462f022013-11-21 13:05:04 +0000326};
327
328// Returns 0 on success and negative values on failure.
Narayan Kamatheaf98852013-12-11 14:51:51 +0000329static android::FileMap* MapFileSegment(const int fd, const off64_t start,
330 const size_t length, const bool read_only,
331 const char* debug_file_name) {
332 android::FileMap* file_map = new android::FileMap;
333 const bool success = file_map->create(debug_file_name, fd, start, length, read_only);
334 if (!success) {
335 file_map->release();
336 return NULL;
Narayan Kamath7462f022013-11-21 13:05:04 +0000337 }
338
Narayan Kamatheaf98852013-12-11 14:51:51 +0000339 return file_map;
Narayan Kamath7462f022013-11-21 13:05:04 +0000340}
341
342static int32_t CopyFileToFile(int fd, uint8_t* begin, const uint32_t length, uint64_t *crc_out) {
343 static const uint32_t kBufSize = 32768;
344 uint8_t buf[kBufSize];
345
346 uint32_t count = 0;
347 uint64_t crc = 0;
Narayan Kamath58aaf462013-12-10 16:47:14 +0000348 while (count < length) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000349 uint32_t remaining = length - count;
350
351 // Safe conversion because kBufSize is narrow enough for a 32 bit signed
352 // value.
353 ssize_t get_size = (remaining > kBufSize) ? kBufSize : remaining;
354 ssize_t actual = TEMP_FAILURE_RETRY(read(fd, buf, get_size));
355
356 if (actual != get_size) {
Mark Salyzyn51d562d2014-05-05 14:38:05 -0700357 ALOGW("CopyFileToFile: copy read failed (" ZD " vs " ZD ")", actual, get_size);
Narayan Kamath7462f022013-11-21 13:05:04 +0000358 return kIoError;
359 }
360
361 memcpy(begin + count, buf, get_size);
362 crc = crc32(crc, buf, get_size);
363 count += get_size;
364 }
365
366 *crc_out = crc;
367
368 return 0;
369}
370
371/*
372 * Round up to the next highest power of 2.
373 *
374 * Found on http://graphics.stanford.edu/~seander/bithacks.html.
375 */
376static uint32_t RoundUpPower2(uint32_t val) {
377 val--;
378 val |= val >> 1;
379 val |= val >> 2;
380 val |= val >> 4;
381 val |= val >> 8;
382 val |= val >> 16;
383 val++;
384
385 return val;
386}
387
388static uint32_t ComputeHash(const char* str, uint16_t len) {
389 uint32_t hash = 0;
390
391 while (len--) {
392 hash = hash * 31 + *str++;
393 }
394
395 return hash;
396}
397
398/*
399 * Convert a ZipEntry to a hash table index, verifying that it's in a
400 * valid range.
401 */
402static int64_t EntryToIndex(const ZipEntryName* hash_table,
403 const uint32_t hash_table_size,
404 const char* name, uint16_t length) {
405 const uint32_t hash = ComputeHash(name, length);
406
407 // NOTE: (hash_table_size - 1) is guaranteed to be non-negative.
408 uint32_t ent = hash & (hash_table_size - 1);
409 while (hash_table[ent].name != NULL) {
410 if (hash_table[ent].name_length == length &&
411 memcmp(hash_table[ent].name, name, length) == 0) {
412 return ent;
413 }
414
415 ent = (ent + 1) & (hash_table_size - 1);
416 }
417
Colin Crossf4b0b792014-02-06 20:07:15 -0800418 ALOGV("Zip: Unable to find entry %.*s", length, name);
Narayan Kamath7462f022013-11-21 13:05:04 +0000419 return kEntryNotFound;
420}
421
422/*
423 * Add a new entry to the hash table.
424 */
425static int32_t AddToHash(ZipEntryName *hash_table, const uint64_t hash_table_size,
426 const char* name, uint16_t length) {
427 const uint64_t hash = ComputeHash(name, length);
428 uint32_t ent = hash & (hash_table_size - 1);
429
430 /*
431 * We over-allocated the table, so we're guaranteed to find an empty slot.
432 * Further, we guarantee that the hashtable size is not 0.
433 */
434 while (hash_table[ent].name != NULL) {
435 if (hash_table[ent].name_length == length &&
436 memcmp(hash_table[ent].name, name, length) == 0) {
437 // We've found a duplicate entry. We don't accept it
438 ALOGW("Zip: Found duplicate entry %.*s", length, name);
439 return kDuplicateEntry;
440 }
441 ent = (ent + 1) & (hash_table_size - 1);
442 }
443
444 hash_table[ent].name = name;
445 hash_table[ent].name_length = length;
446 return 0;
447}
448
Narayan Kamath7462f022013-11-21 13:05:04 +0000449static int32_t MapCentralDirectory0(int fd, const char* debug_file_name,
450 ZipArchive* archive, off64_t file_length,
Narayan Kamath926973e2014-06-09 14:18:14 +0100451 off64_t read_amount, uint8_t* scan_buffer) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000452 const off64_t search_start = file_length - read_amount;
453
454 if (lseek64(fd, search_start, SEEK_SET) != search_start) {
Narayan Kamath926973e2014-06-09 14:18:14 +0100455 ALOGW("Zip: seek %" PRId64 " failed: %s", static_cast<int64_t>(search_start),
456 strerror(errno));
Narayan Kamath7462f022013-11-21 13:05:04 +0000457 return kIoError;
458 }
Narayan Kamath926973e2014-06-09 14:18:14 +0100459 ssize_t actual = TEMP_FAILURE_RETRY(
460 read(fd, scan_buffer, static_cast<size_t>(read_amount)));
461 if (actual != static_cast<ssize_t>(read_amount)) {
462 ALOGW("Zip: read %" PRId64 " failed: %s", static_cast<int64_t>(read_amount),
463 strerror(errno));
Narayan Kamath7462f022013-11-21 13:05:04 +0000464 return kIoError;
465 }
466
467 /*
468 * Scan backward for the EOCD magic. In an archive without a trailing
469 * comment, we'll find it on the first try. (We may want to consider
470 * doing an initial minimal read; if we don't find it, retry with a
471 * second read as above.)
472 */
Narayan Kamath926973e2014-06-09 14:18:14 +0100473 int i = read_amount - sizeof(EocdRecord);
474 for (; i >= 0; i--) {
475 if (scan_buffer[i] == 0x50 &&
476 ((*reinterpret_cast<uint32_t*>(&scan_buffer[i])) == EocdRecord::kSignature)) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000477 ALOGV("+++ Found EOCD at buf+%d", i);
478 break;
479 }
480 }
481 if (i < 0) {
482 ALOGD("Zip: EOCD not found, %s is not zip", debug_file_name);
483 return kInvalidFile;
484 }
485
486 const off64_t eocd_offset = search_start + i;
Narayan Kamath926973e2014-06-09 14:18:14 +0100487 const EocdRecord* eocd = reinterpret_cast<const EocdRecord*>(scan_buffer + i);
Narayan Kamath7462f022013-11-21 13:05:04 +0000488 /*
Narayan Kamath926973e2014-06-09 14:18:14 +0100489 * Verify that there's no trailing space at the end of the central directory
490 * and its comment.
Narayan Kamath7462f022013-11-21 13:05:04 +0000491 */
Narayan Kamath926973e2014-06-09 14:18:14 +0100492 const off64_t calculated_length = eocd_offset + sizeof(EocdRecord)
493 + eocd->comment_length;
494 if (calculated_length != file_length) {
Narayan Kamath4f6b4992014-06-03 13:59:23 +0100495 ALOGW("Zip: %" PRId64 " extraneous bytes at the end of the central directory",
Narayan Kamath926973e2014-06-09 14:18:14 +0100496 static_cast<int64_t>(file_length - calculated_length));
Narayan Kamath4f6b4992014-06-03 13:59:23 +0100497 return kInvalidFile;
498 }
Narayan Kamath7462f022013-11-21 13:05:04 +0000499
Narayan Kamath926973e2014-06-09 14:18:14 +0100500 /*
501 * Grab the CD offset and size, and the number of entries in the
502 * archive and verify that they look reasonable.
503 */
Tianjie Xu1ee48922016-09-21 14:58:11 -0700504 if (static_cast<off64_t>(eocd->cd_start_offset) + eocd->cd_size > eocd_offset) {
Narayan Kamath926973e2014-06-09 14:18:14 +0100505 ALOGW("Zip: bad offsets (dir %" PRIu32 ", size %" PRIu32 ", eocd %" PRId64 ")",
506 eocd->cd_start_offset, eocd->cd_size, static_cast<int64_t>(eocd_offset));
Tianjie Xu1ee48922016-09-21 14:58:11 -0700507#if defined(__ANDROID__)
508 if (eocd->cd_start_offset + eocd->cd_size <= eocd_offset) {
509 android_errorWriteLog(0x534e4554, "31251826");
510 }
511#endif
Narayan Kamath7462f022013-11-21 13:05:04 +0000512 return kInvalidOffset;
513 }
Narayan Kamath926973e2014-06-09 14:18:14 +0100514 if (eocd->num_records == 0) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000515 ALOGW("Zip: empty archive?");
516 return kEmptyArchive;
517 }
518
Narayan Kamath926973e2014-06-09 14:18:14 +0100519 ALOGV("+++ num_entries=%" PRIu32 "dir_size=%" PRIu32 " dir_offset=%" PRIu32,
520 eocd->num_records, eocd->cd_size, eocd->cd_start_offset);
Narayan Kamath7462f022013-11-21 13:05:04 +0000521
522 /*
523 * It all looks good. Create a mapping for the CD, and set the fields
524 * in archive.
525 */
Narayan Kamath926973e2014-06-09 14:18:14 +0100526 android::FileMap* map = MapFileSegment(fd,
527 static_cast<off64_t>(eocd->cd_start_offset),
528 static_cast<size_t>(eocd->cd_size),
529 true /* read only */, debug_file_name);
Narayan Kamatheaf98852013-12-11 14:51:51 +0000530 if (map == NULL) {
531 archive->directory_map = NULL;
532 return kMmapFailed;
Narayan Kamath7462f022013-11-21 13:05:04 +0000533 }
534
Narayan Kamatheaf98852013-12-11 14:51:51 +0000535 archive->directory_map = map;
Narayan Kamath926973e2014-06-09 14:18:14 +0100536 archive->num_entries = eocd->num_records;
537 archive->directory_offset = eocd->cd_start_offset;
Narayan Kamath7462f022013-11-21 13:05:04 +0000538
539 return 0;
540}
541
542/*
543 * Find the zip Central Directory and memory-map it.
544 *
545 * On success, returns 0 after populating fields from the EOCD area:
546 * directory_offset
547 * directory_map
548 * num_entries
549 */
550static int32_t MapCentralDirectory(int fd, const char* debug_file_name,
551 ZipArchive* archive) {
552
553 // Test file length. We use lseek64 to make sure the file
554 // is small enough to be a zip file (Its size must be less than
555 // 0xffffffff bytes).
556 off64_t file_length = lseek64(fd, 0, SEEK_END);
557 if (file_length == -1) {
558 ALOGV("Zip: lseek on fd %d failed", fd);
559 return kInvalidFile;
560 }
561
562 if (file_length > (off64_t) 0xffffffff) {
Narayan Kamath926973e2014-06-09 14:18:14 +0100563 ALOGV("Zip: zip file too long %" PRId64, static_cast<int64_t>(file_length));
Narayan Kamath7462f022013-11-21 13:05:04 +0000564 return kInvalidFile;
565 }
566
Narayan Kamath926973e2014-06-09 14:18:14 +0100567 if (file_length < static_cast<off64_t>(sizeof(EocdRecord))) {
568 ALOGV("Zip: length %" PRId64 " is too small to be zip", static_cast<int64_t>(file_length));
Narayan Kamath7462f022013-11-21 13:05:04 +0000569 return kInvalidFile;
570 }
571
572 /*
573 * Perform the traditional EOCD snipe hunt.
574 *
575 * We're searching for the End of Central Directory magic number,
576 * which appears at the start of the EOCD block. It's followed by
577 * 18 bytes of EOCD stuff and up to 64KB of archive comment. We
578 * need to read the last part of the file into a buffer, dig through
579 * it to find the magic number, parse some values out, and use those
580 * to determine the extent of the CD.
581 *
582 * We start by pulling in the last part of the file.
583 */
Narayan Kamath926973e2014-06-09 14:18:14 +0100584 off64_t read_amount = kMaxEOCDSearch;
585 if (file_length < read_amount) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000586 read_amount = file_length;
587 }
588
Narayan Kamath926973e2014-06-09 14:18:14 +0100589 uint8_t* scan_buffer = reinterpret_cast<uint8_t*>(malloc(read_amount));
Narayan Kamath7462f022013-11-21 13:05:04 +0000590 int32_t result = MapCentralDirectory0(fd, debug_file_name, archive,
591 file_length, read_amount, scan_buffer);
592
593 free(scan_buffer);
594 return result;
595}
596
Narayan Kamatheeb93c92017-09-14 10:41:28 +0100597static inline ssize_t ReadAtOffset(int fd, uint8_t* buf, size_t len, off64_t off);
598
Narayan Kamath7462f022013-11-21 13:05:04 +0000599/*
600 * Parses the Zip archive's Central Directory. Allocates and populates the
601 * hash table.
602 *
603 * Returns 0 on success.
604 */
605static int32_t ParseZipArchive(ZipArchive* archive) {
606 int32_t result = -1;
Narayan Kamath926973e2014-06-09 14:18:14 +0100607 const uint8_t* const cd_ptr = (const uint8_t*) archive->directory_map->getDataPtr();
608 const size_t cd_length = archive->directory_map->getDataLength();
609 const uint16_t num_entries = archive->num_entries;
Narayan Kamath7462f022013-11-21 13:05:04 +0000610
611 /*
612 * Create hash table. We have a minimum 75% load factor, possibly as
613 * low as 50% after we round off to a power of 2. There must be at
614 * least one unused entry to avoid an infinite loop during creation.
615 */
616 archive->hash_table_size = RoundUpPower2(1 + (num_entries * 4) / 3);
617 archive->hash_table = (ZipEntryName*) calloc(archive->hash_table_size,
618 sizeof(ZipEntryName));
619
620 /*
621 * Walk through the central directory, adding entries to the hash
622 * table and verifying values.
623 */
Narayan Kamath926973e2014-06-09 14:18:14 +0100624 const uint8_t* const cd_end = cd_ptr + cd_length;
Narayan Kamath7462f022013-11-21 13:05:04 +0000625 const uint8_t* ptr = cd_ptr;
626 for (uint16_t i = 0; i < num_entries; i++) {
Tianjie Xu6fdfd582017-04-05 14:46:27 -0700627 if (ptr > cd_end - sizeof(CentralDirectoryRecord)) {
628 ALOGW("Zip: ran off the end (at %" PRIu16 ")", i);
629#if defined(__ANDROID__)
630 android_errorWriteLog(0x534e4554, "36392138");
631#endif
632 goto bail;
633 }
634
Narayan Kamath926973e2014-06-09 14:18:14 +0100635 const CentralDirectoryRecord* cdr =
636 reinterpret_cast<const CentralDirectoryRecord*>(ptr);
637 if (cdr->record_signature != CentralDirectoryRecord::kSignature) {
Mark Salyzyn088bf902014-05-08 16:02:20 -0700638 ALOGW("Zip: missed a central dir sig (at %" PRIu16 ")", i);
Narayan Kamath7462f022013-11-21 13:05:04 +0000639 goto bail;
640 }
641
Narayan Kamath926973e2014-06-09 14:18:14 +0100642 const off64_t local_header_offset = cdr->local_file_header_offset;
Narayan Kamath7462f022013-11-21 13:05:04 +0000643 if (local_header_offset >= archive->directory_offset) {
Mark Salyzyn56a90a02014-05-08 17:20:55 -0700644 ALOGW("Zip: bad LFH offset %" PRId64 " at entry %" PRIu16, (int64_t)local_header_offset, i);
Narayan Kamath7462f022013-11-21 13:05:04 +0000645 goto bail;
646 }
647
Narayan Kamath926973e2014-06-09 14:18:14 +0100648 const uint16_t file_name_length = cdr->file_name_length;
649 const uint16_t extra_length = cdr->extra_field_length;
650 const uint16_t comment_length = cdr->comment_length;
Piotr Jastrzebski0c1b8942014-08-15 12:53:00 +0100651 const char* file_name = reinterpret_cast<const char*>(ptr + sizeof(CentralDirectoryRecord));
652
653 /* check that file name doesn't contain \0 character */
654 if (memchr(file_name, 0, file_name_length) != NULL) {
655 ALOGW("Zip: entry name can't contain \\0 character");
656 goto bail;
657 }
Narayan Kamath7462f022013-11-21 13:05:04 +0000658
659 /* add the CDE filename to the hash table */
660 const int add_result = AddToHash(archive->hash_table,
Narayan Kamath926973e2014-06-09 14:18:14 +0100661 archive->hash_table_size, file_name, file_name_length);
Narayan Kamath7462f022013-11-21 13:05:04 +0000662 if (add_result) {
663 ALOGW("Zip: Error adding entry to hash table %d", add_result);
664 result = add_result;
665 goto bail;
666 }
667
Narayan Kamath926973e2014-06-09 14:18:14 +0100668 ptr += sizeof(CentralDirectoryRecord) + file_name_length + extra_length + comment_length;
669 if ((ptr - cd_ptr) > static_cast<int64_t>(cd_length)) {
Mark Salyzyn088bf902014-05-08 16:02:20 -0700670 ALOGW("Zip: bad CD advance (%tu vs %zu) at entry %" PRIu16,
671 ptr - cd_ptr, cd_length, i);
Narayan Kamath7462f022013-11-21 13:05:04 +0000672 goto bail;
673 }
674 }
Narayan Kamath2d516d22017-08-09 18:32:09 +0100675
676 uint32_t lfh_start_bytes;
Narayan Kamatheeb93c92017-09-14 10:41:28 +0100677 if (ReadAtOffset(archive->fd, reinterpret_cast<uint8_t*>(&lfh_start_bytes),
678 sizeof(uint32_t), 0) != sizeof(uint32_t)) {
Narayan Kamath2d516d22017-08-09 18:32:09 +0100679 ALOGW("Zip: Unable to read header for entry at offset == 0.");
680 return -1;
681 }
682
683 if (lfh_start_bytes != LocalFileHeader::kSignature) {
684 ALOGW("Zip: Entry at offset zero has invalid LFH signature %" PRIx32, lfh_start_bytes);
685#if defined(__ANDROID__)
686 android_errorWriteLog(0x534e4554, "64211847");
687#endif
688 return -1;
689 }
690
Mark Salyzyn088bf902014-05-08 16:02:20 -0700691 ALOGV("+++ zip good scan %" PRIu16 " entries", num_entries);
Narayan Kamath7462f022013-11-21 13:05:04 +0000692
693 result = 0;
694
695bail:
696 return result;
697}
698
699static int32_t OpenArchiveInternal(ZipArchive* archive,
700 const char* debug_file_name) {
701 int32_t result = -1;
702 if ((result = MapCentralDirectory(archive->fd, debug_file_name, archive))) {
703 return result;
704 }
705
706 if ((result = ParseZipArchive(archive))) {
707 return result;
708 }
709
710 return 0;
711}
712
713int32_t OpenArchiveFd(int fd, const char* debug_file_name,
714 ZipArchiveHandle* handle) {
Neil Fuller00473682014-07-25 14:43:04 +0100715 ZipArchive* archive = new ZipArchive(fd);
Narayan Kamath7462f022013-11-21 13:05:04 +0000716 *handle = archive;
Narayan Kamath7462f022013-11-21 13:05:04 +0000717 return OpenArchiveInternal(archive, debug_file_name);
718}
719
720int32_t OpenArchive(const char* fileName, ZipArchiveHandle* handle) {
Neil Fuller00473682014-07-25 14:43:04 +0100721 const int fd = open(fileName, O_RDONLY | O_BINARY, 0);
722 ZipArchive* archive = new ZipArchive(fd);
Narayan Kamath7462f022013-11-21 13:05:04 +0000723 *handle = archive;
724
Narayan Kamath7462f022013-11-21 13:05:04 +0000725 if (fd < 0) {
726 ALOGW("Unable to open '%s': %s", fileName, strerror(errno));
727 return kIoError;
Narayan Kamath7462f022013-11-21 13:05:04 +0000728 }
Narayan Kamath7462f022013-11-21 13:05:04 +0000729 return OpenArchiveInternal(archive, fileName);
730}
731
732/*
733 * Close a ZipArchive, closing the file and freeing the contents.
734 */
735void CloseArchive(ZipArchiveHandle handle) {
736 ZipArchive* archive = (ZipArchive*) handle;
737 ALOGV("Closing archive %p", archive);
Neil Fuller00473682014-07-25 14:43:04 +0100738 delete archive;
Narayan Kamath7462f022013-11-21 13:05:04 +0000739}
740
741static int32_t UpdateEntryFromDataDescriptor(int fd,
742 ZipEntry *entry) {
Narayan Kamath926973e2014-06-09 14:18:14 +0100743 uint8_t ddBuf[sizeof(DataDescriptor) + sizeof(DataDescriptor::kOptSignature)];
Narayan Kamath7462f022013-11-21 13:05:04 +0000744 ssize_t actual = TEMP_FAILURE_RETRY(read(fd, ddBuf, sizeof(ddBuf)));
745 if (actual != sizeof(ddBuf)) {
746 return kIoError;
747 }
748
Narayan Kamath926973e2014-06-09 14:18:14 +0100749 const uint32_t ddSignature = *(reinterpret_cast<const uint32_t*>(ddBuf));
750 const uint16_t offset = (ddSignature == DataDescriptor::kOptSignature) ? 4 : 0;
751 const DataDescriptor* descriptor = reinterpret_cast<const DataDescriptor*>(ddBuf + offset);
Narayan Kamath7462f022013-11-21 13:05:04 +0000752
Narayan Kamath926973e2014-06-09 14:18:14 +0100753 entry->crc32 = descriptor->crc32;
754 entry->compressed_length = descriptor->compressed_size;
755 entry->uncompressed_length = descriptor->uncompressed_size;
Narayan Kamath7462f022013-11-21 13:05:04 +0000756
757 return 0;
758}
759
760// Attempts to read |len| bytes into |buf| at offset |off|.
761//
762// This method uses pread64 on platforms that support it and
763// lseek64 + read on platforms that don't. This implies that
764// callers should not rely on the |fd| offset being incremented
765// as a side effect of this call.
766static inline ssize_t ReadAtOffset(int fd, uint8_t* buf, size_t len,
767 off64_t off) {
768#ifdef HAVE_PREAD
769 return TEMP_FAILURE_RETRY(pread64(fd, buf, len, off));
770#else
771 // The only supported platform that doesn't support pread at the moment
772 // is Windows. Only recent versions of windows support unix like forks,
773 // and even there the semantics are quite different.
774 if (lseek64(fd, off, SEEK_SET) != off) {
Mark Salyzyn99ef9912014-03-14 14:26:22 -0700775 ALOGW("Zip: failed seek to offset %" PRId64, off);
Narayan Kamath7462f022013-11-21 13:05:04 +0000776 return kIoError;
777 }
778
779 return TEMP_FAILURE_RETRY(read(fd, buf, len));
780#endif // HAVE_PREAD
781}
782
783static int32_t FindEntry(const ZipArchive* archive, const int ent,
784 ZipEntry* data) {
785 const uint16_t nameLen = archive->hash_table[ent].name_length;
786 const char* name = archive->hash_table[ent].name;
787
788 // Recover the start of the central directory entry from the filename
789 // pointer. The filename is the first entry past the fixed-size data,
790 // so we can just subtract back from that.
Narayan Kamath926973e2014-06-09 14:18:14 +0100791 const uint8_t* ptr = reinterpret_cast<const uint8_t*>(name);
792 ptr -= sizeof(CentralDirectoryRecord);
Narayan Kamath7462f022013-11-21 13:05:04 +0000793
794 // This is the base of our mmapped region, we have to sanity check that
795 // the name that's in the hash table is a pointer to a location within
796 // this mapped region.
Narayan Kamath926973e2014-06-09 14:18:14 +0100797 const uint8_t* base_ptr = reinterpret_cast<const uint8_t*>(
798 archive->directory_map->getDataPtr());
Narayan Kamatheaf98852013-12-11 14:51:51 +0000799 if (ptr < base_ptr || ptr > base_ptr + archive->directory_map->getDataLength()) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000800 ALOGW("Zip: Invalid entry pointer");
801 return kInvalidOffset;
802 }
803
Narayan Kamath926973e2014-06-09 14:18:14 +0100804 const CentralDirectoryRecord *cdr =
805 reinterpret_cast<const CentralDirectoryRecord*>(ptr);
806
Narayan Kamath7462f022013-11-21 13:05:04 +0000807 // The offset of the start of the central directory in the zipfile.
808 // We keep this lying around so that we can sanity check all our lengths
809 // and our per-file structures.
810 const off64_t cd_offset = archive->directory_offset;
811
812 // Fill out the compression method, modification time, crc32
813 // and other interesting attributes from the central directory. These
814 // will later be compared against values from the local file header.
Narayan Kamath926973e2014-06-09 14:18:14 +0100815 data->method = cdr->compression_method;
816 data->mod_time = cdr->last_mod_time;
817 data->crc32 = cdr->crc32;
818 data->compressed_length = cdr->compressed_size;
819 data->uncompressed_length = cdr->uncompressed_size;
Narayan Kamath7462f022013-11-21 13:05:04 +0000820
821 // Figure out the local header offset from the central directory. The
822 // actual file data will begin after the local header and the name /
823 // extra comments.
Narayan Kamath926973e2014-06-09 14:18:14 +0100824 const off64_t local_header_offset = cdr->local_file_header_offset;
825 if (local_header_offset + static_cast<off64_t>(sizeof(LocalFileHeader)) >= cd_offset) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000826 ALOGW("Zip: bad local hdr offset in zip");
827 return kInvalidOffset;
828 }
829
Narayan Kamath926973e2014-06-09 14:18:14 +0100830 uint8_t lfh_buf[sizeof(LocalFileHeader)];
Narayan Kamath7462f022013-11-21 13:05:04 +0000831 ssize_t actual = ReadAtOffset(archive->fd, lfh_buf, sizeof(lfh_buf),
832 local_header_offset);
833 if (actual != sizeof(lfh_buf)) {
Mark Salyzyn56a90a02014-05-08 17:20:55 -0700834 ALOGW("Zip: failed reading lfh name from offset %" PRId64, (int64_t)local_header_offset);
Narayan Kamath7462f022013-11-21 13:05:04 +0000835 return kIoError;
836 }
837
Narayan Kamath926973e2014-06-09 14:18:14 +0100838 const LocalFileHeader *lfh = reinterpret_cast<const LocalFileHeader*>(lfh_buf);
839
840 if (lfh->lfh_signature != LocalFileHeader::kSignature) {
Mark Salyzyn99ef9912014-03-14 14:26:22 -0700841 ALOGW("Zip: didn't find signature at start of lfh, offset=%" PRId64,
Narayan Kamath926973e2014-06-09 14:18:14 +0100842 static_cast<int64_t>(local_header_offset));
Narayan Kamath7462f022013-11-21 13:05:04 +0000843 return kInvalidOffset;
844 }
845
846 // Paranoia: Match the values specified in the local file header
847 // to those specified in the central directory.
Narayan Kamath926973e2014-06-09 14:18:14 +0100848 if ((lfh->gpb_flags & kGPBDDFlagMask) == 0) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000849 data->has_data_descriptor = 0;
Narayan Kamath926973e2014-06-09 14:18:14 +0100850 if (data->compressed_length != lfh->compressed_size
851 || data->uncompressed_length != lfh->uncompressed_size
852 || data->crc32 != lfh->crc32) {
Mark Salyzyn088bf902014-05-08 16:02:20 -0700853 ALOGW("Zip: size/crc32 mismatch. expected {%" PRIu32 ", %" PRIu32
854 ", %" PRIx32 "}, was {%" PRIu32 ", %" PRIu32 ", %" PRIx32 "}",
Narayan Kamath7462f022013-11-21 13:05:04 +0000855 data->compressed_length, data->uncompressed_length, data->crc32,
Narayan Kamath926973e2014-06-09 14:18:14 +0100856 lfh->compressed_size, lfh->uncompressed_size, lfh->crc32);
Narayan Kamath7462f022013-11-21 13:05:04 +0000857 return kInconsistentInformation;
858 }
859 } else {
860 data->has_data_descriptor = 1;
861 }
862
863 // Check that the local file header name matches the declared
864 // name in the central directory.
Narayan Kamath926973e2014-06-09 14:18:14 +0100865 if (lfh->file_name_length == nameLen) {
866 const off64_t name_offset = local_header_offset + sizeof(LocalFileHeader);
867 if (name_offset + lfh->file_name_length >= cd_offset) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000868 ALOGW("Zip: Invalid declared length");
869 return kInvalidOffset;
870 }
871
872 uint8_t* name_buf = (uint8_t*) malloc(nameLen);
873 ssize_t actual = ReadAtOffset(archive->fd, name_buf, nameLen,
874 name_offset);
875
876 if (actual != nameLen) {
Mark Salyzyn56a90a02014-05-08 17:20:55 -0700877 ALOGW("Zip: failed reading lfh name from offset %" PRId64, (int64_t)name_offset);
Narayan Kamath7462f022013-11-21 13:05:04 +0000878 free(name_buf);
879 return kIoError;
880 }
881
882 if (memcmp(name, name_buf, nameLen)) {
883 free(name_buf);
884 return kInconsistentInformation;
885 }
886
887 free(name_buf);
888 } else {
889 ALOGW("Zip: lfh name did not match central directory.");
890 return kInconsistentInformation;
891 }
892
Narayan Kamath926973e2014-06-09 14:18:14 +0100893 const off64_t data_offset = local_header_offset + sizeof(LocalFileHeader)
894 + lfh->file_name_length + lfh->extra_field_length;
Narayan Kamath48953a12014-01-24 12:32:39 +0000895 if (data_offset > cd_offset) {
Mark Salyzyn56a90a02014-05-08 17:20:55 -0700896 ALOGW("Zip: bad data offset %" PRId64 " in zip", (int64_t)data_offset);
Narayan Kamath7462f022013-11-21 13:05:04 +0000897 return kInvalidOffset;
898 }
899
900 if ((off64_t)(data_offset + data->compressed_length) > cd_offset) {
Mark Salyzyn088bf902014-05-08 16:02:20 -0700901 ALOGW("Zip: bad compressed length in zip (%" PRId64 " + %" PRIu32 " > %" PRId64 ")",
Mark Salyzyn56a90a02014-05-08 17:20:55 -0700902 (int64_t)data_offset, data->compressed_length, (int64_t)cd_offset);
Narayan Kamath7462f022013-11-21 13:05:04 +0000903 return kInvalidOffset;
904 }
905
906 if (data->method == kCompressStored &&
907 (off64_t)(data_offset + data->uncompressed_length) > cd_offset) {
Mark Salyzyn088bf902014-05-08 16:02:20 -0700908 ALOGW("Zip: bad uncompressed length in zip (%" PRId64 " + %" PRIu32 " > %" PRId64 ")",
Mark Salyzyn96c5c992014-05-08 19:16:40 -0700909 (int64_t)data_offset, data->uncompressed_length, (int64_t)cd_offset);
Narayan Kamath7462f022013-11-21 13:05:04 +0000910 return kInvalidOffset;
911 }
912
913 data->offset = data_offset;
914 return 0;
915}
916
917struct IterationHandle {
918 uint32_t position;
919 const char* prefix;
920 uint16_t prefix_len;
921 ZipArchive* archive;
922};
923
924int32_t StartIteration(ZipArchiveHandle handle, void** cookie_ptr, const char* prefix) {
925 ZipArchive* archive = (ZipArchive *) handle;
926
927 if (archive == NULL || archive->hash_table == NULL) {
928 ALOGW("Zip: Invalid ZipArchiveHandle");
929 return kInvalidHandle;
930 }
931
932 IterationHandle* cookie = (IterationHandle*) malloc(sizeof(IterationHandle));
933 cookie->position = 0;
934 cookie->prefix = prefix;
935 cookie->archive = archive;
936 if (prefix != NULL) {
937 cookie->prefix_len = strlen(prefix);
938 }
939
940 *cookie_ptr = cookie ;
941 return 0;
942}
943
944int32_t FindEntry(const ZipArchiveHandle handle, const char* entryName,
945 ZipEntry* data) {
946 const ZipArchive* archive = (ZipArchive*) handle;
947 const int nameLen = strlen(entryName);
948 if (nameLen == 0 || nameLen > 65535) {
949 ALOGW("Zip: Invalid filename %s", entryName);
950 return kInvalidEntryName;
951 }
952
953 const int64_t ent = EntryToIndex(archive->hash_table,
954 archive->hash_table_size, entryName, nameLen);
955
956 if (ent < 0) {
Narayan Kamatha1ff8012013-12-31 10:27:59 +0000957 ALOGV("Zip: Could not find entry %.*s", nameLen, entryName);
Narayan Kamath7462f022013-11-21 13:05:04 +0000958 return ent;
959 }
960
961 return FindEntry(archive, ent, data);
962}
963
964int32_t Next(void* cookie, ZipEntry* data, ZipEntryName* name) {
965 IterationHandle* handle = (IterationHandle *) cookie;
966 if (handle == NULL) {
967 return kInvalidHandle;
968 }
969
970 ZipArchive* archive = handle->archive;
971 if (archive == NULL || archive->hash_table == NULL) {
972 ALOGW("Zip: Invalid ZipArchiveHandle");
973 return kInvalidHandle;
974 }
975
976 const uint32_t currentOffset = handle->position;
977 const uint32_t hash_table_length = archive->hash_table_size;
978 const ZipEntryName *hash_table = archive->hash_table;
979
980 for (uint32_t i = currentOffset; i < hash_table_length; ++i) {
981 if (hash_table[i].name != NULL &&
982 (handle->prefix == NULL ||
983 (memcmp(handle->prefix, hash_table[i].name, handle->prefix_len) == 0))) {
984 handle->position = (i + 1);
985 const int error = FindEntry(archive, i, data);
986 if (!error) {
987 name->name = hash_table[i].name;
988 name->name_length = hash_table[i].name_length;
989 }
990
991 return error;
992 }
993 }
994
995 handle->position = 0;
996 return kIterationEnd;
997}
998
999static int32_t InflateToFile(int fd, const ZipEntry* entry,
1000 uint8_t* begin, uint32_t length,
1001 uint64_t* crc_out) {
1002 int32_t result = -1;
1003 const uint32_t kBufSize = 32768;
1004 uint8_t read_buf[kBufSize];
1005 uint8_t write_buf[kBufSize];
1006 z_stream zstream;
1007 int zerr;
1008
1009 /*
1010 * Initialize the zlib stream struct.
1011 */
1012 memset(&zstream, 0, sizeof(zstream));
1013 zstream.zalloc = Z_NULL;
1014 zstream.zfree = Z_NULL;
1015 zstream.opaque = Z_NULL;
1016 zstream.next_in = NULL;
1017 zstream.avail_in = 0;
1018 zstream.next_out = (Bytef*) write_buf;
1019 zstream.avail_out = kBufSize;
1020 zstream.data_type = Z_UNKNOWN;
1021
1022 /*
1023 * Use the undocumented "negative window bits" feature to tell zlib
1024 * that there's no zlib header waiting for it.
1025 */
1026 zerr = inflateInit2(&zstream, -MAX_WBITS);
1027 if (zerr != Z_OK) {
1028 if (zerr == Z_VERSION_ERROR) {
1029 ALOGE("Installed zlib is not compatible with linked version (%s)",
1030 ZLIB_VERSION);
1031 } else {
1032 ALOGW("Call to inflateInit2 failed (zerr=%d)", zerr);
1033 }
1034
1035 return kZlibError;
1036 }
1037
1038 const uint32_t uncompressed_length = entry->uncompressed_length;
1039
1040 uint32_t compressed_length = entry->compressed_length;
1041 uint32_t write_count = 0;
1042 do {
1043 /* read as much as we can */
1044 if (zstream.avail_in == 0) {
Mark Salyzyn51d562d2014-05-05 14:38:05 -07001045 const ZD_TYPE getSize = (compressed_length > kBufSize) ? kBufSize : compressed_length;
1046 const ZD_TYPE actual = TEMP_FAILURE_RETRY(read(fd, read_buf, getSize));
Narayan Kamath7462f022013-11-21 13:05:04 +00001047 if (actual != getSize) {
Mark Salyzyn51d562d2014-05-05 14:38:05 -07001048 ALOGW("Zip: inflate read failed (" ZD " vs " ZD ")", actual, getSize);
Narayan Kamath7462f022013-11-21 13:05:04 +00001049 result = kIoError;
1050 goto z_bail;
1051 }
1052
1053 compressed_length -= getSize;
1054
1055 zstream.next_in = read_buf;
1056 zstream.avail_in = getSize;
1057 }
1058
1059 /* uncompress the data */
1060 zerr = inflate(&zstream, Z_NO_FLUSH);
1061 if (zerr != Z_OK && zerr != Z_STREAM_END) {
1062 ALOGW("Zip: inflate zerr=%d (nIn=%p aIn=%u nOut=%p aOut=%u)",
1063 zerr, zstream.next_in, zstream.avail_in,
1064 zstream.next_out, zstream.avail_out);
1065 result = kZlibError;
1066 goto z_bail;
1067 }
1068
1069 /* write when we're full or when we're done */
1070 if (zstream.avail_out == 0 ||
1071 (zerr == Z_STREAM_END && zstream.avail_out != kBufSize)) {
1072 const size_t write_size = zstream.next_out - write_buf;
1073 // The file might have declared a bogus length.
1074 if (write_size + write_count > length) {
1075 goto z_bail;
1076 }
1077 memcpy(begin + write_count, write_buf, write_size);
1078 write_count += write_size;
1079
1080 zstream.next_out = write_buf;
1081 zstream.avail_out = kBufSize;
1082 }
1083 } while (zerr == Z_OK);
1084
1085 assert(zerr == Z_STREAM_END); /* other errors should've been caught */
1086
1087 // stream.adler holds the crc32 value for such streams.
1088 *crc_out = zstream.adler;
1089
1090 if (zstream.total_out != uncompressed_length || compressed_length != 0) {
Mark Salyzyn088bf902014-05-08 16:02:20 -07001091 ALOGW("Zip: size mismatch on inflated file (%lu vs %" PRIu32 ")",
Narayan Kamath7462f022013-11-21 13:05:04 +00001092 zstream.total_out, uncompressed_length);
1093 result = kInconsistentInformation;
1094 goto z_bail;
1095 }
1096
1097 result = 0;
1098
1099z_bail:
1100 inflateEnd(&zstream); /* free up any allocated structures */
1101
1102 return result;
1103}
1104
1105int32_t ExtractToMemory(ZipArchiveHandle handle,
1106 ZipEntry* entry, uint8_t* begin, uint32_t size) {
1107 ZipArchive* archive = (ZipArchive*) handle;
1108 const uint16_t method = entry->method;
1109 off64_t data_offset = entry->offset;
1110
1111 if (lseek64(archive->fd, data_offset, SEEK_SET) != data_offset) {
Mark Salyzyn56a90a02014-05-08 17:20:55 -07001112 ALOGW("Zip: lseek to data at %" PRId64 " failed", (int64_t)data_offset);
Narayan Kamath7462f022013-11-21 13:05:04 +00001113 return kIoError;
1114 }
1115
1116 // this should default to kUnknownCompressionMethod.
1117 int32_t return_value = -1;
1118 uint64_t crc = 0;
1119 if (method == kCompressStored) {
1120 return_value = CopyFileToFile(archive->fd, begin, size, &crc);
1121 } else if (method == kCompressDeflated) {
1122 return_value = InflateToFile(archive->fd, entry, begin, size, &crc);
1123 }
1124
1125 if (!return_value && entry->has_data_descriptor) {
1126 return_value = UpdateEntryFromDataDescriptor(archive->fd, entry);
1127 if (return_value) {
1128 return return_value;
1129 }
1130 }
1131
1132 // TODO: Fix this check by passing the right flags to inflate2 so that
1133 // it calculates the CRC for us.
1134 if (entry->crc32 != crc && false) {
Mark Salyzyn088bf902014-05-08 16:02:20 -07001135 ALOGW("Zip: crc mismatch: expected %" PRIu32 ", was %" PRIu64, entry->crc32, crc);
Narayan Kamath7462f022013-11-21 13:05:04 +00001136 return kInconsistentInformation;
1137 }
1138
1139 return return_value;
1140}
1141
1142int32_t ExtractEntryToFile(ZipArchiveHandle handle,
1143 ZipEntry* entry, int fd) {
1144 const int32_t declared_length = entry->uncompressed_length;
1145
Narayan Kamath00a258c2013-12-13 16:06:19 +00001146 const off64_t current_offset = lseek64(fd, 0, SEEK_CUR);
1147 if (current_offset == -1) {
1148 ALOGW("Zip: unable to seek to current location on fd %d: %s", fd,
1149 strerror(errno));
Narayan Kamath7462f022013-11-21 13:05:04 +00001150 return kIoError;
1151 }
1152
Narayan Kamath00a258c2013-12-13 16:06:19 +00001153 int result = TEMP_FAILURE_RETRY(ftruncate(fd, declared_length + current_offset));
1154 if (result == -1) {
Mark Salyzyn99ef9912014-03-14 14:26:22 -07001155 ALOGW("Zip: unable to truncate file to %" PRId64 ": %s",
Mark Salyzyn56a90a02014-05-08 17:20:55 -07001156 (int64_t)(declared_length + current_offset), strerror(errno));
Narayan Kamath00a258c2013-12-13 16:06:19 +00001157 return kIoError;
1158 }
1159
Narayan Kamath48953a12014-01-24 12:32:39 +00001160 // Don't attempt to map a region of length 0. We still need the
1161 // ftruncate() though, since the API guarantees that we will truncate
1162 // the file to the end of the uncompressed output.
1163 if (declared_length == 0) {
1164 return 0;
1165 }
1166
Narayan Kamath00a258c2013-12-13 16:06:19 +00001167 android::FileMap* map = MapFileSegment(fd, current_offset, declared_length,
Narayan Kamatheaf98852013-12-11 14:51:51 +00001168 false, kTempMappingFileName);
1169 if (map == NULL) {
1170 return kMmapFailed;
Narayan Kamath7462f022013-11-21 13:05:04 +00001171 }
1172
Narayan Kamatheaf98852013-12-11 14:51:51 +00001173 const int32_t error = ExtractToMemory(handle, entry,
1174 reinterpret_cast<uint8_t*>(map->getDataPtr()),
1175 map->getDataLength());
1176 map->release();
Narayan Kamath7462f022013-11-21 13:05:04 +00001177 return error;
1178}
1179
1180const char* ErrorCodeString(int32_t error_code) {
1181 if (error_code > kErrorMessageLowerBound && error_code < kErrorMessageUpperBound) {
1182 return kErrorMessages[error_code * -1];
1183 }
1184
1185 return kErrorMessages[0];
1186}
1187
1188int GetFileDescriptor(const ZipArchiveHandle handle) {
1189 return ((ZipArchive*) handle)->fd;
1190}
1191