blob: e6e0276a3af29c16d0d526434f2aa778944878bf [file] [log] [blame]
Narayan Kamath7462f022013-11-21 13:05:04 +00001/*
2 * Copyright (C) 2008 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17/*
18 * Read-only access to Zip archives, with minimal heap allocation.
19 */
Narayan Kamath7462f022013-11-21 13:05:04 +000020
Mark Salyzyncfd5b082016-10-17 14:28:00 -070021#define LOG_TAG "ziparchive"
22
Narayan Kamath7462f022013-11-21 13:05:04 +000023#include <assert.h>
24#include <errno.h>
Mark Salyzyn99ef9912014-03-14 14:26:22 -070025#include <fcntl.h>
26#include <inttypes.h>
Narayan Kamath7462f022013-11-21 13:05:04 +000027#include <limits.h>
Narayan Kamath7462f022013-11-21 13:05:04 +000028#include <stdlib.h>
29#include <string.h>
Narayan Kamath7462f022013-11-21 13:05:04 +000030#include <unistd.h>
31
Dan Albert1ae07642015-04-09 14:11:18 -070032#include <memory>
33#include <vector>
34
Mark Salyzynff2dcd92016-09-28 15:54:45 -070035#include <android-base/file.h>
36#include <android-base/logging.h>
37#include <android-base/macros.h> // TEMP_FAILURE_RETRY may or may not be in unistd
38#include <android-base/memory.h>
Mark Salyzyncfd5b082016-10-17 14:28:00 -070039#include <log/log.h>
Mark Salyzynff2dcd92016-09-28 15:54:45 -070040#include <utils/Compat.h>
41#include <utils/FileMap.h>
Christopher Ferrise6884ce2015-11-10 14:55:12 -080042#include "ziparchive/zip_archive.h"
Dan Albert1ae07642015-04-09 14:11:18 -070043#include "zlib.h"
Narayan Kamath7462f022013-11-21 13:05:04 +000044
Narayan Kamath044bc8e2014-12-03 18:22:53 +000045#include "entry_name_utils-inl.h"
Adam Lesinskiad4ad8c2015-10-05 18:16:18 -070046#include "zip_archive_common.h"
Christopher Ferrise6884ce2015-11-10 14:55:12 -080047#include "zip_archive_private.h"
Mark Salyzyn99ef9912014-03-14 14:26:22 -070048
Dan Albert1ae07642015-04-09 14:11:18 -070049using android::base::get_unaligned;
Narayan Kamath044bc8e2014-12-03 18:22:53 +000050
Narayan Kamath926973e2014-06-09 14:18:14 +010051// This is for windows. If we don't open a file in binary mode, weird
Narayan Kamath7462f022013-11-21 13:05:04 +000052// things will happen.
53#ifndef O_BINARY
54#define O_BINARY 0
55#endif
56
Narayan Kamath926973e2014-06-09 14:18:14 +010057// The maximum number of bytes to scan backwards for the EOCD start.
58static const uint32_t kMaxEOCDSearch = kMaxCommentLen + sizeof(EocdRecord);
59
Narayan Kamath7462f022013-11-21 13:05:04 +000060static const char* kErrorMessages[] = {
61 "Unknown return code.",
Narayan Kamatheb41ad22013-12-09 16:26:36 +000062 "Iteration ended",
Narayan Kamath7462f022013-11-21 13:05:04 +000063 "Zlib error",
64 "Invalid file",
65 "Invalid handle",
66 "Duplicate entries in archive",
67 "Empty archive",
68 "Entry not found",
69 "Invalid offset",
70 "Inconsistent information",
71 "Invalid entry name",
Narayan Kamatheb41ad22013-12-09 16:26:36 +000072 "I/O Error",
Narayan Kamatheaf98852013-12-11 14:51:51 +000073 "File mapping failed"
Narayan Kamath7462f022013-11-21 13:05:04 +000074};
75
76static const int32_t kErrorMessageUpperBound = 0;
77
Narayan Kamatheb41ad22013-12-09 16:26:36 +000078static const int32_t kIterationEnd = -1;
Narayan Kamath7462f022013-11-21 13:05:04 +000079
80// We encountered a Zlib error when inflating a stream from this file.
81// Usually indicates file corruption.
82static const int32_t kZlibError = -2;
83
84// The input file cannot be processed as a zip archive. Usually because
85// it's too small, too large or does not have a valid signature.
86static const int32_t kInvalidFile = -3;
87
88// An invalid iteration / ziparchive handle was passed in as an input
89// argument.
90static const int32_t kInvalidHandle = -4;
91
92// The zip archive contained two (or possibly more) entries with the same
93// name.
94static const int32_t kDuplicateEntry = -5;
95
96// The zip archive contains no entries.
97static const int32_t kEmptyArchive = -6;
98
99// The specified entry was not found in the archive.
100static const int32_t kEntryNotFound = -7;
101
102// The zip archive contained an invalid local file header pointer.
103static const int32_t kInvalidOffset = -8;
104
105// The zip archive contained inconsistent entry information. This could
106// be because the central directory & local file header did not agree, or
107// if the actual uncompressed length or crc32 do not match their declared
108// values.
109static const int32_t kInconsistentInformation = -9;
110
111// An invalid entry name was encountered.
112static const int32_t kInvalidEntryName = -10;
113
Narayan Kamatheb41ad22013-12-09 16:26:36 +0000114// An I/O related system call (read, lseek, ftruncate, map) failed.
115static const int32_t kIoError = -11;
Narayan Kamath7462f022013-11-21 13:05:04 +0000116
Narayan Kamatheaf98852013-12-11 14:51:51 +0000117// We were not able to mmap the central directory or entry contents.
118static const int32_t kMmapFailed = -12;
Narayan Kamath7462f022013-11-21 13:05:04 +0000119
Narayan Kamatheaf98852013-12-11 14:51:51 +0000120static const int32_t kErrorMessageLowerBound = -13;
Narayan Kamath7462f022013-11-21 13:05:04 +0000121
Narayan Kamath7462f022013-11-21 13:05:04 +0000122/*
123 * A Read-only Zip archive.
124 *
125 * We want "open" and "find entry by name" to be fast operations, and
126 * we want to use as little memory as possible. We memory-map the zip
127 * central directory, and load a hash table with pointers to the filenames
128 * (which aren't null-terminated). The other fields are at a fixed offset
129 * from the filename, so we don't need to extract those (but we do need
130 * to byte-read and endian-swap them every time we want them).
131 *
132 * It's possible that somebody has handed us a massive (~1GB) zip archive,
133 * so we can't expect to mmap the entire file.
134 *
135 * To speed comparisons when doing a lookup by name, we could make the mapping
136 * "private" (copy-on-write) and null-terminate the filenames after verifying
137 * the record structure. However, this requires a private mapping of
138 * every page that the Central Directory touches. Easier to tuck a copy
139 * of the string length into the hash table entry.
140 */
Narayan Kamath7462f022013-11-21 13:05:04 +0000141
Narayan Kamath7462f022013-11-21 13:05:04 +0000142/*
143 * Round up to the next highest power of 2.
144 *
145 * Found on http://graphics.stanford.edu/~seander/bithacks.html.
146 */
147static uint32_t RoundUpPower2(uint32_t val) {
148 val--;
149 val |= val >> 1;
150 val |= val >> 2;
151 val |= val >> 4;
152 val |= val >> 8;
153 val |= val >> 16;
154 val++;
155
156 return val;
157}
158
Yusuke Sato07447542015-06-25 14:39:19 -0700159static uint32_t ComputeHash(const ZipString& name) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000160 uint32_t hash = 0;
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100161 uint16_t len = name.name_length;
162 const uint8_t* str = name.name;
Narayan Kamath7462f022013-11-21 13:05:04 +0000163
164 while (len--) {
165 hash = hash * 31 + *str++;
166 }
167
168 return hash;
169}
170
171/*
172 * Convert a ZipEntry to a hash table index, verifying that it's in a
173 * valid range.
174 */
Yusuke Sato07447542015-06-25 14:39:19 -0700175static int64_t EntryToIndex(const ZipString* hash_table,
Narayan Kamath7462f022013-11-21 13:05:04 +0000176 const uint32_t hash_table_size,
Yusuke Sato07447542015-06-25 14:39:19 -0700177 const ZipString& name) {
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100178 const uint32_t hash = ComputeHash(name);
Narayan Kamath7462f022013-11-21 13:05:04 +0000179
180 // NOTE: (hash_table_size - 1) is guaranteed to be non-negative.
181 uint32_t ent = hash & (hash_table_size - 1);
182 while (hash_table[ent].name != NULL) {
Yusuke Sato07447542015-06-25 14:39:19 -0700183 if (hash_table[ent] == name) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000184 return ent;
185 }
186
187 ent = (ent + 1) & (hash_table_size - 1);
188 }
189
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100190 ALOGV("Zip: Unable to find entry %.*s", name.name_length, name.name);
Narayan Kamath7462f022013-11-21 13:05:04 +0000191 return kEntryNotFound;
192}
193
194/*
195 * Add a new entry to the hash table.
196 */
Yusuke Sato07447542015-06-25 14:39:19 -0700197static int32_t AddToHash(ZipString *hash_table, const uint64_t hash_table_size,
198 const ZipString& name) {
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100199 const uint64_t hash = ComputeHash(name);
Narayan Kamath7462f022013-11-21 13:05:04 +0000200 uint32_t ent = hash & (hash_table_size - 1);
201
202 /*
203 * We over-allocated the table, so we're guaranteed to find an empty slot.
204 * Further, we guarantee that the hashtable size is not 0.
205 */
206 while (hash_table[ent].name != NULL) {
Yusuke Sato07447542015-06-25 14:39:19 -0700207 if (hash_table[ent] == name) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000208 // We've found a duplicate entry. We don't accept it
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100209 ALOGW("Zip: Found duplicate entry %.*s", name.name_length, name.name);
Narayan Kamath7462f022013-11-21 13:05:04 +0000210 return kDuplicateEntry;
211 }
212 ent = (ent + 1) & (hash_table_size - 1);
213 }
214
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100215 hash_table[ent].name = name.name;
216 hash_table[ent].name_length = name.name_length;
Narayan Kamath7462f022013-11-21 13:05:04 +0000217 return 0;
218}
219
Tianjie Xu18c25922016-09-29 15:27:41 -0700220static int32_t MapCentralDirectory0(const char* debug_file_name, ZipArchive* archive,
221 off64_t file_length, off64_t read_amount,
222 uint8_t* scan_buffer) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000223 const off64_t search_start = file_length - read_amount;
224
Tianjie Xu18c25922016-09-29 15:27:41 -0700225 if(!archive->mapped_zip.ReadAtOffset(scan_buffer, read_amount, search_start)) {
226 ALOGE("Zip: read %" PRId64 " from offset %" PRId64 " failed",
227 static_cast<int64_t>(read_amount), static_cast<int64_t>(search_start));
Narayan Kamath7462f022013-11-21 13:05:04 +0000228 return kIoError;
229 }
230
231 /*
232 * Scan backward for the EOCD magic. In an archive without a trailing
233 * comment, we'll find it on the first try. (We may want to consider
234 * doing an initial minimal read; if we don't find it, retry with a
235 * second read as above.)
236 */
Narayan Kamath926973e2014-06-09 14:18:14 +0100237 int i = read_amount - sizeof(EocdRecord);
238 for (; i >= 0; i--) {
Dan Albert1ae07642015-04-09 14:11:18 -0700239 if (scan_buffer[i] == 0x50) {
240 uint32_t* sig_addr = reinterpret_cast<uint32_t*>(&scan_buffer[i]);
241 if (get_unaligned<uint32_t>(sig_addr) == EocdRecord::kSignature) {
242 ALOGV("+++ Found EOCD at buf+%d", i);
243 break;
244 }
Narayan Kamath7462f022013-11-21 13:05:04 +0000245 }
246 }
247 if (i < 0) {
248 ALOGD("Zip: EOCD not found, %s is not zip", debug_file_name);
249 return kInvalidFile;
250 }
251
252 const off64_t eocd_offset = search_start + i;
Narayan Kamath926973e2014-06-09 14:18:14 +0100253 const EocdRecord* eocd = reinterpret_cast<const EocdRecord*>(scan_buffer + i);
Narayan Kamath7462f022013-11-21 13:05:04 +0000254 /*
Narayan Kamath926973e2014-06-09 14:18:14 +0100255 * Verify that there's no trailing space at the end of the central directory
256 * and its comment.
Narayan Kamath7462f022013-11-21 13:05:04 +0000257 */
Narayan Kamath926973e2014-06-09 14:18:14 +0100258 const off64_t calculated_length = eocd_offset + sizeof(EocdRecord)
259 + eocd->comment_length;
260 if (calculated_length != file_length) {
Narayan Kamath4f6b4992014-06-03 13:59:23 +0100261 ALOGW("Zip: %" PRId64 " extraneous bytes at the end of the central directory",
Narayan Kamath926973e2014-06-09 14:18:14 +0100262 static_cast<int64_t>(file_length - calculated_length));
Narayan Kamath4f6b4992014-06-03 13:59:23 +0100263 return kInvalidFile;
264 }
Narayan Kamath7462f022013-11-21 13:05:04 +0000265
Narayan Kamath926973e2014-06-09 14:18:14 +0100266 /*
267 * Grab the CD offset and size, and the number of entries in the
268 * archive and verify that they look reasonable.
269 */
270 if (eocd->cd_start_offset + eocd->cd_size > eocd_offset) {
271 ALOGW("Zip: bad offsets (dir %" PRIu32 ", size %" PRIu32 ", eocd %" PRId64 ")",
272 eocd->cd_start_offset, eocd->cd_size, static_cast<int64_t>(eocd_offset));
Narayan Kamath7462f022013-11-21 13:05:04 +0000273 return kInvalidOffset;
274 }
Narayan Kamath926973e2014-06-09 14:18:14 +0100275 if (eocd->num_records == 0) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000276 ALOGW("Zip: empty archive?");
277 return kEmptyArchive;
278 }
279
Elliott Hughese49236b2015-06-04 15:21:59 -0700280 ALOGV("+++ num_entries=%" PRIu32 " dir_size=%" PRIu32 " dir_offset=%" PRIu32,
Narayan Kamath926973e2014-06-09 14:18:14 +0100281 eocd->num_records, eocd->cd_size, eocd->cd_start_offset);
Narayan Kamath7462f022013-11-21 13:05:04 +0000282
283 /*
284 * It all looks good. Create a mapping for the CD, and set the fields
285 * in archive.
286 */
Tianjie Xu18c25922016-09-29 15:27:41 -0700287
288 if (!archive->InitializeCentralDirectory(debug_file_name,
289 static_cast<off64_t>(eocd->cd_start_offset),
290 static_cast<size_t>(eocd->cd_size))) {
291 ALOGE("Zip: failed to intialize central directory.\n");
Narayan Kamatheaf98852013-12-11 14:51:51 +0000292 return kMmapFailed;
Narayan Kamath7462f022013-11-21 13:05:04 +0000293 }
294
Narayan Kamath926973e2014-06-09 14:18:14 +0100295 archive->num_entries = eocd->num_records;
296 archive->directory_offset = eocd->cd_start_offset;
Narayan Kamath7462f022013-11-21 13:05:04 +0000297
298 return 0;
299}
300
301/*
302 * Find the zip Central Directory and memory-map it.
303 *
304 * On success, returns 0 after populating fields from the EOCD area:
305 * directory_offset
Tianjie Xu18c25922016-09-29 15:27:41 -0700306 * directory_ptr
Narayan Kamath7462f022013-11-21 13:05:04 +0000307 * num_entries
308 */
Tianjie Xu18c25922016-09-29 15:27:41 -0700309static int32_t MapCentralDirectory(const char* debug_file_name, ZipArchive* archive) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000310
311 // Test file length. We use lseek64 to make sure the file
312 // is small enough to be a zip file (Its size must be less than
313 // 0xffffffff bytes).
Tianjie Xu18c25922016-09-29 15:27:41 -0700314 off64_t file_length = archive->mapped_zip.GetFileLength();
Narayan Kamath7462f022013-11-21 13:05:04 +0000315 if (file_length == -1) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000316 return kInvalidFile;
317 }
318
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800319 if (file_length > static_cast<off64_t>(0xffffffff)) {
Narayan Kamath926973e2014-06-09 14:18:14 +0100320 ALOGV("Zip: zip file too long %" PRId64, static_cast<int64_t>(file_length));
Narayan Kamath7462f022013-11-21 13:05:04 +0000321 return kInvalidFile;
322 }
323
Narayan Kamath926973e2014-06-09 14:18:14 +0100324 if (file_length < static_cast<off64_t>(sizeof(EocdRecord))) {
325 ALOGV("Zip: length %" PRId64 " is too small to be zip", static_cast<int64_t>(file_length));
Narayan Kamath7462f022013-11-21 13:05:04 +0000326 return kInvalidFile;
327 }
328
329 /*
330 * Perform the traditional EOCD snipe hunt.
331 *
332 * We're searching for the End of Central Directory magic number,
333 * which appears at the start of the EOCD block. It's followed by
334 * 18 bytes of EOCD stuff and up to 64KB of archive comment. We
335 * need to read the last part of the file into a buffer, dig through
336 * it to find the magic number, parse some values out, and use those
337 * to determine the extent of the CD.
338 *
339 * We start by pulling in the last part of the file.
340 */
Narayan Kamath926973e2014-06-09 14:18:14 +0100341 off64_t read_amount = kMaxEOCDSearch;
342 if (file_length < read_amount) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000343 read_amount = file_length;
344 }
345
Tianjie Xu18c25922016-09-29 15:27:41 -0700346 std::vector<uint8_t> scan_buffer(read_amount);
347 int32_t result = MapCentralDirectory0(debug_file_name, archive, file_length, read_amount,
348 scan_buffer.data());
Narayan Kamath7462f022013-11-21 13:05:04 +0000349 return result;
350}
351
352/*
353 * Parses the Zip archive's Central Directory. Allocates and populates the
354 * hash table.
355 *
356 * Returns 0 on success.
357 */
358static int32_t ParseZipArchive(ZipArchive* archive) {
Tianjie Xu18c25922016-09-29 15:27:41 -0700359 const uint8_t* const cd_ptr = archive->central_directory.GetBasePtr();
360 const size_t cd_length = archive->central_directory.GetMapLength();
Narayan Kamath926973e2014-06-09 14:18:14 +0100361 const uint16_t num_entries = archive->num_entries;
Narayan Kamath7462f022013-11-21 13:05:04 +0000362
363 /*
364 * Create hash table. We have a minimum 75% load factor, possibly as
365 * low as 50% after we round off to a power of 2. There must be at
366 * least one unused entry to avoid an infinite loop during creation.
367 */
368 archive->hash_table_size = RoundUpPower2(1 + (num_entries * 4) / 3);
Yusuke Sato07447542015-06-25 14:39:19 -0700369 archive->hash_table = reinterpret_cast<ZipString*>(calloc(archive->hash_table_size,
370 sizeof(ZipString)));
Narayan Kamath7462f022013-11-21 13:05:04 +0000371
372 /*
373 * Walk through the central directory, adding entries to the hash
374 * table and verifying values.
375 */
Narayan Kamath926973e2014-06-09 14:18:14 +0100376 const uint8_t* const cd_end = cd_ptr + cd_length;
Narayan Kamath7462f022013-11-21 13:05:04 +0000377 const uint8_t* ptr = cd_ptr;
378 for (uint16_t i = 0; i < num_entries; i++) {
Narayan Kamath926973e2014-06-09 14:18:14 +0100379 const CentralDirectoryRecord* cdr =
380 reinterpret_cast<const CentralDirectoryRecord*>(ptr);
381 if (cdr->record_signature != CentralDirectoryRecord::kSignature) {
Mark Salyzyn088bf902014-05-08 16:02:20 -0700382 ALOGW("Zip: missed a central dir sig (at %" PRIu16 ")", i);
Dmitriy Ivanov3ea93da2015-03-06 11:48:47 -0800383 return -1;
Narayan Kamath7462f022013-11-21 13:05:04 +0000384 }
385
Narayan Kamath926973e2014-06-09 14:18:14 +0100386 if (ptr + sizeof(CentralDirectoryRecord) > cd_end) {
Mark Salyzyn088bf902014-05-08 16:02:20 -0700387 ALOGW("Zip: ran off the end (at %" PRIu16 ")", i);
Dmitriy Ivanov3ea93da2015-03-06 11:48:47 -0800388 return -1;
Narayan Kamath7462f022013-11-21 13:05:04 +0000389 }
390
Narayan Kamath926973e2014-06-09 14:18:14 +0100391 const off64_t local_header_offset = cdr->local_file_header_offset;
Narayan Kamath7462f022013-11-21 13:05:04 +0000392 if (local_header_offset >= archive->directory_offset) {
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800393 ALOGW("Zip: bad LFH offset %" PRId64 " at entry %" PRIu16,
394 static_cast<int64_t>(local_header_offset), i);
Dmitriy Ivanov3ea93da2015-03-06 11:48:47 -0800395 return -1;
Narayan Kamath7462f022013-11-21 13:05:04 +0000396 }
397
Narayan Kamath926973e2014-06-09 14:18:14 +0100398 const uint16_t file_name_length = cdr->file_name_length;
399 const uint16_t extra_length = cdr->extra_field_length;
400 const uint16_t comment_length = cdr->comment_length;
Piotr Jastrzebski78271ba2014-08-15 12:53:00 +0100401 const uint8_t* file_name = ptr + sizeof(CentralDirectoryRecord);
402
Narayan Kamath044bc8e2014-12-03 18:22:53 +0000403 /* check that file name is valid UTF-8 and doesn't contain NUL (U+0000) characters */
404 if (!IsValidEntryName(file_name, file_name_length)) {
Dmitriy Ivanov3ea93da2015-03-06 11:48:47 -0800405 return -1;
Piotr Jastrzebski78271ba2014-08-15 12:53:00 +0100406 }
Narayan Kamath7462f022013-11-21 13:05:04 +0000407
408 /* add the CDE filename to the hash table */
Yusuke Sato07447542015-06-25 14:39:19 -0700409 ZipString entry_name;
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100410 entry_name.name = file_name;
411 entry_name.name_length = file_name_length;
Narayan Kamath7462f022013-11-21 13:05:04 +0000412 const int add_result = AddToHash(archive->hash_table,
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100413 archive->hash_table_size, entry_name);
Dmitriy Ivanov3ea93da2015-03-06 11:48:47 -0800414 if (add_result != 0) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000415 ALOGW("Zip: Error adding entry to hash table %d", add_result);
Dmitriy Ivanov3ea93da2015-03-06 11:48:47 -0800416 return add_result;
Narayan Kamath7462f022013-11-21 13:05:04 +0000417 }
418
Narayan Kamath926973e2014-06-09 14:18:14 +0100419 ptr += sizeof(CentralDirectoryRecord) + file_name_length + extra_length + comment_length;
420 if ((ptr - cd_ptr) > static_cast<int64_t>(cd_length)) {
Mark Salyzyn088bf902014-05-08 16:02:20 -0700421 ALOGW("Zip: bad CD advance (%tu vs %zu) at entry %" PRIu16,
422 ptr - cd_ptr, cd_length, i);
Dmitriy Ivanov3ea93da2015-03-06 11:48:47 -0800423 return -1;
Narayan Kamath7462f022013-11-21 13:05:04 +0000424 }
425 }
Mark Salyzyn088bf902014-05-08 16:02:20 -0700426 ALOGV("+++ zip good scan %" PRIu16 " entries", num_entries);
Narayan Kamath7462f022013-11-21 13:05:04 +0000427
Dmitriy Ivanov3ea93da2015-03-06 11:48:47 -0800428 return 0;
Narayan Kamath7462f022013-11-21 13:05:04 +0000429}
430
431static int32_t OpenArchiveInternal(ZipArchive* archive,
432 const char* debug_file_name) {
433 int32_t result = -1;
Tianjie Xu18c25922016-09-29 15:27:41 -0700434 if ((result = MapCentralDirectory(debug_file_name, archive)) != 0) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000435 return result;
436 }
437
438 if ((result = ParseZipArchive(archive))) {
439 return result;
440 }
441
442 return 0;
443}
444
445int32_t OpenArchiveFd(int fd, const char* debug_file_name,
Dmitriy Ivanov40b52b22014-07-15 19:33:00 -0700446 ZipArchiveHandle* handle, bool assume_ownership) {
447 ZipArchive* archive = new ZipArchive(fd, assume_ownership);
Narayan Kamath7462f022013-11-21 13:05:04 +0000448 *handle = archive;
Narayan Kamath7462f022013-11-21 13:05:04 +0000449 return OpenArchiveInternal(archive, debug_file_name);
450}
451
452int32_t OpenArchive(const char* fileName, ZipArchiveHandle* handle) {
Neil Fullerb1a113f2014-07-25 14:43:04 +0100453 const int fd = open(fileName, O_RDONLY | O_BINARY, 0);
Dmitriy Ivanov40b52b22014-07-15 19:33:00 -0700454 ZipArchive* archive = new ZipArchive(fd, true);
Narayan Kamath7462f022013-11-21 13:05:04 +0000455 *handle = archive;
456
Narayan Kamath7462f022013-11-21 13:05:04 +0000457 if (fd < 0) {
458 ALOGW("Unable to open '%s': %s", fileName, strerror(errno));
459 return kIoError;
Narayan Kamath7462f022013-11-21 13:05:04 +0000460 }
Dmitriy Ivanov40b52b22014-07-15 19:33:00 -0700461
Narayan Kamath7462f022013-11-21 13:05:04 +0000462 return OpenArchiveInternal(archive, fileName);
463}
464
Tianjie Xu18c25922016-09-29 15:27:41 -0700465int32_t OpenArchiveFromMemory(void* address, size_t length, const char* debug_file_name,
466 ZipArchiveHandle *handle) {
467 ZipArchive* archive = new ZipArchive(address, length);
468 *handle = archive;
469 return OpenArchiveInternal(archive, debug_file_name);
470}
471
Narayan Kamath7462f022013-11-21 13:05:04 +0000472/*
473 * Close a ZipArchive, closing the file and freeing the contents.
474 */
475void CloseArchive(ZipArchiveHandle handle) {
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800476 ZipArchive* archive = reinterpret_cast<ZipArchive*>(handle);
Narayan Kamath7462f022013-11-21 13:05:04 +0000477 ALOGV("Closing archive %p", archive);
Neil Fullerb1a113f2014-07-25 14:43:04 +0100478 delete archive;
Narayan Kamath7462f022013-11-21 13:05:04 +0000479}
480
Tianjie Xu18c25922016-09-29 15:27:41 -0700481static int32_t UpdateEntryFromDataDescriptor(MappedZipFile& mapped_zip,
Narayan Kamath7462f022013-11-21 13:05:04 +0000482 ZipEntry *entry) {
Narayan Kamath926973e2014-06-09 14:18:14 +0100483 uint8_t ddBuf[sizeof(DataDescriptor) + sizeof(DataDescriptor::kOptSignature)];
Tianjie Xu18c25922016-09-29 15:27:41 -0700484 if (!mapped_zip.ReadData(ddBuf, sizeof(ddBuf))) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000485 return kIoError;
486 }
487
Narayan Kamath926973e2014-06-09 14:18:14 +0100488 const uint32_t ddSignature = *(reinterpret_cast<const uint32_t*>(ddBuf));
489 const uint16_t offset = (ddSignature == DataDescriptor::kOptSignature) ? 4 : 0;
490 const DataDescriptor* descriptor = reinterpret_cast<const DataDescriptor*>(ddBuf + offset);
Narayan Kamath7462f022013-11-21 13:05:04 +0000491
Narayan Kamath926973e2014-06-09 14:18:14 +0100492 entry->crc32 = descriptor->crc32;
493 entry->compressed_length = descriptor->compressed_size;
494 entry->uncompressed_length = descriptor->uncompressed_size;
Narayan Kamath7462f022013-11-21 13:05:04 +0000495
496 return 0;
497}
498
Narayan Kamath7462f022013-11-21 13:05:04 +0000499static int32_t FindEntry(const ZipArchive* archive, const int ent,
500 ZipEntry* data) {
501 const uint16_t nameLen = archive->hash_table[ent].name_length;
Narayan Kamath7462f022013-11-21 13:05:04 +0000502
503 // Recover the start of the central directory entry from the filename
504 // pointer. The filename is the first entry past the fixed-size data,
505 // so we can just subtract back from that.
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100506 const uint8_t* ptr = archive->hash_table[ent].name;
Narayan Kamath926973e2014-06-09 14:18:14 +0100507 ptr -= sizeof(CentralDirectoryRecord);
Narayan Kamath7462f022013-11-21 13:05:04 +0000508
509 // This is the base of our mmapped region, we have to sanity check that
510 // the name that's in the hash table is a pointer to a location within
511 // this mapped region.
Tianjie Xu18c25922016-09-29 15:27:41 -0700512 const uint8_t* base_ptr = archive->central_directory.GetBasePtr();
513 if (ptr < base_ptr || ptr > base_ptr + archive->central_directory.GetMapLength()) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000514 ALOGW("Zip: Invalid entry pointer");
515 return kInvalidOffset;
516 }
517
Narayan Kamath926973e2014-06-09 14:18:14 +0100518 const CentralDirectoryRecord *cdr =
519 reinterpret_cast<const CentralDirectoryRecord*>(ptr);
520
Narayan Kamath7462f022013-11-21 13:05:04 +0000521 // The offset of the start of the central directory in the zipfile.
522 // We keep this lying around so that we can sanity check all our lengths
523 // and our per-file structures.
524 const off64_t cd_offset = archive->directory_offset;
525
526 // Fill out the compression method, modification time, crc32
527 // and other interesting attributes from the central directory. These
528 // will later be compared against values from the local file header.
Narayan Kamath926973e2014-06-09 14:18:14 +0100529 data->method = cdr->compression_method;
beonit0e99a2f2015-07-18 02:08:16 +0900530 data->mod_time = cdr->last_mod_date << 16 | cdr->last_mod_time;
Narayan Kamath926973e2014-06-09 14:18:14 +0100531 data->crc32 = cdr->crc32;
532 data->compressed_length = cdr->compressed_size;
533 data->uncompressed_length = cdr->uncompressed_size;
Narayan Kamath7462f022013-11-21 13:05:04 +0000534
535 // Figure out the local header offset from the central directory. The
536 // actual file data will begin after the local header and the name /
537 // extra comments.
Narayan Kamath926973e2014-06-09 14:18:14 +0100538 const off64_t local_header_offset = cdr->local_file_header_offset;
539 if (local_header_offset + static_cast<off64_t>(sizeof(LocalFileHeader)) >= cd_offset) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000540 ALOGW("Zip: bad local hdr offset in zip");
541 return kInvalidOffset;
542 }
543
Narayan Kamath926973e2014-06-09 14:18:14 +0100544 uint8_t lfh_buf[sizeof(LocalFileHeader)];
Tianjie Xu18c25922016-09-29 15:27:41 -0700545 if (!archive->mapped_zip.ReadAtOffset(lfh_buf, sizeof(lfh_buf), local_header_offset)) {
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800546 ALOGW("Zip: failed reading lfh name from offset %" PRId64,
547 static_cast<int64_t>(local_header_offset));
Narayan Kamath7462f022013-11-21 13:05:04 +0000548 return kIoError;
549 }
550
Narayan Kamath926973e2014-06-09 14:18:14 +0100551 const LocalFileHeader *lfh = reinterpret_cast<const LocalFileHeader*>(lfh_buf);
552
553 if (lfh->lfh_signature != LocalFileHeader::kSignature) {
Mark Salyzyn99ef9912014-03-14 14:26:22 -0700554 ALOGW("Zip: didn't find signature at start of lfh, offset=%" PRId64,
Narayan Kamath926973e2014-06-09 14:18:14 +0100555 static_cast<int64_t>(local_header_offset));
Narayan Kamath7462f022013-11-21 13:05:04 +0000556 return kInvalidOffset;
557 }
558
559 // Paranoia: Match the values specified in the local file header
560 // to those specified in the central directory.
Narayan Kamath926973e2014-06-09 14:18:14 +0100561 if ((lfh->gpb_flags & kGPBDDFlagMask) == 0) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000562 data->has_data_descriptor = 0;
Narayan Kamath926973e2014-06-09 14:18:14 +0100563 if (data->compressed_length != lfh->compressed_size
564 || data->uncompressed_length != lfh->uncompressed_size
565 || data->crc32 != lfh->crc32) {
Mark Salyzyn088bf902014-05-08 16:02:20 -0700566 ALOGW("Zip: size/crc32 mismatch. expected {%" PRIu32 ", %" PRIu32
567 ", %" PRIx32 "}, was {%" PRIu32 ", %" PRIu32 ", %" PRIx32 "}",
Narayan Kamath7462f022013-11-21 13:05:04 +0000568 data->compressed_length, data->uncompressed_length, data->crc32,
Narayan Kamath926973e2014-06-09 14:18:14 +0100569 lfh->compressed_size, lfh->uncompressed_size, lfh->crc32);
Narayan Kamath7462f022013-11-21 13:05:04 +0000570 return kInconsistentInformation;
571 }
572 } else {
573 data->has_data_descriptor = 1;
574 }
575
576 // Check that the local file header name matches the declared
577 // name in the central directory.
Narayan Kamath926973e2014-06-09 14:18:14 +0100578 if (lfh->file_name_length == nameLen) {
579 const off64_t name_offset = local_header_offset + sizeof(LocalFileHeader);
Mykola Kondratenko50afc152014-09-08 12:46:37 +0200580 if (name_offset + lfh->file_name_length > cd_offset) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000581 ALOGW("Zip: Invalid declared length");
582 return kInvalidOffset;
583 }
584
Tianjie Xu18c25922016-09-29 15:27:41 -0700585 std::vector<uint8_t> name_buf(nameLen);
586 if (!archive->mapped_zip.ReadAtOffset(name_buf.data(), nameLen, name_offset)) {
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800587 ALOGW("Zip: failed reading lfh name from offset %" PRId64, static_cast<int64_t>(name_offset));
Narayan Kamath7462f022013-11-21 13:05:04 +0000588 return kIoError;
589 }
590
Tianjie Xu18c25922016-09-29 15:27:41 -0700591 if (memcmp(archive->hash_table[ent].name, name_buf.data(), nameLen)) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000592 return kInconsistentInformation;
593 }
594
Narayan Kamath7462f022013-11-21 13:05:04 +0000595 } else {
596 ALOGW("Zip: lfh name did not match central directory.");
597 return kInconsistentInformation;
598 }
599
Narayan Kamath926973e2014-06-09 14:18:14 +0100600 const off64_t data_offset = local_header_offset + sizeof(LocalFileHeader)
601 + lfh->file_name_length + lfh->extra_field_length;
Narayan Kamath48953a12014-01-24 12:32:39 +0000602 if (data_offset > cd_offset) {
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800603 ALOGW("Zip: bad data offset %" PRId64 " in zip", static_cast<int64_t>(data_offset));
Narayan Kamath7462f022013-11-21 13:05:04 +0000604 return kInvalidOffset;
605 }
606
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800607 if (static_cast<off64_t>(data_offset + data->compressed_length) > cd_offset) {
Mark Salyzyn088bf902014-05-08 16:02:20 -0700608 ALOGW("Zip: bad compressed length in zip (%" PRId64 " + %" PRIu32 " > %" PRId64 ")",
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800609 static_cast<int64_t>(data_offset), data->compressed_length, static_cast<int64_t>(cd_offset));
Narayan Kamath7462f022013-11-21 13:05:04 +0000610 return kInvalidOffset;
611 }
612
613 if (data->method == kCompressStored &&
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800614 static_cast<off64_t>(data_offset + data->uncompressed_length) > cd_offset) {
Mark Salyzyn088bf902014-05-08 16:02:20 -0700615 ALOGW("Zip: bad uncompressed length in zip (%" PRId64 " + %" PRIu32 " > %" PRId64 ")",
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800616 static_cast<int64_t>(data_offset), data->uncompressed_length,
617 static_cast<int64_t>(cd_offset));
Narayan Kamath7462f022013-11-21 13:05:04 +0000618 return kInvalidOffset;
619 }
620
621 data->offset = data_offset;
622 return 0;
623}
624
625struct IterationHandle {
626 uint32_t position;
Piotr Jastrzebski10aa9a02014-08-19 09:01:20 +0100627 // We're not using vector here because this code is used in the Windows SDK
628 // where the STL is not available.
Yusuke Sato07447542015-06-25 14:39:19 -0700629 ZipString prefix;
630 ZipString suffix;
Narayan Kamath7462f022013-11-21 13:05:04 +0000631 ZipArchive* archive;
Piotr Jastrzebski8e085362014-08-18 11:37:45 +0100632
Yusuke Sato07447542015-06-25 14:39:19 -0700633 IterationHandle(const ZipString* in_prefix,
634 const ZipString* in_suffix) {
635 if (in_prefix) {
636 uint8_t* name_copy = new uint8_t[in_prefix->name_length];
637 memcpy(name_copy, in_prefix->name, in_prefix->name_length);
638 prefix.name = name_copy;
639 prefix.name_length = in_prefix->name_length;
640 } else {
641 prefix.name = NULL;
642 prefix.name_length = 0;
Yusuke Satof1d3d3b2015-06-25 14:09:00 -0700643 }
Yusuke Sato07447542015-06-25 14:39:19 -0700644 if (in_suffix) {
645 uint8_t* name_copy = new uint8_t[in_suffix->name_length];
646 memcpy(name_copy, in_suffix->name, in_suffix->name_length);
647 suffix.name = name_copy;
648 suffix.name_length = in_suffix->name_length;
649 } else {
650 suffix.name = NULL;
651 suffix.name_length = 0;
Yusuke Satof1d3d3b2015-06-25 14:09:00 -0700652 }
Piotr Jastrzebski8e085362014-08-18 11:37:45 +0100653 }
654
655 ~IterationHandle() {
Yusuke Sato07447542015-06-25 14:39:19 -0700656 delete[] prefix.name;
657 delete[] suffix.name;
Piotr Jastrzebski8e085362014-08-18 11:37:45 +0100658 }
Narayan Kamath7462f022013-11-21 13:05:04 +0000659};
660
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100661int32_t StartIteration(ZipArchiveHandle handle, void** cookie_ptr,
Yusuke Sato07447542015-06-25 14:39:19 -0700662 const ZipString* optional_prefix,
663 const ZipString* optional_suffix) {
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800664 ZipArchive* archive = reinterpret_cast<ZipArchive*>(handle);
Narayan Kamath7462f022013-11-21 13:05:04 +0000665
666 if (archive == NULL || archive->hash_table == NULL) {
667 ALOGW("Zip: Invalid ZipArchiveHandle");
668 return kInvalidHandle;
669 }
670
Yusuke Satof1d3d3b2015-06-25 14:09:00 -0700671 IterationHandle* cookie = new IterationHandle(optional_prefix, optional_suffix);
Narayan Kamath7462f022013-11-21 13:05:04 +0000672 cookie->position = 0;
Narayan Kamath7462f022013-11-21 13:05:04 +0000673 cookie->archive = archive;
Narayan Kamath7462f022013-11-21 13:05:04 +0000674
675 *cookie_ptr = cookie ;
676 return 0;
677}
678
Piotr Jastrzebski79c8b342014-08-08 14:02:17 +0100679void EndIteration(void* cookie) {
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100680 delete reinterpret_cast<IterationHandle*>(cookie);
Piotr Jastrzebski79c8b342014-08-08 14:02:17 +0100681}
682
Yusuke Sato07447542015-06-25 14:39:19 -0700683int32_t FindEntry(const ZipArchiveHandle handle, const ZipString& entryName,
Narayan Kamath7462f022013-11-21 13:05:04 +0000684 ZipEntry* data) {
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800685 const ZipArchive* archive = reinterpret_cast<ZipArchive*>(handle);
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100686 if (entryName.name_length == 0) {
687 ALOGW("Zip: Invalid filename %.*s", entryName.name_length, entryName.name);
Narayan Kamath7462f022013-11-21 13:05:04 +0000688 return kInvalidEntryName;
689 }
690
691 const int64_t ent = EntryToIndex(archive->hash_table,
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100692 archive->hash_table_size, entryName);
Narayan Kamath7462f022013-11-21 13:05:04 +0000693
694 if (ent < 0) {
Piotr Jastrzebskiecccc5a2014-08-11 16:35:11 +0100695 ALOGV("Zip: Could not find entry %.*s", entryName.name_length, entryName.name);
Narayan Kamath7462f022013-11-21 13:05:04 +0000696 return ent;
697 }
698
699 return FindEntry(archive, ent, data);
700}
701
Yusuke Sato07447542015-06-25 14:39:19 -0700702int32_t Next(void* cookie, ZipEntry* data, ZipString* name) {
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -0800703 IterationHandle* handle = reinterpret_cast<IterationHandle*>(cookie);
Narayan Kamath7462f022013-11-21 13:05:04 +0000704 if (handle == NULL) {
705 return kInvalidHandle;
706 }
707
708 ZipArchive* archive = handle->archive;
709 if (archive == NULL || archive->hash_table == NULL) {
710 ALOGW("Zip: Invalid ZipArchiveHandle");
711 return kInvalidHandle;
712 }
713
714 const uint32_t currentOffset = handle->position;
715 const uint32_t hash_table_length = archive->hash_table_size;
Yusuke Sato07447542015-06-25 14:39:19 -0700716 const ZipString* hash_table = archive->hash_table;
Narayan Kamath7462f022013-11-21 13:05:04 +0000717
718 for (uint32_t i = currentOffset; i < hash_table_length; ++i) {
719 if (hash_table[i].name != NULL &&
Yusuke Sato07447542015-06-25 14:39:19 -0700720 (handle->prefix.name_length == 0 ||
721 hash_table[i].StartsWith(handle->prefix)) &&
722 (handle->suffix.name_length == 0 ||
723 hash_table[i].EndsWith(handle->suffix))) {
Narayan Kamath7462f022013-11-21 13:05:04 +0000724 handle->position = (i + 1);
725 const int error = FindEntry(archive, i, data);
726 if (!error) {
727 name->name = hash_table[i].name;
728 name->name_length = hash_table[i].name_length;
729 }
730
731 return error;
732 }
733 }
734
735 handle->position = 0;
736 return kIterationEnd;
737}
738
Narayan Kamathf899bd52015-04-17 11:53:14 +0100739class Writer {
740 public:
741 virtual bool Append(uint8_t* buf, size_t buf_size) = 0;
742 virtual ~Writer() {}
743 protected:
744 Writer() = default;
745 private:
746 DISALLOW_COPY_AND_ASSIGN(Writer);
747};
748
749// A Writer that writes data to a fixed size memory region.
750// The size of the memory region must be equal to the total size of
751// the data appended to it.
752class MemoryWriter : public Writer {
753 public:
754 MemoryWriter(uint8_t* buf, size_t size) : Writer(),
755 buf_(buf), size_(size), bytes_written_(0) {
756 }
757
758 virtual bool Append(uint8_t* buf, size_t buf_size) override {
759 if (bytes_written_ + buf_size > size_) {
760 ALOGW("Zip: Unexpected size " ZD " (declared) vs " ZD " (actual)",
761 size_, bytes_written_ + buf_size);
762 return false;
763 }
764
765 memcpy(buf_ + bytes_written_, buf, buf_size);
766 bytes_written_ += buf_size;
767 return true;
768 }
769
770 private:
771 uint8_t* const buf_;
772 const size_t size_;
773 size_t bytes_written_;
774};
775
776// A Writer that appends data to a file |fd| at its current position.
777// The file will be truncated to the end of the written data.
778class FileWriter : public Writer {
779 public:
780
781 // Creates a FileWriter for |fd| and prepare to write |entry| to it,
782 // guaranteeing that the file descriptor is valid and that there's enough
783 // space on the volume to write out the entry completely and that the file
Tao Baoa456c212016-11-15 10:08:07 -0800784 // is truncated to the correct length (no truncation if |fd| references a
785 // block device).
Narayan Kamathf899bd52015-04-17 11:53:14 +0100786 //
787 // Returns a valid FileWriter on success, |nullptr| if an error occurred.
788 static std::unique_ptr<FileWriter> Create(int fd, const ZipEntry* entry) {
789 const uint32_t declared_length = entry->uncompressed_length;
790 const off64_t current_offset = lseek64(fd, 0, SEEK_CUR);
791 if (current_offset == -1) {
792 ALOGW("Zip: unable to seek to current location on fd %d: %s", fd, strerror(errno));
793 return nullptr;
794 }
795
796 int result = 0;
797#if defined(__linux__)
798 if (declared_length > 0) {
799 // Make sure we have enough space on the volume to extract the compressed
800 // entry. Note that the call to ftruncate below will change the file size but
801 // will not allocate space on disk and this call to fallocate will not
802 // change the file size.
Badhri Jagan Sridharana68d0d12015-06-02 14:47:57 -0700803 // Note: fallocate is only supported by the following filesystems -
804 // btrfs, ext4, ocfs2, and xfs. Therefore fallocate might fail with
805 // EOPNOTSUPP error when issued in other filesystems.
806 // Hence, check for the return error code before concluding that the
807 // disk does not have enough space.
Narayan Kamathf899bd52015-04-17 11:53:14 +0100808 result = TEMP_FAILURE_RETRY(fallocate(fd, 0, current_offset, declared_length));
Badhri Jagan Sridharana68d0d12015-06-02 14:47:57 -0700809 if (result == -1 && errno == ENOSPC) {
Narayan Kamathd5d7abe2016-08-10 12:24:05 +0100810 ALOGW("Zip: unable to allocate %" PRId64 " bytes at offset %" PRId64 " : %s",
811 static_cast<int64_t>(declared_length), static_cast<int64_t>(current_offset),
812 strerror(errno));
Narayan Kamathf899bd52015-04-17 11:53:14 +0100813 return std::unique_ptr<FileWriter>(nullptr);
814 }
815 }
816#endif // __linux__
817
Tao Baoa456c212016-11-15 10:08:07 -0800818 struct stat sb;
819 if (fstat(fd, &sb) == -1) {
820 ALOGW("Zip: unable to fstat file: %s", strerror(errno));
Narayan Kamathf899bd52015-04-17 11:53:14 +0100821 return std::unique_ptr<FileWriter>(nullptr);
822 }
823
Tao Baoa456c212016-11-15 10:08:07 -0800824 // Block device doesn't support ftruncate(2).
825 if (!S_ISBLK(sb.st_mode)) {
826 result = TEMP_FAILURE_RETRY(ftruncate(fd, declared_length + current_offset));
827 if (result == -1) {
828 ALOGW("Zip: unable to truncate file to %" PRId64 ": %s",
829 static_cast<int64_t>(declared_length + current_offset), strerror(errno));
830 return std::unique_ptr<FileWriter>(nullptr);
831 }
832 }
833
Narayan Kamathf899bd52015-04-17 11:53:14 +0100834 return std::unique_ptr<FileWriter>(new FileWriter(fd, declared_length));
835 }
836
837 virtual bool Append(uint8_t* buf, size_t buf_size) override {
838 if (total_bytes_written_ + buf_size > declared_length_) {
839 ALOGW("Zip: Unexpected size " ZD " (declared) vs " ZD " (actual)",
840 declared_length_, total_bytes_written_ + buf_size);
841 return false;
842 }
843
Narayan Kamathe97e66e2015-04-27 16:25:53 +0100844 const bool result = android::base::WriteFully(fd_, buf, buf_size);
845 if (result) {
846 total_bytes_written_ += buf_size;
847 } else {
848 ALOGW("Zip: unable to write " ZD " bytes to file; %s", buf_size, strerror(errno));
Narayan Kamathf899bd52015-04-17 11:53:14 +0100849 }
850
Narayan Kamathe97e66e2015-04-27 16:25:53 +0100851 return result;
Narayan Kamathf899bd52015-04-17 11:53:14 +0100852 }
853 private:
854 FileWriter(const int fd, const size_t declared_length) :
855 Writer(),
856 fd_(fd),
857 declared_length_(declared_length),
858 total_bytes_written_(0) {
859 }
860
861 const int fd_;
862 const size_t declared_length_;
863 size_t total_bytes_written_;
864};
865
Dmitriy Ivanovf94e1592015-03-06 13:27:59 -0800866// This method is using libz macros with old-style-casts
867#pragma GCC diagnostic push
868#pragma GCC diagnostic ignored "-Wold-style-cast"
869static inline int zlib_inflateInit2(z_stream* stream, int window_bits) {
870 return inflateInit2(stream, window_bits);
871}
872#pragma GCC diagnostic pop
873
Tianjie Xu18c25922016-09-29 15:27:41 -0700874static int32_t InflateEntryToWriter(MappedZipFile& mapped_zip, const ZipEntry* entry,
Narayan Kamathf899bd52015-04-17 11:53:14 +0100875 Writer* writer, uint64_t* crc_out) {
Dmitriy Ivanovedbabfe2015-03-12 09:58:15 -0700876 const size_t kBufSize = 32768;
877 std::vector<uint8_t> read_buf(kBufSize);
878 std::vector<uint8_t> write_buf(kBufSize);
Narayan Kamath7462f022013-11-21 13:05:04 +0000879 z_stream zstream;
880 int zerr;
881
882 /*
883 * Initialize the zlib stream struct.
884 */
885 memset(&zstream, 0, sizeof(zstream));
886 zstream.zalloc = Z_NULL;
887 zstream.zfree = Z_NULL;
888 zstream.opaque = Z_NULL;
889 zstream.next_in = NULL;
890 zstream.avail_in = 0;
Dmitriy Ivanovedbabfe2015-03-12 09:58:15 -0700891 zstream.next_out = &write_buf[0];
Narayan Kamath7462f022013-11-21 13:05:04 +0000892 zstream.avail_out = kBufSize;
893 zstream.data_type = Z_UNKNOWN;
894
895 /*
896 * Use the undocumented "negative window bits" feature to tell zlib
897 * that there's no zlib header waiting for it.
898 */
Dmitriy Ivanovf94e1592015-03-06 13:27:59 -0800899 zerr = zlib_inflateInit2(&zstream, -MAX_WBITS);
Narayan Kamath7462f022013-11-21 13:05:04 +0000900 if (zerr != Z_OK) {
901 if (zerr == Z_VERSION_ERROR) {
902 ALOGE("Installed zlib is not compatible with linked version (%s)",
903 ZLIB_VERSION);
904 } else {
905 ALOGW("Call to inflateInit2 failed (zerr=%d)", zerr);
906 }
907
908 return kZlibError;
909 }
910
Dmitriy Ivanov1f741e52015-03-06 14:26:37 -0800911 auto zstream_deleter = [](z_stream* stream) {
912 inflateEnd(stream); /* free up any allocated structures */
913 };
914
915 std::unique_ptr<z_stream, decltype(zstream_deleter)> zstream_guard(&zstream, zstream_deleter);
916
Narayan Kamath7462f022013-11-21 13:05:04 +0000917 const uint32_t uncompressed_length = entry->uncompressed_length;
918
919 uint32_t compressed_length = entry->compressed_length;
Narayan Kamath7462f022013-11-21 13:05:04 +0000920 do {
921 /* read as much as we can */
922 if (zstream.avail_in == 0) {
Yabin Cuib2a77002016-02-08 16:26:33 -0800923 const size_t getSize = (compressed_length > kBufSize) ? kBufSize : compressed_length;
Tianjie Xu18c25922016-09-29 15:27:41 -0700924 if (!mapped_zip.ReadData(read_buf.data(), getSize)) {
Yabin Cuib2a77002016-02-08 16:26:33 -0800925 ALOGW("Zip: inflate read failed, getSize = %zu: %s", getSize, strerror(errno));
Dmitriy Ivanov1f741e52015-03-06 14:26:37 -0800926 return kIoError;
Narayan Kamath7462f022013-11-21 13:05:04 +0000927 }
928
929 compressed_length -= getSize;
930
Dmitriy Ivanovedbabfe2015-03-12 09:58:15 -0700931 zstream.next_in = &read_buf[0];
Narayan Kamath7462f022013-11-21 13:05:04 +0000932 zstream.avail_in = getSize;
933 }
934
935 /* uncompress the data */
936 zerr = inflate(&zstream, Z_NO_FLUSH);
937 if (zerr != Z_OK && zerr != Z_STREAM_END) {
938 ALOGW("Zip: inflate zerr=%d (nIn=%p aIn=%u nOut=%p aOut=%u)",
939 zerr, zstream.next_in, zstream.avail_in,
940 zstream.next_out, zstream.avail_out);
Dmitriy Ivanov1f741e52015-03-06 14:26:37 -0800941 return kZlibError;
Narayan Kamath7462f022013-11-21 13:05:04 +0000942 }
943
944 /* write when we're full or when we're done */
945 if (zstream.avail_out == 0 ||
946 (zerr == Z_STREAM_END && zstream.avail_out != kBufSize)) {
Dmitriy Ivanovedbabfe2015-03-12 09:58:15 -0700947 const size_t write_size = zstream.next_out - &write_buf[0];
Narayan Kamathf899bd52015-04-17 11:53:14 +0100948 if (!writer->Append(&write_buf[0], write_size)) {
949 // The file might have declared a bogus length.
950 return kInconsistentInformation;
Narayan Kamath7462f022013-11-21 13:05:04 +0000951 }
Narayan Kamath7462f022013-11-21 13:05:04 +0000952
Dmitriy Ivanovedbabfe2015-03-12 09:58:15 -0700953 zstream.next_out = &write_buf[0];
Narayan Kamath7462f022013-11-21 13:05:04 +0000954 zstream.avail_out = kBufSize;
955 }
956 } while (zerr == Z_OK);
957
958 assert(zerr == Z_STREAM_END); /* other errors should've been caught */
959
960 // stream.adler holds the crc32 value for such streams.
961 *crc_out = zstream.adler;
962
963 if (zstream.total_out != uncompressed_length || compressed_length != 0) {
Mark Salyzyn088bf902014-05-08 16:02:20 -0700964 ALOGW("Zip: size mismatch on inflated file (%lu vs %" PRIu32 ")",
Narayan Kamath7462f022013-11-21 13:05:04 +0000965 zstream.total_out, uncompressed_length);
Dmitriy Ivanov1f741e52015-03-06 14:26:37 -0800966 return kInconsistentInformation;
Narayan Kamath7462f022013-11-21 13:05:04 +0000967 }
968
Dmitriy Ivanov1f741e52015-03-06 14:26:37 -0800969 return 0;
Narayan Kamath7462f022013-11-21 13:05:04 +0000970}
971
Tianjie Xu18c25922016-09-29 15:27:41 -0700972static int32_t CopyEntryToWriter(MappedZipFile& mapped_zip, const ZipEntry* entry, Writer* writer,
Narayan Kamathf899bd52015-04-17 11:53:14 +0100973 uint64_t *crc_out) {
974 static const uint32_t kBufSize = 32768;
975 std::vector<uint8_t> buf(kBufSize);
976
977 const uint32_t length = entry->uncompressed_length;
978 uint32_t count = 0;
979 uint64_t crc = 0;
980 while (count < length) {
981 uint32_t remaining = length - count;
982
983 // Safe conversion because kBufSize is narrow enough for a 32 bit signed
984 // value.
Yabin Cuib2a77002016-02-08 16:26:33 -0800985 const size_t block_size = (remaining > kBufSize) ? kBufSize : remaining;
Tianjie Xu18c25922016-09-29 15:27:41 -0700986 if (!mapped_zip.ReadData(buf.data(), block_size)) {
Yabin Cuib2a77002016-02-08 16:26:33 -0800987 ALOGW("CopyFileToFile: copy read failed, block_size = %zu: %s", block_size, strerror(errno));
Narayan Kamathf899bd52015-04-17 11:53:14 +0100988 return kIoError;
989 }
990
991 if (!writer->Append(&buf[0], block_size)) {
992 return kIoError;
993 }
994 crc = crc32(crc, &buf[0], block_size);
995 count += block_size;
996 }
997
998 *crc_out = crc;
999
1000 return 0;
1001}
1002
1003int32_t ExtractToWriter(ZipArchiveHandle handle,
1004 ZipEntry* entry, Writer* writer) {
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -08001005 ZipArchive* archive = reinterpret_cast<ZipArchive*>(handle);
Narayan Kamath7462f022013-11-21 13:05:04 +00001006 const uint16_t method = entry->method;
1007 off64_t data_offset = entry->offset;
1008
Tianjie Xu18c25922016-09-29 15:27:41 -07001009 if (!archive->mapped_zip.SeekToOffset(data_offset)) {
Dmitriy Ivanovf4cb8e22015-03-06 10:50:56 -08001010 ALOGW("Zip: lseek to data at %" PRId64 " failed", static_cast<int64_t>(data_offset));
Narayan Kamath7462f022013-11-21 13:05:04 +00001011 return kIoError;
1012 }
1013
1014 // this should default to kUnknownCompressionMethod.
1015 int32_t return_value = -1;
1016 uint64_t crc = 0;
1017 if (method == kCompressStored) {
Tianjie Xu18c25922016-09-29 15:27:41 -07001018 return_value = CopyEntryToWriter(archive->mapped_zip, entry, writer, &crc);
Narayan Kamath7462f022013-11-21 13:05:04 +00001019 } else if (method == kCompressDeflated) {
Tianjie Xu18c25922016-09-29 15:27:41 -07001020 return_value = InflateEntryToWriter(archive->mapped_zip, entry, writer, &crc);
Narayan Kamath7462f022013-11-21 13:05:04 +00001021 }
1022
1023 if (!return_value && entry->has_data_descriptor) {
Tianjie Xu18c25922016-09-29 15:27:41 -07001024 return_value = UpdateEntryFromDataDescriptor(archive->mapped_zip, entry);
Narayan Kamath7462f022013-11-21 13:05:04 +00001025 if (return_value) {
1026 return return_value;
1027 }
1028 }
1029
1030 // TODO: Fix this check by passing the right flags to inflate2 so that
1031 // it calculates the CRC for us.
1032 if (entry->crc32 != crc && false) {
Mark Salyzyn088bf902014-05-08 16:02:20 -07001033 ALOGW("Zip: crc mismatch: expected %" PRIu32 ", was %" PRIu64, entry->crc32, crc);
Narayan Kamath7462f022013-11-21 13:05:04 +00001034 return kInconsistentInformation;
1035 }
1036
1037 return return_value;
1038}
1039
Narayan Kamathf899bd52015-04-17 11:53:14 +01001040int32_t ExtractToMemory(ZipArchiveHandle handle, ZipEntry* entry,
1041 uint8_t* begin, uint32_t size) {
1042 std::unique_ptr<Writer> writer(new MemoryWriter(begin, size));
1043 return ExtractToWriter(handle, entry, writer.get());
1044}
1045
Narayan Kamath7462f022013-11-21 13:05:04 +00001046int32_t ExtractEntryToFile(ZipArchiveHandle handle,
1047 ZipEntry* entry, int fd) {
Narayan Kamathf899bd52015-04-17 11:53:14 +01001048 std::unique_ptr<Writer> writer(FileWriter::Create(fd, entry));
1049 if (writer.get() == nullptr) {
Narayan Kamath7462f022013-11-21 13:05:04 +00001050 return kIoError;
1051 }
1052
Narayan Kamathf899bd52015-04-17 11:53:14 +01001053 return ExtractToWriter(handle, entry, writer.get());
Narayan Kamath7462f022013-11-21 13:05:04 +00001054}
1055
1056const char* ErrorCodeString(int32_t error_code) {
1057 if (error_code > kErrorMessageLowerBound && error_code < kErrorMessageUpperBound) {
1058 return kErrorMessages[error_code * -1];
1059 }
1060
1061 return kErrorMessages[0];
1062}
1063
1064int GetFileDescriptor(const ZipArchiveHandle handle) {
Tianjie Xu18c25922016-09-29 15:27:41 -07001065 return reinterpret_cast<ZipArchive*>(handle)->mapped_zip.GetFileDescriptor();
Narayan Kamath7462f022013-11-21 13:05:04 +00001066}
Colin Cross7c6c7f02016-09-16 10:15:51 -07001067
1068ZipString::ZipString(const char* entry_name)
1069 : name(reinterpret_cast<const uint8_t*>(entry_name)) {
1070 size_t len = strlen(entry_name);
1071 CHECK_LE(len, static_cast<size_t>(UINT16_MAX));
1072 name_length = static_cast<uint16_t>(len);
1073}
Tianjie Xu18c25922016-09-29 15:27:41 -07001074
1075#if !defined(_WIN32)
1076class ProcessWriter : public Writer {
1077 public:
1078 ProcessWriter(ProcessZipEntryFunction func, void* cookie) : Writer(),
1079 proc_function_(func),
1080 cookie_(cookie) {
1081 }
1082
1083 virtual bool Append(uint8_t* buf, size_t buf_size) override {
1084 return proc_function_(buf, buf_size, cookie_);
1085 }
1086
1087 private:
1088 ProcessZipEntryFunction proc_function_;
1089 void* cookie_;
1090};
1091
1092int32_t ProcessZipEntryContents(ZipArchiveHandle handle, ZipEntry* entry,
1093 ProcessZipEntryFunction func, void* cookie) {
1094 ProcessWriter writer(func, cookie);
1095 return ExtractToWriter(handle, entry, &writer);
1096}
1097
1098#endif //!defined(_WIN32)
1099
1100int MappedZipFile::GetFileDescriptor() const {
1101 if (!has_fd_) {
1102 ALOGW("Zip: MappedZipFile doesn't have a file descriptor.");
1103 return -1;
1104 }
1105 return fd_;
1106}
1107
1108void* MappedZipFile::GetBasePtr() const {
1109 if (has_fd_) {
1110 ALOGW("Zip: MappedZipFile doesn't have a base pointer.");
1111 return nullptr;
1112 }
1113 return base_ptr_;
1114}
1115
1116off64_t MappedZipFile::GetFileLength() const {
1117 if (has_fd_) {
1118 off64_t result = lseek64(fd_, 0, SEEK_END);
1119 if (result == -1) {
1120 ALOGE("Zip: lseek on fd %d failed: %s", fd_, strerror(errno));
1121 }
1122 return result;
1123 } else {
1124 if (base_ptr_ == nullptr) {
1125 ALOGE("Zip: invalid file map\n");
1126 return -1;
1127 }
1128 return static_cast<off64_t>(data_length_);
1129 }
1130}
1131
1132bool MappedZipFile::SeekToOffset(off64_t offset) {
1133 if (has_fd_) {
1134 if (lseek64(fd_, offset, SEEK_SET) != offset) {
1135 ALOGE("Zip: lseek to %" PRId64 " failed: %s\n", offset, strerror(errno));
1136 return false;
1137 }
1138 return true;
1139 } else {
1140 if (offset < 0 || offset > static_cast<off64_t>(data_length_)) {
1141 ALOGE("Zip: invalid offset: %" PRId64 ", data length: %" PRId64 "\n" , offset,
1142 data_length_);
1143 return false;
1144 }
1145
1146 read_pos_ = offset;
1147 return true;
1148 }
1149}
1150
1151bool MappedZipFile::ReadData(uint8_t* buffer, size_t read_amount) {
1152 if (has_fd_) {
1153 if(!android::base::ReadFully(fd_, buffer, read_amount)) {
1154 ALOGE("Zip: read from %d failed\n", fd_);
1155 return false;
1156 }
1157 } else {
1158 memcpy(buffer, static_cast<uint8_t*>(base_ptr_) + read_pos_, read_amount);
1159 read_pos_ += read_amount;
1160 }
1161 return true;
1162}
1163
1164// Attempts to read |len| bytes into |buf| at offset |off|.
1165bool MappedZipFile::ReadAtOffset(uint8_t* buf, size_t len, off64_t off) {
1166#if !defined(_WIN32)
1167 if (has_fd_) {
1168 if (static_cast<size_t>(TEMP_FAILURE_RETRY(pread64(fd_, buf, len, off))) != len) {
1169 ALOGE("Zip: failed to read at offset %" PRId64 "\n", off);
1170 return false;
1171 }
1172 return true;
1173 }
1174#endif
1175 if (!SeekToOffset(off)) {
1176 return false;
1177 }
1178 return ReadData(buf, len);
1179
1180}
1181
1182void CentralDirectory::Initialize(void* map_base_ptr, off64_t cd_start_offset, size_t cd_size) {
1183 base_ptr_ = static_cast<uint8_t*>(map_base_ptr) + cd_start_offset;
1184 length_ = cd_size;
1185}
1186
1187bool ZipArchive::InitializeCentralDirectory(const char* debug_file_name, off64_t cd_start_offset,
1188 size_t cd_size) {
1189 if (mapped_zip.HasFd()) {
1190 if (!directory_map->create(debug_file_name, mapped_zip.GetFileDescriptor(),
1191 cd_start_offset, cd_size, true /* read only */)) {
1192 return false;
1193 }
1194
1195 CHECK_EQ(directory_map->getDataLength(), cd_size);
1196 central_directory.Initialize(directory_map->getDataPtr(), 0/*offset*/, cd_size);
1197 } else {
1198 if (mapped_zip.GetBasePtr() == nullptr) {
1199 ALOGE("Zip: Failed to map central directory, bad mapped_zip base pointer\n");
1200 return false;
1201 }
1202 if (static_cast<off64_t>(cd_start_offset) + static_cast<off64_t>(cd_size) >
1203 mapped_zip.GetFileLength()) {
1204 ALOGE("Zip: Failed to map central directory, offset exceeds mapped memory region ("
1205 "start_offset %" PRId64 ", cd_size %zu, mapped_region_size %" PRId64 ")",
1206 static_cast<int64_t>(cd_start_offset), cd_size, mapped_zip.GetFileLength());
1207 return false;
1208 }
1209
1210 central_directory.Initialize(mapped_zip.GetBasePtr(), cd_start_offset, cd_size);
1211 }
1212 return true;
1213}