• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /*
2  * Copyright (C) 2007 The Android Open Source Project
3  *
4  * Licensed under the Apache License, Version 2.0 (the "License");
5  * you may not use this file except in compliance with the License.
6  * You may obtain a copy of the License at
7  *
8  *      http://www.apache.org/licenses/LICENSE-2.0
9  *
10  * Unless required by applicable law or agreed to in writing, software
11  * distributed under the License is distributed on an "AS IS" BASIS,
12  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13  * See the License for the specific language governing permissions and
14  * limitations under the License.
15  */
16 
17 //
18 // Read-only access to Zip archives, with minimal heap allocation.
19 //
20 #define LOG_TAG "zipro"
21 //#define LOG_NDEBUG 0
22 #include <utils/Log.h>
23 #include <utils/ZipFileRO.h>
24 #include <utils/misc.h>
25 #include <utils/threads.h>
26 
27 #include <zlib.h>
28 
29 #include <string.h>
30 #include <fcntl.h>
31 #include <errno.h>
32 #include <assert.h>
33 #include <unistd.h>
34 
35 #if HAVE_PRINTF_ZD
36 #  define ZD "%zd"
37 #  define ZD_TYPE ssize_t
38 #else
39 #  define ZD "%ld"
40 #  define ZD_TYPE long
41 #endif
42 
43 /*
44  * We must open binary files using open(path, ... | O_BINARY) under Windows.
45  * Otherwise strange read errors will happen.
46  */
47 #ifndef O_BINARY
48 #  define O_BINARY  0
49 #endif
50 
51 /*
52  * TEMP_FAILURE_RETRY is defined by some, but not all, versions of
53  * <unistd.h>. (Alas, it is not as standard as we'd hoped!) So, if it's
54  * not already defined, then define it here.
55  */
56 #ifndef TEMP_FAILURE_RETRY
57 /* Used to retry syscalls that can return EINTR. */
58 #define TEMP_FAILURE_RETRY(exp) ({         \
59     typeof (exp) _rc;                      \
60     do {                                   \
61         _rc = (exp);                       \
62     } while (_rc == -1 && errno == EINTR); \
63     _rc; })
64 #endif
65 
66 using namespace android;
67 
68 /*
69  * Zip file constants.
70  */
71 #define kEOCDSignature      0x06054b50
72 #define kEOCDLen            22
73 #define kEOCDNumEntries     8               // offset to #of entries in file
74 #define kEOCDSize           12              // size of the central directory
75 #define kEOCDFileOffset     16              // offset to central directory
76 
77 #define kMaxCommentLen      65535           // longest possible in ushort
78 #define kMaxEOCDSearch      (kMaxCommentLen + kEOCDLen)
79 
80 #define kLFHSignature       0x04034b50
81 #define kLFHLen             30              // excluding variable-len fields
82 #define kLFHNameLen         26              // offset to filename length
83 #define kLFHExtraLen        28              // offset to extra length
84 
85 #define kCDESignature       0x02014b50
86 #define kCDELen             46              // excluding variable-len fields
87 #define kCDEMethod          10              // offset to compression method
88 #define kCDEModWhen         12              // offset to modification timestamp
89 #define kCDECRC             16              // offset to entry CRC
90 #define kCDECompLen         20              // offset to compressed length
91 #define kCDEUncompLen       24              // offset to uncompressed length
92 #define kCDENameLen         28              // offset to filename length
93 #define kCDEExtraLen        30              // offset to extra length
94 #define kCDECommentLen      32              // offset to comment length
95 #define kCDELocalOffset     42              // offset to local hdr
96 
97 /*
98  * The values we return for ZipEntryRO use 0 as an invalid value, so we
99  * want to adjust the hash table index by a fixed amount.  Using a large
100  * value helps insure that people don't mix & match arguments, e.g. to
101  * findEntryByIndex().
102  */
103 #define kZipEntryAdj        10000
104 
~ZipFileRO()105 ZipFileRO::~ZipFileRO() {
106     free(mHashTable);
107     if (mDirectoryMap)
108         mDirectoryMap->release();
109     if (mFd >= 0)
110         TEMP_FAILURE_RETRY(close(mFd));
111     if (mFileName)
112         free(mFileName);
113 }
114 
115 /*
116  * Convert a ZipEntryRO to a hash table index, verifying that it's in a
117  * valid range.
118  */
entryToIndex(const ZipEntryRO entry) const119 int ZipFileRO::entryToIndex(const ZipEntryRO entry) const
120 {
121     long ent = ((intptr_t) entry) - kZipEntryAdj;
122     if (ent < 0 || ent >= mHashTableSize || mHashTable[ent].name == NULL) {
123         ALOGW("Invalid ZipEntryRO %p (%ld)\n", entry, ent);
124         return -1;
125     }
126     return ent;
127 }
128 
129 
130 /*
131  * Open the specified file read-only.  We memory-map the entire thing and
132  * close the file before returning.
133  */
open(const char * zipFileName)134 status_t ZipFileRO::open(const char* zipFileName)
135 {
136     int fd = -1;
137 
138     assert(mDirectoryMap == NULL);
139 
140     /*
141      * Open and map the specified file.
142      */
143     fd = TEMP_FAILURE_RETRY(::open(zipFileName, O_RDONLY | O_BINARY));
144     if (fd < 0) {
145         ALOGW("Unable to open zip '%s': %s\n", zipFileName, strerror(errno));
146         return NAME_NOT_FOUND;
147     }
148 
149     mFileLength = lseek64(fd, 0, SEEK_END);
150     if (mFileLength < kEOCDLen) {
151         TEMP_FAILURE_RETRY(close(fd));
152         return UNKNOWN_ERROR;
153     }
154 
155     if (mFileName != NULL) {
156         free(mFileName);
157     }
158     mFileName = strdup(zipFileName);
159 
160     mFd = fd;
161 
162     /*
163      * Find the Central Directory and store its size and number of entries.
164      */
165     if (!mapCentralDirectory()) {
166         goto bail;
167     }
168 
169     /*
170      * Verify Central Directory and create data structures for fast access.
171      */
172     if (!parseZipArchive()) {
173         goto bail;
174     }
175 
176     return OK;
177 
178 bail:
179     free(mFileName);
180     mFileName = NULL;
181     TEMP_FAILURE_RETRY(close(fd));
182     return UNKNOWN_ERROR;
183 }
184 
185 /*
186  * Parse the Zip archive, verifying its contents and initializing internal
187  * data structures.
188  */
mapCentralDirectory(void)189 bool ZipFileRO::mapCentralDirectory(void)
190 {
191     ssize_t readAmount = kMaxEOCDSearch;
192     if (readAmount > (ssize_t) mFileLength)
193         readAmount = mFileLength;
194 
195     unsigned char* scanBuf = (unsigned char*) malloc(readAmount);
196     if (scanBuf == NULL) {
197         ALOGW("couldn't allocate scanBuf: %s", strerror(errno));
198         free(scanBuf);
199         return false;
200     }
201 
202     /*
203      * Make sure this is a Zip archive.
204      */
205     if (lseek64(mFd, 0, SEEK_SET) != 0) {
206         ALOGW("seek to start failed: %s", strerror(errno));
207         free(scanBuf);
208         return false;
209     }
210 
211     ssize_t actual = TEMP_FAILURE_RETRY(read(mFd, scanBuf, sizeof(int32_t)));
212     if (actual != (ssize_t) sizeof(int32_t)) {
213         ALOGI("couldn't read first signature from zip archive: %s", strerror(errno));
214         free(scanBuf);
215         return false;
216     }
217 
218     {
219         unsigned int header = get4LE(scanBuf);
220         if (header == kEOCDSignature) {
221             ALOGI("Found Zip archive, but it looks empty\n");
222             free(scanBuf);
223             return false;
224         } else if (header != kLFHSignature) {
225             ALOGV("Not a Zip archive (found 0x%08x)\n", header);
226             free(scanBuf);
227             return false;
228         }
229     }
230 
231     /*
232      * Perform the traditional EOCD snipe hunt.
233      *
234      * We're searching for the End of Central Directory magic number,
235      * which appears at the start of the EOCD block.  It's followed by
236      * 18 bytes of EOCD stuff and up to 64KB of archive comment.  We
237      * need to read the last part of the file into a buffer, dig through
238      * it to find the magic number, parse some values out, and use those
239      * to determine the extent of the CD.
240      *
241      * We start by pulling in the last part of the file.
242      */
243     off64_t searchStart = mFileLength - readAmount;
244 
245     if (lseek64(mFd, searchStart, SEEK_SET) != searchStart) {
246         ALOGW("seek %ld failed: %s\n",  (long) searchStart, strerror(errno));
247         free(scanBuf);
248         return false;
249     }
250     actual = TEMP_FAILURE_RETRY(read(mFd, scanBuf, readAmount));
251     if (actual != (ssize_t) readAmount) {
252         ALOGW("Zip: read " ZD ", expected " ZD ". Failed: %s\n",
253             (ZD_TYPE) actual, (ZD_TYPE) readAmount, strerror(errno));
254         free(scanBuf);
255         return false;
256     }
257 
258     /*
259      * Scan backward for the EOCD magic.  In an archive without a trailing
260      * comment, we'll find it on the first try.  (We may want to consider
261      * doing an initial minimal read; if we don't find it, retry with a
262      * second read as above.)
263      */
264     int i;
265     for (i = readAmount - kEOCDLen; i >= 0; i--) {
266         if (scanBuf[i] == 0x50 && get4LE(&scanBuf[i]) == kEOCDSignature) {
267             ALOGV("+++ Found EOCD at buf+%d\n", i);
268             break;
269         }
270     }
271     if (i < 0) {
272         ALOGD("Zip: EOCD not found, %s is not zip\n", mFileName);
273         free(scanBuf);
274         return false;
275     }
276 
277     off64_t eocdOffset = searchStart + i;
278     const unsigned char* eocdPtr = scanBuf + i;
279 
280     assert(eocdOffset < mFileLength);
281 
282     /*
283      * Grab the CD offset and size, and the number of entries in the
284      * archive. After that, we can release our EOCD hunt buffer.
285      */
286     unsigned int numEntries = get2LE(eocdPtr + kEOCDNumEntries);
287     unsigned int dirSize = get4LE(eocdPtr + kEOCDSize);
288     unsigned int dirOffset = get4LE(eocdPtr + kEOCDFileOffset);
289     free(scanBuf);
290 
291     // Verify that they look reasonable.
292     if ((long long) dirOffset + (long long) dirSize > (long long) eocdOffset) {
293         ALOGW("bad offsets (dir %ld, size %u, eocd %ld)\n",
294             (long) dirOffset, dirSize, (long) eocdOffset);
295         return false;
296     }
297     if (numEntries == 0) {
298         ALOGW("empty archive?\n");
299         return false;
300     }
301 
302     ALOGV("+++ numEntries=%d dirSize=%d dirOffset=%d\n",
303         numEntries, dirSize, dirOffset);
304 
305     mDirectoryMap = new FileMap();
306     if (mDirectoryMap == NULL) {
307         ALOGW("Unable to create directory map: %s", strerror(errno));
308         return false;
309     }
310 
311     if (!mDirectoryMap->create(mFileName, mFd, dirOffset, dirSize, true)) {
312         ALOGW("Unable to map '%s' (" ZD " to " ZD "): %s\n", mFileName,
313                 (ZD_TYPE) dirOffset, (ZD_TYPE) (dirOffset + dirSize), strerror(errno));
314         return false;
315     }
316 
317     mNumEntries = numEntries;
318     mDirectoryOffset = dirOffset;
319 
320     return true;
321 }
322 
323 
324 /*
325  * Round up to the next highest power of 2.
326  *
327  * Found on http://graphics.stanford.edu/~seander/bithacks.html.
328  */
roundUpPower2(unsigned int val)329 static unsigned int roundUpPower2(unsigned int val)
330 {
331     val--;
332     val |= val >> 1;
333     val |= val >> 2;
334     val |= val >> 4;
335     val |= val >> 8;
336     val |= val >> 16;
337     val++;
338 
339     return val;
340 }
341 
parseZipArchive(void)342 bool ZipFileRO::parseZipArchive(void)
343 {
344     bool result = false;
345     const unsigned char* cdPtr = (const unsigned char*) mDirectoryMap->getDataPtr();
346     size_t cdLength = mDirectoryMap->getDataLength();
347     int numEntries = mNumEntries;
348 
349     /*
350      * Create hash table.  We have a minimum 75% load factor, possibly as
351      * low as 50% after we round off to a power of 2.
352      */
353     mHashTableSize = roundUpPower2(1 + (numEntries * 4) / 3);
354     mHashTable = (HashEntry*) calloc(mHashTableSize, sizeof(HashEntry));
355 
356     /*
357      * Walk through the central directory, adding entries to the hash
358      * table.
359      */
360     const unsigned char* ptr = cdPtr;
361     for (int i = 0; i < numEntries; i++) {
362         if (get4LE(ptr) != kCDESignature) {
363             ALOGW("Missed a central dir sig (at %d)\n", i);
364             goto bail;
365         }
366         if (ptr + kCDELen > cdPtr + cdLength) {
367             ALOGW("Ran off the end (at %d)\n", i);
368             goto bail;
369         }
370 
371         long localHdrOffset = (long) get4LE(ptr + kCDELocalOffset);
372         if (localHdrOffset >= mDirectoryOffset) {
373             ALOGW("bad LFH offset %ld at entry %d\n", localHdrOffset, i);
374             goto bail;
375         }
376 
377         unsigned int fileNameLen, extraLen, commentLen, hash;
378 
379         fileNameLen = get2LE(ptr + kCDENameLen);
380         extraLen = get2LE(ptr + kCDEExtraLen);
381         commentLen = get2LE(ptr + kCDECommentLen);
382 
383         /* add the CDE filename to the hash table */
384         hash = computeHash((const char*)ptr + kCDELen, fileNameLen);
385         addToHash((const char*)ptr + kCDELen, fileNameLen, hash);
386 
387         ptr += kCDELen + fileNameLen + extraLen + commentLen;
388         if ((size_t)(ptr - cdPtr) > cdLength) {
389             ALOGW("bad CD advance (%d vs " ZD ") at entry %d\n",
390                 (int) (ptr - cdPtr), (ZD_TYPE) cdLength, i);
391             goto bail;
392         }
393     }
394     ALOGV("+++ zip good scan %d entries\n", numEntries);
395     result = true;
396 
397 bail:
398     return result;
399 }
400 
401 /*
402  * Simple string hash function for non-null-terminated strings.
403  */
computeHash(const char * str,int len)404 /*static*/ unsigned int ZipFileRO::computeHash(const char* str, int len)
405 {
406     unsigned int hash = 0;
407 
408     while (len--)
409         hash = hash * 31 + *str++;
410 
411     return hash;
412 }
413 
414 /*
415  * Add a new entry to the hash table.
416  */
addToHash(const char * str,int strLen,unsigned int hash)417 void ZipFileRO::addToHash(const char* str, int strLen, unsigned int hash)
418 {
419     int ent = hash & (mHashTableSize-1);
420 
421     /*
422      * We over-allocate the table, so we're guaranteed to find an empty slot.
423      */
424     while (mHashTable[ent].name != NULL)
425         ent = (ent + 1) & (mHashTableSize-1);
426 
427     mHashTable[ent].name = str;
428     mHashTable[ent].nameLen = strLen;
429 }
430 
431 /*
432  * Find a matching entry.
433  *
434  * Returns NULL if not found.
435  */
findEntryByName(const char * fileName) const436 ZipEntryRO ZipFileRO::findEntryByName(const char* fileName) const
437 {
438     /*
439      * If the ZipFileRO instance is not initialized, the entry number will
440      * end up being garbage since mHashTableSize is -1.
441      */
442     if (mHashTableSize <= 0) {
443         return NULL;
444     }
445 
446     int nameLen = strlen(fileName);
447     unsigned int hash = computeHash(fileName, nameLen);
448     int ent = hash & (mHashTableSize-1);
449 
450     while (mHashTable[ent].name != NULL) {
451         if (mHashTable[ent].nameLen == nameLen &&
452             memcmp(mHashTable[ent].name, fileName, nameLen) == 0)
453         {
454             /* match */
455             return (ZipEntryRO)(long)(ent + kZipEntryAdj);
456         }
457 
458         ent = (ent + 1) & (mHashTableSize-1);
459     }
460 
461     return NULL;
462 }
463 
464 /*
465  * Find the Nth entry.
466  *
467  * This currently involves walking through the sparse hash table, counting
468  * non-empty entries.  If we need to speed this up we can either allocate
469  * a parallel lookup table or (perhaps better) provide an iterator interface.
470  */
findEntryByIndex(int idx) const471 ZipEntryRO ZipFileRO::findEntryByIndex(int idx) const
472 {
473     if (idx < 0 || idx >= mNumEntries) {
474         ALOGW("Invalid index %d\n", idx);
475         return NULL;
476     }
477 
478     for (int ent = 0; ent < mHashTableSize; ent++) {
479         if (mHashTable[ent].name != NULL) {
480             if (idx-- == 0)
481                 return (ZipEntryRO) (intptr_t)(ent + kZipEntryAdj);
482         }
483     }
484 
485     return NULL;
486 }
487 
488 /*
489  * Get the useful fields from the zip entry.
490  *
491  * Returns "false" if the offsets to the fields or the contents of the fields
492  * appear to be bogus.
493  */
getEntryInfo(ZipEntryRO entry,int * pMethod,size_t * pUncompLen,size_t * pCompLen,off64_t * pOffset,long * pModWhen,long * pCrc32) const494 bool ZipFileRO::getEntryInfo(ZipEntryRO entry, int* pMethod, size_t* pUncompLen,
495     size_t* pCompLen, off64_t* pOffset, long* pModWhen, long* pCrc32) const
496 {
497     bool ret = false;
498 
499     const int ent = entryToIndex(entry);
500     if (ent < 0)
501         return false;
502 
503     HashEntry hashEntry = mHashTable[ent];
504 
505     /*
506      * Recover the start of the central directory entry from the filename
507      * pointer.  The filename is the first entry past the fixed-size data,
508      * so we can just subtract back from that.
509      */
510     const unsigned char* ptr = (const unsigned char*) hashEntry.name;
511     off64_t cdOffset = mDirectoryOffset;
512 
513     ptr -= kCDELen;
514 
515     int method = get2LE(ptr + kCDEMethod);
516     if (pMethod != NULL)
517         *pMethod = method;
518 
519     if (pModWhen != NULL)
520         *pModWhen = get4LE(ptr + kCDEModWhen);
521     if (pCrc32 != NULL)
522         *pCrc32 = get4LE(ptr + kCDECRC);
523 
524     size_t compLen = get4LE(ptr + kCDECompLen);
525     if (pCompLen != NULL)
526         *pCompLen = compLen;
527     size_t uncompLen = get4LE(ptr + kCDEUncompLen);
528     if (pUncompLen != NULL)
529         *pUncompLen = uncompLen;
530 
531     /*
532      * If requested, determine the offset of the start of the data.  All we
533      * have is the offset to the Local File Header, which is variable size,
534      * so we have to read the contents of the struct to figure out where
535      * the actual data starts.
536      *
537      * We also need to make sure that the lengths are not so large that
538      * somebody trying to map the compressed or uncompressed data runs
539      * off the end of the mapped region.
540      *
541      * Note we don't verify compLen/uncompLen if they don't request the
542      * dataOffset, because dataOffset is expensive to determine.  However,
543      * if they don't have the file offset, they're not likely to be doing
544      * anything with the contents.
545      */
546     if (pOffset != NULL) {
547         long localHdrOffset = get4LE(ptr + kCDELocalOffset);
548         if (localHdrOffset + kLFHLen >= cdOffset) {
549             ALOGE("ERROR: bad local hdr offset in zip\n");
550             return false;
551         }
552 
553         unsigned char lfhBuf[kLFHLen];
554 
555 #ifdef HAVE_PREAD
556         /*
557          * This file descriptor might be from zygote's preloaded assets,
558          * so we need to do an pread64() instead of a lseek64() + read() to
559          * guarantee atomicity across the processes with the shared file
560          * descriptors.
561          */
562         ssize_t actual =
563                 TEMP_FAILURE_RETRY(pread64(mFd, lfhBuf, sizeof(lfhBuf), localHdrOffset));
564 
565         if (actual != sizeof(lfhBuf)) {
566             ALOGW("failed reading lfh from offset %ld\n", localHdrOffset);
567             return false;
568         }
569 
570         if (get4LE(lfhBuf) != kLFHSignature) {
571             ALOGW("didn't find signature at start of lfh; wanted: offset=%ld data=0x%08x; "
572                     "got: data=0x%08lx\n",
573                     localHdrOffset, kLFHSignature, get4LE(lfhBuf));
574             return false;
575         }
576 #else /* HAVE_PREAD */
577         /*
578          * For hosts don't have pread64() we cannot guarantee atomic reads from
579          * an offset in a file. Android should never run on those platforms.
580          * File descriptors inherited from a fork() share file offsets and
581          * there would be nothing to protect from two different processes
582          * calling lseek64() concurrently.
583          */
584 
585         {
586             AutoMutex _l(mFdLock);
587 
588             if (lseek64(mFd, localHdrOffset, SEEK_SET) != localHdrOffset) {
589                 ALOGW("failed seeking to lfh at offset %ld\n", localHdrOffset);
590                 return false;
591             }
592 
593             ssize_t actual =
594                     TEMP_FAILURE_RETRY(read(mFd, lfhBuf, sizeof(lfhBuf)));
595             if (actual != sizeof(lfhBuf)) {
596                 ALOGW("failed reading lfh from offset %ld\n", localHdrOffset);
597                 return false;
598             }
599 
600             if (get4LE(lfhBuf) != kLFHSignature) {
601                 off64_t actualOffset = lseek64(mFd, 0, SEEK_CUR);
602                 ALOGW("didn't find signature at start of lfh; wanted: offset=%ld data=0x%08x; "
603                         "got: offset=" ZD " data=0x%08lx\n",
604                         localHdrOffset, kLFHSignature, (ZD_TYPE) actualOffset, get4LE(lfhBuf));
605                 return false;
606             }
607         }
608 #endif /* HAVE_PREAD */
609 
610         off64_t dataOffset = localHdrOffset + kLFHLen
611             + get2LE(lfhBuf + kLFHNameLen) + get2LE(lfhBuf + kLFHExtraLen);
612         if (dataOffset >= cdOffset) {
613             ALOGW("bad data offset %ld in zip\n", (long) dataOffset);
614             return false;
615         }
616 
617         /* check lengths */
618         if ((off64_t)(dataOffset + compLen) > cdOffset) {
619             ALOGW("bad compressed length in zip (%ld + " ZD " > %ld)\n",
620                 (long) dataOffset, (ZD_TYPE) compLen, (long) cdOffset);
621             return false;
622         }
623 
624         if (method == kCompressStored &&
625             (off64_t)(dataOffset + uncompLen) > cdOffset)
626         {
627             ALOGE("ERROR: bad uncompressed length in zip (%ld + " ZD " > %ld)\n",
628                 (long) dataOffset, (ZD_TYPE) uncompLen, (long) cdOffset);
629             return false;
630         }
631 
632         *pOffset = dataOffset;
633     }
634 
635     return true;
636 }
637 
638 /*
639  * Copy the entry's filename to the buffer.
640  */
getEntryFileName(ZipEntryRO entry,char * buffer,int bufLen) const641 int ZipFileRO::getEntryFileName(ZipEntryRO entry, char* buffer, int bufLen)
642     const
643 {
644     int ent = entryToIndex(entry);
645     if (ent < 0)
646         return -1;
647 
648     int nameLen = mHashTable[ent].nameLen;
649     if (bufLen < nameLen+1)
650         return nameLen+1;
651 
652     memcpy(buffer, mHashTable[ent].name, nameLen);
653     buffer[nameLen] = '\0';
654     return 0;
655 }
656 
657 /*
658  * Create a new FileMap object that spans the data in "entry".
659  */
createEntryFileMap(ZipEntryRO entry) const660 FileMap* ZipFileRO::createEntryFileMap(ZipEntryRO entry) const
661 {
662     /*
663      * TODO: the efficient way to do this is to modify FileMap to allow
664      * sub-regions of a file to be mapped.  A reference-counting scheme
665      * can manage the base memory mapping.  For now, we just create a brand
666      * new mapping off of the Zip archive file descriptor.
667      */
668 
669     FileMap* newMap;
670     size_t compLen;
671     off64_t offset;
672 
673     if (!getEntryInfo(entry, NULL, NULL, &compLen, &offset, NULL, NULL))
674         return NULL;
675 
676     newMap = new FileMap();
677     if (!newMap->create(mFileName, mFd, offset, compLen, true)) {
678         newMap->release();
679         return NULL;
680     }
681 
682     return newMap;
683 }
684 
685 /*
686  * Uncompress an entry, in its entirety, into the provided output buffer.
687  *
688  * This doesn't verify the data's CRC, which might be useful for
689  * uncompressed data.  The caller should be able to manage it.
690  */
uncompressEntry(ZipEntryRO entry,void * buffer) const691 bool ZipFileRO::uncompressEntry(ZipEntryRO entry, void* buffer) const
692 {
693     const size_t kSequentialMin = 32768;
694     bool result = false;
695     int ent = entryToIndex(entry);
696     if (ent < 0)
697         return -1;
698 
699     int method;
700     size_t uncompLen, compLen;
701     off64_t offset;
702     const unsigned char* ptr;
703 
704     getEntryInfo(entry, &method, &uncompLen, &compLen, &offset, NULL, NULL);
705 
706     FileMap* file = createEntryFileMap(entry);
707     if (file == NULL) {
708         goto bail;
709     }
710 
711     ptr = (const unsigned char*) file->getDataPtr();
712 
713     /*
714      * Experiment with madvise hint.  When we want to uncompress a file,
715      * we pull some stuff out of the central dir entry and then hit a
716      * bunch of compressed or uncompressed data sequentially.  The CDE
717      * visit will cause a limited amount of read-ahead because it's at
718      * the end of the file.  We could end up doing lots of extra disk
719      * access if the file we're prying open is small.  Bottom line is we
720      * probably don't want to turn MADV_SEQUENTIAL on and leave it on.
721      *
722      * So, if the compressed size of the file is above a certain minimum
723      * size, temporarily boost the read-ahead in the hope that the extra
724      * pair of system calls are negated by a reduction in page faults.
725      */
726     if (compLen > kSequentialMin)
727         file->advise(FileMap::SEQUENTIAL);
728 
729     if (method == kCompressStored) {
730         memcpy(buffer, ptr, uncompLen);
731     } else {
732         if (!inflateBuffer(buffer, ptr, uncompLen, compLen))
733             goto unmap;
734     }
735 
736     if (compLen > kSequentialMin)
737         file->advise(FileMap::NORMAL);
738 
739     result = true;
740 
741 unmap:
742     file->release();
743 bail:
744     return result;
745 }
746 
747 /*
748  * Uncompress an entry, in its entirety, to an open file descriptor.
749  *
750  * This doesn't verify the data's CRC, but probably should.
751  */
uncompressEntry(ZipEntryRO entry,int fd) const752 bool ZipFileRO::uncompressEntry(ZipEntryRO entry, int fd) const
753 {
754     bool result = false;
755     int ent = entryToIndex(entry);
756     if (ent < 0)
757         return -1;
758 
759     int method;
760     size_t uncompLen, compLen;
761     off64_t offset;
762     const unsigned char* ptr;
763 
764     getEntryInfo(entry, &method, &uncompLen, &compLen, &offset, NULL, NULL);
765 
766     FileMap* file = createEntryFileMap(entry);
767     if (file == NULL) {
768         goto bail;
769     }
770 
771     ptr = (const unsigned char*) file->getDataPtr();
772 
773     if (method == kCompressStored) {
774         ssize_t actual = TEMP_FAILURE_RETRY(write(fd, ptr, uncompLen));
775         if (actual < 0) {
776             ALOGE("Write failed: %s\n", strerror(errno));
777             goto unmap;
778         } else if ((size_t) actual != uncompLen) {
779             ALOGE("Partial write during uncompress (" ZD " of " ZD ")\n",
780                 (ZD_TYPE) actual, (ZD_TYPE) uncompLen);
781             goto unmap;
782         } else {
783             ALOGI("+++ successful write\n");
784         }
785     } else {
786         if (!inflateBuffer(fd, ptr, uncompLen, compLen))
787             goto unmap;
788     }
789 
790     result = true;
791 
792 unmap:
793     file->release();
794 bail:
795     return result;
796 }
797 
798 /*
799  * Uncompress "deflate" data from one buffer to another.
800  */
inflateBuffer(void * outBuf,const void * inBuf,size_t uncompLen,size_t compLen)801 /*static*/ bool ZipFileRO::inflateBuffer(void* outBuf, const void* inBuf,
802     size_t uncompLen, size_t compLen)
803 {
804     bool result = false;
805     z_stream zstream;
806     int zerr;
807 
808     /*
809      * Initialize the zlib stream struct.
810      */
811     memset(&zstream, 0, sizeof(zstream));
812     zstream.zalloc = Z_NULL;
813     zstream.zfree = Z_NULL;
814     zstream.opaque = Z_NULL;
815     zstream.next_in = (Bytef*)inBuf;
816     zstream.avail_in = compLen;
817     zstream.next_out = (Bytef*) outBuf;
818     zstream.avail_out = uncompLen;
819     zstream.data_type = Z_UNKNOWN;
820 
821     /*
822      * Use the undocumented "negative window bits" feature to tell zlib
823      * that there's no zlib header waiting for it.
824      */
825     zerr = inflateInit2(&zstream, -MAX_WBITS);
826     if (zerr != Z_OK) {
827         if (zerr == Z_VERSION_ERROR) {
828             ALOGE("Installed zlib is not compatible with linked version (%s)\n",
829                 ZLIB_VERSION);
830         } else {
831             ALOGE("Call to inflateInit2 failed (zerr=%d)\n", zerr);
832         }
833         goto bail;
834     }
835 
836     /*
837      * Expand data.
838      */
839     zerr = inflate(&zstream, Z_FINISH);
840     if (zerr != Z_STREAM_END) {
841         ALOGW("Zip inflate failed, zerr=%d (nIn=%p aIn=%u nOut=%p aOut=%u)\n",
842             zerr, zstream.next_in, zstream.avail_in,
843             zstream.next_out, zstream.avail_out);
844         goto z_bail;
845     }
846 
847     /* paranoia */
848     if (zstream.total_out != uncompLen) {
849         ALOGW("Size mismatch on inflated file (%ld vs " ZD ")\n",
850             zstream.total_out, (ZD_TYPE) uncompLen);
851         goto z_bail;
852     }
853 
854     result = true;
855 
856 z_bail:
857     inflateEnd(&zstream);        /* free up any allocated structures */
858 
859 bail:
860     return result;
861 }
862 
863 /*
864  * Uncompress "deflate" data from one buffer to an open file descriptor.
865  */
inflateBuffer(int fd,const void * inBuf,size_t uncompLen,size_t compLen)866 /*static*/ bool ZipFileRO::inflateBuffer(int fd, const void* inBuf,
867     size_t uncompLen, size_t compLen)
868 {
869     bool result = false;
870     const size_t kWriteBufSize = 32768;
871     unsigned char writeBuf[kWriteBufSize];
872     z_stream zstream;
873     int zerr;
874 
875     /*
876      * Initialize the zlib stream struct.
877      */
878     memset(&zstream, 0, sizeof(zstream));
879     zstream.zalloc = Z_NULL;
880     zstream.zfree = Z_NULL;
881     zstream.opaque = Z_NULL;
882     zstream.next_in = (Bytef*)inBuf;
883     zstream.avail_in = compLen;
884     zstream.next_out = (Bytef*) writeBuf;
885     zstream.avail_out = sizeof(writeBuf);
886     zstream.data_type = Z_UNKNOWN;
887 
888     /*
889      * Use the undocumented "negative window bits" feature to tell zlib
890      * that there's no zlib header waiting for it.
891      */
892     zerr = inflateInit2(&zstream, -MAX_WBITS);
893     if (zerr != Z_OK) {
894         if (zerr == Z_VERSION_ERROR) {
895             ALOGE("Installed zlib is not compatible with linked version (%s)\n",
896                 ZLIB_VERSION);
897         } else {
898             ALOGE("Call to inflateInit2 failed (zerr=%d)\n", zerr);
899         }
900         goto bail;
901     }
902 
903     /*
904      * Loop while we have more to do.
905      */
906     do {
907         /*
908          * Expand data.
909          */
910         zerr = inflate(&zstream, Z_NO_FLUSH);
911         if (zerr != Z_OK && zerr != Z_STREAM_END) {
912             ALOGW("zlib inflate: zerr=%d (nIn=%p aIn=%u nOut=%p aOut=%u)\n",
913                 zerr, zstream.next_in, zstream.avail_in,
914                 zstream.next_out, zstream.avail_out);
915             goto z_bail;
916         }
917 
918         /* write when we're full or when we're done */
919         if (zstream.avail_out == 0 ||
920             (zerr == Z_STREAM_END && zstream.avail_out != sizeof(writeBuf)))
921         {
922             long writeSize = zstream.next_out - writeBuf;
923             int cc = TEMP_FAILURE_RETRY(write(fd, writeBuf, writeSize));
924             if (cc < 0) {
925                 ALOGW("write failed in inflate: %s", strerror(errno));
926                 goto z_bail;
927             } else if (cc != (int) writeSize) {
928                 ALOGW("write failed in inflate (%d vs %ld)", cc, writeSize);
929                 goto z_bail;
930             }
931 
932             zstream.next_out = writeBuf;
933             zstream.avail_out = sizeof(writeBuf);
934         }
935     } while (zerr == Z_OK);
936 
937     assert(zerr == Z_STREAM_END);       /* other errors should've been caught */
938 
939     /* paranoia */
940     if (zstream.total_out != uncompLen) {
941         ALOGW("Size mismatch on inflated file (%ld vs " ZD ")\n",
942             zstream.total_out, (ZD_TYPE) uncompLen);
943         goto z_bail;
944     }
945 
946     result = true;
947 
948 z_bail:
949     inflateEnd(&zstream);        /* free up any allocated structures */
950 
951 bail:
952     return result;
953 }
954