zip_archive.h revision 761600567d73b23324ae0251e871c15d6849ffd8
1b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom/*
2b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom * Copyright (C) 2008 The Android Open Source Project
3b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom *
4b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom * Licensed under the Apache License, Version 2.0 (the "License");
5b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom * you may not use this file except in compliance with the License.
6b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom * You may obtain a copy of the License at
7b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom *
8b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom *      http://www.apache.org/licenses/LICENSE-2.0
9b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom *
10b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom * Unless required by applicable law or agreed to in writing, software
11b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom * distributed under the License is distributed on an "AS IS" BASIS,
12b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom * See the License for the specific language governing permissions and
14b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom * limitations under the License.
15b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom */
16b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
17b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom#ifndef ART_SRC_ZIP_ARCHIVE_H_
18b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom#define ART_SRC_ZIP_ARCHIVE_H_
19b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
20b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom#include <stdint.h>
21b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom#include <zlib.h>
22b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
23761600567d73b23324ae0251e871c15d6849ffd8Elliott Hughes#include "base/unix_file/random_access_file.h"
24b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom#include "globals.h"
25b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom#include "logging.h"
26db4d54081f09abcbe97ffdf615874f2809a9e777Brian Carlstrom#include "mem_map.h"
27761600567d73b23324ae0251e871c15d6849ffd8Elliott Hughes#include "os.h"
28a0e180632411f7fe0edf454e571c42209ee7b540Elliott Hughes#include "safe_map.h"
29b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom#include "stringpiece.h"
30e5448b5a12003b405b22cde3b94f962ab4888a87Elliott Hughes#include "UniquePtr.h"
31b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
32b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstromnamespace art {
33b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
34b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstromclass ZipArchive;
35b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstromclass MemMap;
36b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
37b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstromclass ZipEntry {
38b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom public:
3989521898b56f2ebc3fb68acfb6bc6dde9b6f5c38Brian Carlstrom  bool ExtractToFile(File& file);
4089521898b56f2ebc3fb68acfb6bc6dde9b6f5c38Brian Carlstrom  bool ExtractToMemory(MemMap& mem_map);
41b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
4289521898b56f2ebc3fb68acfb6bc6dde9b6f5c38Brian Carlstrom  uint32_t GetUncompressedLength();
43b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  uint32_t GetCrc32();
44b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
45b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom private:
46a6cc893c4b142cd410fc956963b6f5a014e983adBrian Carlstrom  ZipEntry(const ZipArchive* zip_archive, const byte* ptr) : zip_archive_(zip_archive), ptr_(ptr) {}
47b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
48b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  // Zip compression methods
49b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  enum {
50b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom    kCompressStored     = 0,        // no compression
51b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom    kCompressDeflated   = 8,        // standard deflate
52b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  };
53b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
54b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  // kCompressStored, kCompressDeflated, ...
55b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  uint16_t GetCompressionMethod();
56b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
57b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  uint32_t GetCompressedLength();
58b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
59b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  // returns -1 on error
60b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  off_t GetDataOffset();
61b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
62a6cc893c4b142cd410fc956963b6f5a014e983adBrian Carlstrom  const ZipArchive* zip_archive_;
63b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
64b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  // pointer to zip entry within central directory
65db4d54081f09abcbe97ffdf615874f2809a9e777Brian Carlstrom  const byte* ptr_;
66b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
67b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  friend class ZipArchive;
68a21039c3ae2b20e44ceb2735251c04d0aac89afdElliott Hughes  DISALLOW_COPY_AND_ASSIGN(ZipEntry);
69b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom};
70b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
71b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstromclass ZipArchive {
72b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom public:
73b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  // Zip file constants.
74b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const uint32_t kEOCDSignature  = 0x06054b50;
75b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kEOCDLen         = 22;
76b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kEOCDNumEntries  =  8;  // offset to #of entries in file
77b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kEOCDSize        = 12;  // size of the central directory
78b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kEOCDFileOffset  = 16;  // offset to central directory
79b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
80b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kMaxCommentLen = 65535;  // longest possible in uint16_t
81b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kMaxEOCDSearch = (kMaxCommentLen + kEOCDLen);
82b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
83b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const uint32_t kLFHSignature = 0x04034b50;
84b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kLFHLen        = 30;  // excluding variable-len fields
85b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kLFHNameLen    = 26;  // offset to filename length
86b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kLFHExtraLen   = 28;  // offset to extra length
87b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
88b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const uint32_t kCDESignature   = 0x02014b50;
89b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kCDELen          = 46;  // excluding variable-len fields
90b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kCDEMethod       = 10;  // offset to compression method
91b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kCDEModWhen      = 12;  // offset to modification timestamp
92b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kCDECRC          = 16;  // offset to entry CRC
93b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kCDECompLen      = 20;  // offset to compressed length
94b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kCDEUncompLen    = 24;  // offset to uncompressed length
95b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kCDENameLen      = 28;  // offset to filename length
96b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kCDEExtraLen     = 30;  // offset to extra length
97b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kCDECommentLen   = 32;  // offset to comment length
98b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kCDELocalOffset  = 42;  // offset to local hdr
99b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
100b7bbba49d88eae58223d9878da4069bf6d7140bfBrian Carlstrom  // return new ZipArchive instance on success, NULL on error.
101b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static ZipArchive* Open(const std::string& filename);
102a6cc893c4b142cd410fc956963b6f5a014e983adBrian Carlstrom  static ZipArchive* OpenFromFd(int fd);
103b7bbba49d88eae58223d9878da4069bf6d7140bfBrian Carlstrom
104a6cc893c4b142cd410fc956963b6f5a014e983adBrian Carlstrom  ZipEntry* Find(const char* name) const;
105b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
106b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  ~ZipArchive() {
107b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom    Close();
108b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  }
109b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
110b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom private:
111a51a3dd5603daf3d368b7735067e1d9eb54c4c40Elliott Hughes  explicit ZipArchive(int fd) : fd_(fd), num_entries_(0), dir_offset_(0) {}
112b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
113b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  bool MapCentralDirectory();
114b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  bool Parse();
115b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  void Close();
116b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
117b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  int fd_;
118b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  uint16_t num_entries_;
119b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  off_t dir_offset_;
12090a3369d3b6238f1a4c9b19ca68978dab1c39bc4Elliott Hughes  UniquePtr<MemMap> dir_map_;
121a0e180632411f7fe0edf454e571c42209ee7b540Elliott Hughes  typedef SafeMap<StringPiece, const byte*> DirEntries;
1227e93b50433cde2a44d99212e8040299bde498546Brian Carlstrom  DirEntries dir_entries_;
123b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
124b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  friend class ZipEntry;
125a21039c3ae2b20e44ceb2735251c04d0aac89afdElliott Hughes
126a21039c3ae2b20e44ceb2735251c04d0aac89afdElliott Hughes  DISALLOW_COPY_AND_ASSIGN(ZipArchive);
127b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom};
128b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
129b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom}  // namespace art
130b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
131b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom#endif  // ART_SRC_ZIP_ARCHIVE_H_
132