zip_archive.h revision 89521898b56f2ebc3fb68acfb6bc6dde9b6f5c38
1b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom/*
2b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom * Copyright (C) 2008 The Android Open Source Project
3b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom *
4b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom * Licensed under the Apache License, Version 2.0 (the "License");
5b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom * you may not use this file except in compliance with the License.
6b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom * You may obtain a copy of the License at
7b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom *
8b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom *      http://www.apache.org/licenses/LICENSE-2.0
9b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom *
10b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom * Unless required by applicable law or agreed to in writing, software
11b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom * distributed under the License is distributed on an "AS IS" BASIS,
12b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom * See the License for the specific language governing permissions and
14b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom * limitations under the License.
15b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom */
16b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
17b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom#ifndef ART_SRC_ZIP_ARCHIVE_H_
18b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom#define ART_SRC_ZIP_ARCHIVE_H_
19b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
20b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom#include <stdint.h>
21b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom#include <sys/mman.h>
22b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom#include <zlib.h>
23b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
2490a3369d3b6238f1a4c9b19ca68978dab1c39bc4Elliott Hughes#include <map>
2590a3369d3b6238f1a4c9b19ca68978dab1c39bc4Elliott Hughes
2690a3369d3b6238f1a4c9b19ca68978dab1c39bc4Elliott Hughes#include "UniquePtr.h"
27db4d54081f09abcbe97ffdf615874f2809a9e777Brian Carlstrom#include "file.h"
28b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom#include "globals.h"
29b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom#include "logging.h"
30db4d54081f09abcbe97ffdf615874f2809a9e777Brian Carlstrom#include "mem_map.h"
31b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom#include "stringpiece.h"
327e93b50433cde2a44d99212e8040299bde498546Brian Carlstrom#include "unordered_map.h"
33b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
34b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstromnamespace art {
35b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
36b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstromclass ZipArchive;
37b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstromclass MemMap;
38b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
39b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstromclass ZipEntry {
40b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom public:
4189521898b56f2ebc3fb68acfb6bc6dde9b6f5c38Brian Carlstrom  bool ExtractToFile(File& file);
4289521898b56f2ebc3fb68acfb6bc6dde9b6f5c38Brian Carlstrom  bool ExtractToMemory(MemMap& mem_map);
43b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
4489521898b56f2ebc3fb68acfb6bc6dde9b6f5c38Brian Carlstrom  uint32_t GetUncompressedLength();
45b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  uint32_t GetCrc32();
46b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
47b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom private:
48b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
49362f9bc807169bcfc8761dde067bbfb79b5ad0fdElliott Hughes  ZipEntry(ZipArchive* zip_archive, const byte* ptr) : zip_archive_(zip_archive), ptr_(ptr) {}
50b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
51b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  // Zip compression methods
52b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  enum {
53b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom    kCompressStored     = 0,        // no compression
54b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom    kCompressDeflated   = 8,        // standard deflate
55b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  };
56b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
57b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  // kCompressStored, kCompressDeflated, ...
58b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  uint16_t GetCompressionMethod();
59b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
60b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  uint32_t GetCompressedLength();
61b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
62b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  // returns -1 on error
63b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  off_t GetDataOffset();
64b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
65b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  ZipArchive* zip_archive_;
66b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
67b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  // pointer to zip entry within central directory
68db4d54081f09abcbe97ffdf615874f2809a9e777Brian Carlstrom  const byte* ptr_;
69b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
70b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  friend class ZipArchive;
71b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom};
72b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
73b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstromclass ZipArchive {
74b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom public:
75b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
76b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  // Zip file constants.
77b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const uint32_t kEOCDSignature  = 0x06054b50;
78b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kEOCDLen         = 22;
79b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kEOCDNumEntries  =  8;  // offset to #of entries in file
80b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kEOCDSize        = 12;  // size of the central directory
81b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kEOCDFileOffset  = 16;  // offset to central directory
82b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
83b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kMaxCommentLen = 65535;  // longest possible in uint16_t
84b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kMaxEOCDSearch = (kMaxCommentLen + kEOCDLen);
85b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
86b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const uint32_t kLFHSignature = 0x04034b50;
87b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kLFHLen        = 30;  // excluding variable-len fields
88b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kLFHNameLen    = 26;  // offset to filename length
89b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kLFHExtraLen   = 28;  // offset to extra length
90b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
91b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const uint32_t kCDESignature   = 0x02014b50;
92b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kCDELen          = 46;  // excluding variable-len fields
93b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kCDEMethod       = 10;  // offset to compression method
94b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kCDEModWhen      = 12;  // offset to modification timestamp
95b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kCDECRC          = 16;  // offset to entry CRC
96b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kCDECompLen      = 20;  // offset to compressed length
97b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kCDEUncompLen    = 24;  // offset to uncompressed length
98b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kCDENameLen      = 28;  // offset to filename length
99b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kCDEExtraLen     = 30;  // offset to extra length
100b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kCDECommentLen   = 32;  // offset to comment length
101b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static const int32_t kCDELocalOffset  = 42;  // offset to local hdr
102b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
103b7bbba49d88eae58223d9878da4069bf6d7140bfBrian Carlstrom  // return new ZipArchive instance on success, NULL on error.
104b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  static ZipArchive* Open(const std::string& filename);
105b7bbba49d88eae58223d9878da4069bf6d7140bfBrian Carlstrom  static ZipArchive* Open(int fd);
106b7bbba49d88eae58223d9878da4069bf6d7140bfBrian Carlstrom
107c1f143de3d0370a17a4561eb83bf10a5d7908aa3Elliott Hughes  ZipEntry* Find(const char* name);
108b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
109b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  ~ZipArchive() {
110b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom    Close();
111b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  }
112b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
113b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom private:
114a51a3dd5603daf3d368b7735067e1d9eb54c4c40Elliott Hughes  explicit ZipArchive(int fd) : fd_(fd), num_entries_(0), dir_offset_(0) {}
115b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
116b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  bool MapCentralDirectory();
117b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  bool Parse();
118b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  void Close();
119b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
120b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  int fd_;
121b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  uint16_t num_entries_;
122b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  off_t dir_offset_;
12390a3369d3b6238f1a4c9b19ca68978dab1c39bc4Elliott Hughes  UniquePtr<MemMap> dir_map_;
124a663ea5de4c9ab6b1510fdebd6d8eca77ba699aeBrian Carlstrom  typedef std::tr1::unordered_map<StringPiece, const byte*, StringPieceHash> DirEntries;
1257e93b50433cde2a44d99212e8040299bde498546Brian Carlstrom  DirEntries dir_entries_;
126b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
127b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom  friend class ZipEntry;
128b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom};
129b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
130b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom}  // namespace art
131b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom
132b0460eaa2cb131f1dbdd5a7217bd36b9a9f1b995Brian Carlstrom#endif  // ART_SRC_ZIP_ARCHIVE_H_
133