dex_file.h revision b0fa5dc7769c1e054032f39de0a3f6d6dd06f8cf
1/*
2 * Copyright (C) 2011 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 *      http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17#ifndef ART_RUNTIME_DEX_FILE_H_
18#define ART_RUNTIME_DEX_FILE_H_
19
20#include <string>
21#include <vector>
22
23#include "base/logging.h"
24#include "base/mutex.h"  // For Locks::mutator_lock_.
25#include "globals.h"
26#include "invoke_type.h"
27#include "jni.h"
28#include "mem_map.h"
29#include "modifiers.h"
30#include "safe_map.h"
31#include "UniquePtr.h"
32
33namespace art {
34
35// TODO: remove dependencies on mirror classes, primarily by moving
36// EncodedStaticFieldValueIterator to its own file.
37namespace mirror {
38  class ArtField;
39  class ArtMethod;
40  class ClassLoader;
41  class DexCache;
42}  // namespace mirror
43class ClassLinker;
44class Signature;
45template <typename T>
46class SirtRef;
47class StringPiece;
48class ZipArchive;
49
50// TODO: move all of the macro functionality into the DexCache class.
51class DexFile {
52 public:
53  static const byte kDexMagic[];
54  static const byte kDexMagicVersion[];
55  static const size_t kSha1DigestSize = 20;
56  static const uint32_t kDexEndianConstant = 0x12345678;
57
58  // name of the DexFile entry within a zip archive
59  static const char* kClassesDex;
60
61  // The value of an invalid index.
62  static const uint32_t kDexNoIndex = 0xFFFFFFFF;
63
64  // The value of an invalid index.
65  static const uint16_t kDexNoIndex16 = 0xFFFF;
66
67  // Raw header_item.
68  struct Header {
69    uint8_t magic_[8];
70    uint32_t checksum_;  // See also location_checksum_
71    uint8_t signature_[kSha1DigestSize];
72    uint32_t file_size_;  // size of entire file
73    uint32_t header_size_;  // offset to start of next section
74    uint32_t endian_tag_;
75    uint32_t link_size_;  // unused
76    uint32_t link_off_;  // unused
77    uint32_t map_off_;  // unused
78    uint32_t string_ids_size_;  // number of StringIds
79    uint32_t string_ids_off_;  // file offset of StringIds array
80    uint32_t type_ids_size_;  // number of TypeIds, we don't support more than 65535
81    uint32_t type_ids_off_;  // file offset of TypeIds array
82    uint32_t proto_ids_size_;  // number of ProtoIds, we don't support more than 65535
83    uint32_t proto_ids_off_;  // file offset of ProtoIds array
84    uint32_t field_ids_size_;  // number of FieldIds
85    uint32_t field_ids_off_;  // file offset of FieldIds array
86    uint32_t method_ids_size_;  // number of MethodIds
87    uint32_t method_ids_off_;  // file offset of MethodIds array
88    uint32_t class_defs_size_;  // number of ClassDefs
89    uint32_t class_defs_off_;  // file offset of ClassDef array
90    uint32_t data_size_;  // unused
91    uint32_t data_off_;  // unused
92
93   private:
94    DISALLOW_COPY_AND_ASSIGN(Header);
95  };
96
97  // Map item type codes.
98  enum {
99    kDexTypeHeaderItem               = 0x0000,
100    kDexTypeStringIdItem             = 0x0001,
101    kDexTypeTypeIdItem               = 0x0002,
102    kDexTypeProtoIdItem              = 0x0003,
103    kDexTypeFieldIdItem              = 0x0004,
104    kDexTypeMethodIdItem             = 0x0005,
105    kDexTypeClassDefItem             = 0x0006,
106    kDexTypeMapList                  = 0x1000,
107    kDexTypeTypeList                 = 0x1001,
108    kDexTypeAnnotationSetRefList     = 0x1002,
109    kDexTypeAnnotationSetItem        = 0x1003,
110    kDexTypeClassDataItem            = 0x2000,
111    kDexTypeCodeItem                 = 0x2001,
112    kDexTypeStringDataItem           = 0x2002,
113    kDexTypeDebugInfoItem            = 0x2003,
114    kDexTypeAnnotationItem           = 0x2004,
115    kDexTypeEncodedArrayItem         = 0x2005,
116    kDexTypeAnnotationsDirectoryItem = 0x2006,
117  };
118
119  struct MapItem {
120    uint16_t type_;
121    uint16_t unused_;
122    uint32_t size_;
123    uint32_t offset_;
124
125   private:
126    DISALLOW_COPY_AND_ASSIGN(MapItem);
127  };
128
129  struct MapList {
130    uint32_t size_;
131    MapItem list_[1];
132
133   private:
134    DISALLOW_COPY_AND_ASSIGN(MapList);
135  };
136
137  // Raw string_id_item.
138  struct StringId {
139    uint32_t string_data_off_;  // offset in bytes from the base address
140
141   private:
142    DISALLOW_COPY_AND_ASSIGN(StringId);
143  };
144
145  // Raw type_id_item.
146  struct TypeId {
147    uint32_t descriptor_idx_;  // index into string_ids
148
149   private:
150    DISALLOW_COPY_AND_ASSIGN(TypeId);
151  };
152
153  // Raw field_id_item.
154  struct FieldId {
155    uint16_t class_idx_;  // index into type_ids_ array for defining class
156    uint16_t type_idx_;  // index into type_ids_ array for field type
157    uint32_t name_idx_;  // index into string_ids_ array for field name
158
159   private:
160    DISALLOW_COPY_AND_ASSIGN(FieldId);
161  };
162
163  // Raw method_id_item.
164  struct MethodId {
165    uint16_t class_idx_;  // index into type_ids_ array for defining class
166    uint16_t proto_idx_;  // index into proto_ids_ array for method prototype
167    uint32_t name_idx_;  // index into string_ids_ array for method name
168
169   private:
170    DISALLOW_COPY_AND_ASSIGN(MethodId);
171  };
172
173  // Raw proto_id_item.
174  struct ProtoId {
175    uint32_t shorty_idx_;  // index into string_ids array for shorty descriptor
176    uint16_t return_type_idx_;  // index into type_ids array for return type
177    uint16_t pad_;             // padding = 0
178    uint32_t parameters_off_;  // file offset to type_list for parameter types
179
180   private:
181    DISALLOW_COPY_AND_ASSIGN(ProtoId);
182  };
183
184  // Raw class_def_item.
185  struct ClassDef {
186    uint16_t class_idx_;  // index into type_ids_ array for this class
187    uint16_t pad1_;  // padding = 0
188    uint32_t access_flags_;
189    uint16_t superclass_idx_;  // index into type_ids_ array for superclass
190    uint16_t pad2_;  // padding = 0
191    uint32_t interfaces_off_;  // file offset to TypeList
192    uint32_t source_file_idx_;  // index into string_ids_ for source file name
193    uint32_t annotations_off_;  // file offset to annotations_directory_item
194    uint32_t class_data_off_;  // file offset to class_data_item
195    uint32_t static_values_off_;  // file offset to EncodedArray
196
197   private:
198    DISALLOW_COPY_AND_ASSIGN(ClassDef);
199  };
200
201  // Raw type_item.
202  struct TypeItem {
203    uint16_t type_idx_;  // index into type_ids section
204
205   private:
206    DISALLOW_COPY_AND_ASSIGN(TypeItem);
207  };
208
209  // Raw type_list.
210  class TypeList {
211   public:
212    uint32_t Size() const {
213      return size_;
214    }
215
216    const TypeItem& GetTypeItem(uint32_t idx) const {
217      DCHECK_LT(idx, this->size_);
218      return this->list_[idx];
219    }
220
221   private:
222    uint32_t size_;  // size of the list, in entries
223    TypeItem list_[1];  // elements of the list
224    DISALLOW_COPY_AND_ASSIGN(TypeList);
225  };
226
227  // Raw code_item.
228  struct CodeItem {
229    uint16_t registers_size_;
230    uint16_t ins_size_;
231    uint16_t outs_size_;
232    uint16_t tries_size_;
233    uint32_t debug_info_off_;  // file offset to debug info stream
234    uint32_t insns_size_in_code_units_;  // size of the insns array, in 2 byte code units
235    uint16_t insns_[1];
236
237   private:
238    DISALLOW_COPY_AND_ASSIGN(CodeItem);
239  };
240
241  // Raw try_item.
242  struct TryItem {
243    uint32_t start_addr_;
244    uint16_t insn_count_;
245    uint16_t handler_off_;
246
247   private:
248    DISALLOW_COPY_AND_ASSIGN(TryItem);
249  };
250
251  // Annotation constants.
252  enum {
253    kDexVisibilityBuild         = 0x00,     /* annotation visibility */
254    kDexVisibilityRuntime       = 0x01,
255    kDexVisibilitySystem        = 0x02,
256
257    kDexAnnotationByte          = 0x00,
258    kDexAnnotationShort         = 0x02,
259    kDexAnnotationChar          = 0x03,
260    kDexAnnotationInt           = 0x04,
261    kDexAnnotationLong          = 0x06,
262    kDexAnnotationFloat         = 0x10,
263    kDexAnnotationDouble        = 0x11,
264    kDexAnnotationString        = 0x17,
265    kDexAnnotationType          = 0x18,
266    kDexAnnotationField         = 0x19,
267    kDexAnnotationMethod        = 0x1a,
268    kDexAnnotationEnum          = 0x1b,
269    kDexAnnotationArray         = 0x1c,
270    kDexAnnotationAnnotation    = 0x1d,
271    kDexAnnotationNull          = 0x1e,
272    kDexAnnotationBoolean       = 0x1f,
273
274    kDexAnnotationValueTypeMask = 0x1f,     /* low 5 bits */
275    kDexAnnotationValueArgShift = 5,
276  };
277
278  struct AnnotationsDirectoryItem {
279    uint32_t class_annotations_off_;
280    uint32_t fields_size_;
281    uint32_t methods_size_;
282    uint32_t parameters_size_;
283
284   private:
285    DISALLOW_COPY_AND_ASSIGN(AnnotationsDirectoryItem);
286  };
287
288  struct FieldAnnotationsItem {
289    uint32_t field_idx_;
290    uint32_t annotations_off_;
291
292   private:
293    DISALLOW_COPY_AND_ASSIGN(FieldAnnotationsItem);
294  };
295
296  struct MethodAnnotationsItem {
297    uint32_t method_idx_;
298    uint32_t annotations_off_;
299
300   private:
301    DISALLOW_COPY_AND_ASSIGN(MethodAnnotationsItem);
302  };
303
304  struct ParameterAnnotationsItem {
305    uint32_t method_idx_;
306    uint32_t annotations_off_;
307
308   private:
309    DISALLOW_COPY_AND_ASSIGN(ParameterAnnotationsItem);
310  };
311
312  struct AnnotationSetRefItem {
313    uint32_t annotations_off_;
314
315   private:
316    DISALLOW_COPY_AND_ASSIGN(AnnotationSetRefItem);
317  };
318
319  struct AnnotationSetRefList {
320    uint32_t size_;
321    AnnotationSetRefItem list_[1];
322
323   private:
324    DISALLOW_COPY_AND_ASSIGN(AnnotationSetRefList);
325  };
326
327  struct AnnotationSetItem {
328    uint32_t size_;
329    uint32_t entries_[1];
330
331   private:
332    DISALLOW_COPY_AND_ASSIGN(AnnotationSetItem);
333  };
334
335  struct AnnotationItem {
336    uint8_t visibility_;
337    uint8_t annotation_[1];
338
339   private:
340    DISALLOW_COPY_AND_ASSIGN(AnnotationItem);
341  };
342
343  typedef std::pair<const DexFile*, const DexFile::ClassDef*> ClassPathEntry;
344  typedef std::vector<const DexFile*> ClassPath;
345
346  // Search a collection of DexFiles for a descriptor
347  static ClassPathEntry FindInClassPath(const char* descriptor,
348                                        const ClassPath& class_path);
349
350  // Returns the checksum of a file for comparison with GetLocationChecksum().
351  // For .dex files, this is the header checksum.
352  // For zip files, this is the classes.dex zip entry CRC32 checksum.
353  // Return true if the checksum could be found, false otherwise.
354  static bool GetChecksum(const char* filename, uint32_t* checksum, std::string* error_msg);
355
356  // Opens .dex file, guessing the container format based on file extension
357  static const DexFile* Open(const char* filename, const char* location, std::string* error_msg);
358
359  // Opens .dex file, backed by existing memory
360  static const DexFile* Open(const uint8_t* base, size_t size,
361                             const std::string& location,
362                             uint32_t location_checksum,
363                             std::string* error_msg) {
364    return OpenMemory(base, size, location, location_checksum, NULL, error_msg);
365  }
366
367  // Opens .dex file from the classes.dex in a zip archive
368  static const DexFile* Open(const ZipArchive& zip_archive, const std::string& location,
369                             std::string* error_msg);
370
371  // Closes a .dex file.
372  virtual ~DexFile();
373
374  const std::string& GetLocation() const {
375    return location_;
376  }
377
378  // For DexFiles directly from .dex files, this is the checksum from the DexFile::Header.
379  // For DexFiles opened from a zip files, this will be the ZipEntry CRC32 of classes.dex.
380  uint32_t GetLocationChecksum() const {
381    return location_checksum_;
382  }
383
384  const Header& GetHeader() const {
385    DCHECK(header_ != NULL) << GetLocation();
386    return *header_;
387  }
388
389  // Decode the dex magic version
390  uint32_t GetVersion() const;
391
392  // Returns true if the byte string points to the magic value.
393  static bool IsMagicValid(const byte* magic);
394
395  // Returns true if the byte string after the magic is the correct value.
396  static bool IsVersionValid(const byte* magic);
397
398  // Returns the number of string identifiers in the .dex file.
399  size_t NumStringIds() const {
400    DCHECK(header_ != NULL) << GetLocation();
401    return header_->string_ids_size_;
402  }
403
404  // Returns the StringId at the specified index.
405  const StringId& GetStringId(uint32_t idx) const {
406    DCHECK_LT(idx, NumStringIds()) << GetLocation();
407    return string_ids_[idx];
408  }
409
410  uint32_t GetIndexForStringId(const StringId& string_id) const {
411    CHECK_GE(&string_id, string_ids_) << GetLocation();
412    CHECK_LT(&string_id, string_ids_ + header_->string_ids_size_) << GetLocation();
413    return &string_id - string_ids_;
414  }
415
416  int32_t GetStringLength(const StringId& string_id) const;
417
418  // Returns a pointer to the UTF-8 string data referred to by the given string_id as well as the
419  // length of the string when decoded as a UTF-16 string. Note the UTF-16 length is not the same
420  // as the string length of the string data.
421  const char* GetStringDataAndUtf16Length(const StringId& string_id, uint32_t* utf16_length) const;
422
423  const char* GetStringData(const StringId& string_id) const {
424    uint32_t ignored;
425    return GetStringDataAndUtf16Length(string_id, &ignored);
426  }
427
428  // Index version of GetStringDataAndUtf16Length.
429  const char* StringDataAndUtf16LengthByIdx(uint32_t idx, uint32_t* utf16_length) const {
430    if (idx == kDexNoIndex) {
431      *utf16_length = 0;
432      return NULL;
433    }
434    const StringId& string_id = GetStringId(idx);
435    return GetStringDataAndUtf16Length(string_id, utf16_length);
436  }
437
438  const char* StringDataByIdx(uint32_t idx) const {
439    uint32_t unicode_length;
440    return StringDataAndUtf16LengthByIdx(idx, &unicode_length);
441  }
442
443  // Looks up a string id for a given modified utf8 string.
444  const StringId* FindStringId(const char* string) const;
445
446  // Looks up a string id for a given utf16 string.
447  const StringId* FindStringId(const uint16_t* string) const;
448
449  // Returns the number of type identifiers in the .dex file.
450  size_t NumTypeIds() const {
451    DCHECK(header_ != NULL) << GetLocation();
452    return header_->type_ids_size_;
453  }
454
455  // Returns the TypeId at the specified index.
456  const TypeId& GetTypeId(uint32_t idx) const {
457    DCHECK_LT(idx, NumTypeIds()) << GetLocation();
458    return type_ids_[idx];
459  }
460
461  uint16_t GetIndexForTypeId(const TypeId& type_id) const {
462    CHECK_GE(&type_id, type_ids_) << GetLocation();
463    CHECK_LT(&type_id, type_ids_ + header_->type_ids_size_) << GetLocation();
464    size_t result = &type_id - type_ids_;
465    DCHECK_LT(result, 65536U) << GetLocation();
466    return static_cast<uint16_t>(result);
467  }
468
469  // Get the descriptor string associated with a given type index.
470  const char* StringByTypeIdx(uint32_t idx, uint32_t* unicode_length) const {
471    const TypeId& type_id = GetTypeId(idx);
472    return StringDataAndUtf16LengthByIdx(type_id.descriptor_idx_, unicode_length);
473  }
474
475  const char* StringByTypeIdx(uint32_t idx) const {
476    const TypeId& type_id = GetTypeId(idx);
477    return StringDataByIdx(type_id.descriptor_idx_);
478  }
479
480  // Returns the type descriptor string of a type id.
481  const char* GetTypeDescriptor(const TypeId& type_id) const {
482    return StringDataByIdx(type_id.descriptor_idx_);
483  }
484
485  // Looks up a type for the given string index
486  const TypeId* FindTypeId(uint32_t string_idx) const;
487
488  // Returns the number of field identifiers in the .dex file.
489  size_t NumFieldIds() const {
490    DCHECK(header_ != NULL) << GetLocation();
491    return header_->field_ids_size_;
492  }
493
494  // Returns the FieldId at the specified index.
495  const FieldId& GetFieldId(uint32_t idx) const {
496    DCHECK_LT(idx, NumFieldIds()) << GetLocation();
497    return field_ids_[idx];
498  }
499
500  uint32_t GetIndexForFieldId(const FieldId& field_id) const {
501    CHECK_GE(&field_id, field_ids_) << GetLocation();
502    CHECK_LT(&field_id, field_ids_ + header_->field_ids_size_) << GetLocation();
503    return &field_id - field_ids_;
504  }
505
506  // Looks up a field by its declaring class, name and type
507  const FieldId* FindFieldId(const DexFile::TypeId& declaring_klass,
508                             const DexFile::StringId& name,
509                             const DexFile::TypeId& type) const;
510
511  // Returns the declaring class descriptor string of a field id.
512  const char* GetFieldDeclaringClassDescriptor(const FieldId& field_id) const {
513    const DexFile::TypeId& type_id = GetTypeId(field_id.class_idx_);
514    return GetTypeDescriptor(type_id);
515  }
516
517  // Returns the class descriptor string of a field id.
518  const char* GetFieldTypeDescriptor(const FieldId& field_id) const {
519    const DexFile::TypeId& type_id = GetTypeId(field_id.type_idx_);
520    return GetTypeDescriptor(type_id);
521  }
522
523  // Returns the name of a field id.
524  const char* GetFieldName(const FieldId& field_id) const {
525    return StringDataByIdx(field_id.name_idx_);
526  }
527
528  // Returns the number of method identifiers in the .dex file.
529  size_t NumMethodIds() const {
530    DCHECK(header_ != NULL) << GetLocation();
531    return header_->method_ids_size_;
532  }
533
534  // Returns the MethodId at the specified index.
535  const MethodId& GetMethodId(uint32_t idx) const {
536    DCHECK_LT(idx, NumMethodIds()) << GetLocation();
537    return method_ids_[idx];
538  }
539
540  uint32_t GetIndexForMethodId(const MethodId& method_id) const {
541    CHECK_GE(&method_id, method_ids_) << GetLocation();
542    CHECK_LT(&method_id, method_ids_ + header_->method_ids_size_) << GetLocation();
543    return &method_id - method_ids_;
544  }
545
546  // Looks up a method by its declaring class, name and proto_id
547  const MethodId* FindMethodId(const DexFile::TypeId& declaring_klass,
548                               const DexFile::StringId& name,
549                               const DexFile::ProtoId& signature) const;
550
551  // Returns the declaring class descriptor string of a method id.
552  const char* GetMethodDeclaringClassDescriptor(const MethodId& method_id) const {
553    const DexFile::TypeId& type_id = GetTypeId(method_id.class_idx_);
554    return GetTypeDescriptor(type_id);
555  }
556
557  // Returns the prototype of a method id.
558  const ProtoId& GetMethodPrototype(const MethodId& method_id) const {
559    return GetProtoId(method_id.proto_idx_);
560  }
561
562  // Returns a representation of the signature of a method id.
563  const Signature GetMethodSignature(const MethodId& method_id) const;
564
565  // Returns the name of a method id.
566  const char* GetMethodName(const MethodId& method_id) const {
567    return StringDataByIdx(method_id.name_idx_);
568  }
569
570  // Returns the shorty of a method id.
571  const char* GetMethodShorty(const MethodId& method_id) const {
572    return StringDataByIdx(GetProtoId(method_id.proto_idx_).shorty_idx_);
573  }
574  const char* GetMethodShorty(const MethodId& method_id, uint32_t* length) const {
575    // Using the UTF16 length is safe here as shorties are guaranteed to be ASCII characters.
576    return StringDataAndUtf16LengthByIdx(GetProtoId(method_id.proto_idx_).shorty_idx_, length);
577  }
578  // Returns the number of class definitions in the .dex file.
579  size_t NumClassDefs() const {
580    DCHECK(header_ != NULL) << GetLocation();
581    return header_->class_defs_size_;
582  }
583
584  // Returns the ClassDef at the specified index.
585  const ClassDef& GetClassDef(uint16_t idx) const {
586    DCHECK_LT(idx, NumClassDefs()) << GetLocation();
587    return class_defs_[idx];
588  }
589
590  uint16_t GetIndexForClassDef(const ClassDef& class_def) const {
591    CHECK_GE(&class_def, class_defs_) << GetLocation();
592    CHECK_LT(&class_def, class_defs_ + header_->class_defs_size_) << GetLocation();
593    return &class_def - class_defs_;
594  }
595
596  // Returns the class descriptor string of a class definition.
597  const char* GetClassDescriptor(const ClassDef& class_def) const {
598    return StringByTypeIdx(class_def.class_idx_);
599  }
600
601  // Looks up a class definition by its class descriptor.
602  const ClassDef* FindClassDef(const char* descriptor) const;
603
604  // Looks up a class definition by its type index.
605  const ClassDef* FindClassDef(uint16_t type_idx) const;
606
607  const TypeList* GetInterfacesList(const ClassDef& class_def) const {
608    if (class_def.interfaces_off_ == 0) {
609        return NULL;
610    } else {
611      const byte* addr = begin_ + class_def.interfaces_off_;
612      return reinterpret_cast<const TypeList*>(addr);
613    }
614  }
615
616  // Returns a pointer to the raw memory mapped class_data_item
617  const byte* GetClassData(const ClassDef& class_def) const {
618    if (class_def.class_data_off_ == 0) {
619      return NULL;
620    } else {
621      return begin_ + class_def.class_data_off_;
622    }
623  }
624
625  //
626  const CodeItem* GetCodeItem(const uint32_t code_off) const {
627    if (code_off == 0) {
628      return NULL;  // native or abstract method
629    } else {
630      const byte* addr = begin_ + code_off;
631      return reinterpret_cast<const CodeItem*>(addr);
632    }
633  }
634
635  const char* GetReturnTypeDescriptor(const ProtoId& proto_id) const {
636    return StringByTypeIdx(proto_id.return_type_idx_);
637  }
638
639  // Returns the number of prototype identifiers in the .dex file.
640  size_t NumProtoIds() const {
641    DCHECK(header_ != NULL) << GetLocation();
642    return header_->proto_ids_size_;
643  }
644
645  // Returns the ProtoId at the specified index.
646  const ProtoId& GetProtoId(uint32_t idx) const {
647    DCHECK_LT(idx, NumProtoIds()) << GetLocation();
648    return proto_ids_[idx];
649  }
650
651  uint16_t GetIndexForProtoId(const ProtoId& proto_id) const {
652    CHECK_GE(&proto_id, proto_ids_) << GetLocation();
653    CHECK_LT(&proto_id, proto_ids_ + header_->proto_ids_size_) << GetLocation();
654    return &proto_id - proto_ids_;
655  }
656
657  // Looks up a proto id for a given return type and signature type list
658  const ProtoId* FindProtoId(uint16_t return_type_idx,
659                             const uint16_t* signature_type_idxs, uint32_t signature_length) const;
660  const ProtoId* FindProtoId(uint16_t return_type_idx,
661                             const std::vector<uint16_t>& signature_type_idxs) const {
662    return FindProtoId(return_type_idx, &signature_type_idxs[0], signature_type_idxs.size());
663  }
664
665  // Given a signature place the type ids into the given vector, returns true on success
666  bool CreateTypeList(const StringPiece& signature, uint16_t* return_type_idx,
667                      std::vector<uint16_t>* param_type_idxs) const;
668
669  // Create a Signature from the given string signature or return Signature::NoSignature if not
670  // possible.
671  const Signature CreateSignature(const StringPiece& signature) const;
672
673  // Returns the short form method descriptor for the given prototype.
674  const char* GetShorty(uint32_t proto_idx) const {
675    const ProtoId& proto_id = GetProtoId(proto_idx);
676    return StringDataByIdx(proto_id.shorty_idx_);
677  }
678
679  const TypeList* GetProtoParameters(const ProtoId& proto_id) const {
680    if (proto_id.parameters_off_ == 0) {
681      return NULL;
682    } else {
683      const byte* addr = begin_ + proto_id.parameters_off_;
684      return reinterpret_cast<const TypeList*>(addr);
685    }
686  }
687
688  const byte* GetEncodedStaticFieldValuesArray(const ClassDef& class_def) const {
689    if (class_def.static_values_off_ == 0) {
690      return 0;
691    } else {
692      return begin_ + class_def.static_values_off_;
693    }
694  }
695
696  static const TryItem* GetTryItems(const CodeItem& code_item, uint32_t offset);
697
698  // Get the base of the encoded data for the given DexCode.
699  static const byte* GetCatchHandlerData(const CodeItem& code_item, uint32_t offset) {
700    const byte* handler_data =
701        reinterpret_cast<const byte*>(GetTryItems(code_item, code_item.tries_size_));
702    return handler_data + offset;
703  }
704
705  // Find which try region is associated with the given address (ie dex pc). Returns -1 if none.
706  static int32_t FindTryItem(const CodeItem &code_item, uint32_t address);
707
708  // Find the handler offset associated with the given address (ie dex pc). Returns -1 if none.
709  static int32_t FindCatchHandlerOffset(const CodeItem &code_item, uint32_t address);
710
711  // Get the pointer to the start of the debugging data
712  const byte* GetDebugInfoStream(const CodeItem* code_item) const {
713    if (code_item->debug_info_off_ == 0) {
714      return NULL;
715    } else {
716      return begin_ + code_item->debug_info_off_;
717    }
718  }
719
720  // Callback for "new position table entry".
721  // Returning true causes the decoder to stop early.
722  typedef bool (*DexDebugNewPositionCb)(void* context, uint32_t address, uint32_t line_num);
723
724  // Callback for "new locals table entry". "signature" is an empty string
725  // if no signature is available for an entry.
726  typedef void (*DexDebugNewLocalCb)(void* context, uint16_t reg,
727                                     uint32_t start_address,
728                                     uint32_t end_address,
729                                     const char* name,
730                                     const char* descriptor,
731                                     const char* signature);
732
733  static bool LineNumForPcCb(void* context, uint32_t address, uint32_t line_num);
734
735  // Debug info opcodes and constants
736  enum {
737    DBG_END_SEQUENCE         = 0x00,
738    DBG_ADVANCE_PC           = 0x01,
739    DBG_ADVANCE_LINE         = 0x02,
740    DBG_START_LOCAL          = 0x03,
741    DBG_START_LOCAL_EXTENDED = 0x04,
742    DBG_END_LOCAL            = 0x05,
743    DBG_RESTART_LOCAL        = 0x06,
744    DBG_SET_PROLOGUE_END     = 0x07,
745    DBG_SET_EPILOGUE_BEGIN   = 0x08,
746    DBG_SET_FILE             = 0x09,
747    DBG_FIRST_SPECIAL        = 0x0a,
748    DBG_LINE_BASE            = -4,
749    DBG_LINE_RANGE           = 15,
750  };
751
752  struct LocalInfo {
753    LocalInfo()
754        : name_(NULL), descriptor_(NULL), signature_(NULL), start_address_(0), is_live_(false) {}
755
756    const char* name_;  // E.g., list
757    const char* descriptor_;  // E.g., Ljava/util/LinkedList;
758    const char* signature_;  // E.g., java.util.LinkedList<java.lang.Integer>
759    uint16_t start_address_;  // PC location where the local is first defined.
760    bool is_live_;  // Is the local defined and live.
761
762   private:
763    DISALLOW_COPY_AND_ASSIGN(LocalInfo);
764  };
765
766  struct LineNumFromPcContext {
767    LineNumFromPcContext(uint32_t address, uint32_t line_num)
768        : address_(address), line_num_(line_num) {}
769    uint32_t address_;
770    uint32_t line_num_;
771   private:
772    DISALLOW_COPY_AND_ASSIGN(LineNumFromPcContext);
773  };
774
775  void InvokeLocalCbIfLive(void* context, int reg, uint32_t end_address,
776                           LocalInfo* local_in_reg, DexDebugNewLocalCb local_cb) const {
777    if (local_cb != NULL && local_in_reg[reg].is_live_) {
778      local_cb(context, reg, local_in_reg[reg].start_address_, end_address,
779          local_in_reg[reg].name_, local_in_reg[reg].descriptor_,
780          local_in_reg[reg].signature_ != NULL ? local_in_reg[reg].signature_ : "");
781    }
782  }
783
784  // Determine the source file line number based on the program counter.
785  // "pc" is an offset, in 16-bit units, from the start of the method's code.
786  //
787  // Returns -1 if no match was found (possibly because the source files were
788  // compiled without "-g", so no line number information is present).
789  // Returns -2 for native methods (as expected in exception traces).
790  //
791  // This is used by runtime; therefore use art::Method not art::DexFile::Method.
792  int32_t GetLineNumFromPC(mirror::ArtMethod* method, uint32_t rel_pc) const
793      SHARED_LOCKS_REQUIRED(Locks::mutator_lock_);
794
795  void DecodeDebugInfo(const CodeItem* code_item, bool is_static, uint32_t method_idx,
796                       DexDebugNewPositionCb position_cb, DexDebugNewLocalCb local_cb,
797                       void* context) const;
798
799  const char* GetSourceFile(const ClassDef& class_def) const {
800    if (class_def.source_file_idx_ == 0xffffffff) {
801      return NULL;
802    } else {
803      return StringDataByIdx(class_def.source_file_idx_);
804    }
805  }
806
807  int GetPermissions() const;
808
809  bool IsReadOnly() const;
810
811  bool EnableWrite() const;
812
813  bool DisableWrite() const;
814
815  const byte* Begin() const {
816    return begin_;
817  }
818
819  size_t Size() const {
820    return size_;
821  }
822
823 private:
824  // Opens a .dex file
825  static const DexFile* OpenFile(int fd, const char* location, bool verify, std::string* error_msg);
826
827  // Opens a dex file from within a .jar, .zip, or .apk file
828  static const DexFile* OpenZip(int fd, const std::string& location, std::string* error_msg);
829
830  // Opens a .dex file at the given address backed by a MemMap
831  static const DexFile* OpenMemory(const std::string& location,
832                                   uint32_t location_checksum,
833                                   MemMap* mem_map,
834                                   std::string* error_msg);
835
836  // Opens a .dex file at the given address, optionally backed by a MemMap
837  static const DexFile* OpenMemory(const byte* dex_file,
838                                   size_t size,
839                                   const std::string& location,
840                                   uint32_t location_checksum,
841                                   MemMap* mem_map,
842                                   std::string* error_msg);
843
844  DexFile(const byte* base, size_t size,
845          const std::string& location,
846          uint32_t location_checksum,
847          MemMap* mem_map);
848
849  // Top-level initializer that calls other Init methods.
850  bool Init(std::string* error_msg);
851
852  // Returns true if the header magic and version numbers are of the expected values.
853  bool CheckMagicAndVersion(std::string* error_msg) const;
854
855  void DecodeDebugInfo0(const CodeItem* code_item, bool is_static, uint32_t method_idx,
856      DexDebugNewPositionCb position_cb, DexDebugNewLocalCb local_cb,
857      void* context, const byte* stream, LocalInfo* local_in_reg) const;
858
859  // The base address of the memory mapping.
860  const byte* const begin_;
861
862  // The size of the underlying memory allocation in bytes.
863  const size_t size_;
864
865  // Typically the dex file name when available, alternatively some identifying string.
866  //
867  // The ClassLinker will use this to match DexFiles the boot class
868  // path to DexCache::GetLocation when loading from an image.
869  const std::string location_;
870
871  const uint32_t location_checksum_;
872
873  // Manages the underlying memory allocation.
874  UniquePtr<MemMap> mem_map_;
875
876  // Points to the header section.
877  const Header* const header_;
878
879  // Points to the base of the string identifier list.
880  const StringId* const string_ids_;
881
882  // Points to the base of the type identifier list.
883  const TypeId* const type_ids_;
884
885  // Points to the base of the field identifier list.
886  const FieldId* const field_ids_;
887
888  // Points to the base of the method identifier list.
889  const MethodId* const method_ids_;
890
891  // Points to the base of the prototype identifier list.
892  const ProtoId* const proto_ids_;
893
894  // Points to the base of the class definition list.
895  const ClassDef* const class_defs_;
896};
897std::ostream& operator<<(std::ostream& os, const DexFile& dex_file);
898
899// Iterate over a dex file's ProtoId's paramters
900class DexFileParameterIterator {
901 public:
902  DexFileParameterIterator(const DexFile& dex_file, const DexFile::ProtoId& proto_id)
903      : dex_file_(dex_file), size_(0), pos_(0) {
904    type_list_ = dex_file_.GetProtoParameters(proto_id);
905    if (type_list_ != NULL) {
906      size_ = type_list_->Size();
907    }
908  }
909  bool HasNext() const { return pos_ < size_; }
910  void Next() { ++pos_; }
911  uint16_t GetTypeIdx() {
912    return type_list_->GetTypeItem(pos_).type_idx_;
913  }
914  const char* GetDescriptor() {
915    return dex_file_.StringByTypeIdx(GetTypeIdx());
916  }
917 private:
918  const DexFile& dex_file_;
919  const DexFile::TypeList* type_list_;
920  uint32_t size_;
921  uint32_t pos_;
922  DISALLOW_IMPLICIT_CONSTRUCTORS(DexFileParameterIterator);
923};
924
925// Abstract the signature of a method.
926class Signature {
927 public:
928  std::string ToString() const;
929
930  static Signature NoSignature() {
931    return Signature();
932  }
933
934  bool operator==(const Signature& rhs) const;
935  bool operator!=(const Signature& rhs) const {
936    return !(*this == rhs);
937  }
938
939  bool operator==(const StringPiece& rhs) const;
940
941 private:
942  Signature(const DexFile* dex, const DexFile::ProtoId& proto) : dex_file_(dex), proto_id_(&proto) {
943  }
944
945  Signature() : dex_file_(nullptr), proto_id_(nullptr) {
946  }
947
948  friend class DexFile;
949
950  const DexFile* const dex_file_;
951  const DexFile::ProtoId* const proto_id_;
952};
953std::ostream& operator<<(std::ostream& os, const Signature& sig);
954
955// Iterate and decode class_data_item
956class ClassDataItemIterator {
957 public:
958  ClassDataItemIterator(const DexFile& dex_file, const byte* raw_class_data_item)
959      : dex_file_(dex_file), pos_(0), ptr_pos_(raw_class_data_item), last_idx_(0) {
960    ReadClassDataHeader();
961    if (EndOfInstanceFieldsPos() > 0) {
962      ReadClassDataField();
963    } else if (EndOfVirtualMethodsPos() > 0) {
964      ReadClassDataMethod();
965    }
966  }
967  uint32_t NumStaticFields() const {
968    return header_.static_fields_size_;
969  }
970  uint32_t NumInstanceFields() const {
971    return header_.instance_fields_size_;
972  }
973  uint32_t NumDirectMethods() const {
974    return header_.direct_methods_size_;
975  }
976  uint32_t NumVirtualMethods() const {
977    return header_.virtual_methods_size_;
978  }
979  bool HasNextStaticField() const {
980    return pos_ < EndOfStaticFieldsPos();
981  }
982  bool HasNextInstanceField() const {
983    return pos_ >= EndOfStaticFieldsPos() && pos_ < EndOfInstanceFieldsPos();
984  }
985  bool HasNextDirectMethod() const {
986    return pos_ >= EndOfInstanceFieldsPos() && pos_ < EndOfDirectMethodsPos();
987  }
988  bool HasNextVirtualMethod() const {
989    return pos_ >= EndOfDirectMethodsPos() && pos_ < EndOfVirtualMethodsPos();
990  }
991  bool HasNext() const {
992    return pos_ < EndOfVirtualMethodsPos();
993  }
994  inline void Next() {
995    pos_++;
996    if (pos_ < EndOfStaticFieldsPos()) {
997      last_idx_ = GetMemberIndex();
998      ReadClassDataField();
999    } else if (pos_ == EndOfStaticFieldsPos() && NumInstanceFields() > 0) {
1000      last_idx_ = 0;  // transition to next array, reset last index
1001      ReadClassDataField();
1002    } else if (pos_ < EndOfInstanceFieldsPos()) {
1003      last_idx_ = GetMemberIndex();
1004      ReadClassDataField();
1005    } else if (pos_ == EndOfInstanceFieldsPos() && NumDirectMethods() > 0) {
1006      last_idx_ = 0;  // transition to next array, reset last index
1007      ReadClassDataMethod();
1008    } else if (pos_ < EndOfDirectMethodsPos()) {
1009      last_idx_ = GetMemberIndex();
1010      ReadClassDataMethod();
1011    } else if (pos_ == EndOfDirectMethodsPos() && NumVirtualMethods() > 0) {
1012      last_idx_ = 0;  // transition to next array, reset last index
1013      ReadClassDataMethod();
1014    } else if (pos_ < EndOfVirtualMethodsPos()) {
1015      last_idx_ = GetMemberIndex();
1016      ReadClassDataMethod();
1017    } else {
1018      DCHECK(!HasNext());
1019    }
1020  }
1021  uint32_t GetMemberIndex() const {
1022    if (pos_ < EndOfInstanceFieldsPos()) {
1023      return last_idx_ + field_.field_idx_delta_;
1024    } else {
1025      DCHECK_LT(pos_, EndOfVirtualMethodsPos());
1026      return last_idx_ + method_.method_idx_delta_;
1027    }
1028  }
1029  uint32_t GetMemberAccessFlags() const {
1030    if (pos_ < EndOfInstanceFieldsPos()) {
1031      return field_.access_flags_;
1032    } else {
1033      DCHECK_LT(pos_, EndOfVirtualMethodsPos());
1034      return method_.access_flags_;
1035    }
1036  }
1037  InvokeType GetMethodInvokeType(const DexFile::ClassDef& class_def) const {
1038    if (HasNextDirectMethod()) {
1039      if ((GetMemberAccessFlags() & kAccStatic) != 0) {
1040        return kStatic;
1041      } else {
1042        return kDirect;
1043      }
1044    } else {
1045      DCHECK_EQ(GetMemberAccessFlags() & kAccStatic, 0U);
1046      if ((class_def.access_flags_ & kAccInterface) != 0) {
1047        return kInterface;
1048      } else if ((GetMemberAccessFlags() & kAccConstructor) != 0) {
1049        return kSuper;
1050      } else {
1051        return kVirtual;
1052      }
1053    }
1054  }
1055  const DexFile::CodeItem* GetMethodCodeItem() const {
1056    return dex_file_.GetCodeItem(method_.code_off_);
1057  }
1058  uint32_t GetMethodCodeItemOffset() const {
1059    return method_.code_off_;
1060  }
1061  const byte* EndDataPointer() const {
1062    CHECK(!HasNext());
1063    return ptr_pos_;
1064  }
1065
1066 private:
1067  // A dex file's class_data_item is leb128 encoded, this structure holds a decoded form of the
1068  // header for a class_data_item
1069  struct ClassDataHeader {
1070    uint32_t static_fields_size_;  // the number of static fields
1071    uint32_t instance_fields_size_;  // the number of instance fields
1072    uint32_t direct_methods_size_;  // the number of direct methods
1073    uint32_t virtual_methods_size_;  // the number of virtual methods
1074  } header_;
1075
1076  // Read and decode header from a class_data_item stream into header
1077  void ReadClassDataHeader();
1078
1079  uint32_t EndOfStaticFieldsPos() const {
1080    return header_.static_fields_size_;
1081  }
1082  uint32_t EndOfInstanceFieldsPos() const {
1083    return EndOfStaticFieldsPos() + header_.instance_fields_size_;
1084  }
1085  uint32_t EndOfDirectMethodsPos() const {
1086    return EndOfInstanceFieldsPos() + header_.direct_methods_size_;
1087  }
1088  uint32_t EndOfVirtualMethodsPos() const {
1089    return EndOfDirectMethodsPos() + header_.virtual_methods_size_;
1090  }
1091
1092  // A decoded version of the field of a class_data_item
1093  struct ClassDataField {
1094    uint32_t field_idx_delta_;  // delta of index into the field_ids array for FieldId
1095    uint32_t access_flags_;  // access flags for the field
1096    ClassDataField() :  field_idx_delta_(0), access_flags_(0) {}
1097
1098   private:
1099    DISALLOW_COPY_AND_ASSIGN(ClassDataField);
1100  };
1101  ClassDataField field_;
1102
1103  // Read and decode a field from a class_data_item stream into field
1104  void ReadClassDataField();
1105
1106  // A decoded version of the method of a class_data_item
1107  struct ClassDataMethod {
1108    uint32_t method_idx_delta_;  // delta of index into the method_ids array for MethodId
1109    uint32_t access_flags_;
1110    uint32_t code_off_;
1111    ClassDataMethod() : method_idx_delta_(0), access_flags_(0), code_off_(0) {}
1112
1113   private:
1114    DISALLOW_COPY_AND_ASSIGN(ClassDataMethod);
1115  };
1116  ClassDataMethod method_;
1117
1118  // Read and decode a method from a class_data_item stream into method
1119  void ReadClassDataMethod();
1120
1121  const DexFile& dex_file_;
1122  size_t pos_;  // integral number of items passed
1123  const byte* ptr_pos_;  // pointer into stream of class_data_item
1124  uint32_t last_idx_;  // last read field or method index to apply delta to
1125  DISALLOW_IMPLICIT_CONSTRUCTORS(ClassDataItemIterator);
1126};
1127
1128class EncodedStaticFieldValueIterator {
1129 public:
1130  EncodedStaticFieldValueIterator(const DexFile& dex_file, SirtRef<mirror::DexCache>* dex_cache,
1131                                  SirtRef<mirror::ClassLoader>* class_loader,
1132                                  ClassLinker* linker, const DexFile::ClassDef& class_def)
1133      SHARED_LOCKS_REQUIRED(Locks::mutator_lock_);
1134
1135  template<bool kTransactionActive>
1136  void ReadValueToField(mirror::ArtField* field) const SHARED_LOCKS_REQUIRED(Locks::mutator_lock_);
1137
1138  bool HasNext() { return pos_ < array_size_; }
1139
1140  void Next();
1141
1142  enum ValueType {
1143    kByte = 0x00,
1144    kShort = 0x02,
1145    kChar = 0x03,
1146    kInt = 0x04,
1147    kLong = 0x06,
1148    kFloat = 0x10,
1149    kDouble = 0x11,
1150    kString = 0x17,
1151    kType = 0x18,
1152    kField = 0x19,
1153    kMethod = 0x1a,
1154    kEnum = 0x1b,
1155    kArray = 0x1c,
1156    kAnnotation = 0x1d,
1157    kNull = 0x1e,
1158    kBoolean = 0x1f
1159  };
1160
1161 private:
1162  static const byte kEncodedValueTypeMask = 0x1f;  // 0b11111
1163  static const byte kEncodedValueArgShift = 5;
1164
1165  const DexFile& dex_file_;
1166  SirtRef<mirror::DexCache>* const dex_cache_;  // Dex cache to resolve literal objects.
1167  SirtRef<mirror::ClassLoader>* const class_loader_;  // ClassLoader to resolve types.
1168  ClassLinker* linker_;  // Linker to resolve literal objects.
1169  size_t array_size_;  // Size of array.
1170  size_t pos_;  // Current position.
1171  const byte* ptr_;  // Pointer into encoded data array.
1172  ValueType type_;  // Type of current encoded value.
1173  jvalue jval_;  // Value of current encoded value.
1174  DISALLOW_IMPLICIT_CONSTRUCTORS(EncodedStaticFieldValueIterator);
1175};
1176std::ostream& operator<<(std::ostream& os, const EncodedStaticFieldValueIterator::ValueType& code);
1177
1178class CatchHandlerIterator {
1179  public:
1180    CatchHandlerIterator(const DexFile::CodeItem& code_item, uint32_t address);
1181
1182    CatchHandlerIterator(const DexFile::CodeItem& code_item,
1183                         const DexFile::TryItem& try_item);
1184
1185    explicit CatchHandlerIterator(const byte* handler_data) {
1186      Init(handler_data);
1187    }
1188
1189    uint16_t GetHandlerTypeIndex() const {
1190      return handler_.type_idx_;
1191    }
1192    uint32_t GetHandlerAddress() const {
1193      return handler_.address_;
1194    }
1195    void Next();
1196    bool HasNext() const {
1197      return remaining_count_ != -1 || catch_all_;
1198    }
1199    // End of this set of catch blocks, convenience method to locate next set of catch blocks
1200    const byte* EndDataPointer() const {
1201      CHECK(!HasNext());
1202      return current_data_;
1203    }
1204
1205  private:
1206    void Init(const DexFile::CodeItem& code_item, int32_t offset);
1207    void Init(const byte* handler_data);
1208
1209    struct CatchHandlerItem {
1210      uint16_t type_idx_;  // type index of the caught exception type
1211      uint32_t address_;  // handler address
1212    } handler_;
1213    const byte *current_data_;  // the current handler in dex file.
1214    int32_t remaining_count_;   // number of handlers not read.
1215    bool catch_all_;            // is there a handler that will catch all exceptions in case
1216                                // that all typed handler does not match.
1217};
1218
1219}  // namespace art
1220
1221#endif  // ART_RUNTIME_DEX_FILE_H_
1222