dex_file.h revision 5c96e6b4dc354a7439b211b93462fbe8edea5e57
1/*
2 * Copyright (C) 2011 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 *      http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17#ifndef ART_RUNTIME_DEX_FILE_H_
18#define ART_RUNTIME_DEX_FILE_H_
19
20#include <string>
21#include <vector>
22
23#include "base/logging.h"
24#include "base/mutex.h"
25#include "base/stringpiece.h"
26#include "globals.h"
27#include "invoke_type.h"
28#include "jni.h"
29#include "mem_map.h"
30#include "modifiers.h"
31#include "safe_map.h"
32#include "UniquePtr.h"
33
34namespace art {
35
36// TODO: remove dependencies on mirror classes, primarily by moving
37// EncodedStaticFieldValueIterator to its own file.
38namespace mirror {
39  class ArtField;
40  class ArtMethod;
41  class ClassLoader;
42  class DexCache;
43}  // namespace mirror
44class ClassLinker;
45class Signature;
46template <typename T>
47class SirtRef;
48class StringPiece;
49class ZipArchive;
50
51// TODO: move all of the macro functionality into the DexCache class.
52class DexFile {
53 public:
54  static const byte kDexMagic[];
55  static const byte kDexMagicVersion[];
56  static const size_t kSha1DigestSize = 20;
57  static const uint32_t kDexEndianConstant = 0x12345678;
58
59  // name of the DexFile entry within a zip archive
60  static const char* kClassesDex;
61
62  // The value of an invalid index.
63  static const uint32_t kDexNoIndex = 0xFFFFFFFF;
64
65  // The value of an invalid index.
66  static const uint16_t kDexNoIndex16 = 0xFFFF;
67
68  // Raw header_item.
69  struct Header {
70    uint8_t magic_[8];
71    uint32_t checksum_;  // See also location_checksum_
72    uint8_t signature_[kSha1DigestSize];
73    uint32_t file_size_;  // size of entire file
74    uint32_t header_size_;  // offset to start of next section
75    uint32_t endian_tag_;
76    uint32_t link_size_;  // unused
77    uint32_t link_off_;  // unused
78    uint32_t map_off_;  // unused
79    uint32_t string_ids_size_;  // number of StringIds
80    uint32_t string_ids_off_;  // file offset of StringIds array
81    uint32_t type_ids_size_;  // number of TypeIds, we don't support more than 65535
82    uint32_t type_ids_off_;  // file offset of TypeIds array
83    uint32_t proto_ids_size_;  // number of ProtoIds, we don't support more than 65535
84    uint32_t proto_ids_off_;  // file offset of ProtoIds array
85    uint32_t field_ids_size_;  // number of FieldIds
86    uint32_t field_ids_off_;  // file offset of FieldIds array
87    uint32_t method_ids_size_;  // number of MethodIds
88    uint32_t method_ids_off_;  // file offset of MethodIds array
89    uint32_t class_defs_size_;  // number of ClassDefs
90    uint32_t class_defs_off_;  // file offset of ClassDef array
91    uint32_t data_size_;  // unused
92    uint32_t data_off_;  // unused
93
94   private:
95    DISALLOW_COPY_AND_ASSIGN(Header);
96  };
97
98  // Map item type codes.
99  enum {
100    kDexTypeHeaderItem               = 0x0000,
101    kDexTypeStringIdItem             = 0x0001,
102    kDexTypeTypeIdItem               = 0x0002,
103    kDexTypeProtoIdItem              = 0x0003,
104    kDexTypeFieldIdItem              = 0x0004,
105    kDexTypeMethodIdItem             = 0x0005,
106    kDexTypeClassDefItem             = 0x0006,
107    kDexTypeMapList                  = 0x1000,
108    kDexTypeTypeList                 = 0x1001,
109    kDexTypeAnnotationSetRefList     = 0x1002,
110    kDexTypeAnnotationSetItem        = 0x1003,
111    kDexTypeClassDataItem            = 0x2000,
112    kDexTypeCodeItem                 = 0x2001,
113    kDexTypeStringDataItem           = 0x2002,
114    kDexTypeDebugInfoItem            = 0x2003,
115    kDexTypeAnnotationItem           = 0x2004,
116    kDexTypeEncodedArrayItem         = 0x2005,
117    kDexTypeAnnotationsDirectoryItem = 0x2006,
118  };
119
120  struct MapItem {
121    uint16_t type_;
122    uint16_t unused_;
123    uint32_t size_;
124    uint32_t offset_;
125
126   private:
127    DISALLOW_COPY_AND_ASSIGN(MapItem);
128  };
129
130  struct MapList {
131    uint32_t size_;
132    MapItem list_[1];
133
134   private:
135    DISALLOW_COPY_AND_ASSIGN(MapList);
136  };
137
138  // Raw string_id_item.
139  struct StringId {
140    uint32_t string_data_off_;  // offset in bytes from the base address
141
142   private:
143    DISALLOW_COPY_AND_ASSIGN(StringId);
144  };
145
146  // Raw type_id_item.
147  struct TypeId {
148    uint32_t descriptor_idx_;  // index into string_ids
149
150   private:
151    DISALLOW_COPY_AND_ASSIGN(TypeId);
152  };
153
154  // Raw field_id_item.
155  struct FieldId {
156    uint16_t class_idx_;  // index into type_ids_ array for defining class
157    uint16_t type_idx_;  // index into type_ids_ array for field type
158    uint32_t name_idx_;  // index into string_ids_ array for field name
159
160   private:
161    DISALLOW_COPY_AND_ASSIGN(FieldId);
162  };
163
164  // Raw method_id_item.
165  struct MethodId {
166    uint16_t class_idx_;  // index into type_ids_ array for defining class
167    uint16_t proto_idx_;  // index into proto_ids_ array for method prototype
168    uint32_t name_idx_;  // index into string_ids_ array for method name
169
170   private:
171    DISALLOW_COPY_AND_ASSIGN(MethodId);
172  };
173
174  // Raw proto_id_item.
175  struct ProtoId {
176    uint32_t shorty_idx_;  // index into string_ids array for shorty descriptor
177    uint16_t return_type_idx_;  // index into type_ids array for return type
178    uint16_t pad_;             // padding = 0
179    uint32_t parameters_off_;  // file offset to type_list for parameter types
180
181   private:
182    DISALLOW_COPY_AND_ASSIGN(ProtoId);
183  };
184
185  // Raw class_def_item.
186  struct ClassDef {
187    uint16_t class_idx_;  // index into type_ids_ array for this class
188    uint16_t pad1_;  // padding = 0
189    uint32_t access_flags_;
190    uint16_t superclass_idx_;  // index into type_ids_ array for superclass
191    uint16_t pad2_;  // padding = 0
192    uint32_t interfaces_off_;  // file offset to TypeList
193    uint32_t source_file_idx_;  // index into string_ids_ for source file name
194    uint32_t annotations_off_;  // file offset to annotations_directory_item
195    uint32_t class_data_off_;  // file offset to class_data_item
196    uint32_t static_values_off_;  // file offset to EncodedArray
197
198   private:
199    DISALLOW_COPY_AND_ASSIGN(ClassDef);
200  };
201
202  // Raw type_item.
203  struct TypeItem {
204    uint16_t type_idx_;  // index into type_ids section
205
206   private:
207    DISALLOW_COPY_AND_ASSIGN(TypeItem);
208  };
209
210  // Raw type_list.
211  class TypeList {
212   public:
213    uint32_t Size() const {
214      return size_;
215    }
216
217    const TypeItem& GetTypeItem(uint32_t idx) const {
218      DCHECK_LT(idx, this->size_);
219      return this->list_[idx];
220    }
221
222   private:
223    uint32_t size_;  // size of the list, in entries
224    TypeItem list_[1];  // elements of the list
225    DISALLOW_COPY_AND_ASSIGN(TypeList);
226  };
227
228  // Raw code_item.
229  struct CodeItem {
230    uint16_t registers_size_;
231    uint16_t ins_size_;
232    uint16_t outs_size_;
233    uint16_t tries_size_;
234    uint32_t debug_info_off_;  // file offset to debug info stream
235    uint32_t insns_size_in_code_units_;  // size of the insns array, in 2 byte code units
236    uint16_t insns_[1];
237
238   private:
239    DISALLOW_COPY_AND_ASSIGN(CodeItem);
240  };
241
242  // Raw try_item.
243  struct TryItem {
244    uint32_t start_addr_;
245    uint16_t insn_count_;
246    uint16_t handler_off_;
247
248   private:
249    DISALLOW_COPY_AND_ASSIGN(TryItem);
250  };
251
252  // Annotation constants.
253  enum {
254    kDexVisibilityBuild         = 0x00,     /* annotation visibility */
255    kDexVisibilityRuntime       = 0x01,
256    kDexVisibilitySystem        = 0x02,
257
258    kDexAnnotationByte          = 0x00,
259    kDexAnnotationShort         = 0x02,
260    kDexAnnotationChar          = 0x03,
261    kDexAnnotationInt           = 0x04,
262    kDexAnnotationLong          = 0x06,
263    kDexAnnotationFloat         = 0x10,
264    kDexAnnotationDouble        = 0x11,
265    kDexAnnotationString        = 0x17,
266    kDexAnnotationType          = 0x18,
267    kDexAnnotationField         = 0x19,
268    kDexAnnotationMethod        = 0x1a,
269    kDexAnnotationEnum          = 0x1b,
270    kDexAnnotationArray         = 0x1c,
271    kDexAnnotationAnnotation    = 0x1d,
272    kDexAnnotationNull          = 0x1e,
273    kDexAnnotationBoolean       = 0x1f,
274
275    kDexAnnotationValueTypeMask = 0x1f,     /* low 5 bits */
276    kDexAnnotationValueArgShift = 5,
277  };
278
279  struct AnnotationsDirectoryItem {
280    uint32_t class_annotations_off_;
281    uint32_t fields_size_;
282    uint32_t methods_size_;
283    uint32_t parameters_size_;
284
285   private:
286    DISALLOW_COPY_AND_ASSIGN(AnnotationsDirectoryItem);
287  };
288
289  struct FieldAnnotationsItem {
290    uint32_t field_idx_;
291    uint32_t annotations_off_;
292
293   private:
294    DISALLOW_COPY_AND_ASSIGN(FieldAnnotationsItem);
295  };
296
297  struct MethodAnnotationsItem {
298    uint32_t method_idx_;
299    uint32_t annotations_off_;
300
301   private:
302    DISALLOW_COPY_AND_ASSIGN(MethodAnnotationsItem);
303  };
304
305  struct ParameterAnnotationsItem {
306    uint32_t method_idx_;
307    uint32_t annotations_off_;
308
309   private:
310    DISALLOW_COPY_AND_ASSIGN(ParameterAnnotationsItem);
311  };
312
313  struct AnnotationSetRefItem {
314    uint32_t annotations_off_;
315
316   private:
317    DISALLOW_COPY_AND_ASSIGN(AnnotationSetRefItem);
318  };
319
320  struct AnnotationSetRefList {
321    uint32_t size_;
322    AnnotationSetRefItem list_[1];
323
324   private:
325    DISALLOW_COPY_AND_ASSIGN(AnnotationSetRefList);
326  };
327
328  struct AnnotationSetItem {
329    uint32_t size_;
330    uint32_t entries_[1];
331
332   private:
333    DISALLOW_COPY_AND_ASSIGN(AnnotationSetItem);
334  };
335
336  struct AnnotationItem {
337    uint8_t visibility_;
338    uint8_t annotation_[1];
339
340   private:
341    DISALLOW_COPY_AND_ASSIGN(AnnotationItem);
342  };
343
344  typedef std::pair<const DexFile*, const DexFile::ClassDef*> ClassPathEntry;
345  typedef std::vector<const DexFile*> ClassPath;
346
347  // Search a collection of DexFiles for a descriptor
348  static ClassPathEntry FindInClassPath(const char* descriptor,
349                                        const ClassPath& class_path);
350
351  // Returns the checksum of a file for comparison with GetLocationChecksum().
352  // For .dex files, this is the header checksum.
353  // For zip files, this is the classes.dex zip entry CRC32 checksum.
354  // Return true if the checksum could be found, false otherwise.
355  static bool GetChecksum(const char* filename, uint32_t* checksum, std::string* error_msg);
356
357  // Opens .dex file, guessing the container format based on file extension
358  static const DexFile* Open(const char* filename, const char* location, std::string* error_msg);
359
360  // Opens .dex file, backed by existing memory
361  static const DexFile* Open(const uint8_t* base, size_t size,
362                             const std::string& location,
363                             uint32_t location_checksum,
364                             std::string* error_msg) {
365    return OpenMemory(base, size, location, location_checksum, NULL, error_msg);
366  }
367
368  // Opens .dex file from the classes.dex in a zip archive
369  static const DexFile* Open(const ZipArchive& zip_archive, const std::string& location,
370                             std::string* error_msg);
371
372  // Closes a .dex file.
373  virtual ~DexFile();
374
375  const std::string& GetLocation() const {
376    return location_;
377  }
378
379  // For DexFiles directly from .dex files, this is the checksum from the DexFile::Header.
380  // For DexFiles opened from a zip files, this will be the ZipEntry CRC32 of classes.dex.
381  uint32_t GetLocationChecksum() const {
382    return location_checksum_;
383  }
384
385  const Header& GetHeader() const {
386    DCHECK(header_ != NULL) << GetLocation();
387    return *header_;
388  }
389
390  Mutex& GetModificationLock() {
391    return modification_lock;
392  }
393
394  // Decode the dex magic version
395  uint32_t GetVersion() const;
396
397  // Returns true if the byte string points to the magic value.
398  static bool IsMagicValid(const byte* magic);
399
400  // Returns true if the byte string after the magic is the correct value.
401  static bool IsVersionValid(const byte* magic);
402
403  // Returns the number of string identifiers in the .dex file.
404  size_t NumStringIds() const {
405    DCHECK(header_ != NULL) << GetLocation();
406    return header_->string_ids_size_;
407  }
408
409  // Returns the StringId at the specified index.
410  const StringId& GetStringId(uint32_t idx) const {
411    DCHECK_LT(idx, NumStringIds()) << GetLocation();
412    return string_ids_[idx];
413  }
414
415  uint32_t GetIndexForStringId(const StringId& string_id) const {
416    CHECK_GE(&string_id, string_ids_) << GetLocation();
417    CHECK_LT(&string_id, string_ids_ + header_->string_ids_size_) << GetLocation();
418    return &string_id - string_ids_;
419  }
420
421  int32_t GetStringLength(const StringId& string_id) const;
422
423  // Returns a pointer to the UTF-8 string data referred to by the given string_id as well as the
424  // length of the string when decoded as a UTF-16 string. Note the UTF-16 length is not the same
425  // as the string length of the string data.
426  const char* GetStringDataAndUtf16Length(const StringId& string_id, uint32_t* utf16_length) const;
427
428  const char* GetStringData(const StringId& string_id) const {
429    uint32_t ignored;
430    return GetStringDataAndUtf16Length(string_id, &ignored);
431  }
432
433  // Index version of GetStringDataAndUtf16Length.
434  const char* StringDataAndUtf16LengthByIdx(uint32_t idx, uint32_t* utf16_length) const {
435    if (idx == kDexNoIndex) {
436      *utf16_length = 0;
437      return NULL;
438    }
439    const StringId& string_id = GetStringId(idx);
440    return GetStringDataAndUtf16Length(string_id, utf16_length);
441  }
442
443  const char* StringDataByIdx(uint32_t idx) const {
444    uint32_t unicode_length;
445    return StringDataAndUtf16LengthByIdx(idx, &unicode_length);
446  }
447
448  // Looks up a string id for a given modified utf8 string.
449  const StringId* FindStringId(const char* string) const;
450
451  // Looks up a string id for a given utf16 string.
452  const StringId* FindStringId(const uint16_t* string) const;
453
454  // Returns the number of type identifiers in the .dex file.
455  size_t NumTypeIds() const {
456    DCHECK(header_ != NULL) << GetLocation();
457    return header_->type_ids_size_;
458  }
459
460  // Returns the TypeId at the specified index.
461  const TypeId& GetTypeId(uint32_t idx) const {
462    DCHECK_LT(idx, NumTypeIds()) << GetLocation();
463    return type_ids_[idx];
464  }
465
466  uint16_t GetIndexForTypeId(const TypeId& type_id) const {
467    CHECK_GE(&type_id, type_ids_) << GetLocation();
468    CHECK_LT(&type_id, type_ids_ + header_->type_ids_size_) << GetLocation();
469    size_t result = &type_id - type_ids_;
470    DCHECK_LT(result, 65536U) << GetLocation();
471    return static_cast<uint16_t>(result);
472  }
473
474  // Get the descriptor string associated with a given type index.
475  const char* StringByTypeIdx(uint32_t idx, uint32_t* unicode_length) const {
476    const TypeId& type_id = GetTypeId(idx);
477    return StringDataAndUtf16LengthByIdx(type_id.descriptor_idx_, unicode_length);
478  }
479
480  const char* StringByTypeIdx(uint32_t idx) const {
481    const TypeId& type_id = GetTypeId(idx);
482    return StringDataByIdx(type_id.descriptor_idx_);
483  }
484
485  // Returns the type descriptor string of a type id.
486  const char* GetTypeDescriptor(const TypeId& type_id) const {
487    return StringDataByIdx(type_id.descriptor_idx_);
488  }
489
490  // Looks up a type for the given string index
491  const TypeId* FindTypeId(uint32_t string_idx) const;
492
493  // Returns the number of field identifiers in the .dex file.
494  size_t NumFieldIds() const {
495    DCHECK(header_ != NULL) << GetLocation();
496    return header_->field_ids_size_;
497  }
498
499  // Returns the FieldId at the specified index.
500  const FieldId& GetFieldId(uint32_t idx) const {
501    DCHECK_LT(idx, NumFieldIds()) << GetLocation();
502    return field_ids_[idx];
503  }
504
505  uint32_t GetIndexForFieldId(const FieldId& field_id) const {
506    CHECK_GE(&field_id, field_ids_) << GetLocation();
507    CHECK_LT(&field_id, field_ids_ + header_->field_ids_size_) << GetLocation();
508    return &field_id - field_ids_;
509  }
510
511  // Looks up a field by its declaring class, name and type
512  const FieldId* FindFieldId(const DexFile::TypeId& declaring_klass,
513                             const DexFile::StringId& name,
514                             const DexFile::TypeId& type) const;
515
516  // Returns the declaring class descriptor string of a field id.
517  const char* GetFieldDeclaringClassDescriptor(const FieldId& field_id) const {
518    const DexFile::TypeId& type_id = GetTypeId(field_id.class_idx_);
519    return GetTypeDescriptor(type_id);
520  }
521
522  // Returns the class descriptor string of a field id.
523  const char* GetFieldTypeDescriptor(const FieldId& field_id) const {
524    const DexFile::TypeId& type_id = GetTypeId(field_id.type_idx_);
525    return GetTypeDescriptor(type_id);
526  }
527
528  // Returns the name of a field id.
529  const char* GetFieldName(const FieldId& field_id) const {
530    return StringDataByIdx(field_id.name_idx_);
531  }
532
533  // Returns the number of method identifiers in the .dex file.
534  size_t NumMethodIds() const {
535    DCHECK(header_ != NULL) << GetLocation();
536    return header_->method_ids_size_;
537  }
538
539  // Returns the MethodId at the specified index.
540  const MethodId& GetMethodId(uint32_t idx) const {
541    DCHECK_LT(idx, NumMethodIds()) << GetLocation();
542    return method_ids_[idx];
543  }
544
545  uint32_t GetIndexForMethodId(const MethodId& method_id) const {
546    CHECK_GE(&method_id, method_ids_) << GetLocation();
547    CHECK_LT(&method_id, method_ids_ + header_->method_ids_size_) << GetLocation();
548    return &method_id - method_ids_;
549  }
550
551  // Looks up a method by its declaring class, name and proto_id
552  const MethodId* FindMethodId(const DexFile::TypeId& declaring_klass,
553                               const DexFile::StringId& name,
554                               const DexFile::ProtoId& signature) const;
555
556  // Returns the declaring class descriptor string of a method id.
557  const char* GetMethodDeclaringClassDescriptor(const MethodId& method_id) const {
558    const DexFile::TypeId& type_id = GetTypeId(method_id.class_idx_);
559    return GetTypeDescriptor(type_id);
560  }
561
562  // Returns the prototype of a method id.
563  const ProtoId& GetMethodPrototype(const MethodId& method_id) const {
564    return GetProtoId(method_id.proto_idx_);
565  }
566
567  // Returns a representation of the signature of a method id.
568  const Signature GetMethodSignature(const MethodId& method_id) const;
569
570  // Returns the name of a method id.
571  const char* GetMethodName(const MethodId& method_id) const {
572    return StringDataByIdx(method_id.name_idx_);
573  }
574
575  // Returns the shorty of a method id.
576  const char* GetMethodShorty(const MethodId& method_id) const {
577    return StringDataByIdx(GetProtoId(method_id.proto_idx_).shorty_idx_);
578  }
579  const char* GetMethodShorty(const MethodId& method_id, uint32_t* length) const {
580    // Using the UTF16 length is safe here as shorties are guaranteed to be ASCII characters.
581    return StringDataAndUtf16LengthByIdx(GetProtoId(method_id.proto_idx_).shorty_idx_, length);
582  }
583  // Returns the number of class definitions in the .dex file.
584  size_t NumClassDefs() const {
585    DCHECK(header_ != NULL) << GetLocation();
586    return header_->class_defs_size_;
587  }
588
589  // Returns the ClassDef at the specified index.
590  const ClassDef& GetClassDef(uint16_t idx) const {
591    DCHECK_LT(idx, NumClassDefs()) << GetLocation();
592    return class_defs_[idx];
593  }
594
595  uint16_t GetIndexForClassDef(const ClassDef& class_def) const {
596    CHECK_GE(&class_def, class_defs_) << GetLocation();
597    CHECK_LT(&class_def, class_defs_ + header_->class_defs_size_) << GetLocation();
598    return &class_def - class_defs_;
599  }
600
601  // Returns the class descriptor string of a class definition.
602  const char* GetClassDescriptor(const ClassDef& class_def) const {
603    return StringByTypeIdx(class_def.class_idx_);
604  }
605
606  // Looks up a class definition by its class descriptor.
607  const ClassDef* FindClassDef(const char* descriptor) const;
608
609  // Looks up a class definition by its type index.
610  const ClassDef* FindClassDef(uint16_t type_idx) const;
611
612  const TypeList* GetInterfacesList(const ClassDef& class_def) const {
613    if (class_def.interfaces_off_ == 0) {
614        return NULL;
615    } else {
616      const byte* addr = begin_ + class_def.interfaces_off_;
617      return reinterpret_cast<const TypeList*>(addr);
618    }
619  }
620
621  // Returns a pointer to the raw memory mapped class_data_item
622  const byte* GetClassData(const ClassDef& class_def) const {
623    if (class_def.class_data_off_ == 0) {
624      return NULL;
625    } else {
626      return begin_ + class_def.class_data_off_;
627    }
628  }
629
630  //
631  const CodeItem* GetCodeItem(const uint32_t code_off) const {
632    if (code_off == 0) {
633      return NULL;  // native or abstract method
634    } else {
635      const byte* addr = begin_ + code_off;
636      return reinterpret_cast<const CodeItem*>(addr);
637    }
638  }
639
640  const char* GetReturnTypeDescriptor(const ProtoId& proto_id) const {
641    return StringByTypeIdx(proto_id.return_type_idx_);
642  }
643
644  // Returns the number of prototype identifiers in the .dex file.
645  size_t NumProtoIds() const {
646    DCHECK(header_ != NULL) << GetLocation();
647    return header_->proto_ids_size_;
648  }
649
650  // Returns the ProtoId at the specified index.
651  const ProtoId& GetProtoId(uint32_t idx) const {
652    DCHECK_LT(idx, NumProtoIds()) << GetLocation();
653    return proto_ids_[idx];
654  }
655
656  uint16_t GetIndexForProtoId(const ProtoId& proto_id) const {
657    CHECK_GE(&proto_id, proto_ids_) << GetLocation();
658    CHECK_LT(&proto_id, proto_ids_ + header_->proto_ids_size_) << GetLocation();
659    return &proto_id - proto_ids_;
660  }
661
662  // Looks up a proto id for a given return type and signature type list
663  const ProtoId* FindProtoId(uint16_t return_type_idx,
664                             const uint16_t* signature_type_idxs, uint32_t signature_length) const;
665  const ProtoId* FindProtoId(uint16_t return_type_idx,
666                             const std::vector<uint16_t>& signature_type_idxs) const {
667    return FindProtoId(return_type_idx, &signature_type_idxs[0], signature_type_idxs.size());
668  }
669
670  // Given a signature place the type ids into the given vector, returns true on success
671  bool CreateTypeList(const StringPiece& signature, uint16_t* return_type_idx,
672                      std::vector<uint16_t>* param_type_idxs) const;
673
674  // Create a Signature from the given string signature or return Signature::NoSignature if not
675  // possible.
676  const Signature CreateSignature(const StringPiece& signature) const;
677
678  // Returns the short form method descriptor for the given prototype.
679  const char* GetShorty(uint32_t proto_idx) const {
680    const ProtoId& proto_id = GetProtoId(proto_idx);
681    return StringDataByIdx(proto_id.shorty_idx_);
682  }
683
684  const TypeList* GetProtoParameters(const ProtoId& proto_id) const {
685    if (proto_id.parameters_off_ == 0) {
686      return NULL;
687    } else {
688      const byte* addr = begin_ + proto_id.parameters_off_;
689      return reinterpret_cast<const TypeList*>(addr);
690    }
691  }
692
693  const byte* GetEncodedStaticFieldValuesArray(const ClassDef& class_def) const {
694    if (class_def.static_values_off_ == 0) {
695      return 0;
696    } else {
697      return begin_ + class_def.static_values_off_;
698    }
699  }
700
701  static const TryItem* GetTryItems(const CodeItem& code_item, uint32_t offset);
702
703  // Get the base of the encoded data for the given DexCode.
704  static const byte* GetCatchHandlerData(const CodeItem& code_item, uint32_t offset) {
705    const byte* handler_data =
706        reinterpret_cast<const byte*>(GetTryItems(code_item, code_item.tries_size_));
707    return handler_data + offset;
708  }
709
710  // Find which try region is associated with the given address (ie dex pc). Returns -1 if none.
711  static int32_t FindTryItem(const CodeItem &code_item, uint32_t address);
712
713  // Find the handler offset associated with the given address (ie dex pc). Returns -1 if none.
714  static int32_t FindCatchHandlerOffset(const CodeItem &code_item, uint32_t address);
715
716  // Get the pointer to the start of the debugging data
717  const byte* GetDebugInfoStream(const CodeItem* code_item) const {
718    if (code_item->debug_info_off_ == 0) {
719      return NULL;
720    } else {
721      return begin_ + code_item->debug_info_off_;
722    }
723  }
724
725  // Callback for "new position table entry".
726  // Returning true causes the decoder to stop early.
727  typedef bool (*DexDebugNewPositionCb)(void* context, uint32_t address, uint32_t line_num);
728
729  // Callback for "new locals table entry". "signature" is an empty string
730  // if no signature is available for an entry.
731  typedef void (*DexDebugNewLocalCb)(void* context, uint16_t reg,
732                                     uint32_t start_address,
733                                     uint32_t end_address,
734                                     const char* name,
735                                     const char* descriptor,
736                                     const char* signature);
737
738  static bool LineNumForPcCb(void* context, uint32_t address, uint32_t line_num);
739
740  // Debug info opcodes and constants
741  enum {
742    DBG_END_SEQUENCE         = 0x00,
743    DBG_ADVANCE_PC           = 0x01,
744    DBG_ADVANCE_LINE         = 0x02,
745    DBG_START_LOCAL          = 0x03,
746    DBG_START_LOCAL_EXTENDED = 0x04,
747    DBG_END_LOCAL            = 0x05,
748    DBG_RESTART_LOCAL        = 0x06,
749    DBG_SET_PROLOGUE_END     = 0x07,
750    DBG_SET_EPILOGUE_BEGIN   = 0x08,
751    DBG_SET_FILE             = 0x09,
752    DBG_FIRST_SPECIAL        = 0x0a,
753    DBG_LINE_BASE            = -4,
754    DBG_LINE_RANGE           = 15,
755  };
756
757  struct LocalInfo {
758    LocalInfo()
759        : name_(NULL), descriptor_(NULL), signature_(NULL), start_address_(0), is_live_(false) {}
760
761    const char* name_;  // E.g., list
762    const char* descriptor_;  // E.g., Ljava/util/LinkedList;
763    const char* signature_;  // E.g., java.util.LinkedList<java.lang.Integer>
764    uint16_t start_address_;  // PC location where the local is first defined.
765    bool is_live_;  // Is the local defined and live.
766
767   private:
768    DISALLOW_COPY_AND_ASSIGN(LocalInfo);
769  };
770
771  struct LineNumFromPcContext {
772    LineNumFromPcContext(uint32_t address, uint32_t line_num)
773        : address_(address), line_num_(line_num) {}
774    uint32_t address_;
775    uint32_t line_num_;
776   private:
777    DISALLOW_COPY_AND_ASSIGN(LineNumFromPcContext);
778  };
779
780  void InvokeLocalCbIfLive(void* context, int reg, uint32_t end_address,
781                           LocalInfo* local_in_reg, DexDebugNewLocalCb local_cb) const {
782    if (local_cb != NULL && local_in_reg[reg].is_live_) {
783      local_cb(context, reg, local_in_reg[reg].start_address_, end_address,
784          local_in_reg[reg].name_, local_in_reg[reg].descriptor_,
785          local_in_reg[reg].signature_ != NULL ? local_in_reg[reg].signature_ : "");
786    }
787  }
788
789  // Determine the source file line number based on the program counter.
790  // "pc" is an offset, in 16-bit units, from the start of the method's code.
791  //
792  // Returns -1 if no match was found (possibly because the source files were
793  // compiled without "-g", so no line number information is present).
794  // Returns -2 for native methods (as expected in exception traces).
795  //
796  // This is used by runtime; therefore use art::Method not art::DexFile::Method.
797  int32_t GetLineNumFromPC(const mirror::ArtMethod* method, uint32_t rel_pc) const
798      SHARED_LOCKS_REQUIRED(Locks::mutator_lock_);
799
800  void DecodeDebugInfo(const CodeItem* code_item, bool is_static, uint32_t method_idx,
801                       DexDebugNewPositionCb position_cb, DexDebugNewLocalCb local_cb,
802                       void* context) const;
803
804  const char* GetSourceFile(const ClassDef& class_def) const {
805    if (class_def.source_file_idx_ == 0xffffffff) {
806      return NULL;
807    } else {
808      return StringDataByIdx(class_def.source_file_idx_);
809    }
810  }
811
812  int GetPermissions() const;
813
814  bool IsReadOnly() const;
815
816  bool EnableWrite() const;
817
818  bool DisableWrite() const;
819
820  const byte* Begin() const {
821    return begin_;
822  }
823
824  size_t Size() const {
825    return size_;
826  }
827
828 private:
829  // Opens a .dex file
830  static const DexFile* OpenFile(int fd, const char* location, bool verify, std::string* error_msg);
831
832  // Opens a dex file from within a .jar, .zip, or .apk file
833  static const DexFile* OpenZip(int fd, const std::string& location, std::string* error_msg);
834
835  // Opens a .dex file at the given address backed by a MemMap
836  static const DexFile* OpenMemory(const std::string& location,
837                                   uint32_t location_checksum,
838                                   MemMap* mem_map,
839                                   std::string* error_msg);
840
841  // Opens a .dex file at the given address, optionally backed by a MemMap
842  static const DexFile* OpenMemory(const byte* dex_file,
843                                   size_t size,
844                                   const std::string& location,
845                                   uint32_t location_checksum,
846                                   MemMap* mem_map,
847                                   std::string* error_msg);
848
849  DexFile(const byte* base, size_t size,
850          const std::string& location,
851          uint32_t location_checksum,
852          MemMap* mem_map)
853      : begin_(base),
854        size_(size),
855        location_(location),
856        location_checksum_(location_checksum),
857        mem_map_(mem_map),
858        modification_lock("DEX modification lock"),
859        header_(0),
860        string_ids_(0),
861        type_ids_(0),
862        field_ids_(0),
863        method_ids_(0),
864        proto_ids_(0),
865        class_defs_(0) {
866    CHECK(begin_ != NULL) << GetLocation();
867    CHECK_GT(size_, 0U) << GetLocation();
868  }
869
870  // Top-level initializer that calls other Init methods.
871  bool Init(std::string* error_msg);
872
873  // Caches pointers into to the various file sections.
874  void InitMembers();
875
876  // Returns true if the header magic and version numbers are of the expected values.
877  bool CheckMagicAndVersion(std::string* error_msg) const;
878
879  void DecodeDebugInfo0(const CodeItem* code_item, bool is_static, uint32_t method_idx,
880      DexDebugNewPositionCb position_cb, DexDebugNewLocalCb local_cb,
881      void* context, const byte* stream, LocalInfo* local_in_reg) const;
882
883  // The base address of the memory mapping.
884  const byte* const begin_;
885
886  // The size of the underlying memory allocation in bytes.
887  const size_t size_;
888
889  // Typically the dex file name when available, alternatively some identifying string.
890  //
891  // The ClassLinker will use this to match DexFiles the boot class
892  // path to DexCache::GetLocation when loading from an image.
893  const std::string location_;
894
895  const uint32_t location_checksum_;
896
897  // Manages the underlying memory allocation.
898  UniquePtr<MemMap> mem_map_;
899
900  // The DEX-to-DEX compiler uses this lock to ensure thread safety when
901  // enabling write access to a read-only DEX file.
902  // TODO: move to Locks::dex_file_modification_lock.
903  Mutex modification_lock;
904
905  // Points to the header section.
906  const Header* header_;
907
908  // Points to the base of the string identifier list.
909  const StringId* string_ids_;
910
911  // Points to the base of the type identifier list.
912  const TypeId* type_ids_;
913
914  // Points to the base of the field identifier list.
915  const FieldId* field_ids_;
916
917  // Points to the base of the method identifier list.
918  const MethodId* method_ids_;
919
920  // Points to the base of the prototype identifier list.
921  const ProtoId* proto_ids_;
922
923  // Points to the base of the class definition list.
924  const ClassDef* class_defs_;
925};
926
927// Iterate over a dex file's ProtoId's paramters
928class DexFileParameterIterator {
929 public:
930  DexFileParameterIterator(const DexFile& dex_file, const DexFile::ProtoId& proto_id)
931      : dex_file_(dex_file), size_(0), pos_(0) {
932    type_list_ = dex_file_.GetProtoParameters(proto_id);
933    if (type_list_ != NULL) {
934      size_ = type_list_->Size();
935    }
936  }
937  bool HasNext() const { return pos_ < size_; }
938  void Next() { ++pos_; }
939  uint16_t GetTypeIdx() {
940    return type_list_->GetTypeItem(pos_).type_idx_;
941  }
942  const char* GetDescriptor() {
943    return dex_file_.StringByTypeIdx(GetTypeIdx());
944  }
945 private:
946  const DexFile& dex_file_;
947  const DexFile::TypeList* type_list_;
948  uint32_t size_;
949  uint32_t pos_;
950  DISALLOW_IMPLICIT_CONSTRUCTORS(DexFileParameterIterator);
951};
952
953// Abstract the signature of a method.
954class Signature {
955 public:
956  std::string ToString() const;
957
958  static Signature NoSignature() {
959    return Signature();
960  }
961
962  bool operator==(const Signature& rhs) const;
963  bool operator!=(const Signature& rhs) const {
964    return !(*this == rhs);
965  }
966
967  bool operator==(const StringPiece& rhs) const {
968    // TODO: Avoid temporary string allocation.
969    return ToString() == rhs;
970  }
971
972 private:
973  Signature(const DexFile* dex, const DexFile::ProtoId& proto) : dex_file_(dex), proto_id_(&proto) {
974  }
975
976  Signature() : dex_file_(nullptr), proto_id_(nullptr) {
977  }
978
979  friend class DexFile;
980
981  const DexFile* const dex_file_;
982  const DexFile::ProtoId* const proto_id_;
983};
984std::ostream& operator<<(std::ostream& os, const Signature& sig);
985
986// Iterate and decode class_data_item
987class ClassDataItemIterator {
988 public:
989  ClassDataItemIterator(const DexFile& dex_file, const byte* raw_class_data_item)
990      : dex_file_(dex_file), pos_(0), ptr_pos_(raw_class_data_item), last_idx_(0) {
991    ReadClassDataHeader();
992    if (EndOfInstanceFieldsPos() > 0) {
993      ReadClassDataField();
994    } else if (EndOfVirtualMethodsPos() > 0) {
995      ReadClassDataMethod();
996    }
997  }
998  uint32_t NumStaticFields() const {
999    return header_.static_fields_size_;
1000  }
1001  uint32_t NumInstanceFields() const {
1002    return header_.instance_fields_size_;
1003  }
1004  uint32_t NumDirectMethods() const {
1005    return header_.direct_methods_size_;
1006  }
1007  uint32_t NumVirtualMethods() const {
1008    return header_.virtual_methods_size_;
1009  }
1010  bool HasNextStaticField() const {
1011    return pos_ < EndOfStaticFieldsPos();
1012  }
1013  bool HasNextInstanceField() const {
1014    return pos_ >= EndOfStaticFieldsPos() && pos_ < EndOfInstanceFieldsPos();
1015  }
1016  bool HasNextDirectMethod() const {
1017    return pos_ >= EndOfInstanceFieldsPos() && pos_ < EndOfDirectMethodsPos();
1018  }
1019  bool HasNextVirtualMethod() const {
1020    return pos_ >= EndOfDirectMethodsPos() && pos_ < EndOfVirtualMethodsPos();
1021  }
1022  bool HasNext() const {
1023    return pos_ < EndOfVirtualMethodsPos();
1024  }
1025  inline void Next() {
1026    pos_++;
1027    if (pos_ < EndOfStaticFieldsPos()) {
1028      last_idx_ = GetMemberIndex();
1029      ReadClassDataField();
1030    } else if (pos_ == EndOfStaticFieldsPos() && NumInstanceFields() > 0) {
1031      last_idx_ = 0;  // transition to next array, reset last index
1032      ReadClassDataField();
1033    } else if (pos_ < EndOfInstanceFieldsPos()) {
1034      last_idx_ = GetMemberIndex();
1035      ReadClassDataField();
1036    } else if (pos_ == EndOfInstanceFieldsPos() && NumDirectMethods() > 0) {
1037      last_idx_ = 0;  // transition to next array, reset last index
1038      ReadClassDataMethod();
1039    } else if (pos_ < EndOfDirectMethodsPos()) {
1040      last_idx_ = GetMemberIndex();
1041      ReadClassDataMethod();
1042    } else if (pos_ == EndOfDirectMethodsPos() && NumVirtualMethods() > 0) {
1043      last_idx_ = 0;  // transition to next array, reset last index
1044      ReadClassDataMethod();
1045    } else if (pos_ < EndOfVirtualMethodsPos()) {
1046      last_idx_ = GetMemberIndex();
1047      ReadClassDataMethod();
1048    } else {
1049      DCHECK(!HasNext());
1050    }
1051  }
1052  uint32_t GetMemberIndex() const {
1053    if (pos_ < EndOfInstanceFieldsPos()) {
1054      return last_idx_ + field_.field_idx_delta_;
1055    } else {
1056      DCHECK_LT(pos_, EndOfVirtualMethodsPos());
1057      return last_idx_ + method_.method_idx_delta_;
1058    }
1059  }
1060  uint32_t GetMemberAccessFlags() const {
1061    if (pos_ < EndOfInstanceFieldsPos()) {
1062      return field_.access_flags_;
1063    } else {
1064      DCHECK_LT(pos_, EndOfVirtualMethodsPos());
1065      return method_.access_flags_;
1066    }
1067  }
1068  InvokeType GetMethodInvokeType(const DexFile::ClassDef& class_def) const {
1069    if (HasNextDirectMethod()) {
1070      if ((GetMemberAccessFlags() & kAccStatic) != 0) {
1071        return kStatic;
1072      } else {
1073        return kDirect;
1074      }
1075    } else {
1076      DCHECK_EQ(GetMemberAccessFlags() & kAccStatic, 0U);
1077      if ((class_def.access_flags_ & kAccInterface) != 0) {
1078        return kInterface;
1079      } else if ((GetMemberAccessFlags() & kAccConstructor) != 0) {
1080        return kSuper;
1081      } else {
1082        return kVirtual;
1083      }
1084    }
1085  }
1086  const DexFile::CodeItem* GetMethodCodeItem() const {
1087    return dex_file_.GetCodeItem(method_.code_off_);
1088  }
1089  uint32_t GetMethodCodeItemOffset() const {
1090    return method_.code_off_;
1091  }
1092  const byte* EndDataPointer() const {
1093    CHECK(!HasNext());
1094    return ptr_pos_;
1095  }
1096
1097 private:
1098  // A dex file's class_data_item is leb128 encoded, this structure holds a decoded form of the
1099  // header for a class_data_item
1100  struct ClassDataHeader {
1101    uint32_t static_fields_size_;  // the number of static fields
1102    uint32_t instance_fields_size_;  // the number of instance fields
1103    uint32_t direct_methods_size_;  // the number of direct methods
1104    uint32_t virtual_methods_size_;  // the number of virtual methods
1105  } header_;
1106
1107  // Read and decode header from a class_data_item stream into header
1108  void ReadClassDataHeader();
1109
1110  uint32_t EndOfStaticFieldsPos() const {
1111    return header_.static_fields_size_;
1112  }
1113  uint32_t EndOfInstanceFieldsPos() const {
1114    return EndOfStaticFieldsPos() + header_.instance_fields_size_;
1115  }
1116  uint32_t EndOfDirectMethodsPos() const {
1117    return EndOfInstanceFieldsPos() + header_.direct_methods_size_;
1118  }
1119  uint32_t EndOfVirtualMethodsPos() const {
1120    return EndOfDirectMethodsPos() + header_.virtual_methods_size_;
1121  }
1122
1123  // A decoded version of the field of a class_data_item
1124  struct ClassDataField {
1125    uint32_t field_idx_delta_;  // delta of index into the field_ids array for FieldId
1126    uint32_t access_flags_;  // access flags for the field
1127    ClassDataField() :  field_idx_delta_(0), access_flags_(0) {}
1128
1129   private:
1130    DISALLOW_COPY_AND_ASSIGN(ClassDataField);
1131  };
1132  ClassDataField field_;
1133
1134  // Read and decode a field from a class_data_item stream into field
1135  void ReadClassDataField();
1136
1137  // A decoded version of the method of a class_data_item
1138  struct ClassDataMethod {
1139    uint32_t method_idx_delta_;  // delta of index into the method_ids array for MethodId
1140    uint32_t access_flags_;
1141    uint32_t code_off_;
1142    ClassDataMethod() : method_idx_delta_(0), access_flags_(0), code_off_(0) {}
1143
1144   private:
1145    DISALLOW_COPY_AND_ASSIGN(ClassDataMethod);
1146  };
1147  ClassDataMethod method_;
1148
1149  // Read and decode a method from a class_data_item stream into method
1150  void ReadClassDataMethod();
1151
1152  const DexFile& dex_file_;
1153  size_t pos_;  // integral number of items passed
1154  const byte* ptr_pos_;  // pointer into stream of class_data_item
1155  uint32_t last_idx_;  // last read field or method index to apply delta to
1156  DISALLOW_IMPLICIT_CONSTRUCTORS(ClassDataItemIterator);
1157};
1158
1159class EncodedStaticFieldValueIterator {
1160 public:
1161  EncodedStaticFieldValueIterator(const DexFile& dex_file, SirtRef<mirror::DexCache>* dex_cache,
1162                                  SirtRef<mirror::ClassLoader>* class_loader,
1163                                  ClassLinker* linker, const DexFile::ClassDef& class_def)
1164      SHARED_LOCKS_REQUIRED(Locks::mutator_lock_);
1165
1166  void ReadValueToField(mirror::ArtField* field) const SHARED_LOCKS_REQUIRED(Locks::mutator_lock_);
1167
1168  bool HasNext() { return pos_ < array_size_; }
1169
1170  void Next();
1171
1172  enum ValueType {
1173    kByte = 0x00,
1174    kShort = 0x02,
1175    kChar = 0x03,
1176    kInt = 0x04,
1177    kLong = 0x06,
1178    kFloat = 0x10,
1179    kDouble = 0x11,
1180    kString = 0x17,
1181    kType = 0x18,
1182    kField = 0x19,
1183    kMethod = 0x1a,
1184    kEnum = 0x1b,
1185    kArray = 0x1c,
1186    kAnnotation = 0x1d,
1187    kNull = 0x1e,
1188    kBoolean = 0x1f
1189  };
1190
1191 private:
1192  static const byte kEncodedValueTypeMask = 0x1f;  // 0b11111
1193  static const byte kEncodedValueArgShift = 5;
1194
1195  const DexFile& dex_file_;
1196  SirtRef<mirror::DexCache>* const dex_cache_;  // Dex cache to resolve literal objects.
1197  SirtRef<mirror::ClassLoader>* const class_loader_;  // ClassLoader to resolve types.
1198  ClassLinker* linker_;  // Linker to resolve literal objects.
1199  size_t array_size_;  // Size of array.
1200  size_t pos_;  // Current position.
1201  const byte* ptr_;  // Pointer into encoded data array.
1202  ValueType type_;  // Type of current encoded value.
1203  jvalue jval_;  // Value of current encoded value.
1204  DISALLOW_IMPLICIT_CONSTRUCTORS(EncodedStaticFieldValueIterator);
1205};
1206std::ostream& operator<<(std::ostream& os, const EncodedStaticFieldValueIterator::ValueType& code);
1207
1208class CatchHandlerIterator {
1209  public:
1210    CatchHandlerIterator(const DexFile::CodeItem& code_item, uint32_t address);
1211
1212    CatchHandlerIterator(const DexFile::CodeItem& code_item,
1213                         const DexFile::TryItem& try_item);
1214
1215    explicit CatchHandlerIterator(const byte* handler_data) {
1216      Init(handler_data);
1217    }
1218
1219    uint16_t GetHandlerTypeIndex() const {
1220      return handler_.type_idx_;
1221    }
1222    uint32_t GetHandlerAddress() const {
1223      return handler_.address_;
1224    }
1225    void Next();
1226    bool HasNext() const {
1227      return remaining_count_ != -1 || catch_all_;
1228    }
1229    // End of this set of catch blocks, convenience method to locate next set of catch blocks
1230    const byte* EndDataPointer() const {
1231      CHECK(!HasNext());
1232      return current_data_;
1233    }
1234
1235  private:
1236    void Init(const DexFile::CodeItem& code_item, int32_t offset);
1237    void Init(const byte* handler_data);
1238
1239    struct CatchHandlerItem {
1240      uint16_t type_idx_;  // type index of the caught exception type
1241      uint32_t address_;  // handler address
1242    } handler_;
1243    const byte *current_data_;  // the current handler in dex file.
1244    int32_t remaining_count_;   // number of handlers not read.
1245    bool catch_all_;            // is there a handler that will catch all exceptions in case
1246                                // that all typed handler does not match.
1247};
1248
1249}  // namespace art
1250
1251#endif  // ART_RUNTIME_DEX_FILE_H_
1252