dexlayout.cc revision 3ab96b460684781af58b3f9c5b9fb0e370de6b50
1/* 2 * Copyright (C) 2016 The Android Open Source Project 3 * 4 * Licensed under the Apache License, Version 2.0 (the "License"); 5 * you may not use this file except in compliance with the License. 6 * You may obtain a copy of the License at 7 * 8 * http://www.apache.org/licenses/LICENSE-2.0 9 * 10 * Unless required by applicable law or agreed to in writing, software 11 * distributed under the License is distributed on an "AS IS" BASIS, 12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 13 * See the License for the specific language governing permissions and 14 * limitations under the License. 15 * 16 * Implementation file of the dexlayout utility. 17 * 18 * This is a tool to read dex files into an internal representation, 19 * reorganize the representation, and emit dex files with a better 20 * file layout. 21 */ 22 23#include "dexlayout.h" 24 25#include <inttypes.h> 26#include <stdio.h> 27 28#include <iostream> 29#include <memory> 30#include <sstream> 31#include <vector> 32 33#include "base/unix_file/fd_file.h" 34#include "dex_ir_builder.h" 35#include "dex_file-inl.h" 36#include "dex_instruction-inl.h" 37#include "os.h" 38#include "utils.h" 39 40namespace art { 41 42/* 43 * Options parsed in main driver. 44 */ 45struct Options options_; 46 47/* 48 * Output file. Defaults to stdout. 49 */ 50FILE* out_file_ = stdout; 51 52/* 53 * Flags for use with createAccessFlagStr(). 54 */ 55enum AccessFor { 56 kAccessForClass = 0, kAccessForMethod = 1, kAccessForField = 2, kAccessForMAX 57}; 58const int kNumFlags = 18; 59 60/* 61 * Gets 2 little-endian bytes. 62 */ 63static inline uint16_t Get2LE(unsigned char const* src) { 64 return src[0] | (src[1] << 8); 65} 66 67/* 68 * Converts a type descriptor to human-readable "dotted" form. For 69 * example, "Ljava/lang/String;" becomes "java.lang.String", and 70 * "[I" becomes "int[]". Also converts '$' to '.', which means this 71 * form can't be converted back to a descriptor. 72 */ 73static std::string DescriptorToDotWrapper(const char* descriptor) { 74 std::string result = DescriptorToDot(descriptor); 75 size_t found = result.find('$'); 76 while (found != std::string::npos) { 77 result[found] = '.'; 78 found = result.find('$', found); 79 } 80 return result; 81} 82 83/* 84 * Converts the class name portion of a type descriptor to human-readable 85 * "dotted" form. For example, "Ljava/lang/String;" becomes "String". 86 */ 87static std::string DescriptorClassToDot(const char* str) { 88 std::string descriptor(str); 89 // Reduce to just the class name prefix. 90 size_t last_slash = descriptor.rfind('/'); 91 if (last_slash == std::string::npos) { 92 last_slash = 0; 93 } 94 // Start past the '/' or 'L'. 95 last_slash++; 96 97 // Copy class name over, trimming trailing ';'. 98 size_t size = descriptor.size() - 1 - last_slash; 99 std::string result(descriptor.substr(last_slash, size)); 100 101 // Replace '$' with '.'. 102 size_t dollar_sign = result.find('$'); 103 while (dollar_sign != std::string::npos) { 104 result[dollar_sign] = '.'; 105 dollar_sign = result.find('$', dollar_sign); 106 } 107 108 return result; 109} 110 111/* 112 * Returns string representing the boolean value. 113 */ 114static const char* StrBool(bool val) { 115 return val ? "true" : "false"; 116} 117 118/* 119 * Returns a quoted string representing the boolean value. 120 */ 121static const char* QuotedBool(bool val) { 122 return val ? "\"true\"" : "\"false\""; 123} 124 125/* 126 * Returns a quoted string representing the access flags. 127 */ 128static const char* QuotedVisibility(uint32_t access_flags) { 129 if (access_flags & kAccPublic) { 130 return "\"public\""; 131 } else if (access_flags & kAccProtected) { 132 return "\"protected\""; 133 } else if (access_flags & kAccPrivate) { 134 return "\"private\""; 135 } else { 136 return "\"package\""; 137 } 138} 139 140/* 141 * Counts the number of '1' bits in a word. 142 */ 143static int CountOnes(uint32_t val) { 144 val = val - ((val >> 1) & 0x55555555); 145 val = (val & 0x33333333) + ((val >> 2) & 0x33333333); 146 return (((val + (val >> 4)) & 0x0F0F0F0F) * 0x01010101) >> 24; 147} 148 149/* 150 * Creates a new string with human-readable access flags. 151 * 152 * In the base language the access_flags fields are type uint16_t; in Dalvik they're uint32_t. 153 */ 154static char* CreateAccessFlagStr(uint32_t flags, AccessFor for_what) { 155 static const char* kAccessStrings[kAccessForMAX][kNumFlags] = { 156 { 157 "PUBLIC", /* 0x00001 */ 158 "PRIVATE", /* 0x00002 */ 159 "PROTECTED", /* 0x00004 */ 160 "STATIC", /* 0x00008 */ 161 "FINAL", /* 0x00010 */ 162 "?", /* 0x00020 */ 163 "?", /* 0x00040 */ 164 "?", /* 0x00080 */ 165 "?", /* 0x00100 */ 166 "INTERFACE", /* 0x00200 */ 167 "ABSTRACT", /* 0x00400 */ 168 "?", /* 0x00800 */ 169 "SYNTHETIC", /* 0x01000 */ 170 "ANNOTATION", /* 0x02000 */ 171 "ENUM", /* 0x04000 */ 172 "?", /* 0x08000 */ 173 "VERIFIED", /* 0x10000 */ 174 "OPTIMIZED", /* 0x20000 */ 175 }, { 176 "PUBLIC", /* 0x00001 */ 177 "PRIVATE", /* 0x00002 */ 178 "PROTECTED", /* 0x00004 */ 179 "STATIC", /* 0x00008 */ 180 "FINAL", /* 0x00010 */ 181 "SYNCHRONIZED", /* 0x00020 */ 182 "BRIDGE", /* 0x00040 */ 183 "VARARGS", /* 0x00080 */ 184 "NATIVE", /* 0x00100 */ 185 "?", /* 0x00200 */ 186 "ABSTRACT", /* 0x00400 */ 187 "STRICT", /* 0x00800 */ 188 "SYNTHETIC", /* 0x01000 */ 189 "?", /* 0x02000 */ 190 "?", /* 0x04000 */ 191 "MIRANDA", /* 0x08000 */ 192 "CONSTRUCTOR", /* 0x10000 */ 193 "DECLARED_SYNCHRONIZED", /* 0x20000 */ 194 }, { 195 "PUBLIC", /* 0x00001 */ 196 "PRIVATE", /* 0x00002 */ 197 "PROTECTED", /* 0x00004 */ 198 "STATIC", /* 0x00008 */ 199 "FINAL", /* 0x00010 */ 200 "?", /* 0x00020 */ 201 "VOLATILE", /* 0x00040 */ 202 "TRANSIENT", /* 0x00080 */ 203 "?", /* 0x00100 */ 204 "?", /* 0x00200 */ 205 "?", /* 0x00400 */ 206 "?", /* 0x00800 */ 207 "SYNTHETIC", /* 0x01000 */ 208 "?", /* 0x02000 */ 209 "ENUM", /* 0x04000 */ 210 "?", /* 0x08000 */ 211 "?", /* 0x10000 */ 212 "?", /* 0x20000 */ 213 }, 214 }; 215 216 // Allocate enough storage to hold the expected number of strings, 217 // plus a space between each. We over-allocate, using the longest 218 // string above as the base metric. 219 const int kLongest = 21; // The strlen of longest string above. 220 const int count = CountOnes(flags); 221 char* str; 222 char* cp; 223 cp = str = reinterpret_cast<char*>(malloc(count * (kLongest + 1) + 1)); 224 225 for (int i = 0; i < kNumFlags; i++) { 226 if (flags & 0x01) { 227 const char* accessStr = kAccessStrings[for_what][i]; 228 const int len = strlen(accessStr); 229 if (cp != str) { 230 *cp++ = ' '; 231 } 232 memcpy(cp, accessStr, len); 233 cp += len; 234 } 235 flags >>= 1; 236 } // for 237 238 *cp = '\0'; 239 return str; 240} 241 242static std::string GetSignatureForProtoId(const dex_ir::ProtoId* proto) { 243 if (proto == nullptr) { 244 return "<no signature>"; 245 } 246 247 const std::vector<const dex_ir::TypeId*>& params = proto->Parameters(); 248 std::string result("("); 249 for (uint32_t i = 0; i < params.size(); ++i) { 250 result += params[i]->GetStringId()->Data(); 251 } 252 result += ")"; 253 result += proto->ReturnType()->GetStringId()->Data(); 254 return result; 255} 256 257/* 258 * Copies character data from "data" to "out", converting non-ASCII values 259 * to fprintf format chars or an ASCII filler ('.' or '?'). 260 * 261 * The output buffer must be able to hold (2*len)+1 bytes. The result is 262 * NULL-terminated. 263 */ 264static void Asciify(char* out, const unsigned char* data, size_t len) { 265 while (len--) { 266 if (*data < 0x20) { 267 // Could do more here, but we don't need them yet. 268 switch (*data) { 269 case '\0': 270 *out++ = '\\'; 271 *out++ = '0'; 272 break; 273 case '\n': 274 *out++ = '\\'; 275 *out++ = 'n'; 276 break; 277 default: 278 *out++ = '.'; 279 break; 280 } // switch 281 } else if (*data >= 0x80) { 282 *out++ = '?'; 283 } else { 284 *out++ = *data; 285 } 286 data++; 287 } // while 288 *out = '\0'; 289} 290 291/* 292 * Dumps a string value with some escape characters. 293 */ 294static void DumpEscapedString(const char* p) { 295 fputs("\"", out_file_); 296 for (; *p; p++) { 297 switch (*p) { 298 case '\\': 299 fputs("\\\\", out_file_); 300 break; 301 case '\"': 302 fputs("\\\"", out_file_); 303 break; 304 case '\t': 305 fputs("\\t", out_file_); 306 break; 307 case '\n': 308 fputs("\\n", out_file_); 309 break; 310 case '\r': 311 fputs("\\r", out_file_); 312 break; 313 default: 314 putc(*p, out_file_); 315 } // switch 316 } // for 317 fputs("\"", out_file_); 318} 319 320/* 321 * Dumps a string as an XML attribute value. 322 */ 323static void DumpXmlAttribute(const char* p) { 324 for (; *p; p++) { 325 switch (*p) { 326 case '&': 327 fputs("&", out_file_); 328 break; 329 case '<': 330 fputs("<", out_file_); 331 break; 332 case '>': 333 fputs(">", out_file_); 334 break; 335 case '"': 336 fputs(""", out_file_); 337 break; 338 case '\t': 339 fputs("	", out_file_); 340 break; 341 case '\n': 342 fputs("
", out_file_); 343 break; 344 case '\r': 345 fputs("
", out_file_); 346 break; 347 default: 348 putc(*p, out_file_); 349 } // switch 350 } // for 351} 352 353// Forward declare to resolve circular dependence. 354static void DumpEncodedValue(const dex_ir::EncodedValue* data); 355 356/* 357 * Dumps encoded annotation. 358 */ 359static void DumpEncodedAnnotation(dex_ir::EncodedAnnotation* annotation) { 360 fputs(annotation->GetType()->GetStringId()->Data(), out_file_); 361 // Display all name=value pairs. 362 for (auto& subannotation : *annotation->GetAnnotationElements()) { 363 fputc(' ', out_file_); 364 fputs(subannotation->GetName()->Data(), out_file_); 365 fputc('=', out_file_); 366 DumpEncodedValue(subannotation->GetValue()); 367 } 368} 369/* 370 * Dumps encoded value. 371 */ 372static void DumpEncodedValue(const dex_ir::EncodedValue* data) { 373 switch (data->Type()) { 374 case DexFile::kDexAnnotationByte: 375 fprintf(out_file_, "%" PRId8, data->GetByte()); 376 break; 377 case DexFile::kDexAnnotationShort: 378 fprintf(out_file_, "%" PRId16, data->GetShort()); 379 break; 380 case DexFile::kDexAnnotationChar: 381 fprintf(out_file_, "%" PRIu16, data->GetChar()); 382 break; 383 case DexFile::kDexAnnotationInt: 384 fprintf(out_file_, "%" PRId32, data->GetInt()); 385 break; 386 case DexFile::kDexAnnotationLong: 387 fprintf(out_file_, "%" PRId64, data->GetLong()); 388 break; 389 case DexFile::kDexAnnotationFloat: { 390 fprintf(out_file_, "%g", data->GetFloat()); 391 break; 392 } 393 case DexFile::kDexAnnotationDouble: { 394 fprintf(out_file_, "%g", data->GetDouble()); 395 break; 396 } 397 case DexFile::kDexAnnotationString: { 398 dex_ir::StringId* string_id = data->GetStringId(); 399 if (options_.output_format_ == kOutputPlain) { 400 DumpEscapedString(string_id->Data()); 401 } else { 402 DumpXmlAttribute(string_id->Data()); 403 } 404 break; 405 } 406 case DexFile::kDexAnnotationType: { 407 dex_ir::TypeId* type_id = data->GetTypeId(); 408 fputs(type_id->GetStringId()->Data(), out_file_); 409 break; 410 } 411 case DexFile::kDexAnnotationField: 412 case DexFile::kDexAnnotationEnum: { 413 dex_ir::FieldId* field_id = data->GetFieldId(); 414 fputs(field_id->Name()->Data(), out_file_); 415 break; 416 } 417 case DexFile::kDexAnnotationMethod: { 418 dex_ir::MethodId* method_id = data->GetMethodId(); 419 fputs(method_id->Name()->Data(), out_file_); 420 break; 421 } 422 case DexFile::kDexAnnotationArray: { 423 fputc('{', out_file_); 424 // Display all elements. 425 for (auto& value : *data->GetEncodedArray()->GetEncodedValues()) { 426 fputc(' ', out_file_); 427 DumpEncodedValue(value.get()); 428 } 429 fputs(" }", out_file_); 430 break; 431 } 432 case DexFile::kDexAnnotationAnnotation: { 433 DumpEncodedAnnotation(data->GetEncodedAnnotation()); 434 break; 435 } 436 case DexFile::kDexAnnotationNull: 437 fputs("null", out_file_); 438 break; 439 case DexFile::kDexAnnotationBoolean: 440 fputs(StrBool(data->GetBoolean()), out_file_); 441 break; 442 default: 443 fputs("????", out_file_); 444 break; 445 } // switch 446} 447 448/* 449 * Dumps the file header. 450 */ 451static void DumpFileHeader(dex_ir::Header* header) { 452 char sanitized[8 * 2 + 1]; 453 dex_ir::Collections& collections = header->GetCollections(); 454 fprintf(out_file_, "DEX file header:\n"); 455 Asciify(sanitized, header->Magic(), 8); 456 fprintf(out_file_, "magic : '%s'\n", sanitized); 457 fprintf(out_file_, "checksum : %08x\n", header->Checksum()); 458 fprintf(out_file_, "signature : %02x%02x...%02x%02x\n", 459 header->Signature()[0], header->Signature()[1], 460 header->Signature()[DexFile::kSha1DigestSize - 2], 461 header->Signature()[DexFile::kSha1DigestSize - 1]); 462 fprintf(out_file_, "file_size : %d\n", header->FileSize()); 463 fprintf(out_file_, "header_size : %d\n", header->HeaderSize()); 464 fprintf(out_file_, "link_size : %d\n", header->LinkSize()); 465 fprintf(out_file_, "link_off : %d (0x%06x)\n", 466 header->LinkOffset(), header->LinkOffset()); 467 fprintf(out_file_, "string_ids_size : %d\n", collections.StringIdsSize()); 468 fprintf(out_file_, "string_ids_off : %d (0x%06x)\n", 469 collections.StringIdsOffset(), collections.StringIdsOffset()); 470 fprintf(out_file_, "type_ids_size : %d\n", collections.TypeIdsSize()); 471 fprintf(out_file_, "type_ids_off : %d (0x%06x)\n", 472 collections.TypeIdsOffset(), collections.TypeIdsOffset()); 473 fprintf(out_file_, "proto_ids_size : %d\n", collections.ProtoIdsSize()); 474 fprintf(out_file_, "proto_ids_off : %d (0x%06x)\n", 475 collections.ProtoIdsOffset(), collections.ProtoIdsOffset()); 476 fprintf(out_file_, "field_ids_size : %d\n", collections.FieldIdsSize()); 477 fprintf(out_file_, "field_ids_off : %d (0x%06x)\n", 478 collections.FieldIdsOffset(), collections.FieldIdsOffset()); 479 fprintf(out_file_, "method_ids_size : %d\n", collections.MethodIdsSize()); 480 fprintf(out_file_, "method_ids_off : %d (0x%06x)\n", 481 collections.MethodIdsOffset(), collections.MethodIdsOffset()); 482 fprintf(out_file_, "class_defs_size : %d\n", collections.ClassDefsSize()); 483 fprintf(out_file_, "class_defs_off : %d (0x%06x)\n", 484 collections.ClassDefsOffset(), collections.ClassDefsOffset()); 485 fprintf(out_file_, "data_size : %d\n", header->DataSize()); 486 fprintf(out_file_, "data_off : %d (0x%06x)\n\n", 487 header->DataOffset(), header->DataOffset()); 488} 489 490/* 491 * Dumps a class_def_item. 492 */ 493static void DumpClassDef(dex_ir::Header* header, int idx) { 494 // General class information. 495 dex_ir::ClassDef* class_def = header->GetCollections().GetClassDef(idx); 496 fprintf(out_file_, "Class #%d header:\n", idx); 497 fprintf(out_file_, "class_idx : %d\n", class_def->ClassType()->GetIndex()); 498 fprintf(out_file_, "access_flags : %d (0x%04x)\n", 499 class_def->GetAccessFlags(), class_def->GetAccessFlags()); 500 uint32_t superclass_idx = class_def->Superclass() == nullptr ? 501 DexFile::kDexNoIndex16 : class_def->Superclass()->GetIndex(); 502 fprintf(out_file_, "superclass_idx : %d\n", superclass_idx); 503 fprintf(out_file_, "interfaces_off : %d (0x%06x)\n", 504 class_def->InterfacesOffset(), class_def->InterfacesOffset()); 505 uint32_t source_file_offset = 0xffffffffU; 506 if (class_def->SourceFile() != nullptr) { 507 source_file_offset = class_def->SourceFile()->GetIndex(); 508 } 509 fprintf(out_file_, "source_file_idx : %d\n", source_file_offset); 510 uint32_t annotations_offset = 0; 511 if (class_def->Annotations() != nullptr) { 512 annotations_offset = class_def->Annotations()->GetOffset(); 513 } 514 fprintf(out_file_, "annotations_off : %d (0x%06x)\n", 515 annotations_offset, annotations_offset); 516 if (class_def->GetClassData() == nullptr) { 517 fprintf(out_file_, "class_data_off : %d (0x%06x)\n", 0, 0); 518 } else { 519 fprintf(out_file_, "class_data_off : %d (0x%06x)\n", 520 class_def->GetClassData()->GetOffset(), class_def->GetClassData()->GetOffset()); 521 } 522 523 // Fields and methods. 524 dex_ir::ClassData* class_data = class_def->GetClassData(); 525 if (class_data != nullptr && class_data->StaticFields() != nullptr) { 526 fprintf(out_file_, "static_fields_size : %zu\n", class_data->StaticFields()->size()); 527 } else { 528 fprintf(out_file_, "static_fields_size : 0\n"); 529 } 530 if (class_data != nullptr && class_data->InstanceFields() != nullptr) { 531 fprintf(out_file_, "instance_fields_size: %zu\n", class_data->InstanceFields()->size()); 532 } else { 533 fprintf(out_file_, "instance_fields_size: 0\n"); 534 } 535 if (class_data != nullptr && class_data->DirectMethods() != nullptr) { 536 fprintf(out_file_, "direct_methods_size : %zu\n", class_data->DirectMethods()->size()); 537 } else { 538 fprintf(out_file_, "direct_methods_size : 0\n"); 539 } 540 if (class_data != nullptr && class_data->VirtualMethods() != nullptr) { 541 fprintf(out_file_, "virtual_methods_size: %zu\n", class_data->VirtualMethods()->size()); 542 } else { 543 fprintf(out_file_, "virtual_methods_size: 0\n"); 544 } 545 fprintf(out_file_, "\n"); 546} 547 548/** 549 * Dumps an annotation set item. 550 */ 551static void DumpAnnotationSetItem(dex_ir::AnnotationSetItem* set_item) { 552 if (set_item == nullptr || set_item->GetItems()->size() == 0) { 553 fputs(" empty-annotation-set\n", out_file_); 554 return; 555 } 556 for (dex_ir::AnnotationItem* annotation : *set_item->GetItems()) { 557 if (annotation == nullptr) { 558 continue; 559 } 560 fputs(" ", out_file_); 561 switch (annotation->GetVisibility()) { 562 case DexFile::kDexVisibilityBuild: fputs("VISIBILITY_BUILD ", out_file_); break; 563 case DexFile::kDexVisibilityRuntime: fputs("VISIBILITY_RUNTIME ", out_file_); break; 564 case DexFile::kDexVisibilitySystem: fputs("VISIBILITY_SYSTEM ", out_file_); break; 565 default: fputs("VISIBILITY_UNKNOWN ", out_file_); break; 566 } // switch 567 DumpEncodedAnnotation(annotation->GetAnnotation()); 568 fputc('\n', out_file_); 569 } 570} 571 572/* 573 * Dumps class annotations. 574 */ 575static void DumpClassAnnotations(dex_ir::Header* header, int idx) { 576 dex_ir::ClassDef* class_def = header->GetCollections().GetClassDef(idx); 577 dex_ir::AnnotationsDirectoryItem* annotations_directory = class_def->Annotations(); 578 if (annotations_directory == nullptr) { 579 return; // none 580 } 581 582 fprintf(out_file_, "Class #%d annotations:\n", idx); 583 584 dex_ir::AnnotationSetItem* class_set_item = annotations_directory->GetClassAnnotation(); 585 dex_ir::FieldAnnotationVector* fields = annotations_directory->GetFieldAnnotations(); 586 dex_ir::MethodAnnotationVector* methods = annotations_directory->GetMethodAnnotations(); 587 dex_ir::ParameterAnnotationVector* parameters = annotations_directory->GetParameterAnnotations(); 588 589 // Annotations on the class itself. 590 if (class_set_item != nullptr) { 591 fprintf(out_file_, "Annotations on class\n"); 592 DumpAnnotationSetItem(class_set_item); 593 } 594 595 // Annotations on fields. 596 if (fields != nullptr) { 597 for (auto& field : *fields) { 598 const dex_ir::FieldId* field_id = field->GetFieldId(); 599 const uint32_t field_idx = field_id->GetIndex(); 600 const char* field_name = field_id->Name()->Data(); 601 fprintf(out_file_, "Annotations on field #%u '%s'\n", field_idx, field_name); 602 DumpAnnotationSetItem(field->GetAnnotationSetItem()); 603 } 604 } 605 606 // Annotations on methods. 607 if (methods != nullptr) { 608 for (auto& method : *methods) { 609 const dex_ir::MethodId* method_id = method->GetMethodId(); 610 const uint32_t method_idx = method_id->GetIndex(); 611 const char* method_name = method_id->Name()->Data(); 612 fprintf(out_file_, "Annotations on method #%u '%s'\n", method_idx, method_name); 613 DumpAnnotationSetItem(method->GetAnnotationSetItem()); 614 } 615 } 616 617 // Annotations on method parameters. 618 if (parameters != nullptr) { 619 for (auto& parameter : *parameters) { 620 const dex_ir::MethodId* method_id = parameter->GetMethodId(); 621 const uint32_t method_idx = method_id->GetIndex(); 622 const char* method_name = method_id->Name()->Data(); 623 fprintf(out_file_, "Annotations on method #%u '%s' parameters\n", method_idx, method_name); 624 uint32_t j = 0; 625 for (dex_ir::AnnotationSetItem* annotation : *parameter->GetAnnotations()->GetItems()) { 626 fprintf(out_file_, "#%u\n", j); 627 DumpAnnotationSetItem(annotation); 628 ++j; 629 } 630 } 631 } 632 633 fputc('\n', out_file_); 634} 635 636/* 637 * Dumps an interface that a class declares to implement. 638 */ 639static void DumpInterface(const dex_ir::TypeId* type_item, int i) { 640 const char* interface_name = type_item->GetStringId()->Data(); 641 if (options_.output_format_ == kOutputPlain) { 642 fprintf(out_file_, " #%d : '%s'\n", i, interface_name); 643 } else { 644 std::string dot(DescriptorToDotWrapper(interface_name)); 645 fprintf(out_file_, "<implements name=\"%s\">\n</implements>\n", dot.c_str()); 646 } 647} 648 649/* 650 * Dumps the catches table associated with the code. 651 */ 652static void DumpCatches(const dex_ir::CodeItem* code) { 653 const uint16_t tries_size = code->TriesSize(); 654 655 // No catch table. 656 if (tries_size == 0) { 657 fprintf(out_file_, " catches : (none)\n"); 658 return; 659 } 660 661 // Dump all table entries. 662 fprintf(out_file_, " catches : %d\n", tries_size); 663 std::vector<std::unique_ptr<const dex_ir::TryItem>>* tries = code->Tries(); 664 for (uint32_t i = 0; i < tries_size; i++) { 665 const dex_ir::TryItem* try_item = (*tries)[i].get(); 666 const uint32_t start = try_item->StartAddr(); 667 const uint32_t end = start + try_item->InsnCount(); 668 fprintf(out_file_, " 0x%04x - 0x%04x\n", start, end); 669 for (auto& handler : try_item->GetHandlers()) { 670 const dex_ir::TypeId* type_id = handler->GetTypeId(); 671 const char* descriptor = (type_id == nullptr) ? "<any>" : type_id->GetStringId()->Data(); 672 fprintf(out_file_, " %s -> 0x%04x\n", descriptor, handler->GetAddress()); 673 } // for 674 } // for 675} 676 677/* 678 * Dumps all positions table entries associated with the code. 679 */ 680static void DumpPositionInfo(const dex_ir::CodeItem* code) { 681 dex_ir::DebugInfoItem* debug_info = code->DebugInfo(); 682 if (debug_info == nullptr) { 683 return; 684 } 685 std::vector<std::unique_ptr<dex_ir::PositionInfo>>& positions = debug_info->GetPositionInfo(); 686 for (size_t i = 0; i < positions.size(); ++i) { 687 fprintf(out_file_, " 0x%04x line=%d\n", positions[i]->address_, positions[i]->line_); 688 } 689} 690 691/* 692 * Dumps all locals table entries associated with the code. 693 */ 694static void DumpLocalInfo(const dex_ir::CodeItem* code) { 695 dex_ir::DebugInfoItem* debug_info = code->DebugInfo(); 696 if (debug_info == nullptr) { 697 return; 698 } 699 std::vector<std::unique_ptr<dex_ir::LocalInfo>>& locals = debug_info->GetLocalInfo(); 700 for (size_t i = 0; i < locals.size(); ++i) { 701 dex_ir::LocalInfo* entry = locals[i].get(); 702 fprintf(out_file_, " 0x%04x - 0x%04x reg=%d %s %s %s\n", 703 entry->start_address_, entry->end_address_, entry->reg_, 704 entry->name_.c_str(), entry->descriptor_.c_str(), entry->signature_.c_str()); 705 } 706} 707 708/* 709 * Helper for dumpInstruction(), which builds the string 710 * representation for the index in the given instruction. 711 * Returns a pointer to a buffer of sufficient size. 712 */ 713static std::unique_ptr<char[]> IndexString(dex_ir::Header* header, 714 const Instruction* dec_insn, 715 size_t buf_size) { 716 std::unique_ptr<char[]> buf(new char[buf_size]); 717 // Determine index and width of the string. 718 uint32_t index = 0; 719 uint32_t width = 4; 720 switch (Instruction::FormatOf(dec_insn->Opcode())) { 721 // SOME NOT SUPPORTED: 722 // case Instruction::k20bc: 723 case Instruction::k21c: 724 case Instruction::k35c: 725 // case Instruction::k35ms: 726 case Instruction::k3rc: 727 // case Instruction::k3rms: 728 // case Instruction::k35mi: 729 // case Instruction::k3rmi: 730 index = dec_insn->VRegB(); 731 width = 4; 732 break; 733 case Instruction::k31c: 734 index = dec_insn->VRegB(); 735 width = 8; 736 break; 737 case Instruction::k22c: 738 // case Instruction::k22cs: 739 index = dec_insn->VRegC(); 740 width = 4; 741 break; 742 default: 743 break; 744 } // switch 745 746 // Determine index type. 747 size_t outSize = 0; 748 switch (Instruction::IndexTypeOf(dec_insn->Opcode())) { 749 case Instruction::kIndexUnknown: 750 // This function should never get called for this type, but do 751 // something sensible here, just to help with debugging. 752 outSize = snprintf(buf.get(), buf_size, "<unknown-index>"); 753 break; 754 case Instruction::kIndexNone: 755 // This function should never get called for this type, but do 756 // something sensible here, just to help with debugging. 757 outSize = snprintf(buf.get(), buf_size, "<no-index>"); 758 break; 759 case Instruction::kIndexTypeRef: 760 if (index < header->GetCollections().TypeIdsSize()) { 761 const char* tp = header->GetCollections().GetTypeId(index)->GetStringId()->Data(); 762 outSize = snprintf(buf.get(), buf_size, "%s // type@%0*x", tp, width, index); 763 } else { 764 outSize = snprintf(buf.get(), buf_size, "<type?> // type@%0*x", width, index); 765 } 766 break; 767 case Instruction::kIndexStringRef: 768 if (index < header->GetCollections().StringIdsSize()) { 769 const char* st = header->GetCollections().GetStringId(index)->Data(); 770 outSize = snprintf(buf.get(), buf_size, "\"%s\" // string@%0*x", st, width, index); 771 } else { 772 outSize = snprintf(buf.get(), buf_size, "<string?> // string@%0*x", width, index); 773 } 774 break; 775 case Instruction::kIndexMethodRef: 776 if (index < header->GetCollections().MethodIdsSize()) { 777 dex_ir::MethodId* method_id = header->GetCollections().GetMethodId(index); 778 const char* name = method_id->Name()->Data(); 779 std::string type_descriptor = GetSignatureForProtoId(method_id->Proto()); 780 const char* back_descriptor = method_id->Class()->GetStringId()->Data(); 781 outSize = snprintf(buf.get(), buf_size, "%s.%s:%s // method@%0*x", 782 back_descriptor, name, type_descriptor.c_str(), width, index); 783 } else { 784 outSize = snprintf(buf.get(), buf_size, "<method?> // method@%0*x", width, index); 785 } 786 break; 787 case Instruction::kIndexFieldRef: 788 if (index < header->GetCollections().FieldIdsSize()) { 789 dex_ir::FieldId* field_id = header->GetCollections().GetFieldId(index); 790 const char* name = field_id->Name()->Data(); 791 const char* type_descriptor = field_id->Type()->GetStringId()->Data(); 792 const char* back_descriptor = field_id->Class()->GetStringId()->Data(); 793 outSize = snprintf(buf.get(), buf_size, "%s.%s:%s // field@%0*x", 794 back_descriptor, name, type_descriptor, width, index); 795 } else { 796 outSize = snprintf(buf.get(), buf_size, "<field?> // field@%0*x", width, index); 797 } 798 break; 799 case Instruction::kIndexVtableOffset: 800 outSize = snprintf(buf.get(), buf_size, "[%0*x] // vtable #%0*x", 801 width, index, width, index); 802 break; 803 case Instruction::kIndexFieldOffset: 804 outSize = snprintf(buf.get(), buf_size, "[obj+%0*x]", width, index); 805 break; 806 // SOME NOT SUPPORTED: 807 // case Instruction::kIndexVaries: 808 // case Instruction::kIndexInlineMethod: 809 default: 810 outSize = snprintf(buf.get(), buf_size, "<?>"); 811 break; 812 } // switch 813 814 // Determine success of string construction. 815 if (outSize >= buf_size) { 816 // The buffer wasn't big enough; retry with computed size. Note: snprintf() 817 // doesn't count/ the '\0' as part of its returned size, so we add explicit 818 // space for it here. 819 return IndexString(header, dec_insn, outSize + 1); 820 } 821 return buf; 822} 823 824/* 825 * Dumps a single instruction. 826 */ 827static void DumpInstruction(dex_ir::Header* header, const dex_ir::CodeItem* code, 828 uint32_t code_offset, uint32_t insn_idx, uint32_t insn_width, 829 const Instruction* dec_insn) { 830 // Address of instruction (expressed as byte offset). 831 fprintf(out_file_, "%06x:", code_offset + 0x10 + insn_idx * 2); 832 833 // Dump (part of) raw bytes. 834 const uint16_t* insns = code->Insns(); 835 for (uint32_t i = 0; i < 8; i++) { 836 if (i < insn_width) { 837 if (i == 7) { 838 fprintf(out_file_, " ... "); 839 } else { 840 // Print 16-bit value in little-endian order. 841 const uint8_t* bytePtr = (const uint8_t*) &insns[insn_idx + i]; 842 fprintf(out_file_, " %02x%02x", bytePtr[0], bytePtr[1]); 843 } 844 } else { 845 fputs(" ", out_file_); 846 } 847 } // for 848 849 // Dump pseudo-instruction or opcode. 850 if (dec_insn->Opcode() == Instruction::NOP) { 851 const uint16_t instr = Get2LE((const uint8_t*) &insns[insn_idx]); 852 if (instr == Instruction::kPackedSwitchSignature) { 853 fprintf(out_file_, "|%04x: packed-switch-data (%d units)", insn_idx, insn_width); 854 } else if (instr == Instruction::kSparseSwitchSignature) { 855 fprintf(out_file_, "|%04x: sparse-switch-data (%d units)", insn_idx, insn_width); 856 } else if (instr == Instruction::kArrayDataSignature) { 857 fprintf(out_file_, "|%04x: array-data (%d units)", insn_idx, insn_width); 858 } else { 859 fprintf(out_file_, "|%04x: nop // spacer", insn_idx); 860 } 861 } else { 862 fprintf(out_file_, "|%04x: %s", insn_idx, dec_insn->Name()); 863 } 864 865 // Set up additional argument. 866 std::unique_ptr<char[]> index_buf; 867 if (Instruction::IndexTypeOf(dec_insn->Opcode()) != Instruction::kIndexNone) { 868 index_buf = IndexString(header, dec_insn, 200); 869 } 870 871 // Dump the instruction. 872 // 873 // NOTE: pDecInsn->DumpString(pDexFile) differs too much from original. 874 // 875 switch (Instruction::FormatOf(dec_insn->Opcode())) { 876 case Instruction::k10x: // op 877 break; 878 case Instruction::k12x: // op vA, vB 879 fprintf(out_file_, " v%d, v%d", dec_insn->VRegA(), dec_insn->VRegB()); 880 break; 881 case Instruction::k11n: // op vA, #+B 882 fprintf(out_file_, " v%d, #int %d // #%x", 883 dec_insn->VRegA(), (int32_t) dec_insn->VRegB(), (uint8_t)dec_insn->VRegB()); 884 break; 885 case Instruction::k11x: // op vAA 886 fprintf(out_file_, " v%d", dec_insn->VRegA()); 887 break; 888 case Instruction::k10t: // op +AA 889 case Instruction::k20t: { // op +AAAA 890 const int32_t targ = (int32_t) dec_insn->VRegA(); 891 fprintf(out_file_, " %04x // %c%04x", 892 insn_idx + targ, 893 (targ < 0) ? '-' : '+', 894 (targ < 0) ? -targ : targ); 895 break; 896 } 897 case Instruction::k22x: // op vAA, vBBBB 898 fprintf(out_file_, " v%d, v%d", dec_insn->VRegA(), dec_insn->VRegB()); 899 break; 900 case Instruction::k21t: { // op vAA, +BBBB 901 const int32_t targ = (int32_t) dec_insn->VRegB(); 902 fprintf(out_file_, " v%d, %04x // %c%04x", dec_insn->VRegA(), 903 insn_idx + targ, 904 (targ < 0) ? '-' : '+', 905 (targ < 0) ? -targ : targ); 906 break; 907 } 908 case Instruction::k21s: // op vAA, #+BBBB 909 fprintf(out_file_, " v%d, #int %d // #%x", 910 dec_insn->VRegA(), (int32_t) dec_insn->VRegB(), (uint16_t)dec_insn->VRegB()); 911 break; 912 case Instruction::k21h: // op vAA, #+BBBB0000[00000000] 913 // The printed format varies a bit based on the actual opcode. 914 if (dec_insn->Opcode() == Instruction::CONST_HIGH16) { 915 const int32_t value = dec_insn->VRegB() << 16; 916 fprintf(out_file_, " v%d, #int %d // #%x", 917 dec_insn->VRegA(), value, (uint16_t) dec_insn->VRegB()); 918 } else { 919 const int64_t value = ((int64_t) dec_insn->VRegB()) << 48; 920 fprintf(out_file_, " v%d, #long %" PRId64 " // #%x", 921 dec_insn->VRegA(), value, (uint16_t) dec_insn->VRegB()); 922 } 923 break; 924 case Instruction::k21c: // op vAA, thing@BBBB 925 case Instruction::k31c: // op vAA, thing@BBBBBBBB 926 fprintf(out_file_, " v%d, %s", dec_insn->VRegA(), index_buf.get()); 927 break; 928 case Instruction::k23x: // op vAA, vBB, vCC 929 fprintf(out_file_, " v%d, v%d, v%d", 930 dec_insn->VRegA(), dec_insn->VRegB(), dec_insn->VRegC()); 931 break; 932 case Instruction::k22b: // op vAA, vBB, #+CC 933 fprintf(out_file_, " v%d, v%d, #int %d // #%02x", 934 dec_insn->VRegA(), dec_insn->VRegB(), 935 (int32_t) dec_insn->VRegC(), (uint8_t) dec_insn->VRegC()); 936 break; 937 case Instruction::k22t: { // op vA, vB, +CCCC 938 const int32_t targ = (int32_t) dec_insn->VRegC(); 939 fprintf(out_file_, " v%d, v%d, %04x // %c%04x", 940 dec_insn->VRegA(), dec_insn->VRegB(), 941 insn_idx + targ, 942 (targ < 0) ? '-' : '+', 943 (targ < 0) ? -targ : targ); 944 break; 945 } 946 case Instruction::k22s: // op vA, vB, #+CCCC 947 fprintf(out_file_, " v%d, v%d, #int %d // #%04x", 948 dec_insn->VRegA(), dec_insn->VRegB(), 949 (int32_t) dec_insn->VRegC(), (uint16_t) dec_insn->VRegC()); 950 break; 951 case Instruction::k22c: // op vA, vB, thing@CCCC 952 // NOT SUPPORTED: 953 // case Instruction::k22cs: // [opt] op vA, vB, field offset CCCC 954 fprintf(out_file_, " v%d, v%d, %s", 955 dec_insn->VRegA(), dec_insn->VRegB(), index_buf.get()); 956 break; 957 case Instruction::k30t: 958 fprintf(out_file_, " #%08x", dec_insn->VRegA()); 959 break; 960 case Instruction::k31i: { // op vAA, #+BBBBBBBB 961 // This is often, but not always, a float. 962 union { 963 float f; 964 uint32_t i; 965 } conv; 966 conv.i = dec_insn->VRegB(); 967 fprintf(out_file_, " v%d, #float %g // #%08x", 968 dec_insn->VRegA(), conv.f, dec_insn->VRegB()); 969 break; 970 } 971 case Instruction::k31t: // op vAA, offset +BBBBBBBB 972 fprintf(out_file_, " v%d, %08x // +%08x", 973 dec_insn->VRegA(), insn_idx + dec_insn->VRegB(), dec_insn->VRegB()); 974 break; 975 case Instruction::k32x: // op vAAAA, vBBBB 976 fprintf(out_file_, " v%d, v%d", dec_insn->VRegA(), dec_insn->VRegB()); 977 break; 978 case Instruction::k35c: { // op {vC, vD, vE, vF, vG}, thing@BBBB 979 // NOT SUPPORTED: 980 // case Instruction::k35ms: // [opt] invoke-virtual+super 981 // case Instruction::k35mi: // [opt] inline invoke 982 uint32_t arg[Instruction::kMaxVarArgRegs]; 983 dec_insn->GetVarArgs(arg); 984 fputs(" {", out_file_); 985 for (int i = 0, n = dec_insn->VRegA(); i < n; i++) { 986 if (i == 0) { 987 fprintf(out_file_, "v%d", arg[i]); 988 } else { 989 fprintf(out_file_, ", v%d", arg[i]); 990 } 991 } // for 992 fprintf(out_file_, "}, %s", index_buf.get()); 993 break; 994 } 995 case Instruction::k3rc: // op {vCCCC .. v(CCCC+AA-1)}, thing@BBBB 996 // NOT SUPPORTED: 997 // case Instruction::k3rms: // [opt] invoke-virtual+super/range 998 // case Instruction::k3rmi: // [opt] execute-inline/range 999 { 1000 // This doesn't match the "dx" output when some of the args are 1001 // 64-bit values -- dx only shows the first register. 1002 fputs(" {", out_file_); 1003 for (int i = 0, n = dec_insn->VRegA(); i < n; i++) { 1004 if (i == 0) { 1005 fprintf(out_file_, "v%d", dec_insn->VRegC() + i); 1006 } else { 1007 fprintf(out_file_, ", v%d", dec_insn->VRegC() + i); 1008 } 1009 } // for 1010 fprintf(out_file_, "}, %s", index_buf.get()); 1011 } 1012 break; 1013 case Instruction::k51l: { // op vAA, #+BBBBBBBBBBBBBBBB 1014 // This is often, but not always, a double. 1015 union { 1016 double d; 1017 uint64_t j; 1018 } conv; 1019 conv.j = dec_insn->WideVRegB(); 1020 fprintf(out_file_, " v%d, #double %g // #%016" PRIx64, 1021 dec_insn->VRegA(), conv.d, dec_insn->WideVRegB()); 1022 break; 1023 } 1024 // NOT SUPPORTED: 1025 // case Instruction::k00x: // unknown op or breakpoint 1026 // break; 1027 default: 1028 fprintf(out_file_, " ???"); 1029 break; 1030 } // switch 1031 1032 fputc('\n', out_file_); 1033} 1034 1035/* 1036 * Dumps a bytecode disassembly. 1037 */ 1038static void DumpBytecodes(dex_ir::Header* header, uint32_t idx, 1039 const dex_ir::CodeItem* code, uint32_t code_offset) { 1040 dex_ir::MethodId* method_id = header->GetCollections().GetMethodId(idx); 1041 const char* name = method_id->Name()->Data(); 1042 std::string type_descriptor = GetSignatureForProtoId(method_id->Proto()); 1043 const char* back_descriptor = method_id->Class()->GetStringId()->Data(); 1044 1045 // Generate header. 1046 std::string dot(DescriptorToDotWrapper(back_descriptor)); 1047 fprintf(out_file_, "%06x: |[%06x] %s.%s:%s\n", 1048 code_offset, code_offset, dot.c_str(), name, type_descriptor.c_str()); 1049 1050 // Iterate over all instructions. 1051 const uint16_t* insns = code->Insns(); 1052 for (uint32_t insn_idx = 0; insn_idx < code->InsnsSize();) { 1053 const Instruction* instruction = Instruction::At(&insns[insn_idx]); 1054 const uint32_t insn_width = instruction->SizeInCodeUnits(); 1055 if (insn_width == 0) { 1056 fprintf(stderr, "GLITCH: zero-width instruction at idx=0x%04x\n", insn_idx); 1057 break; 1058 } 1059 DumpInstruction(header, code, code_offset, insn_idx, insn_width, instruction); 1060 insn_idx += insn_width; 1061 } // for 1062} 1063 1064/* 1065 * Dumps code of a method. 1066 */ 1067static void DumpCode(dex_ir::Header* header, uint32_t idx, const dex_ir::CodeItem* code, 1068 uint32_t code_offset) { 1069 fprintf(out_file_, " registers : %d\n", code->RegistersSize()); 1070 fprintf(out_file_, " ins : %d\n", code->InsSize()); 1071 fprintf(out_file_, " outs : %d\n", code->OutsSize()); 1072 fprintf(out_file_, " insns size : %d 16-bit code units\n", 1073 code->InsnsSize()); 1074 1075 // Bytecode disassembly, if requested. 1076 if (options_.disassemble_) { 1077 DumpBytecodes(header, idx, code, code_offset); 1078 } 1079 1080 // Try-catch blocks. 1081 DumpCatches(code); 1082 1083 // Positions and locals table in the debug info. 1084 fprintf(out_file_, " positions : \n"); 1085 DumpPositionInfo(code); 1086 fprintf(out_file_, " locals : \n"); 1087 DumpLocalInfo(code); 1088} 1089 1090/* 1091 * Dumps a method. 1092 */ 1093static void DumpMethod(dex_ir::Header* header, uint32_t idx, uint32_t flags, 1094 const dex_ir::CodeItem* code, int i) { 1095 // Bail for anything private if export only requested. 1096 if (options_.exports_only_ && (flags & (kAccPublic | kAccProtected)) == 0) { 1097 return; 1098 } 1099 1100 dex_ir::MethodId* method_id = header->GetCollections().GetMethodId(idx); 1101 const char* name = method_id->Name()->Data(); 1102 char* type_descriptor = strdup(GetSignatureForProtoId(method_id->Proto()).c_str()); 1103 const char* back_descriptor = method_id->Class()->GetStringId()->Data(); 1104 char* access_str = CreateAccessFlagStr(flags, kAccessForMethod); 1105 1106 if (options_.output_format_ == kOutputPlain) { 1107 fprintf(out_file_, " #%d : (in %s)\n", i, back_descriptor); 1108 fprintf(out_file_, " name : '%s'\n", name); 1109 fprintf(out_file_, " type : '%s'\n", type_descriptor); 1110 fprintf(out_file_, " access : 0x%04x (%s)\n", flags, access_str); 1111 if (code == nullptr) { 1112 fprintf(out_file_, " code : (none)\n"); 1113 } else { 1114 fprintf(out_file_, " code -\n"); 1115 DumpCode(header, idx, code, code->GetOffset()); 1116 } 1117 if (options_.disassemble_) { 1118 fputc('\n', out_file_); 1119 } 1120 } else if (options_.output_format_ == kOutputXml) { 1121 const bool constructor = (name[0] == '<'); 1122 1123 // Method name and prototype. 1124 if (constructor) { 1125 std::string dot(DescriptorClassToDot(back_descriptor)); 1126 fprintf(out_file_, "<constructor name=\"%s\"\n", dot.c_str()); 1127 dot = DescriptorToDotWrapper(back_descriptor); 1128 fprintf(out_file_, " type=\"%s\"\n", dot.c_str()); 1129 } else { 1130 fprintf(out_file_, "<method name=\"%s\"\n", name); 1131 const char* return_type = strrchr(type_descriptor, ')'); 1132 if (return_type == nullptr) { 1133 fprintf(stderr, "bad method type descriptor '%s'\n", type_descriptor); 1134 goto bail; 1135 } 1136 std::string dot(DescriptorToDotWrapper(return_type + 1)); 1137 fprintf(out_file_, " return=\"%s\"\n", dot.c_str()); 1138 fprintf(out_file_, " abstract=%s\n", QuotedBool((flags & kAccAbstract) != 0)); 1139 fprintf(out_file_, " native=%s\n", QuotedBool((flags & kAccNative) != 0)); 1140 fprintf(out_file_, " synchronized=%s\n", QuotedBool( 1141 (flags & (kAccSynchronized | kAccDeclaredSynchronized)) != 0)); 1142 } 1143 1144 // Additional method flags. 1145 fprintf(out_file_, " static=%s\n", QuotedBool((flags & kAccStatic) != 0)); 1146 fprintf(out_file_, " final=%s\n", QuotedBool((flags & kAccFinal) != 0)); 1147 // The "deprecated=" not knowable w/o parsing annotations. 1148 fprintf(out_file_, " visibility=%s\n>\n", QuotedVisibility(flags)); 1149 1150 // Parameters. 1151 if (type_descriptor[0] != '(') { 1152 fprintf(stderr, "ERROR: bad descriptor '%s'\n", type_descriptor); 1153 goto bail; 1154 } 1155 char* tmp_buf = reinterpret_cast<char*>(malloc(strlen(type_descriptor) + 1)); 1156 const char* base = type_descriptor + 1; 1157 int arg_num = 0; 1158 while (*base != ')') { 1159 char* cp = tmp_buf; 1160 while (*base == '[') { 1161 *cp++ = *base++; 1162 } 1163 if (*base == 'L') { 1164 // Copy through ';'. 1165 do { 1166 *cp = *base++; 1167 } while (*cp++ != ';'); 1168 } else { 1169 // Primitive char, copy it. 1170 if (strchr("ZBCSIFJD", *base) == nullptr) { 1171 fprintf(stderr, "ERROR: bad method signature '%s'\n", base); 1172 break; // while 1173 } 1174 *cp++ = *base++; 1175 } 1176 // Null terminate and display. 1177 *cp++ = '\0'; 1178 std::string dot(DescriptorToDotWrapper(tmp_buf)); 1179 fprintf(out_file_, "<parameter name=\"arg%d\" type=\"%s\">\n" 1180 "</parameter>\n", arg_num++, dot.c_str()); 1181 } // while 1182 free(tmp_buf); 1183 if (constructor) { 1184 fprintf(out_file_, "</constructor>\n"); 1185 } else { 1186 fprintf(out_file_, "</method>\n"); 1187 } 1188 } 1189 1190 bail: 1191 free(type_descriptor); 1192 free(access_str); 1193} 1194 1195/* 1196 * Dumps a static (class) field. 1197 */ 1198static void DumpSField(dex_ir::Header* header, uint32_t idx, uint32_t flags, 1199 int i, dex_ir::EncodedValue* init) { 1200 // Bail for anything private if export only requested. 1201 if (options_.exports_only_ && (flags & (kAccPublic | kAccProtected)) == 0) { 1202 return; 1203 } 1204 1205 dex_ir::FieldId* field_id = header->GetCollections().GetFieldId(idx); 1206 const char* name = field_id->Name()->Data(); 1207 const char* type_descriptor = field_id->Type()->GetStringId()->Data(); 1208 const char* back_descriptor = field_id->Class()->GetStringId()->Data(); 1209 char* access_str = CreateAccessFlagStr(flags, kAccessForField); 1210 1211 if (options_.output_format_ == kOutputPlain) { 1212 fprintf(out_file_, " #%d : (in %s)\n", i, back_descriptor); 1213 fprintf(out_file_, " name : '%s'\n", name); 1214 fprintf(out_file_, " type : '%s'\n", type_descriptor); 1215 fprintf(out_file_, " access : 0x%04x (%s)\n", flags, access_str); 1216 if (init != nullptr) { 1217 fputs(" value : ", out_file_); 1218 DumpEncodedValue(init); 1219 fputs("\n", out_file_); 1220 } 1221 } else if (options_.output_format_ == kOutputXml) { 1222 fprintf(out_file_, "<field name=\"%s\"\n", name); 1223 std::string dot(DescriptorToDotWrapper(type_descriptor)); 1224 fprintf(out_file_, " type=\"%s\"\n", dot.c_str()); 1225 fprintf(out_file_, " transient=%s\n", QuotedBool((flags & kAccTransient) != 0)); 1226 fprintf(out_file_, " volatile=%s\n", QuotedBool((flags & kAccVolatile) != 0)); 1227 // The "value=" is not knowable w/o parsing annotations. 1228 fprintf(out_file_, " static=%s\n", QuotedBool((flags & kAccStatic) != 0)); 1229 fprintf(out_file_, " final=%s\n", QuotedBool((flags & kAccFinal) != 0)); 1230 // The "deprecated=" is not knowable w/o parsing annotations. 1231 fprintf(out_file_, " visibility=%s\n", QuotedVisibility(flags)); 1232 if (init != nullptr) { 1233 fputs(" value=\"", out_file_); 1234 DumpEncodedValue(init); 1235 fputs("\"\n", out_file_); 1236 } 1237 fputs(">\n</field>\n", out_file_); 1238 } 1239 1240 free(access_str); 1241} 1242 1243/* 1244 * Dumps an instance field. 1245 */ 1246static void DumpIField(dex_ir::Header* header, uint32_t idx, uint32_t flags, int i) { 1247 DumpSField(header, idx, flags, i, nullptr); 1248} 1249 1250/* 1251 * Dumping a CFG. Note that this will do duplicate work. utils.h doesn't expose the code-item 1252 * version, so the DumpMethodCFG code will have to iterate again to find it. But dexdump is a 1253 * tool, so this is not performance-critical. 1254 */ 1255 1256static void DumpCFG(const DexFile* dex_file, 1257 uint32_t dex_method_idx, 1258 const DexFile::CodeItem* code) { 1259 if (code != nullptr) { 1260 std::ostringstream oss; 1261 DumpMethodCFG(dex_file, dex_method_idx, oss); 1262 fprintf(out_file_, "%s", oss.str().c_str()); 1263 } 1264} 1265 1266static void DumpCFG(const DexFile* dex_file, int idx) { 1267 const DexFile::ClassDef& class_def = dex_file->GetClassDef(idx); 1268 const uint8_t* class_data = dex_file->GetClassData(class_def); 1269 if (class_data == nullptr) { // empty class such as a marker interface? 1270 return; 1271 } 1272 ClassDataItemIterator it(*dex_file, class_data); 1273 while (it.HasNextStaticField()) { 1274 it.Next(); 1275 } 1276 while (it.HasNextInstanceField()) { 1277 it.Next(); 1278 } 1279 while (it.HasNextDirectMethod()) { 1280 DumpCFG(dex_file, 1281 it.GetMemberIndex(), 1282 it.GetMethodCodeItem()); 1283 it.Next(); 1284 } 1285 while (it.HasNextVirtualMethod()) { 1286 DumpCFG(dex_file, 1287 it.GetMemberIndex(), 1288 it.GetMethodCodeItem()); 1289 it.Next(); 1290 } 1291} 1292 1293/* 1294 * Dumps the class. 1295 * 1296 * Note "idx" is a DexClassDef index, not a DexTypeId index. 1297 * 1298 * If "*last_package" is nullptr or does not match the current class' package, 1299 * the value will be replaced with a newly-allocated string. 1300 */ 1301static void DumpClass(const DexFile* dex_file, 1302 dex_ir::Header* header, 1303 int idx, 1304 char** last_package) { 1305 dex_ir::ClassDef* class_def = header->GetCollections().GetClassDef(idx); 1306 // Omitting non-public class. 1307 if (options_.exports_only_ && (class_def->GetAccessFlags() & kAccPublic) == 0) { 1308 return; 1309 } 1310 1311 if (options_.show_section_headers_) { 1312 DumpClassDef(header, idx); 1313 } 1314 1315 if (options_.show_annotations_) { 1316 DumpClassAnnotations(header, idx); 1317 } 1318 1319 if (options_.show_cfg_) { 1320 DumpCFG(dex_file, idx); 1321 return; 1322 } 1323 1324 // For the XML output, show the package name. Ideally we'd gather 1325 // up the classes, sort them, and dump them alphabetically so the 1326 // package name wouldn't jump around, but that's not a great plan 1327 // for something that needs to run on the device. 1328 const char* class_descriptor = 1329 header->GetCollections().GetClassDef(idx)->ClassType()->GetStringId()->Data(); 1330 if (!(class_descriptor[0] == 'L' && 1331 class_descriptor[strlen(class_descriptor)-1] == ';')) { 1332 // Arrays and primitives should not be defined explicitly. Keep going? 1333 fprintf(stderr, "Malformed class name '%s'\n", class_descriptor); 1334 } else if (options_.output_format_ == kOutputXml) { 1335 char* mangle = strdup(class_descriptor + 1); 1336 mangle[strlen(mangle)-1] = '\0'; 1337 1338 // Reduce to just the package name. 1339 char* last_slash = strrchr(mangle, '/'); 1340 if (last_slash != nullptr) { 1341 *last_slash = '\0'; 1342 } else { 1343 *mangle = '\0'; 1344 } 1345 1346 for (char* cp = mangle; *cp != '\0'; cp++) { 1347 if (*cp == '/') { 1348 *cp = '.'; 1349 } 1350 } // for 1351 1352 if (*last_package == nullptr || strcmp(mangle, *last_package) != 0) { 1353 // Start of a new package. 1354 if (*last_package != nullptr) { 1355 fprintf(out_file_, "</package>\n"); 1356 } 1357 fprintf(out_file_, "<package name=\"%s\"\n>\n", mangle); 1358 free(*last_package); 1359 *last_package = mangle; 1360 } else { 1361 free(mangle); 1362 } 1363 } 1364 1365 // General class information. 1366 char* access_str = CreateAccessFlagStr(class_def->GetAccessFlags(), kAccessForClass); 1367 const char* superclass_descriptor = nullptr; 1368 if (class_def->Superclass() != nullptr) { 1369 superclass_descriptor = class_def->Superclass()->GetStringId()->Data(); 1370 } 1371 if (options_.output_format_ == kOutputPlain) { 1372 fprintf(out_file_, "Class #%d -\n", idx); 1373 fprintf(out_file_, " Class descriptor : '%s'\n", class_descriptor); 1374 fprintf(out_file_, " Access flags : 0x%04x (%s)\n", 1375 class_def->GetAccessFlags(), access_str); 1376 if (superclass_descriptor != nullptr) { 1377 fprintf(out_file_, " Superclass : '%s'\n", superclass_descriptor); 1378 } 1379 fprintf(out_file_, " Interfaces -\n"); 1380 } else { 1381 std::string dot(DescriptorClassToDot(class_descriptor)); 1382 fprintf(out_file_, "<class name=\"%s\"\n", dot.c_str()); 1383 if (superclass_descriptor != nullptr) { 1384 dot = DescriptorToDotWrapper(superclass_descriptor); 1385 fprintf(out_file_, " extends=\"%s\"\n", dot.c_str()); 1386 } 1387 fprintf(out_file_, " interface=%s\n", 1388 QuotedBool((class_def->GetAccessFlags() & kAccInterface) != 0)); 1389 fprintf(out_file_, " abstract=%s\n", 1390 QuotedBool((class_def->GetAccessFlags() & kAccAbstract) != 0)); 1391 fprintf(out_file_, " static=%s\n", QuotedBool((class_def->GetAccessFlags() & kAccStatic) != 0)); 1392 fprintf(out_file_, " final=%s\n", QuotedBool((class_def->GetAccessFlags() & kAccFinal) != 0)); 1393 // The "deprecated=" not knowable w/o parsing annotations. 1394 fprintf(out_file_, " visibility=%s\n", QuotedVisibility(class_def->GetAccessFlags())); 1395 fprintf(out_file_, ">\n"); 1396 } 1397 1398 // Interfaces. 1399 const dex_ir::TypeIdVector* interfaces = class_def->Interfaces(); 1400 if (interfaces != nullptr) { 1401 for (uint32_t i = 0; i < interfaces->size(); i++) { 1402 DumpInterface((*interfaces)[i], i); 1403 } // for 1404 } 1405 1406 // Fields and methods. 1407 dex_ir::ClassData* class_data = class_def->GetClassData(); 1408 // Prepare data for static fields. 1409 dex_ir::EncodedArrayItem* static_values = class_def->StaticValues(); 1410 dex_ir::EncodedValueVector* encoded_values = 1411 static_values == nullptr ? nullptr : static_values->GetEncodedValues(); 1412 const uint32_t encoded_values_size = (encoded_values == nullptr) ? 0 : encoded_values->size(); 1413 1414 // Static fields. 1415 if (options_.output_format_ == kOutputPlain) { 1416 fprintf(out_file_, " Static fields -\n"); 1417 } 1418 if (class_data != nullptr) { 1419 dex_ir::FieldItemVector* static_fields = class_data->StaticFields(); 1420 if (static_fields != nullptr) { 1421 for (uint32_t i = 0; i < static_fields->size(); i++) { 1422 DumpSField(header, 1423 (*static_fields)[i]->GetFieldId()->GetIndex(), 1424 (*static_fields)[i]->GetAccessFlags(), 1425 i, 1426 i < encoded_values_size ? (*encoded_values)[i].get() : nullptr); 1427 } // for 1428 } 1429 } 1430 1431 // Instance fields. 1432 if (options_.output_format_ == kOutputPlain) { 1433 fprintf(out_file_, " Instance fields -\n"); 1434 } 1435 if (class_data != nullptr) { 1436 dex_ir::FieldItemVector* instance_fields = class_data->InstanceFields(); 1437 if (instance_fields != nullptr) { 1438 for (uint32_t i = 0; i < instance_fields->size(); i++) { 1439 DumpIField(header, 1440 (*instance_fields)[i]->GetFieldId()->GetIndex(), 1441 (*instance_fields)[i]->GetAccessFlags(), 1442 i); 1443 } // for 1444 } 1445 } 1446 1447 // Direct methods. 1448 if (options_.output_format_ == kOutputPlain) { 1449 fprintf(out_file_, " Direct methods -\n"); 1450 } 1451 if (class_data != nullptr) { 1452 dex_ir::MethodItemVector* direct_methods = class_data->DirectMethods(); 1453 if (direct_methods != nullptr) { 1454 for (uint32_t i = 0; i < direct_methods->size(); i++) { 1455 DumpMethod(header, 1456 (*direct_methods)[i]->GetMethodId()->GetIndex(), 1457 (*direct_methods)[i]->GetAccessFlags(), 1458 (*direct_methods)[i]->GetCodeItem(), 1459 i); 1460 } // for 1461 } 1462 } 1463 1464 // Virtual methods. 1465 if (options_.output_format_ == kOutputPlain) { 1466 fprintf(out_file_, " Virtual methods -\n"); 1467 } 1468 if (class_data != nullptr) { 1469 dex_ir::MethodItemVector* virtual_methods = class_data->VirtualMethods(); 1470 if (virtual_methods != nullptr) { 1471 for (uint32_t i = 0; i < virtual_methods->size(); i++) { 1472 DumpMethod(header, 1473 (*virtual_methods)[i]->GetMethodId()->GetIndex(), 1474 (*virtual_methods)[i]->GetAccessFlags(), 1475 (*virtual_methods)[i]->GetCodeItem(), 1476 i); 1477 } // for 1478 } 1479 } 1480 1481 // End of class. 1482 if (options_.output_format_ == kOutputPlain) { 1483 const char* file_name = "unknown"; 1484 if (class_def->SourceFile() != nullptr) { 1485 file_name = class_def->SourceFile()->Data(); 1486 } 1487 const dex_ir::StringId* source_file = class_def->SourceFile(); 1488 fprintf(out_file_, " source_file_idx : %d (%s)\n\n", 1489 source_file == nullptr ? 0xffffffffU : source_file->GetIndex(), file_name); 1490 } else if (options_.output_format_ == kOutputXml) { 1491 fprintf(out_file_, "</class>\n"); 1492 } 1493 1494 free(access_str); 1495} 1496 1497/* 1498static uint32_t GetDataSectionOffset(dex_ir::Header& header) { 1499 return dex_ir::Header::ItemSize() + 1500 header.GetCollections().StringIdsSize() * dex_ir::StringId::ItemSize() + 1501 header.GetCollections().TypeIdsSize() * dex_ir::TypeId::ItemSize() + 1502 header.GetCollections().ProtoIdsSize() * dex_ir::ProtoId::ItemSize() + 1503 header.GetCollections().FieldIdsSize() * dex_ir::FieldId::ItemSize() + 1504 header.GetCollections().MethodIdsSize() * dex_ir::MethodId::ItemSize() + 1505 header.GetCollections().ClassDefsSize() * dex_ir::ClassDef::ItemSize(); 1506} 1507 1508static bool Align(File* file, uint32_t& offset) { 1509 uint8_t zero_buffer[] = { 0, 0, 0 }; 1510 uint32_t zeroes = (-offset) & 3; 1511 if (zeroes > 0) { 1512 if (!file->PwriteFully(zero_buffer, zeroes, offset)) { 1513 return false; 1514 } 1515 offset += zeroes; 1516 } 1517 return true; 1518} 1519 1520static bool WriteStrings(File* dex_file, dex_ir::Header& header, 1521 uint32_t& index_offset, uint32_t& data_offset) { 1522 uint32_t index = 0; 1523 uint32_t index_buffer[1]; 1524 uint32_t string_length; 1525 uint32_t length_length; 1526 uint8_t length_buffer[8]; 1527 for (std::unique_ptr<dex_ir::StringId>& string_id : header.GetCollections().StringIds()) { 1528 string_id->SetOffset(index); 1529 index_buffer[0] = data_offset; 1530 string_length = strlen(string_id->Data()); 1531 length_length = UnsignedLeb128Size(string_length); 1532 EncodeUnsignedLeb128(length_buffer, string_length); 1533 1534 if (!dex_file->PwriteFully(index_buffer, 4, index_offset) || 1535 !dex_file->PwriteFully(length_buffer, length_length, data_offset) || 1536 !dex_file->PwriteFully(string_id->Data(), string_length, data_offset + length_length)) { 1537 return false; 1538 } 1539 1540 index++; 1541 index_offset += 4; 1542 data_offset += string_length + length_length; 1543 } 1544 return true; 1545} 1546 1547static bool WriteTypes(File* dex_file, dex_ir::Header& header, uint32_t& index_offset) { 1548 uint32_t index = 0; 1549 uint32_t index_buffer[1]; 1550 for (std::unique_ptr<dex_ir::TypeId>& type_id : header.GetCollections().TypeIds()) { 1551 type_id->SetIndex(index); 1552 index_buffer[0] = type_id->GetStringId()->GetOffset(); 1553 1554 if (!dex_file->PwriteFully(index_buffer, 4, index_offset)) { 1555 return false; 1556 } 1557 1558 index++; 1559 index_offset += 4; 1560 } 1561 return true; 1562} 1563 1564static bool WriteTypeLists(File* dex_file, dex_ir::Header& header, uint32_t& data_offset) { 1565 if (!Align(dex_file, data_offset)) { 1566 return false; 1567 } 1568 1569 return true; 1570} 1571 1572static void OutputDexFile(dex_ir::Header& header, const char* file_name) { 1573 LOG(INFO) << "FILE NAME: " << file_name; 1574 std::unique_ptr<File> dex_file(OS::CreateEmptyFileWriteOnly(file_name)); 1575 if (dex_file == nullptr) { 1576 fprintf(stderr, "Can't open %s\n", file_name); 1577 return; 1578 } 1579 1580 uint32_t index_offset = dex_ir::Header::ItemSize(); 1581 uint32_t data_offset = GetDataSectionOffset(header); 1582 WriteStrings(dex_file.get(), header, index_offset, data_offset); 1583 WriteTypes(dex_file.get(), header, index_offset); 1584} 1585*/ 1586 1587/* 1588 * Dumps the requested sections of the file. 1589 */ 1590static void ProcessDexFile(const char* file_name, const DexFile* dex_file) { 1591 if (options_.verbose_) { 1592 fprintf(out_file_, "Opened '%s', DEX version '%.3s'\n", 1593 file_name, dex_file->GetHeader().magic_ + 4); 1594 } 1595 std::unique_ptr<dex_ir::Header> header(dex_ir::DexIrBuilder(*dex_file)); 1596 1597 // Headers. 1598 if (options_.show_file_headers_) { 1599 DumpFileHeader(header.get()); 1600 } 1601 1602 // Open XML context. 1603 if (options_.output_format_ == kOutputXml) { 1604 fprintf(out_file_, "<api>\n"); 1605 } 1606 1607 // Iterate over all classes. 1608 char* package = nullptr; 1609 const uint32_t class_defs_size = header->GetCollections().ClassDefsSize(); 1610 for (uint32_t i = 0; i < class_defs_size; i++) { 1611 DumpClass(dex_file, header.get(), i, &package); 1612 } // for 1613 1614 // Free the last package allocated. 1615 if (package != nullptr) { 1616 fprintf(out_file_, "</package>\n"); 1617 free(package); 1618 } 1619 1620 // Close XML context. 1621 if (options_.output_format_ == kOutputXml) { 1622 fprintf(out_file_, "</api>\n"); 1623 } 1624 1625 /* 1626 // Output dex file. 1627 if (options_.output_dex_files_) { 1628 std::string output_dex_filename = dex_file->GetLocation() + ".out"; 1629 OutputDexFile(*header, output_dex_filename.c_str()); 1630 } 1631 */ 1632} 1633 1634/* 1635 * Processes a single file (either direct .dex or indirect .zip/.jar/.apk). 1636 */ 1637int ProcessFile(const char* file_name) { 1638 if (options_.verbose_) { 1639 fprintf(out_file_, "Processing '%s'...\n", file_name); 1640 } 1641 1642 // If the file is not a .dex file, the function tries .zip/.jar/.apk files, 1643 // all of which are Zip archives with "classes.dex" inside. 1644 const bool verify_checksum = !options_.ignore_bad_checksum_; 1645 std::string error_msg; 1646 std::vector<std::unique_ptr<const DexFile>> dex_files; 1647 if (!DexFile::Open(file_name, file_name, verify_checksum, &error_msg, &dex_files)) { 1648 // Display returned error message to user. Note that this error behavior 1649 // differs from the error messages shown by the original Dalvik dexdump. 1650 fputs(error_msg.c_str(), stderr); 1651 fputc('\n', stderr); 1652 return -1; 1653 } 1654 1655 // Success. Either report checksum verification or process 1656 // all dex files found in given file. 1657 if (options_.checksum_only_) { 1658 fprintf(out_file_, "Checksum verified\n"); 1659 } else { 1660 for (size_t i = 0; i < dex_files.size(); i++) { 1661 ProcessDexFile(file_name, dex_files[i].get()); 1662 } 1663 } 1664 return 0; 1665} 1666 1667} // namespace art 1668