| /* |
| * Copyright (C) 2016 The Android Open Source Project |
| * |
| * Licensed under the Apache License, Version 2.0 (the "License"); |
| * you may not use this file except in compliance with the License. |
| * You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| * |
| * Implementation file of the dexlayout utility. |
| * |
| * This is a tool to read dex files into an internal representation, |
| * reorganize the representation, and emit dex files with a better |
| * file layout. |
| */ |
| |
| #include "dexlayout.h" |
| |
| #include <inttypes.h> |
| #include <stdio.h> |
| #include <sys/mman.h> // For the PROT_* and MAP_* constants. |
| |
| #include <iostream> |
| #include <memory> |
| #include <sstream> |
| #include <vector> |
| |
| #include "android-base/stringprintf.h" |
| |
| #include "dex_file-inl.h" |
| #include "dex_file_layout.h" |
| #include "dex_file_loader.h" |
| #include "dex_file_types.h" |
| #include "dex_file_verifier.h" |
| #include "dex_instruction-inl.h" |
| #include "dex_ir_builder.h" |
| #include "dex_verify.h" |
| #include "dex_visualize.h" |
| #include "dex_writer.h" |
| #include "jit/profile_compilation_info.h" |
| #include "mem_map.h" |
| #include "os.h" |
| #include "utils.h" |
| |
| namespace art { |
| |
| using android::base::StringPrintf; |
| |
| // Setting this to false disables class def layout entirely, which is stronger than strictly |
| // necessary to ensure the partial order w.r.t. class derivation. TODO: Re-enable (b/68317550). |
| static constexpr bool kChangeClassDefOrder = false; |
| |
| static constexpr uint32_t kDataSectionAlignment = sizeof(uint32_t) * 2; |
| static constexpr uint32_t kDexCodeItemAlignment = 4; |
| |
| /* |
| * Flags for use with createAccessFlagStr(). |
| */ |
| enum AccessFor { |
| kAccessForClass = 0, kAccessForMethod = 1, kAccessForField = 2, kAccessForMAX |
| }; |
| const int kNumFlags = 18; |
| |
| /* |
| * Gets 2 little-endian bytes. |
| */ |
| static inline uint16_t Get2LE(unsigned char const* src) { |
| return src[0] | (src[1] << 8); |
| } |
| |
| /* |
| * Converts a type descriptor to human-readable "dotted" form. For |
| * example, "Ljava/lang/String;" becomes "java.lang.String", and |
| * "[I" becomes "int[]". Also converts '$' to '.', which means this |
| * form can't be converted back to a descriptor. |
| */ |
| static std::string DescriptorToDotWrapper(const char* descriptor) { |
| std::string result = DescriptorToDot(descriptor); |
| size_t found = result.find('$'); |
| while (found != std::string::npos) { |
| result[found] = '.'; |
| found = result.find('$', found); |
| } |
| return result; |
| } |
| |
| /* |
| * Converts the class name portion of a type descriptor to human-readable |
| * "dotted" form. For example, "Ljava/lang/String;" becomes "String". |
| */ |
| static std::string DescriptorClassToDot(const char* str) { |
| std::string descriptor(str); |
| // Reduce to just the class name prefix. |
| size_t last_slash = descriptor.rfind('/'); |
| if (last_slash == std::string::npos) { |
| last_slash = 0; |
| } |
| // Start past the '/' or 'L'. |
| last_slash++; |
| |
| // Copy class name over, trimming trailing ';'. |
| size_t size = descriptor.size() - 1 - last_slash; |
| std::string result(descriptor.substr(last_slash, size)); |
| |
| // Replace '$' with '.'. |
| size_t dollar_sign = result.find('$'); |
| while (dollar_sign != std::string::npos) { |
| result[dollar_sign] = '.'; |
| dollar_sign = result.find('$', dollar_sign); |
| } |
| |
| return result; |
| } |
| |
| /* |
| * Returns string representing the boolean value. |
| */ |
| static const char* StrBool(bool val) { |
| return val ? "true" : "false"; |
| } |
| |
| /* |
| * Returns a quoted string representing the boolean value. |
| */ |
| static const char* QuotedBool(bool val) { |
| return val ? "\"true\"" : "\"false\""; |
| } |
| |
| /* |
| * Returns a quoted string representing the access flags. |
| */ |
| static const char* QuotedVisibility(uint32_t access_flags) { |
| if (access_flags & kAccPublic) { |
| return "\"public\""; |
| } else if (access_flags & kAccProtected) { |
| return "\"protected\""; |
| } else if (access_flags & kAccPrivate) { |
| return "\"private\""; |
| } else { |
| return "\"package\""; |
| } |
| } |
| |
| /* |
| * Counts the number of '1' bits in a word. |
| */ |
| static int CountOnes(uint32_t val) { |
| val = val - ((val >> 1) & 0x55555555); |
| val = (val & 0x33333333) + ((val >> 2) & 0x33333333); |
| return (((val + (val >> 4)) & 0x0F0F0F0F) * 0x01010101) >> 24; |
| } |
| |
| /* |
| * Creates a new string with human-readable access flags. |
| * |
| * In the base language the access_flags fields are type uint16_t; in Dalvik they're uint32_t. |
| */ |
| static char* CreateAccessFlagStr(uint32_t flags, AccessFor for_what) { |
| static const char* kAccessStrings[kAccessForMAX][kNumFlags] = { |
| { |
| "PUBLIC", /* 0x00001 */ |
| "PRIVATE", /* 0x00002 */ |
| "PROTECTED", /* 0x00004 */ |
| "STATIC", /* 0x00008 */ |
| "FINAL", /* 0x00010 */ |
| "?", /* 0x00020 */ |
| "?", /* 0x00040 */ |
| "?", /* 0x00080 */ |
| "?", /* 0x00100 */ |
| "INTERFACE", /* 0x00200 */ |
| "ABSTRACT", /* 0x00400 */ |
| "?", /* 0x00800 */ |
| "SYNTHETIC", /* 0x01000 */ |
| "ANNOTATION", /* 0x02000 */ |
| "ENUM", /* 0x04000 */ |
| "?", /* 0x08000 */ |
| "VERIFIED", /* 0x10000 */ |
| "OPTIMIZED", /* 0x20000 */ |
| }, { |
| "PUBLIC", /* 0x00001 */ |
| "PRIVATE", /* 0x00002 */ |
| "PROTECTED", /* 0x00004 */ |
| "STATIC", /* 0x00008 */ |
| "FINAL", /* 0x00010 */ |
| "SYNCHRONIZED", /* 0x00020 */ |
| "BRIDGE", /* 0x00040 */ |
| "VARARGS", /* 0x00080 */ |
| "NATIVE", /* 0x00100 */ |
| "?", /* 0x00200 */ |
| "ABSTRACT", /* 0x00400 */ |
| "STRICT", /* 0x00800 */ |
| "SYNTHETIC", /* 0x01000 */ |
| "?", /* 0x02000 */ |
| "?", /* 0x04000 */ |
| "MIRANDA", /* 0x08000 */ |
| "CONSTRUCTOR", /* 0x10000 */ |
| "DECLARED_SYNCHRONIZED", /* 0x20000 */ |
| }, { |
| "PUBLIC", /* 0x00001 */ |
| "PRIVATE", /* 0x00002 */ |
| "PROTECTED", /* 0x00004 */ |
| "STATIC", /* 0x00008 */ |
| "FINAL", /* 0x00010 */ |
| "?", /* 0x00020 */ |
| "VOLATILE", /* 0x00040 */ |
| "TRANSIENT", /* 0x00080 */ |
| "?", /* 0x00100 */ |
| "?", /* 0x00200 */ |
| "?", /* 0x00400 */ |
| "?", /* 0x00800 */ |
| "SYNTHETIC", /* 0x01000 */ |
| "?", /* 0x02000 */ |
| "ENUM", /* 0x04000 */ |
| "?", /* 0x08000 */ |
| "?", /* 0x10000 */ |
| "?", /* 0x20000 */ |
| }, |
| }; |
| |
| // Allocate enough storage to hold the expected number of strings, |
| // plus a space between each. We over-allocate, using the longest |
| // string above as the base metric. |
| const int kLongest = 21; // The strlen of longest string above. |
| const int count = CountOnes(flags); |
| char* str; |
| char* cp; |
| cp = str = reinterpret_cast<char*>(malloc(count * (kLongest + 1) + 1)); |
| |
| for (int i = 0; i < kNumFlags; i++) { |
| if (flags & 0x01) { |
| const char* accessStr = kAccessStrings[for_what][i]; |
| const int len = strlen(accessStr); |
| if (cp != str) { |
| *cp++ = ' '; |
| } |
| memcpy(cp, accessStr, len); |
| cp += len; |
| } |
| flags >>= 1; |
| } // for |
| |
| *cp = '\0'; |
| return str; |
| } |
| |
| static std::string GetSignatureForProtoId(const dex_ir::ProtoId* proto) { |
| if (proto == nullptr) { |
| return "<no signature>"; |
| } |
| |
| std::string result("("); |
| const dex_ir::TypeList* type_list = proto->Parameters(); |
| if (type_list != nullptr) { |
| for (const dex_ir::TypeId* type_id : *type_list->GetTypeList()) { |
| result += type_id->GetStringId()->Data(); |
| } |
| } |
| result += ")"; |
| result += proto->ReturnType()->GetStringId()->Data(); |
| return result; |
| } |
| |
| /* |
| * Copies character data from "data" to "out", converting non-ASCII values |
| * to fprintf format chars or an ASCII filler ('.' or '?'). |
| * |
| * The output buffer must be able to hold (2*len)+1 bytes. The result is |
| * NULL-terminated. |
| */ |
| static void Asciify(char* out, const unsigned char* data, size_t len) { |
| while (len--) { |
| if (*data < 0x20) { |
| // Could do more here, but we don't need them yet. |
| switch (*data) { |
| case '\0': |
| *out++ = '\\'; |
| *out++ = '0'; |
| break; |
| case '\n': |
| *out++ = '\\'; |
| *out++ = 'n'; |
| break; |
| default: |
| *out++ = '.'; |
| break; |
| } // switch |
| } else if (*data >= 0x80) { |
| *out++ = '?'; |
| } else { |
| *out++ = *data; |
| } |
| data++; |
| } // while |
| *out = '\0'; |
| } |
| |
| /* |
| * Dumps a string value with some escape characters. |
| */ |
| static void DumpEscapedString(const char* p, FILE* out_file) { |
| fputs("\"", out_file); |
| for (; *p; p++) { |
| switch (*p) { |
| case '\\': |
| fputs("\\\\", out_file); |
| break; |
| case '\"': |
| fputs("\\\"", out_file); |
| break; |
| case '\t': |
| fputs("\\t", out_file); |
| break; |
| case '\n': |
| fputs("\\n", out_file); |
| break; |
| case '\r': |
| fputs("\\r", out_file); |
| break; |
| default: |
| putc(*p, out_file); |
| } // switch |
| } // for |
| fputs("\"", out_file); |
| } |
| |
| /* |
| * Dumps a string as an XML attribute value. |
| */ |
| static void DumpXmlAttribute(const char* p, FILE* out_file) { |
| for (; *p; p++) { |
| switch (*p) { |
| case '&': |
| fputs("&", out_file); |
| break; |
| case '<': |
| fputs("<", out_file); |
| break; |
| case '>': |
| fputs(">", out_file); |
| break; |
| case '"': |
| fputs(""", out_file); |
| break; |
| case '\t': |
| fputs("	", out_file); |
| break; |
| case '\n': |
| fputs("
", out_file); |
| break; |
| case '\r': |
| fputs("
", out_file); |
| break; |
| default: |
| putc(*p, out_file); |
| } // switch |
| } // for |
| } |
| |
| /* |
| * Helper for dumpInstruction(), which builds the string |
| * representation for the index in the given instruction. |
| * Returns a pointer to a buffer of sufficient size. |
| */ |
| static std::unique_ptr<char[]> IndexString(dex_ir::Header* header, |
| const Instruction* dec_insn, |
| size_t buf_size) { |
| std::unique_ptr<char[]> buf(new char[buf_size]); |
| // Determine index and width of the string. |
| uint32_t index = 0; |
| uint32_t secondary_index = dex::kDexNoIndex; |
| uint32_t width = 4; |
| switch (Instruction::FormatOf(dec_insn->Opcode())) { |
| // SOME NOT SUPPORTED: |
| // case Instruction::k20bc: |
| case Instruction::k21c: |
| case Instruction::k35c: |
| // case Instruction::k35ms: |
| case Instruction::k3rc: |
| // case Instruction::k3rms: |
| // case Instruction::k35mi: |
| // case Instruction::k3rmi: |
| index = dec_insn->VRegB(); |
| width = 4; |
| break; |
| case Instruction::k31c: |
| index = dec_insn->VRegB(); |
| width = 8; |
| break; |
| case Instruction::k22c: |
| // case Instruction::k22cs: |
| index = dec_insn->VRegC(); |
| width = 4; |
| break; |
| case Instruction::k45cc: |
| case Instruction::k4rcc: |
| index = dec_insn->VRegB(); |
| secondary_index = dec_insn->VRegH(); |
| width = 4; |
| break; |
| default: |
| break; |
| } // switch |
| |
| // Determine index type. |
| size_t outSize = 0; |
| switch (Instruction::IndexTypeOf(dec_insn->Opcode())) { |
| case Instruction::kIndexUnknown: |
| // This function should never get called for this type, but do |
| // something sensible here, just to help with debugging. |
| outSize = snprintf(buf.get(), buf_size, "<unknown-index>"); |
| break; |
| case Instruction::kIndexNone: |
| // This function should never get called for this type, but do |
| // something sensible here, just to help with debugging. |
| outSize = snprintf(buf.get(), buf_size, "<no-index>"); |
| break; |
| case Instruction::kIndexTypeRef: |
| if (index < header->GetCollections().TypeIdsSize()) { |
| const char* tp = header->GetCollections().GetTypeId(index)->GetStringId()->Data(); |
| outSize = snprintf(buf.get(), buf_size, "%s // type@%0*x", tp, width, index); |
| } else { |
| outSize = snprintf(buf.get(), buf_size, "<type?> // type@%0*x", width, index); |
| } |
| break; |
| case Instruction::kIndexStringRef: |
| if (index < header->GetCollections().StringIdsSize()) { |
| const char* st = header->GetCollections().GetStringId(index)->Data(); |
| outSize = snprintf(buf.get(), buf_size, "\"%s\" // string@%0*x", st, width, index); |
| } else { |
| outSize = snprintf(buf.get(), buf_size, "<string?> // string@%0*x", width, index); |
| } |
| break; |
| case Instruction::kIndexMethodRef: |
| if (index < header->GetCollections().MethodIdsSize()) { |
| dex_ir::MethodId* method_id = header->GetCollections().GetMethodId(index); |
| const char* name = method_id->Name()->Data(); |
| std::string type_descriptor = GetSignatureForProtoId(method_id->Proto()); |
| const char* back_descriptor = method_id->Class()->GetStringId()->Data(); |
| outSize = snprintf(buf.get(), buf_size, "%s.%s:%s // method@%0*x", |
| back_descriptor, name, type_descriptor.c_str(), width, index); |
| } else { |
| outSize = snprintf(buf.get(), buf_size, "<method?> // method@%0*x", width, index); |
| } |
| break; |
| case Instruction::kIndexFieldRef: |
| if (index < header->GetCollections().FieldIdsSize()) { |
| dex_ir::FieldId* field_id = header->GetCollections().GetFieldId(index); |
| const char* name = field_id->Name()->Data(); |
| const char* type_descriptor = field_id->Type()->GetStringId()->Data(); |
| const char* back_descriptor = field_id->Class()->GetStringId()->Data(); |
| outSize = snprintf(buf.get(), buf_size, "%s.%s:%s // field@%0*x", |
| back_descriptor, name, type_descriptor, width, index); |
| } else { |
| outSize = snprintf(buf.get(), buf_size, "<field?> // field@%0*x", width, index); |
| } |
| break; |
| case Instruction::kIndexVtableOffset: |
| outSize = snprintf(buf.get(), buf_size, "[%0*x] // vtable #%0*x", |
| width, index, width, index); |
| break; |
| case Instruction::kIndexFieldOffset: |
| outSize = snprintf(buf.get(), buf_size, "[obj+%0*x]", width, index); |
| break; |
| case Instruction::kIndexMethodAndProtoRef: { |
| std::string method("<method?>"); |
| std::string proto("<proto?>"); |
| if (index < header->GetCollections().MethodIdsSize()) { |
| dex_ir::MethodId* method_id = header->GetCollections().GetMethodId(index); |
| const char* name = method_id->Name()->Data(); |
| std::string type_descriptor = GetSignatureForProtoId(method_id->Proto()); |
| const char* back_descriptor = method_id->Class()->GetStringId()->Data(); |
| method = StringPrintf("%s.%s:%s", back_descriptor, name, type_descriptor.c_str()); |
| } |
| if (secondary_index < header->GetCollections().ProtoIdsSize()) { |
| dex_ir::ProtoId* proto_id = header->GetCollections().GetProtoId(secondary_index); |
| proto = GetSignatureForProtoId(proto_id); |
| } |
| outSize = snprintf(buf.get(), buf_size, "%s, %s // method@%0*x, proto@%0*x", |
| method.c_str(), proto.c_str(), width, index, width, secondary_index); |
| } |
| break; |
| // SOME NOT SUPPORTED: |
| // case Instruction::kIndexVaries: |
| // case Instruction::kIndexInlineMethod: |
| default: |
| outSize = snprintf(buf.get(), buf_size, "<?>"); |
| break; |
| } // switch |
| |
| // Determine success of string construction. |
| if (outSize >= buf_size) { |
| // The buffer wasn't big enough; retry with computed size. Note: snprintf() |
| // doesn't count/ the '\0' as part of its returned size, so we add explicit |
| // space for it here. |
| return IndexString(header, dec_insn, outSize + 1); |
| } |
| return buf; |
| } |
| |
| /* |
| * Dumps encoded annotation. |
| */ |
| void DexLayout::DumpEncodedAnnotation(dex_ir::EncodedAnnotation* annotation) { |
| fputs(annotation->GetType()->GetStringId()->Data(), out_file_); |
| // Display all name=value pairs. |
| for (auto& subannotation : *annotation->GetAnnotationElements()) { |
| fputc(' ', out_file_); |
| fputs(subannotation->GetName()->Data(), out_file_); |
| fputc('=', out_file_); |
| DumpEncodedValue(subannotation->GetValue()); |
| } |
| } |
| /* |
| * Dumps encoded value. |
| */ |
| void DexLayout::DumpEncodedValue(const dex_ir::EncodedValue* data) { |
| switch (data->Type()) { |
| case DexFile::kDexAnnotationByte: |
| fprintf(out_file_, "%" PRId8, data->GetByte()); |
| break; |
| case DexFile::kDexAnnotationShort: |
| fprintf(out_file_, "%" PRId16, data->GetShort()); |
| break; |
| case DexFile::kDexAnnotationChar: |
| fprintf(out_file_, "%" PRIu16, data->GetChar()); |
| break; |
| case DexFile::kDexAnnotationInt: |
| fprintf(out_file_, "%" PRId32, data->GetInt()); |
| break; |
| case DexFile::kDexAnnotationLong: |
| fprintf(out_file_, "%" PRId64, data->GetLong()); |
| break; |
| case DexFile::kDexAnnotationFloat: { |
| fprintf(out_file_, "%g", data->GetFloat()); |
| break; |
| } |
| case DexFile::kDexAnnotationDouble: { |
| fprintf(out_file_, "%g", data->GetDouble()); |
| break; |
| } |
| case DexFile::kDexAnnotationString: { |
| dex_ir::StringId* string_id = data->GetStringId(); |
| if (options_.output_format_ == kOutputPlain) { |
| DumpEscapedString(string_id->Data(), out_file_); |
| } else { |
| DumpXmlAttribute(string_id->Data(), out_file_); |
| } |
| break; |
| } |
| case DexFile::kDexAnnotationType: { |
| dex_ir::TypeId* type_id = data->GetTypeId(); |
| fputs(type_id->GetStringId()->Data(), out_file_); |
| break; |
| } |
| case DexFile::kDexAnnotationField: |
| case DexFile::kDexAnnotationEnum: { |
| dex_ir::FieldId* field_id = data->GetFieldId(); |
| fputs(field_id->Name()->Data(), out_file_); |
| break; |
| } |
| case DexFile::kDexAnnotationMethod: { |
| dex_ir::MethodId* method_id = data->GetMethodId(); |
| fputs(method_id->Name()->Data(), out_file_); |
| break; |
| } |
| case DexFile::kDexAnnotationArray: { |
| fputc('{', out_file_); |
| // Display all elements. |
| for (auto& value : *data->GetEncodedArray()->GetEncodedValues()) { |
| fputc(' ', out_file_); |
| DumpEncodedValue(value.get()); |
| } |
| fputs(" }", out_file_); |
| break; |
| } |
| case DexFile::kDexAnnotationAnnotation: { |
| DumpEncodedAnnotation(data->GetEncodedAnnotation()); |
| break; |
| } |
| case DexFile::kDexAnnotationNull: |
| fputs("null", out_file_); |
| break; |
| case DexFile::kDexAnnotationBoolean: |
| fputs(StrBool(data->GetBoolean()), out_file_); |
| break; |
| default: |
| fputs("????", out_file_); |
| break; |
| } // switch |
| } |
| |
| /* |
| * Dumps the file header. |
| */ |
| void DexLayout::DumpFileHeader() { |
| char sanitized[8 * 2 + 1]; |
| dex_ir::Collections& collections = header_->GetCollections(); |
| fprintf(out_file_, "DEX file header:\n"); |
| Asciify(sanitized, header_->Magic(), 8); |
| fprintf(out_file_, "magic : '%s'\n", sanitized); |
| fprintf(out_file_, "checksum : %08x\n", header_->Checksum()); |
| fprintf(out_file_, "signature : %02x%02x...%02x%02x\n", |
| header_->Signature()[0], header_->Signature()[1], |
| header_->Signature()[DexFile::kSha1DigestSize - 2], |
| header_->Signature()[DexFile::kSha1DigestSize - 1]); |
| fprintf(out_file_, "file_size : %d\n", header_->FileSize()); |
| fprintf(out_file_, "header_size : %d\n", header_->HeaderSize()); |
| fprintf(out_file_, "link_size : %d\n", header_->LinkSize()); |
| fprintf(out_file_, "link_off : %d (0x%06x)\n", |
| header_->LinkOffset(), header_->LinkOffset()); |
| fprintf(out_file_, "string_ids_size : %d\n", collections.StringIdsSize()); |
| fprintf(out_file_, "string_ids_off : %d (0x%06x)\n", |
| collections.StringIdsOffset(), collections.StringIdsOffset()); |
| fprintf(out_file_, "type_ids_size : %d\n", collections.TypeIdsSize()); |
| fprintf(out_file_, "type_ids_off : %d (0x%06x)\n", |
| collections.TypeIdsOffset(), collections.TypeIdsOffset()); |
| fprintf(out_file_, "proto_ids_size : %d\n", collections.ProtoIdsSize()); |
| fprintf(out_file_, "proto_ids_off : %d (0x%06x)\n", |
| collections.ProtoIdsOffset(), collections.ProtoIdsOffset()); |
| fprintf(out_file_, "field_ids_size : %d\n", collections.FieldIdsSize()); |
| fprintf(out_file_, "field_ids_off : %d (0x%06x)\n", |
| collections.FieldIdsOffset(), collections.FieldIdsOffset()); |
| fprintf(out_file_, "method_ids_size : %d\n", collections.MethodIdsSize()); |
| fprintf(out_file_, "method_ids_off : %d (0x%06x)\n", |
| collections.MethodIdsOffset(), collections.MethodIdsOffset()); |
| fprintf(out_file_, "class_defs_size : %d\n", collections.ClassDefsSize()); |
| fprintf(out_file_, "class_defs_off : %d (0x%06x)\n", |
| collections.ClassDefsOffset(), collections.ClassDefsOffset()); |
| fprintf(out_file_, "data_size : %d\n", header_->DataSize()); |
| fprintf(out_file_, "data_off : %d (0x%06x)\n\n", |
| header_->DataOffset(), header_->DataOffset()); |
| } |
| |
| /* |
| * Dumps a class_def_item. |
| */ |
| void DexLayout::DumpClassDef(int idx) { |
| // General class information. |
| dex_ir::ClassDef* class_def = header_->GetCollections().GetClassDef(idx); |
| fprintf(out_file_, "Class #%d header:\n", idx); |
| fprintf(out_file_, "class_idx : %d\n", class_def->ClassType()->GetIndex()); |
| fprintf(out_file_, "access_flags : %d (0x%04x)\n", |
| class_def->GetAccessFlags(), class_def->GetAccessFlags()); |
| uint32_t superclass_idx = class_def->Superclass() == nullptr ? |
| DexFile::kDexNoIndex16 : class_def->Superclass()->GetIndex(); |
| fprintf(out_file_, "superclass_idx : %d\n", superclass_idx); |
| fprintf(out_file_, "interfaces_off : %d (0x%06x)\n", |
| class_def->InterfacesOffset(), class_def->InterfacesOffset()); |
| uint32_t source_file_offset = 0xffffffffU; |
| if (class_def->SourceFile() != nullptr) { |
| source_file_offset = class_def->SourceFile()->GetIndex(); |
| } |
| fprintf(out_file_, "source_file_idx : %d\n", source_file_offset); |
| uint32_t annotations_offset = 0; |
| if (class_def->Annotations() != nullptr) { |
| annotations_offset = class_def->Annotations()->GetOffset(); |
| } |
| fprintf(out_file_, "annotations_off : %d (0x%06x)\n", |
| annotations_offset, annotations_offset); |
| if (class_def->GetClassData() == nullptr) { |
| fprintf(out_file_, "class_data_off : %d (0x%06x)\n", 0, 0); |
| } else { |
| fprintf(out_file_, "class_data_off : %d (0x%06x)\n", |
| class_def->GetClassData()->GetOffset(), class_def->GetClassData()->GetOffset()); |
| } |
| |
| // Fields and methods. |
| dex_ir::ClassData* class_data = class_def->GetClassData(); |
| if (class_data != nullptr && class_data->StaticFields() != nullptr) { |
| fprintf(out_file_, "static_fields_size : %zu\n", class_data->StaticFields()->size()); |
| } else { |
| fprintf(out_file_, "static_fields_size : 0\n"); |
| } |
| if (class_data != nullptr && class_data->InstanceFields() != nullptr) { |
| fprintf(out_file_, "instance_fields_size: %zu\n", class_data->InstanceFields()->size()); |
| } else { |
| fprintf(out_file_, "instance_fields_size: 0\n"); |
| } |
| if (class_data != nullptr && class_data->DirectMethods() != nullptr) { |
| fprintf(out_file_, "direct_methods_size : %zu\n", class_data->DirectMethods()->size()); |
| } else { |
| fprintf(out_file_, "direct_methods_size : 0\n"); |
| } |
| if (class_data != nullptr && class_data->VirtualMethods() != nullptr) { |
| fprintf(out_file_, "virtual_methods_size: %zu\n", class_data->VirtualMethods()->size()); |
| } else { |
| fprintf(out_file_, "virtual_methods_size: 0\n"); |
| } |
| fprintf(out_file_, "\n"); |
| } |
| |
| /** |
| * Dumps an annotation set item. |
| */ |
| void DexLayout::DumpAnnotationSetItem(dex_ir::AnnotationSetItem* set_item) { |
| if (set_item == nullptr || set_item->GetItems()->size() == 0) { |
| fputs(" empty-annotation-set\n", out_file_); |
| return; |
| } |
| for (dex_ir::AnnotationItem* annotation : *set_item->GetItems()) { |
| if (annotation == nullptr) { |
| continue; |
| } |
| fputs(" ", out_file_); |
| switch (annotation->GetVisibility()) { |
| case DexFile::kDexVisibilityBuild: fputs("VISIBILITY_BUILD ", out_file_); break; |
| case DexFile::kDexVisibilityRuntime: fputs("VISIBILITY_RUNTIME ", out_file_); break; |
| case DexFile::kDexVisibilitySystem: fputs("VISIBILITY_SYSTEM ", out_file_); break; |
| default: fputs("VISIBILITY_UNKNOWN ", out_file_); break; |
| } // switch |
| DumpEncodedAnnotation(annotation->GetAnnotation()); |
| fputc('\n', out_file_); |
| } |
| } |
| |
| /* |
| * Dumps class annotations. |
| */ |
| void DexLayout::DumpClassAnnotations(int idx) { |
| dex_ir::ClassDef* class_def = header_->GetCollections().GetClassDef(idx); |
| dex_ir::AnnotationsDirectoryItem* annotations_directory = class_def->Annotations(); |
| if (annotations_directory == nullptr) { |
| return; // none |
| } |
| |
| fprintf(out_file_, "Class #%d annotations:\n", idx); |
| |
| dex_ir::AnnotationSetItem* class_set_item = annotations_directory->GetClassAnnotation(); |
| dex_ir::FieldAnnotationVector* fields = annotations_directory->GetFieldAnnotations(); |
| dex_ir::MethodAnnotationVector* methods = annotations_directory->GetMethodAnnotations(); |
| dex_ir::ParameterAnnotationVector* parameters = annotations_directory->GetParameterAnnotations(); |
| |
| // Annotations on the class itself. |
| if (class_set_item != nullptr) { |
| fprintf(out_file_, "Annotations on class\n"); |
| DumpAnnotationSetItem(class_set_item); |
| } |
| |
| // Annotations on fields. |
| if (fields != nullptr) { |
| for (auto& field : *fields) { |
| const dex_ir::FieldId* field_id = field->GetFieldId(); |
| const uint32_t field_idx = field_id->GetIndex(); |
| const char* field_name = field_id->Name()->Data(); |
| fprintf(out_file_, "Annotations on field #%u '%s'\n", field_idx, field_name); |
| DumpAnnotationSetItem(field->GetAnnotationSetItem()); |
| } |
| } |
| |
| // Annotations on methods. |
| if (methods != nullptr) { |
| for (auto& method : *methods) { |
| const dex_ir::MethodId* method_id = method->GetMethodId(); |
| const uint32_t method_idx = method_id->GetIndex(); |
| const char* method_name = method_id->Name()->Data(); |
| fprintf(out_file_, "Annotations on method #%u '%s'\n", method_idx, method_name); |
| DumpAnnotationSetItem(method->GetAnnotationSetItem()); |
| } |
| } |
| |
| // Annotations on method parameters. |
| if (parameters != nullptr) { |
| for (auto& parameter : *parameters) { |
| const dex_ir::MethodId* method_id = parameter->GetMethodId(); |
| const uint32_t method_idx = method_id->GetIndex(); |
| const char* method_name = method_id->Name()->Data(); |
| fprintf(out_file_, "Annotations on method #%u '%s' parameters\n", method_idx, method_name); |
| uint32_t j = 0; |
| for (dex_ir::AnnotationSetItem* annotation : *parameter->GetAnnotations()->GetItems()) { |
| fprintf(out_file_, "#%u\n", j); |
| DumpAnnotationSetItem(annotation); |
| ++j; |
| } |
| } |
| } |
| |
| fputc('\n', out_file_); |
| } |
| |
| /* |
| * Dumps an interface that a class declares to implement. |
| */ |
| void DexLayout::DumpInterface(const dex_ir::TypeId* type_item, int i) { |
| const char* interface_name = type_item->GetStringId()->Data(); |
| if (options_.output_format_ == kOutputPlain) { |
| fprintf(out_file_, " #%d : '%s'\n", i, interface_name); |
| } else { |
| std::string dot(DescriptorToDotWrapper(interface_name)); |
| fprintf(out_file_, "<implements name=\"%s\">\n</implements>\n", dot.c_str()); |
| } |
| } |
| |
| /* |
| * Dumps the catches table associated with the code. |
| */ |
| void DexLayout::DumpCatches(const dex_ir::CodeItem* code) { |
| const uint16_t tries_size = code->TriesSize(); |
| |
| // No catch table. |
| if (tries_size == 0) { |
| fprintf(out_file_, " catches : (none)\n"); |
| return; |
| } |
| |
| // Dump all table entries. |
| fprintf(out_file_, " catches : %d\n", tries_size); |
| std::vector<std::unique_ptr<const dex_ir::TryItem>>* tries = code->Tries(); |
| for (uint32_t i = 0; i < tries_size; i++) { |
| const dex_ir::TryItem* try_item = (*tries)[i].get(); |
| const uint32_t start = try_item->StartAddr(); |
| const uint32_t end = start + try_item->InsnCount(); |
| fprintf(out_file_, " 0x%04x - 0x%04x\n", start, end); |
| for (auto& handler : *try_item->GetHandlers()->GetHandlers()) { |
| const dex_ir::TypeId* type_id = handler->GetTypeId(); |
| const char* descriptor = (type_id == nullptr) ? "<any>" : type_id->GetStringId()->Data(); |
| fprintf(out_file_, " %s -> 0x%04x\n", descriptor, handler->GetAddress()); |
| } // for |
| } // for |
| } |
| |
| /* |
| * Dumps a single instruction. |
| */ |
| void DexLayout::DumpInstruction(const dex_ir::CodeItem* code, |
| uint32_t code_offset, |
| uint32_t insn_idx, |
| uint32_t insn_width, |
| const Instruction* dec_insn) { |
| // Address of instruction (expressed as byte offset). |
| fprintf(out_file_, "%06x:", code_offset + 0x10 + insn_idx * 2); |
| |
| // Dump (part of) raw bytes. |
| const uint16_t* insns = code->Insns(); |
| for (uint32_t i = 0; i < 8; i++) { |
| if (i < insn_width) { |
| if (i == 7) { |
| fprintf(out_file_, " ... "); |
| } else { |
| // Print 16-bit value in little-endian order. |
| const uint8_t* bytePtr = (const uint8_t*) &insns[insn_idx + i]; |
| fprintf(out_file_, " %02x%02x", bytePtr[0], bytePtr[1]); |
| } |
| } else { |
| fputs(" ", out_file_); |
| } |
| } // for |
| |
| // Dump pseudo-instruction or opcode. |
| if (dec_insn->Opcode() == Instruction::NOP) { |
| const uint16_t instr = Get2LE((const uint8_t*) &insns[insn_idx]); |
| if (instr == Instruction::kPackedSwitchSignature) { |
| fprintf(out_file_, "|%04x: packed-switch-data (%d units)", insn_idx, insn_width); |
| } else if (instr == Instruction::kSparseSwitchSignature) { |
| fprintf(out_file_, "|%04x: sparse-switch-data (%d units)", insn_idx, insn_width); |
| } else if (instr == Instruction::kArrayDataSignature) { |
| fprintf(out_file_, "|%04x: array-data (%d units)", insn_idx, insn_width); |
| } else { |
| fprintf(out_file_, "|%04x: nop // spacer", insn_idx); |
| } |
| } else { |
| fprintf(out_file_, "|%04x: %s", insn_idx, dec_insn->Name()); |
| } |
| |
| // Set up additional argument. |
| std::unique_ptr<char[]> index_buf; |
| if (Instruction::IndexTypeOf(dec_insn->Opcode()) != Instruction::kIndexNone) { |
| index_buf = IndexString(header_, dec_insn, 200); |
| } |
| |
| // Dump the instruction. |
| // |
| // NOTE: pDecInsn->DumpString(pDexFile) differs too much from original. |
| // |
| switch (Instruction::FormatOf(dec_insn->Opcode())) { |
| case Instruction::k10x: // op |
| break; |
| case Instruction::k12x: // op vA, vB |
| fprintf(out_file_, " v%d, v%d", dec_insn->VRegA(), dec_insn->VRegB()); |
| break; |
| case Instruction::k11n: // op vA, #+B |
| fprintf(out_file_, " v%d, #int %d // #%x", |
| dec_insn->VRegA(), (int32_t) dec_insn->VRegB(), (uint8_t)dec_insn->VRegB()); |
| break; |
| case Instruction::k11x: // op vAA |
| fprintf(out_file_, " v%d", dec_insn->VRegA()); |
| break; |
| case Instruction::k10t: // op +AA |
| case Instruction::k20t: { // op +AAAA |
| const int32_t targ = (int32_t) dec_insn->VRegA(); |
| fprintf(out_file_, " %04x // %c%04x", |
| insn_idx + targ, |
| (targ < 0) ? '-' : '+', |
| (targ < 0) ? -targ : targ); |
| break; |
| } |
| case Instruction::k22x: // op vAA, vBBBB |
| fprintf(out_file_, " v%d, v%d", dec_insn->VRegA(), dec_insn->VRegB()); |
| break; |
| case Instruction::k21t: { // op vAA, +BBBB |
| const int32_t targ = (int32_t) dec_insn->VRegB(); |
| fprintf(out_file_, " v%d, %04x // %c%04x", dec_insn->VRegA(), |
| insn_idx + targ, |
| (targ < 0) ? '-' : '+', |
| (targ < 0) ? -targ : targ); |
| break; |
| } |
| case Instruction::k21s: // op vAA, #+BBBB |
| fprintf(out_file_, " v%d, #int %d // #%x", |
| dec_insn->VRegA(), (int32_t) dec_insn->VRegB(), (uint16_t)dec_insn->VRegB()); |
| break; |
| case Instruction::k21h: // op vAA, #+BBBB0000[00000000] |
| // The printed format varies a bit based on the actual opcode. |
| if (dec_insn->Opcode() == Instruction::CONST_HIGH16) { |
| const int32_t value = dec_insn->VRegB() << 16; |
| fprintf(out_file_, " v%d, #int %d // #%x", |
| dec_insn->VRegA(), value, (uint16_t) dec_insn->VRegB()); |
| } else { |
| const int64_t value = ((int64_t) dec_insn->VRegB()) << 48; |
| fprintf(out_file_, " v%d, #long %" PRId64 " // #%x", |
| dec_insn->VRegA(), value, (uint16_t) dec_insn->VRegB()); |
| } |
| break; |
| case Instruction::k21c: // op vAA, thing@BBBB |
| case Instruction::k31c: // op vAA, thing@BBBBBBBB |
| fprintf(out_file_, " v%d, %s", dec_insn->VRegA(), index_buf.get()); |
| break; |
| case Instruction::k23x: // op vAA, vBB, vCC |
| fprintf(out_file_, " v%d, v%d, v%d", |
| dec_insn->VRegA(), dec_insn->VRegB(), dec_insn->VRegC()); |
| break; |
| case Instruction::k22b: // op vAA, vBB, #+CC |
| fprintf(out_file_, " v%d, v%d, #int %d // #%02x", |
| dec_insn->VRegA(), dec_insn->VRegB(), |
| (int32_t) dec_insn->VRegC(), (uint8_t) dec_insn->VRegC()); |
| break; |
| case Instruction::k22t: { // op vA, vB, +CCCC |
| const int32_t targ = (int32_t) dec_insn->VRegC(); |
| fprintf(out_file_, " v%d, v%d, %04x // %c%04x", |
| dec_insn->VRegA(), dec_insn->VRegB(), |
| insn_idx + targ, |
| (targ < 0) ? '-' : '+', |
| (targ < 0) ? -targ : targ); |
| break; |
| } |
| case Instruction::k22s: // op vA, vB, #+CCCC |
| fprintf(out_file_, " v%d, v%d, #int %d // #%04x", |
| dec_insn->VRegA(), dec_insn->VRegB(), |
| (int32_t) dec_insn->VRegC(), (uint16_t) dec_insn->VRegC()); |
| break; |
| case Instruction::k22c: // op vA, vB, thing@CCCC |
| // NOT SUPPORTED: |
| // case Instruction::k22cs: // [opt] op vA, vB, field offset CCCC |
| fprintf(out_file_, " v%d, v%d, %s", |
| dec_insn->VRegA(), dec_insn->VRegB(), index_buf.get()); |
| break; |
| case Instruction::k30t: |
| fprintf(out_file_, " #%08x", dec_insn->VRegA()); |
| break; |
| case Instruction::k31i: { // op vAA, #+BBBBBBBB |
| // This is often, but not always, a float. |
| union { |
| float f; |
| uint32_t i; |
| } conv; |
| conv.i = dec_insn->VRegB(); |
| fprintf(out_file_, " v%d, #float %g // #%08x", |
| dec_insn->VRegA(), conv.f, dec_insn->VRegB()); |
| break; |
| } |
| case Instruction::k31t: // op vAA, offset +BBBBBBBB |
| fprintf(out_file_, " v%d, %08x // +%08x", |
| dec_insn->VRegA(), insn_idx + dec_insn->VRegB(), dec_insn->VRegB()); |
| break; |
| case Instruction::k32x: // op vAAAA, vBBBB |
| fprintf(out_file_, " v%d, v%d", dec_insn->VRegA(), dec_insn->VRegB()); |
| break; |
| case Instruction::k35c: // op {vC, vD, vE, vF, vG}, thing@BBBB |
| case Instruction::k45cc: { // op {vC, vD, vE, vF, vG}, meth@BBBB, proto@HHHH |
| // NOT SUPPORTED: |
| // case Instruction::k35ms: // [opt] invoke-virtual+super |
| // case Instruction::k35mi: // [opt] inline invoke |
| uint32_t arg[Instruction::kMaxVarArgRegs]; |
| dec_insn->GetVarArgs(arg); |
| fputs(" {", out_file_); |
| for (int i = 0, n = dec_insn->VRegA(); i < n; i++) { |
| if (i == 0) { |
| fprintf(out_file_, "v%d", arg[i]); |
| } else { |
| fprintf(out_file_, ", v%d", arg[i]); |
| } |
| } // for |
| fprintf(out_file_, "}, %s", index_buf.get()); |
| break; |
| } |
| case Instruction::k3rc: // op {vCCCC .. v(CCCC+AA-1)}, thing@BBBB |
| case Instruction::k4rcc: // op {vCCCC .. v(CCCC+AA-1)}, meth@BBBB, proto@HHHH |
| // NOT SUPPORTED: |
| // case Instruction::k3rms: // [opt] invoke-virtual+super/range |
| // case Instruction::k3rmi: // [opt] execute-inline/range |
| { |
| // This doesn't match the "dx" output when some of the args are |
| // 64-bit values -- dx only shows the first register. |
| fputs(" {", out_file_); |
| for (int i = 0, n = dec_insn->VRegA(); i < n; i++) { |
| if (i == 0) { |
| fprintf(out_file_, "v%d", dec_insn->VRegC() + i); |
| } else { |
| fprintf(out_file_, ", v%d", dec_insn->VRegC() + i); |
| } |
| } // for |
| fprintf(out_file_, "}, %s", index_buf.get()); |
| } |
| break; |
| case Instruction::k51l: { // op vAA, #+BBBBBBBBBBBBBBBB |
| // This is often, but not always, a double. |
| union { |
| double d; |
| uint64_t j; |
| } conv; |
| conv.j = dec_insn->WideVRegB(); |
| fprintf(out_file_, " v%d, #double %g // #%016" PRIx64, |
| dec_insn->VRegA(), conv.d, dec_insn->WideVRegB()); |
| break; |
| } |
| // NOT SUPPORTED: |
| // case Instruction::k00x: // unknown op or breakpoint |
| // break; |
| default: |
| fprintf(out_file_, " ???"); |
| break; |
| } // switch |
| |
| fputc('\n', out_file_); |
| } |
| |
| /* |
| * Dumps a bytecode disassembly. |
| */ |
| void DexLayout::DumpBytecodes(uint32_t idx, const dex_ir::CodeItem* code, uint32_t code_offset) { |
| dex_ir::MethodId* method_id = header_->GetCollections().GetMethodId(idx); |
| const char* name = method_id->Name()->Data(); |
| std::string type_descriptor = GetSignatureForProtoId(method_id->Proto()); |
| const char* back_descriptor = method_id->Class()->GetStringId()->Data(); |
| |
| // Generate header. |
| std::string dot(DescriptorToDotWrapper(back_descriptor)); |
| fprintf(out_file_, "%06x: |[%06x] %s.%s:%s\n", |
| code_offset, code_offset, dot.c_str(), name, type_descriptor.c_str()); |
| |
| // Iterate over all instructions. |
| for (const DexInstructionPcPair& inst : code->Instructions()) { |
| const uint32_t insn_width = inst->SizeInCodeUnits(); |
| if (insn_width == 0) { |
| fprintf(stderr, "GLITCH: zero-width instruction at idx=0x%04x\n", inst.DexPc()); |
| break; |
| } |
| DumpInstruction(code, code_offset, inst.DexPc(), insn_width, &inst.Inst()); |
| } // for |
| } |
| |
| /* |
| * Callback for dumping each positions table entry. |
| */ |
| static bool DumpPositionsCb(void* context, const DexFile::PositionInfo& entry) { |
| FILE* out_file = reinterpret_cast<FILE*>(context); |
| fprintf(out_file, " 0x%04x line=%d\n", entry.address_, entry.line_); |
| return false; |
| } |
| |
| /* |
| * Callback for dumping locals table entry. |
| */ |
| static void DumpLocalsCb(void* context, const DexFile::LocalInfo& entry) { |
| const char* signature = entry.signature_ != nullptr ? entry.signature_ : ""; |
| FILE* out_file = reinterpret_cast<FILE*>(context); |
| fprintf(out_file, " 0x%04x - 0x%04x reg=%d %s %s %s\n", |
| entry.start_address_, entry.end_address_, entry.reg_, |
| entry.name_, entry.descriptor_, signature); |
| } |
| |
| /* |
| * Lookup functions. |
| */ |
| static const char* StringDataByIdx(uint32_t idx, dex_ir::Collections& collections) { |
| dex_ir::StringId* string_id = collections.GetStringIdOrNullPtr(idx); |
| if (string_id == nullptr) { |
| return nullptr; |
| } |
| return string_id->Data(); |
| } |
| |
| static const char* StringDataByTypeIdx(uint16_t idx, dex_ir::Collections& collections) { |
| dex_ir::TypeId* type_id = collections.GetTypeIdOrNullPtr(idx); |
| if (type_id == nullptr) { |
| return nullptr; |
| } |
| dex_ir::StringId* string_id = type_id->GetStringId(); |
| if (string_id == nullptr) { |
| return nullptr; |
| } |
| return string_id->Data(); |
| } |
| |
| |
| /* |
| * Dumps code of a method. |
| */ |
| void DexLayout::DumpCode(uint32_t idx, |
| const dex_ir::CodeItem* code, |
| uint32_t code_offset, |
| const char* declaring_class_descriptor, |
| const char* method_name, |
| bool is_static, |
| const dex_ir::ProtoId* proto) { |
| fprintf(out_file_, " registers : %d\n", code->RegistersSize()); |
| fprintf(out_file_, " ins : %d\n", code->InsSize()); |
| fprintf(out_file_, " outs : %d\n", code->OutsSize()); |
| fprintf(out_file_, " insns size : %d 16-bit code units\n", |
| code->InsnsSize()); |
| |
| // Bytecode disassembly, if requested. |
| if (options_.disassemble_) { |
| DumpBytecodes(idx, code, code_offset); |
| } |
| |
| // Try-catch blocks. |
| DumpCatches(code); |
| |
| // Positions and locals table in the debug info. |
| dex_ir::DebugInfoItem* debug_info = code->DebugInfo(); |
| fprintf(out_file_, " positions : \n"); |
| if (debug_info != nullptr) { |
| DexFile::DecodeDebugPositionInfo(debug_info->GetDebugInfo(), |
| [this](uint32_t idx) { |
| return StringDataByIdx(idx, this->header_->GetCollections()); |
| }, |
| DumpPositionsCb, |
| out_file_); |
| } |
| fprintf(out_file_, " locals : \n"); |
| if (debug_info != nullptr) { |
| std::vector<const char*> arg_descriptors; |
| const dex_ir::TypeList* parameters = proto->Parameters(); |
| if (parameters != nullptr) { |
| const dex_ir::TypeIdVector* parameter_type_vector = parameters->GetTypeList(); |
| if (parameter_type_vector != nullptr) { |
| for (const dex_ir::TypeId* type_id : *parameter_type_vector) { |
| arg_descriptors.push_back(type_id->GetStringId()->Data()); |
| } |
| } |
| } |
| DexFile::DecodeDebugLocalInfo(debug_info->GetDebugInfo(), |
| "DexLayout in-memory", |
| declaring_class_descriptor, |
| arg_descriptors, |
| method_name, |
| is_static, |
| code->RegistersSize(), |
| code->InsSize(), |
| code->InsnsSize(), |
| [this](uint32_t idx) { |
| return StringDataByIdx(idx, this->header_->GetCollections()); |
| }, |
| [this](uint32_t idx) { |
| return |
| StringDataByTypeIdx(dchecked_integral_cast<uint16_t>(idx), |
| this->header_->GetCollections()); |
| }, |
| DumpLocalsCb, |
| out_file_); |
| } |
| } |
| |
| /* |
| * Dumps a method. |
| */ |
| void DexLayout::DumpMethod(uint32_t idx, uint32_t flags, const dex_ir::CodeItem* code, int i) { |
| // Bail for anything private if export only requested. |
| if (options_.exports_only_ && (flags & (kAccPublic | kAccProtected)) == 0) { |
| return; |
| } |
| |
| dex_ir::MethodId* method_id = header_->GetCollections().GetMethodId(idx); |
| const char* name = method_id->Name()->Data(); |
| char* type_descriptor = strdup(GetSignatureForProtoId(method_id->Proto()).c_str()); |
| const char* back_descriptor = method_id->Class()->GetStringId()->Data(); |
| char* access_str = CreateAccessFlagStr(flags, kAccessForMethod); |
| |
| if (options_.output_format_ == kOutputPlain) { |
| fprintf(out_file_, " #%d : (in %s)\n", i, back_descriptor); |
| fprintf(out_file_, " name : '%s'\n", name); |
| fprintf(out_file_, " type : '%s'\n", type_descriptor); |
| fprintf(out_file_, " access : 0x%04x (%s)\n", flags, access_str); |
| if (code == nullptr) { |
| fprintf(out_file_, " code : (none)\n"); |
| } else { |
| fprintf(out_file_, " code -\n"); |
| DumpCode(idx, |
| code, |
| code->GetOffset(), |
| back_descriptor, |
| name, |
| (flags & kAccStatic) != 0, |
| method_id->Proto()); |
| } |
| if (options_.disassemble_) { |
| fputc('\n', out_file_); |
| } |
| } else if (options_.output_format_ == kOutputXml) { |
| const bool constructor = (name[0] == '<'); |
| |
| // Method name and prototype. |
| if (constructor) { |
| std::string dot(DescriptorClassToDot(back_descriptor)); |
| fprintf(out_file_, "<constructor name=\"%s\"\n", dot.c_str()); |
| dot = DescriptorToDotWrapper(back_descriptor); |
| fprintf(out_file_, " type=\"%s\"\n", dot.c_str()); |
| } else { |
| fprintf(out_file_, "<method name=\"%s\"\n", name); |
| const char* return_type = strrchr(type_descriptor, ')'); |
| if (return_type == nullptr) { |
| fprintf(stderr, "bad method type descriptor '%s'\n", type_descriptor); |
| goto bail; |
| } |
| std::string dot(DescriptorToDotWrapper(return_type + 1)); |
| fprintf(out_file_, " return=\"%s\"\n", dot.c_str()); |
| fprintf(out_file_, " abstract=%s\n", QuotedBool((flags & kAccAbstract) != 0)); |
| fprintf(out_file_, " native=%s\n", QuotedBool((flags & kAccNative) != 0)); |
| fprintf(out_file_, " synchronized=%s\n", QuotedBool( |
| (flags & (kAccSynchronized | kAccDeclaredSynchronized)) != 0)); |
| } |
| |
| // Additional method flags. |
| fprintf(out_file_, " static=%s\n", QuotedBool((flags & kAccStatic) != 0)); |
| fprintf(out_file_, " final=%s\n", QuotedBool((flags & kAccFinal) != 0)); |
| // The "deprecated=" not knowable w/o parsing annotations. |
| fprintf(out_file_, " visibility=%s\n>\n", QuotedVisibility(flags)); |
| |
| // Parameters. |
| if (type_descriptor[0] != '(') { |
| fprintf(stderr, "ERROR: bad descriptor '%s'\n", type_descriptor); |
| goto bail; |
| } |
| char* tmp_buf = reinterpret_cast<char*>(malloc(strlen(type_descriptor) + 1)); |
| const char* base = type_descriptor + 1; |
| int arg_num = 0; |
| while (*base != ')') { |
| char* cp = tmp_buf; |
| while (*base == '[') { |
| *cp++ = *base++; |
| } |
| if (*base == 'L') { |
| // Copy through ';'. |
| do { |
| *cp = *base++; |
| } while (*cp++ != ';'); |
| } else { |
| // Primitive char, copy it. |
| if (strchr("ZBCSIFJD", *base) == nullptr) { |
| fprintf(stderr, "ERROR: bad method signature '%s'\n", base); |
| break; // while |
| } |
| *cp++ = *base++; |
| } |
| // Null terminate and display. |
| *cp++ = '\0'; |
| std::string dot(DescriptorToDotWrapper(tmp_buf)); |
| fprintf(out_file_, "<parameter name=\"arg%d\" type=\"%s\">\n" |
| "</parameter>\n", arg_num++, dot.c_str()); |
| } // while |
| free(tmp_buf); |
| if (constructor) { |
| fprintf(out_file_, "</constructor>\n"); |
| } else { |
| fprintf(out_file_, "</method>\n"); |
| } |
| } |
| |
| bail: |
| free(type_descriptor); |
| free(access_str); |
| } |
| |
| /* |
| * Dumps a static (class) field. |
| */ |
| void DexLayout::DumpSField(uint32_t idx, uint32_t flags, int i, dex_ir::EncodedValue* init) { |
| // Bail for anything private if export only requested. |
| if (options_.exports_only_ && (flags & (kAccPublic | kAccProtected)) == 0) { |
| return; |
| } |
| |
| dex_ir::FieldId* field_id = header_->GetCollections().GetFieldId(idx); |
| const char* name = field_id->Name()->Data(); |
| const char* type_descriptor = field_id->Type()->GetStringId()->Data(); |
| const char* back_descriptor = field_id->Class()->GetStringId()->Data(); |
| char* access_str = CreateAccessFlagStr(flags, kAccessForField); |
| |
| if (options_.output_format_ == kOutputPlain) { |
| fprintf(out_file_, " #%d : (in %s)\n", i, back_descriptor); |
| fprintf(out_file_, " name : '%s'\n", name); |
| fprintf(out_file_, " type : '%s'\n", type_descriptor); |
| fprintf(out_file_, " access : 0x%04x (%s)\n", flags, access_str); |
| if (init != nullptr) { |
| fputs(" value : ", out_file_); |
| DumpEncodedValue(init); |
| fputs("\n", out_file_); |
| } |
| } else if (options_.output_format_ == kOutputXml) { |
| fprintf(out_file_, "<field name=\"%s\"\n", name); |
| std::string dot(DescriptorToDotWrapper(type_descriptor)); |
| fprintf(out_file_, " type=\"%s\"\n", dot.c_str()); |
| fprintf(out_file_, " transient=%s\n", QuotedBool((flags & kAccTransient) != 0)); |
| fprintf(out_file_, " volatile=%s\n", QuotedBool((flags & kAccVolatile) != 0)); |
| // The "value=" is not knowable w/o parsing annotations. |
| fprintf(out_file_, " static=%s\n", QuotedBool((flags & kAccStatic) != 0)); |
| fprintf(out_file_, " final=%s\n", QuotedBool((flags & kAccFinal) != 0)); |
| // The "deprecated=" is not knowable w/o parsing annotations. |
| fprintf(out_file_, " visibility=%s\n", QuotedVisibility(flags)); |
| if (init != nullptr) { |
| fputs(" value=\"", out_file_); |
| DumpEncodedValue(init); |
| fputs("\"\n", out_file_); |
| } |
| fputs(">\n</field>\n", out_file_); |
| } |
| |
| free(access_str); |
| } |
| |
| /* |
| * Dumps an instance field. |
| */ |
| void DexLayout::DumpIField(uint32_t idx, uint32_t flags, int i) { |
| DumpSField(idx, flags, i, nullptr); |
| } |
| |
| /* |
| * Dumps the class. |
| * |
| * Note "idx" is a DexClassDef index, not a DexTypeId index. |
| * |
| * If "*last_package" is nullptr or does not match the current class' package, |
| * the value will be replaced with a newly-allocated string. |
| */ |
| void DexLayout::DumpClass(int idx, char** last_package) { |
| dex_ir::ClassDef* class_def = header_->GetCollections().GetClassDef(idx); |
| // Omitting non-public class. |
| if (options_.exports_only_ && (class_def->GetAccessFlags() & kAccPublic) == 0) { |
| return; |
| } |
| |
| if (options_.show_section_headers_) { |
| DumpClassDef(idx); |
| } |
| |
| if (options_.show_annotations_) { |
| DumpClassAnnotations(idx); |
| } |
| |
| // For the XML output, show the package name. Ideally we'd gather |
| // up the classes, sort them, and dump them alphabetically so the |
| // package name wouldn't jump around, but that's not a great plan |
| // for something that needs to run on the device. |
| const char* class_descriptor = |
| header_->GetCollections().GetClassDef(idx)->ClassType()->GetStringId()->Data(); |
| if (!(class_descriptor[0] == 'L' && |
| class_descriptor[strlen(class_descriptor)-1] == ';')) { |
| // Arrays and primitives should not be defined explicitly. Keep going? |
| fprintf(stderr, "Malformed class name '%s'\n", class_descriptor); |
| } else if (options_.output_format_ == kOutputXml) { |
| char* mangle = strdup(class_descriptor + 1); |
| mangle[strlen(mangle)-1] = '\0'; |
| |
| // Reduce to just the package name. |
| char* last_slash = strrchr(mangle, '/'); |
| if (last_slash != nullptr) { |
| *last_slash = '\0'; |
| } else { |
| *mangle = '\0'; |
| } |
| |
| for (char* cp = mangle; *cp != '\0'; cp++) { |
| if (*cp == '/') { |
| *cp = '.'; |
| } |
| } // for |
| |
| if (*last_package == nullptr || strcmp(mangle, *last_package) != 0) { |
| // Start of a new package. |
| if (*last_package != nullptr) { |
| fprintf(out_file_, "</package>\n"); |
| } |
| fprintf(out_file_, "<package name=\"%s\"\n>\n", mangle); |
| free(*last_package); |
| *last_package = mangle; |
| } else { |
| free(mangle); |
| } |
| } |
| |
| // General class information. |
| char* access_str = CreateAccessFlagStr(class_def->GetAccessFlags(), kAccessForClass); |
| const char* superclass_descriptor = nullptr; |
| if (class_def->Superclass() != nullptr) { |
| superclass_descriptor = class_def->Superclass()->GetStringId()->Data(); |
| } |
| if (options_.output_format_ == kOutputPlain) { |
| fprintf(out_file_, "Class #%d -\n", idx); |
| fprintf(out_file_, " Class descriptor : '%s'\n", class_descriptor); |
| fprintf(out_file_, " Access flags : 0x%04x (%s)\n", |
| class_def->GetAccessFlags(), access_str); |
| if (superclass_descriptor != nullptr) { |
| fprintf(out_file_, " Superclass : '%s'\n", superclass_descriptor); |
| } |
| fprintf(out_file_, " Interfaces -\n"); |
| } else { |
| std::string dot(DescriptorClassToDot(class_descriptor)); |
| fprintf(out_file_, "<class name=\"%s\"\n", dot.c_str()); |
| if (superclass_descriptor != nullptr) { |
| dot = DescriptorToDotWrapper(superclass_descriptor); |
| fprintf(out_file_, " extends=\"%s\"\n", dot.c_str()); |
| } |
| fprintf(out_file_, " interface=%s\n", |
| QuotedBool((class_def->GetAccessFlags() & kAccInterface) != 0)); |
| fprintf(out_file_, " abstract=%s\n", |
| QuotedBool((class_def->GetAccessFlags() & kAccAbstract) != 0)); |
| fprintf(out_file_, " static=%s\n", QuotedBool((class_def->GetAccessFlags() & kAccStatic) != 0)); |
| fprintf(out_file_, " final=%s\n", QuotedBool((class_def->GetAccessFlags() & kAccFinal) != 0)); |
| // The "deprecated=" not knowable w/o parsing annotations. |
| fprintf(out_file_, " visibility=%s\n", QuotedVisibility(class_def->GetAccessFlags())); |
| fprintf(out_file_, ">\n"); |
| } |
| |
| // Interfaces. |
| const dex_ir::TypeList* interfaces = class_def->Interfaces(); |
| if (interfaces != nullptr) { |
| const dex_ir::TypeIdVector* interfaces_vector = interfaces->GetTypeList(); |
| for (uint32_t i = 0; i < interfaces_vector->size(); i++) { |
| DumpInterface((*interfaces_vector)[i], i); |
| } // for |
| } |
| |
| // Fields and methods. |
| dex_ir::ClassData* class_data = class_def->GetClassData(); |
| // Prepare data for static fields. |
| dex_ir::EncodedArrayItem* static_values = class_def->StaticValues(); |
| dex_ir::EncodedValueVector* encoded_values = |
| static_values == nullptr ? nullptr : static_values->GetEncodedValues(); |
| const uint32_t encoded_values_size = (encoded_values == nullptr) ? 0 : encoded_values->size(); |
| |
| // Static fields. |
| if (options_.output_format_ == kOutputPlain) { |
| fprintf(out_file_, " Static fields -\n"); |
| } |
| if (class_data != nullptr) { |
| dex_ir::FieldItemVector* static_fields = class_data->StaticFields(); |
| if (static_fields != nullptr) { |
| for (uint32_t i = 0; i < static_fields->size(); i++) { |
| DumpSField((*static_fields)[i]->GetFieldId()->GetIndex(), |
| (*static_fields)[i]->GetAccessFlags(), |
| i, |
| i < encoded_values_size ? (*encoded_values)[i].get() : nullptr); |
| } // for |
| } |
| } |
| |
| // Instance fields. |
| if (options_.output_format_ == kOutputPlain) { |
| fprintf(out_file_, " Instance fields -\n"); |
| } |
| if (class_data != nullptr) { |
| dex_ir::FieldItemVector* instance_fields = class_data->InstanceFields(); |
| if (instance_fields != nullptr) { |
| for (uint32_t i = 0; i < instance_fields->size(); i++) { |
| DumpIField((*instance_fields)[i]->GetFieldId()->GetIndex(), |
| (*instance_fields)[i]->GetAccessFlags(), |
| i); |
| } // for |
| } |
| } |
| |
| // Direct methods. |
| if (options_.output_format_ == kOutputPlain) { |
| fprintf(out_file_, " Direct methods -\n"); |
| } |
| if (class_data != nullptr) { |
| dex_ir::MethodItemVector* direct_methods = class_data->DirectMethods(); |
| if (direct_methods != nullptr) { |
| for (uint32_t i = 0; i < direct_methods->size(); i++) { |
| DumpMethod((*direct_methods)[i]->GetMethodId()->GetIndex(), |
| (*direct_methods)[i]->GetAccessFlags(), |
| (*direct_methods)[i]->GetCodeItem(), |
| i); |
| } // for |
| } |
| } |
| |
| // Virtual methods. |
| if (options_.output_format_ == kOutputPlain) { |
| fprintf(out_file_, " Virtual methods -\n"); |
| } |
| if (class_data != nullptr) { |
| dex_ir::MethodItemVector* virtual_methods = class_data->VirtualMethods(); |
| if (virtual_methods != nullptr) { |
| for (uint32_t i = 0; i < virtual_methods->size(); i++) { |
| DumpMethod((*virtual_methods)[i]->GetMethodId()->GetIndex(), |
| (*virtual_methods)[i]->GetAccessFlags(), |
| (*virtual_methods)[i]->GetCodeItem(), |
| i); |
| } // for |
| } |
| } |
| |
| // End of class. |
| if (options_.output_format_ == kOutputPlain) { |
| const char* file_name = "unknown"; |
| if (class_def->SourceFile() != nullptr) { |
| file_name = class_def->SourceFile()->Data(); |
| } |
| const dex_ir::StringId* source_file = class_def->SourceFile(); |
| fprintf(out_file_, " source_file_idx : %d (%s)\n\n", |
| source_file == nullptr ? 0xffffffffU : source_file->GetIndex(), file_name); |
| } else if (options_.output_format_ == kOutputXml) { |
| fprintf(out_file_, "</class>\n"); |
| } |
| |
| free(access_str); |
| } |
| |
| void DexLayout::DumpDexFile() { |
| // Headers. |
| if (options_.show_file_headers_) { |
| DumpFileHeader(); |
| } |
| |
| // Open XML context. |
| if (options_.output_format_ == kOutputXml) { |
| fprintf(out_file_, "<api>\n"); |
| } |
| |
| // Iterate over all classes. |
| char* package = nullptr; |
| const uint32_t class_defs_size = header_->GetCollections().ClassDefsSize(); |
| for (uint32_t i = 0; i < class_defs_size; i++) { |
| DumpClass(i, &package); |
| } // for |
| |
| // Free the last package allocated. |
| if (package != nullptr) { |
| fprintf(out_file_, "</package>\n"); |
| free(package); |
| } |
| |
| // Close XML context. |
| if (options_.output_format_ == kOutputXml) { |
| fprintf(out_file_, "</api>\n"); |
| } |
| } |
| |
| std::vector<dex_ir::ClassData*> DexLayout::LayoutClassDefsAndClassData(const DexFile* dex_file) { |
| std::vector<dex_ir::ClassDef*> new_class_def_order; |
| for (std::unique_ptr<dex_ir::ClassDef>& class_def : header_->GetCollections().ClassDefs()) { |
| dex::TypeIndex type_idx(class_def->ClassType()->GetIndex()); |
| if (info_->ContainsClass(*dex_file, type_idx)) { |
| new_class_def_order.push_back(class_def.get()); |
| } |
| } |
| for (std::unique_ptr<dex_ir::ClassDef>& class_def : header_->GetCollections().ClassDefs()) { |
| dex::TypeIndex type_idx(class_def->ClassType()->GetIndex()); |
| if (!info_->ContainsClass(*dex_file, type_idx)) { |
| new_class_def_order.push_back(class_def.get()); |
| } |
| } |
| uint32_t class_defs_offset = header_->GetCollections().ClassDefsOffset(); |
| uint32_t class_data_offset = header_->GetCollections().ClassDatasOffset(); |
| std::unordered_set<dex_ir::ClassData*> visited_class_data; |
| std::vector<dex_ir::ClassData*> new_class_data_order; |
| for (uint32_t i = 0; i < new_class_def_order.size(); ++i) { |
| dex_ir::ClassDef* class_def = new_class_def_order[i]; |
| if (kChangeClassDefOrder) { |
| // This produces dex files that violate the spec since the super class class_def is supposed |
| // to occur before any subclasses. |
| class_def->SetIndex(i); |
| class_def->SetOffset(class_defs_offset); |
| class_defs_offset += dex_ir::ClassDef::ItemSize(); |
| } |
| dex_ir::ClassData* class_data = class_def->GetClassData(); |
| if (class_data != nullptr && visited_class_data.find(class_data) == visited_class_data.end()) { |
| class_data->SetOffset(class_data_offset); |
| class_data_offset += class_data->GetSize(); |
| visited_class_data.insert(class_data); |
| new_class_data_order.push_back(class_data); |
| } |
| } |
| return new_class_data_order; |
| } |
| |
| int32_t DexLayout::LayoutStringData(const DexFile* dex_file) { |
| const size_t num_strings = header_->GetCollections().StringIds().size(); |
| std::vector<bool> is_shorty(num_strings, false); |
| std::vector<bool> from_hot_method(num_strings, false); |
| for (std::unique_ptr<dex_ir::ClassDef>& class_def : header_->GetCollections().ClassDefs()) { |
| // A name of a profile class is probably going to get looked up by ClassTable::Lookup, mark it |
| // as hot. Add its super class and interfaces as well, which can be used during initialization. |
| const bool is_profile_class = |
| info_->ContainsClass(*dex_file, dex::TypeIndex(class_def->ClassType()->GetIndex())); |
| if (is_profile_class) { |
| from_hot_method[class_def->ClassType()->GetStringId()->GetIndex()] = true; |
| const dex_ir::TypeId* superclass = class_def->Superclass(); |
| if (superclass != nullptr) { |
| from_hot_method[superclass->GetStringId()->GetIndex()] = true; |
| } |
| const dex_ir::TypeList* interfaces = class_def->Interfaces(); |
| if (interfaces != nullptr) { |
| for (const dex_ir::TypeId* interface_type : *interfaces->GetTypeList()) { |
| from_hot_method[interface_type->GetStringId()->GetIndex()] = true; |
| } |
| } |
| } |
| dex_ir::ClassData* data = class_def->GetClassData(); |
| if (data == nullptr) { |
| continue; |
| } |
| for (size_t i = 0; i < 2; ++i) { |
| for (auto& method : *(i == 0 ? data->DirectMethods() : data->VirtualMethods())) { |
| const dex_ir::MethodId* method_id = method->GetMethodId(); |
| dex_ir::CodeItem* code_item = method->GetCodeItem(); |
| if (code_item == nullptr) { |
| continue; |
| } |
| const bool is_clinit = is_profile_class && |
| (method->GetAccessFlags() & kAccConstructor) != 0 && |
| (method->GetAccessFlags() & kAccStatic) != 0; |
| const bool method_executed = is_clinit || |
| info_->GetMethodHotness(MethodReference(dex_file, method_id->GetIndex())).IsInProfile(); |
| if (!method_executed) { |
| continue; |
| } |
| is_shorty[method_id->Proto()->Shorty()->GetIndex()] = true; |
| dex_ir::CodeFixups* fixups = code_item->GetCodeFixups(); |
| if (fixups == nullptr) { |
| continue; |
| } |
| // Add const-strings. |
| for (dex_ir::StringId* id : *fixups->StringIds()) { |
| from_hot_method[id->GetIndex()] = true; |
| } |
| // Add field classes, names, and types. |
| for (dex_ir::FieldId* id : *fixups->FieldIds()) { |
| // TODO: Only visit field ids from static getters and setters. |
| from_hot_method[id->Class()->GetStringId()->GetIndex()] = true; |
| from_hot_method[id->Name()->GetIndex()] = true; |
| from_hot_method[id->Type()->GetStringId()->GetIndex()] = true; |
| } |
| // For clinits, add referenced method classes, names, and protos. |
| if (is_clinit) { |
| for (dex_ir::MethodId* id : *fixups->MethodIds()) { |
| from_hot_method[id->Class()->GetStringId()->GetIndex()] = true; |
| from_hot_method[id->Name()->GetIndex()] = true; |
| is_shorty[id->Proto()->Shorty()->GetIndex()] = true; |
| } |
| } |
| } |
| } |
| } |
| // Sort string data by specified order. |
| std::vector<dex_ir::StringId*> string_ids; |
| size_t min_offset = std::numeric_limits<size_t>::max(); |
| size_t max_offset = 0; |
| size_t hot_bytes = 0; |
| for (auto& string_id : header_->GetCollections().StringIds()) { |
| string_ids.push_back(string_id.get()); |
| const size_t cur_offset = string_id->DataItem()->GetOffset(); |
| CHECK_NE(cur_offset, 0u); |
| min_offset = std::min(min_offset, cur_offset); |
| dex_ir::StringData* data = string_id->DataItem(); |
| const size_t element_size = data->GetSize() + 1; // Add one extra for null. |
| size_t end_offset = cur_offset + element_size; |
| if (is_shorty[string_id->GetIndex()] || from_hot_method[string_id->GetIndex()]) { |
| hot_bytes += element_size; |
| } |
| max_offset = std::max(max_offset, end_offset); |
| } |
| VLOG(compiler) << "Hot string data bytes " << hot_bytes << "/" << max_offset - min_offset; |
| std::sort(string_ids.begin(), |
| string_ids.end(), |
| [&is_shorty, &from_hot_method](const dex_ir::StringId* a, |
| const dex_ir::StringId* b) { |
| const bool a_is_hot = from_hot_method[a->GetIndex()]; |
| const bool b_is_hot = from_hot_method[b->GetIndex()]; |
| if (a_is_hot != b_is_hot) { |
| return a_is_hot < b_is_hot; |
| } |
| // After hot methods are partitioned, subpartition shorties. |
| const bool a_is_shorty = is_shorty[a->GetIndex()]; |
| const bool b_is_shorty = is_shorty[b->GetIndex()]; |
| if (a_is_shorty != b_is_shorty) { |
| return a_is_shorty < b_is_shorty; |
| } |
| // Preserve order. |
| return a->DataItem()->GetOffset() < b->DataItem()->GetOffset(); |
| }); |
| // Now we know what order we want the string data, reorder the offsets. |
| size_t offset = min_offset; |
| for (dex_ir::StringId* string_id : string_ids) { |
| dex_ir::StringData* data = string_id->DataItem(); |
| data->SetOffset(offset); |
| offset += data->GetSize() + 1; // Add one extra for null. |
| } |
| if (offset > max_offset) { |
| return offset - max_offset; |
| // If we expanded the string data section, we need to update the offsets or else we will |
| // corrupt the next section when writing out. |
| } |
| return 0; |
| } |
| |
| // Orders code items according to specified class data ordering. |
| // NOTE: If the section following the code items is byte aligned, the last code item is left in |
| // place to preserve alignment. Layout needs an overhaul to handle movement of other sections. |
| int32_t DexLayout::LayoutCodeItems(const DexFile* dex_file, |
| std::vector<dex_ir::ClassData*> new_class_data_order) { |
| // Do not move code items if class data section precedes code item section. |
| // ULEB encoding is variable length, causing problems determining the offset of the code items. |
| // TODO: We should swap the order of these sections in the future to avoid this issue. |
| uint32_t class_data_offset = header_->GetCollections().ClassDatasOffset(); |
| uint32_t code_item_offset = header_->GetCollections().CodeItemsOffset(); |
| if (class_data_offset < code_item_offset) { |
| return 0; |
| } |
| |
| // Find the last code item so we can leave it in place if the next section is not 4 byte aligned. |
| dex_ir::CodeItem* last_code_item = nullptr; |
| std::unordered_set<dex_ir::CodeItem*> visited_code_items; |
| bool is_code_item_aligned = IsNextSectionCodeItemAligned(code_item_offset); |
| if (!is_code_item_aligned) { |
| for (auto& code_item_pair : header_->GetCollections().CodeItems()) { |
| std::unique_ptr<dex_ir::CodeItem>& code_item = code_item_pair.second; |
| if (last_code_item == nullptr |
| || last_code_item->GetOffset() < code_item->GetOffset()) { |
| last_code_item = code_item.get(); |
| } |
| } |
| } |
| |
| static constexpr InvokeType invoke_types[] = { |
| kDirect, |
| kVirtual |
| }; |
| |
| const size_t num_layout_types = static_cast<size_t>(LayoutType::kLayoutTypeCount); |
| std::unordered_set<dex_ir::CodeItem*> code_items[num_layout_types]; |
| for (InvokeType invoke_type : invoke_types) { |
| for (std::unique_ptr<dex_ir::ClassDef>& class_def : header_->GetCollections().ClassDefs()) { |
| const bool is_profile_class = |
| info_->ContainsClass(*dex_file, dex::TypeIndex(class_def->ClassType()->GetIndex())); |
| |
| // Skip classes that are not defined in this dex file. |
| dex_ir::ClassData* class_data = class_def->GetClassData(); |
| if (class_data == nullptr) { |
| continue; |
| } |
| for (auto& method : *(invoke_type == InvokeType::kDirect |
| ? class_data->DirectMethods() |
| : class_data->VirtualMethods())) { |
| const dex_ir::MethodId *method_id = method->GetMethodId(); |
| dex_ir::CodeItem *code_item = method->GetCodeItem(); |
| if (code_item == last_code_item || code_item == nullptr) { |
| continue; |
| } |
| // Separate executed methods (clinits and profiled methods) from unexecuted methods. |
| const bool is_clinit = (method->GetAccessFlags() & kAccConstructor) != 0 && |
| (method->GetAccessFlags() & kAccStatic) != 0; |
| const bool is_startup_clinit = is_profile_class && is_clinit; |
| using Hotness = ProfileCompilationInfo::MethodHotness; |
| Hotness hotness = info_->GetMethodHotness(MethodReference(dex_file, method_id->GetIndex())); |
| LayoutType state = LayoutType::kLayoutTypeUnused; |
| if (hotness.IsHot()) { |
| // Hot code is compiled, maybe one day it won't be accessed. So lay it out together for |
| // now. |
| state = LayoutType::kLayoutTypeHot; |
| } else if (is_startup_clinit || hotness.GetFlags() == Hotness::kFlagStartup) { |
| // Startup clinit or a method that only has the startup flag. |
| state = LayoutType::kLayoutTypeStartupOnly; |
| } else if (is_clinit) { |
| state = LayoutType::kLayoutTypeUsedOnce; |
| } else if (hotness.IsInProfile()) { |
| state = LayoutType::kLayoutTypeSometimesUsed; |
| } |
| code_items[static_cast<size_t>(state)].insert(code_item); |
| } |
| } |
| } |
| |
| // Removing duplicate CodeItems may expose other issues with downstream |
| // optimizations such as quickening. But we need to ensure at least the weak |
| // forms of it currently in use do not break layout optimizations. |
| std::map<dex_ir::CodeItem*, uint32_t> original_code_item_offset; |
| // Total_diff includes diffs generated by clinits, executed, and non-executed methods. |
| int32_t total_diff = 0; |
| // The relative placement has no effect on correctness; it is used to ensure |
| // the layout is deterministic |
| for (size_t index = 0; index < num_layout_types; ++index) { |
| const std::unordered_set<dex_ir::CodeItem*>& code_items_set = code_items[index]; |
| // diff is reset for each class of code items. |
| int32_t diff = 0; |
| const uint32_t start_offset = code_item_offset; |
| for (dex_ir::ClassData* data : new_class_data_order) { |
| data->SetOffset(data->GetOffset() + diff); |
| for (InvokeType invoke_type : invoke_types) { |
| for (auto &method : *(invoke_type == InvokeType::kDirect |
| ? data->DirectMethods() |
| : data->VirtualMethods())) { |
| dex_ir::CodeItem* code_item = method->GetCodeItem(); |
| if (code_item != nullptr && |
| code_items_set.find(code_item) != code_items_set.end()) { |
| // Compute where the CodeItem was originally laid out. |
| uint32_t original_offset = code_item->GetOffset(); |
| auto it = original_code_item_offset.find(code_item); |
| if (it != original_code_item_offset.end()) { |
| original_offset = it->second; |
| } else { |
| original_code_item_offset[code_item] = code_item->GetOffset(); |
| // Assign the new offset and move the pointer to allocate space. |
| code_item->SetOffset(code_item_offset); |
| code_item_offset += |
| RoundUp(code_item->GetSize(), kDexCodeItemAlignment); |
| } |
| // Update the size of the encoded methods to reflect that the offset difference |
| // may have changed the ULEB128 length. |
| diff += |
| UnsignedLeb128Size(code_item->GetOffset()) - UnsignedLeb128Size(original_offset); |
| } |
| } |
| } |
| } |
| DexLayoutSection& code_section = dex_sections_.sections_[static_cast<size_t>( |
| DexLayoutSections::SectionType::kSectionTypeCode)]; |
| code_section.parts_[index].offset_ = start_offset; |
| code_section.parts_[index].size_ = code_item_offset - start_offset; |
| for (size_t i = 0; i < num_layout_types; ++i) { |
| VLOG(dex) << "Code item layout bucket " << i << " count=" << code_items[i].size() |
| << " bytes=" << code_section.parts_[i].size_; |
| } |
| total_diff += diff; |
| } |
| // Adjust diff to be 4-byte aligned. |
| return RoundUp(total_diff, kDexCodeItemAlignment); |
| } |
| |
| bool DexLayout::IsNextSectionCodeItemAligned(uint32_t offset) { |
| dex_ir::Collections& collections = header_->GetCollections(); |
| std::set<uint32_t> section_offsets; |
| section_offsets.insert(collections.MapListOffset()); |
| section_offsets.insert(collections.TypeListsOffset()); |
| section_offsets.insert(collections.AnnotationSetRefListsOffset()); |
| section_offsets.insert(collections.AnnotationSetItemsOffset()); |
| section_offsets.insert(collections.ClassDatasOffset()); |
| section_offsets.insert(collections.CodeItemsOffset()); |
| section_offsets.insert(collections.StringDatasOffset()); |
| section_offsets.insert(collections.DebugInfoItemsOffset()); |
| section_offsets.insert(collections.AnnotationItemsOffset()); |
| section_offsets.insert(collections.EncodedArrayItemsOffset()); |
| section_offsets.insert(collections.AnnotationsDirectoryItemsOffset()); |
| |
| auto found = section_offsets.find(offset); |
| if (found != section_offsets.end()) { |
| found++; |
| if (found != section_offsets.end()) { |
| return *found % kDexCodeItemAlignment == 0; |
| } |
| } |
| return false; |
| } |
| |
| // Adjust offsets of every item in the specified section by diff bytes. |
| template<class T> void DexLayout::FixupSection(std::map<uint32_t, std::unique_ptr<T>>& map, |
| uint32_t diff) { |
| for (auto& pair : map) { |
| std::unique_ptr<T>& item = pair.second; |
| item->SetOffset(item->GetOffset() + diff); |
| } |
| } |
| |
| // Adjust offsets of all sections with an address after the specified offset by diff bytes. |
| void DexLayout::FixupSections(uint32_t offset, uint32_t diff) { |
| dex_ir::Collections& collections = header_->GetCollections(); |
| uint32_t map_list_offset = collections.MapListOffset(); |
| if (map_list_offset > offset) { |
| collections.SetMapListOffset(map_list_offset + diff); |
| } |
| |
| uint32_t type_lists_offset = collections.TypeListsOffset(); |
| if (type_lists_offset > offset) { |
| collections.SetTypeListsOffset(type_lists_offset + diff); |
| FixupSection(collections.TypeLists(), diff); |
| } |
| |
| uint32_t annotation_set_ref_lists_offset = collections.AnnotationSetRefListsOffset(); |
| if (annotation_set_ref_lists_offset > offset) { |
| collections.SetAnnotationSetRefListsOffset(annotation_set_ref_lists_offset + diff); |
| FixupSection(collections.AnnotationSetRefLists(), diff); |
| } |
| |
| uint32_t annotation_set_items_offset = collections.AnnotationSetItemsOffset(); |
| if (annotation_set_items_offset > offset) { |
| collections.SetAnnotationSetItemsOffset(annotation_set_items_offset + diff); |
| FixupSection(collections.AnnotationSetItems(), diff); |
| } |
| |
| uint32_t class_datas_offset = collections.ClassDatasOffset(); |
| if (class_datas_offset > offset) { |
| collections.SetClassDatasOffset(class_datas_offset + diff); |
| FixupSection(collections.ClassDatas(), diff); |
| } |
| |
| uint32_t code_items_offset = collections.CodeItemsOffset(); |
| if (code_items_offset > offset) { |
| collections.SetCodeItemsOffset(code_items_offset + diff); |
| FixupSection(collections.CodeItems(), diff); |
| } |
| |
| uint32_t string_datas_offset = collections.StringDatasOffset(); |
| if (string_datas_offset > offset) { |
| collections.SetStringDatasOffset(string_datas_offset + diff); |
| FixupSection(collections.StringDatas(), diff); |
| } |
| |
| uint32_t debug_info_items_offset = collections.DebugInfoItemsOffset(); |
| if (debug_info_items_offset > offset) { |
| collections.SetDebugInfoItemsOffset(debug_info_items_offset + diff); |
| FixupSection(collections.DebugInfoItems(), diff); |
| } |
| |
| uint32_t annotation_items_offset = collections.AnnotationItemsOffset(); |
| if (annotation_items_offset > offset) { |
| collections.SetAnnotationItemsOffset(annotation_items_offset + diff); |
| FixupSection(collections.AnnotationItems(), diff); |
| } |
| |
| uint32_t encoded_array_items_offset = collections.EncodedArrayItemsOffset(); |
| if (encoded_array_items_offset > offset) { |
| collections.SetEncodedArrayItemsOffset(encoded_array_items_offset + diff); |
| FixupSection(collections.EncodedArrayItems(), diff); |
| } |
| |
| uint32_t annotations_directory_items_offset = collections.AnnotationsDirectoryItemsOffset(); |
| if (annotations_directory_items_offset > offset) { |
| collections.SetAnnotationsDirectoryItemsOffset(annotations_directory_items_offset + diff); |
| FixupSection(collections.AnnotationsDirectoryItems(), diff); |
| } |
| } |
| |
| void DexLayout::LayoutOutputFile(const DexFile* dex_file) { |
| const int32_t string_diff = LayoutStringData(dex_file); |
| // If we expanded the string data section, we need to update the offsets or else we will |
| // corrupt the next section when writing out. |
| FixupSections(header_->GetCollections().StringDatasOffset(), string_diff); |
| // Update file size. |
| header_->SetFileSize(header_->FileSize() + string_diff); |
| |
| std::vector<dex_ir::ClassData*> new_class_data_order = LayoutClassDefsAndClassData(dex_file); |
| const int32_t code_item_diff = LayoutCodeItems(dex_file, new_class_data_order); |
| // Move sections after ClassData by diff bytes. |
| FixupSections(header_->GetCollections().ClassDatasOffset(), code_item_diff); |
| |
| // Update file and data size. |
| // The data size must be aligned to kDataSectionAlignment. |
| const int32_t total_diff = code_item_diff + string_diff; |
| header_->SetDataSize(RoundUp(header_->DataSize() + total_diff, kDataSectionAlignment)); |
| header_->SetFileSize(header_->FileSize() + total_diff); |
| } |
| |
| void DexLayout::OutputDexFile(const DexFile* dex_file) { |
| const std::string& dex_file_location = dex_file->GetLocation(); |
| std::string error_msg; |
| std::unique_ptr<File> new_file; |
| if (!options_.output_to_memmap_) { |
| std::string output_location(options_.output_dex_directory_); |
| size_t last_slash = dex_file_location.rfind('/'); |
| std::string dex_file_directory = dex_file_location.substr(0, last_slash + 1); |
| if (output_location == dex_file_directory) { |
| output_location = dex_file_location + ".new"; |
| } else if (last_slash != std::string::npos) { |
| output_location += dex_file_location.substr(last_slash); |
| } else { |
| output_location += "/" + dex_file_location + ".new"; |
| } |
| new_file.reset(OS::CreateEmptyFile(output_location.c_str())); |
| if (new_file == nullptr) { |
| LOG(ERROR) << "Could not create dex writer output file: " << output_location; |
| return; |
| } |
| if (ftruncate(new_file->Fd(), header_->FileSize()) != 0) { |
| LOG(ERROR) << "Could not grow dex writer output file: " << output_location;; |
| new_file->Erase(); |
| return; |
| } |
| mem_map_.reset(MemMap::MapFile(header_->FileSize(), PROT_READ | PROT_WRITE, MAP_SHARED, |
| new_file->Fd(), 0, /*low_4gb*/ false, output_location.c_str(), &error_msg)); |
| } else { |
| mem_map_.reset(MemMap::MapAnonymous("layout dex", nullptr, header_->FileSize(), |
| PROT_READ | PROT_WRITE, /* low_4gb */ false, /* reuse */ false, &error_msg)); |
| } |
| if (mem_map_ == nullptr) { |
| LOG(ERROR) << "Could not create mem map for dex writer output: " << error_msg; |
| if (new_file != nullptr) { |
| new_file->Erase(); |
| } |
| return; |
| } |
| DexWriter::Output(header_, mem_map_.get(), options_.compact_dex_level_); |
| if (new_file != nullptr) { |
| UNUSED(new_file->FlushCloseOrErase()); |
| } |
| } |
| |
| /* |
| * Dumps the requested sections of the file. |
| */ |
| void DexLayout::ProcessDexFile(const char* file_name, |
| const DexFile* dex_file, |
| size_t dex_file_index) { |
| std::unique_ptr<dex_ir::Header> header(dex_ir::DexIrBuilder(*dex_file)); |
| SetHeader(header.get()); |
| |
| if (options_.verbose_) { |
| fprintf(out_file_, "Opened '%s', DEX version '%.3s'\n", |
| file_name, dex_file->GetHeader().magic_ + 4); |
| } |
| |
| if (options_.visualize_pattern_) { |
| VisualizeDexLayout(header_, dex_file, dex_file_index, info_); |
| return; |
| } |
| |
| if (options_.show_section_statistics_) { |
| ShowDexSectionStatistics(header_, dex_file_index); |
| return; |
| } |
| |
| // Dump dex file. |
| if (options_.dump_) { |
| DumpDexFile(); |
| } |
| |
| // In case we are outputting to a file, keep it open so we can verify. |
| if (options_.output_dex_directory_ != nullptr || options_.output_to_memmap_) { |
| if (info_ != nullptr) { |
| LayoutOutputFile(dex_file); |
| } |
| OutputDexFile(dex_file); |
| |
| // Clear header before verifying to reduce peak RAM usage. |
| header.reset(); |
| |
| // Verify the output dex file's structure, only enabled by default for debug builds. |
| if (options_.verify_output_) { |
| std::string error_msg; |
| std::string location = "memory mapped file for " + std::string(file_name); |
| std::unique_ptr<const DexFile> output_dex_file(DexFileLoader::Open(mem_map_->Begin(), |
| mem_map_->Size(), |
| location, |
| /* checksum */ 0, |
| /*oat_dex_file*/ nullptr, |
| /*verify*/ true, |
| /*verify_checksum*/ false, |
| &error_msg)); |
| CHECK(output_dex_file != nullptr) << "Failed to re-open output file:" << error_msg; |
| |
| // Do IR-level comparison between input and output. This check ignores potential differences |
| // due to layout, so offsets are not checked. Instead, it checks the data contents of each item. |
| // |
| // Regenerate output IR to catch any bugs that might happen during writing. |
| std::unique_ptr<dex_ir::Header> output_header(dex_ir::DexIrBuilder(*output_dex_file)); |
| std::unique_ptr<dex_ir::Header> orig_header(dex_ir::DexIrBuilder(*dex_file)); |
| CHECK(VerifyOutputDexFile(output_header.get(), orig_header.get(), &error_msg)) << error_msg; |
| } |
| } |
| } |
| |
| /* |
| * Processes a single file (either direct .dex or indirect .zip/.jar/.apk). |
| */ |
| int DexLayout::ProcessFile(const char* file_name) { |
| if (options_.verbose_) { |
| fprintf(out_file_, "Processing '%s'...\n", file_name); |
| } |
| |
| // If the file is not a .dex file, the function tries .zip/.jar/.apk files, |
| // all of which are Zip archives with "classes.dex" inside. |
| const bool verify_checksum = !options_.ignore_bad_checksum_; |
| std::string error_msg; |
| std::vector<std::unique_ptr<const DexFile>> dex_files; |
| if (!DexFileLoader::Open( |
| file_name, file_name, /* verify */ true, verify_checksum, &error_msg, &dex_files)) { |
| // Display returned error message to user. Note that this error behavior |
| // differs from the error messages shown by the original Dalvik dexdump. |
| fputs(error_msg.c_str(), stderr); |
| fputc('\n', stderr); |
| return -1; |
| } |
| |
| // Success. Either report checksum verification or process |
| // all dex files found in given file. |
| if (options_.checksum_only_) { |
| fprintf(out_file_, "Checksum verified\n"); |
| } else { |
| for (size_t i = 0; i < dex_files.size(); i++) { |
| ProcessDexFile(file_name, dex_files[i].get(), i); |
| } |
| } |
| return 0; |
| } |
| |
| } // namespace art |