diff options
Diffstat (limited to 'compiler')
| -rw-r--r-- | compiler/Android.mk | 2 | ||||
| -rw-r--r-- | compiler/optimizing/code_generator.cc | 2 | ||||
| -rw-r--r-- | compiler/optimizing/code_generator.h | 8 | ||||
| -rw-r--r-- | compiler/optimizing/code_generator_arm64.cc | 22 | ||||
| -rw-r--r-- | compiler/optimizing/code_generator_arm64.h | 2 | ||||
| -rw-r--r-- | compiler/optimizing/code_generator_x86.cc | 87 | ||||
| -rw-r--r-- | compiler/optimizing/code_generator_x86.h | 14 | ||||
| -rw-r--r-- | compiler/optimizing/code_generator_x86_64.cc | 29 | ||||
| -rw-r--r-- | compiler/optimizing/code_generator_x86_64.h | 2 | ||||
| -rw-r--r-- | compiler/optimizing/nodes.cc | 10 | ||||
| -rw-r--r-- | compiler/optimizing/nodes.h | 5 | ||||
| -rw-r--r-- | compiler/optimizing/optimizing_compiler.cc | 7 | ||||
| -rw-r--r-- | compiler/optimizing/pc_relative_fixups_x86.cc (renamed from compiler/optimizing/constant_area_fixups_x86.cc) | 32 | ||||
| -rw-r--r-- | compiler/optimizing/pc_relative_fixups_x86.h (renamed from compiler/optimizing/constant_area_fixups_x86.h) | 12 | 
14 files changed, 158 insertions, 76 deletions
| diff --git a/compiler/Android.mk b/compiler/Android.mk index e74a68f608..42ddfd83ab 100644 --- a/compiler/Android.mk +++ b/compiler/Android.mk @@ -67,7 +67,6 @@ LIBART_COMPILER_SRC_FILES := \  	optimizing/builder.cc \  	optimizing/code_generator.cc \  	optimizing/code_generator_utils.cc \ -	optimizing/constant_area_fixups_x86.cc \  	optimizing/constant_folding.cc \  	optimizing/dead_code_elimination.cc \  	optimizing/graph_checker.cc \ @@ -85,6 +84,7 @@ LIBART_COMPILER_SRC_FILES := \  	optimizing/optimization.cc \  	optimizing/optimizing_compiler.cc \  	optimizing/parallel_move_resolver.cc \ +	optimizing/pc_relative_fixups_x86.cc \  	optimizing/prepare_for_register_allocation.cc \  	optimizing/primitive_type_propagation.cc \  	optimizing/reference_type_propagation.cc \ diff --git a/compiler/optimizing/code_generator.cc b/compiler/optimizing/code_generator.cc index ce92470868..5188e115e0 100644 --- a/compiler/optimizing/code_generator.cc +++ b/compiler/optimizing/code_generator.cc @@ -208,6 +208,7 @@ class DisassemblyScope {  void CodeGenerator::GenerateSlowPaths() {    size_t code_start = 0;    for (SlowPathCode* slow_path : slow_paths_) { +    current_slow_path_ = slow_path;      if (disasm_info_ != nullptr) {        code_start = GetAssembler()->CodeSize();      } @@ -216,6 +217,7 @@ void CodeGenerator::GenerateSlowPaths() {        disasm_info_->AddSlowPathInterval(slow_path, code_start, GetAssembler()->CodeSize());      }    } +  current_slow_path_ = nullptr;  }  void CodeGenerator::CompileInternal(CodeAllocator* allocator, bool is_baseline) { diff --git a/compiler/optimizing/code_generator.h b/compiler/optimizing/code_generator.h index a92014dc79..2108abefcc 100644 --- a/compiler/optimizing/code_generator.h +++ b/compiler/optimizing/code_generator.h @@ -490,6 +490,7 @@ class CodeGenerator {          compiler_options_(compiler_options),          src_map_(graph->GetArena()->Adapter(kArenaAllocCodeGenerator)),          slow_paths_(graph->GetArena()->Adapter(kArenaAllocCodeGenerator)), +        current_slow_path_(nullptr),          current_block_index_(0),          is_leaf_(true),          requires_current_method_(false) { @@ -557,6 +558,10 @@ class CodeGenerator {      return raw_pointer_to_labels_array + block->GetBlockId();    } +  SlowPathCode* GetCurrentSlowPath() { +    return current_slow_path_; +  } +    // Frame size required for this method.    uint32_t frame_size_;    uint32_t core_spill_mask_; @@ -605,6 +610,9 @@ class CodeGenerator {    ArenaVector<SrcMapElem> src_map_;    ArenaVector<SlowPathCode*> slow_paths_; +  // The current slow path that we're generating code for. +  SlowPathCode* current_slow_path_; +    // The current block index in `block_order_` of the block    // we are generating code for.    size_t current_block_index_; diff --git a/compiler/optimizing/code_generator_arm64.cc b/compiler/optimizing/code_generator_arm64.cc index b0be446174..7e248b402a 100644 --- a/compiler/optimizing/code_generator_arm64.cc +++ b/compiler/optimizing/code_generator_arm64.cc @@ -598,7 +598,7 @@ CodeGeneratorARM64::CodeGeneratorARM64(HGraph* graph,        call_patches_(MethodReferenceComparator(),                      graph->GetArena()->Adapter(kArenaAllocCodeGenerator)),        relative_call_patches_(graph->GetArena()->Adapter(kArenaAllocCodeGenerator)), -      pc_rel_dex_cache_patches_(graph->GetArena()->Adapter(kArenaAllocCodeGenerator)) { +      pc_relative_dex_cache_patches_(graph->GetArena()->Adapter(kArenaAllocCodeGenerator)) {    // Save the link register (containing the return address) to mimic Quick.    AddAllocatedRegister(LocationFrom(lr));  } @@ -2872,21 +2872,21 @@ void CodeGeneratorARM64::GenerateStaticOrDirectCall(HInvokeStaticOrDirect* invok        break;      case HInvokeStaticOrDirect::MethodLoadKind::kDexCachePcRelative: {        // Add ADRP with its PC-relative DexCache access patch. -      pc_rel_dex_cache_patches_.emplace_back(*invoke->GetTargetMethod().dex_file, -                                             invoke->GetDexCacheArrayOffset()); -      vixl::Label* pc_insn_label = &pc_rel_dex_cache_patches_.back().label; +      pc_relative_dex_cache_patches_.emplace_back(*invoke->GetTargetMethod().dex_file, +                                                  invoke->GetDexCacheArrayOffset()); +      vixl::Label* pc_insn_label = &pc_relative_dex_cache_patches_.back().label;        {          vixl::SingleEmissionCheckScope guard(GetVIXLAssembler());          __ adrp(XRegisterFrom(temp).X(), 0);        }        __ Bind(pc_insn_label);  // Bind after ADRP. -      pc_rel_dex_cache_patches_.back().pc_insn_label = pc_insn_label; +      pc_relative_dex_cache_patches_.back().pc_insn_label = pc_insn_label;        // Add LDR with its PC-relative DexCache access patch. -      pc_rel_dex_cache_patches_.emplace_back(*invoke->GetTargetMethod().dex_file, -                                             invoke->GetDexCacheArrayOffset()); +      pc_relative_dex_cache_patches_.emplace_back(*invoke->GetTargetMethod().dex_file, +                                                  invoke->GetDexCacheArrayOffset());        __ Ldr(XRegisterFrom(temp).X(), MemOperand(XRegisterFrom(temp).X(), 0)); -      __ Bind(&pc_rel_dex_cache_patches_.back().label);  // Bind after LDR. -      pc_rel_dex_cache_patches_.back().pc_insn_label = pc_insn_label; +      __ Bind(&pc_relative_dex_cache_patches_.back().label);  // Bind after LDR. +      pc_relative_dex_cache_patches_.back().pc_insn_label = pc_insn_label;        break;      }      case HInvokeStaticOrDirect::MethodLoadKind::kDexCacheViaMethod: { @@ -2973,7 +2973,7 @@ void CodeGeneratorARM64::EmitLinkerPatches(ArenaVector<LinkerPatch>* linker_patc        method_patches_.size() +        call_patches_.size() +        relative_call_patches_.size() + -      pc_rel_dex_cache_patches_.size(); +      pc_relative_dex_cache_patches_.size();    linker_patches->reserve(size);    for (const auto& entry : method_patches_) {      const MethodReference& target_method = entry.first; @@ -2994,7 +2994,7 @@ void CodeGeneratorARM64::EmitLinkerPatches(ArenaVector<LinkerPatch>* linker_patc                                                               info.target_method.dex_file,                                                               info.target_method.dex_method_index));    } -  for (const PcRelativeDexCacheAccessInfo& info : pc_rel_dex_cache_patches_) { +  for (const PcRelativeDexCacheAccessInfo& info : pc_relative_dex_cache_patches_) {      linker_patches->push_back(LinkerPatch::DexCacheArrayPatch(info.label.location() - 4u,                                                                &info.target_dex_file,                                                                info.pc_insn_label->location() - 4u, diff --git a/compiler/optimizing/code_generator_arm64.h b/compiler/optimizing/code_generator_arm64.h index ab684ea538..aa5ad386e1 100644 --- a/compiler/optimizing/code_generator_arm64.h +++ b/compiler/optimizing/code_generator_arm64.h @@ -447,7 +447,7 @@ class CodeGeneratorARM64 : public CodeGenerator {    // Using ArenaDeque<> which retains element addresses on push/emplace_back().    ArenaDeque<MethodPatchInfo<vixl::Label>> relative_call_patches_;    // PC-relative DexCache access info. -  ArenaDeque<PcRelativeDexCacheAccessInfo> pc_rel_dex_cache_patches_; +  ArenaDeque<PcRelativeDexCacheAccessInfo> pc_relative_dex_cache_patches_;    DISALLOW_COPY_AND_ASSIGN(CodeGeneratorARM64);  }; diff --git a/compiler/optimizing/code_generator_x86.cc b/compiler/optimizing/code_generator_x86.cc index 8308d9ee20..d5d6c210bf 100644 --- a/compiler/optimizing/code_generator_x86.cc +++ b/compiler/optimizing/code_generator_x86.cc @@ -19,7 +19,6 @@  #include "art_method.h"  #include "code_generator_utils.h"  #include "compiled_method.h" -#include "constant_area_fixups_x86.h"  #include "entrypoints/quick/quick_entrypoints.h"  #include "entrypoints/quick/quick_entrypoints_enum.h"  #include "gc/accounting/card_table.h" @@ -27,6 +26,7 @@  #include "intrinsics_x86.h"  #include "mirror/array-inl.h"  #include "mirror/class-inl.h" +#include "pc_relative_fixups_x86.h"  #include "thread.h"  #include "utils/assembler.h"  #include "utils/stack_checks.h" @@ -533,6 +533,7 @@ CodeGeneratorX86::CodeGeneratorX86(HGraph* graph,        isa_features_(isa_features),        method_patches_(graph->GetArena()->Adapter(kArenaAllocCodeGenerator)),        relative_call_patches_(graph->GetArena()->Adapter(kArenaAllocCodeGenerator)), +      pc_relative_dex_cache_patches_(graph->GetArena()->Adapter(kArenaAllocCodeGenerator)),        fixups_to_jump_tables_(graph->GetArena()->Adapter(kArenaAllocCodeGenerator)) {    // Use a fake return address register to mimic Quick.    AddAllocatedRegister(Location::RegisterLocation(kFakeReturnRegister)); @@ -1696,11 +1697,20 @@ void LocationsBuilderX86::VisitInvokeStaticOrDirect(HInvokeStaticOrDirect* invok    IntrinsicLocationsBuilderX86 intrinsic(codegen_);    if (intrinsic.TryDispatch(invoke)) { +    if (invoke->GetLocations()->CanCall() && invoke->HasPcRelativeDexCache()) { +      invoke->GetLocations()->SetInAt(invoke->GetCurrentMethodInputIndex(), Location::Any()); +    }      return;    }    HandleInvoke(invoke); +  // For PC-relative dex cache the invoke has an extra input, the PC-relative address base. +  if (invoke->HasPcRelativeDexCache()) { +    invoke->GetLocations()->SetInAt(invoke->GetCurrentMethodInputIndex(), +                                    Location::RequiresRegister()); +  } +    if (codegen_->IsBaseline()) {      // Baseline does not have enough registers if the current method also      // needs a register. We therefore do not require a register for it, and let @@ -3779,16 +3789,6 @@ void InstructionCodeGeneratorX86::GenerateMemoryBarrier(MemBarrierKind kind) {  HInvokeStaticOrDirect::DispatchInfo CodeGeneratorX86::GetSupportedInvokeStaticOrDirectDispatch(        const HInvokeStaticOrDirect::DispatchInfo& desired_dispatch_info,        MethodReference target_method ATTRIBUTE_UNUSED) { -  if (desired_dispatch_info.method_load_kind == -      HInvokeStaticOrDirect::MethodLoadKind::kDexCachePcRelative) { -    // TODO: Implement this type. For the moment, we fall back to kDexCacheViaMethod. -    return HInvokeStaticOrDirect::DispatchInfo { -      HInvokeStaticOrDirect::MethodLoadKind::kDexCacheViaMethod, -      HInvokeStaticOrDirect::CodePtrLocation::kCallArtMethod, -      0u, -      0u -    }; -  }    switch (desired_dispatch_info.code_ptr_location) {      case HInvokeStaticOrDirect::CodePtrLocation::kCallDirectWithFixup:      case HInvokeStaticOrDirect::CodePtrLocation::kCallDirect: @@ -3805,6 +3805,32 @@ HInvokeStaticOrDirect::DispatchInfo CodeGeneratorX86::GetSupportedInvokeStaticOr    }  } +Register CodeGeneratorX86::GetInvokeStaticOrDirectExtraParameter(HInvokeStaticOrDirect* invoke, +                                                                 Register temp) { +  DCHECK_EQ(invoke->InputCount(), invoke->GetNumberOfArguments() + 1u); +  Location location = invoke->GetLocations()->InAt(invoke->GetCurrentMethodInputIndex()); +  if (!invoke->GetLocations()->Intrinsified()) { +    return location.AsRegister<Register>(); +  } +  // For intrinsics we allow any location, so it may be on the stack. +  if (!location.IsRegister()) { +    __ movl(temp, Address(ESP, location.GetStackIndex())); +    return temp; +  } +  // For register locations, check if the register was saved. If so, get it from the stack. +  // Note: There is a chance that the register was saved but not overwritten, so we could +  // save one load. However, since this is just an intrinsic slow path we prefer this +  // simple and more robust approach rather that trying to determine if that's the case. +  SlowPathCode* slow_path = GetCurrentSlowPath(); +  DCHECK(slow_path != nullptr);  // For intrinsified invokes the call is emitted on the slow path. +  if (slow_path->IsCoreRegisterSaved(location.AsRegister<Register>())) { +    int stack_offset = slow_path->GetStackOffsetOfCoreRegister(location.AsRegister<Register>()); +    __ movl(temp, Address(ESP, stack_offset)); +    return temp; +  } +  return location.AsRegister<Register>(); +} +  void CodeGeneratorX86::GenerateStaticOrDirectCall(HInvokeStaticOrDirect* invoke, Location temp) {    Location callee_method = temp;  // For all kinds except kRecursive, callee will be in temp.    switch (invoke->GetMethodLoadKind()) { @@ -3823,11 +3849,16 @@ void CodeGeneratorX86::GenerateStaticOrDirectCall(HInvokeStaticOrDirect* invoke,        method_patches_.emplace_back(invoke->GetTargetMethod());        __ Bind(&method_patches_.back().label);  // Bind the label at the end of the "movl" insn.        break; -    case HInvokeStaticOrDirect::MethodLoadKind::kDexCachePcRelative: -      // TODO: Implement this type. -      // Currently filtered out by GetSupportedInvokeStaticOrDirectDispatch(). -      LOG(FATAL) << "Unsupported"; -      UNREACHABLE(); +    case HInvokeStaticOrDirect::MethodLoadKind::kDexCachePcRelative: { +      Register base_reg = GetInvokeStaticOrDirectExtraParameter(invoke, +                                                                temp.AsRegister<Register>()); +      uint32_t offset = invoke->GetDexCacheArrayOffset(); +      __ movl(temp.AsRegister<Register>(), Address(base_reg, kDummy32BitOffset)); +      // Add the patch entry and bind its label at the end of the instruction. +      pc_relative_dex_cache_patches_.emplace_back(*invoke->GetTargetMethod().dex_file, offset); +      __ Bind(&pc_relative_dex_cache_patches_.back().label); +      break; +    }      case HInvokeStaticOrDirect::MethodLoadKind::kDexCacheViaMethod: {        Location current_method = invoke->GetLocations()->InAt(invoke->GetCurrentMethodInputIndex());        Register method_reg; @@ -3898,23 +3929,33 @@ void CodeGeneratorX86::GenerateVirtualCall(HInvokeVirtual* invoke, Location temp  void CodeGeneratorX86::EmitLinkerPatches(ArenaVector<LinkerPatch>* linker_patches) {    DCHECK(linker_patches->empty()); -  linker_patches->reserve(method_patches_.size() + relative_call_patches_.size()); +  size_t size = +      method_patches_.size() + +      relative_call_patches_.size() + +      pc_relative_dex_cache_patches_.size(); +  linker_patches->reserve(size); +  // The label points to the end of the "movl" insn but the literal offset for method +  // patch needs to point to the embedded constant which occupies the last 4 bytes. +  constexpr uint32_t kLabelPositionToLiteralOffsetAdjustment = 4u;    for (const MethodPatchInfo<Label>& info : method_patches_) { -    // The label points to the end of the "movl" insn but the literal offset for method -    // patch x86 needs to point to the embedded constant which occupies the last 4 bytes. -    uint32_t literal_offset = info.label.Position() - 4; +    uint32_t literal_offset = info.label.Position() - kLabelPositionToLiteralOffsetAdjustment;      linker_patches->push_back(LinkerPatch::MethodPatch(literal_offset,                                                         info.target_method.dex_file,                                                         info.target_method.dex_method_index));    }    for (const MethodPatchInfo<Label>& info : relative_call_patches_) { -    // The label points to the end of the "call" insn but the literal offset for method -    // patch x86 needs to point to the embedded constant which occupies the last 4 bytes. -    uint32_t literal_offset = info.label.Position() - 4; +    uint32_t literal_offset = info.label.Position() - kLabelPositionToLiteralOffsetAdjustment;      linker_patches->push_back(LinkerPatch::RelativeCodePatch(literal_offset,                                                               info.target_method.dex_file,                                                               info.target_method.dex_method_index));    } +  for (const PcRelativeDexCacheAccessInfo& info : pc_relative_dex_cache_patches_) { +    uint32_t literal_offset = info.label.Position() - kLabelPositionToLiteralOffsetAdjustment; +    linker_patches->push_back(LinkerPatch::DexCacheArrayPatch(literal_offset, +                                                              &info.target_dex_file, +                                                              GetMethodAddressOffset(), +                                                              info.element_offset)); +  }  }  void CodeGeneratorX86::MarkGCCard(Register temp, diff --git a/compiler/optimizing/code_generator_x86.h b/compiler/optimizing/code_generator_x86.h index ac3d06c23d..177a059df8 100644 --- a/compiler/optimizing/code_generator_x86.h +++ b/compiler/optimizing/code_generator_x86.h @@ -398,6 +398,18 @@ class CodeGeneratorX86 : public CodeGenerator {    void Finalize(CodeAllocator* allocator) OVERRIDE;   private: +  Register GetInvokeStaticOrDirectExtraParameter(HInvokeStaticOrDirect* invoke, Register temp); + +  struct PcRelativeDexCacheAccessInfo { +    PcRelativeDexCacheAccessInfo(const DexFile& dex_file, uint32_t element_off) +        : target_dex_file(dex_file), element_offset(element_off), label() { } + +    const DexFile& target_dex_file; +    uint32_t element_offset; +    // NOTE: Label is bound to the end of the instruction that has an embedded 32-bit offset. +    Label label; +  }; +    // Labels for each block that will be compiled.    Label* block_labels_;  // Indexed by block id.    Label frame_entry_label_; @@ -410,6 +422,8 @@ class CodeGeneratorX86 : public CodeGenerator {    // Method patch info. Using ArenaDeque<> which retains element addresses on push/emplace_back().    ArenaDeque<MethodPatchInfo<Label>> method_patches_;    ArenaDeque<MethodPatchInfo<Label>> relative_call_patches_; +  // PC-relative DexCache access info. +  ArenaDeque<PcRelativeDexCacheAccessInfo> pc_relative_dex_cache_patches_;    // Offset to the start of the constant area in the assembled code.    // Used for fixups to the constant area. diff --git a/compiler/optimizing/code_generator_x86_64.cc b/compiler/optimizing/code_generator_x86_64.cc index ee8a299c5e..e2ad6673c7 100644 --- a/compiler/optimizing/code_generator_x86_64.cc +++ b/compiler/optimizing/code_generator_x86_64.cc @@ -514,12 +514,12 @@ void CodeGeneratorX86_64::GenerateStaticOrDirectCall(HInvokeStaticOrDirect* invo        __ Bind(&method_patches_.back().label);  // Bind the label at the end of the "movl" insn.        break;      case HInvokeStaticOrDirect::MethodLoadKind::kDexCachePcRelative: -      pc_rel_dex_cache_patches_.emplace_back(*invoke->GetTargetMethod().dex_file, -                                             invoke->GetDexCacheArrayOffset()); +      pc_relative_dex_cache_patches_.emplace_back(*invoke->GetTargetMethod().dex_file, +                                                  invoke->GetDexCacheArrayOffset());        __ movq(temp.AsRegister<CpuRegister>(),                Address::Absolute(kDummy32BitOffset, false /* no_rip */));        // Bind the label at the end of the "movl" insn. -      __ Bind(&pc_rel_dex_cache_patches_.back().label); +      __ Bind(&pc_relative_dex_cache_patches_.back().label);        break;      case HInvokeStaticOrDirect::MethodLoadKind::kDexCacheViaMethod: {        Location current_method = invoke->GetLocations()->InAt(invoke->GetCurrentMethodInputIndex()); @@ -593,28 +593,27 @@ void CodeGeneratorX86_64::GenerateVirtualCall(HInvokeVirtual* invoke, Location t  void CodeGeneratorX86_64::EmitLinkerPatches(ArenaVector<LinkerPatch>* linker_patches) {    DCHECK(linker_patches->empty());    size_t size = -      method_patches_.size() + relative_call_patches_.size() + pc_rel_dex_cache_patches_.size(); +      method_patches_.size() + +      relative_call_patches_.size() + +      pc_relative_dex_cache_patches_.size();    linker_patches->reserve(size); +  // The label points to the end of the "movl" insn but the literal offset for method +  // patch needs to point to the embedded constant which occupies the last 4 bytes. +  constexpr uint32_t kLabelPositionToLiteralOffsetAdjustment = 4u;    for (const MethodPatchInfo<Label>& info : method_patches_) { -    // The label points to the end of the "movl" instruction but the literal offset for method -    // patch x86 needs to point to the embedded constant which occupies the last 4 bytes. -    uint32_t literal_offset = info.label.Position() - 4; +    uint32_t literal_offset = info.label.Position() - kLabelPositionToLiteralOffsetAdjustment;      linker_patches->push_back(LinkerPatch::MethodPatch(literal_offset,                                                         info.target_method.dex_file,                                                         info.target_method.dex_method_index));    }    for (const MethodPatchInfo<Label>& info : relative_call_patches_) { -    // The label points to the end of the "call" instruction but the literal offset for method -    // patch x86 needs to point to the embedded constant which occupies the last 4 bytes. -    uint32_t literal_offset = info.label.Position() - 4; +    uint32_t literal_offset = info.label.Position() - kLabelPositionToLiteralOffsetAdjustment;      linker_patches->push_back(LinkerPatch::RelativeCodePatch(literal_offset,                                                               info.target_method.dex_file,                                                               info.target_method.dex_method_index));    } -  for (const PcRelativeDexCacheAccessInfo& info : pc_rel_dex_cache_patches_) { -    // The label points to the end of the "mov" instruction but the literal offset for method -    // patch x86 needs to point to the embedded constant which occupies the last 4 bytes. -    uint32_t literal_offset = info.label.Position() - 4; +  for (const PcRelativeDexCacheAccessInfo& info : pc_relative_dex_cache_patches_) { +    uint32_t literal_offset = info.label.Position() - kLabelPositionToLiteralOffsetAdjustment;      linker_patches->push_back(LinkerPatch::DexCacheArrayPatch(literal_offset,                                                                &info.target_dex_file,                                                                info.label.Position(), @@ -695,7 +694,7 @@ CodeGeneratorX86_64::CodeGeneratorX86_64(HGraph* graph,          constant_area_start_(0),          method_patches_(graph->GetArena()->Adapter(kArenaAllocCodeGenerator)),          relative_call_patches_(graph->GetArena()->Adapter(kArenaAllocCodeGenerator)), -        pc_rel_dex_cache_patches_(graph->GetArena()->Adapter(kArenaAllocCodeGenerator)), +        pc_relative_dex_cache_patches_(graph->GetArena()->Adapter(kArenaAllocCodeGenerator)),          fixups_to_jump_tables_(graph->GetArena()->Adapter(kArenaAllocCodeGenerator)) {    AddAllocatedRegister(Location::RegisterLocation(kFakeReturnRegister));  } diff --git a/compiler/optimizing/code_generator_x86_64.h b/compiler/optimizing/code_generator_x86_64.h index 7a52473408..708450835d 100644 --- a/compiler/optimizing/code_generator_x86_64.h +++ b/compiler/optimizing/code_generator_x86_64.h @@ -401,7 +401,7 @@ class CodeGeneratorX86_64 : public CodeGenerator {    ArenaDeque<MethodPatchInfo<Label>> method_patches_;    ArenaDeque<MethodPatchInfo<Label>> relative_call_patches_;    // PC-relative DexCache access info. -  ArenaDeque<PcRelativeDexCacheAccessInfo> pc_rel_dex_cache_patches_; +  ArenaDeque<PcRelativeDexCacheAccessInfo> pc_relative_dex_cache_patches_;    // When we don't know the proper offset for the value, we use kDummy32BitOffset.    // We will fix this up in the linker later to have the right value. diff --git a/compiler/optimizing/nodes.cc b/compiler/optimizing/nodes.cc index de3f2668b6..83f53d791b 100644 --- a/compiler/optimizing/nodes.cc +++ b/compiler/optimizing/nodes.cc @@ -1972,6 +1972,16 @@ bool HInvokeStaticOrDirect::NeedsDexCacheOfDeclaringClass() const {    return !opt.GetDoesNotNeedDexCache();  } +void HInvokeStaticOrDirect::InsertInputAt(size_t index, HInstruction* input) { +  inputs_.insert(inputs_.begin() + index, HUserRecord<HInstruction*>(input)); +  input->AddUseAt(this, index); +  // Update indexes in use nodes of inputs that have been pushed further back by the insert(). +  for (size_t i = index + 1u, size = inputs_.size(); i != size; ++i) { +    DCHECK_EQ(InputRecordAt(i).GetUseNode()->GetIndex(), i - 1u); +    InputRecordAt(i).GetUseNode()->SetIndex(i); +  } +} +  void HInvokeStaticOrDirect::RemoveInputAt(size_t index) {    RemoveAsUserOfInput(index);    inputs_.erase(inputs_.begin() + index); diff --git a/compiler/optimizing/nodes.h b/compiler/optimizing/nodes.h index ab53e63300..4c4d0f268d 100644 --- a/compiler/optimizing/nodes.h +++ b/compiler/optimizing/nodes.h @@ -3436,6 +3436,7 @@ class HInvokeStaticOrDirect : public HInvoke {      dispatch_info_ = dispatch_info;    } +  void InsertInputAt(size_t index, HInstruction* input);    void RemoveInputAt(size_t index);    bool CanDoImplicitNullCheckOn(HInstruction* obj ATTRIBUTE_UNUSED) const OVERRIDE { @@ -3456,7 +3457,7 @@ class HInvokeStaticOrDirect : public HInvoke {    bool IsStringInit() const { return GetMethodLoadKind() == MethodLoadKind::kStringInit; }    uint32_t GetCurrentMethodInputIndex() const { return GetNumberOfArguments(); }    bool HasMethodAddress() const { return GetMethodLoadKind() == MethodLoadKind::kDirectAddress; } -  bool HasPcRelDexCache() const { +  bool HasPcRelativeDexCache() const {      return GetMethodLoadKind() == MethodLoadKind::kDexCachePcRelative;    }    bool HasCurrentMethodInput() const { @@ -3484,7 +3485,7 @@ class HInvokeStaticOrDirect : public HInvoke {    }    uint32_t GetDexCacheArrayOffset() const { -    DCHECK(HasPcRelDexCache()); +    DCHECK(HasPcRelativeDexCache());      return dispatch_info_.method_load_data;    } diff --git a/compiler/optimizing/optimizing_compiler.cc b/compiler/optimizing/optimizing_compiler.cc index 7e3c5e602e..6e85a82849 100644 --- a/compiler/optimizing/optimizing_compiler.cc +++ b/compiler/optimizing/optimizing_compiler.cc @@ -24,7 +24,7 @@  #endif  #ifdef ART_ENABLE_CODEGEN_x86 -#include "constant_area_fixups_x86.h" +#include "pc_relative_fixups_x86.h"  #endif  #include "art_method-inl.h" @@ -446,10 +446,9 @@ static void RunArchOptimizations(InstructionSet instruction_set,  #endif  #ifdef ART_ENABLE_CODEGEN_x86      case kX86: { -      x86::ConstantAreaFixups* constant_area_fixups = -          new (arena) x86::ConstantAreaFixups(graph, stats); +      x86::PcRelativeFixups* pc_relative_fixups = new (arena) x86::PcRelativeFixups(graph, stats);        HOptimization* x86_optimizations[] = { -        constant_area_fixups +          pc_relative_fixups        };        RunOptimizations(x86_optimizations, arraysize(x86_optimizations), pass_observer);        break; diff --git a/compiler/optimizing/constant_area_fixups_x86.cc b/compiler/optimizing/pc_relative_fixups_x86.cc index c3470002c5..c2894c7338 100644 --- a/compiler/optimizing/constant_area_fixups_x86.cc +++ b/compiler/optimizing/pc_relative_fixups_x86.cc @@ -14,7 +14,7 @@   * limitations under the License.   */ -#include "constant_area_fixups_x86.h" +#include "pc_relative_fixups_x86.h"  namespace art {  namespace x86 { @@ -22,9 +22,9 @@ namespace x86 {  /**   * Finds instructions that need the constant area base as an input.   */ -class ConstantHandlerVisitor : public HGraphVisitor { +class PCRelativeHandlerVisitor : public HGraphVisitor {   public: -  explicit ConstantHandlerVisitor(HGraph* graph) : HGraphVisitor(graph), base_(nullptr) {} +  explicit PCRelativeHandlerVisitor(HGraph* graph) : HGraphVisitor(graph), base_(nullptr) {}   private:    void VisitAdd(HAdd* add) OVERRIDE { @@ -72,7 +72,7 @@ class ConstantHandlerVisitor : public HGraphVisitor {    void VisitPackedSwitch(HPackedSwitch* switch_insn) OVERRIDE {      // We need to replace the HPackedSwitch with a HX86PackedSwitch in order to      // address the constant area. -    InitializeConstantAreaPointer(switch_insn); +    InitializePCRelativeBasePointer(switch_insn);      HGraph* graph = GetGraph();      HBasicBlock* block = switch_insn->GetBlock();      HX86PackedSwitch* x86_switch = new (graph->GetArena()) HX86PackedSwitch( @@ -84,7 +84,7 @@ class ConstantHandlerVisitor : public HGraphVisitor {      block->ReplaceAndRemoveInstructionWith(switch_insn, x86_switch);    } -  void InitializeConstantAreaPointer(HInstruction* user) { +  void InitializePCRelativeBasePointer(HInstruction* user) {      // Ensure we only initialize the pointer once.      if (base_ != nullptr) {        return; @@ -99,16 +99,24 @@ class ConstantHandlerVisitor : public HGraphVisitor {    }    void ReplaceInput(HInstruction* insn, HConstant* value, int input_index, bool materialize) { -    InitializeConstantAreaPointer(insn); -    HGraph* graph = GetGraph(); -    HBasicBlock* block = insn->GetBlock(); +    InitializePCRelativeBasePointer(insn);      HX86LoadFromConstantTable* load_constant = -        new (graph->GetArena()) HX86LoadFromConstantTable(base_, value, materialize); -    block->InsertInstructionBefore(load_constant, insn); +        new (GetGraph()->GetArena()) HX86LoadFromConstantTable(base_, value, materialize); +    insn->GetBlock()->InsertInstructionBefore(load_constant, insn);      insn->ReplaceInput(load_constant, input_index);    }    void HandleInvoke(HInvoke* invoke) { +    // If this is an invoke-static/-direct with PC-relative dex cache array +    // addressing, we need the PC-relative address base. +    HInvokeStaticOrDirect* invoke_static_or_direct = invoke->AsInvokeStaticOrDirect(); +    if (invoke_static_or_direct != nullptr && invoke_static_or_direct->HasPcRelativeDexCache()) { +      InitializePCRelativeBasePointer(invoke); +      // Add the extra parameter base_. +      uint32_t index = invoke_static_or_direct->GetCurrentMethodInputIndex(); +      DCHECK(!invoke_static_or_direct->HasCurrentMethodInput()); +      invoke_static_or_direct->InsertInputAt(index, base_); +    }      // Ensure that we can load FP arguments from the constant area.      for (size_t i = 0, e = invoke->InputCount(); i < e; i++) {        HConstant* input = invoke->InputAt(i)->AsConstant(); @@ -123,8 +131,8 @@ class ConstantHandlerVisitor : public HGraphVisitor {    HX86ComputeBaseMethodAddress* base_;  }; -void ConstantAreaFixups::Run() { -  ConstantHandlerVisitor visitor(graph_); +void PcRelativeFixups::Run() { +  PCRelativeHandlerVisitor visitor(graph_);    visitor.VisitInsertionOrder();  } diff --git a/compiler/optimizing/constant_area_fixups_x86.h b/compiler/optimizing/pc_relative_fixups_x86.h index 4138039cdd..af708acb03 100644 --- a/compiler/optimizing/constant_area_fixups_x86.h +++ b/compiler/optimizing/pc_relative_fixups_x86.h @@ -14,8 +14,8 @@   * limitations under the License.   */ -#ifndef ART_COMPILER_OPTIMIZING_CONSTANT_AREA_FIXUPS_X86_H_ -#define ART_COMPILER_OPTIMIZING_CONSTANT_AREA_FIXUPS_X86_H_ +#ifndef ART_COMPILER_OPTIMIZING_PC_RELATIVE_FIXUPS_X86_H_ +#define ART_COMPILER_OPTIMIZING_PC_RELATIVE_FIXUPS_X86_H_  #include "nodes.h"  #include "optimization.h" @@ -23,10 +23,10 @@  namespace art {  namespace x86 { -class ConstantAreaFixups : public HOptimization { +class PcRelativeFixups : public HOptimization {   public: -  ConstantAreaFixups(HGraph* graph, OptimizingCompilerStats* stats) -      : HOptimization(graph, "constant_area_fixups_x86", stats) {} +  PcRelativeFixups(HGraph* graph, OptimizingCompilerStats* stats) +      : HOptimization(graph, "pc_relative_fixups_x86", stats) {}    void Run() OVERRIDE;  }; @@ -34,4 +34,4 @@ class ConstantAreaFixups : public HOptimization {  }  // namespace x86  }  // namespace art -#endif  // ART_COMPILER_OPTIMIZING_CONSTANT_AREA_FIXUPS_X86_H_ +#endif  // ART_COMPILER_OPTIMIZING_PC_RELATIVE_FIXUPS_X86_H_ |