summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
-rw-r--r--compiler/jit/jit_compiler.cc4
-rw-r--r--compiler/jit/jit_compiler.h2
-rw-r--r--compiler/optimizing/code_generator_arm64.cc3
-rw-r--r--compiler/optimizing/code_generator_arm_vixl.cc3
-rw-r--r--compiler/optimizing/code_generator_riscv64.cc3
-rw-r--r--compiler/optimizing/code_generator_x86.cc3
-rw-r--r--compiler/optimizing/code_generator_x86_64.cc3
-rw-r--r--compiler/optimizing/graph_visualizer.cc3
-rw-r--r--compiler/optimizing/inliner.cc68
-rw-r--r--compiler/optimizing/inliner.h12
-rw-r--r--compiler/optimizing/optimization.cc1
-rw-r--r--compiler/optimizing/optimizing_compiler.cc36
-rw-r--r--compiler/optimizing/profiling_info_builder.cc59
-rw-r--r--compiler/optimizing/profiling_info_builder.h10
-rw-r--r--runtime/jit/jit.h1
-rw-r--r--runtime/jit/profiling_info.cc38
-rw-r--r--runtime/jit/profiling_info.h13
-rw-r--r--runtime/quick_exception_handler.cc43
18 files changed, 256 insertions, 49 deletions
diff --git a/compiler/jit/jit_compiler.cc b/compiler/jit/jit_compiler.cc
index 523a666f8a..c14d5d37e8 100644
--- a/compiler/jit/jit_compiler.cc
+++ b/compiler/jit/jit_compiler.cc
@@ -226,5 +226,9 @@ bool JitCompiler::IsBaselineCompiler() const {
return compiler_options_->IsBaseline();
}
+uint32_t JitCompiler::GetInlineMaxCodeUnits() const {
+ return compiler_options_->GetInlineMaxCodeUnits();
+}
+
} // namespace jit
} // namespace art
diff --git a/compiler/jit/jit_compiler.h b/compiler/jit/jit_compiler.h
index 5a919fb612..66aa545dd7 100644
--- a/compiler/jit/jit_compiler.h
+++ b/compiler/jit/jit_compiler.h
@@ -64,6 +64,8 @@ class JitCompiler : public JitCompilerInterface {
bool compress,
/*out*/ size_t* num_symbols) override;
+ uint32_t GetInlineMaxCodeUnits() const override;
+
private:
std::unique_ptr<CompilerOptions> compiler_options_;
std::unique_ptr<Compiler> compiler_;
diff --git a/compiler/optimizing/code_generator_arm64.cc b/compiler/optimizing/code_generator_arm64.cc
index 9027976165..907fdc04fa 100644
--- a/compiler/optimizing/code_generator_arm64.cc
+++ b/compiler/optimizing/code_generator_arm64.cc
@@ -4597,7 +4597,8 @@ void CodeGeneratorARM64::MaybeGenerateInlineCacheCheck(HInstruction* instruction
if (ProfilingInfoBuilder::IsInlineCacheUseful(instruction->AsInvoke(), this)) {
ProfilingInfo* info = GetGraph()->GetProfilingInfo();
DCHECK(info != nullptr);
- InlineCache* cache = ProfilingInfoBuilder::GetInlineCache(info, instruction->AsInvoke());
+ InlineCache* cache = ProfilingInfoBuilder::GetInlineCache(
+ info, GetCompilerOptions(), instruction->AsInvoke());
if (cache != nullptr) {
uint64_t address = reinterpret_cast64<uint64_t>(cache);
vixl::aarch64::Label done;
diff --git a/compiler/optimizing/code_generator_arm_vixl.cc b/compiler/optimizing/code_generator_arm_vixl.cc
index 00c14b0b46..144be63c6c 100644
--- a/compiler/optimizing/code_generator_arm_vixl.cc
+++ b/compiler/optimizing/code_generator_arm_vixl.cc
@@ -3687,7 +3687,8 @@ void CodeGeneratorARMVIXL::MaybeGenerateInlineCacheCheck(HInstruction* instructi
DCHECK_EQ(r0.GetCode(), klass.GetCode());
if (ProfilingInfoBuilder::IsInlineCacheUseful(instruction->AsInvoke(), this)) {
ProfilingInfo* info = GetGraph()->GetProfilingInfo();
- InlineCache* cache = ProfilingInfoBuilder::GetInlineCache(info, instruction->AsInvoke());
+ InlineCache* cache = ProfilingInfoBuilder::GetInlineCache(
+ info, GetCompilerOptions(), instruction->AsInvoke());
if (cache != nullptr) {
uint32_t address = reinterpret_cast32<uint32_t>(cache);
vixl32::Label done;
diff --git a/compiler/optimizing/code_generator_riscv64.cc b/compiler/optimizing/code_generator_riscv64.cc
index 182c1d4d05..9627fd2a5a 100644
--- a/compiler/optimizing/code_generator_riscv64.cc
+++ b/compiler/optimizing/code_generator_riscv64.cc
@@ -6724,7 +6724,8 @@ void CodeGeneratorRISCV64::MaybeGenerateInlineCacheCheck(HInstruction* instructi
if (ProfilingInfoBuilder::IsInlineCacheUseful(instruction->AsInvoke(), this)) {
ProfilingInfo* info = GetGraph()->GetProfilingInfo();
DCHECK(info != nullptr);
- InlineCache* cache = ProfilingInfoBuilder::GetInlineCache(info, instruction->AsInvoke());
+ InlineCache* cache = ProfilingInfoBuilder::GetInlineCache(
+ info, GetCompilerOptions(), instruction->AsInvoke());
if (cache != nullptr) {
uint64_t address = reinterpret_cast64<uint64_t>(cache);
Riscv64Label done;
diff --git a/compiler/optimizing/code_generator_x86.cc b/compiler/optimizing/code_generator_x86.cc
index 71db5c99af..95f4c7389d 100644
--- a/compiler/optimizing/code_generator_x86.cc
+++ b/compiler/optimizing/code_generator_x86.cc
@@ -2848,7 +2848,8 @@ void CodeGeneratorX86::MaybeGenerateInlineCacheCheck(HInstruction* instruction,
if (ProfilingInfoBuilder::IsInlineCacheUseful(instruction->AsInvoke(), this)) {
ProfilingInfo* info = GetGraph()->GetProfilingInfo();
DCHECK(info != nullptr);
- InlineCache* cache = ProfilingInfoBuilder::GetInlineCache(info, instruction->AsInvoke());
+ InlineCache* cache = ProfilingInfoBuilder::GetInlineCache(
+ info, GetCompilerOptions(), instruction->AsInvoke());
if (cache != nullptr) {
uint32_t address = reinterpret_cast32<uint32_t>(cache);
if (kIsDebugBuild) {
diff --git a/compiler/optimizing/code_generator_x86_64.cc b/compiler/optimizing/code_generator_x86_64.cc
index 81ffa9876c..d43d3dd95f 100644
--- a/compiler/optimizing/code_generator_x86_64.cc
+++ b/compiler/optimizing/code_generator_x86_64.cc
@@ -3098,7 +3098,8 @@ void CodeGeneratorX86_64::MaybeGenerateInlineCacheCheck(HInstruction* instructio
if (ProfilingInfoBuilder::IsInlineCacheUseful(instruction->AsInvoke(), this)) {
ProfilingInfo* info = GetGraph()->GetProfilingInfo();
DCHECK(info != nullptr);
- InlineCache* cache = ProfilingInfoBuilder::GetInlineCache(info, instruction->AsInvoke());
+ InlineCache* cache = ProfilingInfoBuilder::GetInlineCache(
+ info, GetCompilerOptions(), instruction->AsInvoke());
if (cache != nullptr) {
uint64_t address = reinterpret_cast64<uint64_t>(cache);
NearLabel done;
diff --git a/compiler/optimizing/graph_visualizer.cc b/compiler/optimizing/graph_visualizer.cc
index b7f7a0f550..afbf941355 100644
--- a/compiler/optimizing/graph_visualizer.cc
+++ b/compiler/optimizing/graph_visualizer.cc
@@ -867,7 +867,8 @@ class HGraphVisualizerPrinter : public HGraphDelegateVisitor {
std::ostringstream oss;
oss << pass_name_;
if (!IsDebugDump()) {
- oss << " (" << (is_after_pass_ ? "after" : "before")
+ oss << " (" << (GetGraph()->IsCompilingBaseline() ? "baseline " : "")
+ << (is_after_pass_ ? "after" : "before")
<< (graph_in_bad_state_ ? ", bad_state" : "") << ")";
}
PrintProperty("name", oss.str().c_str());
diff --git a/compiler/optimizing/inliner.cc b/compiler/optimizing/inliner.cc
index 37fa318403..d86e3b55c8 100644
--- a/compiler/optimizing/inliner.cc
+++ b/compiler/optimizing/inliner.cc
@@ -37,6 +37,7 @@
#include "mirror/object_array-alloc-inl.h"
#include "mirror/object_array-inl.h"
#include "nodes.h"
+#include "profiling_info_builder.h"
#include "reference_type_propagation.h"
#include "register_allocator_linear_scan.h"
#include "scoped_thread_state_change-inl.h"
@@ -519,6 +520,15 @@ bool HInliner::TryInline(HInvoke* invoke_instruction) {
return result;
}
+ if (graph_->IsCompilingBaseline()) {
+ LOG_FAIL_NO_STAT() << "Call to " << invoke_instruction->GetMethodReference().PrettyMethod()
+ << " not inlined because we are compiling baseline and we could not"
+ << " statically resolve the target";
+ // For baseline compilation, we will collect inline caches, so we should not
+ // try to inline using them.
+ return false;
+ }
+
DCHECK(!invoke_instruction->IsInvokeStaticOrDirect());
// No try catch inlining allowed here, or recursively. For try catch inlining we are banking on
@@ -669,17 +679,36 @@ HInliner::InlineCacheType HInliner::GetInlineCacheJIT(
ArtMethod* caller = graph_->GetArtMethod();
// Under JIT, we should always know the caller.
DCHECK(caller != nullptr);
- ProfilingInfo* profiling_info = graph_->GetProfilingInfo();
- if (profiling_info == nullptr) {
- return kInlineCacheNoData;
+
+ InlineCache* cache = nullptr;
+ // Start with the outer graph profiling info.
+ ProfilingInfo* profiling_info = outermost_graph_->GetProfilingInfo();
+ if (profiling_info != nullptr) {
+ if (depth_ == 0) {
+ cache = profiling_info->GetInlineCache(invoke_instruction->GetDexPc());
+ } else {
+ uint32_t dex_pc = ProfilingInfoBuilder::EncodeInlinedDexPc(
+ this, codegen_->GetCompilerOptions(), invoke_instruction);
+ if (dex_pc != kNoDexPc) {
+ cache = profiling_info->GetInlineCache(dex_pc);
+ }
+ }
+ }
+
+ if (cache == nullptr) {
+ // Check the current graph profiling info.
+ profiling_info = graph_->GetProfilingInfo();
+ if (profiling_info == nullptr) {
+ return kInlineCacheNoData;
+ }
+
+ cache = profiling_info->GetInlineCache(invoke_instruction->GetDexPc());
}
- InlineCache* cache = profiling_info->GetInlineCache(invoke_instruction->GetDexPc());
if (cache == nullptr) {
- // This shouldn't happen, but we don't guarantee that method resolution
- // between baseline compilation and optimizing compilation is identical. Be robust,
- // warn about it, and return that we don't have any inline cache data.
- LOG(WARNING) << "No inline cache found for " << caller->PrettyMethod();
+ // Either we never hit this invoke and we never compiled the callee,
+ // or the method wasn't resolved when we performed baseline compilation.
+ // Bail for now.
return kInlineCacheNoData;
}
Runtime::Current()->GetJit()->GetCodeCache()->CopyInlineCacheInto(*cache, classes);
@@ -705,6 +734,12 @@ HInliner::InlineCacheType HInliner::GetInlineCacheAOT(
const ProfileCompilationInfo::InlineCacheMap* inline_caches = hotness.GetInlineCacheMap();
DCHECK(inline_caches != nullptr);
+
+ // Inlined inline caches are not supported in AOT, so we use the dex pc directly, and don't
+ // call `InlineCache::EncodeDexPc`.
+ // To support it, we would need to ensure `inline_max_code_units` remain the
+ // same between dex2oat and runtime, for example by adding it to the boot
+ // image oat header.
const auto it = inline_caches->find(invoke_instruction->GetDexPc());
if (it == inline_caches->end()) {
return kInlineCacheUninitialized;
@@ -2074,6 +2109,20 @@ bool HInliner::CanInlineBody(const HGraph* callee_graph,
<< " could not be inlined because it needs a BSS check";
return false;
}
+
+ if (outermost_graph_->IsCompilingBaseline() &&
+ (current->IsInvokeVirtual() || current->IsInvokeInterface()) &&
+ ProfilingInfoBuilder::IsInlineCacheUseful(current->AsInvoke(), codegen_)) {
+ uint32_t maximum_inlining_depth_for_baseline =
+ InlineCache::MaxDexPcEncodingDepth(
+ outermost_graph_->GetArtMethod(),
+ codegen_->GetCompilerOptions().GetInlineMaxCodeUnits());
+ if (depth_ + 1 > maximum_inlining_depth_for_baseline) {
+ LOG_FAIL_NO_STAT() << "Reached maximum depth for inlining in baseline compilation: "
+ << depth_ << " for " << callee_graph->GetArtMethod()->PrettyMethod();
+ return false;
+ }
+ }
}
}
@@ -2185,6 +2234,7 @@ bool HInliner::TryBuildAndInlineHelper(HInvoke* invoke_instruction,
// The current invoke is not a try block.
!invoke_instruction->GetBlock()->IsTryBlock();
RunOptimizations(callee_graph,
+ invoke_instruction->GetEnvironment(),
code_item,
dex_compilation_unit,
try_catch_inlining_allowed_for_recursive_inline);
@@ -2224,6 +2274,7 @@ bool HInliner::TryBuildAndInlineHelper(HInvoke* invoke_instruction,
}
void HInliner::RunOptimizations(HGraph* callee_graph,
+ HEnvironment* caller_environment,
const dex::CodeItem* code_item,
const DexCompilationUnit& dex_compilation_unit,
bool try_catch_inlining_allowed_for_recursive_inline) {
@@ -2272,6 +2323,7 @@ void HInliner::RunOptimizations(HGraph* callee_graph,
total_number_of_dex_registers_ + accessor.RegistersSize(),
total_number_of_instructions_ + number_of_instructions,
this,
+ caller_environment,
depth_ + 1,
try_catch_inlining_allowed_for_recursive_inline);
inliner.Run();
diff --git a/compiler/optimizing/inliner.h b/compiler/optimizing/inliner.h
index af067dae73..a001404268 100644
--- a/compiler/optimizing/inliner.h
+++ b/compiler/optimizing/inliner.h
@@ -43,6 +43,7 @@ class HInliner : public HOptimization {
size_t total_number_of_dex_registers,
size_t total_number_of_instructions,
HInliner* parent,
+ HEnvironment* caller_environment,
size_t depth,
bool try_catch_inlining_allowed,
const char* name = kInlinerPassName)
@@ -54,6 +55,7 @@ class HInliner : public HOptimization {
total_number_of_dex_registers_(total_number_of_dex_registers),
total_number_of_instructions_(total_number_of_instructions),
parent_(parent),
+ caller_environment_(caller_environment),
depth_(depth),
inlining_budget_(0),
try_catch_inlining_allowed_(try_catch_inlining_allowed),
@@ -63,6 +65,12 @@ class HInliner : public HOptimization {
static constexpr const char* kInlinerPassName = "inliner";
+ const HInliner* GetParent() const { return parent_; }
+ const HEnvironment* GetCallerEnvironment() const { return caller_environment_; }
+
+ const HGraph* GetOutermostGraph() const { return outermost_graph_; }
+ const HGraph* GetGraph() const { return graph_; }
+
private:
enum InlineCacheType {
kInlineCacheNoData = 0,
@@ -108,6 +116,7 @@ class HInliner : public HOptimization {
// Run simple optimizations on `callee_graph`.
void RunOptimizations(HGraph* callee_graph,
+ HEnvironment* caller_environment,
const dex::CodeItem* code_item,
const DexCompilationUnit& dex_compilation_unit,
bool try_catch_inlining_allowed_for_recursive_inline)
@@ -320,9 +329,10 @@ class HInliner : public HOptimization {
const size_t total_number_of_dex_registers_;
size_t total_number_of_instructions_;
- // The 'parent' inliner, that means the inlinigng optimization that requested
+ // The 'parent' inliner, that means the inlining optimization that requested
// `graph_` to be inlined.
const HInliner* const parent_;
+ const HEnvironment* const caller_environment_;
const size_t depth_;
// The budget left for inlining, in number of instructions.
diff --git a/compiler/optimizing/optimization.cc b/compiler/optimizing/optimization.cc
index 16045d447c..a4df48c0ee 100644
--- a/compiler/optimizing/optimization.cc
+++ b/compiler/optimizing/optimization.cc
@@ -257,6 +257,7 @@ ArenaVector<HOptimization*> ConstructOptimizations(
accessor.RegistersSize(),
/* total_number_of_instructions= */ 0,
/* parent= */ nullptr,
+ /* caller_environment= */ nullptr,
/* depth= */ 0,
/* try_catch_inlining_allowed= */ true,
pass_name);
diff --git a/compiler/optimizing/optimizing_compiler.cc b/compiler/optimizing/optimizing_compiler.cc
index d458462226..5868f22ab8 100644
--- a/compiler/optimizing/optimizing_compiler.cc
+++ b/compiler/optimizing/optimizing_compiler.cc
@@ -368,10 +368,10 @@ class OptimizingCompiler final : public Compiler {
const DexCompilationUnit& dex_compilation_unit,
PassObserver* pass_observer) const;
- bool RunBaselineOptimizations(HGraph* graph,
- CodeGenerator* codegen,
- const DexCompilationUnit& dex_compilation_unit,
- PassObserver* pass_observer) const;
+ bool RunRequiredPasses(HGraph* graph,
+ CodeGenerator* codegen,
+ const DexCompilationUnit& dex_compilation_unit,
+ PassObserver* pass_observer) const;
std::vector<uint8_t> GenerateJitDebugInfo(const debug::MethodDebugInfo& method_debug_info);
@@ -444,10 +444,10 @@ static bool IsInstructionSetSupported(InstructionSet instruction_set) {
instruction_set == InstructionSet::kX86_64;
}
-bool OptimizingCompiler::RunBaselineOptimizations(HGraph* graph,
- CodeGenerator* codegen,
- const DexCompilationUnit& dex_compilation_unit,
- PassObserver* pass_observer) const {
+bool OptimizingCompiler::RunRequiredPasses(HGraph* graph,
+ CodeGenerator* codegen,
+ const DexCompilationUnit& dex_compilation_unit,
+ PassObserver* pass_observer) const {
switch (codegen->GetCompilerOptions().GetInstructionSet()) {
#if defined(ART_ENABLE_CODEGEN_arm)
case InstructionSet::kThumb2:
@@ -904,21 +904,15 @@ CodeGenerator* OptimizingCompiler::TryCompile(ArenaAllocator* allocator,
}
}
- if (compilation_kind == CompilationKind::kBaseline) {
- RunBaselineOptimizations(graph, codegen.get(), dex_compilation_unit, &pass_observer);
+ if (compilation_kind == CompilationKind::kBaseline && compiler_options.ProfileBranches()) {
+ // Branch profiling currently doesn't support running optimizations.
+ RunRequiredPasses(graph, codegen.get(), dex_compilation_unit, &pass_observer);
} else {
RunOptimizations(graph, codegen.get(), dex_compilation_unit, &pass_observer);
PassScope scope(WriteBarrierElimination::kWBEPassName, &pass_observer);
WriteBarrierElimination(graph, compilation_stats_.get()).Run();
}
- RegisterAllocator::Strategy regalloc_strategy =
- compiler_options.GetRegisterAllocationStrategy();
- AllocateRegisters(graph,
- codegen.get(),
- &pass_observer,
- regalloc_strategy,
- compilation_stats_.get());
// If we are compiling baseline and we haven't created a profiling info for
// this method already, do it now.
if (jit != nullptr &&
@@ -935,6 +929,14 @@ CodeGenerator* OptimizingCompiler::TryCompile(ArenaAllocator* allocator,
}
}
+ RegisterAllocator::Strategy regalloc_strategy =
+ compiler_options.GetRegisterAllocationStrategy();
+ AllocateRegisters(graph,
+ codegen.get(),
+ &pass_observer,
+ regalloc_strategy,
+ compilation_stats_.get());
+
codegen->Compile();
pass_observer.DumpDisassembly();
diff --git a/compiler/optimizing/profiling_info_builder.cc b/compiler/optimizing/profiling_info_builder.cc
index 7888753830..19795f5466 100644
--- a/compiler/optimizing/profiling_info_builder.cc
+++ b/compiler/optimizing/profiling_info_builder.cc
@@ -20,6 +20,7 @@
#include "code_generator.h"
#include "driver/compiler_options.h"
#include "dex/code_item_accessors-inl.h"
+#include "inliner.h"
#include "jit/profiling_info.h"
#include "optimizing_compiler_stats.h"
#include "scoped_thread_state_change-inl.h"
@@ -42,10 +43,53 @@ void ProfilingInfoBuilder::Run() {
ProfilingInfo::Create(soa.Self(), GetGraph()->GetArtMethod(), inline_caches_));
}
+
+uint32_t ProfilingInfoBuilder::EncodeInlinedDexPc(const HInliner* inliner,
+ const CompilerOptions& compiler_options,
+ HInvoke* invoke) {
+ DCHECK(inliner->GetCallerEnvironment() != nullptr);
+ DCHECK(inliner->GetParent() != nullptr);
+ std::vector<uint32_t> temp_vector;
+ temp_vector.push_back(invoke->GetDexPc());
+ while (inliner->GetCallerEnvironment() != nullptr) {
+ temp_vector.push_back(inliner->GetCallerEnvironment()->GetDexPc());
+ inliner = inliner->GetParent();
+ }
+
+ DCHECK_EQ(inliner->GetOutermostGraph(), inliner->GetGraph());
+ return InlineCache::EncodeDexPc(
+ inliner->GetOutermostGraph()->GetArtMethod(),
+ temp_vector,
+ compiler_options.GetInlineMaxCodeUnits());
+}
+
+static uint32_t EncodeDexPc(HInvoke* invoke, const CompilerOptions& compiler_options) {
+ std::vector<uint32_t> dex_pcs;
+ ArtMethod* outer_method = nullptr;
+ for (HEnvironment* environment = invoke->GetEnvironment();
+ environment != nullptr;
+ environment = environment->GetParent()) {
+ outer_method = environment->GetMethod();
+ dex_pcs.push_back(environment->GetDexPc());
+ }
+
+ ScopedObjectAccess soa(Thread::Current());
+ return InlineCache::EncodeDexPc(
+ outer_method,
+ dex_pcs,
+ compiler_options.GetInlineMaxCodeUnits());
+}
+
void ProfilingInfoBuilder::HandleInvoke(HInvoke* invoke) {
- DCHECK(!invoke->GetEnvironment()->IsFromInlinedInvoke());
if (IsInlineCacheUseful(invoke, codegen_)) {
- inline_caches_.push_back(invoke->GetDexPc());
+ uint32_t dex_pc = EncodeDexPc(invoke, compiler_options_);
+ if (dex_pc != kNoDexPc) {
+ inline_caches_.push_back(dex_pc);
+ } else {
+ ScopedObjectAccess soa(Thread::Current());
+ LOG(WARNING) << "Could not encode dex pc for "
+ << invoke->GetResolvedMethod()->PrettyMethod();
+ }
}
}
@@ -81,10 +125,15 @@ bool ProfilingInfoBuilder::IsInlineCacheUseful(HInvoke* invoke, CodeGenerator* c
return true;
}
-InlineCache* ProfilingInfoBuilder::GetInlineCache(ProfilingInfo* info, HInvoke* instruction) {
- DCHECK(!instruction->GetEnvironment()->IsFromInlinedInvoke());
+InlineCache* ProfilingInfoBuilder::GetInlineCache(ProfilingInfo* info,
+ const CompilerOptions& compiler_options,
+ HInvoke* instruction) {
ScopedObjectAccess soa(Thread::Current());
- return info->GetInlineCache(instruction->GetDexPc());
+ uint32_t dex_pc = EncodeDexPc(instruction, compiler_options);
+ if (dex_pc == kNoDexPc) {
+ return nullptr;
+ }
+ return info->GetInlineCache(dex_pc);
}
} // namespace art
diff --git a/compiler/optimizing/profiling_info_builder.h b/compiler/optimizing/profiling_info_builder.h
index 2185b0eed3..c8dc59a03c 100644
--- a/compiler/optimizing/profiling_info_builder.h
+++ b/compiler/optimizing/profiling_info_builder.h
@@ -24,6 +24,7 @@ namespace art HIDDEN {
class CodeGenerator;
class CompilerOptions;
+class HInliner;
class InlineCache;
class ProfilingInfo;
@@ -42,8 +43,13 @@ class ProfilingInfoBuilder : public HGraphDelegateVisitor {
static constexpr const char* kProfilingInfoBuilderPassName =
"profiling_info_builder";
- static InlineCache* GetInlineCache(ProfilingInfo* info, HInvoke* invoke);
+ static InlineCache* GetInlineCache(ProfilingInfo* info,
+ const CompilerOptions& compiler_options,
+ HInvoke* invoke);
static bool IsInlineCacheUseful(HInvoke* invoke, CodeGenerator* codegen);
+ static uint32_t EncodeInlinedDexPc(
+ const HInliner* inliner, const CompilerOptions& compiler_options, HInvoke* invoke)
+ REQUIRES_SHARED(Locks::mutator_lock_);
private:
void VisitInvokeVirtual(HInvokeVirtual* invoke) override;
@@ -52,7 +58,7 @@ class ProfilingInfoBuilder : public HGraphDelegateVisitor {
void HandleInvoke(HInvoke* invoke);
CodeGenerator* codegen_;
- [[maybe_unused]] const CompilerOptions& compiler_options_;
+ const CompilerOptions& compiler_options_;
std::vector<uint32_t> inline_caches_;
DISALLOW_COPY_AND_ASSIGN(ProfilingInfoBuilder);
diff --git a/runtime/jit/jit.h b/runtime/jit/jit.h
index d5fcd35b3d..2acbbf7416 100644
--- a/runtime/jit/jit.h
+++ b/runtime/jit/jit.h
@@ -197,6 +197,7 @@ class JitCompilerInterface {
virtual void ParseCompilerOptions() = 0;
virtual bool IsBaselineCompiler() const = 0;
virtual void SetDebuggableCompilerOption(bool value) = 0;
+ virtual uint32_t GetInlineMaxCodeUnits() const = 0;
virtual std::vector<uint8_t> PackElfFileForJIT(ArrayRef<const JITCodeEntry*> elf_files,
ArrayRef<const void*> removed_symbols,
diff --git a/runtime/jit/profiling_info.cc b/runtime/jit/profiling_info.cc
index 2e94a41093..1aaf53e0a1 100644
--- a/runtime/jit/profiling_info.cc
+++ b/runtime/jit/profiling_info.cc
@@ -114,6 +114,9 @@ BranchCache* ProfilingInfo::GetBranchCache(uint32_t dex_pc) {
void ProfilingInfo::AddInvokeInfo(uint32_t dex_pc, mirror::Class* cls) {
InlineCache* cache = GetInlineCache(dex_pc);
+ if (cache == nullptr) {
+ return;
+ }
for (size_t i = 0; i < InlineCache::kIndividualCacheSize; ++i) {
mirror::Class* existing = cache->classes_[i].Read<kWithoutReadBarrier>();
mirror::Class* marked = ReadBarrier::IsMarked(existing);
@@ -159,4 +162,39 @@ ScopedProfilingInfoUse::~ScopedProfilingInfoUse() {
}
}
+uint32_t InlineCache::EncodeDexPc(ArtMethod* method,
+ const std::vector<uint32_t>& dex_pcs,
+ uint32_t inline_max_code_units) {
+ if (kIsDebugBuild) {
+ // Make sure `inline_max_code_units` is always the same.
+ static uint32_t global_max_code_units = inline_max_code_units;
+ CHECK_EQ(global_max_code_units, inline_max_code_units);
+ }
+ if (dex_pcs.size() - 1 > MaxDexPcEncodingDepth(method, inline_max_code_units)) {
+ return -1;
+ }
+ uint32_t size = dex_pcs.size();
+ uint32_t insns_size = method->DexInstructions().InsnsSizeInCodeUnits();
+
+ uint32_t dex_pc = dex_pcs[size - 1];
+ uint32_t shift = MinimumBitsToStore(insns_size - 1);
+ for (uint32_t i = size - 1; i > 0; --i) {
+ DCHECK_LT(shift, BitSizeOf<uint32_t>());
+ dex_pc += ((dex_pcs[i - 1] + 1) << shift);
+ shift += MinimumBitsToStore(inline_max_code_units);
+ }
+ return dex_pc;
+}
+
+uint32_t InlineCache::MaxDexPcEncodingDepth(ArtMethod* method, uint32_t inline_max_code_units) {
+ uint32_t insns_size = method->DexInstructions().InsnsSizeInCodeUnits();
+ uint32_t num_bits = MinimumBitsToStore(insns_size - 1);
+ uint32_t depth = 0;
+ do {
+ depth++;
+ num_bits += MinimumBitsToStore(inline_max_code_units);
+ } while (num_bits <= BitSizeOf<uint32_t>());
+ return depth - 1;
+}
+
} // namespace art
diff --git a/runtime/jit/profiling_info.h b/runtime/jit/profiling_info.h
index 62b431d7a2..4ce20ff66a 100644
--- a/runtime/jit/profiling_info.h
+++ b/runtime/jit/profiling_info.h
@@ -28,6 +28,7 @@
namespace art {
class ArtMethod;
+class CompilerOptions;
class ProfilingInfo;
namespace jit {
@@ -50,6 +51,18 @@ class InlineCache {
return MemberOffset(OFFSETOF_MEMBER(InlineCache, classes_));
}
+ // Encode the list of `dex_pcs` to fit into an uint32_t.
+ static uint32_t EncodeDexPc(ArtMethod* method,
+ const std::vector<uint32_t>& dex_pcs,
+ uint32_t inline_max_code_units)
+ REQUIRES_SHARED(Locks::mutator_lock_);
+
+ // Return the maximum inlining depth that we support to encode a list of dex
+ // pcs.
+ static uint32_t MaxDexPcEncodingDepth(ArtMethod* method,
+ uint32_t inline_max_code_units)
+ REQUIRES_SHARED(Locks::mutator_lock_);
+
private:
uint32_t dex_pc_;
GcRoot<mirror::Class> classes_[kIndividualCacheSize];
diff --git a/runtime/quick_exception_handler.cc b/runtime/quick_exception_handler.cc
index 590a596c1f..86a2ddabfd 100644
--- a/runtime/quick_exception_handler.cc
+++ b/runtime/quick_exception_handler.cc
@@ -407,6 +407,10 @@ class DeoptimizeStackVisitor final : public StackVisitor {
return bottom_shadow_frame_;
}
+ const std::vector<uint32_t>& GetDexPcs() const {
+ return dex_pcs_;
+ }
+
void FinishStackWalk() REQUIRES_SHARED(Locks::mutator_lock_) {
// This is the upcall, or the next full frame in single-frame deopt, or the
// code isn't deoptimizeable. We remember the frame and last pc so that we
@@ -515,11 +519,14 @@ class DeoptimizeStackVisitor final : public StackVisitor {
}
prev_shadow_frame_ = new_frame;
- if (single_frame_deopt_ && !IsInInlinedFrame()) {
- // Single-frame deopt ends at the first non-inlined frame and needs to store that method.
- single_frame_done_ = true;
- single_frame_deopt_method_ = method;
- single_frame_deopt_quick_method_header_ = GetCurrentOatQuickMethodHeader();
+ if (single_frame_deopt_) {
+ dex_pcs_.push_back(GetDexPc());
+ if (!IsInInlinedFrame()) {
+ // Single-frame deopt ends at the first non-inlined frame and needs to store that method.
+ single_frame_done_ = true;
+ single_frame_deopt_method_ = method;
+ single_frame_deopt_quick_method_header_ = GetCurrentOatQuickMethodHeader();
+ }
}
callee_method_ = method;
return true;
@@ -659,6 +666,7 @@ class DeoptimizeStackVisitor final : public StackVisitor {
// a deopt after running method exit callbacks if the callback throws or requests events that
// need a deopt.
bool skip_method_exit_callbacks_;
+ std::vector<uint32_t> dex_pcs_;
DISALLOW_COPY_AND_ASSIGN(DeoptimizeStackVisitor);
};
@@ -739,11 +747,26 @@ void QuickExceptionHandler::DeoptimizeSingleFrame(DeoptimizationKind kind) {
case Instruction::INVOKE_VIRTUAL:
case Instruction::INVOKE_INTERFACE_RANGE:
case Instruction::INVOKE_VIRTUAL_RANGE: {
- runtime->GetJit()->GetCodeCache()->MaybeUpdateInlineCache(
- shadow_frame->GetMethod(),
- dex_pc,
- shadow_frame->GetVRegReference(inst->VRegC())->GetClass(),
- self_);
+ uint32_t encoded_dex_pc = InlineCache::EncodeDexPc(
+ visitor.GetSingleFrameDeoptMethod(),
+ visitor.GetDexPcs(),
+ runtime->GetJit()->GetJitCompiler()->GetInlineMaxCodeUnits());
+ if (encoded_dex_pc != static_cast<uint32_t>(-1)) {
+ // The inline cache comes from the top-level method.
+ runtime->GetJit()->GetCodeCache()->MaybeUpdateInlineCache(
+ visitor.GetSingleFrameDeoptMethod(),
+ encoded_dex_pc,
+ shadow_frame->GetVRegReference(inst->VRegC())->GetClass(),
+ self_);
+ } else {
+ // If the top-level inline cache did not exist, update the one for the
+ // bottom method, we know it's the one that was used for compilation.
+ runtime->GetJit()->GetCodeCache()->MaybeUpdateInlineCache(
+ shadow_frame->GetMethod(),
+ dex_pc,
+ shadow_frame->GetVRegReference(inst->VRegC())->GetClass(),
+ self_);
+ }
break;
}
default: {