| /* |
| * Copyright (C) 2014 The Android Open Source Project |
| * |
| * Licensed under the Apache License, Version 2.0 (the "License"); |
| * you may not use this file except in compliance with the License. |
| * You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| #ifndef ART_COMPILER_OPTIMIZING_INLINER_H_ |
| #define ART_COMPILER_OPTIMIZING_INLINER_H_ |
| |
| #include "dex_file_types.h" |
| #include "invoke_type.h" |
| #include "optimization.h" |
| #include "jit/profile_compilation_info.h" |
| |
| namespace art { |
| |
| class CodeGenerator; |
| class CompilerDriver; |
| class DexCompilationUnit; |
| class HGraph; |
| class HInvoke; |
| class OptimizingCompilerStats; |
| |
| class HInliner : public HOptimization { |
| public: |
| HInliner(HGraph* outer_graph, |
| HGraph* outermost_graph, |
| CodeGenerator* codegen, |
| const DexCompilationUnit& outer_compilation_unit, |
| const DexCompilationUnit& caller_compilation_unit, |
| CompilerDriver* compiler_driver, |
| VariableSizedHandleScope* handles, |
| OptimizingCompilerStats* stats, |
| size_t total_number_of_dex_registers, |
| size_t depth) |
| : HOptimization(outer_graph, kInlinerPassName, stats), |
| outermost_graph_(outermost_graph), |
| outer_compilation_unit_(outer_compilation_unit), |
| caller_compilation_unit_(caller_compilation_unit), |
| codegen_(codegen), |
| compiler_driver_(compiler_driver), |
| total_number_of_dex_registers_(total_number_of_dex_registers), |
| depth_(depth), |
| number_of_inlined_instructions_(0), |
| handles_(handles), |
| inline_stats_(nullptr) {} |
| |
| void Run() OVERRIDE; |
| |
| static constexpr const char* kInlinerPassName = "inliner"; |
| |
| private: |
| enum InlineCacheType { |
| kInlineCacheNoData = 0, |
| kInlineCacheUninitialized = 1, |
| kInlineCacheMonomorphic = 2, |
| kInlineCachePolymorphic = 3, |
| kInlineCacheMegamorphic = 4, |
| kInlineCacheMissingTypes = 5 |
| }; |
| |
| bool TryInline(HInvoke* invoke_instruction); |
| |
| // Try to inline `resolved_method` in place of `invoke_instruction`. `do_rtp` is whether |
| // reference type propagation can run after the inlining. If the inlining is successful, this |
| // method will replace and remove the `invoke_instruction`. If `cha_devirtualize` is true, |
| // a CHA guard needs to be added for the inlining. |
| bool TryInlineAndReplace(HInvoke* invoke_instruction, |
| ArtMethod* resolved_method, |
| ReferenceTypeInfo receiver_type, |
| bool do_rtp, |
| bool cha_devirtualize) |
| REQUIRES_SHARED(Locks::mutator_lock_); |
| |
| bool TryBuildAndInline(HInvoke* invoke_instruction, |
| ArtMethod* resolved_method, |
| ReferenceTypeInfo receiver_type, |
| HInstruction** return_replacement) |
| REQUIRES_SHARED(Locks::mutator_lock_); |
| |
| bool TryBuildAndInlineHelper(HInvoke* invoke_instruction, |
| ArtMethod* resolved_method, |
| ReferenceTypeInfo receiver_type, |
| bool same_dex_file, |
| HInstruction** return_replacement); |
| |
| // Run simple optimizations on `callee_graph`. |
| // Returns the number of inlined instructions. |
| size_t RunOptimizations(HGraph* callee_graph, |
| const DexFile::CodeItem* code_item, |
| const DexCompilationUnit& dex_compilation_unit); |
| |
| // Try to recognize known simple patterns and replace invoke call with appropriate instructions. |
| bool TryPatternSubstitution(HInvoke* invoke_instruction, |
| ArtMethod* resolved_method, |
| HInstruction** return_replacement) |
| REQUIRES_SHARED(Locks::mutator_lock_); |
| |
| // Create a new HInstanceFieldGet. |
| HInstanceFieldGet* CreateInstanceFieldGet(uint32_t field_index, |
| ArtMethod* referrer, |
| HInstruction* obj); |
| // Create a new HInstanceFieldSet. |
| HInstanceFieldSet* CreateInstanceFieldSet(uint32_t field_index, |
| ArtMethod* referrer, |
| HInstruction* obj, |
| HInstruction* value, |
| bool* is_final = nullptr); |
| |
| // Try inlining the invoke instruction using inline caches. |
| bool TryInlineFromInlineCache( |
| const DexFile& caller_dex_file, |
| HInvoke* invoke_instruction, |
| ArtMethod* resolved_method) |
| REQUIRES_SHARED(Locks::mutator_lock_); |
| |
| // Try getting the inline cache from JIT code cache. |
| // Return true if the inline cache was successfully allocated and the |
| // invoke info was found in the profile info. |
| InlineCacheType GetInlineCacheJIT( |
| HInvoke* invoke_instruction, |
| StackHandleScope<1>* hs, |
| /*out*/Handle<mirror::ObjectArray<mirror::Class>>* inline_cache) |
| REQUIRES_SHARED(Locks::mutator_lock_); |
| |
| // Try getting the inline cache from AOT offline profile. |
| // Return true if the inline cache was successfully allocated and the |
| // invoke info was found in the profile info. |
| InlineCacheType GetInlineCacheAOT(const DexFile& caller_dex_file, |
| HInvoke* invoke_instruction, |
| StackHandleScope<1>* hs, |
| /*out*/Handle<mirror::ObjectArray<mirror::Class>>* inline_cache) |
| REQUIRES_SHARED(Locks::mutator_lock_); |
| |
| // Extract the mirror classes from the offline profile and add them to the `inline_cache`. |
| // Note that even if we have profile data for the invoke the inline_cache might contain |
| // only null entries if the types cannot be resolved. |
| InlineCacheType ExtractClassesFromOfflineProfile( |
| const HInvoke* invoke_instruction, |
| const ProfileCompilationInfo::OfflineProfileMethodInfo& offline_profile, |
| /*out*/Handle<mirror::ObjectArray<mirror::Class>> inline_cache) |
| REQUIRES_SHARED(Locks::mutator_lock_); |
| |
| // Compute the inline cache type. |
| InlineCacheType GetInlineCacheType( |
| const Handle<mirror::ObjectArray<mirror::Class>>& classes) |
| REQUIRES_SHARED(Locks::mutator_lock_); |
| |
| // Try to inline the target of a monomorphic call. If successful, the code |
| // in the graph will look like: |
| // if (receiver.getClass() != ic.GetMonomorphicType()) deopt |
| // ... // inlined code |
| bool TryInlineMonomorphicCall(HInvoke* invoke_instruction, |
| ArtMethod* resolved_method, |
| Handle<mirror::ObjectArray<mirror::Class>> classes) |
| REQUIRES_SHARED(Locks::mutator_lock_); |
| |
| // Try to inline targets of a polymorphic call. |
| bool TryInlinePolymorphicCall(HInvoke* invoke_instruction, |
| ArtMethod* resolved_method, |
| Handle<mirror::ObjectArray<mirror::Class>> classes) |
| REQUIRES_SHARED(Locks::mutator_lock_); |
| |
| bool TryInlinePolymorphicCallToSameTarget(HInvoke* invoke_instruction, |
| ArtMethod* resolved_method, |
| Handle<mirror::ObjectArray<mirror::Class>> classes) |
| REQUIRES_SHARED(Locks::mutator_lock_); |
| |
| // Try CHA-based devirtualization to change virtual method calls into |
| // direct calls. |
| // Returns the actual method that resolved_method can be devirtualized to. |
| ArtMethod* TryCHADevirtualization(ArtMethod* resolved_method) |
| REQUIRES_SHARED(Locks::mutator_lock_); |
| |
| // Add a CHA guard for a CHA-based devirtualized call. A CHA guard checks a |
| // should_deoptimize flag and if it's true, does deoptimization. |
| void AddCHAGuard(HInstruction* invoke_instruction, |
| uint32_t dex_pc, |
| HInstruction* cursor, |
| HBasicBlock* bb_cursor); |
| |
| HInstanceFieldGet* BuildGetReceiverClass(ClassLinker* class_linker, |
| HInstruction* receiver, |
| uint32_t dex_pc) const |
| REQUIRES_SHARED(Locks::mutator_lock_); |
| |
| void FixUpReturnReferenceType(ArtMethod* resolved_method, HInstruction* return_replacement) |
| REQUIRES_SHARED(Locks::mutator_lock_); |
| |
| // Creates an instance of ReferenceTypeInfo from `klass` if `klass` is |
| // admissible (see ReferenceTypePropagation::IsAdmissible for details). |
| // Otherwise returns inexact Object RTI. |
| ReferenceTypeInfo GetClassRTI(mirror::Class* klass) REQUIRES_SHARED(Locks::mutator_lock_); |
| |
| bool ArgumentTypesMoreSpecific(HInvoke* invoke_instruction, ArtMethod* resolved_method) |
| REQUIRES_SHARED(Locks::mutator_lock_); |
| |
| bool ReturnTypeMoreSpecific(HInvoke* invoke_instruction, HInstruction* return_replacement) |
| REQUIRES_SHARED(Locks::mutator_lock_); |
| |
| // Add a type guard on the given `receiver`. This will add to the graph: |
| // i0 = HFieldGet(receiver, klass) |
| // i1 = HLoadClass(class_index, is_referrer) |
| // i2 = HNotEqual(i0, i1) |
| // |
| // And if `with_deoptimization` is true: |
| // HDeoptimize(i2) |
| // |
| // The method returns the `HNotEqual`, that will be used for polymorphic inlining. |
| HInstruction* AddTypeGuard(HInstruction* receiver, |
| HInstruction* cursor, |
| HBasicBlock* bb_cursor, |
| dex::TypeIndex class_index, |
| Handle<mirror::Class> klass, |
| HInstruction* invoke_instruction, |
| bool with_deoptimization) |
| REQUIRES_SHARED(Locks::mutator_lock_); |
| |
| /* |
| * Ad-hoc implementation for implementing a diamond pattern in the graph for |
| * polymorphic inlining: |
| * 1) `compare` becomes the input of the new `HIf`. |
| * 2) Everything up until `invoke_instruction` is in the then branch (could |
| * contain multiple blocks). |
| * 3) `invoke_instruction` is moved to the otherwise block. |
| * 4) If `return_replacement` is not null, the merge block will have |
| * a phi whose inputs are `return_replacement` and `invoke_instruction`. |
| * |
| * Before: |
| * Block1 |
| * compare |
| * ... |
| * invoke_instruction |
| * |
| * After: |
| * Block1 |
| * compare |
| * if |
| * / \ |
| * / \ |
| * Then block Otherwise block |
| * ... invoke_instruction |
| * \ / |
| * \ / |
| * Merge block |
| * phi(return_replacement, invoke_instruction) |
| */ |
| void CreateDiamondPatternForPolymorphicInline(HInstruction* compare, |
| HInstruction* return_replacement, |
| HInstruction* invoke_instruction); |
| |
| HGraph* const outermost_graph_; |
| const DexCompilationUnit& outer_compilation_unit_; |
| const DexCompilationUnit& caller_compilation_unit_; |
| CodeGenerator* const codegen_; |
| CompilerDriver* const compiler_driver_; |
| const size_t total_number_of_dex_registers_; |
| const size_t depth_; |
| size_t number_of_inlined_instructions_; |
| VariableSizedHandleScope* const handles_; |
| |
| // Used to record stats about optimizations on the inlined graph. |
| // If the inlining is successful, these stats are merged to the caller graph's stats. |
| OptimizingCompilerStats* inline_stats_; |
| |
| DISALLOW_COPY_AND_ASSIGN(HInliner); |
| }; |
| |
| } // namespace art |
| |
| #endif // ART_COMPILER_OPTIMIZING_INLINER_H_ |