blob: 882ba4e58b0f403462ffcef7d3e393794f23a325 [file] [log] [blame]
Nicolas Geoffraye53798a2014-12-01 10:31:54 +00001/*
2 * Copyright (C) 2014 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17#ifndef ART_COMPILER_OPTIMIZING_INLINER_H_
18#define ART_COMPILER_OPTIMIZING_INLINER_H_
19
David Sehr9e734c72018-01-04 17:56:19 -080020#include "dex/dex_file_types.h"
David Sehr8c0961f2018-01-23 16:11:38 -080021#include "dex/invoke_type.h"
Andreas Gampe8cf9cb32017-07-19 09:28:38 -070022#include "optimization.h"
David Sehr82d046e2018-04-23 08:14:19 -070023#include "profile/profile_compilation_info.h"
Nicolas Geoffraye53798a2014-12-01 10:31:54 +000024
Vladimir Marko0a516052019-10-14 13:00:44 +000025namespace art {
Nicolas Geoffraye53798a2014-12-01 10:31:54 +000026
Vladimir Markodc151b22015-10-15 18:02:30 +010027class CodeGenerator;
Nicolas Geoffraye53798a2014-12-01 10:31:54 +000028class DexCompilationUnit;
29class HGraph;
30class HInvoke;
31class OptimizingCompilerStats;
32
33class HInliner : public HOptimization {
34 public:
35 HInliner(HGraph* outer_graph,
Nicolas Geoffray73be1e82015-09-17 15:22:56 +010036 HGraph* outermost_graph,
Vladimir Markodc151b22015-10-15 18:02:30 +010037 CodeGenerator* codegen,
Nicolas Geoffraye53798a2014-12-01 10:31:54 +000038 const DexCompilationUnit& outer_compilation_unit,
Nicolas Geoffray9437b782015-03-25 10:08:51 +000039 const DexCompilationUnit& caller_compilation_unit,
Mathieu Chartiere8a3c572016-10-11 16:52:17 -070040 VariableSizedHandleScope* handles,
Nicolas Geoffrayef87c5d2015-01-30 12:41:14 +000041 OptimizingCompilerStats* stats,
Nicolas Geoffray5949fa02015-12-18 10:57:10 +000042 size_t total_number_of_dex_registers,
Nicolas Geoffrayf6d46682017-02-28 17:41:45 +000043 size_t total_number_of_instructions,
44 HInliner* parent,
Aart Bik2ca10eb2017-11-15 15:17:53 -080045 size_t depth = 0,
46 const char* name = kInlinerPassName)
47 : HOptimization(outer_graph, name, stats),
Nicolas Geoffray73be1e82015-09-17 15:22:56 +010048 outermost_graph_(outermost_graph),
Nicolas Geoffraye53798a2014-12-01 10:31:54 +000049 outer_compilation_unit_(outer_compilation_unit),
Nicolas Geoffray9437b782015-03-25 10:08:51 +000050 caller_compilation_unit_(caller_compilation_unit),
Vladimir Markodc151b22015-10-15 18:02:30 +010051 codegen_(codegen),
Nicolas Geoffray5949fa02015-12-18 10:57:10 +000052 total_number_of_dex_registers_(total_number_of_dex_registers),
Nicolas Geoffrayf6d46682017-02-28 17:41:45 +000053 total_number_of_instructions_(total_number_of_instructions),
54 parent_(parent),
Nicolas Geoffray454a4812015-06-09 10:37:32 +010055 depth_(depth),
Nicolas Geoffrayf6d46682017-02-28 17:41:45 +000056 inlining_budget_(0),
Vladimir Marko438709f2017-02-23 18:56:13 +000057 handles_(handles),
58 inline_stats_(nullptr) {}
Nicolas Geoffraye53798a2014-12-01 10:31:54 +000059
Roland Levillainbbc6e7e2018-08-24 16:58:47 +010060 bool Run() override;
Nicolas Geoffraye53798a2014-12-01 10:31:54 +000061
Andreas Gampe7c3952f2015-02-19 18:21:24 -080062 static constexpr const char* kInlinerPassName = "inliner";
63
Nicolas Geoffraye53798a2014-12-01 10:31:54 +000064 private:
Calin Juravle13439f02017-02-21 01:17:21 -080065 enum InlineCacheType {
66 kInlineCacheNoData = 0,
67 kInlineCacheUninitialized = 1,
68 kInlineCacheMonomorphic = 2,
69 kInlineCachePolymorphic = 3,
70 kInlineCacheMegamorphic = 4,
71 kInlineCacheMissingTypes = 5
72 };
73
Nicolas Geoffraye418dda2015-08-11 20:03:09 -070074 bool TryInline(HInvoke* invoke_instruction);
Nicolas Geoffray73be1e82015-09-17 15:22:56 +010075
Eric Holk1868de92020-02-12 09:10:21 -080076 // Attempt to resolve the target of the invoke instruction to an acutal call
77 // target.
78 //
79 // Returns the target directly in the case of static or direct invokes.
80 // Otherwise, uses CHA devirtualization or other methods to try to find the
81 // call target.
82 ArtMethod* FindActualCallTarget(HInvoke* invoke_instruction, bool* cha_devirtualize)
83 REQUIRES_SHARED(Locks::mutator_lock_);
84
Nicolas Geoffray73be1e82015-09-17 15:22:56 +010085 // Try to inline `resolved_method` in place of `invoke_instruction`. `do_rtp` is whether
Nicolas Geoffray55bd7492016-02-16 15:37:12 +000086 // reference type propagation can run after the inlining. If the inlining is successful, this
Mingyao Yang063fc772016-08-02 11:02:54 -070087 // method will replace and remove the `invoke_instruction`. If `cha_devirtualize` is true,
88 // a CHA guard needs to be added for the inlining.
89 bool TryInlineAndReplace(HInvoke* invoke_instruction,
90 ArtMethod* resolved_method,
Nicolas Geoffray0f001b72017-01-04 16:46:23 +000091 ReferenceTypeInfo receiver_type,
Mingyao Yang063fc772016-08-02 11:02:54 -070092 bool do_rtp,
93 bool cha_devirtualize)
Andreas Gampebdf7f1c2016-08-30 16:38:47 -070094 REQUIRES_SHARED(Locks::mutator_lock_);
Nicolas Geoffray73be1e82015-09-17 15:22:56 +010095
Nicolas Geoffray55bd7492016-02-16 15:37:12 +000096 bool TryBuildAndInline(HInvoke* invoke_instruction,
97 ArtMethod* resolved_method,
Nicolas Geoffray0f001b72017-01-04 16:46:23 +000098 ReferenceTypeInfo receiver_type,
Nicolas Geoffray55bd7492016-02-16 15:37:12 +000099 HInstruction** return_replacement)
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700100 REQUIRES_SHARED(Locks::mutator_lock_);
Nicolas Geoffray55bd7492016-02-16 15:37:12 +0000101
102 bool TryBuildAndInlineHelper(HInvoke* invoke_instruction,
103 ArtMethod* resolved_method,
Nicolas Geoffray0f001b72017-01-04 16:46:23 +0000104 ReferenceTypeInfo receiver_type,
Eric Holk1868de92020-02-12 09:10:21 -0800105 HInstruction** return_replacement)
106 REQUIRES_SHARED(Locks::mutator_lock_);
107
108 // Substitutes parameters in the callee graph with their values from the caller.
109 void SubstituteArguments(HGraph* callee_graph,
110 HInvoke* invoke_instruction,
111 ReferenceTypeInfo receiver_type,
112 const DexCompilationUnit& dex_compilation_unit)
113 REQUIRES_SHARED(Locks::mutator_lock_);
Nicolas Geoffray55bd7492016-02-16 15:37:12 +0000114
Roland Levillaina3aef2e2016-04-06 17:45:58 +0100115 // Run simple optimizations on `callee_graph`.
Nicolas Geoffrayf6d46682017-02-28 17:41:45 +0000116 void RunOptimizations(HGraph* callee_graph,
Andreas Gampe3f1dcd32018-12-28 09:39:56 -0800117 const dex::CodeItem* code_item,
Nicolas Geoffrayf6d46682017-02-28 17:41:45 +0000118 const DexCompilationUnit& dex_compilation_unit)
119 REQUIRES_SHARED(Locks::mutator_lock_);
Roland Levillaina3aef2e2016-04-06 17:45:58 +0100120
Vladimir Markobe10e8e2016-01-22 12:09:44 +0000121 // Try to recognize known simple patterns and replace invoke call with appropriate instructions.
Nicolas Geoffray55bd7492016-02-16 15:37:12 +0000122 bool TryPatternSubstitution(HInvoke* invoke_instruction,
123 ArtMethod* resolved_method,
124 HInstruction** return_replacement)
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700125 REQUIRES_SHARED(Locks::mutator_lock_);
Vladimir Markobe10e8e2016-01-22 12:09:44 +0000126
Eric Holk1868de92020-02-12 09:10:21 -0800127 // Returns whether inlining is allowed based on ART semantics.
128 bool IsInliningAllowed(art::ArtMethod* method, const CodeItemDataAccessor& accessor) const
129 REQUIRES_SHARED(Locks::mutator_lock_);
130
131
132 // Returns whether ART supports inlining this method.
133 //
134 // Some methods are not supported because they have features for which inlining
135 // is not implemented. For example, we do not currently support inlining throw
136 // instructions into a try block.
137 bool IsInliningSupported(const HInvoke* invoke_instruction,
138 art::ArtMethod* method,
139 const CodeItemDataAccessor& accessor) const
140 REQUIRES_SHARED(Locks::mutator_lock_);
141
142 // Returns whether the inlining budget allows inlining method.
143 //
144 // For example, this checks whether the function has grown too large and
145 // inlining should be prevented.
146 bool IsInliningBudgetAvailable(art::ArtMethod* method, const CodeItemDataAccessor& accessor) const
147 REQUIRES_SHARED(Locks::mutator_lock_);
148
149 // Inspects the body of a method (callee_graph) and returns whether it can be
150 // inlined.
151 //
152 // This checks for instructions and constructs that we do not support
153 // inlining, such as inlining a throw instruction into a try block.
154 bool CanInlineBody(const HGraph* callee_graph,
155 const HBasicBlock* target_block,
156 size_t* out_number_of_instructions) const
157 REQUIRES_SHARED(Locks::mutator_lock_);
158
Vladimir Markobe10e8e2016-01-22 12:09:44 +0000159 // Create a new HInstanceFieldGet.
Vladimir Markof44d36c2017-03-14 14:18:46 +0000160 HInstanceFieldGet* CreateInstanceFieldGet(uint32_t field_index,
161 ArtMethod* referrer,
Vladimir Markobe10e8e2016-01-22 12:09:44 +0000162 HInstruction* obj);
163 // Create a new HInstanceFieldSet.
Vladimir Markof44d36c2017-03-14 14:18:46 +0000164 HInstanceFieldSet* CreateInstanceFieldSet(uint32_t field_index,
165 ArtMethod* referrer,
Vladimir Markobe10e8e2016-01-22 12:09:44 +0000166 HInstruction* obj,
Vladimir Markof44d36c2017-03-14 14:18:46 +0000167 HInstruction* value,
168 bool* is_final = nullptr);
Vladimir Markobe10e8e2016-01-22 12:09:44 +0000169
Calin Juravle13439f02017-02-21 01:17:21 -0800170 // Try inlining the invoke instruction using inline caches.
171 bool TryInlineFromInlineCache(
172 const DexFile& caller_dex_file,
173 HInvoke* invoke_instruction,
174 ArtMethod* resolved_method)
175 REQUIRES_SHARED(Locks::mutator_lock_);
176
177 // Try getting the inline cache from JIT code cache.
178 // Return true if the inline cache was successfully allocated and the
179 // invoke info was found in the profile info.
180 InlineCacheType GetInlineCacheJIT(
181 HInvoke* invoke_instruction,
182 StackHandleScope<1>* hs,
183 /*out*/Handle<mirror::ObjectArray<mirror::Class>>* inline_cache)
184 REQUIRES_SHARED(Locks::mutator_lock_);
185
186 // Try getting the inline cache from AOT offline profile.
187 // Return true if the inline cache was successfully allocated and the
188 // invoke info was found in the profile info.
189 InlineCacheType GetInlineCacheAOT(const DexFile& caller_dex_file,
190 HInvoke* invoke_instruction,
191 StackHandleScope<1>* hs,
192 /*out*/Handle<mirror::ObjectArray<mirror::Class>>* inline_cache)
193 REQUIRES_SHARED(Locks::mutator_lock_);
194
195 // Extract the mirror classes from the offline profile and add them to the `inline_cache`.
196 // Note that even if we have profile data for the invoke the inline_cache might contain
197 // only null entries if the types cannot be resolved.
198 InlineCacheType ExtractClassesFromOfflineProfile(
199 const HInvoke* invoke_instruction,
200 const ProfileCompilationInfo::OfflineProfileMethodInfo& offline_profile,
201 /*out*/Handle<mirror::ObjectArray<mirror::Class>> inline_cache)
202 REQUIRES_SHARED(Locks::mutator_lock_);
203
204 // Compute the inline cache type.
205 InlineCacheType GetInlineCacheType(
206 const Handle<mirror::ObjectArray<mirror::Class>>& classes)
207 REQUIRES_SHARED(Locks::mutator_lock_);
208
Nicolas Geoffray73be1e82015-09-17 15:22:56 +0100209 // Try to inline the target of a monomorphic call. If successful, the code
210 // in the graph will look like:
211 // if (receiver.getClass() != ic.GetMonomorphicType()) deopt
212 // ... // inlined code
213 bool TryInlineMonomorphicCall(HInvoke* invoke_instruction,
214 ArtMethod* resolved_method,
Nicolas Geoffraye51ca8b2016-11-22 14:49:31 +0000215 Handle<mirror::ObjectArray<mirror::Class>> classes)
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700216 REQUIRES_SHARED(Locks::mutator_lock_);
Nicolas Geoffray73be1e82015-09-17 15:22:56 +0100217
Nicolas Geoffray916cc1d2016-02-18 11:12:31 +0000218 // Try to inline targets of a polymorphic call.
Nicolas Geoffray73be1e82015-09-17 15:22:56 +0100219 bool TryInlinePolymorphicCall(HInvoke* invoke_instruction,
220 ArtMethod* resolved_method,
Nicolas Geoffraye51ca8b2016-11-22 14:49:31 +0000221 Handle<mirror::ObjectArray<mirror::Class>> classes)
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700222 REQUIRES_SHARED(Locks::mutator_lock_);
Nicolas Geoffray73be1e82015-09-17 15:22:56 +0100223
Nicolas Geoffray916cc1d2016-02-18 11:12:31 +0000224 bool TryInlinePolymorphicCallToSameTarget(HInvoke* invoke_instruction,
225 ArtMethod* resolved_method,
Nicolas Geoffraye51ca8b2016-11-22 14:49:31 +0000226 Handle<mirror::ObjectArray<mirror::Class>> classes)
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700227 REQUIRES_SHARED(Locks::mutator_lock_);
Nicolas Geoffray916cc1d2016-02-18 11:12:31 +0000228
Calin Juravleaf44e6c2017-05-23 14:24:55 -0700229 // Returns whether or not we should use only polymorphic inlining with no deoptimizations.
230 bool UseOnlyPolymorphicInliningWithNoDeopt();
231
Mingyao Yang063fc772016-08-02 11:02:54 -0700232 // Try CHA-based devirtualization to change virtual method calls into
233 // direct calls.
234 // Returns the actual method that resolved_method can be devirtualized to.
235 ArtMethod* TryCHADevirtualization(ArtMethod* resolved_method)
236 REQUIRES_SHARED(Locks::mutator_lock_);
237
238 // Add a CHA guard for a CHA-based devirtualized call. A CHA guard checks a
239 // should_deoptimize flag and if it's true, does deoptimization.
240 void AddCHAGuard(HInstruction* invoke_instruction,
241 uint32_t dex_pc,
242 HInstruction* cursor,
243 HBasicBlock* bb_cursor);
Nicolas Geoffray916cc1d2016-02-18 11:12:31 +0000244
Nicolas Geoffraya42363f2015-12-17 14:57:09 +0000245 HInstanceFieldGet* BuildGetReceiverClass(ClassLinker* class_linker,
246 HInstruction* receiver,
247 uint32_t dex_pc) const
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700248 REQUIRES_SHARED(Locks::mutator_lock_);
Nicolas Geoffraya42363f2015-12-17 14:57:09 +0000249
David Brazdil94ab38f2016-06-21 17:48:19 +0100250 void FixUpReturnReferenceType(ArtMethod* resolved_method, HInstruction* return_replacement)
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700251 REQUIRES_SHARED(Locks::mutator_lock_);
David Brazdil94ab38f2016-06-21 17:48:19 +0100252
253 // Creates an instance of ReferenceTypeInfo from `klass` if `klass` is
254 // admissible (see ReferenceTypePropagation::IsAdmissible for details).
255 // Otherwise returns inexact Object RTI.
Vladimir Markob45528c2017-07-27 14:14:28 +0100256 ReferenceTypeInfo GetClassRTI(ObjPtr<mirror::Class> klass) REQUIRES_SHARED(Locks::mutator_lock_);
David Brazdil94ab38f2016-06-21 17:48:19 +0100257
258 bool ArgumentTypesMoreSpecific(HInvoke* invoke_instruction, ArtMethod* resolved_method)
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700259 REQUIRES_SHARED(Locks::mutator_lock_);
David Brazdil94ab38f2016-06-21 17:48:19 +0100260
261 bool ReturnTypeMoreSpecific(HInvoke* invoke_instruction, HInstruction* return_replacement)
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700262 REQUIRES_SHARED(Locks::mutator_lock_);
Vladimir Markobe10e8e2016-01-22 12:09:44 +0000263
Nicolas Geoffray916cc1d2016-02-18 11:12:31 +0000264 // Add a type guard on the given `receiver`. This will add to the graph:
265 // i0 = HFieldGet(receiver, klass)
266 // i1 = HLoadClass(class_index, is_referrer)
267 // i2 = HNotEqual(i0, i1)
268 //
269 // And if `with_deoptimization` is true:
270 // HDeoptimize(i2)
271 //
272 // The method returns the `HNotEqual`, that will be used for polymorphic inlining.
273 HInstruction* AddTypeGuard(HInstruction* receiver,
274 HInstruction* cursor,
275 HBasicBlock* bb_cursor,
Andreas Gampea5b09a62016-11-17 15:21:22 -0800276 dex::TypeIndex class_index,
Nicolas Geoffray5247c082017-01-13 14:17:29 +0000277 Handle<mirror::Class> klass,
Nicolas Geoffray916cc1d2016-02-18 11:12:31 +0000278 HInstruction* invoke_instruction,
279 bool with_deoptimization)
Andreas Gampebdf7f1c2016-08-30 16:38:47 -0700280 REQUIRES_SHARED(Locks::mutator_lock_);
Nicolas Geoffray916cc1d2016-02-18 11:12:31 +0000281
282 /*
283 * Ad-hoc implementation for implementing a diamond pattern in the graph for
284 * polymorphic inlining:
285 * 1) `compare` becomes the input of the new `HIf`.
286 * 2) Everything up until `invoke_instruction` is in the then branch (could
287 * contain multiple blocks).
288 * 3) `invoke_instruction` is moved to the otherwise block.
289 * 4) If `return_replacement` is not null, the merge block will have
290 * a phi whose inputs are `return_replacement` and `invoke_instruction`.
291 *
292 * Before:
293 * Block1
294 * compare
295 * ...
296 * invoke_instruction
297 *
298 * After:
299 * Block1
300 * compare
301 * if
302 * / \
303 * / \
304 * Then block Otherwise block
305 * ... invoke_instruction
306 * \ /
307 * \ /
308 * Merge block
309 * phi(return_replacement, invoke_instruction)
310 */
311 void CreateDiamondPatternForPolymorphicInline(HInstruction* compare,
312 HInstruction* return_replacement,
313 HInstruction* invoke_instruction);
314
Nicolas Geoffrayf6d46682017-02-28 17:41:45 +0000315 // Update the inlining budget based on `total_number_of_instructions_`.
316 void UpdateInliningBudget();
317
318 // Count the number of calls of `method` being inlined recursively.
319 size_t CountRecursiveCallsOf(ArtMethod* method) const;
320
321 // Pretty-print for spaces during logging.
322 std::string DepthString(int line) const;
323
Nicolas Geoffray73be1e82015-09-17 15:22:56 +0100324 HGraph* const outermost_graph_;
Nicolas Geoffraye53798a2014-12-01 10:31:54 +0000325 const DexCompilationUnit& outer_compilation_unit_;
Nicolas Geoffray9437b782015-03-25 10:08:51 +0000326 const DexCompilationUnit& caller_compilation_unit_;
Vladimir Markodc151b22015-10-15 18:02:30 +0100327 CodeGenerator* const codegen_;
Nicolas Geoffray5949fa02015-12-18 10:57:10 +0000328 const size_t total_number_of_dex_registers_;
Nicolas Geoffrayf6d46682017-02-28 17:41:45 +0000329 size_t total_number_of_instructions_;
330
331 // The 'parent' inliner, that means the inlinigng optimization that requested
332 // `graph_` to be inlined.
333 const HInliner* const parent_;
Nicolas Geoffrayef87c5d2015-01-30 12:41:14 +0000334 const size_t depth_;
Nicolas Geoffrayf6d46682017-02-28 17:41:45 +0000335
336 // The budget left for inlining, in number of instructions.
337 size_t inlining_budget_;
Mathieu Chartiere8a3c572016-10-11 16:52:17 -0700338 VariableSizedHandleScope* const handles_;
Nicolas Geoffraye53798a2014-12-01 10:31:54 +0000339
Vladimir Marko438709f2017-02-23 18:56:13 +0000340 // Used to record stats about optimizations on the inlined graph.
341 // If the inlining is successful, these stats are merged to the caller graph's stats.
342 OptimizingCompilerStats* inline_stats_;
343
Nicolas Geoffraye53798a2014-12-01 10:31:54 +0000344 DISALLOW_COPY_AND_ASSIGN(HInliner);
345};
346
347} // namespace art
348
349#endif // ART_COMPILER_OPTIMIZING_INLINER_H_