blob: fbf1516f64cb6803cf956eaaca2bb95d0c90a4ed [file] [log] [blame]
Artem Serov121f2032017-10-23 19:19:06 +01001/*
2 * Copyright (C) 2018 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17#ifndef ART_COMPILER_OPTIMIZING_LOOP_ANALYSIS_H_
18#define ART_COMPILER_OPTIMIZING_LOOP_ANALYSIS_H_
19
20#include "nodes.h"
21
Vladimir Marko0a516052019-10-14 13:00:44 +000022namespace art {
Artem Serov121f2032017-10-23 19:19:06 +010023
Artem Serov8ba4de12019-12-04 21:10:23 +000024class CodeGenerator;
Artem Serov0e329082018-06-12 10:23:27 +010025class InductionVarRange;
Artem Serov121f2032017-10-23 19:19:06 +010026class LoopAnalysis;
27
Artem Serov121f2032017-10-23 19:19:06 +010028// Class to hold cached information on properties of the loop.
29class LoopAnalysisInfo : public ValueObject {
30 public:
Artem Serov0e329082018-06-12 10:23:27 +010031 // No loop unrolling factor (just one copy of the loop-body).
32 static constexpr uint32_t kNoUnrollingFactor = 1;
33 // Used for unknown and non-constant trip counts (see InductionVarRange::HasKnownTripCount).
34 static constexpr int64_t kUnknownTripCount = -1;
35
Artem Serov121f2032017-10-23 19:19:06 +010036 explicit LoopAnalysisInfo(HLoopInformation* loop_info)
Artem Serov0e329082018-06-12 10:23:27 +010037 : trip_count_(kUnknownTripCount),
38 bb_num_(0),
Artem Serov121f2032017-10-23 19:19:06 +010039 instr_num_(0),
40 exits_num_(0),
Artem Serov0e329082018-06-12 10:23:27 +010041 invariant_exits_num_(0),
Artem Serov72411e62017-10-19 16:18:07 +010042 has_instructions_preventing_scalar_peeling_(false),
Artem Serov121f2032017-10-23 19:19:06 +010043 has_instructions_preventing_scalar_unrolling_(false),
Artem Serovcf43fb62018-02-15 14:43:48 +000044 has_long_type_instructions_(false),
Artem Serov121f2032017-10-23 19:19:06 +010045 loop_info_(loop_info) {}
46
Artem Serov0e329082018-06-12 10:23:27 +010047 int64_t GetTripCount() const { return trip_count_; }
Artem Serov121f2032017-10-23 19:19:06 +010048 size_t GetNumberOfBasicBlocks() const { return bb_num_; }
49 size_t GetNumberOfInstructions() const { return instr_num_; }
50 size_t GetNumberOfExits() const { return exits_num_; }
Artem Serov0e329082018-06-12 10:23:27 +010051 size_t GetNumberOfInvariantExits() const { return invariant_exits_num_; }
Artem Serov121f2032017-10-23 19:19:06 +010052
Artem Serov72411e62017-10-19 16:18:07 +010053 bool HasInstructionsPreventingScalarPeeling() const {
54 return has_instructions_preventing_scalar_peeling_;
55 }
56
Artem Serov121f2032017-10-23 19:19:06 +010057 bool HasInstructionsPreventingScalarUnrolling() const {
58 return has_instructions_preventing_scalar_unrolling_;
59 }
60
Artem Serov0e329082018-06-12 10:23:27 +010061 bool HasInstructionsPreventingScalarOpts() const {
62 return HasInstructionsPreventingScalarPeeling() || HasInstructionsPreventingScalarUnrolling();
63 }
64
Artem Serovcf43fb62018-02-15 14:43:48 +000065 bool HasLongTypeInstructions() const {
66 return has_long_type_instructions_;
67 }
68
Artem Serov0e329082018-06-12 10:23:27 +010069 HLoopInformation* GetLoopInfo() const { return loop_info_; }
Artem Serov121f2032017-10-23 19:19:06 +010070
71 private:
Artem Serov0e329082018-06-12 10:23:27 +010072 // Trip count of the loop if known, kUnknownTripCount otherwise.
73 int64_t trip_count_;
Artem Serov121f2032017-10-23 19:19:06 +010074 // Number of basic blocks in the loop body.
75 size_t bb_num_;
76 // Number of instructions in the loop body.
77 size_t instr_num_;
78 // Number of loop's exits.
79 size_t exits_num_;
Artem Serov0e329082018-06-12 10:23:27 +010080 // Number of "if" loop exits (with HIf instruction) whose condition is loop-invariant.
81 size_t invariant_exits_num_;
Artem Serov72411e62017-10-19 16:18:07 +010082 // Whether the loop has instructions which make scalar loop peeling non-beneficial.
83 bool has_instructions_preventing_scalar_peeling_;
Artem Serov121f2032017-10-23 19:19:06 +010084 // Whether the loop has instructions which make scalar loop unrolling non-beneficial.
85 bool has_instructions_preventing_scalar_unrolling_;
Artem Serovcf43fb62018-02-15 14:43:48 +000086 // Whether the loop has instructions of primitive long type; unrolling these loop will
87 // likely introduce spill/fills on 32-bit targets.
88 bool has_long_type_instructions_;
Artem Serov121f2032017-10-23 19:19:06 +010089
90 // Corresponding HLoopInformation.
Artem Serov0e329082018-06-12 10:23:27 +010091 HLoopInformation* loop_info_;
Artem Serov121f2032017-10-23 19:19:06 +010092
93 friend class LoopAnalysis;
94};
95
96// Placeholder class for methods and routines used to analyse loops, calculate loop properties
97// and characteristics.
98class LoopAnalysis : public ValueObject {
99 public:
100 // Calculates loops basic properties like body size, exits number, etc. and fills
101 // 'analysis_results' with this information.
102 static void CalculateLoopBasicProperties(HLoopInformation* loop_info,
Artem Serov0e329082018-06-12 10:23:27 +0100103 LoopAnalysisInfo* analysis_results,
104 int64_t trip_count);
Artem Serov121f2032017-10-23 19:19:06 +0100105
Artem Serov0e329082018-06-12 10:23:27 +0100106 // Returns the trip count of the loop if it is known and kUnknownTripCount otherwise.
107 static int64_t GetLoopTripCount(HLoopInformation* loop_info,
108 const InductionVarRange* induction_range);
Artem Serov72411e62017-10-19 16:18:07 +0100109
Artem Serov121f2032017-10-23 19:19:06 +0100110 private:
Artem Serov72411e62017-10-19 16:18:07 +0100111 // Returns whether an instruction makes scalar loop peeling/unrolling non-beneficial.
Artem Serov121f2032017-10-23 19:19:06 +0100112 //
113 // If in the loop body we have a dex/runtime call then its contribution to the whole
Artem Serov72411e62017-10-19 16:18:07 +0100114 // loop performance will probably prevail. So peeling/unrolling optimization will not bring
115 // any noticeable performance improvement. It will increase the code size.
116 static bool MakesScalarPeelingUnrollingNonBeneficial(HInstruction* instruction) {
Artem Serov121f2032017-10-23 19:19:06 +0100117 return (instruction->IsNewArray() ||
118 instruction->IsNewInstance() ||
119 instruction->IsUnresolvedInstanceFieldGet() ||
120 instruction->IsUnresolvedInstanceFieldSet() ||
121 instruction->IsUnresolvedStaticFieldGet() ||
122 instruction->IsUnresolvedStaticFieldSet() ||
Artem Serov72411e62017-10-19 16:18:07 +0100123 // TODO: Support loops with intrinsified invokes.
Artem Serova6e26142018-06-19 14:55:17 +0100124 instruction->IsInvoke());
Artem Serov121f2032017-10-23 19:19:06 +0100125 }
126};
127
128//
129// Helper class which holds target-dependent methods and constants needed for loop optimizations.
130//
131// To support peeling/unrolling for a new architecture one needs to create new helper class,
132// inherit it from this and add implementation for the following methods.
133//
Artem Serovcf43fb62018-02-15 14:43:48 +0000134class ArchNoOptsLoopHelper : public ArenaObject<kArenaAllocOptimization> {
Artem Serov121f2032017-10-23 19:19:06 +0100135 public:
Artem Serov8ba4de12019-12-04 21:10:23 +0000136 explicit ArchNoOptsLoopHelper(const CodeGenerator& codegen) : codegen_(codegen) {}
Artem Serovcf43fb62018-02-15 14:43:48 +0000137 virtual ~ArchNoOptsLoopHelper() {}
Artem Serov121f2032017-10-23 19:19:06 +0100138
139 // Creates an instance of specialised helper for the target or default helper if the target
140 // doesn't support loop peeling and unrolling.
Artem Serov8ba4de12019-12-04 21:10:23 +0000141 static ArchNoOptsLoopHelper* Create(const CodeGenerator& codegen, ArenaAllocator* allocator);
Artem Serov121f2032017-10-23 19:19:06 +0100142
Artem Serovcf43fb62018-02-15 14:43:48 +0000143 // Returns whether the loop is not beneficial for loop peeling/unrolling.
Artem Serov121f2032017-10-23 19:19:06 +0100144 //
Artem Serovcf43fb62018-02-15 14:43:48 +0000145 // For example, if the loop body has too many instructions then peeling/unrolling optimization
146 // will not bring any noticeable performance improvement however will increase the code size.
Artem Serov121f2032017-10-23 19:19:06 +0100147 //
148 // Returns 'true' by default, should be overridden by particular target loop helper.
Artem Serovcf43fb62018-02-15 14:43:48 +0000149 virtual bool IsLoopNonBeneficialForScalarOpts(
Artem Serov121f2032017-10-23 19:19:06 +0100150 LoopAnalysisInfo* loop_analysis_info ATTRIBUTE_UNUSED) const { return true; }
151
152 // Returns optimal scalar unrolling factor for the loop.
153 //
154 // Returns kNoUnrollingFactor by default, should be overridden by particular target loop helper.
Artem Serov0e329082018-06-12 10:23:27 +0100155 virtual uint32_t GetScalarUnrollingFactor(
156 const LoopAnalysisInfo* analysis_info ATTRIBUTE_UNUSED) const {
157 return LoopAnalysisInfo::kNoUnrollingFactor;
Artem Serov121f2032017-10-23 19:19:06 +0100158 }
159
Artem Serov72411e62017-10-19 16:18:07 +0100160 // Returns whether scalar loop peeling is enabled,
161 //
162 // Returns 'false' by default, should be overridden by particular target loop helper.
163 virtual bool IsLoopPeelingEnabled() const { return false; }
164
Artem Serov18ba1da2018-05-16 19:06:32 +0100165 // Returns whether it is beneficial to fully unroll the loop.
166 //
167 // Returns 'false' by default, should be overridden by particular target loop helper.
168 virtual bool IsFullUnrollingBeneficial(LoopAnalysisInfo* analysis_info ATTRIBUTE_UNUSED) const {
169 return false;
170 }
171
Artem Serov121f2032017-10-23 19:19:06 +0100172 // Returns optimal SIMD unrolling factor for the loop.
173 //
174 // Returns kNoUnrollingFactor by default, should be overridden by particular target loop helper.
175 virtual uint32_t GetSIMDUnrollingFactor(HBasicBlock* block ATTRIBUTE_UNUSED,
176 int64_t trip_count ATTRIBUTE_UNUSED,
177 uint32_t max_peel ATTRIBUTE_UNUSED,
178 uint32_t vector_length ATTRIBUTE_UNUSED) const {
Artem Serov0e329082018-06-12 10:23:27 +0100179 return LoopAnalysisInfo::kNoUnrollingFactor;
Artem Serov121f2032017-10-23 19:19:06 +0100180 }
Artem Serov8ba4de12019-12-04 21:10:23 +0000181
182 protected:
183 const CodeGenerator& codegen_;
Artem Serov121f2032017-10-23 19:19:06 +0100184};
185
186} // namespace art
187
188#endif // ART_COMPILER_OPTIMIZING_LOOP_ANALYSIS_H_