Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (C) 2014 The Android Open Source Project |
| 3 | * |
| 4 | * Licensed under the Apache License, Version 2.0 (the "License"); |
| 5 | * you may not use this file except in compliance with the License. |
| 6 | * You may obtain a copy of the License at |
| 7 | * |
| 8 | * http://www.apache.org/licenses/LICENSE-2.0 |
| 9 | * |
| 10 | * Unless required by applicable law or agreed to in writing, software |
| 11 | * distributed under the License is distributed on an "AS IS" BASIS, |
| 12 | * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| 13 | * See the License for the specific language governing permissions and |
| 14 | * limitations under the License. |
| 15 | */ |
| 16 | |
| 17 | #ifndef ART_COMPILER_OPTIMIZING_CODE_GENERATOR_H_ |
| 18 | #define ART_COMPILER_OPTIMIZING_CODE_GENERATOR_H_ |
| 19 | |
Ian Rogers | d582fa4 | 2014-11-05 23:46:43 -0800 | [diff] [blame] | 20 | #include "arch/instruction_set.h" |
Calin Juravle | 3416601 | 2014-12-19 17:22:29 +0000 | [diff] [blame] | 21 | #include "arch/instruction_set_features.h" |
Vladimir Marko | f9f6441 | 2015-09-02 14:05:49 +0100 | [diff] [blame] | 22 | #include "base/arena_containers.h" |
| 23 | #include "base/arena_object.h" |
Nicolas Geoffray | 01bc96d | 2014-04-11 17:43:50 +0100 | [diff] [blame] | 24 | #include "base/bit_field.h" |
Nicolas Geoffray | d28b969 | 2015-11-04 14:36:55 +0000 | [diff] [blame] | 25 | #include "compiled_method.h" |
Calin Juravle | cd6dffe | 2015-01-08 17:35:35 +0000 | [diff] [blame] | 26 | #include "driver/compiler_options.h" |
Nicolas Geoffray | bab4ed7 | 2014-03-11 17:53:17 +0000 | [diff] [blame] | 27 | #include "globals.h" |
Alexandre Rames | eb7b739 | 2015-06-19 14:47:01 +0100 | [diff] [blame] | 28 | #include "graph_visualizer.h" |
Nicolas Geoffray | 4e3d23a | 2014-05-22 18:32:45 +0100 | [diff] [blame] | 29 | #include "locations.h" |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 30 | #include "memory_region.h" |
| 31 | #include "nodes.h" |
Serban Constantinescu | ecc4366 | 2015-08-13 13:33:12 +0100 | [diff] [blame] | 32 | #include "optimizing_compiler_stats.h" |
Nicolas Geoffray | 3946844 | 2014-09-02 15:17:15 +0100 | [diff] [blame] | 33 | #include "stack_map_stream.h" |
Andreas Gampe | 85b62f2 | 2015-09-09 13:15:38 -0700 | [diff] [blame] | 34 | #include "utils/label.h" |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 35 | |
| 36 | namespace art { |
| 37 | |
Roland Levillain | 6d0e483 | 2014-11-27 18:31:21 +0000 | [diff] [blame] | 38 | // Binary encoding of 2^32 for type double. |
| 39 | static int64_t constexpr k2Pow32EncodingForDouble = INT64_C(0x41F0000000000000); |
| 40 | // Binary encoding of 2^31 for type double. |
| 41 | static int64_t constexpr k2Pow31EncodingForDouble = INT64_C(0x41E0000000000000); |
| 42 | |
Mark Mendell | e82549b | 2015-05-06 10:55:34 -0400 | [diff] [blame] | 43 | // Minimum value for a primitive integer. |
| 44 | static int32_t constexpr kPrimIntMin = 0x80000000; |
| 45 | // Minimum value for a primitive long. |
| 46 | static int64_t constexpr kPrimLongMin = INT64_C(0x8000000000000000); |
| 47 | |
Roland Levillain | 3f8f936 | 2014-12-02 17:45:01 +0000 | [diff] [blame] | 48 | // Maximum value for a primitive integer. |
| 49 | static int32_t constexpr kPrimIntMax = 0x7fffffff; |
Roland Levillain | 624279f | 2014-12-04 11:54:28 +0000 | [diff] [blame] | 50 | // Maximum value for a primitive long. |
Mark Mendell | e82549b | 2015-05-06 10:55:34 -0400 | [diff] [blame] | 51 | static int64_t constexpr kPrimLongMax = INT64_C(0x7fffffffffffffff); |
Roland Levillain | 3f8f936 | 2014-12-02 17:45:01 +0000 | [diff] [blame] | 52 | |
Nicolas Geoffray | 92a73ae | 2014-10-16 11:12:52 +0100 | [diff] [blame] | 53 | class Assembler; |
Nicolas Geoffray | e503832 | 2014-07-04 09:41:32 +0100 | [diff] [blame] | 54 | class CodeGenerator; |
Nicolas Geoffray | d28b969 | 2015-11-04 14:36:55 +0000 | [diff] [blame] | 55 | class CompilerDriver; |
Vladimir Marko | 5815501 | 2015-08-19 12:49:41 +0000 | [diff] [blame] | 56 | class LinkerPatch; |
Nicolas Geoffray | f0e3937 | 2014-11-12 17:50:07 +0000 | [diff] [blame] | 57 | class ParallelMoveResolver; |
Nicolas Geoffray | 92cf83e | 2014-03-18 17:59:20 +0000 | [diff] [blame] | 58 | |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 59 | class CodeAllocator { |
| 60 | public: |
Nicolas Geoffray | e503832 | 2014-07-04 09:41:32 +0100 | [diff] [blame] | 61 | CodeAllocator() {} |
| 62 | virtual ~CodeAllocator() {} |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 63 | |
| 64 | virtual uint8_t* Allocate(size_t size) = 0; |
| 65 | |
| 66 | private: |
| 67 | DISALLOW_COPY_AND_ASSIGN(CodeAllocator); |
| 68 | }; |
| 69 | |
Ian Rogers | 6a3c1fc | 2014-10-31 00:33:20 -0700 | [diff] [blame] | 70 | class SlowPathCode : public ArenaObject<kArenaAllocSlowPaths> { |
Nicolas Geoffray | e503832 | 2014-07-04 09:41:32 +0100 | [diff] [blame] | 71 | public: |
David Srbecky | 9cd6d37 | 2016-02-09 15:24:47 +0000 | [diff] [blame^] | 72 | explicit SlowPathCode(HInstruction* instruction) : instruction_(instruction) { |
Nicolas Geoffray | eeefa12 | 2015-03-13 18:52:59 +0000 | [diff] [blame] | 73 | for (size_t i = 0; i < kMaximumNumberOfExpectedRegisters; ++i) { |
| 74 | saved_core_stack_offsets_[i] = kRegisterNotSaved; |
| 75 | saved_fpu_stack_offsets_[i] = kRegisterNotSaved; |
| 76 | } |
| 77 | } |
| 78 | |
Nicolas Geoffray | e503832 | 2014-07-04 09:41:32 +0100 | [diff] [blame] | 79 | virtual ~SlowPathCode() {} |
| 80 | |
Nicolas Geoffray | e503832 | 2014-07-04 09:41:32 +0100 | [diff] [blame] | 81 | virtual void EmitNativeCode(CodeGenerator* codegen) = 0; |
| 82 | |
Zheng Xu | da40309 | 2015-04-24 17:35:39 +0800 | [diff] [blame] | 83 | virtual void SaveLiveRegisters(CodeGenerator* codegen, LocationSummary* locations); |
| 84 | virtual void RestoreLiveRegisters(CodeGenerator* codegen, LocationSummary* locations); |
Nicolas Geoffray | a8ac913 | 2015-03-13 16:36:36 +0000 | [diff] [blame] | 85 | |
Nicolas Geoffray | eeefa12 | 2015-03-13 18:52:59 +0000 | [diff] [blame] | 86 | bool IsCoreRegisterSaved(int reg) const { |
| 87 | return saved_core_stack_offsets_[reg] != kRegisterNotSaved; |
| 88 | } |
| 89 | |
| 90 | bool IsFpuRegisterSaved(int reg) const { |
| 91 | return saved_fpu_stack_offsets_[reg] != kRegisterNotSaved; |
| 92 | } |
| 93 | |
| 94 | uint32_t GetStackOffsetOfCoreRegister(int reg) const { |
| 95 | return saved_core_stack_offsets_[reg]; |
| 96 | } |
| 97 | |
| 98 | uint32_t GetStackOffsetOfFpuRegister(int reg) const { |
| 99 | return saved_fpu_stack_offsets_[reg]; |
| 100 | } |
| 101 | |
Alexandre Rames | 8158f28 | 2015-08-07 10:26:17 +0100 | [diff] [blame] | 102 | virtual bool IsFatal() const { return false; } |
| 103 | |
Alexandre Rames | 9931f31 | 2015-06-19 14:47:01 +0100 | [diff] [blame] | 104 | virtual const char* GetDescription() const = 0; |
| 105 | |
Andreas Gampe | 85b62f2 | 2015-09-09 13:15:38 -0700 | [diff] [blame] | 106 | Label* GetEntryLabel() { return &entry_label_; } |
| 107 | Label* GetExitLabel() { return &exit_label_; } |
| 108 | |
David Srbecky | 9cd6d37 | 2016-02-09 15:24:47 +0000 | [diff] [blame^] | 109 | uint32_t GetDexPc() const { |
| 110 | return instruction_ != nullptr ? instruction_->GetDexPc() : kNoDexPc; |
| 111 | } |
| 112 | |
Zheng Xu | da40309 | 2015-04-24 17:35:39 +0800 | [diff] [blame] | 113 | protected: |
Nicolas Geoffray | eeefa12 | 2015-03-13 18:52:59 +0000 | [diff] [blame] | 114 | static constexpr size_t kMaximumNumberOfExpectedRegisters = 32; |
| 115 | static constexpr uint32_t kRegisterNotSaved = -1; |
David Srbecky | 9cd6d37 | 2016-02-09 15:24:47 +0000 | [diff] [blame^] | 116 | // The instruction where this slow path is happening. |
| 117 | HInstruction* instruction_; |
Nicolas Geoffray | eeefa12 | 2015-03-13 18:52:59 +0000 | [diff] [blame] | 118 | uint32_t saved_core_stack_offsets_[kMaximumNumberOfExpectedRegisters]; |
| 119 | uint32_t saved_fpu_stack_offsets_[kMaximumNumberOfExpectedRegisters]; |
Zheng Xu | da40309 | 2015-04-24 17:35:39 +0800 | [diff] [blame] | 120 | |
| 121 | private: |
Andreas Gampe | 85b62f2 | 2015-09-09 13:15:38 -0700 | [diff] [blame] | 122 | Label entry_label_; |
| 123 | Label exit_label_; |
| 124 | |
Nicolas Geoffray | e503832 | 2014-07-04 09:41:32 +0100 | [diff] [blame] | 125 | DISALLOW_COPY_AND_ASSIGN(SlowPathCode); |
| 126 | }; |
| 127 | |
Roland Levillain | 2d27c8e | 2015-04-28 15:48:45 +0100 | [diff] [blame] | 128 | class InvokeDexCallingConventionVisitor { |
| 129 | public: |
| 130 | virtual Location GetNextLocation(Primitive::Type type) = 0; |
Nicolas Geoffray | fd88f16 | 2015-06-03 11:23:52 +0100 | [diff] [blame] | 131 | virtual Location GetReturnLocation(Primitive::Type type) const = 0; |
| 132 | virtual Location GetMethodLocation() const = 0; |
Roland Levillain | 2d27c8e | 2015-04-28 15:48:45 +0100 | [diff] [blame] | 133 | |
| 134 | protected: |
| 135 | InvokeDexCallingConventionVisitor() {} |
| 136 | virtual ~InvokeDexCallingConventionVisitor() {} |
| 137 | |
| 138 | // The current index for core registers. |
| 139 | uint32_t gp_index_ = 0u; |
| 140 | // The current index for floating-point registers. |
| 141 | uint32_t float_index_ = 0u; |
| 142 | // The current stack index. |
| 143 | uint32_t stack_index_ = 0u; |
| 144 | |
| 145 | private: |
| 146 | DISALLOW_COPY_AND_ASSIGN(InvokeDexCallingConventionVisitor); |
| 147 | }; |
| 148 | |
Calin Juravle | e460d1d | 2015-09-29 04:52:17 +0100 | [diff] [blame] | 149 | class FieldAccessCallingConvention { |
| 150 | public: |
| 151 | virtual Location GetObjectLocation() const = 0; |
| 152 | virtual Location GetFieldIndexLocation() const = 0; |
| 153 | virtual Location GetReturnLocation(Primitive::Type type) const = 0; |
| 154 | virtual Location GetSetValueLocation(Primitive::Type type, bool is_instance) const = 0; |
| 155 | virtual Location GetFpuLocation(Primitive::Type type) const = 0; |
| 156 | virtual ~FieldAccessCallingConvention() {} |
| 157 | |
| 158 | protected: |
| 159 | FieldAccessCallingConvention() {} |
| 160 | |
| 161 | private: |
| 162 | DISALLOW_COPY_AND_ASSIGN(FieldAccessCallingConvention); |
| 163 | }; |
| 164 | |
Nicolas Geoffray | 12df9eb | 2015-01-09 14:53:50 +0000 | [diff] [blame] | 165 | class CodeGenerator { |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 166 | public: |
David Brazdil | 58282f4 | 2016-01-14 12:45:10 +0000 | [diff] [blame] | 167 | // Compiles the graph to executable instructions. |
| 168 | void Compile(CodeAllocator* allocator); |
Nicolas Geoffray | 12df9eb | 2015-01-09 14:53:50 +0000 | [diff] [blame] | 169 | static CodeGenerator* Create(HGraph* graph, |
Calin Juravle | 3416601 | 2014-12-19 17:22:29 +0000 | [diff] [blame] | 170 | InstructionSet instruction_set, |
Calin Juravle | cd6dffe | 2015-01-08 17:35:35 +0000 | [diff] [blame] | 171 | const InstructionSetFeatures& isa_features, |
Serban Constantinescu | ecc4366 | 2015-08-13 13:33:12 +0100 | [diff] [blame] | 172 | const CompilerOptions& compiler_options, |
| 173 | OptimizingCompilerStats* stats = nullptr); |
Nicolas Geoffray | 12df9eb | 2015-01-09 14:53:50 +0000 | [diff] [blame] | 174 | virtual ~CodeGenerator() {} |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 175 | |
Vladimir Marko | dc151b2 | 2015-10-15 18:02:30 +0100 | [diff] [blame] | 176 | // Get the graph. This is the outermost graph, never the graph of a method being inlined. |
Nicolas Geoffray | 787c307 | 2014-03-17 10:20:19 +0000 | [diff] [blame] | 177 | HGraph* GetGraph() const { return graph_; } |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 178 | |
Nicolas Geoffray | dc23d83 | 2015-02-16 11:15:43 +0000 | [diff] [blame] | 179 | HBasicBlock* GetNextBlockToEmit() const; |
| 180 | HBasicBlock* FirstNonEmptyBlock(HBasicBlock* block) const; |
Nicolas Geoffray | bab4ed7 | 2014-03-11 17:53:17 +0000 | [diff] [blame] | 181 | bool GoesToNextBlock(HBasicBlock* current, HBasicBlock* next) const; |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 182 | |
Nicolas Geoffray | 86dbb9a | 2014-06-04 11:12:39 +0100 | [diff] [blame] | 183 | size_t GetStackSlotOfParameter(HParameterValue* parameter) const { |
| 184 | // Note that this follows the current calling convention. |
| 185 | return GetFrameSize() |
Mathieu Chartier | e401d14 | 2015-04-22 13:56:20 -0700 | [diff] [blame] | 186 | + InstructionSetPointerSize(GetInstructionSet()) // Art method |
Nicolas Geoffray | e27f31a | 2014-06-12 17:53:14 +0100 | [diff] [blame] | 187 | + parameter->GetIndex() * kVRegSize; |
Nicolas Geoffray | 86dbb9a | 2014-06-04 11:12:39 +0100 | [diff] [blame] | 188 | } |
| 189 | |
Nicolas Geoffray | 92a73ae | 2014-10-16 11:12:52 +0100 | [diff] [blame] | 190 | virtual void Initialize() = 0; |
Serban Constantinescu | 32f5b4d | 2014-11-25 20:05:46 +0000 | [diff] [blame] | 191 | virtual void Finalize(CodeAllocator* allocator); |
Vladimir Marko | 5815501 | 2015-08-19 12:49:41 +0000 | [diff] [blame] | 192 | virtual void EmitLinkerPatches(ArenaVector<LinkerPatch>* linker_patches); |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 193 | virtual void GenerateFrameEntry() = 0; |
| 194 | virtual void GenerateFrameExit() = 0; |
Nicolas Geoffray | 92a73ae | 2014-10-16 11:12:52 +0100 | [diff] [blame] | 195 | virtual void Bind(HBasicBlock* block) = 0; |
Calin Juravle | 175dc73 | 2015-08-25 15:42:32 +0100 | [diff] [blame] | 196 | virtual void MoveConstant(Location destination, int32_t value) = 0; |
Calin Juravle | e460d1d | 2015-09-29 04:52:17 +0100 | [diff] [blame] | 197 | virtual void MoveLocation(Location dst, Location src, Primitive::Type dst_type) = 0; |
| 198 | virtual void AddLocationAsTemp(Location location, LocationSummary* locations) = 0; |
| 199 | |
Nicolas Geoffray | 787c307 | 2014-03-17 10:20:19 +0000 | [diff] [blame] | 200 | virtual Assembler* GetAssembler() = 0; |
Alexandre Rames | eb7b739 | 2015-06-19 14:47:01 +0100 | [diff] [blame] | 201 | virtual const Assembler& GetAssembler() const = 0; |
Nicolas Geoffray | 707c809 | 2014-04-04 10:50:14 +0100 | [diff] [blame] | 202 | virtual size_t GetWordSize() const = 0; |
Mark Mendell | f85a9ca | 2015-01-13 09:20:58 -0500 | [diff] [blame] | 203 | virtual size_t GetFloatingPointSpillSlotSize() const = 0; |
Nicolas Geoffray | de58ab2 | 2014-11-05 12:46:03 +0000 | [diff] [blame] | 204 | virtual uintptr_t GetAddressOf(HBasicBlock* block) const = 0; |
Nicolas Geoffray | 4c204ba | 2015-02-03 15:12:35 +0000 | [diff] [blame] | 205 | void InitializeCodeGeneration(size_t number_of_spill_slots, |
| 206 | size_t maximum_number_of_live_core_registers, |
Roland Levillain | 0d5a281 | 2015-11-13 10:07:31 +0000 | [diff] [blame] | 207 | size_t maximum_number_of_live_fpu_registers, |
Nicolas Geoffray | 4c204ba | 2015-02-03 15:12:35 +0000 | [diff] [blame] | 208 | size_t number_of_out_slots, |
Vladimir Marko | fa6b93c | 2015-09-15 10:15:55 +0100 | [diff] [blame] | 209 | const ArenaVector<HBasicBlock*>& block_order); |
Nicolas Geoffray | ab032bc | 2014-07-15 12:55:21 +0100 | [diff] [blame] | 210 | int32_t GetStackSlot(HLocal* local) const; |
Nicolas Geoffray | 787c307 | 2014-03-17 10:20:19 +0000 | [diff] [blame] | 211 | |
| 212 | uint32_t GetFrameSize() const { return frame_size_; } |
| 213 | void SetFrameSize(uint32_t size) { frame_size_ = size; } |
Nicolas Geoffray | 8ccc3f5 | 2014-03-19 10:34:11 +0000 | [diff] [blame] | 214 | uint32_t GetCoreSpillMask() const { return core_spill_mask_; } |
Nicolas Geoffray | d97dc40 | 2015-01-22 13:50:01 +0000 | [diff] [blame] | 215 | uint32_t GetFpuSpillMask() const { return fpu_spill_mask_; } |
Nicolas Geoffray | 787c307 | 2014-03-17 10:20:19 +0000 | [diff] [blame] | 216 | |
Nicolas Geoffray | 71175b7 | 2014-10-09 22:13:55 +0100 | [diff] [blame] | 217 | size_t GetNumberOfCoreRegisters() const { return number_of_core_registers_; } |
| 218 | size_t GetNumberOfFloatingPointRegisters() const { return number_of_fpu_registers_; } |
David Brazdil | 58282f4 | 2016-01-14 12:45:10 +0000 | [diff] [blame] | 219 | virtual void SetupBlockedRegisters() const = 0; |
Nicolas Geoffray | 71175b7 | 2014-10-09 22:13:55 +0100 | [diff] [blame] | 220 | |
Nicolas Geoffray | 4dee636 | 2015-01-23 18:23:14 +0000 | [diff] [blame] | 221 | virtual void ComputeSpillMask() { |
| 222 | core_spill_mask_ = allocated_registers_.GetCoreRegisters() & core_callee_save_mask_; |
| 223 | DCHECK_NE(core_spill_mask_, 0u) << "At least the return address register must be saved"; |
| 224 | fpu_spill_mask_ = allocated_registers_.GetFloatingPointRegisters() & fpu_callee_save_mask_; |
| 225 | } |
| 226 | |
| 227 | static uint32_t ComputeRegisterMask(const int* registers, size_t length) { |
| 228 | uint32_t mask = 0; |
| 229 | for (size_t i = 0, e = length; i < e; ++i) { |
| 230 | mask |= (1 << registers[i]); |
| 231 | } |
| 232 | return mask; |
| 233 | } |
| 234 | |
Nicolas Geoffray | a7062e0 | 2014-05-22 12:50:17 +0100 | [diff] [blame] | 235 | virtual void DumpCoreRegister(std::ostream& stream, int reg) const = 0; |
| 236 | virtual void DumpFloatingPointRegister(std::ostream& stream, int reg) const = 0; |
Nicolas Geoffray | 412f10c | 2014-06-19 10:00:34 +0100 | [diff] [blame] | 237 | virtual InstructionSet GetInstructionSet() const = 0; |
Calin Juravle | cd6dffe | 2015-01-08 17:35:35 +0000 | [diff] [blame] | 238 | |
| 239 | const CompilerOptions& GetCompilerOptions() const { return compiler_options_; } |
| 240 | |
Serban Constantinescu | ecc4366 | 2015-08-13 13:33:12 +0100 | [diff] [blame] | 241 | void MaybeRecordStat(MethodCompilationStat compilation_stat, size_t count = 1) const; |
| 242 | |
Nicolas Geoffray | 102cbed | 2014-10-15 18:31:05 +0100 | [diff] [blame] | 243 | // Saves the register in the stack. Returns the size taken on stack. |
| 244 | virtual size_t SaveCoreRegister(size_t stack_index, uint32_t reg_id) = 0; |
| 245 | // Restores the register from the stack. Returns the size taken on stack. |
| 246 | virtual size_t RestoreCoreRegister(size_t stack_index, uint32_t reg_id) = 0; |
Nicolas Geoffray | 234d69d | 2015-03-09 10:28:50 +0000 | [diff] [blame] | 247 | |
| 248 | virtual size_t SaveFloatingPointRegister(size_t stack_index, uint32_t reg_id) = 0; |
| 249 | virtual size_t RestoreFloatingPointRegister(size_t stack_index, uint32_t reg_id) = 0; |
| 250 | |
Nicolas Geoffray | 840e546 | 2015-01-07 16:01:24 +0000 | [diff] [blame] | 251 | virtual bool NeedsTwoRegisters(Primitive::Type type) const = 0; |
Nicolas Geoffray | 234d69d | 2015-03-09 10:28:50 +0000 | [diff] [blame] | 252 | // Returns whether we should split long moves in parallel moves. |
| 253 | virtual bool ShouldSplitLongMoves() const { return false; } |
Nicolas Geoffray | a7062e0 | 2014-05-22 12:50:17 +0100 | [diff] [blame] | 254 | |
Roland Levillain | 0d5a281 | 2015-11-13 10:07:31 +0000 | [diff] [blame] | 255 | size_t GetNumberOfCoreCalleeSaveRegisters() const { |
| 256 | return POPCOUNT(core_callee_save_mask_); |
| 257 | } |
| 258 | |
| 259 | size_t GetNumberOfCoreCallerSaveRegisters() const { |
| 260 | DCHECK_GE(GetNumberOfCoreRegisters(), GetNumberOfCoreCalleeSaveRegisters()); |
| 261 | return GetNumberOfCoreRegisters() - GetNumberOfCoreCalleeSaveRegisters(); |
| 262 | } |
| 263 | |
Nicolas Geoffray | 9889396 | 2015-01-21 12:32:32 +0000 | [diff] [blame] | 264 | bool IsCoreCalleeSaveRegister(int reg) const { |
| 265 | return (core_callee_save_mask_ & (1 << reg)) != 0; |
| 266 | } |
| 267 | |
| 268 | bool IsFloatingPointCalleeSaveRegister(int reg) const { |
| 269 | return (fpu_callee_save_mask_ & (1 << reg)) != 0; |
| 270 | } |
| 271 | |
Yevgeny Rouban | 2a7c1ef | 2015-07-22 18:36:24 +0600 | [diff] [blame] | 272 | // Record native to dex mapping for a suspend point. Required by runtime. |
Nicolas Geoffray | eeefa12 | 2015-03-13 18:52:59 +0000 | [diff] [blame] | 273 | void RecordPcInfo(HInstruction* instruction, uint32_t dex_pc, SlowPathCode* slow_path = nullptr); |
David Srbecky | b7070a2 | 2016-01-08 18:13:53 +0000 | [diff] [blame] | 274 | // Check whether we have already recorded mapping at this PC. |
| 275 | bool HasStackMapAtCurrentPc(); |
David Srbecky | c7098ff | 2016-02-09 14:30:11 +0000 | [diff] [blame] | 276 | // Record extra stack maps if we support native debugging. |
| 277 | void MaybeRecordNativeDebugInfo(HInstruction* instruction, uint32_t dex_pc); |
Yevgeny Rouban | 2a7c1ef | 2015-07-22 18:36:24 +0600 | [diff] [blame] | 278 | |
Calin Juravle | 77520bc | 2015-01-12 18:45:46 +0000 | [diff] [blame] | 279 | bool CanMoveNullCheckToUser(HNullCheck* null_check); |
| 280 | void MaybeRecordImplicitNullCheck(HInstruction* instruction); |
Nicolas Geoffray | 8ccc3f5 | 2014-03-19 10:34:11 +0000 | [diff] [blame] | 281 | |
David Brazdil | 77a48ae | 2015-09-15 12:34:04 +0000 | [diff] [blame] | 282 | // Records a stack map which the runtime might use to set catch phi values |
| 283 | // during exception delivery. |
| 284 | // TODO: Replace with a catch-entering instruction that records the environment. |
| 285 | void RecordCatchBlockInfo(); |
| 286 | |
| 287 | // Returns true if implicit null checks are allowed in the compiler options |
| 288 | // and if the null check is not inside a try block. We currently cannot do |
| 289 | // implicit null checks in that case because we need the NullCheckSlowPath to |
| 290 | // save live registers, which may be needed by the runtime to set catch phis. |
| 291 | bool IsImplicitNullCheckAllowed(HNullCheck* null_check) const; |
| 292 | |
Nicolas Geoffray | e503832 | 2014-07-04 09:41:32 +0100 | [diff] [blame] | 293 | void AddSlowPath(SlowPathCode* slow_path) { |
Vladimir Marko | 225b646 | 2015-09-28 12:17:40 +0100 | [diff] [blame] | 294 | slow_paths_.push_back(slow_path); |
Nicolas Geoffray | e503832 | 2014-07-04 09:41:32 +0100 | [diff] [blame] | 295 | } |
| 296 | |
Nicolas Geoffray | b331feb | 2016-02-05 16:51:53 +0000 | [diff] [blame] | 297 | void BuildStackMaps(MemoryRegion region, const DexFile::CodeItem& code_item); |
Nicolas Geoffray | d28b969 | 2015-11-04 14:36:55 +0000 | [diff] [blame] | 298 | size_t ComputeStackMapsSize(); |
Nicolas Geoffray | 787c307 | 2014-03-17 10:20:19 +0000 | [diff] [blame] | 299 | |
Nicolas Geoffray | f12feb8 | 2014-07-17 18:32:41 +0100 | [diff] [blame] | 300 | bool IsLeafMethod() const { |
| 301 | return is_leaf_; |
| 302 | } |
| 303 | |
| 304 | void MarkNotLeaf() { |
| 305 | is_leaf_ = false; |
Nicolas Geoffray | c0572a4 | 2015-02-06 14:35:25 +0000 | [diff] [blame] | 306 | requires_current_method_ = true; |
| 307 | } |
| 308 | |
| 309 | void SetRequiresCurrentMethod() { |
| 310 | requires_current_method_ = true; |
| 311 | } |
| 312 | |
| 313 | bool RequiresCurrentMethod() const { |
| 314 | return requires_current_method_; |
Nicolas Geoffray | f12feb8 | 2014-07-17 18:32:41 +0100 | [diff] [blame] | 315 | } |
| 316 | |
Nicolas Geoffray | 3c04974 | 2014-09-24 18:10:46 +0100 | [diff] [blame] | 317 | // Clears the spill slots taken by loop phis in the `LocationSummary` of the |
| 318 | // suspend check. This is called when the code generator generates code |
| 319 | // for the suspend check at the back edge (instead of where the suspend check |
| 320 | // is, which is the loop entry). At this point, the spill slots for the phis |
| 321 | // have not been written to. |
| 322 | void ClearSpillSlotsFromLoopPhisInStackMap(HSuspendCheck* suspend_check) const; |
| 323 | |
Nicolas Geoffray | 71175b7 | 2014-10-09 22:13:55 +0100 | [diff] [blame] | 324 | bool* GetBlockedCoreRegisters() const { return blocked_core_registers_; } |
Nicolas Geoffray | 102cbed | 2014-10-15 18:31:05 +0100 | [diff] [blame] | 325 | bool* GetBlockedFloatingPointRegisters() const { return blocked_fpu_registers_; } |
Nicolas Geoffray | 71175b7 | 2014-10-09 22:13:55 +0100 | [diff] [blame] | 326 | |
Nicolas Geoffray | 19a19cf | 2014-10-22 16:07:05 +0100 | [diff] [blame] | 327 | // Helper that returns the pointer offset of an index in an object array. |
| 328 | // Note: this method assumes we always have the same pointer size, regardless |
| 329 | // of the architecture. |
| 330 | static size_t GetCacheOffset(uint32_t index); |
Mathieu Chartier | e401d14 | 2015-04-22 13:56:20 -0700 | [diff] [blame] | 331 | // Pointer variant for ArtMethod and ArtField arrays. |
| 332 | size_t GetCachePointerOffset(uint32_t index); |
Nicolas Geoffray | 19a19cf | 2014-10-22 16:07:05 +0100 | [diff] [blame] | 333 | |
Nicolas Geoffray | 9021825 | 2015-04-15 11:56:51 +0100 | [diff] [blame] | 334 | void EmitParallelMoves(Location from1, |
| 335 | Location to1, |
| 336 | Primitive::Type type1, |
| 337 | Location from2, |
| 338 | Location to2, |
| 339 | Primitive::Type type2); |
Nicolas Geoffray | f0e3937 | 2014-11-12 17:50:07 +0000 | [diff] [blame] | 340 | |
Nicolas Geoffray | af07bc1 | 2014-11-12 18:08:09 +0000 | [diff] [blame] | 341 | static bool StoreNeedsWriteBarrier(Primitive::Type type, HInstruction* value) { |
David Brazdil | 522e224 | 2015-03-17 18:48:28 +0000 | [diff] [blame] | 342 | // Check that null value is not represented as an integer constant. |
| 343 | DCHECK(type != Primitive::kPrimNot || !value->IsIntConstant()); |
| 344 | return type == Primitive::kPrimNot && !value->IsNullConstant(); |
Nicolas Geoffray | af07bc1 | 2014-11-12 18:08:09 +0000 | [diff] [blame] | 345 | } |
| 346 | |
Alexandre Rames | 78e3ef6 | 2015-08-12 13:43:29 +0100 | [diff] [blame] | 347 | void ValidateInvokeRuntime(HInstruction* instruction, SlowPathCode* slow_path); |
| 348 | |
Nicolas Geoffray | 9889396 | 2015-01-21 12:32:32 +0000 | [diff] [blame] | 349 | void AddAllocatedRegister(Location location) { |
| 350 | allocated_registers_.Add(location); |
| 351 | } |
| 352 | |
Nicolas Geoffray | 45b83af | 2015-07-06 15:12:53 +0000 | [diff] [blame] | 353 | bool HasAllocatedRegister(bool is_core, int reg) const { |
| 354 | return is_core |
| 355 | ? allocated_registers_.ContainsCoreRegister(reg) |
| 356 | : allocated_registers_.ContainsFloatingPointRegister(reg); |
| 357 | } |
| 358 | |
Nicolas Geoffray | c0572a4 | 2015-02-06 14:35:25 +0000 | [diff] [blame] | 359 | void AllocateLocations(HInstruction* instruction); |
| 360 | |
Roland Levillain | aa9b7c4 | 2015-02-17 15:40:09 +0000 | [diff] [blame] | 361 | // Tells whether the stack frame of the compiled method is |
| 362 | // considered "empty", that is either actually having a size of zero, |
| 363 | // or just containing the saved return address register. |
| 364 | bool HasEmptyFrame() const { |
| 365 | return GetFrameSize() == (CallPushesPC() ? GetWordSize() : 0); |
| 366 | } |
| 367 | |
Nicolas Geoffray | d6138ef | 2015-02-18 14:48:53 +0000 | [diff] [blame] | 368 | static int32_t GetInt32ValueOf(HConstant* constant) { |
| 369 | if (constant->IsIntConstant()) { |
| 370 | return constant->AsIntConstant()->GetValue(); |
| 371 | } else if (constant->IsNullConstant()) { |
| 372 | return 0; |
| 373 | } else { |
| 374 | DCHECK(constant->IsFloatConstant()); |
Roland Levillain | da4d79b | 2015-03-24 14:36:11 +0000 | [diff] [blame] | 375 | return bit_cast<int32_t, float>(constant->AsFloatConstant()->GetValue()); |
Nicolas Geoffray | d6138ef | 2015-02-18 14:48:53 +0000 | [diff] [blame] | 376 | } |
| 377 | } |
| 378 | |
| 379 | static int64_t GetInt64ValueOf(HConstant* constant) { |
| 380 | if (constant->IsIntConstant()) { |
| 381 | return constant->AsIntConstant()->GetValue(); |
| 382 | } else if (constant->IsNullConstant()) { |
| 383 | return 0; |
| 384 | } else if (constant->IsFloatConstant()) { |
Roland Levillain | da4d79b | 2015-03-24 14:36:11 +0000 | [diff] [blame] | 385 | return bit_cast<int32_t, float>(constant->AsFloatConstant()->GetValue()); |
Nicolas Geoffray | d6138ef | 2015-02-18 14:48:53 +0000 | [diff] [blame] | 386 | } else if (constant->IsLongConstant()) { |
| 387 | return constant->AsLongConstant()->GetValue(); |
| 388 | } else { |
| 389 | DCHECK(constant->IsDoubleConstant()); |
Roland Levillain | da4d79b | 2015-03-24 14:36:11 +0000 | [diff] [blame] | 390 | return bit_cast<int64_t, double>(constant->AsDoubleConstant()->GetValue()); |
Nicolas Geoffray | d6138ef | 2015-02-18 14:48:53 +0000 | [diff] [blame] | 391 | } |
| 392 | } |
| 393 | |
Nicolas Geoffray | a8ac913 | 2015-03-13 16:36:36 +0000 | [diff] [blame] | 394 | size_t GetFirstRegisterSlotInSlowPath() const { |
| 395 | return first_register_slot_in_slow_path_; |
| 396 | } |
| 397 | |
| 398 | uint32_t FrameEntrySpillSize() const { |
| 399 | return GetFpuSpillSize() + GetCoreSpillSize(); |
| 400 | } |
| 401 | |
Roland Levillain | ec525fc | 2015-04-28 15:50:20 +0100 | [diff] [blame] | 402 | virtual ParallelMoveResolver* GetMoveResolver() = 0; |
Nicolas Geoffray | a8ac913 | 2015-03-13 16:36:36 +0000 | [diff] [blame] | 403 | |
Nicolas Geoffray | fd88f16 | 2015-06-03 11:23:52 +0100 | [diff] [blame] | 404 | static void CreateCommonInvokeLocationSummary( |
| 405 | HInvoke* invoke, InvokeDexCallingConventionVisitor* visitor); |
| 406 | |
Calin Juravle | 175dc73 | 2015-08-25 15:42:32 +0100 | [diff] [blame] | 407 | void GenerateInvokeUnresolvedRuntimeCall(HInvokeUnresolved* invoke); |
| 408 | |
Calin Juravle | e460d1d | 2015-09-29 04:52:17 +0100 | [diff] [blame] | 409 | void CreateUnresolvedFieldLocationSummary( |
| 410 | HInstruction* field_access, |
| 411 | Primitive::Type field_type, |
| 412 | const FieldAccessCallingConvention& calling_convention); |
| 413 | |
| 414 | void GenerateUnresolvedFieldAccess( |
| 415 | HInstruction* field_access, |
| 416 | Primitive::Type field_type, |
| 417 | uint32_t field_index, |
| 418 | uint32_t dex_pc, |
| 419 | const FieldAccessCallingConvention& calling_convention); |
| 420 | |
Calin Juravle | 98893e1 | 2015-10-02 21:05:03 +0100 | [diff] [blame] | 421 | // TODO: This overlaps a bit with MoveFromReturnRegister. Refactor for a better design. |
| 422 | static void CreateLoadClassLocationSummary(HLoadClass* cls, |
| 423 | Location runtime_type_index_location, |
Roland Levillain | 0d5a281 | 2015-11-13 10:07:31 +0000 | [diff] [blame] | 424 | Location runtime_return_location, |
| 425 | bool code_generator_supports_read_barrier = false); |
Calin Juravle | 98893e1 | 2015-10-02 21:05:03 +0100 | [diff] [blame] | 426 | |
Nicolas Geoffray | 5bd05a5 | 2015-10-13 09:48:30 +0100 | [diff] [blame] | 427 | static void CreateSystemArrayCopyLocationSummary(HInvoke* invoke); |
| 428 | |
Alexandre Rames | eb7b739 | 2015-06-19 14:47:01 +0100 | [diff] [blame] | 429 | void SetDisassemblyInformation(DisassemblyInformation* info) { disasm_info_ = info; } |
| 430 | DisassemblyInformation* GetDisassemblyInformation() const { return disasm_info_; } |
| 431 | |
Calin Juravle | 175dc73 | 2015-08-25 15:42:32 +0100 | [diff] [blame] | 432 | virtual void InvokeRuntime(QuickEntrypointEnum entrypoint, |
| 433 | HInstruction* instruction, |
| 434 | uint32_t dex_pc, |
| 435 | SlowPathCode* slow_path) = 0; |
| 436 | |
Vladimir Marko | dc151b2 | 2015-10-15 18:02:30 +0100 | [diff] [blame] | 437 | // Check if the desired_dispatch_info is supported. If it is, return it, |
| 438 | // otherwise return a fall-back info that should be used instead. |
| 439 | virtual HInvokeStaticOrDirect::DispatchInfo GetSupportedInvokeStaticOrDirectDispatch( |
| 440 | const HInvokeStaticOrDirect::DispatchInfo& desired_dispatch_info, |
| 441 | MethodReference target_method) = 0; |
| 442 | |
Andreas Gampe | 85b62f2 | 2015-09-09 13:15:38 -0700 | [diff] [blame] | 443 | // Generate a call to a static or direct method. |
| 444 | virtual void GenerateStaticOrDirectCall(HInvokeStaticOrDirect* invoke, Location temp) = 0; |
| 445 | // Generate a call to a virtual method. |
| 446 | virtual void GenerateVirtualCall(HInvokeVirtual* invoke, Location temp) = 0; |
| 447 | |
| 448 | // Copy the result of a call into the given target. |
| 449 | virtual void MoveFromReturnRegister(Location trg, Primitive::Type type) = 0; |
| 450 | |
David Srbecky | c7098ff | 2016-02-09 14:30:11 +0000 | [diff] [blame] | 451 | virtual void GenerateNop() = 0; |
| 452 | |
Nicolas Geoffray | 787c307 | 2014-03-17 10:20:19 +0000 | [diff] [blame] | 453 | protected: |
Vladimir Marko | 5815501 | 2015-08-19 12:49:41 +0000 | [diff] [blame] | 454 | // Method patch info used for recording locations of required linker patches and |
| 455 | // target methods. The target method can be used for various purposes, whether for |
| 456 | // patching the address of the method or the code pointer or a PC-relative call. |
| 457 | template <typename LabelType> |
| 458 | struct MethodPatchInfo { |
| 459 | explicit MethodPatchInfo(MethodReference m) : target_method(m), label() { } |
| 460 | |
| 461 | MethodReference target_method; |
| 462 | LabelType label; |
| 463 | }; |
| 464 | |
Nicolas Geoffray | 71175b7 | 2014-10-09 22:13:55 +0100 | [diff] [blame] | 465 | CodeGenerator(HGraph* graph, |
| 466 | size_t number_of_core_registers, |
| 467 | size_t number_of_fpu_registers, |
Calin Juravle | cd6dffe | 2015-01-08 17:35:35 +0000 | [diff] [blame] | 468 | size_t number_of_register_pairs, |
Nicolas Geoffray | 9889396 | 2015-01-21 12:32:32 +0000 | [diff] [blame] | 469 | uint32_t core_callee_save_mask, |
| 470 | uint32_t fpu_callee_save_mask, |
Serban Constantinescu | ecc4366 | 2015-08-13 13:33:12 +0100 | [diff] [blame] | 471 | const CompilerOptions& compiler_options, |
| 472 | OptimizingCompilerStats* stats) |
Nicolas Geoffray | c0572a4 | 2015-02-06 14:35:25 +0000 | [diff] [blame] | 473 | : frame_size_(0), |
Nicolas Geoffray | 4361bef | 2014-08-20 04:59:12 +0100 | [diff] [blame] | 474 | core_spill_mask_(0), |
Nicolas Geoffray | d97dc40 | 2015-01-22 13:50:01 +0000 | [diff] [blame] | 475 | fpu_spill_mask_(0), |
Nicolas Geoffray | 3bca0df | 2014-09-19 11:01:00 +0100 | [diff] [blame] | 476 | first_register_slot_in_slow_path_(0), |
Vladimir Marko | 5233f93 | 2015-09-29 19:01:15 +0100 | [diff] [blame] | 477 | blocked_core_registers_(graph->GetArena()->AllocArray<bool>(number_of_core_registers, |
| 478 | kArenaAllocCodeGenerator)), |
| 479 | blocked_fpu_registers_(graph->GetArena()->AllocArray<bool>(number_of_fpu_registers, |
| 480 | kArenaAllocCodeGenerator)), |
| 481 | blocked_register_pairs_(graph->GetArena()->AllocArray<bool>(number_of_register_pairs, |
| 482 | kArenaAllocCodeGenerator)), |
Nicolas Geoffray | 71175b7 | 2014-10-09 22:13:55 +0100 | [diff] [blame] | 483 | number_of_core_registers_(number_of_core_registers), |
| 484 | number_of_fpu_registers_(number_of_fpu_registers), |
| 485 | number_of_register_pairs_(number_of_register_pairs), |
Nicolas Geoffray | 9889396 | 2015-01-21 12:32:32 +0000 | [diff] [blame] | 486 | core_callee_save_mask_(core_callee_save_mask), |
| 487 | fpu_callee_save_mask_(fpu_callee_save_mask), |
Vladimir Marko | cf93a5c | 2015-06-16 11:33:24 +0000 | [diff] [blame] | 488 | stack_map_stream_(graph->GetArena()), |
| 489 | block_order_(nullptr), |
Alexandre Rames | eb7b739 | 2015-06-19 14:47:01 +0100 | [diff] [blame] | 490 | disasm_info_(nullptr), |
Serban Constantinescu | ecc4366 | 2015-08-13 13:33:12 +0100 | [diff] [blame] | 491 | stats_(stats), |
Nicolas Geoffray | 787c307 | 2014-03-17 10:20:19 +0000 | [diff] [blame] | 492 | graph_(graph), |
Calin Juravle | cd6dffe | 2015-01-08 17:35:35 +0000 | [diff] [blame] | 493 | compiler_options_(compiler_options), |
Vladimir Marko | 225b646 | 2015-09-28 12:17:40 +0100 | [diff] [blame] | 494 | slow_paths_(graph->GetArena()->Adapter(kArenaAllocCodeGenerator)), |
Vladimir Marko | 0f7dca4 | 2015-11-02 14:36:43 +0000 | [diff] [blame] | 495 | current_slow_path_(nullptr), |
Nicolas Geoffray | 4c204ba | 2015-02-03 15:12:35 +0000 | [diff] [blame] | 496 | current_block_index_(0), |
Nicolas Geoffray | 3946844 | 2014-09-02 15:17:15 +0100 | [diff] [blame] | 497 | is_leaf_(true), |
Vladimir Marko | 225b646 | 2015-09-28 12:17:40 +0100 | [diff] [blame] | 498 | requires_current_method_(false) { |
| 499 | slow_paths_.reserve(8); |
| 500 | } |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 501 | |
Nicolas Geoffray | a7aca37 | 2014-04-28 17:47:12 +0100 | [diff] [blame] | 502 | virtual Location GetStackLocation(HLoadLocal* load) const = 0; |
| 503 | |
Nicolas Geoffray | c0572a4 | 2015-02-06 14:35:25 +0000 | [diff] [blame] | 504 | virtual HGraphVisitor* GetLocationBuilder() = 0; |
| 505 | virtual HGraphVisitor* GetInstructionVisitor() = 0; |
Nicolas Geoffray | f0e3937 | 2014-11-12 17:50:07 +0000 | [diff] [blame] | 506 | |
Nicolas Geoffray | d97dc40 | 2015-01-22 13:50:01 +0000 | [diff] [blame] | 507 | // Returns the location of the first spilled entry for floating point registers, |
| 508 | // relative to the stack pointer. |
| 509 | uint32_t GetFpuSpillStart() const { |
Nicolas Geoffray | d97dc40 | 2015-01-22 13:50:01 +0000 | [diff] [blame] | 510 | return GetFrameSize() - FrameEntrySpillSize(); |
| 511 | } |
| 512 | |
| 513 | uint32_t GetFpuSpillSize() const { |
| 514 | return POPCOUNT(fpu_spill_mask_) * GetFloatingPointSpillSlotSize(); |
| 515 | } |
| 516 | |
| 517 | uint32_t GetCoreSpillSize() const { |
| 518 | return POPCOUNT(core_spill_mask_) * GetWordSize(); |
| 519 | } |
| 520 | |
Nicolas Geoffray | c0572a4 | 2015-02-06 14:35:25 +0000 | [diff] [blame] | 521 | bool HasAllocatedCalleeSaveRegisters() const { |
| 522 | // We check the core registers against 1 because it always comprises the return PC. |
| 523 | return (POPCOUNT(allocated_registers_.GetCoreRegisters() & core_callee_save_mask_) != 1) |
| 524 | || (POPCOUNT(allocated_registers_.GetFloatingPointRegisters() & fpu_callee_save_mask_) != 0); |
| 525 | } |
| 526 | |
| 527 | bool CallPushesPC() const { |
| 528 | InstructionSet instruction_set = GetInstructionSet(); |
| 529 | return instruction_set == kX86 || instruction_set == kX86_64; |
| 530 | } |
| 531 | |
Vladimir Marko | 225b646 | 2015-09-28 12:17:40 +0100 | [diff] [blame] | 532 | // Arm64 has its own type for a label, so we need to templatize these methods |
Nicolas Geoffray | dc23d83 | 2015-02-16 11:15:43 +0000 | [diff] [blame] | 533 | // to share the logic. |
Vladimir Marko | 225b646 | 2015-09-28 12:17:40 +0100 | [diff] [blame] | 534 | |
| 535 | template <typename LabelType> |
| 536 | LabelType* CommonInitializeLabels() { |
Vladimir Marko | b95fb77 | 2015-09-30 13:32:31 +0100 | [diff] [blame] | 537 | // We use raw array allocations instead of ArenaVector<> because Labels are |
| 538 | // non-constructible and non-movable and as such cannot be held in a vector. |
Vladimir Marko | 225b646 | 2015-09-28 12:17:40 +0100 | [diff] [blame] | 539 | size_t size = GetGraph()->GetBlocks().size(); |
| 540 | LabelType* labels = GetGraph()->GetArena()->AllocArray<LabelType>(size, |
| 541 | kArenaAllocCodeGenerator); |
| 542 | for (size_t i = 0; i != size; ++i) { |
| 543 | new(labels + i) LabelType(); |
| 544 | } |
| 545 | return labels; |
| 546 | } |
| 547 | |
Vladimir Marko | 5815501 | 2015-08-19 12:49:41 +0000 | [diff] [blame] | 548 | template <typename LabelType> |
| 549 | LabelType* CommonGetLabelOf(LabelType* raw_pointer_to_labels_array, HBasicBlock* block) const { |
Nicolas Geoffray | dc23d83 | 2015-02-16 11:15:43 +0000 | [diff] [blame] | 550 | block = FirstNonEmptyBlock(block); |
| 551 | return raw_pointer_to_labels_array + block->GetBlockId(); |
| 552 | } |
| 553 | |
Vladimir Marko | 0f7dca4 | 2015-11-02 14:36:43 +0000 | [diff] [blame] | 554 | SlowPathCode* GetCurrentSlowPath() { |
| 555 | return current_slow_path_; |
| 556 | } |
| 557 | |
Nicolas Geoffray | 8ccc3f5 | 2014-03-19 10:34:11 +0000 | [diff] [blame] | 558 | // Frame size required for this method. |
| 559 | uint32_t frame_size_; |
| 560 | uint32_t core_spill_mask_; |
Nicolas Geoffray | d97dc40 | 2015-01-22 13:50:01 +0000 | [diff] [blame] | 561 | uint32_t fpu_spill_mask_; |
Nicolas Geoffray | 3bca0df | 2014-09-19 11:01:00 +0100 | [diff] [blame] | 562 | uint32_t first_register_slot_in_slow_path_; |
Nicolas Geoffray | 8ccc3f5 | 2014-03-19 10:34:11 +0000 | [diff] [blame] | 563 | |
Nicolas Geoffray | 9889396 | 2015-01-21 12:32:32 +0000 | [diff] [blame] | 564 | // Registers that were allocated during linear scan. |
| 565 | RegisterSet allocated_registers_; |
| 566 | |
Nicolas Geoffray | 71175b7 | 2014-10-09 22:13:55 +0100 | [diff] [blame] | 567 | // Arrays used when doing register allocation to know which |
| 568 | // registers we can allocate. `SetupBlockedRegisters` updates the |
| 569 | // arrays. |
| 570 | bool* const blocked_core_registers_; |
| 571 | bool* const blocked_fpu_registers_; |
| 572 | bool* const blocked_register_pairs_; |
| 573 | size_t number_of_core_registers_; |
| 574 | size_t number_of_fpu_registers_; |
| 575 | size_t number_of_register_pairs_; |
Nicolas Geoffray | 9889396 | 2015-01-21 12:32:32 +0000 | [diff] [blame] | 576 | const uint32_t core_callee_save_mask_; |
| 577 | const uint32_t fpu_callee_save_mask_; |
Nicolas Geoffray | 71175b7 | 2014-10-09 22:13:55 +0100 | [diff] [blame] | 578 | |
Vladimir Marko | cf93a5c | 2015-06-16 11:33:24 +0000 | [diff] [blame] | 579 | StackMapStream stack_map_stream_; |
| 580 | |
| 581 | // The order to use for code generation. |
Vladimir Marko | fa6b93c | 2015-09-15 10:15:55 +0100 | [diff] [blame] | 582 | const ArenaVector<HBasicBlock*>* block_order_; |
Vladimir Marko | cf93a5c | 2015-06-16 11:33:24 +0000 | [diff] [blame] | 583 | |
Alexandre Rames | eb7b739 | 2015-06-19 14:47:01 +0100 | [diff] [blame] | 584 | DisassemblyInformation* disasm_info_; |
| 585 | |
Nicolas Geoffray | bab4ed7 | 2014-03-11 17:53:17 +0000 | [diff] [blame] | 586 | private: |
Nicolas Geoffray | 3bca0df | 2014-09-19 11:01:00 +0100 | [diff] [blame] | 587 | size_t GetStackOffsetOfSavedRegister(size_t index); |
Alexandre Rames | eb7b739 | 2015-06-19 14:47:01 +0100 | [diff] [blame] | 588 | void GenerateSlowPaths(); |
Mark Mendell | 5f87418 | 2015-03-04 15:42:45 -0500 | [diff] [blame] | 589 | void BlockIfInRegister(Location location, bool is_out = false) const; |
Nicolas Geoffray | b1d0f3f | 2015-05-14 12:41:51 +0100 | [diff] [blame] | 590 | void EmitEnvironment(HEnvironment* environment, SlowPathCode* slow_path); |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 591 | |
Serban Constantinescu | ecc4366 | 2015-08-13 13:33:12 +0100 | [diff] [blame] | 592 | OptimizingCompilerStats* stats_; |
| 593 | |
Nicolas Geoffray | 787c307 | 2014-03-17 10:20:19 +0000 | [diff] [blame] | 594 | HGraph* const graph_; |
Calin Juravle | cd6dffe | 2015-01-08 17:35:35 +0000 | [diff] [blame] | 595 | const CompilerOptions& compiler_options_; |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 596 | |
Vladimir Marko | 225b646 | 2015-09-28 12:17:40 +0100 | [diff] [blame] | 597 | ArenaVector<SlowPathCode*> slow_paths_; |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 598 | |
Aart Bik | 42249c3 | 2016-01-07 15:33:50 -0800 | [diff] [blame] | 599 | // The current slow-path that we're generating code for. |
Vladimir Marko | 0f7dca4 | 2015-11-02 14:36:43 +0000 | [diff] [blame] | 600 | SlowPathCode* current_slow_path_; |
| 601 | |
Nicolas Geoffray | 4c204ba | 2015-02-03 15:12:35 +0000 | [diff] [blame] | 602 | // The current block index in `block_order_` of the block |
| 603 | // we are generating code for. |
| 604 | size_t current_block_index_; |
| 605 | |
Nicolas Geoffray | c0572a4 | 2015-02-06 14:35:25 +0000 | [diff] [blame] | 606 | // Whether the method is a leaf method. |
Nicolas Geoffray | f12feb8 | 2014-07-17 18:32:41 +0100 | [diff] [blame] | 607 | bool is_leaf_; |
| 608 | |
Nicolas Geoffray | c0572a4 | 2015-02-06 14:35:25 +0000 | [diff] [blame] | 609 | // Whether an instruction in the graph accesses the current method. |
| 610 | bool requires_current_method_; |
| 611 | |
David Srbecky | c6b4dd8 | 2015-04-07 20:32:43 +0100 | [diff] [blame] | 612 | friend class OptimizingCFITest; |
| 613 | |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 614 | DISALLOW_COPY_AND_ASSIGN(CodeGenerator); |
| 615 | }; |
| 616 | |
Nicolas Geoffray | 7fb49da | 2014-10-06 09:12:41 +0100 | [diff] [blame] | 617 | template <typename C, typename F> |
Nicolas Geoffray | 4a34a42 | 2014-04-03 10:38:37 +0100 | [diff] [blame] | 618 | class CallingConvention { |
| 619 | public: |
Nicolas Geoffray | 7fb49da | 2014-10-06 09:12:41 +0100 | [diff] [blame] | 620 | CallingConvention(const C* registers, |
| 621 | size_t number_of_registers, |
| 622 | const F* fpu_registers, |
Mathieu Chartier | e401d14 | 2015-04-22 13:56:20 -0700 | [diff] [blame] | 623 | size_t number_of_fpu_registers, |
| 624 | size_t pointer_size) |
Nicolas Geoffray | 7fb49da | 2014-10-06 09:12:41 +0100 | [diff] [blame] | 625 | : registers_(registers), |
| 626 | number_of_registers_(number_of_registers), |
| 627 | fpu_registers_(fpu_registers), |
Mathieu Chartier | e401d14 | 2015-04-22 13:56:20 -0700 | [diff] [blame] | 628 | number_of_fpu_registers_(number_of_fpu_registers), |
| 629 | pointer_size_(pointer_size) {} |
Nicolas Geoffray | 4a34a42 | 2014-04-03 10:38:37 +0100 | [diff] [blame] | 630 | |
| 631 | size_t GetNumberOfRegisters() const { return number_of_registers_; } |
Nicolas Geoffray | 7fb49da | 2014-10-06 09:12:41 +0100 | [diff] [blame] | 632 | size_t GetNumberOfFpuRegisters() const { return number_of_fpu_registers_; } |
Nicolas Geoffray | 4a34a42 | 2014-04-03 10:38:37 +0100 | [diff] [blame] | 633 | |
Nicolas Geoffray | 7fb49da | 2014-10-06 09:12:41 +0100 | [diff] [blame] | 634 | C GetRegisterAt(size_t index) const { |
Nicolas Geoffray | 4a34a42 | 2014-04-03 10:38:37 +0100 | [diff] [blame] | 635 | DCHECK_LT(index, number_of_registers_); |
| 636 | return registers_[index]; |
| 637 | } |
| 638 | |
Nicolas Geoffray | 7fb49da | 2014-10-06 09:12:41 +0100 | [diff] [blame] | 639 | F GetFpuRegisterAt(size_t index) const { |
| 640 | DCHECK_LT(index, number_of_fpu_registers_); |
| 641 | return fpu_registers_[index]; |
| 642 | } |
| 643 | |
| 644 | size_t GetStackOffsetOf(size_t index) const { |
Nicolas Geoffray | 4a34a42 | 2014-04-03 10:38:37 +0100 | [diff] [blame] | 645 | // We still reserve the space for parameters passed by registers. |
Mathieu Chartier | e401d14 | 2015-04-22 13:56:20 -0700 | [diff] [blame] | 646 | // Add space for the method pointer. |
| 647 | return pointer_size_ + index * kVRegSize; |
Nicolas Geoffray | 4a34a42 | 2014-04-03 10:38:37 +0100 | [diff] [blame] | 648 | } |
| 649 | |
| 650 | private: |
Nicolas Geoffray | 7fb49da | 2014-10-06 09:12:41 +0100 | [diff] [blame] | 651 | const C* registers_; |
Nicolas Geoffray | 4a34a42 | 2014-04-03 10:38:37 +0100 | [diff] [blame] | 652 | const size_t number_of_registers_; |
Nicolas Geoffray | 7fb49da | 2014-10-06 09:12:41 +0100 | [diff] [blame] | 653 | const F* fpu_registers_; |
| 654 | const size_t number_of_fpu_registers_; |
Mathieu Chartier | e401d14 | 2015-04-22 13:56:20 -0700 | [diff] [blame] | 655 | const size_t pointer_size_; |
Nicolas Geoffray | 4a34a42 | 2014-04-03 10:38:37 +0100 | [diff] [blame] | 656 | |
| 657 | DISALLOW_COPY_AND_ASSIGN(CallingConvention); |
| 658 | }; |
| 659 | |
Aart Bik | 42249c3 | 2016-01-07 15:33:50 -0800 | [diff] [blame] | 660 | /** |
| 661 | * A templated class SlowPathGenerator with a templated method NewSlowPath() |
| 662 | * that can be used by any code generator to share equivalent slow-paths with |
| 663 | * the objective of reducing generated code size. |
| 664 | * |
| 665 | * InstructionType: instruction that requires SlowPathCodeType |
| 666 | * SlowPathCodeType: subclass of SlowPathCode, with constructor SlowPathCodeType(InstructionType *) |
| 667 | */ |
| 668 | template <typename InstructionType> |
| 669 | class SlowPathGenerator { |
| 670 | static_assert(std::is_base_of<HInstruction, InstructionType>::value, |
| 671 | "InstructionType is not a subclass of art::HInstruction"); |
| 672 | |
| 673 | public: |
| 674 | SlowPathGenerator(HGraph* graph, CodeGenerator* codegen) |
| 675 | : graph_(graph), |
| 676 | codegen_(codegen), |
| 677 | slow_path_map_(std::less<uint32_t>(), graph->GetArena()->Adapter(kArenaAllocSlowPaths)) {} |
| 678 | |
| 679 | // Creates and adds a new slow-path, if needed, or returns existing one otherwise. |
| 680 | // Templating the method (rather than the whole class) on the slow-path type enables |
| 681 | // keeping this code at a generic, non architecture-specific place. |
| 682 | // |
| 683 | // NOTE: This approach assumes each InstructionType only generates one SlowPathCodeType. |
| 684 | // To relax this requirement, we would need some RTTI on the stored slow-paths, |
| 685 | // or template the class as a whole on SlowPathType. |
| 686 | template <typename SlowPathCodeType> |
| 687 | SlowPathCodeType* NewSlowPath(InstructionType* instruction) { |
| 688 | static_assert(std::is_base_of<SlowPathCode, SlowPathCodeType>::value, |
| 689 | "SlowPathCodeType is not a subclass of art::SlowPathCode"); |
| 690 | static_assert(std::is_constructible<SlowPathCodeType, InstructionType*>::value, |
| 691 | "SlowPathCodeType is not constructible from InstructionType*"); |
| 692 | // Iterate over potential candidates for sharing. Currently, only same-typed |
| 693 | // slow-paths with exactly the same dex-pc are viable candidates. |
| 694 | // TODO: pass dex-pc/slow-path-type to run-time to allow even more sharing? |
| 695 | const uint32_t dex_pc = instruction->GetDexPc(); |
| 696 | auto iter = slow_path_map_.find(dex_pc); |
| 697 | if (iter != slow_path_map_.end()) { |
| 698 | auto candidates = iter->second; |
| 699 | for (const auto& it : candidates) { |
| 700 | InstructionType* other_instruction = it.first; |
| 701 | SlowPathCodeType* other_slow_path = down_cast<SlowPathCodeType*>(it.second); |
| 702 | // Determine if the instructions allow for slow-path sharing. |
| 703 | if (HaveSameLiveRegisters(instruction, other_instruction) && |
| 704 | HaveSameStackMap(instruction, other_instruction)) { |
| 705 | // Can share: reuse existing one. |
| 706 | return other_slow_path; |
| 707 | } |
| 708 | } |
| 709 | } else { |
| 710 | // First time this dex-pc is seen. |
| 711 | iter = slow_path_map_.Put(dex_pc, {{}, {graph_->GetArena()->Adapter(kArenaAllocSlowPaths)}}); |
| 712 | } |
| 713 | // Cannot share: create and add new slow-path for this particular dex-pc. |
| 714 | SlowPathCodeType* slow_path = new (graph_->GetArena()) SlowPathCodeType(instruction); |
| 715 | iter->second.emplace_back(std::make_pair(instruction, slow_path)); |
| 716 | codegen_->AddSlowPath(slow_path); |
| 717 | return slow_path; |
| 718 | } |
| 719 | |
| 720 | private: |
| 721 | // Tests if both instructions have same set of live physical registers. This ensures |
| 722 | // the slow-path has exactly the same preamble on saving these registers to stack. |
| 723 | bool HaveSameLiveRegisters(const InstructionType* i1, const InstructionType* i2) const { |
| 724 | const uint32_t core_spill = ~codegen_->GetCoreSpillMask(); |
| 725 | const uint32_t fpu_spill = ~codegen_->GetFpuSpillMask(); |
| 726 | RegisterSet* live1 = i1->GetLocations()->GetLiveRegisters(); |
| 727 | RegisterSet* live2 = i2->GetLocations()->GetLiveRegisters(); |
| 728 | return (((live1->GetCoreRegisters() & core_spill) == |
| 729 | (live2->GetCoreRegisters() & core_spill)) && |
| 730 | ((live1->GetFloatingPointRegisters() & fpu_spill) == |
| 731 | (live2->GetFloatingPointRegisters() & fpu_spill))); |
| 732 | } |
| 733 | |
| 734 | // Tests if both instructions have the same stack map. This ensures the interpreter |
| 735 | // will find exactly the same dex-registers at the same entries. |
| 736 | bool HaveSameStackMap(const InstructionType* i1, const InstructionType* i2) const { |
| 737 | DCHECK(i1->HasEnvironment()); |
| 738 | DCHECK(i2->HasEnvironment()); |
| 739 | // We conservatively test if the two instructions find exactly the same instructions |
| 740 | // and location in each dex-register. This guarantees they will have the same stack map. |
| 741 | HEnvironment* e1 = i1->GetEnvironment(); |
| 742 | HEnvironment* e2 = i2->GetEnvironment(); |
| 743 | if (e1->GetParent() != e2->GetParent() || e1->Size() != e2->Size()) { |
| 744 | return false; |
| 745 | } |
| 746 | for (size_t i = 0, sz = e1->Size(); i < sz; ++i) { |
| 747 | if (e1->GetInstructionAt(i) != e2->GetInstructionAt(i) || |
| 748 | !e1->GetLocationAt(i).Equals(e2->GetLocationAt(i))) { |
| 749 | return false; |
| 750 | } |
| 751 | } |
| 752 | return true; |
| 753 | } |
| 754 | |
| 755 | HGraph* const graph_; |
| 756 | CodeGenerator* const codegen_; |
| 757 | |
| 758 | // Map from dex-pc to vector of already existing instruction/slow-path pairs. |
| 759 | ArenaSafeMap<uint32_t, ArenaVector<std::pair<InstructionType*, SlowPathCode*>>> slow_path_map_; |
| 760 | |
| 761 | DISALLOW_COPY_AND_ASSIGN(SlowPathGenerator); |
| 762 | }; |
| 763 | |
| 764 | class InstructionCodeGenerator : public HGraphVisitor { |
| 765 | public: |
| 766 | InstructionCodeGenerator(HGraph* graph, CodeGenerator* codegen) |
| 767 | : HGraphVisitor(graph), |
| 768 | deopt_slow_paths_(graph, codegen) {} |
| 769 | |
| 770 | protected: |
| 771 | // Add slow-path generator for each instruction/slow-path combination that desires sharing. |
| 772 | // TODO: under current regime, only deopt sharing make sense; extend later. |
| 773 | SlowPathGenerator<HDeoptimize> deopt_slow_paths_; |
| 774 | }; |
| 775 | |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 776 | } // namespace art |
| 777 | |
| 778 | #endif // ART_COMPILER_OPTIMIZING_CODE_GENERATOR_H_ |