blob: 28766d85ea8ec422ff5adec012d00d6e1821e1ca [file] [log] [blame]
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +00001/*
2 * Copyright (C) 2014 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17#ifndef ART_COMPILER_OPTIMIZING_CODE_GENERATOR_X86_H_
18#define ART_COMPILER_OPTIMIZING_CODE_GENERATOR_X86_H_
19
20#include "code_generator.h"
Calin Juravle52c48962014-12-16 17:02:57 +000021#include "dex/compiler_enums.h"
Calin Juravlecd6dffe2015-01-08 17:35:35 +000022#include "driver/compiler_options.h"
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +000023#include "nodes.h"
Nicolas Geoffray86dbb9a2014-06-04 11:12:39 +010024#include "parallel_move_resolver.h"
Nicolas Geoffray787c3072014-03-17 10:20:19 +000025#include "utils/x86/assembler_x86.h"
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +000026
27namespace art {
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +000028namespace x86 {
29
Nicolas Geoffray86a8d7a2014-11-19 08:47:18 +000030// Use a local definition to prevent copying mistakes.
31static constexpr size_t kX86WordSize = kX86PointerSize;
Nicolas Geoffray707c8092014-04-04 10:50:14 +010032
Nicolas Geoffray01bc96d2014-04-11 17:43:50 +010033class CodeGeneratorX86;
Nicolas Geoffray424f6762014-11-03 14:51:25 +000034class SlowPathCodeX86;
Nicolas Geoffray01bc96d2014-04-11 17:43:50 +010035
Nicolas Geoffraya747a392014-04-17 14:56:23 +010036static constexpr Register kParameterCoreRegisters[] = { ECX, EDX, EBX };
37static constexpr RegisterPair kParameterCorePairRegisters[] = { ECX_EDX, EDX_EBX };
38static constexpr size_t kParameterCoreRegistersLength = arraysize(kParameterCoreRegisters);
Mark P Mendell966c3ae2015-01-27 15:45:27 +000039static constexpr XmmRegister kParameterFpuRegisters[] = { XMM0, XMM1, XMM2, XMM3 };
40static constexpr size_t kParameterFpuRegistersLength = arraysize(kParameterFpuRegisters);
Nicolas Geoffraya747a392014-04-17 14:56:23 +010041
Nicolas Geoffrayd75948a2015-03-27 09:53:16 +000042static constexpr Register kRuntimeParameterCoreRegisters[] = { EAX, ECX, EDX, EBX };
43static constexpr size_t kRuntimeParameterCoreRegistersLength =
44 arraysize(kRuntimeParameterCoreRegisters);
45static constexpr XmmRegister kRuntimeParameterFpuRegisters[] = { XMM0, XMM1, XMM2, XMM3 };
46static constexpr size_t kRuntimeParameterFpuRegistersLength =
47 arraysize(kRuntimeParameterFpuRegisters);
48
49class InvokeRuntimeCallingConvention : public CallingConvention<Register, XmmRegister> {
50 public:
51 InvokeRuntimeCallingConvention()
52 : CallingConvention(kRuntimeParameterCoreRegisters,
53 kRuntimeParameterCoreRegistersLength,
54 kRuntimeParameterFpuRegisters,
55 kRuntimeParameterFpuRegistersLength) {}
56
57 private:
58 DISALLOW_COPY_AND_ASSIGN(InvokeRuntimeCallingConvention);
59};
60
Nicolas Geoffray7fb49da2014-10-06 09:12:41 +010061class InvokeDexCallingConvention : public CallingConvention<Register, XmmRegister> {
Nicolas Geoffraya747a392014-04-17 14:56:23 +010062 public:
Nicolas Geoffray7fb49da2014-10-06 09:12:41 +010063 InvokeDexCallingConvention() : CallingConvention(
64 kParameterCoreRegisters,
65 kParameterCoreRegistersLength,
66 kParameterFpuRegisters,
67 kParameterFpuRegistersLength) {}
Nicolas Geoffraya747a392014-04-17 14:56:23 +010068
69 RegisterPair GetRegisterPairAt(size_t argument_index) {
70 DCHECK_LT(argument_index + 1, GetNumberOfRegisters());
71 return kParameterCorePairRegisters[argument_index];
72 }
73
74 private:
75 DISALLOW_COPY_AND_ASSIGN(InvokeDexCallingConvention);
76};
77
Roland Levillain2d27c8e2015-04-28 15:48:45 +010078class InvokeDexCallingConventionVisitorX86 : public InvokeDexCallingConventionVisitor {
Nicolas Geoffraya747a392014-04-17 14:56:23 +010079 public:
Roland Levillain2d27c8e2015-04-28 15:48:45 +010080 InvokeDexCallingConventionVisitorX86() {}
81 virtual ~InvokeDexCallingConventionVisitorX86() {}
Nicolas Geoffraya747a392014-04-17 14:56:23 +010082
Roland Levillain2d27c8e2015-04-28 15:48:45 +010083 Location GetNextLocation(Primitive::Type type) OVERRIDE;
Nicolas Geoffraya747a392014-04-17 14:56:23 +010084
85 private:
86 InvokeDexCallingConvention calling_convention;
Nicolas Geoffraya747a392014-04-17 14:56:23 +010087
Roland Levillain2d27c8e2015-04-28 15:48:45 +010088 DISALLOW_COPY_AND_ASSIGN(InvokeDexCallingConventionVisitorX86);
Nicolas Geoffraya747a392014-04-17 14:56:23 +010089};
90
Zheng Xuad4450e2015-04-17 18:48:56 +080091class ParallelMoveResolverX86 : public ParallelMoveResolverWithSwap {
Nicolas Geoffray86dbb9a2014-06-04 11:12:39 +010092 public:
93 ParallelMoveResolverX86(ArenaAllocator* allocator, CodeGeneratorX86* codegen)
Zheng Xuad4450e2015-04-17 18:48:56 +080094 : ParallelMoveResolverWithSwap(allocator), codegen_(codegen) {}
Nicolas Geoffray86dbb9a2014-06-04 11:12:39 +010095
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +000096 void EmitMove(size_t index) OVERRIDE;
97 void EmitSwap(size_t index) OVERRIDE;
98 void SpillScratch(int reg) OVERRIDE;
99 void RestoreScratch(int reg) OVERRIDE;
Nicolas Geoffray86dbb9a2014-06-04 11:12:39 +0100100
101 X86Assembler* GetAssembler() const;
102
103 private:
104 void Exchange(Register reg, int mem);
105 void Exchange(int mem1, int mem2);
Mark Mendell7c8d0092015-01-26 11:21:33 -0500106 void Exchange32(XmmRegister reg, int mem);
107 void MoveMemoryToMemory32(int dst, int src);
108 void MoveMemoryToMemory64(int dst, int src);
Nicolas Geoffray86dbb9a2014-06-04 11:12:39 +0100109
110 CodeGeneratorX86* const codegen_;
111
112 DISALLOW_COPY_AND_ASSIGN(ParallelMoveResolverX86);
113};
114
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +0000115class LocationsBuilderX86 : public HGraphVisitor {
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000116 public:
Nicolas Geoffray01bc96d2014-04-11 17:43:50 +0100117 LocationsBuilderX86(HGraph* graph, CodeGeneratorX86* codegen)
118 : HGraphVisitor(graph), codegen_(codegen) {}
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000119
Nicolas Geoffray360231a2014-10-08 21:07:48 +0100120#define DECLARE_VISIT_INSTRUCTION(name, super) \
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000121 void Visit##name(H##name* instr) OVERRIDE;
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000122
Nicolas Geoffray96f89a22014-07-11 10:57:49 +0100123 FOR_EACH_CONCRETE_INSTRUCTION(DECLARE_VISIT_INSTRUCTION)
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000124
125#undef DECLARE_VISIT_INSTRUCTION
126
Nicolas Geoffray9574c4b2014-11-12 13:19:37 +0000127 private:
128 void HandleBitwiseOperation(HBinaryOperation* instruction);
Nicolas Geoffraye982f0b2014-08-13 02:11:24 +0100129 void HandleInvoke(HInvoke* invoke);
Calin Juravle9aec02f2014-11-18 23:06:35 +0000130 void HandleShift(HBinaryOperation* instruction);
Calin Juravle52c48962014-12-16 17:02:57 +0000131 void HandleFieldSet(HInstruction* instruction, const FieldInfo& field_info);
132 void HandleFieldGet(HInstruction* instruction, const FieldInfo& field_info);
Nicolas Geoffraye982f0b2014-08-13 02:11:24 +0100133
Nicolas Geoffray01bc96d2014-04-11 17:43:50 +0100134 CodeGeneratorX86* const codegen_;
Roland Levillain2d27c8e2015-04-28 15:48:45 +0100135 InvokeDexCallingConventionVisitorX86 parameter_visitor_;
Nicolas Geoffray01bc96d2014-04-11 17:43:50 +0100136
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +0000137 DISALLOW_COPY_AND_ASSIGN(LocationsBuilderX86);
138};
139
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000140class InstructionCodeGeneratorX86 : public HGraphVisitor {
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +0000141 public:
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100142 InstructionCodeGeneratorX86(HGraph* graph, CodeGeneratorX86* codegen);
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +0000143
Nicolas Geoffray360231a2014-10-08 21:07:48 +0100144#define DECLARE_VISIT_INSTRUCTION(name, super) \
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000145 void Visit##name(H##name* instr) OVERRIDE;
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +0000146
Nicolas Geoffray96f89a22014-07-11 10:57:49 +0100147 FOR_EACH_CONCRETE_INSTRUCTION(DECLARE_VISIT_INSTRUCTION)
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +0000148
149#undef DECLARE_VISIT_INSTRUCTION
150
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100151 X86Assembler* GetAssembler() const { return assembler_; }
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000152
153 private:
Nicolas Geoffray3c049742014-09-24 18:10:46 +0100154 // Generate code for the given suspend check. If not null, `successor`
155 // is the block to branch to if the suspend check is not needed, and after
156 // the suspend call.
157 void GenerateSuspendCheck(HSuspendCheck* check, HBasicBlock* successor);
Nicolas Geoffray424f6762014-11-03 14:51:25 +0000158 void GenerateClassInitializationCheck(SlowPathCodeX86* slow_path, Register class_reg);
Nicolas Geoffray9574c4b2014-11-12 13:19:37 +0000159 void HandleBitwiseOperation(HBinaryOperation* instruction);
Calin Juravlebacfec32014-11-14 15:54:36 +0000160 void GenerateDivRemIntegral(HBinaryOperation* instruction);
Guillaume Sanchez0f88e872015-03-30 17:55:45 +0100161 void DivRemOneOrMinusOne(HBinaryOperation* instruction);
Guillaume Sanchezb19930c2015-04-09 21:12:15 +0100162 void DivByPowerOfTwo(HDiv* instruction);
Guillaume Sanchez0f88e872015-03-30 17:55:45 +0100163 void GenerateDivRemWithAnyConstant(HBinaryOperation* instruction);
Mark Mendell24f2dfa2015-01-14 19:51:45 -0500164 void GenerateRemFP(HRem *rem);
Calin Juravle9aec02f2014-11-18 23:06:35 +0000165 void HandleShift(HBinaryOperation* instruction);
166 void GenerateShlLong(const Location& loc, Register shifter);
167 void GenerateShrLong(const Location& loc, Register shifter);
168 void GenerateUShrLong(const Location& loc, Register shifter);
Mark P Mendell73945692015-04-29 14:56:17 +0000169 void GenerateShlLong(const Location& loc, int shift);
170 void GenerateShrLong(const Location& loc, int shift);
171 void GenerateUShrLong(const Location& loc, int shift);
Calin Juravle52c48962014-12-16 17:02:57 +0000172 void GenerateMemoryBarrier(MemBarrierKind kind);
Nicolas Geoffray07276db2015-05-18 14:22:09 +0100173 void HandleFieldSet(HInstruction* instruction,
174 const FieldInfo& field_info,
175 bool value_can_be_null);
Calin Juravle52c48962014-12-16 17:02:57 +0000176 void HandleFieldGet(HInstruction* instruction, const FieldInfo& field_info);
Roland Levillain232ade02015-04-20 15:14:36 +0100177 // Push value to FPU stack. `is_fp` specifies whether the value is floating point or not.
178 // `is_wide` specifies whether it is long/double or not.
Mark Mendell24f2dfa2015-01-14 19:51:45 -0500179 void PushOntoFPStack(Location source, uint32_t temp_offset,
Roland Levillain232ade02015-04-20 15:14:36 +0100180 uint32_t stack_adjustment, bool is_fp, bool is_wide);
Nicolas Geoffray3c049742014-09-24 18:10:46 +0100181
Calin Juravlecd6dffe2015-01-08 17:35:35 +0000182 void GenerateImplicitNullCheck(HNullCheck* instruction);
183 void GenerateExplicitNullCheck(HNullCheck* instruction);
Mingyao Yangd43b3ac2015-04-01 14:03:04 -0700184 void GenerateTestAndBranch(HInstruction* instruction,
185 Label* true_target,
186 Label* false_target,
187 Label* always_true_target);
Calin Juravlecd6dffe2015-01-08 17:35:35 +0000188
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100189 X86Assembler* const assembler_;
190 CodeGeneratorX86* const codegen_;
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000191
192 DISALLOW_COPY_AND_ASSIGN(InstructionCodeGeneratorX86);
193};
194
195class CodeGeneratorX86 : public CodeGenerator {
196 public:
Mark Mendellfb8d2792015-03-31 22:16:59 -0400197 CodeGeneratorX86(HGraph* graph,
198 const X86InstructionSetFeatures& isa_features,
199 const CompilerOptions& compiler_options);
Nicolas Geoffrayf12feb82014-07-17 18:32:41 +0100200 virtual ~CodeGeneratorX86() {}
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000201
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000202 void GenerateFrameEntry() OVERRIDE;
203 void GenerateFrameExit() OVERRIDE;
204 void Bind(HBasicBlock* block) OVERRIDE;
205 void Move(HInstruction* instruction, Location location, HInstruction* move_for) OVERRIDE;
206 size_t SaveCoreRegister(size_t stack_index, uint32_t reg_id) OVERRIDE;
207 size_t RestoreCoreRegister(size_t stack_index, uint32_t reg_id) OVERRIDE;
Mark Mendell7c8d0092015-01-26 11:21:33 -0500208 size_t SaveFloatingPointRegister(size_t stack_index, uint32_t reg_id) OVERRIDE;
209 size_t RestoreFloatingPointRegister(size_t stack_index, uint32_t reg_id) OVERRIDE;
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +0000210
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000211 size_t GetWordSize() const OVERRIDE {
Nicolas Geoffray707c8092014-04-04 10:50:14 +0100212 return kX86WordSize;
213 }
214
Mark Mendellf85a9ca2015-01-13 09:20:58 -0500215 size_t GetFloatingPointSpillSlotSize() const OVERRIDE {
216 // 8 bytes == 2 words for each spill.
217 return 2 * kX86WordSize;
218 }
219
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000220 HGraphVisitor* GetLocationBuilder() OVERRIDE {
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +0000221 return &location_builder_;
222 }
223
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000224 HGraphVisitor* GetInstructionVisitor() OVERRIDE {
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000225 return &instruction_visitor_;
226 }
227
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000228 X86Assembler* GetAssembler() OVERRIDE {
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000229 return &assembler_;
230 }
231
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000232 uintptr_t GetAddressOf(HBasicBlock* block) const OVERRIDE {
233 return GetLabelOf(block)->Position();
234 }
Calin Juravle34bacdf2014-10-07 20:23:36 +0100235
Nicolas Geoffray98893962015-01-21 12:32:32 +0000236 void SetupBlockedRegisters(bool is_baseline) const OVERRIDE;
Nicolas Geoffraya7aca372014-04-28 17:47:12 +0100237
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000238 Location AllocateFreeRegister(Primitive::Type type) const OVERRIDE;
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100239
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000240 Location GetStackLocation(HLoadLocal* load) const OVERRIDE;
241
242 void DumpCoreRegister(std::ostream& stream, int reg) const OVERRIDE;
243 void DumpFloatingPointRegister(std::ostream& stream, int reg) const OVERRIDE;
Nicolas Geoffraya7062e02014-05-22 12:50:17 +0100244
Calin Juravle34bacdf2014-10-07 20:23:36 +0100245 // Blocks all register pairs made out of blocked core registers.
246 void UpdateBlockedPairRegisters() const;
247
Nicolas Geoffrayf0e39372014-11-12 17:50:07 +0000248 ParallelMoveResolverX86* GetMoveResolver() OVERRIDE {
Nicolas Geoffray86dbb9a2014-06-04 11:12:39 +0100249 return &move_resolver_;
250 }
251
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000252 InstructionSet GetInstructionSet() const OVERRIDE {
Nicolas Geoffray412f10c2014-06-19 10:00:34 +0100253 return InstructionSet::kX86;
254 }
255
Nicolas Geoffray01bc96d2014-04-11 17:43:50 +0100256 // Helper method to move a 32bits value between two locations.
257 void Move32(Location destination, Location source);
258 // Helper method to move a 64bits value between two locations.
259 void Move64(Location destination, Location source);
260
Mark Mendell09ed1a32015-03-25 08:30:06 -0400261 // Generate a call to a static or direct method.
262 void GenerateStaticOrDirectCall(HInvokeStaticOrDirect* invoke, Register temp);
263
Nicolas Geoffray3c7bb982014-07-23 16:04:16 +0100264 // Emit a write barrier.
Nicolas Geoffray07276db2015-05-18 14:22:09 +0100265 void MarkGCCard(Register temp,
266 Register card,
267 Register object,
268 Register value,
269 bool value_can_be_null);
Nicolas Geoffray3c7bb982014-07-23 16:04:16 +0100270
Nicolas Geoffray19a19cf2014-10-22 16:07:05 +0100271 void LoadCurrentMethod(Register reg);
272
Nicolas Geoffray92a73ae2014-10-16 11:12:52 +0100273 Label* GetLabelOf(HBasicBlock* block) const {
Nicolas Geoffraydc23d832015-02-16 11:15:43 +0000274 return CommonGetLabelOf<Label>(block_labels_.GetRawStorage(), block);
Nicolas Geoffray92a73ae2014-10-16 11:12:52 +0100275 }
276
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000277 void Initialize() OVERRIDE {
Nicolas Geoffray92a73ae2014-10-16 11:12:52 +0100278 block_labels_.SetSize(GetGraph()->GetBlocks().Size());
279 }
280
Nicolas Geoffray840e5462015-01-07 16:01:24 +0000281 bool NeedsTwoRegisters(Primitive::Type type) const OVERRIDE {
282 return type == Primitive::kPrimLong;
283 }
284
Nicolas Geoffray234d69d2015-03-09 10:28:50 +0000285 bool ShouldSplitLongMoves() const OVERRIDE { return true; }
286
Nicolas Geoffray1cf95282014-12-12 19:22:03 +0000287 Label* GetFrameEntryLabel() { return &frame_entry_label_; }
288
Mark Mendellfb8d2792015-03-31 22:16:59 -0400289 const X86InstructionSetFeatures& GetInstructionSetFeatures() const {
290 return isa_features_;
291 }
292
Nicolas Geoffray3c7bb982014-07-23 16:04:16 +0100293 private:
Nicolas Geoffray92a73ae2014-10-16 11:12:52 +0100294 // Labels for each block that will be compiled.
295 GrowableArray<Label> block_labels_;
Nicolas Geoffray1cf95282014-12-12 19:22:03 +0000296 Label frame_entry_label_;
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +0000297 LocationsBuilderX86 location_builder_;
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000298 InstructionCodeGeneratorX86 instruction_visitor_;
Nicolas Geoffray86dbb9a2014-06-04 11:12:39 +0100299 ParallelMoveResolverX86 move_resolver_;
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000300 X86Assembler assembler_;
Mark Mendellfb8d2792015-03-31 22:16:59 -0400301 const X86InstructionSetFeatures& isa_features_;
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000302
303 DISALLOW_COPY_AND_ASSIGN(CodeGeneratorX86);
304};
305
Mark Mendell09ed1a32015-03-25 08:30:06 -0400306class SlowPathCodeX86 : public SlowPathCode {
307 public:
308 SlowPathCodeX86() : entry_label_(), exit_label_() {}
309
310 Label* GetEntryLabel() { return &entry_label_; }
311 Label* GetExitLabel() { return &exit_label_; }
312
313 private:
314 Label entry_label_;
315 Label exit_label_;
316
317 DISALLOW_COPY_AND_ASSIGN(SlowPathCodeX86);
318};
319
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000320} // namespace x86
321} // namespace art
322
323#endif // ART_COMPILER_OPTIMIZING_CODE_GENERATOR_X86_H_