blob: e8912b39ab4d09196b3aaf70ae48ba4c243c8d03 [file] [log] [blame]
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -08001/*
2 * Copyright (C) 2015 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17#include "intrinsics_arm.h"
18
19#include "arch/arm/instruction_set_features_arm.h"
Mathieu Chartiere401d142015-04-22 13:56:20 -070020#include "art_method.h"
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -080021#include "code_generator_arm.h"
22#include "entrypoints/quick/quick_entrypoints.h"
23#include "intrinsics.h"
Andreas Gampe85b62f22015-09-09 13:15:38 -070024#include "intrinsics_utils.h"
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -080025#include "mirror/array-inl.h"
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -080026#include "mirror/string.h"
27#include "thread.h"
28#include "utils/arm/assembler_arm.h"
29
30namespace art {
31
32namespace arm {
33
34ArmAssembler* IntrinsicCodeGeneratorARM::GetAssembler() {
35 return codegen_->GetAssembler();
36}
37
38ArenaAllocator* IntrinsicCodeGeneratorARM::GetAllocator() {
39 return codegen_->GetGraph()->GetArena();
40}
41
Andreas Gampe85b62f22015-09-09 13:15:38 -070042using IntrinsicSlowPathARM = IntrinsicSlowPath<InvokeDexCallingConventionVisitorARM>;
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -080043
44bool IntrinsicLocationsBuilderARM::TryDispatch(HInvoke* invoke) {
45 Dispatch(invoke);
46 LocationSummary* res = invoke->GetLocations();
Roland Levillain3b359c72015-11-17 19:35:12 +000047 if (res == nullptr) {
48 return false;
49 }
50 if (kEmitCompilerReadBarrier && res->CanCall()) {
51 // Generating an intrinsic for this HInvoke may produce an
52 // IntrinsicSlowPathARM slow path. Currently this approach
53 // does not work when using read barriers, as the emitted
54 // calling sequence will make use of another slow path
55 // (ReadBarrierForRootSlowPathARM for HInvokeStaticOrDirect,
56 // ReadBarrierSlowPathARM for HInvokeVirtual). So we bail
57 // out in this case.
58 //
59 // TODO: Find a way to have intrinsics work with read barriers.
60 invoke->SetLocations(nullptr);
61 return false;
62 }
63 return res->Intrinsified();
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -080064}
65
66#define __ assembler->
67
68static void CreateFPToIntLocations(ArenaAllocator* arena, HInvoke* invoke) {
69 LocationSummary* locations = new (arena) LocationSummary(invoke,
70 LocationSummary::kNoCall,
71 kIntrinsified);
72 locations->SetInAt(0, Location::RequiresFpuRegister());
73 locations->SetOut(Location::RequiresRegister());
74}
75
76static void CreateIntToFPLocations(ArenaAllocator* arena, HInvoke* invoke) {
77 LocationSummary* locations = new (arena) LocationSummary(invoke,
78 LocationSummary::kNoCall,
79 kIntrinsified);
80 locations->SetInAt(0, Location::RequiresRegister());
81 locations->SetOut(Location::RequiresFpuRegister());
82}
83
84static void MoveFPToInt(LocationSummary* locations, bool is64bit, ArmAssembler* assembler) {
85 Location input = locations->InAt(0);
86 Location output = locations->Out();
87 if (is64bit) {
88 __ vmovrrd(output.AsRegisterPairLow<Register>(),
89 output.AsRegisterPairHigh<Register>(),
90 FromLowSToD(input.AsFpuRegisterPairLow<SRegister>()));
91 } else {
92 __ vmovrs(output.AsRegister<Register>(), input.AsFpuRegister<SRegister>());
93 }
94}
95
96static void MoveIntToFP(LocationSummary* locations, bool is64bit, ArmAssembler* assembler) {
97 Location input = locations->InAt(0);
98 Location output = locations->Out();
99 if (is64bit) {
100 __ vmovdrr(FromLowSToD(output.AsFpuRegisterPairLow<SRegister>()),
101 input.AsRegisterPairLow<Register>(),
102 input.AsRegisterPairHigh<Register>());
103 } else {
104 __ vmovsr(output.AsFpuRegister<SRegister>(), input.AsRegister<Register>());
105 }
106}
107
108void IntrinsicLocationsBuilderARM::VisitDoubleDoubleToRawLongBits(HInvoke* invoke) {
109 CreateFPToIntLocations(arena_, invoke);
110}
111void IntrinsicLocationsBuilderARM::VisitDoubleLongBitsToDouble(HInvoke* invoke) {
112 CreateIntToFPLocations(arena_, invoke);
113}
114
115void IntrinsicCodeGeneratorARM::VisitDoubleDoubleToRawLongBits(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000116 MoveFPToInt(invoke->GetLocations(), /* is64bit */ true, GetAssembler());
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800117}
118void IntrinsicCodeGeneratorARM::VisitDoubleLongBitsToDouble(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000119 MoveIntToFP(invoke->GetLocations(), /* is64bit */ true, GetAssembler());
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800120}
121
122void IntrinsicLocationsBuilderARM::VisitFloatFloatToRawIntBits(HInvoke* invoke) {
123 CreateFPToIntLocations(arena_, invoke);
124}
125void IntrinsicLocationsBuilderARM::VisitFloatIntBitsToFloat(HInvoke* invoke) {
126 CreateIntToFPLocations(arena_, invoke);
127}
128
129void IntrinsicCodeGeneratorARM::VisitFloatFloatToRawIntBits(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000130 MoveFPToInt(invoke->GetLocations(), /* is64bit */ false, GetAssembler());
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800131}
132void IntrinsicCodeGeneratorARM::VisitFloatIntBitsToFloat(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000133 MoveIntToFP(invoke->GetLocations(), /* is64bit */ false, GetAssembler());
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800134}
135
136static void CreateIntToIntLocations(ArenaAllocator* arena, HInvoke* invoke) {
137 LocationSummary* locations = new (arena) LocationSummary(invoke,
138 LocationSummary::kNoCall,
139 kIntrinsified);
140 locations->SetInAt(0, Location::RequiresRegister());
141 locations->SetOut(Location::RequiresRegister(), Location::kNoOutputOverlap);
142}
143
144static void CreateFPToFPLocations(ArenaAllocator* arena, HInvoke* invoke) {
145 LocationSummary* locations = new (arena) LocationSummary(invoke,
146 LocationSummary::kNoCall,
147 kIntrinsified);
148 locations->SetInAt(0, Location::RequiresFpuRegister());
149 locations->SetOut(Location::RequiresFpuRegister(), Location::kNoOutputOverlap);
150}
151
Scott Wakeling611d3392015-07-10 11:42:06 +0100152static void GenNumberOfLeadingZeros(LocationSummary* locations,
153 Primitive::Type type,
154 ArmAssembler* assembler) {
155 Location in = locations->InAt(0);
156 Register out = locations->Out().AsRegister<Register>();
157
158 DCHECK((type == Primitive::kPrimInt) || (type == Primitive::kPrimLong));
159
160 if (type == Primitive::kPrimLong) {
161 Register in_reg_lo = in.AsRegisterPairLow<Register>();
162 Register in_reg_hi = in.AsRegisterPairHigh<Register>();
163 Label end;
164 __ clz(out, in_reg_hi);
165 __ CompareAndBranchIfNonZero(in_reg_hi, &end);
166 __ clz(out, in_reg_lo);
167 __ AddConstant(out, 32);
168 __ Bind(&end);
169 } else {
170 __ clz(out, in.AsRegister<Register>());
171 }
172}
173
174void IntrinsicLocationsBuilderARM::VisitIntegerNumberOfLeadingZeros(HInvoke* invoke) {
175 CreateIntToIntLocations(arena_, invoke);
176}
177
178void IntrinsicCodeGeneratorARM::VisitIntegerNumberOfLeadingZeros(HInvoke* invoke) {
179 GenNumberOfLeadingZeros(invoke->GetLocations(), Primitive::kPrimInt, GetAssembler());
180}
181
182void IntrinsicLocationsBuilderARM::VisitLongNumberOfLeadingZeros(HInvoke* invoke) {
183 LocationSummary* locations = new (arena_) LocationSummary(invoke,
184 LocationSummary::kNoCall,
185 kIntrinsified);
186 locations->SetInAt(0, Location::RequiresRegister());
187 locations->SetOut(Location::RequiresRegister(), Location::kOutputOverlap);
188}
189
190void IntrinsicCodeGeneratorARM::VisitLongNumberOfLeadingZeros(HInvoke* invoke) {
191 GenNumberOfLeadingZeros(invoke->GetLocations(), Primitive::kPrimLong, GetAssembler());
192}
193
Scott Wakeling9ee23f42015-07-23 10:44:35 +0100194static void GenNumberOfTrailingZeros(LocationSummary* locations,
195 Primitive::Type type,
196 ArmAssembler* assembler) {
197 DCHECK((type == Primitive::kPrimInt) || (type == Primitive::kPrimLong));
198
199 Register out = locations->Out().AsRegister<Register>();
200
201 if (type == Primitive::kPrimLong) {
202 Register in_reg_lo = locations->InAt(0).AsRegisterPairLow<Register>();
203 Register in_reg_hi = locations->InAt(0).AsRegisterPairHigh<Register>();
204 Label end;
205 __ rbit(out, in_reg_lo);
206 __ clz(out, out);
207 __ CompareAndBranchIfNonZero(in_reg_lo, &end);
208 __ rbit(out, in_reg_hi);
209 __ clz(out, out);
210 __ AddConstant(out, 32);
211 __ Bind(&end);
212 } else {
213 Register in = locations->InAt(0).AsRegister<Register>();
214 __ rbit(out, in);
215 __ clz(out, out);
216 }
217}
218
219void IntrinsicLocationsBuilderARM::VisitIntegerNumberOfTrailingZeros(HInvoke* invoke) {
220 LocationSummary* locations = new (arena_) LocationSummary(invoke,
221 LocationSummary::kNoCall,
222 kIntrinsified);
223 locations->SetInAt(0, Location::RequiresRegister());
224 locations->SetOut(Location::RequiresRegister(), Location::kNoOutputOverlap);
225}
226
227void IntrinsicCodeGeneratorARM::VisitIntegerNumberOfTrailingZeros(HInvoke* invoke) {
228 GenNumberOfTrailingZeros(invoke->GetLocations(), Primitive::kPrimInt, GetAssembler());
229}
230
231void IntrinsicLocationsBuilderARM::VisitLongNumberOfTrailingZeros(HInvoke* invoke) {
232 LocationSummary* locations = new (arena_) LocationSummary(invoke,
233 LocationSummary::kNoCall,
234 kIntrinsified);
235 locations->SetInAt(0, Location::RequiresRegister());
236 locations->SetOut(Location::RequiresRegister(), Location::kOutputOverlap);
237}
238
239void IntrinsicCodeGeneratorARM::VisitLongNumberOfTrailingZeros(HInvoke* invoke) {
240 GenNumberOfTrailingZeros(invoke->GetLocations(), Primitive::kPrimLong, GetAssembler());
241}
242
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800243static void MathAbsFP(LocationSummary* locations, bool is64bit, ArmAssembler* assembler) {
244 Location in = locations->InAt(0);
245 Location out = locations->Out();
246
247 if (is64bit) {
248 __ vabsd(FromLowSToD(out.AsFpuRegisterPairLow<SRegister>()),
249 FromLowSToD(in.AsFpuRegisterPairLow<SRegister>()));
250 } else {
251 __ vabss(out.AsFpuRegister<SRegister>(), in.AsFpuRegister<SRegister>());
252 }
253}
254
255void IntrinsicLocationsBuilderARM::VisitMathAbsDouble(HInvoke* invoke) {
256 CreateFPToFPLocations(arena_, invoke);
257}
258
259void IntrinsicCodeGeneratorARM::VisitMathAbsDouble(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000260 MathAbsFP(invoke->GetLocations(), /* is64bit */ true, GetAssembler());
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800261}
262
263void IntrinsicLocationsBuilderARM::VisitMathAbsFloat(HInvoke* invoke) {
264 CreateFPToFPLocations(arena_, invoke);
265}
266
267void IntrinsicCodeGeneratorARM::VisitMathAbsFloat(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000268 MathAbsFP(invoke->GetLocations(), /* is64bit */ false, GetAssembler());
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800269}
270
271static void CreateIntToIntPlusTemp(ArenaAllocator* arena, HInvoke* invoke) {
272 LocationSummary* locations = new (arena) LocationSummary(invoke,
273 LocationSummary::kNoCall,
274 kIntrinsified);
275 locations->SetInAt(0, Location::RequiresRegister());
276 locations->SetOut(Location::RequiresRegister(), Location::kNoOutputOverlap);
277
278 locations->AddTemp(Location::RequiresRegister());
279}
280
281static void GenAbsInteger(LocationSummary* locations,
282 bool is64bit,
283 ArmAssembler* assembler) {
284 Location in = locations->InAt(0);
285 Location output = locations->Out();
286
287 Register mask = locations->GetTemp(0).AsRegister<Register>();
288
289 if (is64bit) {
290 Register in_reg_lo = in.AsRegisterPairLow<Register>();
291 Register in_reg_hi = in.AsRegisterPairHigh<Register>();
292 Register out_reg_lo = output.AsRegisterPairLow<Register>();
293 Register out_reg_hi = output.AsRegisterPairHigh<Register>();
294
295 DCHECK_NE(out_reg_lo, in_reg_hi) << "Diagonal overlap unexpected.";
296
297 __ Asr(mask, in_reg_hi, 31);
298 __ adds(out_reg_lo, in_reg_lo, ShifterOperand(mask));
299 __ adc(out_reg_hi, in_reg_hi, ShifterOperand(mask));
300 __ eor(out_reg_lo, mask, ShifterOperand(out_reg_lo));
301 __ eor(out_reg_hi, mask, ShifterOperand(out_reg_hi));
302 } else {
303 Register in_reg = in.AsRegister<Register>();
304 Register out_reg = output.AsRegister<Register>();
305
306 __ Asr(mask, in_reg, 31);
307 __ add(out_reg, in_reg, ShifterOperand(mask));
308 __ eor(out_reg, mask, ShifterOperand(out_reg));
309 }
310}
311
312void IntrinsicLocationsBuilderARM::VisitMathAbsInt(HInvoke* invoke) {
313 CreateIntToIntPlusTemp(arena_, invoke);
314}
315
316void IntrinsicCodeGeneratorARM::VisitMathAbsInt(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000317 GenAbsInteger(invoke->GetLocations(), /* is64bit */ false, GetAssembler());
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800318}
319
320
321void IntrinsicLocationsBuilderARM::VisitMathAbsLong(HInvoke* invoke) {
322 CreateIntToIntPlusTemp(arena_, invoke);
323}
324
325void IntrinsicCodeGeneratorARM::VisitMathAbsLong(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000326 GenAbsInteger(invoke->GetLocations(), /* is64bit */ true, GetAssembler());
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800327}
328
329static void GenMinMax(LocationSummary* locations,
330 bool is_min,
331 ArmAssembler* assembler) {
332 Register op1 = locations->InAt(0).AsRegister<Register>();
333 Register op2 = locations->InAt(1).AsRegister<Register>();
334 Register out = locations->Out().AsRegister<Register>();
335
336 __ cmp(op1, ShifterOperand(op2));
337
338 __ it((is_min) ? Condition::LT : Condition::GT, kItElse);
339 __ mov(out, ShifterOperand(op1), is_min ? Condition::LT : Condition::GT);
340 __ mov(out, ShifterOperand(op2), is_min ? Condition::GE : Condition::LE);
341}
342
343static void CreateIntIntToIntLocations(ArenaAllocator* arena, HInvoke* invoke) {
344 LocationSummary* locations = new (arena) LocationSummary(invoke,
345 LocationSummary::kNoCall,
346 kIntrinsified);
347 locations->SetInAt(0, Location::RequiresRegister());
348 locations->SetInAt(1, Location::RequiresRegister());
349 locations->SetOut(Location::RequiresRegister(), Location::kNoOutputOverlap);
350}
351
352void IntrinsicLocationsBuilderARM::VisitMathMinIntInt(HInvoke* invoke) {
353 CreateIntIntToIntLocations(arena_, invoke);
354}
355
356void IntrinsicCodeGeneratorARM::VisitMathMinIntInt(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000357 GenMinMax(invoke->GetLocations(), /* is_min */ true, GetAssembler());
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800358}
359
360void IntrinsicLocationsBuilderARM::VisitMathMaxIntInt(HInvoke* invoke) {
361 CreateIntIntToIntLocations(arena_, invoke);
362}
363
364void IntrinsicCodeGeneratorARM::VisitMathMaxIntInt(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000365 GenMinMax(invoke->GetLocations(), /* is_min */ false, GetAssembler());
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800366}
367
368void IntrinsicLocationsBuilderARM::VisitMathSqrt(HInvoke* invoke) {
369 CreateFPToFPLocations(arena_, invoke);
370}
371
372void IntrinsicCodeGeneratorARM::VisitMathSqrt(HInvoke* invoke) {
373 LocationSummary* locations = invoke->GetLocations();
374 ArmAssembler* assembler = GetAssembler();
375 __ vsqrtd(FromLowSToD(locations->Out().AsFpuRegisterPairLow<SRegister>()),
376 FromLowSToD(locations->InAt(0).AsFpuRegisterPairLow<SRegister>()));
377}
378
379void IntrinsicLocationsBuilderARM::VisitMemoryPeekByte(HInvoke* invoke) {
380 CreateIntToIntLocations(arena_, invoke);
381}
382
383void IntrinsicCodeGeneratorARM::VisitMemoryPeekByte(HInvoke* invoke) {
384 ArmAssembler* assembler = GetAssembler();
385 // Ignore upper 4B of long address.
386 __ ldrsb(invoke->GetLocations()->Out().AsRegister<Register>(),
387 Address(invoke->GetLocations()->InAt(0).AsRegisterPairLow<Register>()));
388}
389
390void IntrinsicLocationsBuilderARM::VisitMemoryPeekIntNative(HInvoke* invoke) {
391 CreateIntToIntLocations(arena_, invoke);
392}
393
394void IntrinsicCodeGeneratorARM::VisitMemoryPeekIntNative(HInvoke* invoke) {
395 ArmAssembler* assembler = GetAssembler();
396 // Ignore upper 4B of long address.
397 __ ldr(invoke->GetLocations()->Out().AsRegister<Register>(),
398 Address(invoke->GetLocations()->InAt(0).AsRegisterPairLow<Register>()));
399}
400
401void IntrinsicLocationsBuilderARM::VisitMemoryPeekLongNative(HInvoke* invoke) {
402 CreateIntToIntLocations(arena_, invoke);
403}
404
405void IntrinsicCodeGeneratorARM::VisitMemoryPeekLongNative(HInvoke* invoke) {
406 ArmAssembler* assembler = GetAssembler();
407 // Ignore upper 4B of long address.
408 Register addr = invoke->GetLocations()->InAt(0).AsRegisterPairLow<Register>();
409 // Worst case: Control register bit SCTLR.A = 0. Then unaligned accesses throw a processor
410 // exception. So we can't use ldrd as addr may be unaligned.
411 Register lo = invoke->GetLocations()->Out().AsRegisterPairLow<Register>();
412 Register hi = invoke->GetLocations()->Out().AsRegisterPairHigh<Register>();
413 if (addr == lo) {
414 __ ldr(hi, Address(addr, 4));
415 __ ldr(lo, Address(addr, 0));
416 } else {
417 __ ldr(lo, Address(addr, 0));
418 __ ldr(hi, Address(addr, 4));
419 }
420}
421
422void IntrinsicLocationsBuilderARM::VisitMemoryPeekShortNative(HInvoke* invoke) {
423 CreateIntToIntLocations(arena_, invoke);
424}
425
426void IntrinsicCodeGeneratorARM::VisitMemoryPeekShortNative(HInvoke* invoke) {
427 ArmAssembler* assembler = GetAssembler();
428 // Ignore upper 4B of long address.
429 __ ldrsh(invoke->GetLocations()->Out().AsRegister<Register>(),
430 Address(invoke->GetLocations()->InAt(0).AsRegisterPairLow<Register>()));
431}
432
433static void CreateIntIntToVoidLocations(ArenaAllocator* arena, HInvoke* invoke) {
434 LocationSummary* locations = new (arena) LocationSummary(invoke,
435 LocationSummary::kNoCall,
436 kIntrinsified);
437 locations->SetInAt(0, Location::RequiresRegister());
438 locations->SetInAt(1, Location::RequiresRegister());
439}
440
441void IntrinsicLocationsBuilderARM::VisitMemoryPokeByte(HInvoke* invoke) {
442 CreateIntIntToVoidLocations(arena_, invoke);
443}
444
445void IntrinsicCodeGeneratorARM::VisitMemoryPokeByte(HInvoke* invoke) {
446 ArmAssembler* assembler = GetAssembler();
447 __ strb(invoke->GetLocations()->InAt(1).AsRegister<Register>(),
448 Address(invoke->GetLocations()->InAt(0).AsRegisterPairLow<Register>()));
449}
450
451void IntrinsicLocationsBuilderARM::VisitMemoryPokeIntNative(HInvoke* invoke) {
452 CreateIntIntToVoidLocations(arena_, invoke);
453}
454
455void IntrinsicCodeGeneratorARM::VisitMemoryPokeIntNative(HInvoke* invoke) {
456 ArmAssembler* assembler = GetAssembler();
457 __ str(invoke->GetLocations()->InAt(1).AsRegister<Register>(),
458 Address(invoke->GetLocations()->InAt(0).AsRegisterPairLow<Register>()));
459}
460
461void IntrinsicLocationsBuilderARM::VisitMemoryPokeLongNative(HInvoke* invoke) {
462 CreateIntIntToVoidLocations(arena_, invoke);
463}
464
465void IntrinsicCodeGeneratorARM::VisitMemoryPokeLongNative(HInvoke* invoke) {
466 ArmAssembler* assembler = GetAssembler();
467 // Ignore upper 4B of long address.
468 Register addr = invoke->GetLocations()->InAt(0).AsRegisterPairLow<Register>();
469 // Worst case: Control register bit SCTLR.A = 0. Then unaligned accesses throw a processor
470 // exception. So we can't use ldrd as addr may be unaligned.
471 __ str(invoke->GetLocations()->InAt(1).AsRegisterPairLow<Register>(), Address(addr, 0));
472 __ str(invoke->GetLocations()->InAt(1).AsRegisterPairHigh<Register>(), Address(addr, 4));
473}
474
475void IntrinsicLocationsBuilderARM::VisitMemoryPokeShortNative(HInvoke* invoke) {
476 CreateIntIntToVoidLocations(arena_, invoke);
477}
478
479void IntrinsicCodeGeneratorARM::VisitMemoryPokeShortNative(HInvoke* invoke) {
480 ArmAssembler* assembler = GetAssembler();
481 __ strh(invoke->GetLocations()->InAt(1).AsRegister<Register>(),
482 Address(invoke->GetLocations()->InAt(0).AsRegisterPairLow<Register>()));
483}
484
485void IntrinsicLocationsBuilderARM::VisitThreadCurrentThread(HInvoke* invoke) {
486 LocationSummary* locations = new (arena_) LocationSummary(invoke,
487 LocationSummary::kNoCall,
488 kIntrinsified);
489 locations->SetOut(Location::RequiresRegister());
490}
491
492void IntrinsicCodeGeneratorARM::VisitThreadCurrentThread(HInvoke* invoke) {
493 ArmAssembler* assembler = GetAssembler();
494 __ LoadFromOffset(kLoadWord,
495 invoke->GetLocations()->Out().AsRegister<Register>(),
496 TR,
497 Thread::PeerOffset<kArmPointerSize>().Int32Value());
498}
499
500static void GenUnsafeGet(HInvoke* invoke,
501 Primitive::Type type,
502 bool is_volatile,
503 CodeGeneratorARM* codegen) {
504 LocationSummary* locations = invoke->GetLocations();
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800505 ArmAssembler* assembler = codegen->GetAssembler();
Roland Levillain3b359c72015-11-17 19:35:12 +0000506 Location base_loc = locations->InAt(1);
507 Register base = base_loc.AsRegister<Register>(); // Object pointer.
508 Location offset_loc = locations->InAt(2);
509 Register offset = offset_loc.AsRegisterPairLow<Register>(); // Long offset, lo part only.
510 Location trg_loc = locations->Out();
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800511
Roland Levillainc9285912015-12-18 10:38:42 +0000512 switch (type) {
513 case Primitive::kPrimInt: {
514 Register trg = trg_loc.AsRegister<Register>();
515 __ ldr(trg, Address(base, offset));
516 if (is_volatile) {
517 __ dmb(ISH);
518 }
519 break;
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800520 }
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800521
Roland Levillainc9285912015-12-18 10:38:42 +0000522 case Primitive::kPrimNot: {
523 Register trg = trg_loc.AsRegister<Register>();
524 if (kEmitCompilerReadBarrier) {
525 if (kUseBakerReadBarrier) {
526 Location temp = locations->GetTemp(0);
527 codegen->GenerateArrayLoadWithBakerReadBarrier(
528 invoke, trg_loc, base, 0U, offset_loc, temp, /* needs_null_check */ false);
529 if (is_volatile) {
530 __ dmb(ISH);
531 }
532 } else {
533 __ ldr(trg, Address(base, offset));
534 if (is_volatile) {
535 __ dmb(ISH);
536 }
537 codegen->GenerateReadBarrierSlow(invoke, trg_loc, trg_loc, base_loc, 0U, offset_loc);
538 }
539 } else {
540 __ ldr(trg, Address(base, offset));
541 if (is_volatile) {
542 __ dmb(ISH);
543 }
544 __ MaybeUnpoisonHeapReference(trg);
545 }
546 break;
547 }
Roland Levillain4d027112015-07-01 15:41:14 +0100548
Roland Levillainc9285912015-12-18 10:38:42 +0000549 case Primitive::kPrimLong: {
550 Register trg_lo = trg_loc.AsRegisterPairLow<Register>();
551 __ add(IP, base, ShifterOperand(offset));
552 if (is_volatile && !codegen->GetInstructionSetFeatures().HasAtomicLdrdAndStrd()) {
553 Register trg_hi = trg_loc.AsRegisterPairHigh<Register>();
554 __ ldrexd(trg_lo, trg_hi, IP);
555 } else {
556 __ ldrd(trg_lo, Address(IP));
557 }
558 if (is_volatile) {
559 __ dmb(ISH);
560 }
561 break;
562 }
563
564 default:
565 LOG(FATAL) << "Unexpected type " << type;
566 UNREACHABLE();
Roland Levillain4d027112015-07-01 15:41:14 +0100567 }
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800568}
569
Roland Levillainc9285912015-12-18 10:38:42 +0000570static void CreateIntIntIntToIntLocations(ArenaAllocator* arena,
571 HInvoke* invoke,
572 Primitive::Type type) {
Roland Levillain3b359c72015-11-17 19:35:12 +0000573 bool can_call = kEmitCompilerReadBarrier &&
574 (invoke->GetIntrinsic() == Intrinsics::kUnsafeGetObject ||
575 invoke->GetIntrinsic() == Intrinsics::kUnsafeGetObjectVolatile);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800576 LocationSummary* locations = new (arena) LocationSummary(invoke,
Roland Levillain3b359c72015-11-17 19:35:12 +0000577 can_call ?
578 LocationSummary::kCallOnSlowPath :
579 LocationSummary::kNoCall,
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800580 kIntrinsified);
581 locations->SetInAt(0, Location::NoLocation()); // Unused receiver.
582 locations->SetInAt(1, Location::RequiresRegister());
583 locations->SetInAt(2, Location::RequiresRegister());
584 locations->SetOut(Location::RequiresRegister(), Location::kNoOutputOverlap);
Roland Levillainc9285912015-12-18 10:38:42 +0000585 if (type == Primitive::kPrimNot && kEmitCompilerReadBarrier && kUseBakerReadBarrier) {
586 // We need a temporary register for the read barrier marking slow
587 // path in InstructionCodeGeneratorARM::GenerateArrayLoadWithBakerReadBarrier.
588 locations->AddTemp(Location::RequiresRegister());
589 }
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800590}
591
592void IntrinsicLocationsBuilderARM::VisitUnsafeGet(HInvoke* invoke) {
Roland Levillainc9285912015-12-18 10:38:42 +0000593 CreateIntIntIntToIntLocations(arena_, invoke, Primitive::kPrimInt);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800594}
595void IntrinsicLocationsBuilderARM::VisitUnsafeGetVolatile(HInvoke* invoke) {
Roland Levillainc9285912015-12-18 10:38:42 +0000596 CreateIntIntIntToIntLocations(arena_, invoke, Primitive::kPrimInt);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800597}
598void IntrinsicLocationsBuilderARM::VisitUnsafeGetLong(HInvoke* invoke) {
Roland Levillainc9285912015-12-18 10:38:42 +0000599 CreateIntIntIntToIntLocations(arena_, invoke, Primitive::kPrimLong);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800600}
601void IntrinsicLocationsBuilderARM::VisitUnsafeGetLongVolatile(HInvoke* invoke) {
Roland Levillainc9285912015-12-18 10:38:42 +0000602 CreateIntIntIntToIntLocations(arena_, invoke, Primitive::kPrimLong);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800603}
604void IntrinsicLocationsBuilderARM::VisitUnsafeGetObject(HInvoke* invoke) {
Roland Levillainc9285912015-12-18 10:38:42 +0000605 CreateIntIntIntToIntLocations(arena_, invoke, Primitive::kPrimNot);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800606}
607void IntrinsicLocationsBuilderARM::VisitUnsafeGetObjectVolatile(HInvoke* invoke) {
Roland Levillainc9285912015-12-18 10:38:42 +0000608 CreateIntIntIntToIntLocations(arena_, invoke, Primitive::kPrimNot);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800609}
610
611void IntrinsicCodeGeneratorARM::VisitUnsafeGet(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000612 GenUnsafeGet(invoke, Primitive::kPrimInt, /* is_volatile */ false, codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800613}
614void IntrinsicCodeGeneratorARM::VisitUnsafeGetVolatile(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000615 GenUnsafeGet(invoke, Primitive::kPrimInt, /* is_volatile */ true, codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800616}
617void IntrinsicCodeGeneratorARM::VisitUnsafeGetLong(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000618 GenUnsafeGet(invoke, Primitive::kPrimLong, /* is_volatile */ false, codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800619}
620void IntrinsicCodeGeneratorARM::VisitUnsafeGetLongVolatile(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000621 GenUnsafeGet(invoke, Primitive::kPrimLong, /* is_volatile */ true, codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800622}
623void IntrinsicCodeGeneratorARM::VisitUnsafeGetObject(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000624 GenUnsafeGet(invoke, Primitive::kPrimNot, /* is_volatile */ false, codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800625}
626void IntrinsicCodeGeneratorARM::VisitUnsafeGetObjectVolatile(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000627 GenUnsafeGet(invoke, Primitive::kPrimNot, /* is_volatile */ true, codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800628}
629
630static void CreateIntIntIntIntToVoid(ArenaAllocator* arena,
631 const ArmInstructionSetFeatures& features,
632 Primitive::Type type,
633 bool is_volatile,
634 HInvoke* invoke) {
635 LocationSummary* locations = new (arena) LocationSummary(invoke,
636 LocationSummary::kNoCall,
637 kIntrinsified);
638 locations->SetInAt(0, Location::NoLocation()); // Unused receiver.
639 locations->SetInAt(1, Location::RequiresRegister());
640 locations->SetInAt(2, Location::RequiresRegister());
641 locations->SetInAt(3, Location::RequiresRegister());
642
643 if (type == Primitive::kPrimLong) {
644 // Potentially need temps for ldrexd-strexd loop.
645 if (is_volatile && !features.HasAtomicLdrdAndStrd()) {
646 locations->AddTemp(Location::RequiresRegister()); // Temp_lo.
647 locations->AddTemp(Location::RequiresRegister()); // Temp_hi.
648 }
649 } else if (type == Primitive::kPrimNot) {
650 // Temps for card-marking.
651 locations->AddTemp(Location::RequiresRegister()); // Temp.
652 locations->AddTemp(Location::RequiresRegister()); // Card.
653 }
654}
655
656void IntrinsicLocationsBuilderARM::VisitUnsafePut(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000657 CreateIntIntIntIntToVoid(arena_, features_, Primitive::kPrimInt, /* is_volatile */ false, invoke);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800658}
659void IntrinsicLocationsBuilderARM::VisitUnsafePutOrdered(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000660 CreateIntIntIntIntToVoid(arena_, features_, Primitive::kPrimInt, /* is_volatile */ false, invoke);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800661}
662void IntrinsicLocationsBuilderARM::VisitUnsafePutVolatile(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000663 CreateIntIntIntIntToVoid(arena_, features_, Primitive::kPrimInt, /* is_volatile */ true, invoke);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800664}
665void IntrinsicLocationsBuilderARM::VisitUnsafePutObject(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000666 CreateIntIntIntIntToVoid(arena_, features_, Primitive::kPrimNot, /* is_volatile */ false, invoke);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800667}
668void IntrinsicLocationsBuilderARM::VisitUnsafePutObjectOrdered(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000669 CreateIntIntIntIntToVoid(arena_, features_, Primitive::kPrimNot, /* is_volatile */ false, invoke);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800670}
671void IntrinsicLocationsBuilderARM::VisitUnsafePutObjectVolatile(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000672 CreateIntIntIntIntToVoid(arena_, features_, Primitive::kPrimNot, /* is_volatile */ true, invoke);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800673}
674void IntrinsicLocationsBuilderARM::VisitUnsafePutLong(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000675 CreateIntIntIntIntToVoid(
676 arena_, features_, Primitive::kPrimLong, /* is_volatile */ false, invoke);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800677}
678void IntrinsicLocationsBuilderARM::VisitUnsafePutLongOrdered(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000679 CreateIntIntIntIntToVoid(
680 arena_, features_, Primitive::kPrimLong, /* is_volatile */ false, invoke);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800681}
682void IntrinsicLocationsBuilderARM::VisitUnsafePutLongVolatile(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000683 CreateIntIntIntIntToVoid(
684 arena_, features_, Primitive::kPrimLong, /* is_volatile */ true, invoke);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800685}
686
687static void GenUnsafePut(LocationSummary* locations,
688 Primitive::Type type,
689 bool is_volatile,
690 bool is_ordered,
691 CodeGeneratorARM* codegen) {
692 ArmAssembler* assembler = codegen->GetAssembler();
693
694 Register base = locations->InAt(1).AsRegister<Register>(); // Object pointer.
695 Register offset = locations->InAt(2).AsRegisterPairLow<Register>(); // Long offset, lo part only.
696 Register value;
697
698 if (is_volatile || is_ordered) {
699 __ dmb(ISH);
700 }
701
702 if (type == Primitive::kPrimLong) {
703 Register value_lo = locations->InAt(3).AsRegisterPairLow<Register>();
704 value = value_lo;
705 if (is_volatile && !codegen->GetInstructionSetFeatures().HasAtomicLdrdAndStrd()) {
706 Register temp_lo = locations->GetTemp(0).AsRegister<Register>();
707 Register temp_hi = locations->GetTemp(1).AsRegister<Register>();
708 Register value_hi = locations->InAt(3).AsRegisterPairHigh<Register>();
709
710 __ add(IP, base, ShifterOperand(offset));
711 Label loop_head;
712 __ Bind(&loop_head);
713 __ ldrexd(temp_lo, temp_hi, IP);
714 __ strexd(temp_lo, value_lo, value_hi, IP);
715 __ cmp(temp_lo, ShifterOperand(0));
716 __ b(&loop_head, NE);
717 } else {
718 __ add(IP, base, ShifterOperand(offset));
719 __ strd(value_lo, Address(IP));
720 }
721 } else {
Roland Levillain4d027112015-07-01 15:41:14 +0100722 value = locations->InAt(3).AsRegister<Register>();
723 Register source = value;
724 if (kPoisonHeapReferences && type == Primitive::kPrimNot) {
725 Register temp = locations->GetTemp(0).AsRegister<Register>();
726 __ Mov(temp, value);
727 __ PoisonHeapReference(temp);
728 source = temp;
729 }
730 __ str(source, Address(base, offset));
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800731 }
732
733 if (is_volatile) {
734 __ dmb(ISH);
735 }
736
737 if (type == Primitive::kPrimNot) {
738 Register temp = locations->GetTemp(0).AsRegister<Register>();
739 Register card = locations->GetTemp(1).AsRegister<Register>();
Nicolas Geoffray07276db2015-05-18 14:22:09 +0100740 bool value_can_be_null = true; // TODO: Worth finding out this information?
741 codegen->MarkGCCard(temp, card, base, value, value_can_be_null);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800742 }
743}
744
745void IntrinsicCodeGeneratorARM::VisitUnsafePut(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000746 GenUnsafePut(invoke->GetLocations(),
747 Primitive::kPrimInt,
748 /* is_volatile */ false,
749 /* is_ordered */ false,
750 codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800751}
752void IntrinsicCodeGeneratorARM::VisitUnsafePutOrdered(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000753 GenUnsafePut(invoke->GetLocations(),
754 Primitive::kPrimInt,
755 /* is_volatile */ false,
756 /* is_ordered */ true,
757 codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800758}
759void IntrinsicCodeGeneratorARM::VisitUnsafePutVolatile(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000760 GenUnsafePut(invoke->GetLocations(),
761 Primitive::kPrimInt,
762 /* is_volatile */ true,
763 /* is_ordered */ false,
764 codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800765}
766void IntrinsicCodeGeneratorARM::VisitUnsafePutObject(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000767 GenUnsafePut(invoke->GetLocations(),
768 Primitive::kPrimNot,
769 /* is_volatile */ false,
770 /* is_ordered */ false,
771 codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800772}
773void IntrinsicCodeGeneratorARM::VisitUnsafePutObjectOrdered(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000774 GenUnsafePut(invoke->GetLocations(),
775 Primitive::kPrimNot,
776 /* is_volatile */ false,
777 /* is_ordered */ true,
778 codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800779}
780void IntrinsicCodeGeneratorARM::VisitUnsafePutObjectVolatile(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000781 GenUnsafePut(invoke->GetLocations(),
782 Primitive::kPrimNot,
783 /* is_volatile */ true,
784 /* is_ordered */ false,
785 codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800786}
787void IntrinsicCodeGeneratorARM::VisitUnsafePutLong(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000788 GenUnsafePut(invoke->GetLocations(),
789 Primitive::kPrimLong,
790 /* is_volatile */ false,
791 /* is_ordered */ false,
792 codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800793}
794void IntrinsicCodeGeneratorARM::VisitUnsafePutLongOrdered(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000795 GenUnsafePut(invoke->GetLocations(),
796 Primitive::kPrimLong,
797 /* is_volatile */ false,
798 /* is_ordered */ true,
799 codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800800}
801void IntrinsicCodeGeneratorARM::VisitUnsafePutLongVolatile(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000802 GenUnsafePut(invoke->GetLocations(),
803 Primitive::kPrimLong,
804 /* is_volatile */ true,
805 /* is_ordered */ false,
806 codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800807}
808
809static void CreateIntIntIntIntIntToIntPlusTemps(ArenaAllocator* arena,
Roland Levillain2e50ecb2016-01-27 14:08:33 +0000810 HInvoke* invoke,
811 Primitive::Type type) {
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800812 LocationSummary* locations = new (arena) LocationSummary(invoke,
813 LocationSummary::kNoCall,
814 kIntrinsified);
815 locations->SetInAt(0, Location::NoLocation()); // Unused receiver.
816 locations->SetInAt(1, Location::RequiresRegister());
817 locations->SetInAt(2, Location::RequiresRegister());
818 locations->SetInAt(3, Location::RequiresRegister());
819 locations->SetInAt(4, Location::RequiresRegister());
820
Roland Levillain2e50ecb2016-01-27 14:08:33 +0000821 // If heap poisoning is enabled, we don't want the unpoisoning
822 // operations to potentially clobber the output.
823 Location::OutputOverlap overlaps = (kPoisonHeapReferences && type == Primitive::kPrimNot)
824 ? Location::kOutputOverlap
825 : Location::kNoOutputOverlap;
826 locations->SetOut(Location::RequiresRegister(), overlaps);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800827
828 locations->AddTemp(Location::RequiresRegister()); // Pointer.
829 locations->AddTemp(Location::RequiresRegister()); // Temp 1.
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800830}
831
832static void GenCas(LocationSummary* locations, Primitive::Type type, CodeGeneratorARM* codegen) {
833 DCHECK_NE(type, Primitive::kPrimLong);
834
835 ArmAssembler* assembler = codegen->GetAssembler();
836
837 Register out = locations->Out().AsRegister<Register>(); // Boolean result.
838
839 Register base = locations->InAt(1).AsRegister<Register>(); // Object pointer.
840 Register offset = locations->InAt(2).AsRegisterPairLow<Register>(); // Offset (discard high 4B).
841 Register expected_lo = locations->InAt(3).AsRegister<Register>(); // Expected.
842 Register value_lo = locations->InAt(4).AsRegister<Register>(); // Value.
843
844 Register tmp_ptr = locations->GetTemp(0).AsRegister<Register>(); // Pointer to actual memory.
845 Register tmp_lo = locations->GetTemp(1).AsRegister<Register>(); // Value in memory.
846
847 if (type == Primitive::kPrimNot) {
848 // Mark card for object assuming new value is stored. Worst case we will mark an unchanged
849 // object and scan the receiver at the next GC for nothing.
Nicolas Geoffray07276db2015-05-18 14:22:09 +0100850 bool value_can_be_null = true; // TODO: Worth finding out this information?
851 codegen->MarkGCCard(tmp_ptr, tmp_lo, base, value_lo, value_can_be_null);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800852 }
853
854 // Prevent reordering with prior memory operations.
Roland Levillain4bedb382016-01-12 12:01:04 +0000855 // Emit a DMB ISH instruction instead of an DMB ISHST one, as the
856 // latter allows a preceding load to be delayed past the STXR
857 // instruction below.
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800858 __ dmb(ISH);
859
860 __ add(tmp_ptr, base, ShifterOperand(offset));
861
Roland Levillain4d027112015-07-01 15:41:14 +0100862 if (kPoisonHeapReferences && type == Primitive::kPrimNot) {
863 codegen->GetAssembler()->PoisonHeapReference(expected_lo);
Roland Levillain2e50ecb2016-01-27 14:08:33 +0000864 if (value_lo == expected_lo) {
865 // Do not poison `value_lo`, as it is the same register as
866 // `expected_lo`, which has just been poisoned.
867 } else {
868 codegen->GetAssembler()->PoisonHeapReference(value_lo);
869 }
Roland Levillain4d027112015-07-01 15:41:14 +0100870 }
871
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800872 // do {
873 // tmp = [r_ptr] - expected;
874 // } while (tmp == 0 && failure([r_ptr] <- r_new_value));
875 // result = tmp != 0;
876
877 Label loop_head;
878 __ Bind(&loop_head);
879
Roland Levillain391b8662015-12-18 11:43:38 +0000880 // TODO: When `type == Primitive::kPrimNot`, add a read barrier for
881 // the reference stored in the object before attempting the CAS,
882 // similar to the one in the art::Unsafe_compareAndSwapObject JNI
883 // implementation.
884 //
885 // Note that this code is not (yet) used when read barriers are
886 // enabled (see IntrinsicLocationsBuilderARM::VisitUnsafeCASObject).
887 DCHECK(!(type == Primitive::kPrimNot && kEmitCompilerReadBarrier));
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800888 __ ldrex(tmp_lo, tmp_ptr);
889
890 __ subs(tmp_lo, tmp_lo, ShifterOperand(expected_lo));
891
892 __ it(EQ, ItState::kItT);
893 __ strex(tmp_lo, value_lo, tmp_ptr, EQ);
894 __ cmp(tmp_lo, ShifterOperand(1), EQ);
895
896 __ b(&loop_head, EQ);
897
898 __ dmb(ISH);
899
900 __ rsbs(out, tmp_lo, ShifterOperand(1));
901 __ it(CC);
902 __ mov(out, ShifterOperand(0), CC);
Roland Levillain4d027112015-07-01 15:41:14 +0100903
904 if (kPoisonHeapReferences && type == Primitive::kPrimNot) {
Roland Levillain4d027112015-07-01 15:41:14 +0100905 codegen->GetAssembler()->UnpoisonHeapReference(expected_lo);
Roland Levillain2e50ecb2016-01-27 14:08:33 +0000906 if (value_lo == expected_lo) {
907 // Do not unpoison `value_lo`, as it is the same register as
908 // `expected_lo`, which has just been unpoisoned.
909 } else {
910 codegen->GetAssembler()->UnpoisonHeapReference(value_lo);
911 }
Roland Levillain4d027112015-07-01 15:41:14 +0100912 }
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800913}
914
Andreas Gampeca714582015-04-03 19:41:34 -0700915void IntrinsicLocationsBuilderARM::VisitUnsafeCASInt(HInvoke* invoke) {
Roland Levillain2e50ecb2016-01-27 14:08:33 +0000916 CreateIntIntIntIntIntToIntPlusTemps(arena_, invoke, Primitive::kPrimInt);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800917}
Andreas Gampeca714582015-04-03 19:41:34 -0700918void IntrinsicLocationsBuilderARM::VisitUnsafeCASObject(HInvoke* invoke) {
Roland Levillain391b8662015-12-18 11:43:38 +0000919 // The UnsafeCASObject intrinsic is missing a read barrier, and
920 // therefore sometimes does not work as expected (b/25883050).
921 // Turn it off temporarily as a quick fix, until the read barrier is
922 // implemented (see TODO in GenCAS below).
923 //
Roland Levillain2e50ecb2016-01-27 14:08:33 +0000924 // TODO(rpl): Fix this issue and re-enable this intrinsic with read barriers.
925 if (kEmitCompilerReadBarrier) {
Roland Levillain985ff702015-10-23 13:25:35 +0100926 return;
927 }
928
Roland Levillain2e50ecb2016-01-27 14:08:33 +0000929 CreateIntIntIntIntIntToIntPlusTemps(arena_, invoke, Primitive::kPrimNot);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800930}
931void IntrinsicCodeGeneratorARM::VisitUnsafeCASInt(HInvoke* invoke) {
932 GenCas(invoke->GetLocations(), Primitive::kPrimInt, codegen_);
933}
934void IntrinsicCodeGeneratorARM::VisitUnsafeCASObject(HInvoke* invoke) {
935 GenCas(invoke->GetLocations(), Primitive::kPrimNot, codegen_);
936}
937
938void IntrinsicLocationsBuilderARM::VisitStringCharAt(HInvoke* invoke) {
939 LocationSummary* locations = new (arena_) LocationSummary(invoke,
940 LocationSummary::kCallOnSlowPath,
941 kIntrinsified);
942 locations->SetInAt(0, Location::RequiresRegister());
943 locations->SetInAt(1, Location::RequiresRegister());
944 locations->SetOut(Location::RequiresRegister(), Location::kOutputOverlap);
945
946 locations->AddTemp(Location::RequiresRegister());
947 locations->AddTemp(Location::RequiresRegister());
948}
949
950void IntrinsicCodeGeneratorARM::VisitStringCharAt(HInvoke* invoke) {
951 ArmAssembler* assembler = GetAssembler();
952 LocationSummary* locations = invoke->GetLocations();
953
954 // Location of reference to data array
955 const MemberOffset value_offset = mirror::String::ValueOffset();
956 // Location of count
957 const MemberOffset count_offset = mirror::String::CountOffset();
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800958
959 Register obj = locations->InAt(0).AsRegister<Register>(); // String object pointer.
960 Register idx = locations->InAt(1).AsRegister<Register>(); // Index of character.
961 Register out = locations->Out().AsRegister<Register>(); // Result character.
962
963 Register temp = locations->GetTemp(0).AsRegister<Register>();
964 Register array_temp = locations->GetTemp(1).AsRegister<Register>();
965
966 // TODO: Maybe we can support range check elimination. Overall, though, I think it's not worth
967 // the cost.
968 // TODO: For simplicity, the index parameter is requested in a register, so different from Quick
969 // we will not optimize the code for constants (which would save a register).
970
Andreas Gampe85b62f22015-09-09 13:15:38 -0700971 SlowPathCode* slow_path = new (GetAllocator()) IntrinsicSlowPathARM(invoke);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800972 codegen_->AddSlowPath(slow_path);
973
974 __ ldr(temp, Address(obj, count_offset.Int32Value())); // temp = str.length.
975 codegen_->MaybeRecordImplicitNullCheck(invoke);
976 __ cmp(idx, ShifterOperand(temp));
977 __ b(slow_path->GetEntryLabel(), CS);
978
Jeff Hao848f70a2014-01-15 13:49:50 -0800979 __ add(array_temp, obj, ShifterOperand(value_offset.Int32Value())); // array_temp := str.value.
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800980
981 // Load the value.
Jeff Hao848f70a2014-01-15 13:49:50 -0800982 __ ldrh(out, Address(array_temp, idx, LSL, 1)); // out := array_temp[idx].
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800983
984 __ Bind(slow_path->GetExitLabel());
985}
986
Nicolas Geoffrayd75948a2015-03-27 09:53:16 +0000987void IntrinsicLocationsBuilderARM::VisitStringCompareTo(HInvoke* invoke) {
988 // The inputs plus one temp.
989 LocationSummary* locations = new (arena_) LocationSummary(invoke,
990 LocationSummary::kCall,
991 kIntrinsified);
992 InvokeRuntimeCallingConvention calling_convention;
993 locations->SetInAt(0, Location::RegisterLocation(calling_convention.GetRegisterAt(0)));
994 locations->SetInAt(1, Location::RegisterLocation(calling_convention.GetRegisterAt(1)));
995 locations->SetOut(Location::RegisterLocation(R0));
996}
997
998void IntrinsicCodeGeneratorARM::VisitStringCompareTo(HInvoke* invoke) {
999 ArmAssembler* assembler = GetAssembler();
1000 LocationSummary* locations = invoke->GetLocations();
1001
Nicolas Geoffray512e04d2015-03-27 17:21:24 +00001002 // Note that the null check must have been done earlier.
Calin Juravle641547a2015-04-21 22:08:51 +01001003 DCHECK(!invoke->CanDoImplicitNullCheckOn(invoke->InputAt(0)));
Nicolas Geoffrayd75948a2015-03-27 09:53:16 +00001004
1005 Register argument = locations->InAt(1).AsRegister<Register>();
1006 __ cmp(argument, ShifterOperand(0));
Andreas Gampe85b62f22015-09-09 13:15:38 -07001007 SlowPathCode* slow_path = new (GetAllocator()) IntrinsicSlowPathARM(invoke);
Nicolas Geoffrayd75948a2015-03-27 09:53:16 +00001008 codegen_->AddSlowPath(slow_path);
1009 __ b(slow_path->GetEntryLabel(), EQ);
1010
1011 __ LoadFromOffset(
1012 kLoadWord, LR, TR, QUICK_ENTRYPOINT_OFFSET(kArmWordSize, pStringCompareTo).Int32Value());
1013 __ blx(LR);
1014 __ Bind(slow_path->GetExitLabel());
1015}
1016
Agi Csaki289cd552015-08-18 17:10:38 -07001017void IntrinsicLocationsBuilderARM::VisitStringEquals(HInvoke* invoke) {
1018 LocationSummary* locations = new (arena_) LocationSummary(invoke,
1019 LocationSummary::kNoCall,
1020 kIntrinsified);
1021 InvokeRuntimeCallingConvention calling_convention;
1022 locations->SetInAt(0, Location::RequiresRegister());
1023 locations->SetInAt(1, Location::RequiresRegister());
1024 // Temporary registers to store lengths of strings and for calculations.
1025 // Using instruction cbz requires a low register, so explicitly set a temp to be R0.
1026 locations->AddTemp(Location::RegisterLocation(R0));
1027 locations->AddTemp(Location::RequiresRegister());
1028 locations->AddTemp(Location::RequiresRegister());
1029
1030 locations->SetOut(Location::RequiresRegister());
1031}
1032
1033void IntrinsicCodeGeneratorARM::VisitStringEquals(HInvoke* invoke) {
1034 ArmAssembler* assembler = GetAssembler();
1035 LocationSummary* locations = invoke->GetLocations();
1036
1037 Register str = locations->InAt(0).AsRegister<Register>();
1038 Register arg = locations->InAt(1).AsRegister<Register>();
1039 Register out = locations->Out().AsRegister<Register>();
1040
1041 Register temp = locations->GetTemp(0).AsRegister<Register>();
1042 Register temp1 = locations->GetTemp(1).AsRegister<Register>();
1043 Register temp2 = locations->GetTemp(2).AsRegister<Register>();
1044
1045 Label loop;
1046 Label end;
1047 Label return_true;
1048 Label return_false;
1049
1050 // Get offsets of count, value, and class fields within a string object.
1051 const uint32_t count_offset = mirror::String::CountOffset().Uint32Value();
1052 const uint32_t value_offset = mirror::String::ValueOffset().Uint32Value();
1053 const uint32_t class_offset = mirror::Object::ClassOffset().Uint32Value();
1054
1055 // Note that the null check must have been done earlier.
1056 DCHECK(!invoke->CanDoImplicitNullCheckOn(invoke->InputAt(0)));
1057
1058 // Check if input is null, return false if it is.
1059 __ CompareAndBranchIfZero(arg, &return_false);
1060
1061 // Instanceof check for the argument by comparing class fields.
1062 // All string objects must have the same type since String cannot be subclassed.
1063 // Receiver must be a string object, so its class field is equal to all strings' class fields.
1064 // If the argument is a string object, its class field must be equal to receiver's class field.
1065 __ ldr(temp, Address(str, class_offset));
1066 __ ldr(temp1, Address(arg, class_offset));
1067 __ cmp(temp, ShifterOperand(temp1));
1068 __ b(&return_false, NE);
1069
1070 // Load lengths of this and argument strings.
1071 __ ldr(temp, Address(str, count_offset));
1072 __ ldr(temp1, Address(arg, count_offset));
1073 // Check if lengths are equal, return false if they're not.
1074 __ cmp(temp, ShifterOperand(temp1));
1075 __ b(&return_false, NE);
1076 // Return true if both strings are empty.
1077 __ cbz(temp, &return_true);
1078
1079 // Reference equality check, return true if same reference.
1080 __ cmp(str, ShifterOperand(arg));
1081 __ b(&return_true, EQ);
1082
1083 // Assertions that must hold in order to compare strings 2 characters at a time.
1084 DCHECK_ALIGNED(value_offset, 4);
1085 static_assert(IsAligned<4>(kObjectAlignment), "String of odd length is not zero padded");
1086
Agi Csaki289cd552015-08-18 17:10:38 -07001087 __ LoadImmediate(temp1, value_offset);
Agi Csaki289cd552015-08-18 17:10:38 -07001088
1089 // Loop to compare strings 2 characters at a time starting at the front of the string.
1090 // Ok to do this because strings with an odd length are zero-padded.
1091 __ Bind(&loop);
1092 __ ldr(out, Address(str, temp1));
1093 __ ldr(temp2, Address(arg, temp1));
1094 __ cmp(out, ShifterOperand(temp2));
1095 __ b(&return_false, NE);
1096 __ add(temp1, temp1, ShifterOperand(sizeof(uint32_t)));
Vladimir Markoa63f0d42015-09-01 13:36:35 +01001097 __ subs(temp, temp, ShifterOperand(sizeof(uint32_t) / sizeof(uint16_t)));
1098 __ b(&loop, GT);
Agi Csaki289cd552015-08-18 17:10:38 -07001099
1100 // Return true and exit the function.
1101 // If loop does not result in returning false, we return true.
1102 __ Bind(&return_true);
1103 __ LoadImmediate(out, 1);
1104 __ b(&end);
1105
1106 // Return false and exit the function.
1107 __ Bind(&return_false);
1108 __ LoadImmediate(out, 0);
1109 __ Bind(&end);
1110}
1111
Andreas Gampeba6fdbc2015-05-07 22:31:55 -07001112static void GenerateVisitStringIndexOf(HInvoke* invoke,
1113 ArmAssembler* assembler,
1114 CodeGeneratorARM* codegen,
1115 ArenaAllocator* allocator,
1116 bool start_at_zero) {
1117 LocationSummary* locations = invoke->GetLocations();
1118 Register tmp_reg = locations->GetTemp(0).AsRegister<Register>();
1119
1120 // Note that the null check must have been done earlier.
1121 DCHECK(!invoke->CanDoImplicitNullCheckOn(invoke->InputAt(0)));
1122
1123 // Check for code points > 0xFFFF. Either a slow-path check when we don't know statically,
1124 // or directly dispatch if we have a constant.
Andreas Gampe85b62f22015-09-09 13:15:38 -07001125 SlowPathCode* slow_path = nullptr;
Andreas Gampeba6fdbc2015-05-07 22:31:55 -07001126 if (invoke->InputAt(1)->IsIntConstant()) {
1127 if (static_cast<uint32_t>(invoke->InputAt(1)->AsIntConstant()->GetValue()) >
1128 std::numeric_limits<uint16_t>::max()) {
1129 // Always needs the slow-path. We could directly dispatch to it, but this case should be
1130 // rare, so for simplicity just put the full slow-path down and branch unconditionally.
1131 slow_path = new (allocator) IntrinsicSlowPathARM(invoke);
1132 codegen->AddSlowPath(slow_path);
1133 __ b(slow_path->GetEntryLabel());
1134 __ Bind(slow_path->GetExitLabel());
1135 return;
1136 }
1137 } else {
1138 Register char_reg = locations->InAt(1).AsRegister<Register>();
1139 __ LoadImmediate(tmp_reg, std::numeric_limits<uint16_t>::max());
1140 __ cmp(char_reg, ShifterOperand(tmp_reg));
1141 slow_path = new (allocator) IntrinsicSlowPathARM(invoke);
1142 codegen->AddSlowPath(slow_path);
1143 __ b(slow_path->GetEntryLabel(), HI);
1144 }
1145
1146 if (start_at_zero) {
1147 DCHECK_EQ(tmp_reg, R2);
1148 // Start-index = 0.
1149 __ LoadImmediate(tmp_reg, 0);
1150 }
1151
1152 __ LoadFromOffset(kLoadWord, LR, TR,
1153 QUICK_ENTRYPOINT_OFFSET(kArmWordSize, pIndexOf).Int32Value());
1154 __ blx(LR);
1155
1156 if (slow_path != nullptr) {
1157 __ Bind(slow_path->GetExitLabel());
1158 }
1159}
1160
1161void IntrinsicLocationsBuilderARM::VisitStringIndexOf(HInvoke* invoke) {
1162 LocationSummary* locations = new (arena_) LocationSummary(invoke,
1163 LocationSummary::kCall,
1164 kIntrinsified);
1165 // We have a hand-crafted assembly stub that follows the runtime calling convention. So it's
1166 // best to align the inputs accordingly.
1167 InvokeRuntimeCallingConvention calling_convention;
1168 locations->SetInAt(0, Location::RegisterLocation(calling_convention.GetRegisterAt(0)));
1169 locations->SetInAt(1, Location::RegisterLocation(calling_convention.GetRegisterAt(1)));
1170 locations->SetOut(Location::RegisterLocation(R0));
1171
1172 // Need a temp for slow-path codepoint compare, and need to send start-index=0.
1173 locations->AddTemp(Location::RegisterLocation(calling_convention.GetRegisterAt(2)));
1174}
1175
1176void IntrinsicCodeGeneratorARM::VisitStringIndexOf(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +00001177 GenerateVisitStringIndexOf(
1178 invoke, GetAssembler(), codegen_, GetAllocator(), /* start_at_zero */ true);
Andreas Gampeba6fdbc2015-05-07 22:31:55 -07001179}
1180
1181void IntrinsicLocationsBuilderARM::VisitStringIndexOfAfter(HInvoke* invoke) {
1182 LocationSummary* locations = new (arena_) LocationSummary(invoke,
1183 LocationSummary::kCall,
1184 kIntrinsified);
1185 // We have a hand-crafted assembly stub that follows the runtime calling convention. So it's
1186 // best to align the inputs accordingly.
1187 InvokeRuntimeCallingConvention calling_convention;
1188 locations->SetInAt(0, Location::RegisterLocation(calling_convention.GetRegisterAt(0)));
1189 locations->SetInAt(1, Location::RegisterLocation(calling_convention.GetRegisterAt(1)));
1190 locations->SetInAt(2, Location::RegisterLocation(calling_convention.GetRegisterAt(2)));
1191 locations->SetOut(Location::RegisterLocation(R0));
1192
1193 // Need a temp for slow-path codepoint compare.
1194 locations->AddTemp(Location::RequiresRegister());
1195}
1196
1197void IntrinsicCodeGeneratorARM::VisitStringIndexOfAfter(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +00001198 GenerateVisitStringIndexOf(
1199 invoke, GetAssembler(), codegen_, GetAllocator(), /* start_at_zero */ false);
Andreas Gampeba6fdbc2015-05-07 22:31:55 -07001200}
1201
Jeff Hao848f70a2014-01-15 13:49:50 -08001202void IntrinsicLocationsBuilderARM::VisitStringNewStringFromBytes(HInvoke* invoke) {
1203 LocationSummary* locations = new (arena_) LocationSummary(invoke,
1204 LocationSummary::kCall,
1205 kIntrinsified);
1206 InvokeRuntimeCallingConvention calling_convention;
1207 locations->SetInAt(0, Location::RegisterLocation(calling_convention.GetRegisterAt(0)));
1208 locations->SetInAt(1, Location::RegisterLocation(calling_convention.GetRegisterAt(1)));
1209 locations->SetInAt(2, Location::RegisterLocation(calling_convention.GetRegisterAt(2)));
1210 locations->SetInAt(3, Location::RegisterLocation(calling_convention.GetRegisterAt(3)));
1211 locations->SetOut(Location::RegisterLocation(R0));
1212}
1213
1214void IntrinsicCodeGeneratorARM::VisitStringNewStringFromBytes(HInvoke* invoke) {
1215 ArmAssembler* assembler = GetAssembler();
1216 LocationSummary* locations = invoke->GetLocations();
1217
1218 Register byte_array = locations->InAt(0).AsRegister<Register>();
1219 __ cmp(byte_array, ShifterOperand(0));
Andreas Gampe85b62f22015-09-09 13:15:38 -07001220 SlowPathCode* slow_path = new (GetAllocator()) IntrinsicSlowPathARM(invoke);
Jeff Hao848f70a2014-01-15 13:49:50 -08001221 codegen_->AddSlowPath(slow_path);
1222 __ b(slow_path->GetEntryLabel(), EQ);
1223
1224 __ LoadFromOffset(
1225 kLoadWord, LR, TR, QUICK_ENTRYPOINT_OFFSET(kArmWordSize, pAllocStringFromBytes).Int32Value());
1226 codegen_->RecordPcInfo(invoke, invoke->GetDexPc());
1227 __ blx(LR);
1228 __ Bind(slow_path->GetExitLabel());
1229}
1230
1231void IntrinsicLocationsBuilderARM::VisitStringNewStringFromChars(HInvoke* invoke) {
1232 LocationSummary* locations = new (arena_) LocationSummary(invoke,
1233 LocationSummary::kCall,
1234 kIntrinsified);
1235 InvokeRuntimeCallingConvention calling_convention;
1236 locations->SetInAt(0, Location::RegisterLocation(calling_convention.GetRegisterAt(0)));
1237 locations->SetInAt(1, Location::RegisterLocation(calling_convention.GetRegisterAt(1)));
1238 locations->SetInAt(2, Location::RegisterLocation(calling_convention.GetRegisterAt(2)));
1239 locations->SetOut(Location::RegisterLocation(R0));
1240}
1241
1242void IntrinsicCodeGeneratorARM::VisitStringNewStringFromChars(HInvoke* invoke) {
1243 ArmAssembler* assembler = GetAssembler();
1244
1245 __ LoadFromOffset(
1246 kLoadWord, LR, TR, QUICK_ENTRYPOINT_OFFSET(kArmWordSize, pAllocStringFromChars).Int32Value());
1247 codegen_->RecordPcInfo(invoke, invoke->GetDexPc());
1248 __ blx(LR);
1249}
1250
1251void IntrinsicLocationsBuilderARM::VisitStringNewStringFromString(HInvoke* invoke) {
1252 LocationSummary* locations = new (arena_) LocationSummary(invoke,
1253 LocationSummary::kCall,
1254 kIntrinsified);
1255 InvokeRuntimeCallingConvention calling_convention;
1256 locations->SetInAt(0, Location::RegisterLocation(calling_convention.GetRegisterAt(0)));
1257 locations->SetOut(Location::RegisterLocation(R0));
1258}
1259
1260void IntrinsicCodeGeneratorARM::VisitStringNewStringFromString(HInvoke* invoke) {
1261 ArmAssembler* assembler = GetAssembler();
1262 LocationSummary* locations = invoke->GetLocations();
1263
1264 Register string_to_copy = locations->InAt(0).AsRegister<Register>();
1265 __ cmp(string_to_copy, ShifterOperand(0));
Andreas Gampe85b62f22015-09-09 13:15:38 -07001266 SlowPathCode* slow_path = new (GetAllocator()) IntrinsicSlowPathARM(invoke);
Jeff Hao848f70a2014-01-15 13:49:50 -08001267 codegen_->AddSlowPath(slow_path);
1268 __ b(slow_path->GetEntryLabel(), EQ);
1269
1270 __ LoadFromOffset(kLoadWord,
1271 LR, TR, QUICK_ENTRYPOINT_OFFSET(kArmWordSize, pAllocStringFromString).Int32Value());
1272 codegen_->RecordPcInfo(invoke, invoke->GetDexPc());
1273 __ blx(LR);
1274 __ Bind(slow_path->GetExitLabel());
1275}
1276
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001277void IntrinsicLocationsBuilderARM::VisitSystemArrayCopy(HInvoke* invoke) {
1278 CodeGenerator::CreateSystemArrayCopyLocationSummary(invoke);
1279 LocationSummary* locations = invoke->GetLocations();
1280 if (locations == nullptr) {
1281 return;
1282 }
1283
1284 HIntConstant* src_pos = invoke->InputAt(1)->AsIntConstant();
1285 HIntConstant* dest_pos = invoke->InputAt(3)->AsIntConstant();
1286 HIntConstant* length = invoke->InputAt(4)->AsIntConstant();
1287
1288 if (src_pos != nullptr && !assembler_->ShifterOperandCanAlwaysHold(src_pos->GetValue())) {
1289 locations->SetInAt(1, Location::RequiresRegister());
1290 }
1291 if (dest_pos != nullptr && !assembler_->ShifterOperandCanAlwaysHold(dest_pos->GetValue())) {
1292 locations->SetInAt(3, Location::RequiresRegister());
1293 }
1294 if (length != nullptr && !assembler_->ShifterOperandCanAlwaysHold(length->GetValue())) {
1295 locations->SetInAt(4, Location::RequiresRegister());
1296 }
1297}
1298
1299static void CheckPosition(ArmAssembler* assembler,
1300 Location pos,
1301 Register input,
1302 Location length,
1303 SlowPathCode* slow_path,
1304 Register input_len,
1305 Register temp,
1306 bool length_is_input_length = false) {
1307 // Where is the length in the Array?
1308 const uint32_t length_offset = mirror::Array::LengthOffset().Uint32Value();
1309
1310 if (pos.IsConstant()) {
1311 int32_t pos_const = pos.GetConstant()->AsIntConstant()->GetValue();
1312 if (pos_const == 0) {
1313 if (!length_is_input_length) {
1314 // Check that length(input) >= length.
1315 __ LoadFromOffset(kLoadWord, temp, input, length_offset);
1316 if (length.IsConstant()) {
1317 __ cmp(temp, ShifterOperand(length.GetConstant()->AsIntConstant()->GetValue()));
1318 } else {
1319 __ cmp(temp, ShifterOperand(length.AsRegister<Register>()));
1320 }
1321 __ b(slow_path->GetEntryLabel(), LT);
1322 }
1323 } else {
1324 // Check that length(input) >= pos.
1325 __ LoadFromOffset(kLoadWord, input_len, input, length_offset);
1326 __ subs(temp, input_len, ShifterOperand(pos_const));
1327 __ b(slow_path->GetEntryLabel(), LT);
1328
1329 // Check that (length(input) - pos) >= length.
1330 if (length.IsConstant()) {
1331 __ cmp(temp, ShifterOperand(length.GetConstant()->AsIntConstant()->GetValue()));
1332 } else {
1333 __ cmp(temp, ShifterOperand(length.AsRegister<Register>()));
1334 }
1335 __ b(slow_path->GetEntryLabel(), LT);
1336 }
1337 } else if (length_is_input_length) {
1338 // The only way the copy can succeed is if pos is zero.
1339 Register pos_reg = pos.AsRegister<Register>();
1340 __ CompareAndBranchIfNonZero(pos_reg, slow_path->GetEntryLabel());
1341 } else {
1342 // Check that pos >= 0.
1343 Register pos_reg = pos.AsRegister<Register>();
1344 __ cmp(pos_reg, ShifterOperand(0));
1345 __ b(slow_path->GetEntryLabel(), LT);
1346
1347 // Check that pos <= length(input).
1348 __ LoadFromOffset(kLoadWord, temp, input, length_offset);
1349 __ subs(temp, temp, ShifterOperand(pos_reg));
1350 __ b(slow_path->GetEntryLabel(), LT);
1351
1352 // Check that (length(input) - pos) >= length.
1353 if (length.IsConstant()) {
1354 __ cmp(temp, ShifterOperand(length.GetConstant()->AsIntConstant()->GetValue()));
1355 } else {
1356 __ cmp(temp, ShifterOperand(length.AsRegister<Register>()));
1357 }
1358 __ b(slow_path->GetEntryLabel(), LT);
1359 }
1360}
1361
Roland Levillain3b359c72015-11-17 19:35:12 +00001362// TODO: Implement read barriers in the SystemArrayCopy intrinsic.
1363// Note that this code path is not used (yet) because we do not
1364// intrinsify methods that can go into the IntrinsicSlowPathARM
1365// slow path.
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001366void IntrinsicCodeGeneratorARM::VisitSystemArrayCopy(HInvoke* invoke) {
1367 ArmAssembler* assembler = GetAssembler();
1368 LocationSummary* locations = invoke->GetLocations();
1369
1370 uint32_t class_offset = mirror::Object::ClassOffset().Int32Value();
1371 uint32_t super_offset = mirror::Class::SuperClassOffset().Int32Value();
1372 uint32_t component_offset = mirror::Class::ComponentTypeOffset().Int32Value();
1373 uint32_t primitive_offset = mirror::Class::PrimitiveTypeOffset().Int32Value();
1374
1375 Register src = locations->InAt(0).AsRegister<Register>();
1376 Location src_pos = locations->InAt(1);
1377 Register dest = locations->InAt(2).AsRegister<Register>();
1378 Location dest_pos = locations->InAt(3);
1379 Location length = locations->InAt(4);
1380 Register temp1 = locations->GetTemp(0).AsRegister<Register>();
1381 Register temp2 = locations->GetTemp(1).AsRegister<Register>();
1382 Register temp3 = locations->GetTemp(2).AsRegister<Register>();
1383
1384 SlowPathCode* slow_path = new (GetAllocator()) IntrinsicSlowPathARM(invoke);
1385 codegen_->AddSlowPath(slow_path);
1386
1387 Label ok;
1388 SystemArrayCopyOptimizations optimizations(invoke);
1389
1390 if (!optimizations.GetDestinationIsSource()) {
1391 if (!src_pos.IsConstant() || !dest_pos.IsConstant()) {
1392 __ cmp(src, ShifterOperand(dest));
1393 }
1394 }
1395
1396 // If source and destination are the same, we go to slow path if we need to do
1397 // forward copying.
1398 if (src_pos.IsConstant()) {
1399 int32_t src_pos_constant = src_pos.GetConstant()->AsIntConstant()->GetValue();
1400 if (dest_pos.IsConstant()) {
1401 // Checked when building locations.
1402 DCHECK(!optimizations.GetDestinationIsSource()
1403 || (src_pos_constant >= dest_pos.GetConstant()->AsIntConstant()->GetValue()));
1404 } else {
1405 if (!optimizations.GetDestinationIsSource()) {
1406 __ b(&ok, NE);
1407 }
1408 __ cmp(dest_pos.AsRegister<Register>(), ShifterOperand(src_pos_constant));
1409 __ b(slow_path->GetEntryLabel(), GT);
1410 }
1411 } else {
1412 if (!optimizations.GetDestinationIsSource()) {
1413 __ b(&ok, NE);
1414 }
1415 if (dest_pos.IsConstant()) {
1416 int32_t dest_pos_constant = dest_pos.GetConstant()->AsIntConstant()->GetValue();
1417 __ cmp(src_pos.AsRegister<Register>(), ShifterOperand(dest_pos_constant));
1418 } else {
1419 __ cmp(src_pos.AsRegister<Register>(), ShifterOperand(dest_pos.AsRegister<Register>()));
1420 }
1421 __ b(slow_path->GetEntryLabel(), LT);
1422 }
1423
1424 __ Bind(&ok);
1425
1426 if (!optimizations.GetSourceIsNotNull()) {
1427 // Bail out if the source is null.
1428 __ CompareAndBranchIfZero(src, slow_path->GetEntryLabel());
1429 }
1430
1431 if (!optimizations.GetDestinationIsNotNull() && !optimizations.GetDestinationIsSource()) {
1432 // Bail out if the destination is null.
1433 __ CompareAndBranchIfZero(dest, slow_path->GetEntryLabel());
1434 }
1435
1436 // If the length is negative, bail out.
1437 // We have already checked in the LocationsBuilder for the constant case.
1438 if (!length.IsConstant() &&
1439 !optimizations.GetCountIsSourceLength() &&
1440 !optimizations.GetCountIsDestinationLength()) {
1441 __ cmp(length.AsRegister<Register>(), ShifterOperand(0));
1442 __ b(slow_path->GetEntryLabel(), LT);
1443 }
1444
1445 // Validity checks: source.
1446 CheckPosition(assembler,
1447 src_pos,
1448 src,
1449 length,
1450 slow_path,
1451 temp1,
1452 temp2,
1453 optimizations.GetCountIsSourceLength());
1454
1455 // Validity checks: dest.
1456 CheckPosition(assembler,
1457 dest_pos,
1458 dest,
1459 length,
1460 slow_path,
1461 temp1,
1462 temp2,
1463 optimizations.GetCountIsDestinationLength());
1464
1465 if (!optimizations.GetDoesNotNeedTypeCheck()) {
1466 // Check whether all elements of the source array are assignable to the component
1467 // type of the destination array. We do two checks: the classes are the same,
1468 // or the destination is Object[]. If none of these checks succeed, we go to the
1469 // slow path.
1470 __ LoadFromOffset(kLoadWord, temp1, dest, class_offset);
1471 __ LoadFromOffset(kLoadWord, temp2, src, class_offset);
1472 bool did_unpoison = false;
1473 if (!optimizations.GetDestinationIsNonPrimitiveArray() ||
1474 !optimizations.GetSourceIsNonPrimitiveArray()) {
1475 // One or two of the references need to be unpoisoned. Unpoisoned them
1476 // both to make the identity check valid.
1477 __ MaybeUnpoisonHeapReference(temp1);
1478 __ MaybeUnpoisonHeapReference(temp2);
1479 did_unpoison = true;
1480 }
1481
1482 if (!optimizations.GetDestinationIsNonPrimitiveArray()) {
1483 // Bail out if the destination is not a non primitive array.
1484 __ LoadFromOffset(kLoadWord, temp3, temp1, component_offset);
1485 __ CompareAndBranchIfZero(temp3, slow_path->GetEntryLabel());
1486 __ MaybeUnpoisonHeapReference(temp3);
1487 __ LoadFromOffset(kLoadUnsignedHalfword, temp3, temp3, primitive_offset);
1488 static_assert(Primitive::kPrimNot == 0, "Expected 0 for kPrimNot");
1489 __ CompareAndBranchIfNonZero(temp3, slow_path->GetEntryLabel());
1490 }
1491
1492 if (!optimizations.GetSourceIsNonPrimitiveArray()) {
1493 // Bail out if the source is not a non primitive array.
1494 // Bail out if the destination is not a non primitive array.
1495 __ LoadFromOffset(kLoadWord, temp3, temp2, component_offset);
1496 __ CompareAndBranchIfZero(temp3, slow_path->GetEntryLabel());
1497 __ MaybeUnpoisonHeapReference(temp3);
1498 __ LoadFromOffset(kLoadUnsignedHalfword, temp3, temp3, primitive_offset);
1499 static_assert(Primitive::kPrimNot == 0, "Expected 0 for kPrimNot");
1500 __ CompareAndBranchIfNonZero(temp3, slow_path->GetEntryLabel());
1501 }
1502
1503 __ cmp(temp1, ShifterOperand(temp2));
1504
1505 if (optimizations.GetDestinationIsTypedObjectArray()) {
1506 Label do_copy;
1507 __ b(&do_copy, EQ);
1508 if (!did_unpoison) {
1509 __ MaybeUnpoisonHeapReference(temp1);
1510 }
1511 __ LoadFromOffset(kLoadWord, temp1, temp1, component_offset);
1512 __ MaybeUnpoisonHeapReference(temp1);
1513 __ LoadFromOffset(kLoadWord, temp1, temp1, super_offset);
1514 // No need to unpoison the result, we're comparing against null.
1515 __ CompareAndBranchIfNonZero(temp1, slow_path->GetEntryLabel());
1516 __ Bind(&do_copy);
1517 } else {
1518 __ b(slow_path->GetEntryLabel(), NE);
1519 }
1520 } else if (!optimizations.GetSourceIsNonPrimitiveArray()) {
1521 DCHECK(optimizations.GetDestinationIsNonPrimitiveArray());
1522 // Bail out if the source is not a non primitive array.
1523 __ LoadFromOffset(kLoadWord, temp1, src, class_offset);
1524 __ MaybeUnpoisonHeapReference(temp1);
1525 __ LoadFromOffset(kLoadWord, temp3, temp1, component_offset);
1526 __ CompareAndBranchIfZero(temp3, slow_path->GetEntryLabel());
1527 __ MaybeUnpoisonHeapReference(temp3);
1528 __ LoadFromOffset(kLoadUnsignedHalfword, temp3, temp3, primitive_offset);
1529 static_assert(Primitive::kPrimNot == 0, "Expected 0 for kPrimNot");
1530 __ CompareAndBranchIfNonZero(temp3, slow_path->GetEntryLabel());
1531 }
1532
1533 // Compute base source address, base destination address, and end source address.
1534
1535 uint32_t element_size = sizeof(int32_t);
1536 uint32_t offset = mirror::Array::DataOffset(element_size).Uint32Value();
1537 if (src_pos.IsConstant()) {
1538 int32_t constant = src_pos.GetConstant()->AsIntConstant()->GetValue();
1539 __ AddConstant(temp1, src, element_size * constant + offset);
1540 } else {
1541 __ add(temp1, src, ShifterOperand(src_pos.AsRegister<Register>(), LSL, 2));
1542 __ AddConstant(temp1, offset);
1543 }
1544
1545 if (dest_pos.IsConstant()) {
1546 int32_t constant = dest_pos.GetConstant()->AsIntConstant()->GetValue();
1547 __ AddConstant(temp2, dest, element_size * constant + offset);
1548 } else {
1549 __ add(temp2, dest, ShifterOperand(dest_pos.AsRegister<Register>(), LSL, 2));
1550 __ AddConstant(temp2, offset);
1551 }
1552
1553 if (length.IsConstant()) {
1554 int32_t constant = length.GetConstant()->AsIntConstant()->GetValue();
1555 __ AddConstant(temp3, temp1, element_size * constant);
1556 } else {
1557 __ add(temp3, temp1, ShifterOperand(length.AsRegister<Register>(), LSL, 2));
1558 }
1559
1560 // Iterate over the arrays and do a raw copy of the objects. We don't need to
1561 // poison/unpoison, nor do any read barrier as the next uses of the destination
1562 // array will do it.
1563 Label loop, done;
1564 __ cmp(temp1, ShifterOperand(temp3));
1565 __ b(&done, EQ);
1566 __ Bind(&loop);
1567 __ ldr(IP, Address(temp1, element_size, Address::PostIndex));
1568 __ str(IP, Address(temp2, element_size, Address::PostIndex));
1569 __ cmp(temp1, ShifterOperand(temp3));
1570 __ b(&loop, NE);
1571 __ Bind(&done);
1572
1573 // We only need one card marking on the destination array.
1574 codegen_->MarkGCCard(temp1,
1575 temp2,
1576 dest,
1577 Register(kNoRegister),
Roland Levillainbf84a3d2015-12-04 14:33:02 +00001578 /* can_be_null */ false);
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001579
1580 __ Bind(slow_path->GetExitLabel());
1581}
1582
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -08001583// Unimplemented intrinsics.
1584
1585#define UNIMPLEMENTED_INTRINSIC(Name) \
1586void IntrinsicLocationsBuilderARM::Visit ## Name(HInvoke* invoke ATTRIBUTE_UNUSED) { \
1587} \
1588void IntrinsicCodeGeneratorARM::Visit ## Name(HInvoke* invoke ATTRIBUTE_UNUSED) { \
1589}
1590
Aart Bik3f67e692016-01-15 14:35:12 -08001591UNIMPLEMENTED_INTRINSIC(IntegerBitCount)
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -08001592UNIMPLEMENTED_INTRINSIC(IntegerReverse)
1593UNIMPLEMENTED_INTRINSIC(IntegerReverseBytes)
Aart Bik3f67e692016-01-15 14:35:12 -08001594UNIMPLEMENTED_INTRINSIC(LongBitCount)
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -08001595UNIMPLEMENTED_INTRINSIC(LongReverse)
1596UNIMPLEMENTED_INTRINSIC(LongReverseBytes)
1597UNIMPLEMENTED_INTRINSIC(ShortReverseBytes)
1598UNIMPLEMENTED_INTRINSIC(MathMinDoubleDouble)
1599UNIMPLEMENTED_INTRINSIC(MathMinFloatFloat)
1600UNIMPLEMENTED_INTRINSIC(MathMaxDoubleDouble)
1601UNIMPLEMENTED_INTRINSIC(MathMaxFloatFloat)
1602UNIMPLEMENTED_INTRINSIC(MathMinLongLong)
1603UNIMPLEMENTED_INTRINSIC(MathMaxLongLong)
1604UNIMPLEMENTED_INTRINSIC(MathCeil) // Could be done by changing rounding mode, maybe?
1605UNIMPLEMENTED_INTRINSIC(MathFloor) // Could be done by changing rounding mode, maybe?
1606UNIMPLEMENTED_INTRINSIC(MathRint)
1607UNIMPLEMENTED_INTRINSIC(MathRoundDouble) // Could be done by changing rounding mode, maybe?
1608UNIMPLEMENTED_INTRINSIC(MathRoundFloat) // Could be done by changing rounding mode, maybe?
1609UNIMPLEMENTED_INTRINSIC(UnsafeCASLong) // High register pressure.
1610UNIMPLEMENTED_INTRINSIC(SystemArrayCopyChar)
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -08001611UNIMPLEMENTED_INTRINSIC(ReferenceGetReferent)
Jeff Hao848f70a2014-01-15 13:49:50 -08001612UNIMPLEMENTED_INTRINSIC(StringGetCharsNoCheck)
Mark Mendella4f12202015-08-06 15:23:34 -04001613UNIMPLEMENTED_INTRINSIC(MathCos)
1614UNIMPLEMENTED_INTRINSIC(MathSin)
1615UNIMPLEMENTED_INTRINSIC(MathAcos)
1616UNIMPLEMENTED_INTRINSIC(MathAsin)
1617UNIMPLEMENTED_INTRINSIC(MathAtan)
1618UNIMPLEMENTED_INTRINSIC(MathAtan2)
1619UNIMPLEMENTED_INTRINSIC(MathCbrt)
1620UNIMPLEMENTED_INTRINSIC(MathCosh)
1621UNIMPLEMENTED_INTRINSIC(MathExp)
1622UNIMPLEMENTED_INTRINSIC(MathExpm1)
1623UNIMPLEMENTED_INTRINSIC(MathHypot)
1624UNIMPLEMENTED_INTRINSIC(MathLog)
1625UNIMPLEMENTED_INTRINSIC(MathLog10)
1626UNIMPLEMENTED_INTRINSIC(MathNextAfter)
1627UNIMPLEMENTED_INTRINSIC(MathSinh)
1628UNIMPLEMENTED_INTRINSIC(MathTan)
1629UNIMPLEMENTED_INTRINSIC(MathTanh)
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -08001630
Aart Bik59c94542016-01-25 14:20:58 -08001631UNIMPLEMENTED_INTRINSIC(FloatIsInfinite)
1632UNIMPLEMENTED_INTRINSIC(DoubleIsInfinite)
1633UNIMPLEMENTED_INTRINSIC(FloatIsNaN)
1634UNIMPLEMENTED_INTRINSIC(DoubleIsNaN)
1635
1636UNIMPLEMENTED_INTRINSIC(IntegerCompare)
1637UNIMPLEMENTED_INTRINSIC(LongCompare)
1638UNIMPLEMENTED_INTRINSIC(IntegerHighestOneBit)
1639UNIMPLEMENTED_INTRINSIC(LongHighestOneBit)
1640UNIMPLEMENTED_INTRINSIC(IntegerLowestOneBit)
1641UNIMPLEMENTED_INTRINSIC(LongLowestOneBit)
1642UNIMPLEMENTED_INTRINSIC(IntegerSignum)
1643UNIMPLEMENTED_INTRINSIC(LongSignum)
1644
1645// Rotate operations are handled as HRor instructions.
1646UNIMPLEMENTED_INTRINSIC(IntegerRotateLeft)
1647UNIMPLEMENTED_INTRINSIC(IntegerRotateRight)
1648UNIMPLEMENTED_INTRINSIC(LongRotateLeft)
1649UNIMPLEMENTED_INTRINSIC(LongRotateRight)
1650
Roland Levillain4d027112015-07-01 15:41:14 +01001651#undef UNIMPLEMENTED_INTRINSIC
1652
1653#undef __
1654
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -08001655} // namespace arm
1656} // namespace art