blob: 96a6ecbee94e55657d513ca4daa9b9eb06cd1d66 [file] [log] [blame]
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -08001/*
2 * Copyright (C) 2015 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17#include "intrinsics_arm.h"
18
19#include "arch/arm/instruction_set_features_arm.h"
Mathieu Chartiere401d142015-04-22 13:56:20 -070020#include "art_method.h"
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -080021#include "code_generator_arm.h"
22#include "entrypoints/quick/quick_entrypoints.h"
23#include "intrinsics.h"
Andreas Gampe85b62f22015-09-09 13:15:38 -070024#include "intrinsics_utils.h"
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -080025#include "mirror/array-inl.h"
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -080026#include "mirror/string.h"
27#include "thread.h"
28#include "utils/arm/assembler_arm.h"
29
30namespace art {
31
32namespace arm {
33
34ArmAssembler* IntrinsicCodeGeneratorARM::GetAssembler() {
35 return codegen_->GetAssembler();
36}
37
38ArenaAllocator* IntrinsicCodeGeneratorARM::GetAllocator() {
39 return codegen_->GetGraph()->GetArena();
40}
41
Andreas Gampe85b62f22015-09-09 13:15:38 -070042using IntrinsicSlowPathARM = IntrinsicSlowPath<InvokeDexCallingConventionVisitorARM>;
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -080043
Roland Levillain0b671c02016-08-19 12:02:34 +010044// NOLINT on __ macro to suppress wrong warning/fix (misc-macro-parentheses) from clang-tidy.
45#define __ down_cast<ArmAssembler*>(codegen->GetAssembler())-> // NOLINT
46
47// Slow path implementing the SystemArrayCopy intrinsic copy loop with read barriers.
48class ReadBarrierSystemArrayCopySlowPathARM : public SlowPathCode {
49 public:
50 explicit ReadBarrierSystemArrayCopySlowPathARM(HInstruction* instruction)
51 : SlowPathCode(instruction) {
52 DCHECK(kEmitCompilerReadBarrier);
53 DCHECK(kUseBakerReadBarrier);
54 }
55
56 void EmitNativeCode(CodeGenerator* codegen) OVERRIDE {
57 CodeGeneratorARM* arm_codegen = down_cast<CodeGeneratorARM*>(codegen);
58 LocationSummary* locations = instruction_->GetLocations();
59 DCHECK(locations->CanCall());
60 DCHECK(instruction_->IsInvokeStaticOrDirect())
61 << "Unexpected instruction in read barrier arraycopy slow path: "
62 << instruction_->DebugName();
63 DCHECK(instruction_->GetLocations()->Intrinsified());
64 DCHECK_EQ(instruction_->AsInvoke()->GetIntrinsic(), Intrinsics::kSystemArrayCopy);
65
66 int32_t element_size = Primitive::ComponentSize(Primitive::kPrimNot);
67 uint32_t element_size_shift = Primitive::ComponentSizeShift(Primitive::kPrimNot);
68 uint32_t offset = mirror::Array::DataOffset(element_size).Uint32Value();
69
70 Register dest = locations->InAt(2).AsRegister<Register>();
71 Location dest_pos = locations->InAt(3);
72 Register src_curr_addr = locations->GetTemp(0).AsRegister<Register>();
73 Register dst_curr_addr = locations->GetTemp(1).AsRegister<Register>();
74 Register src_stop_addr = locations->GetTemp(2).AsRegister<Register>();
75 Register tmp = locations->GetTemp(3).AsRegister<Register>();
76
77 __ Bind(GetEntryLabel());
78 // Compute the base destination address in `dst_curr_addr`.
79 if (dest_pos.IsConstant()) {
80 int32_t constant = dest_pos.GetConstant()->AsIntConstant()->GetValue();
81 __ AddConstant(dst_curr_addr, dest, element_size * constant + offset);
82 } else {
83 __ add(dst_curr_addr,
84 dest,
85 ShifterOperand(dest_pos.AsRegister<Register>(), LSL, element_size_shift));
86 __ AddConstant(dst_curr_addr, offset);
87 }
88
89 Label loop;
90 __ Bind(&loop);
91 __ ldr(tmp, Address(src_curr_addr, element_size, Address::PostIndex));
92 __ MaybeUnpoisonHeapReference(tmp);
93 // TODO: Inline the mark bit check before calling the runtime?
94 // tmp = ReadBarrier::Mark(tmp);
95 // No need to save live registers; it's taken care of by the
96 // entrypoint. Also, there is no need to update the stack mask,
97 // as this runtime call will not trigger a garbage collection.
98 // (See ReadBarrierMarkSlowPathARM::EmitNativeCode for more
99 // explanations.)
100 DCHECK_NE(tmp, SP);
101 DCHECK_NE(tmp, LR);
102 DCHECK_NE(tmp, PC);
103 // IP is used internally by the ReadBarrierMarkRegX entry point
104 // as a temporary (and not preserved). It thus cannot be used by
105 // any live register in this slow path.
106 DCHECK_NE(src_curr_addr, IP);
107 DCHECK_NE(dst_curr_addr, IP);
108 DCHECK_NE(src_stop_addr, IP);
109 DCHECK_NE(tmp, IP);
110 DCHECK(0 <= tmp && tmp < kNumberOfCoreRegisters) << tmp;
111 int32_t entry_point_offset =
112 CodeGenerator::GetReadBarrierMarkEntryPointsOffset<kArmPointerSize>(tmp);
113 // This runtime call does not require a stack map.
114 arm_codegen->InvokeRuntimeWithoutRecordingPcInfo(entry_point_offset, instruction_, this);
115 __ MaybePoisonHeapReference(tmp);
116 __ str(tmp, Address(dst_curr_addr, element_size, Address::PostIndex));
117 __ cmp(src_curr_addr, ShifterOperand(src_stop_addr));
118 __ b(&loop, NE);
119 __ b(GetExitLabel());
120 }
121
122 const char* GetDescription() const OVERRIDE { return "ReadBarrierSystemArrayCopySlowPathARM"; }
123
124 private:
125 DISALLOW_COPY_AND_ASSIGN(ReadBarrierSystemArrayCopySlowPathARM);
126};
127
128#undef __
129
Vladimir Marko68c981f2016-08-26 13:13:33 +0100130IntrinsicLocationsBuilderARM::IntrinsicLocationsBuilderARM(CodeGeneratorARM* codegen)
131 : arena_(codegen->GetGraph()->GetArena()),
132 assembler_(codegen->GetAssembler()),
133 features_(codegen->GetInstructionSetFeatures()) {}
134
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800135bool IntrinsicLocationsBuilderARM::TryDispatch(HInvoke* invoke) {
136 Dispatch(invoke);
137 LocationSummary* res = invoke->GetLocations();
Roland Levillain3b359c72015-11-17 19:35:12 +0000138 if (res == nullptr) {
139 return false;
140 }
Roland Levillain3b359c72015-11-17 19:35:12 +0000141 return res->Intrinsified();
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800142}
143
144#define __ assembler->
145
146static void CreateFPToIntLocations(ArenaAllocator* arena, HInvoke* invoke) {
147 LocationSummary* locations = new (arena) LocationSummary(invoke,
148 LocationSummary::kNoCall,
149 kIntrinsified);
150 locations->SetInAt(0, Location::RequiresFpuRegister());
151 locations->SetOut(Location::RequiresRegister());
152}
153
154static void CreateIntToFPLocations(ArenaAllocator* arena, HInvoke* invoke) {
155 LocationSummary* locations = new (arena) LocationSummary(invoke,
156 LocationSummary::kNoCall,
157 kIntrinsified);
158 locations->SetInAt(0, Location::RequiresRegister());
159 locations->SetOut(Location::RequiresFpuRegister());
160}
161
162static void MoveFPToInt(LocationSummary* locations, bool is64bit, ArmAssembler* assembler) {
163 Location input = locations->InAt(0);
164 Location output = locations->Out();
165 if (is64bit) {
166 __ vmovrrd(output.AsRegisterPairLow<Register>(),
167 output.AsRegisterPairHigh<Register>(),
168 FromLowSToD(input.AsFpuRegisterPairLow<SRegister>()));
169 } else {
170 __ vmovrs(output.AsRegister<Register>(), input.AsFpuRegister<SRegister>());
171 }
172}
173
174static void MoveIntToFP(LocationSummary* locations, bool is64bit, ArmAssembler* assembler) {
175 Location input = locations->InAt(0);
176 Location output = locations->Out();
177 if (is64bit) {
178 __ vmovdrr(FromLowSToD(output.AsFpuRegisterPairLow<SRegister>()),
179 input.AsRegisterPairLow<Register>(),
180 input.AsRegisterPairHigh<Register>());
181 } else {
182 __ vmovsr(output.AsFpuRegister<SRegister>(), input.AsRegister<Register>());
183 }
184}
185
186void IntrinsicLocationsBuilderARM::VisitDoubleDoubleToRawLongBits(HInvoke* invoke) {
187 CreateFPToIntLocations(arena_, invoke);
188}
189void IntrinsicLocationsBuilderARM::VisitDoubleLongBitsToDouble(HInvoke* invoke) {
190 CreateIntToFPLocations(arena_, invoke);
191}
192
193void IntrinsicCodeGeneratorARM::VisitDoubleDoubleToRawLongBits(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000194 MoveFPToInt(invoke->GetLocations(), /* is64bit */ true, GetAssembler());
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800195}
196void IntrinsicCodeGeneratorARM::VisitDoubleLongBitsToDouble(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000197 MoveIntToFP(invoke->GetLocations(), /* is64bit */ true, GetAssembler());
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800198}
199
200void IntrinsicLocationsBuilderARM::VisitFloatFloatToRawIntBits(HInvoke* invoke) {
201 CreateFPToIntLocations(arena_, invoke);
202}
203void IntrinsicLocationsBuilderARM::VisitFloatIntBitsToFloat(HInvoke* invoke) {
204 CreateIntToFPLocations(arena_, invoke);
205}
206
207void IntrinsicCodeGeneratorARM::VisitFloatFloatToRawIntBits(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000208 MoveFPToInt(invoke->GetLocations(), /* is64bit */ false, GetAssembler());
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800209}
210void IntrinsicCodeGeneratorARM::VisitFloatIntBitsToFloat(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000211 MoveIntToFP(invoke->GetLocations(), /* is64bit */ false, GetAssembler());
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800212}
213
214static void CreateIntToIntLocations(ArenaAllocator* arena, HInvoke* invoke) {
215 LocationSummary* locations = new (arena) LocationSummary(invoke,
216 LocationSummary::kNoCall,
217 kIntrinsified);
218 locations->SetInAt(0, Location::RequiresRegister());
219 locations->SetOut(Location::RequiresRegister(), Location::kNoOutputOverlap);
220}
221
222static void CreateFPToFPLocations(ArenaAllocator* arena, HInvoke* invoke) {
223 LocationSummary* locations = new (arena) LocationSummary(invoke,
224 LocationSummary::kNoCall,
225 kIntrinsified);
226 locations->SetInAt(0, Location::RequiresFpuRegister());
227 locations->SetOut(Location::RequiresFpuRegister(), Location::kNoOutputOverlap);
228}
229
Scott Wakeling611d3392015-07-10 11:42:06 +0100230static void GenNumberOfLeadingZeros(LocationSummary* locations,
231 Primitive::Type type,
232 ArmAssembler* assembler) {
233 Location in = locations->InAt(0);
234 Register out = locations->Out().AsRegister<Register>();
235
236 DCHECK((type == Primitive::kPrimInt) || (type == Primitive::kPrimLong));
237
238 if (type == Primitive::kPrimLong) {
239 Register in_reg_lo = in.AsRegisterPairLow<Register>();
240 Register in_reg_hi = in.AsRegisterPairHigh<Register>();
241 Label end;
242 __ clz(out, in_reg_hi);
243 __ CompareAndBranchIfNonZero(in_reg_hi, &end);
244 __ clz(out, in_reg_lo);
245 __ AddConstant(out, 32);
246 __ Bind(&end);
247 } else {
248 __ clz(out, in.AsRegister<Register>());
249 }
250}
251
252void IntrinsicLocationsBuilderARM::VisitIntegerNumberOfLeadingZeros(HInvoke* invoke) {
253 CreateIntToIntLocations(arena_, invoke);
254}
255
256void IntrinsicCodeGeneratorARM::VisitIntegerNumberOfLeadingZeros(HInvoke* invoke) {
257 GenNumberOfLeadingZeros(invoke->GetLocations(), Primitive::kPrimInt, GetAssembler());
258}
259
260void IntrinsicLocationsBuilderARM::VisitLongNumberOfLeadingZeros(HInvoke* invoke) {
261 LocationSummary* locations = new (arena_) LocationSummary(invoke,
262 LocationSummary::kNoCall,
263 kIntrinsified);
264 locations->SetInAt(0, Location::RequiresRegister());
265 locations->SetOut(Location::RequiresRegister(), Location::kOutputOverlap);
266}
267
268void IntrinsicCodeGeneratorARM::VisitLongNumberOfLeadingZeros(HInvoke* invoke) {
269 GenNumberOfLeadingZeros(invoke->GetLocations(), Primitive::kPrimLong, GetAssembler());
270}
271
Scott Wakeling9ee23f42015-07-23 10:44:35 +0100272static void GenNumberOfTrailingZeros(LocationSummary* locations,
273 Primitive::Type type,
274 ArmAssembler* assembler) {
275 DCHECK((type == Primitive::kPrimInt) || (type == Primitive::kPrimLong));
276
277 Register out = locations->Out().AsRegister<Register>();
278
279 if (type == Primitive::kPrimLong) {
280 Register in_reg_lo = locations->InAt(0).AsRegisterPairLow<Register>();
281 Register in_reg_hi = locations->InAt(0).AsRegisterPairHigh<Register>();
282 Label end;
283 __ rbit(out, in_reg_lo);
284 __ clz(out, out);
285 __ CompareAndBranchIfNonZero(in_reg_lo, &end);
286 __ rbit(out, in_reg_hi);
287 __ clz(out, out);
288 __ AddConstant(out, 32);
289 __ Bind(&end);
290 } else {
291 Register in = locations->InAt(0).AsRegister<Register>();
292 __ rbit(out, in);
293 __ clz(out, out);
294 }
295}
296
297void IntrinsicLocationsBuilderARM::VisitIntegerNumberOfTrailingZeros(HInvoke* invoke) {
298 LocationSummary* locations = new (arena_) LocationSummary(invoke,
299 LocationSummary::kNoCall,
300 kIntrinsified);
301 locations->SetInAt(0, Location::RequiresRegister());
302 locations->SetOut(Location::RequiresRegister(), Location::kNoOutputOverlap);
303}
304
305void IntrinsicCodeGeneratorARM::VisitIntegerNumberOfTrailingZeros(HInvoke* invoke) {
306 GenNumberOfTrailingZeros(invoke->GetLocations(), Primitive::kPrimInt, GetAssembler());
307}
308
309void IntrinsicLocationsBuilderARM::VisitLongNumberOfTrailingZeros(HInvoke* invoke) {
310 LocationSummary* locations = new (arena_) LocationSummary(invoke,
311 LocationSummary::kNoCall,
312 kIntrinsified);
313 locations->SetInAt(0, Location::RequiresRegister());
314 locations->SetOut(Location::RequiresRegister(), Location::kOutputOverlap);
315}
316
317void IntrinsicCodeGeneratorARM::VisitLongNumberOfTrailingZeros(HInvoke* invoke) {
318 GenNumberOfTrailingZeros(invoke->GetLocations(), Primitive::kPrimLong, GetAssembler());
319}
320
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800321static void MathAbsFP(LocationSummary* locations, bool is64bit, ArmAssembler* assembler) {
322 Location in = locations->InAt(0);
323 Location out = locations->Out();
324
325 if (is64bit) {
326 __ vabsd(FromLowSToD(out.AsFpuRegisterPairLow<SRegister>()),
327 FromLowSToD(in.AsFpuRegisterPairLow<SRegister>()));
328 } else {
329 __ vabss(out.AsFpuRegister<SRegister>(), in.AsFpuRegister<SRegister>());
330 }
331}
332
333void IntrinsicLocationsBuilderARM::VisitMathAbsDouble(HInvoke* invoke) {
334 CreateFPToFPLocations(arena_, invoke);
335}
336
337void IntrinsicCodeGeneratorARM::VisitMathAbsDouble(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000338 MathAbsFP(invoke->GetLocations(), /* is64bit */ true, GetAssembler());
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800339}
340
341void IntrinsicLocationsBuilderARM::VisitMathAbsFloat(HInvoke* invoke) {
342 CreateFPToFPLocations(arena_, invoke);
343}
344
345void IntrinsicCodeGeneratorARM::VisitMathAbsFloat(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000346 MathAbsFP(invoke->GetLocations(), /* is64bit */ false, GetAssembler());
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800347}
348
349static void CreateIntToIntPlusTemp(ArenaAllocator* arena, HInvoke* invoke) {
350 LocationSummary* locations = new (arena) LocationSummary(invoke,
351 LocationSummary::kNoCall,
352 kIntrinsified);
353 locations->SetInAt(0, Location::RequiresRegister());
354 locations->SetOut(Location::RequiresRegister(), Location::kNoOutputOverlap);
355
356 locations->AddTemp(Location::RequiresRegister());
357}
358
359static void GenAbsInteger(LocationSummary* locations,
360 bool is64bit,
361 ArmAssembler* assembler) {
362 Location in = locations->InAt(0);
363 Location output = locations->Out();
364
365 Register mask = locations->GetTemp(0).AsRegister<Register>();
366
367 if (is64bit) {
368 Register in_reg_lo = in.AsRegisterPairLow<Register>();
369 Register in_reg_hi = in.AsRegisterPairHigh<Register>();
370 Register out_reg_lo = output.AsRegisterPairLow<Register>();
371 Register out_reg_hi = output.AsRegisterPairHigh<Register>();
372
373 DCHECK_NE(out_reg_lo, in_reg_hi) << "Diagonal overlap unexpected.";
374
375 __ Asr(mask, in_reg_hi, 31);
376 __ adds(out_reg_lo, in_reg_lo, ShifterOperand(mask));
377 __ adc(out_reg_hi, in_reg_hi, ShifterOperand(mask));
378 __ eor(out_reg_lo, mask, ShifterOperand(out_reg_lo));
379 __ eor(out_reg_hi, mask, ShifterOperand(out_reg_hi));
380 } else {
381 Register in_reg = in.AsRegister<Register>();
382 Register out_reg = output.AsRegister<Register>();
383
384 __ Asr(mask, in_reg, 31);
385 __ add(out_reg, in_reg, ShifterOperand(mask));
386 __ eor(out_reg, mask, ShifterOperand(out_reg));
387 }
388}
389
390void IntrinsicLocationsBuilderARM::VisitMathAbsInt(HInvoke* invoke) {
391 CreateIntToIntPlusTemp(arena_, invoke);
392}
393
394void IntrinsicCodeGeneratorARM::VisitMathAbsInt(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000395 GenAbsInteger(invoke->GetLocations(), /* is64bit */ false, GetAssembler());
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800396}
397
398
399void IntrinsicLocationsBuilderARM::VisitMathAbsLong(HInvoke* invoke) {
400 CreateIntToIntPlusTemp(arena_, invoke);
401}
402
403void IntrinsicCodeGeneratorARM::VisitMathAbsLong(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000404 GenAbsInteger(invoke->GetLocations(), /* is64bit */ true, GetAssembler());
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800405}
406
407static void GenMinMax(LocationSummary* locations,
408 bool is_min,
409 ArmAssembler* assembler) {
410 Register op1 = locations->InAt(0).AsRegister<Register>();
411 Register op2 = locations->InAt(1).AsRegister<Register>();
412 Register out = locations->Out().AsRegister<Register>();
413
414 __ cmp(op1, ShifterOperand(op2));
415
416 __ it((is_min) ? Condition::LT : Condition::GT, kItElse);
417 __ mov(out, ShifterOperand(op1), is_min ? Condition::LT : Condition::GT);
418 __ mov(out, ShifterOperand(op2), is_min ? Condition::GE : Condition::LE);
419}
420
421static void CreateIntIntToIntLocations(ArenaAllocator* arena, HInvoke* invoke) {
422 LocationSummary* locations = new (arena) LocationSummary(invoke,
423 LocationSummary::kNoCall,
424 kIntrinsified);
425 locations->SetInAt(0, Location::RequiresRegister());
426 locations->SetInAt(1, Location::RequiresRegister());
427 locations->SetOut(Location::RequiresRegister(), Location::kNoOutputOverlap);
428}
429
430void IntrinsicLocationsBuilderARM::VisitMathMinIntInt(HInvoke* invoke) {
431 CreateIntIntToIntLocations(arena_, invoke);
432}
433
434void IntrinsicCodeGeneratorARM::VisitMathMinIntInt(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000435 GenMinMax(invoke->GetLocations(), /* is_min */ true, GetAssembler());
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800436}
437
438void IntrinsicLocationsBuilderARM::VisitMathMaxIntInt(HInvoke* invoke) {
439 CreateIntIntToIntLocations(arena_, invoke);
440}
441
442void IntrinsicCodeGeneratorARM::VisitMathMaxIntInt(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000443 GenMinMax(invoke->GetLocations(), /* is_min */ false, GetAssembler());
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800444}
445
446void IntrinsicLocationsBuilderARM::VisitMathSqrt(HInvoke* invoke) {
447 CreateFPToFPLocations(arena_, invoke);
448}
449
450void IntrinsicCodeGeneratorARM::VisitMathSqrt(HInvoke* invoke) {
451 LocationSummary* locations = invoke->GetLocations();
452 ArmAssembler* assembler = GetAssembler();
453 __ vsqrtd(FromLowSToD(locations->Out().AsFpuRegisterPairLow<SRegister>()),
454 FromLowSToD(locations->InAt(0).AsFpuRegisterPairLow<SRegister>()));
455}
456
457void IntrinsicLocationsBuilderARM::VisitMemoryPeekByte(HInvoke* invoke) {
458 CreateIntToIntLocations(arena_, invoke);
459}
460
461void IntrinsicCodeGeneratorARM::VisitMemoryPeekByte(HInvoke* invoke) {
462 ArmAssembler* assembler = GetAssembler();
463 // Ignore upper 4B of long address.
464 __ ldrsb(invoke->GetLocations()->Out().AsRegister<Register>(),
465 Address(invoke->GetLocations()->InAt(0).AsRegisterPairLow<Register>()));
466}
467
468void IntrinsicLocationsBuilderARM::VisitMemoryPeekIntNative(HInvoke* invoke) {
469 CreateIntToIntLocations(arena_, invoke);
470}
471
472void IntrinsicCodeGeneratorARM::VisitMemoryPeekIntNative(HInvoke* invoke) {
473 ArmAssembler* assembler = GetAssembler();
474 // Ignore upper 4B of long address.
475 __ ldr(invoke->GetLocations()->Out().AsRegister<Register>(),
476 Address(invoke->GetLocations()->InAt(0).AsRegisterPairLow<Register>()));
477}
478
479void IntrinsicLocationsBuilderARM::VisitMemoryPeekLongNative(HInvoke* invoke) {
480 CreateIntToIntLocations(arena_, invoke);
481}
482
483void IntrinsicCodeGeneratorARM::VisitMemoryPeekLongNative(HInvoke* invoke) {
484 ArmAssembler* assembler = GetAssembler();
485 // Ignore upper 4B of long address.
486 Register addr = invoke->GetLocations()->InAt(0).AsRegisterPairLow<Register>();
487 // Worst case: Control register bit SCTLR.A = 0. Then unaligned accesses throw a processor
488 // exception. So we can't use ldrd as addr may be unaligned.
489 Register lo = invoke->GetLocations()->Out().AsRegisterPairLow<Register>();
490 Register hi = invoke->GetLocations()->Out().AsRegisterPairHigh<Register>();
491 if (addr == lo) {
492 __ ldr(hi, Address(addr, 4));
493 __ ldr(lo, Address(addr, 0));
494 } else {
495 __ ldr(lo, Address(addr, 0));
496 __ ldr(hi, Address(addr, 4));
497 }
498}
499
500void IntrinsicLocationsBuilderARM::VisitMemoryPeekShortNative(HInvoke* invoke) {
501 CreateIntToIntLocations(arena_, invoke);
502}
503
504void IntrinsicCodeGeneratorARM::VisitMemoryPeekShortNative(HInvoke* invoke) {
505 ArmAssembler* assembler = GetAssembler();
506 // Ignore upper 4B of long address.
507 __ ldrsh(invoke->GetLocations()->Out().AsRegister<Register>(),
508 Address(invoke->GetLocations()->InAt(0).AsRegisterPairLow<Register>()));
509}
510
511static void CreateIntIntToVoidLocations(ArenaAllocator* arena, HInvoke* invoke) {
512 LocationSummary* locations = new (arena) LocationSummary(invoke,
513 LocationSummary::kNoCall,
514 kIntrinsified);
515 locations->SetInAt(0, Location::RequiresRegister());
516 locations->SetInAt(1, Location::RequiresRegister());
517}
518
519void IntrinsicLocationsBuilderARM::VisitMemoryPokeByte(HInvoke* invoke) {
520 CreateIntIntToVoidLocations(arena_, invoke);
521}
522
523void IntrinsicCodeGeneratorARM::VisitMemoryPokeByte(HInvoke* invoke) {
524 ArmAssembler* assembler = GetAssembler();
525 __ strb(invoke->GetLocations()->InAt(1).AsRegister<Register>(),
526 Address(invoke->GetLocations()->InAt(0).AsRegisterPairLow<Register>()));
527}
528
529void IntrinsicLocationsBuilderARM::VisitMemoryPokeIntNative(HInvoke* invoke) {
530 CreateIntIntToVoidLocations(arena_, invoke);
531}
532
533void IntrinsicCodeGeneratorARM::VisitMemoryPokeIntNative(HInvoke* invoke) {
534 ArmAssembler* assembler = GetAssembler();
535 __ str(invoke->GetLocations()->InAt(1).AsRegister<Register>(),
536 Address(invoke->GetLocations()->InAt(0).AsRegisterPairLow<Register>()));
537}
538
539void IntrinsicLocationsBuilderARM::VisitMemoryPokeLongNative(HInvoke* invoke) {
540 CreateIntIntToVoidLocations(arena_, invoke);
541}
542
543void IntrinsicCodeGeneratorARM::VisitMemoryPokeLongNative(HInvoke* invoke) {
544 ArmAssembler* assembler = GetAssembler();
545 // Ignore upper 4B of long address.
546 Register addr = invoke->GetLocations()->InAt(0).AsRegisterPairLow<Register>();
547 // Worst case: Control register bit SCTLR.A = 0. Then unaligned accesses throw a processor
548 // exception. So we can't use ldrd as addr may be unaligned.
549 __ str(invoke->GetLocations()->InAt(1).AsRegisterPairLow<Register>(), Address(addr, 0));
550 __ str(invoke->GetLocations()->InAt(1).AsRegisterPairHigh<Register>(), Address(addr, 4));
551}
552
553void IntrinsicLocationsBuilderARM::VisitMemoryPokeShortNative(HInvoke* invoke) {
554 CreateIntIntToVoidLocations(arena_, invoke);
555}
556
557void IntrinsicCodeGeneratorARM::VisitMemoryPokeShortNative(HInvoke* invoke) {
558 ArmAssembler* assembler = GetAssembler();
559 __ strh(invoke->GetLocations()->InAt(1).AsRegister<Register>(),
560 Address(invoke->GetLocations()->InAt(0).AsRegisterPairLow<Register>()));
561}
562
563void IntrinsicLocationsBuilderARM::VisitThreadCurrentThread(HInvoke* invoke) {
564 LocationSummary* locations = new (arena_) LocationSummary(invoke,
565 LocationSummary::kNoCall,
566 kIntrinsified);
567 locations->SetOut(Location::RequiresRegister());
568}
569
570void IntrinsicCodeGeneratorARM::VisitThreadCurrentThread(HInvoke* invoke) {
571 ArmAssembler* assembler = GetAssembler();
572 __ LoadFromOffset(kLoadWord,
573 invoke->GetLocations()->Out().AsRegister<Register>(),
574 TR,
575 Thread::PeerOffset<kArmPointerSize>().Int32Value());
576}
577
578static void GenUnsafeGet(HInvoke* invoke,
579 Primitive::Type type,
580 bool is_volatile,
581 CodeGeneratorARM* codegen) {
582 LocationSummary* locations = invoke->GetLocations();
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800583 ArmAssembler* assembler = codegen->GetAssembler();
Roland Levillain3b359c72015-11-17 19:35:12 +0000584 Location base_loc = locations->InAt(1);
585 Register base = base_loc.AsRegister<Register>(); // Object pointer.
586 Location offset_loc = locations->InAt(2);
587 Register offset = offset_loc.AsRegisterPairLow<Register>(); // Long offset, lo part only.
588 Location trg_loc = locations->Out();
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800589
Roland Levillainc9285912015-12-18 10:38:42 +0000590 switch (type) {
591 case Primitive::kPrimInt: {
592 Register trg = trg_loc.AsRegister<Register>();
593 __ ldr(trg, Address(base, offset));
594 if (is_volatile) {
595 __ dmb(ISH);
596 }
597 break;
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800598 }
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800599
Roland Levillainc9285912015-12-18 10:38:42 +0000600 case Primitive::kPrimNot: {
601 Register trg = trg_loc.AsRegister<Register>();
602 if (kEmitCompilerReadBarrier) {
603 if (kUseBakerReadBarrier) {
604 Location temp = locations->GetTemp(0);
Roland Levillainbfea3352016-06-23 13:48:47 +0100605 codegen->GenerateReferenceLoadWithBakerReadBarrier(
606 invoke, trg_loc, base, 0U, offset_loc, TIMES_1, temp, /* needs_null_check */ false);
Roland Levillainc9285912015-12-18 10:38:42 +0000607 if (is_volatile) {
608 __ dmb(ISH);
609 }
610 } else {
611 __ ldr(trg, Address(base, offset));
612 if (is_volatile) {
613 __ dmb(ISH);
614 }
615 codegen->GenerateReadBarrierSlow(invoke, trg_loc, trg_loc, base_loc, 0U, offset_loc);
616 }
617 } else {
618 __ ldr(trg, Address(base, offset));
619 if (is_volatile) {
620 __ dmb(ISH);
621 }
622 __ MaybeUnpoisonHeapReference(trg);
623 }
624 break;
625 }
Roland Levillain4d027112015-07-01 15:41:14 +0100626
Roland Levillainc9285912015-12-18 10:38:42 +0000627 case Primitive::kPrimLong: {
628 Register trg_lo = trg_loc.AsRegisterPairLow<Register>();
629 __ add(IP, base, ShifterOperand(offset));
630 if (is_volatile && !codegen->GetInstructionSetFeatures().HasAtomicLdrdAndStrd()) {
631 Register trg_hi = trg_loc.AsRegisterPairHigh<Register>();
632 __ ldrexd(trg_lo, trg_hi, IP);
633 } else {
634 __ ldrd(trg_lo, Address(IP));
635 }
636 if (is_volatile) {
637 __ dmb(ISH);
638 }
639 break;
640 }
641
642 default:
643 LOG(FATAL) << "Unexpected type " << type;
644 UNREACHABLE();
Roland Levillain4d027112015-07-01 15:41:14 +0100645 }
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800646}
647
Roland Levillainc9285912015-12-18 10:38:42 +0000648static void CreateIntIntIntToIntLocations(ArenaAllocator* arena,
649 HInvoke* invoke,
650 Primitive::Type type) {
Roland Levillain3b359c72015-11-17 19:35:12 +0000651 bool can_call = kEmitCompilerReadBarrier &&
652 (invoke->GetIntrinsic() == Intrinsics::kUnsafeGetObject ||
653 invoke->GetIntrinsic() == Intrinsics::kUnsafeGetObjectVolatile);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800654 LocationSummary* locations = new (arena) LocationSummary(invoke,
Roland Levillain3b359c72015-11-17 19:35:12 +0000655 can_call ?
656 LocationSummary::kCallOnSlowPath :
657 LocationSummary::kNoCall,
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800658 kIntrinsified);
Vladimir Marko70e97462016-08-09 11:04:26 +0100659 if (can_call && kUseBakerReadBarrier) {
Vladimir Marko804b03f2016-09-14 16:26:36 +0100660 locations->SetCustomSlowPathCallerSaves(RegisterSet::Empty()); // No caller-save registers.
Vladimir Marko70e97462016-08-09 11:04:26 +0100661 }
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800662 locations->SetInAt(0, Location::NoLocation()); // Unused receiver.
663 locations->SetInAt(1, Location::RequiresRegister());
664 locations->SetInAt(2, Location::RequiresRegister());
Roland Levillainbfea3352016-06-23 13:48:47 +0100665 locations->SetOut(Location::RequiresRegister(),
666 can_call ? Location::kOutputOverlap : Location::kNoOutputOverlap);
Roland Levillainc9285912015-12-18 10:38:42 +0000667 if (type == Primitive::kPrimNot && kEmitCompilerReadBarrier && kUseBakerReadBarrier) {
668 // We need a temporary register for the read barrier marking slow
Roland Levillainbfea3352016-06-23 13:48:47 +0100669 // path in InstructionCodeGeneratorARM::GenerateReferenceLoadWithBakerReadBarrier.
Roland Levillainc9285912015-12-18 10:38:42 +0000670 locations->AddTemp(Location::RequiresRegister());
671 }
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800672}
673
674void IntrinsicLocationsBuilderARM::VisitUnsafeGet(HInvoke* invoke) {
Roland Levillainc9285912015-12-18 10:38:42 +0000675 CreateIntIntIntToIntLocations(arena_, invoke, Primitive::kPrimInt);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800676}
677void IntrinsicLocationsBuilderARM::VisitUnsafeGetVolatile(HInvoke* invoke) {
Roland Levillainc9285912015-12-18 10:38:42 +0000678 CreateIntIntIntToIntLocations(arena_, invoke, Primitive::kPrimInt);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800679}
680void IntrinsicLocationsBuilderARM::VisitUnsafeGetLong(HInvoke* invoke) {
Roland Levillainc9285912015-12-18 10:38:42 +0000681 CreateIntIntIntToIntLocations(arena_, invoke, Primitive::kPrimLong);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800682}
683void IntrinsicLocationsBuilderARM::VisitUnsafeGetLongVolatile(HInvoke* invoke) {
Roland Levillainc9285912015-12-18 10:38:42 +0000684 CreateIntIntIntToIntLocations(arena_, invoke, Primitive::kPrimLong);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800685}
686void IntrinsicLocationsBuilderARM::VisitUnsafeGetObject(HInvoke* invoke) {
Roland Levillainc9285912015-12-18 10:38:42 +0000687 CreateIntIntIntToIntLocations(arena_, invoke, Primitive::kPrimNot);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800688}
689void IntrinsicLocationsBuilderARM::VisitUnsafeGetObjectVolatile(HInvoke* invoke) {
Roland Levillainc9285912015-12-18 10:38:42 +0000690 CreateIntIntIntToIntLocations(arena_, invoke, Primitive::kPrimNot);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800691}
692
693void IntrinsicCodeGeneratorARM::VisitUnsafeGet(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000694 GenUnsafeGet(invoke, Primitive::kPrimInt, /* is_volatile */ false, codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800695}
696void IntrinsicCodeGeneratorARM::VisitUnsafeGetVolatile(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000697 GenUnsafeGet(invoke, Primitive::kPrimInt, /* is_volatile */ true, codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800698}
699void IntrinsicCodeGeneratorARM::VisitUnsafeGetLong(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000700 GenUnsafeGet(invoke, Primitive::kPrimLong, /* is_volatile */ false, codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800701}
702void IntrinsicCodeGeneratorARM::VisitUnsafeGetLongVolatile(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000703 GenUnsafeGet(invoke, Primitive::kPrimLong, /* is_volatile */ true, codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800704}
705void IntrinsicCodeGeneratorARM::VisitUnsafeGetObject(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000706 GenUnsafeGet(invoke, Primitive::kPrimNot, /* is_volatile */ false, codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800707}
708void IntrinsicCodeGeneratorARM::VisitUnsafeGetObjectVolatile(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000709 GenUnsafeGet(invoke, Primitive::kPrimNot, /* is_volatile */ true, codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800710}
711
712static void CreateIntIntIntIntToVoid(ArenaAllocator* arena,
713 const ArmInstructionSetFeatures& features,
714 Primitive::Type type,
715 bool is_volatile,
716 HInvoke* invoke) {
717 LocationSummary* locations = new (arena) LocationSummary(invoke,
718 LocationSummary::kNoCall,
719 kIntrinsified);
720 locations->SetInAt(0, Location::NoLocation()); // Unused receiver.
721 locations->SetInAt(1, Location::RequiresRegister());
722 locations->SetInAt(2, Location::RequiresRegister());
723 locations->SetInAt(3, Location::RequiresRegister());
724
725 if (type == Primitive::kPrimLong) {
726 // Potentially need temps for ldrexd-strexd loop.
727 if (is_volatile && !features.HasAtomicLdrdAndStrd()) {
728 locations->AddTemp(Location::RequiresRegister()); // Temp_lo.
729 locations->AddTemp(Location::RequiresRegister()); // Temp_hi.
730 }
731 } else if (type == Primitive::kPrimNot) {
732 // Temps for card-marking.
733 locations->AddTemp(Location::RequiresRegister()); // Temp.
734 locations->AddTemp(Location::RequiresRegister()); // Card.
735 }
736}
737
738void IntrinsicLocationsBuilderARM::VisitUnsafePut(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000739 CreateIntIntIntIntToVoid(arena_, features_, Primitive::kPrimInt, /* is_volatile */ false, invoke);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800740}
741void IntrinsicLocationsBuilderARM::VisitUnsafePutOrdered(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000742 CreateIntIntIntIntToVoid(arena_, features_, Primitive::kPrimInt, /* is_volatile */ false, invoke);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800743}
744void IntrinsicLocationsBuilderARM::VisitUnsafePutVolatile(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000745 CreateIntIntIntIntToVoid(arena_, features_, Primitive::kPrimInt, /* is_volatile */ true, invoke);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800746}
747void IntrinsicLocationsBuilderARM::VisitUnsafePutObject(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000748 CreateIntIntIntIntToVoid(arena_, features_, Primitive::kPrimNot, /* is_volatile */ false, invoke);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800749}
750void IntrinsicLocationsBuilderARM::VisitUnsafePutObjectOrdered(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000751 CreateIntIntIntIntToVoid(arena_, features_, Primitive::kPrimNot, /* is_volatile */ false, invoke);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800752}
753void IntrinsicLocationsBuilderARM::VisitUnsafePutObjectVolatile(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000754 CreateIntIntIntIntToVoid(arena_, features_, Primitive::kPrimNot, /* is_volatile */ true, invoke);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800755}
756void IntrinsicLocationsBuilderARM::VisitUnsafePutLong(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000757 CreateIntIntIntIntToVoid(
758 arena_, features_, Primitive::kPrimLong, /* is_volatile */ false, invoke);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800759}
760void IntrinsicLocationsBuilderARM::VisitUnsafePutLongOrdered(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000761 CreateIntIntIntIntToVoid(
762 arena_, features_, Primitive::kPrimLong, /* is_volatile */ false, invoke);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800763}
764void IntrinsicLocationsBuilderARM::VisitUnsafePutLongVolatile(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000765 CreateIntIntIntIntToVoid(
766 arena_, features_, Primitive::kPrimLong, /* is_volatile */ true, invoke);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800767}
768
769static void GenUnsafePut(LocationSummary* locations,
770 Primitive::Type type,
771 bool is_volatile,
772 bool is_ordered,
773 CodeGeneratorARM* codegen) {
774 ArmAssembler* assembler = codegen->GetAssembler();
775
776 Register base = locations->InAt(1).AsRegister<Register>(); // Object pointer.
777 Register offset = locations->InAt(2).AsRegisterPairLow<Register>(); // Long offset, lo part only.
778 Register value;
779
780 if (is_volatile || is_ordered) {
781 __ dmb(ISH);
782 }
783
784 if (type == Primitive::kPrimLong) {
785 Register value_lo = locations->InAt(3).AsRegisterPairLow<Register>();
786 value = value_lo;
787 if (is_volatile && !codegen->GetInstructionSetFeatures().HasAtomicLdrdAndStrd()) {
788 Register temp_lo = locations->GetTemp(0).AsRegister<Register>();
789 Register temp_hi = locations->GetTemp(1).AsRegister<Register>();
790 Register value_hi = locations->InAt(3).AsRegisterPairHigh<Register>();
791
792 __ add(IP, base, ShifterOperand(offset));
793 Label loop_head;
794 __ Bind(&loop_head);
795 __ ldrexd(temp_lo, temp_hi, IP);
796 __ strexd(temp_lo, value_lo, value_hi, IP);
797 __ cmp(temp_lo, ShifterOperand(0));
798 __ b(&loop_head, NE);
799 } else {
800 __ add(IP, base, ShifterOperand(offset));
801 __ strd(value_lo, Address(IP));
802 }
803 } else {
Roland Levillain4d027112015-07-01 15:41:14 +0100804 value = locations->InAt(3).AsRegister<Register>();
805 Register source = value;
806 if (kPoisonHeapReferences && type == Primitive::kPrimNot) {
807 Register temp = locations->GetTemp(0).AsRegister<Register>();
808 __ Mov(temp, value);
809 __ PoisonHeapReference(temp);
810 source = temp;
811 }
812 __ str(source, Address(base, offset));
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800813 }
814
815 if (is_volatile) {
816 __ dmb(ISH);
817 }
818
819 if (type == Primitive::kPrimNot) {
820 Register temp = locations->GetTemp(0).AsRegister<Register>();
821 Register card = locations->GetTemp(1).AsRegister<Register>();
Nicolas Geoffray07276db2015-05-18 14:22:09 +0100822 bool value_can_be_null = true; // TODO: Worth finding out this information?
823 codegen->MarkGCCard(temp, card, base, value, value_can_be_null);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800824 }
825}
826
827void IntrinsicCodeGeneratorARM::VisitUnsafePut(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000828 GenUnsafePut(invoke->GetLocations(),
829 Primitive::kPrimInt,
830 /* is_volatile */ false,
831 /* is_ordered */ false,
832 codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800833}
834void IntrinsicCodeGeneratorARM::VisitUnsafePutOrdered(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000835 GenUnsafePut(invoke->GetLocations(),
836 Primitive::kPrimInt,
837 /* is_volatile */ false,
838 /* is_ordered */ true,
839 codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800840}
841void IntrinsicCodeGeneratorARM::VisitUnsafePutVolatile(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000842 GenUnsafePut(invoke->GetLocations(),
843 Primitive::kPrimInt,
844 /* is_volatile */ true,
845 /* is_ordered */ false,
846 codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800847}
848void IntrinsicCodeGeneratorARM::VisitUnsafePutObject(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000849 GenUnsafePut(invoke->GetLocations(),
850 Primitive::kPrimNot,
851 /* is_volatile */ false,
852 /* is_ordered */ false,
853 codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800854}
855void IntrinsicCodeGeneratorARM::VisitUnsafePutObjectOrdered(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000856 GenUnsafePut(invoke->GetLocations(),
857 Primitive::kPrimNot,
858 /* is_volatile */ false,
859 /* is_ordered */ true,
860 codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800861}
862void IntrinsicCodeGeneratorARM::VisitUnsafePutObjectVolatile(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000863 GenUnsafePut(invoke->GetLocations(),
864 Primitive::kPrimNot,
865 /* is_volatile */ true,
866 /* is_ordered */ false,
867 codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800868}
869void IntrinsicCodeGeneratorARM::VisitUnsafePutLong(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000870 GenUnsafePut(invoke->GetLocations(),
871 Primitive::kPrimLong,
872 /* is_volatile */ false,
873 /* is_ordered */ false,
874 codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800875}
876void IntrinsicCodeGeneratorARM::VisitUnsafePutLongOrdered(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000877 GenUnsafePut(invoke->GetLocations(),
878 Primitive::kPrimLong,
879 /* is_volatile */ false,
880 /* is_ordered */ true,
881 codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800882}
883void IntrinsicCodeGeneratorARM::VisitUnsafePutLongVolatile(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000884 GenUnsafePut(invoke->GetLocations(),
885 Primitive::kPrimLong,
886 /* is_volatile */ true,
887 /* is_ordered */ false,
888 codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800889}
890
891static void CreateIntIntIntIntIntToIntPlusTemps(ArenaAllocator* arena,
Roland Levillain2e50ecb2016-01-27 14:08:33 +0000892 HInvoke* invoke,
893 Primitive::Type type) {
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800894 LocationSummary* locations = new (arena) LocationSummary(invoke,
895 LocationSummary::kNoCall,
896 kIntrinsified);
897 locations->SetInAt(0, Location::NoLocation()); // Unused receiver.
898 locations->SetInAt(1, Location::RequiresRegister());
899 locations->SetInAt(2, Location::RequiresRegister());
900 locations->SetInAt(3, Location::RequiresRegister());
901 locations->SetInAt(4, Location::RequiresRegister());
902
Roland Levillain2e50ecb2016-01-27 14:08:33 +0000903 // If heap poisoning is enabled, we don't want the unpoisoning
904 // operations to potentially clobber the output.
905 Location::OutputOverlap overlaps = (kPoisonHeapReferences && type == Primitive::kPrimNot)
906 ? Location::kOutputOverlap
907 : Location::kNoOutputOverlap;
908 locations->SetOut(Location::RequiresRegister(), overlaps);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800909
910 locations->AddTemp(Location::RequiresRegister()); // Pointer.
911 locations->AddTemp(Location::RequiresRegister()); // Temp 1.
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800912}
913
914static void GenCas(LocationSummary* locations, Primitive::Type type, CodeGeneratorARM* codegen) {
915 DCHECK_NE(type, Primitive::kPrimLong);
916
917 ArmAssembler* assembler = codegen->GetAssembler();
918
919 Register out = locations->Out().AsRegister<Register>(); // Boolean result.
920
921 Register base = locations->InAt(1).AsRegister<Register>(); // Object pointer.
922 Register offset = locations->InAt(2).AsRegisterPairLow<Register>(); // Offset (discard high 4B).
923 Register expected_lo = locations->InAt(3).AsRegister<Register>(); // Expected.
924 Register value_lo = locations->InAt(4).AsRegister<Register>(); // Value.
925
926 Register tmp_ptr = locations->GetTemp(0).AsRegister<Register>(); // Pointer to actual memory.
927 Register tmp_lo = locations->GetTemp(1).AsRegister<Register>(); // Value in memory.
928
929 if (type == Primitive::kPrimNot) {
930 // Mark card for object assuming new value is stored. Worst case we will mark an unchanged
931 // object and scan the receiver at the next GC for nothing.
Nicolas Geoffray07276db2015-05-18 14:22:09 +0100932 bool value_can_be_null = true; // TODO: Worth finding out this information?
933 codegen->MarkGCCard(tmp_ptr, tmp_lo, base, value_lo, value_can_be_null);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800934 }
935
936 // Prevent reordering with prior memory operations.
Roland Levillain4bedb382016-01-12 12:01:04 +0000937 // Emit a DMB ISH instruction instead of an DMB ISHST one, as the
938 // latter allows a preceding load to be delayed past the STXR
939 // instruction below.
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800940 __ dmb(ISH);
941
942 __ add(tmp_ptr, base, ShifterOperand(offset));
943
Roland Levillain4d027112015-07-01 15:41:14 +0100944 if (kPoisonHeapReferences && type == Primitive::kPrimNot) {
945 codegen->GetAssembler()->PoisonHeapReference(expected_lo);
Roland Levillain2e50ecb2016-01-27 14:08:33 +0000946 if (value_lo == expected_lo) {
947 // Do not poison `value_lo`, as it is the same register as
948 // `expected_lo`, which has just been poisoned.
949 } else {
950 codegen->GetAssembler()->PoisonHeapReference(value_lo);
951 }
Roland Levillain4d027112015-07-01 15:41:14 +0100952 }
953
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800954 // do {
955 // tmp = [r_ptr] - expected;
956 // } while (tmp == 0 && failure([r_ptr] <- r_new_value));
957 // result = tmp != 0;
958
959 Label loop_head;
960 __ Bind(&loop_head);
961
Roland Levillain391b8662015-12-18 11:43:38 +0000962 // TODO: When `type == Primitive::kPrimNot`, add a read barrier for
963 // the reference stored in the object before attempting the CAS,
964 // similar to the one in the art::Unsafe_compareAndSwapObject JNI
965 // implementation.
966 //
967 // Note that this code is not (yet) used when read barriers are
968 // enabled (see IntrinsicLocationsBuilderARM::VisitUnsafeCASObject).
969 DCHECK(!(type == Primitive::kPrimNot && kEmitCompilerReadBarrier));
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800970 __ ldrex(tmp_lo, tmp_ptr);
971
972 __ subs(tmp_lo, tmp_lo, ShifterOperand(expected_lo));
973
974 __ it(EQ, ItState::kItT);
975 __ strex(tmp_lo, value_lo, tmp_ptr, EQ);
976 __ cmp(tmp_lo, ShifterOperand(1), EQ);
977
978 __ b(&loop_head, EQ);
979
980 __ dmb(ISH);
981
982 __ rsbs(out, tmp_lo, ShifterOperand(1));
983 __ it(CC);
984 __ mov(out, ShifterOperand(0), CC);
Roland Levillain4d027112015-07-01 15:41:14 +0100985
986 if (kPoisonHeapReferences && type == Primitive::kPrimNot) {
Roland Levillain4d027112015-07-01 15:41:14 +0100987 codegen->GetAssembler()->UnpoisonHeapReference(expected_lo);
Roland Levillain2e50ecb2016-01-27 14:08:33 +0000988 if (value_lo == expected_lo) {
989 // Do not unpoison `value_lo`, as it is the same register as
990 // `expected_lo`, which has just been unpoisoned.
991 } else {
992 codegen->GetAssembler()->UnpoisonHeapReference(value_lo);
993 }
Roland Levillain4d027112015-07-01 15:41:14 +0100994 }
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800995}
996
Andreas Gampeca714582015-04-03 19:41:34 -0700997void IntrinsicLocationsBuilderARM::VisitUnsafeCASInt(HInvoke* invoke) {
Roland Levillain2e50ecb2016-01-27 14:08:33 +0000998 CreateIntIntIntIntIntToIntPlusTemps(arena_, invoke, Primitive::kPrimInt);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800999}
Andreas Gampeca714582015-04-03 19:41:34 -07001000void IntrinsicLocationsBuilderARM::VisitUnsafeCASObject(HInvoke* invoke) {
Roland Levillain391b8662015-12-18 11:43:38 +00001001 // The UnsafeCASObject intrinsic is missing a read barrier, and
1002 // therefore sometimes does not work as expected (b/25883050).
1003 // Turn it off temporarily as a quick fix, until the read barrier is
Roland Levillain3d312422016-06-23 13:53:42 +01001004 // implemented (see TODO in GenCAS).
Roland Levillain391b8662015-12-18 11:43:38 +00001005 //
Roland Levillain3d312422016-06-23 13:53:42 +01001006 // TODO(rpl): Implement read barrier support in GenCAS and re-enable
1007 // this intrinsic.
Roland Levillain2e50ecb2016-01-27 14:08:33 +00001008 if (kEmitCompilerReadBarrier) {
Roland Levillain985ff702015-10-23 13:25:35 +01001009 return;
1010 }
1011
Roland Levillain2e50ecb2016-01-27 14:08:33 +00001012 CreateIntIntIntIntIntToIntPlusTemps(arena_, invoke, Primitive::kPrimNot);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -08001013}
1014void IntrinsicCodeGeneratorARM::VisitUnsafeCASInt(HInvoke* invoke) {
1015 GenCas(invoke->GetLocations(), Primitive::kPrimInt, codegen_);
1016}
1017void IntrinsicCodeGeneratorARM::VisitUnsafeCASObject(HInvoke* invoke) {
Roland Levillain3d312422016-06-23 13:53:42 +01001018 // The UnsafeCASObject intrinsic is missing a read barrier, and
1019 // therefore sometimes does not work as expected (b/25883050).
1020 // Turn it off temporarily as a quick fix, until the read barrier is
1021 // implemented (see TODO in GenCAS).
1022 //
1023 // TODO(rpl): Implement read barrier support in GenCAS and re-enable
1024 // this intrinsic.
1025 DCHECK(!kEmitCompilerReadBarrier);
1026
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -08001027 GenCas(invoke->GetLocations(), Primitive::kPrimNot, codegen_);
1028}
1029
Nicolas Geoffrayd75948a2015-03-27 09:53:16 +00001030void IntrinsicLocationsBuilderARM::VisitStringCompareTo(HInvoke* invoke) {
1031 // The inputs plus one temp.
1032 LocationSummary* locations = new (arena_) LocationSummary(invoke,
Scott Wakelingc25cbf12016-04-18 09:00:11 +01001033 invoke->InputAt(1)->CanBeNull()
1034 ? LocationSummary::kCallOnSlowPath
1035 : LocationSummary::kNoCall,
Nicolas Geoffrayd75948a2015-03-27 09:53:16 +00001036 kIntrinsified);
Scott Wakelingc25cbf12016-04-18 09:00:11 +01001037 locations->SetInAt(0, Location::RequiresRegister());
1038 locations->SetInAt(1, Location::RequiresRegister());
1039 locations->AddTemp(Location::RequiresRegister());
1040 locations->AddTemp(Location::RequiresRegister());
1041 locations->AddTemp(Location::RequiresRegister());
jessicahandojo05765752016-09-09 19:01:32 -07001042 // Need temporary registers for String compression's feature.
1043 if (mirror::kUseStringCompression) {
1044 locations->AddTemp(Location::RequiresRegister());
1045 locations->AddTemp(Location::RequiresRegister());
1046 }
Scott Wakelingc25cbf12016-04-18 09:00:11 +01001047 locations->SetOut(Location::RequiresRegister(), Location::kOutputOverlap);
Nicolas Geoffrayd75948a2015-03-27 09:53:16 +00001048}
1049
1050void IntrinsicCodeGeneratorARM::VisitStringCompareTo(HInvoke* invoke) {
1051 ArmAssembler* assembler = GetAssembler();
1052 LocationSummary* locations = invoke->GetLocations();
1053
Scott Wakelingc25cbf12016-04-18 09:00:11 +01001054 Register str = locations->InAt(0).AsRegister<Register>();
1055 Register arg = locations->InAt(1).AsRegister<Register>();
1056 Register out = locations->Out().AsRegister<Register>();
1057
1058 Register temp0 = locations->GetTemp(0).AsRegister<Register>();
1059 Register temp1 = locations->GetTemp(1).AsRegister<Register>();
1060 Register temp2 = locations->GetTemp(2).AsRegister<Register>();
jessicahandojo05765752016-09-09 19:01:32 -07001061 Register temp3, temp4;
1062 if (mirror::kUseStringCompression) {
1063 temp3 = locations->GetTemp(3).AsRegister<Register>();
1064 temp4 = locations->GetTemp(4).AsRegister<Register>();
1065 }
Scott Wakelingc25cbf12016-04-18 09:00:11 +01001066
1067 Label loop;
1068 Label find_char_diff;
1069 Label end;
jessicahandojo05765752016-09-09 19:01:32 -07001070 Label different_compression;
Scott Wakelingc25cbf12016-04-18 09:00:11 +01001071
1072 // Get offsets of count and value fields within a string object.
1073 const int32_t count_offset = mirror::String::CountOffset().Int32Value();
1074 const int32_t value_offset = mirror::String::ValueOffset().Int32Value();
1075
Nicolas Geoffray512e04d2015-03-27 17:21:24 +00001076 // Note that the null check must have been done earlier.
Calin Juravle641547a2015-04-21 22:08:51 +01001077 DCHECK(!invoke->CanDoImplicitNullCheckOn(invoke->InputAt(0)));
Nicolas Geoffrayd75948a2015-03-27 09:53:16 +00001078
Scott Wakelingc25cbf12016-04-18 09:00:11 +01001079 // Take slow path and throw if input can be and is null.
1080 SlowPathCode* slow_path = nullptr;
1081 const bool can_slow_path = invoke->InputAt(1)->CanBeNull();
1082 if (can_slow_path) {
1083 slow_path = new (GetAllocator()) IntrinsicSlowPathARM(invoke);
1084 codegen_->AddSlowPath(slow_path);
1085 __ CompareAndBranchIfZero(arg, slow_path->GetEntryLabel());
1086 }
Nicolas Geoffrayd75948a2015-03-27 09:53:16 +00001087
Scott Wakelingc25cbf12016-04-18 09:00:11 +01001088 // Reference equality check, return 0 if same reference.
1089 __ subs(out, str, ShifterOperand(arg));
1090 __ b(&end, EQ);
jessicahandojo05765752016-09-09 19:01:32 -07001091 if (mirror::kUseStringCompression) {
1092 // Load lengths of this and argument strings.
1093 __ ldr(temp3, Address(str, count_offset));
1094 __ ldr(temp4, Address(arg, count_offset));
1095 // Clean out compression flag from lengths.
1096 __ bic(temp0, temp3, ShifterOperand(0x80000000));
1097 __ bic(IP, temp4, ShifterOperand(0x80000000));
1098 } else {
1099 // Load lengths of this and argument strings.
1100 __ ldr(temp0, Address(str, count_offset));
1101 __ ldr(IP, Address(arg, count_offset));
1102 }
Scott Wakelingc25cbf12016-04-18 09:00:11 +01001103 // out = length diff.
jessicahandojo05765752016-09-09 19:01:32 -07001104 __ subs(out, temp0, ShifterOperand(IP));
Scott Wakelingc25cbf12016-04-18 09:00:11 +01001105 // temp0 = min(len(str), len(arg)).
jessicahandojo05765752016-09-09 19:01:32 -07001106 __ it(GT);
1107 __ mov(temp0, ShifterOperand(IP), GT);
Scott Wakelingc25cbf12016-04-18 09:00:11 +01001108 // Shorter string is empty?
1109 __ CompareAndBranchIfZero(temp0, &end);
1110
jessicahandojo05765752016-09-09 19:01:32 -07001111 if (mirror::kUseStringCompression) {
1112 // Check if both strings using same compression style to use this comparison loop.
1113 __ eors(temp3, temp3, ShifterOperand(temp4));
1114 __ b(&different_compression, MI);
1115 }
Scott Wakelingc25cbf12016-04-18 09:00:11 +01001116 // Store offset of string value in preparation for comparison loop.
1117 __ mov(temp1, ShifterOperand(value_offset));
jessicahandojo05765752016-09-09 19:01:32 -07001118 if (mirror::kUseStringCompression) {
1119 // For string compression, calculate the number of bytes to compare (not chars).
1120 // This could in theory exceed INT32_MAX, so treat temp0 as unsigned.
1121 __ cmp(temp4, ShifterOperand(0));
1122 __ it(GE);
1123 __ add(temp0, temp0, ShifterOperand(temp0), GE);
1124 }
Scott Wakelingc25cbf12016-04-18 09:00:11 +01001125
1126 // Assertions that must hold in order to compare multiple characters at a time.
1127 CHECK_ALIGNED(value_offset, 8);
1128 static_assert(IsAligned<8>(kObjectAlignment),
1129 "String data must be 8-byte aligned for unrolled CompareTo loop.");
1130
1131 const size_t char_size = Primitive::ComponentSize(Primitive::kPrimChar);
1132 DCHECK_EQ(char_size, 2u);
1133
jessicahandojo05765752016-09-09 19:01:32 -07001134 Label find_char_diff_2nd_cmp;
Scott Wakelingc25cbf12016-04-18 09:00:11 +01001135 // Unrolled loop comparing 4x16-bit chars per iteration (ok because of string data alignment).
1136 __ Bind(&loop);
1137 __ ldr(IP, Address(str, temp1));
1138 __ ldr(temp2, Address(arg, temp1));
1139 __ cmp(IP, ShifterOperand(temp2));
1140 __ b(&find_char_diff, NE);
1141 __ add(temp1, temp1, ShifterOperand(char_size * 2));
Scott Wakelingc25cbf12016-04-18 09:00:11 +01001142
1143 __ ldr(IP, Address(str, temp1));
1144 __ ldr(temp2, Address(arg, temp1));
1145 __ cmp(IP, ShifterOperand(temp2));
jessicahandojo05765752016-09-09 19:01:32 -07001146 __ b(&find_char_diff_2nd_cmp, NE);
Scott Wakelingc25cbf12016-04-18 09:00:11 +01001147 __ add(temp1, temp1, ShifterOperand(char_size * 2));
jessicahandojo05765752016-09-09 19:01:32 -07001148 // With string compression, we have compared 8 bytes, otherwise 4 chars.
1149 __ subs(temp0, temp0, ShifterOperand(mirror::kUseStringCompression ? 8 : 4));
1150 __ b(&loop, HI);
Scott Wakelingc25cbf12016-04-18 09:00:11 +01001151 __ b(&end);
1152
jessicahandojo05765752016-09-09 19:01:32 -07001153 __ Bind(&find_char_diff_2nd_cmp);
1154 if (mirror::kUseStringCompression) {
1155 __ subs(temp0, temp0, ShifterOperand(4)); // 4 bytes previously compared.
1156 __ b(&end, LS); // Was the second comparison fully beyond the end?
1157 } else {
1158 // Without string compression, we can start treating temp0 as signed
1159 // and rely on the signed comparison below.
1160 __ sub(temp0, temp0, ShifterOperand(2));
1161 }
1162
1163 // Find the single character difference.
Scott Wakelingc25cbf12016-04-18 09:00:11 +01001164 __ Bind(&find_char_diff);
1165 // Get the bit position of the first character that differs.
1166 __ eor(temp1, temp2, ShifterOperand(IP));
1167 __ rbit(temp1, temp1);
1168 __ clz(temp1, temp1);
1169
jessicahandojo05765752016-09-09 19:01:32 -07001170 // temp0 = number of characters remaining to compare.
1171 // (Without string compression, it could be < 1 if a difference is found by the second CMP
1172 // in the comparison loop, and after the end of the shorter string data).
Scott Wakelingc25cbf12016-04-18 09:00:11 +01001173
jessicahandojo05765752016-09-09 19:01:32 -07001174 // Without string compression (temp1 >> 4) = character where difference occurs between the last
1175 // two words compared, in the interval [0,1].
1176 // (0 for low half-word different, 1 for high half-word different).
1177 // With string compression, (temp1 << 3) = byte where the difference occurs,
1178 // in the interval [0,3].
Scott Wakelingc25cbf12016-04-18 09:00:11 +01001179
jessicahandojo05765752016-09-09 19:01:32 -07001180 // If temp0 <= (temp1 >> (kUseStringCompression ? 3 : 4)), the difference occurs outside
1181 // the remaining string data, so just return length diff (out).
1182 // The comparison is unsigned for string compression, otherwise signed.
1183 __ cmp(temp0, ShifterOperand(temp1, LSR, mirror::kUseStringCompression ? 3 : 4));
1184 __ b(&end, mirror::kUseStringCompression ? LS : LE);
Scott Wakelingc25cbf12016-04-18 09:00:11 +01001185 // Extract the characters and calculate the difference.
jessicahandojo05765752016-09-09 19:01:32 -07001186 Label uncompressed_string, continue_process;
1187 if (mirror::kUseStringCompression) {
1188 __ cmp(temp4, ShifterOperand(0));
1189 __ b(&uncompressed_string, GE);
1190 __ bic(temp1, temp1, ShifterOperand(0x7));
1191 __ b(&continue_process);
1192 }
1193 __ Bind(&uncompressed_string);
Scott Wakelingc25cbf12016-04-18 09:00:11 +01001194 __ bic(temp1, temp1, ShifterOperand(0xf));
jessicahandojo05765752016-09-09 19:01:32 -07001195 __ Bind(&continue_process);
1196
Scott Wakelingc25cbf12016-04-18 09:00:11 +01001197 __ Lsr(temp2, temp2, temp1);
1198 __ Lsr(IP, IP, temp1);
jessicahandojo05765752016-09-09 19:01:32 -07001199 Label calculate_difference, uncompressed_string_extract_chars;
1200 if (mirror::kUseStringCompression) {
1201 __ cmp(temp4, ShifterOperand(0));
1202 __ b(&uncompressed_string_extract_chars, GE);
1203 __ ubfx(temp2, temp2, 0, 8);
1204 __ ubfx(IP, IP, 0, 8);
1205 __ b(&calculate_difference);
1206 }
1207 __ Bind(&uncompressed_string_extract_chars);
Scott Wakelingc25cbf12016-04-18 09:00:11 +01001208 __ movt(temp2, 0);
1209 __ movt(IP, 0);
jessicahandojo05765752016-09-09 19:01:32 -07001210 __ Bind(&calculate_difference);
Scott Wakelingc25cbf12016-04-18 09:00:11 +01001211 __ sub(out, IP, ShifterOperand(temp2));
jessicahandojo05765752016-09-09 19:01:32 -07001212 __ b(&end);
1213
1214 if (mirror::kUseStringCompression) {
1215 const size_t c_char_size = Primitive::ComponentSize(Primitive::kPrimByte);
1216 DCHECK_EQ(c_char_size, 1u);
1217 Label loop_arg_compressed, loop_this_compressed, find_diff;
1218 // Comparison for different compression style.
1219 // This part is when THIS is compressed and ARG is not.
1220 __ Bind(&different_compression);
1221 __ add(temp2, str, ShifterOperand(value_offset));
1222 __ add(temp3, arg, ShifterOperand(value_offset));
1223 __ cmp(temp4, ShifterOperand(0));
1224 __ b(&loop_arg_compressed, LT);
1225
1226 __ Bind(&loop_this_compressed);
1227 __ ldrb(IP, Address(temp2, c_char_size, Address::PostIndex));
1228 __ ldrh(temp4, Address(temp3, char_size, Address::PostIndex));
1229 __ cmp(IP, ShifterOperand(temp4));
1230 __ b(&find_diff, NE);
1231 __ subs(temp0, temp0, ShifterOperand(1));
1232 __ b(&loop_this_compressed, GT);
1233 __ b(&end);
1234
1235 // This part is when THIS is not compressed and ARG is.
1236 __ Bind(&loop_arg_compressed);
1237 __ ldrh(IP, Address(temp2, char_size, Address::PostIndex));
1238 __ ldrb(temp4, Address(temp3, c_char_size, Address::PostIndex));
1239 __ cmp(IP, ShifterOperand(temp4));
1240 __ b(&find_diff, NE);
1241 __ subs(temp0, temp0, ShifterOperand(1));
1242 __ b(&loop_arg_compressed, GT);
1243 __ b(&end);
1244
1245 // Calculate the difference.
1246 __ Bind(&find_diff);
1247 __ sub(out, IP, ShifterOperand(temp4));
1248 }
Scott Wakelingc25cbf12016-04-18 09:00:11 +01001249
1250 __ Bind(&end);
1251
1252 if (can_slow_path) {
1253 __ Bind(slow_path->GetExitLabel());
1254 }
Nicolas Geoffrayd75948a2015-03-27 09:53:16 +00001255}
1256
Agi Csaki289cd552015-08-18 17:10:38 -07001257void IntrinsicLocationsBuilderARM::VisitStringEquals(HInvoke* invoke) {
1258 LocationSummary* locations = new (arena_) LocationSummary(invoke,
1259 LocationSummary::kNoCall,
1260 kIntrinsified);
1261 InvokeRuntimeCallingConvention calling_convention;
1262 locations->SetInAt(0, Location::RequiresRegister());
1263 locations->SetInAt(1, Location::RequiresRegister());
1264 // Temporary registers to store lengths of strings and for calculations.
1265 // Using instruction cbz requires a low register, so explicitly set a temp to be R0.
1266 locations->AddTemp(Location::RegisterLocation(R0));
1267 locations->AddTemp(Location::RequiresRegister());
1268 locations->AddTemp(Location::RequiresRegister());
1269
1270 locations->SetOut(Location::RequiresRegister());
1271}
1272
1273void IntrinsicCodeGeneratorARM::VisitStringEquals(HInvoke* invoke) {
1274 ArmAssembler* assembler = GetAssembler();
1275 LocationSummary* locations = invoke->GetLocations();
1276
1277 Register str = locations->InAt(0).AsRegister<Register>();
1278 Register arg = locations->InAt(1).AsRegister<Register>();
1279 Register out = locations->Out().AsRegister<Register>();
1280
1281 Register temp = locations->GetTemp(0).AsRegister<Register>();
1282 Register temp1 = locations->GetTemp(1).AsRegister<Register>();
1283 Register temp2 = locations->GetTemp(2).AsRegister<Register>();
1284
jessicahandojo05765752016-09-09 19:01:32 -07001285 Label loop, preloop;
Agi Csaki289cd552015-08-18 17:10:38 -07001286 Label end;
1287 Label return_true;
1288 Label return_false;
1289
1290 // Get offsets of count, value, and class fields within a string object.
1291 const uint32_t count_offset = mirror::String::CountOffset().Uint32Value();
1292 const uint32_t value_offset = mirror::String::ValueOffset().Uint32Value();
1293 const uint32_t class_offset = mirror::Object::ClassOffset().Uint32Value();
1294
1295 // Note that the null check must have been done earlier.
1296 DCHECK(!invoke->CanDoImplicitNullCheckOn(invoke->InputAt(0)));
1297
Vladimir Marko53b52002016-05-24 19:30:45 +01001298 StringEqualsOptimizations optimizations(invoke);
1299 if (!optimizations.GetArgumentNotNull()) {
1300 // Check if input is null, return false if it is.
1301 __ CompareAndBranchIfZero(arg, &return_false);
1302 }
Agi Csaki289cd552015-08-18 17:10:38 -07001303
Vladimir Marko53b52002016-05-24 19:30:45 +01001304 if (!optimizations.GetArgumentIsString()) {
1305 // Instanceof check for the argument by comparing class fields.
1306 // All string objects must have the same type since String cannot be subclassed.
1307 // Receiver must be a string object, so its class field is equal to all strings' class fields.
1308 // If the argument is a string object, its class field must be equal to receiver's class field.
1309 __ ldr(temp, Address(str, class_offset));
1310 __ ldr(temp1, Address(arg, class_offset));
1311 __ cmp(temp, ShifterOperand(temp1));
1312 __ b(&return_false, NE);
1313 }
Agi Csaki289cd552015-08-18 17:10:38 -07001314
1315 // Load lengths of this and argument strings.
1316 __ ldr(temp, Address(str, count_offset));
1317 __ ldr(temp1, Address(arg, count_offset));
1318 // Check if lengths are equal, return false if they're not.
jessicahandojo05765752016-09-09 19:01:32 -07001319 // Also compares the compression style, if differs return false.
Agi Csaki289cd552015-08-18 17:10:38 -07001320 __ cmp(temp, ShifterOperand(temp1));
1321 __ b(&return_false, NE);
1322 // Return true if both strings are empty.
jessicahandojo05765752016-09-09 19:01:32 -07001323 if (mirror::kUseStringCompression) {
1324 // Length needs to be masked out first because 0 is treated as compressed.
1325 __ bic(temp, temp, ShifterOperand(0x80000000));
1326 }
Agi Csaki289cd552015-08-18 17:10:38 -07001327 __ cbz(temp, &return_true);
Agi Csaki289cd552015-08-18 17:10:38 -07001328 // Reference equality check, return true if same reference.
1329 __ cmp(str, ShifterOperand(arg));
1330 __ b(&return_true, EQ);
1331
1332 // Assertions that must hold in order to compare strings 2 characters at a time.
1333 DCHECK_ALIGNED(value_offset, 4);
Scott Wakelingc25cbf12016-04-18 09:00:11 +01001334 static_assert(IsAligned<4>(kObjectAlignment), "String data must be aligned for fast compare.");
Agi Csaki289cd552015-08-18 17:10:38 -07001335
jessicahandojo05765752016-09-09 19:01:32 -07001336 if (mirror::kUseStringCompression) {
1337 // If not compressed, directly to fast compare. Else do preprocess on length.
1338 __ cmp(temp1, ShifterOperand(0));
1339 __ b(&preloop, GT);
1340 // Mask out compression flag and adjust length for compressed string (8-bit)
1341 // as if it is a 16-bit data, new_length = (length + 1) / 2.
1342 __ add(temp, temp, ShifterOperand(1));
1343 __ Lsr(temp, temp, 1);
1344 __ Bind(&preloop);
1345 }
Agi Csaki289cd552015-08-18 17:10:38 -07001346 // Loop to compare strings 2 characters at a time starting at the front of the string.
1347 // Ok to do this because strings with an odd length are zero-padded.
jessicahandojo05765752016-09-09 19:01:32 -07001348 __ LoadImmediate(temp1, value_offset);
Agi Csaki289cd552015-08-18 17:10:38 -07001349 __ Bind(&loop);
1350 __ ldr(out, Address(str, temp1));
1351 __ ldr(temp2, Address(arg, temp1));
1352 __ cmp(out, ShifterOperand(temp2));
1353 __ b(&return_false, NE);
1354 __ add(temp1, temp1, ShifterOperand(sizeof(uint32_t)));
Vladimir Markoa63f0d42015-09-01 13:36:35 +01001355 __ subs(temp, temp, ShifterOperand(sizeof(uint32_t) / sizeof(uint16_t)));
1356 __ b(&loop, GT);
Agi Csaki289cd552015-08-18 17:10:38 -07001357
1358 // Return true and exit the function.
1359 // If loop does not result in returning false, we return true.
1360 __ Bind(&return_true);
1361 __ LoadImmediate(out, 1);
1362 __ b(&end);
1363
1364 // Return false and exit the function.
1365 __ Bind(&return_false);
1366 __ LoadImmediate(out, 0);
1367 __ Bind(&end);
1368}
1369
Andreas Gampeba6fdbc2015-05-07 22:31:55 -07001370static void GenerateVisitStringIndexOf(HInvoke* invoke,
1371 ArmAssembler* assembler,
1372 CodeGeneratorARM* codegen,
1373 ArenaAllocator* allocator,
1374 bool start_at_zero) {
1375 LocationSummary* locations = invoke->GetLocations();
Andreas Gampeba6fdbc2015-05-07 22:31:55 -07001376
1377 // Note that the null check must have been done earlier.
1378 DCHECK(!invoke->CanDoImplicitNullCheckOn(invoke->InputAt(0)));
1379
1380 // Check for code points > 0xFFFF. Either a slow-path check when we don't know statically,
Vladimir Markofb6c90a2016-05-06 15:52:12 +01001381 // or directly dispatch for a large constant, or omit slow-path for a small constant or a char.
Andreas Gampe85b62f22015-09-09 13:15:38 -07001382 SlowPathCode* slow_path = nullptr;
Vladimir Markofb6c90a2016-05-06 15:52:12 +01001383 HInstruction* code_point = invoke->InputAt(1);
1384 if (code_point->IsIntConstant()) {
Vladimir Markoda051082016-05-17 16:10:20 +01001385 if (static_cast<uint32_t>(code_point->AsIntConstant()->GetValue()) >
Andreas Gampeba6fdbc2015-05-07 22:31:55 -07001386 std::numeric_limits<uint16_t>::max()) {
1387 // Always needs the slow-path. We could directly dispatch to it, but this case should be
1388 // rare, so for simplicity just put the full slow-path down and branch unconditionally.
1389 slow_path = new (allocator) IntrinsicSlowPathARM(invoke);
1390 codegen->AddSlowPath(slow_path);
1391 __ b(slow_path->GetEntryLabel());
1392 __ Bind(slow_path->GetExitLabel());
1393 return;
1394 }
Vladimir Markofb6c90a2016-05-06 15:52:12 +01001395 } else if (code_point->GetType() != Primitive::kPrimChar) {
Andreas Gampeba6fdbc2015-05-07 22:31:55 -07001396 Register char_reg = locations->InAt(1).AsRegister<Register>();
Vladimir Markofb6c90a2016-05-06 15:52:12 +01001397 // 0xffff is not modified immediate but 0x10000 is, so use `>= 0x10000` instead of `> 0xffff`.
1398 __ cmp(char_reg,
1399 ShifterOperand(static_cast<uint32_t>(std::numeric_limits<uint16_t>::max()) + 1));
Andreas Gampeba6fdbc2015-05-07 22:31:55 -07001400 slow_path = new (allocator) IntrinsicSlowPathARM(invoke);
1401 codegen->AddSlowPath(slow_path);
Vladimir Markofb6c90a2016-05-06 15:52:12 +01001402 __ b(slow_path->GetEntryLabel(), HS);
Andreas Gampeba6fdbc2015-05-07 22:31:55 -07001403 }
1404
1405 if (start_at_zero) {
Vladimir Markofb6c90a2016-05-06 15:52:12 +01001406 Register tmp_reg = locations->GetTemp(0).AsRegister<Register>();
Andreas Gampeba6fdbc2015-05-07 22:31:55 -07001407 DCHECK_EQ(tmp_reg, R2);
1408 // Start-index = 0.
1409 __ LoadImmediate(tmp_reg, 0);
1410 }
1411
Serban Constantinescu4bb30ac2016-06-22 17:04:45 +01001412 codegen->InvokeRuntime(kQuickIndexOf, invoke, invoke->GetDexPc(), slow_path);
Roland Levillain42ad2882016-02-29 18:26:54 +00001413 CheckEntrypointTypes<kQuickIndexOf, int32_t, void*, uint32_t, uint32_t>();
Andreas Gampeba6fdbc2015-05-07 22:31:55 -07001414
1415 if (slow_path != nullptr) {
1416 __ Bind(slow_path->GetExitLabel());
1417 }
1418}
1419
1420void IntrinsicLocationsBuilderARM::VisitStringIndexOf(HInvoke* invoke) {
1421 LocationSummary* locations = new (arena_) LocationSummary(invoke,
Serban Constantinescu806f0122016-03-09 11:10:16 +00001422 LocationSummary::kCallOnMainAndSlowPath,
Andreas Gampeba6fdbc2015-05-07 22:31:55 -07001423 kIntrinsified);
1424 // We have a hand-crafted assembly stub that follows the runtime calling convention. So it's
1425 // best to align the inputs accordingly.
1426 InvokeRuntimeCallingConvention calling_convention;
1427 locations->SetInAt(0, Location::RegisterLocation(calling_convention.GetRegisterAt(0)));
1428 locations->SetInAt(1, Location::RegisterLocation(calling_convention.GetRegisterAt(1)));
1429 locations->SetOut(Location::RegisterLocation(R0));
1430
Vladimir Markofb6c90a2016-05-06 15:52:12 +01001431 // Need to send start-index=0.
Andreas Gampeba6fdbc2015-05-07 22:31:55 -07001432 locations->AddTemp(Location::RegisterLocation(calling_convention.GetRegisterAt(2)));
1433}
1434
1435void IntrinsicCodeGeneratorARM::VisitStringIndexOf(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +00001436 GenerateVisitStringIndexOf(
1437 invoke, GetAssembler(), codegen_, GetAllocator(), /* start_at_zero */ true);
Andreas Gampeba6fdbc2015-05-07 22:31:55 -07001438}
1439
1440void IntrinsicLocationsBuilderARM::VisitStringIndexOfAfter(HInvoke* invoke) {
1441 LocationSummary* locations = new (arena_) LocationSummary(invoke,
Serban Constantinescu806f0122016-03-09 11:10:16 +00001442 LocationSummary::kCallOnMainAndSlowPath,
Andreas Gampeba6fdbc2015-05-07 22:31:55 -07001443 kIntrinsified);
1444 // We have a hand-crafted assembly stub that follows the runtime calling convention. So it's
1445 // best to align the inputs accordingly.
1446 InvokeRuntimeCallingConvention calling_convention;
1447 locations->SetInAt(0, Location::RegisterLocation(calling_convention.GetRegisterAt(0)));
1448 locations->SetInAt(1, Location::RegisterLocation(calling_convention.GetRegisterAt(1)));
1449 locations->SetInAt(2, Location::RegisterLocation(calling_convention.GetRegisterAt(2)));
1450 locations->SetOut(Location::RegisterLocation(R0));
Andreas Gampeba6fdbc2015-05-07 22:31:55 -07001451}
1452
1453void IntrinsicCodeGeneratorARM::VisitStringIndexOfAfter(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +00001454 GenerateVisitStringIndexOf(
1455 invoke, GetAssembler(), codegen_, GetAllocator(), /* start_at_zero */ false);
Andreas Gampeba6fdbc2015-05-07 22:31:55 -07001456}
1457
Jeff Hao848f70a2014-01-15 13:49:50 -08001458void IntrinsicLocationsBuilderARM::VisitStringNewStringFromBytes(HInvoke* invoke) {
1459 LocationSummary* locations = new (arena_) LocationSummary(invoke,
Serban Constantinescu806f0122016-03-09 11:10:16 +00001460 LocationSummary::kCallOnMainAndSlowPath,
Jeff Hao848f70a2014-01-15 13:49:50 -08001461 kIntrinsified);
1462 InvokeRuntimeCallingConvention calling_convention;
1463 locations->SetInAt(0, Location::RegisterLocation(calling_convention.GetRegisterAt(0)));
1464 locations->SetInAt(1, Location::RegisterLocation(calling_convention.GetRegisterAt(1)));
1465 locations->SetInAt(2, Location::RegisterLocation(calling_convention.GetRegisterAt(2)));
1466 locations->SetInAt(3, Location::RegisterLocation(calling_convention.GetRegisterAt(3)));
1467 locations->SetOut(Location::RegisterLocation(R0));
1468}
1469
1470void IntrinsicCodeGeneratorARM::VisitStringNewStringFromBytes(HInvoke* invoke) {
1471 ArmAssembler* assembler = GetAssembler();
1472 LocationSummary* locations = invoke->GetLocations();
1473
1474 Register byte_array = locations->InAt(0).AsRegister<Register>();
1475 __ cmp(byte_array, ShifterOperand(0));
Andreas Gampe85b62f22015-09-09 13:15:38 -07001476 SlowPathCode* slow_path = new (GetAllocator()) IntrinsicSlowPathARM(invoke);
Jeff Hao848f70a2014-01-15 13:49:50 -08001477 codegen_->AddSlowPath(slow_path);
1478 __ b(slow_path->GetEntryLabel(), EQ);
1479
Serban Constantinescu4bb30ac2016-06-22 17:04:45 +01001480 codegen_->InvokeRuntime(kQuickAllocStringFromBytes, invoke, invoke->GetDexPc(), slow_path);
Roland Levillainf969a202016-03-09 16:14:00 +00001481 CheckEntrypointTypes<kQuickAllocStringFromBytes, void*, void*, int32_t, int32_t, int32_t>();
Jeff Hao848f70a2014-01-15 13:49:50 -08001482 __ Bind(slow_path->GetExitLabel());
1483}
1484
1485void IntrinsicLocationsBuilderARM::VisitStringNewStringFromChars(HInvoke* invoke) {
1486 LocationSummary* locations = new (arena_) LocationSummary(invoke,
Serban Constantinescu54ff4822016-07-07 18:03:19 +01001487 LocationSummary::kCallOnMainOnly,
Jeff Hao848f70a2014-01-15 13:49:50 -08001488 kIntrinsified);
1489 InvokeRuntimeCallingConvention calling_convention;
1490 locations->SetInAt(0, Location::RegisterLocation(calling_convention.GetRegisterAt(0)));
1491 locations->SetInAt(1, Location::RegisterLocation(calling_convention.GetRegisterAt(1)));
1492 locations->SetInAt(2, Location::RegisterLocation(calling_convention.GetRegisterAt(2)));
1493 locations->SetOut(Location::RegisterLocation(R0));
1494}
1495
1496void IntrinsicCodeGeneratorARM::VisitStringNewStringFromChars(HInvoke* invoke) {
Roland Levillaincc3839c2016-02-29 16:23:48 +00001497 // No need to emit code checking whether `locations->InAt(2)` is a null
1498 // pointer, as callers of the native method
1499 //
1500 // java.lang.StringFactory.newStringFromChars(int offset, int charCount, char[] data)
1501 //
1502 // all include a null check on `data` before calling that method.
Serban Constantinescu4bb30ac2016-06-22 17:04:45 +01001503 codegen_->InvokeRuntime(kQuickAllocStringFromChars, invoke, invoke->GetDexPc());
Roland Levillainf969a202016-03-09 16:14:00 +00001504 CheckEntrypointTypes<kQuickAllocStringFromChars, void*, int32_t, int32_t, void*>();
Jeff Hao848f70a2014-01-15 13:49:50 -08001505}
1506
1507void IntrinsicLocationsBuilderARM::VisitStringNewStringFromString(HInvoke* invoke) {
1508 LocationSummary* locations = new (arena_) LocationSummary(invoke,
Serban Constantinescu806f0122016-03-09 11:10:16 +00001509 LocationSummary::kCallOnMainAndSlowPath,
Jeff Hao848f70a2014-01-15 13:49:50 -08001510 kIntrinsified);
1511 InvokeRuntimeCallingConvention calling_convention;
1512 locations->SetInAt(0, Location::RegisterLocation(calling_convention.GetRegisterAt(0)));
1513 locations->SetOut(Location::RegisterLocation(R0));
1514}
1515
1516void IntrinsicCodeGeneratorARM::VisitStringNewStringFromString(HInvoke* invoke) {
1517 ArmAssembler* assembler = GetAssembler();
1518 LocationSummary* locations = invoke->GetLocations();
1519
1520 Register string_to_copy = locations->InAt(0).AsRegister<Register>();
1521 __ cmp(string_to_copy, ShifterOperand(0));
Andreas Gampe85b62f22015-09-09 13:15:38 -07001522 SlowPathCode* slow_path = new (GetAllocator()) IntrinsicSlowPathARM(invoke);
Jeff Hao848f70a2014-01-15 13:49:50 -08001523 codegen_->AddSlowPath(slow_path);
1524 __ b(slow_path->GetEntryLabel(), EQ);
1525
Serban Constantinescu4bb30ac2016-06-22 17:04:45 +01001526 codegen_->InvokeRuntime(kQuickAllocStringFromString, invoke, invoke->GetDexPc(), slow_path);
Roland Levillainf969a202016-03-09 16:14:00 +00001527 CheckEntrypointTypes<kQuickAllocStringFromString, void*, void*>();
Serban Constantinescu4bb30ac2016-06-22 17:04:45 +01001528
Jeff Hao848f70a2014-01-15 13:49:50 -08001529 __ Bind(slow_path->GetExitLabel());
1530}
1531
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001532void IntrinsicLocationsBuilderARM::VisitSystemArrayCopy(HInvoke* invoke) {
Roland Levillain0b671c02016-08-19 12:02:34 +01001533 // The only read barrier implementation supporting the
1534 // SystemArrayCopy intrinsic is the Baker-style read barriers.
1535 if (kEmitCompilerReadBarrier && !kUseBakerReadBarrier) {
Roland Levillain3d312422016-06-23 13:53:42 +01001536 return;
1537 }
1538
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001539 CodeGenerator::CreateSystemArrayCopyLocationSummary(invoke);
1540 LocationSummary* locations = invoke->GetLocations();
1541 if (locations == nullptr) {
1542 return;
1543 }
1544
1545 HIntConstant* src_pos = invoke->InputAt(1)->AsIntConstant();
1546 HIntConstant* dest_pos = invoke->InputAt(3)->AsIntConstant();
1547 HIntConstant* length = invoke->InputAt(4)->AsIntConstant();
1548
1549 if (src_pos != nullptr && !assembler_->ShifterOperandCanAlwaysHold(src_pos->GetValue())) {
1550 locations->SetInAt(1, Location::RequiresRegister());
1551 }
1552 if (dest_pos != nullptr && !assembler_->ShifterOperandCanAlwaysHold(dest_pos->GetValue())) {
1553 locations->SetInAt(3, Location::RequiresRegister());
1554 }
1555 if (length != nullptr && !assembler_->ShifterOperandCanAlwaysHold(length->GetValue())) {
1556 locations->SetInAt(4, Location::RequiresRegister());
1557 }
Roland Levillain0b671c02016-08-19 12:02:34 +01001558 if (kEmitCompilerReadBarrier && kUseBakerReadBarrier) {
1559 // Temporary register IP cannot be used in
Roland Levillain16d9f942016-08-25 17:27:56 +01001560 // ReadBarrierSystemArrayCopySlowPathARM (because that register
Roland Levillain0b671c02016-08-19 12:02:34 +01001561 // is clobbered by ReadBarrierMarkRegX entry points). Get an extra
1562 // temporary register from the register allocator.
1563 locations->AddTemp(Location::RequiresRegister());
1564 }
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001565}
1566
1567static void CheckPosition(ArmAssembler* assembler,
1568 Location pos,
1569 Register input,
1570 Location length,
1571 SlowPathCode* slow_path,
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001572 Register temp,
1573 bool length_is_input_length = false) {
1574 // Where is the length in the Array?
1575 const uint32_t length_offset = mirror::Array::LengthOffset().Uint32Value();
1576
1577 if (pos.IsConstant()) {
1578 int32_t pos_const = pos.GetConstant()->AsIntConstant()->GetValue();
1579 if (pos_const == 0) {
1580 if (!length_is_input_length) {
1581 // Check that length(input) >= length.
1582 __ LoadFromOffset(kLoadWord, temp, input, length_offset);
1583 if (length.IsConstant()) {
1584 __ cmp(temp, ShifterOperand(length.GetConstant()->AsIntConstant()->GetValue()));
1585 } else {
1586 __ cmp(temp, ShifterOperand(length.AsRegister<Register>()));
1587 }
1588 __ b(slow_path->GetEntryLabel(), LT);
1589 }
1590 } else {
1591 // Check that length(input) >= pos.
Nicolas Geoffrayfea1abd2016-07-06 12:09:12 +01001592 __ LoadFromOffset(kLoadWord, temp, input, length_offset);
1593 __ subs(temp, temp, ShifterOperand(pos_const));
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001594 __ b(slow_path->GetEntryLabel(), LT);
1595
1596 // Check that (length(input) - pos) >= length.
1597 if (length.IsConstant()) {
1598 __ cmp(temp, ShifterOperand(length.GetConstant()->AsIntConstant()->GetValue()));
1599 } else {
1600 __ cmp(temp, ShifterOperand(length.AsRegister<Register>()));
1601 }
1602 __ b(slow_path->GetEntryLabel(), LT);
1603 }
1604 } else if (length_is_input_length) {
1605 // The only way the copy can succeed is if pos is zero.
1606 Register pos_reg = pos.AsRegister<Register>();
1607 __ CompareAndBranchIfNonZero(pos_reg, slow_path->GetEntryLabel());
1608 } else {
1609 // Check that pos >= 0.
1610 Register pos_reg = pos.AsRegister<Register>();
1611 __ cmp(pos_reg, ShifterOperand(0));
1612 __ b(slow_path->GetEntryLabel(), LT);
1613
1614 // Check that pos <= length(input).
1615 __ LoadFromOffset(kLoadWord, temp, input, length_offset);
1616 __ subs(temp, temp, ShifterOperand(pos_reg));
1617 __ b(slow_path->GetEntryLabel(), LT);
1618
1619 // Check that (length(input) - pos) >= length.
1620 if (length.IsConstant()) {
1621 __ cmp(temp, ShifterOperand(length.GetConstant()->AsIntConstant()->GetValue()));
1622 } else {
1623 __ cmp(temp, ShifterOperand(length.AsRegister<Register>()));
1624 }
1625 __ b(slow_path->GetEntryLabel(), LT);
1626 }
1627}
1628
1629void IntrinsicCodeGeneratorARM::VisitSystemArrayCopy(HInvoke* invoke) {
Roland Levillain0b671c02016-08-19 12:02:34 +01001630 // The only read barrier implementation supporting the
1631 // SystemArrayCopy intrinsic is the Baker-style read barriers.
1632 DCHECK(!kEmitCompilerReadBarrier || kUseBakerReadBarrier);
Roland Levillain3d312422016-06-23 13:53:42 +01001633
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001634 ArmAssembler* assembler = GetAssembler();
1635 LocationSummary* locations = invoke->GetLocations();
1636
1637 uint32_t class_offset = mirror::Object::ClassOffset().Int32Value();
1638 uint32_t super_offset = mirror::Class::SuperClassOffset().Int32Value();
1639 uint32_t component_offset = mirror::Class::ComponentTypeOffset().Int32Value();
1640 uint32_t primitive_offset = mirror::Class::PrimitiveTypeOffset().Int32Value();
Roland Levillain0b671c02016-08-19 12:02:34 +01001641 uint32_t monitor_offset = mirror::Object::MonitorOffset().Int32Value();
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001642
1643 Register src = locations->InAt(0).AsRegister<Register>();
1644 Location src_pos = locations->InAt(1);
1645 Register dest = locations->InAt(2).AsRegister<Register>();
1646 Location dest_pos = locations->InAt(3);
1647 Location length = locations->InAt(4);
Roland Levillain0b671c02016-08-19 12:02:34 +01001648 Location temp1_loc = locations->GetTemp(0);
1649 Register temp1 = temp1_loc.AsRegister<Register>();
1650 Location temp2_loc = locations->GetTemp(1);
1651 Register temp2 = temp2_loc.AsRegister<Register>();
1652 Location temp3_loc = locations->GetTemp(2);
1653 Register temp3 = temp3_loc.AsRegister<Register>();
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001654
Roland Levillain0b671c02016-08-19 12:02:34 +01001655 SlowPathCode* intrinsic_slow_path = new (GetAllocator()) IntrinsicSlowPathARM(invoke);
1656 codegen_->AddSlowPath(intrinsic_slow_path);
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001657
Roland Levillainebea3d22016-04-12 15:42:57 +01001658 Label conditions_on_positions_validated;
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001659 SystemArrayCopyOptimizations optimizations(invoke);
1660
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001661 // If source and destination are the same, we go to slow path if we need to do
1662 // forward copying.
1663 if (src_pos.IsConstant()) {
1664 int32_t src_pos_constant = src_pos.GetConstant()->AsIntConstant()->GetValue();
1665 if (dest_pos.IsConstant()) {
Nicolas Geoffray9f65db82016-07-07 12:07:42 +01001666 int32_t dest_pos_constant = dest_pos.GetConstant()->AsIntConstant()->GetValue();
1667 if (optimizations.GetDestinationIsSource()) {
1668 // Checked when building locations.
1669 DCHECK_GE(src_pos_constant, dest_pos_constant);
1670 } else if (src_pos_constant < dest_pos_constant) {
1671 __ cmp(src, ShifterOperand(dest));
Roland Levillain0b671c02016-08-19 12:02:34 +01001672 __ b(intrinsic_slow_path->GetEntryLabel(), EQ);
Nicolas Geoffray9f65db82016-07-07 12:07:42 +01001673 }
1674
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001675 // Checked when building locations.
1676 DCHECK(!optimizations.GetDestinationIsSource()
1677 || (src_pos_constant >= dest_pos.GetConstant()->AsIntConstant()->GetValue()));
1678 } else {
1679 if (!optimizations.GetDestinationIsSource()) {
Nicolas Geoffray9f65db82016-07-07 12:07:42 +01001680 __ cmp(src, ShifterOperand(dest));
Roland Levillainebea3d22016-04-12 15:42:57 +01001681 __ b(&conditions_on_positions_validated, NE);
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001682 }
1683 __ cmp(dest_pos.AsRegister<Register>(), ShifterOperand(src_pos_constant));
Roland Levillain0b671c02016-08-19 12:02:34 +01001684 __ b(intrinsic_slow_path->GetEntryLabel(), GT);
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001685 }
1686 } else {
1687 if (!optimizations.GetDestinationIsSource()) {
Nicolas Geoffray9f65db82016-07-07 12:07:42 +01001688 __ cmp(src, ShifterOperand(dest));
Roland Levillainebea3d22016-04-12 15:42:57 +01001689 __ b(&conditions_on_positions_validated, NE);
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001690 }
1691 if (dest_pos.IsConstant()) {
1692 int32_t dest_pos_constant = dest_pos.GetConstant()->AsIntConstant()->GetValue();
1693 __ cmp(src_pos.AsRegister<Register>(), ShifterOperand(dest_pos_constant));
1694 } else {
1695 __ cmp(src_pos.AsRegister<Register>(), ShifterOperand(dest_pos.AsRegister<Register>()));
1696 }
Roland Levillain0b671c02016-08-19 12:02:34 +01001697 __ b(intrinsic_slow_path->GetEntryLabel(), LT);
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001698 }
1699
Roland Levillainebea3d22016-04-12 15:42:57 +01001700 __ Bind(&conditions_on_positions_validated);
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001701
1702 if (!optimizations.GetSourceIsNotNull()) {
1703 // Bail out if the source is null.
Roland Levillain0b671c02016-08-19 12:02:34 +01001704 __ CompareAndBranchIfZero(src, intrinsic_slow_path->GetEntryLabel());
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001705 }
1706
1707 if (!optimizations.GetDestinationIsNotNull() && !optimizations.GetDestinationIsSource()) {
1708 // Bail out if the destination is null.
Roland Levillain0b671c02016-08-19 12:02:34 +01001709 __ CompareAndBranchIfZero(dest, intrinsic_slow_path->GetEntryLabel());
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001710 }
1711
1712 // If the length is negative, bail out.
1713 // We have already checked in the LocationsBuilder for the constant case.
1714 if (!length.IsConstant() &&
1715 !optimizations.GetCountIsSourceLength() &&
1716 !optimizations.GetCountIsDestinationLength()) {
1717 __ cmp(length.AsRegister<Register>(), ShifterOperand(0));
Roland Levillain0b671c02016-08-19 12:02:34 +01001718 __ b(intrinsic_slow_path->GetEntryLabel(), LT);
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001719 }
1720
1721 // Validity checks: source.
1722 CheckPosition(assembler,
1723 src_pos,
1724 src,
1725 length,
Roland Levillain0b671c02016-08-19 12:02:34 +01001726 intrinsic_slow_path,
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001727 temp1,
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001728 optimizations.GetCountIsSourceLength());
1729
1730 // Validity checks: dest.
1731 CheckPosition(assembler,
1732 dest_pos,
1733 dest,
1734 length,
Roland Levillain0b671c02016-08-19 12:02:34 +01001735 intrinsic_slow_path,
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001736 temp1,
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001737 optimizations.GetCountIsDestinationLength());
1738
1739 if (!optimizations.GetDoesNotNeedTypeCheck()) {
1740 // Check whether all elements of the source array are assignable to the component
1741 // type of the destination array. We do two checks: the classes are the same,
1742 // or the destination is Object[]. If none of these checks succeed, we go to the
1743 // slow path.
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001744
Roland Levillain0b671c02016-08-19 12:02:34 +01001745 if (kEmitCompilerReadBarrier && kUseBakerReadBarrier) {
1746 if (!optimizations.GetSourceIsNonPrimitiveArray()) {
1747 // /* HeapReference<Class> */ temp1 = src->klass_
1748 codegen_->GenerateFieldLoadWithBakerReadBarrier(
1749 invoke, temp1_loc, src, class_offset, temp2_loc, /* needs_null_check */ false);
1750 // Bail out if the source is not a non primitive array.
1751 // /* HeapReference<Class> */ temp1 = temp1->component_type_
1752 codegen_->GenerateFieldLoadWithBakerReadBarrier(
1753 invoke, temp1_loc, temp1, component_offset, temp2_loc, /* needs_null_check */ false);
1754 __ CompareAndBranchIfZero(temp1, intrinsic_slow_path->GetEntryLabel());
1755 // If heap poisoning is enabled, `temp1` has been unpoisoned
1756 // by the the previous call to GenerateFieldLoadWithBakerReadBarrier.
1757 // /* uint16_t */ temp1 = static_cast<uint16>(temp1->primitive_type_);
1758 __ LoadFromOffset(kLoadUnsignedHalfword, temp1, temp1, primitive_offset);
1759 static_assert(Primitive::kPrimNot == 0, "Expected 0 for kPrimNot");
1760 __ CompareAndBranchIfNonZero(temp1, intrinsic_slow_path->GetEntryLabel());
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001761 }
Roland Levillain0b671c02016-08-19 12:02:34 +01001762
1763 // /* HeapReference<Class> */ temp1 = dest->klass_
1764 codegen_->GenerateFieldLoadWithBakerReadBarrier(
1765 invoke, temp1_loc, dest, class_offset, temp2_loc, /* needs_null_check */ false);
1766
1767 if (!optimizations.GetDestinationIsNonPrimitiveArray()) {
1768 // Bail out if the destination is not a non primitive array.
1769 //
1770 // Register `temp1` is not trashed by the read barrier emitted
1771 // by GenerateFieldLoadWithBakerReadBarrier below, as that
1772 // method produces a call to a ReadBarrierMarkRegX entry point,
1773 // which saves all potentially live registers, including
1774 // temporaries such a `temp1`.
1775 // /* HeapReference<Class> */ temp2 = temp1->component_type_
1776 codegen_->GenerateFieldLoadWithBakerReadBarrier(
1777 invoke, temp2_loc, temp1, component_offset, temp3_loc, /* needs_null_check */ false);
1778 __ CompareAndBranchIfZero(temp2, intrinsic_slow_path->GetEntryLabel());
1779 // If heap poisoning is enabled, `temp2` has been unpoisoned
1780 // by the the previous call to GenerateFieldLoadWithBakerReadBarrier.
1781 // /* uint16_t */ temp2 = static_cast<uint16>(temp2->primitive_type_);
1782 __ LoadFromOffset(kLoadUnsignedHalfword, temp2, temp2, primitive_offset);
1783 static_assert(Primitive::kPrimNot == 0, "Expected 0 for kPrimNot");
1784 __ CompareAndBranchIfNonZero(temp2, intrinsic_slow_path->GetEntryLabel());
1785 }
1786
1787 // For the same reason given earlier, `temp1` is not trashed by the
1788 // read barrier emitted by GenerateFieldLoadWithBakerReadBarrier below.
1789 // /* HeapReference<Class> */ temp2 = src->klass_
1790 codegen_->GenerateFieldLoadWithBakerReadBarrier(
1791 invoke, temp2_loc, src, class_offset, temp3_loc, /* needs_null_check */ false);
1792 // Note: if heap poisoning is on, we are comparing two unpoisoned references here.
1793 __ cmp(temp1, ShifterOperand(temp2));
1794
1795 if (optimizations.GetDestinationIsTypedObjectArray()) {
1796 Label do_copy;
1797 __ b(&do_copy, EQ);
1798 // /* HeapReference<Class> */ temp1 = temp1->component_type_
1799 codegen_->GenerateFieldLoadWithBakerReadBarrier(
1800 invoke, temp1_loc, temp1, component_offset, temp2_loc, /* needs_null_check */ false);
1801 // /* HeapReference<Class> */ temp1 = temp1->super_class_
1802 // We do not need to emit a read barrier for the following
1803 // heap reference load, as `temp1` is only used in a
1804 // comparison with null below, and this reference is not
1805 // kept afterwards.
1806 __ LoadFromOffset(kLoadWord, temp1, temp1, super_offset);
1807 __ CompareAndBranchIfNonZero(temp1, intrinsic_slow_path->GetEntryLabel());
1808 __ Bind(&do_copy);
1809 } else {
1810 __ b(intrinsic_slow_path->GetEntryLabel(), NE);
1811 }
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001812 } else {
Roland Levillain0b671c02016-08-19 12:02:34 +01001813 // Non read barrier code.
1814
1815 // /* HeapReference<Class> */ temp1 = dest->klass_
1816 __ LoadFromOffset(kLoadWord, temp1, dest, class_offset);
1817 // /* HeapReference<Class> */ temp2 = src->klass_
1818 __ LoadFromOffset(kLoadWord, temp2, src, class_offset);
1819 bool did_unpoison = false;
1820 if (!optimizations.GetDestinationIsNonPrimitiveArray() ||
1821 !optimizations.GetSourceIsNonPrimitiveArray()) {
1822 // One or two of the references need to be unpoisoned. Unpoison them
1823 // both to make the identity check valid.
1824 __ MaybeUnpoisonHeapReference(temp1);
1825 __ MaybeUnpoisonHeapReference(temp2);
1826 did_unpoison = true;
1827 }
1828
1829 if (!optimizations.GetDestinationIsNonPrimitiveArray()) {
1830 // Bail out if the destination is not a non primitive array.
1831 // /* HeapReference<Class> */ temp3 = temp1->component_type_
1832 __ LoadFromOffset(kLoadWord, temp3, temp1, component_offset);
1833 __ CompareAndBranchIfZero(temp3, intrinsic_slow_path->GetEntryLabel());
1834 __ MaybeUnpoisonHeapReference(temp3);
1835 // /* uint16_t */ temp3 = static_cast<uint16>(temp3->primitive_type_);
1836 __ LoadFromOffset(kLoadUnsignedHalfword, temp3, temp3, primitive_offset);
1837 static_assert(Primitive::kPrimNot == 0, "Expected 0 for kPrimNot");
1838 __ CompareAndBranchIfNonZero(temp3, intrinsic_slow_path->GetEntryLabel());
1839 }
1840
1841 if (!optimizations.GetSourceIsNonPrimitiveArray()) {
1842 // Bail out if the source is not a non primitive array.
1843 // /* HeapReference<Class> */ temp3 = temp2->component_type_
1844 __ LoadFromOffset(kLoadWord, temp3, temp2, component_offset);
1845 __ CompareAndBranchIfZero(temp3, intrinsic_slow_path->GetEntryLabel());
1846 __ MaybeUnpoisonHeapReference(temp3);
1847 // /* uint16_t */ temp3 = static_cast<uint16>(temp3->primitive_type_);
1848 __ LoadFromOffset(kLoadUnsignedHalfword, temp3, temp3, primitive_offset);
1849 static_assert(Primitive::kPrimNot == 0, "Expected 0 for kPrimNot");
1850 __ CompareAndBranchIfNonZero(temp3, intrinsic_slow_path->GetEntryLabel());
1851 }
1852
1853 __ cmp(temp1, ShifterOperand(temp2));
1854
1855 if (optimizations.GetDestinationIsTypedObjectArray()) {
1856 Label do_copy;
1857 __ b(&do_copy, EQ);
1858 if (!did_unpoison) {
1859 __ MaybeUnpoisonHeapReference(temp1);
1860 }
1861 // /* HeapReference<Class> */ temp1 = temp1->component_type_
1862 __ LoadFromOffset(kLoadWord, temp1, temp1, component_offset);
1863 __ MaybeUnpoisonHeapReference(temp1);
1864 // /* HeapReference<Class> */ temp1 = temp1->super_class_
1865 __ LoadFromOffset(kLoadWord, temp1, temp1, super_offset);
1866 // No need to unpoison the result, we're comparing against null.
1867 __ CompareAndBranchIfNonZero(temp1, intrinsic_slow_path->GetEntryLabel());
1868 __ Bind(&do_copy);
1869 } else {
1870 __ b(intrinsic_slow_path->GetEntryLabel(), NE);
1871 }
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001872 }
1873 } else if (!optimizations.GetSourceIsNonPrimitiveArray()) {
1874 DCHECK(optimizations.GetDestinationIsNonPrimitiveArray());
1875 // Bail out if the source is not a non primitive array.
Roland Levillain0b671c02016-08-19 12:02:34 +01001876 if (kEmitCompilerReadBarrier && kUseBakerReadBarrier) {
1877 // /* HeapReference<Class> */ temp1 = src->klass_
1878 codegen_->GenerateFieldLoadWithBakerReadBarrier(
1879 invoke, temp1_loc, src, class_offset, temp2_loc, /* needs_null_check */ false);
1880 // /* HeapReference<Class> */ temp3 = temp1->component_type_
1881 codegen_->GenerateFieldLoadWithBakerReadBarrier(
1882 invoke, temp3_loc, temp1, component_offset, temp2_loc, /* needs_null_check */ false);
1883 __ CompareAndBranchIfZero(temp3, intrinsic_slow_path->GetEntryLabel());
1884 // If heap poisoning is enabled, `temp3` has been unpoisoned
1885 // by the the previous call to GenerateFieldLoadWithBakerReadBarrier.
1886 } else {
1887 // /* HeapReference<Class> */ temp1 = src->klass_
1888 __ LoadFromOffset(kLoadWord, temp1, src, class_offset);
1889 __ MaybeUnpoisonHeapReference(temp1);
1890 // /* HeapReference<Class> */ temp3 = temp1->component_type_
1891 __ LoadFromOffset(kLoadWord, temp3, temp1, component_offset);
1892 __ CompareAndBranchIfZero(temp3, intrinsic_slow_path->GetEntryLabel());
1893 __ MaybeUnpoisonHeapReference(temp3);
1894 }
1895 // /* uint16_t */ temp3 = static_cast<uint16>(temp3->primitive_type_);
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001896 __ LoadFromOffset(kLoadUnsignedHalfword, temp3, temp3, primitive_offset);
1897 static_assert(Primitive::kPrimNot == 0, "Expected 0 for kPrimNot");
Roland Levillain0b671c02016-08-19 12:02:34 +01001898 __ CompareAndBranchIfNonZero(temp3, intrinsic_slow_path->GetEntryLabel());
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001899 }
1900
Nicolas Geoffrayfea1abd2016-07-06 12:09:12 +01001901 int32_t element_size = Primitive::ComponentSize(Primitive::kPrimNot);
Roland Levillain0b671c02016-08-19 12:02:34 +01001902 uint32_t element_size_shift = Primitive::ComponentSizeShift(Primitive::kPrimNot);
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001903 uint32_t offset = mirror::Array::DataOffset(element_size).Uint32Value();
Roland Levillain0b671c02016-08-19 12:02:34 +01001904
1905 // Compute the base source address in `temp1`.
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001906 if (src_pos.IsConstant()) {
1907 int32_t constant = src_pos.GetConstant()->AsIntConstant()->GetValue();
1908 __ AddConstant(temp1, src, element_size * constant + offset);
1909 } else {
Roland Levillain0b671c02016-08-19 12:02:34 +01001910 __ add(temp1, src, ShifterOperand(src_pos.AsRegister<Register>(), LSL, element_size_shift));
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001911 __ AddConstant(temp1, offset);
1912 }
1913
Roland Levillain0b671c02016-08-19 12:02:34 +01001914 // Compute the end source address in `temp3`.
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001915 if (length.IsConstant()) {
1916 int32_t constant = length.GetConstant()->AsIntConstant()->GetValue();
1917 __ AddConstant(temp3, temp1, element_size * constant);
1918 } else {
Roland Levillain0b671c02016-08-19 12:02:34 +01001919 __ add(temp3, temp1, ShifterOperand(length.AsRegister<Register>(), LSL, element_size_shift));
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001920 }
1921
Roland Levillain0b671c02016-08-19 12:02:34 +01001922 if (kEmitCompilerReadBarrier && kUseBakerReadBarrier) {
1923 // The base destination address is computed later, as `temp2` is
1924 // used for intermediate computations.
1925
1926 // SystemArrayCopy implementation for Baker read barriers (see
1927 // also CodeGeneratorARM::GenerateReferenceLoadWithBakerReadBarrier):
1928 //
1929 // if (src_ptr != end_ptr) {
1930 // uint32_t rb_state = Lockword(src->monitor_).ReadBarrierState();
1931 // lfence; // Load fence or artificial data dependency to prevent load-load reordering
1932 // bool is_gray = (rb_state == ReadBarrier::gray_ptr_);
1933 // if (is_gray) {
1934 // // Slow-path copy.
1935 // do {
1936 // *dest_ptr++ = MaybePoison(ReadBarrier::Mark(MaybeUnpoison(*src_ptr++)));
1937 // } while (src_ptr != end_ptr)
1938 // } else {
1939 // // Fast-path copy.
1940 // do {
1941 // *dest_ptr++ = *src_ptr++;
1942 // } while (src_ptr != end_ptr)
1943 // }
1944 // }
1945
1946 Label loop, done;
1947
1948 // Don't enter copy loop if `length == 0`.
1949 __ cmp(temp1, ShifterOperand(temp3));
1950 __ b(&done, EQ);
1951
1952 // /* int32_t */ monitor = src->monitor_
1953 __ LoadFromOffset(kLoadWord, temp2, src, monitor_offset);
1954 // /* LockWord */ lock_word = LockWord(monitor)
1955 static_assert(sizeof(LockWord) == sizeof(int32_t),
1956 "art::LockWord and int32_t have different sizes.");
1957
1958 // Introduce a dependency on the lock_word including the rb_state,
1959 // which shall prevent load-load reordering without using
1960 // a memory barrier (which would be more expensive).
1961 // `src` is unchanged by this operation, but its value now depends
1962 // on `temp2`.
1963 __ add(src, src, ShifterOperand(temp2, LSR, 32));
1964
1965 // Slow path used to copy array when `src` is gray.
1966 SlowPathCode* read_barrier_slow_path =
1967 new (GetAllocator()) ReadBarrierSystemArrayCopySlowPathARM(invoke);
1968 codegen_->AddSlowPath(read_barrier_slow_path);
1969
1970 // Given the numeric representation, it's enough to check the low bit of the
1971 // rb_state. We do that by shifting the bit out of the lock word with LSRS
1972 // which can be a 16-bit instruction unlike the TST immediate.
1973 static_assert(ReadBarrier::white_ptr_ == 0, "Expecting white to have value 0");
1974 static_assert(ReadBarrier::gray_ptr_ == 1, "Expecting gray to have value 1");
1975 static_assert(ReadBarrier::black_ptr_ == 2, "Expecting black to have value 2");
1976 __ Lsrs(temp2, temp2, LockWord::kReadBarrierStateShift + 1);
1977 // Carry flag is the last bit shifted out by LSRS.
1978 __ b(read_barrier_slow_path->GetEntryLabel(), CS);
1979
1980 // Fast-path copy.
1981
1982 // Compute the base destination address in `temp2`.
1983 if (dest_pos.IsConstant()) {
1984 int32_t constant = dest_pos.GetConstant()->AsIntConstant()->GetValue();
1985 __ AddConstant(temp2, dest, element_size * constant + offset);
1986 } else {
1987 __ add(temp2, dest, ShifterOperand(dest_pos.AsRegister<Register>(), LSL, element_size_shift));
1988 __ AddConstant(temp2, offset);
1989 }
1990
1991 // Iterate over the arrays and do a raw copy of the objects. We don't need to
1992 // poison/unpoison.
1993 __ Bind(&loop);
1994 __ ldr(IP, Address(temp1, element_size, Address::PostIndex));
1995 __ str(IP, Address(temp2, element_size, Address::PostIndex));
1996 __ cmp(temp1, ShifterOperand(temp3));
1997 __ b(&loop, NE);
1998
1999 __ Bind(read_barrier_slow_path->GetExitLabel());
2000 __ Bind(&done);
2001 } else {
2002 // Non read barrier code.
2003
2004 // Compute the base destination address in `temp2`.
2005 if (dest_pos.IsConstant()) {
2006 int32_t constant = dest_pos.GetConstant()->AsIntConstant()->GetValue();
2007 __ AddConstant(temp2, dest, element_size * constant + offset);
2008 } else {
2009 __ add(temp2, dest, ShifterOperand(dest_pos.AsRegister<Register>(), LSL, element_size_shift));
2010 __ AddConstant(temp2, offset);
2011 }
2012
2013 // Iterate over the arrays and do a raw copy of the objects. We don't need to
2014 // poison/unpoison.
2015 Label loop, done;
2016 __ cmp(temp1, ShifterOperand(temp3));
2017 __ b(&done, EQ);
2018 __ Bind(&loop);
2019 __ ldr(IP, Address(temp1, element_size, Address::PostIndex));
2020 __ str(IP, Address(temp2, element_size, Address::PostIndex));
2021 __ cmp(temp1, ShifterOperand(temp3));
2022 __ b(&loop, NE);
2023 __ Bind(&done);
2024 }
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01002025
2026 // We only need one card marking on the destination array.
2027 codegen_->MarkGCCard(temp1,
2028 temp2,
2029 dest,
2030 Register(kNoRegister),
Roland Levillainebea3d22016-04-12 15:42:57 +01002031 /* value_can_be_null */ false);
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01002032
Roland Levillain0b671c02016-08-19 12:02:34 +01002033 __ Bind(intrinsic_slow_path->GetExitLabel());
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01002034}
2035
Anton Kirilovd70dc9d2016-02-04 14:59:04 +00002036static void CreateFPToFPCallLocations(ArenaAllocator* arena, HInvoke* invoke) {
2037 // If the graph is debuggable, all callee-saved floating-point registers are blocked by
2038 // the code generator. Furthermore, the register allocator creates fixed live intervals
2039 // for all caller-saved registers because we are doing a function call. As a result, if
2040 // the input and output locations are unallocated, the register allocator runs out of
2041 // registers and fails; however, a debuggable graph is not the common case.
2042 if (invoke->GetBlock()->GetGraph()->IsDebuggable()) {
2043 return;
2044 }
2045
2046 DCHECK_EQ(invoke->GetNumberOfArguments(), 1U);
2047 DCHECK_EQ(invoke->InputAt(0)->GetType(), Primitive::kPrimDouble);
2048 DCHECK_EQ(invoke->GetType(), Primitive::kPrimDouble);
2049
2050 LocationSummary* const locations = new (arena) LocationSummary(invoke,
Serban Constantinescu54ff4822016-07-07 18:03:19 +01002051 LocationSummary::kCallOnMainOnly,
Anton Kirilovd70dc9d2016-02-04 14:59:04 +00002052 kIntrinsified);
2053 const InvokeRuntimeCallingConvention calling_convention;
2054
2055 locations->SetInAt(0, Location::RequiresFpuRegister());
2056 locations->SetOut(Location::RequiresFpuRegister());
2057 // Native code uses the soft float ABI.
2058 locations->AddTemp(Location::RegisterLocation(calling_convention.GetRegisterAt(0)));
2059 locations->AddTemp(Location::RegisterLocation(calling_convention.GetRegisterAt(1)));
2060}
2061
2062static void CreateFPFPToFPCallLocations(ArenaAllocator* arena, HInvoke* invoke) {
2063 // If the graph is debuggable, all callee-saved floating-point registers are blocked by
2064 // the code generator. Furthermore, the register allocator creates fixed live intervals
2065 // for all caller-saved registers because we are doing a function call. As a result, if
2066 // the input and output locations are unallocated, the register allocator runs out of
2067 // registers and fails; however, a debuggable graph is not the common case.
2068 if (invoke->GetBlock()->GetGraph()->IsDebuggable()) {
2069 return;
2070 }
2071
2072 DCHECK_EQ(invoke->GetNumberOfArguments(), 2U);
2073 DCHECK_EQ(invoke->InputAt(0)->GetType(), Primitive::kPrimDouble);
2074 DCHECK_EQ(invoke->InputAt(1)->GetType(), Primitive::kPrimDouble);
2075 DCHECK_EQ(invoke->GetType(), Primitive::kPrimDouble);
2076
2077 LocationSummary* const locations = new (arena) LocationSummary(invoke,
Serban Constantinescu54ff4822016-07-07 18:03:19 +01002078 LocationSummary::kCallOnMainOnly,
Anton Kirilovd70dc9d2016-02-04 14:59:04 +00002079 kIntrinsified);
2080 const InvokeRuntimeCallingConvention calling_convention;
2081
2082 locations->SetInAt(0, Location::RequiresFpuRegister());
2083 locations->SetInAt(1, Location::RequiresFpuRegister());
2084 locations->SetOut(Location::RequiresFpuRegister());
2085 // Native code uses the soft float ABI.
2086 locations->AddTemp(Location::RegisterLocation(calling_convention.GetRegisterAt(0)));
2087 locations->AddTemp(Location::RegisterLocation(calling_convention.GetRegisterAt(1)));
2088 locations->AddTemp(Location::RegisterLocation(calling_convention.GetRegisterAt(2)));
2089 locations->AddTemp(Location::RegisterLocation(calling_convention.GetRegisterAt(3)));
2090}
2091
2092static void GenFPToFPCall(HInvoke* invoke,
2093 ArmAssembler* assembler,
2094 CodeGeneratorARM* codegen,
2095 QuickEntrypointEnum entry) {
2096 LocationSummary* const locations = invoke->GetLocations();
2097 const InvokeRuntimeCallingConvention calling_convention;
2098
2099 DCHECK_EQ(invoke->GetNumberOfArguments(), 1U);
2100 DCHECK(locations->WillCall() && locations->Intrinsified());
2101 DCHECK(!locations->GetLiveRegisters()->ContainsCoreRegister(calling_convention.GetRegisterAt(0)));
2102 DCHECK(!locations->GetLiveRegisters()->ContainsCoreRegister(calling_convention.GetRegisterAt(1)));
2103
Anton Kirilovd70dc9d2016-02-04 14:59:04 +00002104 // Native code uses the soft float ABI.
2105 __ vmovrrd(calling_convention.GetRegisterAt(0),
2106 calling_convention.GetRegisterAt(1),
2107 FromLowSToD(locations->InAt(0).AsFpuRegisterPairLow<SRegister>()));
Serban Constantinescu4bb30ac2016-06-22 17:04:45 +01002108 codegen->InvokeRuntime(entry, invoke, invoke->GetDexPc());
Anton Kirilovd70dc9d2016-02-04 14:59:04 +00002109 __ vmovdrr(FromLowSToD(locations->Out().AsFpuRegisterPairLow<SRegister>()),
2110 calling_convention.GetRegisterAt(0),
2111 calling_convention.GetRegisterAt(1));
2112}
2113
2114static void GenFPFPToFPCall(HInvoke* invoke,
2115 ArmAssembler* assembler,
2116 CodeGeneratorARM* codegen,
2117 QuickEntrypointEnum entry) {
2118 LocationSummary* const locations = invoke->GetLocations();
2119 const InvokeRuntimeCallingConvention calling_convention;
2120
2121 DCHECK_EQ(invoke->GetNumberOfArguments(), 2U);
2122 DCHECK(locations->WillCall() && locations->Intrinsified());
2123 DCHECK(!locations->GetLiveRegisters()->ContainsCoreRegister(calling_convention.GetRegisterAt(0)));
2124 DCHECK(!locations->GetLiveRegisters()->ContainsCoreRegister(calling_convention.GetRegisterAt(1)));
2125 DCHECK(!locations->GetLiveRegisters()->ContainsCoreRegister(calling_convention.GetRegisterAt(2)));
2126 DCHECK(!locations->GetLiveRegisters()->ContainsCoreRegister(calling_convention.GetRegisterAt(3)));
2127
Anton Kirilovd70dc9d2016-02-04 14:59:04 +00002128 // Native code uses the soft float ABI.
2129 __ vmovrrd(calling_convention.GetRegisterAt(0),
2130 calling_convention.GetRegisterAt(1),
2131 FromLowSToD(locations->InAt(0).AsFpuRegisterPairLow<SRegister>()));
2132 __ vmovrrd(calling_convention.GetRegisterAt(2),
2133 calling_convention.GetRegisterAt(3),
2134 FromLowSToD(locations->InAt(1).AsFpuRegisterPairLow<SRegister>()));
Serban Constantinescu4bb30ac2016-06-22 17:04:45 +01002135 codegen->InvokeRuntime(entry, invoke, invoke->GetDexPc());
Anton Kirilovd70dc9d2016-02-04 14:59:04 +00002136 __ vmovdrr(FromLowSToD(locations->Out().AsFpuRegisterPairLow<SRegister>()),
2137 calling_convention.GetRegisterAt(0),
2138 calling_convention.GetRegisterAt(1));
2139}
2140
2141void IntrinsicLocationsBuilderARM::VisitMathCos(HInvoke* invoke) {
2142 CreateFPToFPCallLocations(arena_, invoke);
2143}
2144
2145void IntrinsicCodeGeneratorARM::VisitMathCos(HInvoke* invoke) {
2146 GenFPToFPCall(invoke, GetAssembler(), codegen_, kQuickCos);
2147}
2148
2149void IntrinsicLocationsBuilderARM::VisitMathSin(HInvoke* invoke) {
2150 CreateFPToFPCallLocations(arena_, invoke);
2151}
2152
2153void IntrinsicCodeGeneratorARM::VisitMathSin(HInvoke* invoke) {
2154 GenFPToFPCall(invoke, GetAssembler(), codegen_, kQuickSin);
2155}
2156
2157void IntrinsicLocationsBuilderARM::VisitMathAcos(HInvoke* invoke) {
2158 CreateFPToFPCallLocations(arena_, invoke);
2159}
2160
2161void IntrinsicCodeGeneratorARM::VisitMathAcos(HInvoke* invoke) {
2162 GenFPToFPCall(invoke, GetAssembler(), codegen_, kQuickAcos);
2163}
2164
2165void IntrinsicLocationsBuilderARM::VisitMathAsin(HInvoke* invoke) {
2166 CreateFPToFPCallLocations(arena_, invoke);
2167}
2168
2169void IntrinsicCodeGeneratorARM::VisitMathAsin(HInvoke* invoke) {
2170 GenFPToFPCall(invoke, GetAssembler(), codegen_, kQuickAsin);
2171}
2172
2173void IntrinsicLocationsBuilderARM::VisitMathAtan(HInvoke* invoke) {
2174 CreateFPToFPCallLocations(arena_, invoke);
2175}
2176
2177void IntrinsicCodeGeneratorARM::VisitMathAtan(HInvoke* invoke) {
2178 GenFPToFPCall(invoke, GetAssembler(), codegen_, kQuickAtan);
2179}
2180
2181void IntrinsicLocationsBuilderARM::VisitMathCbrt(HInvoke* invoke) {
2182 CreateFPToFPCallLocations(arena_, invoke);
2183}
2184
2185void IntrinsicCodeGeneratorARM::VisitMathCbrt(HInvoke* invoke) {
2186 GenFPToFPCall(invoke, GetAssembler(), codegen_, kQuickCbrt);
2187}
2188
2189void IntrinsicLocationsBuilderARM::VisitMathCosh(HInvoke* invoke) {
2190 CreateFPToFPCallLocations(arena_, invoke);
2191}
2192
2193void IntrinsicCodeGeneratorARM::VisitMathCosh(HInvoke* invoke) {
2194 GenFPToFPCall(invoke, GetAssembler(), codegen_, kQuickCosh);
2195}
2196
2197void IntrinsicLocationsBuilderARM::VisitMathExp(HInvoke* invoke) {
2198 CreateFPToFPCallLocations(arena_, invoke);
2199}
2200
2201void IntrinsicCodeGeneratorARM::VisitMathExp(HInvoke* invoke) {
2202 GenFPToFPCall(invoke, GetAssembler(), codegen_, kQuickExp);
2203}
2204
2205void IntrinsicLocationsBuilderARM::VisitMathExpm1(HInvoke* invoke) {
2206 CreateFPToFPCallLocations(arena_, invoke);
2207}
2208
2209void IntrinsicCodeGeneratorARM::VisitMathExpm1(HInvoke* invoke) {
2210 GenFPToFPCall(invoke, GetAssembler(), codegen_, kQuickExpm1);
2211}
2212
2213void IntrinsicLocationsBuilderARM::VisitMathLog(HInvoke* invoke) {
2214 CreateFPToFPCallLocations(arena_, invoke);
2215}
2216
2217void IntrinsicCodeGeneratorARM::VisitMathLog(HInvoke* invoke) {
2218 GenFPToFPCall(invoke, GetAssembler(), codegen_, kQuickLog);
2219}
2220
2221void IntrinsicLocationsBuilderARM::VisitMathLog10(HInvoke* invoke) {
2222 CreateFPToFPCallLocations(arena_, invoke);
2223}
2224
2225void IntrinsicCodeGeneratorARM::VisitMathLog10(HInvoke* invoke) {
2226 GenFPToFPCall(invoke, GetAssembler(), codegen_, kQuickLog10);
2227}
2228
2229void IntrinsicLocationsBuilderARM::VisitMathSinh(HInvoke* invoke) {
2230 CreateFPToFPCallLocations(arena_, invoke);
2231}
2232
2233void IntrinsicCodeGeneratorARM::VisitMathSinh(HInvoke* invoke) {
2234 GenFPToFPCall(invoke, GetAssembler(), codegen_, kQuickSinh);
2235}
2236
2237void IntrinsicLocationsBuilderARM::VisitMathTan(HInvoke* invoke) {
2238 CreateFPToFPCallLocations(arena_, invoke);
2239}
2240
2241void IntrinsicCodeGeneratorARM::VisitMathTan(HInvoke* invoke) {
2242 GenFPToFPCall(invoke, GetAssembler(), codegen_, kQuickTan);
2243}
2244
2245void IntrinsicLocationsBuilderARM::VisitMathTanh(HInvoke* invoke) {
2246 CreateFPToFPCallLocations(arena_, invoke);
2247}
2248
2249void IntrinsicCodeGeneratorARM::VisitMathTanh(HInvoke* invoke) {
2250 GenFPToFPCall(invoke, GetAssembler(), codegen_, kQuickTanh);
2251}
2252
2253void IntrinsicLocationsBuilderARM::VisitMathAtan2(HInvoke* invoke) {
2254 CreateFPFPToFPCallLocations(arena_, invoke);
2255}
2256
2257void IntrinsicCodeGeneratorARM::VisitMathAtan2(HInvoke* invoke) {
2258 GenFPFPToFPCall(invoke, GetAssembler(), codegen_, kQuickAtan2);
2259}
2260
2261void IntrinsicLocationsBuilderARM::VisitMathHypot(HInvoke* invoke) {
2262 CreateFPFPToFPCallLocations(arena_, invoke);
2263}
2264
2265void IntrinsicCodeGeneratorARM::VisitMathHypot(HInvoke* invoke) {
2266 GenFPFPToFPCall(invoke, GetAssembler(), codegen_, kQuickHypot);
2267}
2268
2269void IntrinsicLocationsBuilderARM::VisitMathNextAfter(HInvoke* invoke) {
2270 CreateFPFPToFPCallLocations(arena_, invoke);
2271}
2272
2273void IntrinsicCodeGeneratorARM::VisitMathNextAfter(HInvoke* invoke) {
2274 GenFPFPToFPCall(invoke, GetAssembler(), codegen_, kQuickNextAfter);
2275}
2276
Artem Serovc257da72016-02-02 13:49:43 +00002277void IntrinsicLocationsBuilderARM::VisitIntegerReverse(HInvoke* invoke) {
2278 CreateIntToIntLocations(arena_, invoke);
2279}
2280
2281void IntrinsicCodeGeneratorARM::VisitIntegerReverse(HInvoke* invoke) {
2282 ArmAssembler* assembler = GetAssembler();
2283 LocationSummary* locations = invoke->GetLocations();
2284
2285 Register out = locations->Out().AsRegister<Register>();
2286 Register in = locations->InAt(0).AsRegister<Register>();
2287
2288 __ rbit(out, in);
2289}
2290
2291void IntrinsicLocationsBuilderARM::VisitLongReverse(HInvoke* invoke) {
2292 LocationSummary* locations = new (arena_) LocationSummary(invoke,
2293 LocationSummary::kNoCall,
2294 kIntrinsified);
2295 locations->SetInAt(0, Location::RequiresRegister());
2296 locations->SetOut(Location::RequiresRegister(), Location::kOutputOverlap);
2297}
2298
2299void IntrinsicCodeGeneratorARM::VisitLongReverse(HInvoke* invoke) {
2300 ArmAssembler* assembler = GetAssembler();
2301 LocationSummary* locations = invoke->GetLocations();
2302
2303 Register in_reg_lo = locations->InAt(0).AsRegisterPairLow<Register>();
2304 Register in_reg_hi = locations->InAt(0).AsRegisterPairHigh<Register>();
2305 Register out_reg_lo = locations->Out().AsRegisterPairLow<Register>();
2306 Register out_reg_hi = locations->Out().AsRegisterPairHigh<Register>();
2307
2308 __ rbit(out_reg_lo, in_reg_hi);
2309 __ rbit(out_reg_hi, in_reg_lo);
2310}
2311
2312void IntrinsicLocationsBuilderARM::VisitIntegerReverseBytes(HInvoke* invoke) {
2313 CreateIntToIntLocations(arena_, invoke);
2314}
2315
2316void IntrinsicCodeGeneratorARM::VisitIntegerReverseBytes(HInvoke* invoke) {
2317 ArmAssembler* assembler = GetAssembler();
2318 LocationSummary* locations = invoke->GetLocations();
2319
2320 Register out = locations->Out().AsRegister<Register>();
2321 Register in = locations->InAt(0).AsRegister<Register>();
2322
2323 __ rev(out, in);
2324}
2325
2326void IntrinsicLocationsBuilderARM::VisitLongReverseBytes(HInvoke* invoke) {
2327 LocationSummary* locations = new (arena_) LocationSummary(invoke,
2328 LocationSummary::kNoCall,
2329 kIntrinsified);
2330 locations->SetInAt(0, Location::RequiresRegister());
2331 locations->SetOut(Location::RequiresRegister(), Location::kOutputOverlap);
2332}
2333
2334void IntrinsicCodeGeneratorARM::VisitLongReverseBytes(HInvoke* invoke) {
2335 ArmAssembler* assembler = GetAssembler();
2336 LocationSummary* locations = invoke->GetLocations();
2337
2338 Register in_reg_lo = locations->InAt(0).AsRegisterPairLow<Register>();
2339 Register in_reg_hi = locations->InAt(0).AsRegisterPairHigh<Register>();
2340 Register out_reg_lo = locations->Out().AsRegisterPairLow<Register>();
2341 Register out_reg_hi = locations->Out().AsRegisterPairHigh<Register>();
2342
2343 __ rev(out_reg_lo, in_reg_hi);
2344 __ rev(out_reg_hi, in_reg_lo);
2345}
2346
2347void IntrinsicLocationsBuilderARM::VisitShortReverseBytes(HInvoke* invoke) {
2348 CreateIntToIntLocations(arena_, invoke);
2349}
2350
2351void IntrinsicCodeGeneratorARM::VisitShortReverseBytes(HInvoke* invoke) {
2352 ArmAssembler* assembler = GetAssembler();
2353 LocationSummary* locations = invoke->GetLocations();
2354
2355 Register out = locations->Out().AsRegister<Register>();
2356 Register in = locations->InAt(0).AsRegister<Register>();
2357
2358 __ revsh(out, in);
2359}
2360
xueliang.zhongf1073c82016-07-05 15:28:19 +01002361static void GenBitCount(HInvoke* instr, Primitive::Type type, ArmAssembler* assembler) {
2362 DCHECK(Primitive::IsIntOrLongType(type)) << type;
2363 DCHECK_EQ(instr->GetType(), Primitive::kPrimInt);
2364 DCHECK_EQ(Primitive::PrimitiveKind(instr->InputAt(0)->GetType()), type);
2365
2366 bool is_long = type == Primitive::kPrimLong;
2367 LocationSummary* locations = instr->GetLocations();
2368 Location in = locations->InAt(0);
2369 Register src_0 = is_long ? in.AsRegisterPairLow<Register>() : in.AsRegister<Register>();
2370 Register src_1 = is_long ? in.AsRegisterPairHigh<Register>() : src_0;
2371 SRegister tmp_s = locations->GetTemp(0).AsFpuRegisterPairLow<SRegister>();
2372 DRegister tmp_d = FromLowSToD(tmp_s);
2373 Register out_r = locations->Out().AsRegister<Register>();
2374
2375 // Move data from core register(s) to temp D-reg for bit count calculation, then move back.
2376 // According to Cortex A57 and A72 optimization guides, compared to transferring to full D-reg,
2377 // transferring data from core reg to upper or lower half of vfp D-reg requires extra latency,
2378 // That's why for integer bit count, we use 'vmov d0, r0, r0' instead of 'vmov d0[0], r0'.
2379 __ vmovdrr(tmp_d, src_1, src_0); // Temp DReg |--src_1|--src_0|
2380 __ vcntd(tmp_d, tmp_d); // Temp DReg |c|c|c|c|c|c|c|c|
2381 __ vpaddld(tmp_d, tmp_d, 8, /* is_unsigned */ true); // Temp DReg |--c|--c|--c|--c|
2382 __ vpaddld(tmp_d, tmp_d, 16, /* is_unsigned */ true); // Temp DReg |------c|------c|
2383 if (is_long) {
2384 __ vpaddld(tmp_d, tmp_d, 32, /* is_unsigned */ true); // Temp DReg |--------------c|
2385 }
2386 __ vmovrs(out_r, tmp_s);
2387}
2388
2389void IntrinsicLocationsBuilderARM::VisitIntegerBitCount(HInvoke* invoke) {
2390 CreateIntToIntLocations(arena_, invoke);
2391 invoke->GetLocations()->AddTemp(Location::RequiresFpuRegister());
2392}
2393
2394void IntrinsicCodeGeneratorARM::VisitIntegerBitCount(HInvoke* invoke) {
2395 GenBitCount(invoke, Primitive::kPrimInt, GetAssembler());
2396}
2397
2398void IntrinsicLocationsBuilderARM::VisitLongBitCount(HInvoke* invoke) {
2399 VisitIntegerBitCount(invoke);
2400}
2401
2402void IntrinsicCodeGeneratorARM::VisitLongBitCount(HInvoke* invoke) {
2403 GenBitCount(invoke, Primitive::kPrimLong, GetAssembler());
2404}
2405
Tim Zhang25abd6c2016-01-19 23:39:24 +08002406void IntrinsicLocationsBuilderARM::VisitStringGetCharsNoCheck(HInvoke* invoke) {
2407 LocationSummary* locations = new (arena_) LocationSummary(invoke,
2408 LocationSummary::kNoCall,
2409 kIntrinsified);
2410 locations->SetInAt(0, Location::RequiresRegister());
2411 locations->SetInAt(1, Location::RequiresRegister());
2412 locations->SetInAt(2, Location::RequiresRegister());
2413 locations->SetInAt(3, Location::RequiresRegister());
2414 locations->SetInAt(4, Location::RequiresRegister());
2415
Scott Wakeling3fdab772016-04-25 11:32:37 +01002416 // Temporary registers to store lengths of strings and for calculations.
Tim Zhang25abd6c2016-01-19 23:39:24 +08002417 locations->AddTemp(Location::RequiresRegister());
2418 locations->AddTemp(Location::RequiresRegister());
2419 locations->AddTemp(Location::RequiresRegister());
2420}
2421
2422void IntrinsicCodeGeneratorARM::VisitStringGetCharsNoCheck(HInvoke* invoke) {
2423 ArmAssembler* assembler = GetAssembler();
2424 LocationSummary* locations = invoke->GetLocations();
2425
2426 // Check assumption that sizeof(Char) is 2 (used in scaling below).
2427 const size_t char_size = Primitive::ComponentSize(Primitive::kPrimChar);
2428 DCHECK_EQ(char_size, 2u);
2429
2430 // Location of data in char array buffer.
2431 const uint32_t data_offset = mirror::Array::DataOffset(char_size).Uint32Value();
2432
2433 // Location of char array data in string.
2434 const uint32_t value_offset = mirror::String::ValueOffset().Uint32Value();
2435
2436 // void getCharsNoCheck(int srcBegin, int srcEnd, char[] dst, int dstBegin);
2437 // Since getChars() calls getCharsNoCheck() - we use registers rather than constants.
2438 Register srcObj = locations->InAt(0).AsRegister<Register>();
2439 Register srcBegin = locations->InAt(1).AsRegister<Register>();
2440 Register srcEnd = locations->InAt(2).AsRegister<Register>();
2441 Register dstObj = locations->InAt(3).AsRegister<Register>();
2442 Register dstBegin = locations->InAt(4).AsRegister<Register>();
2443
Scott Wakeling3fdab772016-04-25 11:32:37 +01002444 Register num_chr = locations->GetTemp(0).AsRegister<Register>();
2445 Register src_ptr = locations->GetTemp(1).AsRegister<Register>();
Tim Zhang25abd6c2016-01-19 23:39:24 +08002446 Register dst_ptr = locations->GetTemp(2).AsRegister<Register>();
Tim Zhang25abd6c2016-01-19 23:39:24 +08002447
jessicahandojo05765752016-09-09 19:01:32 -07002448 Label done, compressed_string_loop;
Tim Zhang25abd6c2016-01-19 23:39:24 +08002449 // dst to be copied.
2450 __ add(dst_ptr, dstObj, ShifterOperand(data_offset));
2451 __ add(dst_ptr, dst_ptr, ShifterOperand(dstBegin, LSL, 1));
2452
Scott Wakeling3fdab772016-04-25 11:32:37 +01002453 __ subs(num_chr, srcEnd, ShifterOperand(srcBegin));
Scott Wakeling3fdab772016-04-25 11:32:37 +01002454 // Early out for valid zero-length retrievals.
Tim Zhang25abd6c2016-01-19 23:39:24 +08002455 __ b(&done, EQ);
Scott Wakeling3fdab772016-04-25 11:32:37 +01002456
jessicahandojo05765752016-09-09 19:01:32 -07002457 // src range to copy.
2458 __ add(src_ptr, srcObj, ShifterOperand(value_offset));
2459 Label compressed_string_preloop;
2460 if (mirror::kUseStringCompression) {
2461 // Location of count in string.
2462 const uint32_t count_offset = mirror::String::CountOffset().Uint32Value();
2463 // String's length.
2464 __ ldr(IP, Address(srcObj, count_offset));
2465 __ cmp(IP, ShifterOperand(0));
2466 __ b(&compressed_string_preloop, LT);
2467 }
2468 __ add(src_ptr, src_ptr, ShifterOperand(srcBegin, LSL, 1));
2469
2470 // Do the copy.
2471 Label loop, remainder;
2472
Scott Wakeling3fdab772016-04-25 11:32:37 +01002473 // Save repairing the value of num_chr on the < 4 character path.
2474 __ subs(IP, num_chr, ShifterOperand(4));
2475 __ b(&remainder, LT);
2476
2477 // Keep the result of the earlier subs, we are going to fetch at least 4 characters.
2478 __ mov(num_chr, ShifterOperand(IP));
2479
2480 // Main loop used for longer fetches loads and stores 4x16-bit characters at a time.
2481 // (LDRD/STRD fault on unaligned addresses and it's not worth inlining extra code
2482 // to rectify these everywhere this intrinsic applies.)
2483 __ Bind(&loop);
2484 __ ldr(IP, Address(src_ptr, char_size * 2));
2485 __ subs(num_chr, num_chr, ShifterOperand(4));
2486 __ str(IP, Address(dst_ptr, char_size * 2));
2487 __ ldr(IP, Address(src_ptr, char_size * 4, Address::PostIndex));
2488 __ str(IP, Address(dst_ptr, char_size * 4, Address::PostIndex));
2489 __ b(&loop, GE);
2490
2491 __ adds(num_chr, num_chr, ShifterOperand(4));
2492 __ b(&done, EQ);
2493
2494 // Main loop for < 4 character case and remainder handling. Loads and stores one
2495 // 16-bit Java character at a time.
2496 __ Bind(&remainder);
2497 __ ldrh(IP, Address(src_ptr, char_size, Address::PostIndex));
2498 __ subs(num_chr, num_chr, ShifterOperand(1));
2499 __ strh(IP, Address(dst_ptr, char_size, Address::PostIndex));
2500 __ b(&remainder, GT);
jessicahandojo05765752016-09-09 19:01:32 -07002501 __ b(&done);
2502
2503 if (mirror::kUseStringCompression) {
2504 const size_t c_char_size = Primitive::ComponentSize(Primitive::kPrimByte);
2505 DCHECK_EQ(c_char_size, 1u);
2506 // Copy loop for compressed src, copying 1 character (8-bit) to (16-bit) at a time.
2507 __ Bind(&compressed_string_preloop);
2508 __ add(src_ptr, src_ptr, ShifterOperand(srcBegin));
2509 __ Bind(&compressed_string_loop);
2510 __ ldrb(IP, Address(src_ptr, c_char_size, Address::PostIndex));
2511 __ strh(IP, Address(dst_ptr, char_size, Address::PostIndex));
2512 __ subs(num_chr, num_chr, ShifterOperand(1));
2513 __ b(&compressed_string_loop, GT);
2514 }
Scott Wakeling3fdab772016-04-25 11:32:37 +01002515
Tim Zhang25abd6c2016-01-19 23:39:24 +08002516 __ Bind(&done);
2517}
2518
Anton Kirilova3ffea22016-04-07 17:02:37 +01002519void IntrinsicLocationsBuilderARM::VisitFloatIsInfinite(HInvoke* invoke) {
2520 CreateFPToIntLocations(arena_, invoke);
2521}
2522
2523void IntrinsicCodeGeneratorARM::VisitFloatIsInfinite(HInvoke* invoke) {
2524 ArmAssembler* const assembler = GetAssembler();
2525 LocationSummary* const locations = invoke->GetLocations();
2526 const Register out = locations->Out().AsRegister<Register>();
2527 // Shifting left by 1 bit makes the value encodable as an immediate operand;
2528 // we don't care about the sign bit anyway.
2529 constexpr uint32_t infinity = kPositiveInfinityFloat << 1U;
2530
2531 __ vmovrs(out, locations->InAt(0).AsFpuRegister<SRegister>());
2532 // We don't care about the sign bit, so shift left.
2533 __ Lsl(out, out, 1);
2534 __ eor(out, out, ShifterOperand(infinity));
2535 // If the result is 0, then it has 32 leading zeros, and less than that otherwise.
2536 __ clz(out, out);
2537 // Any number less than 32 logically shifted right by 5 bits results in 0;
2538 // the same operation on 32 yields 1.
2539 __ Lsr(out, out, 5);
2540}
2541
2542void IntrinsicLocationsBuilderARM::VisitDoubleIsInfinite(HInvoke* invoke) {
2543 CreateFPToIntLocations(arena_, invoke);
2544}
2545
2546void IntrinsicCodeGeneratorARM::VisitDoubleIsInfinite(HInvoke* invoke) {
2547 ArmAssembler* const assembler = GetAssembler();
2548 LocationSummary* const locations = invoke->GetLocations();
2549 const Register out = locations->Out().AsRegister<Register>();
2550 // The highest 32 bits of double precision positive infinity separated into
2551 // two constants encodable as immediate operands.
2552 constexpr uint32_t infinity_high = 0x7f000000U;
2553 constexpr uint32_t infinity_high2 = 0x00f00000U;
2554
2555 static_assert((infinity_high | infinity_high2) == static_cast<uint32_t>(kPositiveInfinityDouble >> 32U),
2556 "The constants do not add up to the high 32 bits of double precision positive infinity.");
2557 __ vmovrrd(IP, out, FromLowSToD(locations->InAt(0).AsFpuRegisterPairLow<SRegister>()));
2558 __ eor(out, out, ShifterOperand(infinity_high));
2559 __ eor(out, out, ShifterOperand(infinity_high2));
2560 // We don't care about the sign bit, so shift left.
2561 __ orr(out, IP, ShifterOperand(out, LSL, 1));
2562 // If the result is 0, then it has 32 leading zeros, and less than that otherwise.
2563 __ clz(out, out);
2564 // Any number less than 32 logically shifted right by 5 bits results in 0;
2565 // the same operation on 32 yields 1.
2566 __ Lsr(out, out, 5);
2567}
2568
Aart Bik2f9fcc92016-03-01 15:16:54 -08002569UNIMPLEMENTED_INTRINSIC(ARM, MathMinDoubleDouble)
2570UNIMPLEMENTED_INTRINSIC(ARM, MathMinFloatFloat)
2571UNIMPLEMENTED_INTRINSIC(ARM, MathMaxDoubleDouble)
2572UNIMPLEMENTED_INTRINSIC(ARM, MathMaxFloatFloat)
2573UNIMPLEMENTED_INTRINSIC(ARM, MathMinLongLong)
2574UNIMPLEMENTED_INTRINSIC(ARM, MathMaxLongLong)
2575UNIMPLEMENTED_INTRINSIC(ARM, MathCeil) // Could be done by changing rounding mode, maybe?
2576UNIMPLEMENTED_INTRINSIC(ARM, MathFloor) // Could be done by changing rounding mode, maybe?
2577UNIMPLEMENTED_INTRINSIC(ARM, MathRint)
2578UNIMPLEMENTED_INTRINSIC(ARM, MathRoundDouble) // Could be done by changing rounding mode, maybe?
2579UNIMPLEMENTED_INTRINSIC(ARM, MathRoundFloat) // Could be done by changing rounding mode, maybe?
2580UNIMPLEMENTED_INTRINSIC(ARM, UnsafeCASLong) // High register pressure.
2581UNIMPLEMENTED_INTRINSIC(ARM, SystemArrayCopyChar)
2582UNIMPLEMENTED_INTRINSIC(ARM, ReferenceGetReferent)
Aart Bik2f9fcc92016-03-01 15:16:54 -08002583UNIMPLEMENTED_INTRINSIC(ARM, IntegerHighestOneBit)
2584UNIMPLEMENTED_INTRINSIC(ARM, LongHighestOneBit)
2585UNIMPLEMENTED_INTRINSIC(ARM, IntegerLowestOneBit)
2586UNIMPLEMENTED_INTRINSIC(ARM, LongLowestOneBit)
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -08002587
Aart Bik0e54c012016-03-04 12:08:31 -08002588// 1.8.
2589UNIMPLEMENTED_INTRINSIC(ARM, UnsafeGetAndAddInt)
2590UNIMPLEMENTED_INTRINSIC(ARM, UnsafeGetAndAddLong)
2591UNIMPLEMENTED_INTRINSIC(ARM, UnsafeGetAndSetInt)
2592UNIMPLEMENTED_INTRINSIC(ARM, UnsafeGetAndSetLong)
2593UNIMPLEMENTED_INTRINSIC(ARM, UnsafeGetAndSetObject)
Aart Bik0e54c012016-03-04 12:08:31 -08002594
Aart Bik2f9fcc92016-03-01 15:16:54 -08002595UNREACHABLE_INTRINSICS(ARM)
Roland Levillain4d027112015-07-01 15:41:14 +01002596
2597#undef __
2598
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -08002599} // namespace arm
2600} // namespace art