blob: 5e5e9732a5b2435c6ad3829c3b141eefdfbb2b60 [file] [log] [blame]
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -08001/*
2 * Copyright (C) 2015 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17#include "intrinsics_arm.h"
18
19#include "arch/arm/instruction_set_features_arm.h"
Mathieu Chartiere401d142015-04-22 13:56:20 -070020#include "art_method.h"
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -080021#include "code_generator_arm.h"
22#include "entrypoints/quick/quick_entrypoints.h"
23#include "intrinsics.h"
Andreas Gampe85b62f22015-09-09 13:15:38 -070024#include "intrinsics_utils.h"
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -080025#include "mirror/array-inl.h"
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -080026#include "mirror/string.h"
27#include "thread.h"
28#include "utils/arm/assembler_arm.h"
29
30namespace art {
31
32namespace arm {
33
34ArmAssembler* IntrinsicCodeGeneratorARM::GetAssembler() {
35 return codegen_->GetAssembler();
36}
37
38ArenaAllocator* IntrinsicCodeGeneratorARM::GetAllocator() {
39 return codegen_->GetGraph()->GetArena();
40}
41
Andreas Gampe85b62f22015-09-09 13:15:38 -070042using IntrinsicSlowPathARM = IntrinsicSlowPath<InvokeDexCallingConventionVisitorARM>;
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -080043
44bool IntrinsicLocationsBuilderARM::TryDispatch(HInvoke* invoke) {
45 Dispatch(invoke);
46 LocationSummary* res = invoke->GetLocations();
Roland Levillain3b359c72015-11-17 19:35:12 +000047 if (res == nullptr) {
48 return false;
49 }
50 if (kEmitCompilerReadBarrier && res->CanCall()) {
51 // Generating an intrinsic for this HInvoke may produce an
52 // IntrinsicSlowPathARM slow path. Currently this approach
53 // does not work when using read barriers, as the emitted
54 // calling sequence will make use of another slow path
55 // (ReadBarrierForRootSlowPathARM for HInvokeStaticOrDirect,
56 // ReadBarrierSlowPathARM for HInvokeVirtual). So we bail
57 // out in this case.
58 //
59 // TODO: Find a way to have intrinsics work with read barriers.
60 invoke->SetLocations(nullptr);
61 return false;
62 }
63 return res->Intrinsified();
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -080064}
65
66#define __ assembler->
67
68static void CreateFPToIntLocations(ArenaAllocator* arena, HInvoke* invoke) {
69 LocationSummary* locations = new (arena) LocationSummary(invoke,
70 LocationSummary::kNoCall,
71 kIntrinsified);
72 locations->SetInAt(0, Location::RequiresFpuRegister());
73 locations->SetOut(Location::RequiresRegister());
74}
75
76static void CreateIntToFPLocations(ArenaAllocator* arena, HInvoke* invoke) {
77 LocationSummary* locations = new (arena) LocationSummary(invoke,
78 LocationSummary::kNoCall,
79 kIntrinsified);
80 locations->SetInAt(0, Location::RequiresRegister());
81 locations->SetOut(Location::RequiresFpuRegister());
82}
83
84static void MoveFPToInt(LocationSummary* locations, bool is64bit, ArmAssembler* assembler) {
85 Location input = locations->InAt(0);
86 Location output = locations->Out();
87 if (is64bit) {
88 __ vmovrrd(output.AsRegisterPairLow<Register>(),
89 output.AsRegisterPairHigh<Register>(),
90 FromLowSToD(input.AsFpuRegisterPairLow<SRegister>()));
91 } else {
92 __ vmovrs(output.AsRegister<Register>(), input.AsFpuRegister<SRegister>());
93 }
94}
95
96static void MoveIntToFP(LocationSummary* locations, bool is64bit, ArmAssembler* assembler) {
97 Location input = locations->InAt(0);
98 Location output = locations->Out();
99 if (is64bit) {
100 __ vmovdrr(FromLowSToD(output.AsFpuRegisterPairLow<SRegister>()),
101 input.AsRegisterPairLow<Register>(),
102 input.AsRegisterPairHigh<Register>());
103 } else {
104 __ vmovsr(output.AsFpuRegister<SRegister>(), input.AsRegister<Register>());
105 }
106}
107
108void IntrinsicLocationsBuilderARM::VisitDoubleDoubleToRawLongBits(HInvoke* invoke) {
109 CreateFPToIntLocations(arena_, invoke);
110}
111void IntrinsicLocationsBuilderARM::VisitDoubleLongBitsToDouble(HInvoke* invoke) {
112 CreateIntToFPLocations(arena_, invoke);
113}
114
115void IntrinsicCodeGeneratorARM::VisitDoubleDoubleToRawLongBits(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000116 MoveFPToInt(invoke->GetLocations(), /* is64bit */ true, GetAssembler());
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800117}
118void IntrinsicCodeGeneratorARM::VisitDoubleLongBitsToDouble(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000119 MoveIntToFP(invoke->GetLocations(), /* is64bit */ true, GetAssembler());
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800120}
121
122void IntrinsicLocationsBuilderARM::VisitFloatFloatToRawIntBits(HInvoke* invoke) {
123 CreateFPToIntLocations(arena_, invoke);
124}
125void IntrinsicLocationsBuilderARM::VisitFloatIntBitsToFloat(HInvoke* invoke) {
126 CreateIntToFPLocations(arena_, invoke);
127}
128
129void IntrinsicCodeGeneratorARM::VisitFloatFloatToRawIntBits(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000130 MoveFPToInt(invoke->GetLocations(), /* is64bit */ false, GetAssembler());
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800131}
132void IntrinsicCodeGeneratorARM::VisitFloatIntBitsToFloat(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000133 MoveIntToFP(invoke->GetLocations(), /* is64bit */ false, GetAssembler());
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800134}
135
136static void CreateIntToIntLocations(ArenaAllocator* arena, HInvoke* invoke) {
137 LocationSummary* locations = new (arena) LocationSummary(invoke,
138 LocationSummary::kNoCall,
139 kIntrinsified);
140 locations->SetInAt(0, Location::RequiresRegister());
141 locations->SetOut(Location::RequiresRegister(), Location::kNoOutputOverlap);
142}
143
144static void CreateFPToFPLocations(ArenaAllocator* arena, HInvoke* invoke) {
145 LocationSummary* locations = new (arena) LocationSummary(invoke,
146 LocationSummary::kNoCall,
147 kIntrinsified);
148 locations->SetInAt(0, Location::RequiresFpuRegister());
149 locations->SetOut(Location::RequiresFpuRegister(), Location::kNoOutputOverlap);
150}
151
Scott Wakeling611d3392015-07-10 11:42:06 +0100152static void GenNumberOfLeadingZeros(LocationSummary* locations,
153 Primitive::Type type,
154 ArmAssembler* assembler) {
155 Location in = locations->InAt(0);
156 Register out = locations->Out().AsRegister<Register>();
157
158 DCHECK((type == Primitive::kPrimInt) || (type == Primitive::kPrimLong));
159
160 if (type == Primitive::kPrimLong) {
161 Register in_reg_lo = in.AsRegisterPairLow<Register>();
162 Register in_reg_hi = in.AsRegisterPairHigh<Register>();
163 Label end;
164 __ clz(out, in_reg_hi);
165 __ CompareAndBranchIfNonZero(in_reg_hi, &end);
166 __ clz(out, in_reg_lo);
167 __ AddConstant(out, 32);
168 __ Bind(&end);
169 } else {
170 __ clz(out, in.AsRegister<Register>());
171 }
172}
173
174void IntrinsicLocationsBuilderARM::VisitIntegerNumberOfLeadingZeros(HInvoke* invoke) {
175 CreateIntToIntLocations(arena_, invoke);
176}
177
178void IntrinsicCodeGeneratorARM::VisitIntegerNumberOfLeadingZeros(HInvoke* invoke) {
179 GenNumberOfLeadingZeros(invoke->GetLocations(), Primitive::kPrimInt, GetAssembler());
180}
181
182void IntrinsicLocationsBuilderARM::VisitLongNumberOfLeadingZeros(HInvoke* invoke) {
183 LocationSummary* locations = new (arena_) LocationSummary(invoke,
184 LocationSummary::kNoCall,
185 kIntrinsified);
186 locations->SetInAt(0, Location::RequiresRegister());
187 locations->SetOut(Location::RequiresRegister(), Location::kOutputOverlap);
188}
189
190void IntrinsicCodeGeneratorARM::VisitLongNumberOfLeadingZeros(HInvoke* invoke) {
191 GenNumberOfLeadingZeros(invoke->GetLocations(), Primitive::kPrimLong, GetAssembler());
192}
193
Scott Wakeling9ee23f42015-07-23 10:44:35 +0100194static void GenNumberOfTrailingZeros(LocationSummary* locations,
195 Primitive::Type type,
196 ArmAssembler* assembler) {
197 DCHECK((type == Primitive::kPrimInt) || (type == Primitive::kPrimLong));
198
199 Register out = locations->Out().AsRegister<Register>();
200
201 if (type == Primitive::kPrimLong) {
202 Register in_reg_lo = locations->InAt(0).AsRegisterPairLow<Register>();
203 Register in_reg_hi = locations->InAt(0).AsRegisterPairHigh<Register>();
204 Label end;
205 __ rbit(out, in_reg_lo);
206 __ clz(out, out);
207 __ CompareAndBranchIfNonZero(in_reg_lo, &end);
208 __ rbit(out, in_reg_hi);
209 __ clz(out, out);
210 __ AddConstant(out, 32);
211 __ Bind(&end);
212 } else {
213 Register in = locations->InAt(0).AsRegister<Register>();
214 __ rbit(out, in);
215 __ clz(out, out);
216 }
217}
218
219void IntrinsicLocationsBuilderARM::VisitIntegerNumberOfTrailingZeros(HInvoke* invoke) {
220 LocationSummary* locations = new (arena_) LocationSummary(invoke,
221 LocationSummary::kNoCall,
222 kIntrinsified);
223 locations->SetInAt(0, Location::RequiresRegister());
224 locations->SetOut(Location::RequiresRegister(), Location::kNoOutputOverlap);
225}
226
227void IntrinsicCodeGeneratorARM::VisitIntegerNumberOfTrailingZeros(HInvoke* invoke) {
228 GenNumberOfTrailingZeros(invoke->GetLocations(), Primitive::kPrimInt, GetAssembler());
229}
230
231void IntrinsicLocationsBuilderARM::VisitLongNumberOfTrailingZeros(HInvoke* invoke) {
232 LocationSummary* locations = new (arena_) LocationSummary(invoke,
233 LocationSummary::kNoCall,
234 kIntrinsified);
235 locations->SetInAt(0, Location::RequiresRegister());
236 locations->SetOut(Location::RequiresRegister(), Location::kOutputOverlap);
237}
238
239void IntrinsicCodeGeneratorARM::VisitLongNumberOfTrailingZeros(HInvoke* invoke) {
240 GenNumberOfTrailingZeros(invoke->GetLocations(), Primitive::kPrimLong, GetAssembler());
241}
242
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800243static void MathAbsFP(LocationSummary* locations, bool is64bit, ArmAssembler* assembler) {
244 Location in = locations->InAt(0);
245 Location out = locations->Out();
246
247 if (is64bit) {
248 __ vabsd(FromLowSToD(out.AsFpuRegisterPairLow<SRegister>()),
249 FromLowSToD(in.AsFpuRegisterPairLow<SRegister>()));
250 } else {
251 __ vabss(out.AsFpuRegister<SRegister>(), in.AsFpuRegister<SRegister>());
252 }
253}
254
255void IntrinsicLocationsBuilderARM::VisitMathAbsDouble(HInvoke* invoke) {
256 CreateFPToFPLocations(arena_, invoke);
257}
258
259void IntrinsicCodeGeneratorARM::VisitMathAbsDouble(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000260 MathAbsFP(invoke->GetLocations(), /* is64bit */ true, GetAssembler());
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800261}
262
263void IntrinsicLocationsBuilderARM::VisitMathAbsFloat(HInvoke* invoke) {
264 CreateFPToFPLocations(arena_, invoke);
265}
266
267void IntrinsicCodeGeneratorARM::VisitMathAbsFloat(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000268 MathAbsFP(invoke->GetLocations(), /* is64bit */ false, GetAssembler());
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800269}
270
271static void CreateIntToIntPlusTemp(ArenaAllocator* arena, HInvoke* invoke) {
272 LocationSummary* locations = new (arena) LocationSummary(invoke,
273 LocationSummary::kNoCall,
274 kIntrinsified);
275 locations->SetInAt(0, Location::RequiresRegister());
276 locations->SetOut(Location::RequiresRegister(), Location::kNoOutputOverlap);
277
278 locations->AddTemp(Location::RequiresRegister());
279}
280
281static void GenAbsInteger(LocationSummary* locations,
282 bool is64bit,
283 ArmAssembler* assembler) {
284 Location in = locations->InAt(0);
285 Location output = locations->Out();
286
287 Register mask = locations->GetTemp(0).AsRegister<Register>();
288
289 if (is64bit) {
290 Register in_reg_lo = in.AsRegisterPairLow<Register>();
291 Register in_reg_hi = in.AsRegisterPairHigh<Register>();
292 Register out_reg_lo = output.AsRegisterPairLow<Register>();
293 Register out_reg_hi = output.AsRegisterPairHigh<Register>();
294
295 DCHECK_NE(out_reg_lo, in_reg_hi) << "Diagonal overlap unexpected.";
296
297 __ Asr(mask, in_reg_hi, 31);
298 __ adds(out_reg_lo, in_reg_lo, ShifterOperand(mask));
299 __ adc(out_reg_hi, in_reg_hi, ShifterOperand(mask));
300 __ eor(out_reg_lo, mask, ShifterOperand(out_reg_lo));
301 __ eor(out_reg_hi, mask, ShifterOperand(out_reg_hi));
302 } else {
303 Register in_reg = in.AsRegister<Register>();
304 Register out_reg = output.AsRegister<Register>();
305
306 __ Asr(mask, in_reg, 31);
307 __ add(out_reg, in_reg, ShifterOperand(mask));
308 __ eor(out_reg, mask, ShifterOperand(out_reg));
309 }
310}
311
312void IntrinsicLocationsBuilderARM::VisitMathAbsInt(HInvoke* invoke) {
313 CreateIntToIntPlusTemp(arena_, invoke);
314}
315
316void IntrinsicCodeGeneratorARM::VisitMathAbsInt(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000317 GenAbsInteger(invoke->GetLocations(), /* is64bit */ false, GetAssembler());
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800318}
319
320
321void IntrinsicLocationsBuilderARM::VisitMathAbsLong(HInvoke* invoke) {
322 CreateIntToIntPlusTemp(arena_, invoke);
323}
324
325void IntrinsicCodeGeneratorARM::VisitMathAbsLong(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000326 GenAbsInteger(invoke->GetLocations(), /* is64bit */ true, GetAssembler());
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800327}
328
329static void GenMinMax(LocationSummary* locations,
330 bool is_min,
331 ArmAssembler* assembler) {
332 Register op1 = locations->InAt(0).AsRegister<Register>();
333 Register op2 = locations->InAt(1).AsRegister<Register>();
334 Register out = locations->Out().AsRegister<Register>();
335
336 __ cmp(op1, ShifterOperand(op2));
337
338 __ it((is_min) ? Condition::LT : Condition::GT, kItElse);
339 __ mov(out, ShifterOperand(op1), is_min ? Condition::LT : Condition::GT);
340 __ mov(out, ShifterOperand(op2), is_min ? Condition::GE : Condition::LE);
341}
342
343static void CreateIntIntToIntLocations(ArenaAllocator* arena, HInvoke* invoke) {
344 LocationSummary* locations = new (arena) LocationSummary(invoke,
345 LocationSummary::kNoCall,
346 kIntrinsified);
347 locations->SetInAt(0, Location::RequiresRegister());
348 locations->SetInAt(1, Location::RequiresRegister());
349 locations->SetOut(Location::RequiresRegister(), Location::kNoOutputOverlap);
350}
351
352void IntrinsicLocationsBuilderARM::VisitMathMinIntInt(HInvoke* invoke) {
353 CreateIntIntToIntLocations(arena_, invoke);
354}
355
356void IntrinsicCodeGeneratorARM::VisitMathMinIntInt(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000357 GenMinMax(invoke->GetLocations(), /* is_min */ true, GetAssembler());
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800358}
359
360void IntrinsicLocationsBuilderARM::VisitMathMaxIntInt(HInvoke* invoke) {
361 CreateIntIntToIntLocations(arena_, invoke);
362}
363
364void IntrinsicCodeGeneratorARM::VisitMathMaxIntInt(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000365 GenMinMax(invoke->GetLocations(), /* is_min */ false, GetAssembler());
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800366}
367
368void IntrinsicLocationsBuilderARM::VisitMathSqrt(HInvoke* invoke) {
369 CreateFPToFPLocations(arena_, invoke);
370}
371
372void IntrinsicCodeGeneratorARM::VisitMathSqrt(HInvoke* invoke) {
373 LocationSummary* locations = invoke->GetLocations();
374 ArmAssembler* assembler = GetAssembler();
375 __ vsqrtd(FromLowSToD(locations->Out().AsFpuRegisterPairLow<SRegister>()),
376 FromLowSToD(locations->InAt(0).AsFpuRegisterPairLow<SRegister>()));
377}
378
379void IntrinsicLocationsBuilderARM::VisitMemoryPeekByte(HInvoke* invoke) {
380 CreateIntToIntLocations(arena_, invoke);
381}
382
383void IntrinsicCodeGeneratorARM::VisitMemoryPeekByte(HInvoke* invoke) {
384 ArmAssembler* assembler = GetAssembler();
385 // Ignore upper 4B of long address.
386 __ ldrsb(invoke->GetLocations()->Out().AsRegister<Register>(),
387 Address(invoke->GetLocations()->InAt(0).AsRegisterPairLow<Register>()));
388}
389
390void IntrinsicLocationsBuilderARM::VisitMemoryPeekIntNative(HInvoke* invoke) {
391 CreateIntToIntLocations(arena_, invoke);
392}
393
394void IntrinsicCodeGeneratorARM::VisitMemoryPeekIntNative(HInvoke* invoke) {
395 ArmAssembler* assembler = GetAssembler();
396 // Ignore upper 4B of long address.
397 __ ldr(invoke->GetLocations()->Out().AsRegister<Register>(),
398 Address(invoke->GetLocations()->InAt(0).AsRegisterPairLow<Register>()));
399}
400
401void IntrinsicLocationsBuilderARM::VisitMemoryPeekLongNative(HInvoke* invoke) {
402 CreateIntToIntLocations(arena_, invoke);
403}
404
405void IntrinsicCodeGeneratorARM::VisitMemoryPeekLongNative(HInvoke* invoke) {
406 ArmAssembler* assembler = GetAssembler();
407 // Ignore upper 4B of long address.
408 Register addr = invoke->GetLocations()->InAt(0).AsRegisterPairLow<Register>();
409 // Worst case: Control register bit SCTLR.A = 0. Then unaligned accesses throw a processor
410 // exception. So we can't use ldrd as addr may be unaligned.
411 Register lo = invoke->GetLocations()->Out().AsRegisterPairLow<Register>();
412 Register hi = invoke->GetLocations()->Out().AsRegisterPairHigh<Register>();
413 if (addr == lo) {
414 __ ldr(hi, Address(addr, 4));
415 __ ldr(lo, Address(addr, 0));
416 } else {
417 __ ldr(lo, Address(addr, 0));
418 __ ldr(hi, Address(addr, 4));
419 }
420}
421
422void IntrinsicLocationsBuilderARM::VisitMemoryPeekShortNative(HInvoke* invoke) {
423 CreateIntToIntLocations(arena_, invoke);
424}
425
426void IntrinsicCodeGeneratorARM::VisitMemoryPeekShortNative(HInvoke* invoke) {
427 ArmAssembler* assembler = GetAssembler();
428 // Ignore upper 4B of long address.
429 __ ldrsh(invoke->GetLocations()->Out().AsRegister<Register>(),
430 Address(invoke->GetLocations()->InAt(0).AsRegisterPairLow<Register>()));
431}
432
433static void CreateIntIntToVoidLocations(ArenaAllocator* arena, HInvoke* invoke) {
434 LocationSummary* locations = new (arena) LocationSummary(invoke,
435 LocationSummary::kNoCall,
436 kIntrinsified);
437 locations->SetInAt(0, Location::RequiresRegister());
438 locations->SetInAt(1, Location::RequiresRegister());
439}
440
441void IntrinsicLocationsBuilderARM::VisitMemoryPokeByte(HInvoke* invoke) {
442 CreateIntIntToVoidLocations(arena_, invoke);
443}
444
445void IntrinsicCodeGeneratorARM::VisitMemoryPokeByte(HInvoke* invoke) {
446 ArmAssembler* assembler = GetAssembler();
447 __ strb(invoke->GetLocations()->InAt(1).AsRegister<Register>(),
448 Address(invoke->GetLocations()->InAt(0).AsRegisterPairLow<Register>()));
449}
450
451void IntrinsicLocationsBuilderARM::VisitMemoryPokeIntNative(HInvoke* invoke) {
452 CreateIntIntToVoidLocations(arena_, invoke);
453}
454
455void IntrinsicCodeGeneratorARM::VisitMemoryPokeIntNative(HInvoke* invoke) {
456 ArmAssembler* assembler = GetAssembler();
457 __ str(invoke->GetLocations()->InAt(1).AsRegister<Register>(),
458 Address(invoke->GetLocations()->InAt(0).AsRegisterPairLow<Register>()));
459}
460
461void IntrinsicLocationsBuilderARM::VisitMemoryPokeLongNative(HInvoke* invoke) {
462 CreateIntIntToVoidLocations(arena_, invoke);
463}
464
465void IntrinsicCodeGeneratorARM::VisitMemoryPokeLongNative(HInvoke* invoke) {
466 ArmAssembler* assembler = GetAssembler();
467 // Ignore upper 4B of long address.
468 Register addr = invoke->GetLocations()->InAt(0).AsRegisterPairLow<Register>();
469 // Worst case: Control register bit SCTLR.A = 0. Then unaligned accesses throw a processor
470 // exception. So we can't use ldrd as addr may be unaligned.
471 __ str(invoke->GetLocations()->InAt(1).AsRegisterPairLow<Register>(), Address(addr, 0));
472 __ str(invoke->GetLocations()->InAt(1).AsRegisterPairHigh<Register>(), Address(addr, 4));
473}
474
475void IntrinsicLocationsBuilderARM::VisitMemoryPokeShortNative(HInvoke* invoke) {
476 CreateIntIntToVoidLocations(arena_, invoke);
477}
478
479void IntrinsicCodeGeneratorARM::VisitMemoryPokeShortNative(HInvoke* invoke) {
480 ArmAssembler* assembler = GetAssembler();
481 __ strh(invoke->GetLocations()->InAt(1).AsRegister<Register>(),
482 Address(invoke->GetLocations()->InAt(0).AsRegisterPairLow<Register>()));
483}
484
485void IntrinsicLocationsBuilderARM::VisitThreadCurrentThread(HInvoke* invoke) {
486 LocationSummary* locations = new (arena_) LocationSummary(invoke,
487 LocationSummary::kNoCall,
488 kIntrinsified);
489 locations->SetOut(Location::RequiresRegister());
490}
491
492void IntrinsicCodeGeneratorARM::VisitThreadCurrentThread(HInvoke* invoke) {
493 ArmAssembler* assembler = GetAssembler();
494 __ LoadFromOffset(kLoadWord,
495 invoke->GetLocations()->Out().AsRegister<Register>(),
496 TR,
497 Thread::PeerOffset<kArmPointerSize>().Int32Value());
498}
499
500static void GenUnsafeGet(HInvoke* invoke,
501 Primitive::Type type,
502 bool is_volatile,
503 CodeGeneratorARM* codegen) {
504 LocationSummary* locations = invoke->GetLocations();
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800505 ArmAssembler* assembler = codegen->GetAssembler();
Roland Levillain3b359c72015-11-17 19:35:12 +0000506 Location base_loc = locations->InAt(1);
507 Register base = base_loc.AsRegister<Register>(); // Object pointer.
508 Location offset_loc = locations->InAt(2);
509 Register offset = offset_loc.AsRegisterPairLow<Register>(); // Long offset, lo part only.
510 Location trg_loc = locations->Out();
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800511
Roland Levillainc9285912015-12-18 10:38:42 +0000512 switch (type) {
513 case Primitive::kPrimInt: {
514 Register trg = trg_loc.AsRegister<Register>();
515 __ ldr(trg, Address(base, offset));
516 if (is_volatile) {
517 __ dmb(ISH);
518 }
519 break;
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800520 }
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800521
Roland Levillainc9285912015-12-18 10:38:42 +0000522 case Primitive::kPrimNot: {
523 Register trg = trg_loc.AsRegister<Register>();
524 if (kEmitCompilerReadBarrier) {
525 if (kUseBakerReadBarrier) {
526 Location temp = locations->GetTemp(0);
527 codegen->GenerateArrayLoadWithBakerReadBarrier(
528 invoke, trg_loc, base, 0U, offset_loc, temp, /* needs_null_check */ false);
529 if (is_volatile) {
530 __ dmb(ISH);
531 }
532 } else {
533 __ ldr(trg, Address(base, offset));
534 if (is_volatile) {
535 __ dmb(ISH);
536 }
537 codegen->GenerateReadBarrierSlow(invoke, trg_loc, trg_loc, base_loc, 0U, offset_loc);
538 }
539 } else {
540 __ ldr(trg, Address(base, offset));
541 if (is_volatile) {
542 __ dmb(ISH);
543 }
544 __ MaybeUnpoisonHeapReference(trg);
545 }
546 break;
547 }
Roland Levillain4d027112015-07-01 15:41:14 +0100548
Roland Levillainc9285912015-12-18 10:38:42 +0000549 case Primitive::kPrimLong: {
550 Register trg_lo = trg_loc.AsRegisterPairLow<Register>();
551 __ add(IP, base, ShifterOperand(offset));
552 if (is_volatile && !codegen->GetInstructionSetFeatures().HasAtomicLdrdAndStrd()) {
553 Register trg_hi = trg_loc.AsRegisterPairHigh<Register>();
554 __ ldrexd(trg_lo, trg_hi, IP);
555 } else {
556 __ ldrd(trg_lo, Address(IP));
557 }
558 if (is_volatile) {
559 __ dmb(ISH);
560 }
561 break;
562 }
563
564 default:
565 LOG(FATAL) << "Unexpected type " << type;
566 UNREACHABLE();
Roland Levillain4d027112015-07-01 15:41:14 +0100567 }
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800568}
569
Roland Levillainc9285912015-12-18 10:38:42 +0000570static void CreateIntIntIntToIntLocations(ArenaAllocator* arena,
571 HInvoke* invoke,
572 Primitive::Type type) {
Roland Levillain3b359c72015-11-17 19:35:12 +0000573 bool can_call = kEmitCompilerReadBarrier &&
574 (invoke->GetIntrinsic() == Intrinsics::kUnsafeGetObject ||
575 invoke->GetIntrinsic() == Intrinsics::kUnsafeGetObjectVolatile);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800576 LocationSummary* locations = new (arena) LocationSummary(invoke,
Roland Levillain3b359c72015-11-17 19:35:12 +0000577 can_call ?
578 LocationSummary::kCallOnSlowPath :
579 LocationSummary::kNoCall,
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800580 kIntrinsified);
581 locations->SetInAt(0, Location::NoLocation()); // Unused receiver.
582 locations->SetInAt(1, Location::RequiresRegister());
583 locations->SetInAt(2, Location::RequiresRegister());
584 locations->SetOut(Location::RequiresRegister(), Location::kNoOutputOverlap);
Roland Levillainc9285912015-12-18 10:38:42 +0000585 if (type == Primitive::kPrimNot && kEmitCompilerReadBarrier && kUseBakerReadBarrier) {
586 // We need a temporary register for the read barrier marking slow
587 // path in InstructionCodeGeneratorARM::GenerateArrayLoadWithBakerReadBarrier.
588 locations->AddTemp(Location::RequiresRegister());
589 }
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800590}
591
592void IntrinsicLocationsBuilderARM::VisitUnsafeGet(HInvoke* invoke) {
Roland Levillainc9285912015-12-18 10:38:42 +0000593 CreateIntIntIntToIntLocations(arena_, invoke, Primitive::kPrimInt);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800594}
595void IntrinsicLocationsBuilderARM::VisitUnsafeGetVolatile(HInvoke* invoke) {
Roland Levillainc9285912015-12-18 10:38:42 +0000596 CreateIntIntIntToIntLocations(arena_, invoke, Primitive::kPrimInt);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800597}
598void IntrinsicLocationsBuilderARM::VisitUnsafeGetLong(HInvoke* invoke) {
Roland Levillainc9285912015-12-18 10:38:42 +0000599 CreateIntIntIntToIntLocations(arena_, invoke, Primitive::kPrimLong);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800600}
601void IntrinsicLocationsBuilderARM::VisitUnsafeGetLongVolatile(HInvoke* invoke) {
Roland Levillainc9285912015-12-18 10:38:42 +0000602 CreateIntIntIntToIntLocations(arena_, invoke, Primitive::kPrimLong);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800603}
604void IntrinsicLocationsBuilderARM::VisitUnsafeGetObject(HInvoke* invoke) {
Roland Levillainc9285912015-12-18 10:38:42 +0000605 CreateIntIntIntToIntLocations(arena_, invoke, Primitive::kPrimNot);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800606}
607void IntrinsicLocationsBuilderARM::VisitUnsafeGetObjectVolatile(HInvoke* invoke) {
Roland Levillainc9285912015-12-18 10:38:42 +0000608 CreateIntIntIntToIntLocations(arena_, invoke, Primitive::kPrimNot);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800609}
610
611void IntrinsicCodeGeneratorARM::VisitUnsafeGet(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000612 GenUnsafeGet(invoke, Primitive::kPrimInt, /* is_volatile */ false, codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800613}
614void IntrinsicCodeGeneratorARM::VisitUnsafeGetVolatile(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000615 GenUnsafeGet(invoke, Primitive::kPrimInt, /* is_volatile */ true, codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800616}
617void IntrinsicCodeGeneratorARM::VisitUnsafeGetLong(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000618 GenUnsafeGet(invoke, Primitive::kPrimLong, /* is_volatile */ false, codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800619}
620void IntrinsicCodeGeneratorARM::VisitUnsafeGetLongVolatile(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000621 GenUnsafeGet(invoke, Primitive::kPrimLong, /* is_volatile */ true, codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800622}
623void IntrinsicCodeGeneratorARM::VisitUnsafeGetObject(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000624 GenUnsafeGet(invoke, Primitive::kPrimNot, /* is_volatile */ false, codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800625}
626void IntrinsicCodeGeneratorARM::VisitUnsafeGetObjectVolatile(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000627 GenUnsafeGet(invoke, Primitive::kPrimNot, /* is_volatile */ true, codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800628}
629
630static void CreateIntIntIntIntToVoid(ArenaAllocator* arena,
631 const ArmInstructionSetFeatures& features,
632 Primitive::Type type,
633 bool is_volatile,
634 HInvoke* invoke) {
635 LocationSummary* locations = new (arena) LocationSummary(invoke,
636 LocationSummary::kNoCall,
637 kIntrinsified);
638 locations->SetInAt(0, Location::NoLocation()); // Unused receiver.
639 locations->SetInAt(1, Location::RequiresRegister());
640 locations->SetInAt(2, Location::RequiresRegister());
641 locations->SetInAt(3, Location::RequiresRegister());
642
643 if (type == Primitive::kPrimLong) {
644 // Potentially need temps for ldrexd-strexd loop.
645 if (is_volatile && !features.HasAtomicLdrdAndStrd()) {
646 locations->AddTemp(Location::RequiresRegister()); // Temp_lo.
647 locations->AddTemp(Location::RequiresRegister()); // Temp_hi.
648 }
649 } else if (type == Primitive::kPrimNot) {
650 // Temps for card-marking.
651 locations->AddTemp(Location::RequiresRegister()); // Temp.
652 locations->AddTemp(Location::RequiresRegister()); // Card.
653 }
654}
655
656void IntrinsicLocationsBuilderARM::VisitUnsafePut(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000657 CreateIntIntIntIntToVoid(arena_, features_, Primitive::kPrimInt, /* is_volatile */ false, invoke);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800658}
659void IntrinsicLocationsBuilderARM::VisitUnsafePutOrdered(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000660 CreateIntIntIntIntToVoid(arena_, features_, Primitive::kPrimInt, /* is_volatile */ false, invoke);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800661}
662void IntrinsicLocationsBuilderARM::VisitUnsafePutVolatile(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000663 CreateIntIntIntIntToVoid(arena_, features_, Primitive::kPrimInt, /* is_volatile */ true, invoke);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800664}
665void IntrinsicLocationsBuilderARM::VisitUnsafePutObject(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000666 CreateIntIntIntIntToVoid(arena_, features_, Primitive::kPrimNot, /* is_volatile */ false, invoke);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800667}
668void IntrinsicLocationsBuilderARM::VisitUnsafePutObjectOrdered(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000669 CreateIntIntIntIntToVoid(arena_, features_, Primitive::kPrimNot, /* is_volatile */ false, invoke);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800670}
671void IntrinsicLocationsBuilderARM::VisitUnsafePutObjectVolatile(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000672 CreateIntIntIntIntToVoid(arena_, features_, Primitive::kPrimNot, /* is_volatile */ true, invoke);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800673}
674void IntrinsicLocationsBuilderARM::VisitUnsafePutLong(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000675 CreateIntIntIntIntToVoid(
676 arena_, features_, Primitive::kPrimLong, /* is_volatile */ false, invoke);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800677}
678void IntrinsicLocationsBuilderARM::VisitUnsafePutLongOrdered(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000679 CreateIntIntIntIntToVoid(
680 arena_, features_, Primitive::kPrimLong, /* is_volatile */ false, invoke);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800681}
682void IntrinsicLocationsBuilderARM::VisitUnsafePutLongVolatile(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000683 CreateIntIntIntIntToVoid(
684 arena_, features_, Primitive::kPrimLong, /* is_volatile */ true, invoke);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800685}
686
687static void GenUnsafePut(LocationSummary* locations,
688 Primitive::Type type,
689 bool is_volatile,
690 bool is_ordered,
691 CodeGeneratorARM* codegen) {
692 ArmAssembler* assembler = codegen->GetAssembler();
693
694 Register base = locations->InAt(1).AsRegister<Register>(); // Object pointer.
695 Register offset = locations->InAt(2).AsRegisterPairLow<Register>(); // Long offset, lo part only.
696 Register value;
697
698 if (is_volatile || is_ordered) {
699 __ dmb(ISH);
700 }
701
702 if (type == Primitive::kPrimLong) {
703 Register value_lo = locations->InAt(3).AsRegisterPairLow<Register>();
704 value = value_lo;
705 if (is_volatile && !codegen->GetInstructionSetFeatures().HasAtomicLdrdAndStrd()) {
706 Register temp_lo = locations->GetTemp(0).AsRegister<Register>();
707 Register temp_hi = locations->GetTemp(1).AsRegister<Register>();
708 Register value_hi = locations->InAt(3).AsRegisterPairHigh<Register>();
709
710 __ add(IP, base, ShifterOperand(offset));
711 Label loop_head;
712 __ Bind(&loop_head);
713 __ ldrexd(temp_lo, temp_hi, IP);
714 __ strexd(temp_lo, value_lo, value_hi, IP);
715 __ cmp(temp_lo, ShifterOperand(0));
716 __ b(&loop_head, NE);
717 } else {
718 __ add(IP, base, ShifterOperand(offset));
719 __ strd(value_lo, Address(IP));
720 }
721 } else {
Roland Levillain4d027112015-07-01 15:41:14 +0100722 value = locations->InAt(3).AsRegister<Register>();
723 Register source = value;
724 if (kPoisonHeapReferences && type == Primitive::kPrimNot) {
725 Register temp = locations->GetTemp(0).AsRegister<Register>();
726 __ Mov(temp, value);
727 __ PoisonHeapReference(temp);
728 source = temp;
729 }
730 __ str(source, Address(base, offset));
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800731 }
732
733 if (is_volatile) {
734 __ dmb(ISH);
735 }
736
737 if (type == Primitive::kPrimNot) {
738 Register temp = locations->GetTemp(0).AsRegister<Register>();
739 Register card = locations->GetTemp(1).AsRegister<Register>();
Nicolas Geoffray07276db2015-05-18 14:22:09 +0100740 bool value_can_be_null = true; // TODO: Worth finding out this information?
741 codegen->MarkGCCard(temp, card, base, value, value_can_be_null);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800742 }
743}
744
745void IntrinsicCodeGeneratorARM::VisitUnsafePut(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000746 GenUnsafePut(invoke->GetLocations(),
747 Primitive::kPrimInt,
748 /* is_volatile */ false,
749 /* is_ordered */ false,
750 codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800751}
752void IntrinsicCodeGeneratorARM::VisitUnsafePutOrdered(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000753 GenUnsafePut(invoke->GetLocations(),
754 Primitive::kPrimInt,
755 /* is_volatile */ false,
756 /* is_ordered */ true,
757 codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800758}
759void IntrinsicCodeGeneratorARM::VisitUnsafePutVolatile(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000760 GenUnsafePut(invoke->GetLocations(),
761 Primitive::kPrimInt,
762 /* is_volatile */ true,
763 /* is_ordered */ false,
764 codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800765}
766void IntrinsicCodeGeneratorARM::VisitUnsafePutObject(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000767 GenUnsafePut(invoke->GetLocations(),
768 Primitive::kPrimNot,
769 /* is_volatile */ false,
770 /* is_ordered */ false,
771 codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800772}
773void IntrinsicCodeGeneratorARM::VisitUnsafePutObjectOrdered(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000774 GenUnsafePut(invoke->GetLocations(),
775 Primitive::kPrimNot,
776 /* is_volatile */ false,
777 /* is_ordered */ true,
778 codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800779}
780void IntrinsicCodeGeneratorARM::VisitUnsafePutObjectVolatile(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000781 GenUnsafePut(invoke->GetLocations(),
782 Primitive::kPrimNot,
783 /* is_volatile */ true,
784 /* is_ordered */ false,
785 codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800786}
787void IntrinsicCodeGeneratorARM::VisitUnsafePutLong(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000788 GenUnsafePut(invoke->GetLocations(),
789 Primitive::kPrimLong,
790 /* is_volatile */ false,
791 /* is_ordered */ false,
792 codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800793}
794void IntrinsicCodeGeneratorARM::VisitUnsafePutLongOrdered(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000795 GenUnsafePut(invoke->GetLocations(),
796 Primitive::kPrimLong,
797 /* is_volatile */ false,
798 /* is_ordered */ true,
799 codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800800}
801void IntrinsicCodeGeneratorARM::VisitUnsafePutLongVolatile(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +0000802 GenUnsafePut(invoke->GetLocations(),
803 Primitive::kPrimLong,
804 /* is_volatile */ true,
805 /* is_ordered */ false,
806 codegen_);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800807}
808
809static void CreateIntIntIntIntIntToIntPlusTemps(ArenaAllocator* arena,
Roland Levillain2e50ecb2016-01-27 14:08:33 +0000810 HInvoke* invoke,
811 Primitive::Type type) {
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800812 LocationSummary* locations = new (arena) LocationSummary(invoke,
813 LocationSummary::kNoCall,
814 kIntrinsified);
815 locations->SetInAt(0, Location::NoLocation()); // Unused receiver.
816 locations->SetInAt(1, Location::RequiresRegister());
817 locations->SetInAt(2, Location::RequiresRegister());
818 locations->SetInAt(3, Location::RequiresRegister());
819 locations->SetInAt(4, Location::RequiresRegister());
820
Roland Levillain2e50ecb2016-01-27 14:08:33 +0000821 // If heap poisoning is enabled, we don't want the unpoisoning
822 // operations to potentially clobber the output.
823 Location::OutputOverlap overlaps = (kPoisonHeapReferences && type == Primitive::kPrimNot)
824 ? Location::kOutputOverlap
825 : Location::kNoOutputOverlap;
826 locations->SetOut(Location::RequiresRegister(), overlaps);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800827
828 locations->AddTemp(Location::RequiresRegister()); // Pointer.
829 locations->AddTemp(Location::RequiresRegister()); // Temp 1.
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800830}
831
832static void GenCas(LocationSummary* locations, Primitive::Type type, CodeGeneratorARM* codegen) {
833 DCHECK_NE(type, Primitive::kPrimLong);
834
835 ArmAssembler* assembler = codegen->GetAssembler();
836
837 Register out = locations->Out().AsRegister<Register>(); // Boolean result.
838
839 Register base = locations->InAt(1).AsRegister<Register>(); // Object pointer.
840 Register offset = locations->InAt(2).AsRegisterPairLow<Register>(); // Offset (discard high 4B).
841 Register expected_lo = locations->InAt(3).AsRegister<Register>(); // Expected.
842 Register value_lo = locations->InAt(4).AsRegister<Register>(); // Value.
843
844 Register tmp_ptr = locations->GetTemp(0).AsRegister<Register>(); // Pointer to actual memory.
845 Register tmp_lo = locations->GetTemp(1).AsRegister<Register>(); // Value in memory.
846
847 if (type == Primitive::kPrimNot) {
848 // Mark card for object assuming new value is stored. Worst case we will mark an unchanged
849 // object and scan the receiver at the next GC for nothing.
Nicolas Geoffray07276db2015-05-18 14:22:09 +0100850 bool value_can_be_null = true; // TODO: Worth finding out this information?
851 codegen->MarkGCCard(tmp_ptr, tmp_lo, base, value_lo, value_can_be_null);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800852 }
853
854 // Prevent reordering with prior memory operations.
Roland Levillain4bedb382016-01-12 12:01:04 +0000855 // Emit a DMB ISH instruction instead of an DMB ISHST one, as the
856 // latter allows a preceding load to be delayed past the STXR
857 // instruction below.
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800858 __ dmb(ISH);
859
860 __ add(tmp_ptr, base, ShifterOperand(offset));
861
Roland Levillain4d027112015-07-01 15:41:14 +0100862 if (kPoisonHeapReferences && type == Primitive::kPrimNot) {
863 codegen->GetAssembler()->PoisonHeapReference(expected_lo);
Roland Levillain2e50ecb2016-01-27 14:08:33 +0000864 if (value_lo == expected_lo) {
865 // Do not poison `value_lo`, as it is the same register as
866 // `expected_lo`, which has just been poisoned.
867 } else {
868 codegen->GetAssembler()->PoisonHeapReference(value_lo);
869 }
Roland Levillain4d027112015-07-01 15:41:14 +0100870 }
871
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800872 // do {
873 // tmp = [r_ptr] - expected;
874 // } while (tmp == 0 && failure([r_ptr] <- r_new_value));
875 // result = tmp != 0;
876
877 Label loop_head;
878 __ Bind(&loop_head);
879
Roland Levillain391b8662015-12-18 11:43:38 +0000880 // TODO: When `type == Primitive::kPrimNot`, add a read barrier for
881 // the reference stored in the object before attempting the CAS,
882 // similar to the one in the art::Unsafe_compareAndSwapObject JNI
883 // implementation.
884 //
885 // Note that this code is not (yet) used when read barriers are
886 // enabled (see IntrinsicLocationsBuilderARM::VisitUnsafeCASObject).
887 DCHECK(!(type == Primitive::kPrimNot && kEmitCompilerReadBarrier));
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800888 __ ldrex(tmp_lo, tmp_ptr);
889
890 __ subs(tmp_lo, tmp_lo, ShifterOperand(expected_lo));
891
892 __ it(EQ, ItState::kItT);
893 __ strex(tmp_lo, value_lo, tmp_ptr, EQ);
894 __ cmp(tmp_lo, ShifterOperand(1), EQ);
895
896 __ b(&loop_head, EQ);
897
898 __ dmb(ISH);
899
900 __ rsbs(out, tmp_lo, ShifterOperand(1));
901 __ it(CC);
902 __ mov(out, ShifterOperand(0), CC);
Roland Levillain4d027112015-07-01 15:41:14 +0100903
904 if (kPoisonHeapReferences && type == Primitive::kPrimNot) {
Roland Levillain4d027112015-07-01 15:41:14 +0100905 codegen->GetAssembler()->UnpoisonHeapReference(expected_lo);
Roland Levillain2e50ecb2016-01-27 14:08:33 +0000906 if (value_lo == expected_lo) {
907 // Do not unpoison `value_lo`, as it is the same register as
908 // `expected_lo`, which has just been unpoisoned.
909 } else {
910 codegen->GetAssembler()->UnpoisonHeapReference(value_lo);
911 }
Roland Levillain4d027112015-07-01 15:41:14 +0100912 }
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800913}
914
Andreas Gampeca714582015-04-03 19:41:34 -0700915void IntrinsicLocationsBuilderARM::VisitUnsafeCASInt(HInvoke* invoke) {
Roland Levillain2e50ecb2016-01-27 14:08:33 +0000916 CreateIntIntIntIntIntToIntPlusTemps(arena_, invoke, Primitive::kPrimInt);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800917}
Andreas Gampeca714582015-04-03 19:41:34 -0700918void IntrinsicLocationsBuilderARM::VisitUnsafeCASObject(HInvoke* invoke) {
Roland Levillain391b8662015-12-18 11:43:38 +0000919 // The UnsafeCASObject intrinsic is missing a read barrier, and
920 // therefore sometimes does not work as expected (b/25883050).
921 // Turn it off temporarily as a quick fix, until the read barrier is
922 // implemented (see TODO in GenCAS below).
923 //
Roland Levillain2e50ecb2016-01-27 14:08:33 +0000924 // TODO(rpl): Fix this issue and re-enable this intrinsic with read barriers.
925 if (kEmitCompilerReadBarrier) {
Roland Levillain985ff702015-10-23 13:25:35 +0100926 return;
927 }
928
Roland Levillain2e50ecb2016-01-27 14:08:33 +0000929 CreateIntIntIntIntIntToIntPlusTemps(arena_, invoke, Primitive::kPrimNot);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800930}
931void IntrinsicCodeGeneratorARM::VisitUnsafeCASInt(HInvoke* invoke) {
932 GenCas(invoke->GetLocations(), Primitive::kPrimInt, codegen_);
933}
934void IntrinsicCodeGeneratorARM::VisitUnsafeCASObject(HInvoke* invoke) {
935 GenCas(invoke->GetLocations(), Primitive::kPrimNot, codegen_);
936}
937
938void IntrinsicLocationsBuilderARM::VisitStringCharAt(HInvoke* invoke) {
939 LocationSummary* locations = new (arena_) LocationSummary(invoke,
940 LocationSummary::kCallOnSlowPath,
941 kIntrinsified);
942 locations->SetInAt(0, Location::RequiresRegister());
943 locations->SetInAt(1, Location::RequiresRegister());
944 locations->SetOut(Location::RequiresRegister(), Location::kOutputOverlap);
945
946 locations->AddTemp(Location::RequiresRegister());
947 locations->AddTemp(Location::RequiresRegister());
948}
949
950void IntrinsicCodeGeneratorARM::VisitStringCharAt(HInvoke* invoke) {
951 ArmAssembler* assembler = GetAssembler();
952 LocationSummary* locations = invoke->GetLocations();
953
954 // Location of reference to data array
955 const MemberOffset value_offset = mirror::String::ValueOffset();
956 // Location of count
957 const MemberOffset count_offset = mirror::String::CountOffset();
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800958
959 Register obj = locations->InAt(0).AsRegister<Register>(); // String object pointer.
960 Register idx = locations->InAt(1).AsRegister<Register>(); // Index of character.
961 Register out = locations->Out().AsRegister<Register>(); // Result character.
962
963 Register temp = locations->GetTemp(0).AsRegister<Register>();
964 Register array_temp = locations->GetTemp(1).AsRegister<Register>();
965
966 // TODO: Maybe we can support range check elimination. Overall, though, I think it's not worth
967 // the cost.
968 // TODO: For simplicity, the index parameter is requested in a register, so different from Quick
969 // we will not optimize the code for constants (which would save a register).
970
Andreas Gampe85b62f22015-09-09 13:15:38 -0700971 SlowPathCode* slow_path = new (GetAllocator()) IntrinsicSlowPathARM(invoke);
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800972 codegen_->AddSlowPath(slow_path);
973
974 __ ldr(temp, Address(obj, count_offset.Int32Value())); // temp = str.length.
975 codegen_->MaybeRecordImplicitNullCheck(invoke);
976 __ cmp(idx, ShifterOperand(temp));
977 __ b(slow_path->GetEntryLabel(), CS);
978
Jeff Hao848f70a2014-01-15 13:49:50 -0800979 __ add(array_temp, obj, ShifterOperand(value_offset.Int32Value())); // array_temp := str.value.
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800980
981 // Load the value.
Jeff Hao848f70a2014-01-15 13:49:50 -0800982 __ ldrh(out, Address(array_temp, idx, LSL, 1)); // out := array_temp[idx].
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -0800983
984 __ Bind(slow_path->GetExitLabel());
985}
986
Nicolas Geoffrayd75948a2015-03-27 09:53:16 +0000987void IntrinsicLocationsBuilderARM::VisitStringCompareTo(HInvoke* invoke) {
988 // The inputs plus one temp.
989 LocationSummary* locations = new (arena_) LocationSummary(invoke,
990 LocationSummary::kCall,
991 kIntrinsified);
992 InvokeRuntimeCallingConvention calling_convention;
993 locations->SetInAt(0, Location::RegisterLocation(calling_convention.GetRegisterAt(0)));
994 locations->SetInAt(1, Location::RegisterLocation(calling_convention.GetRegisterAt(1)));
995 locations->SetOut(Location::RegisterLocation(R0));
996}
997
998void IntrinsicCodeGeneratorARM::VisitStringCompareTo(HInvoke* invoke) {
999 ArmAssembler* assembler = GetAssembler();
1000 LocationSummary* locations = invoke->GetLocations();
1001
Nicolas Geoffray512e04d2015-03-27 17:21:24 +00001002 // Note that the null check must have been done earlier.
Calin Juravle641547a2015-04-21 22:08:51 +01001003 DCHECK(!invoke->CanDoImplicitNullCheckOn(invoke->InputAt(0)));
Nicolas Geoffrayd75948a2015-03-27 09:53:16 +00001004
1005 Register argument = locations->InAt(1).AsRegister<Register>();
1006 __ cmp(argument, ShifterOperand(0));
Andreas Gampe85b62f22015-09-09 13:15:38 -07001007 SlowPathCode* slow_path = new (GetAllocator()) IntrinsicSlowPathARM(invoke);
Nicolas Geoffrayd75948a2015-03-27 09:53:16 +00001008 codegen_->AddSlowPath(slow_path);
1009 __ b(slow_path->GetEntryLabel(), EQ);
1010
1011 __ LoadFromOffset(
1012 kLoadWord, LR, TR, QUICK_ENTRYPOINT_OFFSET(kArmWordSize, pStringCompareTo).Int32Value());
1013 __ blx(LR);
1014 __ Bind(slow_path->GetExitLabel());
1015}
1016
Agi Csaki289cd552015-08-18 17:10:38 -07001017void IntrinsicLocationsBuilderARM::VisitStringEquals(HInvoke* invoke) {
1018 LocationSummary* locations = new (arena_) LocationSummary(invoke,
1019 LocationSummary::kNoCall,
1020 kIntrinsified);
1021 InvokeRuntimeCallingConvention calling_convention;
1022 locations->SetInAt(0, Location::RequiresRegister());
1023 locations->SetInAt(1, Location::RequiresRegister());
1024 // Temporary registers to store lengths of strings and for calculations.
1025 // Using instruction cbz requires a low register, so explicitly set a temp to be R0.
1026 locations->AddTemp(Location::RegisterLocation(R0));
1027 locations->AddTemp(Location::RequiresRegister());
1028 locations->AddTemp(Location::RequiresRegister());
1029
1030 locations->SetOut(Location::RequiresRegister());
1031}
1032
1033void IntrinsicCodeGeneratorARM::VisitStringEquals(HInvoke* invoke) {
1034 ArmAssembler* assembler = GetAssembler();
1035 LocationSummary* locations = invoke->GetLocations();
1036
1037 Register str = locations->InAt(0).AsRegister<Register>();
1038 Register arg = locations->InAt(1).AsRegister<Register>();
1039 Register out = locations->Out().AsRegister<Register>();
1040
1041 Register temp = locations->GetTemp(0).AsRegister<Register>();
1042 Register temp1 = locations->GetTemp(1).AsRegister<Register>();
1043 Register temp2 = locations->GetTemp(2).AsRegister<Register>();
1044
1045 Label loop;
1046 Label end;
1047 Label return_true;
1048 Label return_false;
1049
1050 // Get offsets of count, value, and class fields within a string object.
1051 const uint32_t count_offset = mirror::String::CountOffset().Uint32Value();
1052 const uint32_t value_offset = mirror::String::ValueOffset().Uint32Value();
1053 const uint32_t class_offset = mirror::Object::ClassOffset().Uint32Value();
1054
1055 // Note that the null check must have been done earlier.
1056 DCHECK(!invoke->CanDoImplicitNullCheckOn(invoke->InputAt(0)));
1057
Vladimir Marko53b52002016-05-24 19:30:45 +01001058 StringEqualsOptimizations optimizations(invoke);
1059 if (!optimizations.GetArgumentNotNull()) {
1060 // Check if input is null, return false if it is.
1061 __ CompareAndBranchIfZero(arg, &return_false);
1062 }
Agi Csaki289cd552015-08-18 17:10:38 -07001063
Vladimir Marko53b52002016-05-24 19:30:45 +01001064 if (!optimizations.GetArgumentIsString()) {
1065 // Instanceof check for the argument by comparing class fields.
1066 // All string objects must have the same type since String cannot be subclassed.
1067 // Receiver must be a string object, so its class field is equal to all strings' class fields.
1068 // If the argument is a string object, its class field must be equal to receiver's class field.
1069 __ ldr(temp, Address(str, class_offset));
1070 __ ldr(temp1, Address(arg, class_offset));
1071 __ cmp(temp, ShifterOperand(temp1));
1072 __ b(&return_false, NE);
1073 }
Agi Csaki289cd552015-08-18 17:10:38 -07001074
1075 // Load lengths of this and argument strings.
1076 __ ldr(temp, Address(str, count_offset));
1077 __ ldr(temp1, Address(arg, count_offset));
1078 // Check if lengths are equal, return false if they're not.
1079 __ cmp(temp, ShifterOperand(temp1));
1080 __ b(&return_false, NE);
1081 // Return true if both strings are empty.
1082 __ cbz(temp, &return_true);
1083
1084 // Reference equality check, return true if same reference.
1085 __ cmp(str, ShifterOperand(arg));
1086 __ b(&return_true, EQ);
1087
1088 // Assertions that must hold in order to compare strings 2 characters at a time.
1089 DCHECK_ALIGNED(value_offset, 4);
1090 static_assert(IsAligned<4>(kObjectAlignment), "String of odd length is not zero padded");
1091
Agi Csaki289cd552015-08-18 17:10:38 -07001092 __ LoadImmediate(temp1, value_offset);
Agi Csaki289cd552015-08-18 17:10:38 -07001093
1094 // Loop to compare strings 2 characters at a time starting at the front of the string.
1095 // Ok to do this because strings with an odd length are zero-padded.
1096 __ Bind(&loop);
1097 __ ldr(out, Address(str, temp1));
1098 __ ldr(temp2, Address(arg, temp1));
1099 __ cmp(out, ShifterOperand(temp2));
1100 __ b(&return_false, NE);
1101 __ add(temp1, temp1, ShifterOperand(sizeof(uint32_t)));
Vladimir Markoa63f0d42015-09-01 13:36:35 +01001102 __ subs(temp, temp, ShifterOperand(sizeof(uint32_t) / sizeof(uint16_t)));
1103 __ b(&loop, GT);
Agi Csaki289cd552015-08-18 17:10:38 -07001104
1105 // Return true and exit the function.
1106 // If loop does not result in returning false, we return true.
1107 __ Bind(&return_true);
1108 __ LoadImmediate(out, 1);
1109 __ b(&end);
1110
1111 // Return false and exit the function.
1112 __ Bind(&return_false);
1113 __ LoadImmediate(out, 0);
1114 __ Bind(&end);
1115}
1116
Andreas Gampeba6fdbc2015-05-07 22:31:55 -07001117static void GenerateVisitStringIndexOf(HInvoke* invoke,
1118 ArmAssembler* assembler,
1119 CodeGeneratorARM* codegen,
1120 ArenaAllocator* allocator,
1121 bool start_at_zero) {
1122 LocationSummary* locations = invoke->GetLocations();
Andreas Gampeba6fdbc2015-05-07 22:31:55 -07001123
1124 // Note that the null check must have been done earlier.
1125 DCHECK(!invoke->CanDoImplicitNullCheckOn(invoke->InputAt(0)));
1126
1127 // Check for code points > 0xFFFF. Either a slow-path check when we don't know statically,
Vladimir Markofb6c90a2016-05-06 15:52:12 +01001128 // or directly dispatch for a large constant, or omit slow-path for a small constant or a char.
Andreas Gampe85b62f22015-09-09 13:15:38 -07001129 SlowPathCode* slow_path = nullptr;
Vladimir Markofb6c90a2016-05-06 15:52:12 +01001130 HInstruction* code_point = invoke->InputAt(1);
1131 if (code_point->IsIntConstant()) {
Vladimir Markoda051082016-05-17 16:10:20 +01001132 if (static_cast<uint32_t>(code_point->AsIntConstant()->GetValue()) >
Andreas Gampeba6fdbc2015-05-07 22:31:55 -07001133 std::numeric_limits<uint16_t>::max()) {
1134 // Always needs the slow-path. We could directly dispatch to it, but this case should be
1135 // rare, so for simplicity just put the full slow-path down and branch unconditionally.
1136 slow_path = new (allocator) IntrinsicSlowPathARM(invoke);
1137 codegen->AddSlowPath(slow_path);
1138 __ b(slow_path->GetEntryLabel());
1139 __ Bind(slow_path->GetExitLabel());
1140 return;
1141 }
Vladimir Markofb6c90a2016-05-06 15:52:12 +01001142 } else if (code_point->GetType() != Primitive::kPrimChar) {
Andreas Gampeba6fdbc2015-05-07 22:31:55 -07001143 Register char_reg = locations->InAt(1).AsRegister<Register>();
Vladimir Markofb6c90a2016-05-06 15:52:12 +01001144 // 0xffff is not modified immediate but 0x10000 is, so use `>= 0x10000` instead of `> 0xffff`.
1145 __ cmp(char_reg,
1146 ShifterOperand(static_cast<uint32_t>(std::numeric_limits<uint16_t>::max()) + 1));
Andreas Gampeba6fdbc2015-05-07 22:31:55 -07001147 slow_path = new (allocator) IntrinsicSlowPathARM(invoke);
1148 codegen->AddSlowPath(slow_path);
Vladimir Markofb6c90a2016-05-06 15:52:12 +01001149 __ b(slow_path->GetEntryLabel(), HS);
Andreas Gampeba6fdbc2015-05-07 22:31:55 -07001150 }
1151
1152 if (start_at_zero) {
Vladimir Markofb6c90a2016-05-06 15:52:12 +01001153 Register tmp_reg = locations->GetTemp(0).AsRegister<Register>();
Andreas Gampeba6fdbc2015-05-07 22:31:55 -07001154 DCHECK_EQ(tmp_reg, R2);
1155 // Start-index = 0.
1156 __ LoadImmediate(tmp_reg, 0);
1157 }
1158
1159 __ LoadFromOffset(kLoadWord, LR, TR,
1160 QUICK_ENTRYPOINT_OFFSET(kArmWordSize, pIndexOf).Int32Value());
Roland Levillain42ad2882016-02-29 18:26:54 +00001161 CheckEntrypointTypes<kQuickIndexOf, int32_t, void*, uint32_t, uint32_t>();
Andreas Gampeba6fdbc2015-05-07 22:31:55 -07001162 __ blx(LR);
1163
1164 if (slow_path != nullptr) {
1165 __ Bind(slow_path->GetExitLabel());
1166 }
1167}
1168
1169void IntrinsicLocationsBuilderARM::VisitStringIndexOf(HInvoke* invoke) {
1170 LocationSummary* locations = new (arena_) LocationSummary(invoke,
1171 LocationSummary::kCall,
1172 kIntrinsified);
1173 // We have a hand-crafted assembly stub that follows the runtime calling convention. So it's
1174 // best to align the inputs accordingly.
1175 InvokeRuntimeCallingConvention calling_convention;
1176 locations->SetInAt(0, Location::RegisterLocation(calling_convention.GetRegisterAt(0)));
1177 locations->SetInAt(1, Location::RegisterLocation(calling_convention.GetRegisterAt(1)));
1178 locations->SetOut(Location::RegisterLocation(R0));
1179
Vladimir Markofb6c90a2016-05-06 15:52:12 +01001180 // Need to send start-index=0.
Andreas Gampeba6fdbc2015-05-07 22:31:55 -07001181 locations->AddTemp(Location::RegisterLocation(calling_convention.GetRegisterAt(2)));
1182}
1183
1184void IntrinsicCodeGeneratorARM::VisitStringIndexOf(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +00001185 GenerateVisitStringIndexOf(
1186 invoke, GetAssembler(), codegen_, GetAllocator(), /* start_at_zero */ true);
Andreas Gampeba6fdbc2015-05-07 22:31:55 -07001187}
1188
1189void IntrinsicLocationsBuilderARM::VisitStringIndexOfAfter(HInvoke* invoke) {
1190 LocationSummary* locations = new (arena_) LocationSummary(invoke,
1191 LocationSummary::kCall,
1192 kIntrinsified);
1193 // We have a hand-crafted assembly stub that follows the runtime calling convention. So it's
1194 // best to align the inputs accordingly.
1195 InvokeRuntimeCallingConvention calling_convention;
1196 locations->SetInAt(0, Location::RegisterLocation(calling_convention.GetRegisterAt(0)));
1197 locations->SetInAt(1, Location::RegisterLocation(calling_convention.GetRegisterAt(1)));
1198 locations->SetInAt(2, Location::RegisterLocation(calling_convention.GetRegisterAt(2)));
1199 locations->SetOut(Location::RegisterLocation(R0));
Andreas Gampeba6fdbc2015-05-07 22:31:55 -07001200}
1201
1202void IntrinsicCodeGeneratorARM::VisitStringIndexOfAfter(HInvoke* invoke) {
Roland Levillainbf84a3d2015-12-04 14:33:02 +00001203 GenerateVisitStringIndexOf(
1204 invoke, GetAssembler(), codegen_, GetAllocator(), /* start_at_zero */ false);
Andreas Gampeba6fdbc2015-05-07 22:31:55 -07001205}
1206
Jeff Hao848f70a2014-01-15 13:49:50 -08001207void IntrinsicLocationsBuilderARM::VisitStringNewStringFromBytes(HInvoke* invoke) {
1208 LocationSummary* locations = new (arena_) LocationSummary(invoke,
1209 LocationSummary::kCall,
1210 kIntrinsified);
1211 InvokeRuntimeCallingConvention calling_convention;
1212 locations->SetInAt(0, Location::RegisterLocation(calling_convention.GetRegisterAt(0)));
1213 locations->SetInAt(1, Location::RegisterLocation(calling_convention.GetRegisterAt(1)));
1214 locations->SetInAt(2, Location::RegisterLocation(calling_convention.GetRegisterAt(2)));
1215 locations->SetInAt(3, Location::RegisterLocation(calling_convention.GetRegisterAt(3)));
1216 locations->SetOut(Location::RegisterLocation(R0));
1217}
1218
1219void IntrinsicCodeGeneratorARM::VisitStringNewStringFromBytes(HInvoke* invoke) {
1220 ArmAssembler* assembler = GetAssembler();
1221 LocationSummary* locations = invoke->GetLocations();
1222
1223 Register byte_array = locations->InAt(0).AsRegister<Register>();
1224 __ cmp(byte_array, ShifterOperand(0));
Andreas Gampe85b62f22015-09-09 13:15:38 -07001225 SlowPathCode* slow_path = new (GetAllocator()) IntrinsicSlowPathARM(invoke);
Jeff Hao848f70a2014-01-15 13:49:50 -08001226 codegen_->AddSlowPath(slow_path);
1227 __ b(slow_path->GetEntryLabel(), EQ);
1228
1229 __ LoadFromOffset(
1230 kLoadWord, LR, TR, QUICK_ENTRYPOINT_OFFSET(kArmWordSize, pAllocStringFromBytes).Int32Value());
Roland Levillainf969a202016-03-09 16:14:00 +00001231 CheckEntrypointTypes<kQuickAllocStringFromBytes, void*, void*, int32_t, int32_t, int32_t>();
Jeff Hao848f70a2014-01-15 13:49:50 -08001232 __ blx(LR);
Roland Levillainf969a202016-03-09 16:14:00 +00001233 codegen_->RecordPcInfo(invoke, invoke->GetDexPc());
Jeff Hao848f70a2014-01-15 13:49:50 -08001234 __ Bind(slow_path->GetExitLabel());
1235}
1236
1237void IntrinsicLocationsBuilderARM::VisitStringNewStringFromChars(HInvoke* invoke) {
1238 LocationSummary* locations = new (arena_) LocationSummary(invoke,
1239 LocationSummary::kCall,
1240 kIntrinsified);
1241 InvokeRuntimeCallingConvention calling_convention;
1242 locations->SetInAt(0, Location::RegisterLocation(calling_convention.GetRegisterAt(0)));
1243 locations->SetInAt(1, Location::RegisterLocation(calling_convention.GetRegisterAt(1)));
1244 locations->SetInAt(2, Location::RegisterLocation(calling_convention.GetRegisterAt(2)));
1245 locations->SetOut(Location::RegisterLocation(R0));
1246}
1247
1248void IntrinsicCodeGeneratorARM::VisitStringNewStringFromChars(HInvoke* invoke) {
1249 ArmAssembler* assembler = GetAssembler();
1250
Roland Levillaincc3839c2016-02-29 16:23:48 +00001251 // No need to emit code checking whether `locations->InAt(2)` is a null
1252 // pointer, as callers of the native method
1253 //
1254 // java.lang.StringFactory.newStringFromChars(int offset, int charCount, char[] data)
1255 //
1256 // all include a null check on `data` before calling that method.
Jeff Hao848f70a2014-01-15 13:49:50 -08001257 __ LoadFromOffset(
1258 kLoadWord, LR, TR, QUICK_ENTRYPOINT_OFFSET(kArmWordSize, pAllocStringFromChars).Int32Value());
Roland Levillainf969a202016-03-09 16:14:00 +00001259 CheckEntrypointTypes<kQuickAllocStringFromChars, void*, int32_t, int32_t, void*>();
Jeff Hao848f70a2014-01-15 13:49:50 -08001260 __ blx(LR);
Roland Levillainf969a202016-03-09 16:14:00 +00001261 codegen_->RecordPcInfo(invoke, invoke->GetDexPc());
Jeff Hao848f70a2014-01-15 13:49:50 -08001262}
1263
1264void IntrinsicLocationsBuilderARM::VisitStringNewStringFromString(HInvoke* invoke) {
1265 LocationSummary* locations = new (arena_) LocationSummary(invoke,
1266 LocationSummary::kCall,
1267 kIntrinsified);
1268 InvokeRuntimeCallingConvention calling_convention;
1269 locations->SetInAt(0, Location::RegisterLocation(calling_convention.GetRegisterAt(0)));
1270 locations->SetOut(Location::RegisterLocation(R0));
1271}
1272
1273void IntrinsicCodeGeneratorARM::VisitStringNewStringFromString(HInvoke* invoke) {
1274 ArmAssembler* assembler = GetAssembler();
1275 LocationSummary* locations = invoke->GetLocations();
1276
1277 Register string_to_copy = locations->InAt(0).AsRegister<Register>();
1278 __ cmp(string_to_copy, ShifterOperand(0));
Andreas Gampe85b62f22015-09-09 13:15:38 -07001279 SlowPathCode* slow_path = new (GetAllocator()) IntrinsicSlowPathARM(invoke);
Jeff Hao848f70a2014-01-15 13:49:50 -08001280 codegen_->AddSlowPath(slow_path);
1281 __ b(slow_path->GetEntryLabel(), EQ);
1282
1283 __ LoadFromOffset(kLoadWord,
1284 LR, TR, QUICK_ENTRYPOINT_OFFSET(kArmWordSize, pAllocStringFromString).Int32Value());
Roland Levillainf969a202016-03-09 16:14:00 +00001285 CheckEntrypointTypes<kQuickAllocStringFromString, void*, void*>();
Jeff Hao848f70a2014-01-15 13:49:50 -08001286 __ blx(LR);
Roland Levillainf969a202016-03-09 16:14:00 +00001287 codegen_->RecordPcInfo(invoke, invoke->GetDexPc());
Jeff Hao848f70a2014-01-15 13:49:50 -08001288 __ Bind(slow_path->GetExitLabel());
1289}
1290
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001291void IntrinsicLocationsBuilderARM::VisitSystemArrayCopy(HInvoke* invoke) {
1292 CodeGenerator::CreateSystemArrayCopyLocationSummary(invoke);
1293 LocationSummary* locations = invoke->GetLocations();
1294 if (locations == nullptr) {
1295 return;
1296 }
1297
1298 HIntConstant* src_pos = invoke->InputAt(1)->AsIntConstant();
1299 HIntConstant* dest_pos = invoke->InputAt(3)->AsIntConstant();
1300 HIntConstant* length = invoke->InputAt(4)->AsIntConstant();
1301
1302 if (src_pos != nullptr && !assembler_->ShifterOperandCanAlwaysHold(src_pos->GetValue())) {
1303 locations->SetInAt(1, Location::RequiresRegister());
1304 }
1305 if (dest_pos != nullptr && !assembler_->ShifterOperandCanAlwaysHold(dest_pos->GetValue())) {
1306 locations->SetInAt(3, Location::RequiresRegister());
1307 }
1308 if (length != nullptr && !assembler_->ShifterOperandCanAlwaysHold(length->GetValue())) {
1309 locations->SetInAt(4, Location::RequiresRegister());
1310 }
1311}
1312
1313static void CheckPosition(ArmAssembler* assembler,
1314 Location pos,
1315 Register input,
1316 Location length,
1317 SlowPathCode* slow_path,
1318 Register input_len,
1319 Register temp,
1320 bool length_is_input_length = false) {
1321 // Where is the length in the Array?
1322 const uint32_t length_offset = mirror::Array::LengthOffset().Uint32Value();
1323
1324 if (pos.IsConstant()) {
1325 int32_t pos_const = pos.GetConstant()->AsIntConstant()->GetValue();
1326 if (pos_const == 0) {
1327 if (!length_is_input_length) {
1328 // Check that length(input) >= length.
1329 __ LoadFromOffset(kLoadWord, temp, input, length_offset);
1330 if (length.IsConstant()) {
1331 __ cmp(temp, ShifterOperand(length.GetConstant()->AsIntConstant()->GetValue()));
1332 } else {
1333 __ cmp(temp, ShifterOperand(length.AsRegister<Register>()));
1334 }
1335 __ b(slow_path->GetEntryLabel(), LT);
1336 }
1337 } else {
1338 // Check that length(input) >= pos.
1339 __ LoadFromOffset(kLoadWord, input_len, input, length_offset);
1340 __ subs(temp, input_len, ShifterOperand(pos_const));
1341 __ b(slow_path->GetEntryLabel(), LT);
1342
1343 // Check that (length(input) - pos) >= length.
1344 if (length.IsConstant()) {
1345 __ cmp(temp, ShifterOperand(length.GetConstant()->AsIntConstant()->GetValue()));
1346 } else {
1347 __ cmp(temp, ShifterOperand(length.AsRegister<Register>()));
1348 }
1349 __ b(slow_path->GetEntryLabel(), LT);
1350 }
1351 } else if (length_is_input_length) {
1352 // The only way the copy can succeed is if pos is zero.
1353 Register pos_reg = pos.AsRegister<Register>();
1354 __ CompareAndBranchIfNonZero(pos_reg, slow_path->GetEntryLabel());
1355 } else {
1356 // Check that pos >= 0.
1357 Register pos_reg = pos.AsRegister<Register>();
1358 __ cmp(pos_reg, ShifterOperand(0));
1359 __ b(slow_path->GetEntryLabel(), LT);
1360
1361 // Check that pos <= length(input).
1362 __ LoadFromOffset(kLoadWord, temp, input, length_offset);
1363 __ subs(temp, temp, ShifterOperand(pos_reg));
1364 __ b(slow_path->GetEntryLabel(), LT);
1365
1366 // Check that (length(input) - pos) >= length.
1367 if (length.IsConstant()) {
1368 __ cmp(temp, ShifterOperand(length.GetConstant()->AsIntConstant()->GetValue()));
1369 } else {
1370 __ cmp(temp, ShifterOperand(length.AsRegister<Register>()));
1371 }
1372 __ b(slow_path->GetEntryLabel(), LT);
1373 }
1374}
1375
Roland Levillain3b359c72015-11-17 19:35:12 +00001376// TODO: Implement read barriers in the SystemArrayCopy intrinsic.
1377// Note that this code path is not used (yet) because we do not
1378// intrinsify methods that can go into the IntrinsicSlowPathARM
1379// slow path.
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001380void IntrinsicCodeGeneratorARM::VisitSystemArrayCopy(HInvoke* invoke) {
1381 ArmAssembler* assembler = GetAssembler();
1382 LocationSummary* locations = invoke->GetLocations();
1383
1384 uint32_t class_offset = mirror::Object::ClassOffset().Int32Value();
1385 uint32_t super_offset = mirror::Class::SuperClassOffset().Int32Value();
1386 uint32_t component_offset = mirror::Class::ComponentTypeOffset().Int32Value();
1387 uint32_t primitive_offset = mirror::Class::PrimitiveTypeOffset().Int32Value();
1388
1389 Register src = locations->InAt(0).AsRegister<Register>();
1390 Location src_pos = locations->InAt(1);
1391 Register dest = locations->InAt(2).AsRegister<Register>();
1392 Location dest_pos = locations->InAt(3);
1393 Location length = locations->InAt(4);
1394 Register temp1 = locations->GetTemp(0).AsRegister<Register>();
1395 Register temp2 = locations->GetTemp(1).AsRegister<Register>();
1396 Register temp3 = locations->GetTemp(2).AsRegister<Register>();
1397
1398 SlowPathCode* slow_path = new (GetAllocator()) IntrinsicSlowPathARM(invoke);
1399 codegen_->AddSlowPath(slow_path);
1400
Roland Levillainebea3d22016-04-12 15:42:57 +01001401 Label conditions_on_positions_validated;
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001402 SystemArrayCopyOptimizations optimizations(invoke);
1403
Roland Levillainebea3d22016-04-12 15:42:57 +01001404 if (!optimizations.GetDestinationIsSource() &&
1405 (!src_pos.IsConstant() || !dest_pos.IsConstant())) {
1406 __ cmp(src, ShifterOperand(dest));
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001407 }
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001408 // If source and destination are the same, we go to slow path if we need to do
1409 // forward copying.
1410 if (src_pos.IsConstant()) {
1411 int32_t src_pos_constant = src_pos.GetConstant()->AsIntConstant()->GetValue();
1412 if (dest_pos.IsConstant()) {
1413 // Checked when building locations.
1414 DCHECK(!optimizations.GetDestinationIsSource()
1415 || (src_pos_constant >= dest_pos.GetConstant()->AsIntConstant()->GetValue()));
1416 } else {
1417 if (!optimizations.GetDestinationIsSource()) {
Roland Levillainebea3d22016-04-12 15:42:57 +01001418 __ b(&conditions_on_positions_validated, NE);
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001419 }
1420 __ cmp(dest_pos.AsRegister<Register>(), ShifterOperand(src_pos_constant));
1421 __ b(slow_path->GetEntryLabel(), GT);
1422 }
1423 } else {
1424 if (!optimizations.GetDestinationIsSource()) {
Roland Levillainebea3d22016-04-12 15:42:57 +01001425 __ b(&conditions_on_positions_validated, NE);
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001426 }
1427 if (dest_pos.IsConstant()) {
1428 int32_t dest_pos_constant = dest_pos.GetConstant()->AsIntConstant()->GetValue();
1429 __ cmp(src_pos.AsRegister<Register>(), ShifterOperand(dest_pos_constant));
1430 } else {
1431 __ cmp(src_pos.AsRegister<Register>(), ShifterOperand(dest_pos.AsRegister<Register>()));
1432 }
1433 __ b(slow_path->GetEntryLabel(), LT);
1434 }
1435
Roland Levillainebea3d22016-04-12 15:42:57 +01001436 __ Bind(&conditions_on_positions_validated);
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001437
1438 if (!optimizations.GetSourceIsNotNull()) {
1439 // Bail out if the source is null.
1440 __ CompareAndBranchIfZero(src, slow_path->GetEntryLabel());
1441 }
1442
1443 if (!optimizations.GetDestinationIsNotNull() && !optimizations.GetDestinationIsSource()) {
1444 // Bail out if the destination is null.
1445 __ CompareAndBranchIfZero(dest, slow_path->GetEntryLabel());
1446 }
1447
1448 // If the length is negative, bail out.
1449 // We have already checked in the LocationsBuilder for the constant case.
1450 if (!length.IsConstant() &&
1451 !optimizations.GetCountIsSourceLength() &&
1452 !optimizations.GetCountIsDestinationLength()) {
1453 __ cmp(length.AsRegister<Register>(), ShifterOperand(0));
1454 __ b(slow_path->GetEntryLabel(), LT);
1455 }
1456
1457 // Validity checks: source.
1458 CheckPosition(assembler,
1459 src_pos,
1460 src,
1461 length,
1462 slow_path,
1463 temp1,
1464 temp2,
1465 optimizations.GetCountIsSourceLength());
1466
1467 // Validity checks: dest.
1468 CheckPosition(assembler,
1469 dest_pos,
1470 dest,
1471 length,
1472 slow_path,
1473 temp1,
1474 temp2,
1475 optimizations.GetCountIsDestinationLength());
1476
1477 if (!optimizations.GetDoesNotNeedTypeCheck()) {
1478 // Check whether all elements of the source array are assignable to the component
1479 // type of the destination array. We do two checks: the classes are the same,
1480 // or the destination is Object[]. If none of these checks succeed, we go to the
1481 // slow path.
1482 __ LoadFromOffset(kLoadWord, temp1, dest, class_offset);
1483 __ LoadFromOffset(kLoadWord, temp2, src, class_offset);
1484 bool did_unpoison = false;
1485 if (!optimizations.GetDestinationIsNonPrimitiveArray() ||
1486 !optimizations.GetSourceIsNonPrimitiveArray()) {
Roland Levillainebea3d22016-04-12 15:42:57 +01001487 // One or two of the references need to be unpoisoned. Unpoison them
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001488 // both to make the identity check valid.
1489 __ MaybeUnpoisonHeapReference(temp1);
1490 __ MaybeUnpoisonHeapReference(temp2);
1491 did_unpoison = true;
1492 }
1493
1494 if (!optimizations.GetDestinationIsNonPrimitiveArray()) {
1495 // Bail out if the destination is not a non primitive array.
Roland Levillainebea3d22016-04-12 15:42:57 +01001496 // /* HeapReference<Class> */ temp3 = temp1->component_type_
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001497 __ LoadFromOffset(kLoadWord, temp3, temp1, component_offset);
1498 __ CompareAndBranchIfZero(temp3, slow_path->GetEntryLabel());
1499 __ MaybeUnpoisonHeapReference(temp3);
1500 __ LoadFromOffset(kLoadUnsignedHalfword, temp3, temp3, primitive_offset);
1501 static_assert(Primitive::kPrimNot == 0, "Expected 0 for kPrimNot");
1502 __ CompareAndBranchIfNonZero(temp3, slow_path->GetEntryLabel());
1503 }
1504
1505 if (!optimizations.GetSourceIsNonPrimitiveArray()) {
1506 // Bail out if the source is not a non primitive array.
Roland Levillainebea3d22016-04-12 15:42:57 +01001507 // /* HeapReference<Class> */ temp3 = temp2->component_type_
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001508 __ LoadFromOffset(kLoadWord, temp3, temp2, component_offset);
1509 __ CompareAndBranchIfZero(temp3, slow_path->GetEntryLabel());
1510 __ MaybeUnpoisonHeapReference(temp3);
1511 __ LoadFromOffset(kLoadUnsignedHalfword, temp3, temp3, primitive_offset);
1512 static_assert(Primitive::kPrimNot == 0, "Expected 0 for kPrimNot");
1513 __ CompareAndBranchIfNonZero(temp3, slow_path->GetEntryLabel());
1514 }
1515
1516 __ cmp(temp1, ShifterOperand(temp2));
1517
1518 if (optimizations.GetDestinationIsTypedObjectArray()) {
1519 Label do_copy;
1520 __ b(&do_copy, EQ);
1521 if (!did_unpoison) {
1522 __ MaybeUnpoisonHeapReference(temp1);
1523 }
Roland Levillainebea3d22016-04-12 15:42:57 +01001524 // /* HeapReference<Class> */ temp1 = temp1->component_type_
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001525 __ LoadFromOffset(kLoadWord, temp1, temp1, component_offset);
1526 __ MaybeUnpoisonHeapReference(temp1);
Roland Levillainebea3d22016-04-12 15:42:57 +01001527 // /* HeapReference<Class> */ temp1 = temp1->super_class_
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001528 __ LoadFromOffset(kLoadWord, temp1, temp1, super_offset);
1529 // No need to unpoison the result, we're comparing against null.
1530 __ CompareAndBranchIfNonZero(temp1, slow_path->GetEntryLabel());
1531 __ Bind(&do_copy);
1532 } else {
1533 __ b(slow_path->GetEntryLabel(), NE);
1534 }
1535 } else if (!optimizations.GetSourceIsNonPrimitiveArray()) {
1536 DCHECK(optimizations.GetDestinationIsNonPrimitiveArray());
1537 // Bail out if the source is not a non primitive array.
Roland Levillainebea3d22016-04-12 15:42:57 +01001538 // /* HeapReference<Class> */ temp1 = src->klass_
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001539 __ LoadFromOffset(kLoadWord, temp1, src, class_offset);
1540 __ MaybeUnpoisonHeapReference(temp1);
Roland Levillainebea3d22016-04-12 15:42:57 +01001541 // /* HeapReference<Class> */ temp3 = temp1->component_type_
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001542 __ LoadFromOffset(kLoadWord, temp3, temp1, component_offset);
1543 __ CompareAndBranchIfZero(temp3, slow_path->GetEntryLabel());
1544 __ MaybeUnpoisonHeapReference(temp3);
1545 __ LoadFromOffset(kLoadUnsignedHalfword, temp3, temp3, primitive_offset);
1546 static_assert(Primitive::kPrimNot == 0, "Expected 0 for kPrimNot");
1547 __ CompareAndBranchIfNonZero(temp3, slow_path->GetEntryLabel());
1548 }
1549
1550 // Compute base source address, base destination address, and end source address.
1551
1552 uint32_t element_size = sizeof(int32_t);
1553 uint32_t offset = mirror::Array::DataOffset(element_size).Uint32Value();
1554 if (src_pos.IsConstant()) {
1555 int32_t constant = src_pos.GetConstant()->AsIntConstant()->GetValue();
1556 __ AddConstant(temp1, src, element_size * constant + offset);
1557 } else {
1558 __ add(temp1, src, ShifterOperand(src_pos.AsRegister<Register>(), LSL, 2));
1559 __ AddConstant(temp1, offset);
1560 }
1561
1562 if (dest_pos.IsConstant()) {
1563 int32_t constant = dest_pos.GetConstant()->AsIntConstant()->GetValue();
1564 __ AddConstant(temp2, dest, element_size * constant + offset);
1565 } else {
1566 __ add(temp2, dest, ShifterOperand(dest_pos.AsRegister<Register>(), LSL, 2));
1567 __ AddConstant(temp2, offset);
1568 }
1569
1570 if (length.IsConstant()) {
1571 int32_t constant = length.GetConstant()->AsIntConstant()->GetValue();
1572 __ AddConstant(temp3, temp1, element_size * constant);
1573 } else {
1574 __ add(temp3, temp1, ShifterOperand(length.AsRegister<Register>(), LSL, 2));
1575 }
1576
1577 // Iterate over the arrays and do a raw copy of the objects. We don't need to
1578 // poison/unpoison, nor do any read barrier as the next uses of the destination
1579 // array will do it.
1580 Label loop, done;
1581 __ cmp(temp1, ShifterOperand(temp3));
1582 __ b(&done, EQ);
1583 __ Bind(&loop);
1584 __ ldr(IP, Address(temp1, element_size, Address::PostIndex));
1585 __ str(IP, Address(temp2, element_size, Address::PostIndex));
1586 __ cmp(temp1, ShifterOperand(temp3));
1587 __ b(&loop, NE);
1588 __ Bind(&done);
1589
1590 // We only need one card marking on the destination array.
1591 codegen_->MarkGCCard(temp1,
1592 temp2,
1593 dest,
1594 Register(kNoRegister),
Roland Levillainebea3d22016-04-12 15:42:57 +01001595 /* value_can_be_null */ false);
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +01001596
1597 __ Bind(slow_path->GetExitLabel());
1598}
1599
Anton Kirilovd70dc9d2016-02-04 14:59:04 +00001600static void CreateFPToFPCallLocations(ArenaAllocator* arena, HInvoke* invoke) {
1601 // If the graph is debuggable, all callee-saved floating-point registers are blocked by
1602 // the code generator. Furthermore, the register allocator creates fixed live intervals
1603 // for all caller-saved registers because we are doing a function call. As a result, if
1604 // the input and output locations are unallocated, the register allocator runs out of
1605 // registers and fails; however, a debuggable graph is not the common case.
1606 if (invoke->GetBlock()->GetGraph()->IsDebuggable()) {
1607 return;
1608 }
1609
1610 DCHECK_EQ(invoke->GetNumberOfArguments(), 1U);
1611 DCHECK_EQ(invoke->InputAt(0)->GetType(), Primitive::kPrimDouble);
1612 DCHECK_EQ(invoke->GetType(), Primitive::kPrimDouble);
1613
1614 LocationSummary* const locations = new (arena) LocationSummary(invoke,
1615 LocationSummary::kCall,
1616 kIntrinsified);
1617 const InvokeRuntimeCallingConvention calling_convention;
1618
1619 locations->SetInAt(0, Location::RequiresFpuRegister());
1620 locations->SetOut(Location::RequiresFpuRegister());
1621 // Native code uses the soft float ABI.
1622 locations->AddTemp(Location::RegisterLocation(calling_convention.GetRegisterAt(0)));
1623 locations->AddTemp(Location::RegisterLocation(calling_convention.GetRegisterAt(1)));
1624}
1625
1626static void CreateFPFPToFPCallLocations(ArenaAllocator* arena, HInvoke* invoke) {
1627 // If the graph is debuggable, all callee-saved floating-point registers are blocked by
1628 // the code generator. Furthermore, the register allocator creates fixed live intervals
1629 // for all caller-saved registers because we are doing a function call. As a result, if
1630 // the input and output locations are unallocated, the register allocator runs out of
1631 // registers and fails; however, a debuggable graph is not the common case.
1632 if (invoke->GetBlock()->GetGraph()->IsDebuggable()) {
1633 return;
1634 }
1635
1636 DCHECK_EQ(invoke->GetNumberOfArguments(), 2U);
1637 DCHECK_EQ(invoke->InputAt(0)->GetType(), Primitive::kPrimDouble);
1638 DCHECK_EQ(invoke->InputAt(1)->GetType(), Primitive::kPrimDouble);
1639 DCHECK_EQ(invoke->GetType(), Primitive::kPrimDouble);
1640
1641 LocationSummary* const locations = new (arena) LocationSummary(invoke,
1642 LocationSummary::kCall,
1643 kIntrinsified);
1644 const InvokeRuntimeCallingConvention calling_convention;
1645
1646 locations->SetInAt(0, Location::RequiresFpuRegister());
1647 locations->SetInAt(1, Location::RequiresFpuRegister());
1648 locations->SetOut(Location::RequiresFpuRegister());
1649 // Native code uses the soft float ABI.
1650 locations->AddTemp(Location::RegisterLocation(calling_convention.GetRegisterAt(0)));
1651 locations->AddTemp(Location::RegisterLocation(calling_convention.GetRegisterAt(1)));
1652 locations->AddTemp(Location::RegisterLocation(calling_convention.GetRegisterAt(2)));
1653 locations->AddTemp(Location::RegisterLocation(calling_convention.GetRegisterAt(3)));
1654}
1655
1656static void GenFPToFPCall(HInvoke* invoke,
1657 ArmAssembler* assembler,
1658 CodeGeneratorARM* codegen,
1659 QuickEntrypointEnum entry) {
1660 LocationSummary* const locations = invoke->GetLocations();
1661 const InvokeRuntimeCallingConvention calling_convention;
1662
1663 DCHECK_EQ(invoke->GetNumberOfArguments(), 1U);
1664 DCHECK(locations->WillCall() && locations->Intrinsified());
1665 DCHECK(!locations->GetLiveRegisters()->ContainsCoreRegister(calling_convention.GetRegisterAt(0)));
1666 DCHECK(!locations->GetLiveRegisters()->ContainsCoreRegister(calling_convention.GetRegisterAt(1)));
1667
1668 __ LoadFromOffset(kLoadWord, LR, TR, GetThreadOffset<kArmWordSize>(entry).Int32Value());
1669 // Native code uses the soft float ABI.
1670 __ vmovrrd(calling_convention.GetRegisterAt(0),
1671 calling_convention.GetRegisterAt(1),
1672 FromLowSToD(locations->InAt(0).AsFpuRegisterPairLow<SRegister>()));
1673 __ blx(LR);
1674 codegen->RecordPcInfo(invoke, invoke->GetDexPc());
1675 __ vmovdrr(FromLowSToD(locations->Out().AsFpuRegisterPairLow<SRegister>()),
1676 calling_convention.GetRegisterAt(0),
1677 calling_convention.GetRegisterAt(1));
1678}
1679
1680static void GenFPFPToFPCall(HInvoke* invoke,
1681 ArmAssembler* assembler,
1682 CodeGeneratorARM* codegen,
1683 QuickEntrypointEnum entry) {
1684 LocationSummary* const locations = invoke->GetLocations();
1685 const InvokeRuntimeCallingConvention calling_convention;
1686
1687 DCHECK_EQ(invoke->GetNumberOfArguments(), 2U);
1688 DCHECK(locations->WillCall() && locations->Intrinsified());
1689 DCHECK(!locations->GetLiveRegisters()->ContainsCoreRegister(calling_convention.GetRegisterAt(0)));
1690 DCHECK(!locations->GetLiveRegisters()->ContainsCoreRegister(calling_convention.GetRegisterAt(1)));
1691 DCHECK(!locations->GetLiveRegisters()->ContainsCoreRegister(calling_convention.GetRegisterAt(2)));
1692 DCHECK(!locations->GetLiveRegisters()->ContainsCoreRegister(calling_convention.GetRegisterAt(3)));
1693
1694 __ LoadFromOffset(kLoadWord, LR, TR, GetThreadOffset<kArmWordSize>(entry).Int32Value());
1695 // Native code uses the soft float ABI.
1696 __ vmovrrd(calling_convention.GetRegisterAt(0),
1697 calling_convention.GetRegisterAt(1),
1698 FromLowSToD(locations->InAt(0).AsFpuRegisterPairLow<SRegister>()));
1699 __ vmovrrd(calling_convention.GetRegisterAt(2),
1700 calling_convention.GetRegisterAt(3),
1701 FromLowSToD(locations->InAt(1).AsFpuRegisterPairLow<SRegister>()));
1702 __ blx(LR);
1703 codegen->RecordPcInfo(invoke, invoke->GetDexPc());
1704 __ vmovdrr(FromLowSToD(locations->Out().AsFpuRegisterPairLow<SRegister>()),
1705 calling_convention.GetRegisterAt(0),
1706 calling_convention.GetRegisterAt(1));
1707}
1708
1709void IntrinsicLocationsBuilderARM::VisitMathCos(HInvoke* invoke) {
1710 CreateFPToFPCallLocations(arena_, invoke);
1711}
1712
1713void IntrinsicCodeGeneratorARM::VisitMathCos(HInvoke* invoke) {
1714 GenFPToFPCall(invoke, GetAssembler(), codegen_, kQuickCos);
1715}
1716
1717void IntrinsicLocationsBuilderARM::VisitMathSin(HInvoke* invoke) {
1718 CreateFPToFPCallLocations(arena_, invoke);
1719}
1720
1721void IntrinsicCodeGeneratorARM::VisitMathSin(HInvoke* invoke) {
1722 GenFPToFPCall(invoke, GetAssembler(), codegen_, kQuickSin);
1723}
1724
1725void IntrinsicLocationsBuilderARM::VisitMathAcos(HInvoke* invoke) {
1726 CreateFPToFPCallLocations(arena_, invoke);
1727}
1728
1729void IntrinsicCodeGeneratorARM::VisitMathAcos(HInvoke* invoke) {
1730 GenFPToFPCall(invoke, GetAssembler(), codegen_, kQuickAcos);
1731}
1732
1733void IntrinsicLocationsBuilderARM::VisitMathAsin(HInvoke* invoke) {
1734 CreateFPToFPCallLocations(arena_, invoke);
1735}
1736
1737void IntrinsicCodeGeneratorARM::VisitMathAsin(HInvoke* invoke) {
1738 GenFPToFPCall(invoke, GetAssembler(), codegen_, kQuickAsin);
1739}
1740
1741void IntrinsicLocationsBuilderARM::VisitMathAtan(HInvoke* invoke) {
1742 CreateFPToFPCallLocations(arena_, invoke);
1743}
1744
1745void IntrinsicCodeGeneratorARM::VisitMathAtan(HInvoke* invoke) {
1746 GenFPToFPCall(invoke, GetAssembler(), codegen_, kQuickAtan);
1747}
1748
1749void IntrinsicLocationsBuilderARM::VisitMathCbrt(HInvoke* invoke) {
1750 CreateFPToFPCallLocations(arena_, invoke);
1751}
1752
1753void IntrinsicCodeGeneratorARM::VisitMathCbrt(HInvoke* invoke) {
1754 GenFPToFPCall(invoke, GetAssembler(), codegen_, kQuickCbrt);
1755}
1756
1757void IntrinsicLocationsBuilderARM::VisitMathCosh(HInvoke* invoke) {
1758 CreateFPToFPCallLocations(arena_, invoke);
1759}
1760
1761void IntrinsicCodeGeneratorARM::VisitMathCosh(HInvoke* invoke) {
1762 GenFPToFPCall(invoke, GetAssembler(), codegen_, kQuickCosh);
1763}
1764
1765void IntrinsicLocationsBuilderARM::VisitMathExp(HInvoke* invoke) {
1766 CreateFPToFPCallLocations(arena_, invoke);
1767}
1768
1769void IntrinsicCodeGeneratorARM::VisitMathExp(HInvoke* invoke) {
1770 GenFPToFPCall(invoke, GetAssembler(), codegen_, kQuickExp);
1771}
1772
1773void IntrinsicLocationsBuilderARM::VisitMathExpm1(HInvoke* invoke) {
1774 CreateFPToFPCallLocations(arena_, invoke);
1775}
1776
1777void IntrinsicCodeGeneratorARM::VisitMathExpm1(HInvoke* invoke) {
1778 GenFPToFPCall(invoke, GetAssembler(), codegen_, kQuickExpm1);
1779}
1780
1781void IntrinsicLocationsBuilderARM::VisitMathLog(HInvoke* invoke) {
1782 CreateFPToFPCallLocations(arena_, invoke);
1783}
1784
1785void IntrinsicCodeGeneratorARM::VisitMathLog(HInvoke* invoke) {
1786 GenFPToFPCall(invoke, GetAssembler(), codegen_, kQuickLog);
1787}
1788
1789void IntrinsicLocationsBuilderARM::VisitMathLog10(HInvoke* invoke) {
1790 CreateFPToFPCallLocations(arena_, invoke);
1791}
1792
1793void IntrinsicCodeGeneratorARM::VisitMathLog10(HInvoke* invoke) {
1794 GenFPToFPCall(invoke, GetAssembler(), codegen_, kQuickLog10);
1795}
1796
1797void IntrinsicLocationsBuilderARM::VisitMathSinh(HInvoke* invoke) {
1798 CreateFPToFPCallLocations(arena_, invoke);
1799}
1800
1801void IntrinsicCodeGeneratorARM::VisitMathSinh(HInvoke* invoke) {
1802 GenFPToFPCall(invoke, GetAssembler(), codegen_, kQuickSinh);
1803}
1804
1805void IntrinsicLocationsBuilderARM::VisitMathTan(HInvoke* invoke) {
1806 CreateFPToFPCallLocations(arena_, invoke);
1807}
1808
1809void IntrinsicCodeGeneratorARM::VisitMathTan(HInvoke* invoke) {
1810 GenFPToFPCall(invoke, GetAssembler(), codegen_, kQuickTan);
1811}
1812
1813void IntrinsicLocationsBuilderARM::VisitMathTanh(HInvoke* invoke) {
1814 CreateFPToFPCallLocations(arena_, invoke);
1815}
1816
1817void IntrinsicCodeGeneratorARM::VisitMathTanh(HInvoke* invoke) {
1818 GenFPToFPCall(invoke, GetAssembler(), codegen_, kQuickTanh);
1819}
1820
1821void IntrinsicLocationsBuilderARM::VisitMathAtan2(HInvoke* invoke) {
1822 CreateFPFPToFPCallLocations(arena_, invoke);
1823}
1824
1825void IntrinsicCodeGeneratorARM::VisitMathAtan2(HInvoke* invoke) {
1826 GenFPFPToFPCall(invoke, GetAssembler(), codegen_, kQuickAtan2);
1827}
1828
1829void IntrinsicLocationsBuilderARM::VisitMathHypot(HInvoke* invoke) {
1830 CreateFPFPToFPCallLocations(arena_, invoke);
1831}
1832
1833void IntrinsicCodeGeneratorARM::VisitMathHypot(HInvoke* invoke) {
1834 GenFPFPToFPCall(invoke, GetAssembler(), codegen_, kQuickHypot);
1835}
1836
1837void IntrinsicLocationsBuilderARM::VisitMathNextAfter(HInvoke* invoke) {
1838 CreateFPFPToFPCallLocations(arena_, invoke);
1839}
1840
1841void IntrinsicCodeGeneratorARM::VisitMathNextAfter(HInvoke* invoke) {
1842 GenFPFPToFPCall(invoke, GetAssembler(), codegen_, kQuickNextAfter);
1843}
1844
Artem Serovc257da72016-02-02 13:49:43 +00001845void IntrinsicLocationsBuilderARM::VisitIntegerReverse(HInvoke* invoke) {
1846 CreateIntToIntLocations(arena_, invoke);
1847}
1848
1849void IntrinsicCodeGeneratorARM::VisitIntegerReverse(HInvoke* invoke) {
1850 ArmAssembler* assembler = GetAssembler();
1851 LocationSummary* locations = invoke->GetLocations();
1852
1853 Register out = locations->Out().AsRegister<Register>();
1854 Register in = locations->InAt(0).AsRegister<Register>();
1855
1856 __ rbit(out, in);
1857}
1858
1859void IntrinsicLocationsBuilderARM::VisitLongReverse(HInvoke* invoke) {
1860 LocationSummary* locations = new (arena_) LocationSummary(invoke,
1861 LocationSummary::kNoCall,
1862 kIntrinsified);
1863 locations->SetInAt(0, Location::RequiresRegister());
1864 locations->SetOut(Location::RequiresRegister(), Location::kOutputOverlap);
1865}
1866
1867void IntrinsicCodeGeneratorARM::VisitLongReverse(HInvoke* invoke) {
1868 ArmAssembler* assembler = GetAssembler();
1869 LocationSummary* locations = invoke->GetLocations();
1870
1871 Register in_reg_lo = locations->InAt(0).AsRegisterPairLow<Register>();
1872 Register in_reg_hi = locations->InAt(0).AsRegisterPairHigh<Register>();
1873 Register out_reg_lo = locations->Out().AsRegisterPairLow<Register>();
1874 Register out_reg_hi = locations->Out().AsRegisterPairHigh<Register>();
1875
1876 __ rbit(out_reg_lo, in_reg_hi);
1877 __ rbit(out_reg_hi, in_reg_lo);
1878}
1879
1880void IntrinsicLocationsBuilderARM::VisitIntegerReverseBytes(HInvoke* invoke) {
1881 CreateIntToIntLocations(arena_, invoke);
1882}
1883
1884void IntrinsicCodeGeneratorARM::VisitIntegerReverseBytes(HInvoke* invoke) {
1885 ArmAssembler* assembler = GetAssembler();
1886 LocationSummary* locations = invoke->GetLocations();
1887
1888 Register out = locations->Out().AsRegister<Register>();
1889 Register in = locations->InAt(0).AsRegister<Register>();
1890
1891 __ rev(out, in);
1892}
1893
1894void IntrinsicLocationsBuilderARM::VisitLongReverseBytes(HInvoke* invoke) {
1895 LocationSummary* locations = new (arena_) LocationSummary(invoke,
1896 LocationSummary::kNoCall,
1897 kIntrinsified);
1898 locations->SetInAt(0, Location::RequiresRegister());
1899 locations->SetOut(Location::RequiresRegister(), Location::kOutputOverlap);
1900}
1901
1902void IntrinsicCodeGeneratorARM::VisitLongReverseBytes(HInvoke* invoke) {
1903 ArmAssembler* assembler = GetAssembler();
1904 LocationSummary* locations = invoke->GetLocations();
1905
1906 Register in_reg_lo = locations->InAt(0).AsRegisterPairLow<Register>();
1907 Register in_reg_hi = locations->InAt(0).AsRegisterPairHigh<Register>();
1908 Register out_reg_lo = locations->Out().AsRegisterPairLow<Register>();
1909 Register out_reg_hi = locations->Out().AsRegisterPairHigh<Register>();
1910
1911 __ rev(out_reg_lo, in_reg_hi);
1912 __ rev(out_reg_hi, in_reg_lo);
1913}
1914
1915void IntrinsicLocationsBuilderARM::VisitShortReverseBytes(HInvoke* invoke) {
1916 CreateIntToIntLocations(arena_, invoke);
1917}
1918
1919void IntrinsicCodeGeneratorARM::VisitShortReverseBytes(HInvoke* invoke) {
1920 ArmAssembler* assembler = GetAssembler();
1921 LocationSummary* locations = invoke->GetLocations();
1922
1923 Register out = locations->Out().AsRegister<Register>();
1924 Register in = locations->InAt(0).AsRegister<Register>();
1925
1926 __ revsh(out, in);
1927}
1928
Tim Zhang25abd6c2016-01-19 23:39:24 +08001929void IntrinsicLocationsBuilderARM::VisitStringGetCharsNoCheck(HInvoke* invoke) {
1930 LocationSummary* locations = new (arena_) LocationSummary(invoke,
1931 LocationSummary::kNoCall,
1932 kIntrinsified);
1933 locations->SetInAt(0, Location::RequiresRegister());
1934 locations->SetInAt(1, Location::RequiresRegister());
1935 locations->SetInAt(2, Location::RequiresRegister());
1936 locations->SetInAt(3, Location::RequiresRegister());
1937 locations->SetInAt(4, Location::RequiresRegister());
1938
1939 locations->AddTemp(Location::RequiresRegister());
1940 locations->AddTemp(Location::RequiresRegister());
1941 locations->AddTemp(Location::RequiresRegister());
1942 locations->AddTemp(Location::RequiresRegister());
1943}
1944
1945void IntrinsicCodeGeneratorARM::VisitStringGetCharsNoCheck(HInvoke* invoke) {
1946 ArmAssembler* assembler = GetAssembler();
1947 LocationSummary* locations = invoke->GetLocations();
1948
1949 // Check assumption that sizeof(Char) is 2 (used in scaling below).
1950 const size_t char_size = Primitive::ComponentSize(Primitive::kPrimChar);
1951 DCHECK_EQ(char_size, 2u);
1952
1953 // Location of data in char array buffer.
1954 const uint32_t data_offset = mirror::Array::DataOffset(char_size).Uint32Value();
1955
1956 // Location of char array data in string.
1957 const uint32_t value_offset = mirror::String::ValueOffset().Uint32Value();
1958
1959 // void getCharsNoCheck(int srcBegin, int srcEnd, char[] dst, int dstBegin);
1960 // Since getChars() calls getCharsNoCheck() - we use registers rather than constants.
1961 Register srcObj = locations->InAt(0).AsRegister<Register>();
1962 Register srcBegin = locations->InAt(1).AsRegister<Register>();
1963 Register srcEnd = locations->InAt(2).AsRegister<Register>();
1964 Register dstObj = locations->InAt(3).AsRegister<Register>();
1965 Register dstBegin = locations->InAt(4).AsRegister<Register>();
1966
1967 Register src_ptr = locations->GetTemp(0).AsRegister<Register>();
1968 Register src_ptr_end = locations->GetTemp(1).AsRegister<Register>();
1969 Register dst_ptr = locations->GetTemp(2).AsRegister<Register>();
1970 Register tmp = locations->GetTemp(3).AsRegister<Register>();
1971
1972 // src range to copy.
1973 __ add(src_ptr, srcObj, ShifterOperand(value_offset));
1974 __ add(src_ptr_end, src_ptr, ShifterOperand(srcEnd, LSL, 1));
1975 __ add(src_ptr, src_ptr, ShifterOperand(srcBegin, LSL, 1));
1976
1977 // dst to be copied.
1978 __ add(dst_ptr, dstObj, ShifterOperand(data_offset));
1979 __ add(dst_ptr, dst_ptr, ShifterOperand(dstBegin, LSL, 1));
1980
1981 // Do the copy.
1982 Label loop, done;
1983 __ Bind(&loop);
1984 __ cmp(src_ptr, ShifterOperand(src_ptr_end));
1985 __ b(&done, EQ);
1986 __ ldrh(tmp, Address(src_ptr, char_size, Address::PostIndex));
1987 __ strh(tmp, Address(dst_ptr, char_size, Address::PostIndex));
1988 __ b(&loop);
1989 __ Bind(&done);
1990}
1991
Anton Kirilova3ffea22016-04-07 17:02:37 +01001992void IntrinsicLocationsBuilderARM::VisitFloatIsInfinite(HInvoke* invoke) {
1993 CreateFPToIntLocations(arena_, invoke);
1994}
1995
1996void IntrinsicCodeGeneratorARM::VisitFloatIsInfinite(HInvoke* invoke) {
1997 ArmAssembler* const assembler = GetAssembler();
1998 LocationSummary* const locations = invoke->GetLocations();
1999 const Register out = locations->Out().AsRegister<Register>();
2000 // Shifting left by 1 bit makes the value encodable as an immediate operand;
2001 // we don't care about the sign bit anyway.
2002 constexpr uint32_t infinity = kPositiveInfinityFloat << 1U;
2003
2004 __ vmovrs(out, locations->InAt(0).AsFpuRegister<SRegister>());
2005 // We don't care about the sign bit, so shift left.
2006 __ Lsl(out, out, 1);
2007 __ eor(out, out, ShifterOperand(infinity));
2008 // If the result is 0, then it has 32 leading zeros, and less than that otherwise.
2009 __ clz(out, out);
2010 // Any number less than 32 logically shifted right by 5 bits results in 0;
2011 // the same operation on 32 yields 1.
2012 __ Lsr(out, out, 5);
2013}
2014
2015void IntrinsicLocationsBuilderARM::VisitDoubleIsInfinite(HInvoke* invoke) {
2016 CreateFPToIntLocations(arena_, invoke);
2017}
2018
2019void IntrinsicCodeGeneratorARM::VisitDoubleIsInfinite(HInvoke* invoke) {
2020 ArmAssembler* const assembler = GetAssembler();
2021 LocationSummary* const locations = invoke->GetLocations();
2022 const Register out = locations->Out().AsRegister<Register>();
2023 // The highest 32 bits of double precision positive infinity separated into
2024 // two constants encodable as immediate operands.
2025 constexpr uint32_t infinity_high = 0x7f000000U;
2026 constexpr uint32_t infinity_high2 = 0x00f00000U;
2027
2028 static_assert((infinity_high | infinity_high2) == static_cast<uint32_t>(kPositiveInfinityDouble >> 32U),
2029 "The constants do not add up to the high 32 bits of double precision positive infinity.");
2030 __ vmovrrd(IP, out, FromLowSToD(locations->InAt(0).AsFpuRegisterPairLow<SRegister>()));
2031 __ eor(out, out, ShifterOperand(infinity_high));
2032 __ eor(out, out, ShifterOperand(infinity_high2));
2033 // We don't care about the sign bit, so shift left.
2034 __ orr(out, IP, ShifterOperand(out, LSL, 1));
2035 // If the result is 0, then it has 32 leading zeros, and less than that otherwise.
2036 __ clz(out, out);
2037 // Any number less than 32 logically shifted right by 5 bits results in 0;
2038 // the same operation on 32 yields 1.
2039 __ Lsr(out, out, 5);
2040}
2041
Aart Bik2f9fcc92016-03-01 15:16:54 -08002042UNIMPLEMENTED_INTRINSIC(ARM, IntegerBitCount)
2043UNIMPLEMENTED_INTRINSIC(ARM, LongBitCount)
2044UNIMPLEMENTED_INTRINSIC(ARM, MathMinDoubleDouble)
2045UNIMPLEMENTED_INTRINSIC(ARM, MathMinFloatFloat)
2046UNIMPLEMENTED_INTRINSIC(ARM, MathMaxDoubleDouble)
2047UNIMPLEMENTED_INTRINSIC(ARM, MathMaxFloatFloat)
2048UNIMPLEMENTED_INTRINSIC(ARM, MathMinLongLong)
2049UNIMPLEMENTED_INTRINSIC(ARM, MathMaxLongLong)
2050UNIMPLEMENTED_INTRINSIC(ARM, MathCeil) // Could be done by changing rounding mode, maybe?
2051UNIMPLEMENTED_INTRINSIC(ARM, MathFloor) // Could be done by changing rounding mode, maybe?
2052UNIMPLEMENTED_INTRINSIC(ARM, MathRint)
2053UNIMPLEMENTED_INTRINSIC(ARM, MathRoundDouble) // Could be done by changing rounding mode, maybe?
2054UNIMPLEMENTED_INTRINSIC(ARM, MathRoundFloat) // Could be done by changing rounding mode, maybe?
2055UNIMPLEMENTED_INTRINSIC(ARM, UnsafeCASLong) // High register pressure.
2056UNIMPLEMENTED_INTRINSIC(ARM, SystemArrayCopyChar)
2057UNIMPLEMENTED_INTRINSIC(ARM, ReferenceGetReferent)
Aart Bik2f9fcc92016-03-01 15:16:54 -08002058UNIMPLEMENTED_INTRINSIC(ARM, IntegerHighestOneBit)
2059UNIMPLEMENTED_INTRINSIC(ARM, LongHighestOneBit)
2060UNIMPLEMENTED_INTRINSIC(ARM, IntegerLowestOneBit)
2061UNIMPLEMENTED_INTRINSIC(ARM, LongLowestOneBit)
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -08002062
Aart Bik0e54c012016-03-04 12:08:31 -08002063// 1.8.
2064UNIMPLEMENTED_INTRINSIC(ARM, UnsafeGetAndAddInt)
2065UNIMPLEMENTED_INTRINSIC(ARM, UnsafeGetAndAddLong)
2066UNIMPLEMENTED_INTRINSIC(ARM, UnsafeGetAndSetInt)
2067UNIMPLEMENTED_INTRINSIC(ARM, UnsafeGetAndSetLong)
2068UNIMPLEMENTED_INTRINSIC(ARM, UnsafeGetAndSetObject)
Aart Bik0e54c012016-03-04 12:08:31 -08002069
Aart Bik2f9fcc92016-03-01 15:16:54 -08002070UNREACHABLE_INTRINSICS(ARM)
Roland Levillain4d027112015-07-01 15:41:14 +01002071
2072#undef __
2073
Andreas Gampe2bcf9bf2015-01-29 09:56:07 -08002074} // namespace arm
2075} // namespace art