blob: afb7fc371834e9939c0ed64d61999e1f75851254 [file] [log] [blame]
Alexandre Rames5319def2014-10-23 10:03:10 +01001/*
2 * Copyright (C) 2014 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17#ifndef ART_COMPILER_OPTIMIZING_CODE_GENERATOR_ARM64_H_
18#define ART_COMPILER_OPTIMIZING_CODE_GENERATOR_ARM64_H_
19
20#include "code_generator.h"
Serban Constantinescu02d81cc2015-01-05 16:08:49 +000021#include "dex/compiler_enums.h"
Calin Juravlecd6dffe2015-01-08 17:35:35 +000022#include "driver/compiler_options.h"
Alexandre Rames5319def2014-10-23 10:03:10 +010023#include "nodes.h"
24#include "parallel_move_resolver.h"
25#include "utils/arm64/assembler_arm64.h"
26#include "a64/disasm-a64.h"
27#include "a64/macro-assembler-a64.h"
28#include "arch/arm64/quick_method_frame_info_arm64.h"
29
30namespace art {
31namespace arm64 {
32
33class CodeGeneratorARM64;
Andreas Gampe878d58c2015-01-15 23:24:00 -080034
35// TODO: Tune the use of Load-Acquire, Store-Release vs Data Memory Barriers.
36// For now we prefer the use of load-acquire, store-release over explicit memory barriers.
37static constexpr bool kUseAcquireRelease = true;
Alexandre Rames5319def2014-10-23 10:03:10 +010038
Nicolas Geoffray86a8d7a2014-11-19 08:47:18 +000039// Use a local definition to prevent copying mistakes.
40static constexpr size_t kArm64WordSize = kArm64PointerSize;
41
Alexandre Rames5319def2014-10-23 10:03:10 +010042static const vixl::Register kParameterCoreRegisters[] = {
43 vixl::x1, vixl::x2, vixl::x3, vixl::x4, vixl::x5, vixl::x6, vixl::x7
44};
45static constexpr size_t kParameterCoreRegistersLength = arraysize(kParameterCoreRegisters);
46static const vixl::FPRegister kParameterFPRegisters[] = {
47 vixl::d0, vixl::d1, vixl::d2, vixl::d3, vixl::d4, vixl::d5, vixl::d6, vixl::d7
48};
49static constexpr size_t kParameterFPRegistersLength = arraysize(kParameterFPRegisters);
50
Andreas Gampe878d58c2015-01-15 23:24:00 -080051const vixl::Register tr = vixl::x18; // Thread Register
52static const vixl::Register kArtMethodRegister = vixl::w0; // Method register on invoke.
Serban Constantinescu3d087de2015-01-28 11:57:05 +000053const vixl::Register kQuickSuspendRegister = vixl::x19;
Alexandre Rames5319def2014-10-23 10:03:10 +010054
55const vixl::CPURegList vixl_reserved_core_registers(vixl::ip0, vixl::ip1);
Alexandre Ramesa89086e2014-11-07 17:13:25 +000056const vixl::CPURegList vixl_reserved_fp_registers(vixl::d31);
Alexandre Rames5319def2014-10-23 10:03:10 +010057
Serban Constantinescu3d087de2015-01-28 11:57:05 +000058// TODO: When the runtime does not use kQuickSuspendRegister as a suspend
59// counter remove it from the reserved registers list.
60const vixl::CPURegList runtime_reserved_core_registers(tr, kQuickSuspendRegister, vixl::lr);
61
62// Callee-saved registers defined by AAPCS64.
63const vixl::CPURegList callee_saved_core_registers(vixl::CPURegister::kRegister,
64 vixl::kXRegSize,
65 vixl::x19.code(),
66 vixl::x30.code());
67const vixl::CPURegList callee_saved_fp_registers(vixl::CPURegister::kFPRegister,
68 vixl::kDRegSize,
69 vixl::d8.code(),
70 vixl::d15.code());
Alexandre Ramesa89086e2014-11-07 17:13:25 +000071Location ARM64ReturnLocation(Primitive::Type return_type);
72
Andreas Gampe878d58c2015-01-15 23:24:00 -080073class SlowPathCodeARM64 : public SlowPathCode {
74 public:
75 SlowPathCodeARM64() : entry_label_(), exit_label_() {}
76
77 vixl::Label* GetEntryLabel() { return &entry_label_; }
78 vixl::Label* GetExitLabel() { return &exit_label_; }
79
80 private:
81 vixl::Label entry_label_;
82 vixl::Label exit_label_;
83
84 DISALLOW_COPY_AND_ASSIGN(SlowPathCodeARM64);
85};
86
Alexandre Rames5319def2014-10-23 10:03:10 +010087class InvokeDexCallingConvention : public CallingConvention<vixl::Register, vixl::FPRegister> {
88 public:
89 InvokeDexCallingConvention()
90 : CallingConvention(kParameterCoreRegisters,
91 kParameterCoreRegistersLength,
92 kParameterFPRegisters,
93 kParameterFPRegistersLength) {}
94
95 Location GetReturnLocation(Primitive::Type return_type) {
Alexandre Ramesa89086e2014-11-07 17:13:25 +000096 return ARM64ReturnLocation(return_type);
Alexandre Rames5319def2014-10-23 10:03:10 +010097 }
98
99
100 private:
101 DISALLOW_COPY_AND_ASSIGN(InvokeDexCallingConvention);
102};
103
104class InvokeDexCallingConventionVisitor {
105 public:
Alexandre Ramesa89086e2014-11-07 17:13:25 +0000106 InvokeDexCallingConventionVisitor() : gp_index_(0), fp_index_(0), stack_index_(0) {}
Alexandre Rames5319def2014-10-23 10:03:10 +0100107
108 Location GetNextLocation(Primitive::Type type);
109 Location GetReturnLocation(Primitive::Type return_type) {
110 return calling_convention.GetReturnLocation(return_type);
111 }
112
113 private:
114 InvokeDexCallingConvention calling_convention;
115 // The current index for core registers.
116 uint32_t gp_index_;
Alexandre Ramesa89086e2014-11-07 17:13:25 +0000117 // The current index for floating-point registers.
118 uint32_t fp_index_;
Alexandre Rames5319def2014-10-23 10:03:10 +0100119 // The current stack index.
120 uint32_t stack_index_;
121
122 DISALLOW_COPY_AND_ASSIGN(InvokeDexCallingConventionVisitor);
123};
124
125class InstructionCodeGeneratorARM64 : public HGraphVisitor {
126 public:
127 InstructionCodeGeneratorARM64(HGraph* graph, CodeGeneratorARM64* codegen);
128
129#define DECLARE_VISIT_INSTRUCTION(name, super) \
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000130 void Visit##name(H##name* instr) OVERRIDE;
Alexandre Rames5319def2014-10-23 10:03:10 +0100131 FOR_EACH_CONCRETE_INSTRUCTION(DECLARE_VISIT_INSTRUCTION)
132#undef DECLARE_VISIT_INSTRUCTION
133
134 void LoadCurrentMethod(XRegister reg);
135
136 Arm64Assembler* GetAssembler() const { return assembler_; }
Alexandre Rames67555f72014-11-18 10:55:16 +0000137 vixl::MacroAssembler* GetVIXLAssembler() { return GetAssembler()->vixl_masm_; }
Alexandre Rames5319def2014-10-23 10:03:10 +0100138
139 private:
Alexandre Rames67555f72014-11-18 10:55:16 +0000140 void GenerateClassInitializationCheck(SlowPathCodeARM64* slow_path, vixl::Register class_reg);
Serban Constantinescu02d81cc2015-01-05 16:08:49 +0000141 void GenerateMemoryBarrier(MemBarrierKind kind);
Serban Constantinescu02164b32014-11-13 14:05:07 +0000142 void GenerateSuspendCheck(HSuspendCheck* instruction, HBasicBlock* successor);
Alexandre Rames67555f72014-11-18 10:55:16 +0000143 void HandleBinaryOp(HBinaryOperation* instr);
Serban Constantinescu02164b32014-11-13 14:05:07 +0000144 void HandleShift(HBinaryOperation* instr);
Calin Juravlecd6dffe2015-01-08 17:35:35 +0000145 void GenerateImplicitNullCheck(HNullCheck* instruction);
146 void GenerateExplicitNullCheck(HNullCheck* instruction);
Alexandre Rames5319def2014-10-23 10:03:10 +0100147
148 Arm64Assembler* const assembler_;
149 CodeGeneratorARM64* const codegen_;
150
151 DISALLOW_COPY_AND_ASSIGN(InstructionCodeGeneratorARM64);
152};
153
154class LocationsBuilderARM64 : public HGraphVisitor {
155 public:
156 explicit LocationsBuilderARM64(HGraph* graph, CodeGeneratorARM64* codegen)
157 : HGraphVisitor(graph), codegen_(codegen) {}
158
159#define DECLARE_VISIT_INSTRUCTION(name, super) \
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000160 void Visit##name(H##name* instr) OVERRIDE;
Alexandre Rames5319def2014-10-23 10:03:10 +0100161 FOR_EACH_CONCRETE_INSTRUCTION(DECLARE_VISIT_INSTRUCTION)
162#undef DECLARE_VISIT_INSTRUCTION
163
164 private:
Alexandre Rames67555f72014-11-18 10:55:16 +0000165 void HandleBinaryOp(HBinaryOperation* instr);
Serban Constantinescu02164b32014-11-13 14:05:07 +0000166 void HandleShift(HBinaryOperation* instr);
Alexandre Rames5319def2014-10-23 10:03:10 +0100167 void HandleInvoke(HInvoke* instr);
168
169 CodeGeneratorARM64* const codegen_;
170 InvokeDexCallingConventionVisitor parameter_visitor_;
171
172 DISALLOW_COPY_AND_ASSIGN(LocationsBuilderARM64);
173};
174
Alexandre Rames3e69f162014-12-10 10:36:50 +0000175class ParallelMoveResolverARM64 : public ParallelMoveResolver {
176 public:
177 ParallelMoveResolverARM64(ArenaAllocator* allocator, CodeGeneratorARM64* codegen)
178 : ParallelMoveResolver(allocator), codegen_(codegen) {}
179
180 void EmitMove(size_t index) OVERRIDE;
181 void EmitSwap(size_t index) OVERRIDE;
182 void RestoreScratch(int reg) OVERRIDE;
183 void SpillScratch(int reg) OVERRIDE;
184
185 private:
186 Arm64Assembler* GetAssembler() const;
187 vixl::MacroAssembler* GetVIXLAssembler() const {
188 return GetAssembler()->vixl_masm_;
189 }
190
191 CodeGeneratorARM64* const codegen_;
192
193 DISALLOW_COPY_AND_ASSIGN(ParallelMoveResolverARM64);
194};
195
Alexandre Rames5319def2014-10-23 10:03:10 +0100196class CodeGeneratorARM64 : public CodeGenerator {
197 public:
Calin Juravlecd6dffe2015-01-08 17:35:35 +0000198 CodeGeneratorARM64(HGraph* graph, const CompilerOptions& compiler_options);
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000199 virtual ~CodeGeneratorARM64() {}
Alexandre Rames5319def2014-10-23 10:03:10 +0100200
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000201 void GenerateFrameEntry() OVERRIDE;
202 void GenerateFrameExit() OVERRIDE;
Alexandre Rames5319def2014-10-23 10:03:10 +0100203
Serban Constantinescu3d087de2015-01-28 11:57:05 +0000204 vixl::CPURegList GetFramePreservedCoreRegisters() const {
205 return vixl::CPURegList(vixl::CPURegister::kRegister, vixl::kXRegSize,
206 core_spill_mask_);
207 }
208
209 vixl::CPURegList GetFramePreservedFPRegisters() const {
210 return vixl::CPURegList(vixl::CPURegister::kFPRegister, vixl::kDRegSize,
211 fpu_spill_mask_);
Alexandre Rames5319def2014-10-23 10:03:10 +0100212 }
Alexandre Rames5319def2014-10-23 10:03:10 +0100213
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000214 void Bind(HBasicBlock* block) OVERRIDE;
Alexandre Rames5319def2014-10-23 10:03:10 +0100215
216 vixl::Label* GetLabelOf(HBasicBlock* block) const {
Nicolas Geoffraydc23d832015-02-16 11:15:43 +0000217 return CommonGetLabelOf<vixl::Label>(block_labels_, block);
Alexandre Rames5319def2014-10-23 10:03:10 +0100218 }
219
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000220 void Move(HInstruction* instruction, Location location, HInstruction* move_for) OVERRIDE;
Alexandre Rames5319def2014-10-23 10:03:10 +0100221
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000222 size_t GetWordSize() const OVERRIDE {
Alexandre Rames5319def2014-10-23 10:03:10 +0100223 return kArm64WordSize;
224 }
225
Mark Mendellf85a9ca2015-01-13 09:20:58 -0500226 size_t GetFloatingPointSpillSlotSize() const OVERRIDE {
227 // Allocated in D registers, which are word sized.
228 return kArm64WordSize;
229 }
230
Alexandre Rames67555f72014-11-18 10:55:16 +0000231 uintptr_t GetAddressOf(HBasicBlock* block) const OVERRIDE {
232 vixl::Label* block_entry_label = GetLabelOf(block);
233 DCHECK(block_entry_label->IsBound());
234 return block_entry_label->location();
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000235 }
Alexandre Rames5319def2014-10-23 10:03:10 +0100236
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000237 HGraphVisitor* GetLocationBuilder() OVERRIDE { return &location_builder_; }
238 HGraphVisitor* GetInstructionVisitor() OVERRIDE { return &instruction_visitor_; }
239 Arm64Assembler* GetAssembler() OVERRIDE { return &assembler_; }
Alexandre Rames67555f72014-11-18 10:55:16 +0000240 vixl::MacroAssembler* GetVIXLAssembler() { return GetAssembler()->vixl_masm_; }
Alexandre Rames5319def2014-10-23 10:03:10 +0100241
242 // Emit a write barrier.
243 void MarkGCCard(vixl::Register object, vixl::Register value);
244
245 // Register allocation.
246
Nicolas Geoffray98893962015-01-21 12:32:32 +0000247 void SetupBlockedRegisters(bool is_baseline) const OVERRIDE;
Alexandre Rames5319def2014-10-23 10:03:10 +0100248 // AllocateFreeRegister() is only used when allocating registers locally
249 // during CompileBaseline().
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000250 Location AllocateFreeRegister(Primitive::Type type) const OVERRIDE;
Alexandre Rames5319def2014-10-23 10:03:10 +0100251
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000252 Location GetStackLocation(HLoadLocal* load) const OVERRIDE;
Alexandre Rames5319def2014-10-23 10:03:10 +0100253
Alexandre Rames3e69f162014-12-10 10:36:50 +0000254 size_t SaveCoreRegister(size_t stack_index, uint32_t reg_id);
255 size_t RestoreCoreRegister(size_t stack_index, uint32_t reg_id);
256 size_t SaveFloatingPointRegister(size_t stack_index, uint32_t reg_id);
257 size_t RestoreFloatingPointRegister(size_t stack_index, uint32_t reg_id);
Alexandre Rames5319def2014-10-23 10:03:10 +0100258
259 // The number of registers that can be allocated. The register allocator may
260 // decide to reserve and not use a few of them.
261 // We do not consider registers sp, xzr, wzr. They are either not allocatable
262 // (xzr, wzr), or make for poor allocatable registers (sp alignment
263 // requirements, etc.). This also facilitates our task as all other registers
264 // can easily be mapped via to or from their type and index or code.
Alexandre Ramesa89086e2014-11-07 17:13:25 +0000265 static const int kNumberOfAllocatableRegisters = vixl::kNumberOfRegisters - 1;
266 static const int kNumberOfAllocatableFPRegisters = vixl::kNumberOfFPRegisters;
Alexandre Rames5319def2014-10-23 10:03:10 +0100267 static constexpr int kNumberOfAllocatableRegisterPairs = 0;
268
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000269 void DumpCoreRegister(std::ostream& stream, int reg) const OVERRIDE;
270 void DumpFloatingPointRegister(std::ostream& stream, int reg) const OVERRIDE;
Alexandre Rames5319def2014-10-23 10:03:10 +0100271
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000272 InstructionSet GetInstructionSet() const OVERRIDE {
Alexandre Rames5319def2014-10-23 10:03:10 +0100273 return InstructionSet::kArm64;
274 }
275
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000276 void Initialize() OVERRIDE {
Alexandre Rames5319def2014-10-23 10:03:10 +0100277 HGraph* graph = GetGraph();
278 int length = graph->GetBlocks().Size();
279 block_labels_ = graph->GetArena()->AllocArray<vixl::Label>(length);
280 for (int i = 0; i < length; ++i) {
281 new(block_labels_ + i) vixl::Label();
282 }
283 }
284
Serban Constantinescu32f5b4d2014-11-25 20:05:46 +0000285 void Finalize(CodeAllocator* allocator) OVERRIDE;
286
Alexandre Ramesfc19de82014-11-07 17:13:31 +0000287 // Code generation helpers.
Alexandre Rames67555f72014-11-18 10:55:16 +0000288 void MoveConstant(vixl::CPURegister destination, HConstant* constant);
Alexandre Rames3e69f162014-12-10 10:36:50 +0000289 // The type is optional. When specified it must be coherent with the
290 // locations, and is used for optimisation and debugging.
291 void MoveLocation(Location destination, Location source,
292 Primitive::Type type = Primitive::kPrimVoid);
293 void SwapLocations(Location loc_1, Location loc_2);
Alexandre Rames67555f72014-11-18 10:55:16 +0000294 void Load(Primitive::Type type, vixl::CPURegister dst, const vixl::MemOperand& src);
295 void Store(Primitive::Type type, vixl::CPURegister rt, const vixl::MemOperand& dst);
296 void LoadCurrentMethod(vixl::Register current_method);
Calin Juravle77520bc2015-01-12 18:45:46 +0000297 void LoadAcquire(HInstruction* instruction, vixl::CPURegister dst, const vixl::MemOperand& src);
Serban Constantinescu02d81cc2015-01-05 16:08:49 +0000298 void StoreRelease(Primitive::Type type, vixl::CPURegister rt, const vixl::MemOperand& dst);
Alexandre Rames67555f72014-11-18 10:55:16 +0000299
300 // Generate code to invoke a runtime entry point.
301 void InvokeRuntime(int32_t offset, HInstruction* instruction, uint32_t dex_pc);
Alexandre Ramesfc19de82014-11-07 17:13:31 +0000302
Alexandre Rames3e69f162014-12-10 10:36:50 +0000303 ParallelMoveResolverARM64* GetMoveResolver() { return &move_resolver_; }
Nicolas Geoffrayf0e39372014-11-12 17:50:07 +0000304
Nicolas Geoffray840e5462015-01-07 16:01:24 +0000305 bool NeedsTwoRegisters(Primitive::Type type ATTRIBUTE_UNUSED) const OVERRIDE {
306 return false;
307 }
308
Andreas Gampe878d58c2015-01-15 23:24:00 -0800309 void GenerateStaticOrDirectCall(HInvokeStaticOrDirect* invoke, vixl::Register temp);
310
Alexandre Rames5319def2014-10-23 10:03:10 +0100311 private:
312 // Labels for each block that will be compiled.
313 vixl::Label* block_labels_;
Nicolas Geoffray1cf95282014-12-12 19:22:03 +0000314 vixl::Label frame_entry_label_;
Alexandre Rames5319def2014-10-23 10:03:10 +0100315
316 LocationsBuilderARM64 location_builder_;
317 InstructionCodeGeneratorARM64 instruction_visitor_;
Alexandre Rames3e69f162014-12-10 10:36:50 +0000318 ParallelMoveResolverARM64 move_resolver_;
Alexandre Rames5319def2014-10-23 10:03:10 +0100319 Arm64Assembler assembler_;
320
321 DISALLOW_COPY_AND_ASSIGN(CodeGeneratorARM64);
322};
323
Alexandre Rames3e69f162014-12-10 10:36:50 +0000324inline Arm64Assembler* ParallelMoveResolverARM64::GetAssembler() const {
325 return codegen_->GetAssembler();
326}
327
Alexandre Rames5319def2014-10-23 10:03:10 +0100328} // namespace arm64
329} // namespace art
330
331#endif // ART_COMPILER_OPTIMIZING_CODE_GENERATOR_ARM64_H_