blob: b8553d266dd967798cf7d4af27f50286b45a4f72 [file] [log] [blame]
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +00001/*
2 * Copyright (C) 2014 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17#ifndef ART_COMPILER_OPTIMIZING_CODE_GENERATOR_X86_H_
18#define ART_COMPILER_OPTIMIZING_CODE_GENERATOR_X86_H_
19
20#include "code_generator.h"
Calin Juravle52c48962014-12-16 17:02:57 +000021#include "dex/compiler_enums.h"
Calin Juravlecd6dffe2015-01-08 17:35:35 +000022#include "driver/compiler_options.h"
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +000023#include "nodes.h"
Nicolas Geoffray86dbb9a2014-06-04 11:12:39 +010024#include "parallel_move_resolver.h"
Nicolas Geoffray787c3072014-03-17 10:20:19 +000025#include "utils/x86/assembler_x86.h"
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +000026
27namespace art {
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +000028namespace x86 {
29
Nicolas Geoffray86a8d7a2014-11-19 08:47:18 +000030// Use a local definition to prevent copying mistakes.
31static constexpr size_t kX86WordSize = kX86PointerSize;
Nicolas Geoffray707c8092014-04-04 10:50:14 +010032
Nicolas Geoffray01bc96d2014-04-11 17:43:50 +010033class CodeGeneratorX86;
Nicolas Geoffray424f6762014-11-03 14:51:25 +000034class SlowPathCodeX86;
Nicolas Geoffray01bc96d2014-04-11 17:43:50 +010035
Nicolas Geoffraya747a392014-04-17 14:56:23 +010036static constexpr Register kParameterCoreRegisters[] = { ECX, EDX, EBX };
37static constexpr RegisterPair kParameterCorePairRegisters[] = { ECX_EDX, EDX_EBX };
38static constexpr size_t kParameterCoreRegistersLength = arraysize(kParameterCoreRegisters);
Mark P Mendell966c3ae2015-01-27 15:45:27 +000039static constexpr XmmRegister kParameterFpuRegisters[] = { XMM0, XMM1, XMM2, XMM3 };
40static constexpr size_t kParameterFpuRegistersLength = arraysize(kParameterFpuRegisters);
Nicolas Geoffraya747a392014-04-17 14:56:23 +010041
Nicolas Geoffrayd75948a2015-03-27 09:53:16 +000042static constexpr Register kRuntimeParameterCoreRegisters[] = { EAX, ECX, EDX, EBX };
43static constexpr size_t kRuntimeParameterCoreRegistersLength =
44 arraysize(kRuntimeParameterCoreRegisters);
45static constexpr XmmRegister kRuntimeParameterFpuRegisters[] = { XMM0, XMM1, XMM2, XMM3 };
46static constexpr size_t kRuntimeParameterFpuRegistersLength =
47 arraysize(kRuntimeParameterFpuRegisters);
48
49class InvokeRuntimeCallingConvention : public CallingConvention<Register, XmmRegister> {
50 public:
51 InvokeRuntimeCallingConvention()
52 : CallingConvention(kRuntimeParameterCoreRegisters,
53 kRuntimeParameterCoreRegistersLength,
54 kRuntimeParameterFpuRegisters,
Mathieu Chartiere401d142015-04-22 13:56:20 -070055 kRuntimeParameterFpuRegistersLength,
56 kX86PointerSize) {}
Nicolas Geoffrayd75948a2015-03-27 09:53:16 +000057
58 private:
59 DISALLOW_COPY_AND_ASSIGN(InvokeRuntimeCallingConvention);
60};
61
Nicolas Geoffray7fb49da2014-10-06 09:12:41 +010062class InvokeDexCallingConvention : public CallingConvention<Register, XmmRegister> {
Nicolas Geoffraya747a392014-04-17 14:56:23 +010063 public:
Nicolas Geoffray7fb49da2014-10-06 09:12:41 +010064 InvokeDexCallingConvention() : CallingConvention(
65 kParameterCoreRegisters,
66 kParameterCoreRegistersLength,
67 kParameterFpuRegisters,
Mathieu Chartiere401d142015-04-22 13:56:20 -070068 kParameterFpuRegistersLength,
69 kX86PointerSize) {}
Nicolas Geoffraya747a392014-04-17 14:56:23 +010070
71 RegisterPair GetRegisterPairAt(size_t argument_index) {
72 DCHECK_LT(argument_index + 1, GetNumberOfRegisters());
73 return kParameterCorePairRegisters[argument_index];
74 }
75
76 private:
77 DISALLOW_COPY_AND_ASSIGN(InvokeDexCallingConvention);
78};
79
Roland Levillain2d27c8e2015-04-28 15:48:45 +010080class InvokeDexCallingConventionVisitorX86 : public InvokeDexCallingConventionVisitor {
Nicolas Geoffraya747a392014-04-17 14:56:23 +010081 public:
Roland Levillain2d27c8e2015-04-28 15:48:45 +010082 InvokeDexCallingConventionVisitorX86() {}
83 virtual ~InvokeDexCallingConventionVisitorX86() {}
Nicolas Geoffraya747a392014-04-17 14:56:23 +010084
Roland Levillain2d27c8e2015-04-28 15:48:45 +010085 Location GetNextLocation(Primitive::Type type) OVERRIDE;
Nicolas Geoffrayfd88f162015-06-03 11:23:52 +010086 Location GetReturnLocation(Primitive::Type type) const OVERRIDE;
87 Location GetMethodLocation() const OVERRIDE;
Nicolas Geoffraya747a392014-04-17 14:56:23 +010088
89 private:
90 InvokeDexCallingConvention calling_convention;
Nicolas Geoffraya747a392014-04-17 14:56:23 +010091
Roland Levillain2d27c8e2015-04-28 15:48:45 +010092 DISALLOW_COPY_AND_ASSIGN(InvokeDexCallingConventionVisitorX86);
Nicolas Geoffraya747a392014-04-17 14:56:23 +010093};
94
Zheng Xuad4450e2015-04-17 18:48:56 +080095class ParallelMoveResolverX86 : public ParallelMoveResolverWithSwap {
Nicolas Geoffray86dbb9a2014-06-04 11:12:39 +010096 public:
97 ParallelMoveResolverX86(ArenaAllocator* allocator, CodeGeneratorX86* codegen)
Zheng Xuad4450e2015-04-17 18:48:56 +080098 : ParallelMoveResolverWithSwap(allocator), codegen_(codegen) {}
Nicolas Geoffray86dbb9a2014-06-04 11:12:39 +010099
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000100 void EmitMove(size_t index) OVERRIDE;
101 void EmitSwap(size_t index) OVERRIDE;
102 void SpillScratch(int reg) OVERRIDE;
103 void RestoreScratch(int reg) OVERRIDE;
Nicolas Geoffray86dbb9a2014-06-04 11:12:39 +0100104
105 X86Assembler* GetAssembler() const;
106
107 private:
108 void Exchange(Register reg, int mem);
109 void Exchange(int mem1, int mem2);
Mark Mendell7c8d0092015-01-26 11:21:33 -0500110 void Exchange32(XmmRegister reg, int mem);
111 void MoveMemoryToMemory32(int dst, int src);
112 void MoveMemoryToMemory64(int dst, int src);
Nicolas Geoffray86dbb9a2014-06-04 11:12:39 +0100113
114 CodeGeneratorX86* const codegen_;
115
116 DISALLOW_COPY_AND_ASSIGN(ParallelMoveResolverX86);
117};
118
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +0000119class LocationsBuilderX86 : public HGraphVisitor {
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000120 public:
Nicolas Geoffray01bc96d2014-04-11 17:43:50 +0100121 LocationsBuilderX86(HGraph* graph, CodeGeneratorX86* codegen)
122 : HGraphVisitor(graph), codegen_(codegen) {}
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000123
Nicolas Geoffray360231a2014-10-08 21:07:48 +0100124#define DECLARE_VISIT_INSTRUCTION(name, super) \
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000125 void Visit##name(H##name* instr) OVERRIDE;
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000126
Nicolas Geoffray96f89a22014-07-11 10:57:49 +0100127 FOR_EACH_CONCRETE_INSTRUCTION(DECLARE_VISIT_INSTRUCTION)
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000128
129#undef DECLARE_VISIT_INSTRUCTION
130
Nicolas Geoffray9574c4b2014-11-12 13:19:37 +0000131 private:
132 void HandleBitwiseOperation(HBinaryOperation* instruction);
Nicolas Geoffraye982f0b2014-08-13 02:11:24 +0100133 void HandleInvoke(HInvoke* invoke);
Calin Juravle9aec02f2014-11-18 23:06:35 +0000134 void HandleShift(HBinaryOperation* instruction);
Calin Juravle52c48962014-12-16 17:02:57 +0000135 void HandleFieldSet(HInstruction* instruction, const FieldInfo& field_info);
136 void HandleFieldGet(HInstruction* instruction, const FieldInfo& field_info);
Nicolas Geoffraye982f0b2014-08-13 02:11:24 +0100137
Nicolas Geoffray01bc96d2014-04-11 17:43:50 +0100138 CodeGeneratorX86* const codegen_;
Roland Levillain2d27c8e2015-04-28 15:48:45 +0100139 InvokeDexCallingConventionVisitorX86 parameter_visitor_;
Nicolas Geoffray01bc96d2014-04-11 17:43:50 +0100140
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +0000141 DISALLOW_COPY_AND_ASSIGN(LocationsBuilderX86);
142};
143
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000144class InstructionCodeGeneratorX86 : public HGraphVisitor {
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +0000145 public:
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100146 InstructionCodeGeneratorX86(HGraph* graph, CodeGeneratorX86* codegen);
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +0000147
Nicolas Geoffray360231a2014-10-08 21:07:48 +0100148#define DECLARE_VISIT_INSTRUCTION(name, super) \
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000149 void Visit##name(H##name* instr) OVERRIDE;
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +0000150
Nicolas Geoffray96f89a22014-07-11 10:57:49 +0100151 FOR_EACH_CONCRETE_INSTRUCTION(DECLARE_VISIT_INSTRUCTION)
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +0000152
153#undef DECLARE_VISIT_INSTRUCTION
154
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100155 X86Assembler* GetAssembler() const { return assembler_; }
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000156
157 private:
Nicolas Geoffray3c049742014-09-24 18:10:46 +0100158 // Generate code for the given suspend check. If not null, `successor`
159 // is the block to branch to if the suspend check is not needed, and after
160 // the suspend call.
161 void GenerateSuspendCheck(HSuspendCheck* check, HBasicBlock* successor);
Nicolas Geoffray424f6762014-11-03 14:51:25 +0000162 void GenerateClassInitializationCheck(SlowPathCodeX86* slow_path, Register class_reg);
Nicolas Geoffray9574c4b2014-11-12 13:19:37 +0000163 void HandleBitwiseOperation(HBinaryOperation* instruction);
Calin Juravlebacfec32014-11-14 15:54:36 +0000164 void GenerateDivRemIntegral(HBinaryOperation* instruction);
Guillaume Sanchez0f88e872015-03-30 17:55:45 +0100165 void DivRemOneOrMinusOne(HBinaryOperation* instruction);
Guillaume Sanchezb19930c2015-04-09 21:12:15 +0100166 void DivByPowerOfTwo(HDiv* instruction);
Guillaume Sanchez0f88e872015-03-30 17:55:45 +0100167 void GenerateDivRemWithAnyConstant(HBinaryOperation* instruction);
Mark Mendell24f2dfa2015-01-14 19:51:45 -0500168 void GenerateRemFP(HRem *rem);
Calin Juravle9aec02f2014-11-18 23:06:35 +0000169 void HandleShift(HBinaryOperation* instruction);
170 void GenerateShlLong(const Location& loc, Register shifter);
171 void GenerateShrLong(const Location& loc, Register shifter);
172 void GenerateUShrLong(const Location& loc, Register shifter);
Mark P Mendell73945692015-04-29 14:56:17 +0000173 void GenerateShlLong(const Location& loc, int shift);
174 void GenerateShrLong(const Location& loc, int shift);
175 void GenerateUShrLong(const Location& loc, int shift);
Calin Juravle52c48962014-12-16 17:02:57 +0000176 void GenerateMemoryBarrier(MemBarrierKind kind);
Nicolas Geoffray07276db2015-05-18 14:22:09 +0100177 void HandleFieldSet(HInstruction* instruction,
178 const FieldInfo& field_info,
179 bool value_can_be_null);
Calin Juravle52c48962014-12-16 17:02:57 +0000180 void HandleFieldGet(HInstruction* instruction, const FieldInfo& field_info);
Roland Levillain232ade02015-04-20 15:14:36 +0100181 // Push value to FPU stack. `is_fp` specifies whether the value is floating point or not.
182 // `is_wide` specifies whether it is long/double or not.
Mark Mendell24f2dfa2015-01-14 19:51:45 -0500183 void PushOntoFPStack(Location source, uint32_t temp_offset,
Roland Levillain232ade02015-04-20 15:14:36 +0100184 uint32_t stack_adjustment, bool is_fp, bool is_wide);
Nicolas Geoffray3c049742014-09-24 18:10:46 +0100185
Calin Juravlecd6dffe2015-01-08 17:35:35 +0000186 void GenerateImplicitNullCheck(HNullCheck* instruction);
187 void GenerateExplicitNullCheck(HNullCheck* instruction);
Mingyao Yangd43b3ac2015-04-01 14:03:04 -0700188 void GenerateTestAndBranch(HInstruction* instruction,
189 Label* true_target,
190 Label* false_target,
191 Label* always_true_target);
Calin Juravlecd6dffe2015-01-08 17:35:35 +0000192
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100193 X86Assembler* const assembler_;
194 CodeGeneratorX86* const codegen_;
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000195
196 DISALLOW_COPY_AND_ASSIGN(InstructionCodeGeneratorX86);
197};
198
199class CodeGeneratorX86 : public CodeGenerator {
200 public:
Mark Mendellfb8d2792015-03-31 22:16:59 -0400201 CodeGeneratorX86(HGraph* graph,
202 const X86InstructionSetFeatures& isa_features,
203 const CompilerOptions& compiler_options);
Nicolas Geoffrayf12feb82014-07-17 18:32:41 +0100204 virtual ~CodeGeneratorX86() {}
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000205
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000206 void GenerateFrameEntry() OVERRIDE;
207 void GenerateFrameExit() OVERRIDE;
208 void Bind(HBasicBlock* block) OVERRIDE;
209 void Move(HInstruction* instruction, Location location, HInstruction* move_for) OVERRIDE;
210 size_t SaveCoreRegister(size_t stack_index, uint32_t reg_id) OVERRIDE;
211 size_t RestoreCoreRegister(size_t stack_index, uint32_t reg_id) OVERRIDE;
Mark Mendell7c8d0092015-01-26 11:21:33 -0500212 size_t SaveFloatingPointRegister(size_t stack_index, uint32_t reg_id) OVERRIDE;
213 size_t RestoreFloatingPointRegister(size_t stack_index, uint32_t reg_id) OVERRIDE;
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +0000214
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000215 size_t GetWordSize() const OVERRIDE {
Nicolas Geoffray707c8092014-04-04 10:50:14 +0100216 return kX86WordSize;
217 }
218
Mark Mendellf85a9ca2015-01-13 09:20:58 -0500219 size_t GetFloatingPointSpillSlotSize() const OVERRIDE {
220 // 8 bytes == 2 words for each spill.
221 return 2 * kX86WordSize;
222 }
223
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000224 HGraphVisitor* GetLocationBuilder() OVERRIDE {
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +0000225 return &location_builder_;
226 }
227
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000228 HGraphVisitor* GetInstructionVisitor() OVERRIDE {
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000229 return &instruction_visitor_;
230 }
231
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000232 X86Assembler* GetAssembler() OVERRIDE {
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000233 return &assembler_;
234 }
235
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000236 uintptr_t GetAddressOf(HBasicBlock* block) const OVERRIDE {
237 return GetLabelOf(block)->Position();
238 }
Calin Juravle34bacdf2014-10-07 20:23:36 +0100239
Nicolas Geoffray98893962015-01-21 12:32:32 +0000240 void SetupBlockedRegisters(bool is_baseline) const OVERRIDE;
Nicolas Geoffraya7aca372014-04-28 17:47:12 +0100241
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000242 Location AllocateFreeRegister(Primitive::Type type) const OVERRIDE;
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100243
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000244 Location GetStackLocation(HLoadLocal* load) const OVERRIDE;
245
246 void DumpCoreRegister(std::ostream& stream, int reg) const OVERRIDE;
247 void DumpFloatingPointRegister(std::ostream& stream, int reg) const OVERRIDE;
Nicolas Geoffraya7062e02014-05-22 12:50:17 +0100248
Calin Juravle34bacdf2014-10-07 20:23:36 +0100249 // Blocks all register pairs made out of blocked core registers.
250 void UpdateBlockedPairRegisters() const;
251
Nicolas Geoffrayf0e39372014-11-12 17:50:07 +0000252 ParallelMoveResolverX86* GetMoveResolver() OVERRIDE {
Nicolas Geoffray86dbb9a2014-06-04 11:12:39 +0100253 return &move_resolver_;
254 }
255
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000256 InstructionSet GetInstructionSet() const OVERRIDE {
Nicolas Geoffray412f10c2014-06-19 10:00:34 +0100257 return InstructionSet::kX86;
258 }
259
Nicolas Geoffray01bc96d2014-04-11 17:43:50 +0100260 // Helper method to move a 32bits value between two locations.
261 void Move32(Location destination, Location source);
262 // Helper method to move a 64bits value between two locations.
263 void Move64(Location destination, Location source);
264
Mark Mendell09ed1a32015-03-25 08:30:06 -0400265 // Generate a call to a static or direct method.
Nicolas Geoffray38207af2015-06-01 15:46:22 +0100266 void GenerateStaticOrDirectCall(HInvokeStaticOrDirect* invoke, Location temp);
Mark Mendell09ed1a32015-03-25 08:30:06 -0400267
Nicolas Geoffray3c7bb982014-07-23 16:04:16 +0100268 // Emit a write barrier.
Nicolas Geoffray07276db2015-05-18 14:22:09 +0100269 void MarkGCCard(Register temp,
270 Register card,
271 Register object,
272 Register value,
273 bool value_can_be_null);
Nicolas Geoffray3c7bb982014-07-23 16:04:16 +0100274
Nicolas Geoffray19a19cf2014-10-22 16:07:05 +0100275 void LoadCurrentMethod(Register reg);
276
Nicolas Geoffray92a73ae2014-10-16 11:12:52 +0100277 Label* GetLabelOf(HBasicBlock* block) const {
Nicolas Geoffraydc23d832015-02-16 11:15:43 +0000278 return CommonGetLabelOf<Label>(block_labels_.GetRawStorage(), block);
Nicolas Geoffray92a73ae2014-10-16 11:12:52 +0100279 }
280
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000281 void Initialize() OVERRIDE {
Nicolas Geoffray92a73ae2014-10-16 11:12:52 +0100282 block_labels_.SetSize(GetGraph()->GetBlocks().Size());
283 }
284
Nicolas Geoffray840e5462015-01-07 16:01:24 +0000285 bool NeedsTwoRegisters(Primitive::Type type) const OVERRIDE {
286 return type == Primitive::kPrimLong;
287 }
288
Nicolas Geoffray234d69d2015-03-09 10:28:50 +0000289 bool ShouldSplitLongMoves() const OVERRIDE { return true; }
290
Nicolas Geoffray1cf95282014-12-12 19:22:03 +0000291 Label* GetFrameEntryLabel() { return &frame_entry_label_; }
292
Mark Mendellfb8d2792015-03-31 22:16:59 -0400293 const X86InstructionSetFeatures& GetInstructionSetFeatures() const {
294 return isa_features_;
295 }
296
Nicolas Geoffray3c7bb982014-07-23 16:04:16 +0100297 private:
Nicolas Geoffray92a73ae2014-10-16 11:12:52 +0100298 // Labels for each block that will be compiled.
299 GrowableArray<Label> block_labels_;
Nicolas Geoffray1cf95282014-12-12 19:22:03 +0000300 Label frame_entry_label_;
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +0000301 LocationsBuilderX86 location_builder_;
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000302 InstructionCodeGeneratorX86 instruction_visitor_;
Nicolas Geoffray86dbb9a2014-06-04 11:12:39 +0100303 ParallelMoveResolverX86 move_resolver_;
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000304 X86Assembler assembler_;
Mark Mendellfb8d2792015-03-31 22:16:59 -0400305 const X86InstructionSetFeatures& isa_features_;
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000306
307 DISALLOW_COPY_AND_ASSIGN(CodeGeneratorX86);
308};
309
Mark Mendell09ed1a32015-03-25 08:30:06 -0400310class SlowPathCodeX86 : public SlowPathCode {
311 public:
312 SlowPathCodeX86() : entry_label_(), exit_label_() {}
313
314 Label* GetEntryLabel() { return &entry_label_; }
315 Label* GetExitLabel() { return &exit_label_; }
316
317 private:
318 Label entry_label_;
319 Label exit_label_;
320
321 DISALLOW_COPY_AND_ASSIGN(SlowPathCodeX86);
322};
323
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000324} // namespace x86
325} // namespace art
326
327#endif // ART_COMPILER_OPTIMIZING_CODE_GENERATOR_X86_H_