blob: 1dcee29030426632899487177d07ff2381a14bc1 [file] [log] [blame]
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +00001/*
2 * Copyright (C) 2014 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17#ifndef ART_COMPILER_OPTIMIZING_CODE_GENERATOR_H_
18#define ART_COMPILER_OPTIMIZING_CODE_GENERATOR_H_
19
Ian Rogersd582fa42014-11-05 23:46:43 -080020#include "arch/instruction_set.h"
Calin Juravle34166012014-12-19 17:22:29 +000021#include "arch/instruction_set_features.h"
Vladimir Markof9f64412015-09-02 14:05:49 +010022#include "base/arena_containers.h"
23#include "base/arena_object.h"
Nicolas Geoffray01bc96d2014-04-11 17:43:50 +010024#include "base/bit_field.h"
Vladimir Marko70e97462016-08-09 11:04:26 +010025#include "base/bit_utils.h"
Andreas Gampe542451c2016-07-26 09:02:02 -070026#include "base/enums.h"
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +000027#include "globals.h"
Alexandre Rameseb7b7392015-06-19 14:47:01 +010028#include "graph_visualizer.h"
Nicolas Geoffray4e3d23a2014-05-22 18:32:45 +010029#include "locations.h"
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +000030#include "memory_region.h"
31#include "nodes.h"
Serban Constantinescuecc43662015-08-13 13:33:12 +010032#include "optimizing_compiler_stats.h"
Mathieu Chartier3af00dc2016-11-10 11:25:57 -080033#include "read_barrier_option.h"
Nicolas Geoffray39468442014-09-02 15:17:15 +010034#include "stack_map_stream.h"
Nicolas Geoffray132d8362016-11-16 09:19:42 +000035#include "string_reference.h"
Mathieu Chartierdbddc222017-05-24 12:04:13 -070036#include "type_reference.h"
Andreas Gampe85b62f22015-09-09 13:15:38 -070037#include "utils/label.h"
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +000038
39namespace art {
40
Roland Levillain6d0e4832014-11-27 18:31:21 +000041// Binary encoding of 2^32 for type double.
42static int64_t constexpr k2Pow32EncodingForDouble = INT64_C(0x41F0000000000000);
43// Binary encoding of 2^31 for type double.
44static int64_t constexpr k2Pow31EncodingForDouble = INT64_C(0x41E0000000000000);
45
Mark Mendelle82549b2015-05-06 10:55:34 -040046// Minimum value for a primitive integer.
47static int32_t constexpr kPrimIntMin = 0x80000000;
48// Minimum value for a primitive long.
49static int64_t constexpr kPrimLongMin = INT64_C(0x8000000000000000);
50
Roland Levillain3f8f9362014-12-02 17:45:01 +000051// Maximum value for a primitive integer.
52static int32_t constexpr kPrimIntMax = 0x7fffffff;
Roland Levillain624279f2014-12-04 11:54:28 +000053// Maximum value for a primitive long.
Mark Mendelle82549b2015-05-06 10:55:34 -040054static int64_t constexpr kPrimLongMax = INT64_C(0x7fffffffffffffff);
Roland Levillain3f8f9362014-12-02 17:45:01 +000055
Mathieu Chartier3af00dc2016-11-10 11:25:57 -080056static constexpr ReadBarrierOption kCompilerReadBarrierOption =
57 kEmitCompilerReadBarrier ? kWithReadBarrier : kWithoutReadBarrier;
58
Nicolas Geoffray92a73ae2014-10-16 11:12:52 +010059class Assembler;
Nicolas Geoffraye5038322014-07-04 09:41:32 +010060class CodeGenerator;
Nicolas Geoffrayd28b9692015-11-04 14:36:55 +000061class CompilerDriver;
Vladimir Marko3a21e382016-09-02 12:38:38 +010062class CompilerOptions;
Vladimir Marko58155012015-08-19 12:49:41 +000063class LinkerPatch;
Nicolas Geoffrayf0e39372014-11-12 17:50:07 +000064class ParallelMoveResolver;
Nicolas Geoffray92cf83e2014-03-18 17:59:20 +000065
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +000066class CodeAllocator {
67 public:
Nicolas Geoffraye5038322014-07-04 09:41:32 +010068 CodeAllocator() {}
69 virtual ~CodeAllocator() {}
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +000070
71 virtual uint8_t* Allocate(size_t size) = 0;
72
73 private:
74 DISALLOW_COPY_AND_ASSIGN(CodeAllocator);
75};
76
Alexandre Ramesc01a6642016-04-15 11:54:06 +010077class SlowPathCode : public DeletableArenaObject<kArenaAllocSlowPaths> {
Nicolas Geoffraye5038322014-07-04 09:41:32 +010078 public:
David Srbecky9cd6d372016-02-09 15:24:47 +000079 explicit SlowPathCode(HInstruction* instruction) : instruction_(instruction) {
Nicolas Geoffrayeeefa122015-03-13 18:52:59 +000080 for (size_t i = 0; i < kMaximumNumberOfExpectedRegisters; ++i) {
81 saved_core_stack_offsets_[i] = kRegisterNotSaved;
82 saved_fpu_stack_offsets_[i] = kRegisterNotSaved;
83 }
84 }
85
Nicolas Geoffraye5038322014-07-04 09:41:32 +010086 virtual ~SlowPathCode() {}
87
Nicolas Geoffraye5038322014-07-04 09:41:32 +010088 virtual void EmitNativeCode(CodeGenerator* codegen) = 0;
89
Roland Levillain4359e612016-07-20 11:32:19 +010090 // Save live core and floating-point caller-save registers and
91 // update the stack mask in `locations` for registers holding object
92 // references.
Zheng Xuda403092015-04-24 17:35:39 +080093 virtual void SaveLiveRegisters(CodeGenerator* codegen, LocationSummary* locations);
Roland Levillain4359e612016-07-20 11:32:19 +010094 // Restore live core and floating-point caller-save registers.
Zheng Xuda403092015-04-24 17:35:39 +080095 virtual void RestoreLiveRegisters(CodeGenerator* codegen, LocationSummary* locations);
Nicolas Geoffraya8ac9132015-03-13 16:36:36 +000096
Nicolas Geoffrayeeefa122015-03-13 18:52:59 +000097 bool IsCoreRegisterSaved(int reg) const {
98 return saved_core_stack_offsets_[reg] != kRegisterNotSaved;
99 }
100
101 bool IsFpuRegisterSaved(int reg) const {
102 return saved_fpu_stack_offsets_[reg] != kRegisterNotSaved;
103 }
104
105 uint32_t GetStackOffsetOfCoreRegister(int reg) const {
106 return saved_core_stack_offsets_[reg];
107 }
108
109 uint32_t GetStackOffsetOfFpuRegister(int reg) const {
110 return saved_fpu_stack_offsets_[reg];
111 }
112
Alexandre Rames8158f282015-08-07 10:26:17 +0100113 virtual bool IsFatal() const { return false; }
114
Alexandre Rames9931f312015-06-19 14:47:01 +0100115 virtual const char* GetDescription() const = 0;
116
Andreas Gampe85b62f22015-09-09 13:15:38 -0700117 Label* GetEntryLabel() { return &entry_label_; }
118 Label* GetExitLabel() { return &exit_label_; }
119
David Srbeckyd28f4a02016-03-14 17:14:24 +0000120 HInstruction* GetInstruction() const {
121 return instruction_;
122 }
123
David Srbecky9cd6d372016-02-09 15:24:47 +0000124 uint32_t GetDexPc() const {
125 return instruction_ != nullptr ? instruction_->GetDexPc() : kNoDexPc;
126 }
127
Zheng Xuda403092015-04-24 17:35:39 +0800128 protected:
Nicolas Geoffrayeeefa122015-03-13 18:52:59 +0000129 static constexpr size_t kMaximumNumberOfExpectedRegisters = 32;
130 static constexpr uint32_t kRegisterNotSaved = -1;
David Srbecky9cd6d372016-02-09 15:24:47 +0000131 // The instruction where this slow path is happening.
132 HInstruction* instruction_;
Nicolas Geoffrayeeefa122015-03-13 18:52:59 +0000133 uint32_t saved_core_stack_offsets_[kMaximumNumberOfExpectedRegisters];
134 uint32_t saved_fpu_stack_offsets_[kMaximumNumberOfExpectedRegisters];
Zheng Xuda403092015-04-24 17:35:39 +0800135
136 private:
Andreas Gampe85b62f22015-09-09 13:15:38 -0700137 Label entry_label_;
138 Label exit_label_;
139
Nicolas Geoffraye5038322014-07-04 09:41:32 +0100140 DISALLOW_COPY_AND_ASSIGN(SlowPathCode);
141};
142
Roland Levillain2d27c8e2015-04-28 15:48:45 +0100143class InvokeDexCallingConventionVisitor {
144 public:
145 virtual Location GetNextLocation(Primitive::Type type) = 0;
Nicolas Geoffrayfd88f162015-06-03 11:23:52 +0100146 virtual Location GetReturnLocation(Primitive::Type type) const = 0;
147 virtual Location GetMethodLocation() const = 0;
Roland Levillain2d27c8e2015-04-28 15:48:45 +0100148
149 protected:
150 InvokeDexCallingConventionVisitor() {}
151 virtual ~InvokeDexCallingConventionVisitor() {}
152
153 // The current index for core registers.
154 uint32_t gp_index_ = 0u;
155 // The current index for floating-point registers.
156 uint32_t float_index_ = 0u;
157 // The current stack index.
158 uint32_t stack_index_ = 0u;
159
160 private:
161 DISALLOW_COPY_AND_ASSIGN(InvokeDexCallingConventionVisitor);
162};
163
Calin Juravlee460d1d2015-09-29 04:52:17 +0100164class FieldAccessCallingConvention {
165 public:
166 virtual Location GetObjectLocation() const = 0;
167 virtual Location GetFieldIndexLocation() const = 0;
168 virtual Location GetReturnLocation(Primitive::Type type) const = 0;
169 virtual Location GetSetValueLocation(Primitive::Type type, bool is_instance) const = 0;
170 virtual Location GetFpuLocation(Primitive::Type type) const = 0;
171 virtual ~FieldAccessCallingConvention() {}
172
173 protected:
174 FieldAccessCallingConvention() {}
175
176 private:
177 DISALLOW_COPY_AND_ASSIGN(FieldAccessCallingConvention);
178};
179
Vladimir Markod58b8372016-04-12 18:51:43 +0100180class CodeGenerator : public DeletableArenaObject<kArenaAllocCodeGenerator> {
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000181 public:
David Brazdil58282f42016-01-14 12:45:10 +0000182 // Compiles the graph to executable instructions.
183 void Compile(CodeAllocator* allocator);
Vladimir Markod58b8372016-04-12 18:51:43 +0100184 static std::unique_ptr<CodeGenerator> Create(HGraph* graph,
185 InstructionSet instruction_set,
186 const InstructionSetFeatures& isa_features,
187 const CompilerOptions& compiler_options,
188 OptimizingCompilerStats* stats = nullptr);
Nicolas Geoffray12df9eb2015-01-09 14:53:50 +0000189 virtual ~CodeGenerator() {}
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000190
Vladimir Markodc151b22015-10-15 18:02:30 +0100191 // Get the graph. This is the outermost graph, never the graph of a method being inlined.
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000192 HGraph* GetGraph() const { return graph_; }
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000193
Nicolas Geoffraydc23d832015-02-16 11:15:43 +0000194 HBasicBlock* GetNextBlockToEmit() const;
195 HBasicBlock* FirstNonEmptyBlock(HBasicBlock* block) const;
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +0000196 bool GoesToNextBlock(HBasicBlock* current, HBasicBlock* next) const;
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000197
Nicolas Geoffray86dbb9a2014-06-04 11:12:39 +0100198 size_t GetStackSlotOfParameter(HParameterValue* parameter) const {
199 // Note that this follows the current calling convention.
200 return GetFrameSize()
Andreas Gampe542451c2016-07-26 09:02:02 -0700201 + static_cast<size_t>(InstructionSetPointerSize(GetInstructionSet())) // Art method
Nicolas Geoffraye27f31a2014-06-12 17:53:14 +0100202 + parameter->GetIndex() * kVRegSize;
Nicolas Geoffray86dbb9a2014-06-04 11:12:39 +0100203 }
204
Nicolas Geoffray92a73ae2014-10-16 11:12:52 +0100205 virtual void Initialize() = 0;
Serban Constantinescu32f5b4d2014-11-25 20:05:46 +0000206 virtual void Finalize(CodeAllocator* allocator);
Vladimir Marko58155012015-08-19 12:49:41 +0000207 virtual void EmitLinkerPatches(ArenaVector<LinkerPatch>* linker_patches);
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000208 virtual void GenerateFrameEntry() = 0;
209 virtual void GenerateFrameExit() = 0;
Nicolas Geoffray92a73ae2014-10-16 11:12:52 +0100210 virtual void Bind(HBasicBlock* block) = 0;
Calin Juravle175dc732015-08-25 15:42:32 +0100211 virtual void MoveConstant(Location destination, int32_t value) = 0;
Calin Juravlee460d1d2015-09-29 04:52:17 +0100212 virtual void MoveLocation(Location dst, Location src, Primitive::Type dst_type) = 0;
213 virtual void AddLocationAsTemp(Location location, LocationSummary* locations) = 0;
214
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000215 virtual Assembler* GetAssembler() = 0;
Alexandre Rameseb7b7392015-06-19 14:47:01 +0100216 virtual const Assembler& GetAssembler() const = 0;
Nicolas Geoffray707c8092014-04-04 10:50:14 +0100217 virtual size_t GetWordSize() const = 0;
Mark Mendellf85a9ca2015-01-13 09:20:58 -0500218 virtual size_t GetFloatingPointSpillSlotSize() const = 0;
Alexandre Ramesc01a6642016-04-15 11:54:06 +0100219 virtual uintptr_t GetAddressOf(HBasicBlock* block) = 0;
Nicolas Geoffray4c204ba2015-02-03 15:12:35 +0000220 void InitializeCodeGeneration(size_t number_of_spill_slots,
Vladimir Marko70e97462016-08-09 11:04:26 +0100221 size_t maximum_safepoint_spill_size,
Nicolas Geoffray4c204ba2015-02-03 15:12:35 +0000222 size_t number_of_out_slots,
Vladimir Markofa6b93c2015-09-15 10:15:55 +0100223 const ArenaVector<HBasicBlock*>& block_order);
Alexandre Rames68bd9b92016-07-15 17:41:13 +0100224 // Backends can override this as necessary. For most, no special alignment is required.
225 virtual uint32_t GetPreferredSlotsAlignment() const { return 1; }
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000226
227 uint32_t GetFrameSize() const { return frame_size_; }
228 void SetFrameSize(uint32_t size) { frame_size_ = size; }
Nicolas Geoffray8ccc3f52014-03-19 10:34:11 +0000229 uint32_t GetCoreSpillMask() const { return core_spill_mask_; }
Nicolas Geoffrayd97dc402015-01-22 13:50:01 +0000230 uint32_t GetFpuSpillMask() const { return fpu_spill_mask_; }
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000231
Nicolas Geoffray71175b72014-10-09 22:13:55 +0100232 size_t GetNumberOfCoreRegisters() const { return number_of_core_registers_; }
233 size_t GetNumberOfFloatingPointRegisters() const { return number_of_fpu_registers_; }
David Brazdil58282f42016-01-14 12:45:10 +0000234 virtual void SetupBlockedRegisters() const = 0;
Nicolas Geoffray71175b72014-10-09 22:13:55 +0100235
Nicolas Geoffray4dee6362015-01-23 18:23:14 +0000236 virtual void ComputeSpillMask() {
237 core_spill_mask_ = allocated_registers_.GetCoreRegisters() & core_callee_save_mask_;
238 DCHECK_NE(core_spill_mask_, 0u) << "At least the return address register must be saved";
239 fpu_spill_mask_ = allocated_registers_.GetFloatingPointRegisters() & fpu_callee_save_mask_;
240 }
241
242 static uint32_t ComputeRegisterMask(const int* registers, size_t length) {
243 uint32_t mask = 0;
244 for (size_t i = 0, e = length; i < e; ++i) {
245 mask |= (1 << registers[i]);
246 }
247 return mask;
248 }
249
Nicolas Geoffraya7062e02014-05-22 12:50:17 +0100250 virtual void DumpCoreRegister(std::ostream& stream, int reg) const = 0;
251 virtual void DumpFloatingPointRegister(std::ostream& stream, int reg) const = 0;
Nicolas Geoffray412f10c2014-06-19 10:00:34 +0100252 virtual InstructionSet GetInstructionSet() const = 0;
Calin Juravlecd6dffe2015-01-08 17:35:35 +0000253
254 const CompilerOptions& GetCompilerOptions() const { return compiler_options_; }
255
Serban Constantinescuecc43662015-08-13 13:33:12 +0100256 void MaybeRecordStat(MethodCompilationStat compilation_stat, size_t count = 1) const;
257
Nicolas Geoffray102cbed2014-10-15 18:31:05 +0100258 // Saves the register in the stack. Returns the size taken on stack.
259 virtual size_t SaveCoreRegister(size_t stack_index, uint32_t reg_id) = 0;
260 // Restores the register from the stack. Returns the size taken on stack.
261 virtual size_t RestoreCoreRegister(size_t stack_index, uint32_t reg_id) = 0;
Nicolas Geoffray234d69d2015-03-09 10:28:50 +0000262
263 virtual size_t SaveFloatingPointRegister(size_t stack_index, uint32_t reg_id) = 0;
264 virtual size_t RestoreFloatingPointRegister(size_t stack_index, uint32_t reg_id) = 0;
265
Nicolas Geoffray840e5462015-01-07 16:01:24 +0000266 virtual bool NeedsTwoRegisters(Primitive::Type type) const = 0;
Nicolas Geoffray234d69d2015-03-09 10:28:50 +0000267 // Returns whether we should split long moves in parallel moves.
268 virtual bool ShouldSplitLongMoves() const { return false; }
Nicolas Geoffraya7062e02014-05-22 12:50:17 +0100269
Roland Levillain0d5a2812015-11-13 10:07:31 +0000270 size_t GetNumberOfCoreCalleeSaveRegisters() const {
271 return POPCOUNT(core_callee_save_mask_);
272 }
273
274 size_t GetNumberOfCoreCallerSaveRegisters() const {
275 DCHECK_GE(GetNumberOfCoreRegisters(), GetNumberOfCoreCalleeSaveRegisters());
276 return GetNumberOfCoreRegisters() - GetNumberOfCoreCalleeSaveRegisters();
277 }
278
Nicolas Geoffray98893962015-01-21 12:32:32 +0000279 bool IsCoreCalleeSaveRegister(int reg) const {
280 return (core_callee_save_mask_ & (1 << reg)) != 0;
281 }
282
283 bool IsFloatingPointCalleeSaveRegister(int reg) const {
284 return (fpu_callee_save_mask_ & (1 << reg)) != 0;
285 }
286
Vladimir Marko70e97462016-08-09 11:04:26 +0100287 uint32_t GetSlowPathSpills(LocationSummary* locations, bool core_registers) const {
288 DCHECK(locations->OnlyCallsOnSlowPath() ||
289 (locations->Intrinsified() && locations->CallsOnMainAndSlowPath() &&
290 !locations->HasCustomSlowPathCallingConvention()));
291 uint32_t live_registers = core_registers
292 ? locations->GetLiveRegisters()->GetCoreRegisters()
293 : locations->GetLiveRegisters()->GetFloatingPointRegisters();
294 if (locations->HasCustomSlowPathCallingConvention()) {
295 // Save only the live registers that the custom calling convention wants us to save.
296 uint32_t caller_saves = core_registers
297 ? locations->GetCustomSlowPathCallerSaves().GetCoreRegisters()
298 : locations->GetCustomSlowPathCallerSaves().GetFloatingPointRegisters();
299 return live_registers & caller_saves;
300 } else {
301 // Default ABI, we need to spill non-callee-save live registers.
302 uint32_t callee_saves = core_registers ? core_callee_save_mask_ : fpu_callee_save_mask_;
303 return live_registers & ~callee_saves;
304 }
305 }
306
307 size_t GetNumberOfSlowPathSpills(LocationSummary* locations, bool core_registers) const {
308 return POPCOUNT(GetSlowPathSpills(locations, core_registers));
309 }
310
Mingyao Yang063fc772016-08-02 11:02:54 -0700311 size_t GetStackOffsetOfShouldDeoptimizeFlag() const {
312 DCHECK(GetGraph()->HasShouldDeoptimizeFlag());
313 DCHECK_GE(GetFrameSize(), FrameEntrySpillSize() + kShouldDeoptimizeFlagSize);
314 return GetFrameSize() - FrameEntrySpillSize() - kShouldDeoptimizeFlagSize;
315 }
316
Yevgeny Rouban2a7c1ef2015-07-22 18:36:24 +0600317 // Record native to dex mapping for a suspend point. Required by runtime.
Nicolas Geoffrayeeefa122015-03-13 18:52:59 +0000318 void RecordPcInfo(HInstruction* instruction, uint32_t dex_pc, SlowPathCode* slow_path = nullptr);
David Srbeckyb7070a22016-01-08 18:13:53 +0000319 // Check whether we have already recorded mapping at this PC.
320 bool HasStackMapAtCurrentPc();
David Srbeckyc7098ff2016-02-09 14:30:11 +0000321 // Record extra stack maps if we support native debugging.
David Srbeckyd28f4a02016-03-14 17:14:24 +0000322 void MaybeRecordNativeDebugInfo(HInstruction* instruction,
323 uint32_t dex_pc,
324 SlowPathCode* slow_path = nullptr);
Yevgeny Rouban2a7c1ef2015-07-22 18:36:24 +0600325
Calin Juravle77520bc2015-01-12 18:45:46 +0000326 bool CanMoveNullCheckToUser(HNullCheck* null_check);
327 void MaybeRecordImplicitNullCheck(HInstruction* instruction);
Vladimir Marko804b03f2016-09-14 16:26:36 +0100328 LocationSummary* CreateThrowingSlowPathLocations(
329 HInstruction* instruction, RegisterSet caller_saves = RegisterSet::Empty());
Calin Juravle2ae48182016-03-16 14:05:09 +0000330 void GenerateNullCheck(HNullCheck* null_check);
331 virtual void GenerateImplicitNullCheck(HNullCheck* null_check) = 0;
332 virtual void GenerateExplicitNullCheck(HNullCheck* null_check) = 0;
Nicolas Geoffray8ccc3f52014-03-19 10:34:11 +0000333
David Brazdil77a48ae2015-09-15 12:34:04 +0000334 // Records a stack map which the runtime might use to set catch phi values
335 // during exception delivery.
336 // TODO: Replace with a catch-entering instruction that records the environment.
337 void RecordCatchBlockInfo();
338
Alexandre Ramesc01a6642016-04-15 11:54:06 +0100339 // TODO: Avoid creating the `std::unique_ptr` here.
Nicolas Geoffraye5038322014-07-04 09:41:32 +0100340 void AddSlowPath(SlowPathCode* slow_path) {
Alexandre Ramesc01a6642016-04-15 11:54:06 +0100341 slow_paths_.push_back(std::unique_ptr<SlowPathCode>(slow_path));
Nicolas Geoffraye5038322014-07-04 09:41:32 +0100342 }
343
Mathieu Chartiercbcedbf2017-03-12 22:24:50 -0700344 void BuildStackMaps(MemoryRegion stack_map_region,
345 MemoryRegion method_info_region,
346 const DexFile::CodeItem& code_item);
347 void ComputeStackMapAndMethodInfoSize(size_t* stack_map_size, size_t* method_info_size);
Nicolas Geoffray132d8362016-11-16 09:19:42 +0000348 size_t GetNumberOfJitRoots() const {
Nicolas Geoffray22384ae2016-12-12 22:33:36 +0000349 return jit_string_roots_.size() + jit_class_roots_.size();
Nicolas Geoffray132d8362016-11-16 09:19:42 +0000350 }
351
352 // Fills the `literals` array with literals collected during code generation.
353 // Also emits literal patches.
354 void EmitJitRoots(uint8_t* code,
355 Handle<mirror::ObjectArray<mirror::Object>> roots,
Nicolas Geoffrayf0acfe72017-01-09 20:54:52 +0000356 const uint8_t* roots_data)
Nicolas Geoffray132d8362016-11-16 09:19:42 +0000357 REQUIRES_SHARED(Locks::mutator_lock_);
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000358
Nicolas Geoffrayf12feb82014-07-17 18:32:41 +0100359 bool IsLeafMethod() const {
360 return is_leaf_;
361 }
362
363 void MarkNotLeaf() {
364 is_leaf_ = false;
Nicolas Geoffrayc0572a42015-02-06 14:35:25 +0000365 requires_current_method_ = true;
366 }
367
368 void SetRequiresCurrentMethod() {
369 requires_current_method_ = true;
370 }
371
372 bool RequiresCurrentMethod() const {
373 return requires_current_method_;
Nicolas Geoffrayf12feb82014-07-17 18:32:41 +0100374 }
375
Nicolas Geoffray3c049742014-09-24 18:10:46 +0100376 // Clears the spill slots taken by loop phis in the `LocationSummary` of the
377 // suspend check. This is called when the code generator generates code
378 // for the suspend check at the back edge (instead of where the suspend check
379 // is, which is the loop entry). At this point, the spill slots for the phis
380 // have not been written to.
381 void ClearSpillSlotsFromLoopPhisInStackMap(HSuspendCheck* suspend_check) const;
382
Nicolas Geoffray71175b72014-10-09 22:13:55 +0100383 bool* GetBlockedCoreRegisters() const { return blocked_core_registers_; }
Nicolas Geoffray102cbed2014-10-15 18:31:05 +0100384 bool* GetBlockedFloatingPointRegisters() const { return blocked_fpu_registers_; }
Nicolas Geoffray71175b72014-10-09 22:13:55 +0100385
Matthew Gharrityd9ffd0d2016-06-22 10:27:55 -0700386 bool IsBlockedCoreRegister(size_t i) { return blocked_core_registers_[i]; }
387 bool IsBlockedFloatingPointRegister(size_t i) { return blocked_fpu_registers_[i]; }
388
Nicolas Geoffray19a19cf2014-10-22 16:07:05 +0100389 // Helper that returns the pointer offset of an index in an object array.
390 // Note: this method assumes we always have the same pointer size, regardless
391 // of the architecture.
392 static size_t GetCacheOffset(uint32_t index);
Mathieu Chartiere401d142015-04-22 13:56:20 -0700393 // Pointer variant for ArtMethod and ArtField arrays.
394 size_t GetCachePointerOffset(uint32_t index);
Nicolas Geoffray19a19cf2014-10-22 16:07:05 +0100395
Vladimir Markodce016e2016-04-28 13:10:02 +0100396 // Helper that returns the offset of the array's length field.
397 // Note: Besides the normal arrays, we also use the HArrayLength for
398 // accessing the String's `count` field in String intrinsics.
399 static uint32_t GetArrayLengthOffset(HArrayLength* array_length);
400
Vladimir Marko87f3fcb2016-04-28 15:52:11 +0100401 // Helper that returns the offset of the array's data.
402 // Note: Besides the normal arrays, we also use the HArrayGet for
403 // accessing the String's `value` field in String intrinsics.
404 static uint32_t GetArrayDataOffset(HArrayGet* array_get);
405
Roland Levillain02b75802016-07-13 11:54:35 +0100406 // Return the entry point offset for ReadBarrierMarkRegX, where X is `reg`.
Andreas Gampe542451c2016-07-26 09:02:02 -0700407 template <PointerSize pointer_size>
Roland Levillain02b75802016-07-13 11:54:35 +0100408 static int32_t GetReadBarrierMarkEntryPointsOffset(size_t reg) {
Roland Levillaind549c282016-07-25 12:49:15 +0100409 // The entry point list defines 30 ReadBarrierMarkRegX entry points.
410 DCHECK_LT(reg, 30u);
Roland Levillain02b75802016-07-13 11:54:35 +0100411 // The ReadBarrierMarkRegX entry points are ordered by increasing
412 // register number in Thread::tls_Ptr_.quick_entrypoints.
413 return QUICK_ENTRYPOINT_OFFSET(pointer_size, pReadBarrierMarkReg00).Int32Value()
Andreas Gampe542451c2016-07-26 09:02:02 -0700414 + static_cast<size_t>(pointer_size) * reg;
Roland Levillain02b75802016-07-13 11:54:35 +0100415 }
416
Nicolas Geoffray90218252015-04-15 11:56:51 +0100417 void EmitParallelMoves(Location from1,
418 Location to1,
419 Primitive::Type type1,
420 Location from2,
421 Location to2,
422 Primitive::Type type2);
Nicolas Geoffrayf0e39372014-11-12 17:50:07 +0000423
Nicolas Geoffrayaf07bc12014-11-12 18:08:09 +0000424 static bool StoreNeedsWriteBarrier(Primitive::Type type, HInstruction* value) {
David Brazdil522e2242015-03-17 18:48:28 +0000425 // Check that null value is not represented as an integer constant.
426 DCHECK(type != Primitive::kPrimNot || !value->IsIntConstant());
427 return type == Primitive::kPrimNot && !value->IsNullConstant();
Nicolas Geoffrayaf07bc12014-11-12 18:08:09 +0000428 }
429
Roland Levillaindec8f632016-07-22 17:10:06 +0100430
Orion Hodsonac141392017-01-13 11:53:47 +0000431 // Performs checks pertaining to an InvokeRuntime call.
Alexandre Rames91a65162016-09-19 13:54:30 +0100432 void ValidateInvokeRuntime(QuickEntrypointEnum entrypoint,
433 HInstruction* instruction,
434 SlowPathCode* slow_path);
Alexandre Rames78e3ef62015-08-12 13:43:29 +0100435
Orion Hodsonac141392017-01-13 11:53:47 +0000436 // Performs checks pertaining to an InvokeRuntimeWithoutRecordingPcInfo call.
Roland Levillaindec8f632016-07-22 17:10:06 +0100437 static void ValidateInvokeRuntimeWithoutRecordingPcInfo(HInstruction* instruction,
438 SlowPathCode* slow_path);
439
Nicolas Geoffray98893962015-01-21 12:32:32 +0000440 void AddAllocatedRegister(Location location) {
441 allocated_registers_.Add(location);
442 }
443
Nicolas Geoffray45b83af2015-07-06 15:12:53 +0000444 bool HasAllocatedRegister(bool is_core, int reg) const {
445 return is_core
446 ? allocated_registers_.ContainsCoreRegister(reg)
447 : allocated_registers_.ContainsFloatingPointRegister(reg);
448 }
449
Nicolas Geoffrayc0572a42015-02-06 14:35:25 +0000450 void AllocateLocations(HInstruction* instruction);
451
Roland Levillainaa9b7c42015-02-17 15:40:09 +0000452 // Tells whether the stack frame of the compiled method is
453 // considered "empty", that is either actually having a size of zero,
454 // or just containing the saved return address register.
455 bool HasEmptyFrame() const {
456 return GetFrameSize() == (CallPushesPC() ? GetWordSize() : 0);
457 }
458
Nicolas Geoffrayd6138ef2015-02-18 14:48:53 +0000459 static int32_t GetInt32ValueOf(HConstant* constant) {
460 if (constant->IsIntConstant()) {
461 return constant->AsIntConstant()->GetValue();
462 } else if (constant->IsNullConstant()) {
463 return 0;
464 } else {
465 DCHECK(constant->IsFloatConstant());
Roland Levillainda4d79b2015-03-24 14:36:11 +0000466 return bit_cast<int32_t, float>(constant->AsFloatConstant()->GetValue());
Nicolas Geoffrayd6138ef2015-02-18 14:48:53 +0000467 }
468 }
469
470 static int64_t GetInt64ValueOf(HConstant* constant) {
471 if (constant->IsIntConstant()) {
472 return constant->AsIntConstant()->GetValue();
473 } else if (constant->IsNullConstant()) {
474 return 0;
475 } else if (constant->IsFloatConstant()) {
Roland Levillainda4d79b2015-03-24 14:36:11 +0000476 return bit_cast<int32_t, float>(constant->AsFloatConstant()->GetValue());
Nicolas Geoffrayd6138ef2015-02-18 14:48:53 +0000477 } else if (constant->IsLongConstant()) {
478 return constant->AsLongConstant()->GetValue();
479 } else {
480 DCHECK(constant->IsDoubleConstant());
Roland Levillainda4d79b2015-03-24 14:36:11 +0000481 return bit_cast<int64_t, double>(constant->AsDoubleConstant()->GetValue());
Nicolas Geoffrayd6138ef2015-02-18 14:48:53 +0000482 }
483 }
484
Nicolas Geoffraya8ac9132015-03-13 16:36:36 +0000485 size_t GetFirstRegisterSlotInSlowPath() const {
486 return first_register_slot_in_slow_path_;
487 }
488
489 uint32_t FrameEntrySpillSize() const {
490 return GetFpuSpillSize() + GetCoreSpillSize();
491 }
492
Roland Levillainec525fc2015-04-28 15:50:20 +0100493 virtual ParallelMoveResolver* GetMoveResolver() = 0;
Nicolas Geoffraya8ac9132015-03-13 16:36:36 +0000494
Nicolas Geoffrayfd88f162015-06-03 11:23:52 +0100495 static void CreateCommonInvokeLocationSummary(
496 HInvoke* invoke, InvokeDexCallingConventionVisitor* visitor);
497
Vladimir Markoe7197bf2017-06-02 17:00:23 +0100498 void GenerateInvokeStaticOrDirectRuntimeCall(
499 HInvokeStaticOrDirect* invoke, Location temp, SlowPathCode* slow_path);
Calin Juravle175dc732015-08-25 15:42:32 +0100500 void GenerateInvokeUnresolvedRuntimeCall(HInvokeUnresolved* invoke);
501
Orion Hodsonac141392017-01-13 11:53:47 +0000502 void GenerateInvokePolymorphicCall(HInvokePolymorphic* invoke);
503
Calin Juravlee460d1d2015-09-29 04:52:17 +0100504 void CreateUnresolvedFieldLocationSummary(
505 HInstruction* field_access,
506 Primitive::Type field_type,
507 const FieldAccessCallingConvention& calling_convention);
508
509 void GenerateUnresolvedFieldAccess(
510 HInstruction* field_access,
511 Primitive::Type field_type,
512 uint32_t field_index,
513 uint32_t dex_pc,
514 const FieldAccessCallingConvention& calling_convention);
515
Vladimir Marko41559982017-01-06 14:04:23 +0000516 static void CreateLoadClassRuntimeCallLocationSummary(HLoadClass* cls,
517 Location runtime_type_index_location,
518 Location runtime_return_location);
519 void GenerateLoadClassRuntimeCall(HLoadClass* cls);
Calin Juravle98893e12015-10-02 21:05:03 +0100520
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +0100521 static void CreateSystemArrayCopyLocationSummary(HInvoke* invoke);
522
Alexandre Rameseb7b7392015-06-19 14:47:01 +0100523 void SetDisassemblyInformation(DisassemblyInformation* info) { disasm_info_ = info; }
524 DisassemblyInformation* GetDisassemblyInformation() const { return disasm_info_; }
525
Calin Juravle175dc732015-08-25 15:42:32 +0100526 virtual void InvokeRuntime(QuickEntrypointEnum entrypoint,
527 HInstruction* instruction,
528 uint32_t dex_pc,
Vladimir Marko41559982017-01-06 14:04:23 +0000529 SlowPathCode* slow_path = nullptr) = 0;
Calin Juravle175dc732015-08-25 15:42:32 +0100530
Vladimir Markocac5a7e2016-02-22 10:39:50 +0000531 // Check if the desired_string_load_kind is supported. If it is, return it,
Vladimir Markodbb7f5b2016-03-30 13:23:58 +0100532 // otherwise return a fall-back kind that should be used instead.
Vladimir Markocac5a7e2016-02-22 10:39:50 +0000533 virtual HLoadString::LoadKind GetSupportedLoadStringKind(
534 HLoadString::LoadKind desired_string_load_kind) = 0;
535
Vladimir Markodbb7f5b2016-03-30 13:23:58 +0100536 // Check if the desired_class_load_kind is supported. If it is, return it,
537 // otherwise return a fall-back kind that should be used instead.
538 virtual HLoadClass::LoadKind GetSupportedLoadClassKind(
539 HLoadClass::LoadKind desired_class_load_kind) = 0;
540
Nicolas Geoffray132d8362016-11-16 09:19:42 +0000541 static LocationSummary::CallKind GetLoadStringCallKind(HLoadString* load) {
542 switch (load->GetLoadKind()) {
543 case HLoadString::LoadKind::kBssEntry:
544 DCHECK(load->NeedsEnvironment());
545 return LocationSummary::kCallOnSlowPath;
546 case HLoadString::LoadKind::kDexCacheViaMethod:
547 DCHECK(load->NeedsEnvironment());
548 return LocationSummary::kCallOnMainOnly;
549 case HLoadString::LoadKind::kJitTableAddress:
550 DCHECK(!load->NeedsEnvironment());
551 return kEmitCompilerReadBarrier
552 ? LocationSummary::kCallOnSlowPath
553 : LocationSummary::kNoCall;
554 break;
555 default:
556 DCHECK(!load->NeedsEnvironment());
557 return LocationSummary::kNoCall;
558 }
559 }
560
Vladimir Markodc151b22015-10-15 18:02:30 +0100561 // Check if the desired_dispatch_info is supported. If it is, return it,
562 // otherwise return a fall-back info that should be used instead.
563 virtual HInvokeStaticOrDirect::DispatchInfo GetSupportedInvokeStaticOrDirectDispatch(
564 const HInvokeStaticOrDirect::DispatchInfo& desired_dispatch_info,
Nicolas Geoffray5e4e11e2016-09-22 13:17:41 +0100565 HInvokeStaticOrDirect* invoke) = 0;
Vladimir Markodc151b22015-10-15 18:02:30 +0100566
Andreas Gampe85b62f22015-09-09 13:15:38 -0700567 // Generate a call to a static or direct method.
Vladimir Markoe7197bf2017-06-02 17:00:23 +0100568 virtual void GenerateStaticOrDirectCall(
569 HInvokeStaticOrDirect* invoke, Location temp, SlowPathCode* slow_path = nullptr) = 0;
Andreas Gampe85b62f22015-09-09 13:15:38 -0700570 // Generate a call to a virtual method.
Vladimir Markoe7197bf2017-06-02 17:00:23 +0100571 virtual void GenerateVirtualCall(
572 HInvokeVirtual* invoke, Location temp, SlowPathCode* slow_path = nullptr) = 0;
Andreas Gampe85b62f22015-09-09 13:15:38 -0700573
574 // Copy the result of a call into the given target.
575 virtual void MoveFromReturnRegister(Location trg, Primitive::Type type) = 0;
576
David Srbeckyc7098ff2016-02-09 14:30:11 +0000577 virtual void GenerateNop() = 0;
578
Nicolas Geoffrayb048cb72017-01-23 22:50:24 +0000579 static QuickEntrypointEnum GetArrayAllocationEntrypoint(Handle<mirror::Class> array_klass);
580
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000581 protected:
Vladimir Markoaad75c62016-10-03 08:46:48 +0000582 // Patch info used for recording locations of required linker patches and their targets,
583 // i.e. target method, string, type or code identified by their dex file and index.
Vladimir Marko58155012015-08-19 12:49:41 +0000584 template <typename LabelType>
Vladimir Markoaad75c62016-10-03 08:46:48 +0000585 struct PatchInfo {
586 PatchInfo(const DexFile& target_dex_file, uint32_t target_index)
587 : dex_file(target_dex_file), index(target_index) { }
Vladimir Markocac5a7e2016-02-22 10:39:50 +0000588
589 const DexFile& dex_file;
Vladimir Markoaad75c62016-10-03 08:46:48 +0000590 uint32_t index;
Vladimir Markodbb7f5b2016-03-30 13:23:58 +0100591 LabelType label;
592 };
593
Nicolas Geoffray71175b72014-10-09 22:13:55 +0100594 CodeGenerator(HGraph* graph,
595 size_t number_of_core_registers,
596 size_t number_of_fpu_registers,
Calin Juravlecd6dffe2015-01-08 17:35:35 +0000597 size_t number_of_register_pairs,
Nicolas Geoffray98893962015-01-21 12:32:32 +0000598 uint32_t core_callee_save_mask,
599 uint32_t fpu_callee_save_mask,
Serban Constantinescuecc43662015-08-13 13:33:12 +0100600 const CompilerOptions& compiler_options,
601 OptimizingCompilerStats* stats)
Nicolas Geoffrayc0572a42015-02-06 14:35:25 +0000602 : frame_size_(0),
Nicolas Geoffray4361bef2014-08-20 04:59:12 +0100603 core_spill_mask_(0),
Nicolas Geoffrayd97dc402015-01-22 13:50:01 +0000604 fpu_spill_mask_(0),
Nicolas Geoffray3bca0df2014-09-19 11:01:00 +0100605 first_register_slot_in_slow_path_(0),
Vladimir Marko804b03f2016-09-14 16:26:36 +0100606 allocated_registers_(RegisterSet::Empty()),
Vladimir Marko5233f932015-09-29 19:01:15 +0100607 blocked_core_registers_(graph->GetArena()->AllocArray<bool>(number_of_core_registers,
608 kArenaAllocCodeGenerator)),
609 blocked_fpu_registers_(graph->GetArena()->AllocArray<bool>(number_of_fpu_registers,
610 kArenaAllocCodeGenerator)),
Nicolas Geoffray71175b72014-10-09 22:13:55 +0100611 number_of_core_registers_(number_of_core_registers),
612 number_of_fpu_registers_(number_of_fpu_registers),
613 number_of_register_pairs_(number_of_register_pairs),
Nicolas Geoffray98893962015-01-21 12:32:32 +0000614 core_callee_save_mask_(core_callee_save_mask),
615 fpu_callee_save_mask_(fpu_callee_save_mask),
Mathieu Chartiera2f526f2017-01-19 14:48:48 -0800616 stack_map_stream_(graph->GetArena(), graph->GetInstructionSet()),
Vladimir Markocf93a5c2015-06-16 11:33:24 +0000617 block_order_(nullptr),
Nicolas Geoffray132d8362016-11-16 09:19:42 +0000618 jit_string_roots_(StringReferenceValueComparator(),
619 graph->GetArena()->Adapter(kArenaAllocCodeGenerator)),
Nicolas Geoffray22384ae2016-12-12 22:33:36 +0000620 jit_class_roots_(TypeReferenceValueComparator(),
621 graph->GetArena()->Adapter(kArenaAllocCodeGenerator)),
Alexandre Rameseb7b7392015-06-19 14:47:01 +0100622 disasm_info_(nullptr),
Serban Constantinescuecc43662015-08-13 13:33:12 +0100623 stats_(stats),
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000624 graph_(graph),
Calin Juravlecd6dffe2015-01-08 17:35:35 +0000625 compiler_options_(compiler_options),
Vladimir Marko225b6462015-09-28 12:17:40 +0100626 slow_paths_(graph->GetArena()->Adapter(kArenaAllocCodeGenerator)),
Vladimir Marko0f7dca42015-11-02 14:36:43 +0000627 current_slow_path_(nullptr),
Nicolas Geoffray4c204ba2015-02-03 15:12:35 +0000628 current_block_index_(0),
Nicolas Geoffray39468442014-09-02 15:17:15 +0100629 is_leaf_(true),
Vladimir Marko225b6462015-09-28 12:17:40 +0100630 requires_current_method_(false) {
631 slow_paths_.reserve(8);
632 }
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000633
Nicolas Geoffrayc0572a42015-02-06 14:35:25 +0000634 virtual HGraphVisitor* GetLocationBuilder() = 0;
635 virtual HGraphVisitor* GetInstructionVisitor() = 0;
Nicolas Geoffrayf0e39372014-11-12 17:50:07 +0000636
Nicolas Geoffrayd97dc402015-01-22 13:50:01 +0000637 // Returns the location of the first spilled entry for floating point registers,
638 // relative to the stack pointer.
639 uint32_t GetFpuSpillStart() const {
Nicolas Geoffrayd97dc402015-01-22 13:50:01 +0000640 return GetFrameSize() - FrameEntrySpillSize();
641 }
642
643 uint32_t GetFpuSpillSize() const {
644 return POPCOUNT(fpu_spill_mask_) * GetFloatingPointSpillSlotSize();
645 }
646
647 uint32_t GetCoreSpillSize() const {
648 return POPCOUNT(core_spill_mask_) * GetWordSize();
649 }
650
Alexey Frunze58320ce2016-08-30 21:40:46 -0700651 virtual bool HasAllocatedCalleeSaveRegisters() const {
Nicolas Geoffrayc0572a42015-02-06 14:35:25 +0000652 // We check the core registers against 1 because it always comprises the return PC.
653 return (POPCOUNT(allocated_registers_.GetCoreRegisters() & core_callee_save_mask_) != 1)
654 || (POPCOUNT(allocated_registers_.GetFloatingPointRegisters() & fpu_callee_save_mask_) != 0);
655 }
656
657 bool CallPushesPC() const {
658 InstructionSet instruction_set = GetInstructionSet();
659 return instruction_set == kX86 || instruction_set == kX86_64;
660 }
661
Vladimir Marko225b6462015-09-28 12:17:40 +0100662 // Arm64 has its own type for a label, so we need to templatize these methods
Nicolas Geoffraydc23d832015-02-16 11:15:43 +0000663 // to share the logic.
Vladimir Marko225b6462015-09-28 12:17:40 +0100664
665 template <typename LabelType>
666 LabelType* CommonInitializeLabels() {
Vladimir Markob95fb772015-09-30 13:32:31 +0100667 // We use raw array allocations instead of ArenaVector<> because Labels are
668 // non-constructible and non-movable and as such cannot be held in a vector.
Vladimir Marko225b6462015-09-28 12:17:40 +0100669 size_t size = GetGraph()->GetBlocks().size();
670 LabelType* labels = GetGraph()->GetArena()->AllocArray<LabelType>(size,
671 kArenaAllocCodeGenerator);
672 for (size_t i = 0; i != size; ++i) {
673 new(labels + i) LabelType();
674 }
675 return labels;
676 }
677
Vladimir Marko58155012015-08-19 12:49:41 +0000678 template <typename LabelType>
679 LabelType* CommonGetLabelOf(LabelType* raw_pointer_to_labels_array, HBasicBlock* block) const {
Nicolas Geoffraydc23d832015-02-16 11:15:43 +0000680 block = FirstNonEmptyBlock(block);
681 return raw_pointer_to_labels_array + block->GetBlockId();
682 }
683
Vladimir Marko0f7dca42015-11-02 14:36:43 +0000684 SlowPathCode* GetCurrentSlowPath() {
685 return current_slow_path_;
686 }
687
Nicolas Geoffray132d8362016-11-16 09:19:42 +0000688 // Emit the patches assocatied with JIT roots. Only applies to JIT compiled code.
689 virtual void EmitJitRootPatches(uint8_t* code ATTRIBUTE_UNUSED,
690 const uint8_t* roots_data ATTRIBUTE_UNUSED) {
691 DCHECK_EQ(jit_string_roots_.size(), 0u);
Nicolas Geoffray22384ae2016-12-12 22:33:36 +0000692 DCHECK_EQ(jit_class_roots_.size(), 0u);
Nicolas Geoffray132d8362016-11-16 09:19:42 +0000693 }
694
Nicolas Geoffray8ccc3f52014-03-19 10:34:11 +0000695 // Frame size required for this method.
696 uint32_t frame_size_;
697 uint32_t core_spill_mask_;
Nicolas Geoffrayd97dc402015-01-22 13:50:01 +0000698 uint32_t fpu_spill_mask_;
Nicolas Geoffray3bca0df2014-09-19 11:01:00 +0100699 uint32_t first_register_slot_in_slow_path_;
Nicolas Geoffray8ccc3f52014-03-19 10:34:11 +0000700
Nicolas Geoffray98893962015-01-21 12:32:32 +0000701 // Registers that were allocated during linear scan.
702 RegisterSet allocated_registers_;
703
Nicolas Geoffray71175b72014-10-09 22:13:55 +0100704 // Arrays used when doing register allocation to know which
705 // registers we can allocate. `SetupBlockedRegisters` updates the
706 // arrays.
707 bool* const blocked_core_registers_;
708 bool* const blocked_fpu_registers_;
Nicolas Geoffray71175b72014-10-09 22:13:55 +0100709 size_t number_of_core_registers_;
710 size_t number_of_fpu_registers_;
711 size_t number_of_register_pairs_;
Nicolas Geoffray98893962015-01-21 12:32:32 +0000712 const uint32_t core_callee_save_mask_;
713 const uint32_t fpu_callee_save_mask_;
Nicolas Geoffray71175b72014-10-09 22:13:55 +0100714
Vladimir Markocf93a5c2015-06-16 11:33:24 +0000715 StackMapStream stack_map_stream_;
716
717 // The order to use for code generation.
Vladimir Markofa6b93c2015-09-15 10:15:55 +0100718 const ArenaVector<HBasicBlock*>* block_order_;
Vladimir Markocf93a5c2015-06-16 11:33:24 +0000719
Nicolas Geoffray132d8362016-11-16 09:19:42 +0000720 // Maps a StringReference (dex_file, string_index) to the index in the literal table.
Nicolas Geoffrayf0acfe72017-01-09 20:54:52 +0000721 // Entries are intially added with a pointer in the handle zone, and `EmitJitRoots`
722 // will compute all the indices.
723 ArenaSafeMap<StringReference, uint64_t, StringReferenceValueComparator> jit_string_roots_;
Nicolas Geoffray22384ae2016-12-12 22:33:36 +0000724
725 // Maps a ClassReference (dex_file, type_index) to the index in the literal table.
726 // Entries are intially added with a pointer in the handle zone, and `EmitJitRoots`
727 // will compute all the indices.
728 ArenaSafeMap<TypeReference, uint64_t, TypeReferenceValueComparator> jit_class_roots_;
Nicolas Geoffray132d8362016-11-16 09:19:42 +0000729
Alexandre Rameseb7b7392015-06-19 14:47:01 +0100730 DisassemblyInformation* disasm_info_;
731
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +0000732 private:
Nicolas Geoffray3bca0df2014-09-19 11:01:00 +0100733 size_t GetStackOffsetOfSavedRegister(size_t index);
Alexandre Rameseb7b7392015-06-19 14:47:01 +0100734 void GenerateSlowPaths();
Mark Mendell5f874182015-03-04 15:42:45 -0500735 void BlockIfInRegister(Location location, bool is_out = false) const;
Nicolas Geoffrayb1d0f3f2015-05-14 12:41:51 +0100736 void EmitEnvironment(HEnvironment* environment, SlowPathCode* slow_path);
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000737
Serban Constantinescuecc43662015-08-13 13:33:12 +0100738 OptimizingCompilerStats* stats_;
739
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000740 HGraph* const graph_;
Calin Juravlecd6dffe2015-01-08 17:35:35 +0000741 const CompilerOptions& compiler_options_;
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000742
Alexandre Ramesc01a6642016-04-15 11:54:06 +0100743 ArenaVector<std::unique_ptr<SlowPathCode>> slow_paths_;
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000744
Aart Bik42249c32016-01-07 15:33:50 -0800745 // The current slow-path that we're generating code for.
Vladimir Marko0f7dca42015-11-02 14:36:43 +0000746 SlowPathCode* current_slow_path_;
747
Nicolas Geoffray4c204ba2015-02-03 15:12:35 +0000748 // The current block index in `block_order_` of the block
749 // we are generating code for.
750 size_t current_block_index_;
751
Nicolas Geoffrayc0572a42015-02-06 14:35:25 +0000752 // Whether the method is a leaf method.
Nicolas Geoffrayf12feb82014-07-17 18:32:41 +0100753 bool is_leaf_;
754
Nicolas Geoffrayc0572a42015-02-06 14:35:25 +0000755 // Whether an instruction in the graph accesses the current method.
Vladimir Marko3b7537b2016-09-13 11:56:01 +0000756 // TODO: Rename: this actually indicates that some instruction in the method
757 // needs the environment including a valid stack frame.
Nicolas Geoffrayc0572a42015-02-06 14:35:25 +0000758 bool requires_current_method_;
759
David Srbeckyc6b4dd82015-04-07 20:32:43 +0100760 friend class OptimizingCFITest;
761
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000762 DISALLOW_COPY_AND_ASSIGN(CodeGenerator);
763};
764
Nicolas Geoffray7fb49da2014-10-06 09:12:41 +0100765template <typename C, typename F>
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100766class CallingConvention {
767 public:
Nicolas Geoffray7fb49da2014-10-06 09:12:41 +0100768 CallingConvention(const C* registers,
769 size_t number_of_registers,
770 const F* fpu_registers,
Mathieu Chartiere401d142015-04-22 13:56:20 -0700771 size_t number_of_fpu_registers,
Andreas Gampe542451c2016-07-26 09:02:02 -0700772 PointerSize pointer_size)
Nicolas Geoffray7fb49da2014-10-06 09:12:41 +0100773 : registers_(registers),
774 number_of_registers_(number_of_registers),
775 fpu_registers_(fpu_registers),
Mathieu Chartiere401d142015-04-22 13:56:20 -0700776 number_of_fpu_registers_(number_of_fpu_registers),
777 pointer_size_(pointer_size) {}
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100778
779 size_t GetNumberOfRegisters() const { return number_of_registers_; }
Nicolas Geoffray7fb49da2014-10-06 09:12:41 +0100780 size_t GetNumberOfFpuRegisters() const { return number_of_fpu_registers_; }
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100781
Nicolas Geoffray7fb49da2014-10-06 09:12:41 +0100782 C GetRegisterAt(size_t index) const {
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100783 DCHECK_LT(index, number_of_registers_);
784 return registers_[index];
785 }
786
Nicolas Geoffray7fb49da2014-10-06 09:12:41 +0100787 F GetFpuRegisterAt(size_t index) const {
788 DCHECK_LT(index, number_of_fpu_registers_);
789 return fpu_registers_[index];
790 }
791
792 size_t GetStackOffsetOf(size_t index) const {
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100793 // We still reserve the space for parameters passed by registers.
Mathieu Chartiere401d142015-04-22 13:56:20 -0700794 // Add space for the method pointer.
Andreas Gampe542451c2016-07-26 09:02:02 -0700795 return static_cast<size_t>(pointer_size_) + index * kVRegSize;
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100796 }
797
798 private:
Nicolas Geoffray7fb49da2014-10-06 09:12:41 +0100799 const C* registers_;
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100800 const size_t number_of_registers_;
Nicolas Geoffray7fb49da2014-10-06 09:12:41 +0100801 const F* fpu_registers_;
802 const size_t number_of_fpu_registers_;
Andreas Gampe542451c2016-07-26 09:02:02 -0700803 const PointerSize pointer_size_;
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100804
805 DISALLOW_COPY_AND_ASSIGN(CallingConvention);
806};
807
Aart Bik42249c32016-01-07 15:33:50 -0800808/**
809 * A templated class SlowPathGenerator with a templated method NewSlowPath()
810 * that can be used by any code generator to share equivalent slow-paths with
811 * the objective of reducing generated code size.
812 *
813 * InstructionType: instruction that requires SlowPathCodeType
814 * SlowPathCodeType: subclass of SlowPathCode, with constructor SlowPathCodeType(InstructionType *)
815 */
816template <typename InstructionType>
817class SlowPathGenerator {
818 static_assert(std::is_base_of<HInstruction, InstructionType>::value,
819 "InstructionType is not a subclass of art::HInstruction");
820
821 public:
822 SlowPathGenerator(HGraph* graph, CodeGenerator* codegen)
823 : graph_(graph),
824 codegen_(codegen),
825 slow_path_map_(std::less<uint32_t>(), graph->GetArena()->Adapter(kArenaAllocSlowPaths)) {}
826
827 // Creates and adds a new slow-path, if needed, or returns existing one otherwise.
828 // Templating the method (rather than the whole class) on the slow-path type enables
829 // keeping this code at a generic, non architecture-specific place.
830 //
831 // NOTE: This approach assumes each InstructionType only generates one SlowPathCodeType.
832 // To relax this requirement, we would need some RTTI on the stored slow-paths,
833 // or template the class as a whole on SlowPathType.
834 template <typename SlowPathCodeType>
835 SlowPathCodeType* NewSlowPath(InstructionType* instruction) {
836 static_assert(std::is_base_of<SlowPathCode, SlowPathCodeType>::value,
837 "SlowPathCodeType is not a subclass of art::SlowPathCode");
838 static_assert(std::is_constructible<SlowPathCodeType, InstructionType*>::value,
839 "SlowPathCodeType is not constructible from InstructionType*");
840 // Iterate over potential candidates for sharing. Currently, only same-typed
841 // slow-paths with exactly the same dex-pc are viable candidates.
842 // TODO: pass dex-pc/slow-path-type to run-time to allow even more sharing?
843 const uint32_t dex_pc = instruction->GetDexPc();
844 auto iter = slow_path_map_.find(dex_pc);
845 if (iter != slow_path_map_.end()) {
Vladimir Marko7d157fc2017-05-10 16:29:23 +0100846 const ArenaVector<std::pair<InstructionType*, SlowPathCode*>>& candidates = iter->second;
Aart Bik42249c32016-01-07 15:33:50 -0800847 for (const auto& it : candidates) {
848 InstructionType* other_instruction = it.first;
849 SlowPathCodeType* other_slow_path = down_cast<SlowPathCodeType*>(it.second);
850 // Determine if the instructions allow for slow-path sharing.
851 if (HaveSameLiveRegisters(instruction, other_instruction) &&
852 HaveSameStackMap(instruction, other_instruction)) {
853 // Can share: reuse existing one.
854 return other_slow_path;
855 }
856 }
857 } else {
858 // First time this dex-pc is seen.
859 iter = slow_path_map_.Put(dex_pc, {{}, {graph_->GetArena()->Adapter(kArenaAllocSlowPaths)}});
860 }
861 // Cannot share: create and add new slow-path for this particular dex-pc.
862 SlowPathCodeType* slow_path = new (graph_->GetArena()) SlowPathCodeType(instruction);
863 iter->second.emplace_back(std::make_pair(instruction, slow_path));
864 codegen_->AddSlowPath(slow_path);
865 return slow_path;
866 }
867
868 private:
869 // Tests if both instructions have same set of live physical registers. This ensures
870 // the slow-path has exactly the same preamble on saving these registers to stack.
871 bool HaveSameLiveRegisters(const InstructionType* i1, const InstructionType* i2) const {
872 const uint32_t core_spill = ~codegen_->GetCoreSpillMask();
873 const uint32_t fpu_spill = ~codegen_->GetFpuSpillMask();
874 RegisterSet* live1 = i1->GetLocations()->GetLiveRegisters();
875 RegisterSet* live2 = i2->GetLocations()->GetLiveRegisters();
876 return (((live1->GetCoreRegisters() & core_spill) ==
877 (live2->GetCoreRegisters() & core_spill)) &&
878 ((live1->GetFloatingPointRegisters() & fpu_spill) ==
879 (live2->GetFloatingPointRegisters() & fpu_spill)));
880 }
881
882 // Tests if both instructions have the same stack map. This ensures the interpreter
883 // will find exactly the same dex-registers at the same entries.
884 bool HaveSameStackMap(const InstructionType* i1, const InstructionType* i2) const {
885 DCHECK(i1->HasEnvironment());
886 DCHECK(i2->HasEnvironment());
887 // We conservatively test if the two instructions find exactly the same instructions
888 // and location in each dex-register. This guarantees they will have the same stack map.
889 HEnvironment* e1 = i1->GetEnvironment();
890 HEnvironment* e2 = i2->GetEnvironment();
891 if (e1->GetParent() != e2->GetParent() || e1->Size() != e2->Size()) {
892 return false;
893 }
894 for (size_t i = 0, sz = e1->Size(); i < sz; ++i) {
895 if (e1->GetInstructionAt(i) != e2->GetInstructionAt(i) ||
896 !e1->GetLocationAt(i).Equals(e2->GetLocationAt(i))) {
897 return false;
898 }
899 }
900 return true;
901 }
902
903 HGraph* const graph_;
904 CodeGenerator* const codegen_;
905
906 // Map from dex-pc to vector of already existing instruction/slow-path pairs.
907 ArenaSafeMap<uint32_t, ArenaVector<std::pair<InstructionType*, SlowPathCode*>>> slow_path_map_;
908
909 DISALLOW_COPY_AND_ASSIGN(SlowPathGenerator);
910};
911
912class InstructionCodeGenerator : public HGraphVisitor {
913 public:
914 InstructionCodeGenerator(HGraph* graph, CodeGenerator* codegen)
915 : HGraphVisitor(graph),
916 deopt_slow_paths_(graph, codegen) {}
917
918 protected:
919 // Add slow-path generator for each instruction/slow-path combination that desires sharing.
920 // TODO: under current regime, only deopt sharing make sense; extend later.
921 SlowPathGenerator<HDeoptimize> deopt_slow_paths_;
922};
923
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000924} // namespace art
925
926#endif // ART_COMPILER_OPTIMIZING_CODE_GENERATOR_H_