blob: 78a8afb156c522b77132d919ee4a32df643019aa [file] [log] [blame]
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +00001/*
2 * Copyright (C) 2014 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17#ifndef ART_COMPILER_OPTIMIZING_CODE_GENERATOR_H_
18#define ART_COMPILER_OPTIMIZING_CODE_GENERATOR_H_
19
Ian Rogersd582fa42014-11-05 23:46:43 -080020#include "arch/instruction_set.h"
Calin Juravle34166012014-12-19 17:22:29 +000021#include "arch/instruction_set_features.h"
Vladimir Markof9f64412015-09-02 14:05:49 +010022#include "base/arena_containers.h"
23#include "base/arena_object.h"
Nicolas Geoffray01bc96d2014-04-11 17:43:50 +010024#include "base/bit_field.h"
Andreas Gampe542451c2016-07-26 09:02:02 -070025#include "base/enums.h"
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +000026#include "globals.h"
Alexandre Rameseb7b7392015-06-19 14:47:01 +010027#include "graph_visualizer.h"
Nicolas Geoffray4e3d23a2014-05-22 18:32:45 +010028#include "locations.h"
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +000029#include "memory_region.h"
30#include "nodes.h"
Serban Constantinescuecc43662015-08-13 13:33:12 +010031#include "optimizing_compiler_stats.h"
Nicolas Geoffray39468442014-09-02 15:17:15 +010032#include "stack_map_stream.h"
Andreas Gampe85b62f22015-09-09 13:15:38 -070033#include "utils/label.h"
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +000034
35namespace art {
36
Roland Levillain6d0e4832014-11-27 18:31:21 +000037// Binary encoding of 2^32 for type double.
38static int64_t constexpr k2Pow32EncodingForDouble = INT64_C(0x41F0000000000000);
39// Binary encoding of 2^31 for type double.
40static int64_t constexpr k2Pow31EncodingForDouble = INT64_C(0x41E0000000000000);
41
Mark Mendelle82549b2015-05-06 10:55:34 -040042// Minimum value for a primitive integer.
43static int32_t constexpr kPrimIntMin = 0x80000000;
44// Minimum value for a primitive long.
45static int64_t constexpr kPrimLongMin = INT64_C(0x8000000000000000);
46
Roland Levillain3f8f9362014-12-02 17:45:01 +000047// Maximum value for a primitive integer.
48static int32_t constexpr kPrimIntMax = 0x7fffffff;
Roland Levillain624279f2014-12-04 11:54:28 +000049// Maximum value for a primitive long.
Mark Mendelle82549b2015-05-06 10:55:34 -040050static int64_t constexpr kPrimLongMax = INT64_C(0x7fffffffffffffff);
Roland Levillain3f8f9362014-12-02 17:45:01 +000051
Nicolas Geoffray92a73ae2014-10-16 11:12:52 +010052class Assembler;
Nicolas Geoffraye5038322014-07-04 09:41:32 +010053class CodeGenerator;
Nicolas Geoffrayd28b9692015-11-04 14:36:55 +000054class CompilerDriver;
Vladimir Marko3a21e382016-09-02 12:38:38 +010055class CompilerOptions;
Vladimir Marko58155012015-08-19 12:49:41 +000056class LinkerPatch;
Nicolas Geoffrayf0e39372014-11-12 17:50:07 +000057class ParallelMoveResolver;
Nicolas Geoffray92cf83e2014-03-18 17:59:20 +000058
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +000059class CodeAllocator {
60 public:
Nicolas Geoffraye5038322014-07-04 09:41:32 +010061 CodeAllocator() {}
62 virtual ~CodeAllocator() {}
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +000063
64 virtual uint8_t* Allocate(size_t size) = 0;
65
66 private:
67 DISALLOW_COPY_AND_ASSIGN(CodeAllocator);
68};
69
Alexandre Ramesc01a6642016-04-15 11:54:06 +010070class SlowPathCode : public DeletableArenaObject<kArenaAllocSlowPaths> {
Nicolas Geoffraye5038322014-07-04 09:41:32 +010071 public:
David Srbecky9cd6d372016-02-09 15:24:47 +000072 explicit SlowPathCode(HInstruction* instruction) : instruction_(instruction) {
Nicolas Geoffrayeeefa122015-03-13 18:52:59 +000073 for (size_t i = 0; i < kMaximumNumberOfExpectedRegisters; ++i) {
74 saved_core_stack_offsets_[i] = kRegisterNotSaved;
75 saved_fpu_stack_offsets_[i] = kRegisterNotSaved;
76 }
77 }
78
Nicolas Geoffraye5038322014-07-04 09:41:32 +010079 virtual ~SlowPathCode() {}
80
Nicolas Geoffraye5038322014-07-04 09:41:32 +010081 virtual void EmitNativeCode(CodeGenerator* codegen) = 0;
82
Roland Levillain4359e612016-07-20 11:32:19 +010083 // Save live core and floating-point caller-save registers and
84 // update the stack mask in `locations` for registers holding object
85 // references.
Zheng Xuda403092015-04-24 17:35:39 +080086 virtual void SaveLiveRegisters(CodeGenerator* codegen, LocationSummary* locations);
Roland Levillain4359e612016-07-20 11:32:19 +010087 // Restore live core and floating-point caller-save registers.
Zheng Xuda403092015-04-24 17:35:39 +080088 virtual void RestoreLiveRegisters(CodeGenerator* codegen, LocationSummary* locations);
Nicolas Geoffraya8ac9132015-03-13 16:36:36 +000089
Nicolas Geoffrayeeefa122015-03-13 18:52:59 +000090 bool IsCoreRegisterSaved(int reg) const {
91 return saved_core_stack_offsets_[reg] != kRegisterNotSaved;
92 }
93
94 bool IsFpuRegisterSaved(int reg) const {
95 return saved_fpu_stack_offsets_[reg] != kRegisterNotSaved;
96 }
97
98 uint32_t GetStackOffsetOfCoreRegister(int reg) const {
99 return saved_core_stack_offsets_[reg];
100 }
101
102 uint32_t GetStackOffsetOfFpuRegister(int reg) const {
103 return saved_fpu_stack_offsets_[reg];
104 }
105
Alexandre Rames8158f282015-08-07 10:26:17 +0100106 virtual bool IsFatal() const { return false; }
107
Alexandre Rames9931f312015-06-19 14:47:01 +0100108 virtual const char* GetDescription() const = 0;
109
Andreas Gampe85b62f22015-09-09 13:15:38 -0700110 Label* GetEntryLabel() { return &entry_label_; }
111 Label* GetExitLabel() { return &exit_label_; }
112
David Srbeckyd28f4a02016-03-14 17:14:24 +0000113 HInstruction* GetInstruction() const {
114 return instruction_;
115 }
116
David Srbecky9cd6d372016-02-09 15:24:47 +0000117 uint32_t GetDexPc() const {
118 return instruction_ != nullptr ? instruction_->GetDexPc() : kNoDexPc;
119 }
120
Zheng Xuda403092015-04-24 17:35:39 +0800121 protected:
Nicolas Geoffrayeeefa122015-03-13 18:52:59 +0000122 static constexpr size_t kMaximumNumberOfExpectedRegisters = 32;
123 static constexpr uint32_t kRegisterNotSaved = -1;
David Srbecky9cd6d372016-02-09 15:24:47 +0000124 // The instruction where this slow path is happening.
125 HInstruction* instruction_;
Nicolas Geoffrayeeefa122015-03-13 18:52:59 +0000126 uint32_t saved_core_stack_offsets_[kMaximumNumberOfExpectedRegisters];
127 uint32_t saved_fpu_stack_offsets_[kMaximumNumberOfExpectedRegisters];
Zheng Xuda403092015-04-24 17:35:39 +0800128
129 private:
Andreas Gampe85b62f22015-09-09 13:15:38 -0700130 Label entry_label_;
131 Label exit_label_;
132
Nicolas Geoffraye5038322014-07-04 09:41:32 +0100133 DISALLOW_COPY_AND_ASSIGN(SlowPathCode);
134};
135
Roland Levillain2d27c8e2015-04-28 15:48:45 +0100136class InvokeDexCallingConventionVisitor {
137 public:
138 virtual Location GetNextLocation(Primitive::Type type) = 0;
Nicolas Geoffrayfd88f162015-06-03 11:23:52 +0100139 virtual Location GetReturnLocation(Primitive::Type type) const = 0;
140 virtual Location GetMethodLocation() const = 0;
Roland Levillain2d27c8e2015-04-28 15:48:45 +0100141
142 protected:
143 InvokeDexCallingConventionVisitor() {}
144 virtual ~InvokeDexCallingConventionVisitor() {}
145
146 // The current index for core registers.
147 uint32_t gp_index_ = 0u;
148 // The current index for floating-point registers.
149 uint32_t float_index_ = 0u;
150 // The current stack index.
151 uint32_t stack_index_ = 0u;
152
153 private:
154 DISALLOW_COPY_AND_ASSIGN(InvokeDexCallingConventionVisitor);
155};
156
Calin Juravlee460d1d2015-09-29 04:52:17 +0100157class FieldAccessCallingConvention {
158 public:
159 virtual Location GetObjectLocation() const = 0;
160 virtual Location GetFieldIndexLocation() const = 0;
161 virtual Location GetReturnLocation(Primitive::Type type) const = 0;
162 virtual Location GetSetValueLocation(Primitive::Type type, bool is_instance) const = 0;
163 virtual Location GetFpuLocation(Primitive::Type type) const = 0;
164 virtual ~FieldAccessCallingConvention() {}
165
166 protected:
167 FieldAccessCallingConvention() {}
168
169 private:
170 DISALLOW_COPY_AND_ASSIGN(FieldAccessCallingConvention);
171};
172
Vladimir Markod58b8372016-04-12 18:51:43 +0100173class CodeGenerator : public DeletableArenaObject<kArenaAllocCodeGenerator> {
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000174 public:
David Brazdil58282f42016-01-14 12:45:10 +0000175 // Compiles the graph to executable instructions.
176 void Compile(CodeAllocator* allocator);
Vladimir Markod58b8372016-04-12 18:51:43 +0100177 static std::unique_ptr<CodeGenerator> Create(HGraph* graph,
178 InstructionSet instruction_set,
179 const InstructionSetFeatures& isa_features,
180 const CompilerOptions& compiler_options,
181 OptimizingCompilerStats* stats = nullptr);
Nicolas Geoffray12df9eb2015-01-09 14:53:50 +0000182 virtual ~CodeGenerator() {}
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000183
Vladimir Markodc151b22015-10-15 18:02:30 +0100184 // Get the graph. This is the outermost graph, never the graph of a method being inlined.
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000185 HGraph* GetGraph() const { return graph_; }
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000186
Nicolas Geoffraydc23d832015-02-16 11:15:43 +0000187 HBasicBlock* GetNextBlockToEmit() const;
188 HBasicBlock* FirstNonEmptyBlock(HBasicBlock* block) const;
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +0000189 bool GoesToNextBlock(HBasicBlock* current, HBasicBlock* next) const;
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000190
Nicolas Geoffray86dbb9a2014-06-04 11:12:39 +0100191 size_t GetStackSlotOfParameter(HParameterValue* parameter) const {
192 // Note that this follows the current calling convention.
193 return GetFrameSize()
Andreas Gampe542451c2016-07-26 09:02:02 -0700194 + static_cast<size_t>(InstructionSetPointerSize(GetInstructionSet())) // Art method
Nicolas Geoffraye27f31a2014-06-12 17:53:14 +0100195 + parameter->GetIndex() * kVRegSize;
Nicolas Geoffray86dbb9a2014-06-04 11:12:39 +0100196 }
197
Nicolas Geoffray92a73ae2014-10-16 11:12:52 +0100198 virtual void Initialize() = 0;
Serban Constantinescu32f5b4d2014-11-25 20:05:46 +0000199 virtual void Finalize(CodeAllocator* allocator);
Vladimir Marko58155012015-08-19 12:49:41 +0000200 virtual void EmitLinkerPatches(ArenaVector<LinkerPatch>* linker_patches);
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000201 virtual void GenerateFrameEntry() = 0;
202 virtual void GenerateFrameExit() = 0;
Nicolas Geoffray92a73ae2014-10-16 11:12:52 +0100203 virtual void Bind(HBasicBlock* block) = 0;
Calin Juravle175dc732015-08-25 15:42:32 +0100204 virtual void MoveConstant(Location destination, int32_t value) = 0;
Calin Juravlee460d1d2015-09-29 04:52:17 +0100205 virtual void MoveLocation(Location dst, Location src, Primitive::Type dst_type) = 0;
206 virtual void AddLocationAsTemp(Location location, LocationSummary* locations) = 0;
207
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000208 virtual Assembler* GetAssembler() = 0;
Alexandre Rameseb7b7392015-06-19 14:47:01 +0100209 virtual const Assembler& GetAssembler() const = 0;
Nicolas Geoffray707c8092014-04-04 10:50:14 +0100210 virtual size_t GetWordSize() const = 0;
Mark Mendellf85a9ca2015-01-13 09:20:58 -0500211 virtual size_t GetFloatingPointSpillSlotSize() const = 0;
Alexandre Ramesc01a6642016-04-15 11:54:06 +0100212 virtual uintptr_t GetAddressOf(HBasicBlock* block) = 0;
Nicolas Geoffray4c204ba2015-02-03 15:12:35 +0000213 void InitializeCodeGeneration(size_t number_of_spill_slots,
214 size_t maximum_number_of_live_core_registers,
Roland Levillain0d5a2812015-11-13 10:07:31 +0000215 size_t maximum_number_of_live_fpu_registers,
Nicolas Geoffray4c204ba2015-02-03 15:12:35 +0000216 size_t number_of_out_slots,
Vladimir Markofa6b93c2015-09-15 10:15:55 +0100217 const ArenaVector<HBasicBlock*>& block_order);
Alexandre Rames68bd9b92016-07-15 17:41:13 +0100218 // Backends can override this as necessary. For most, no special alignment is required.
219 virtual uint32_t GetPreferredSlotsAlignment() const { return 1; }
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000220
221 uint32_t GetFrameSize() const { return frame_size_; }
222 void SetFrameSize(uint32_t size) { frame_size_ = size; }
Nicolas Geoffray8ccc3f52014-03-19 10:34:11 +0000223 uint32_t GetCoreSpillMask() const { return core_spill_mask_; }
Nicolas Geoffrayd97dc402015-01-22 13:50:01 +0000224 uint32_t GetFpuSpillMask() const { return fpu_spill_mask_; }
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000225
Nicolas Geoffray71175b72014-10-09 22:13:55 +0100226 size_t GetNumberOfCoreRegisters() const { return number_of_core_registers_; }
227 size_t GetNumberOfFloatingPointRegisters() const { return number_of_fpu_registers_; }
David Brazdil58282f42016-01-14 12:45:10 +0000228 virtual void SetupBlockedRegisters() const = 0;
Nicolas Geoffray71175b72014-10-09 22:13:55 +0100229
Nicolas Geoffray4dee6362015-01-23 18:23:14 +0000230 virtual void ComputeSpillMask() {
231 core_spill_mask_ = allocated_registers_.GetCoreRegisters() & core_callee_save_mask_;
232 DCHECK_NE(core_spill_mask_, 0u) << "At least the return address register must be saved";
233 fpu_spill_mask_ = allocated_registers_.GetFloatingPointRegisters() & fpu_callee_save_mask_;
234 }
235
236 static uint32_t ComputeRegisterMask(const int* registers, size_t length) {
237 uint32_t mask = 0;
238 for (size_t i = 0, e = length; i < e; ++i) {
239 mask |= (1 << registers[i]);
240 }
241 return mask;
242 }
243
Nicolas Geoffraya7062e02014-05-22 12:50:17 +0100244 virtual void DumpCoreRegister(std::ostream& stream, int reg) const = 0;
245 virtual void DumpFloatingPointRegister(std::ostream& stream, int reg) const = 0;
Nicolas Geoffray412f10c2014-06-19 10:00:34 +0100246 virtual InstructionSet GetInstructionSet() const = 0;
Calin Juravlecd6dffe2015-01-08 17:35:35 +0000247
248 const CompilerOptions& GetCompilerOptions() const { return compiler_options_; }
249
Serban Constantinescuecc43662015-08-13 13:33:12 +0100250 void MaybeRecordStat(MethodCompilationStat compilation_stat, size_t count = 1) const;
251
Nicolas Geoffray102cbed2014-10-15 18:31:05 +0100252 // Saves the register in the stack. Returns the size taken on stack.
253 virtual size_t SaveCoreRegister(size_t stack_index, uint32_t reg_id) = 0;
254 // Restores the register from the stack. Returns the size taken on stack.
255 virtual size_t RestoreCoreRegister(size_t stack_index, uint32_t reg_id) = 0;
Nicolas Geoffray234d69d2015-03-09 10:28:50 +0000256
257 virtual size_t SaveFloatingPointRegister(size_t stack_index, uint32_t reg_id) = 0;
258 virtual size_t RestoreFloatingPointRegister(size_t stack_index, uint32_t reg_id) = 0;
259
Nicolas Geoffray840e5462015-01-07 16:01:24 +0000260 virtual bool NeedsTwoRegisters(Primitive::Type type) const = 0;
Nicolas Geoffray234d69d2015-03-09 10:28:50 +0000261 // Returns whether we should split long moves in parallel moves.
262 virtual bool ShouldSplitLongMoves() const { return false; }
Nicolas Geoffraya7062e02014-05-22 12:50:17 +0100263
Roland Levillain0d5a2812015-11-13 10:07:31 +0000264 size_t GetNumberOfCoreCalleeSaveRegisters() const {
265 return POPCOUNT(core_callee_save_mask_);
266 }
267
268 size_t GetNumberOfCoreCallerSaveRegisters() const {
269 DCHECK_GE(GetNumberOfCoreRegisters(), GetNumberOfCoreCalleeSaveRegisters());
270 return GetNumberOfCoreRegisters() - GetNumberOfCoreCalleeSaveRegisters();
271 }
272
Nicolas Geoffray98893962015-01-21 12:32:32 +0000273 bool IsCoreCalleeSaveRegister(int reg) const {
274 return (core_callee_save_mask_ & (1 << reg)) != 0;
275 }
276
277 bool IsFloatingPointCalleeSaveRegister(int reg) const {
278 return (fpu_callee_save_mask_ & (1 << reg)) != 0;
279 }
280
Yevgeny Rouban2a7c1ef2015-07-22 18:36:24 +0600281 // Record native to dex mapping for a suspend point. Required by runtime.
Nicolas Geoffrayeeefa122015-03-13 18:52:59 +0000282 void RecordPcInfo(HInstruction* instruction, uint32_t dex_pc, SlowPathCode* slow_path = nullptr);
David Srbeckyb7070a22016-01-08 18:13:53 +0000283 // Check whether we have already recorded mapping at this PC.
284 bool HasStackMapAtCurrentPc();
David Srbeckyc7098ff2016-02-09 14:30:11 +0000285 // Record extra stack maps if we support native debugging.
David Srbeckyd28f4a02016-03-14 17:14:24 +0000286 void MaybeRecordNativeDebugInfo(HInstruction* instruction,
287 uint32_t dex_pc,
288 SlowPathCode* slow_path = nullptr);
Yevgeny Rouban2a7c1ef2015-07-22 18:36:24 +0600289
Calin Juravle77520bc2015-01-12 18:45:46 +0000290 bool CanMoveNullCheckToUser(HNullCheck* null_check);
291 void MaybeRecordImplicitNullCheck(HInstruction* instruction);
Calin Juravle2ae48182016-03-16 14:05:09 +0000292 void GenerateNullCheck(HNullCheck* null_check);
293 virtual void GenerateImplicitNullCheck(HNullCheck* null_check) = 0;
294 virtual void GenerateExplicitNullCheck(HNullCheck* null_check) = 0;
Nicolas Geoffray8ccc3f52014-03-19 10:34:11 +0000295
David Brazdil77a48ae2015-09-15 12:34:04 +0000296 // Records a stack map which the runtime might use to set catch phi values
297 // during exception delivery.
298 // TODO: Replace with a catch-entering instruction that records the environment.
299 void RecordCatchBlockInfo();
300
301 // Returns true if implicit null checks are allowed in the compiler options
302 // and if the null check is not inside a try block. We currently cannot do
303 // implicit null checks in that case because we need the NullCheckSlowPath to
304 // save live registers, which may be needed by the runtime to set catch phis.
305 bool IsImplicitNullCheckAllowed(HNullCheck* null_check) const;
306
Alexandre Ramesc01a6642016-04-15 11:54:06 +0100307 // TODO: Avoid creating the `std::unique_ptr` here.
Nicolas Geoffraye5038322014-07-04 09:41:32 +0100308 void AddSlowPath(SlowPathCode* slow_path) {
Alexandre Ramesc01a6642016-04-15 11:54:06 +0100309 slow_paths_.push_back(std::unique_ptr<SlowPathCode>(slow_path));
Nicolas Geoffraye5038322014-07-04 09:41:32 +0100310 }
311
Nicolas Geoffrayb331feb2016-02-05 16:51:53 +0000312 void BuildStackMaps(MemoryRegion region, const DexFile::CodeItem& code_item);
Nicolas Geoffrayd28b9692015-11-04 14:36:55 +0000313 size_t ComputeStackMapsSize();
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000314
Nicolas Geoffrayf12feb82014-07-17 18:32:41 +0100315 bool IsLeafMethod() const {
316 return is_leaf_;
317 }
318
319 void MarkNotLeaf() {
320 is_leaf_ = false;
Nicolas Geoffrayc0572a42015-02-06 14:35:25 +0000321 requires_current_method_ = true;
322 }
323
324 void SetRequiresCurrentMethod() {
325 requires_current_method_ = true;
326 }
327
328 bool RequiresCurrentMethod() const {
329 return requires_current_method_;
Nicolas Geoffrayf12feb82014-07-17 18:32:41 +0100330 }
331
Nicolas Geoffray3c049742014-09-24 18:10:46 +0100332 // Clears the spill slots taken by loop phis in the `LocationSummary` of the
333 // suspend check. This is called when the code generator generates code
334 // for the suspend check at the back edge (instead of where the suspend check
335 // is, which is the loop entry). At this point, the spill slots for the phis
336 // have not been written to.
337 void ClearSpillSlotsFromLoopPhisInStackMap(HSuspendCheck* suspend_check) const;
338
Nicolas Geoffray71175b72014-10-09 22:13:55 +0100339 bool* GetBlockedCoreRegisters() const { return blocked_core_registers_; }
Nicolas Geoffray102cbed2014-10-15 18:31:05 +0100340 bool* GetBlockedFloatingPointRegisters() const { return blocked_fpu_registers_; }
Nicolas Geoffray71175b72014-10-09 22:13:55 +0100341
Matthew Gharrityd9ffd0d2016-06-22 10:27:55 -0700342 bool IsBlockedCoreRegister(size_t i) { return blocked_core_registers_[i]; }
343 bool IsBlockedFloatingPointRegister(size_t i) { return blocked_fpu_registers_[i]; }
344
Nicolas Geoffray19a19cf2014-10-22 16:07:05 +0100345 // Helper that returns the pointer offset of an index in an object array.
346 // Note: this method assumes we always have the same pointer size, regardless
347 // of the architecture.
348 static size_t GetCacheOffset(uint32_t index);
Mathieu Chartiere401d142015-04-22 13:56:20 -0700349 // Pointer variant for ArtMethod and ArtField arrays.
350 size_t GetCachePointerOffset(uint32_t index);
Nicolas Geoffray19a19cf2014-10-22 16:07:05 +0100351
Vladimir Markodce016e2016-04-28 13:10:02 +0100352 // Helper that returns the offset of the array's length field.
353 // Note: Besides the normal arrays, we also use the HArrayLength for
354 // accessing the String's `count` field in String intrinsics.
355 static uint32_t GetArrayLengthOffset(HArrayLength* array_length);
356
Vladimir Marko87f3fcb2016-04-28 15:52:11 +0100357 // Helper that returns the offset of the array's data.
358 // Note: Besides the normal arrays, we also use the HArrayGet for
359 // accessing the String's `value` field in String intrinsics.
360 static uint32_t GetArrayDataOffset(HArrayGet* array_get);
361
Roland Levillain02b75802016-07-13 11:54:35 +0100362 // Return the entry point offset for ReadBarrierMarkRegX, where X is `reg`.
Andreas Gampe542451c2016-07-26 09:02:02 -0700363 template <PointerSize pointer_size>
Roland Levillain02b75802016-07-13 11:54:35 +0100364 static int32_t GetReadBarrierMarkEntryPointsOffset(size_t reg) {
Roland Levillaind549c282016-07-25 12:49:15 +0100365 // The entry point list defines 30 ReadBarrierMarkRegX entry points.
366 DCHECK_LT(reg, 30u);
Roland Levillain02b75802016-07-13 11:54:35 +0100367 // The ReadBarrierMarkRegX entry points are ordered by increasing
368 // register number in Thread::tls_Ptr_.quick_entrypoints.
369 return QUICK_ENTRYPOINT_OFFSET(pointer_size, pReadBarrierMarkReg00).Int32Value()
Andreas Gampe542451c2016-07-26 09:02:02 -0700370 + static_cast<size_t>(pointer_size) * reg;
Roland Levillain02b75802016-07-13 11:54:35 +0100371 }
372
Nicolas Geoffray90218252015-04-15 11:56:51 +0100373 void EmitParallelMoves(Location from1,
374 Location to1,
375 Primitive::Type type1,
376 Location from2,
377 Location to2,
378 Primitive::Type type2);
Nicolas Geoffrayf0e39372014-11-12 17:50:07 +0000379
Nicolas Geoffrayaf07bc12014-11-12 18:08:09 +0000380 static bool StoreNeedsWriteBarrier(Primitive::Type type, HInstruction* value) {
David Brazdil522e2242015-03-17 18:48:28 +0000381 // Check that null value is not represented as an integer constant.
382 DCHECK(type != Primitive::kPrimNot || !value->IsIntConstant());
383 return type == Primitive::kPrimNot && !value->IsNullConstant();
Nicolas Geoffrayaf07bc12014-11-12 18:08:09 +0000384 }
385
Roland Levillaindec8f632016-07-22 17:10:06 +0100386
387 // Perfoms checks pertaining to an InvokeRuntime call.
Alexandre Rames78e3ef62015-08-12 13:43:29 +0100388 void ValidateInvokeRuntime(HInstruction* instruction, SlowPathCode* slow_path);
389
Roland Levillaindec8f632016-07-22 17:10:06 +0100390 // Perfoms checks pertaining to an InvokeRuntimeWithoutRecordingPcInfo call.
391 static void ValidateInvokeRuntimeWithoutRecordingPcInfo(HInstruction* instruction,
392 SlowPathCode* slow_path);
393
Nicolas Geoffray98893962015-01-21 12:32:32 +0000394 void AddAllocatedRegister(Location location) {
395 allocated_registers_.Add(location);
396 }
397
Nicolas Geoffray45b83af2015-07-06 15:12:53 +0000398 bool HasAllocatedRegister(bool is_core, int reg) const {
399 return is_core
400 ? allocated_registers_.ContainsCoreRegister(reg)
401 : allocated_registers_.ContainsFloatingPointRegister(reg);
402 }
403
Nicolas Geoffrayc0572a42015-02-06 14:35:25 +0000404 void AllocateLocations(HInstruction* instruction);
405
Roland Levillainaa9b7c42015-02-17 15:40:09 +0000406 // Tells whether the stack frame of the compiled method is
407 // considered "empty", that is either actually having a size of zero,
408 // or just containing the saved return address register.
409 bool HasEmptyFrame() const {
410 return GetFrameSize() == (CallPushesPC() ? GetWordSize() : 0);
411 }
412
Nicolas Geoffrayd6138ef2015-02-18 14:48:53 +0000413 static int32_t GetInt32ValueOf(HConstant* constant) {
414 if (constant->IsIntConstant()) {
415 return constant->AsIntConstant()->GetValue();
416 } else if (constant->IsNullConstant()) {
417 return 0;
418 } else {
419 DCHECK(constant->IsFloatConstant());
Roland Levillainda4d79b2015-03-24 14:36:11 +0000420 return bit_cast<int32_t, float>(constant->AsFloatConstant()->GetValue());
Nicolas Geoffrayd6138ef2015-02-18 14:48:53 +0000421 }
422 }
423
424 static int64_t GetInt64ValueOf(HConstant* constant) {
425 if (constant->IsIntConstant()) {
426 return constant->AsIntConstant()->GetValue();
427 } else if (constant->IsNullConstant()) {
428 return 0;
429 } else if (constant->IsFloatConstant()) {
Roland Levillainda4d79b2015-03-24 14:36:11 +0000430 return bit_cast<int32_t, float>(constant->AsFloatConstant()->GetValue());
Nicolas Geoffrayd6138ef2015-02-18 14:48:53 +0000431 } else if (constant->IsLongConstant()) {
432 return constant->AsLongConstant()->GetValue();
433 } else {
434 DCHECK(constant->IsDoubleConstant());
Roland Levillainda4d79b2015-03-24 14:36:11 +0000435 return bit_cast<int64_t, double>(constant->AsDoubleConstant()->GetValue());
Nicolas Geoffrayd6138ef2015-02-18 14:48:53 +0000436 }
437 }
438
Nicolas Geoffraya8ac9132015-03-13 16:36:36 +0000439 size_t GetFirstRegisterSlotInSlowPath() const {
440 return first_register_slot_in_slow_path_;
441 }
442
443 uint32_t FrameEntrySpillSize() const {
444 return GetFpuSpillSize() + GetCoreSpillSize();
445 }
446
Roland Levillainec525fc2015-04-28 15:50:20 +0100447 virtual ParallelMoveResolver* GetMoveResolver() = 0;
Nicolas Geoffraya8ac9132015-03-13 16:36:36 +0000448
Nicolas Geoffrayfd88f162015-06-03 11:23:52 +0100449 static void CreateCommonInvokeLocationSummary(
450 HInvoke* invoke, InvokeDexCallingConventionVisitor* visitor);
451
Calin Juravle175dc732015-08-25 15:42:32 +0100452 void GenerateInvokeUnresolvedRuntimeCall(HInvokeUnresolved* invoke);
453
Calin Juravlee460d1d2015-09-29 04:52:17 +0100454 void CreateUnresolvedFieldLocationSummary(
455 HInstruction* field_access,
456 Primitive::Type field_type,
457 const FieldAccessCallingConvention& calling_convention);
458
459 void GenerateUnresolvedFieldAccess(
460 HInstruction* field_access,
461 Primitive::Type field_type,
462 uint32_t field_index,
463 uint32_t dex_pc,
464 const FieldAccessCallingConvention& calling_convention);
465
Calin Juravle98893e12015-10-02 21:05:03 +0100466 // TODO: This overlaps a bit with MoveFromReturnRegister. Refactor for a better design.
467 static void CreateLoadClassLocationSummary(HLoadClass* cls,
468 Location runtime_type_index_location,
Roland Levillain0d5a2812015-11-13 10:07:31 +0000469 Location runtime_return_location,
470 bool code_generator_supports_read_barrier = false);
Calin Juravle98893e12015-10-02 21:05:03 +0100471
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +0100472 static void CreateSystemArrayCopyLocationSummary(HInvoke* invoke);
473
Alexandre Rameseb7b7392015-06-19 14:47:01 +0100474 void SetDisassemblyInformation(DisassemblyInformation* info) { disasm_info_ = info; }
475 DisassemblyInformation* GetDisassemblyInformation() const { return disasm_info_; }
476
Calin Juravle175dc732015-08-25 15:42:32 +0100477 virtual void InvokeRuntime(QuickEntrypointEnum entrypoint,
478 HInstruction* instruction,
479 uint32_t dex_pc,
480 SlowPathCode* slow_path) = 0;
481
Vladimir Markocac5a7e2016-02-22 10:39:50 +0000482 // Check if the desired_string_load_kind is supported. If it is, return it,
Vladimir Markodbb7f5b2016-03-30 13:23:58 +0100483 // otherwise return a fall-back kind that should be used instead.
Vladimir Markocac5a7e2016-02-22 10:39:50 +0000484 virtual HLoadString::LoadKind GetSupportedLoadStringKind(
485 HLoadString::LoadKind desired_string_load_kind) = 0;
486
Vladimir Markodbb7f5b2016-03-30 13:23:58 +0100487 // Check if the desired_class_load_kind is supported. If it is, return it,
488 // otherwise return a fall-back kind that should be used instead.
489 virtual HLoadClass::LoadKind GetSupportedLoadClassKind(
490 HLoadClass::LoadKind desired_class_load_kind) = 0;
491
Vladimir Markodc151b22015-10-15 18:02:30 +0100492 // Check if the desired_dispatch_info is supported. If it is, return it,
493 // otherwise return a fall-back info that should be used instead.
494 virtual HInvokeStaticOrDirect::DispatchInfo GetSupportedInvokeStaticOrDirectDispatch(
495 const HInvokeStaticOrDirect::DispatchInfo& desired_dispatch_info,
496 MethodReference target_method) = 0;
497
Andreas Gampe85b62f22015-09-09 13:15:38 -0700498 // Generate a call to a static or direct method.
499 virtual void GenerateStaticOrDirectCall(HInvokeStaticOrDirect* invoke, Location temp) = 0;
500 // Generate a call to a virtual method.
501 virtual void GenerateVirtualCall(HInvokeVirtual* invoke, Location temp) = 0;
502
503 // Copy the result of a call into the given target.
504 virtual void MoveFromReturnRegister(Location trg, Primitive::Type type) = 0;
505
David Srbeckyc7098ff2016-02-09 14:30:11 +0000506 virtual void GenerateNop() = 0;
507
Serguei Katkov288c7a82016-05-16 11:53:15 +0600508 uint32_t GetReferenceSlowFlagOffset() const;
509 uint32_t GetReferenceDisableFlagOffset() const;
510
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000511 protected:
Vladimir Marko58155012015-08-19 12:49:41 +0000512 // Method patch info used for recording locations of required linker patches and
513 // target methods. The target method can be used for various purposes, whether for
514 // patching the address of the method or the code pointer or a PC-relative call.
515 template <typename LabelType>
516 struct MethodPatchInfo {
517 explicit MethodPatchInfo(MethodReference m) : target_method(m), label() { }
518
519 MethodReference target_method;
520 LabelType label;
521 };
522
Vladimir Markocac5a7e2016-02-22 10:39:50 +0000523 // String patch info used for recording locations of required linker patches and
524 // target strings. The actual string address can be absolute or PC-relative.
525 template <typename LabelType>
526 struct StringPatchInfo {
527 StringPatchInfo(const DexFile& df, uint32_t index)
528 : dex_file(df), string_index(index), label() { }
529
530 const DexFile& dex_file;
531 uint32_t string_index;
532 LabelType label;
533 };
534
Vladimir Markodbb7f5b2016-03-30 13:23:58 +0100535 // Type patch info used for recording locations of required linker patches and
536 // target types. The actual type address can be absolute or PC-relative.
537 // TODO: Consider merging with MethodPatchInfo and StringPatchInfo - all these
538 // classes contain the dex file, some index and the label.
539 template <typename LabelType>
540 struct TypePatchInfo {
541 TypePatchInfo(const DexFile& df, uint32_t index)
542 : dex_file(df), type_index(index), label() { }
543
544 const DexFile& dex_file;
545 uint32_t type_index;
546 LabelType label;
547 };
548
Nicolas Geoffray71175b72014-10-09 22:13:55 +0100549 CodeGenerator(HGraph* graph,
550 size_t number_of_core_registers,
551 size_t number_of_fpu_registers,
Calin Juravlecd6dffe2015-01-08 17:35:35 +0000552 size_t number_of_register_pairs,
Nicolas Geoffray98893962015-01-21 12:32:32 +0000553 uint32_t core_callee_save_mask,
554 uint32_t fpu_callee_save_mask,
Serban Constantinescuecc43662015-08-13 13:33:12 +0100555 const CompilerOptions& compiler_options,
556 OptimizingCompilerStats* stats)
Nicolas Geoffrayc0572a42015-02-06 14:35:25 +0000557 : frame_size_(0),
Nicolas Geoffray4361bef2014-08-20 04:59:12 +0100558 core_spill_mask_(0),
Nicolas Geoffrayd97dc402015-01-22 13:50:01 +0000559 fpu_spill_mask_(0),
Nicolas Geoffray3bca0df2014-09-19 11:01:00 +0100560 first_register_slot_in_slow_path_(0),
Vladimir Marko5233f932015-09-29 19:01:15 +0100561 blocked_core_registers_(graph->GetArena()->AllocArray<bool>(number_of_core_registers,
562 kArenaAllocCodeGenerator)),
563 blocked_fpu_registers_(graph->GetArena()->AllocArray<bool>(number_of_fpu_registers,
564 kArenaAllocCodeGenerator)),
565 blocked_register_pairs_(graph->GetArena()->AllocArray<bool>(number_of_register_pairs,
566 kArenaAllocCodeGenerator)),
Nicolas Geoffray71175b72014-10-09 22:13:55 +0100567 number_of_core_registers_(number_of_core_registers),
568 number_of_fpu_registers_(number_of_fpu_registers),
569 number_of_register_pairs_(number_of_register_pairs),
Nicolas Geoffray98893962015-01-21 12:32:32 +0000570 core_callee_save_mask_(core_callee_save_mask),
571 fpu_callee_save_mask_(fpu_callee_save_mask),
Vladimir Markocf93a5c2015-06-16 11:33:24 +0000572 stack_map_stream_(graph->GetArena()),
573 block_order_(nullptr),
Alexandre Rameseb7b7392015-06-19 14:47:01 +0100574 disasm_info_(nullptr),
Serban Constantinescuecc43662015-08-13 13:33:12 +0100575 stats_(stats),
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000576 graph_(graph),
Calin Juravlecd6dffe2015-01-08 17:35:35 +0000577 compiler_options_(compiler_options),
Vladimir Marko225b6462015-09-28 12:17:40 +0100578 slow_paths_(graph->GetArena()->Adapter(kArenaAllocCodeGenerator)),
Vladimir Marko0f7dca42015-11-02 14:36:43 +0000579 current_slow_path_(nullptr),
Nicolas Geoffray4c204ba2015-02-03 15:12:35 +0000580 current_block_index_(0),
Nicolas Geoffray39468442014-09-02 15:17:15 +0100581 is_leaf_(true),
Vladimir Marko225b6462015-09-28 12:17:40 +0100582 requires_current_method_(false) {
583 slow_paths_.reserve(8);
584 }
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000585
Nicolas Geoffrayc0572a42015-02-06 14:35:25 +0000586 virtual HGraphVisitor* GetLocationBuilder() = 0;
587 virtual HGraphVisitor* GetInstructionVisitor() = 0;
Nicolas Geoffrayf0e39372014-11-12 17:50:07 +0000588
Nicolas Geoffrayd97dc402015-01-22 13:50:01 +0000589 // Returns the location of the first spilled entry for floating point registers,
590 // relative to the stack pointer.
591 uint32_t GetFpuSpillStart() const {
Nicolas Geoffrayd97dc402015-01-22 13:50:01 +0000592 return GetFrameSize() - FrameEntrySpillSize();
593 }
594
595 uint32_t GetFpuSpillSize() const {
596 return POPCOUNT(fpu_spill_mask_) * GetFloatingPointSpillSlotSize();
597 }
598
599 uint32_t GetCoreSpillSize() const {
600 return POPCOUNT(core_spill_mask_) * GetWordSize();
601 }
602
Nicolas Geoffrayc0572a42015-02-06 14:35:25 +0000603 bool HasAllocatedCalleeSaveRegisters() const {
604 // We check the core registers against 1 because it always comprises the return PC.
605 return (POPCOUNT(allocated_registers_.GetCoreRegisters() & core_callee_save_mask_) != 1)
606 || (POPCOUNT(allocated_registers_.GetFloatingPointRegisters() & fpu_callee_save_mask_) != 0);
607 }
608
609 bool CallPushesPC() const {
610 InstructionSet instruction_set = GetInstructionSet();
611 return instruction_set == kX86 || instruction_set == kX86_64;
612 }
613
Vladimir Marko225b6462015-09-28 12:17:40 +0100614 // Arm64 has its own type for a label, so we need to templatize these methods
Nicolas Geoffraydc23d832015-02-16 11:15:43 +0000615 // to share the logic.
Vladimir Marko225b6462015-09-28 12:17:40 +0100616
617 template <typename LabelType>
618 LabelType* CommonInitializeLabels() {
Vladimir Markob95fb772015-09-30 13:32:31 +0100619 // We use raw array allocations instead of ArenaVector<> because Labels are
620 // non-constructible and non-movable and as such cannot be held in a vector.
Vladimir Marko225b6462015-09-28 12:17:40 +0100621 size_t size = GetGraph()->GetBlocks().size();
622 LabelType* labels = GetGraph()->GetArena()->AllocArray<LabelType>(size,
623 kArenaAllocCodeGenerator);
624 for (size_t i = 0; i != size; ++i) {
625 new(labels + i) LabelType();
626 }
627 return labels;
628 }
629
Vladimir Marko58155012015-08-19 12:49:41 +0000630 template <typename LabelType>
631 LabelType* CommonGetLabelOf(LabelType* raw_pointer_to_labels_array, HBasicBlock* block) const {
Nicolas Geoffraydc23d832015-02-16 11:15:43 +0000632 block = FirstNonEmptyBlock(block);
633 return raw_pointer_to_labels_array + block->GetBlockId();
634 }
635
Vladimir Marko0f7dca42015-11-02 14:36:43 +0000636 SlowPathCode* GetCurrentSlowPath() {
637 return current_slow_path_;
638 }
639
Nicolas Geoffray8ccc3f52014-03-19 10:34:11 +0000640 // Frame size required for this method.
641 uint32_t frame_size_;
642 uint32_t core_spill_mask_;
Nicolas Geoffrayd97dc402015-01-22 13:50:01 +0000643 uint32_t fpu_spill_mask_;
Nicolas Geoffray3bca0df2014-09-19 11:01:00 +0100644 uint32_t first_register_slot_in_slow_path_;
Nicolas Geoffray8ccc3f52014-03-19 10:34:11 +0000645
Nicolas Geoffray98893962015-01-21 12:32:32 +0000646 // Registers that were allocated during linear scan.
647 RegisterSet allocated_registers_;
648
Nicolas Geoffray71175b72014-10-09 22:13:55 +0100649 // Arrays used when doing register allocation to know which
650 // registers we can allocate. `SetupBlockedRegisters` updates the
651 // arrays.
652 bool* const blocked_core_registers_;
653 bool* const blocked_fpu_registers_;
654 bool* const blocked_register_pairs_;
655 size_t number_of_core_registers_;
656 size_t number_of_fpu_registers_;
657 size_t number_of_register_pairs_;
Nicolas Geoffray98893962015-01-21 12:32:32 +0000658 const uint32_t core_callee_save_mask_;
659 const uint32_t fpu_callee_save_mask_;
Nicolas Geoffray71175b72014-10-09 22:13:55 +0100660
Vladimir Markocf93a5c2015-06-16 11:33:24 +0000661 StackMapStream stack_map_stream_;
662
663 // The order to use for code generation.
Vladimir Markofa6b93c2015-09-15 10:15:55 +0100664 const ArenaVector<HBasicBlock*>* block_order_;
Vladimir Markocf93a5c2015-06-16 11:33:24 +0000665
Alexandre Rameseb7b7392015-06-19 14:47:01 +0100666 DisassemblyInformation* disasm_info_;
667
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +0000668 private:
Nicolas Geoffray3bca0df2014-09-19 11:01:00 +0100669 size_t GetStackOffsetOfSavedRegister(size_t index);
Alexandre Rameseb7b7392015-06-19 14:47:01 +0100670 void GenerateSlowPaths();
Mark Mendell5f874182015-03-04 15:42:45 -0500671 void BlockIfInRegister(Location location, bool is_out = false) const;
Nicolas Geoffrayb1d0f3f2015-05-14 12:41:51 +0100672 void EmitEnvironment(HEnvironment* environment, SlowPathCode* slow_path);
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000673
Serban Constantinescuecc43662015-08-13 13:33:12 +0100674 OptimizingCompilerStats* stats_;
675
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000676 HGraph* const graph_;
Calin Juravlecd6dffe2015-01-08 17:35:35 +0000677 const CompilerOptions& compiler_options_;
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000678
Alexandre Ramesc01a6642016-04-15 11:54:06 +0100679 ArenaVector<std::unique_ptr<SlowPathCode>> slow_paths_;
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000680
Aart Bik42249c32016-01-07 15:33:50 -0800681 // The current slow-path that we're generating code for.
Vladimir Marko0f7dca42015-11-02 14:36:43 +0000682 SlowPathCode* current_slow_path_;
683
Nicolas Geoffray4c204ba2015-02-03 15:12:35 +0000684 // The current block index in `block_order_` of the block
685 // we are generating code for.
686 size_t current_block_index_;
687
Nicolas Geoffrayc0572a42015-02-06 14:35:25 +0000688 // Whether the method is a leaf method.
Nicolas Geoffrayf12feb82014-07-17 18:32:41 +0100689 bool is_leaf_;
690
Nicolas Geoffrayc0572a42015-02-06 14:35:25 +0000691 // Whether an instruction in the graph accesses the current method.
692 bool requires_current_method_;
693
David Srbeckyc6b4dd82015-04-07 20:32:43 +0100694 friend class OptimizingCFITest;
695
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000696 DISALLOW_COPY_AND_ASSIGN(CodeGenerator);
697};
698
Nicolas Geoffray7fb49da2014-10-06 09:12:41 +0100699template <typename C, typename F>
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100700class CallingConvention {
701 public:
Nicolas Geoffray7fb49da2014-10-06 09:12:41 +0100702 CallingConvention(const C* registers,
703 size_t number_of_registers,
704 const F* fpu_registers,
Mathieu Chartiere401d142015-04-22 13:56:20 -0700705 size_t number_of_fpu_registers,
Andreas Gampe542451c2016-07-26 09:02:02 -0700706 PointerSize pointer_size)
Nicolas Geoffray7fb49da2014-10-06 09:12:41 +0100707 : registers_(registers),
708 number_of_registers_(number_of_registers),
709 fpu_registers_(fpu_registers),
Mathieu Chartiere401d142015-04-22 13:56:20 -0700710 number_of_fpu_registers_(number_of_fpu_registers),
711 pointer_size_(pointer_size) {}
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100712
713 size_t GetNumberOfRegisters() const { return number_of_registers_; }
Nicolas Geoffray7fb49da2014-10-06 09:12:41 +0100714 size_t GetNumberOfFpuRegisters() const { return number_of_fpu_registers_; }
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100715
Nicolas Geoffray7fb49da2014-10-06 09:12:41 +0100716 C GetRegisterAt(size_t index) const {
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100717 DCHECK_LT(index, number_of_registers_);
718 return registers_[index];
719 }
720
Nicolas Geoffray7fb49da2014-10-06 09:12:41 +0100721 F GetFpuRegisterAt(size_t index) const {
722 DCHECK_LT(index, number_of_fpu_registers_);
723 return fpu_registers_[index];
724 }
725
726 size_t GetStackOffsetOf(size_t index) const {
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100727 // We still reserve the space for parameters passed by registers.
Mathieu Chartiere401d142015-04-22 13:56:20 -0700728 // Add space for the method pointer.
Andreas Gampe542451c2016-07-26 09:02:02 -0700729 return static_cast<size_t>(pointer_size_) + index * kVRegSize;
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100730 }
731
732 private:
Nicolas Geoffray7fb49da2014-10-06 09:12:41 +0100733 const C* registers_;
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100734 const size_t number_of_registers_;
Nicolas Geoffray7fb49da2014-10-06 09:12:41 +0100735 const F* fpu_registers_;
736 const size_t number_of_fpu_registers_;
Andreas Gampe542451c2016-07-26 09:02:02 -0700737 const PointerSize pointer_size_;
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100738
739 DISALLOW_COPY_AND_ASSIGN(CallingConvention);
740};
741
Aart Bik42249c32016-01-07 15:33:50 -0800742/**
743 * A templated class SlowPathGenerator with a templated method NewSlowPath()
744 * that can be used by any code generator to share equivalent slow-paths with
745 * the objective of reducing generated code size.
746 *
747 * InstructionType: instruction that requires SlowPathCodeType
748 * SlowPathCodeType: subclass of SlowPathCode, with constructor SlowPathCodeType(InstructionType *)
749 */
750template <typename InstructionType>
751class SlowPathGenerator {
752 static_assert(std::is_base_of<HInstruction, InstructionType>::value,
753 "InstructionType is not a subclass of art::HInstruction");
754
755 public:
756 SlowPathGenerator(HGraph* graph, CodeGenerator* codegen)
757 : graph_(graph),
758 codegen_(codegen),
759 slow_path_map_(std::less<uint32_t>(), graph->GetArena()->Adapter(kArenaAllocSlowPaths)) {}
760
761 // Creates and adds a new slow-path, if needed, or returns existing one otherwise.
762 // Templating the method (rather than the whole class) on the slow-path type enables
763 // keeping this code at a generic, non architecture-specific place.
764 //
765 // NOTE: This approach assumes each InstructionType only generates one SlowPathCodeType.
766 // To relax this requirement, we would need some RTTI on the stored slow-paths,
767 // or template the class as a whole on SlowPathType.
768 template <typename SlowPathCodeType>
769 SlowPathCodeType* NewSlowPath(InstructionType* instruction) {
770 static_assert(std::is_base_of<SlowPathCode, SlowPathCodeType>::value,
771 "SlowPathCodeType is not a subclass of art::SlowPathCode");
772 static_assert(std::is_constructible<SlowPathCodeType, InstructionType*>::value,
773 "SlowPathCodeType is not constructible from InstructionType*");
774 // Iterate over potential candidates for sharing. Currently, only same-typed
775 // slow-paths with exactly the same dex-pc are viable candidates.
776 // TODO: pass dex-pc/slow-path-type to run-time to allow even more sharing?
777 const uint32_t dex_pc = instruction->GetDexPc();
778 auto iter = slow_path_map_.find(dex_pc);
779 if (iter != slow_path_map_.end()) {
780 auto candidates = iter->second;
781 for (const auto& it : candidates) {
782 InstructionType* other_instruction = it.first;
783 SlowPathCodeType* other_slow_path = down_cast<SlowPathCodeType*>(it.second);
784 // Determine if the instructions allow for slow-path sharing.
785 if (HaveSameLiveRegisters(instruction, other_instruction) &&
786 HaveSameStackMap(instruction, other_instruction)) {
787 // Can share: reuse existing one.
788 return other_slow_path;
789 }
790 }
791 } else {
792 // First time this dex-pc is seen.
793 iter = slow_path_map_.Put(dex_pc, {{}, {graph_->GetArena()->Adapter(kArenaAllocSlowPaths)}});
794 }
795 // Cannot share: create and add new slow-path for this particular dex-pc.
796 SlowPathCodeType* slow_path = new (graph_->GetArena()) SlowPathCodeType(instruction);
797 iter->second.emplace_back(std::make_pair(instruction, slow_path));
798 codegen_->AddSlowPath(slow_path);
799 return slow_path;
800 }
801
802 private:
803 // Tests if both instructions have same set of live physical registers. This ensures
804 // the slow-path has exactly the same preamble on saving these registers to stack.
805 bool HaveSameLiveRegisters(const InstructionType* i1, const InstructionType* i2) const {
806 const uint32_t core_spill = ~codegen_->GetCoreSpillMask();
807 const uint32_t fpu_spill = ~codegen_->GetFpuSpillMask();
808 RegisterSet* live1 = i1->GetLocations()->GetLiveRegisters();
809 RegisterSet* live2 = i2->GetLocations()->GetLiveRegisters();
810 return (((live1->GetCoreRegisters() & core_spill) ==
811 (live2->GetCoreRegisters() & core_spill)) &&
812 ((live1->GetFloatingPointRegisters() & fpu_spill) ==
813 (live2->GetFloatingPointRegisters() & fpu_spill)));
814 }
815
816 // Tests if both instructions have the same stack map. This ensures the interpreter
817 // will find exactly the same dex-registers at the same entries.
818 bool HaveSameStackMap(const InstructionType* i1, const InstructionType* i2) const {
819 DCHECK(i1->HasEnvironment());
820 DCHECK(i2->HasEnvironment());
821 // We conservatively test if the two instructions find exactly the same instructions
822 // and location in each dex-register. This guarantees they will have the same stack map.
823 HEnvironment* e1 = i1->GetEnvironment();
824 HEnvironment* e2 = i2->GetEnvironment();
825 if (e1->GetParent() != e2->GetParent() || e1->Size() != e2->Size()) {
826 return false;
827 }
828 for (size_t i = 0, sz = e1->Size(); i < sz; ++i) {
829 if (e1->GetInstructionAt(i) != e2->GetInstructionAt(i) ||
830 !e1->GetLocationAt(i).Equals(e2->GetLocationAt(i))) {
831 return false;
832 }
833 }
834 return true;
835 }
836
837 HGraph* const graph_;
838 CodeGenerator* const codegen_;
839
840 // Map from dex-pc to vector of already existing instruction/slow-path pairs.
841 ArenaSafeMap<uint32_t, ArenaVector<std::pair<InstructionType*, SlowPathCode*>>> slow_path_map_;
842
843 DISALLOW_COPY_AND_ASSIGN(SlowPathGenerator);
844};
845
846class InstructionCodeGenerator : public HGraphVisitor {
847 public:
848 InstructionCodeGenerator(HGraph* graph, CodeGenerator* codegen)
849 : HGraphVisitor(graph),
850 deopt_slow_paths_(graph, codegen) {}
851
852 protected:
853 // Add slow-path generator for each instruction/slow-path combination that desires sharing.
854 // TODO: under current regime, only deopt sharing make sense; extend later.
855 SlowPathGenerator<HDeoptimize> deopt_slow_paths_;
856};
857
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000858} // namespace art
859
860#endif // ART_COMPILER_OPTIMIZING_CODE_GENERATOR_H_