Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (C) 2014 The Android Open Source Project |
| 3 | * |
| 4 | * Licensed under the Apache License, Version 2.0 (the "License"); |
| 5 | * you may not use this file except in compliance with the License. |
| 6 | * You may obtain a copy of the License at |
| 7 | * |
| 8 | * http://www.apache.org/licenses/LICENSE-2.0 |
| 9 | * |
| 10 | * Unless required by applicable law or agreed to in writing, software |
| 11 | * distributed under the License is distributed on an "AS IS" BASIS, |
| 12 | * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| 13 | * See the License for the specific language governing permissions and |
| 14 | * limitations under the License. |
| 15 | */ |
| 16 | |
| 17 | #ifndef ART_COMPILER_OPTIMIZING_CODE_GENERATOR_H_ |
| 18 | #define ART_COMPILER_OPTIMIZING_CODE_GENERATOR_H_ |
| 19 | |
Ian Rogers | d582fa4 | 2014-11-05 23:46:43 -0800 | [diff] [blame] | 20 | #include "arch/instruction_set.h" |
Calin Juravle | 3416601 | 2014-12-19 17:22:29 +0000 | [diff] [blame] | 21 | #include "arch/instruction_set_features.h" |
Vladimir Marko | f9f6441 | 2015-09-02 14:05:49 +0100 | [diff] [blame] | 22 | #include "base/arena_containers.h" |
| 23 | #include "base/arena_object.h" |
Nicolas Geoffray | 01bc96d | 2014-04-11 17:43:50 +0100 | [diff] [blame] | 24 | #include "base/bit_field.h" |
Nicolas Geoffray | d28b969 | 2015-11-04 14:36:55 +0000 | [diff] [blame] | 25 | #include "compiled_method.h" |
Calin Juravle | cd6dffe | 2015-01-08 17:35:35 +0000 | [diff] [blame] | 26 | #include "driver/compiler_options.h" |
Nicolas Geoffray | bab4ed7 | 2014-03-11 17:53:17 +0000 | [diff] [blame] | 27 | #include "globals.h" |
Alexandre Rames | eb7b739 | 2015-06-19 14:47:01 +0100 | [diff] [blame] | 28 | #include "graph_visualizer.h" |
Nicolas Geoffray | 4e3d23a | 2014-05-22 18:32:45 +0100 | [diff] [blame] | 29 | #include "locations.h" |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 30 | #include "memory_region.h" |
| 31 | #include "nodes.h" |
Serban Constantinescu | ecc4366 | 2015-08-13 13:33:12 +0100 | [diff] [blame] | 32 | #include "optimizing_compiler_stats.h" |
Nicolas Geoffray | 3946844 | 2014-09-02 15:17:15 +0100 | [diff] [blame] | 33 | #include "stack_map_stream.h" |
Andreas Gampe | 85b62f2 | 2015-09-09 13:15:38 -0700 | [diff] [blame] | 34 | #include "utils/label.h" |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 35 | |
| 36 | namespace art { |
| 37 | |
Roland Levillain | 6d0e483 | 2014-11-27 18:31:21 +0000 | [diff] [blame] | 38 | // Binary encoding of 2^32 for type double. |
| 39 | static int64_t constexpr k2Pow32EncodingForDouble = INT64_C(0x41F0000000000000); |
| 40 | // Binary encoding of 2^31 for type double. |
| 41 | static int64_t constexpr k2Pow31EncodingForDouble = INT64_C(0x41E0000000000000); |
| 42 | |
Mark Mendell | e82549b | 2015-05-06 10:55:34 -0400 | [diff] [blame] | 43 | // Minimum value for a primitive integer. |
| 44 | static int32_t constexpr kPrimIntMin = 0x80000000; |
| 45 | // Minimum value for a primitive long. |
| 46 | static int64_t constexpr kPrimLongMin = INT64_C(0x8000000000000000); |
| 47 | |
Roland Levillain | 3f8f936 | 2014-12-02 17:45:01 +0000 | [diff] [blame] | 48 | // Maximum value for a primitive integer. |
| 49 | static int32_t constexpr kPrimIntMax = 0x7fffffff; |
Roland Levillain | 624279f | 2014-12-04 11:54:28 +0000 | [diff] [blame] | 50 | // Maximum value for a primitive long. |
Mark Mendell | e82549b | 2015-05-06 10:55:34 -0400 | [diff] [blame] | 51 | static int64_t constexpr kPrimLongMax = INT64_C(0x7fffffffffffffff); |
Roland Levillain | 3f8f936 | 2014-12-02 17:45:01 +0000 | [diff] [blame] | 52 | |
Nicolas Geoffray | 92a73ae | 2014-10-16 11:12:52 +0100 | [diff] [blame] | 53 | class Assembler; |
Nicolas Geoffray | e503832 | 2014-07-04 09:41:32 +0100 | [diff] [blame] | 54 | class CodeGenerator; |
Nicolas Geoffray | d28b969 | 2015-11-04 14:36:55 +0000 | [diff] [blame] | 55 | class CompilerDriver; |
Vladimir Marko | 5815501 | 2015-08-19 12:49:41 +0000 | [diff] [blame] | 56 | class LinkerPatch; |
Nicolas Geoffray | f0e3937 | 2014-11-12 17:50:07 +0000 | [diff] [blame] | 57 | class ParallelMoveResolver; |
Nicolas Geoffray | 92cf83e | 2014-03-18 17:59:20 +0000 | [diff] [blame] | 58 | |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 59 | class CodeAllocator { |
| 60 | public: |
Nicolas Geoffray | e503832 | 2014-07-04 09:41:32 +0100 | [diff] [blame] | 61 | CodeAllocator() {} |
| 62 | virtual ~CodeAllocator() {} |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 63 | |
| 64 | virtual uint8_t* Allocate(size_t size) = 0; |
| 65 | |
| 66 | private: |
| 67 | DISALLOW_COPY_AND_ASSIGN(CodeAllocator); |
| 68 | }; |
| 69 | |
Alexandre Rames | c01a664 | 2016-04-15 11:54:06 +0100 | [diff] [blame] | 70 | class SlowPathCode : public DeletableArenaObject<kArenaAllocSlowPaths> { |
Nicolas Geoffray | e503832 | 2014-07-04 09:41:32 +0100 | [diff] [blame] | 71 | public: |
David Srbecky | 9cd6d37 | 2016-02-09 15:24:47 +0000 | [diff] [blame] | 72 | explicit SlowPathCode(HInstruction* instruction) : instruction_(instruction) { |
Nicolas Geoffray | eeefa12 | 2015-03-13 18:52:59 +0000 | [diff] [blame] | 73 | for (size_t i = 0; i < kMaximumNumberOfExpectedRegisters; ++i) { |
| 74 | saved_core_stack_offsets_[i] = kRegisterNotSaved; |
| 75 | saved_fpu_stack_offsets_[i] = kRegisterNotSaved; |
| 76 | } |
| 77 | } |
| 78 | |
Nicolas Geoffray | e503832 | 2014-07-04 09:41:32 +0100 | [diff] [blame] | 79 | virtual ~SlowPathCode() {} |
| 80 | |
Nicolas Geoffray | e503832 | 2014-07-04 09:41:32 +0100 | [diff] [blame] | 81 | virtual void EmitNativeCode(CodeGenerator* codegen) = 0; |
| 82 | |
Zheng Xu | da40309 | 2015-04-24 17:35:39 +0800 | [diff] [blame] | 83 | virtual void SaveLiveRegisters(CodeGenerator* codegen, LocationSummary* locations); |
| 84 | virtual void RestoreLiveRegisters(CodeGenerator* codegen, LocationSummary* locations); |
Nicolas Geoffray | a8ac913 | 2015-03-13 16:36:36 +0000 | [diff] [blame] | 85 | |
Nicolas Geoffray | eeefa12 | 2015-03-13 18:52:59 +0000 | [diff] [blame] | 86 | bool IsCoreRegisterSaved(int reg) const { |
| 87 | return saved_core_stack_offsets_[reg] != kRegisterNotSaved; |
| 88 | } |
| 89 | |
| 90 | bool IsFpuRegisterSaved(int reg) const { |
| 91 | return saved_fpu_stack_offsets_[reg] != kRegisterNotSaved; |
| 92 | } |
| 93 | |
| 94 | uint32_t GetStackOffsetOfCoreRegister(int reg) const { |
| 95 | return saved_core_stack_offsets_[reg]; |
| 96 | } |
| 97 | |
| 98 | uint32_t GetStackOffsetOfFpuRegister(int reg) const { |
| 99 | return saved_fpu_stack_offsets_[reg]; |
| 100 | } |
| 101 | |
Alexandre Rames | 8158f28 | 2015-08-07 10:26:17 +0100 | [diff] [blame] | 102 | virtual bool IsFatal() const { return false; } |
| 103 | |
Alexandre Rames | 9931f31 | 2015-06-19 14:47:01 +0100 | [diff] [blame] | 104 | virtual const char* GetDescription() const = 0; |
| 105 | |
Andreas Gampe | 85b62f2 | 2015-09-09 13:15:38 -0700 | [diff] [blame] | 106 | Label* GetEntryLabel() { return &entry_label_; } |
| 107 | Label* GetExitLabel() { return &exit_label_; } |
| 108 | |
David Srbecky | d28f4a0 | 2016-03-14 17:14:24 +0000 | [diff] [blame] | 109 | HInstruction* GetInstruction() const { |
| 110 | return instruction_; |
| 111 | } |
| 112 | |
David Srbecky | 9cd6d37 | 2016-02-09 15:24:47 +0000 | [diff] [blame] | 113 | uint32_t GetDexPc() const { |
| 114 | return instruction_ != nullptr ? instruction_->GetDexPc() : kNoDexPc; |
| 115 | } |
| 116 | |
Zheng Xu | da40309 | 2015-04-24 17:35:39 +0800 | [diff] [blame] | 117 | protected: |
Nicolas Geoffray | eeefa12 | 2015-03-13 18:52:59 +0000 | [diff] [blame] | 118 | static constexpr size_t kMaximumNumberOfExpectedRegisters = 32; |
| 119 | static constexpr uint32_t kRegisterNotSaved = -1; |
David Srbecky | 9cd6d37 | 2016-02-09 15:24:47 +0000 | [diff] [blame] | 120 | // The instruction where this slow path is happening. |
| 121 | HInstruction* instruction_; |
Nicolas Geoffray | eeefa12 | 2015-03-13 18:52:59 +0000 | [diff] [blame] | 122 | uint32_t saved_core_stack_offsets_[kMaximumNumberOfExpectedRegisters]; |
| 123 | uint32_t saved_fpu_stack_offsets_[kMaximumNumberOfExpectedRegisters]; |
Zheng Xu | da40309 | 2015-04-24 17:35:39 +0800 | [diff] [blame] | 124 | |
| 125 | private: |
Andreas Gampe | 85b62f2 | 2015-09-09 13:15:38 -0700 | [diff] [blame] | 126 | Label entry_label_; |
| 127 | Label exit_label_; |
| 128 | |
Nicolas Geoffray | e503832 | 2014-07-04 09:41:32 +0100 | [diff] [blame] | 129 | DISALLOW_COPY_AND_ASSIGN(SlowPathCode); |
| 130 | }; |
| 131 | |
Roland Levillain | 2d27c8e | 2015-04-28 15:48:45 +0100 | [diff] [blame] | 132 | class InvokeDexCallingConventionVisitor { |
| 133 | public: |
| 134 | virtual Location GetNextLocation(Primitive::Type type) = 0; |
Nicolas Geoffray | fd88f16 | 2015-06-03 11:23:52 +0100 | [diff] [blame] | 135 | virtual Location GetReturnLocation(Primitive::Type type) const = 0; |
| 136 | virtual Location GetMethodLocation() const = 0; |
Roland Levillain | 2d27c8e | 2015-04-28 15:48:45 +0100 | [diff] [blame] | 137 | |
| 138 | protected: |
| 139 | InvokeDexCallingConventionVisitor() {} |
| 140 | virtual ~InvokeDexCallingConventionVisitor() {} |
| 141 | |
| 142 | // The current index for core registers. |
| 143 | uint32_t gp_index_ = 0u; |
| 144 | // The current index for floating-point registers. |
| 145 | uint32_t float_index_ = 0u; |
| 146 | // The current stack index. |
| 147 | uint32_t stack_index_ = 0u; |
| 148 | |
| 149 | private: |
| 150 | DISALLOW_COPY_AND_ASSIGN(InvokeDexCallingConventionVisitor); |
| 151 | }; |
| 152 | |
Calin Juravle | e460d1d | 2015-09-29 04:52:17 +0100 | [diff] [blame] | 153 | class FieldAccessCallingConvention { |
| 154 | public: |
| 155 | virtual Location GetObjectLocation() const = 0; |
| 156 | virtual Location GetFieldIndexLocation() const = 0; |
| 157 | virtual Location GetReturnLocation(Primitive::Type type) const = 0; |
| 158 | virtual Location GetSetValueLocation(Primitive::Type type, bool is_instance) const = 0; |
| 159 | virtual Location GetFpuLocation(Primitive::Type type) const = 0; |
| 160 | virtual ~FieldAccessCallingConvention() {} |
| 161 | |
| 162 | protected: |
| 163 | FieldAccessCallingConvention() {} |
| 164 | |
| 165 | private: |
| 166 | DISALLOW_COPY_AND_ASSIGN(FieldAccessCallingConvention); |
| 167 | }; |
| 168 | |
Vladimir Marko | d58b837 | 2016-04-12 18:51:43 +0100 | [diff] [blame] | 169 | class CodeGenerator : public DeletableArenaObject<kArenaAllocCodeGenerator> { |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 170 | public: |
David Brazdil | 58282f4 | 2016-01-14 12:45:10 +0000 | [diff] [blame] | 171 | // Compiles the graph to executable instructions. |
| 172 | void Compile(CodeAllocator* allocator); |
Vladimir Marko | d58b837 | 2016-04-12 18:51:43 +0100 | [diff] [blame] | 173 | static std::unique_ptr<CodeGenerator> Create(HGraph* graph, |
| 174 | InstructionSet instruction_set, |
| 175 | const InstructionSetFeatures& isa_features, |
| 176 | const CompilerOptions& compiler_options, |
| 177 | OptimizingCompilerStats* stats = nullptr); |
Nicolas Geoffray | 12df9eb | 2015-01-09 14:53:50 +0000 | [diff] [blame] | 178 | virtual ~CodeGenerator() {} |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 179 | |
Vladimir Marko | dc151b2 | 2015-10-15 18:02:30 +0100 | [diff] [blame] | 180 | // Get the graph. This is the outermost graph, never the graph of a method being inlined. |
Nicolas Geoffray | 787c307 | 2014-03-17 10:20:19 +0000 | [diff] [blame] | 181 | HGraph* GetGraph() const { return graph_; } |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 182 | |
Nicolas Geoffray | dc23d83 | 2015-02-16 11:15:43 +0000 | [diff] [blame] | 183 | HBasicBlock* GetNextBlockToEmit() const; |
| 184 | HBasicBlock* FirstNonEmptyBlock(HBasicBlock* block) const; |
Nicolas Geoffray | bab4ed7 | 2014-03-11 17:53:17 +0000 | [diff] [blame] | 185 | bool GoesToNextBlock(HBasicBlock* current, HBasicBlock* next) const; |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 186 | |
Nicolas Geoffray | 86dbb9a | 2014-06-04 11:12:39 +0100 | [diff] [blame] | 187 | size_t GetStackSlotOfParameter(HParameterValue* parameter) const { |
| 188 | // Note that this follows the current calling convention. |
| 189 | return GetFrameSize() |
Mathieu Chartier | e401d14 | 2015-04-22 13:56:20 -0700 | [diff] [blame] | 190 | + InstructionSetPointerSize(GetInstructionSet()) // Art method |
Nicolas Geoffray | e27f31a | 2014-06-12 17:53:14 +0100 | [diff] [blame] | 191 | + parameter->GetIndex() * kVRegSize; |
Nicolas Geoffray | 86dbb9a | 2014-06-04 11:12:39 +0100 | [diff] [blame] | 192 | } |
| 193 | |
Nicolas Geoffray | 92a73ae | 2014-10-16 11:12:52 +0100 | [diff] [blame] | 194 | virtual void Initialize() = 0; |
Serban Constantinescu | 32f5b4d | 2014-11-25 20:05:46 +0000 | [diff] [blame] | 195 | virtual void Finalize(CodeAllocator* allocator); |
Vladimir Marko | 5815501 | 2015-08-19 12:49:41 +0000 | [diff] [blame] | 196 | virtual void EmitLinkerPatches(ArenaVector<LinkerPatch>* linker_patches); |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 197 | virtual void GenerateFrameEntry() = 0; |
| 198 | virtual void GenerateFrameExit() = 0; |
Nicolas Geoffray | 92a73ae | 2014-10-16 11:12:52 +0100 | [diff] [blame] | 199 | virtual void Bind(HBasicBlock* block) = 0; |
Calin Juravle | 175dc73 | 2015-08-25 15:42:32 +0100 | [diff] [blame] | 200 | virtual void MoveConstant(Location destination, int32_t value) = 0; |
Calin Juravle | e460d1d | 2015-09-29 04:52:17 +0100 | [diff] [blame] | 201 | virtual void MoveLocation(Location dst, Location src, Primitive::Type dst_type) = 0; |
| 202 | virtual void AddLocationAsTemp(Location location, LocationSummary* locations) = 0; |
| 203 | |
Nicolas Geoffray | 787c307 | 2014-03-17 10:20:19 +0000 | [diff] [blame] | 204 | virtual Assembler* GetAssembler() = 0; |
Alexandre Rames | eb7b739 | 2015-06-19 14:47:01 +0100 | [diff] [blame] | 205 | virtual const Assembler& GetAssembler() const = 0; |
Nicolas Geoffray | 707c809 | 2014-04-04 10:50:14 +0100 | [diff] [blame] | 206 | virtual size_t GetWordSize() const = 0; |
Mark Mendell | f85a9ca | 2015-01-13 09:20:58 -0500 | [diff] [blame] | 207 | virtual size_t GetFloatingPointSpillSlotSize() const = 0; |
Alexandre Rames | c01a664 | 2016-04-15 11:54:06 +0100 | [diff] [blame] | 208 | virtual uintptr_t GetAddressOf(HBasicBlock* block) = 0; |
Nicolas Geoffray | 4c204ba | 2015-02-03 15:12:35 +0000 | [diff] [blame] | 209 | void InitializeCodeGeneration(size_t number_of_spill_slots, |
| 210 | size_t maximum_number_of_live_core_registers, |
Roland Levillain | 0d5a281 | 2015-11-13 10:07:31 +0000 | [diff] [blame] | 211 | size_t maximum_number_of_live_fpu_registers, |
Nicolas Geoffray | 4c204ba | 2015-02-03 15:12:35 +0000 | [diff] [blame] | 212 | size_t number_of_out_slots, |
Vladimir Marko | fa6b93c | 2015-09-15 10:15:55 +0100 | [diff] [blame] | 213 | const ArenaVector<HBasicBlock*>& block_order); |
Nicolas Geoffray | 787c307 | 2014-03-17 10:20:19 +0000 | [diff] [blame] | 214 | |
| 215 | uint32_t GetFrameSize() const { return frame_size_; } |
| 216 | void SetFrameSize(uint32_t size) { frame_size_ = size; } |
Nicolas Geoffray | 8ccc3f5 | 2014-03-19 10:34:11 +0000 | [diff] [blame] | 217 | uint32_t GetCoreSpillMask() const { return core_spill_mask_; } |
Nicolas Geoffray | d97dc40 | 2015-01-22 13:50:01 +0000 | [diff] [blame] | 218 | uint32_t GetFpuSpillMask() const { return fpu_spill_mask_; } |
Nicolas Geoffray | 787c307 | 2014-03-17 10:20:19 +0000 | [diff] [blame] | 219 | |
Nicolas Geoffray | 71175b7 | 2014-10-09 22:13:55 +0100 | [diff] [blame] | 220 | size_t GetNumberOfCoreRegisters() const { return number_of_core_registers_; } |
| 221 | size_t GetNumberOfFloatingPointRegisters() const { return number_of_fpu_registers_; } |
David Brazdil | 58282f4 | 2016-01-14 12:45:10 +0000 | [diff] [blame] | 222 | virtual void SetupBlockedRegisters() const = 0; |
Nicolas Geoffray | 71175b7 | 2014-10-09 22:13:55 +0100 | [diff] [blame] | 223 | |
Nicolas Geoffray | 4dee636 | 2015-01-23 18:23:14 +0000 | [diff] [blame] | 224 | virtual void ComputeSpillMask() { |
| 225 | core_spill_mask_ = allocated_registers_.GetCoreRegisters() & core_callee_save_mask_; |
| 226 | DCHECK_NE(core_spill_mask_, 0u) << "At least the return address register must be saved"; |
| 227 | fpu_spill_mask_ = allocated_registers_.GetFloatingPointRegisters() & fpu_callee_save_mask_; |
| 228 | } |
| 229 | |
| 230 | static uint32_t ComputeRegisterMask(const int* registers, size_t length) { |
| 231 | uint32_t mask = 0; |
| 232 | for (size_t i = 0, e = length; i < e; ++i) { |
| 233 | mask |= (1 << registers[i]); |
| 234 | } |
| 235 | return mask; |
| 236 | } |
| 237 | |
Nicolas Geoffray | a7062e0 | 2014-05-22 12:50:17 +0100 | [diff] [blame] | 238 | virtual void DumpCoreRegister(std::ostream& stream, int reg) const = 0; |
| 239 | virtual void DumpFloatingPointRegister(std::ostream& stream, int reg) const = 0; |
Nicolas Geoffray | 412f10c | 2014-06-19 10:00:34 +0100 | [diff] [blame] | 240 | virtual InstructionSet GetInstructionSet() const = 0; |
Calin Juravle | cd6dffe | 2015-01-08 17:35:35 +0000 | [diff] [blame] | 241 | |
| 242 | const CompilerOptions& GetCompilerOptions() const { return compiler_options_; } |
| 243 | |
Serban Constantinescu | ecc4366 | 2015-08-13 13:33:12 +0100 | [diff] [blame] | 244 | void MaybeRecordStat(MethodCompilationStat compilation_stat, size_t count = 1) const; |
| 245 | |
Nicolas Geoffray | 102cbed | 2014-10-15 18:31:05 +0100 | [diff] [blame] | 246 | // Saves the register in the stack. Returns the size taken on stack. |
| 247 | virtual size_t SaveCoreRegister(size_t stack_index, uint32_t reg_id) = 0; |
| 248 | // Restores the register from the stack. Returns the size taken on stack. |
| 249 | virtual size_t RestoreCoreRegister(size_t stack_index, uint32_t reg_id) = 0; |
Nicolas Geoffray | 234d69d | 2015-03-09 10:28:50 +0000 | [diff] [blame] | 250 | |
| 251 | virtual size_t SaveFloatingPointRegister(size_t stack_index, uint32_t reg_id) = 0; |
| 252 | virtual size_t RestoreFloatingPointRegister(size_t stack_index, uint32_t reg_id) = 0; |
| 253 | |
Nicolas Geoffray | 840e546 | 2015-01-07 16:01:24 +0000 | [diff] [blame] | 254 | virtual bool NeedsTwoRegisters(Primitive::Type type) const = 0; |
Nicolas Geoffray | 234d69d | 2015-03-09 10:28:50 +0000 | [diff] [blame] | 255 | // Returns whether we should split long moves in parallel moves. |
| 256 | virtual bool ShouldSplitLongMoves() const { return false; } |
Nicolas Geoffray | a7062e0 | 2014-05-22 12:50:17 +0100 | [diff] [blame] | 257 | |
Roland Levillain | 0d5a281 | 2015-11-13 10:07:31 +0000 | [diff] [blame] | 258 | size_t GetNumberOfCoreCalleeSaveRegisters() const { |
| 259 | return POPCOUNT(core_callee_save_mask_); |
| 260 | } |
| 261 | |
| 262 | size_t GetNumberOfCoreCallerSaveRegisters() const { |
| 263 | DCHECK_GE(GetNumberOfCoreRegisters(), GetNumberOfCoreCalleeSaveRegisters()); |
| 264 | return GetNumberOfCoreRegisters() - GetNumberOfCoreCalleeSaveRegisters(); |
| 265 | } |
| 266 | |
Nicolas Geoffray | 9889396 | 2015-01-21 12:32:32 +0000 | [diff] [blame] | 267 | bool IsCoreCalleeSaveRegister(int reg) const { |
| 268 | return (core_callee_save_mask_ & (1 << reg)) != 0; |
| 269 | } |
| 270 | |
| 271 | bool IsFloatingPointCalleeSaveRegister(int reg) const { |
| 272 | return (fpu_callee_save_mask_ & (1 << reg)) != 0; |
| 273 | } |
| 274 | |
Yevgeny Rouban | 2a7c1ef | 2015-07-22 18:36:24 +0600 | [diff] [blame] | 275 | // Record native to dex mapping for a suspend point. Required by runtime. |
Nicolas Geoffray | eeefa12 | 2015-03-13 18:52:59 +0000 | [diff] [blame] | 276 | void RecordPcInfo(HInstruction* instruction, uint32_t dex_pc, SlowPathCode* slow_path = nullptr); |
David Srbecky | b7070a2 | 2016-01-08 18:13:53 +0000 | [diff] [blame] | 277 | // Check whether we have already recorded mapping at this PC. |
| 278 | bool HasStackMapAtCurrentPc(); |
David Srbecky | c7098ff | 2016-02-09 14:30:11 +0000 | [diff] [blame] | 279 | // Record extra stack maps if we support native debugging. |
David Srbecky | d28f4a0 | 2016-03-14 17:14:24 +0000 | [diff] [blame] | 280 | void MaybeRecordNativeDebugInfo(HInstruction* instruction, |
| 281 | uint32_t dex_pc, |
| 282 | SlowPathCode* slow_path = nullptr); |
Yevgeny Rouban | 2a7c1ef | 2015-07-22 18:36:24 +0600 | [diff] [blame] | 283 | |
Calin Juravle | 77520bc | 2015-01-12 18:45:46 +0000 | [diff] [blame] | 284 | bool CanMoveNullCheckToUser(HNullCheck* null_check); |
| 285 | void MaybeRecordImplicitNullCheck(HInstruction* instruction); |
Calin Juravle | 2ae4818 | 2016-03-16 14:05:09 +0000 | [diff] [blame] | 286 | void GenerateNullCheck(HNullCheck* null_check); |
| 287 | virtual void GenerateImplicitNullCheck(HNullCheck* null_check) = 0; |
| 288 | virtual void GenerateExplicitNullCheck(HNullCheck* null_check) = 0; |
Nicolas Geoffray | 8ccc3f5 | 2014-03-19 10:34:11 +0000 | [diff] [blame] | 289 | |
David Brazdil | 77a48ae | 2015-09-15 12:34:04 +0000 | [diff] [blame] | 290 | // Records a stack map which the runtime might use to set catch phi values |
| 291 | // during exception delivery. |
| 292 | // TODO: Replace with a catch-entering instruction that records the environment. |
| 293 | void RecordCatchBlockInfo(); |
| 294 | |
| 295 | // Returns true if implicit null checks are allowed in the compiler options |
| 296 | // and if the null check is not inside a try block. We currently cannot do |
| 297 | // implicit null checks in that case because we need the NullCheckSlowPath to |
| 298 | // save live registers, which may be needed by the runtime to set catch phis. |
| 299 | bool IsImplicitNullCheckAllowed(HNullCheck* null_check) const; |
| 300 | |
Alexandre Rames | c01a664 | 2016-04-15 11:54:06 +0100 | [diff] [blame] | 301 | // TODO: Avoid creating the `std::unique_ptr` here. |
Nicolas Geoffray | e503832 | 2014-07-04 09:41:32 +0100 | [diff] [blame] | 302 | void AddSlowPath(SlowPathCode* slow_path) { |
Alexandre Rames | c01a664 | 2016-04-15 11:54:06 +0100 | [diff] [blame] | 303 | slow_paths_.push_back(std::unique_ptr<SlowPathCode>(slow_path)); |
Nicolas Geoffray | e503832 | 2014-07-04 09:41:32 +0100 | [diff] [blame] | 304 | } |
| 305 | |
Nicolas Geoffray | b331feb | 2016-02-05 16:51:53 +0000 | [diff] [blame] | 306 | void BuildStackMaps(MemoryRegion region, const DexFile::CodeItem& code_item); |
Nicolas Geoffray | d28b969 | 2015-11-04 14:36:55 +0000 | [diff] [blame] | 307 | size_t ComputeStackMapsSize(); |
Nicolas Geoffray | 787c307 | 2014-03-17 10:20:19 +0000 | [diff] [blame] | 308 | |
Nicolas Geoffray | f12feb8 | 2014-07-17 18:32:41 +0100 | [diff] [blame] | 309 | bool IsLeafMethod() const { |
| 310 | return is_leaf_; |
| 311 | } |
| 312 | |
| 313 | void MarkNotLeaf() { |
| 314 | is_leaf_ = false; |
Nicolas Geoffray | c0572a4 | 2015-02-06 14:35:25 +0000 | [diff] [blame] | 315 | requires_current_method_ = true; |
| 316 | } |
| 317 | |
| 318 | void SetRequiresCurrentMethod() { |
| 319 | requires_current_method_ = true; |
| 320 | } |
| 321 | |
| 322 | bool RequiresCurrentMethod() const { |
| 323 | return requires_current_method_; |
Nicolas Geoffray | f12feb8 | 2014-07-17 18:32:41 +0100 | [diff] [blame] | 324 | } |
| 325 | |
Nicolas Geoffray | 3c04974 | 2014-09-24 18:10:46 +0100 | [diff] [blame] | 326 | // Clears the spill slots taken by loop phis in the `LocationSummary` of the |
| 327 | // suspend check. This is called when the code generator generates code |
| 328 | // for the suspend check at the back edge (instead of where the suspend check |
| 329 | // is, which is the loop entry). At this point, the spill slots for the phis |
| 330 | // have not been written to. |
| 331 | void ClearSpillSlotsFromLoopPhisInStackMap(HSuspendCheck* suspend_check) const; |
| 332 | |
Nicolas Geoffray | 71175b7 | 2014-10-09 22:13:55 +0100 | [diff] [blame] | 333 | bool* GetBlockedCoreRegisters() const { return blocked_core_registers_; } |
Nicolas Geoffray | 102cbed | 2014-10-15 18:31:05 +0100 | [diff] [blame] | 334 | bool* GetBlockedFloatingPointRegisters() const { return blocked_fpu_registers_; } |
Nicolas Geoffray | 71175b7 | 2014-10-09 22:13:55 +0100 | [diff] [blame] | 335 | |
Nicolas Geoffray | 19a19cf | 2014-10-22 16:07:05 +0100 | [diff] [blame] | 336 | // Helper that returns the pointer offset of an index in an object array. |
| 337 | // Note: this method assumes we always have the same pointer size, regardless |
| 338 | // of the architecture. |
| 339 | static size_t GetCacheOffset(uint32_t index); |
Mathieu Chartier | e401d14 | 2015-04-22 13:56:20 -0700 | [diff] [blame] | 340 | // Pointer variant for ArtMethod and ArtField arrays. |
| 341 | size_t GetCachePointerOffset(uint32_t index); |
Nicolas Geoffray | 19a19cf | 2014-10-22 16:07:05 +0100 | [diff] [blame] | 342 | |
Vladimir Marko | dce016e | 2016-04-28 13:10:02 +0100 | [diff] [blame] | 343 | // Helper that returns the offset of the array's length field. |
| 344 | // Note: Besides the normal arrays, we also use the HArrayLength for |
| 345 | // accessing the String's `count` field in String intrinsics. |
| 346 | static uint32_t GetArrayLengthOffset(HArrayLength* array_length); |
| 347 | |
Vladimir Marko | 87f3fcb | 2016-04-28 15:52:11 +0100 | [diff] [blame] | 348 | // Helper that returns the offset of the array's data. |
| 349 | // Note: Besides the normal arrays, we also use the HArrayGet for |
| 350 | // accessing the String's `value` field in String intrinsics. |
| 351 | static uint32_t GetArrayDataOffset(HArrayGet* array_get); |
| 352 | |
Roland Levillain | 02b7580 | 2016-07-13 11:54:35 +0100 | [diff] [blame^] | 353 | // Return the entry point offset for ReadBarrierMarkRegX, where X is `reg`. |
| 354 | template <size_t pointer_size> |
| 355 | static int32_t GetReadBarrierMarkEntryPointsOffset(size_t reg) { |
| 356 | DCHECK_LT(reg, 32u); |
| 357 | // The ReadBarrierMarkRegX entry points are ordered by increasing |
| 358 | // register number in Thread::tls_Ptr_.quick_entrypoints. |
| 359 | return QUICK_ENTRYPOINT_OFFSET(pointer_size, pReadBarrierMarkReg00).Int32Value() |
| 360 | + pointer_size * reg; |
| 361 | } |
| 362 | |
Nicolas Geoffray | 9021825 | 2015-04-15 11:56:51 +0100 | [diff] [blame] | 363 | void EmitParallelMoves(Location from1, |
| 364 | Location to1, |
| 365 | Primitive::Type type1, |
| 366 | Location from2, |
| 367 | Location to2, |
| 368 | Primitive::Type type2); |
Nicolas Geoffray | f0e3937 | 2014-11-12 17:50:07 +0000 | [diff] [blame] | 369 | |
Nicolas Geoffray | af07bc1 | 2014-11-12 18:08:09 +0000 | [diff] [blame] | 370 | static bool StoreNeedsWriteBarrier(Primitive::Type type, HInstruction* value) { |
David Brazdil | 522e224 | 2015-03-17 18:48:28 +0000 | [diff] [blame] | 371 | // Check that null value is not represented as an integer constant. |
| 372 | DCHECK(type != Primitive::kPrimNot || !value->IsIntConstant()); |
| 373 | return type == Primitive::kPrimNot && !value->IsNullConstant(); |
Nicolas Geoffray | af07bc1 | 2014-11-12 18:08:09 +0000 | [diff] [blame] | 374 | } |
| 375 | |
Alexandre Rames | 78e3ef6 | 2015-08-12 13:43:29 +0100 | [diff] [blame] | 376 | void ValidateInvokeRuntime(HInstruction* instruction, SlowPathCode* slow_path); |
| 377 | |
Nicolas Geoffray | 9889396 | 2015-01-21 12:32:32 +0000 | [diff] [blame] | 378 | void AddAllocatedRegister(Location location) { |
| 379 | allocated_registers_.Add(location); |
| 380 | } |
| 381 | |
Nicolas Geoffray | 45b83af | 2015-07-06 15:12:53 +0000 | [diff] [blame] | 382 | bool HasAllocatedRegister(bool is_core, int reg) const { |
| 383 | return is_core |
| 384 | ? allocated_registers_.ContainsCoreRegister(reg) |
| 385 | : allocated_registers_.ContainsFloatingPointRegister(reg); |
| 386 | } |
| 387 | |
Nicolas Geoffray | c0572a4 | 2015-02-06 14:35:25 +0000 | [diff] [blame] | 388 | void AllocateLocations(HInstruction* instruction); |
| 389 | |
Roland Levillain | aa9b7c4 | 2015-02-17 15:40:09 +0000 | [diff] [blame] | 390 | // Tells whether the stack frame of the compiled method is |
| 391 | // considered "empty", that is either actually having a size of zero, |
| 392 | // or just containing the saved return address register. |
| 393 | bool HasEmptyFrame() const { |
| 394 | return GetFrameSize() == (CallPushesPC() ? GetWordSize() : 0); |
| 395 | } |
| 396 | |
Nicolas Geoffray | d6138ef | 2015-02-18 14:48:53 +0000 | [diff] [blame] | 397 | static int32_t GetInt32ValueOf(HConstant* constant) { |
| 398 | if (constant->IsIntConstant()) { |
| 399 | return constant->AsIntConstant()->GetValue(); |
| 400 | } else if (constant->IsNullConstant()) { |
| 401 | return 0; |
| 402 | } else { |
| 403 | DCHECK(constant->IsFloatConstant()); |
Roland Levillain | da4d79b | 2015-03-24 14:36:11 +0000 | [diff] [blame] | 404 | return bit_cast<int32_t, float>(constant->AsFloatConstant()->GetValue()); |
Nicolas Geoffray | d6138ef | 2015-02-18 14:48:53 +0000 | [diff] [blame] | 405 | } |
| 406 | } |
| 407 | |
| 408 | static int64_t GetInt64ValueOf(HConstant* constant) { |
| 409 | if (constant->IsIntConstant()) { |
| 410 | return constant->AsIntConstant()->GetValue(); |
| 411 | } else if (constant->IsNullConstant()) { |
| 412 | return 0; |
| 413 | } else if (constant->IsFloatConstant()) { |
Roland Levillain | da4d79b | 2015-03-24 14:36:11 +0000 | [diff] [blame] | 414 | return bit_cast<int32_t, float>(constant->AsFloatConstant()->GetValue()); |
Nicolas Geoffray | d6138ef | 2015-02-18 14:48:53 +0000 | [diff] [blame] | 415 | } else if (constant->IsLongConstant()) { |
| 416 | return constant->AsLongConstant()->GetValue(); |
| 417 | } else { |
| 418 | DCHECK(constant->IsDoubleConstant()); |
Roland Levillain | da4d79b | 2015-03-24 14:36:11 +0000 | [diff] [blame] | 419 | return bit_cast<int64_t, double>(constant->AsDoubleConstant()->GetValue()); |
Nicolas Geoffray | d6138ef | 2015-02-18 14:48:53 +0000 | [diff] [blame] | 420 | } |
| 421 | } |
| 422 | |
Nicolas Geoffray | a8ac913 | 2015-03-13 16:36:36 +0000 | [diff] [blame] | 423 | size_t GetFirstRegisterSlotInSlowPath() const { |
| 424 | return first_register_slot_in_slow_path_; |
| 425 | } |
| 426 | |
| 427 | uint32_t FrameEntrySpillSize() const { |
| 428 | return GetFpuSpillSize() + GetCoreSpillSize(); |
| 429 | } |
| 430 | |
Roland Levillain | ec525fc | 2015-04-28 15:50:20 +0100 | [diff] [blame] | 431 | virtual ParallelMoveResolver* GetMoveResolver() = 0; |
Nicolas Geoffray | a8ac913 | 2015-03-13 16:36:36 +0000 | [diff] [blame] | 432 | |
Nicolas Geoffray | fd88f16 | 2015-06-03 11:23:52 +0100 | [diff] [blame] | 433 | static void CreateCommonInvokeLocationSummary( |
| 434 | HInvoke* invoke, InvokeDexCallingConventionVisitor* visitor); |
| 435 | |
Calin Juravle | 175dc73 | 2015-08-25 15:42:32 +0100 | [diff] [blame] | 436 | void GenerateInvokeUnresolvedRuntimeCall(HInvokeUnresolved* invoke); |
| 437 | |
Calin Juravle | e460d1d | 2015-09-29 04:52:17 +0100 | [diff] [blame] | 438 | void CreateUnresolvedFieldLocationSummary( |
| 439 | HInstruction* field_access, |
| 440 | Primitive::Type field_type, |
| 441 | const FieldAccessCallingConvention& calling_convention); |
| 442 | |
| 443 | void GenerateUnresolvedFieldAccess( |
| 444 | HInstruction* field_access, |
| 445 | Primitive::Type field_type, |
| 446 | uint32_t field_index, |
| 447 | uint32_t dex_pc, |
| 448 | const FieldAccessCallingConvention& calling_convention); |
| 449 | |
Calin Juravle | 98893e1 | 2015-10-02 21:05:03 +0100 | [diff] [blame] | 450 | // TODO: This overlaps a bit with MoveFromReturnRegister. Refactor for a better design. |
| 451 | static void CreateLoadClassLocationSummary(HLoadClass* cls, |
| 452 | Location runtime_type_index_location, |
Roland Levillain | 0d5a281 | 2015-11-13 10:07:31 +0000 | [diff] [blame] | 453 | Location runtime_return_location, |
| 454 | bool code_generator_supports_read_barrier = false); |
Calin Juravle | 98893e1 | 2015-10-02 21:05:03 +0100 | [diff] [blame] | 455 | |
Nicolas Geoffray | 5bd05a5 | 2015-10-13 09:48:30 +0100 | [diff] [blame] | 456 | static void CreateSystemArrayCopyLocationSummary(HInvoke* invoke); |
| 457 | |
Alexandre Rames | eb7b739 | 2015-06-19 14:47:01 +0100 | [diff] [blame] | 458 | void SetDisassemblyInformation(DisassemblyInformation* info) { disasm_info_ = info; } |
| 459 | DisassemblyInformation* GetDisassemblyInformation() const { return disasm_info_; } |
| 460 | |
Calin Juravle | 175dc73 | 2015-08-25 15:42:32 +0100 | [diff] [blame] | 461 | virtual void InvokeRuntime(QuickEntrypointEnum entrypoint, |
| 462 | HInstruction* instruction, |
| 463 | uint32_t dex_pc, |
| 464 | SlowPathCode* slow_path) = 0; |
| 465 | |
Vladimir Marko | cac5a7e | 2016-02-22 10:39:50 +0000 | [diff] [blame] | 466 | // Check if the desired_string_load_kind is supported. If it is, return it, |
Vladimir Marko | dbb7f5b | 2016-03-30 13:23:58 +0100 | [diff] [blame] | 467 | // otherwise return a fall-back kind that should be used instead. |
Vladimir Marko | cac5a7e | 2016-02-22 10:39:50 +0000 | [diff] [blame] | 468 | virtual HLoadString::LoadKind GetSupportedLoadStringKind( |
| 469 | HLoadString::LoadKind desired_string_load_kind) = 0; |
| 470 | |
Vladimir Marko | dbb7f5b | 2016-03-30 13:23:58 +0100 | [diff] [blame] | 471 | // Check if the desired_class_load_kind is supported. If it is, return it, |
| 472 | // otherwise return a fall-back kind that should be used instead. |
| 473 | virtual HLoadClass::LoadKind GetSupportedLoadClassKind( |
| 474 | HLoadClass::LoadKind desired_class_load_kind) = 0; |
| 475 | |
Vladimir Marko | dc151b2 | 2015-10-15 18:02:30 +0100 | [diff] [blame] | 476 | // Check if the desired_dispatch_info is supported. If it is, return it, |
| 477 | // otherwise return a fall-back info that should be used instead. |
| 478 | virtual HInvokeStaticOrDirect::DispatchInfo GetSupportedInvokeStaticOrDirectDispatch( |
| 479 | const HInvokeStaticOrDirect::DispatchInfo& desired_dispatch_info, |
| 480 | MethodReference target_method) = 0; |
| 481 | |
Andreas Gampe | 85b62f2 | 2015-09-09 13:15:38 -0700 | [diff] [blame] | 482 | // Generate a call to a static or direct method. |
| 483 | virtual void GenerateStaticOrDirectCall(HInvokeStaticOrDirect* invoke, Location temp) = 0; |
| 484 | // Generate a call to a virtual method. |
| 485 | virtual void GenerateVirtualCall(HInvokeVirtual* invoke, Location temp) = 0; |
| 486 | |
| 487 | // Copy the result of a call into the given target. |
| 488 | virtual void MoveFromReturnRegister(Location trg, Primitive::Type type) = 0; |
| 489 | |
David Srbecky | c7098ff | 2016-02-09 14:30:11 +0000 | [diff] [blame] | 490 | virtual void GenerateNop() = 0; |
| 491 | |
Serguei Katkov | 288c7a8 | 2016-05-16 11:53:15 +0600 | [diff] [blame] | 492 | uint32_t GetReferenceSlowFlagOffset() const; |
| 493 | uint32_t GetReferenceDisableFlagOffset() const; |
| 494 | |
Nicolas Geoffray | 787c307 | 2014-03-17 10:20:19 +0000 | [diff] [blame] | 495 | protected: |
Vladimir Marko | 5815501 | 2015-08-19 12:49:41 +0000 | [diff] [blame] | 496 | // Method patch info used for recording locations of required linker patches and |
| 497 | // target methods. The target method can be used for various purposes, whether for |
| 498 | // patching the address of the method or the code pointer or a PC-relative call. |
| 499 | template <typename LabelType> |
| 500 | struct MethodPatchInfo { |
| 501 | explicit MethodPatchInfo(MethodReference m) : target_method(m), label() { } |
| 502 | |
| 503 | MethodReference target_method; |
| 504 | LabelType label; |
| 505 | }; |
| 506 | |
Vladimir Marko | cac5a7e | 2016-02-22 10:39:50 +0000 | [diff] [blame] | 507 | // String patch info used for recording locations of required linker patches and |
| 508 | // target strings. The actual string address can be absolute or PC-relative. |
| 509 | template <typename LabelType> |
| 510 | struct StringPatchInfo { |
| 511 | StringPatchInfo(const DexFile& df, uint32_t index) |
| 512 | : dex_file(df), string_index(index), label() { } |
| 513 | |
| 514 | const DexFile& dex_file; |
| 515 | uint32_t string_index; |
| 516 | LabelType label; |
| 517 | }; |
| 518 | |
Vladimir Marko | dbb7f5b | 2016-03-30 13:23:58 +0100 | [diff] [blame] | 519 | // Type patch info used for recording locations of required linker patches and |
| 520 | // target types. The actual type address can be absolute or PC-relative. |
| 521 | // TODO: Consider merging with MethodPatchInfo and StringPatchInfo - all these |
| 522 | // classes contain the dex file, some index and the label. |
| 523 | template <typename LabelType> |
| 524 | struct TypePatchInfo { |
| 525 | TypePatchInfo(const DexFile& df, uint32_t index) |
| 526 | : dex_file(df), type_index(index), label() { } |
| 527 | |
| 528 | const DexFile& dex_file; |
| 529 | uint32_t type_index; |
| 530 | LabelType label; |
| 531 | }; |
| 532 | |
Nicolas Geoffray | 71175b7 | 2014-10-09 22:13:55 +0100 | [diff] [blame] | 533 | CodeGenerator(HGraph* graph, |
| 534 | size_t number_of_core_registers, |
| 535 | size_t number_of_fpu_registers, |
Calin Juravle | cd6dffe | 2015-01-08 17:35:35 +0000 | [diff] [blame] | 536 | size_t number_of_register_pairs, |
Nicolas Geoffray | 9889396 | 2015-01-21 12:32:32 +0000 | [diff] [blame] | 537 | uint32_t core_callee_save_mask, |
| 538 | uint32_t fpu_callee_save_mask, |
Serban Constantinescu | ecc4366 | 2015-08-13 13:33:12 +0100 | [diff] [blame] | 539 | const CompilerOptions& compiler_options, |
| 540 | OptimizingCompilerStats* stats) |
Nicolas Geoffray | c0572a4 | 2015-02-06 14:35:25 +0000 | [diff] [blame] | 541 | : frame_size_(0), |
Nicolas Geoffray | 4361bef | 2014-08-20 04:59:12 +0100 | [diff] [blame] | 542 | core_spill_mask_(0), |
Nicolas Geoffray | d97dc40 | 2015-01-22 13:50:01 +0000 | [diff] [blame] | 543 | fpu_spill_mask_(0), |
Nicolas Geoffray | 3bca0df | 2014-09-19 11:01:00 +0100 | [diff] [blame] | 544 | first_register_slot_in_slow_path_(0), |
Vladimir Marko | 5233f93 | 2015-09-29 19:01:15 +0100 | [diff] [blame] | 545 | blocked_core_registers_(graph->GetArena()->AllocArray<bool>(number_of_core_registers, |
| 546 | kArenaAllocCodeGenerator)), |
| 547 | blocked_fpu_registers_(graph->GetArena()->AllocArray<bool>(number_of_fpu_registers, |
| 548 | kArenaAllocCodeGenerator)), |
| 549 | blocked_register_pairs_(graph->GetArena()->AllocArray<bool>(number_of_register_pairs, |
| 550 | kArenaAllocCodeGenerator)), |
Nicolas Geoffray | 71175b7 | 2014-10-09 22:13:55 +0100 | [diff] [blame] | 551 | number_of_core_registers_(number_of_core_registers), |
| 552 | number_of_fpu_registers_(number_of_fpu_registers), |
| 553 | number_of_register_pairs_(number_of_register_pairs), |
Nicolas Geoffray | 9889396 | 2015-01-21 12:32:32 +0000 | [diff] [blame] | 554 | core_callee_save_mask_(core_callee_save_mask), |
| 555 | fpu_callee_save_mask_(fpu_callee_save_mask), |
Vladimir Marko | cf93a5c | 2015-06-16 11:33:24 +0000 | [diff] [blame] | 556 | stack_map_stream_(graph->GetArena()), |
| 557 | block_order_(nullptr), |
Alexandre Rames | eb7b739 | 2015-06-19 14:47:01 +0100 | [diff] [blame] | 558 | disasm_info_(nullptr), |
Serban Constantinescu | ecc4366 | 2015-08-13 13:33:12 +0100 | [diff] [blame] | 559 | stats_(stats), |
Nicolas Geoffray | 787c307 | 2014-03-17 10:20:19 +0000 | [diff] [blame] | 560 | graph_(graph), |
Calin Juravle | cd6dffe | 2015-01-08 17:35:35 +0000 | [diff] [blame] | 561 | compiler_options_(compiler_options), |
Vladimir Marko | 225b646 | 2015-09-28 12:17:40 +0100 | [diff] [blame] | 562 | slow_paths_(graph->GetArena()->Adapter(kArenaAllocCodeGenerator)), |
Vladimir Marko | 0f7dca4 | 2015-11-02 14:36:43 +0000 | [diff] [blame] | 563 | current_slow_path_(nullptr), |
Nicolas Geoffray | 4c204ba | 2015-02-03 15:12:35 +0000 | [diff] [blame] | 564 | current_block_index_(0), |
Nicolas Geoffray | 3946844 | 2014-09-02 15:17:15 +0100 | [diff] [blame] | 565 | is_leaf_(true), |
Vladimir Marko | 225b646 | 2015-09-28 12:17:40 +0100 | [diff] [blame] | 566 | requires_current_method_(false) { |
| 567 | slow_paths_.reserve(8); |
| 568 | } |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 569 | |
Nicolas Geoffray | c0572a4 | 2015-02-06 14:35:25 +0000 | [diff] [blame] | 570 | virtual HGraphVisitor* GetLocationBuilder() = 0; |
| 571 | virtual HGraphVisitor* GetInstructionVisitor() = 0; |
Nicolas Geoffray | f0e3937 | 2014-11-12 17:50:07 +0000 | [diff] [blame] | 572 | |
Nicolas Geoffray | d97dc40 | 2015-01-22 13:50:01 +0000 | [diff] [blame] | 573 | // Returns the location of the first spilled entry for floating point registers, |
| 574 | // relative to the stack pointer. |
| 575 | uint32_t GetFpuSpillStart() const { |
Nicolas Geoffray | d97dc40 | 2015-01-22 13:50:01 +0000 | [diff] [blame] | 576 | return GetFrameSize() - FrameEntrySpillSize(); |
| 577 | } |
| 578 | |
| 579 | uint32_t GetFpuSpillSize() const { |
| 580 | return POPCOUNT(fpu_spill_mask_) * GetFloatingPointSpillSlotSize(); |
| 581 | } |
| 582 | |
| 583 | uint32_t GetCoreSpillSize() const { |
| 584 | return POPCOUNT(core_spill_mask_) * GetWordSize(); |
| 585 | } |
| 586 | |
Nicolas Geoffray | c0572a4 | 2015-02-06 14:35:25 +0000 | [diff] [blame] | 587 | bool HasAllocatedCalleeSaveRegisters() const { |
| 588 | // We check the core registers against 1 because it always comprises the return PC. |
| 589 | return (POPCOUNT(allocated_registers_.GetCoreRegisters() & core_callee_save_mask_) != 1) |
| 590 | || (POPCOUNT(allocated_registers_.GetFloatingPointRegisters() & fpu_callee_save_mask_) != 0); |
| 591 | } |
| 592 | |
| 593 | bool CallPushesPC() const { |
| 594 | InstructionSet instruction_set = GetInstructionSet(); |
| 595 | return instruction_set == kX86 || instruction_set == kX86_64; |
| 596 | } |
| 597 | |
Vladimir Marko | 225b646 | 2015-09-28 12:17:40 +0100 | [diff] [blame] | 598 | // Arm64 has its own type for a label, so we need to templatize these methods |
Nicolas Geoffray | dc23d83 | 2015-02-16 11:15:43 +0000 | [diff] [blame] | 599 | // to share the logic. |
Vladimir Marko | 225b646 | 2015-09-28 12:17:40 +0100 | [diff] [blame] | 600 | |
| 601 | template <typename LabelType> |
| 602 | LabelType* CommonInitializeLabels() { |
Vladimir Marko | b95fb77 | 2015-09-30 13:32:31 +0100 | [diff] [blame] | 603 | // We use raw array allocations instead of ArenaVector<> because Labels are |
| 604 | // non-constructible and non-movable and as such cannot be held in a vector. |
Vladimir Marko | 225b646 | 2015-09-28 12:17:40 +0100 | [diff] [blame] | 605 | size_t size = GetGraph()->GetBlocks().size(); |
| 606 | LabelType* labels = GetGraph()->GetArena()->AllocArray<LabelType>(size, |
| 607 | kArenaAllocCodeGenerator); |
| 608 | for (size_t i = 0; i != size; ++i) { |
| 609 | new(labels + i) LabelType(); |
| 610 | } |
| 611 | return labels; |
| 612 | } |
| 613 | |
Vladimir Marko | 5815501 | 2015-08-19 12:49:41 +0000 | [diff] [blame] | 614 | template <typename LabelType> |
| 615 | LabelType* CommonGetLabelOf(LabelType* raw_pointer_to_labels_array, HBasicBlock* block) const { |
Nicolas Geoffray | dc23d83 | 2015-02-16 11:15:43 +0000 | [diff] [blame] | 616 | block = FirstNonEmptyBlock(block); |
| 617 | return raw_pointer_to_labels_array + block->GetBlockId(); |
| 618 | } |
| 619 | |
Vladimir Marko | 0f7dca4 | 2015-11-02 14:36:43 +0000 | [diff] [blame] | 620 | SlowPathCode* GetCurrentSlowPath() { |
| 621 | return current_slow_path_; |
| 622 | } |
| 623 | |
Nicolas Geoffray | 8ccc3f5 | 2014-03-19 10:34:11 +0000 | [diff] [blame] | 624 | // Frame size required for this method. |
| 625 | uint32_t frame_size_; |
| 626 | uint32_t core_spill_mask_; |
Nicolas Geoffray | d97dc40 | 2015-01-22 13:50:01 +0000 | [diff] [blame] | 627 | uint32_t fpu_spill_mask_; |
Nicolas Geoffray | 3bca0df | 2014-09-19 11:01:00 +0100 | [diff] [blame] | 628 | uint32_t first_register_slot_in_slow_path_; |
Nicolas Geoffray | 8ccc3f5 | 2014-03-19 10:34:11 +0000 | [diff] [blame] | 629 | |
Nicolas Geoffray | 9889396 | 2015-01-21 12:32:32 +0000 | [diff] [blame] | 630 | // Registers that were allocated during linear scan. |
| 631 | RegisterSet allocated_registers_; |
| 632 | |
Nicolas Geoffray | 71175b7 | 2014-10-09 22:13:55 +0100 | [diff] [blame] | 633 | // Arrays used when doing register allocation to know which |
| 634 | // registers we can allocate. `SetupBlockedRegisters` updates the |
| 635 | // arrays. |
| 636 | bool* const blocked_core_registers_; |
| 637 | bool* const blocked_fpu_registers_; |
| 638 | bool* const blocked_register_pairs_; |
| 639 | size_t number_of_core_registers_; |
| 640 | size_t number_of_fpu_registers_; |
| 641 | size_t number_of_register_pairs_; |
Nicolas Geoffray | 9889396 | 2015-01-21 12:32:32 +0000 | [diff] [blame] | 642 | const uint32_t core_callee_save_mask_; |
| 643 | const uint32_t fpu_callee_save_mask_; |
Nicolas Geoffray | 71175b7 | 2014-10-09 22:13:55 +0100 | [diff] [blame] | 644 | |
Vladimir Marko | cf93a5c | 2015-06-16 11:33:24 +0000 | [diff] [blame] | 645 | StackMapStream stack_map_stream_; |
| 646 | |
| 647 | // The order to use for code generation. |
Vladimir Marko | fa6b93c | 2015-09-15 10:15:55 +0100 | [diff] [blame] | 648 | const ArenaVector<HBasicBlock*>* block_order_; |
Vladimir Marko | cf93a5c | 2015-06-16 11:33:24 +0000 | [diff] [blame] | 649 | |
Alexandre Rames | eb7b739 | 2015-06-19 14:47:01 +0100 | [diff] [blame] | 650 | DisassemblyInformation* disasm_info_; |
| 651 | |
Nicolas Geoffray | bab4ed7 | 2014-03-11 17:53:17 +0000 | [diff] [blame] | 652 | private: |
Nicolas Geoffray | 3bca0df | 2014-09-19 11:01:00 +0100 | [diff] [blame] | 653 | size_t GetStackOffsetOfSavedRegister(size_t index); |
Alexandre Rames | eb7b739 | 2015-06-19 14:47:01 +0100 | [diff] [blame] | 654 | void GenerateSlowPaths(); |
Mark Mendell | 5f87418 | 2015-03-04 15:42:45 -0500 | [diff] [blame] | 655 | void BlockIfInRegister(Location location, bool is_out = false) const; |
Nicolas Geoffray | b1d0f3f | 2015-05-14 12:41:51 +0100 | [diff] [blame] | 656 | void EmitEnvironment(HEnvironment* environment, SlowPathCode* slow_path); |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 657 | |
Serban Constantinescu | ecc4366 | 2015-08-13 13:33:12 +0100 | [diff] [blame] | 658 | OptimizingCompilerStats* stats_; |
| 659 | |
Nicolas Geoffray | 787c307 | 2014-03-17 10:20:19 +0000 | [diff] [blame] | 660 | HGraph* const graph_; |
Calin Juravle | cd6dffe | 2015-01-08 17:35:35 +0000 | [diff] [blame] | 661 | const CompilerOptions& compiler_options_; |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 662 | |
Alexandre Rames | c01a664 | 2016-04-15 11:54:06 +0100 | [diff] [blame] | 663 | ArenaVector<std::unique_ptr<SlowPathCode>> slow_paths_; |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 664 | |
Aart Bik | 42249c3 | 2016-01-07 15:33:50 -0800 | [diff] [blame] | 665 | // The current slow-path that we're generating code for. |
Vladimir Marko | 0f7dca4 | 2015-11-02 14:36:43 +0000 | [diff] [blame] | 666 | SlowPathCode* current_slow_path_; |
| 667 | |
Nicolas Geoffray | 4c204ba | 2015-02-03 15:12:35 +0000 | [diff] [blame] | 668 | // The current block index in `block_order_` of the block |
| 669 | // we are generating code for. |
| 670 | size_t current_block_index_; |
| 671 | |
Nicolas Geoffray | c0572a4 | 2015-02-06 14:35:25 +0000 | [diff] [blame] | 672 | // Whether the method is a leaf method. |
Nicolas Geoffray | f12feb8 | 2014-07-17 18:32:41 +0100 | [diff] [blame] | 673 | bool is_leaf_; |
| 674 | |
Nicolas Geoffray | c0572a4 | 2015-02-06 14:35:25 +0000 | [diff] [blame] | 675 | // Whether an instruction in the graph accesses the current method. |
| 676 | bool requires_current_method_; |
| 677 | |
David Srbecky | c6b4dd8 | 2015-04-07 20:32:43 +0100 | [diff] [blame] | 678 | friend class OptimizingCFITest; |
| 679 | |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 680 | DISALLOW_COPY_AND_ASSIGN(CodeGenerator); |
| 681 | }; |
| 682 | |
Nicolas Geoffray | 7fb49da | 2014-10-06 09:12:41 +0100 | [diff] [blame] | 683 | template <typename C, typename F> |
Nicolas Geoffray | 4a34a42 | 2014-04-03 10:38:37 +0100 | [diff] [blame] | 684 | class CallingConvention { |
| 685 | public: |
Nicolas Geoffray | 7fb49da | 2014-10-06 09:12:41 +0100 | [diff] [blame] | 686 | CallingConvention(const C* registers, |
| 687 | size_t number_of_registers, |
| 688 | const F* fpu_registers, |
Mathieu Chartier | e401d14 | 2015-04-22 13:56:20 -0700 | [diff] [blame] | 689 | size_t number_of_fpu_registers, |
| 690 | size_t pointer_size) |
Nicolas Geoffray | 7fb49da | 2014-10-06 09:12:41 +0100 | [diff] [blame] | 691 | : registers_(registers), |
| 692 | number_of_registers_(number_of_registers), |
| 693 | fpu_registers_(fpu_registers), |
Mathieu Chartier | e401d14 | 2015-04-22 13:56:20 -0700 | [diff] [blame] | 694 | number_of_fpu_registers_(number_of_fpu_registers), |
| 695 | pointer_size_(pointer_size) {} |
Nicolas Geoffray | 4a34a42 | 2014-04-03 10:38:37 +0100 | [diff] [blame] | 696 | |
| 697 | size_t GetNumberOfRegisters() const { return number_of_registers_; } |
Nicolas Geoffray | 7fb49da | 2014-10-06 09:12:41 +0100 | [diff] [blame] | 698 | size_t GetNumberOfFpuRegisters() const { return number_of_fpu_registers_; } |
Nicolas Geoffray | 4a34a42 | 2014-04-03 10:38:37 +0100 | [diff] [blame] | 699 | |
Nicolas Geoffray | 7fb49da | 2014-10-06 09:12:41 +0100 | [diff] [blame] | 700 | C GetRegisterAt(size_t index) const { |
Nicolas Geoffray | 4a34a42 | 2014-04-03 10:38:37 +0100 | [diff] [blame] | 701 | DCHECK_LT(index, number_of_registers_); |
| 702 | return registers_[index]; |
| 703 | } |
| 704 | |
Nicolas Geoffray | 7fb49da | 2014-10-06 09:12:41 +0100 | [diff] [blame] | 705 | F GetFpuRegisterAt(size_t index) const { |
| 706 | DCHECK_LT(index, number_of_fpu_registers_); |
| 707 | return fpu_registers_[index]; |
| 708 | } |
| 709 | |
| 710 | size_t GetStackOffsetOf(size_t index) const { |
Nicolas Geoffray | 4a34a42 | 2014-04-03 10:38:37 +0100 | [diff] [blame] | 711 | // We still reserve the space for parameters passed by registers. |
Mathieu Chartier | e401d14 | 2015-04-22 13:56:20 -0700 | [diff] [blame] | 712 | // Add space for the method pointer. |
| 713 | return pointer_size_ + index * kVRegSize; |
Nicolas Geoffray | 4a34a42 | 2014-04-03 10:38:37 +0100 | [diff] [blame] | 714 | } |
| 715 | |
| 716 | private: |
Nicolas Geoffray | 7fb49da | 2014-10-06 09:12:41 +0100 | [diff] [blame] | 717 | const C* registers_; |
Nicolas Geoffray | 4a34a42 | 2014-04-03 10:38:37 +0100 | [diff] [blame] | 718 | const size_t number_of_registers_; |
Nicolas Geoffray | 7fb49da | 2014-10-06 09:12:41 +0100 | [diff] [blame] | 719 | const F* fpu_registers_; |
| 720 | const size_t number_of_fpu_registers_; |
Mathieu Chartier | e401d14 | 2015-04-22 13:56:20 -0700 | [diff] [blame] | 721 | const size_t pointer_size_; |
Nicolas Geoffray | 4a34a42 | 2014-04-03 10:38:37 +0100 | [diff] [blame] | 722 | |
| 723 | DISALLOW_COPY_AND_ASSIGN(CallingConvention); |
| 724 | }; |
| 725 | |
Aart Bik | 42249c3 | 2016-01-07 15:33:50 -0800 | [diff] [blame] | 726 | /** |
| 727 | * A templated class SlowPathGenerator with a templated method NewSlowPath() |
| 728 | * that can be used by any code generator to share equivalent slow-paths with |
| 729 | * the objective of reducing generated code size. |
| 730 | * |
| 731 | * InstructionType: instruction that requires SlowPathCodeType |
| 732 | * SlowPathCodeType: subclass of SlowPathCode, with constructor SlowPathCodeType(InstructionType *) |
| 733 | */ |
| 734 | template <typename InstructionType> |
| 735 | class SlowPathGenerator { |
| 736 | static_assert(std::is_base_of<HInstruction, InstructionType>::value, |
| 737 | "InstructionType is not a subclass of art::HInstruction"); |
| 738 | |
| 739 | public: |
| 740 | SlowPathGenerator(HGraph* graph, CodeGenerator* codegen) |
| 741 | : graph_(graph), |
| 742 | codegen_(codegen), |
| 743 | slow_path_map_(std::less<uint32_t>(), graph->GetArena()->Adapter(kArenaAllocSlowPaths)) {} |
| 744 | |
| 745 | // Creates and adds a new slow-path, if needed, or returns existing one otherwise. |
| 746 | // Templating the method (rather than the whole class) on the slow-path type enables |
| 747 | // keeping this code at a generic, non architecture-specific place. |
| 748 | // |
| 749 | // NOTE: This approach assumes each InstructionType only generates one SlowPathCodeType. |
| 750 | // To relax this requirement, we would need some RTTI on the stored slow-paths, |
| 751 | // or template the class as a whole on SlowPathType. |
| 752 | template <typename SlowPathCodeType> |
| 753 | SlowPathCodeType* NewSlowPath(InstructionType* instruction) { |
| 754 | static_assert(std::is_base_of<SlowPathCode, SlowPathCodeType>::value, |
| 755 | "SlowPathCodeType is not a subclass of art::SlowPathCode"); |
| 756 | static_assert(std::is_constructible<SlowPathCodeType, InstructionType*>::value, |
| 757 | "SlowPathCodeType is not constructible from InstructionType*"); |
| 758 | // Iterate over potential candidates for sharing. Currently, only same-typed |
| 759 | // slow-paths with exactly the same dex-pc are viable candidates. |
| 760 | // TODO: pass dex-pc/slow-path-type to run-time to allow even more sharing? |
| 761 | const uint32_t dex_pc = instruction->GetDexPc(); |
| 762 | auto iter = slow_path_map_.find(dex_pc); |
| 763 | if (iter != slow_path_map_.end()) { |
| 764 | auto candidates = iter->second; |
| 765 | for (const auto& it : candidates) { |
| 766 | InstructionType* other_instruction = it.first; |
| 767 | SlowPathCodeType* other_slow_path = down_cast<SlowPathCodeType*>(it.second); |
| 768 | // Determine if the instructions allow for slow-path sharing. |
| 769 | if (HaveSameLiveRegisters(instruction, other_instruction) && |
| 770 | HaveSameStackMap(instruction, other_instruction)) { |
| 771 | // Can share: reuse existing one. |
| 772 | return other_slow_path; |
| 773 | } |
| 774 | } |
| 775 | } else { |
| 776 | // First time this dex-pc is seen. |
| 777 | iter = slow_path_map_.Put(dex_pc, {{}, {graph_->GetArena()->Adapter(kArenaAllocSlowPaths)}}); |
| 778 | } |
| 779 | // Cannot share: create and add new slow-path for this particular dex-pc. |
| 780 | SlowPathCodeType* slow_path = new (graph_->GetArena()) SlowPathCodeType(instruction); |
| 781 | iter->second.emplace_back(std::make_pair(instruction, slow_path)); |
| 782 | codegen_->AddSlowPath(slow_path); |
| 783 | return slow_path; |
| 784 | } |
| 785 | |
| 786 | private: |
| 787 | // Tests if both instructions have same set of live physical registers. This ensures |
| 788 | // the slow-path has exactly the same preamble on saving these registers to stack. |
| 789 | bool HaveSameLiveRegisters(const InstructionType* i1, const InstructionType* i2) const { |
| 790 | const uint32_t core_spill = ~codegen_->GetCoreSpillMask(); |
| 791 | const uint32_t fpu_spill = ~codegen_->GetFpuSpillMask(); |
| 792 | RegisterSet* live1 = i1->GetLocations()->GetLiveRegisters(); |
| 793 | RegisterSet* live2 = i2->GetLocations()->GetLiveRegisters(); |
| 794 | return (((live1->GetCoreRegisters() & core_spill) == |
| 795 | (live2->GetCoreRegisters() & core_spill)) && |
| 796 | ((live1->GetFloatingPointRegisters() & fpu_spill) == |
| 797 | (live2->GetFloatingPointRegisters() & fpu_spill))); |
| 798 | } |
| 799 | |
| 800 | // Tests if both instructions have the same stack map. This ensures the interpreter |
| 801 | // will find exactly the same dex-registers at the same entries. |
| 802 | bool HaveSameStackMap(const InstructionType* i1, const InstructionType* i2) const { |
| 803 | DCHECK(i1->HasEnvironment()); |
| 804 | DCHECK(i2->HasEnvironment()); |
| 805 | // We conservatively test if the two instructions find exactly the same instructions |
| 806 | // and location in each dex-register. This guarantees they will have the same stack map. |
| 807 | HEnvironment* e1 = i1->GetEnvironment(); |
| 808 | HEnvironment* e2 = i2->GetEnvironment(); |
| 809 | if (e1->GetParent() != e2->GetParent() || e1->Size() != e2->Size()) { |
| 810 | return false; |
| 811 | } |
| 812 | for (size_t i = 0, sz = e1->Size(); i < sz; ++i) { |
| 813 | if (e1->GetInstructionAt(i) != e2->GetInstructionAt(i) || |
| 814 | !e1->GetLocationAt(i).Equals(e2->GetLocationAt(i))) { |
| 815 | return false; |
| 816 | } |
| 817 | } |
| 818 | return true; |
| 819 | } |
| 820 | |
| 821 | HGraph* const graph_; |
| 822 | CodeGenerator* const codegen_; |
| 823 | |
| 824 | // Map from dex-pc to vector of already existing instruction/slow-path pairs. |
| 825 | ArenaSafeMap<uint32_t, ArenaVector<std::pair<InstructionType*, SlowPathCode*>>> slow_path_map_; |
| 826 | |
| 827 | DISALLOW_COPY_AND_ASSIGN(SlowPathGenerator); |
| 828 | }; |
| 829 | |
| 830 | class InstructionCodeGenerator : public HGraphVisitor { |
| 831 | public: |
| 832 | InstructionCodeGenerator(HGraph* graph, CodeGenerator* codegen) |
| 833 | : HGraphVisitor(graph), |
| 834 | deopt_slow_paths_(graph, codegen) {} |
| 835 | |
| 836 | protected: |
| 837 | // Add slow-path generator for each instruction/slow-path combination that desires sharing. |
| 838 | // TODO: under current regime, only deopt sharing make sense; extend later. |
| 839 | SlowPathGenerator<HDeoptimize> deopt_slow_paths_; |
| 840 | }; |
| 841 | |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 842 | } // namespace art |
| 843 | |
| 844 | #endif // ART_COMPILER_OPTIMIZING_CODE_GENERATOR_H_ |