Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (C) 2014 The Android Open Source Project |
| 3 | * |
| 4 | * Licensed under the Apache License, Version 2.0 (the "License"); |
| 5 | * you may not use this file except in compliance with the License. |
| 6 | * You may obtain a copy of the License at |
| 7 | * |
| 8 | * http://www.apache.org/licenses/LICENSE-2.0 |
| 9 | * |
| 10 | * Unless required by applicable law or agreed to in writing, software |
| 11 | * distributed under the License is distributed on an "AS IS" BASIS, |
| 12 | * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| 13 | * See the License for the specific language governing permissions and |
| 14 | * limitations under the License. |
| 15 | */ |
| 16 | |
| 17 | #ifndef ART_COMPILER_OPTIMIZING_CODE_GENERATOR_H_ |
| 18 | #define ART_COMPILER_OPTIMIZING_CODE_GENERATOR_H_ |
| 19 | |
Ian Rogers | d582fa4 | 2014-11-05 23:46:43 -0800 | [diff] [blame] | 20 | #include "arch/instruction_set.h" |
Calin Juravle | 3416601 | 2014-12-19 17:22:29 +0000 | [diff] [blame] | 21 | #include "arch/instruction_set_features.h" |
Vladimir Marko | f9f6441 | 2015-09-02 14:05:49 +0100 | [diff] [blame] | 22 | #include "base/arena_containers.h" |
| 23 | #include "base/arena_object.h" |
Nicolas Geoffray | 01bc96d | 2014-04-11 17:43:50 +0100 | [diff] [blame] | 24 | #include "base/bit_field.h" |
Nicolas Geoffray | d28b969 | 2015-11-04 14:36:55 +0000 | [diff] [blame] | 25 | #include "compiled_method.h" |
Calin Juravle | cd6dffe | 2015-01-08 17:35:35 +0000 | [diff] [blame] | 26 | #include "driver/compiler_options.h" |
Nicolas Geoffray | bab4ed7 | 2014-03-11 17:53:17 +0000 | [diff] [blame] | 27 | #include "globals.h" |
Alexandre Rames | eb7b739 | 2015-06-19 14:47:01 +0100 | [diff] [blame] | 28 | #include "graph_visualizer.h" |
Nicolas Geoffray | 4e3d23a | 2014-05-22 18:32:45 +0100 | [diff] [blame] | 29 | #include "locations.h" |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 30 | #include "memory_region.h" |
| 31 | #include "nodes.h" |
Serban Constantinescu | ecc4366 | 2015-08-13 13:33:12 +0100 | [diff] [blame] | 32 | #include "optimizing_compiler_stats.h" |
Nicolas Geoffray | 3946844 | 2014-09-02 15:17:15 +0100 | [diff] [blame] | 33 | #include "stack_map_stream.h" |
Andreas Gampe | 85b62f2 | 2015-09-09 13:15:38 -0700 | [diff] [blame] | 34 | #include "utils/label.h" |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 35 | |
| 36 | namespace art { |
| 37 | |
Roland Levillain | 6d0e483 | 2014-11-27 18:31:21 +0000 | [diff] [blame] | 38 | // Binary encoding of 2^32 for type double. |
| 39 | static int64_t constexpr k2Pow32EncodingForDouble = INT64_C(0x41F0000000000000); |
| 40 | // Binary encoding of 2^31 for type double. |
| 41 | static int64_t constexpr k2Pow31EncodingForDouble = INT64_C(0x41E0000000000000); |
| 42 | |
Mark Mendell | e82549b | 2015-05-06 10:55:34 -0400 | [diff] [blame] | 43 | // Minimum value for a primitive integer. |
| 44 | static int32_t constexpr kPrimIntMin = 0x80000000; |
| 45 | // Minimum value for a primitive long. |
| 46 | static int64_t constexpr kPrimLongMin = INT64_C(0x8000000000000000); |
| 47 | |
Roland Levillain | 3f8f936 | 2014-12-02 17:45:01 +0000 | [diff] [blame] | 48 | // Maximum value for a primitive integer. |
| 49 | static int32_t constexpr kPrimIntMax = 0x7fffffff; |
Roland Levillain | 624279f | 2014-12-04 11:54:28 +0000 | [diff] [blame] | 50 | // Maximum value for a primitive long. |
Mark Mendell | e82549b | 2015-05-06 10:55:34 -0400 | [diff] [blame] | 51 | static int64_t constexpr kPrimLongMax = INT64_C(0x7fffffffffffffff); |
Roland Levillain | 3f8f936 | 2014-12-02 17:45:01 +0000 | [diff] [blame] | 52 | |
Nicolas Geoffray | 92a73ae | 2014-10-16 11:12:52 +0100 | [diff] [blame] | 53 | class Assembler; |
Nicolas Geoffray | e503832 | 2014-07-04 09:41:32 +0100 | [diff] [blame] | 54 | class CodeGenerator; |
Nicolas Geoffray | d28b969 | 2015-11-04 14:36:55 +0000 | [diff] [blame] | 55 | class CompilerDriver; |
Vladimir Marko | 5815501 | 2015-08-19 12:49:41 +0000 | [diff] [blame] | 56 | class LinkerPatch; |
Nicolas Geoffray | f0e3937 | 2014-11-12 17:50:07 +0000 | [diff] [blame] | 57 | class ParallelMoveResolver; |
Nicolas Geoffray | 92cf83e | 2014-03-18 17:59:20 +0000 | [diff] [blame] | 58 | |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 59 | class CodeAllocator { |
| 60 | public: |
Nicolas Geoffray | e503832 | 2014-07-04 09:41:32 +0100 | [diff] [blame] | 61 | CodeAllocator() {} |
| 62 | virtual ~CodeAllocator() {} |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 63 | |
| 64 | virtual uint8_t* Allocate(size_t size) = 0; |
| 65 | |
| 66 | private: |
| 67 | DISALLOW_COPY_AND_ASSIGN(CodeAllocator); |
| 68 | }; |
| 69 | |
Ian Rogers | 6a3c1fc | 2014-10-31 00:33:20 -0700 | [diff] [blame] | 70 | class SlowPathCode : public ArenaObject<kArenaAllocSlowPaths> { |
Nicolas Geoffray | e503832 | 2014-07-04 09:41:32 +0100 | [diff] [blame] | 71 | public: |
Nicolas Geoffray | eeefa12 | 2015-03-13 18:52:59 +0000 | [diff] [blame] | 72 | SlowPathCode() { |
| 73 | for (size_t i = 0; i < kMaximumNumberOfExpectedRegisters; ++i) { |
| 74 | saved_core_stack_offsets_[i] = kRegisterNotSaved; |
| 75 | saved_fpu_stack_offsets_[i] = kRegisterNotSaved; |
| 76 | } |
| 77 | } |
| 78 | |
Nicolas Geoffray | e503832 | 2014-07-04 09:41:32 +0100 | [diff] [blame] | 79 | virtual ~SlowPathCode() {} |
| 80 | |
Nicolas Geoffray | e503832 | 2014-07-04 09:41:32 +0100 | [diff] [blame] | 81 | virtual void EmitNativeCode(CodeGenerator* codegen) = 0; |
| 82 | |
Zheng Xu | da40309 | 2015-04-24 17:35:39 +0800 | [diff] [blame] | 83 | virtual void SaveLiveRegisters(CodeGenerator* codegen, LocationSummary* locations); |
| 84 | virtual void RestoreLiveRegisters(CodeGenerator* codegen, LocationSummary* locations); |
Nicolas Geoffray | a8ac913 | 2015-03-13 16:36:36 +0000 | [diff] [blame] | 85 | |
Nicolas Geoffray | eeefa12 | 2015-03-13 18:52:59 +0000 | [diff] [blame] | 86 | bool IsCoreRegisterSaved(int reg) const { |
| 87 | return saved_core_stack_offsets_[reg] != kRegisterNotSaved; |
| 88 | } |
| 89 | |
| 90 | bool IsFpuRegisterSaved(int reg) const { |
| 91 | return saved_fpu_stack_offsets_[reg] != kRegisterNotSaved; |
| 92 | } |
| 93 | |
| 94 | uint32_t GetStackOffsetOfCoreRegister(int reg) const { |
| 95 | return saved_core_stack_offsets_[reg]; |
| 96 | } |
| 97 | |
| 98 | uint32_t GetStackOffsetOfFpuRegister(int reg) const { |
| 99 | return saved_fpu_stack_offsets_[reg]; |
| 100 | } |
| 101 | |
Alexandre Rames | 8158f28 | 2015-08-07 10:26:17 +0100 | [diff] [blame] | 102 | virtual bool IsFatal() const { return false; } |
| 103 | |
Alexandre Rames | 9931f31 | 2015-06-19 14:47:01 +0100 | [diff] [blame] | 104 | virtual const char* GetDescription() const = 0; |
| 105 | |
Andreas Gampe | 85b62f2 | 2015-09-09 13:15:38 -0700 | [diff] [blame] | 106 | Label* GetEntryLabel() { return &entry_label_; } |
| 107 | Label* GetExitLabel() { return &exit_label_; } |
| 108 | |
Zheng Xu | da40309 | 2015-04-24 17:35:39 +0800 | [diff] [blame] | 109 | protected: |
Nicolas Geoffray | eeefa12 | 2015-03-13 18:52:59 +0000 | [diff] [blame] | 110 | static constexpr size_t kMaximumNumberOfExpectedRegisters = 32; |
| 111 | static constexpr uint32_t kRegisterNotSaved = -1; |
| 112 | uint32_t saved_core_stack_offsets_[kMaximumNumberOfExpectedRegisters]; |
| 113 | uint32_t saved_fpu_stack_offsets_[kMaximumNumberOfExpectedRegisters]; |
Zheng Xu | da40309 | 2015-04-24 17:35:39 +0800 | [diff] [blame] | 114 | |
| 115 | private: |
Andreas Gampe | 85b62f2 | 2015-09-09 13:15:38 -0700 | [diff] [blame] | 116 | Label entry_label_; |
| 117 | Label exit_label_; |
| 118 | |
Nicolas Geoffray | e503832 | 2014-07-04 09:41:32 +0100 | [diff] [blame] | 119 | DISALLOW_COPY_AND_ASSIGN(SlowPathCode); |
| 120 | }; |
| 121 | |
Roland Levillain | 2d27c8e | 2015-04-28 15:48:45 +0100 | [diff] [blame] | 122 | class InvokeDexCallingConventionVisitor { |
| 123 | public: |
| 124 | virtual Location GetNextLocation(Primitive::Type type) = 0; |
Nicolas Geoffray | fd88f16 | 2015-06-03 11:23:52 +0100 | [diff] [blame] | 125 | virtual Location GetReturnLocation(Primitive::Type type) const = 0; |
| 126 | virtual Location GetMethodLocation() const = 0; |
Roland Levillain | 2d27c8e | 2015-04-28 15:48:45 +0100 | [diff] [blame] | 127 | |
| 128 | protected: |
| 129 | InvokeDexCallingConventionVisitor() {} |
| 130 | virtual ~InvokeDexCallingConventionVisitor() {} |
| 131 | |
| 132 | // The current index for core registers. |
| 133 | uint32_t gp_index_ = 0u; |
| 134 | // The current index for floating-point registers. |
| 135 | uint32_t float_index_ = 0u; |
| 136 | // The current stack index. |
| 137 | uint32_t stack_index_ = 0u; |
| 138 | |
| 139 | private: |
| 140 | DISALLOW_COPY_AND_ASSIGN(InvokeDexCallingConventionVisitor); |
| 141 | }; |
| 142 | |
Calin Juravle | e460d1d | 2015-09-29 04:52:17 +0100 | [diff] [blame] | 143 | class FieldAccessCallingConvention { |
| 144 | public: |
| 145 | virtual Location GetObjectLocation() const = 0; |
| 146 | virtual Location GetFieldIndexLocation() const = 0; |
| 147 | virtual Location GetReturnLocation(Primitive::Type type) const = 0; |
| 148 | virtual Location GetSetValueLocation(Primitive::Type type, bool is_instance) const = 0; |
| 149 | virtual Location GetFpuLocation(Primitive::Type type) const = 0; |
| 150 | virtual ~FieldAccessCallingConvention() {} |
| 151 | |
| 152 | protected: |
| 153 | FieldAccessCallingConvention() {} |
| 154 | |
| 155 | private: |
| 156 | DISALLOW_COPY_AND_ASSIGN(FieldAccessCallingConvention); |
| 157 | }; |
| 158 | |
Nicolas Geoffray | 12df9eb | 2015-01-09 14:53:50 +0000 | [diff] [blame] | 159 | class CodeGenerator { |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 160 | public: |
| 161 | // Compiles the graph to executable instructions. Returns whether the compilation |
| 162 | // succeeded. |
Nicolas Geoffray | 73e80c3 | 2014-07-22 17:47:56 +0100 | [diff] [blame] | 163 | void CompileBaseline(CodeAllocator* allocator, bool is_leaf = false); |
Nicolas Geoffray | 86dbb9a | 2014-06-04 11:12:39 +0100 | [diff] [blame] | 164 | void CompileOptimized(CodeAllocator* allocator); |
Nicolas Geoffray | 12df9eb | 2015-01-09 14:53:50 +0000 | [diff] [blame] | 165 | static CodeGenerator* Create(HGraph* graph, |
Calin Juravle | 3416601 | 2014-12-19 17:22:29 +0000 | [diff] [blame] | 166 | InstructionSet instruction_set, |
Calin Juravle | cd6dffe | 2015-01-08 17:35:35 +0000 | [diff] [blame] | 167 | const InstructionSetFeatures& isa_features, |
Serban Constantinescu | ecc4366 | 2015-08-13 13:33:12 +0100 | [diff] [blame] | 168 | const CompilerOptions& compiler_options, |
| 169 | OptimizingCompilerStats* stats = nullptr); |
Nicolas Geoffray | 12df9eb | 2015-01-09 14:53:50 +0000 | [diff] [blame] | 170 | virtual ~CodeGenerator() {} |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 171 | |
Vladimir Marko | dc151b2 | 2015-10-15 18:02:30 +0100 | [diff] [blame] | 172 | // Get the graph. This is the outermost graph, never the graph of a method being inlined. |
Nicolas Geoffray | 787c307 | 2014-03-17 10:20:19 +0000 | [diff] [blame] | 173 | HGraph* GetGraph() const { return graph_; } |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 174 | |
Nicolas Geoffray | dc23d83 | 2015-02-16 11:15:43 +0000 | [diff] [blame] | 175 | HBasicBlock* GetNextBlockToEmit() const; |
| 176 | HBasicBlock* FirstNonEmptyBlock(HBasicBlock* block) const; |
Nicolas Geoffray | bab4ed7 | 2014-03-11 17:53:17 +0000 | [diff] [blame] | 177 | bool GoesToNextBlock(HBasicBlock* current, HBasicBlock* next) const; |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 178 | |
Nicolas Geoffray | 86dbb9a | 2014-06-04 11:12:39 +0100 | [diff] [blame] | 179 | size_t GetStackSlotOfParameter(HParameterValue* parameter) const { |
| 180 | // Note that this follows the current calling convention. |
| 181 | return GetFrameSize() |
Mathieu Chartier | e401d14 | 2015-04-22 13:56:20 -0700 | [diff] [blame] | 182 | + InstructionSetPointerSize(GetInstructionSet()) // Art method |
Nicolas Geoffray | e27f31a | 2014-06-12 17:53:14 +0100 | [diff] [blame] | 183 | + parameter->GetIndex() * kVRegSize; |
Nicolas Geoffray | 86dbb9a | 2014-06-04 11:12:39 +0100 | [diff] [blame] | 184 | } |
| 185 | |
Nicolas Geoffray | 92a73ae | 2014-10-16 11:12:52 +0100 | [diff] [blame] | 186 | virtual void Initialize() = 0; |
Serban Constantinescu | 32f5b4d | 2014-11-25 20:05:46 +0000 | [diff] [blame] | 187 | virtual void Finalize(CodeAllocator* allocator); |
Vladimir Marko | 5815501 | 2015-08-19 12:49:41 +0000 | [diff] [blame] | 188 | virtual void EmitLinkerPatches(ArenaVector<LinkerPatch>* linker_patches); |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 189 | virtual void GenerateFrameEntry() = 0; |
| 190 | virtual void GenerateFrameExit() = 0; |
Nicolas Geoffray | 92a73ae | 2014-10-16 11:12:52 +0100 | [diff] [blame] | 191 | virtual void Bind(HBasicBlock* block) = 0; |
Nicolas Geoffray | 4a34a42 | 2014-04-03 10:38:37 +0100 | [diff] [blame] | 192 | virtual void Move(HInstruction* instruction, Location location, HInstruction* move_for) = 0; |
Calin Juravle | 175dc73 | 2015-08-25 15:42:32 +0100 | [diff] [blame] | 193 | virtual void MoveConstant(Location destination, int32_t value) = 0; |
Calin Juravle | e460d1d | 2015-09-29 04:52:17 +0100 | [diff] [blame] | 194 | virtual void MoveLocation(Location dst, Location src, Primitive::Type dst_type) = 0; |
| 195 | virtual void AddLocationAsTemp(Location location, LocationSummary* locations) = 0; |
| 196 | |
Nicolas Geoffray | 787c307 | 2014-03-17 10:20:19 +0000 | [diff] [blame] | 197 | virtual Assembler* GetAssembler() = 0; |
Alexandre Rames | eb7b739 | 2015-06-19 14:47:01 +0100 | [diff] [blame] | 198 | virtual const Assembler& GetAssembler() const = 0; |
Nicolas Geoffray | 707c809 | 2014-04-04 10:50:14 +0100 | [diff] [blame] | 199 | virtual size_t GetWordSize() const = 0; |
Mark Mendell | f85a9ca | 2015-01-13 09:20:58 -0500 | [diff] [blame] | 200 | virtual size_t GetFloatingPointSpillSlotSize() const = 0; |
Nicolas Geoffray | de58ab2 | 2014-11-05 12:46:03 +0000 | [diff] [blame] | 201 | virtual uintptr_t GetAddressOf(HBasicBlock* block) const = 0; |
Nicolas Geoffray | 4c204ba | 2015-02-03 15:12:35 +0000 | [diff] [blame] | 202 | void InitializeCodeGeneration(size_t number_of_spill_slots, |
| 203 | size_t maximum_number_of_live_core_registers, |
Roland Levillain | 0d5a281 | 2015-11-13 10:07:31 +0000 | [diff] [blame] | 204 | size_t maximum_number_of_live_fpu_registers, |
Nicolas Geoffray | 4c204ba | 2015-02-03 15:12:35 +0000 | [diff] [blame] | 205 | size_t number_of_out_slots, |
Vladimir Marko | fa6b93c | 2015-09-15 10:15:55 +0100 | [diff] [blame] | 206 | const ArenaVector<HBasicBlock*>& block_order); |
Nicolas Geoffray | ab032bc | 2014-07-15 12:55:21 +0100 | [diff] [blame] | 207 | int32_t GetStackSlot(HLocal* local) const; |
| 208 | Location GetTemporaryLocation(HTemporary* temp) const; |
Nicolas Geoffray | 787c307 | 2014-03-17 10:20:19 +0000 | [diff] [blame] | 209 | |
| 210 | uint32_t GetFrameSize() const { return frame_size_; } |
| 211 | void SetFrameSize(uint32_t size) { frame_size_ = size; } |
Nicolas Geoffray | 8ccc3f5 | 2014-03-19 10:34:11 +0000 | [diff] [blame] | 212 | uint32_t GetCoreSpillMask() const { return core_spill_mask_; } |
Nicolas Geoffray | d97dc40 | 2015-01-22 13:50:01 +0000 | [diff] [blame] | 213 | uint32_t GetFpuSpillMask() const { return fpu_spill_mask_; } |
Nicolas Geoffray | 787c307 | 2014-03-17 10:20:19 +0000 | [diff] [blame] | 214 | |
Nicolas Geoffray | 71175b7 | 2014-10-09 22:13:55 +0100 | [diff] [blame] | 215 | size_t GetNumberOfCoreRegisters() const { return number_of_core_registers_; } |
| 216 | size_t GetNumberOfFloatingPointRegisters() const { return number_of_fpu_registers_; } |
Nicolas Geoffray | 9889396 | 2015-01-21 12:32:32 +0000 | [diff] [blame] | 217 | virtual void SetupBlockedRegisters(bool is_baseline) const = 0; |
Nicolas Geoffray | 71175b7 | 2014-10-09 22:13:55 +0100 | [diff] [blame] | 218 | |
Nicolas Geoffray | 4dee636 | 2015-01-23 18:23:14 +0000 | [diff] [blame] | 219 | virtual void ComputeSpillMask() { |
| 220 | core_spill_mask_ = allocated_registers_.GetCoreRegisters() & core_callee_save_mask_; |
| 221 | DCHECK_NE(core_spill_mask_, 0u) << "At least the return address register must be saved"; |
| 222 | fpu_spill_mask_ = allocated_registers_.GetFloatingPointRegisters() & fpu_callee_save_mask_; |
| 223 | } |
| 224 | |
| 225 | static uint32_t ComputeRegisterMask(const int* registers, size_t length) { |
| 226 | uint32_t mask = 0; |
| 227 | for (size_t i = 0, e = length; i < e; ++i) { |
| 228 | mask |= (1 << registers[i]); |
| 229 | } |
| 230 | return mask; |
| 231 | } |
| 232 | |
Nicolas Geoffray | a7062e0 | 2014-05-22 12:50:17 +0100 | [diff] [blame] | 233 | virtual void DumpCoreRegister(std::ostream& stream, int reg) const = 0; |
| 234 | virtual void DumpFloatingPointRegister(std::ostream& stream, int reg) const = 0; |
Nicolas Geoffray | 412f10c | 2014-06-19 10:00:34 +0100 | [diff] [blame] | 235 | virtual InstructionSet GetInstructionSet() const = 0; |
Calin Juravle | cd6dffe | 2015-01-08 17:35:35 +0000 | [diff] [blame] | 236 | |
| 237 | const CompilerOptions& GetCompilerOptions() const { return compiler_options_; } |
| 238 | |
Serban Constantinescu | ecc4366 | 2015-08-13 13:33:12 +0100 | [diff] [blame] | 239 | void MaybeRecordStat(MethodCompilationStat compilation_stat, size_t count = 1) const; |
| 240 | |
Nicolas Geoffray | 102cbed | 2014-10-15 18:31:05 +0100 | [diff] [blame] | 241 | // Saves the register in the stack. Returns the size taken on stack. |
| 242 | virtual size_t SaveCoreRegister(size_t stack_index, uint32_t reg_id) = 0; |
| 243 | // Restores the register from the stack. Returns the size taken on stack. |
| 244 | virtual size_t RestoreCoreRegister(size_t stack_index, uint32_t reg_id) = 0; |
Nicolas Geoffray | 234d69d | 2015-03-09 10:28:50 +0000 | [diff] [blame] | 245 | |
| 246 | virtual size_t SaveFloatingPointRegister(size_t stack_index, uint32_t reg_id) = 0; |
| 247 | virtual size_t RestoreFloatingPointRegister(size_t stack_index, uint32_t reg_id) = 0; |
| 248 | |
Nicolas Geoffray | 840e546 | 2015-01-07 16:01:24 +0000 | [diff] [blame] | 249 | virtual bool NeedsTwoRegisters(Primitive::Type type) const = 0; |
Nicolas Geoffray | 234d69d | 2015-03-09 10:28:50 +0000 | [diff] [blame] | 250 | // Returns whether we should split long moves in parallel moves. |
| 251 | virtual bool ShouldSplitLongMoves() const { return false; } |
Nicolas Geoffray | a7062e0 | 2014-05-22 12:50:17 +0100 | [diff] [blame] | 252 | |
Roland Levillain | 0d5a281 | 2015-11-13 10:07:31 +0000 | [diff] [blame] | 253 | size_t GetNumberOfCoreCalleeSaveRegisters() const { |
| 254 | return POPCOUNT(core_callee_save_mask_); |
| 255 | } |
| 256 | |
| 257 | size_t GetNumberOfCoreCallerSaveRegisters() const { |
| 258 | DCHECK_GE(GetNumberOfCoreRegisters(), GetNumberOfCoreCalleeSaveRegisters()); |
| 259 | return GetNumberOfCoreRegisters() - GetNumberOfCoreCalleeSaveRegisters(); |
| 260 | } |
| 261 | |
Nicolas Geoffray | 9889396 | 2015-01-21 12:32:32 +0000 | [diff] [blame] | 262 | bool IsCoreCalleeSaveRegister(int reg) const { |
| 263 | return (core_callee_save_mask_ & (1 << reg)) != 0; |
| 264 | } |
| 265 | |
| 266 | bool IsFloatingPointCalleeSaveRegister(int reg) const { |
| 267 | return (fpu_callee_save_mask_ & (1 << reg)) != 0; |
| 268 | } |
| 269 | |
Yevgeny Rouban | 2a7c1ef | 2015-07-22 18:36:24 +0600 | [diff] [blame] | 270 | // Record native to dex mapping for a suspend point. Required by runtime. |
Nicolas Geoffray | eeefa12 | 2015-03-13 18:52:59 +0000 | [diff] [blame] | 271 | void RecordPcInfo(HInstruction* instruction, uint32_t dex_pc, SlowPathCode* slow_path = nullptr); |
David Srbecky | b7070a2 | 2016-01-08 18:13:53 +0000 | [diff] [blame] | 272 | // Check whether we have already recorded mapping at this PC. |
| 273 | bool HasStackMapAtCurrentPc(); |
Yevgeny Rouban | 2a7c1ef | 2015-07-22 18:36:24 +0600 | [diff] [blame] | 274 | |
Calin Juravle | 77520bc | 2015-01-12 18:45:46 +0000 | [diff] [blame] | 275 | bool CanMoveNullCheckToUser(HNullCheck* null_check); |
| 276 | void MaybeRecordImplicitNullCheck(HInstruction* instruction); |
Nicolas Geoffray | 8ccc3f5 | 2014-03-19 10:34:11 +0000 | [diff] [blame] | 277 | |
David Brazdil | 77a48ae | 2015-09-15 12:34:04 +0000 | [diff] [blame] | 278 | // Records a stack map which the runtime might use to set catch phi values |
| 279 | // during exception delivery. |
| 280 | // TODO: Replace with a catch-entering instruction that records the environment. |
| 281 | void RecordCatchBlockInfo(); |
| 282 | |
| 283 | // Returns true if implicit null checks are allowed in the compiler options |
| 284 | // and if the null check is not inside a try block. We currently cannot do |
| 285 | // implicit null checks in that case because we need the NullCheckSlowPath to |
| 286 | // save live registers, which may be needed by the runtime to set catch phis. |
| 287 | bool IsImplicitNullCheckAllowed(HNullCheck* null_check) const; |
| 288 | |
Nicolas Geoffray | e503832 | 2014-07-04 09:41:32 +0100 | [diff] [blame] | 289 | void AddSlowPath(SlowPathCode* slow_path) { |
Vladimir Marko | 225b646 | 2015-09-28 12:17:40 +0100 | [diff] [blame] | 290 | slow_paths_.push_back(slow_path); |
Nicolas Geoffray | e503832 | 2014-07-04 09:41:32 +0100 | [diff] [blame] | 291 | } |
| 292 | |
Vladimir Marko | f9f6441 | 2015-09-02 14:05:49 +0100 | [diff] [blame] | 293 | void BuildMappingTable(ArenaVector<uint8_t>* vector) const; |
| 294 | void BuildVMapTable(ArenaVector<uint8_t>* vector) const; |
Nicolas Geoffray | 92cf83e | 2014-03-18 17:59:20 +0000 | [diff] [blame] | 295 | void BuildNativeGCMap( |
Nicolas Geoffray | d28b969 | 2015-11-04 14:36:55 +0000 | [diff] [blame] | 296 | ArenaVector<uint8_t>* vector, const CompilerDriver& compiler_driver) const; |
| 297 | void BuildStackMaps(MemoryRegion region); |
| 298 | size_t ComputeStackMapsSize(); |
Nicolas Geoffray | 787c307 | 2014-03-17 10:20:19 +0000 | [diff] [blame] | 299 | |
Roland Levillain | 3e3d733 | 2015-04-28 11:00:54 +0100 | [diff] [blame] | 300 | bool IsBaseline() const { |
| 301 | return is_baseline_; |
| 302 | } |
| 303 | |
Nicolas Geoffray | f12feb8 | 2014-07-17 18:32:41 +0100 | [diff] [blame] | 304 | bool IsLeafMethod() const { |
| 305 | return is_leaf_; |
| 306 | } |
| 307 | |
| 308 | void MarkNotLeaf() { |
| 309 | is_leaf_ = false; |
Nicolas Geoffray | c0572a4 | 2015-02-06 14:35:25 +0000 | [diff] [blame] | 310 | requires_current_method_ = true; |
| 311 | } |
| 312 | |
| 313 | void SetRequiresCurrentMethod() { |
| 314 | requires_current_method_ = true; |
| 315 | } |
| 316 | |
| 317 | bool RequiresCurrentMethod() const { |
| 318 | return requires_current_method_; |
Nicolas Geoffray | f12feb8 | 2014-07-17 18:32:41 +0100 | [diff] [blame] | 319 | } |
| 320 | |
Nicolas Geoffray | 3c04974 | 2014-09-24 18:10:46 +0100 | [diff] [blame] | 321 | // Clears the spill slots taken by loop phis in the `LocationSummary` of the |
| 322 | // suspend check. This is called when the code generator generates code |
| 323 | // for the suspend check at the back edge (instead of where the suspend check |
| 324 | // is, which is the loop entry). At this point, the spill slots for the phis |
| 325 | // have not been written to. |
| 326 | void ClearSpillSlotsFromLoopPhisInStackMap(HSuspendCheck* suspend_check) const; |
| 327 | |
Nicolas Geoffray | 71175b7 | 2014-10-09 22:13:55 +0100 | [diff] [blame] | 328 | bool* GetBlockedCoreRegisters() const { return blocked_core_registers_; } |
Nicolas Geoffray | 102cbed | 2014-10-15 18:31:05 +0100 | [diff] [blame] | 329 | bool* GetBlockedFloatingPointRegisters() const { return blocked_fpu_registers_; } |
Nicolas Geoffray | 71175b7 | 2014-10-09 22:13:55 +0100 | [diff] [blame] | 330 | |
Nicolas Geoffray | 19a19cf | 2014-10-22 16:07:05 +0100 | [diff] [blame] | 331 | // Helper that returns the pointer offset of an index in an object array. |
| 332 | // Note: this method assumes we always have the same pointer size, regardless |
| 333 | // of the architecture. |
| 334 | static size_t GetCacheOffset(uint32_t index); |
Mathieu Chartier | e401d14 | 2015-04-22 13:56:20 -0700 | [diff] [blame] | 335 | // Pointer variant for ArtMethod and ArtField arrays. |
| 336 | size_t GetCachePointerOffset(uint32_t index); |
Nicolas Geoffray | 19a19cf | 2014-10-22 16:07:05 +0100 | [diff] [blame] | 337 | |
Nicolas Geoffray | 9021825 | 2015-04-15 11:56:51 +0100 | [diff] [blame] | 338 | void EmitParallelMoves(Location from1, |
| 339 | Location to1, |
| 340 | Primitive::Type type1, |
| 341 | Location from2, |
| 342 | Location to2, |
| 343 | Primitive::Type type2); |
Nicolas Geoffray | f0e3937 | 2014-11-12 17:50:07 +0000 | [diff] [blame] | 344 | |
Nicolas Geoffray | af07bc1 | 2014-11-12 18:08:09 +0000 | [diff] [blame] | 345 | static bool StoreNeedsWriteBarrier(Primitive::Type type, HInstruction* value) { |
David Brazdil | 522e224 | 2015-03-17 18:48:28 +0000 | [diff] [blame] | 346 | // Check that null value is not represented as an integer constant. |
| 347 | DCHECK(type != Primitive::kPrimNot || !value->IsIntConstant()); |
| 348 | return type == Primitive::kPrimNot && !value->IsNullConstant(); |
Nicolas Geoffray | af07bc1 | 2014-11-12 18:08:09 +0000 | [diff] [blame] | 349 | } |
| 350 | |
Alexandre Rames | 78e3ef6 | 2015-08-12 13:43:29 +0100 | [diff] [blame] | 351 | void ValidateInvokeRuntime(HInstruction* instruction, SlowPathCode* slow_path); |
| 352 | |
Nicolas Geoffray | 9889396 | 2015-01-21 12:32:32 +0000 | [diff] [blame] | 353 | void AddAllocatedRegister(Location location) { |
| 354 | allocated_registers_.Add(location); |
| 355 | } |
| 356 | |
Nicolas Geoffray | 45b83af | 2015-07-06 15:12:53 +0000 | [diff] [blame] | 357 | bool HasAllocatedRegister(bool is_core, int reg) const { |
| 358 | return is_core |
| 359 | ? allocated_registers_.ContainsCoreRegister(reg) |
| 360 | : allocated_registers_.ContainsFloatingPointRegister(reg); |
| 361 | } |
| 362 | |
Nicolas Geoffray | c0572a4 | 2015-02-06 14:35:25 +0000 | [diff] [blame] | 363 | void AllocateLocations(HInstruction* instruction); |
| 364 | |
Roland Levillain | aa9b7c4 | 2015-02-17 15:40:09 +0000 | [diff] [blame] | 365 | // Tells whether the stack frame of the compiled method is |
| 366 | // considered "empty", that is either actually having a size of zero, |
| 367 | // or just containing the saved return address register. |
| 368 | bool HasEmptyFrame() const { |
| 369 | return GetFrameSize() == (CallPushesPC() ? GetWordSize() : 0); |
| 370 | } |
| 371 | |
Nicolas Geoffray | d6138ef | 2015-02-18 14:48:53 +0000 | [diff] [blame] | 372 | static int32_t GetInt32ValueOf(HConstant* constant) { |
| 373 | if (constant->IsIntConstant()) { |
| 374 | return constant->AsIntConstant()->GetValue(); |
| 375 | } else if (constant->IsNullConstant()) { |
| 376 | return 0; |
| 377 | } else { |
| 378 | DCHECK(constant->IsFloatConstant()); |
Roland Levillain | da4d79b | 2015-03-24 14:36:11 +0000 | [diff] [blame] | 379 | return bit_cast<int32_t, float>(constant->AsFloatConstant()->GetValue()); |
Nicolas Geoffray | d6138ef | 2015-02-18 14:48:53 +0000 | [diff] [blame] | 380 | } |
| 381 | } |
| 382 | |
| 383 | static int64_t GetInt64ValueOf(HConstant* constant) { |
| 384 | if (constant->IsIntConstant()) { |
| 385 | return constant->AsIntConstant()->GetValue(); |
| 386 | } else if (constant->IsNullConstant()) { |
| 387 | return 0; |
| 388 | } else if (constant->IsFloatConstant()) { |
Roland Levillain | da4d79b | 2015-03-24 14:36:11 +0000 | [diff] [blame] | 389 | return bit_cast<int32_t, float>(constant->AsFloatConstant()->GetValue()); |
Nicolas Geoffray | d6138ef | 2015-02-18 14:48:53 +0000 | [diff] [blame] | 390 | } else if (constant->IsLongConstant()) { |
| 391 | return constant->AsLongConstant()->GetValue(); |
| 392 | } else { |
| 393 | DCHECK(constant->IsDoubleConstant()); |
Roland Levillain | da4d79b | 2015-03-24 14:36:11 +0000 | [diff] [blame] | 394 | return bit_cast<int64_t, double>(constant->AsDoubleConstant()->GetValue()); |
Nicolas Geoffray | d6138ef | 2015-02-18 14:48:53 +0000 | [diff] [blame] | 395 | } |
| 396 | } |
| 397 | |
Nicolas Geoffray | a8ac913 | 2015-03-13 16:36:36 +0000 | [diff] [blame] | 398 | size_t GetFirstRegisterSlotInSlowPath() const { |
| 399 | return first_register_slot_in_slow_path_; |
| 400 | } |
| 401 | |
| 402 | uint32_t FrameEntrySpillSize() const { |
| 403 | return GetFpuSpillSize() + GetCoreSpillSize(); |
| 404 | } |
| 405 | |
Roland Levillain | ec525fc | 2015-04-28 15:50:20 +0100 | [diff] [blame] | 406 | virtual ParallelMoveResolver* GetMoveResolver() = 0; |
Nicolas Geoffray | a8ac913 | 2015-03-13 16:36:36 +0000 | [diff] [blame] | 407 | |
Nicolas Geoffray | fd88f16 | 2015-06-03 11:23:52 +0100 | [diff] [blame] | 408 | static void CreateCommonInvokeLocationSummary( |
| 409 | HInvoke* invoke, InvokeDexCallingConventionVisitor* visitor); |
| 410 | |
Calin Juravle | 175dc73 | 2015-08-25 15:42:32 +0100 | [diff] [blame] | 411 | void GenerateInvokeUnresolvedRuntimeCall(HInvokeUnresolved* invoke); |
| 412 | |
Calin Juravle | e460d1d | 2015-09-29 04:52:17 +0100 | [diff] [blame] | 413 | void CreateUnresolvedFieldLocationSummary( |
| 414 | HInstruction* field_access, |
| 415 | Primitive::Type field_type, |
| 416 | const FieldAccessCallingConvention& calling_convention); |
| 417 | |
| 418 | void GenerateUnresolvedFieldAccess( |
| 419 | HInstruction* field_access, |
| 420 | Primitive::Type field_type, |
| 421 | uint32_t field_index, |
| 422 | uint32_t dex_pc, |
| 423 | const FieldAccessCallingConvention& calling_convention); |
| 424 | |
Calin Juravle | 98893e1 | 2015-10-02 21:05:03 +0100 | [diff] [blame] | 425 | // TODO: This overlaps a bit with MoveFromReturnRegister. Refactor for a better design. |
| 426 | static void CreateLoadClassLocationSummary(HLoadClass* cls, |
| 427 | Location runtime_type_index_location, |
Roland Levillain | 0d5a281 | 2015-11-13 10:07:31 +0000 | [diff] [blame] | 428 | Location runtime_return_location, |
| 429 | bool code_generator_supports_read_barrier = false); |
Calin Juravle | 98893e1 | 2015-10-02 21:05:03 +0100 | [diff] [blame] | 430 | |
Nicolas Geoffray | 5bd05a5 | 2015-10-13 09:48:30 +0100 | [diff] [blame] | 431 | static void CreateSystemArrayCopyLocationSummary(HInvoke* invoke); |
| 432 | |
Alexandre Rames | eb7b739 | 2015-06-19 14:47:01 +0100 | [diff] [blame] | 433 | void SetDisassemblyInformation(DisassemblyInformation* info) { disasm_info_ = info; } |
| 434 | DisassemblyInformation* GetDisassemblyInformation() const { return disasm_info_; } |
| 435 | |
Calin Juravle | 175dc73 | 2015-08-25 15:42:32 +0100 | [diff] [blame] | 436 | virtual void InvokeRuntime(QuickEntrypointEnum entrypoint, |
| 437 | HInstruction* instruction, |
| 438 | uint32_t dex_pc, |
| 439 | SlowPathCode* slow_path) = 0; |
| 440 | |
Vladimir Marko | dc151b2 | 2015-10-15 18:02:30 +0100 | [diff] [blame] | 441 | // Check if the desired_dispatch_info is supported. If it is, return it, |
| 442 | // otherwise return a fall-back info that should be used instead. |
| 443 | virtual HInvokeStaticOrDirect::DispatchInfo GetSupportedInvokeStaticOrDirectDispatch( |
| 444 | const HInvokeStaticOrDirect::DispatchInfo& desired_dispatch_info, |
| 445 | MethodReference target_method) = 0; |
| 446 | |
Andreas Gampe | 85b62f2 | 2015-09-09 13:15:38 -0700 | [diff] [blame] | 447 | // Generate a call to a static or direct method. |
| 448 | virtual void GenerateStaticOrDirectCall(HInvokeStaticOrDirect* invoke, Location temp) = 0; |
| 449 | // Generate a call to a virtual method. |
| 450 | virtual void GenerateVirtualCall(HInvokeVirtual* invoke, Location temp) = 0; |
| 451 | |
| 452 | // Copy the result of a call into the given target. |
| 453 | virtual void MoveFromReturnRegister(Location trg, Primitive::Type type) = 0; |
| 454 | |
Nicolas Geoffray | 787c307 | 2014-03-17 10:20:19 +0000 | [diff] [blame] | 455 | protected: |
Vladimir Marko | 5815501 | 2015-08-19 12:49:41 +0000 | [diff] [blame] | 456 | // Method patch info used for recording locations of required linker patches and |
| 457 | // target methods. The target method can be used for various purposes, whether for |
| 458 | // patching the address of the method or the code pointer or a PC-relative call. |
| 459 | template <typename LabelType> |
| 460 | struct MethodPatchInfo { |
| 461 | explicit MethodPatchInfo(MethodReference m) : target_method(m), label() { } |
| 462 | |
| 463 | MethodReference target_method; |
| 464 | LabelType label; |
| 465 | }; |
| 466 | |
Nicolas Geoffray | 71175b7 | 2014-10-09 22:13:55 +0100 | [diff] [blame] | 467 | CodeGenerator(HGraph* graph, |
| 468 | size_t number_of_core_registers, |
| 469 | size_t number_of_fpu_registers, |
Calin Juravle | cd6dffe | 2015-01-08 17:35:35 +0000 | [diff] [blame] | 470 | size_t number_of_register_pairs, |
Nicolas Geoffray | 9889396 | 2015-01-21 12:32:32 +0000 | [diff] [blame] | 471 | uint32_t core_callee_save_mask, |
| 472 | uint32_t fpu_callee_save_mask, |
Serban Constantinescu | ecc4366 | 2015-08-13 13:33:12 +0100 | [diff] [blame] | 473 | const CompilerOptions& compiler_options, |
| 474 | OptimizingCompilerStats* stats) |
Nicolas Geoffray | c0572a4 | 2015-02-06 14:35:25 +0000 | [diff] [blame] | 475 | : frame_size_(0), |
Nicolas Geoffray | 4361bef | 2014-08-20 04:59:12 +0100 | [diff] [blame] | 476 | core_spill_mask_(0), |
Nicolas Geoffray | d97dc40 | 2015-01-22 13:50:01 +0000 | [diff] [blame] | 477 | fpu_spill_mask_(0), |
Nicolas Geoffray | 3bca0df | 2014-09-19 11:01:00 +0100 | [diff] [blame] | 478 | first_register_slot_in_slow_path_(0), |
Vladimir Marko | 5233f93 | 2015-09-29 19:01:15 +0100 | [diff] [blame] | 479 | blocked_core_registers_(graph->GetArena()->AllocArray<bool>(number_of_core_registers, |
| 480 | kArenaAllocCodeGenerator)), |
| 481 | blocked_fpu_registers_(graph->GetArena()->AllocArray<bool>(number_of_fpu_registers, |
| 482 | kArenaAllocCodeGenerator)), |
| 483 | blocked_register_pairs_(graph->GetArena()->AllocArray<bool>(number_of_register_pairs, |
| 484 | kArenaAllocCodeGenerator)), |
Nicolas Geoffray | 71175b7 | 2014-10-09 22:13:55 +0100 | [diff] [blame] | 485 | number_of_core_registers_(number_of_core_registers), |
| 486 | number_of_fpu_registers_(number_of_fpu_registers), |
| 487 | number_of_register_pairs_(number_of_register_pairs), |
Nicolas Geoffray | 9889396 | 2015-01-21 12:32:32 +0000 | [diff] [blame] | 488 | core_callee_save_mask_(core_callee_save_mask), |
| 489 | fpu_callee_save_mask_(fpu_callee_save_mask), |
Vladimir Marko | cf93a5c | 2015-06-16 11:33:24 +0000 | [diff] [blame] | 490 | stack_map_stream_(graph->GetArena()), |
| 491 | block_order_(nullptr), |
Roland Levillain | 3e3d733 | 2015-04-28 11:00:54 +0100 | [diff] [blame] | 492 | is_baseline_(false), |
Alexandre Rames | eb7b739 | 2015-06-19 14:47:01 +0100 | [diff] [blame] | 493 | disasm_info_(nullptr), |
Serban Constantinescu | ecc4366 | 2015-08-13 13:33:12 +0100 | [diff] [blame] | 494 | stats_(stats), |
Nicolas Geoffray | 787c307 | 2014-03-17 10:20:19 +0000 | [diff] [blame] | 495 | graph_(graph), |
Calin Juravle | cd6dffe | 2015-01-08 17:35:35 +0000 | [diff] [blame] | 496 | compiler_options_(compiler_options), |
Vladimir Marko | 225b646 | 2015-09-28 12:17:40 +0100 | [diff] [blame] | 497 | slow_paths_(graph->GetArena()->Adapter(kArenaAllocCodeGenerator)), |
Vladimir Marko | 0f7dca4 | 2015-11-02 14:36:43 +0000 | [diff] [blame] | 498 | current_slow_path_(nullptr), |
Nicolas Geoffray | 4c204ba | 2015-02-03 15:12:35 +0000 | [diff] [blame] | 499 | current_block_index_(0), |
Nicolas Geoffray | 3946844 | 2014-09-02 15:17:15 +0100 | [diff] [blame] | 500 | is_leaf_(true), |
Vladimir Marko | 225b646 | 2015-09-28 12:17:40 +0100 | [diff] [blame] | 501 | requires_current_method_(false) { |
| 502 | slow_paths_.reserve(8); |
| 503 | } |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 504 | |
Nicolas Geoffray | a7aca37 | 2014-04-28 17:47:12 +0100 | [diff] [blame] | 505 | // Register allocation logic. |
| 506 | void AllocateRegistersLocally(HInstruction* instruction) const; |
| 507 | |
| 508 | // Backend specific implementation for allocating a register. |
Nicolas Geoffray | 71175b7 | 2014-10-09 22:13:55 +0100 | [diff] [blame] | 509 | virtual Location AllocateFreeRegister(Primitive::Type type) const = 0; |
Nicolas Geoffray | a7aca37 | 2014-04-28 17:47:12 +0100 | [diff] [blame] | 510 | |
Nicolas Geoffray | 71175b7 | 2014-10-09 22:13:55 +0100 | [diff] [blame] | 511 | static size_t FindFreeEntry(bool* array, size_t length); |
Nicolas Geoffray | 3c03503 | 2014-10-28 10:46:40 +0000 | [diff] [blame] | 512 | static size_t FindTwoFreeConsecutiveAlignedEntries(bool* array, size_t length); |
Nicolas Geoffray | a7aca37 | 2014-04-28 17:47:12 +0100 | [diff] [blame] | 513 | |
Nicolas Geoffray | a7aca37 | 2014-04-28 17:47:12 +0100 | [diff] [blame] | 514 | virtual Location GetStackLocation(HLoadLocal* load) const = 0; |
| 515 | |
Nicolas Geoffray | c0572a4 | 2015-02-06 14:35:25 +0000 | [diff] [blame] | 516 | virtual HGraphVisitor* GetLocationBuilder() = 0; |
| 517 | virtual HGraphVisitor* GetInstructionVisitor() = 0; |
Nicolas Geoffray | f0e3937 | 2014-11-12 17:50:07 +0000 | [diff] [blame] | 518 | |
Nicolas Geoffray | d97dc40 | 2015-01-22 13:50:01 +0000 | [diff] [blame] | 519 | // Returns the location of the first spilled entry for floating point registers, |
| 520 | // relative to the stack pointer. |
| 521 | uint32_t GetFpuSpillStart() const { |
Nicolas Geoffray | d97dc40 | 2015-01-22 13:50:01 +0000 | [diff] [blame] | 522 | return GetFrameSize() - FrameEntrySpillSize(); |
| 523 | } |
| 524 | |
| 525 | uint32_t GetFpuSpillSize() const { |
| 526 | return POPCOUNT(fpu_spill_mask_) * GetFloatingPointSpillSlotSize(); |
| 527 | } |
| 528 | |
| 529 | uint32_t GetCoreSpillSize() const { |
| 530 | return POPCOUNT(core_spill_mask_) * GetWordSize(); |
| 531 | } |
| 532 | |
Nicolas Geoffray | c0572a4 | 2015-02-06 14:35:25 +0000 | [diff] [blame] | 533 | bool HasAllocatedCalleeSaveRegisters() const { |
| 534 | // We check the core registers against 1 because it always comprises the return PC. |
| 535 | return (POPCOUNT(allocated_registers_.GetCoreRegisters() & core_callee_save_mask_) != 1) |
| 536 | || (POPCOUNT(allocated_registers_.GetFloatingPointRegisters() & fpu_callee_save_mask_) != 0); |
| 537 | } |
| 538 | |
| 539 | bool CallPushesPC() const { |
| 540 | InstructionSet instruction_set = GetInstructionSet(); |
| 541 | return instruction_set == kX86 || instruction_set == kX86_64; |
| 542 | } |
| 543 | |
Vladimir Marko | 225b646 | 2015-09-28 12:17:40 +0100 | [diff] [blame] | 544 | // Arm64 has its own type for a label, so we need to templatize these methods |
Nicolas Geoffray | dc23d83 | 2015-02-16 11:15:43 +0000 | [diff] [blame] | 545 | // to share the logic. |
Vladimir Marko | 225b646 | 2015-09-28 12:17:40 +0100 | [diff] [blame] | 546 | |
| 547 | template <typename LabelType> |
| 548 | LabelType* CommonInitializeLabels() { |
Vladimir Marko | b95fb77 | 2015-09-30 13:32:31 +0100 | [diff] [blame] | 549 | // We use raw array allocations instead of ArenaVector<> because Labels are |
| 550 | // non-constructible and non-movable and as such cannot be held in a vector. |
Vladimir Marko | 225b646 | 2015-09-28 12:17:40 +0100 | [diff] [blame] | 551 | size_t size = GetGraph()->GetBlocks().size(); |
| 552 | LabelType* labels = GetGraph()->GetArena()->AllocArray<LabelType>(size, |
| 553 | kArenaAllocCodeGenerator); |
| 554 | for (size_t i = 0; i != size; ++i) { |
| 555 | new(labels + i) LabelType(); |
| 556 | } |
| 557 | return labels; |
| 558 | } |
| 559 | |
Vladimir Marko | 5815501 | 2015-08-19 12:49:41 +0000 | [diff] [blame] | 560 | template <typename LabelType> |
| 561 | LabelType* CommonGetLabelOf(LabelType* raw_pointer_to_labels_array, HBasicBlock* block) const { |
Nicolas Geoffray | dc23d83 | 2015-02-16 11:15:43 +0000 | [diff] [blame] | 562 | block = FirstNonEmptyBlock(block); |
| 563 | return raw_pointer_to_labels_array + block->GetBlockId(); |
| 564 | } |
| 565 | |
Vladimir Marko | 0f7dca4 | 2015-11-02 14:36:43 +0000 | [diff] [blame] | 566 | SlowPathCode* GetCurrentSlowPath() { |
| 567 | return current_slow_path_; |
| 568 | } |
| 569 | |
Nicolas Geoffray | 8ccc3f5 | 2014-03-19 10:34:11 +0000 | [diff] [blame] | 570 | // Frame size required for this method. |
| 571 | uint32_t frame_size_; |
| 572 | uint32_t core_spill_mask_; |
Nicolas Geoffray | d97dc40 | 2015-01-22 13:50:01 +0000 | [diff] [blame] | 573 | uint32_t fpu_spill_mask_; |
Nicolas Geoffray | 3bca0df | 2014-09-19 11:01:00 +0100 | [diff] [blame] | 574 | uint32_t first_register_slot_in_slow_path_; |
Nicolas Geoffray | 8ccc3f5 | 2014-03-19 10:34:11 +0000 | [diff] [blame] | 575 | |
Nicolas Geoffray | 9889396 | 2015-01-21 12:32:32 +0000 | [diff] [blame] | 576 | // Registers that were allocated during linear scan. |
| 577 | RegisterSet allocated_registers_; |
| 578 | |
Nicolas Geoffray | 71175b7 | 2014-10-09 22:13:55 +0100 | [diff] [blame] | 579 | // Arrays used when doing register allocation to know which |
| 580 | // registers we can allocate. `SetupBlockedRegisters` updates the |
| 581 | // arrays. |
| 582 | bool* const blocked_core_registers_; |
| 583 | bool* const blocked_fpu_registers_; |
| 584 | bool* const blocked_register_pairs_; |
| 585 | size_t number_of_core_registers_; |
| 586 | size_t number_of_fpu_registers_; |
| 587 | size_t number_of_register_pairs_; |
Nicolas Geoffray | 9889396 | 2015-01-21 12:32:32 +0000 | [diff] [blame] | 588 | const uint32_t core_callee_save_mask_; |
| 589 | const uint32_t fpu_callee_save_mask_; |
Nicolas Geoffray | 71175b7 | 2014-10-09 22:13:55 +0100 | [diff] [blame] | 590 | |
Vladimir Marko | cf93a5c | 2015-06-16 11:33:24 +0000 | [diff] [blame] | 591 | StackMapStream stack_map_stream_; |
| 592 | |
| 593 | // The order to use for code generation. |
Vladimir Marko | fa6b93c | 2015-09-15 10:15:55 +0100 | [diff] [blame] | 594 | const ArenaVector<HBasicBlock*>* block_order_; |
Vladimir Marko | cf93a5c | 2015-06-16 11:33:24 +0000 | [diff] [blame] | 595 | |
Roland Levillain | 3e3d733 | 2015-04-28 11:00:54 +0100 | [diff] [blame] | 596 | // Whether we are using baseline. |
| 597 | bool is_baseline_; |
| 598 | |
Alexandre Rames | eb7b739 | 2015-06-19 14:47:01 +0100 | [diff] [blame] | 599 | DisassemblyInformation* disasm_info_; |
| 600 | |
Nicolas Geoffray | bab4ed7 | 2014-03-11 17:53:17 +0000 | [diff] [blame] | 601 | private: |
Nicolas Geoffray | c0572a4 | 2015-02-06 14:35:25 +0000 | [diff] [blame] | 602 | void InitLocationsBaseline(HInstruction* instruction); |
Nicolas Geoffray | 3bca0df | 2014-09-19 11:01:00 +0100 | [diff] [blame] | 603 | size_t GetStackOffsetOfSavedRegister(size_t index); |
Alexandre Rames | eb7b739 | 2015-06-19 14:47:01 +0100 | [diff] [blame] | 604 | void GenerateSlowPaths(); |
Nicolas Geoffray | 4c204ba | 2015-02-03 15:12:35 +0000 | [diff] [blame] | 605 | void CompileInternal(CodeAllocator* allocator, bool is_baseline); |
Mark Mendell | 5f87418 | 2015-03-04 15:42:45 -0500 | [diff] [blame] | 606 | void BlockIfInRegister(Location location, bool is_out = false) const; |
Nicolas Geoffray | b1d0f3f | 2015-05-14 12:41:51 +0100 | [diff] [blame] | 607 | void EmitEnvironment(HEnvironment* environment, SlowPathCode* slow_path); |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 608 | |
Serban Constantinescu | ecc4366 | 2015-08-13 13:33:12 +0100 | [diff] [blame] | 609 | OptimizingCompilerStats* stats_; |
| 610 | |
Nicolas Geoffray | 787c307 | 2014-03-17 10:20:19 +0000 | [diff] [blame] | 611 | HGraph* const graph_; |
Calin Juravle | cd6dffe | 2015-01-08 17:35:35 +0000 | [diff] [blame] | 612 | const CompilerOptions& compiler_options_; |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 613 | |
Vladimir Marko | 225b646 | 2015-09-28 12:17:40 +0100 | [diff] [blame] | 614 | ArenaVector<SlowPathCode*> slow_paths_; |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 615 | |
Aart Bik | 42249c3 | 2016-01-07 15:33:50 -0800 | [diff] [blame^] | 616 | // The current slow-path that we're generating code for. |
Vladimir Marko | 0f7dca4 | 2015-11-02 14:36:43 +0000 | [diff] [blame] | 617 | SlowPathCode* current_slow_path_; |
| 618 | |
Nicolas Geoffray | 4c204ba | 2015-02-03 15:12:35 +0000 | [diff] [blame] | 619 | // The current block index in `block_order_` of the block |
| 620 | // we are generating code for. |
| 621 | size_t current_block_index_; |
| 622 | |
Nicolas Geoffray | c0572a4 | 2015-02-06 14:35:25 +0000 | [diff] [blame] | 623 | // Whether the method is a leaf method. |
Nicolas Geoffray | f12feb8 | 2014-07-17 18:32:41 +0100 | [diff] [blame] | 624 | bool is_leaf_; |
| 625 | |
Nicolas Geoffray | c0572a4 | 2015-02-06 14:35:25 +0000 | [diff] [blame] | 626 | // Whether an instruction in the graph accesses the current method. |
| 627 | bool requires_current_method_; |
| 628 | |
David Srbecky | c6b4dd8 | 2015-04-07 20:32:43 +0100 | [diff] [blame] | 629 | friend class OptimizingCFITest; |
| 630 | |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 631 | DISALLOW_COPY_AND_ASSIGN(CodeGenerator); |
| 632 | }; |
| 633 | |
Nicolas Geoffray | 7fb49da | 2014-10-06 09:12:41 +0100 | [diff] [blame] | 634 | template <typename C, typename F> |
Nicolas Geoffray | 4a34a42 | 2014-04-03 10:38:37 +0100 | [diff] [blame] | 635 | class CallingConvention { |
| 636 | public: |
Nicolas Geoffray | 7fb49da | 2014-10-06 09:12:41 +0100 | [diff] [blame] | 637 | CallingConvention(const C* registers, |
| 638 | size_t number_of_registers, |
| 639 | const F* fpu_registers, |
Mathieu Chartier | e401d14 | 2015-04-22 13:56:20 -0700 | [diff] [blame] | 640 | size_t number_of_fpu_registers, |
| 641 | size_t pointer_size) |
Nicolas Geoffray | 7fb49da | 2014-10-06 09:12:41 +0100 | [diff] [blame] | 642 | : registers_(registers), |
| 643 | number_of_registers_(number_of_registers), |
| 644 | fpu_registers_(fpu_registers), |
Mathieu Chartier | e401d14 | 2015-04-22 13:56:20 -0700 | [diff] [blame] | 645 | number_of_fpu_registers_(number_of_fpu_registers), |
| 646 | pointer_size_(pointer_size) {} |
Nicolas Geoffray | 4a34a42 | 2014-04-03 10:38:37 +0100 | [diff] [blame] | 647 | |
| 648 | size_t GetNumberOfRegisters() const { return number_of_registers_; } |
Nicolas Geoffray | 7fb49da | 2014-10-06 09:12:41 +0100 | [diff] [blame] | 649 | size_t GetNumberOfFpuRegisters() const { return number_of_fpu_registers_; } |
Nicolas Geoffray | 4a34a42 | 2014-04-03 10:38:37 +0100 | [diff] [blame] | 650 | |
Nicolas Geoffray | 7fb49da | 2014-10-06 09:12:41 +0100 | [diff] [blame] | 651 | C GetRegisterAt(size_t index) const { |
Nicolas Geoffray | 4a34a42 | 2014-04-03 10:38:37 +0100 | [diff] [blame] | 652 | DCHECK_LT(index, number_of_registers_); |
| 653 | return registers_[index]; |
| 654 | } |
| 655 | |
Nicolas Geoffray | 7fb49da | 2014-10-06 09:12:41 +0100 | [diff] [blame] | 656 | F GetFpuRegisterAt(size_t index) const { |
| 657 | DCHECK_LT(index, number_of_fpu_registers_); |
| 658 | return fpu_registers_[index]; |
| 659 | } |
| 660 | |
| 661 | size_t GetStackOffsetOf(size_t index) const { |
Nicolas Geoffray | 4a34a42 | 2014-04-03 10:38:37 +0100 | [diff] [blame] | 662 | // We still reserve the space for parameters passed by registers. |
Mathieu Chartier | e401d14 | 2015-04-22 13:56:20 -0700 | [diff] [blame] | 663 | // Add space for the method pointer. |
| 664 | return pointer_size_ + index * kVRegSize; |
Nicolas Geoffray | 4a34a42 | 2014-04-03 10:38:37 +0100 | [diff] [blame] | 665 | } |
| 666 | |
| 667 | private: |
Nicolas Geoffray | 7fb49da | 2014-10-06 09:12:41 +0100 | [diff] [blame] | 668 | const C* registers_; |
Nicolas Geoffray | 4a34a42 | 2014-04-03 10:38:37 +0100 | [diff] [blame] | 669 | const size_t number_of_registers_; |
Nicolas Geoffray | 7fb49da | 2014-10-06 09:12:41 +0100 | [diff] [blame] | 670 | const F* fpu_registers_; |
| 671 | const size_t number_of_fpu_registers_; |
Mathieu Chartier | e401d14 | 2015-04-22 13:56:20 -0700 | [diff] [blame] | 672 | const size_t pointer_size_; |
Nicolas Geoffray | 4a34a42 | 2014-04-03 10:38:37 +0100 | [diff] [blame] | 673 | |
| 674 | DISALLOW_COPY_AND_ASSIGN(CallingConvention); |
| 675 | }; |
| 676 | |
Aart Bik | 42249c3 | 2016-01-07 15:33:50 -0800 | [diff] [blame^] | 677 | /** |
| 678 | * A templated class SlowPathGenerator with a templated method NewSlowPath() |
| 679 | * that can be used by any code generator to share equivalent slow-paths with |
| 680 | * the objective of reducing generated code size. |
| 681 | * |
| 682 | * InstructionType: instruction that requires SlowPathCodeType |
| 683 | * SlowPathCodeType: subclass of SlowPathCode, with constructor SlowPathCodeType(InstructionType *) |
| 684 | */ |
| 685 | template <typename InstructionType> |
| 686 | class SlowPathGenerator { |
| 687 | static_assert(std::is_base_of<HInstruction, InstructionType>::value, |
| 688 | "InstructionType is not a subclass of art::HInstruction"); |
| 689 | |
| 690 | public: |
| 691 | SlowPathGenerator(HGraph* graph, CodeGenerator* codegen) |
| 692 | : graph_(graph), |
| 693 | codegen_(codegen), |
| 694 | slow_path_map_(std::less<uint32_t>(), graph->GetArena()->Adapter(kArenaAllocSlowPaths)) {} |
| 695 | |
| 696 | // Creates and adds a new slow-path, if needed, or returns existing one otherwise. |
| 697 | // Templating the method (rather than the whole class) on the slow-path type enables |
| 698 | // keeping this code at a generic, non architecture-specific place. |
| 699 | // |
| 700 | // NOTE: This approach assumes each InstructionType only generates one SlowPathCodeType. |
| 701 | // To relax this requirement, we would need some RTTI on the stored slow-paths, |
| 702 | // or template the class as a whole on SlowPathType. |
| 703 | template <typename SlowPathCodeType> |
| 704 | SlowPathCodeType* NewSlowPath(InstructionType* instruction) { |
| 705 | static_assert(std::is_base_of<SlowPathCode, SlowPathCodeType>::value, |
| 706 | "SlowPathCodeType is not a subclass of art::SlowPathCode"); |
| 707 | static_assert(std::is_constructible<SlowPathCodeType, InstructionType*>::value, |
| 708 | "SlowPathCodeType is not constructible from InstructionType*"); |
| 709 | // Iterate over potential candidates for sharing. Currently, only same-typed |
| 710 | // slow-paths with exactly the same dex-pc are viable candidates. |
| 711 | // TODO: pass dex-pc/slow-path-type to run-time to allow even more sharing? |
| 712 | const uint32_t dex_pc = instruction->GetDexPc(); |
| 713 | auto iter = slow_path_map_.find(dex_pc); |
| 714 | if (iter != slow_path_map_.end()) { |
| 715 | auto candidates = iter->second; |
| 716 | for (const auto& it : candidates) { |
| 717 | InstructionType* other_instruction = it.first; |
| 718 | SlowPathCodeType* other_slow_path = down_cast<SlowPathCodeType*>(it.second); |
| 719 | // Determine if the instructions allow for slow-path sharing. |
| 720 | if (HaveSameLiveRegisters(instruction, other_instruction) && |
| 721 | HaveSameStackMap(instruction, other_instruction)) { |
| 722 | // Can share: reuse existing one. |
| 723 | return other_slow_path; |
| 724 | } |
| 725 | } |
| 726 | } else { |
| 727 | // First time this dex-pc is seen. |
| 728 | iter = slow_path_map_.Put(dex_pc, {{}, {graph_->GetArena()->Adapter(kArenaAllocSlowPaths)}}); |
| 729 | } |
| 730 | // Cannot share: create and add new slow-path for this particular dex-pc. |
| 731 | SlowPathCodeType* slow_path = new (graph_->GetArena()) SlowPathCodeType(instruction); |
| 732 | iter->second.emplace_back(std::make_pair(instruction, slow_path)); |
| 733 | codegen_->AddSlowPath(slow_path); |
| 734 | return slow_path; |
| 735 | } |
| 736 | |
| 737 | private: |
| 738 | // Tests if both instructions have same set of live physical registers. This ensures |
| 739 | // the slow-path has exactly the same preamble on saving these registers to stack. |
| 740 | bool HaveSameLiveRegisters(const InstructionType* i1, const InstructionType* i2) const { |
| 741 | const uint32_t core_spill = ~codegen_->GetCoreSpillMask(); |
| 742 | const uint32_t fpu_spill = ~codegen_->GetFpuSpillMask(); |
| 743 | RegisterSet* live1 = i1->GetLocations()->GetLiveRegisters(); |
| 744 | RegisterSet* live2 = i2->GetLocations()->GetLiveRegisters(); |
| 745 | return (((live1->GetCoreRegisters() & core_spill) == |
| 746 | (live2->GetCoreRegisters() & core_spill)) && |
| 747 | ((live1->GetFloatingPointRegisters() & fpu_spill) == |
| 748 | (live2->GetFloatingPointRegisters() & fpu_spill))); |
| 749 | } |
| 750 | |
| 751 | // Tests if both instructions have the same stack map. This ensures the interpreter |
| 752 | // will find exactly the same dex-registers at the same entries. |
| 753 | bool HaveSameStackMap(const InstructionType* i1, const InstructionType* i2) const { |
| 754 | DCHECK(i1->HasEnvironment()); |
| 755 | DCHECK(i2->HasEnvironment()); |
| 756 | // We conservatively test if the two instructions find exactly the same instructions |
| 757 | // and location in each dex-register. This guarantees they will have the same stack map. |
| 758 | HEnvironment* e1 = i1->GetEnvironment(); |
| 759 | HEnvironment* e2 = i2->GetEnvironment(); |
| 760 | if (e1->GetParent() != e2->GetParent() || e1->Size() != e2->Size()) { |
| 761 | return false; |
| 762 | } |
| 763 | for (size_t i = 0, sz = e1->Size(); i < sz; ++i) { |
| 764 | if (e1->GetInstructionAt(i) != e2->GetInstructionAt(i) || |
| 765 | !e1->GetLocationAt(i).Equals(e2->GetLocationAt(i))) { |
| 766 | return false; |
| 767 | } |
| 768 | } |
| 769 | return true; |
| 770 | } |
| 771 | |
| 772 | HGraph* const graph_; |
| 773 | CodeGenerator* const codegen_; |
| 774 | |
| 775 | // Map from dex-pc to vector of already existing instruction/slow-path pairs. |
| 776 | ArenaSafeMap<uint32_t, ArenaVector<std::pair<InstructionType*, SlowPathCode*>>> slow_path_map_; |
| 777 | |
| 778 | DISALLOW_COPY_AND_ASSIGN(SlowPathGenerator); |
| 779 | }; |
| 780 | |
| 781 | class InstructionCodeGenerator : public HGraphVisitor { |
| 782 | public: |
| 783 | InstructionCodeGenerator(HGraph* graph, CodeGenerator* codegen) |
| 784 | : HGraphVisitor(graph), |
| 785 | deopt_slow_paths_(graph, codegen) {} |
| 786 | |
| 787 | protected: |
| 788 | // Add slow-path generator for each instruction/slow-path combination that desires sharing. |
| 789 | // TODO: under current regime, only deopt sharing make sense; extend later. |
| 790 | SlowPathGenerator<HDeoptimize> deopt_slow_paths_; |
| 791 | }; |
| 792 | |
Nicolas Geoffray | d4dd255 | 2014-02-28 10:23:58 +0000 | [diff] [blame] | 793 | } // namespace art |
| 794 | |
| 795 | #endif // ART_COMPILER_OPTIMIZING_CODE_GENERATOR_H_ |