blob: 5958cd89bc16cc633e1fdd7d3a4143cdb17f817e [file] [log] [blame]
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +00001/*
2 * Copyright (C) 2014 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17#ifndef ART_COMPILER_OPTIMIZING_CODE_GENERATOR_H_
18#define ART_COMPILER_OPTIMIZING_CODE_GENERATOR_H_
19
Ian Rogersd582fa42014-11-05 23:46:43 -080020#include "arch/instruction_set.h"
Calin Juravle34166012014-12-19 17:22:29 +000021#include "arch/instruction_set_features.h"
Vladimir Markof9f64412015-09-02 14:05:49 +010022#include "base/arena_containers.h"
23#include "base/arena_object.h"
Nicolas Geoffray01bc96d2014-04-11 17:43:50 +010024#include "base/bit_field.h"
Nicolas Geoffrayd28b9692015-11-04 14:36:55 +000025#include "compiled_method.h"
Calin Juravlecd6dffe2015-01-08 17:35:35 +000026#include "driver/compiler_options.h"
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +000027#include "globals.h"
Alexandre Rameseb7b7392015-06-19 14:47:01 +010028#include "graph_visualizer.h"
Nicolas Geoffray4e3d23a2014-05-22 18:32:45 +010029#include "locations.h"
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +000030#include "memory_region.h"
31#include "nodes.h"
Serban Constantinescuecc43662015-08-13 13:33:12 +010032#include "optimizing_compiler_stats.h"
Nicolas Geoffray39468442014-09-02 15:17:15 +010033#include "stack_map_stream.h"
Andreas Gampe85b62f22015-09-09 13:15:38 -070034#include "utils/label.h"
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +000035
36namespace art {
37
Roland Levillain6d0e4832014-11-27 18:31:21 +000038// Binary encoding of 2^32 for type double.
39static int64_t constexpr k2Pow32EncodingForDouble = INT64_C(0x41F0000000000000);
40// Binary encoding of 2^31 for type double.
41static int64_t constexpr k2Pow31EncodingForDouble = INT64_C(0x41E0000000000000);
42
Mark Mendelle82549b2015-05-06 10:55:34 -040043// Minimum value for a primitive integer.
44static int32_t constexpr kPrimIntMin = 0x80000000;
45// Minimum value for a primitive long.
46static int64_t constexpr kPrimLongMin = INT64_C(0x8000000000000000);
47
Roland Levillain3f8f9362014-12-02 17:45:01 +000048// Maximum value for a primitive integer.
49static int32_t constexpr kPrimIntMax = 0x7fffffff;
Roland Levillain624279f2014-12-04 11:54:28 +000050// Maximum value for a primitive long.
Mark Mendelle82549b2015-05-06 10:55:34 -040051static int64_t constexpr kPrimLongMax = INT64_C(0x7fffffffffffffff);
Roland Levillain3f8f9362014-12-02 17:45:01 +000052
Nicolas Geoffray92a73ae2014-10-16 11:12:52 +010053class Assembler;
Nicolas Geoffraye5038322014-07-04 09:41:32 +010054class CodeGenerator;
Nicolas Geoffrayd28b9692015-11-04 14:36:55 +000055class CompilerDriver;
Vladimir Marko58155012015-08-19 12:49:41 +000056class LinkerPatch;
Nicolas Geoffrayf0e39372014-11-12 17:50:07 +000057class ParallelMoveResolver;
Nicolas Geoffray92cf83e2014-03-18 17:59:20 +000058
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +000059class CodeAllocator {
60 public:
Nicolas Geoffraye5038322014-07-04 09:41:32 +010061 CodeAllocator() {}
62 virtual ~CodeAllocator() {}
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +000063
64 virtual uint8_t* Allocate(size_t size) = 0;
65
66 private:
67 DISALLOW_COPY_AND_ASSIGN(CodeAllocator);
68};
69
Ian Rogers6a3c1fc2014-10-31 00:33:20 -070070class SlowPathCode : public ArenaObject<kArenaAllocSlowPaths> {
Nicolas Geoffraye5038322014-07-04 09:41:32 +010071 public:
Nicolas Geoffrayeeefa122015-03-13 18:52:59 +000072 SlowPathCode() {
73 for (size_t i = 0; i < kMaximumNumberOfExpectedRegisters; ++i) {
74 saved_core_stack_offsets_[i] = kRegisterNotSaved;
75 saved_fpu_stack_offsets_[i] = kRegisterNotSaved;
76 }
77 }
78
Nicolas Geoffraye5038322014-07-04 09:41:32 +010079 virtual ~SlowPathCode() {}
80
Nicolas Geoffraye5038322014-07-04 09:41:32 +010081 virtual void EmitNativeCode(CodeGenerator* codegen) = 0;
82
Zheng Xuda403092015-04-24 17:35:39 +080083 virtual void SaveLiveRegisters(CodeGenerator* codegen, LocationSummary* locations);
84 virtual void RestoreLiveRegisters(CodeGenerator* codegen, LocationSummary* locations);
Nicolas Geoffraya8ac9132015-03-13 16:36:36 +000085
Nicolas Geoffrayeeefa122015-03-13 18:52:59 +000086 bool IsCoreRegisterSaved(int reg) const {
87 return saved_core_stack_offsets_[reg] != kRegisterNotSaved;
88 }
89
90 bool IsFpuRegisterSaved(int reg) const {
91 return saved_fpu_stack_offsets_[reg] != kRegisterNotSaved;
92 }
93
94 uint32_t GetStackOffsetOfCoreRegister(int reg) const {
95 return saved_core_stack_offsets_[reg];
96 }
97
98 uint32_t GetStackOffsetOfFpuRegister(int reg) const {
99 return saved_fpu_stack_offsets_[reg];
100 }
101
Alexandre Rames8158f282015-08-07 10:26:17 +0100102 virtual bool IsFatal() const { return false; }
103
Alexandre Rames9931f312015-06-19 14:47:01 +0100104 virtual const char* GetDescription() const = 0;
105
Andreas Gampe85b62f22015-09-09 13:15:38 -0700106 Label* GetEntryLabel() { return &entry_label_; }
107 Label* GetExitLabel() { return &exit_label_; }
108
Zheng Xuda403092015-04-24 17:35:39 +0800109 protected:
Nicolas Geoffrayeeefa122015-03-13 18:52:59 +0000110 static constexpr size_t kMaximumNumberOfExpectedRegisters = 32;
111 static constexpr uint32_t kRegisterNotSaved = -1;
112 uint32_t saved_core_stack_offsets_[kMaximumNumberOfExpectedRegisters];
113 uint32_t saved_fpu_stack_offsets_[kMaximumNumberOfExpectedRegisters];
Zheng Xuda403092015-04-24 17:35:39 +0800114
115 private:
Andreas Gampe85b62f22015-09-09 13:15:38 -0700116 Label entry_label_;
117 Label exit_label_;
118
Nicolas Geoffraye5038322014-07-04 09:41:32 +0100119 DISALLOW_COPY_AND_ASSIGN(SlowPathCode);
120};
121
Roland Levillain2d27c8e2015-04-28 15:48:45 +0100122class InvokeDexCallingConventionVisitor {
123 public:
124 virtual Location GetNextLocation(Primitive::Type type) = 0;
Nicolas Geoffrayfd88f162015-06-03 11:23:52 +0100125 virtual Location GetReturnLocation(Primitive::Type type) const = 0;
126 virtual Location GetMethodLocation() const = 0;
Roland Levillain2d27c8e2015-04-28 15:48:45 +0100127
128 protected:
129 InvokeDexCallingConventionVisitor() {}
130 virtual ~InvokeDexCallingConventionVisitor() {}
131
132 // The current index for core registers.
133 uint32_t gp_index_ = 0u;
134 // The current index for floating-point registers.
135 uint32_t float_index_ = 0u;
136 // The current stack index.
137 uint32_t stack_index_ = 0u;
138
139 private:
140 DISALLOW_COPY_AND_ASSIGN(InvokeDexCallingConventionVisitor);
141};
142
Calin Juravlee460d1d2015-09-29 04:52:17 +0100143class FieldAccessCallingConvention {
144 public:
145 virtual Location GetObjectLocation() const = 0;
146 virtual Location GetFieldIndexLocation() const = 0;
147 virtual Location GetReturnLocation(Primitive::Type type) const = 0;
148 virtual Location GetSetValueLocation(Primitive::Type type, bool is_instance) const = 0;
149 virtual Location GetFpuLocation(Primitive::Type type) const = 0;
150 virtual ~FieldAccessCallingConvention() {}
151
152 protected:
153 FieldAccessCallingConvention() {}
154
155 private:
156 DISALLOW_COPY_AND_ASSIGN(FieldAccessCallingConvention);
157};
158
Nicolas Geoffray12df9eb2015-01-09 14:53:50 +0000159class CodeGenerator {
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000160 public:
161 // Compiles the graph to executable instructions. Returns whether the compilation
162 // succeeded.
Nicolas Geoffray73e80c32014-07-22 17:47:56 +0100163 void CompileBaseline(CodeAllocator* allocator, bool is_leaf = false);
Nicolas Geoffray86dbb9a2014-06-04 11:12:39 +0100164 void CompileOptimized(CodeAllocator* allocator);
Nicolas Geoffray12df9eb2015-01-09 14:53:50 +0000165 static CodeGenerator* Create(HGraph* graph,
Calin Juravle34166012014-12-19 17:22:29 +0000166 InstructionSet instruction_set,
Calin Juravlecd6dffe2015-01-08 17:35:35 +0000167 const InstructionSetFeatures& isa_features,
Serban Constantinescuecc43662015-08-13 13:33:12 +0100168 const CompilerOptions& compiler_options,
169 OptimizingCompilerStats* stats = nullptr);
Nicolas Geoffray12df9eb2015-01-09 14:53:50 +0000170 virtual ~CodeGenerator() {}
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000171
Vladimir Markodc151b22015-10-15 18:02:30 +0100172 // Get the graph. This is the outermost graph, never the graph of a method being inlined.
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000173 HGraph* GetGraph() const { return graph_; }
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000174
Nicolas Geoffraydc23d832015-02-16 11:15:43 +0000175 HBasicBlock* GetNextBlockToEmit() const;
176 HBasicBlock* FirstNonEmptyBlock(HBasicBlock* block) const;
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +0000177 bool GoesToNextBlock(HBasicBlock* current, HBasicBlock* next) const;
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000178
Nicolas Geoffray86dbb9a2014-06-04 11:12:39 +0100179 size_t GetStackSlotOfParameter(HParameterValue* parameter) const {
180 // Note that this follows the current calling convention.
181 return GetFrameSize()
Mathieu Chartiere401d142015-04-22 13:56:20 -0700182 + InstructionSetPointerSize(GetInstructionSet()) // Art method
Nicolas Geoffraye27f31a2014-06-12 17:53:14 +0100183 + parameter->GetIndex() * kVRegSize;
Nicolas Geoffray86dbb9a2014-06-04 11:12:39 +0100184 }
185
Nicolas Geoffray92a73ae2014-10-16 11:12:52 +0100186 virtual void Initialize() = 0;
Serban Constantinescu32f5b4d2014-11-25 20:05:46 +0000187 virtual void Finalize(CodeAllocator* allocator);
Vladimir Marko58155012015-08-19 12:49:41 +0000188 virtual void EmitLinkerPatches(ArenaVector<LinkerPatch>* linker_patches);
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000189 virtual void GenerateFrameEntry() = 0;
190 virtual void GenerateFrameExit() = 0;
Nicolas Geoffray92a73ae2014-10-16 11:12:52 +0100191 virtual void Bind(HBasicBlock* block) = 0;
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100192 virtual void Move(HInstruction* instruction, Location location, HInstruction* move_for) = 0;
Calin Juravle175dc732015-08-25 15:42:32 +0100193 virtual void MoveConstant(Location destination, int32_t value) = 0;
Calin Juravlee460d1d2015-09-29 04:52:17 +0100194 virtual void MoveLocation(Location dst, Location src, Primitive::Type dst_type) = 0;
195 virtual void AddLocationAsTemp(Location location, LocationSummary* locations) = 0;
196
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000197 virtual Assembler* GetAssembler() = 0;
Alexandre Rameseb7b7392015-06-19 14:47:01 +0100198 virtual const Assembler& GetAssembler() const = 0;
Nicolas Geoffray707c8092014-04-04 10:50:14 +0100199 virtual size_t GetWordSize() const = 0;
Mark Mendellf85a9ca2015-01-13 09:20:58 -0500200 virtual size_t GetFloatingPointSpillSlotSize() const = 0;
Nicolas Geoffrayde58ab22014-11-05 12:46:03 +0000201 virtual uintptr_t GetAddressOf(HBasicBlock* block) const = 0;
Nicolas Geoffray4c204ba2015-02-03 15:12:35 +0000202 void InitializeCodeGeneration(size_t number_of_spill_slots,
203 size_t maximum_number_of_live_core_registers,
Roland Levillain0d5a2812015-11-13 10:07:31 +0000204 size_t maximum_number_of_live_fpu_registers,
Nicolas Geoffray4c204ba2015-02-03 15:12:35 +0000205 size_t number_of_out_slots,
Vladimir Markofa6b93c2015-09-15 10:15:55 +0100206 const ArenaVector<HBasicBlock*>& block_order);
Nicolas Geoffrayab032bc2014-07-15 12:55:21 +0100207 int32_t GetStackSlot(HLocal* local) const;
208 Location GetTemporaryLocation(HTemporary* temp) const;
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000209
210 uint32_t GetFrameSize() const { return frame_size_; }
211 void SetFrameSize(uint32_t size) { frame_size_ = size; }
Nicolas Geoffray8ccc3f52014-03-19 10:34:11 +0000212 uint32_t GetCoreSpillMask() const { return core_spill_mask_; }
Nicolas Geoffrayd97dc402015-01-22 13:50:01 +0000213 uint32_t GetFpuSpillMask() const { return fpu_spill_mask_; }
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000214
Nicolas Geoffray71175b72014-10-09 22:13:55 +0100215 size_t GetNumberOfCoreRegisters() const { return number_of_core_registers_; }
216 size_t GetNumberOfFloatingPointRegisters() const { return number_of_fpu_registers_; }
Nicolas Geoffray98893962015-01-21 12:32:32 +0000217 virtual void SetupBlockedRegisters(bool is_baseline) const = 0;
Nicolas Geoffray71175b72014-10-09 22:13:55 +0100218
Nicolas Geoffray4dee6362015-01-23 18:23:14 +0000219 virtual void ComputeSpillMask() {
220 core_spill_mask_ = allocated_registers_.GetCoreRegisters() & core_callee_save_mask_;
221 DCHECK_NE(core_spill_mask_, 0u) << "At least the return address register must be saved";
222 fpu_spill_mask_ = allocated_registers_.GetFloatingPointRegisters() & fpu_callee_save_mask_;
223 }
224
225 static uint32_t ComputeRegisterMask(const int* registers, size_t length) {
226 uint32_t mask = 0;
227 for (size_t i = 0, e = length; i < e; ++i) {
228 mask |= (1 << registers[i]);
229 }
230 return mask;
231 }
232
Nicolas Geoffraya7062e02014-05-22 12:50:17 +0100233 virtual void DumpCoreRegister(std::ostream& stream, int reg) const = 0;
234 virtual void DumpFloatingPointRegister(std::ostream& stream, int reg) const = 0;
Nicolas Geoffray412f10c2014-06-19 10:00:34 +0100235 virtual InstructionSet GetInstructionSet() const = 0;
Calin Juravlecd6dffe2015-01-08 17:35:35 +0000236
237 const CompilerOptions& GetCompilerOptions() const { return compiler_options_; }
238
Serban Constantinescuecc43662015-08-13 13:33:12 +0100239 void MaybeRecordStat(MethodCompilationStat compilation_stat, size_t count = 1) const;
240
Nicolas Geoffray102cbed2014-10-15 18:31:05 +0100241 // Saves the register in the stack. Returns the size taken on stack.
242 virtual size_t SaveCoreRegister(size_t stack_index, uint32_t reg_id) = 0;
243 // Restores the register from the stack. Returns the size taken on stack.
244 virtual size_t RestoreCoreRegister(size_t stack_index, uint32_t reg_id) = 0;
Nicolas Geoffray234d69d2015-03-09 10:28:50 +0000245
246 virtual size_t SaveFloatingPointRegister(size_t stack_index, uint32_t reg_id) = 0;
247 virtual size_t RestoreFloatingPointRegister(size_t stack_index, uint32_t reg_id) = 0;
248
Nicolas Geoffray840e5462015-01-07 16:01:24 +0000249 virtual bool NeedsTwoRegisters(Primitive::Type type) const = 0;
Nicolas Geoffray234d69d2015-03-09 10:28:50 +0000250 // Returns whether we should split long moves in parallel moves.
251 virtual bool ShouldSplitLongMoves() const { return false; }
Nicolas Geoffraya7062e02014-05-22 12:50:17 +0100252
Roland Levillain0d5a2812015-11-13 10:07:31 +0000253 size_t GetNumberOfCoreCalleeSaveRegisters() const {
254 return POPCOUNT(core_callee_save_mask_);
255 }
256
257 size_t GetNumberOfCoreCallerSaveRegisters() const {
258 DCHECK_GE(GetNumberOfCoreRegisters(), GetNumberOfCoreCalleeSaveRegisters());
259 return GetNumberOfCoreRegisters() - GetNumberOfCoreCalleeSaveRegisters();
260 }
261
Nicolas Geoffray98893962015-01-21 12:32:32 +0000262 bool IsCoreCalleeSaveRegister(int reg) const {
263 return (core_callee_save_mask_ & (1 << reg)) != 0;
264 }
265
266 bool IsFloatingPointCalleeSaveRegister(int reg) const {
267 return (fpu_callee_save_mask_ & (1 << reg)) != 0;
268 }
269
Yevgeny Rouban2a7c1ef2015-07-22 18:36:24 +0600270 // Record native to dex mapping for a suspend point. Required by runtime.
Nicolas Geoffrayeeefa122015-03-13 18:52:59 +0000271 void RecordPcInfo(HInstruction* instruction, uint32_t dex_pc, SlowPathCode* slow_path = nullptr);
David Srbeckyb7070a22016-01-08 18:13:53 +0000272 // Check whether we have already recorded mapping at this PC.
273 bool HasStackMapAtCurrentPc();
Yevgeny Rouban2a7c1ef2015-07-22 18:36:24 +0600274
Calin Juravle77520bc2015-01-12 18:45:46 +0000275 bool CanMoveNullCheckToUser(HNullCheck* null_check);
276 void MaybeRecordImplicitNullCheck(HInstruction* instruction);
Nicolas Geoffray8ccc3f52014-03-19 10:34:11 +0000277
David Brazdil77a48ae2015-09-15 12:34:04 +0000278 // Records a stack map which the runtime might use to set catch phi values
279 // during exception delivery.
280 // TODO: Replace with a catch-entering instruction that records the environment.
281 void RecordCatchBlockInfo();
282
283 // Returns true if implicit null checks are allowed in the compiler options
284 // and if the null check is not inside a try block. We currently cannot do
285 // implicit null checks in that case because we need the NullCheckSlowPath to
286 // save live registers, which may be needed by the runtime to set catch phis.
287 bool IsImplicitNullCheckAllowed(HNullCheck* null_check) const;
288
Nicolas Geoffraye5038322014-07-04 09:41:32 +0100289 void AddSlowPath(SlowPathCode* slow_path) {
Vladimir Marko225b6462015-09-28 12:17:40 +0100290 slow_paths_.push_back(slow_path);
Nicolas Geoffraye5038322014-07-04 09:41:32 +0100291 }
292
Vladimir Markof9f64412015-09-02 14:05:49 +0100293 void BuildMappingTable(ArenaVector<uint8_t>* vector) const;
294 void BuildVMapTable(ArenaVector<uint8_t>* vector) const;
Nicolas Geoffray92cf83e2014-03-18 17:59:20 +0000295 void BuildNativeGCMap(
Nicolas Geoffrayd28b9692015-11-04 14:36:55 +0000296 ArenaVector<uint8_t>* vector, const CompilerDriver& compiler_driver) const;
297 void BuildStackMaps(MemoryRegion region);
298 size_t ComputeStackMapsSize();
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000299
Roland Levillain3e3d7332015-04-28 11:00:54 +0100300 bool IsBaseline() const {
301 return is_baseline_;
302 }
303
Nicolas Geoffrayf12feb82014-07-17 18:32:41 +0100304 bool IsLeafMethod() const {
305 return is_leaf_;
306 }
307
308 void MarkNotLeaf() {
309 is_leaf_ = false;
Nicolas Geoffrayc0572a42015-02-06 14:35:25 +0000310 requires_current_method_ = true;
311 }
312
313 void SetRequiresCurrentMethod() {
314 requires_current_method_ = true;
315 }
316
317 bool RequiresCurrentMethod() const {
318 return requires_current_method_;
Nicolas Geoffrayf12feb82014-07-17 18:32:41 +0100319 }
320
Nicolas Geoffray3c049742014-09-24 18:10:46 +0100321 // Clears the spill slots taken by loop phis in the `LocationSummary` of the
322 // suspend check. This is called when the code generator generates code
323 // for the suspend check at the back edge (instead of where the suspend check
324 // is, which is the loop entry). At this point, the spill slots for the phis
325 // have not been written to.
326 void ClearSpillSlotsFromLoopPhisInStackMap(HSuspendCheck* suspend_check) const;
327
Nicolas Geoffray71175b72014-10-09 22:13:55 +0100328 bool* GetBlockedCoreRegisters() const { return blocked_core_registers_; }
Nicolas Geoffray102cbed2014-10-15 18:31:05 +0100329 bool* GetBlockedFloatingPointRegisters() const { return blocked_fpu_registers_; }
Nicolas Geoffray71175b72014-10-09 22:13:55 +0100330
Nicolas Geoffray19a19cf2014-10-22 16:07:05 +0100331 // Helper that returns the pointer offset of an index in an object array.
332 // Note: this method assumes we always have the same pointer size, regardless
333 // of the architecture.
334 static size_t GetCacheOffset(uint32_t index);
Mathieu Chartiere401d142015-04-22 13:56:20 -0700335 // Pointer variant for ArtMethod and ArtField arrays.
336 size_t GetCachePointerOffset(uint32_t index);
Nicolas Geoffray19a19cf2014-10-22 16:07:05 +0100337
Nicolas Geoffray90218252015-04-15 11:56:51 +0100338 void EmitParallelMoves(Location from1,
339 Location to1,
340 Primitive::Type type1,
341 Location from2,
342 Location to2,
343 Primitive::Type type2);
Nicolas Geoffrayf0e39372014-11-12 17:50:07 +0000344
Nicolas Geoffrayaf07bc12014-11-12 18:08:09 +0000345 static bool StoreNeedsWriteBarrier(Primitive::Type type, HInstruction* value) {
David Brazdil522e2242015-03-17 18:48:28 +0000346 // Check that null value is not represented as an integer constant.
347 DCHECK(type != Primitive::kPrimNot || !value->IsIntConstant());
348 return type == Primitive::kPrimNot && !value->IsNullConstant();
Nicolas Geoffrayaf07bc12014-11-12 18:08:09 +0000349 }
350
Alexandre Rames78e3ef62015-08-12 13:43:29 +0100351 void ValidateInvokeRuntime(HInstruction* instruction, SlowPathCode* slow_path);
352
Nicolas Geoffray98893962015-01-21 12:32:32 +0000353 void AddAllocatedRegister(Location location) {
354 allocated_registers_.Add(location);
355 }
356
Nicolas Geoffray45b83af2015-07-06 15:12:53 +0000357 bool HasAllocatedRegister(bool is_core, int reg) const {
358 return is_core
359 ? allocated_registers_.ContainsCoreRegister(reg)
360 : allocated_registers_.ContainsFloatingPointRegister(reg);
361 }
362
Nicolas Geoffrayc0572a42015-02-06 14:35:25 +0000363 void AllocateLocations(HInstruction* instruction);
364
Roland Levillainaa9b7c42015-02-17 15:40:09 +0000365 // Tells whether the stack frame of the compiled method is
366 // considered "empty", that is either actually having a size of zero,
367 // or just containing the saved return address register.
368 bool HasEmptyFrame() const {
369 return GetFrameSize() == (CallPushesPC() ? GetWordSize() : 0);
370 }
371
Nicolas Geoffrayd6138ef2015-02-18 14:48:53 +0000372 static int32_t GetInt32ValueOf(HConstant* constant) {
373 if (constant->IsIntConstant()) {
374 return constant->AsIntConstant()->GetValue();
375 } else if (constant->IsNullConstant()) {
376 return 0;
377 } else {
378 DCHECK(constant->IsFloatConstant());
Roland Levillainda4d79b2015-03-24 14:36:11 +0000379 return bit_cast<int32_t, float>(constant->AsFloatConstant()->GetValue());
Nicolas Geoffrayd6138ef2015-02-18 14:48:53 +0000380 }
381 }
382
383 static int64_t GetInt64ValueOf(HConstant* constant) {
384 if (constant->IsIntConstant()) {
385 return constant->AsIntConstant()->GetValue();
386 } else if (constant->IsNullConstant()) {
387 return 0;
388 } else if (constant->IsFloatConstant()) {
Roland Levillainda4d79b2015-03-24 14:36:11 +0000389 return bit_cast<int32_t, float>(constant->AsFloatConstant()->GetValue());
Nicolas Geoffrayd6138ef2015-02-18 14:48:53 +0000390 } else if (constant->IsLongConstant()) {
391 return constant->AsLongConstant()->GetValue();
392 } else {
393 DCHECK(constant->IsDoubleConstant());
Roland Levillainda4d79b2015-03-24 14:36:11 +0000394 return bit_cast<int64_t, double>(constant->AsDoubleConstant()->GetValue());
Nicolas Geoffrayd6138ef2015-02-18 14:48:53 +0000395 }
396 }
397
Nicolas Geoffraya8ac9132015-03-13 16:36:36 +0000398 size_t GetFirstRegisterSlotInSlowPath() const {
399 return first_register_slot_in_slow_path_;
400 }
401
402 uint32_t FrameEntrySpillSize() const {
403 return GetFpuSpillSize() + GetCoreSpillSize();
404 }
405
Roland Levillainec525fc2015-04-28 15:50:20 +0100406 virtual ParallelMoveResolver* GetMoveResolver() = 0;
Nicolas Geoffraya8ac9132015-03-13 16:36:36 +0000407
Nicolas Geoffrayfd88f162015-06-03 11:23:52 +0100408 static void CreateCommonInvokeLocationSummary(
409 HInvoke* invoke, InvokeDexCallingConventionVisitor* visitor);
410
Calin Juravle175dc732015-08-25 15:42:32 +0100411 void GenerateInvokeUnresolvedRuntimeCall(HInvokeUnresolved* invoke);
412
Calin Juravlee460d1d2015-09-29 04:52:17 +0100413 void CreateUnresolvedFieldLocationSummary(
414 HInstruction* field_access,
415 Primitive::Type field_type,
416 const FieldAccessCallingConvention& calling_convention);
417
418 void GenerateUnresolvedFieldAccess(
419 HInstruction* field_access,
420 Primitive::Type field_type,
421 uint32_t field_index,
422 uint32_t dex_pc,
423 const FieldAccessCallingConvention& calling_convention);
424
Calin Juravle98893e12015-10-02 21:05:03 +0100425 // TODO: This overlaps a bit with MoveFromReturnRegister. Refactor for a better design.
426 static void CreateLoadClassLocationSummary(HLoadClass* cls,
427 Location runtime_type_index_location,
Roland Levillain0d5a2812015-11-13 10:07:31 +0000428 Location runtime_return_location,
429 bool code_generator_supports_read_barrier = false);
Calin Juravle98893e12015-10-02 21:05:03 +0100430
Nicolas Geoffray5bd05a52015-10-13 09:48:30 +0100431 static void CreateSystemArrayCopyLocationSummary(HInvoke* invoke);
432
Alexandre Rameseb7b7392015-06-19 14:47:01 +0100433 void SetDisassemblyInformation(DisassemblyInformation* info) { disasm_info_ = info; }
434 DisassemblyInformation* GetDisassemblyInformation() const { return disasm_info_; }
435
Calin Juravle175dc732015-08-25 15:42:32 +0100436 virtual void InvokeRuntime(QuickEntrypointEnum entrypoint,
437 HInstruction* instruction,
438 uint32_t dex_pc,
439 SlowPathCode* slow_path) = 0;
440
Vladimir Markodc151b22015-10-15 18:02:30 +0100441 // Check if the desired_dispatch_info is supported. If it is, return it,
442 // otherwise return a fall-back info that should be used instead.
443 virtual HInvokeStaticOrDirect::DispatchInfo GetSupportedInvokeStaticOrDirectDispatch(
444 const HInvokeStaticOrDirect::DispatchInfo& desired_dispatch_info,
445 MethodReference target_method) = 0;
446
Andreas Gampe85b62f22015-09-09 13:15:38 -0700447 // Generate a call to a static or direct method.
448 virtual void GenerateStaticOrDirectCall(HInvokeStaticOrDirect* invoke, Location temp) = 0;
449 // Generate a call to a virtual method.
450 virtual void GenerateVirtualCall(HInvokeVirtual* invoke, Location temp) = 0;
451
452 // Copy the result of a call into the given target.
453 virtual void MoveFromReturnRegister(Location trg, Primitive::Type type) = 0;
454
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000455 protected:
Vladimir Marko58155012015-08-19 12:49:41 +0000456 // Method patch info used for recording locations of required linker patches and
457 // target methods. The target method can be used for various purposes, whether for
458 // patching the address of the method or the code pointer or a PC-relative call.
459 template <typename LabelType>
460 struct MethodPatchInfo {
461 explicit MethodPatchInfo(MethodReference m) : target_method(m), label() { }
462
463 MethodReference target_method;
464 LabelType label;
465 };
466
Nicolas Geoffray71175b72014-10-09 22:13:55 +0100467 CodeGenerator(HGraph* graph,
468 size_t number_of_core_registers,
469 size_t number_of_fpu_registers,
Calin Juravlecd6dffe2015-01-08 17:35:35 +0000470 size_t number_of_register_pairs,
Nicolas Geoffray98893962015-01-21 12:32:32 +0000471 uint32_t core_callee_save_mask,
472 uint32_t fpu_callee_save_mask,
Serban Constantinescuecc43662015-08-13 13:33:12 +0100473 const CompilerOptions& compiler_options,
474 OptimizingCompilerStats* stats)
Nicolas Geoffrayc0572a42015-02-06 14:35:25 +0000475 : frame_size_(0),
Nicolas Geoffray4361bef2014-08-20 04:59:12 +0100476 core_spill_mask_(0),
Nicolas Geoffrayd97dc402015-01-22 13:50:01 +0000477 fpu_spill_mask_(0),
Nicolas Geoffray3bca0df2014-09-19 11:01:00 +0100478 first_register_slot_in_slow_path_(0),
Vladimir Marko5233f932015-09-29 19:01:15 +0100479 blocked_core_registers_(graph->GetArena()->AllocArray<bool>(number_of_core_registers,
480 kArenaAllocCodeGenerator)),
481 blocked_fpu_registers_(graph->GetArena()->AllocArray<bool>(number_of_fpu_registers,
482 kArenaAllocCodeGenerator)),
483 blocked_register_pairs_(graph->GetArena()->AllocArray<bool>(number_of_register_pairs,
484 kArenaAllocCodeGenerator)),
Nicolas Geoffray71175b72014-10-09 22:13:55 +0100485 number_of_core_registers_(number_of_core_registers),
486 number_of_fpu_registers_(number_of_fpu_registers),
487 number_of_register_pairs_(number_of_register_pairs),
Nicolas Geoffray98893962015-01-21 12:32:32 +0000488 core_callee_save_mask_(core_callee_save_mask),
489 fpu_callee_save_mask_(fpu_callee_save_mask),
Vladimir Markocf93a5c2015-06-16 11:33:24 +0000490 stack_map_stream_(graph->GetArena()),
491 block_order_(nullptr),
Roland Levillain3e3d7332015-04-28 11:00:54 +0100492 is_baseline_(false),
Alexandre Rameseb7b7392015-06-19 14:47:01 +0100493 disasm_info_(nullptr),
Serban Constantinescuecc43662015-08-13 13:33:12 +0100494 stats_(stats),
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000495 graph_(graph),
Calin Juravlecd6dffe2015-01-08 17:35:35 +0000496 compiler_options_(compiler_options),
Vladimir Marko225b6462015-09-28 12:17:40 +0100497 slow_paths_(graph->GetArena()->Adapter(kArenaAllocCodeGenerator)),
Vladimir Marko0f7dca42015-11-02 14:36:43 +0000498 current_slow_path_(nullptr),
Nicolas Geoffray4c204ba2015-02-03 15:12:35 +0000499 current_block_index_(0),
Nicolas Geoffray39468442014-09-02 15:17:15 +0100500 is_leaf_(true),
Vladimir Marko225b6462015-09-28 12:17:40 +0100501 requires_current_method_(false) {
502 slow_paths_.reserve(8);
503 }
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000504
Nicolas Geoffraya7aca372014-04-28 17:47:12 +0100505 // Register allocation logic.
506 void AllocateRegistersLocally(HInstruction* instruction) const;
507
508 // Backend specific implementation for allocating a register.
Nicolas Geoffray71175b72014-10-09 22:13:55 +0100509 virtual Location AllocateFreeRegister(Primitive::Type type) const = 0;
Nicolas Geoffraya7aca372014-04-28 17:47:12 +0100510
Nicolas Geoffray71175b72014-10-09 22:13:55 +0100511 static size_t FindFreeEntry(bool* array, size_t length);
Nicolas Geoffray3c035032014-10-28 10:46:40 +0000512 static size_t FindTwoFreeConsecutiveAlignedEntries(bool* array, size_t length);
Nicolas Geoffraya7aca372014-04-28 17:47:12 +0100513
Nicolas Geoffraya7aca372014-04-28 17:47:12 +0100514 virtual Location GetStackLocation(HLoadLocal* load) const = 0;
515
Nicolas Geoffrayc0572a42015-02-06 14:35:25 +0000516 virtual HGraphVisitor* GetLocationBuilder() = 0;
517 virtual HGraphVisitor* GetInstructionVisitor() = 0;
Nicolas Geoffrayf0e39372014-11-12 17:50:07 +0000518
Nicolas Geoffrayd97dc402015-01-22 13:50:01 +0000519 // Returns the location of the first spilled entry for floating point registers,
520 // relative to the stack pointer.
521 uint32_t GetFpuSpillStart() const {
Nicolas Geoffrayd97dc402015-01-22 13:50:01 +0000522 return GetFrameSize() - FrameEntrySpillSize();
523 }
524
525 uint32_t GetFpuSpillSize() const {
526 return POPCOUNT(fpu_spill_mask_) * GetFloatingPointSpillSlotSize();
527 }
528
529 uint32_t GetCoreSpillSize() const {
530 return POPCOUNT(core_spill_mask_) * GetWordSize();
531 }
532
Nicolas Geoffrayc0572a42015-02-06 14:35:25 +0000533 bool HasAllocatedCalleeSaveRegisters() const {
534 // We check the core registers against 1 because it always comprises the return PC.
535 return (POPCOUNT(allocated_registers_.GetCoreRegisters() & core_callee_save_mask_) != 1)
536 || (POPCOUNT(allocated_registers_.GetFloatingPointRegisters() & fpu_callee_save_mask_) != 0);
537 }
538
539 bool CallPushesPC() const {
540 InstructionSet instruction_set = GetInstructionSet();
541 return instruction_set == kX86 || instruction_set == kX86_64;
542 }
543
Vladimir Marko225b6462015-09-28 12:17:40 +0100544 // Arm64 has its own type for a label, so we need to templatize these methods
Nicolas Geoffraydc23d832015-02-16 11:15:43 +0000545 // to share the logic.
Vladimir Marko225b6462015-09-28 12:17:40 +0100546
547 template <typename LabelType>
548 LabelType* CommonInitializeLabels() {
Vladimir Markob95fb772015-09-30 13:32:31 +0100549 // We use raw array allocations instead of ArenaVector<> because Labels are
550 // non-constructible and non-movable and as such cannot be held in a vector.
Vladimir Marko225b6462015-09-28 12:17:40 +0100551 size_t size = GetGraph()->GetBlocks().size();
552 LabelType* labels = GetGraph()->GetArena()->AllocArray<LabelType>(size,
553 kArenaAllocCodeGenerator);
554 for (size_t i = 0; i != size; ++i) {
555 new(labels + i) LabelType();
556 }
557 return labels;
558 }
559
Vladimir Marko58155012015-08-19 12:49:41 +0000560 template <typename LabelType>
561 LabelType* CommonGetLabelOf(LabelType* raw_pointer_to_labels_array, HBasicBlock* block) const {
Nicolas Geoffraydc23d832015-02-16 11:15:43 +0000562 block = FirstNonEmptyBlock(block);
563 return raw_pointer_to_labels_array + block->GetBlockId();
564 }
565
Vladimir Marko0f7dca42015-11-02 14:36:43 +0000566 SlowPathCode* GetCurrentSlowPath() {
567 return current_slow_path_;
568 }
569
Nicolas Geoffray8ccc3f52014-03-19 10:34:11 +0000570 // Frame size required for this method.
571 uint32_t frame_size_;
572 uint32_t core_spill_mask_;
Nicolas Geoffrayd97dc402015-01-22 13:50:01 +0000573 uint32_t fpu_spill_mask_;
Nicolas Geoffray3bca0df2014-09-19 11:01:00 +0100574 uint32_t first_register_slot_in_slow_path_;
Nicolas Geoffray8ccc3f52014-03-19 10:34:11 +0000575
Nicolas Geoffray98893962015-01-21 12:32:32 +0000576 // Registers that were allocated during linear scan.
577 RegisterSet allocated_registers_;
578
Nicolas Geoffray71175b72014-10-09 22:13:55 +0100579 // Arrays used when doing register allocation to know which
580 // registers we can allocate. `SetupBlockedRegisters` updates the
581 // arrays.
582 bool* const blocked_core_registers_;
583 bool* const blocked_fpu_registers_;
584 bool* const blocked_register_pairs_;
585 size_t number_of_core_registers_;
586 size_t number_of_fpu_registers_;
587 size_t number_of_register_pairs_;
Nicolas Geoffray98893962015-01-21 12:32:32 +0000588 const uint32_t core_callee_save_mask_;
589 const uint32_t fpu_callee_save_mask_;
Nicolas Geoffray71175b72014-10-09 22:13:55 +0100590
Vladimir Markocf93a5c2015-06-16 11:33:24 +0000591 StackMapStream stack_map_stream_;
592
593 // The order to use for code generation.
Vladimir Markofa6b93c2015-09-15 10:15:55 +0100594 const ArenaVector<HBasicBlock*>* block_order_;
Vladimir Markocf93a5c2015-06-16 11:33:24 +0000595
Roland Levillain3e3d7332015-04-28 11:00:54 +0100596 // Whether we are using baseline.
597 bool is_baseline_;
598
Alexandre Rameseb7b7392015-06-19 14:47:01 +0100599 DisassemblyInformation* disasm_info_;
600
Nicolas Geoffraybab4ed72014-03-11 17:53:17 +0000601 private:
Nicolas Geoffrayc0572a42015-02-06 14:35:25 +0000602 void InitLocationsBaseline(HInstruction* instruction);
Nicolas Geoffray3bca0df2014-09-19 11:01:00 +0100603 size_t GetStackOffsetOfSavedRegister(size_t index);
Alexandre Rameseb7b7392015-06-19 14:47:01 +0100604 void GenerateSlowPaths();
Nicolas Geoffray4c204ba2015-02-03 15:12:35 +0000605 void CompileInternal(CodeAllocator* allocator, bool is_baseline);
Mark Mendell5f874182015-03-04 15:42:45 -0500606 void BlockIfInRegister(Location location, bool is_out = false) const;
Nicolas Geoffrayb1d0f3f2015-05-14 12:41:51 +0100607 void EmitEnvironment(HEnvironment* environment, SlowPathCode* slow_path);
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000608
Serban Constantinescuecc43662015-08-13 13:33:12 +0100609 OptimizingCompilerStats* stats_;
610
Nicolas Geoffray787c3072014-03-17 10:20:19 +0000611 HGraph* const graph_;
Calin Juravlecd6dffe2015-01-08 17:35:35 +0000612 const CompilerOptions& compiler_options_;
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000613
Vladimir Marko225b6462015-09-28 12:17:40 +0100614 ArenaVector<SlowPathCode*> slow_paths_;
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000615
Aart Bik42249c32016-01-07 15:33:50 -0800616 // The current slow-path that we're generating code for.
Vladimir Marko0f7dca42015-11-02 14:36:43 +0000617 SlowPathCode* current_slow_path_;
618
Nicolas Geoffray4c204ba2015-02-03 15:12:35 +0000619 // The current block index in `block_order_` of the block
620 // we are generating code for.
621 size_t current_block_index_;
622
Nicolas Geoffrayc0572a42015-02-06 14:35:25 +0000623 // Whether the method is a leaf method.
Nicolas Geoffrayf12feb82014-07-17 18:32:41 +0100624 bool is_leaf_;
625
Nicolas Geoffrayc0572a42015-02-06 14:35:25 +0000626 // Whether an instruction in the graph accesses the current method.
627 bool requires_current_method_;
628
David Srbeckyc6b4dd82015-04-07 20:32:43 +0100629 friend class OptimizingCFITest;
630
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000631 DISALLOW_COPY_AND_ASSIGN(CodeGenerator);
632};
633
Nicolas Geoffray7fb49da2014-10-06 09:12:41 +0100634template <typename C, typename F>
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100635class CallingConvention {
636 public:
Nicolas Geoffray7fb49da2014-10-06 09:12:41 +0100637 CallingConvention(const C* registers,
638 size_t number_of_registers,
639 const F* fpu_registers,
Mathieu Chartiere401d142015-04-22 13:56:20 -0700640 size_t number_of_fpu_registers,
641 size_t pointer_size)
Nicolas Geoffray7fb49da2014-10-06 09:12:41 +0100642 : registers_(registers),
643 number_of_registers_(number_of_registers),
644 fpu_registers_(fpu_registers),
Mathieu Chartiere401d142015-04-22 13:56:20 -0700645 number_of_fpu_registers_(number_of_fpu_registers),
646 pointer_size_(pointer_size) {}
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100647
648 size_t GetNumberOfRegisters() const { return number_of_registers_; }
Nicolas Geoffray7fb49da2014-10-06 09:12:41 +0100649 size_t GetNumberOfFpuRegisters() const { return number_of_fpu_registers_; }
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100650
Nicolas Geoffray7fb49da2014-10-06 09:12:41 +0100651 C GetRegisterAt(size_t index) const {
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100652 DCHECK_LT(index, number_of_registers_);
653 return registers_[index];
654 }
655
Nicolas Geoffray7fb49da2014-10-06 09:12:41 +0100656 F GetFpuRegisterAt(size_t index) const {
657 DCHECK_LT(index, number_of_fpu_registers_);
658 return fpu_registers_[index];
659 }
660
661 size_t GetStackOffsetOf(size_t index) const {
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100662 // We still reserve the space for parameters passed by registers.
Mathieu Chartiere401d142015-04-22 13:56:20 -0700663 // Add space for the method pointer.
664 return pointer_size_ + index * kVRegSize;
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100665 }
666
667 private:
Nicolas Geoffray7fb49da2014-10-06 09:12:41 +0100668 const C* registers_;
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100669 const size_t number_of_registers_;
Nicolas Geoffray7fb49da2014-10-06 09:12:41 +0100670 const F* fpu_registers_;
671 const size_t number_of_fpu_registers_;
Mathieu Chartiere401d142015-04-22 13:56:20 -0700672 const size_t pointer_size_;
Nicolas Geoffray4a34a422014-04-03 10:38:37 +0100673
674 DISALLOW_COPY_AND_ASSIGN(CallingConvention);
675};
676
Aart Bik42249c32016-01-07 15:33:50 -0800677/**
678 * A templated class SlowPathGenerator with a templated method NewSlowPath()
679 * that can be used by any code generator to share equivalent slow-paths with
680 * the objective of reducing generated code size.
681 *
682 * InstructionType: instruction that requires SlowPathCodeType
683 * SlowPathCodeType: subclass of SlowPathCode, with constructor SlowPathCodeType(InstructionType *)
684 */
685template <typename InstructionType>
686class SlowPathGenerator {
687 static_assert(std::is_base_of<HInstruction, InstructionType>::value,
688 "InstructionType is not a subclass of art::HInstruction");
689
690 public:
691 SlowPathGenerator(HGraph* graph, CodeGenerator* codegen)
692 : graph_(graph),
693 codegen_(codegen),
694 slow_path_map_(std::less<uint32_t>(), graph->GetArena()->Adapter(kArenaAllocSlowPaths)) {}
695
696 // Creates and adds a new slow-path, if needed, or returns existing one otherwise.
697 // Templating the method (rather than the whole class) on the slow-path type enables
698 // keeping this code at a generic, non architecture-specific place.
699 //
700 // NOTE: This approach assumes each InstructionType only generates one SlowPathCodeType.
701 // To relax this requirement, we would need some RTTI on the stored slow-paths,
702 // or template the class as a whole on SlowPathType.
703 template <typename SlowPathCodeType>
704 SlowPathCodeType* NewSlowPath(InstructionType* instruction) {
705 static_assert(std::is_base_of<SlowPathCode, SlowPathCodeType>::value,
706 "SlowPathCodeType is not a subclass of art::SlowPathCode");
707 static_assert(std::is_constructible<SlowPathCodeType, InstructionType*>::value,
708 "SlowPathCodeType is not constructible from InstructionType*");
709 // Iterate over potential candidates for sharing. Currently, only same-typed
710 // slow-paths with exactly the same dex-pc are viable candidates.
711 // TODO: pass dex-pc/slow-path-type to run-time to allow even more sharing?
712 const uint32_t dex_pc = instruction->GetDexPc();
713 auto iter = slow_path_map_.find(dex_pc);
714 if (iter != slow_path_map_.end()) {
715 auto candidates = iter->second;
716 for (const auto& it : candidates) {
717 InstructionType* other_instruction = it.first;
718 SlowPathCodeType* other_slow_path = down_cast<SlowPathCodeType*>(it.second);
719 // Determine if the instructions allow for slow-path sharing.
720 if (HaveSameLiveRegisters(instruction, other_instruction) &&
721 HaveSameStackMap(instruction, other_instruction)) {
722 // Can share: reuse existing one.
723 return other_slow_path;
724 }
725 }
726 } else {
727 // First time this dex-pc is seen.
728 iter = slow_path_map_.Put(dex_pc, {{}, {graph_->GetArena()->Adapter(kArenaAllocSlowPaths)}});
729 }
730 // Cannot share: create and add new slow-path for this particular dex-pc.
731 SlowPathCodeType* slow_path = new (graph_->GetArena()) SlowPathCodeType(instruction);
732 iter->second.emplace_back(std::make_pair(instruction, slow_path));
733 codegen_->AddSlowPath(slow_path);
734 return slow_path;
735 }
736
737 private:
738 // Tests if both instructions have same set of live physical registers. This ensures
739 // the slow-path has exactly the same preamble on saving these registers to stack.
740 bool HaveSameLiveRegisters(const InstructionType* i1, const InstructionType* i2) const {
741 const uint32_t core_spill = ~codegen_->GetCoreSpillMask();
742 const uint32_t fpu_spill = ~codegen_->GetFpuSpillMask();
743 RegisterSet* live1 = i1->GetLocations()->GetLiveRegisters();
744 RegisterSet* live2 = i2->GetLocations()->GetLiveRegisters();
745 return (((live1->GetCoreRegisters() & core_spill) ==
746 (live2->GetCoreRegisters() & core_spill)) &&
747 ((live1->GetFloatingPointRegisters() & fpu_spill) ==
748 (live2->GetFloatingPointRegisters() & fpu_spill)));
749 }
750
751 // Tests if both instructions have the same stack map. This ensures the interpreter
752 // will find exactly the same dex-registers at the same entries.
753 bool HaveSameStackMap(const InstructionType* i1, const InstructionType* i2) const {
754 DCHECK(i1->HasEnvironment());
755 DCHECK(i2->HasEnvironment());
756 // We conservatively test if the two instructions find exactly the same instructions
757 // and location in each dex-register. This guarantees they will have the same stack map.
758 HEnvironment* e1 = i1->GetEnvironment();
759 HEnvironment* e2 = i2->GetEnvironment();
760 if (e1->GetParent() != e2->GetParent() || e1->Size() != e2->Size()) {
761 return false;
762 }
763 for (size_t i = 0, sz = e1->Size(); i < sz; ++i) {
764 if (e1->GetInstructionAt(i) != e2->GetInstructionAt(i) ||
765 !e1->GetLocationAt(i).Equals(e2->GetLocationAt(i))) {
766 return false;
767 }
768 }
769 return true;
770 }
771
772 HGraph* const graph_;
773 CodeGenerator* const codegen_;
774
775 // Map from dex-pc to vector of already existing instruction/slow-path pairs.
776 ArenaSafeMap<uint32_t, ArenaVector<std::pair<InstructionType*, SlowPathCode*>>> slow_path_map_;
777
778 DISALLOW_COPY_AND_ASSIGN(SlowPathGenerator);
779};
780
781class InstructionCodeGenerator : public HGraphVisitor {
782 public:
783 InstructionCodeGenerator(HGraph* graph, CodeGenerator* codegen)
784 : HGraphVisitor(graph),
785 deopt_slow_paths_(graph, codegen) {}
786
787 protected:
788 // Add slow-path generator for each instruction/slow-path combination that desires sharing.
789 // TODO: under current regime, only deopt sharing make sense; extend later.
790 SlowPathGenerator<HDeoptimize> deopt_slow_paths_;
791};
792
Nicolas Geoffrayd4dd2552014-02-28 10:23:58 +0000793} // namespace art
794
795#endif // ART_COMPILER_OPTIMIZING_CODE_GENERATOR_H_