| /* |
| * Copyright (C) 2011 The Android Open Source Project |
| * |
| * Licensed under the Apache License, Version 2.0 (the "License"); |
| * you may not use this file except in compliance with the License. |
| * You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| #include "codegen_arm64.h" |
| |
| #include <inttypes.h> |
| |
| #include <string> |
| |
| #include "dex/compiler_internals.h" |
| #include "dex/quick/mir_to_lir-inl.h" |
| |
| namespace art { |
| |
| // TODO: rework this when c++11 support allows. |
| static const RegStorage core_regs_arr[] = |
| {rs_r0, rs_r1, rs_r2, rs_r3, rs_rARM_SUSPEND, rs_r5, rs_r6, rs_r7, rs_r8, rs_rARM_SELF, |
| rs_r10, rs_r11, rs_r12, rs_rARM_SP, rs_rARM_LR, rs_rARM_PC}; |
| static const RegStorage sp_regs_arr[] = |
| {rs_fr0, rs_fr1, rs_fr2, rs_fr3, rs_fr4, rs_fr5, rs_fr6, rs_fr7, rs_fr8, rs_fr9, rs_fr10, |
| rs_fr11, rs_fr12, rs_fr13, rs_fr14, rs_fr15, rs_fr16, rs_fr17, rs_fr18, rs_fr19, rs_fr20, |
| rs_fr21, rs_fr22, rs_fr23, rs_fr24, rs_fr25, rs_fr26, rs_fr27, rs_fr28, rs_fr29, rs_fr30, |
| rs_fr31}; |
| static const RegStorage dp_regs_arr[] = |
| {rs_dr0, rs_dr1, rs_dr2, rs_dr3, rs_dr4, rs_dr5, rs_dr6, rs_dr7, rs_dr8, rs_dr9, rs_dr10, |
| rs_dr11, rs_dr12, rs_dr13, rs_dr14, rs_dr15}; |
| static const RegStorage reserved_regs_arr[] = |
| {rs_rARM_SUSPEND, rs_rARM_SELF, rs_rARM_SP, rs_rARM_LR, rs_rARM_PC}; |
| static const RegStorage core_temps_arr[] = {rs_r0, rs_r1, rs_r2, rs_r3, rs_r12}; |
| static const RegStorage sp_temps_arr[] = |
| {rs_fr0, rs_fr1, rs_fr2, rs_fr3, rs_fr4, rs_fr5, rs_fr6, rs_fr7, rs_fr8, rs_fr9, rs_fr10, |
| rs_fr11, rs_fr12, rs_fr13, rs_fr14, rs_fr15}; |
| static const RegStorage dp_temps_arr[] = |
| {rs_dr0, rs_dr1, rs_dr2, rs_dr3, rs_dr4, rs_dr5, rs_dr6, rs_dr7}; |
| |
| static const std::vector<RegStorage> core_regs(core_regs_arr, |
| core_regs_arr + sizeof(core_regs_arr) / sizeof(core_regs_arr[0])); |
| static const std::vector<RegStorage> sp_regs(sp_regs_arr, |
| sp_regs_arr + sizeof(sp_regs_arr) / sizeof(sp_regs_arr[0])); |
| static const std::vector<RegStorage> dp_regs(dp_regs_arr, |
| dp_regs_arr + sizeof(dp_regs_arr) / sizeof(dp_regs_arr[0])); |
| static const std::vector<RegStorage> reserved_regs(reserved_regs_arr, |
| reserved_regs_arr + sizeof(reserved_regs_arr) / sizeof(reserved_regs_arr[0])); |
| static const std::vector<RegStorage> core_temps(core_temps_arr, |
| core_temps_arr + sizeof(core_temps_arr) / sizeof(core_temps_arr[0])); |
| static const std::vector<RegStorage> sp_temps(sp_temps_arr, |
| sp_temps_arr + sizeof(sp_temps_arr) / sizeof(sp_temps_arr[0])); |
| static const std::vector<RegStorage> dp_temps(dp_temps_arr, |
| dp_temps_arr + sizeof(dp_temps_arr) / sizeof(dp_temps_arr[0])); |
| |
| RegLocation Arm64Mir2Lir::LocCReturn() { |
| return arm_loc_c_return; |
| } |
| |
| RegLocation Arm64Mir2Lir::LocCReturnWide() { |
| return arm_loc_c_return_wide; |
| } |
| |
| RegLocation Arm64Mir2Lir::LocCReturnFloat() { |
| return arm_loc_c_return_float; |
| } |
| |
| RegLocation Arm64Mir2Lir::LocCReturnDouble() { |
| return arm_loc_c_return_double; |
| } |
| |
| // Return a target-dependent special register. |
| RegStorage Arm64Mir2Lir::TargetReg(SpecialTargetRegister reg) { |
| RegStorage res_reg = RegStorage::InvalidReg(); |
| switch (reg) { |
| case kSelf: res_reg = rs_rARM_SELF; break; |
| case kSuspend: res_reg = rs_rARM_SUSPEND; break; |
| case kLr: res_reg = rs_rARM_LR; break; |
| case kPc: res_reg = rs_rARM_PC; break; |
| case kSp: res_reg = rs_rARM_SP; break; |
| case kArg0: res_reg = rs_r0; break; |
| case kArg1: res_reg = rs_r1; break; |
| case kArg2: res_reg = rs_r2; break; |
| case kArg3: res_reg = rs_r3; break; |
| case kFArg0: res_reg = rs_r0; break; |
| case kFArg1: res_reg = rs_r1; break; |
| case kFArg2: res_reg = rs_r2; break; |
| case kFArg3: res_reg = rs_r3; break; |
| case kRet0: res_reg = rs_r0; break; |
| case kRet1: res_reg = rs_r1; break; |
| case kInvokeTgt: res_reg = rs_rARM_LR; break; |
| case kHiddenArg: res_reg = rs_r12; break; |
| case kHiddenFpArg: res_reg = RegStorage::InvalidReg(); break; |
| case kCount: res_reg = RegStorage::InvalidReg(); break; |
| } |
| return res_reg; |
| } |
| |
| RegStorage Arm64Mir2Lir::GetArgMappingToPhysicalReg(int arg_num) { |
| // For the 32-bit internal ABI, the first 3 arguments are passed in registers. |
| switch (arg_num) { |
| case 0: |
| return rs_r1; |
| case 1: |
| return rs_r2; |
| case 2: |
| return rs_r3; |
| default: |
| return RegStorage::InvalidReg(); |
| } |
| } |
| |
| /* |
| * Decode the register id. |
| */ |
| uint64_t Arm64Mir2Lir::GetRegMaskCommon(RegStorage reg) { |
| uint64_t seed; |
| int shift; |
| int reg_id = reg.GetRegNum(); |
| /* Each double register is equal to a pair of single-precision FP registers */ |
| if (reg.IsDouble()) { |
| seed = 0x3; |
| reg_id = reg_id << 1; |
| } else { |
| seed = 1; |
| } |
| /* FP register starts at bit position 16 */ |
| shift = reg.IsFloat() ? kArmFPReg0 : 0; |
| /* Expand the double register id into single offset */ |
| shift += reg_id; |
| return (seed << shift); |
| } |
| |
| uint64_t Arm64Mir2Lir::GetPCUseDefEncoding() { |
| return ENCODE_ARM_REG_PC; |
| } |
| |
| // Thumb2 specific setup. TODO: inline?: |
| void Arm64Mir2Lir::SetupTargetResourceMasks(LIR* lir, uint64_t flags) { |
| DCHECK_EQ(cu_->instruction_set, kThumb2); |
| DCHECK(!lir->flags.use_def_invalid); |
| |
| int opcode = lir->opcode; |
| |
| // These flags are somewhat uncommon - bypass if we can. |
| if ((flags & (REG_DEF_SP | REG_USE_SP | REG_DEF_LIST0 | REG_DEF_LIST1 | |
| REG_DEF_FPCS_LIST0 | REG_DEF_FPCS_LIST2 | REG_USE_PC | IS_IT | REG_USE_LIST0 | |
| REG_USE_LIST1 | REG_USE_FPCS_LIST0 | REG_USE_FPCS_LIST2 | REG_DEF_LR)) != 0) { |
| if (flags & REG_DEF_SP) { |
| lir->u.m.def_mask |= ENCODE_ARM_REG_SP; |
| } |
| |
| if (flags & REG_USE_SP) { |
| lir->u.m.use_mask |= ENCODE_ARM_REG_SP; |
| } |
| |
| if (flags & REG_DEF_LIST0) { |
| lir->u.m.def_mask |= ENCODE_ARM_REG_LIST(lir->operands[0]); |
| } |
| |
| if (flags & REG_DEF_LIST1) { |
| lir->u.m.def_mask |= ENCODE_ARM_REG_LIST(lir->operands[1]); |
| } |
| |
| if (flags & REG_DEF_FPCS_LIST0) { |
| lir->u.m.def_mask |= ENCODE_ARM_REG_FPCS_LIST(lir->operands[0]); |
| } |
| |
| if (flags & REG_DEF_FPCS_LIST2) { |
| for (int i = 0; i < lir->operands[2]; i++) { |
| SetupRegMask(&lir->u.m.def_mask, lir->operands[1] + i); |
| } |
| } |
| |
| if (flags & REG_USE_PC) { |
| lir->u.m.use_mask |= ENCODE_ARM_REG_PC; |
| } |
| |
| /* Conservatively treat the IT block */ |
| if (flags & IS_IT) { |
| lir->u.m.def_mask = ENCODE_ALL; |
| } |
| |
| if (flags & REG_USE_LIST0) { |
| lir->u.m.use_mask |= ENCODE_ARM_REG_LIST(lir->operands[0]); |
| } |
| |
| if (flags & REG_USE_LIST1) { |
| lir->u.m.use_mask |= ENCODE_ARM_REG_LIST(lir->operands[1]); |
| } |
| |
| if (flags & REG_USE_FPCS_LIST0) { |
| lir->u.m.use_mask |= ENCODE_ARM_REG_FPCS_LIST(lir->operands[0]); |
| } |
| |
| if (flags & REG_USE_FPCS_LIST2) { |
| for (int i = 0; i < lir->operands[2]; i++) { |
| SetupRegMask(&lir->u.m.use_mask, lir->operands[1] + i); |
| } |
| } |
| /* Fixup for kThumbPush/lr and kThumbPop/pc */ |
| if (opcode == kThumbPush || opcode == kThumbPop) { |
| uint64_t r8Mask = GetRegMaskCommon(rs_r8); |
| if ((opcode == kThumbPush) && (lir->u.m.use_mask & r8Mask)) { |
| lir->u.m.use_mask &= ~r8Mask; |
| lir->u.m.use_mask |= ENCODE_ARM_REG_LR; |
| } else if ((opcode == kThumbPop) && (lir->u.m.def_mask & r8Mask)) { |
| lir->u.m.def_mask &= ~r8Mask; |
| lir->u.m.def_mask |= ENCODE_ARM_REG_PC; |
| } |
| } |
| if (flags & REG_DEF_LR) { |
| lir->u.m.def_mask |= ENCODE_ARM_REG_LR; |
| } |
| } |
| } |
| |
| ArmConditionCode Arm64Mir2Lir::ArmConditionEncoding(ConditionCode ccode) { |
| ArmConditionCode res; |
| switch (ccode) { |
| case kCondEq: res = kArmCondEq; break; |
| case kCondNe: res = kArmCondNe; break; |
| case kCondCs: res = kArmCondCs; break; |
| case kCondCc: res = kArmCondCc; break; |
| case kCondUlt: res = kArmCondCc; break; |
| case kCondUge: res = kArmCondCs; break; |
| case kCondMi: res = kArmCondMi; break; |
| case kCondPl: res = kArmCondPl; break; |
| case kCondVs: res = kArmCondVs; break; |
| case kCondVc: res = kArmCondVc; break; |
| case kCondHi: res = kArmCondHi; break; |
| case kCondLs: res = kArmCondLs; break; |
| case kCondGe: res = kArmCondGe; break; |
| case kCondLt: res = kArmCondLt; break; |
| case kCondGt: res = kArmCondGt; break; |
| case kCondLe: res = kArmCondLe; break; |
| case kCondAl: res = kArmCondAl; break; |
| case kCondNv: res = kArmCondNv; break; |
| default: |
| LOG(FATAL) << "Bad condition code " << ccode; |
| res = static_cast<ArmConditionCode>(0); // Quiet gcc |
| } |
| return res; |
| } |
| |
| static const char* core_reg_names[16] = { |
| "r0", |
| "r1", |
| "r2", |
| "r3", |
| "r4", |
| "r5", |
| "r6", |
| "r7", |
| "r8", |
| "rSELF", |
| "r10", |
| "r11", |
| "r12", |
| "sp", |
| "lr", |
| "pc", |
| }; |
| |
| |
| static const char* shift_names[4] = { |
| "lsl", |
| "lsr", |
| "asr", |
| "ror"}; |
| |
| /* Decode and print a ARM register name */ |
| static char* DecodeRegList(int opcode, int vector, char* buf, size_t buf_size) { |
| int i; |
| bool printed = false; |
| buf[0] = 0; |
| for (i = 0; i < 16; i++, vector >>= 1) { |
| if (vector & 0x1) { |
| int reg_id = i; |
| if (opcode == kThumbPush && i == 8) { |
| reg_id = rs_rARM_LR.GetRegNum(); |
| } else if (opcode == kThumbPop && i == 8) { |
| reg_id = rs_rARM_PC.GetRegNum(); |
| } |
| if (printed) { |
| snprintf(buf + strlen(buf), buf_size - strlen(buf), ", r%d", reg_id); |
| } else { |
| printed = true; |
| snprintf(buf, buf_size, "r%d", reg_id); |
| } |
| } |
| } |
| return buf; |
| } |
| |
| static char* DecodeFPCSRegList(int count, int base, char* buf, size_t buf_size) { |
| snprintf(buf, buf_size, "s%d", base); |
| for (int i = 1; i < count; i++) { |
| snprintf(buf + strlen(buf), buf_size - strlen(buf), ", s%d", base + i); |
| } |
| return buf; |
| } |
| |
| static int32_t ExpandImmediate(int value) { |
| int32_t mode = (value & 0xf00) >> 8; |
| uint32_t bits = value & 0xff; |
| switch (mode) { |
| case 0: |
| return bits; |
| case 1: |
| return (bits << 16) | bits; |
| case 2: |
| return (bits << 24) | (bits << 8); |
| case 3: |
| return (bits << 24) | (bits << 16) | (bits << 8) | bits; |
| default: |
| break; |
| } |
| bits = (bits | 0x80) << 24; |
| return bits >> (((value & 0xf80) >> 7) - 8); |
| } |
| |
| const char* cc_names[] = {"eq", "ne", "cs", "cc", "mi", "pl", "vs", "vc", |
| "hi", "ls", "ge", "lt", "gt", "le", "al", "nv"}; |
| /* |
| * Interpret a format string and build a string no longer than size |
| * See format key in Assemble.c. |
| */ |
| std::string Arm64Mir2Lir::BuildInsnString(const char* fmt, LIR* lir, unsigned char* base_addr) { |
| std::string buf; |
| int i; |
| const char* fmt_end = &fmt[strlen(fmt)]; |
| char tbuf[256]; |
| const char* name; |
| char nc; |
| while (fmt < fmt_end) { |
| int operand; |
| if (*fmt == '!') { |
| fmt++; |
| DCHECK_LT(fmt, fmt_end); |
| nc = *fmt++; |
| if (nc == '!') { |
| strcpy(tbuf, "!"); |
| } else { |
| DCHECK_LT(fmt, fmt_end); |
| DCHECK_LT(static_cast<unsigned>(nc-'0'), 4U); |
| operand = lir->operands[nc-'0']; |
| switch (*fmt++) { |
| case 'H': |
| if (operand != 0) { |
| snprintf(tbuf, arraysize(tbuf), ", %s %d", shift_names[operand & 0x3], operand >> 2); |
| } else { |
| strcpy(tbuf, ""); |
| } |
| break; |
| case 'B': |
| switch (operand) { |
| case kSY: |
| name = "sy"; |
| break; |
| case kST: |
| name = "st"; |
| break; |
| case kISH: |
| name = "ish"; |
| break; |
| case kISHST: |
| name = "ishst"; |
| break; |
| case kNSH: |
| name = "nsh"; |
| break; |
| case kNSHST: |
| name = "shst"; |
| break; |
| default: |
| name = "DecodeError2"; |
| break; |
| } |
| strcpy(tbuf, name); |
| break; |
| case 'b': |
| strcpy(tbuf, "0000"); |
| for (i = 3; i >= 0; i--) { |
| tbuf[i] += operand & 1; |
| operand >>= 1; |
| } |
| break; |
| case 'n': |
| operand = ~ExpandImmediate(operand); |
| snprintf(tbuf, arraysize(tbuf), "%d [%#x]", operand, operand); |
| break; |
| case 'm': |
| operand = ExpandImmediate(operand); |
| snprintf(tbuf, arraysize(tbuf), "%d [%#x]", operand, operand); |
| break; |
| case 's': |
| snprintf(tbuf, arraysize(tbuf), "s%d", RegStorage::RegNum(operand)); |
| break; |
| case 'S': |
| snprintf(tbuf, arraysize(tbuf), "d%d", RegStorage::RegNum(operand)); |
| break; |
| case 'h': |
| snprintf(tbuf, arraysize(tbuf), "%04x", operand); |
| break; |
| case 'M': |
| case 'd': |
| snprintf(tbuf, arraysize(tbuf), "%d", operand); |
| break; |
| case 'C': |
| operand = RegStorage::RegNum(operand); |
| DCHECK_LT(operand, static_cast<int>( |
| sizeof(core_reg_names)/sizeof(core_reg_names[0]))); |
| snprintf(tbuf, arraysize(tbuf), "%s", core_reg_names[operand]); |
| break; |
| case 'E': |
| snprintf(tbuf, arraysize(tbuf), "%d", operand*4); |
| break; |
| case 'F': |
| snprintf(tbuf, arraysize(tbuf), "%d", operand*2); |
| break; |
| case 'c': |
| strcpy(tbuf, cc_names[operand]); |
| break; |
| case 't': |
| snprintf(tbuf, arraysize(tbuf), "0x%08" PRIxPTR " (L%p)", |
| reinterpret_cast<uintptr_t>(base_addr) + lir->offset + 4 + (operand << 1), |
| lir->target); |
| break; |
| case 'u': { |
| int offset_1 = lir->operands[0]; |
| int offset_2 = NEXT_LIR(lir)->operands[0]; |
| uintptr_t target = |
| (((reinterpret_cast<uintptr_t>(base_addr) + lir->offset + 4) & |
| ~3) + (offset_1 << 21 >> 9) + (offset_2 << 1)) & |
| 0xfffffffc; |
| snprintf(tbuf, arraysize(tbuf), "%p", reinterpret_cast<void *>(target)); |
| break; |
| } |
| |
| /* Nothing to print for BLX_2 */ |
| case 'v': |
| strcpy(tbuf, "see above"); |
| break; |
| case 'R': |
| DecodeRegList(lir->opcode, operand, tbuf, arraysize(tbuf)); |
| break; |
| case 'P': |
| DecodeFPCSRegList(operand, 16, tbuf, arraysize(tbuf)); |
| break; |
| case 'Q': |
| DecodeFPCSRegList(operand, 0, tbuf, arraysize(tbuf)); |
| break; |
| default: |
| strcpy(tbuf, "DecodeError1"); |
| break; |
| } |
| buf += tbuf; |
| } |
| } else { |
| buf += *fmt++; |
| } |
| } |
| return buf; |
| } |
| |
| void Arm64Mir2Lir::DumpResourceMask(LIR* arm_lir, uint64_t mask, const char* prefix) { |
| char buf[256]; |
| buf[0] = 0; |
| |
| if (mask == ENCODE_ALL) { |
| strcpy(buf, "all"); |
| } else { |
| char num[8]; |
| int i; |
| |
| for (i = 0; i < kArmRegEnd; i++) { |
| if (mask & (1ULL << i)) { |
| snprintf(num, arraysize(num), "%d ", i); |
| strcat(buf, num); |
| } |
| } |
| |
| if (mask & ENCODE_CCODE) { |
| strcat(buf, "cc "); |
| } |
| if (mask & ENCODE_FP_STATUS) { |
| strcat(buf, "fpcc "); |
| } |
| |
| /* Memory bits */ |
| if (arm_lir && (mask & ENCODE_DALVIK_REG)) { |
| snprintf(buf + strlen(buf), arraysize(buf) - strlen(buf), "dr%d%s", |
| DECODE_ALIAS_INFO_REG(arm_lir->flags.alias_info), |
| DECODE_ALIAS_INFO_WIDE(arm_lir->flags.alias_info) ? "(+1)" : ""); |
| } |
| if (mask & ENCODE_LITERAL) { |
| strcat(buf, "lit "); |
| } |
| |
| if (mask & ENCODE_HEAP_REF) { |
| strcat(buf, "heap "); |
| } |
| if (mask & ENCODE_MUST_NOT_ALIAS) { |
| strcat(buf, "noalias "); |
| } |
| } |
| if (buf[0]) { |
| LOG(INFO) << prefix << ": " << buf; |
| } |
| } |
| |
| bool Arm64Mir2Lir::IsUnconditionalBranch(LIR* lir) { |
| return ((lir->opcode == kThumbBUncond) || (lir->opcode == kThumb2BUncond)); |
| } |
| |
| Arm64Mir2Lir::Arm64Mir2Lir(CompilationUnit* cu, MIRGraph* mir_graph, ArenaAllocator* arena) |
| : Mir2Lir(cu, mir_graph, arena) { |
| // Sanity check - make sure encoding map lines up. |
| for (int i = 0; i < kArmLast; i++) { |
| if (Arm64Mir2Lir::EncodingMap[i].opcode != i) { |
| LOG(FATAL) << "Encoding order for " << Arm64Mir2Lir::EncodingMap[i].name |
| << " is wrong: expecting " << i << ", seeing " |
| << static_cast<int>(Arm64Mir2Lir::EncodingMap[i].opcode); |
| } |
| } |
| } |
| |
| Mir2Lir* ArmCodeGenerator(CompilationUnit* const cu, MIRGraph* const mir_graph, |
| ArenaAllocator* const arena) { |
| return new Arm64Mir2Lir(cu, mir_graph, arena); |
| } |
| |
| // Alloc a pair of core registers, or a double. |
| RegStorage Arm64Mir2Lir::AllocTypedTempWide(bool fp_hint, int reg_class) { |
| if (((reg_class == kAnyReg) && fp_hint) || (reg_class == kFPReg)) { |
| return AllocTempDouble(); |
| } else { |
| RegStorage low_reg = AllocTemp(); |
| RegStorage high_reg = AllocTemp(); |
| return RegStorage::MakeRegPair(low_reg, high_reg); |
| } |
| } |
| |
| RegStorage Arm64Mir2Lir::AllocTypedTemp(bool fp_hint, int reg_class) { |
| if (((reg_class == kAnyReg) && fp_hint) || (reg_class == kFPReg)) |
| return AllocTempSingle(); |
| return AllocTemp(); |
| } |
| |
| void Arm64Mir2Lir::CompilerInitializeRegAlloc() { |
| reg_pool_ = new (arena_) RegisterPool(this, arena_, core_regs, sp_regs, dp_regs, reserved_regs, |
| core_temps, sp_temps, dp_temps); |
| |
| // Target-specific adjustments. |
| |
| // Alias single precision floats to appropriate half of overlapping double. |
| GrowableArray<RegisterInfo*>::Iterator it(®_pool_->sp_regs_); |
| for (RegisterInfo* info = it.Next(); info != nullptr; info = it.Next()) { |
| int sp_reg_num = info->GetReg().GetRegNum(); |
| int dp_reg_num = sp_reg_num >> 1; |
| RegStorage dp_reg = RegStorage::Solo64(RegStorage::kFloatingPoint | dp_reg_num); |
| RegisterInfo* dp_reg_info = GetRegInfo(dp_reg); |
| // Double precision register's master storage should refer to itself. |
| DCHECK_EQ(dp_reg_info, dp_reg_info->Master()); |
| // Redirect single precision's master storage to master. |
| info->SetMaster(dp_reg_info); |
| // Singles should show a single 32-bit mask bit, at first referring to the low half. |
| DCHECK_EQ(info->StorageMask(), 0x1U); |
| if (sp_reg_num & 1) { |
| // For odd singles, change to user the high word of the backing double. |
| info->SetStorageMask(0x2); |
| } |
| } |
| |
| // TODO: re-enable this when we can safely save r4 over the suspension code path. |
| bool no_suspend = NO_SUSPEND; // || !Runtime::Current()->ExplicitSuspendChecks(); |
| if (no_suspend) { |
| GetRegInfo(rs_rARM_SUSPEND)->MarkFree(); |
| } |
| |
| // Don't start allocating temps at r0/s0/d0 or you may clobber return regs in early-exit methods. |
| // TODO: adjust when we roll to hard float calling convention. |
| reg_pool_->next_core_reg_ = 2; |
| reg_pool_->next_sp_reg_ = 0; |
| reg_pool_->next_dp_reg_ = 0; |
| } |
| |
| void Arm64Mir2Lir::FreeRegLocTemps(RegLocation rl_keep, RegLocation rl_free) { |
| DCHECK(rl_keep.wide); |
| DCHECK(rl_free.wide); |
| if ((rl_free.reg.GetLowReg() != rl_keep.reg.GetLowReg()) && |
| (rl_free.reg.GetLowReg() != rl_keep.reg.GetHighReg()) && |
| (rl_free.reg.GetHighReg() != rl_keep.reg.GetLowReg()) && |
| (rl_free.reg.GetHighReg() != rl_keep.reg.GetHighReg())) { |
| // No overlap, free. |
| FreeTemp(rl_free.reg); |
| } |
| } |
| |
| /* |
| * TUNING: is true leaf? Can't just use METHOD_IS_LEAF to determine as some |
| * instructions might call out to C/assembly helper functions. Until |
| * machinery is in place, always spill lr. |
| */ |
| |
| void Arm64Mir2Lir::AdjustSpillMask() { |
| core_spill_mask_ |= (1 << rs_rARM_LR.GetRegNum()); |
| num_core_spills_++; |
| } |
| |
| /* |
| * Mark a callee-save fp register as promoted. Note that |
| * vpush/vpop uses contiguous register lists so we must |
| * include any holes in the mask. Associate holes with |
| * Dalvik register INVALID_VREG (0xFFFFU). |
| */ |
| void Arm64Mir2Lir::MarkPreservedSingle(int v_reg, RegStorage reg) { |
| DCHECK_GE(reg.GetRegNum(), ARM_FP_CALLEE_SAVE_BASE); |
| int adjusted_reg_num = reg.GetRegNum() - ARM_FP_CALLEE_SAVE_BASE; |
| // Ensure fp_vmap_table is large enough |
| int table_size = fp_vmap_table_.size(); |
| for (int i = table_size; i < (adjusted_reg_num + 1); i++) { |
| fp_vmap_table_.push_back(INVALID_VREG); |
| } |
| // Add the current mapping |
| fp_vmap_table_[adjusted_reg_num] = v_reg; |
| // Size of fp_vmap_table is high-water mark, use to set mask |
| num_fp_spills_ = fp_vmap_table_.size(); |
| fp_spill_mask_ = ((1 << num_fp_spills_) - 1) << ARM_FP_CALLEE_SAVE_BASE; |
| } |
| |
| void Arm64Mir2Lir::MarkPreservedDouble(int v_reg, RegStorage reg) { |
| // TEMP: perform as 2 singles. |
| int reg_num = reg.GetRegNum() << 1; |
| RegStorage lo = RegStorage::Solo32(RegStorage::kFloatingPoint | reg_num); |
| RegStorage hi = RegStorage::Solo32(RegStorage::kFloatingPoint | reg_num | 1); |
| MarkPreservedSingle(v_reg, lo); |
| MarkPreservedSingle(v_reg + 1, hi); |
| } |
| |
| /* Clobber all regs that might be used by an external C call */ |
| void Arm64Mir2Lir::ClobberCallerSave() { |
| // TODO: rework this - it's gotten even more ugly. |
| Clobber(rs_r0); |
| Clobber(rs_r1); |
| Clobber(rs_r2); |
| Clobber(rs_r3); |
| Clobber(rs_r12); |
| Clobber(rs_r14lr); |
| Clobber(rs_fr0); |
| Clobber(rs_fr1); |
| Clobber(rs_fr2); |
| Clobber(rs_fr3); |
| Clobber(rs_fr4); |
| Clobber(rs_fr5); |
| Clobber(rs_fr6); |
| Clobber(rs_fr7); |
| Clobber(rs_fr8); |
| Clobber(rs_fr9); |
| Clobber(rs_fr10); |
| Clobber(rs_fr11); |
| Clobber(rs_fr12); |
| Clobber(rs_fr13); |
| Clobber(rs_fr14); |
| Clobber(rs_fr15); |
| Clobber(rs_dr0); |
| Clobber(rs_dr1); |
| Clobber(rs_dr2); |
| Clobber(rs_dr3); |
| Clobber(rs_dr4); |
| Clobber(rs_dr5); |
| Clobber(rs_dr6); |
| Clobber(rs_dr7); |
| } |
| |
| RegLocation Arm64Mir2Lir::GetReturnWideAlt() { |
| RegLocation res = LocCReturnWide(); |
| res.reg.SetLowReg(rs_r2.GetReg()); |
| res.reg.SetHighReg(rs_r3.GetReg()); |
| Clobber(rs_r2); |
| Clobber(rs_r3); |
| MarkInUse(rs_r2); |
| MarkInUse(rs_r3); |
| MarkWide(res.reg); |
| return res; |
| } |
| |
| RegLocation Arm64Mir2Lir::GetReturnAlt() { |
| RegLocation res = LocCReturn(); |
| res.reg.SetReg(rs_r1.GetReg()); |
| Clobber(rs_r1); |
| MarkInUse(rs_r1); |
| return res; |
| } |
| |
| /* To be used when explicitly managing register use */ |
| void Arm64Mir2Lir::LockCallTemps() { |
| LockTemp(rs_r0); |
| LockTemp(rs_r1); |
| LockTemp(rs_r2); |
| LockTemp(rs_r3); |
| } |
| |
| /* To be used when explicitly managing register use */ |
| void Arm64Mir2Lir::FreeCallTemps() { |
| FreeTemp(rs_r0); |
| FreeTemp(rs_r1); |
| FreeTemp(rs_r2); |
| FreeTemp(rs_r3); |
| } |
| |
| RegStorage Arm64Mir2Lir::LoadHelper(ThreadOffset<4> offset) { |
| LoadWordDisp(rs_rARM_SELF, offset.Int32Value(), rs_rARM_LR); |
| return rs_rARM_LR; |
| } |
| |
| LIR* Arm64Mir2Lir::CheckSuspendUsingLoad() { |
| RegStorage tmp = rs_r0; |
| Load32Disp(rs_rARM_SELF, Thread::ThreadSuspendTriggerOffset<4>().Int32Value(), tmp); |
| LIR* load2 = Load32Disp(tmp, 0, tmp); |
| return load2; |
| } |
| |
| uint64_t Arm64Mir2Lir::GetTargetInstFlags(int opcode) { |
| DCHECK(!IsPseudoLirOp(opcode)); |
| return Arm64Mir2Lir::EncodingMap[opcode].flags; |
| } |
| |
| const char* Arm64Mir2Lir::GetTargetInstName(int opcode) { |
| DCHECK(!IsPseudoLirOp(opcode)); |
| return Arm64Mir2Lir::EncodingMap[opcode].name; |
| } |
| |
| const char* Arm64Mir2Lir::GetTargetInstFmt(int opcode) { |
| DCHECK(!IsPseudoLirOp(opcode)); |
| return Arm64Mir2Lir::EncodingMap[opcode].fmt; |
| } |
| |
| /* |
| * Somewhat messy code here. We want to allocate a pair of contiguous |
| * physical single-precision floating point registers starting with |
| * an even numbered reg. It is possible that the paired s_reg (s_reg+1) |
| * has already been allocated - try to fit if possible. Fail to |
| * allocate if we can't meet the requirements for the pair of |
| * s_reg<=sX[even] & (s_reg+1)<= sX+1. |
| */ |
| // TODO: needs rewrite to support non-backed 64-bit float regs. |
| RegStorage Arm64Mir2Lir::AllocPreservedDouble(int s_reg) { |
| RegStorage res; |
| int v_reg = mir_graph_->SRegToVReg(s_reg); |
| int p_map_idx = SRegToPMap(s_reg); |
| if (promotion_map_[p_map_idx+1].fp_location == kLocPhysReg) { |
| // Upper reg is already allocated. Can we fit? |
| int high_reg = promotion_map_[p_map_idx+1].FpReg; |
| if ((high_reg & 1) == 0) { |
| // High reg is even - fail. |
| return res; // Invalid. |
| } |
| // Is the low reg of the pair free? |
| // FIXME: rework. |
| RegisterInfo* p = GetRegInfo(RegStorage::FloatSolo32(high_reg - 1)); |
| if (p->InUse() || p->IsTemp()) { |
| // Already allocated or not preserved - fail. |
| return res; // Invalid. |
| } |
| // OK - good to go. |
| res = RegStorage::FloatSolo64(p->GetReg().GetRegNum() >> 1); |
| p->MarkInUse(); |
| MarkPreservedSingle(v_reg, p->GetReg()); |
| } else { |
| /* |
| * TODO: until runtime support is in, make sure we avoid promoting the same vreg to |
| * different underlying physical registers. |
| */ |
| GrowableArray<RegisterInfo*>::Iterator it(®_pool_->dp_regs_); |
| for (RegisterInfo* info = it.Next(); info != nullptr; info = it.Next()) { |
| if (!info->IsTemp() && !info->InUse()) { |
| res = info->GetReg(); |
| info->MarkInUse(); |
| MarkPreservedDouble(v_reg, info->GetReg()); |
| break; |
| } |
| } |
| } |
| if (res.Valid()) { |
| promotion_map_[p_map_idx].fp_location = kLocPhysReg; |
| promotion_map_[p_map_idx].FpReg = res.DoubleToLowSingle().GetReg(); |
| promotion_map_[p_map_idx+1].fp_location = kLocPhysReg; |
| promotion_map_[p_map_idx+1].FpReg = res.DoubleToHighSingle().GetReg(); |
| } |
| return res; |
| } |
| |
| } // namespace art |