| %def header(): |
| /* |
| * Copyright (C) 2019 The Android Open Source Project |
| * |
| * Licensed under the Apache License, Version 2.0 (the "License"); |
| * you may not use this file except in compliance with the License. |
| * You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| /* |
| * This is a #include, not a %include, because we want the C pre-processor |
| * to expand the macros into assembler assignment statements. |
| */ |
| #include "asm_support.h" |
| #include "arch/x86_64/asm_support_x86_64.S" |
| |
| /** |
| * x86_64 ABI general notes: |
| * |
| * Caller save set: |
| * rax, rdx, rcx, rsi, rdi, r8-r11, st(0)-st(7) |
| * Callee save set: |
| * rbx, rbp, r12-r15 |
| * Return regs: |
| * 32-bit in eax |
| * 64-bit in rax |
| * fp on xmm0 |
| * |
| * First 8 fp parameters came in xmm0-xmm7. |
| * First 6 non-fp parameters came in rdi, rsi, rdx, rcx, r8, r9. |
| * Other parameters passed on stack, pushed right-to-left. On entry to target, first |
| * param is at 8(%esp). |
| * |
| * Stack must be 16-byte aligned to support SSE in native code. |
| */ |
| |
| #define IN_ARG3 %rcx |
| #define IN_ARG2 %rdx |
| #define IN_ARG1 %rsi |
| #define IN_ARG0 %rdi |
| /* Out Args */ |
| #define OUT_ARG3 %rcx |
| #define OUT_ARG2 %rdx |
| #define OUT_ARG1 %rsi |
| #define OUT_ARG0 %rdi |
| #define OUT_32_ARG3 %ecx |
| #define OUT_32_ARG2 %edx |
| #define OUT_32_ARG1 %esi |
| #define OUT_32_ARG0 %edi |
| #define OUT_FP_ARG1 %xmm1 |
| #define OUT_FP_ARG0 %xmm0 |
| |
| /* |
| * single-purpose registers, given names for clarity |
| */ |
| #define rSELF %gs |
| #define rPC %r12 |
| #define CFI_DEX 12 // DWARF register number of the register holding dex-pc (rPC). |
| #define CFI_TMP 5 // DWARF register number of the first argument register (rdi). |
| #define rFP %r13 |
| #define rINST %ebx |
| #define rINSTq %rbx |
| #define rINSTw %bx |
| #define rINSTbh %bh |
| #define rINSTbl %bl |
| #define rIBASE %r14 |
| #define rREFS %r15 |
| #define rREFS32 %r15d |
| #define CFI_REFS 15 // DWARF register number of the reference array (r15). |
| |
| // Temporary registers while setting up a frame. |
| #define rNEW_FP %r8 |
| #define rNEW_REFS %r9 |
| #define rNEW_REFS32 %r9d |
| #define CFI_NEW_REFS 9 |
| |
| /* |
| * Get/set the 32-bit value from a Dalvik register. |
| */ |
| #define VREG_ADDRESS(_vreg) (rFP,_vreg,4) |
| #define VREG_HIGH_ADDRESS(_vreg) 4(rFP,_vreg,4) |
| #define VREG_REF_ADDRESS(_vreg) (rREFS,_vreg,4) |
| #define VREG_REF_HIGH_ADDRESS(_vreg) 4(rREFS,_vreg,4) |
| |
| // Includes the return address implictly pushed on stack by 'call'. |
| #define CALLEE_SAVES_SIZE (6 * 8 + 4 * 8 + 1 * 8) |
| |
| // +8 for the ArtMethod of the caller. |
| #define OFFSET_TO_FIRST_ARGUMENT_IN_STACK (CALLEE_SAVES_SIZE + 8) |
| |
| /* |
| * Refresh rINST. |
| * At enter to handler rINST does not contain the opcode number. |
| * However some utilities require the full value, so this macro |
| * restores the opcode number. |
| */ |
| .macro REFRESH_INST _opnum |
| movb rINSTbl, rINSTbh |
| movb $$\_opnum, rINSTbl |
| .endm |
| |
| /* |
| * Fetch the next instruction from rPC into rINSTw. Does not advance rPC. |
| */ |
| .macro FETCH_INST |
| movzwq (rPC), rINSTq |
| .endm |
| |
| /* |
| * Remove opcode from rINST, compute the address of handler and jump to it. |
| */ |
| .macro GOTO_NEXT |
| movzx rINSTbl,%ecx |
| movzbl rINSTbh,rINST |
| shll MACRO_LITERAL(${handler_size_bits}), %ecx |
| addq rIBASE, %rcx |
| jmp *%rcx |
| .endm |
| |
| /* |
| * Advance rPC by instruction count. |
| */ |
| .macro ADVANCE_PC _count |
| leaq 2*\_count(rPC), rPC |
| .endm |
| |
| /* |
| * Advance rPC by instruction count, fetch instruction and jump to handler. |
| */ |
| .macro ADVANCE_PC_FETCH_AND_GOTO_NEXT _count |
| ADVANCE_PC \_count |
| FETCH_INST |
| GOTO_NEXT |
| .endm |
| |
| .macro GET_VREG _reg _vreg |
| movl VREG_ADDRESS(\_vreg), \_reg |
| .endm |
| |
| .macro GET_VREG_OBJECT _reg _vreg |
| movl VREG_REF_ADDRESS(\_vreg), \_reg |
| .endm |
| |
| /* Read wide value. */ |
| .macro GET_WIDE_VREG _reg _vreg |
| movq VREG_ADDRESS(\_vreg), \_reg |
| .endm |
| |
| .macro SET_VREG _reg _vreg |
| movl \_reg, VREG_ADDRESS(\_vreg) |
| movl MACRO_LITERAL(0), VREG_REF_ADDRESS(\_vreg) |
| .endm |
| |
| /* Write wide value. reg is clobbered. */ |
| .macro SET_WIDE_VREG _reg _vreg |
| movq \_reg, VREG_ADDRESS(\_vreg) |
| xorq \_reg, \_reg |
| movq \_reg, VREG_REF_ADDRESS(\_vreg) |
| .endm |
| |
| .macro SET_VREG_OBJECT _reg _vreg |
| movl \_reg, VREG_ADDRESS(\_vreg) |
| movl \_reg, VREG_REF_ADDRESS(\_vreg) |
| .endm |
| |
| .macro GET_VREG_HIGH _reg _vreg |
| movl VREG_HIGH_ADDRESS(\_vreg), \_reg |
| .endm |
| |
| .macro SET_VREG_HIGH _reg _vreg |
| movl \_reg, VREG_HIGH_ADDRESS(\_vreg) |
| movl MACRO_LITERAL(0), VREG_REF_HIGH_ADDRESS(\_vreg) |
| .endm |
| |
| .macro CLEAR_REF _vreg |
| movl MACRO_LITERAL(0), VREG_REF_ADDRESS(\_vreg) |
| .endm |
| |
| .macro CLEAR_WIDE_REF _vreg |
| movl MACRO_LITERAL(0), VREG_REF_ADDRESS(\_vreg) |
| movl MACRO_LITERAL(0), VREG_REF_HIGH_ADDRESS(\_vreg) |
| .endm |
| |
| .macro GET_VREG_XMMs _xmmreg _vreg |
| movss VREG_ADDRESS(\_vreg), \_xmmreg |
| .endm |
| .macro GET_VREG_XMMd _xmmreg _vreg |
| movsd VREG_ADDRESS(\_vreg), \_xmmreg |
| .endm |
| .macro SET_VREG_XMMs _xmmreg _vreg |
| movss \_xmmreg, VREG_ADDRESS(\_vreg) |
| .endm |
| .macro SET_VREG_XMMd _xmmreg _vreg |
| movsd \_xmmreg, VREG_ADDRESS(\_vreg) |
| .endm |
| |
| // An assembly entry that has a OatQuickMethodHeader prefix. |
| .macro OAT_ENTRY name, end |
| FUNCTION_TYPE(\name) |
| ASM_HIDDEN SYMBOL(\name) |
| .global SYMBOL(\name) |
| .balign 16 |
| .long 0 |
| .long (SYMBOL(\end) - SYMBOL(\name)) |
| SYMBOL(\name): |
| .endm |
| |
| .macro ENTRY name |
| .text |
| ASM_HIDDEN SYMBOL(\name) |
| .global SYMBOL(\name) |
| FUNCTION_TYPE(\name) |
| SYMBOL(\name): |
| .endm |
| |
| .macro END name |
| SIZE(\name) |
| .endm |
| |
| // Macro for defining entrypoints into runtime. We don't need to save registers |
| // (we're not holding references there), but there is no |
| // kDontSave runtime method. So just use the kSaveRefsOnly runtime method. |
| .macro NTERP_TRAMPOLINE name, helper |
| DEFINE_FUNCTION \name |
| SETUP_SAVE_REFS_ONLY_FRAME |
| call \helper |
| RESTORE_SAVE_REFS_ONLY_FRAME |
| RETURN_OR_DELIVER_PENDING_EXCEPTION |
| END_FUNCTION \name |
| .endm |
| |
| .macro CLEAR_VOLATILE_MARKER reg |
| andq MACRO_LITERAL(-2), \reg |
| .endm |
| |
| .macro EXPORT_PC |
| movq rPC, -16(rREFS) |
| .endm |
| |
| |
| .macro BRANCH |
| // Update method counter and do a suspend check if the branch is negative. |
| testq rINSTq, rINSTq |
| js 3f |
| 2: |
| leaq (rPC, rINSTq, 2), rPC |
| FETCH_INST |
| GOTO_NEXT |
| 3: |
| movq (%rsp), %rdi |
| addw $$1, ART_METHOD_HOTNESS_COUNT_OFFSET(%rdi) |
| andw $$(NTERP_HOTNESS_MASK), ART_METHOD_HOTNESS_COUNT_OFFSET(%rdi) |
| // If the counter overflows, handle this in the runtime. |
| jz NterpHandleHotnessOverflow |
| // Otherwise, do a suspend check. |
| testl $$(THREAD_SUSPEND_OR_CHECKPOINT_REQUEST), rSELF:THREAD_FLAGS_OFFSET |
| jz 2b |
| EXPORT_PC |
| call SYMBOL(art_quick_test_suspend) |
| jmp 2b |
| .endm |
| |
| // Expects: |
| // - r10, and r11 to be available. |
| // Outputs: |
| // - \registers contains the dex registers size |
| // - \outs contains the outs size |
| // - if load_ins is 1, \ins contains the ins |
| // - \code_item is replace with a pointer to the instructions |
| .macro FETCH_CODE_ITEM_INFO code_item, registers, outs, ins, load_ins |
| testq MACRO_LITERAL(1), \code_item |
| je 5f |
| andq $$-2, \code_item // Remove the extra bit that marks it's a compact dex file. |
| movzwl COMPACT_CODE_ITEM_FIELDS_OFFSET(\code_item), %r10d |
| movl %r10d, \registers |
| sarl $$COMPACT_CODE_ITEM_REGISTERS_SIZE_SHIFT, \registers |
| andl $$0xf, \registers |
| movl %r10d, \outs |
| sarl $$COMPACT_CODE_ITEM_OUTS_SIZE_SHIFT, \outs |
| andl $$0xf, \outs |
| .if \load_ins |
| movl %r10d, \ins |
| sarl $$COMPACT_CODE_ITEM_INS_SIZE_SHIFT, \ins |
| andl $$0xf, \ins |
| .else |
| movl %r10d, %r11d |
| sarl $$COMPACT_CODE_ITEM_INS_SIZE_SHIFT, %r11d |
| andl $$0xf, %r11d |
| addl %r11d, \registers |
| .endif |
| testw $$COMPACT_CODE_ITEM_REGISTERS_INS_OUTS_FLAGS, COMPACT_CODE_ITEM_FLAGS_OFFSET(\code_item) |
| je 4f |
| movq \code_item, %r11 |
| testw $$COMPACT_CODE_ITEM_INSNS_FLAG, COMPACT_CODE_ITEM_FLAGS_OFFSET(\code_item) |
| je 1f |
| subq $$4, %r11 |
| 1: |
| testw $$COMPACT_CODE_ITEM_REGISTERS_FLAG, COMPACT_CODE_ITEM_FLAGS_OFFSET(\code_item) |
| je 2f |
| subq $$2, %r11 |
| movzwl (%r11), %r10d |
| addl %r10d, \registers |
| 2: |
| testw $$COMPACT_CODE_ITEM_INS_FLAG, COMPACT_CODE_ITEM_FLAGS_OFFSET(\code_item) |
| je 3f |
| subq $$2, %r11 |
| movzwl (%r11), %r10d |
| .if \load_ins |
| addl %r10d, \ins |
| .else |
| addl %r10d, \registers |
| .endif |
| 3: |
| testw $$COMPACT_CODE_ITEM_OUTS_FLAG, COMPACT_CODE_ITEM_FLAGS_OFFSET(\code_item) |
| je 4f |
| subq $$2, %r11 |
| movzwl (%r11), %r10d |
| addl %r10d, \outs |
| 4: |
| .if \load_ins |
| addl \ins, \registers |
| .endif |
| addq $$COMPACT_CODE_ITEM_INSNS_OFFSET, \code_item |
| jmp 6f |
| 5: |
| // Fetch dex register size. |
| movzwl CODE_ITEM_REGISTERS_SIZE_OFFSET(\code_item), \registers |
| // Fetch outs size. |
| movzwl CODE_ITEM_OUTS_SIZE_OFFSET(\code_item), \outs |
| .if \load_ins |
| movzwl CODE_ITEM_INS_SIZE_OFFSET(\code_item), \ins |
| .endif |
| addq $$CODE_ITEM_INSNS_OFFSET, \code_item |
| 6: |
| .endm |
| |
| // Setup the stack to start executing the method. Expects: |
| // - rdi to contain the ArtMethod |
| // - rbx, r10, r11 to be available. |
| // |
| // Outputs |
| // - rbx contains the dex registers size |
| // - r11 contains the old stack pointer. |
| // - \code_item is replace with a pointer to the instructions |
| // - if load_ins is 1, r14 contains the ins |
| .macro SETUP_STACK_FRAME code_item, refs, refs32, fp, cfi_refs, load_ins |
| FETCH_CODE_ITEM_INFO \code_item, %ebx, \refs32, %r14d, \load_ins |
| |
| // Compute required frame size for dex registers: ((2 * ebx) + refs) |
| leaq (\refs, %rbx, 2), %r11 |
| salq $$2, %r11 |
| |
| // Compute new stack pointer in r10: add 24 for saving the previous frame, |
| // pc, and method being executed. |
| leaq -24(%rsp), %r10 |
| subq %r11, %r10 |
| // Alignment |
| // Note: There may be two pieces of alignment but there is no need to align |
| // out args to `kPointerSize` separately before aligning to kStackAlignment. |
| andq $$-16, %r10 |
| |
| // Set reference and dex registers, align to pointer size for previous frame and dex pc. |
| leaq 24 + 4(%r10, \refs, 4), \refs |
| andq LITERAL(-__SIZEOF_POINTER__), \refs |
| leaq (\refs, %rbx, 4), \fp |
| |
| // Now setup the stack pointer. |
| movq %rsp, %r11 |
| CFI_DEF_CFA_REGISTER(r11) |
| movq %r10, %rsp |
| movq %r11, -8(\refs) |
| CFI_DEF_CFA_BREG_PLUS_UCONST \cfi_refs, -8, ((6 + 4 + 1) * 8) |
| |
| // Put nulls in reference frame. |
| testl %ebx, %ebx |
| je 2f |
| movq \refs, %r10 |
| 1: |
| movl $$0, (%r10) |
| addq $$4, %r10 |
| cmpq %r10, \fp |
| jne 1b |
| 2: |
| // Save the ArtMethod. |
| movq %rdi, (%rsp) |
| .endm |
| |
| // Puts the next floating point argument into the expected register, |
| // fetching values based on a non-range invoke. |
| // Uses rax as temporary. |
| // |
| // TODO: We could simplify a lot of code by loading the G argument into |
| // the "inst" register. Given that we enter the handler with "1(rPC)" in |
| // the rINST, we can just add rINST<<16 to the args and we don't even |
| // need to pass "arg_index" around. |
| .macro LOOP_OVER_SHORTY_LOADING_XMMS xmm_reg, inst, shorty, arg_index, finished |
| 1: // LOOP |
| movb (REG_VAR(shorty)), %al // bl := *shorty |
| addq MACRO_LITERAL(1), REG_VAR(shorty) // shorty++ |
| cmpb MACRO_LITERAL(0), %al // if (al == '\0') goto finished |
| je VAR(finished) |
| cmpb MACRO_LITERAL(68), %al // if (al == 'D') goto FOUND_DOUBLE |
| je 2f |
| cmpb MACRO_LITERAL(70), %al // if (al == 'F') goto FOUND_FLOAT |
| je 3f |
| shrq MACRO_LITERAL(4), REG_VAR(inst) |
| addq MACRO_LITERAL(1), REG_VAR(arg_index) |
| // Handle extra argument in arg array taken by a long. |
| cmpb MACRO_LITERAL(74), %al // if (al != 'J') goto LOOP |
| jne 1b |
| shrq MACRO_LITERAL(4), REG_VAR(inst) |
| addq MACRO_LITERAL(1), REG_VAR(arg_index) |
| jmp 1b // goto LOOP |
| 2: // FOUND_DOUBLE |
| subq MACRO_LITERAL(8), %rsp |
| movq REG_VAR(inst), %rax |
| andq MACRO_LITERAL(0xf), %rax |
| GET_VREG %eax, %rax |
| movl %eax, (%rsp) |
| shrq MACRO_LITERAL(4), REG_VAR(inst) |
| addq MACRO_LITERAL(1), REG_VAR(arg_index) |
| cmpq MACRO_LITERAL(4), REG_VAR(arg_index) |
| je 5f |
| movq REG_VAR(inst), %rax |
| andq MACRO_LITERAL(0xf), %rax |
| shrq MACRO_LITERAL(4), REG_VAR(inst) |
| addq MACRO_LITERAL(1), REG_VAR(arg_index) |
| jmp 6f |
| 5: |
| movzbl 1(rPC), %eax |
| andq MACRO_LITERAL(0xf), %rax |
| 6: |
| GET_VREG %eax, %rax |
| movl %eax, 4(%rsp) |
| movsd (%rsp), REG_VAR(xmm_reg) |
| addq MACRO_LITERAL(8), %rsp |
| jmp 4f |
| 3: // FOUND_FLOAT |
| cmpq MACRO_LITERAL(4), REG_VAR(arg_index) |
| je 7f |
| movq REG_VAR(inst), %rax |
| andq MACRO_LITERAL(0xf), %rax |
| shrq MACRO_LITERAL(4), REG_VAR(inst) |
| addq MACRO_LITERAL(1), REG_VAR(arg_index) |
| jmp 8f |
| 7: |
| movzbl 1(rPC), %eax |
| andq MACRO_LITERAL(0xf), %rax |
| 8: |
| GET_VREG_XMMs REG_VAR(xmm_reg), %rax |
| 4: |
| .endm |
| |
| // Puts the next int/long/object argument in the expected register, |
| // fetching values based on a non-range invoke. |
| // Uses rax as temporary. |
| .macro LOOP_OVER_SHORTY_LOADING_GPRS gpr_reg64, gpr_reg32, inst, shorty, arg_index, finished |
| 1: // LOOP |
| movb (REG_VAR(shorty)), %al // al := *shorty |
| addq MACRO_LITERAL(1), REG_VAR(shorty) // shorty++ |
| cmpb MACRO_LITERAL(0), %al // if (al == '\0') goto finished |
| je VAR(finished) |
| cmpb MACRO_LITERAL(74), %al // if (al == 'J') goto FOUND_LONG |
| je 2f |
| cmpb MACRO_LITERAL(70), %al // if (al == 'F') goto SKIP_FLOAT |
| je 3f |
| cmpb MACRO_LITERAL(68), %al // if (al == 'D') goto SKIP_DOUBLE |
| je 4f |
| cmpq MACRO_LITERAL(4), REG_VAR(arg_index) |
| je 7f |
| movq REG_VAR(inst), %rax |
| andq MACRO_LITERAL(0xf), %rax |
| shrq MACRO_LITERAL(4), REG_VAR(inst) |
| addq MACRO_LITERAL(1), REG_VAR(arg_index) |
| jmp 8f |
| 7: |
| movzbl 1(rPC), %eax |
| andq MACRO_LITERAL(0xf), %rax |
| 8: |
| GET_VREG REG_VAR(gpr_reg32), %rax |
| jmp 5f |
| 2: // FOUND_LONG |
| subq MACRO_LITERAL(8), %rsp |
| movq REG_VAR(inst), %rax |
| andq MACRO_LITERAL(0xf), %rax |
| GET_VREG %eax, %rax |
| movl %eax, (%rsp) |
| shrq MACRO_LITERAL(4), REG_VAR(inst) |
| addq MACRO_LITERAL(1), REG_VAR(arg_index) |
| cmpq MACRO_LITERAL(4), REG_VAR(arg_index) |
| je 9f |
| movq REG_VAR(inst), %rax |
| andq MACRO_LITERAL(0xf), %rax |
| shrq MACRO_LITERAL(4), REG_VAR(inst) |
| addq MACRO_LITERAL(1), REG_VAR(arg_index) |
| jmp 10f |
| 9: |
| movzbl 1(rPC), %eax |
| andq MACRO_LITERAL(0xf), %rax |
| 10: |
| GET_VREG %eax, %rax |
| movl %eax, 4(%rsp) |
| movq (%rsp), REG_VAR(gpr_reg64) |
| addq MACRO_LITERAL(8), %rsp |
| jmp 5f |
| 3: // SKIP_FLOAT |
| shrq MACRO_LITERAL(4), REG_VAR(inst) |
| addq MACRO_LITERAL(1), REG_VAR(arg_index) |
| jmp 1b |
| 4: // SKIP_DOUBLE |
| shrq MACRO_LITERAL(4), REG_VAR(inst) |
| addq MACRO_LITERAL(1), REG_VAR(arg_index) |
| cmpq MACRO_LITERAL(4), REG_VAR(arg_index) |
| je 1b |
| shrq MACRO_LITERAL(4), REG_VAR(inst) |
| addq MACRO_LITERAL(1), REG_VAR(arg_index) |
| jmp 1b |
| 5: |
| .endm |
| |
| // Puts the next floating point argument into the expected register, |
| // fetching values based on a range invoke. |
| // Uses rax as temporary. |
| .macro LOOP_RANGE_OVER_SHORTY_LOADING_XMMS xmm_reg, shorty, arg_index, stack_index, finished |
| 1: // LOOP |
| movb (REG_VAR(shorty)), %al // al := *shorty |
| addq MACRO_LITERAL(1), REG_VAR(shorty) // shorty++ |
| cmpb MACRO_LITERAL(0), %al // if (al == '\0') goto finished |
| je VAR(finished) |
| cmpb MACRO_LITERAL(68), %al // if (al == 'D') goto FOUND_DOUBLE |
| je 2f |
| cmpb MACRO_LITERAL(70), %al // if (al == 'F') goto FOUND_FLOAT |
| je 3f |
| addq MACRO_LITERAL(1), REG_VAR(arg_index) |
| addq MACRO_LITERAL(1), REG_VAR(stack_index) |
| // Handle extra argument in arg array taken by a long. |
| cmpb MACRO_LITERAL(74), %al // if (al != 'J') goto LOOP |
| jne 1b |
| addq MACRO_LITERAL(1), REG_VAR(arg_index) |
| addq MACRO_LITERAL(1), REG_VAR(stack_index) |
| jmp 1b // goto LOOP |
| 2: // FOUND_DOUBLE |
| GET_VREG_XMMd REG_VAR(xmm_reg), REG_VAR(arg_index) |
| addq MACRO_LITERAL(2), REG_VAR(arg_index) |
| addq MACRO_LITERAL(2), REG_VAR(stack_index) |
| jmp 4f |
| 3: // FOUND_FLOAT |
| GET_VREG_XMMs REG_VAR(xmm_reg), REG_VAR(arg_index) |
| addq MACRO_LITERAL(1), REG_VAR(arg_index) |
| addq MACRO_LITERAL(1), REG_VAR(stack_index) |
| 4: |
| .endm |
| |
| // Puts the next floating point argument into the expected stack slot, |
| // fetching values based on a range invoke. |
| // Uses rax as temporary. |
| // |
| // TODO: We could just copy all the vregs to the stack slots in a simple loop |
| // (or REP MOVSD) without looking at the shorty at all. (We could also drop |
| // the "stack_index" from the macros for loading registers.) We could also do |
| // that conditionally if argument word count > 6; otherwise we know that all |
| // args fit into registers. |
| .macro LOOP_RANGE_OVER_FPs shorty, arg_index, stack_index, finished |
| 1: // LOOP |
| movb (REG_VAR(shorty)), %al // bl := *shorty |
| addq MACRO_LITERAL(1), REG_VAR(shorty) // shorty++ |
| cmpb MACRO_LITERAL(0), %al // if (al == '\0') goto finished |
| je VAR(finished) |
| cmpb MACRO_LITERAL(68), %al // if (al == 'D') goto FOUND_DOUBLE |
| je 2f |
| cmpb MACRO_LITERAL(70), %al // if (al == 'F') goto FOUND_FLOAT |
| je 3f |
| addq MACRO_LITERAL(1), REG_VAR(arg_index) |
| addq MACRO_LITERAL(1), REG_VAR(stack_index) |
| // Handle extra argument in arg array taken by a long. |
| cmpb MACRO_LITERAL(74), %al // if (al != 'J') goto LOOP |
| jne 1b |
| addq MACRO_LITERAL(1), REG_VAR(arg_index) |
| addq MACRO_LITERAL(1), REG_VAR(stack_index) |
| jmp 1b // goto LOOP |
| 2: // FOUND_DOUBLE |
| movq (rFP, REG_VAR(arg_index), 4), %rax |
| movq %rax, 8(%rsp, REG_VAR(stack_index), 4) |
| addq MACRO_LITERAL(2), REG_VAR(arg_index) |
| addq MACRO_LITERAL(2), REG_VAR(stack_index) |
| jmp 1b |
| 3: // FOUND_FLOAT |
| movl (rFP, REG_VAR(arg_index), 4), %eax |
| movl %eax, 8(%rsp, REG_VAR(stack_index), 4) |
| addq MACRO_LITERAL(1), REG_VAR(arg_index) |
| addq MACRO_LITERAL(1), REG_VAR(stack_index) |
| jmp 1b |
| .endm |
| |
| // Puts the next int/long/object argument in the expected register, |
| // fetching values based on a range invoke. |
| // Uses rax as temporary. |
| .macro LOOP_RANGE_OVER_SHORTY_LOADING_GPRS gpr_reg64, gpr_reg32, shorty, arg_index, stack_index, finished |
| 1: // LOOP |
| movb (REG_VAR(shorty)), %al // al := *shorty |
| addq MACRO_LITERAL(1), REG_VAR(shorty) // shorty++ |
| cmpb MACRO_LITERAL(0), %al // if (al == '\0') goto finished |
| je VAR(finished) |
| cmpb MACRO_LITERAL(74), %al // if (al == 'J') goto FOUND_LONG |
| je 2f |
| cmpb MACRO_LITERAL(70), %al // if (al == 'F') goto SKIP_FLOAT |
| je 3f |
| cmpb MACRO_LITERAL(68), %al // if (al == 'D') goto SKIP_DOUBLE |
| je 4f |
| movl (rFP, REG_VAR(arg_index), 4), REG_VAR(gpr_reg32) |
| addq MACRO_LITERAL(1), REG_VAR(arg_index) |
| addq MACRO_LITERAL(1), REG_VAR(stack_index) |
| jmp 5f |
| 2: // FOUND_LONG |
| movq (rFP, REG_VAR(arg_index), 4), REG_VAR(gpr_reg64) |
| addq MACRO_LITERAL(2), REG_VAR(arg_index) |
| addq MACRO_LITERAL(2), REG_VAR(stack_index) |
| jmp 5f |
| 3: // SKIP_FLOAT |
| addq MACRO_LITERAL(1), REG_VAR(arg_index) |
| addq MACRO_LITERAL(1), REG_VAR(stack_index) |
| jmp 1b |
| 4: // SKIP_DOUBLE |
| addq MACRO_LITERAL(2), REG_VAR(arg_index) |
| addq MACRO_LITERAL(2), REG_VAR(stack_index) |
| jmp 1b |
| 5: |
| .endm |
| |
| // Puts the next int/long/object argument in the expected stack slot, |
| // fetching values based on a range invoke. |
| // Uses rax as temporary. |
| .macro LOOP_RANGE_OVER_INTs shorty, arg_index, stack_index, finished |
| 1: // LOOP |
| movb (REG_VAR(shorty)), %al // al := *shorty |
| addq MACRO_LITERAL(1), REG_VAR(shorty) // shorty++ |
| cmpb MACRO_LITERAL(0), %al // if (al == '\0') goto finished |
| je VAR(finished) |
| cmpb MACRO_LITERAL(74), %al // if (al == 'J') goto FOUND_LONG |
| je 2f |
| cmpb MACRO_LITERAL(70), %al // if (al == 'F') goto SKIP_FLOAT |
| je 3f |
| cmpb MACRO_LITERAL(68), %al // if (al == 'D') goto SKIP_DOUBLE |
| je 4f |
| movl (rFP, REG_VAR(arg_index), 4), %eax |
| movl %eax, 8(%rsp, REG_VAR(stack_index), 4) |
| addq MACRO_LITERAL(1), REG_VAR(arg_index) |
| addq MACRO_LITERAL(1), REG_VAR(stack_index) |
| jmp 1b |
| 2: // FOUND_LONG |
| movq (rFP, REG_VAR(arg_index), 4), %rax |
| movq %rax, 8(%rsp, REG_VAR(stack_index), 4) |
| addq MACRO_LITERAL(2), REG_VAR(arg_index) |
| addq MACRO_LITERAL(2), REG_VAR(stack_index) |
| jmp 1b |
| 3: // SKIP_FLOAT |
| addq MACRO_LITERAL(1), REG_VAR(arg_index) |
| addq MACRO_LITERAL(1), REG_VAR(stack_index) |
| jmp 1b |
| 4: // SKIP_DOUBLE |
| addq MACRO_LITERAL(2), REG_VAR(arg_index) |
| addq MACRO_LITERAL(2), REG_VAR(stack_index) |
| jmp 1b |
| .endm |
| |
| // Puts the next floating point parameter passed in physical register |
| // in the expected dex register array entry. |
| // Uses rax as temporary. |
| .macro LOOP_OVER_SHORTY_STORING_XMMS xmm_reg, shorty, arg_index, fp, finished |
| 1: // LOOP |
| movb (REG_VAR(shorty)), %al // al := *shorty |
| addq MACRO_LITERAL(1), REG_VAR(shorty) // shorty++ |
| cmpb MACRO_LITERAL(0), %al // if (al == '\0') goto finished |
| je VAR(finished) |
| cmpb MACRO_LITERAL(68), %al // if (al == 'D') goto FOUND_DOUBLE |
| je 2f |
| cmpb MACRO_LITERAL(70), %al // if (al == 'F') goto FOUND_FLOAT |
| je 3f |
| addq MACRO_LITERAL(1), REG_VAR(arg_index) |
| // Handle extra argument in arg array taken by a long. |
| cmpb MACRO_LITERAL(74), %al // if (al != 'J') goto LOOP |
| jne 1b |
| addq MACRO_LITERAL(1), REG_VAR(arg_index) |
| jmp 1b // goto LOOP |
| 2: // FOUND_DOUBLE |
| movsd REG_VAR(xmm_reg),(REG_VAR(fp), REG_VAR(arg_index), 4) |
| addq MACRO_LITERAL(2), REG_VAR(arg_index) |
| jmp 4f |
| 3: // FOUND_FLOAT |
| movss REG_VAR(xmm_reg), (REG_VAR(fp), REG_VAR(arg_index), 4) |
| addq MACRO_LITERAL(1), REG_VAR(arg_index) |
| 4: |
| .endm |
| |
| // Puts the next int/long/object parameter passed in physical register |
| // in the expected dex register array entry, and in case of object in the |
| // expected reference array entry. |
| // Uses rax as temporary. |
| .macro LOOP_OVER_SHORTY_STORING_GPRS gpr_reg64, gpr_reg32, shorty, arg_index, regs, refs, finished |
| 1: // LOOP |
| movb (REG_VAR(shorty)), %al // al := *shorty |
| addq MACRO_LITERAL(1), REG_VAR(shorty) // shorty++ |
| cmpb MACRO_LITERAL(0), %al // if (al == '\0') goto finished |
| je VAR(finished) |
| cmpb MACRO_LITERAL(74), %al // if (al == 'J') goto FOUND_LONG |
| je 2f |
| cmpb MACRO_LITERAL(70), %al // if (al == 'F') goto SKIP_FLOAT |
| je 3f |
| cmpb MACRO_LITERAL(68), %al // if (al == 'D') goto SKIP_DOUBLE |
| je 4f |
| movl REG_VAR(gpr_reg32), (REG_VAR(regs), REG_VAR(arg_index), 4) |
| cmpb MACRO_LITERAL(76), %al // if (al != 'L') goto NOT_REFERENCE |
| jne 6f |
| movl REG_VAR(gpr_reg32), (REG_VAR(refs), REG_VAR(arg_index), 4) |
| 6: // NOT_REFERENCE |
| addq MACRO_LITERAL(1), REG_VAR(arg_index) |
| jmp 5f |
| 2: // FOUND_LONG |
| movq REG_VAR(gpr_reg64), (REG_VAR(regs), REG_VAR(arg_index), 4) |
| addq MACRO_LITERAL(2), REG_VAR(arg_index) |
| jmp 5f |
| 3: // SKIP_FLOAT |
| addq MACRO_LITERAL(1), REG_VAR(arg_index) |
| jmp 1b |
| 4: // SKIP_DOUBLE |
| addq MACRO_LITERAL(2), REG_VAR(arg_index) |
| jmp 1b |
| 5: |
| .endm |
| |
| // Puts the next floating point parameter passed in stack |
| // in the expected dex register array entry. |
| // Uses rax as temporary. |
| // |
| // TODO: Or we could just spill regs to the reserved slots in the caller's |
| // frame and copy all regs in a simple loop. This time, however, we would |
| // need to look at the shorty anyway to look for the references. |
| // (The trade-off is different for passing arguments and receiving them.) |
| .macro LOOP_OVER_FPs shorty, arg_index, regs, stack_ptr, finished |
| 1: // LOOP |
| movb (REG_VAR(shorty)), %al // al := *shorty |
| addq MACRO_LITERAL(1), REG_VAR(shorty) // shorty++ |
| cmpb MACRO_LITERAL(0), %al // if (al == '\0') goto finished |
| je VAR(finished) |
| cmpb MACRO_LITERAL(68), %al // if (al == 'D') goto FOUND_DOUBLE |
| je 2f |
| cmpb MACRO_LITERAL(70), %al // if (al == 'F') goto FOUND_FLOAT |
| je 3f |
| addq MACRO_LITERAL(1), REG_VAR(arg_index) |
| // Handle extra argument in arg array taken by a long. |
| cmpb MACRO_LITERAL(74), %al // if (al != 'J') goto LOOP |
| jne 1b |
| addq MACRO_LITERAL(1), REG_VAR(arg_index) |
| jmp 1b // goto LOOP |
| 2: // FOUND_DOUBLE |
| movq OFFSET_TO_FIRST_ARGUMENT_IN_STACK(REG_VAR(stack_ptr), REG_VAR(arg_index), 4), %rax |
| movq %rax, (REG_VAR(regs), REG_VAR(arg_index), 4) |
| addq MACRO_LITERAL(2), REG_VAR(arg_index) |
| jmp 1b |
| 3: // FOUND_FLOAT |
| movl OFFSET_TO_FIRST_ARGUMENT_IN_STACK(REG_VAR(stack_ptr), REG_VAR(arg_index), 4), %eax |
| movl %eax, (REG_VAR(regs), REG_VAR(arg_index), 4) |
| addq MACRO_LITERAL(1), REG_VAR(arg_index) |
| jmp 1b |
| .endm |
| |
| // Puts the next int/long/object parameter passed in stack |
| // in the expected dex register array entry, and in case of object in the |
| // expected reference array entry. |
| // Uses rax as temporary. |
| .macro LOOP_OVER_INTs shorty, arg_index, regs, refs, stack_ptr, finished |
| 1: // LOOP |
| movb (REG_VAR(shorty)), %al // al := *shorty |
| addq MACRO_LITERAL(1), REG_VAR(shorty) // shorty++ |
| cmpb MACRO_LITERAL(0), %al // if (al == '\0') goto finished |
| je VAR(finished) |
| cmpb MACRO_LITERAL(74), %al // if (al == 'J') goto FOUND_LONG |
| je 2f |
| cmpb MACRO_LITERAL(76), %al // if (al == 'L') goto FOUND_REFERENCE |
| je 6f |
| cmpb MACRO_LITERAL(70), %al // if (al == 'F') goto SKIP_FLOAT |
| je 3f |
| cmpb MACRO_LITERAL(68), %al // if (al == 'D') goto SKIP_DOUBLE |
| je 4f |
| movl OFFSET_TO_FIRST_ARGUMENT_IN_STACK(REG_VAR(stack_ptr), REG_VAR(arg_index), 4), %eax |
| movl %eax, (REG_VAR(regs), REG_VAR(arg_index), 4) |
| addq MACRO_LITERAL(1), REG_VAR(arg_index) |
| jmp 1b |
| 6: // FOUND_REFERENCE |
| movl OFFSET_TO_FIRST_ARGUMENT_IN_STACK(REG_VAR(stack_ptr), REG_VAR(arg_index), 4), %eax |
| movl %eax, (REG_VAR(regs), REG_VAR(arg_index), 4) |
| movl %eax, (REG_VAR(refs), REG_VAR(arg_index), 4) |
| addq MACRO_LITERAL(1), REG_VAR(arg_index) |
| jmp 1b |
| 2: // FOUND_LONG |
| movq OFFSET_TO_FIRST_ARGUMENT_IN_STACK(REG_VAR(stack_ptr), REG_VAR(arg_index), 4), %rax |
| movq %rax, (REG_VAR(regs), REG_VAR(arg_index), 4) |
| addq MACRO_LITERAL(2), REG_VAR(arg_index) |
| jmp 1b |
| 3: // SKIP_FLOAT |
| addq MACRO_LITERAL(1), REG_VAR(arg_index) |
| jmp 1b |
| 4: // SKIP_DOUBLE |
| addq MACRO_LITERAL(2), REG_VAR(arg_index) |
| jmp 1b |
| .endm |
| |
| // Increase method hotness and do suspend check before starting executing the method. |
| .macro START_EXECUTING_INSTRUCTIONS |
| movq (%rsp), %rdi |
| addw $$1, ART_METHOD_HOTNESS_COUNT_OFFSET(%rdi) |
| andw $$(NTERP_HOTNESS_MASK), ART_METHOD_HOTNESS_COUNT_OFFSET(%rdi) |
| jz 2f |
| testl $$(THREAD_SUSPEND_OR_CHECKPOINT_REQUEST), rSELF:THREAD_FLAGS_OFFSET |
| jz 1f |
| EXPORT_PC |
| call SYMBOL(art_quick_test_suspend) |
| 1: |
| FETCH_INST |
| GOTO_NEXT |
| 2: |
| movq $$0, %rsi |
| movq rFP, %rdx |
| call nterp_hot_method |
| jmp 1b |
| .endm |
| |
| .macro SPILL_ALL_CALLEE_SAVES |
| PUSH r15 |
| PUSH r14 |
| PUSH r13 |
| PUSH r12 |
| PUSH rbp |
| PUSH rbx |
| SETUP_FP_CALLEE_SAVE_FRAME |
| .endm |
| |
| .macro RESTORE_ALL_CALLEE_SAVES |
| RESTORE_FP_CALLEE_SAVE_FRAME |
| POP rbx |
| POP rbp |
| POP r12 |
| POP r13 |
| POP r14 |
| POP r15 |
| .endm |
| |
| // Helper to setup the stack after doing a nterp to nterp call. This will setup: |
| // - rNEW_FP: the new pointer to dex registers |
| // - rNEW_REFS: the new pointer to references |
| // - rPC: the new PC pointer to execute |
| // - edi: number of arguments |
| // - ecx: first dex register |
| // |
| // This helper expects: |
| // - rax to contain the code item |
| .macro SETUP_STACK_FOR_INVOKE |
| // We do the same stack overflow check as the compiler. See CanMethodUseNterp |
| // in how we limit the maximum nterp frame size. |
| testq %rax, -STACK_OVERFLOW_RESERVED_BYTES(%rsp) |
| |
| // Spill all callee saves to have a consistent stack frame whether we |
| // are called by compiled code or nterp. |
| SPILL_ALL_CALLEE_SAVES |
| |
| // Setup the frame. |
| SETUP_STACK_FRAME %rax, rNEW_REFS, rNEW_REFS32, rNEW_FP, CFI_NEW_REFS, load_ins=0 |
| // Make r11 point to the top of the dex register array. |
| leaq (rNEW_FP, %rbx, 4), %r11 |
| |
| // Fetch instruction information before replacing rPC. |
| movzbl 1(rPC), %edi |
| movzwl 4(rPC), %ecx |
| |
| // Set the dex pc pointer. |
| movq %rax, rPC |
| CFI_DEFINE_DEX_PC_WITH_OFFSET(CFI_TMP, CFI_DEX, 0) |
| .endm |
| |
| // Setup arguments based on a non-range nterp to nterp call, and start executing |
| // the method. We expect: |
| // - rNEW_FP: the new pointer to dex registers |
| // - rNEW_REFS: the new pointer to references |
| // - rPC: the new PC pointer to execute |
| // - edi: number of arguments |
| // - ecx: first dex register |
| // - r11: top of dex register array |
| // - esi: receiver if non-static. |
| .macro SETUP_NON_RANGE_ARGUMENTS_AND_EXECUTE is_static=0, is_string_init=0 |
| // Now all temporary registers (except r11 containing top of registers array) |
| // are available, copy the parameters. |
| // /* op vA, vB, {vC...vG} */ |
| movl %edi, %eax |
| shrl $$4, %eax # Number of arguments |
| jz 6f # shl sets the Z flag |
| movq MACRO_LITERAL(-1), %r10 |
| cmpl MACRO_LITERAL(2), %eax |
| jl 1f |
| je 2f |
| cmpl MACRO_LITERAL(4), %eax |
| jl 3f |
| je 4f |
| |
| // We use a decrementing r10 to store references relative |
| // to rNEW_FP and dex registers relative to r11. |
| // |
| // TODO: We could set up r10 as the number of registers (this can be an additional output from |
| // SETUP_STACK_FOR_INVOKE) and then just decrement it by one before copying each arg to |
| // (rNEW_FP, r10, 4) and (rNEW_REFS, r10, 4). |
| // Maybe even introduce macros NEW_VREG_ADDRESS/NEW_VREG_REF_ADDRESS. |
| 5: |
| andq MACRO_LITERAL(15), %rdi |
| GET_VREG_OBJECT %edx, %rdi |
| movl %edx, (rNEW_FP, %r10, 4) |
| GET_VREG %edx, %rdi |
| movl %edx, (%r11, %r10, 4) |
| subq MACRO_LITERAL(1), %r10 |
| 4: |
| movl %ecx, %eax |
| shrl MACRO_LITERAL(12), %eax |
| GET_VREG_OBJECT %edx, %rax |
| movl %edx, (rNEW_FP, %r10, 4) |
| GET_VREG %edx, %rax |
| movl %edx, (%r11, %r10, 4) |
| subq MACRO_LITERAL(1), %r10 |
| 3: |
| movl %ecx, %eax |
| shrl MACRO_LITERAL(8), %eax |
| andl MACRO_LITERAL(0xf), %eax |
| GET_VREG_OBJECT %edx, %rax |
| movl %edx, (rNEW_FP, %r10, 4) |
| GET_VREG %edx, %rax |
| movl %edx, (%r11, %r10, 4) |
| subq MACRO_LITERAL(1), %r10 |
| 2: |
| movl %ecx, %eax |
| shrl MACRO_LITERAL(4), %eax |
| andl MACRO_LITERAL(0xf), %eax |
| GET_VREG_OBJECT %edx, %rax |
| movl %edx, (rNEW_FP, %r10, 4) |
| GET_VREG %edx, %rax |
| movl %edx, (%r11, %r10, 4) |
| subq MACRO_LITERAL(1), %r10 |
| 1: |
| .if \is_string_init |
| // Ignore the first argument |
| .elseif \is_static |
| movl %ecx, %eax |
| andq MACRO_LITERAL(0x000f), %rax |
| GET_VREG_OBJECT %edx, %rax |
| movl %edx, (rNEW_FP, %r10, 4) |
| GET_VREG %edx, %rax |
| movl %edx, (%r11, %r10, 4) |
| .else |
| movl %esi, (rNEW_FP, %r10, 4) |
| movl %esi, (%r11, %r10, 4) |
| .endif |
| |
| 6: |
| // Start executing the method. |
| movq rNEW_FP, rFP |
| movq rNEW_REFS, rREFS |
| CFI_DEF_CFA_BREG_PLUS_UCONST CFI_REFS, -8, ((6 + 4 + 1) * 8) |
| START_EXECUTING_INSTRUCTIONS |
| .endm |
| |
| // Setup arguments based on a range nterp to nterp call, and start executing |
| // the method. |
| .macro SETUP_RANGE_ARGUMENTS_AND_EXECUTE is_static=0, is_string_init=0 |
| // edi is number of arguments |
| // ecx is first register |
| movq MACRO_LITERAL(-4), %r10 |
| .if \is_string_init |
| // Ignore the first argument |
| subl $$1, %edi |
| addl $$1, %ecx |
| .elseif !\is_static |
| subl $$1, %edi |
| addl $$1, %ecx |
| .endif |
| |
| testl %edi, %edi |
| je 2f |
| leaq (rREFS, %rcx, 4), %rax # pointer to first argument in reference array |
| leaq (%rax, %rdi, 4), %rax # pointer to last argument in reference array |
| leaq (rFP, %rcx, 4), %rcx # pointer to first argument in register array |
| leaq (%rcx, %rdi, 4), %rdi # pointer to last argument in register array |
| // TODO: Same comment for copying arguments as in SETUP_NON_RANGE_ARGUMENTS_AND_EXECUTE. |
| 1: |
| movl -4(%rax), %edx |
| movl %edx, (rNEW_FP, %r10, 1) |
| movl -4(%rdi), %edx |
| movl %edx, (%r11, %r10, 1) |
| subq MACRO_LITERAL(4), %r10 |
| subq MACRO_LITERAL(4), %rax |
| subq MACRO_LITERAL(4), %rdi |
| cmpq %rcx, %rdi |
| jne 1b |
| |
| 2: |
| .if \is_string_init |
| // Ignore first argument |
| .elseif !\is_static |
| movl %esi, (rNEW_FP, %r10, 1) |
| movl %esi, (%r11, %r10, 1) |
| .endif |
| movq rNEW_FP, rFP |
| movq rNEW_REFS, rREFS |
| CFI_DEF_CFA_BREG_PLUS_UCONST CFI_REFS, -8, ((6 + 4 + 1) * 8) |
| START_EXECUTING_INSTRUCTIONS |
| .endm |
| |
| .macro GET_SHORTY dest, is_interface, is_polymorphic, is_custom |
| push %rdi |
| push %rsi |
| .if \is_polymorphic |
| movq 16(%rsp), %rdi |
| movq rPC, %rsi |
| call SYMBOL(NterpGetShortyFromInvokePolymorphic) |
| .elseif \is_custom |
| movq 16(%rsp), %rdi |
| movq rPC, %rsi |
| call SYMBOL(NterpGetShortyFromInvokeCustom) |
| .elseif \is_interface |
| movq 16(%rsp), %rdi |
| movzwl 2(rPC), %esi |
| call SYMBOL(NterpGetShortyFromMethodId) |
| .else |
| call SYMBOL(NterpGetShorty) |
| .endif |
| pop %rsi |
| pop %rdi |
| movq %rax, \dest |
| .endm |
| |
| // Uses r9 as temporary. |
| .macro DO_ENTRY_POINT_CHECK call_compiled_code |
| // On entry, the method is %rdi, the instance is %rsi |
| leaq ExecuteNterpImpl(%rip), %r9 |
| cmpq %r9, ART_METHOD_QUICK_CODE_OFFSET_64(%rdi) |
| jne VAR(call_compiled_code) |
| |
| movq ART_METHOD_DATA_OFFSET_64(%rdi), %rax |
| .endm |
| |
| // Uses r9 and r10 as temporary |
| .macro UPDATE_REGISTERS_FOR_STRING_INIT old_value, new_value |
| movq rREFS, %r9 |
| movq rFP, %r10 |
| 1: |
| cmpl (%r9), \old_value |
| jne 2f |
| movl \new_value, (%r9) |
| movl \new_value, (%r10) |
| 2: |
| addq $$4, %r9 |
| addq $$4, %r10 |
| cmpq %r9, rFP |
| jne 1b |
| .endm |
| |
| .macro COMMON_INVOKE_NON_RANGE is_static=0, is_interface=0, suffix="", is_string_init=0, is_polymorphic=0, is_custom=0 |
| .if \is_polymorphic |
| // We always go to compiled code for polymorphic calls. |
| .elseif \is_custom |
| // We always go to compiled code for custom calls. |
| .else |
| DO_ENTRY_POINT_CHECK .Lcall_compiled_code_\suffix |
| .if \is_string_init |
| call nterp_to_nterp_string_init_non_range |
| .elseif \is_static |
| call nterp_to_nterp_static_non_range |
| .else |
| call nterp_to_nterp_instance_non_range |
| .endif |
| jmp .Ldone_return_\suffix |
| .endif |
| |
| .Lcall_compiled_code_\suffix: |
| .if \is_interface |
| // Save interface method, used for conflict resolution, in a callee-save register. |
| movq %rax, %xmm12 |
| .endif |
| GET_SHORTY rINSTq, \is_interface, \is_polymorphic, \is_custom |
| // From this point: |
| // - rISNTq contains shorty (in callee-save to switch over return value after call). |
| // - rdi contains method |
| // - rsi contains 'this' pointer for instance method. |
| leaq 1(rINSTq), %r9 // shorty + 1 ; ie skip return arg character |
| movzwl 4(rPC), %r11d // arguments |
| .if \is_string_init |
| shrq MACRO_LITERAL(4), %r11 |
| movq $$1, %r10 // ignore first argument |
| .elseif \is_static |
| movq $$0, %r10 // arg_index |
| .else |
| shrq MACRO_LITERAL(4), %r11 |
| movq $$1, %r10 // arg_index |
| .endif |
| LOOP_OVER_SHORTY_LOADING_XMMS xmm0, r11, r9, r10, .Lxmm_setup_finished_\suffix |
| LOOP_OVER_SHORTY_LOADING_XMMS xmm1, r11, r9, r10, .Lxmm_setup_finished_\suffix |
| LOOP_OVER_SHORTY_LOADING_XMMS xmm2, r11, r9, r10, .Lxmm_setup_finished_\suffix |
| LOOP_OVER_SHORTY_LOADING_XMMS xmm3, r11, r9, r10, .Lxmm_setup_finished_\suffix |
| LOOP_OVER_SHORTY_LOADING_XMMS xmm4, r11, r9, r10, .Lxmm_setup_finished_\suffix |
| .Lxmm_setup_finished_\suffix: |
| leaq 1(rINSTq), %r9 // shorty + 1 ; ie skip return arg character |
| movzwl 4(rPC), %r11d // arguments |
| .if \is_string_init |
| movq $$1, %r10 // ignore first argument |
| shrq MACRO_LITERAL(4), %r11 |
| LOOP_OVER_SHORTY_LOADING_GPRS rsi, esi, r11, r9, r10, .Lgpr_setup_finished_\suffix |
| .elseif \is_static |
| movq $$0, %r10 // arg_index |
| LOOP_OVER_SHORTY_LOADING_GPRS rsi, esi, r11, r9, r10, .Lgpr_setup_finished_\suffix |
| .else |
| shrq MACRO_LITERAL(4), %r11 |
| movq $$1, %r10 // arg_index |
| .endif |
| LOOP_OVER_SHORTY_LOADING_GPRS rdx, edx, r11, r9, r10, .Lgpr_setup_finished_\suffix |
| LOOP_OVER_SHORTY_LOADING_GPRS rcx, ecx, r11, r9, r10, .Lgpr_setup_finished_\suffix |
| LOOP_OVER_SHORTY_LOADING_GPRS r8, r8d, r11, r9, r10, .Lgpr_setup_finished_\suffix |
| LOOP_OVER_SHORTY_LOADING_GPRS r9, r9d, r11, r9, r10, .Lgpr_setup_finished_\suffix |
| .Lgpr_setup_finished_\suffix: |
| .if \is_polymorphic |
| call SYMBOL(art_quick_invoke_polymorphic) |
| .elseif \is_custom |
| call SYMBOL(art_quick_invoke_custom) |
| .else |
| .if \is_interface |
| movq %xmm12, %rax |
| .endif |
| call *ART_METHOD_QUICK_CODE_OFFSET_64(%rdi) // Call the method. |
| .endif |
| cmpb LITERAL(68), (rINSTq) // Test if result type char == 'D'. |
| je .Lreturn_double_\suffix |
| cmpb LITERAL(70), (rINSTq) // Test if result type char == 'F'. |
| jne .Ldone_return_\suffix |
| .Lreturn_float_\suffix: |
| movd %xmm0, %eax |
| jmp .Ldone_return_\suffix |
| .Lreturn_double_\suffix: |
| movq %xmm0, %rax |
| .Ldone_return_\suffix: |
| /* resume execution of caller */ |
| .if \is_string_init |
| movzwl 4(rPC), %r11d // arguments |
| andq $$0xf, %r11 |
| GET_VREG %esi, %r11 |
| UPDATE_REGISTERS_FOR_STRING_INIT %esi, %eax |
| .endif |
| |
| .if \is_polymorphic |
| ADVANCE_PC_FETCH_AND_GOTO_NEXT 4 |
| .else |
| ADVANCE_PC_FETCH_AND_GOTO_NEXT 3 |
| .endif |
| .endm |
| |
| .macro COMMON_INVOKE_RANGE is_static=0, is_interface=0, suffix="", is_string_init=0, is_polymorphic=0, is_custom=0 |
| .if \is_polymorphic |
| // We always go to compiled code for polymorphic calls. |
| .elseif \is_custom |
| // We always go to compiled code for custom calls. |
| .else |
| DO_ENTRY_POINT_CHECK .Lcall_compiled_code_range_\suffix |
| .if \is_string_init |
| call nterp_to_nterp_string_init_range |
| .elseif \is_static |
| call nterp_to_nterp_static_range |
| .else |
| call nterp_to_nterp_instance_range |
| .endif |
| jmp .Ldone_return_range_\suffix |
| .endif |
| |
| .Lcall_compiled_code_range_\suffix: |
| .if \is_interface |
| // Save interface method, used for conflict resolution, in a callee-saved register. |
| movq %rax, %xmm12 |
| .endif |
| GET_SHORTY rINSTq, \is_interface, \is_polymorphic, \is_custom |
| // From this point: |
| // - rINSTq contains shorty (in callee-save to switch over return value after call). |
| // - rdi contains method |
| // - rsi contains 'this' pointer for instance method. |
| leaq 1(rINSTq), %r9 // shorty + 1 ; ie skip return arg character |
| movzwl 4(rPC), %r10d // arg start index |
| .if \is_string_init |
| addq $$1, %r10 // arg start index |
| movq $$1, %rbp // index in stack |
| .elseif \is_static |
| movq $$0, %rbp // index in stack |
| .else |
| addq $$1, %r10 // arg start index |
| movq $$1, %rbp // index in stack |
| .endif |
| LOOP_RANGE_OVER_SHORTY_LOADING_XMMS xmm0, r9, r10, rbp, .Lxmm_setup_finished_range_\suffix |
| LOOP_RANGE_OVER_SHORTY_LOADING_XMMS xmm1, r9, r10, rbp, .Lxmm_setup_finished_range_\suffix |
| LOOP_RANGE_OVER_SHORTY_LOADING_XMMS xmm2, r9, r10, rbp, .Lxmm_setup_finished_range_\suffix |
| LOOP_RANGE_OVER_SHORTY_LOADING_XMMS xmm3, r9, r10, rbp, .Lxmm_setup_finished_range_\suffix |
| LOOP_RANGE_OVER_SHORTY_LOADING_XMMS xmm4, r9, r10, rbp, .Lxmm_setup_finished_range_\suffix |
| LOOP_RANGE_OVER_SHORTY_LOADING_XMMS xmm5, r9, r10, rbp, .Lxmm_setup_finished_range_\suffix |
| LOOP_RANGE_OVER_SHORTY_LOADING_XMMS xmm6, r9, r10, rbp, .Lxmm_setup_finished_range_\suffix |
| LOOP_RANGE_OVER_SHORTY_LOADING_XMMS xmm7, r9, r10, rbp, .Lxmm_setup_finished_range_\suffix |
| LOOP_RANGE_OVER_FPs r9, r10, rbp, .Lxmm_setup_finished_range_\suffix |
| .Lxmm_setup_finished_range_\suffix: |
| leaq 1(%rbx), %r11 // shorty + 1 ; ie skip return arg character |
| movzwl 4(rPC), %r10d // arg start index |
| .if \is_string_init |
| addq $$1, %r10 // arg start index |
| movq $$1, %rbp // index in stack |
| LOOP_RANGE_OVER_SHORTY_LOADING_GPRS rsi, esi, r11, r10, rbp, .Lgpr_setup_finished_range_\suffix |
| .elseif \is_static |
| movq $$0, %rbp // index in stack |
| LOOP_RANGE_OVER_SHORTY_LOADING_GPRS rsi, esi, r11, r10, rbp, .Lgpr_setup_finished_range_\suffix |
| .else |
| addq $$1, %r10 // arg start index |
| movq $$1, %rbp // index in stack |
| .endif |
| LOOP_RANGE_OVER_SHORTY_LOADING_GPRS rdx, edx, r11, r10, rbp, .Lgpr_setup_finished_range_\suffix |
| LOOP_RANGE_OVER_SHORTY_LOADING_GPRS rcx, ecx, r11, r10, rbp, .Lgpr_setup_finished_range_\suffix |
| LOOP_RANGE_OVER_SHORTY_LOADING_GPRS r8, r8d, r11, r10, rbp, .Lgpr_setup_finished_range_\suffix |
| LOOP_RANGE_OVER_SHORTY_LOADING_GPRS r9, r9d, r11, r10, rbp, .Lgpr_setup_finished_range_\suffix |
| LOOP_RANGE_OVER_INTs r11, r10, rbp, .Lgpr_setup_finished_range_\suffix |
| |
| .Lgpr_setup_finished_range_\suffix: |
| .if \is_polymorphic |
| call SYMBOL(art_quick_invoke_polymorphic) |
| .elseif \is_custom |
| call SYMBOL(art_quick_invoke_custom) |
| .else |
| .if \is_interface |
| // Set the hidden argument for conflict resolution. |
| movq %xmm12, %rax |
| .endif |
| call *ART_METHOD_QUICK_CODE_OFFSET_64(%rdi) // Call the method. |
| .endif |
| cmpb LITERAL(68), (%rbx) // Test if result type char == 'D'. |
| je .Lreturn_range_double_\suffix |
| cmpb LITERAL(70), (%rbx) // Test if result type char == 'F'. |
| je .Lreturn_range_float_\suffix |
| /* resume execution of caller */ |
| .Ldone_return_range_\suffix: |
| .if \is_string_init |
| movzwl 4(rPC), %r11d // arguments |
| GET_VREG %esi, %r11 |
| UPDATE_REGISTERS_FOR_STRING_INIT %esi, %eax |
| .endif |
| |
| .if \is_polymorphic |
| ADVANCE_PC_FETCH_AND_GOTO_NEXT 4 |
| .else |
| ADVANCE_PC_FETCH_AND_GOTO_NEXT 3 |
| .endif |
| .Lreturn_range_double_\suffix: |
| movq %xmm0, %rax |
| jmp .Ldone_return_range_\suffix |
| .Lreturn_range_float_\suffix: |
| movd %xmm0, %eax |
| jmp .Ldone_return_range_\suffix |
| .endm |
| |
| // Fetch some information from the thread cache. |
| // Uses rax, rdx, rcx as temporaries. |
| .macro FETCH_FROM_THREAD_CACHE dest_reg, slow_path |
| movq rSELF:THREAD_SELF_OFFSET, %rax |
| movq rPC, %rdx |
| salq MACRO_LITERAL(THREAD_INTERPRETER_CACHE_SIZE_SHIFT), %rdx |
| andq MACRO_LITERAL(THREAD_INTERPRETER_CACHE_SIZE_MASK), %rdx |
| cmpq THREAD_INTERPRETER_CACHE_OFFSET(%rax, %rdx, 1), rPC |
| jne \slow_path |
| movq __SIZEOF_POINTER__+THREAD_INTERPRETER_CACHE_OFFSET(%rax, %rdx, 1), \dest_reg |
| .endm |
| |
| // Helper for static field get. |
| .macro OP_SGET load="movl", wide="0" |
| // Fast-path which gets the field from thread-local cache. |
| FETCH_FROM_THREAD_CACHE %rax, 2f |
| 1: |
| movl ART_FIELD_OFFSET_OFFSET(%rax), %edx |
| movl ART_FIELD_DECLARING_CLASS_OFFSET(%rax), %eax |
| cmpq $$0, rSELF:THREAD_READ_BARRIER_MARK_REG00_OFFSET |
| jne 3f |
| 4: |
| .if \wide |
| movq (%eax,%edx,1), %rax |
| SET_WIDE_VREG %rax, rINSTq # fp[A] <- value |
| .else |
| \load (%eax, %edx, 1), %eax |
| SET_VREG %eax, rINSTq # fp[A] <- value |
| .endif |
| ADVANCE_PC_FETCH_AND_GOTO_NEXT 2 |
| 2: |
| EXPORT_PC |
| movq rSELF:THREAD_SELF_OFFSET, %rdi |
| movq 0(%rsp), %rsi |
| movq rPC, %rdx |
| movq $$0, %rcx |
| call nterp_get_static_field |
| // Clear the marker that we put for volatile fields. The x86 memory |
| // model doesn't require a barrier. |
| andq $$-2, %rax |
| jmp 1b |
| 3: |
| call art_quick_read_barrier_mark_reg00 |
| jmp 4b |
| .endm |
| |
| // Helper for static field put. |
| .macro OP_SPUT rINST_reg="rINST", store="movl", wide="0": |
| // Fast-path which gets the field from thread-local cache. |
| FETCH_FROM_THREAD_CACHE %rax, 2f |
| 1: |
| movl ART_FIELD_OFFSET_OFFSET(%rax), %edx |
| movl ART_FIELD_DECLARING_CLASS_OFFSET(%rax), %eax |
| cmpq $$0, rSELF:THREAD_READ_BARRIER_MARK_REG00_OFFSET |
| jne 3f |
| 4: |
| .if \wide |
| GET_WIDE_VREG rINSTq, rINSTq # rINST <- v[A] |
| .else |
| GET_VREG rINST, rINSTq # rINST <- v[A] |
| .endif |
| \store \rINST_reg, (%rax,%rdx,1) |
| ADVANCE_PC_FETCH_AND_GOTO_NEXT 2 |
| 2: |
| EXPORT_PC |
| movq rSELF:THREAD_SELF_OFFSET, %rdi |
| movq 0(%rsp), %rsi |
| movq rPC, %rdx |
| movq $$0, %rcx |
| call nterp_get_static_field |
| testq MACRO_LITERAL(1), %rax |
| je 1b |
| // Clear the marker that we put for volatile fields. The x86 memory |
| // model doesn't require a barrier. |
| CLEAR_VOLATILE_MARKER %rax |
| movl ART_FIELD_OFFSET_OFFSET(%rax), %edx |
| movl ART_FIELD_DECLARING_CLASS_OFFSET(%rax), %eax |
| cmpq $$0, rSELF:THREAD_READ_BARRIER_MARK_REG00_OFFSET |
| jne 6f |
| 5: |
| .if \wide |
| GET_WIDE_VREG rINSTq, rINSTq # rINST <- v[A] |
| .else |
| GET_VREG rINST, rINSTq # rINST <- v[A] |
| .endif |
| \store \rINST_reg, (%rax,%rdx,1) |
| lock addl $$0, (%rsp) |
| ADVANCE_PC_FETCH_AND_GOTO_NEXT 2 |
| 3: |
| call art_quick_read_barrier_mark_reg00 |
| jmp 4b |
| 6: |
| call art_quick_read_barrier_mark_reg00 |
| jmp 5b |
| .endm |
| |
| |
| .macro OP_IPUT_INTERNAL rINST_reg="rINST", store="movl", wide="0": |
| movzbq rINSTbl, %rcx # rcx <- BA |
| sarl $$4, %ecx # ecx <- B |
| GET_VREG %ecx, %rcx # vB (object we're operating on) |
| testl %ecx, %ecx # is object null? |
| je common_errNullObject |
| andb $$0xf, rINSTbl # rINST <- A |
| .if \wide |
| GET_WIDE_VREG rINSTq, rINSTq # rax<- fp[A]/fp[A+1] |
| .else |
| GET_VREG rINST, rINSTq # rINST <- v[A] |
| .endif |
| \store \rINST_reg, (%rcx,%rax,1) |
| .endm |
| |
| // Helper for instance field put. |
| .macro OP_IPUT rINST_reg="rINST", store="movl", wide="0": |
| // Fast-path which gets the field from thread-local cache. |
| FETCH_FROM_THREAD_CACHE %rax, 2f |
| 1: |
| OP_IPUT_INTERNAL \rINST_reg, \store, \wide |
| ADVANCE_PC_FETCH_AND_GOTO_NEXT 2 |
| 2: |
| EXPORT_PC |
| movq rSELF:THREAD_SELF_OFFSET, %rdi |
| movq 0(%rsp), %rsi |
| movq rPC, %rdx |
| movq $$0, %rcx |
| call nterp_get_instance_field_offset |
| testl %eax, %eax |
| jns 1b |
| negl %eax |
| OP_IPUT_INTERNAL \rINST_reg, \store, \wide |
| lock addl $$0, (%rsp) |
| ADVANCE_PC_FETCH_AND_GOTO_NEXT 2 |
| .endm |
| |
| // Helper for instance field get. |
| .macro OP_IGET load="movl", wide="0" |
| // Fast-path which gets the field from thread-local cache. |
| FETCH_FROM_THREAD_CACHE %rax, 2f |
| 1: |
| movl rINST, %ecx # rcx <- BA |
| sarl $$4, %ecx # ecx <- B |
| GET_VREG %ecx, %rcx # vB (object we're operating on) |
| testl %ecx, %ecx # is object null? |
| je common_errNullObject |
| andb $$0xf,rINSTbl # rINST <- A |
| .if \wide |
| movq (%rcx,%rax,1), %rax |
| SET_WIDE_VREG %rax, rINSTq # fp[A] <- value |
| .else |
| \load (%rcx,%rax,1), %eax |
| SET_VREG %eax, rINSTq # fp[A] <- value |
| .endif |
| ADVANCE_PC_FETCH_AND_GOTO_NEXT 2 |
| 2: |
| EXPORT_PC |
| movq rSELF:THREAD_SELF_OFFSET, %rdi |
| movq 0(%rsp), %rsi |
| movq rPC, %rdx |
| movq $$0, %rcx |
| call nterp_get_instance_field_offset |
| testl %eax, %eax |
| jns 1b |
| negl %eax |
| jmp 1b |
| .endm |
| |
| %def entry(): |
| /* |
| * ArtMethod entry point. |
| * |
| * On entry: |
| * rdi ArtMethod* callee |
| * rest method parameters |
| */ |
| |
| OAT_ENTRY ExecuteNterpImpl, EndExecuteNterpImpl |
| .cfi_startproc |
| .cfi_def_cfa rsp, 8 |
| testq %rax, -STACK_OVERFLOW_RESERVED_BYTES(%rsp) |
| /* Spill callee save regs */ |
| SPILL_ALL_CALLEE_SAVES |
| |
| // TODO: Get shorty in a better way and remove below |
| PUSH rdi |
| PUSH rsi |
| PUSH rdx |
| PUSH rcx |
| PUSH r8 |
| PUSH r9 |
| |
| // Save xmm registers + alignment. |
| subq MACRO_LITERAL(8 * 8 + 8), %rsp |
| CFI_ADJUST_CFA_OFFSET(8 * 8 + 8) |
| movq %xmm0, 0(%rsp) |
| movq %xmm1, 8(%rsp) |
| movq %xmm2, 16(%rsp) |
| movq %xmm3, 24(%rsp) |
| movq %xmm4, 32(%rsp) |
| movq %xmm5, 40(%rsp) |
| movq %xmm6, 48(%rsp) |
| movq %xmm7, 56(%rsp) |
| |
| call SYMBOL(NterpGetShorty) |
| // Save shorty in callee-save rbp. |
| movq %rax, %rbp |
| |
| // Restore xmm registers + alignment. |
| movq 0(%rsp), %xmm0 |
| movq 8(%rsp), %xmm1 |
| movq 16(%rsp), %xmm2 |
| movq 24(%rsp), %xmm3 |
| movq 32(%rsp), %xmm4 |
| movq 40(%rsp), %xmm5 |
| movq 48(%rsp), %xmm6 |
| movq 56(%rsp), %xmm7 |
| addq MACRO_LITERAL(8 * 8 + 8), %rsp |
| CFI_ADJUST_CFA_OFFSET(-8 * 8 - 8) |
| |
| POP r9 |
| POP r8 |
| POP rcx |
| POP rdx |
| POP rsi |
| POP rdi |
| // TODO: Get shorty in a better way and remove above |
| |
| movq ART_METHOD_DATA_OFFSET_64(%rdi), rPC |
| |
| // Setup the stack for executing the method. |
| SETUP_STACK_FRAME rPC, rREFS, rREFS32, rFP, CFI_REFS, load_ins=1 |
| |
| // Setup the parameters |
| testl %r14d, %r14d |
| je .Lxmm_setup_finished |
| |
| subq %r14, %rbx |
| salq $$2, %rbx // rbx is now the offset for inputs into the registers array. |
| |
| testl $$ART_METHOD_IS_STATIC_FLAG, ART_METHOD_ACCESS_FLAGS_OFFSET(%rdi) |
| |
| // Available: rdi, r10, r14 |
| // Note the leaq below don't change the flags. |
| leaq 1(%rbp), %r10 // shorty + 1 ; ie skip return arg character |
| leaq (rFP, %rbx, 1), %rdi |
| leaq (rREFS, %rbx, 1), %rbx |
| jne .Lhandle_static_method |
| movl %esi, (%rdi) |
| movl %esi, (%rbx) |
| addq $$4, %rdi |
| addq $$4, %rbx |
| addq $$4, %r11 |
| movq $$0, %r14 |
| jmp .Lcontinue_setup_gprs |
| .Lhandle_static_method: |
| movq $$0, %r14 |
| LOOP_OVER_SHORTY_STORING_GPRS rsi, esi, r10, r14, rdi, rbx, .Lgpr_setup_finished |
| .Lcontinue_setup_gprs: |
| LOOP_OVER_SHORTY_STORING_GPRS rdx, edx, r10, r14, rdi, rbx, .Lgpr_setup_finished |
| LOOP_OVER_SHORTY_STORING_GPRS rcx, ecx, r10, r14, rdi, rbx, .Lgpr_setup_finished |
| LOOP_OVER_SHORTY_STORING_GPRS r8, r8d, r10, r14, rdi, rbx, .Lgpr_setup_finished |
| LOOP_OVER_SHORTY_STORING_GPRS r9, r9d, r10, r14, rdi, rbx, .Lgpr_setup_finished |
| LOOP_OVER_INTs r10, r14, rdi, rbx, r11, .Lgpr_setup_finished |
| .Lgpr_setup_finished: |
| leaq 1(%rbp), %r10 // shorty + 1 ; ie skip return arg character |
| movq $$0, %r14 // reset counter |
| LOOP_OVER_SHORTY_STORING_XMMS xmm0, r10, r14, rdi, .Lxmm_setup_finished |
| LOOP_OVER_SHORTY_STORING_XMMS xmm1, r10, r14, rdi, .Lxmm_setup_finished |
| LOOP_OVER_SHORTY_STORING_XMMS xmm2, r10, r14, rdi, .Lxmm_setup_finished |
| LOOP_OVER_SHORTY_STORING_XMMS xmm3, r10, r14, rdi, .Lxmm_setup_finished |
| LOOP_OVER_SHORTY_STORING_XMMS xmm4, r10, r14, rdi, .Lxmm_setup_finished |
| LOOP_OVER_SHORTY_STORING_XMMS xmm5, r10, r14, rdi, .Lxmm_setup_finished |
| LOOP_OVER_SHORTY_STORING_XMMS xmm6, r10, r14, rdi, .Lxmm_setup_finished |
| LOOP_OVER_SHORTY_STORING_XMMS xmm7, r10, r14, rdi, .Lxmm_setup_finished |
| LOOP_OVER_FPs r10, r14, rdi, r11, .Lxmm_setup_finished |
| .Lxmm_setup_finished: |
| CFI_DEFINE_DEX_PC_WITH_OFFSET(CFI_TMP, CFI_DEX, 0) |
| |
| // Set rIBASE |
| leaq artNterpAsmInstructionStart(%rip), rIBASE |
| /* start executing the instruction at rPC */ |
| START_EXECUTING_INSTRUCTIONS |
| /* NOTE: no fallthrough */ |
| // cfi info continues, and covers the whole nterp implementation. |
| END ExecuteNterpImpl |
| |
| %def opcode_pre(): |
| |
| %def helpers(): |
| |
| %def footer(): |
| /* |
| * =========================================================================== |
| * Common subroutines and data |
| * =========================================================================== |
| */ |
| |
| .text |
| .align 2 |
| |
| // Note: mterp also uses the common_* names below for helpers, but that's OK |
| // as the C compiler compiled each interpreter separately. |
| common_errDivideByZero: |
| EXPORT_PC |
| call art_quick_throw_div_zero |
| |
| // Expect array in edi, index in esi. |
| common_errArrayIndex: |
| EXPORT_PC |
| movl MIRROR_ARRAY_LENGTH_OFFSET(%edi), %eax |
| movl %esi, %edi |
| movl %eax, %esi |
| call art_quick_throw_array_bounds |
| |
| common_errNullObject: |
| EXPORT_PC |
| call art_quick_throw_null_pointer_exception |
| |
| NterpCommonInvokeStatic: |
| COMMON_INVOKE_NON_RANGE is_static=1, is_interface=0, suffix="invokeStatic" |
| |
| NterpCommonInvokeStaticRange: |
| COMMON_INVOKE_RANGE is_static=1, is_interface=0, suffix="invokeStatic" |
| |
| NterpCommonInvokeInstance: |
| COMMON_INVOKE_NON_RANGE is_static=0, is_interface=0, suffix="invokeInstance" |
| |
| NterpCommonInvokeInstanceRange: |
| COMMON_INVOKE_RANGE is_static=0, is_interface=0, suffix="invokeInstance" |
| |
| NterpCommonInvokeInterface: |
| COMMON_INVOKE_NON_RANGE is_static=0, is_interface=1, suffix="invokeInterface" |
| |
| NterpCommonInvokeInterfaceRange: |
| COMMON_INVOKE_RANGE is_static=0, is_interface=1, suffix="invokeInterface" |
| |
| NterpCommonInvokePolymorphic: |
| COMMON_INVOKE_NON_RANGE is_static=0, is_interface=0, is_string_init=0, is_polymorphic=1, suffix="invokePolymorphic" |
| |
| NterpCommonInvokePolymorphicRange: |
| COMMON_INVOKE_RANGE is_static=0, is_interface=0, is_polymorphic=1, suffix="invokePolymorphic" |
| |
| NterpCommonInvokeCustom: |
| COMMON_INVOKE_NON_RANGE is_static=1, is_interface=0, is_string_init=0, is_polymorphic=0, is_custom=1, suffix="invokeCustom" |
| |
| NterpCommonInvokeCustomRange: |
| COMMON_INVOKE_RANGE is_static=1, is_interface=0, is_polymorphic=0, is_custom=1, suffix="invokeCustom" |
| |
| NterpHandleStringInit: |
| COMMON_INVOKE_NON_RANGE is_static=0, is_interface=0, is_string_init=1, suffix="stringInit" |
| |
| NterpHandleStringInitRange: |
| COMMON_INVOKE_RANGE is_static=0, is_interface=0, is_string_init=1, suffix="stringInit" |
| |
| NterpNewInstance: |
| EXPORT_PC |
| // Fast-path which gets the class from thread-local cache. |
| FETCH_FROM_THREAD_CACHE %rdi, 2f |
| cmpq $$0, rSELF:THREAD_READ_BARRIER_MARK_REG00_OFFSET |
| jne 3f |
| 4: |
| callq *rSELF:THREAD_ALLOC_OBJECT_ENTRYPOINT_OFFSET |
| 1: |
| SET_VREG_OBJECT %eax, rINSTq # fp[A] <- value |
| ADVANCE_PC_FETCH_AND_GOTO_NEXT 2 |
| 2: |
| movq rSELF:THREAD_SELF_OFFSET, %rdi |
| movq 0(%rsp), %rsi |
| movq rPC, %rdx |
| call nterp_get_class_or_allocate_object |
| jmp 1b |
| 3: |
| // 07 is %rdi |
| call art_quick_read_barrier_mark_reg07 |
| jmp 4b |
| |
| NterpNewArray: |
| /* new-array vA, vB, class@CCCC */ |
| EXPORT_PC |
| // Fast-path which gets the class from thread-local cache. |
| FETCH_FROM_THREAD_CACHE %rdi, 2f |
| cmpq $$0, rSELF:THREAD_READ_BARRIER_MARK_REG00_OFFSET |
| jne 3f |
| 1: |
| movzbl rINSTbl,%esi |
| sarl $$4,%esi # esi<- B |
| GET_VREG %esi %rsi # esi<- vB (array length) |
| andb $$0xf,rINSTbl # rINST<- A |
| callq *rSELF:THREAD_ALLOC_ARRAY_ENTRYPOINT_OFFSET |
| SET_VREG_OBJECT %eax, rINSTq # fp[A] <- value |
| ADVANCE_PC_FETCH_AND_GOTO_NEXT 2 |
| 2: |
| movq rSELF:THREAD_SELF_OFFSET, %rdi |
| movq 0(%rsp), %rsi |
| movq rPC, %rdx |
| call nterp_get_class_or_allocate_object |
| movq %rax, %rdi |
| jmp 1b |
| 3: |
| // 07 is %rdi |
| call art_quick_read_barrier_mark_reg07 |
| jmp 1b |
| |
| NterpPutObjectInstanceField: |
| movzbq rINSTbl, %rbp # rcx <- BA |
| sarl $$4, %ebp # ebp <- B |
| GET_VREG %ebp, %rbp # vB (object we're operating on) |
| andb $$0xf, rINSTbl # rINST <- A |
| GET_VREG rINST, rINSTq # rINST <- v[A] |
| // Fast-path which gets the field from thread-local cache. |
| FETCH_FROM_THREAD_CACHE %rax, 2f |
| 1: |
| testl %ebp, %ebp # is object null? |
| je common_errNullObject |
| movl rINST, (%rbp,%rax,1) |
| testl rINST, rINST |
| je 4f |
| movq rSELF:THREAD_CARD_TABLE_OFFSET, %rax |
| shrq $$CARD_TABLE_CARD_SHIFT, %rbp |
| movb %al, (%rax, %rbp, 1) |
| 4: |
| ADVANCE_PC_FETCH_AND_GOTO_NEXT 2 |
| 2: |
| EXPORT_PC |
| movq rSELF:THREAD_SELF_OFFSET, %rdi |
| movq 0(%rsp), %rsi |
| movq rPC, %rdx |
| movq rINSTq, %rcx |
| call nterp_get_instance_field_offset |
| testl %eax, %eax |
| jns 1b |
| testl %ebp, %ebp # is object null? |
| je common_errNullObject |
| negl %eax |
| movl rINST, (%rbp,%rax,1) |
| testl rINST, rINST |
| je 5f |
| movq rSELF:THREAD_CARD_TABLE_OFFSET, %rax |
| shrq $$CARD_TABLE_CARD_SHIFT, %rbp |
| movb %al, (%rbp, %rax, 1) |
| 5: |
| lock addl $$0, (%rsp) |
| ADVANCE_PC_FETCH_AND_GOTO_NEXT 2 |
| |
| NterpGetObjectInstanceField: |
| // Fast-path which gets the field from thread-local cache. |
| FETCH_FROM_THREAD_CACHE %rax, 2f |
| 1: |
| movl rINST, %ecx # rcx <- BA |
| sarl $$4, %ecx # ecx <- B |
| GET_VREG %ecx, %rcx # vB (object we're operating on) |
| testl %ecx, %ecx # is object null? |
| je common_errNullObject |
| testb $$READ_BARRIER_TEST_VALUE, GRAY_BYTE_OFFSET(%ecx) |
| movl (%rcx,%rax,1), %eax |
| jnz 3f |
| 4: |
| andb $$0xf,rINSTbl # rINST <- A |
| SET_VREG_OBJECT %eax, rINSTq # fp[A] <- value |
| ADVANCE_PC_FETCH_AND_GOTO_NEXT 2 |
| 2: |
| EXPORT_PC |
| movq rSELF:THREAD_SELF_OFFSET, %rdi |
| movq 0(%rsp), %rsi |
| movq rPC, %rdx |
| movq $$0, %rcx |
| call nterp_get_instance_field_offset |
| testl %eax, %eax |
| jns 1b |
| // For volatile fields, we return a negative offset. Remove the sign |
| // and no need for any barrier thanks to the memory model. |
| negl %eax |
| jmp 1b |
| 3: |
| // reg00 is eax |
| call art_quick_read_barrier_mark_reg00 |
| jmp 4b |
| |
| NterpPutObjectStaticField: |
| GET_VREG %ebp, rINSTq |
| // Fast-path which gets the field from thread-local cache. |
| FETCH_FROM_THREAD_CACHE %rax, 2f |
| 1: |
| movl ART_FIELD_OFFSET_OFFSET(%rax), %edx |
| movl ART_FIELD_DECLARING_CLASS_OFFSET(%rax), %eax |
| cmpq $$0, rSELF:THREAD_READ_BARRIER_MARK_REG00_OFFSET |
| jne 3f |
| 5: |
| movl %ebp, (%eax, %edx, 1) |
| testl %ebp, %ebp |
| je 4f |
| movq rSELF:THREAD_CARD_TABLE_OFFSET, %rcx |
| shrq $$CARD_TABLE_CARD_SHIFT, %rax |
| movb %cl, (%rax, %rcx, 1) |
| 4: |
| ADVANCE_PC_FETCH_AND_GOTO_NEXT 2 |
| 2: |
| EXPORT_PC |
| movq rSELF:THREAD_SELF_OFFSET, %rdi |
| movq 0(%rsp), %rsi |
| movq rPC, %rdx |
| movq %rbp, %rcx |
| call nterp_get_static_field |
| testq MACRO_LITERAL(1), %rax |
| je 1b |
| CLEAR_VOLATILE_MARKER %rax |
| movl ART_FIELD_OFFSET_OFFSET(%rax), %edx |
| movl ART_FIELD_DECLARING_CLASS_OFFSET(%rax), %eax |
| cmpq $$0, rSELF:THREAD_READ_BARRIER_MARK_REG00_OFFSET |
| jne 7f |
| 6: |
| movl %ebp, (%eax, %edx, 1) |
| testl %ebp, %ebp |
| je 8f |
| movq rSELF:THREAD_CARD_TABLE_OFFSET, %rcx |
| shrq $$CARD_TABLE_CARD_SHIFT, %rax |
| movb %cl, (%rax, %rcx, 1) |
| 8: |
| lock addl $$0, (%rsp) |
| ADVANCE_PC_FETCH_AND_GOTO_NEXT 2 |
| 3: |
| call art_quick_read_barrier_mark_reg00 |
| jmp 5b |
| 7: |
| call art_quick_read_barrier_mark_reg00 |
| jmp 6b |
| |
| NterpGetObjectStaticField: |
| // Fast-path which gets the field from thread-local cache. |
| FETCH_FROM_THREAD_CACHE %rax, 2f |
| 1: |
| movl ART_FIELD_OFFSET_OFFSET(%rax), %edx |
| movl ART_FIELD_DECLARING_CLASS_OFFSET(%rax), %eax |
| cmpq $$0, rSELF:THREAD_READ_BARRIER_MARK_REG00_OFFSET |
| jne 5f |
| 6: |
| testb $$READ_BARRIER_TEST_VALUE, GRAY_BYTE_OFFSET(%eax) |
| movl (%eax, %edx, 1), %eax |
| jnz 3f |
| 4: |
| SET_VREG_OBJECT %eax, rINSTq # fp[A] <- value |
| ADVANCE_PC_FETCH_AND_GOTO_NEXT 2 |
| 2: |
| EXPORT_PC |
| movq rSELF:THREAD_SELF_OFFSET, %rdi |
| movq 0(%rsp), %rsi |
| movq rPC, %rdx |
| movq $$0, %rcx |
| call nterp_get_static_field |
| andq $$-2, %rax |
| jmp 1b |
| 3: |
| call art_quick_read_barrier_mark_reg00 |
| jmp 4b |
| 5: |
| call art_quick_read_barrier_mark_reg00 |
| jmp 6b |
| |
| NterpGetBooleanStaticField: |
| OP_SGET load="movsbl", wide=0 |
| |
| NterpGetByteStaticField: |
| OP_SGET load="movsbl", wide=0 |
| |
| NterpGetCharStaticField: |
| OP_SGET load="movzwl", wide=0 |
| |
| NterpGetShortStaticField: |
| OP_SGET load="movswl", wide=0 |
| |
| NterpGetWideStaticField: |
| OP_SGET load="movq", wide=1 |
| |
| NterpGetIntStaticField: |
| OP_SGET load="movl", wide=0 |
| |
| NterpPutStaticField: |
| OP_SPUT rINST_reg=rINST, store="movl", wide=0 |
| |
| NterpPutBooleanStaticField: |
| NterpPutByteStaticField: |
| OP_SPUT rINST_reg=rINSTbl, store="movb", wide=0 |
| |
| NterpPutCharStaticField: |
| NterpPutShortStaticField: |
| OP_SPUT rINST_reg=rINSTw, store="movw", wide=0 |
| |
| NterpPutWideStaticField: |
| OP_SPUT rINST_reg=rINSTq, store="movq", wide=1 |
| |
| NterpPutInstanceField: |
| OP_IPUT rINST_reg=rINST, store="movl", wide=0 |
| |
| NterpPutBooleanInstanceField: |
| NterpPutByteInstanceField: |
| OP_IPUT rINST_reg=rINSTbl, store="movb", wide=0 |
| |
| NterpPutCharInstanceField: |
| NterpPutShortInstanceField: |
| OP_IPUT rINST_reg=rINSTw, store="movw", wide=0 |
| |
| NterpPutWideInstanceField: |
| OP_IPUT rINST_reg=rINSTq, store="movq", wide=1 |
| |
| NterpGetBooleanInstanceField: |
| OP_IGET load="movzbl", wide=0 |
| |
| NterpGetByteInstanceField: |
| OP_IGET load="movsbl", wide=0 |
| |
| NterpGetCharInstanceField: |
| OP_IGET load="movzwl", wide=0 |
| |
| NterpGetShortInstanceField: |
| OP_IGET load="movswl", wide=0 |
| |
| NterpGetWideInstanceField: |
| OP_IGET load="movq", wide=1 |
| |
| NterpGetInstanceField: |
| OP_IGET load="movl", wide=0 |
| |
| NterpInstanceOf: |
| /* instance-of vA, vB, class@CCCC */ |
| // Fast-path which gets the class from thread-local cache. |
| EXPORT_PC |
| FETCH_FROM_THREAD_CACHE %rsi, 2f |
| cmpq $$0, rSELF:THREAD_READ_BARRIER_MARK_REG00_OFFSET |
| jne 5f |
| 1: |
| movzbl rINSTbl,%edi |
| sarl $$4,%edi # edi<- B |
| GET_VREG %edi %rdi # edi<- vB (object) |
| andb $$0xf,rINSTbl # rINST<- A |
| testl %edi, %edi |
| je 3f |
| call art_quick_instance_of |
| SET_VREG %eax, rINSTq # fp[A] <- value |
| 4: |
| ADVANCE_PC_FETCH_AND_GOTO_NEXT 2 |
| 3: |
| SET_VREG %edi, rINSTq # fp[A] <-0 |
| jmp 4b |
| 2: |
| movq rSELF:THREAD_SELF_OFFSET, %rdi |
| movq 0(%rsp), %rsi |
| movq rPC, %rdx |
| call nterp_get_class_or_allocate_object |
| movq %rax, %rsi |
| jmp 1b |
| 5: |
| // 06 is %rsi |
| call art_quick_read_barrier_mark_reg06 |
| jmp 1b |
| |
| NterpCheckCast: |
| // Fast-path which gets the class from thread-local cache. |
| EXPORT_PC |
| FETCH_FROM_THREAD_CACHE %rsi, 3f |
| cmpq $$0, rSELF:THREAD_READ_BARRIER_MARK_REG00_OFFSET |
| jne 4f |
| 1: |
| GET_VREG %edi, rINSTq |
| testl %edi, %edi |
| je 2f |
| call art_quick_check_instance_of |
| 2: |
| ADVANCE_PC_FETCH_AND_GOTO_NEXT 2 |
| 3: |
| movq rSELF:THREAD_SELF_OFFSET, %rdi |
| movq 0(%rsp), %rsi |
| movq rPC, %rdx |
| call nterp_get_class_or_allocate_object |
| movq %rax, %rsi |
| jmp 1b |
| 4: |
| // 06 is %rsi |
| call art_quick_read_barrier_mark_reg06 |
| jmp 1b |
| |
| NterpHandleHotnessOverflow: |
| leaq (rPC, rINSTq, 2), %rsi |
| movq rFP, %rdx |
| call nterp_hot_method |
| testq %rax, %rax |
| jne 1f |
| leaq (rPC, rINSTq, 2), rPC |
| FETCH_INST |
| GOTO_NEXT |
| 1: |
| // Drop the current frame. |
| movq -8(rREFS), %rsp |
| CFI_DEF_CFA(rsp, CALLEE_SAVES_SIZE) |
| |
| // Setup the new frame |
| movq OSR_DATA_FRAME_SIZE(%rax), %rcx |
| // Given stack size contains all callee saved registers, remove them. |
| subq $$CALLEE_SAVES_SIZE, %rcx |
| |
| // Remember CFA. |
| movq %rsp, %rbp |
| CFI_DEF_CFA_REGISTER(rbp) |
| |
| subq %rcx, %rsp |
| movq %rsp, %rdi // rdi := beginning of stack |
| leaq OSR_DATA_MEMORY(%rax), %rsi // rsi := memory to copy |
| rep movsb // while (rcx--) { *rdi++ = *rsi++ } |
| |
| // Fetch the native PC to jump to and save it in a callee-save register. |
| movq OSR_DATA_NATIVE_PC(%rax), %rbx |
| |
| // Free the memory holding OSR Data. |
| movq %rax, %rdi |
| call free |
| |
| // Jump to the compiled code. |
| jmp *%rbx |
| |
| NterpHandleInvokeInterfaceOnObjectMethodRange: |
| shrl $$16, %eax |
| movq MIRROR_CLASS_VTABLE_OFFSET_64(%edx, %eax, 8), %rdi |
| jmp NterpCommonInvokeInstanceRange |
| |
| NterpHandleInvokeInterfaceOnObjectMethod: |
| shrl $$16, %eax |
| movq MIRROR_CLASS_VTABLE_OFFSET_64(%edx, %eax, 8), %rdi |
| jmp NterpCommonInvokeInstance |
| |
| // This is the logical end of ExecuteNterpImpl, where the frame info applies. |
| // EndExecuteNterpImpl includes the methods below as we want the runtime to |
| // see them as part of the Nterp PCs. |
| .cfi_endproc |
| |
| nterp_to_nterp_static_non_range: |
| .cfi_startproc |
| .cfi_def_cfa rsp, 8 |
| SETUP_STACK_FOR_INVOKE |
| SETUP_NON_RANGE_ARGUMENTS_AND_EXECUTE is_static=1, is_string_init=0 |
| .cfi_endproc |
| |
| nterp_to_nterp_string_init_non_range: |
| .cfi_startproc |
| .cfi_def_cfa rsp, 8 |
| SETUP_STACK_FOR_INVOKE |
| SETUP_NON_RANGE_ARGUMENTS_AND_EXECUTE is_static=0, is_string_init=1 |
| .cfi_endproc |
| |
| nterp_to_nterp_instance_non_range: |
| .cfi_startproc |
| .cfi_def_cfa rsp, 8 |
| SETUP_STACK_FOR_INVOKE |
| SETUP_NON_RANGE_ARGUMENTS_AND_EXECUTE is_static=0, is_string_init=0 |
| .cfi_endproc |
| |
| nterp_to_nterp_static_range: |
| .cfi_startproc |
| .cfi_def_cfa rsp, 8 |
| SETUP_STACK_FOR_INVOKE |
| SETUP_RANGE_ARGUMENTS_AND_EXECUTE is_static=1 |
| .cfi_endproc |
| |
| nterp_to_nterp_instance_range: |
| .cfi_startproc |
| .cfi_def_cfa rsp, 8 |
| SETUP_STACK_FOR_INVOKE |
| SETUP_RANGE_ARGUMENTS_AND_EXECUTE is_static=0 |
| .cfi_endproc |
| |
| nterp_to_nterp_string_init_range: |
| .cfi_startproc |
| .cfi_def_cfa rsp, 8 |
| SETUP_STACK_FOR_INVOKE |
| SETUP_RANGE_ARGUMENTS_AND_EXECUTE is_static=0, is_string_init=1 |
| .cfi_endproc |
| |
| // This is the end of PCs contained by the OatQuickMethodHeader created for the interpreter |
| // entry point. |
| FUNCTION_TYPE(EndExecuteNterpImpl) |
| ASM_HIDDEN SYMBOL(EndExecuteNterpImpl) |
| .global SYMBOL(EndExecuteNterpImpl) |
| SYMBOL(EndExecuteNterpImpl): |
| |
| // Entrypoints into runtime. |
| NTERP_TRAMPOLINE nterp_get_static_field, NterpGetStaticField |
| NTERP_TRAMPOLINE nterp_get_instance_field_offset, NterpGetInstanceFieldOffset |
| NTERP_TRAMPOLINE nterp_filled_new_array, NterpFilledNewArray |
| NTERP_TRAMPOLINE nterp_filled_new_array_range, NterpFilledNewArrayRange |
| NTERP_TRAMPOLINE nterp_get_class_or_allocate_object, NterpGetClassOrAllocateObject |
| NTERP_TRAMPOLINE nterp_get_method, NterpGetMethod |
| NTERP_TRAMPOLINE nterp_hot_method, NterpHotMethod |
| NTERP_TRAMPOLINE nterp_load_object, NterpLoadObject |
| |
| // gen_mterp.py will inline the following definitions |
| // within [ExecuteNterpImpl, EndExecuteNterpImpl). |
| %def instruction_end(): |
| |
| FUNCTION_TYPE(artNterpAsmInstructionEnd) |
| ASM_HIDDEN SYMBOL(artNterpAsmInstructionEnd) |
| .global SYMBOL(artNterpAsmInstructionEnd) |
| SYMBOL(artNterpAsmInstructionEnd): |
| // artNterpAsmInstructionEnd is used as landing pad for exception handling. |
| FETCH_INST |
| GOTO_NEXT |
| |
| %def instruction_start(): |
| |
| FUNCTION_TYPE(artNterpAsmInstructionStart) |
| ASM_HIDDEN SYMBOL(artNterpAsmInstructionStart) |
| .global SYMBOL(artNterpAsmInstructionStart) |
| SYMBOL(artNterpAsmInstructionStart) = .L_op_nop |
| .text |
| |
| %def default_helper_prefix(): |
| % return "nterp_" |
| |
| %def opcode_start(): |
| ENTRY nterp_${opcode} |
| %def opcode_end(): |
| END nterp_${opcode} |
| %def helper_start(name): |
| ENTRY ${name} |
| %def helper_end(name): |
| END ${name} |