ARM64: Unify constant register handling in interpreter.

Plus minor optimizations. Simplifications for out-of-tree ARM64EC.
Thanks to Peter Cawley. #1096
This commit is contained in:
Mike Pall 2023-10-08 21:39:40 +02:00
parent 9cc8bbb7ae
commit c5b075eb31

View File

@ -291,8 +291,17 @@
| blo target | blo target
|.endmacro |.endmacro
| |
|.macro init_constants
| movn TISNIL, #0
| movz TISNUM, #(LJ_TISNUM>>1)&0xffff, lsl #48
| movz TISNUMhi, #(LJ_TISNUM>>1)&0xffff, lsl #16
|.endmacro
|
|.macro mov_false, reg; movn reg, #0x8000, lsl #32; .endmacro |.macro mov_false, reg; movn reg, #0x8000, lsl #32; .endmacro
|.macro mov_true, reg; movn reg, #0x0001, lsl #48; .endmacro |.macro mov_true, reg; movn reg, #0x0001, lsl #48; .endmacro
|.macro mov_nil, reg; mov reg, TISNIL; .endmacro
|.macro cmp_nil, reg; cmp reg, TISNIL; .endmacro
|.macro add_TISNUM, dst, src; add dst, src, TISNUM; .endmacro
| |
#define GL_J(field) (GG_G2J + (int)offsetof(jit_State, field)) #define GL_J(field) (GG_G2J + (int)offsetof(jit_State, field))
| |
@ -445,9 +454,7 @@ static void build_subroutines(BuildCtx *ctx)
| add fp, CARG1, # SAVE_FP_LR_ | add fp, CARG1, # SAVE_FP_LR_
| mov sp, CARG1 | mov sp, CARG1
| ldr L, SAVE_L | ldr L, SAVE_L
| movz TISNUM, #(LJ_TISNUM>>1)&0xffff, lsl #48 | init_constants
| movz TISNUMhi, #(LJ_TISNUM>>1)&0xffff, lsl #16
| movn TISNIL, #0
| ldr GL, L->glref // Setup pointer to global state. | ldr GL, L->glref // Setup pointer to global state.
|->vm_unwind_ff_eh: // Landing pad for external unwinder. |->vm_unwind_ff_eh: // Landing pad for external unwinder.
| mov RC, #16 // 2 results: false + error message. | mov RC, #16 // 2 results: false + error message.
@ -512,11 +519,9 @@ static void build_subroutines(BuildCtx *ctx)
| str L, GL->cur_L | str L, GL->cur_L
| mov RA, BASE | mov RA, BASE
| ldp BASE, CARG1, L->base | ldp BASE, CARG1, L->base
| movz TISNUM, #(LJ_TISNUM>>1)&0xffff, lsl #48 | init_constants
| movz TISNUMhi, #(LJ_TISNUM>>1)&0xffff, lsl #16
| ldr PC, [BASE, FRAME_PC] | ldr PC, [BASE, FRAME_PC]
| strb wzr, L->status | strb wzr, L->status
| movn TISNIL, #0
| sub RC, CARG1, BASE | sub RC, CARG1, BASE
| ands CARG1, PC, #FRAME_TYPE | ands CARG1, PC, #FRAME_TYPE
| add RC, RC, #8 | add RC, RC, #8
@ -552,10 +557,8 @@ static void build_subroutines(BuildCtx *ctx)
|3: // Entry point for vm_cpcall/vm_resume (BASE = base, PC = ftype). |3: // Entry point for vm_cpcall/vm_resume (BASE = base, PC = ftype).
| str L, GL->cur_L | str L, GL->cur_L
| ldp RB, CARG1, L->base // RB = old base (for vmeta_call). | ldp RB, CARG1, L->base // RB = old base (for vmeta_call).
| movz TISNUM, #(LJ_TISNUM>>1)&0xffff, lsl #48
| movz TISNUMhi, #(LJ_TISNUM>>1)&0xffff, lsl #16
| add PC, PC, BASE | add PC, PC, BASE
| movn TISNIL, #0 | init_constants
| sub PC, PC, RB // PC = frame delta + frame type | sub PC, PC, RB // PC = frame delta + frame type
| sub NARGS8:RC, CARG1, BASE | sub NARGS8:RC, CARG1, BASE
| st_vmstate ST_INTERP | st_vmstate ST_INTERP
@ -664,7 +667,7 @@ static void build_subroutines(BuildCtx *ctx)
| b >1 | b >1
| |
|->vmeta_tgetb: // RB = table, RC = index |->vmeta_tgetb: // RB = table, RC = index
| add RC, RC, TISNUM | add_TISNUM RC, RC
| add CARG2, BASE, RB, lsl #3 | add CARG2, BASE, RB, lsl #3
| add CARG3, sp, TMPDofs | add CARG3, sp, TMPDofs
| str RC, TMPD | str RC, TMPD
@ -699,7 +702,7 @@ static void build_subroutines(BuildCtx *ctx)
| sxtw CARG2, TMP1w | sxtw CARG2, TMP1w
| bl extern lj_tab_getinth // (GCtab *t, int32_t key) | bl extern lj_tab_getinth // (GCtab *t, int32_t key)
| // Returns cTValue * or NULL. | // Returns cTValue * or NULL.
| mov TMP0, TISNIL | mov_nil TMP0
| cbz CRET1, ->BC_TGETR_Z | cbz CRET1, ->BC_TGETR_Z
| ldr TMP0, [CRET1] | ldr TMP0, [CRET1]
| b ->BC_TGETR_Z | b ->BC_TGETR_Z
@ -722,7 +725,7 @@ static void build_subroutines(BuildCtx *ctx)
| b >1 | b >1
| |
|->vmeta_tsetb: // RB = table, RC = index |->vmeta_tsetb: // RB = table, RC = index
| add RC, RC, TISNUM | add_TISNUM RC, RC
| add CARG2, BASE, RB, lsl #3 | add CARG2, BASE, RB, lsl #3
| add CARG3, sp, TMPDofs | add CARG3, sp, TMPDofs
| str RC, TMPD | str RC, TMPD
@ -1036,7 +1039,7 @@ static void build_subroutines(BuildCtx *ctx)
|1: // Field metatable must be at same offset for GCtab and GCudata! |1: // Field metatable must be at same offset for GCtab and GCudata!
| ldr TAB:RB, TAB:CARG1->metatable | ldr TAB:RB, TAB:CARG1->metatable
|2: |2:
| mov CARG1, TISNIL | mov_nil CARG1
| ldr STR:RC, GL->gcroot[GCROOT_MMNAME+MM_metatable] | ldr STR:RC, GL->gcroot[GCROOT_MMNAME+MM_metatable]
| cbz TAB:RB, ->fff_restv | cbz TAB:RB, ->fff_restv
| ldr TMP1w, TAB:RB->hmask | ldr TMP1w, TAB:RB->hmask
@ -1058,7 +1061,7 @@ static void build_subroutines(BuildCtx *ctx)
| movk CARG1, #(LJ_TTAB>>1)&0xffff, lsl #48 | movk CARG1, #(LJ_TTAB>>1)&0xffff, lsl #48
| b ->fff_restv | b ->fff_restv
|5: |5:
| cmp TMP0, TISNIL | cmp_nil TMP0
| bne ->fff_restv | bne ->fff_restv
| b <4 | b <4
| |
@ -1158,8 +1161,8 @@ static void build_subroutines(BuildCtx *ctx)
| cbnz TAB:CARG2, ->fff_fallback | cbnz TAB:CARG2, ->fff_fallback
#endif #endif
| mov RC, #(3+1)*8 | mov RC, #(3+1)*8
| stp CARG1, TISNIL, [BASE, #-8] | stp CFUNC:CARG4, CARG1, [BASE, #-16]
| str CFUNC:CARG4, [BASE, #-16] | str TISNIL, [BASE]
| b ->fff_res | b ->fff_res
| |
|.ffunc_2 ipairs_aux |.ffunc_2 ipairs_aux
@ -1171,14 +1174,14 @@ static void build_subroutines(BuildCtx *ctx)
| add CARG2w, CARG2w, #1 | add CARG2w, CARG2w, #1
| cmp CARG2w, TMP1w | cmp CARG2w, TMP1w
| ldr PC, [BASE, FRAME_PC] | ldr PC, [BASE, FRAME_PC]
| add TMP2, CARG2, TISNUM | add_TISNUM TMP2, CARG2
| mov RC, #(0+1)*8 | mov RC, #(0+1)*8
| str TMP2, [BASE, #-16] | str TMP2, [BASE, #-16]
| bhs >2 // Not in array part? | bhs >2 // Not in array part?
| ldr TMP0, [CARG3, CARG2, lsl #3] | ldr TMP0, [CARG3, CARG2, lsl #3]
|1: |1:
| mov TMP1, #(2+1)*8 | mov TMP1, #(2+1)*8
| cmp TMP0, TISNIL | cmp_nil TMP0
| str TMP0, [BASE, #-8] | str TMP0, [BASE, #-8]
| csel RC, RC, TMP1, eq | csel RC, RC, TMP1, eq
| b ->fff_res | b ->fff_res
@ -1201,8 +1204,8 @@ static void build_subroutines(BuildCtx *ctx)
| cbnz TAB:CARG2, ->fff_fallback | cbnz TAB:CARG2, ->fff_fallback
#endif #endif
| mov RC, #(3+1)*8 | mov RC, #(3+1)*8
| stp CARG1, TISNUM, [BASE, #-8] | stp CFUNC:CARG4, CARG1, [BASE, #-16]
| str CFUNC:CARG4, [BASE, #-16] | str TISNUM, [BASE]
| b ->fff_res | b ->fff_res
| |
|//-- Base library: catch errors ---------------------------------------- |//-- Base library: catch errors ----------------------------------------
@ -1392,7 +1395,7 @@ static void build_subroutines(BuildCtx *ctx)
| eor CARG2w, CARG1w, CARG1w, asr #31 | eor CARG2w, CARG1w, CARG1w, asr #31
| movz CARG3, #0x41e0, lsl #48 // 2^31. | movz CARG3, #0x41e0, lsl #48 // 2^31.
| subs CARG1w, CARG2w, CARG1w, asr #31 | subs CARG1w, CARG2w, CARG1w, asr #31
| add CARG1, CARG1, TISNUM | add_TISNUM CARG1, CARG1
| csel CARG1, CARG1, CARG3, pl | csel CARG1, CARG1, CARG3, pl
| // Fallthrough. | // Fallthrough.
| |
@ -1483,7 +1486,7 @@ static void build_subroutines(BuildCtx *ctx)
| ldr PC, [BASE, FRAME_PC] | ldr PC, [BASE, FRAME_PC]
| str d0, [BASE, #-16] | str d0, [BASE, #-16]
| mov RC, #(2+1)*8 | mov RC, #(2+1)*8
| add CARG2, CARG2, TISNUM | add_TISNUM CARG2, CARG2
| str CARG2, [BASE, #-8] | str CARG2, [BASE, #-8]
| b ->fff_res | b ->fff_res
| |
@ -1549,7 +1552,7 @@ static void build_subroutines(BuildCtx *ctx)
| bne ->fff_fallback | bne ->fff_fallback
| ldrb TMP0w, STR:CARG1[1] // Access is always ok (NUL at end). | ldrb TMP0w, STR:CARG1[1] // Access is always ok (NUL at end).
| ldr CARG3w, STR:CARG1->len | ldr CARG3w, STR:CARG1->len
| add TMP0, TMP0, TISNUM | add_TISNUM TMP0, TMP0
| str TMP0, [BASE, #-16] | str TMP0, [BASE, #-16]
| mov RC, #(0+1)*8 | mov RC, #(0+1)*8
| cbz CARG3, ->fff_res | cbz CARG3, ->fff_res
@ -1695,17 +1698,17 @@ static void build_subroutines(BuildCtx *ctx)
|.ffunc_bit tobit |.ffunc_bit tobit
| mov TMP0w, CARG1w | mov TMP0w, CARG1w
|9: // Label reused by .ffunc_bit_op users. |9: // Label reused by .ffunc_bit_op users.
| add CARG1, TMP0, TISNUM | add_TISNUM CARG1, TMP0
| b ->fff_restv | b ->fff_restv
| |
|.ffunc_bit bswap |.ffunc_bit bswap
| rev TMP0w, CARG1w | rev TMP0w, CARG1w
| add CARG1, TMP0, TISNUM | add_TISNUM CARG1, TMP0
| b ->fff_restv | b ->fff_restv
| |
|.ffunc_bit bnot |.ffunc_bit bnot
| mvn TMP0w, CARG1w | mvn TMP0w, CARG1w
| add CARG1, TMP0, TISNUM | add_TISNUM CARG1, TMP0
| b ->fff_restv | b ->fff_restv
| |
|.macro .ffunc_bit_sh, name, ins, shmod |.macro .ffunc_bit_sh, name, ins, shmod
@ -1726,7 +1729,7 @@ static void build_subroutines(BuildCtx *ctx)
| checkint CARG1, ->vm_tobit_fb | checkint CARG1, ->vm_tobit_fb
|2: |2:
| ins TMP0w, CARG1w, TMP1w | ins TMP0w, CARG1w, TMP1w
| add CARG1, TMP0, TISNUM | add_TISNUM CARG1, TMP0
| b ->fff_restv | b ->fff_restv
|.endmacro |.endmacro
| |
@ -1915,8 +1918,7 @@ static void build_subroutines(BuildCtx *ctx)
| and CARG3, CARG3, #LJ_GCVMASK | and CARG3, CARG3, #LJ_GCVMASK
| beq >2 | beq >2
|1: // Move results down. |1: // Move results down.
| ldr CARG1, [RA] | ldr CARG1, [RA], #8
| add RA, RA, #8
| subs RB, RB, #8 | subs RB, RB, #8
| str CARG1, [BASE, RC, lsl #3] | str CARG1, [BASE, RC, lsl #3]
| add RC, RC, #1 | add RC, RC, #1
@ -2031,9 +2033,7 @@ static void build_subroutines(BuildCtx *ctx)
|.if JIT |.if JIT
| ldr L, SAVE_L | ldr L, SAVE_L
|1: |1:
| movz TISNUM, #(LJ_TISNUM>>1)&0xffff, lsl #48 | init_constants
| movz TISNUMhi, #(LJ_TISNUM>>1)&0xffff, lsl #16
| movn TISNIL, #0
| cmn CARG1w, #LUA_ERRERR | cmn CARG1w, #LUA_ERRERR
| bhs >9 // Check for error from exit. | bhs >9 // Check for error from exit.
| ldr LFUNC:CARG2, [BASE, FRAME_FUNC] | ldr LFUNC:CARG2, [BASE, FRAME_FUNC]
@ -2212,9 +2212,7 @@ static void build_subroutines(BuildCtx *ctx)
| bl extern lj_ccallback_enter // (CTState *cts, void *cf) | bl extern lj_ccallback_enter // (CTState *cts, void *cf)
| // Returns lua_State *. | // Returns lua_State *.
| ldp BASE, RC, L:CRET1->base | ldp BASE, RC, L:CRET1->base
| movz TISNUM, #(LJ_TISNUM>>1)&0xffff, lsl #48 | init_constants
| movz TISNUMhi, #(LJ_TISNUM>>1)&0xffff, lsl #16
| movn TISNIL, #0
| mov L, CRET1 | mov L, CRET1
| ldr LFUNC:CARG3, [BASE, FRAME_FUNC] | ldr LFUNC:CARG3, [BASE, FRAME_FUNC]
| sub RC, RC, BASE | sub RC, RC, BASE
@ -2593,7 +2591,7 @@ static void build_ins(BuildCtx *ctx, BCOp op, int defop)
| bne >5 | bne >5
| negs TMP0w, TMP0w | negs TMP0w, TMP0w
| movz CARG3, #0x41e0, lsl #48 // 2^31. | movz CARG3, #0x41e0, lsl #48 // 2^31.
| add TMP0, TMP0, TISNUM | add_TISNUM TMP0, TMP0
| csel TMP0, TMP0, CARG3, vc | csel TMP0, TMP0, CARG3, vc
|5: |5:
| str TMP0, [BASE, RA, lsl #3] | str TMP0, [BASE, RA, lsl #3]
@ -2608,7 +2606,7 @@ static void build_ins(BuildCtx *ctx, BCOp op, int defop)
| bne >2 | bne >2
| ldr CARG1w, STR:CARG1->len | ldr CARG1w, STR:CARG1->len
|1: |1:
| add CARG1, CARG1, TISNUM | add_TISNUM CARG1, CARG1
| str CARG1, [BASE, RA, lsl #3] | str CARG1, [BASE, RA, lsl #3]
| ins_next | ins_next
| |
@ -2716,7 +2714,7 @@ static void build_ins(BuildCtx *ctx, BCOp op, int defop)
| intins CARG1w, CARG1w, CARG2w | intins CARG1w, CARG1w, CARG2w
| ins_arithfallback bvs | ins_arithfallback bvs
|.endif |.endif
| add CARG1, CARG1, TISNUM | add_TISNUM CARG1, CARG1
| str CARG1, [BASE, RA, lsl #3] | str CARG1, [BASE, RA, lsl #3]
|4: |4:
| ins_next | ins_next
@ -2809,7 +2807,7 @@ static void build_ins(BuildCtx *ctx, BCOp op, int defop)
case BC_KSHORT: case BC_KSHORT:
| // RA = dst, RC = int16_literal | // RA = dst, RC = int16_literal
| sxth RCw, RCw | sxth RCw, RCw
| add TMP0, RC, TISNUM | add_TISNUM TMP0, RC
| str TMP0, [BASE, RA, lsl #3] | str TMP0, [BASE, RA, lsl #3]
| ins_next | ins_next
break; break;
@ -3032,7 +3030,7 @@ static void build_ins(BuildCtx *ctx, BCOp op, int defop)
| cmp TMP1w, CARG1w // In array part? | cmp TMP1w, CARG1w // In array part?
| bhs ->vmeta_tgetv | bhs ->vmeta_tgetv
| ldr TMP0, [CARG3] | ldr TMP0, [CARG3]
| cmp TMP0, TISNIL | cmp_nil TMP0
| beq >5 | beq >5
|1: |1:
| str TMP0, [BASE, RA, lsl #3] | str TMP0, [BASE, RA, lsl #3]
@ -3075,7 +3073,7 @@ static void build_ins(BuildCtx *ctx, BCOp op, int defop)
| ldr NODE:CARG3, NODE:CARG3->next | ldr NODE:CARG3, NODE:CARG3->next
| cmp CARG1, CARG4 | cmp CARG1, CARG4
| bne >4 | bne >4
| cmp TMP0, TISNIL | cmp_nil TMP0
| beq >5 | beq >5
|3: |3:
| str TMP0, [BASE, RA, lsl #3] | str TMP0, [BASE, RA, lsl #3]
@ -3084,7 +3082,7 @@ static void build_ins(BuildCtx *ctx, BCOp op, int defop)
|4: // Follow hash chain. |4: // Follow hash chain.
| cbnz NODE:CARG3, <1 | cbnz NODE:CARG3, <1
| // End of hash chain: key not found, nil result. | // End of hash chain: key not found, nil result.
| mov TMP0, TISNIL | mov_nil TMP0
| |
|5: // Check for __index if table value is nil. |5: // Check for __index if table value is nil.
| ldr TAB:CARG1, TAB:CARG2->metatable | ldr TAB:CARG1, TAB:CARG2->metatable
@ -3105,7 +3103,7 @@ static void build_ins(BuildCtx *ctx, BCOp op, int defop)
| cmp RCw, CARG1w // In array part? | cmp RCw, CARG1w // In array part?
| bhs ->vmeta_tgetb | bhs ->vmeta_tgetb
| ldr TMP0, [CARG3] | ldr TMP0, [CARG3]
| cmp TMP0, TISNIL | cmp_nil TMP0
| beq >5 | beq >5
|1: |1:
| str TMP0, [BASE, RA, lsl #3] | str TMP0, [BASE, RA, lsl #3]
@ -3152,7 +3150,7 @@ static void build_ins(BuildCtx *ctx, BCOp op, int defop)
| ldr TMP1, [CARG3] | ldr TMP1, [CARG3]
| ldr TMP0, [BASE, RA, lsl #3] | ldr TMP0, [BASE, RA, lsl #3]
| ldrb TMP2w, TAB:CARG2->marked | ldrb TMP2w, TAB:CARG2->marked
| cmp TMP1, TISNIL // Previous value is nil? | cmp_nil TMP1 // Previous value is nil?
| beq >5 | beq >5
|1: |1:
| str TMP0, [CARG3] | str TMP0, [CARG3]
@ -3204,7 +3202,7 @@ static void build_ins(BuildCtx *ctx, BCOp op, int defop)
| cmp CARG1, CARG4 | cmp CARG1, CARG4
| bne >5 | bne >5
| ldr TMP0, [BASE, RA, lsl #3] | ldr TMP0, [BASE, RA, lsl #3]
| cmp TMP1, TISNIL // Previous value is nil? | cmp_nil TMP1 // Previous value is nil?
| beq >4 | beq >4
|2: |2:
| str TMP0, NODE:CARG3->val | str TMP0, NODE:CARG3->val
@ -3263,7 +3261,7 @@ static void build_ins(BuildCtx *ctx, BCOp op, int defop)
| ldr TMP1, [CARG3] | ldr TMP1, [CARG3]
| ldr TMP0, [BASE, RA, lsl #3] | ldr TMP0, [BASE, RA, lsl #3]
| ldrb TMP2w, TAB:CARG2->marked | ldrb TMP2w, TAB:CARG2->marked
| cmp TMP1, TISNIL // Previous value is nil? | cmp_nil TMP1 // Previous value is nil?
| beq >5 | beq >5
|1: |1:
| str TMP0, [CARG3] | str TMP0, [CARG3]
@ -3362,9 +3360,8 @@ static void build_ins(BuildCtx *ctx, BCOp op, int defop)
|->BC_CALL_Z: |->BC_CALL_Z:
| mov RB, BASE // Save old BASE for vmeta_call. | mov RB, BASE // Save old BASE for vmeta_call.
| add BASE, BASE, RA, lsl #3 | add BASE, BASE, RA, lsl #3
| ldr CARG3, [BASE] | ldr CARG3, [BASE], #16
| sub NARGS8:RC, NARGS8:RC, #8 | sub NARGS8:RC, NARGS8:RC, #8
| add BASE, BASE, #16
| checkfunc CARG3, ->vmeta_call | checkfunc CARG3, ->vmeta_call
| ins_call | ins_call
break; break;
@ -3380,9 +3377,8 @@ static void build_ins(BuildCtx *ctx, BCOp op, int defop)
| // RA = base, (RB = 0,) RC = (nargs+1)*8 | // RA = base, (RB = 0,) RC = (nargs+1)*8
|->BC_CALLT1_Z: |->BC_CALLT1_Z:
| add RA, BASE, RA, lsl #3 | add RA, BASE, RA, lsl #3
| ldr TMP1, [RA] | ldr TMP1, [RA], #16
| sub NARGS8:RC, NARGS8:RC, #8 | sub NARGS8:RC, NARGS8:RC, #8
| add RA, RA, #16
| checktp CARG3, TMP1, LJ_TFUNC, ->vmeta_callt | checktp CARG3, TMP1, LJ_TFUNC, ->vmeta_callt
| ldr PC, [BASE, FRAME_PC] | ldr PC, [BASE, FRAME_PC]
|->BC_CALLT2_Z: |->BC_CALLT2_Z:
@ -3462,10 +3458,10 @@ static void build_ins(BuildCtx *ctx, BCOp op, int defop)
| add CARG3, CARG2, CARG1, lsl #3 | add CARG3, CARG2, CARG1, lsl #3
| bhs >5 // Index points after array part? | bhs >5 // Index points after array part?
| ldr TMP0, [CARG3] | ldr TMP0, [CARG3]
| cmp TMP0, TISNIL | cmp_nil TMP0
| cinc CARG1, CARG1, eq // Skip holes in array part. | cinc CARG1, CARG1, eq // Skip holes in array part.
| beq <1 | beq <1
| add CARG1, CARG1, TISNUM | add_TISNUM CARG1, CARG1
| stp CARG1, TMP0, [RA] | stp CARG1, TMP0, [RA]
| add CARG1, CARG1, #1 | add CARG1, CARG1, #1
|3: |3:
@ -3483,7 +3479,7 @@ static void build_ins(BuildCtx *ctx, BCOp op, int defop)
| add NODE:CARG3, NODE:RB, CARG1, lsl #3 // node = tab->node + idx*3*8 | add NODE:CARG3, NODE:RB, CARG1, lsl #3 // node = tab->node + idx*3*8
| bhi <4 | bhi <4
| ldp TMP0, CARG1, NODE:CARG3->val | ldp TMP0, CARG1, NODE:CARG3->val
| cmp TMP0, TISNIL | cmp_nil TMP0
| add RC, RC, #1 | add RC, RC, #1
| beq <6 // Skip holes in hash part. | beq <6 // Skip holes in hash part.
| stp CARG1, TMP0, [RA] | stp CARG1, TMP0, [RA]
@ -3501,8 +3497,8 @@ static void build_ins(BuildCtx *ctx, BCOp op, int defop)
| checkfunc CFUNC:CARG1, >5 | checkfunc CFUNC:CARG1, >5
| asr TMP0, TAB:CARG3, #47 | asr TMP0, TAB:CARG3, #47
| ldrb TMP1w, CFUNC:CARG1->ffid | ldrb TMP1w, CFUNC:CARG1->ffid
| cmn TMP0, #-LJ_TTAB | cmp_nil CARG4
| ccmp CARG4, TISNIL, #0, eq | ccmn TMP0, #-LJ_TTAB, #0, eq
| ccmp TMP1w, #FF_next_N, #0, eq | ccmp TMP1w, #FF_next_N, #0, eq
| bne >5 | bne >5
| mov TMP0w, #0xfffe7fff // LJ_KEYINDEX | mov TMP0w, #0xfffe7fff // LJ_KEYINDEX
@ -3542,51 +3538,51 @@ static void build_ins(BuildCtx *ctx, BCOp op, int defop)
| and RC, RC, #255 | and RC, RC, #255
| // RA = base, RB = (nresults+1), RC = numparams | // RA = base, RB = (nresults+1), RC = numparams
| ldr TMP1, [BASE, FRAME_PC] | ldr TMP1, [BASE, FRAME_PC]
| add RC, BASE, RC, lsl #3 | add TMP0, BASE, RC, lsl #3
| add RA, BASE, RA, lsl #3 | add RC, BASE, RA, lsl #3 // RC = destination
| add RC, RC, #FRAME_VARG | add TMP0, TMP0, #FRAME_VARG
| add TMP2, RA, RB, lsl #3 | add TMP2, RC, RB, lsl #3
| sub RC, RC, TMP1 // RC = vbase | sub RA, TMP0, TMP1 // RA = vbase
| // Note: RC may now be even _above_ BASE if nargs was < numparams. | // Note: RA may now be even _above_ BASE if nargs was < numparams.
| sub TMP3, BASE, #16 // TMP3 = vtop | sub TMP3, BASE, #16 // TMP3 = vtop
| cbz RB, >5 | cbz RB, >5
| sub TMP2, TMP2, #16 | sub TMP2, TMP2, #16
|1: // Copy vararg slots to destination slots. |1: // Copy vararg slots to destination slots.
| cmp RC, TMP3 | cmp RA, TMP3
| ldr TMP0, [RC], #8 | ldr TMP0, [RA], #8
| csel TMP0, TMP0, TISNIL, lo | csinv TMP0, TMP0, xzr, lo // TISNIL = ~xzr
| cmp RA, TMP2 | cmp RC, TMP2
| str TMP0, [RA], #8 | str TMP0, [RC], #8
| blo <1 | blo <1
|2: |2:
| ins_next | ins_next
| |
|5: // Copy all varargs. |5: // Copy all varargs.
| ldr TMP0, L->maxstack | ldr TMP0, L->maxstack
| subs TMP2, TMP3, RC | subs TMP2, TMP3, RA
| csel RB, xzr, TMP2, le // MULTRES = (max(vtop-vbase,0)+1)*8 | csel RB, xzr, TMP2, le // MULTRES = (max(vtop-vbase,0)+1)*8
| add RB, RB, #8 | add RB, RB, #8
| add TMP1, RA, TMP2 | add TMP1, RC, TMP2
| str RBw, SAVE_MULTRES | str RBw, SAVE_MULTRES
| ble <2 // Nothing to copy. | ble <2 // Nothing to copy.
| cmp TMP1, TMP0 | cmp TMP1, TMP0
| bhi >7 | bhi >7
|6: |6:
| ldr TMP0, [RC], #8 | ldr TMP0, [RA], #8
| str TMP0, [RA], #8 | str TMP0, [RC], #8
| cmp RC, TMP3 | cmp RA, TMP3
| blo <6 | blo <6
| b <2 | b <2
| |
|7: // Grow stack for varargs. |7: // Grow stack for varargs.
| lsr CARG2, TMP2, #3 | lsr CARG2, TMP2, #3
| stp BASE, RA, L->base | stp BASE, RC, L->base
| mov CARG1, L | mov CARG1, L
| sub RC, RC, BASE // Need delta, because BASE may change. | sub RA, RA, BASE // Need delta, because BASE may change.
| str PC, SAVE_PC | str PC, SAVE_PC
| bl extern lj_state_growstack // (lua_State *L, int n) | bl extern lj_state_growstack // (lua_State *L, int n)
| ldp BASE, RA, L->base | ldp BASE, RC, L->base
| add RC, BASE, RC | add RA, BASE, RA
| sub TMP3, BASE, #16 | sub TMP3, BASE, #16
| b <6 | b <6
break; break;
@ -3730,7 +3726,7 @@ static void build_ins(BuildCtx *ctx, BCOp op, int defop)
} else { } else {
| adds CARG1w, CARG1w, CARG3w | adds CARG1w, CARG1w, CARG3w
| bvs >2 | bvs >2
| add TMP0, CARG1, TISNUM | add_TISNUM TMP0, CARG1
| tbnz CARG3w, #31, >4 | tbnz CARG3w, #31, >4
| cmp CARG1w, CARG2w | cmp CARG1w, CARG2w
} }
@ -3809,7 +3805,7 @@ static void build_ins(BuildCtx *ctx, BCOp op, int defop)
| // RA = base, RC = target | // RA = base, RC = target
| ldr CARG1, [BASE, RA, lsl #3] | ldr CARG1, [BASE, RA, lsl #3]
| add TMP1, BASE, RA, lsl #3 | add TMP1, BASE, RA, lsl #3
| cmp CARG1, TISNIL | cmp_nil CARG1
| beq >1 // Stop if iterator returned nil. | beq >1 // Stop if iterator returned nil.
if (op == BC_JITERL) { if (op == BC_JITERL) {
| str CARG1, [TMP1, #-8] | str CARG1, [TMP1, #-8]