From mboxrd@z Thu Jan 1 00:00:00 1970 Return-Path: Received: by sourceware.org (Postfix, from userid 1944) id 66AEF3857409; Fri, 5 Aug 2022 19:38:07 +0000 (GMT) DKIM-Filter: OpenDKIM Filter v2.11.0 sourceware.org 66AEF3857409 Content-Type: text/plain; charset="us-ascii" MIME-Version: 1.0 Content-Transfer-Encoding: 7bit From: Szabolcs Nagy To: glibc-cvs@sourceware.org Subject: [glibc/arm/morello/main] TODO(audit): aarch64: morello: add _dl_runtime_profile entry X-Act-Checkin: glibc X-Git-Author: Szabolcs Nagy X-Git-Refname: refs/heads/arm/morello/main X-Git-Oldrev: 7f9c78bc3a0eaa7bc5f04a585bdaf672c6578e9a X-Git-Newrev: a8989aef06cc29468d42f6efc21a06a46a32b249 Message-Id: <20220805193807.66AEF3857409@sourceware.org> Date: Fri, 5 Aug 2022 19:38:07 +0000 (GMT) X-BeenThere: glibc-cvs@sourceware.org X-Mailman-Version: 2.1.29 Precedence: list List-Id: Glibc-cvs mailing list List-Unsubscribe: , List-Archive: List-Help: List-Subscribe: , X-List-Received-Date: Fri, 05 Aug 2022 19:38:07 -0000 https://sourceware.org/git/gitweb.cgi?p=glibc.git;h=a8989aef06cc29468d42f6efc21a06a46a32b249 commit a8989aef06cc29468d42f6efc21a06a46a32b249 Author: Szabolcs Nagy Date: Wed Jul 13 16:01:24 2022 +0100 TODO(audit): aarch64: morello: add _dl_runtime_profile entry Required for LD_AUDIT PLT hooks and shared library profiling. incomplete, untested. TODO: needs La_aarch64* layout definition for morello TODO: needs to save c9 for vararg abi Diff: --- sysdeps/aarch64/bits/link.h | 19 ++++ sysdeps/aarch64/morello/dl-trampoline.S | 179 +++++++++++++++++++++++++++++++- 2 files changed, 194 insertions(+), 4 deletions(-) diff --git a/sysdeps/aarch64/bits/link.h b/sysdeps/aarch64/bits/link.h index 2479abc4fb..ca0e59f36c 100644 --- a/sysdeps/aarch64/bits/link.h +++ b/sysdeps/aarch64/bits/link.h @@ -28,6 +28,7 @@ typedef union } La_aarch64_vector; /* Registers for entry into PLT on AArch64. */ +#ifndef __CHERI_PURE_CAPABILITY__ typedef struct La_aarch64_regs { uint64_t lr_xreg[9]; @@ -46,6 +47,24 @@ typedef struct La_aarch64_retval La_aarch64_vector lrv_vreg[8]; void *lrv_vpcs; } La_aarch64_retval; +#else +typedef struct La_aarch64_regs +{ + uintptr_t lr_xreg[9]; + La_aarch64_vector lr_vreg[8]; + uintptr_t lr_sp; + uintptr_t lr_lr; + void *lr_vpcs; +} La_aarch64_regs; + +typedef struct La_aarch64_retval +{ + uintptr_t lrv_xreg[8]; + La_aarch64_vector lrv_vreg[8]; + void *lrv_vpcs; +} La_aarch64_retval; +#endif + __BEGIN_DECLS extern ElfW(Addr) diff --git a/sysdeps/aarch64/morello/dl-trampoline.S b/sysdeps/aarch64/morello/dl-trampoline.S index dcd61d66fe..c34fb91e75 100644 --- a/sysdeps/aarch64/morello/dl-trampoline.S +++ b/sysdeps/aarch64/morello/dl-trampoline.S @@ -125,10 +125,181 @@ _dl_runtime_resolve: .align 2 _dl_runtime_profile: - /* TODO: requires definition of La_aarch64_* layout - and register state saved correctly for varargs ABI. */ - mov c0, 0 - ldr c0, [c0] + /* Morello we get called with: + ip0 &PLTGOT[2] + ip1 temp(dl resolver entry point) + [csp, #16] lr + [csp, #0] &PLTGOT[n] + + Stack frame layout: + [csp, #...] lr + [csp, #...] &PLTGOT[n] + [csp, #192] La_aarch64_regs + [csp, #96] La_aarch64_retval + [csp, #80] frame size return from pltenter + [csp, #64] dl_profile_call saved c1 + [csp, #48] dl_profile_call saved c0 + [csp, #32] t1 + [csp, #0] c29, lr <- c29 + */ + +# define OFFSET_T1 32 +# define OFFSET_SAVED_CALL_X0 OFFSET_T1 + 16 +# define OFFSET_FS OFFSET_SAVED_CALL_X0 + 32 +# define OFFSET_RV OFFSET_FS + 16 +# define OFFSET_RG OFFSET_RV + DL_SIZEOF_RV + +# define SF_SIZE OFFSET_RG + DL_SIZEOF_RG + +# define OFFSET_PLTGOTN SF_SIZE +# define OFFSET_LR OFFSET_PLTGOTN + 16 + + /* Save arguments. */ + mov c11, csp + sub x11, x11, #SF_SIZE + scvalue csp, csp, x11 + cfi_adjust_cfa_offset (SF_SIZE) + stp c29, c30, [csp, #0] + mov c29, csp + cfi_def_cfa_register (c29) + cfi_rel_offset (c29, 0) + cfi_rel_offset (lr, 8) + + stp c0, c1, [c29, #OFFSET_RG + DL_OFFSET_RG_X0 + 32*0] + cfi_rel_offset (c0, OFFSET_RG + DL_OFFSET_RG_X0 + 32*0 + 0) + cfi_rel_offset (c1, OFFSET_RG + DL_OFFSET_RG_X0 + 32*0 + 16) + stp c2, c3, [c29, #OFFSET_RG + DL_OFFSET_RG_X0 + 32*1] + cfi_rel_offset (c2, OFFSET_RG + DL_OFFSET_RG_X0 + 32*1 + 0) + cfi_rel_offset (c3, OFFSET_RG + DL_OFFSET_RG_X0 + 32*1 + 16) + stp c4, c5, [c29, #OFFSET_RG + DL_OFFSET_RG_X0 + 32*2] + cfi_rel_offset (c4, OFFSET_RG + DL_OFFSET_RG_X0 + 32*2 + 0) + cfi_rel_offset (c5, OFFSET_RG + DL_OFFSET_RG_X0 + 32*2 + 16) + stp c6, c7, [c29, #OFFSET_RG + DL_OFFSET_RG_X0 + 32*3] + cfi_rel_offset (c6, OFFSET_RG + DL_OFFSET_RG_X0 + 32*3 + 0) + cfi_rel_offset (c7, OFFSET_RG + DL_OFFSET_RG_X0 + 32*3 + 16) + + stp q0, q1, [c29, #OFFSET_RG + DL_OFFSET_RG_V0 + 32*0] + cfi_rel_offset (q0, OFFSET_RG + DL_OFFSET_RG_V0 + 32*0) + cfi_rel_offset (q1, OFFSET_RG + DL_OFFSET_RG_V0 + 32*0 + 16) + stp q2, q3, [c29, #OFFSET_RG+ DL_OFFSET_RG_V0 + 32*1] + cfi_rel_offset (q2, OFFSET_RG + DL_OFFSET_RG_V0 + 32*1 + 0) + cfi_rel_offset (q3, OFFSET_RG + DL_OFFSET_RG_V0 + 32*1 + 16) + stp q4, q5, [c29, #OFFSET_RG + DL_OFFSET_RG_V0 + 32*2] + cfi_rel_offset (q4, OFFSET_RG + DL_OFFSET_RG_V0 + 32*2 + 0) + cfi_rel_offset (q5, OFFSET_RG + DL_OFFSET_RG_V0 + 32*2 + 16) + stp q6, q7, [c29, #OFFSET_RG + DL_OFFSET_RG_V0 + 32*3] + cfi_rel_offset (q6, OFFSET_RG + DL_OFFSET_RG_V0 + 32*3 + 0) + cfi_rel_offset (q7, OFFSET_RG + DL_OFFSET_RG_V0 + 32*3 + 16) + + add c0, c29, #SF_SIZE + 32 + ldr c1, [c29, #OFFSET_LR] + stp c0, c1, [c29, #OFFSET_RG + DL_OFFSET_RG_SP] + + /* Get pointer to linker struct. */ + ldr c0, [ip0, #-PTR_SIZE] + + /* Prepare to call _dl_profile_fixup(). */ + ldr c1, [c29, OFFSET_PLTGOTN] /* Recover &PLTGOT[n] */ + + mov c11, c1 + sub x1, x1, x16 + add x1, x1, x1, lsl #1 + lsl x1, x1, #3 + sub x1, x1, #(RELA_SIZE<<3) + lsr x1, x1, #3 + scvalue c1, c11, x1 + + stp c0, c1, [c29, #OFFSET_SAVED_CALL_X0] + + /* Set up extra args for _dl_profile_fixup */ + ldr c2, [c29, #OFFSET_LR] /* load saved LR */ + add c3, c29, #OFFSET_RG /* address of La_aarch64_reg */ + add c4, c29, #OFFSET_FS /* address of framesize */ + bl _dl_profile_fixup + + ldr ip0l, [c29, #OFFSET_FS] /* framesize == 0 */ + cmp x16, #0 + bge 1f + cfi_remember_state + + /* Save the return. */ + mov ip0, c0 + + /* Get arguments and return address back. */ + ldp c0, c1, [c29, #OFFSET_RG + DL_OFFSET_RG_X0 + 32*0] + ldp c2, c3, [c29, #OFFSET_RG + DL_OFFSET_RG_X0 + 32*1] + ldp c4, c5, [c29, #OFFSET_RG + DL_OFFSET_RG_X0 + 32*2] + ldp c6, c7, [c29, #OFFSET_RG + DL_OFFSET_RG_X0 + 32*3] + ldp q0, q1, [c29, #OFFSET_RG + DL_OFFSET_RG_V0 + 32*0] + ldp q2, q3, [c29, #OFFSET_RG + DL_OFFSET_RG_V0 + 32*1] + ldp q4, q5, [c29, #OFFSET_RG + DL_OFFSET_RG_V0 + 32*2] + ldp q6, q7, [c29, #OFFSET_RG + DL_OFFSET_RG_V0 + 32*3] + + cfi_def_cfa_register (csp) + ldp c29, c30, [c29, #0] + cfi_restore(c29) + cfi_restore(c30) + + add csp, csp, SF_SIZE + 16 + cfi_adjust_cfa_offset (- SF_SIZE - 32) + + /* Jump to the newly found address. */ + br ip0 + + cfi_restore_state +1: + /* The new frame size is in ip0. */ + + mov c11, c1 + sub x1, x29, x16 + and x12, x1, #0xfffffffffffffff0 + scvalue csp, csp, x12 + scvalue c1, c11, x1 + + str c0, [c29, #OFFSET_T1] + + mov c0, csp + add c1, c29, #SF_SIZE + 16 + mov c2, ip0 + bl memcpy + + ldr ip0, [c29, #OFFSET_T1] + + /* Call the function. */ + ldp c0, c1, [c29, #OFFSET_RG + DL_OFFSET_RG_X0 + 32*0] + ldp c2, c3, [c29, #OFFSET_RG + DL_OFFSET_RG_X0 + 32*1] + ldp c4, c5, [c29, #OFFSET_RG + DL_OFFSET_RG_X0 + 32*2] + ldp c6, c7, [c29, #OFFSET_RG + DL_OFFSET_RG_X0 + 32*3] + ldp q0, q1, [c29, #OFFSET_RG + DL_OFFSET_RG_V0 + 32*0] + ldp q2, q3, [c29, #OFFSET_RG + DL_OFFSET_RG_V0 + 32*1] + ldp q4, q5, [c29, #OFFSET_RG + DL_OFFSET_RG_V0 + 32*2] + ldp q6, q7, [c29, #OFFSET_RG + DL_OFFSET_RG_V0 + 32*3] + blr ip0 + stp c0, c1, [c29, #OFFSET_RV + DL_OFFSET_RV_X0] + stp q0, q1, [c29, #OFFSET_RV + DL_OFFSET_RV_V0 + 32*0] + stp q2, q3, [c29, #OFFSET_RV + DL_OFFSET_RV_V0 + 32*1] + + /* Setup call to pltexit */ + ldp c0, c1, [c29, #OFFSET_SAVED_CALL_X0] + add c2, c29, #OFFSET_RG + add c3, c29, #OFFSET_RV + bl _dl_audit_pltexit + + ldp c0, c1, [c29, #OFFSET_RV + DL_OFFSET_RV_X0] + ldp d0, d1, [c29, #OFFSET_RV + DL_OFFSET_RV_V0 + 32*0] + ldp d2, d3, [c29, #OFFSET_RV + DL_OFFSET_RV_V0 + 32*1] + /* LR from within La_aarch64_reg */ + ldr lr, [c29, #OFFSET_RG + DL_OFFSET_RG_LR] + cfi_restore(lr) + + mov csp, c29 + cfi_def_cfa_register (csp) + ldr c29, [c29, #0] + cfi_restore(c29) + add csp, csp, SF_SIZE + 32 + cfi_adjust_cfa_offset (- SF_SIZE - 32) + + br lr cfi_endproc .size _dl_runtime_profile, .-_dl_runtime_profile