mirror of
https://sourceware.org/git/glibc.git
synced 2025-09-11 12:10:50 +03:00
There is no functional change in this patch. We remove stores and loads to stack, return address signing, and redundant CFI directives before and after call to __libc_arm_za_disable(). The __libc_arm_za_disable implementation follows special calling convention that allows to avoid most of the operations that would be necessary for a call to a normal function (see [1] for details). First, we rely on __libc_arm_za_disable() not clobbering certain registers, and we put return address into one of these registers. Now we don't need to store it on stack, so we don't need to sign return address using PAC. Second, as a result of the above, we don't need to update the CFI offset. This patch provides small optimisation avoiding unnecessary store and load on stack also simplifies assembly code and CFI directives. [1]: https://github.com/ARM-software/abi-aa/blob/main/aapcs64/aapcs64.rst Reviewed-by: Adhemerval Zanella <adhemerval.zanella@linaro.org>
160 lines
4.4 KiB
ArmAsm
160 lines
4.4 KiB
ArmAsm
/* Copyright (C) 1997-2025 Free Software Foundation, Inc.
|
|
|
|
This file is part of the GNU C Library.
|
|
|
|
The GNU C Library is free software; you can redistribute it and/or
|
|
modify it under the terms of the GNU Lesser General Public License as
|
|
published by the Free Software Foundation; either version 2.1 of the
|
|
License, or (at your option) any later version.
|
|
|
|
The GNU C Library is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
Lesser General Public License for more details.
|
|
|
|
You should have received a copy of the GNU Lesser General Public
|
|
License along with the GNU C Library. If not, see
|
|
<https://www.gnu.org/licenses/>. */
|
|
|
|
#include <sysdep.h>
|
|
#include <pointer_guard.h>
|
|
#include <jmpbuf-offsets.h>
|
|
#include <stap-probe.h>
|
|
|
|
/* __longjmp(jmpbuf, val) */
|
|
|
|
ENTRY (__longjmp)
|
|
|
|
#if IS_IN(libc)
|
|
/* Disable ZA state of SME in libc.a and libc.so, but not in ld.so.
|
|
The calling convention of __libc_arm_za_disable allows to do
|
|
this thus allowing to avoid saving to and reading from stack.
|
|
As a result we also don't need to sign the return address and
|
|
check it after returning because it is not stored to stack. */
|
|
mov x13, x30
|
|
cfi_register (x30, x13)
|
|
bl __libc_arm_za_disable
|
|
mov x30, x13
|
|
cfi_register (x13, x30)
|
|
#endif
|
|
|
|
cfi_def_cfa (x0, 0)
|
|
cfi_offset (x19, JB_X19<<3)
|
|
cfi_offset (x20, JB_X20<<3)
|
|
cfi_offset (x21, JB_X21<<3)
|
|
cfi_offset (x22, JB_X22<<3)
|
|
cfi_offset (x23, JB_X23<<3)
|
|
cfi_offset (x24, JB_X24<<3)
|
|
cfi_offset (x25, JB_X25<<3)
|
|
cfi_offset (x26, JB_X26<<3)
|
|
cfi_offset (x27, JB_X27<<3)
|
|
cfi_offset (x28, JB_X28<<3)
|
|
cfi_offset (x29, JB_X29<<3)
|
|
cfi_offset (x30, JB_LR<<3)
|
|
|
|
cfi_offset ( d8, JB_D8<<3)
|
|
cfi_offset ( d9, JB_D9<<3)
|
|
cfi_offset (d10, JB_D10<<3)
|
|
cfi_offset (d11, JB_D11<<3)
|
|
cfi_offset (d12, JB_D12<<3)
|
|
cfi_offset (d13, JB_D13<<3)
|
|
cfi_offset (d14, JB_D14<<3)
|
|
cfi_offset (d15, JB_D15<<3)
|
|
|
|
ldp x19, x20, [x0, #JB_X19<<3]
|
|
ldp x21, x22, [x0, #JB_X21<<3]
|
|
ldp x23, x24, [x0, #JB_X23<<3]
|
|
ldp x25, x26, [x0, #JB_X25<<3]
|
|
ldp x27, x28, [x0, #JB_X27<<3]
|
|
ldp x29, x30, [x0, #JB_X29<<3]
|
|
#ifdef PTR_DEMANGLE
|
|
PTR_DEMANGLE (x30, x30, x3)
|
|
#endif
|
|
/* longjmp probe takes 3 arguments, address of jump buffer as
|
|
first argument (8@x0), return value as second argument (-4@x1),
|
|
and target address (8@x30), respectively. */
|
|
LIBC_PROBE (longjmp, 3, 8@x0, -4@x1, 8@x30)
|
|
ldp d8, d9, [x0, #JB_D8<<3]
|
|
ldp d10, d11, [x0, #JB_D10<<3]
|
|
ldp d12, d13, [x0, #JB_D12<<3]
|
|
ldp d14, d15, [x0, #JB_D14<<3]
|
|
|
|
/* GCS support. */
|
|
mov x16, 1
|
|
CHKFEAT_X16
|
|
tbnz x16, 0, L(gcs_done)
|
|
MRS_GCSPR (x2)
|
|
ldr x3, [x0, #JB_GCSPR]
|
|
mov x4, x3
|
|
/* x2: GCSPR now. x3, x4: target GCSPR. x5, x6: tmp regs. */
|
|
L(gcs_scan):
|
|
cmp x2, x4
|
|
b.eq L(gcs_pop)
|
|
sub x4, x4, 8
|
|
/* Check for a cap token. */
|
|
ldr x5, [x4]
|
|
and x6, x4, 0xfffffffffffff000
|
|
orr x6, x6, 1
|
|
cmp x5, x6
|
|
b.ne L(gcs_scan)
|
|
L(gcs_switch):
|
|
add x2, x4, 8
|
|
GCSSS1 (x4)
|
|
GCSSS2 (xzr)
|
|
L(gcs_pop):
|
|
cmp x2, x3
|
|
b.eq L(gcs_done)
|
|
GCSPOPM (xzr)
|
|
add x2, x2, 8
|
|
b L(gcs_pop)
|
|
L(gcs_done):
|
|
|
|
/* Originally this was implemented with a series of
|
|
.cfi_restore() directives.
|
|
|
|
The theory was that cfi_restore should revert to previous
|
|
frame value is the same as the current value. In practice
|
|
this doesn't work, even after cfi_restore() gdb continues
|
|
to try to recover a previous frame value offset from x0,
|
|
which gets stuffed after a few more instructions. The
|
|
cfi_same_value() mechanism appears to work fine. */
|
|
|
|
cfi_same_value(x19)
|
|
cfi_same_value(x20)
|
|
cfi_same_value(x21)
|
|
cfi_same_value(x22)
|
|
cfi_same_value(x23)
|
|
cfi_same_value(x24)
|
|
cfi_same_value(x25)
|
|
cfi_same_value(x26)
|
|
cfi_same_value(x27)
|
|
cfi_same_value(x28)
|
|
cfi_same_value(x29)
|
|
cfi_same_value(x30)
|
|
cfi_same_value(d8)
|
|
cfi_same_value(d9)
|
|
cfi_same_value(d10)
|
|
cfi_same_value(d11)
|
|
cfi_same_value(d12)
|
|
cfi_same_value(d13)
|
|
cfi_same_value(d14)
|
|
cfi_same_value(d15)
|
|
|
|
ldr x4, [x0, #JB_SP<<3]
|
|
#ifdef PTR_DEMANGLE
|
|
PTR_DEMANGLE (x4, x4, x3)
|
|
#endif
|
|
mov sp, x4
|
|
|
|
/* longjmp_target probe takes 3 arguments, address of jump buffer
|
|
as first argument (8@x0), return value as second argument (-4@x1),
|
|
and target address (8@x30), respectively. */
|
|
LIBC_PROBE (longjmp_target, 3, 8@x0, -4@x1, 8@x30)
|
|
|
|
cmp x1, 0
|
|
cinc x0, x1, eq
|
|
|
|
/* Use br instead of ret because ret is guaranteed to mispredict */
|
|
br x30
|
|
END (__longjmp)
|