1
0
mirror of https://sourceware.org/git/glibc.git synced 2025-09-11 12:10:50 +03:00
Files
glibc/sysdeps/aarch64/__longjmp.S
Yury Khrustalev c0f0db2d59 aarch64: simplify calls to __libc_arm_za_disable in assembly
There is no functional change in this patch.

We remove stores and loads to stack, return address signing, and redundant
CFI directives before and after call to __libc_arm_za_disable().

The __libc_arm_za_disable implementation follows special calling convention
that allows to avoid most of the operations that would be necessary for a
call to a normal function (see [1] for details).

First, we rely on __libc_arm_za_disable() not clobbering certain registers,
and we put return address into one of these registers. Now we don't need
to store it on stack, so we don't need to sign return address using PAC.

Second, as a result of the above, we don't need to update the CFI offset.

This patch provides small optimisation avoiding unnecessary store and load
on stack also simplifies assembly code and CFI directives.

[1]: https://github.com/ARM-software/abi-aa/blob/main/aapcs64/aapcs64.rst

Reviewed-by: Adhemerval Zanella  <adhemerval.zanella@linaro.org>
2025-06-18 09:42:33 +01:00

160 lines
4.4 KiB
ArmAsm

/* Copyright (C) 1997-2025 Free Software Foundation, Inc.
This file is part of the GNU C Library.
The GNU C Library is free software; you can redistribute it and/or
modify it under the terms of the GNU Lesser General Public License as
published by the Free Software Foundation; either version 2.1 of the
License, or (at your option) any later version.
The GNU C Library is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
Lesser General Public License for more details.
You should have received a copy of the GNU Lesser General Public
License along with the GNU C Library. If not, see
<https://www.gnu.org/licenses/>. */
#include <sysdep.h>
#include <pointer_guard.h>
#include <jmpbuf-offsets.h>
#include <stap-probe.h>
/* __longjmp(jmpbuf, val) */
ENTRY (__longjmp)
#if IS_IN(libc)
/* Disable ZA state of SME in libc.a and libc.so, but not in ld.so.
The calling convention of __libc_arm_za_disable allows to do
this thus allowing to avoid saving to and reading from stack.
As a result we also don't need to sign the return address and
check it after returning because it is not stored to stack. */
mov x13, x30
cfi_register (x30, x13)
bl __libc_arm_za_disable
mov x30, x13
cfi_register (x13, x30)
#endif
cfi_def_cfa (x0, 0)
cfi_offset (x19, JB_X19<<3)
cfi_offset (x20, JB_X20<<3)
cfi_offset (x21, JB_X21<<3)
cfi_offset (x22, JB_X22<<3)
cfi_offset (x23, JB_X23<<3)
cfi_offset (x24, JB_X24<<3)
cfi_offset (x25, JB_X25<<3)
cfi_offset (x26, JB_X26<<3)
cfi_offset (x27, JB_X27<<3)
cfi_offset (x28, JB_X28<<3)
cfi_offset (x29, JB_X29<<3)
cfi_offset (x30, JB_LR<<3)
cfi_offset ( d8, JB_D8<<3)
cfi_offset ( d9, JB_D9<<3)
cfi_offset (d10, JB_D10<<3)
cfi_offset (d11, JB_D11<<3)
cfi_offset (d12, JB_D12<<3)
cfi_offset (d13, JB_D13<<3)
cfi_offset (d14, JB_D14<<3)
cfi_offset (d15, JB_D15<<3)
ldp x19, x20, [x0, #JB_X19<<3]
ldp x21, x22, [x0, #JB_X21<<3]
ldp x23, x24, [x0, #JB_X23<<3]
ldp x25, x26, [x0, #JB_X25<<3]
ldp x27, x28, [x0, #JB_X27<<3]
ldp x29, x30, [x0, #JB_X29<<3]
#ifdef PTR_DEMANGLE
PTR_DEMANGLE (x30, x30, x3)
#endif
/* longjmp probe takes 3 arguments, address of jump buffer as
first argument (8@x0), return value as second argument (-4@x1),
and target address (8@x30), respectively. */
LIBC_PROBE (longjmp, 3, 8@x0, -4@x1, 8@x30)
ldp d8, d9, [x0, #JB_D8<<3]
ldp d10, d11, [x0, #JB_D10<<3]
ldp d12, d13, [x0, #JB_D12<<3]
ldp d14, d15, [x0, #JB_D14<<3]
/* GCS support. */
mov x16, 1
CHKFEAT_X16
tbnz x16, 0, L(gcs_done)
MRS_GCSPR (x2)
ldr x3, [x0, #JB_GCSPR]
mov x4, x3
/* x2: GCSPR now. x3, x4: target GCSPR. x5, x6: tmp regs. */
L(gcs_scan):
cmp x2, x4
b.eq L(gcs_pop)
sub x4, x4, 8
/* Check for a cap token. */
ldr x5, [x4]
and x6, x4, 0xfffffffffffff000
orr x6, x6, 1
cmp x5, x6
b.ne L(gcs_scan)
L(gcs_switch):
add x2, x4, 8
GCSSS1 (x4)
GCSSS2 (xzr)
L(gcs_pop):
cmp x2, x3
b.eq L(gcs_done)
GCSPOPM (xzr)
add x2, x2, 8
b L(gcs_pop)
L(gcs_done):
/* Originally this was implemented with a series of
.cfi_restore() directives.
The theory was that cfi_restore should revert to previous
frame value is the same as the current value. In practice
this doesn't work, even after cfi_restore() gdb continues
to try to recover a previous frame value offset from x0,
which gets stuffed after a few more instructions. The
cfi_same_value() mechanism appears to work fine. */
cfi_same_value(x19)
cfi_same_value(x20)
cfi_same_value(x21)
cfi_same_value(x22)
cfi_same_value(x23)
cfi_same_value(x24)
cfi_same_value(x25)
cfi_same_value(x26)
cfi_same_value(x27)
cfi_same_value(x28)
cfi_same_value(x29)
cfi_same_value(x30)
cfi_same_value(d8)
cfi_same_value(d9)
cfi_same_value(d10)
cfi_same_value(d11)
cfi_same_value(d12)
cfi_same_value(d13)
cfi_same_value(d14)
cfi_same_value(d15)
ldr x4, [x0, #JB_SP<<3]
#ifdef PTR_DEMANGLE
PTR_DEMANGLE (x4, x4, x3)
#endif
mov sp, x4
/* longjmp_target probe takes 3 arguments, address of jump buffer
as first argument (8@x0), return value as second argument (-4@x1),
and target address (8@x30), respectively. */
LIBC_PROBE (longjmp_target, 3, 8@x0, -4@x1, 8@x30)
cmp x1, 0
cinc x0, x1, eq
/* Use br instead of ret because ret is guaranteed to mispredict */
br x30
END (__longjmp)