mirror of
https://sourceware.org/git/glibc.git
synced 2025-10-28 23:34:53 +03:00
The current racy approach is to enable asynchronous cancellation
before making the syscall and restore the previous cancellation
type once the syscall returns, and check if cancellation has happen
during the cancellation entrypoint.
As described in BZ#12683, this approach shows 2 problems:
1. Cancellation can act after the syscall has returned from the
kernel, but before userspace saves the return value. It might
result in a resource leak if the syscall allocated a resource or a
side effect (partial read/write), and there is no way to program
handle it with cancellation handlers.
2. If a signal is handled while the thread is blocked at a cancellable
syscall, the entire signal handler runs with asynchronous
cancellation enabled. This can lead to issues if the signal
handler call functions which are async-signal-safe but not
async-cancel-safe.
For the cancellation to work correctly, there are 5 points at which the
cancellation signal could arrive:
[ ... )[ ... )[ syscall ]( ...
1 2 3 4 5
1. Before initial testcancel, e.g. [*... testcancel)
2. Between testcancel and syscall start, e.g. [testcancel...syscall start)
3. While syscall is blocked and no side effects have yet taken
place, e.g. [ syscall ]
4. Same as 3 but with side-effects having occurred (e.g. a partial
read or write).
5. After syscall end e.g. (syscall end...*]
And libc wants to act on cancellation in cases 1, 2, and 3 but not
in cases 4 or 5. For the 4 and 5 cases, the cancellation will eventually
happen in the next cancellable entrypoint without any further external
event.
The proposed solution for each case is:
1. Do a conditional branch based on whether the thread has received
a cancellation request;
2. It can be caught by the signal handler determining that the saved
program counter (from the ucontext_t) is in some address range
beginning just before the "testcancel" and ending with the
syscall instruction.
3. SIGCANCEL can be caught by the signal handler and determine that
the saved program counter (from the ucontext_t) is in the address
range beginning just before "testcancel" and ending with the first
uninterruptable (via a signal) syscall instruction that enters the
kernel.
4. In this case, except for certain syscalls that ALWAYS fail with
EINTR even for non-interrupting signals, the kernel will reset
the program counter to point at the syscall instruction during
signal handling, so that the syscall is restarted when the signal
handler returns. So, from the signal handler's standpoint, this
looks the same as case 2, and thus it's taken care of.
5. For syscalls with side-effects, the kernel cannot restart the
syscall; when it's interrupted by a signal, the kernel must cause
the syscall to return with whatever partial result is obtained
(e.g. partial read or write).
6. The saved program counter points just after the syscall
instruction, so the signal handler won't act on cancellation.
This is similar to 4. since the program counter is past the syscall
instruction.
So The proposed fixes are:
1. Remove the enable_asynccancel/disable_asynccancel function usage in
cancellable syscall definition and instead make them call a common
symbol that will check if cancellation is enabled (__syscall_cancel
at nptl/cancellation.c), call the arch-specific cancellable
entry-point (__syscall_cancel_arch), and cancel the thread when
required.
2. Provide an arch-specific generic system call wrapper function
that contains global markers. These markers will be used in
SIGCANCEL signal handler to check if the interruption has been
called in a valid syscall and if the syscalls has side-effects.
A reference implementation sysdeps/unix/sysv/linux/syscall_cancel.c
is provided. However, the markers may not be set on correct
expected places depending on how INTERNAL_SYSCALL_NCS is
implemented by the architecture. It is expected that all
architectures add an arch-specific implementation.
3. Rewrite SIGCANCEL asynchronous handler to check for both canceling
type and if current IP from signal handler falls between the global
markers and act accordingly.
4. Adjust libc code to replace LIBC_CANCEL_ASYNC/LIBC_CANCEL_RESET to
use the appropriate cancelable syscalls.
5. Adjust 'lowlevellock-futex.h' arch-specific implementations to
provide cancelable futex calls.
Some architectures require specific support on syscall handling:
* On i386 the syscall cancel bridge needs to use the old int80
instruction because the optimized vDSO symbol the resulting PC value
for an interrupted syscall points to an address outside the expected
markers in __syscall_cancel_arch. It has been discussed in LKML [1]
on how kernel could help userland to accomplish it, but afaik
discussion has stalled.
Also, sysenter should not be used directly by libc since its calling
convention is set by the kernel depending of the underlying x86 chip
(check kernel commit 30bfa7b3488bfb1bb75c9f50a5fcac1832970c60).
* mips o32 is the only kABI that requires 7 argument syscall, and to
avoid add a requirement on all architectures to support it, mips
support is added with extra internal defines.
Checked on aarch64-linux-gnu, arm-linux-gnueabihf, powerpc-linux-gnu,
powerpc64-linux-gnu, powerpc64le-linux-gnu, i686-linux-gnu, and
x86_64-linux-gnu.
[1] https://lkml.org/lkml/2016/3/8/1105
Reviewed-by: Carlos O'Donell <carlos@redhat.com>
199 lines
5.4 KiB
C
199 lines
5.4 KiB
C
/* Assembly macros for 32-bit PowerPC.
|
|
Copyright (C) 1999-2024 Free Software Foundation, Inc.
|
|
This file is part of the GNU C Library.
|
|
|
|
The GNU C Library is free software; you can redistribute it and/or
|
|
modify it under the terms of the GNU Lesser General Public
|
|
License as published by the Free Software Foundation; either
|
|
version 2.1 of the License, or (at your option) any later version.
|
|
|
|
The GNU C Library is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
Lesser General Public License for more details.
|
|
|
|
You should have received a copy of the GNU Lesser General Public
|
|
License along with the GNU C Library; if not, see
|
|
<https://www.gnu.org/licenses/>. */
|
|
|
|
#include <sysdeps/powerpc/sysdep.h>
|
|
|
|
#ifdef __ASSEMBLER__
|
|
|
|
/* If compiled for profiling, call `_mcount' at the start of each
|
|
function. */
|
|
#ifdef PROF
|
|
/* The mcount code relies on a the return address being on the stack
|
|
to locate our caller and so it can restore it; so store one just
|
|
for its benefit. */
|
|
# define CALL_MCOUNT \
|
|
mflr r0; \
|
|
stw r0,4(r1); \
|
|
cfi_offset (lr, 4); \
|
|
bl JUMPTARGET(_mcount);
|
|
#else /* PROF */
|
|
# define CALL_MCOUNT /* Do nothing. */
|
|
#endif /* PROF */
|
|
|
|
#define ENTRY(name) \
|
|
.globl C_SYMBOL_NAME(name); \
|
|
.type C_SYMBOL_NAME(name),@function; \
|
|
.align ALIGNARG(2); \
|
|
C_LABEL(name) \
|
|
cfi_startproc; \
|
|
CALL_MCOUNT
|
|
|
|
#define ENTRY_TOCLESS(name) ENTRY(name)
|
|
|
|
/* helper macro for accessing the 32-bit powerpc GOT. */
|
|
|
|
#define SETUP_GOT_ACCESS(regname,GOT_LABEL) \
|
|
bcl 20,31,GOT_LABEL ; \
|
|
GOT_LABEL: ; \
|
|
mflr (regname)
|
|
|
|
#define EALIGN_W_0 /* No words to insert. */
|
|
#define EALIGN_W_1 nop
|
|
#define EALIGN_W_2 nop;nop
|
|
#define EALIGN_W_3 nop;nop;nop
|
|
#define EALIGN_W_4 EALIGN_W_3;nop
|
|
#define EALIGN_W_5 EALIGN_W_4;nop
|
|
#define EALIGN_W_6 EALIGN_W_5;nop
|
|
#define EALIGN_W_7 EALIGN_W_6;nop
|
|
|
|
/* EALIGN is like ENTRY, but does alignment to 'words'*4 bytes
|
|
past a 2^align boundary. */
|
|
#ifdef PROF
|
|
# define EALIGN(name, alignt, words) \
|
|
.globl C_SYMBOL_NAME(name); \
|
|
.type C_SYMBOL_NAME(name),@function; \
|
|
.align ALIGNARG(2); \
|
|
C_LABEL(name) \
|
|
cfi_startproc; \
|
|
CALL_MCOUNT \
|
|
b 0f; \
|
|
.align ALIGNARG(alignt); \
|
|
EALIGN_W_##words; \
|
|
0:
|
|
#else /* PROF */
|
|
# define EALIGN(name, alignt, words) \
|
|
.globl C_SYMBOL_NAME(name); \
|
|
.type C_SYMBOL_NAME(name),@function; \
|
|
.align ALIGNARG(alignt); \
|
|
EALIGN_W_##words; \
|
|
C_LABEL(name) \
|
|
cfi_startproc;
|
|
#endif
|
|
|
|
#undef END
|
|
#define END(name) \
|
|
cfi_endproc; \
|
|
ASM_SIZE_DIRECTIVE(name)
|
|
|
|
#define DO_CALL(syscall) \
|
|
li 0,syscall; \
|
|
DO_CALL_SC
|
|
|
|
#define DO_CALL_SC \
|
|
sc
|
|
|
|
#undef JUMPTARGET
|
|
#ifdef PIC
|
|
# define JUMPTARGET(name) name##@plt
|
|
#else
|
|
# define JUMPTARGET(name) name
|
|
#endif
|
|
|
|
#define TAIL_CALL_NO_RETURN(__func) \
|
|
b __func@local
|
|
|
|
#if defined SHARED && defined PIC && !defined NO_HIDDEN
|
|
# undef HIDDEN_JUMPTARGET
|
|
# define HIDDEN_JUMPTARGET(name) __GI_##name##@local
|
|
#endif
|
|
|
|
#define TAIL_CALL_SYSCALL_ERROR \
|
|
b __syscall_error@local
|
|
|
|
#define PSEUDO(name, syscall_name, args) \
|
|
.section ".text"; \
|
|
ENTRY (name) \
|
|
DO_CALL (SYS_ify (syscall_name));
|
|
|
|
#define RET_SC \
|
|
bnslr+;
|
|
|
|
#define PSEUDO_RET \
|
|
RET_SC; \
|
|
TAIL_CALL_SYSCALL_ERROR
|
|
#define ret PSEUDO_RET
|
|
|
|
#undef PSEUDO_END
|
|
#define PSEUDO_END(name) \
|
|
END (name)
|
|
|
|
#define PSEUDO_NOERRNO(name, syscall_name, args) \
|
|
.section ".text"; \
|
|
ENTRY (name) \
|
|
DO_CALL (SYS_ify (syscall_name));
|
|
|
|
#define PSEUDO_RET_NOERRNO \
|
|
blr
|
|
#define ret_NOERRNO PSEUDO_RET_NOERRNO
|
|
|
|
#undef PSEUDO_END_NOERRNO
|
|
#define PSEUDO_END_NOERRNO(name) \
|
|
END (name)
|
|
|
|
#define PSEUDO_ERRVAL(name, syscall_name, args) \
|
|
.section ".text"; \
|
|
ENTRY (name) \
|
|
DO_CALL (SYS_ify (syscall_name));
|
|
|
|
#define PSEUDO_RET_ERRVAL \
|
|
blr
|
|
#define ret_ERRVAL PSEUDO_RET_ERRVAL
|
|
|
|
#undef PSEUDO_END_ERRVAL
|
|
#define PSEUDO_END_ERRVAL(name) \
|
|
END (name)
|
|
|
|
/* Local labels stripped out by the linker. */
|
|
#undef L
|
|
#define L(x) .L##x
|
|
|
|
#define XGLUE(a,b) a##b
|
|
#define GLUE(a,b) XGLUE (a,b)
|
|
#define GENERATE_GOT_LABEL(name) GLUE (.got_label, name)
|
|
|
|
/* Label in text section. */
|
|
#define C_TEXT(name) name
|
|
|
|
/* Read the value of member from rtld_global_ro. */
|
|
#ifdef PIC
|
|
# ifdef SHARED
|
|
# if IS_IN (rtld)
|
|
/* Inside ld.so we use the local alias to avoid runtime GOT
|
|
relocations. */
|
|
# define __GLRO(rOUT, rGOT, member, offset) \
|
|
lwz rOUT,_rtld_local_ro@got(rGOT); \
|
|
lwz rOUT,offset(rOUT)
|
|
# else
|
|
# define __GLRO(rOUT, rGOT, member, offset) \
|
|
lwz rOUT,_rtld_global_ro@got(rGOT); \
|
|
lwz rOUT,offset(rOUT)
|
|
# endif
|
|
# else
|
|
# define __GLRO(rOUT, rGOT, member, offset) \
|
|
lwz rOUT,member@got(rGOT); \
|
|
lwz rOUT,0(rOUT)
|
|
# endif
|
|
#else
|
|
/* Position-dependent code does not require access to the GOT. */
|
|
# define __GLRO(rOUT, rGOT, member, offset) \
|
|
lis rOUT,(member)@ha; \
|
|
lwz rOUT,(member)@l(rOUT)
|
|
#endif /* PIC */
|
|
|
|
#endif /* __ASSEMBLER__ */
|