forked from rpms/glibc
1a997221e3
Upstream commit: 5d070d12b3a52bc44dd1b71743abc4b6243862ae
Related: RHEL-25850
- x86: Expand the comment on when REP STOSB is used on memset
- x86: Do not prefer ERMS for memset on Zen3+
- x86: Fix Zen3/Zen4 ERMS selection (BZ 30994)
Resolves: RHEL-25530
- Add tst-gnu2-tls2mod1 to test-internal-extras
- elf: Enable TLS descriptor tests on aarch64
- arm: Update _dl_tlsdesc_dynamic to preserve caller-saved registers (BZ 31372)
- Ignore undefined symbols for -mtls-dialect=gnu2
- x86-64: Allocate state buffer space for RDI, RSI and RBX
- x86-64: Update _dl_tlsdesc_dynamic to preserve AMX registers
- x86: Update _dl_tlsdesc_dynamic to preserve caller-saved registers
Resolves: RHEL-29179
- x86-64: Save APX registers in ld.so trampoline
Resolves: RHEL-25045
- LoongArch: Correct {__ieee754, _}_scalb -> {__ieee754, _}_scalbf
- powerpc: Placeholder and infrastructure/build support to add Power11 related changes.
- powerpc: Add HWCAP3/HWCAP4 data to TCB for Power Architecture.
Resolves: RHEL-24761
Fedora 40 commit: 24af28d49b
81 lines
2.8 KiB
Diff
81 lines
2.8 KiB
Diff
commit 7fc8242bf87828c935ac5df5cafb9dc7ab635fd9
|
|
Author: H.J. Lu <hjl.tools@gmail.com>
|
|
Date: Fri Feb 16 07:17:10 2024 -0800
|
|
|
|
x86-64: Save APX registers in ld.so trampoline
|
|
|
|
Add APX registers to STATE_SAVE_MASK so that APX registers are saved in
|
|
ld.so trampoline. This fixes BZ #31371.
|
|
|
|
Also update STATE_SAVE_OFFSET and STATE_SAVE_MASK for i386 which will
|
|
be used by i386 _dl_tlsdesc_dynamic.
|
|
Reviewed-by: Noah Goldstein <goldstein.w.n@gmail.com>
|
|
|
|
(cherry picked from commit dfb05f8e704edac70db38c4c8ee700769d91a413)
|
|
|
|
diff --git a/sysdeps/x86/sysdep.h b/sysdeps/x86/sysdep.h
|
|
index 85d0a8c943cbb218..837fd28734914a1c 100644
|
|
--- a/sysdeps/x86/sysdep.h
|
|
+++ b/sysdeps/x86/sysdep.h
|
|
@@ -21,14 +21,54 @@
|
|
|
|
#include <sysdeps/generic/sysdep.h>
|
|
|
|
+/* The extended state feature IDs in the state component bitmap. */
|
|
+#define X86_XSTATE_X87_ID 0
|
|
+#define X86_XSTATE_SSE_ID 1
|
|
+#define X86_XSTATE_AVX_ID 2
|
|
+#define X86_XSTATE_BNDREGS_ID 3
|
|
+#define X86_XSTATE_BNDCFG_ID 4
|
|
+#define X86_XSTATE_K_ID 5
|
|
+#define X86_XSTATE_ZMM_H_ID 6
|
|
+#define X86_XSTATE_ZMM_ID 7
|
|
+#define X86_XSTATE_PKRU_ID 9
|
|
+#define X86_XSTATE_TILECFG_ID 17
|
|
+#define X86_XSTATE_TILEDATA_ID 18
|
|
+#define X86_XSTATE_APX_F_ID 19
|
|
+
|
|
+#ifdef __x86_64__
|
|
/* Offset for fxsave/xsave area used by _dl_runtime_resolve. Also need
|
|
space to preserve RCX, RDX, RSI, RDI, R8, R9 and RAX. It must be
|
|
- aligned to 16 bytes for fxsave and 64 bytes for xsave. */
|
|
-#define STATE_SAVE_OFFSET (8 * 7 + 8)
|
|
-
|
|
-/* Save SSE, AVX, AVX512, mask and bound registers. */
|
|
-#define STATE_SAVE_MASK \
|
|
- ((1 << 1) | (1 << 2) | (1 << 3) | (1 << 5) | (1 << 6) | (1 << 7))
|
|
+ aligned to 16 bytes for fxsave and 64 bytes for xsave.
|
|
+
|
|
+ NB: Is is non-zero because of the 128-byte red-zone. Some registers
|
|
+ are saved on stack without adjusting stack pointer first. When we
|
|
+ update stack pointer to allocate more space, we need to take the
|
|
+ red-zone into account. */
|
|
+# define STATE_SAVE_OFFSET (8 * 7 + 8)
|
|
+
|
|
+/* Save SSE, AVX, AVX512, mask, bound and APX registers. Bound and APX
|
|
+ registers are mutually exclusive. */
|
|
+# define STATE_SAVE_MASK \
|
|
+ ((1 << X86_XSTATE_SSE_ID) \
|
|
+ | (1 << X86_XSTATE_AVX_ID) \
|
|
+ | (1 << X86_XSTATE_BNDREGS_ID) \
|
|
+ | (1 << X86_XSTATE_K_ID) \
|
|
+ | (1 << X86_XSTATE_ZMM_H_ID) \
|
|
+ | (1 << X86_XSTATE_ZMM_ID) \
|
|
+ | (1 << X86_XSTATE_APX_F_ID))
|
|
+#else
|
|
+/* Offset for fxsave/xsave area used by _dl_tlsdesc_dynamic. Since i386
|
|
+ doesn't have red-zone, use 0 here. */
|
|
+# define STATE_SAVE_OFFSET 0
|
|
+
|
|
+/* Save SSE, AVX, AXV512, mask and bound registers. */
|
|
+# define STATE_SAVE_MASK \
|
|
+ ((1 << X86_XSTATE_SSE_ID) \
|
|
+ | (1 << X86_XSTATE_AVX_ID) \
|
|
+ | (1 << X86_XSTATE_BNDREGS_ID) \
|
|
+ | (1 << X86_XSTATE_K_ID) \
|
|
+ | (1 << X86_XSTATE_ZMM_H_ID))
|
|
+#endif
|
|
|
|
/* Constants for bits in __x86_string_control: */
|
|
|