|
|
307c0f |
From FEDORA_PATCHES Mon Sep 17 00:00:00 2001
|
|
|
307c0f |
From: Tom de Vries <tdevries@suse.de>
|
|
|
307c0f |
Date: Mon, 6 Dec 2021 15:39:03 -0500
|
|
|
307c0f |
Subject: gdb-rhbz2019936-gdbserver-avx512-m32.patch
|
|
|
307c0f |
|
|
|
307c0f |
;; Backport "Fix avx512 -m32 support in gdbserver"
|
|
|
307c0f |
;; (Tom de Vries, RHBZ 2019936)
|
|
|
307c0f |
|
|
|
307c0f |
PR27257 reports a problem that can be reproduced as follows:
|
|
|
307c0f |
- use x86_64 machine with avx512 support
|
|
|
307c0f |
- compile a hello world with -m32 to a.out
|
|
|
307c0f |
- start a gdbserver session with a.out
|
|
|
307c0f |
- use gdb to connect to the gdbserver session
|
|
|
307c0f |
|
|
|
307c0f |
This makes us run into:
|
|
|
307c0f |
...
|
|
|
307c0f |
Listening on port 2346
|
|
|
307c0f |
Remote debugging from host ::1, port 34940
|
|
|
307c0f |
src/gdbserver/regcache.cc:257: \
|
|
|
307c0f |
A problem internal to GDBserver has been detected.
|
|
|
307c0f |
Unknown register zmm16h requested
|
|
|
307c0f |
...
|
|
|
307c0f |
|
|
|
307c0f |
The problem is that i387_xsave_to_cache in gdbserver/i387-fp.cc can't find a
|
|
|
307c0f |
register zmm16h in the register cache.
|
|
|
307c0f |
|
|
|
307c0f |
To understand how this happens, first some background.
|
|
|
307c0f |
|
|
|
307c0f |
SSE has 16 128-bit wide xmm registers.
|
|
|
307c0f |
|
|
|
307c0f |
AVX extends the SSE registers set as follows:
|
|
|
307c0f |
- it extends the 16 existing 128-bit wide xmm registers to 256-bit wide ymm
|
|
|
307c0f |
registers.
|
|
|
307c0f |
|
|
|
307c0f |
AVX512 extends the AVX register set as follows:
|
|
|
307c0f |
- it extends the 16 existing 256-bit wide ymm registers to 512-bit wide zmm
|
|
|
307c0f |
registers.
|
|
|
307c0f |
- it adds 16 additional 512-bit wide zmm registers (with corresponding ymm and
|
|
|
307c0f |
xmm subregisters added as well)
|
|
|
307c0f |
|
|
|
307c0f |
However, in 32-bit mode, there are only 8 xmm/ymm/zmm registers.
|
|
|
307c0f |
|
|
|
307c0f |
The problem we're running into is that gdbserver/i387-fp.cc uses these
|
|
|
307c0f |
constants to describe the size of the register file:
|
|
|
307c0f |
...
|
|
|
307c0f |
static const int num_avx512_zmmh_low_registers = 16;
|
|
|
307c0f |
static const int num_avx512_zmmh_high_registers = 16;
|
|
|
307c0f |
static const int num_avx512_ymmh_registers = 16;
|
|
|
307c0f |
static const int num_avx512_xmm_registers = 16;
|
|
|
307c0f |
...
|
|
|
307c0f |
which are all incorrect for the 32-bit case.
|
|
|
307c0f |
|
|
|
307c0f |
Fix this by replacing the constants with variables that have the appropriate
|
|
|
307c0f |
values in 64-bit and 32-bit mode.
|
|
|
307c0f |
|
|
|
307c0f |
Tested on x86_64-linux with native and unix/-m32.
|
|
|
307c0f |
|
|
|
307c0f |
diff --git a/gdbserver/i387-fp.cc b/gdbserver/i387-fp.cc
|
|
|
307c0f |
--- a/gdbserver/i387-fp.cc
|
|
|
307c0f |
+++ b/gdbserver/i387-fp.cc
|
|
|
307c0f |
@@ -23,10 +23,6 @@
|
|
|
307c0f |
static const int num_mpx_bnd_registers = 4;
|
|
|
307c0f |
static const int num_mpx_cfg_registers = 2;
|
|
|
307c0f |
static const int num_avx512_k_registers = 8;
|
|
|
307c0f |
-static const int num_avx512_zmmh_low_registers = 16;
|
|
|
307c0f |
-static const int num_avx512_zmmh_high_registers = 16;
|
|
|
307c0f |
-static const int num_avx512_ymmh_registers = 16;
|
|
|
307c0f |
-static const int num_avx512_xmm_registers = 16;
|
|
|
307c0f |
static const int num_pkeys_registers = 1;
|
|
|
307c0f |
|
|
|
307c0f |
/* Note: These functions preserve the reserved bits in control registers.
|
|
|
307c0f |
@@ -256,14 +252,22 @@ void
|
|
|
307c0f |
i387_cache_to_xsave (struct regcache *regcache, void *buf)
|
|
|
307c0f |
{
|
|
|
307c0f |
struct i387_xsave *fp = (struct i387_xsave *) buf;
|
|
|
307c0f |
+ bool amd64 = register_size (regcache->tdesc, 0) == 8;
|
|
|
307c0f |
int i;
|
|
|
307c0f |
unsigned long val, val2;
|
|
|
307c0f |
unsigned long long xstate_bv = 0;
|
|
|
307c0f |
unsigned long long clear_bv = 0;
|
|
|
307c0f |
char raw[64];
|
|
|
307c0f |
char *p;
|
|
|
307c0f |
+
|
|
|
307c0f |
/* Amd64 has 16 xmm regs; I386 has 8 xmm regs. */
|
|
|
307c0f |
- int num_xmm_registers = register_size (regcache->tdesc, 0) == 8 ? 16 : 8;
|
|
|
307c0f |
+ int num_xmm_registers = amd64 ? 16 : 8;
|
|
|
307c0f |
+ /* AVX512 extends the existing xmm/ymm registers to a wider mode: zmm. */
|
|
|
307c0f |
+ int num_avx512_zmmh_low_registers = num_xmm_registers;
|
|
|
307c0f |
+ /* AVX512 adds 16 extra regs in Amd64 mode, but none in I386 mode.*/
|
|
|
307c0f |
+ int num_avx512_zmmh_high_registers = amd64 ? 16 : 0;
|
|
|
307c0f |
+ int num_avx512_ymmh_registers = amd64 ? 16 : 0;
|
|
|
307c0f |
+ int num_avx512_xmm_registers = amd64 ? 16 : 0;
|
|
|
307c0f |
|
|
|
307c0f |
/* The supported bits in `xstat_bv' are 8 bytes. Clear part in
|
|
|
307c0f |
vector registers if its bit in xstat_bv is zero. */
|
|
|
307c0f |
@@ -452,7 +456,9 @@ i387_cache_to_xsave (struct regcache *regcache, void *buf)
|
|
|
307c0f |
/* Check if any of ZMM16H-ZMM31H registers are changed. */
|
|
|
307c0f |
if ((x86_xcr0 & X86_XSTATE_ZMM))
|
|
|
307c0f |
{
|
|
|
307c0f |
- int zmm16h_regnum = find_regno (regcache->tdesc, "zmm16h");
|
|
|
307c0f |
+ int zmm16h_regnum = (num_avx512_zmmh_high_registers == 0
|
|
|
307c0f |
+ ? -1
|
|
|
307c0f |
+ : find_regno (regcache->tdesc, "zmm16h"));
|
|
|
307c0f |
|
|
|
307c0f |
for (i = 0; i < num_avx512_zmmh_high_registers; i++)
|
|
|
307c0f |
{
|
|
|
307c0f |
@@ -469,7 +475,9 @@ i387_cache_to_xsave (struct regcache *regcache, void *buf)
|
|
|
307c0f |
/* Check if any XMM_AVX512 registers are changed. */
|
|
|
307c0f |
if ((x86_xcr0 & X86_XSTATE_ZMM))
|
|
|
307c0f |
{
|
|
|
307c0f |
- int xmm_avx512_regnum = find_regno (regcache->tdesc, "xmm16");
|
|
|
307c0f |
+ int xmm_avx512_regnum = (num_avx512_xmm_registers == 0
|
|
|
307c0f |
+ ? -1
|
|
|
307c0f |
+ : find_regno (regcache->tdesc, "xmm16"));
|
|
|
307c0f |
|
|
|
307c0f |
for (i = 0; i < num_avx512_xmm_registers; i++)
|
|
|
307c0f |
{
|
|
|
307c0f |
@@ -486,7 +494,9 @@ i387_cache_to_xsave (struct regcache *regcache, void *buf)
|
|
|
307c0f |
/* Check if any YMMH_AVX512 registers are changed. */
|
|
|
307c0f |
if ((x86_xcr0 & X86_XSTATE_ZMM))
|
|
|
307c0f |
{
|
|
|
307c0f |
- int ymmh_avx512_regnum = find_regno (regcache->tdesc, "ymm16h");
|
|
|
307c0f |
+ int ymmh_avx512_regnum = (num_avx512_ymmh_registers == 0
|
|
|
307c0f |
+ ? -1
|
|
|
307c0f |
+ : find_regno (regcache->tdesc, "ymm16h"));
|
|
|
307c0f |
|
|
|
307c0f |
for (i = 0; i < num_avx512_ymmh_registers; i++)
|
|
|
307c0f |
{
|
|
|
307c0f |
@@ -710,12 +720,20 @@ i387_xsave_to_cache (struct regcache *regcache, const void *buf)
|
|
|
307c0f |
{
|
|
|
307c0f |
struct i387_xsave *fp = (struct i387_xsave *) buf;
|
|
|
307c0f |
struct i387_fxsave *fxp = (struct i387_fxsave *) buf;
|
|
|
307c0f |
+ bool amd64 = register_size (regcache->tdesc, 0) == 8;
|
|
|
307c0f |
int i, top;
|
|
|
307c0f |
unsigned long val;
|
|
|
307c0f |
unsigned long long clear_bv;
|
|
|
307c0f |
gdb_byte *p;
|
|
|
307c0f |
- /* Amd64 has 16 xmm regs; I386 has 8 xmm regs. */
|
|
|
307c0f |
- int num_xmm_registers = register_size (regcache->tdesc, 0) == 8 ? 16 : 8;
|
|
|
307c0f |
+
|
|
|
307c0f |
+ /* Amd64 has 16 xmm regs; I386 has 8 xmm regs. */
|
|
|
307c0f |
+ int num_xmm_registers = amd64 ? 16 : 8;
|
|
|
307c0f |
+ /* AVX512 extends the existing xmm/ymm registers to a wider mode: zmm. */
|
|
|
307c0f |
+ int num_avx512_zmmh_low_registers = num_xmm_registers;
|
|
|
307c0f |
+ /* AVX512 adds 16 extra regs in Amd64 mode, but none in I386 mode.*/
|
|
|
307c0f |
+ int num_avx512_zmmh_high_registers = amd64 ? 16 : 0;
|
|
|
307c0f |
+ int num_avx512_ymmh_registers = amd64 ? 16 : 0;
|
|
|
307c0f |
+ int num_avx512_xmm_registers = amd64 ? 16 : 0;
|
|
|
307c0f |
|
|
|
307c0f |
/* The supported bits in `xstat_bv' are 8 bytes. Clear part in
|
|
|
307c0f |
vector registers if its bit in xstat_bv is zero. */
|
|
|
307c0f |
@@ -845,9 +863,15 @@ i387_xsave_to_cache (struct regcache *regcache, const void *buf)
|
|
|
307c0f |
|
|
|
307c0f |
if ((x86_xcr0 & X86_XSTATE_ZMM) != 0)
|
|
|
307c0f |
{
|
|
|
307c0f |
- int zmm16h_regnum = find_regno (regcache->tdesc, "zmm16h");
|
|
|
307c0f |
- int ymm16h_regnum = find_regno (regcache->tdesc, "ymm16h");
|
|
|
307c0f |
- int xmm16_regnum = find_regno (regcache->tdesc, "xmm16");
|
|
|
307c0f |
+ int zmm16h_regnum = (num_avx512_zmmh_high_registers == 0
|
|
|
307c0f |
+ ? -1
|
|
|
307c0f |
+ : find_regno (regcache->tdesc, "zmm16h"));
|
|
|
307c0f |
+ int ymm16h_regnum = (num_avx512_ymmh_registers == 0
|
|
|
307c0f |
+ ? -1
|
|
|
307c0f |
+ : find_regno (regcache->tdesc, "ymm16h"));
|
|
|
307c0f |
+ int xmm16_regnum = (num_avx512_xmm_registers == 0
|
|
|
307c0f |
+ ? -1
|
|
|
307c0f |
+ : find_regno (regcache->tdesc, "xmm16"));
|
|
|
307c0f |
|
|
|
307c0f |
if ((clear_bv & X86_XSTATE_ZMM) != 0)
|
|
|
307c0f |
{
|