|
|
3db796 |
|
|
|
3db796 |
PR target/84128
|
|
|
3db796 |
* config/i386/i386.c (release_scratch_register_on_entry): Add new
|
|
|
3db796 |
OFFSET and RELEASE_VIA_POP arguments. Use SP+OFFSET to restore
|
|
|
3db796 |
the scratch if RELEASE_VIA_POP is false.
|
|
|
3db796 |
(ix86_adjust_stack_and_probe_stack_clash): Un-constify SIZE.
|
|
|
3db796 |
If we have to save a temporary register, decrement SIZE appropriately.
|
|
|
3db796 |
Pass new arguments to release_scratch_register_on_entry.
|
|
|
3db796 |
(ix86_adjust_stack_and_probe): Likewise.
|
|
|
3db796 |
(ix86_emit_probe_stack_range): Pass new arguments to
|
|
|
3db796 |
release_scratch_register_on_entry.
|
|
|
3db796 |
|
|
|
3db796 |
PR target/84128
|
|
|
3db796 |
* gcc.target/i386/pr84128.c: New test.
|
|
|
3db796 |
|
|
|
3db796 |
diff --git a/gcc/config/i386/i386.c b/gcc/config/i386/i386.c
|
|
|
3db796 |
index fef34a1..3196ac4 100644
|
|
|
3db796 |
--- gcc/config/i386/i386.c
|
|
|
3db796 |
+++ gcc/config/i386/i386.c
|
|
|
3db796 |
@@ -12567,22 +12567,39 @@ get_scratch_register_on_entry (struct scratch_reg *sr)
|
|
|
3db796 |
}
|
|
|
3db796 |
}
|
|
|
3db796 |
|
|
|
3db796 |
-/* Release a scratch register obtained from the preceding function. */
|
|
|
3db796 |
+/* Release a scratch register obtained from the preceding function.
|
|
|
3db796 |
+
|
|
|
3db796 |
+ If RELEASE_VIA_POP is true, we just pop the register off the stack
|
|
|
3db796 |
+ to release it. This is what non-Linux systems use with -fstack-check.
|
|
|
3db796 |
+
|
|
|
3db796 |
+ Otherwise we use OFFSET to locate the saved register and the
|
|
|
3db796 |
+ allocated stack space becomes part of the local frame and is
|
|
|
3db796 |
+ deallocated by the epilogue. */
|
|
|
3db796 |
|
|
|
3db796 |
static void
|
|
|
3db796 |
-release_scratch_register_on_entry (struct scratch_reg *sr)
|
|
|
3db796 |
+release_scratch_register_on_entry (struct scratch_reg *sr, HOST_WIDE_INT offset,
|
|
|
3db796 |
+ bool release_via_pop)
|
|
|
3db796 |
{
|
|
|
3db796 |
if (sr->saved)
|
|
|
3db796 |
{
|
|
|
3db796 |
- struct machine_function *m = cfun->machine;
|
|
|
3db796 |
- rtx x, insn = emit_insn (gen_pop (sr->reg));
|
|
|
3db796 |
+ if (release_via_pop)
|
|
|
3db796 |
+ {
|
|
|
3db796 |
+ struct machine_function *m = cfun->machine;
|
|
|
3db796 |
+ rtx x, insn = emit_insn (gen_pop (sr->reg));
|
|
|
3db796 |
|
|
|
3db796 |
- /* The RTX_FRAME_RELATED_P mechanism doesn't know about pop. */
|
|
|
3db796 |
- RTX_FRAME_RELATED_P (insn) = 1;
|
|
|
3db796 |
- x = gen_rtx_PLUS (Pmode, stack_pointer_rtx, GEN_INT (UNITS_PER_WORD));
|
|
|
3db796 |
- x = gen_rtx_SET (stack_pointer_rtx, x);
|
|
|
3db796 |
- add_reg_note (insn, REG_FRAME_RELATED_EXPR, x);
|
|
|
3db796 |
- m->fs.sp_offset -= UNITS_PER_WORD;
|
|
|
3db796 |
+ /* The RX FRAME_RELATED_P mechanism doesn't know about pop. */
|
|
|
3db796 |
+ RTX_FRAME_RELATED_P (insn) = 1;
|
|
|
3db796 |
+ x = gen_rtx_PLUS (Pmode, stack_pointer_rtx, GEN_INT (UNITS_PER_WORD));
|
|
|
3db796 |
+ x = gen_rtx_SET (stack_pointer_rtx, x);
|
|
|
3db796 |
+ add_reg_note (insn, REG_FRAME_RELATED_EXPR, x);
|
|
|
3db796 |
+ m->fs.sp_offset -= UNITS_PER_WORD;
|
|
|
3db796 |
+ }
|
|
|
3db796 |
+ else
|
|
|
3db796 |
+ {
|
|
|
3db796 |
+ rtx x = gen_rtx_PLUS (Pmode, stack_pointer_rtx, GEN_INT (offset));
|
|
|
3db796 |
+ x = gen_rtx_SET (sr->reg, gen_rtx_MEM (word_mode, x));
|
|
|
3db796 |
+ emit_insn (x);
|
|
|
3db796 |
+ }
|
|
|
3db796 |
}
|
|
|
3db796 |
}
|
|
|
3db796 |
|
|
|
3db796 |
@@ -12597,7 +12614,7 @@ release_scratch_register_on_entry (struct scratch_reg *sr)
|
|
|
3db796 |
pushed on the stack. */
|
|
|
3db796 |
|
|
|
3db796 |
static void
|
|
|
3db796 |
-ix86_adjust_stack_and_probe_stack_clash (const HOST_WIDE_INT size,
|
|
|
3db796 |
+ix86_adjust_stack_and_probe_stack_clash (HOST_WIDE_INT size,
|
|
|
3db796 |
const bool int_registers_saved)
|
|
|
3db796 |
{
|
|
|
3db796 |
struct machine_function *m = cfun->machine;
|
|
|
3db796 |
@@ -12713,6 +12730,12 @@ ix86_adjust_stack_and_probe_stack_clash (const HOST_WIDE_INT size,
|
|
|
3db796 |
struct scratch_reg sr;
|
|
|
3db796 |
get_scratch_register_on_entry (&sr);
|
|
|
3db796 |
|
|
|
3db796 |
+ /* If we needed to save a register, then account for any space
|
|
|
3db796 |
+ that was pushed (we are not going to pop the register when
|
|
|
3db796 |
+ we do the restore). */
|
|
|
3db796 |
+ if (sr.saved)
|
|
|
3db796 |
+ size -= UNITS_PER_WORD;
|
|
|
3db796 |
+
|
|
|
3db796 |
/* Step 1: round SIZE down to a multiple of the interval. */
|
|
|
3db796 |
HOST_WIDE_INT rounded_size = size & -probe_interval;
|
|
|
3db796 |
|
|
|
3db796 |
@@ -12761,7 +12784,9 @@ ix86_adjust_stack_and_probe_stack_clash (const HOST_WIDE_INT size,
|
|
|
3db796 |
m->fs.cfa_reg == stack_pointer_rtx);
|
|
|
3db796 |
dump_stack_clash_frame_info (PROBE_LOOP, size != rounded_size);
|
|
|
3db796 |
|
|
|
3db796 |
- release_scratch_register_on_entry (&sr);
|
|
|
3db796 |
+ /* This does not deallocate the space reserved for the scratch
|
|
|
3db796 |
+ register. That will be deallocated in the epilogue. */
|
|
|
3db796 |
+ release_scratch_register_on_entry (&sr, size, false);
|
|
|
3db796 |
}
|
|
|
3db796 |
|
|
|
3db796 |
/* Make sure nothing is scheduled before we are done. */
|
|
|
3db796 |
@@ -12774,7 +12799,7 @@ ix86_adjust_stack_and_probe_stack_clash (const HOST_WIDE_INT size,
|
|
|
3db796 |
pushed on the stack. */
|
|
|
3db796 |
|
|
|
3db796 |
static void
|
|
|
3db796 |
-ix86_adjust_stack_and_probe (const HOST_WIDE_INT size,
|
|
|
3db796 |
+ix86_adjust_stack_and_probe (HOST_WIDE_INT size,
|
|
|
3db796 |
const bool int_registers_saved)
|
|
|
3db796 |
{
|
|
|
3db796 |
/* We skip the probe for the first interval + a small dope of 4 words and
|
|
|
3db796 |
@@ -12847,6 +12872,11 @@ ix86_adjust_stack_and_probe (const HOST_WIDE_INT size,
|
|
|
3db796 |
|
|
|
3db796 |
get_scratch_register_on_entry (&sr);
|
|
|
3db796 |
|
|
|
3db796 |
+ /* If we needed to save a register, then account for any space
|
|
|
3db796 |
+ that was pushed (we are not going to pop the register when
|
|
|
3db796 |
+ we do the restore). */
|
|
|
3db796 |
+ if (sr.saved)
|
|
|
3db796 |
+ size -= UNITS_PER_WORD;
|
|
|
3db796 |
|
|
|
3db796 |
/* Step 1: round SIZE to the previous multiple of the interval. */
|
|
|
3db796 |
|
|
|
3db796 |
@@ -12906,7 +12936,9 @@ ix86_adjust_stack_and_probe (const HOST_WIDE_INT size,
|
|
|
3db796 |
(get_probe_interval ()
|
|
|
3db796 |
+ dope))));
|
|
|
3db796 |
|
|
|
3db796 |
- release_scratch_register_on_entry (&sr);
|
|
|
3db796 |
+ /* This does not deallocate the space reserved for the scratch
|
|
|
3db796 |
+ register. That will be deallocated in the epilogue. */
|
|
|
3db796 |
+ release_scratch_register_on_entry (&sr, size, false);
|
|
|
3db796 |
}
|
|
|
3db796 |
|
|
|
3db796 |
/* Even if the stack pointer isn't the CFA register, we need to correctly
|
|
|
3db796 |
@@ -13055,7 +13087,7 @@ ix86_emit_probe_stack_range (HOST_WIDE_INT first, HOST_WIDE_INT size,
|
|
|
3db796 |
sr.reg),
|
|
|
3db796 |
rounded_size - size));
|
|
|
3db796 |
|
|
|
3db796 |
- release_scratch_register_on_entry (&sr);
|
|
|
3db796 |
+ release_scratch_register_on_entry (&sr, size, true);
|
|
|
3db796 |
}
|
|
|
3db796 |
|
|
|
3db796 |
/* Make sure nothing is scheduled before we are done. */
|
|
|
3db796 |
|
|
|
3db796 |
diff --git a/gcc/testsuite/gcc.target/i386/pr84128.c b/gcc/testsuite/gcc.target/i386/pr84128.c
|
|
|
3db796 |
new file mode 100644
|
|
|
3db796 |
index 0000000..a8323fd6
|
|
|
3db796 |
--- /dev/null
|
|
|
3db796 |
+++ gcc/testsuite/gcc.target/i386/pr84128.c
|
|
|
3db796 |
@@ -0,0 +1,30 @@
|
|
|
3db796 |
+/* { dg-do run } */
|
|
|
3db796 |
+/* { dg-options "-O2 -march=i686 -mtune=generic -fstack-clash-protection" } */
|
|
|
3db796 |
+/* { dg-require-effective-target ia32 } */
|
|
|
3db796 |
+
|
|
|
3db796 |
+__attribute__ ((noinline, noclone, weak, regparm (3)))
|
|
|
3db796 |
+int
|
|
|
3db796 |
+f1 (long arg0, int (*pf) (long, void *))
|
|
|
3db796 |
+{
|
|
|
3db796 |
+ unsigned char buf[32768];
|
|
|
3db796 |
+ return pf (arg0, buf);
|
|
|
3db796 |
+}
|
|
|
3db796 |
+
|
|
|
3db796 |
+__attribute__ ((noinline, noclone, weak))
|
|
|
3db796 |
+int
|
|
|
3db796 |
+f2 (long arg0, void *ignored)
|
|
|
3db796 |
+{
|
|
|
3db796 |
+ if (arg0 != 17)
|
|
|
3db796 |
+ __builtin_abort ();
|
|
|
3db796 |
+ return 19;
|
|
|
3db796 |
+}
|
|
|
3db796 |
+
|
|
|
3db796 |
+int
|
|
|
3db796 |
+main (void)
|
|
|
3db796 |
+{
|
|
|
3db796 |
+ if (f1 (17, f2) != 19)
|
|
|
3db796 |
+ __builtin_abort ();
|
|
|
3db796 |
+ return 0;
|
|
|
3db796 |
+}
|
|
|
3db796 |
+
|
|
|
3db796 |
+
|