|
|
13f101 |
commit 27d2a2d27f3e0060ade9a1a82ce2292aad6c6931
|
|
|
13f101 |
Author: law <law@138bc75d-0d04-0410-961f-82ee72b054a4>
|
|
|
13f101 |
Date: Mon Sep 25 23:13:55 2017 +0000
|
|
|
13f101 |
|
|
|
13f101 |
* config/rs6000/rs6000-protos.h (output_probe_stack_range): Update
|
|
|
13f101 |
prototype for new argument.
|
|
|
13f101 |
* config/rs6000/rs6000.c (rs6000_emit_allocate_stack_1): New function,
|
|
|
13f101 |
mostly extracted from rs6000_emit_allocate_stack.
|
|
|
13f101 |
(rs6000_emit_probe_stack_range_stack_clash): New function.
|
|
|
13f101 |
(rs6000_emit_allocate_stack): Call
|
|
|
13f101 |
rs6000_emit_probe_stack_range_stack_clash as needed.
|
|
|
13f101 |
(rs6000_emit_probe_stack_range): Add additional argument
|
|
|
13f101 |
to call to gen_probe_stack_range{si,di}.
|
|
|
13f101 |
(output_probe_stack_range): New.
|
|
|
13f101 |
(output_probe_stack_range_1): Renamed from output_probe_stack_range.
|
|
|
13f101 |
(output_probe_stack_range_stack_clash): New.
|
|
|
13f101 |
(rs6000_emit_prologue): Emit notes into dump file as requested.
|
|
|
13f101 |
* rs6000.md (allocate_stack): Handle -fstack-clash-protection.
|
|
|
13f101 |
(probe_stack_range<P:mode>): Operand 0 is now early-clobbered.
|
|
|
13f101 |
Add additional operand and pass it to output_probe_stack_range.
|
|
|
13f101 |
|
|
|
13f101 |
* lib/target-supports.exp
|
|
|
13f101 |
(check_effective_target_supports_stack_clash_protection): Enable for
|
|
|
13f101 |
rs6000 and powerpc targets.
|
|
|
13f101 |
|
|
|
13f101 |
git-svn-id: svn+ssh://gcc.gnu.org/svn/gcc/trunk@253179 138bc75d-0d04-0410-961f-82ee72b054a4
|
|
|
13f101 |
|
|
|
13f101 |
diff --git a/gcc/config/rs6000/rs6000-protos.h b/gcc/config/rs6000/rs6000-protos.h
|
|
|
13f101 |
index d4b93d9970d..cfb23ab80cc 100644
|
|
|
13f101 |
--- a/gcc/config/rs6000/rs6000-protos.h
|
|
|
13f101 |
+++ b/gcc/config/rs6000/rs6000-protos.h
|
|
|
13f101 |
@@ -114,7 +114,7 @@ extern void rs6000_emit_sCOND (enum machine_mode, rtx[]);
|
|
|
13f101 |
extern void rs6000_emit_cbranch (enum machine_mode, rtx[]);
|
|
|
13f101 |
extern char * output_cbranch (rtx, const char *, int, rtx);
|
|
|
13f101 |
extern char * output_e500_flip_gt_bit (rtx, rtx);
|
|
|
13f101 |
-extern const char * output_probe_stack_range (rtx, rtx);
|
|
|
13f101 |
+extern const char * output_probe_stack_range (rtx, rtx, rtx);
|
|
|
13f101 |
extern rtx rs6000_emit_set_const (rtx, enum machine_mode, rtx, int);
|
|
|
13f101 |
extern int rs6000_emit_cmove (rtx, rtx, rtx, rtx);
|
|
|
13f101 |
extern int rs6000_emit_vector_cond_expr (rtx, rtx, rtx, rtx, rtx, rtx);
|
|
|
13f101 |
diff --git a/gcc/config/rs6000/rs6000.c b/gcc/config/rs6000/rs6000.c
|
|
|
13f101 |
index a9052c6becf..c5d9988c1d9 100644
|
|
|
13f101 |
--- a/gcc/config/rs6000/rs6000.c
|
|
|
13f101 |
+++ b/gcc/config/rs6000/rs6000.c
|
|
|
13f101 |
@@ -22320,6 +22320,220 @@ rs6000_emit_stack_tie (rtx fp, bool hard_frame_needed)
|
|
|
13f101 |
emit_insn (gen_stack_tie (gen_rtx_PARALLEL (VOIDmode, p)));
|
|
|
13f101 |
}
|
|
|
13f101 |
|
|
|
13f101 |
+/* Allocate SIZE_INT bytes on the stack using a store with update style insn
|
|
|
13f101 |
+ and set the appropriate attributes for the generated insn. Return the
|
|
|
13f101 |
+ first insn which adjusts the stack pointer or the last insn before
|
|
|
13f101 |
+ the stack adjustment loop.
|
|
|
13f101 |
+
|
|
|
13f101 |
+ SIZE_INT is used to create the CFI note for the allocation.
|
|
|
13f101 |
+
|
|
|
13f101 |
+ SIZE_RTX is an rtx containing the size of the adjustment. Note that
|
|
|
13f101 |
+ since stacks grow to lower addresses its runtime value is -SIZE_INT.
|
|
|
13f101 |
+
|
|
|
13f101 |
+ ORIG_SP contains the backchain value that must be stored at *sp. */
|
|
|
13f101 |
+
|
|
|
13f101 |
+static rtx
|
|
|
13f101 |
+rs6000_emit_allocate_stack_1 (HOST_WIDE_INT size_int, rtx orig_sp)
|
|
|
13f101 |
+{
|
|
|
13f101 |
+ rtx insn;
|
|
|
13f101 |
+
|
|
|
13f101 |
+ rtx size_rtx = GEN_INT (-size_int);
|
|
|
13f101 |
+ if (size_int > 32767)
|
|
|
13f101 |
+ {
|
|
|
13f101 |
+ rtx tmp_reg = gen_rtx_REG (Pmode, 0);
|
|
|
13f101 |
+ /* Need a note here so that try_split doesn't get confused. */
|
|
|
13f101 |
+ if (get_last_insn () == NULL_RTX)
|
|
|
13f101 |
+ emit_note (NOTE_INSN_DELETED);
|
|
|
13f101 |
+ insn = emit_move_insn (tmp_reg, size_rtx);
|
|
|
13f101 |
+ try_split (PATTERN (insn), insn, 0);
|
|
|
13f101 |
+ size_rtx = tmp_reg;
|
|
|
13f101 |
+ }
|
|
|
13f101 |
+
|
|
|
13f101 |
+ if (Pmode == SImode)
|
|
|
13f101 |
+ insn = emit_insn (gen_movsi_update_stack (stack_pointer_rtx,
|
|
|
13f101 |
+ stack_pointer_rtx,
|
|
|
13f101 |
+ size_rtx,
|
|
|
13f101 |
+ orig_sp));
|
|
|
13f101 |
+ else
|
|
|
13f101 |
+ insn = emit_insn (gen_movdi_di_update_stack (stack_pointer_rtx,
|
|
|
13f101 |
+ stack_pointer_rtx,
|
|
|
13f101 |
+ size_rtx,
|
|
|
13f101 |
+ orig_sp));
|
|
|
13f101 |
+ rtx par = PATTERN (insn);
|
|
|
13f101 |
+ gcc_assert (GET_CODE (par) == PARALLEL);
|
|
|
13f101 |
+ rtx set = XVECEXP (par, 0, 0);
|
|
|
13f101 |
+ gcc_assert (GET_CODE (set) == SET);
|
|
|
13f101 |
+ rtx mem = SET_DEST (set);
|
|
|
13f101 |
+ gcc_assert (MEM_P (mem));
|
|
|
13f101 |
+ MEM_NOTRAP_P (mem) = 1;
|
|
|
13f101 |
+ set_mem_alias_set (mem, get_frame_alias_set ());
|
|
|
13f101 |
+
|
|
|
13f101 |
+ RTX_FRAME_RELATED_P (insn) = 1;
|
|
|
13f101 |
+ add_reg_note (insn, REG_FRAME_RELATED_EXPR,
|
|
|
13f101 |
+ gen_rtx_SET (VOIDmode, stack_pointer_rtx,
|
|
|
13f101 |
+ gen_rtx_PLUS (Pmode,
|
|
|
13f101 |
+ stack_pointer_rtx,
|
|
|
13f101 |
+ GEN_INT (-size_int))));
|
|
|
13f101 |
+
|
|
|
13f101 |
+ /* Emit a blockage to ensure the allocation/probing insns are
|
|
|
13f101 |
+ not optimized, combined, removed, etc. Add REG_STACK_CHECK
|
|
|
13f101 |
+ note for similar reasons. */
|
|
|
13f101 |
+ if (flag_stack_clash_protection)
|
|
|
13f101 |
+ {
|
|
|
13f101 |
+ add_reg_note (insn, REG_STACK_CHECK, const0_rtx);
|
|
|
13f101 |
+ emit_insn (gen_blockage ());
|
|
|
13f101 |
+ }
|
|
|
13f101 |
+
|
|
|
13f101 |
+ return insn;
|
|
|
13f101 |
+}
|
|
|
13f101 |
+
|
|
|
13f101 |
+static HOST_WIDE_INT
|
|
|
13f101 |
+get_stack_clash_protection_probe_interval (void)
|
|
|
13f101 |
+{
|
|
|
13f101 |
+ return (HOST_WIDE_INT_1U
|
|
|
13f101 |
+ << PARAM_VALUE (PARAM_STACK_CLASH_PROTECTION_PROBE_INTERVAL));
|
|
|
13f101 |
+}
|
|
|
13f101 |
+
|
|
|
13f101 |
+static HOST_WIDE_INT
|
|
|
13f101 |
+get_stack_clash_protection_guard_size (void)
|
|
|
13f101 |
+{
|
|
|
13f101 |
+ return (HOST_WIDE_INT_1U
|
|
|
13f101 |
+ << PARAM_VALUE (PARAM_STACK_CLASH_PROTECTION_GUARD_SIZE));
|
|
|
13f101 |
+}
|
|
|
13f101 |
+
|
|
|
13f101 |
+/* Allocate ORIG_SIZE bytes on the stack and probe the newly
|
|
|
13f101 |
+ allocated space every STACK_CLASH_PROTECTION_PROBE_INTERVAL bytes.
|
|
|
13f101 |
+
|
|
|
13f101 |
+ COPY_REG, if non-null, should contain a copy of the original
|
|
|
13f101 |
+ stack pointer at exit from this function.
|
|
|
13f101 |
+
|
|
|
13f101 |
+ This is subtly different than the Ada probing in that it tries hard to
|
|
|
13f101 |
+ prevent attacks that jump the stack guard. Thus it is never allowed to
|
|
|
13f101 |
+ allocate more than STACK_CLASH_PROTECTION_PROBE_INTERVAL bytes of stack
|
|
|
13f101 |
+ space without a suitable probe. */
|
|
|
13f101 |
+static rtx
|
|
|
13f101 |
+rs6000_emit_probe_stack_range_stack_clash (HOST_WIDE_INT orig_size,
|
|
|
13f101 |
+ rtx copy_reg)
|
|
|
13f101 |
+{
|
|
|
13f101 |
+ rtx orig_sp = copy_reg;
|
|
|
13f101 |
+
|
|
|
13f101 |
+ HOST_WIDE_INT probe_interval = get_stack_clash_protection_probe_interval ();
|
|
|
13f101 |
+
|
|
|
13f101 |
+ /* Round the size down to a multiple of PROBE_INTERVAL. */
|
|
|
13f101 |
+ HOST_WIDE_INT rounded_size = ROUND_DOWN (orig_size, probe_interval);
|
|
|
13f101 |
+
|
|
|
13f101 |
+ /* If explicitly requested,
|
|
|
13f101 |
+ or the rounded size is not the same as the original size
|
|
|
13f101 |
+ or the the rounded size is greater than a page,
|
|
|
13f101 |
+ then we will need a copy of the original stack pointer. */
|
|
|
13f101 |
+ if (rounded_size != orig_size
|
|
|
13f101 |
+ || rounded_size > probe_interval
|
|
|
13f101 |
+ || copy_reg)
|
|
|
13f101 |
+ {
|
|
|
13f101 |
+ /* If the caller did not request a copy of the incoming stack
|
|
|
13f101 |
+ pointer, then we use r0 to hold the copy. */
|
|
|
13f101 |
+ if (!copy_reg)
|
|
|
13f101 |
+ orig_sp = gen_rtx_REG (Pmode, 0);
|
|
|
13f101 |
+ emit_move_insn (orig_sp, stack_pointer_rtx);
|
|
|
13f101 |
+ }
|
|
|
13f101 |
+
|
|
|
13f101 |
+ /* There's three cases here.
|
|
|
13f101 |
+
|
|
|
13f101 |
+ One is a single probe which is the most common and most efficiently
|
|
|
13f101 |
+ implemented as it does not have to have a copy of the original
|
|
|
13f101 |
+ stack pointer if there are no residuals.
|
|
|
13f101 |
+
|
|
|
13f101 |
+ Second is unrolled allocation/probes which we use if there's just
|
|
|
13f101 |
+ a few of them. It needs to save the original stack pointer into a
|
|
|
13f101 |
+ temporary for use as a source register in the allocation/probe.
|
|
|
13f101 |
+
|
|
|
13f101 |
+ Last is a loop. This is the most uncommon case and least efficient. */
|
|
|
13f101 |
+ rtx retval = NULL;
|
|
|
13f101 |
+ if (rounded_size == probe_interval)
|
|
|
13f101 |
+ {
|
|
|
13f101 |
+ retval = rs6000_emit_allocate_stack_1 (probe_interval, stack_pointer_rtx);
|
|
|
13f101 |
+
|
|
|
13f101 |
+ dump_stack_clash_frame_info (PROBE_INLINE, rounded_size != orig_size);
|
|
|
13f101 |
+ }
|
|
|
13f101 |
+ else if (rounded_size <= 8 * probe_interval)
|
|
|
13f101 |
+ {
|
|
|
13f101 |
+ /* The ABI requires using the store with update insns to allocate
|
|
|
13f101 |
+ space and store the backchain into the stack
|
|
|
13f101 |
+
|
|
|
13f101 |
+ So we save the current stack pointer into a temporary, then
|
|
|
13f101 |
+ emit the store-with-update insns to store the saved stack pointer
|
|
|
13f101 |
+ into the right location in each new page. */
|
|
|
13f101 |
+ for (int i = 0; i < rounded_size; i += probe_interval)
|
|
|
13f101 |
+ {
|
|
|
13f101 |
+ rtx insn = rs6000_emit_allocate_stack_1 (probe_interval, orig_sp);
|
|
|
13f101 |
+
|
|
|
13f101 |
+ /* Save the first stack adjustment in RETVAL. */
|
|
|
13f101 |
+ if (i == 0)
|
|
|
13f101 |
+ retval = insn;
|
|
|
13f101 |
+ }
|
|
|
13f101 |
+
|
|
|
13f101 |
+ dump_stack_clash_frame_info (PROBE_INLINE, rounded_size != orig_size);
|
|
|
13f101 |
+ }
|
|
|
13f101 |
+ else
|
|
|
13f101 |
+ {
|
|
|
13f101 |
+ /* Compute the ending address. */
|
|
|
13f101 |
+ rtx end_addr
|
|
|
13f101 |
+ = copy_reg ? gen_rtx_REG (Pmode, 0) : gen_rtx_REG (Pmode, 12);
|
|
|
13f101 |
+ rtx rs = GEN_INT (-rounded_size);
|
|
|
13f101 |
+ rtx insn;
|
|
|
13f101 |
+ if (add_operand (rs, Pmode))
|
|
|
13f101 |
+ insn = emit_insn (gen_add3_insn (end_addr, stack_pointer_rtx, rs));
|
|
|
13f101 |
+ else
|
|
|
13f101 |
+ {
|
|
|
13f101 |
+ emit_move_insn (end_addr, GEN_INT (-rounded_size));
|
|
|
13f101 |
+ insn = emit_insn (gen_add3_insn (end_addr, end_addr,
|
|
|
13f101 |
+ stack_pointer_rtx));
|
|
|
13f101 |
+ /* Describe the effect of INSN to the CFI engine. */
|
|
|
13f101 |
+ add_reg_note (insn, REG_FRAME_RELATED_EXPR,
|
|
|
13f101 |
+ gen_rtx_SET (VOIDmode, end_addr,
|
|
|
13f101 |
+ gen_rtx_PLUS (Pmode, stack_pointer_rtx,
|
|
|
13f101 |
+ rs)));
|
|
|
13f101 |
+ }
|
|
|
13f101 |
+ RTX_FRAME_RELATED_P (insn) = 1;
|
|
|
13f101 |
+
|
|
|
13f101 |
+ /* Emit the loop. */
|
|
|
13f101 |
+ if (TARGET_64BIT)
|
|
|
13f101 |
+ retval = emit_insn (gen_probe_stack_rangedi (stack_pointer_rtx,
|
|
|
13f101 |
+ stack_pointer_rtx, orig_sp,
|
|
|
13f101 |
+ end_addr));
|
|
|
13f101 |
+ else
|
|
|
13f101 |
+ retval = emit_insn (gen_probe_stack_rangesi (stack_pointer_rtx,
|
|
|
13f101 |
+ stack_pointer_rtx, orig_sp,
|
|
|
13f101 |
+ end_addr));
|
|
|
13f101 |
+ RTX_FRAME_RELATED_P (retval) = 1;
|
|
|
13f101 |
+ /* Describe the effect of INSN to the CFI engine. */
|
|
|
13f101 |
+ add_reg_note (retval, REG_FRAME_RELATED_EXPR,
|
|
|
13f101 |
+ gen_rtx_SET (VOIDmode, stack_pointer_rtx, end_addr));
|
|
|
13f101 |
+
|
|
|
13f101 |
+ /* Emit a blockage to ensure the allocation/probing insns are
|
|
|
13f101 |
+ not optimized, combined, removed, etc. Other cases handle this
|
|
|
13f101 |
+ within their call to rs6000_emit_allocate_stack_1. */
|
|
|
13f101 |
+ emit_insn (gen_blockage ());
|
|
|
13f101 |
+
|
|
|
13f101 |
+ dump_stack_clash_frame_info (PROBE_LOOP, rounded_size != orig_size);
|
|
|
13f101 |
+ }
|
|
|
13f101 |
+
|
|
|
13f101 |
+ if (orig_size != rounded_size)
|
|
|
13f101 |
+ {
|
|
|
13f101 |
+ /* Allocate (and implicitly probe) any residual space. */
|
|
|
13f101 |
+ HOST_WIDE_INT residual = orig_size - rounded_size;
|
|
|
13f101 |
+
|
|
|
13f101 |
+ rtx insn = rs6000_emit_allocate_stack_1 (residual, orig_sp);
|
|
|
13f101 |
+
|
|
|
13f101 |
+ /* If the residual was the only allocation, then we can return the
|
|
|
13f101 |
+ allocating insn. */
|
|
|
13f101 |
+ if (!retval)
|
|
|
13f101 |
+ retval = insn;
|
|
|
13f101 |
+ }
|
|
|
13f101 |
+
|
|
|
13f101 |
+ return retval;
|
|
|
13f101 |
+}
|
|
|
13f101 |
+
|
|
|
13f101 |
/* Emit the correct code for allocating stack space, as insns.
|
|
|
13f101 |
If COPY_REG, make sure a copy of the old frame is left there.
|
|
|
13f101 |
The generated code may use hard register 0 as a temporary. */
|
|
|
13f101 |
@@ -22331,7 +22545,6 @@ rs6000_emit_allocate_stack (HOST_WIDE_INT size, rtx copy_reg, int copy_off)
|
|
|
13f101 |
rtx stack_reg = gen_rtx_REG (Pmode, STACK_POINTER_REGNUM);
|
|
|
13f101 |
rtx tmp_reg = gen_rtx_REG (Pmode, 0);
|
|
|
13f101 |
rtx todec = gen_int_mode (-size, Pmode);
|
|
|
13f101 |
- rtx par, set, mem;
|
|
|
13f101 |
|
|
|
13f101 |
if (INTVAL (todec) != -size)
|
|
|
13f101 |
{
|
|
|
13f101 |
@@ -22368,6 +22581,22 @@ rs6000_emit_allocate_stack (HOST_WIDE_INT size, rtx copy_reg, int copy_off)
|
|
|
13f101 |
warning (0, "stack limit expression is not supported");
|
|
|
13f101 |
}
|
|
|
13f101 |
|
|
|
13f101 |
+ if (flag_stack_clash_protection)
|
|
|
13f101 |
+ {
|
|
|
13f101 |
+ if (size < get_stack_clash_protection_guard_size ())
|
|
|
13f101 |
+ dump_stack_clash_frame_info (NO_PROBE_SMALL_FRAME, true);
|
|
|
13f101 |
+ else
|
|
|
13f101 |
+ {
|
|
|
13f101 |
+ rtx insn = rs6000_emit_probe_stack_range_stack_clash (size, copy_reg);
|
|
|
13f101 |
+
|
|
|
13f101 |
+ /* If we asked for a copy with an offset, then we still need add in
|
|
|
13f101 |
+ the offset. */
|
|
|
13f101 |
+ if (copy_reg && copy_off)
|
|
|
13f101 |
+ emit_insn (gen_add3_insn (copy_reg, copy_reg, GEN_INT (copy_off)));
|
|
|
13f101 |
+ return;
|
|
|
13f101 |
+ }
|
|
|
13f101 |
+ }
|
|
|
13f101 |
+
|
|
|
13f101 |
if (copy_reg)
|
|
|
13f101 |
{
|
|
|
13f101 |
if (copy_off != 0)
|
|
|
13f101 |
@@ -22376,39 +22605,12 @@ rs6000_emit_allocate_stack (HOST_WIDE_INT size, rtx copy_reg, int copy_off)
|
|
|
13f101 |
emit_move_insn (copy_reg, stack_reg);
|
|
|
13f101 |
}
|
|
|
13f101 |
|
|
|
13f101 |
- if (size > 32767)
|
|
|
13f101 |
- {
|
|
|
13f101 |
- /* Need a note here so that try_split doesn't get confused. */
|
|
|
13f101 |
- if (get_last_insn () == NULL_RTX)
|
|
|
13f101 |
- emit_note (NOTE_INSN_DELETED);
|
|
|
13f101 |
- insn = emit_move_insn (tmp_reg, todec);
|
|
|
13f101 |
- try_split (PATTERN (insn), insn, 0);
|
|
|
13f101 |
- todec = tmp_reg;
|
|
|
13f101 |
- }
|
|
|
13f101 |
-
|
|
|
13f101 |
- insn = emit_insn (TARGET_32BIT
|
|
|
13f101 |
- ? gen_movsi_update_stack (stack_reg, stack_reg,
|
|
|
13f101 |
- todec, stack_reg)
|
|
|
13f101 |
- : gen_movdi_di_update_stack (stack_reg, stack_reg,
|
|
|
13f101 |
- todec, stack_reg));
|
|
|
13f101 |
/* Since we didn't use gen_frame_mem to generate the MEM, grab
|
|
|
13f101 |
it now and set the alias set/attributes. The above gen_*_update
|
|
|
13f101 |
calls will generate a PARALLEL with the MEM set being the first
|
|
|
13f101 |
operation. */
|
|
|
13f101 |
- par = PATTERN (insn);
|
|
|
13f101 |
- gcc_assert (GET_CODE (par) == PARALLEL);
|
|
|
13f101 |
- set = XVECEXP (par, 0, 0);
|
|
|
13f101 |
- gcc_assert (GET_CODE (set) == SET);
|
|
|
13f101 |
- mem = SET_DEST (set);
|
|
|
13f101 |
- gcc_assert (MEM_P (mem));
|
|
|
13f101 |
- MEM_NOTRAP_P (mem) = 1;
|
|
|
13f101 |
- set_mem_alias_set (mem, get_frame_alias_set ());
|
|
|
13f101 |
-
|
|
|
13f101 |
- RTX_FRAME_RELATED_P (insn) = 1;
|
|
|
13f101 |
- add_reg_note (insn, REG_FRAME_RELATED_EXPR,
|
|
|
13f101 |
- gen_rtx_SET (VOIDmode, stack_reg,
|
|
|
13f101 |
- gen_rtx_PLUS (Pmode, stack_reg,
|
|
|
13f101 |
- GEN_INT (-size))));
|
|
|
13f101 |
+ insn = rs6000_emit_allocate_stack_1 (size, stack_reg);
|
|
|
13f101 |
+ return;
|
|
|
13f101 |
}
|
|
|
13f101 |
|
|
|
13f101 |
#define PROBE_INTERVAL (1 << STACK_CHECK_PROBE_INTERVAL_EXP)
|
|
|
13f101 |
@@ -22490,9 +22692,9 @@ rs6000_emit_probe_stack_range (HOST_WIDE_INT first, HOST_WIDE_INT size)
|
|
|
13f101 |
until it is equal to ROUNDED_SIZE. */
|
|
|
13f101 |
|
|
|
13f101 |
if (TARGET_64BIT)
|
|
|
13f101 |
- emit_insn (gen_probe_stack_rangedi (r12, r12, r0));
|
|
|
13f101 |
+ emit_insn (gen_probe_stack_rangedi (r12, r12, stack_pointer_rtx, r0));
|
|
|
13f101 |
else
|
|
|
13f101 |
- emit_insn (gen_probe_stack_rangesi (r12, r12, r0));
|
|
|
13f101 |
+ emit_insn (gen_probe_stack_rangesi (r12, r12, stack_pointer_rtx, r0));
|
|
|
13f101 |
|
|
|
13f101 |
|
|
|
13f101 |
/* Step 4: probe at FIRST + SIZE if we cannot assert at compile-time
|
|
|
13f101 |
@@ -22504,10 +22706,10 @@ rs6000_emit_probe_stack_range (HOST_WIDE_INT first, HOST_WIDE_INT size)
|
|
|
13f101 |
}
|
|
|
13f101 |
|
|
|
13f101 |
/* Probe a range of stack addresses from REG1 to REG2 inclusive. These are
|
|
|
13f101 |
- absolute addresses. */
|
|
|
13f101 |
+ addresses, not offsets. */
|
|
|
13f101 |
|
|
|
13f101 |
-const char *
|
|
|
13f101 |
-output_probe_stack_range (rtx reg1, rtx reg2)
|
|
|
13f101 |
+static const char *
|
|
|
13f101 |
+output_probe_stack_range_1 (rtx reg1, rtx reg2)
|
|
|
13f101 |
{
|
|
|
13f101 |
static int labelno = 0;
|
|
|
13f101 |
char loop_lab[32], end_lab[32];
|
|
|
13f101 |
@@ -22546,6 +22748,63 @@ output_probe_stack_range (rtx reg1, rtx reg2)
|
|
|
13f101 |
return "";
|
|
|
13f101 |
}
|
|
|
13f101 |
|
|
|
13f101 |
+/* Probe a range of stack addresses from REG1 to REG3 inclusive. These are
|
|
|
13f101 |
+ addresses, not offsets.
|
|
|
13f101 |
+
|
|
|
13f101 |
+ REG2 contains the backchain that must be stored into *sp at each allocation.
|
|
|
13f101 |
+
|
|
|
13f101 |
+ This is subtly different than the Ada probing above in that it tries hard
|
|
|
13f101 |
+ to prevent attacks that jump the stack guard. Thus, it is never allowed
|
|
|
13f101 |
+ to allocate more than PROBE_INTERVAL bytes of stack space without a
|
|
|
13f101 |
+ suitable probe. */
|
|
|
13f101 |
+
|
|
|
13f101 |
+static const char *
|
|
|
13f101 |
+output_probe_stack_range_stack_clash (rtx reg1, rtx reg2, rtx reg3)
|
|
|
13f101 |
+{
|
|
|
13f101 |
+ static int labelno = 0;
|
|
|
13f101 |
+ char loop_lab[32];
|
|
|
13f101 |
+ rtx xops[3];
|
|
|
13f101 |
+
|
|
|
13f101 |
+ HOST_WIDE_INT probe_interval = get_stack_clash_protection_probe_interval ();
|
|
|
13f101 |
+
|
|
|
13f101 |
+ ASM_GENERATE_INTERNAL_LABEL (loop_lab, "LPSRL", labelno++);
|
|
|
13f101 |
+
|
|
|
13f101 |
+ ASM_OUTPUT_INTERNAL_LABEL (asm_out_file, loop_lab);
|
|
|
13f101 |
+
|
|
|
13f101 |
+ /* This allocates and probes. */
|
|
|
13f101 |
+ xops[0] = reg1;
|
|
|
13f101 |
+ xops[1] = reg2;
|
|
|
13f101 |
+ xops[2] = GEN_INT (-probe_interval);
|
|
|
13f101 |
+ if (TARGET_64BIT)
|
|
|
13f101 |
+ output_asm_insn ("stdu %1,%2(%0)", xops);
|
|
|
13f101 |
+ else
|
|
|
13f101 |
+ output_asm_insn ("stwu %1,%2(%0)", xops);
|
|
|
13f101 |
+
|
|
|
13f101 |
+ /* Jump to LOOP_LAB if TEST_ADDR != LAST_ADDR. */
|
|
|
13f101 |
+ xops[0] = reg1;
|
|
|
13f101 |
+ xops[1] = reg3;
|
|
|
13f101 |
+ if (TARGET_64BIT)
|
|
|
13f101 |
+ output_asm_insn ("cmpd 0,%0,%1", xops);
|
|
|
13f101 |
+ else
|
|
|
13f101 |
+ output_asm_insn ("cmpw 0,%0,%1", xops);
|
|
|
13f101 |
+
|
|
|
13f101 |
+ fputs ("\tbne 0,", asm_out_file);
|
|
|
13f101 |
+ assemble_name_raw (asm_out_file, loop_lab);
|
|
|
13f101 |
+ fputc ('\n', asm_out_file);
|
|
|
13f101 |
+
|
|
|
13f101 |
+ return "";
|
|
|
13f101 |
+}
|
|
|
13f101 |
+
|
|
|
13f101 |
+/* Wrapper around the output_probe_stack_range routines. */
|
|
|
13f101 |
+const char *
|
|
|
13f101 |
+output_probe_stack_range (rtx reg1, rtx reg2, rtx reg3)
|
|
|
13f101 |
+{
|
|
|
13f101 |
+ if (flag_stack_clash_protection)
|
|
|
13f101 |
+ return output_probe_stack_range_stack_clash (reg1, reg2, reg3);
|
|
|
13f101 |
+ else
|
|
|
13f101 |
+ return output_probe_stack_range_1 (reg1, reg3);
|
|
|
13f101 |
+}
|
|
|
13f101 |
+
|
|
|
13f101 |
/* Add to 'insn' a note which is PATTERN (INSN) but with REG replaced
|
|
|
13f101 |
with (plus:P (reg 1) VAL), and with REG2 replaced with RREG if REG2
|
|
|
13f101 |
is not NULL. It would be nice if dwarf2out_frame_debug_expr could
|
|
|
13f101 |
@@ -23857,6 +24116,13 @@ rs6000_emit_prologue (void)
|
|
|
13f101 |
}
|
|
|
13f101 |
}
|
|
|
13f101 |
|
|
|
13f101 |
+ /* If we are emitting stack probes, but allocate no stack, then
|
|
|
13f101 |
+ just note that in the dump file. */
|
|
|
13f101 |
+ if (flag_stack_clash_protection
|
|
|
13f101 |
+ && dump_file
|
|
|
13f101 |
+ && !info->push_p)
|
|
|
13f101 |
+ dump_stack_clash_frame_info (NO_PROBE_NO_FRAME, false);
|
|
|
13f101 |
+
|
|
|
13f101 |
/* Update stack and set back pointer unless this is V.4,
|
|
|
13f101 |
for which it was done previously. */
|
|
|
13f101 |
if (!WORLD_SAVE_P (info) && info->push_p
|
|
|
13f101 |
diff --git a/gcc/config/rs6000/rs6000.md b/gcc/config/rs6000/rs6000.md
|
|
|
13f101 |
index cd197213480..3cd70e592c1 100644
|
|
|
13f101 |
--- a/gcc/config/rs6000/rs6000.md
|
|
|
13f101 |
+++ b/gcc/config/rs6000/rs6000.md
|
|
|
13f101 |
@@ -11822,10 +11822,20 @@
|
|
|
13f101 |
;;
|
|
|
13f101 |
;; First, an insn to allocate new stack space for dynamic use (e.g., alloca).
|
|
|
13f101 |
;; We move the back-chain and decrement the stack pointer.
|
|
|
13f101 |
-
|
|
|
13f101 |
+;;
|
|
|
13f101 |
+;; Operand1 is more naturally reg_or_short_operand. However, for a large
|
|
|
13f101 |
+;; constant alloca, using that predicate will force the generic code to put
|
|
|
13f101 |
+;; the constant size into a register before calling the expander.
|
|
|
13f101 |
+;;
|
|
|
13f101 |
+;; As a result the expander would not have the constant size information
|
|
|
13f101 |
+;; in those cases and would have to generate less efficient code.
|
|
|
13f101 |
+;;
|
|
|
13f101 |
+;; Thus we allow reg_or_cint_operand instead so that the expander can see
|
|
|
13f101 |
+;; the constant size. The value is forced into a register if necessary.
|
|
|
13f101 |
+;;
|
|
|
13f101 |
(define_expand "allocate_stack"
|
|
|
13f101 |
[(set (match_operand 0 "gpc_reg_operand" "")
|
|
|
13f101 |
- (minus (reg 1) (match_operand 1 "reg_or_short_operand" "")))
|
|
|
13f101 |
+ (minus (reg 1) (match_operand 1 "reg_or_cint_operand" "")))
|
|
|
13f101 |
(set (reg 1)
|
|
|
13f101 |
(minus (reg 1) (match_dup 1)))]
|
|
|
13f101 |
""
|
|
|
13f101 |
@@ -11835,6 +11845,15 @@
|
|
|
13f101 |
rtx neg_op0;
|
|
|
13f101 |
rtx insn, par, set, mem;
|
|
|
13f101 |
|
|
|
13f101 |
+ /* By allowing reg_or_cint_operand as the predicate we can get
|
|
|
13f101 |
+ better code for stack-clash-protection because we do not lose
|
|
|
13f101 |
+ size information. But the rest of the code expects the operand
|
|
|
13f101 |
+ to be reg_or_short_operand. If it isn't, then force it into
|
|
|
13f101 |
+ a register. */
|
|
|
13f101 |
+ rtx orig_op1 = operands[1];
|
|
|
13f101 |
+ if (!reg_or_short_operand (operands[1], Pmode))
|
|
|
13f101 |
+ operands[1] = force_reg (Pmode, operands[1]);
|
|
|
13f101 |
+
|
|
|
13f101 |
emit_move_insn (chain, stack_bot);
|
|
|
13f101 |
|
|
|
13f101 |
/* Check stack bounds if necessary. */
|
|
|
13f101 |
@@ -11847,6 +11866,51 @@
|
|
|
13f101 |
emit_insn (gen_cond_trap (LTU, available, operands[1], const0_rtx));
|
|
|
13f101 |
}
|
|
|
13f101 |
|
|
|
13f101 |
+ /* Allocate and probe if requested.
|
|
|
13f101 |
+ This may look similar to the loop we use for prologue allocations,
|
|
|
13f101 |
+ but it is critically different. For the former we know the loop
|
|
|
13f101 |
+ will iterate, but do not know that generally here. The former
|
|
|
13f101 |
+ uses that knowledge to rotate the loop. Combining them would be
|
|
|
13f101 |
+ possible with some performance cost. */
|
|
|
13f101 |
+ if (flag_stack_clash_protection)
|
|
|
13f101 |
+ {
|
|
|
13f101 |
+ rtx rounded_size, last_addr, residual;
|
|
|
13f101 |
+ HOST_WIDE_INT probe_interval;
|
|
|
13f101 |
+ compute_stack_clash_protection_loop_data (&rounded_size, &last_addr,
|
|
|
13f101 |
+ &residual, &probe_interval,
|
|
|
13f101 |
+ orig_op1);
|
|
|
13f101 |
+
|
|
|
13f101 |
+ /* We do occasionally get in here with constant sizes, we might
|
|
|
13f101 |
+ as well do a reasonable job when we obviously can. */
|
|
|
13f101 |
+ if (rounded_size != const0_rtx)
|
|
|
13f101 |
+ {
|
|
|
13f101 |
+ rtx loop_lab, end_loop;
|
|
|
13f101 |
+ bool rotated = CONST_INT_P (rounded_size);
|
|
|
13f101 |
+
|
|
|
13f101 |
+ emit_stack_clash_protection_probe_loop_start (&loop_lab, &end_loop,
|
|
|
13f101 |
+ last_addr, rotated);
|
|
|
13f101 |
+
|
|
|
13f101 |
+ if (Pmode == SImode)
|
|
|
13f101 |
+ emit_insn (gen_movsi_update_stack (stack_pointer_rtx,
|
|
|
13f101 |
+ stack_pointer_rtx,
|
|
|
13f101 |
+ GEN_INT (-probe_interval),
|
|
|
13f101 |
+ chain));
|
|
|
13f101 |
+ else
|
|
|
13f101 |
+ emit_insn (gen_movdi_di_update_stack (stack_pointer_rtx,
|
|
|
13f101 |
+ stack_pointer_rtx,
|
|
|
13f101 |
+ GEN_INT (-probe_interval),
|
|
|
13f101 |
+ chain));
|
|
|
13f101 |
+ emit_stack_clash_protection_probe_loop_end (loop_lab, end_loop,
|
|
|
13f101 |
+ last_addr, rotated);
|
|
|
13f101 |
+ }
|
|
|
13f101 |
+
|
|
|
13f101 |
+ /* Now handle residuals. We just have to set operands[1] correctly
|
|
|
13f101 |
+ and let the rest of the expander run. */
|
|
|
13f101 |
+ operands[1] = residual;
|
|
|
13f101 |
+ if (!CONST_INT_P (residual))
|
|
|
13f101 |
+ operands[1] = force_reg (Pmode, operands[1]);
|
|
|
13f101 |
+ }
|
|
|
13f101 |
+
|
|
|
13f101 |
if (GET_CODE (operands[1]) != CONST_INT
|
|
|
13f101 |
|| INTVAL (operands[1]) < -32767
|
|
|
13f101 |
|| INTVAL (operands[1]) > 32768)
|
|
|
13f101 |
@@ -12994,12 +13058,13 @@
|
|
|
13f101 |
(set_attr "length" "4")])
|
|
|
13f101 |
|
|
|
13f101 |
(define_insn "probe_stack_range<P:mode>"
|
|
|
13f101 |
- [(set (match_operand:P 0 "register_operand" "=r")
|
|
|
13f101 |
+ [(set (match_operand:P 0 "register_operand" "=&r")
|
|
|
13f101 |
(unspec_volatile:P [(match_operand:P 1 "register_operand" "0")
|
|
|
13f101 |
- (match_operand:P 2 "register_operand" "r")]
|
|
|
13f101 |
+ (match_operand:P 2 "register_operand" "r")
|
|
|
13f101 |
+ (match_operand:P 3 "register_operand" "r")]
|
|
|
13f101 |
UNSPECV_PROBE_STACK_RANGE))]
|
|
|
13f101 |
""
|
|
|
13f101 |
- "* return output_probe_stack_range (operands[0], operands[2]);"
|
|
|
13f101 |
+ "* return output_probe_stack_range (operands[0], operands[2], operands[3]);"
|
|
|
13f101 |
[(set_attr "type" "three")])
|
|
|
13f101 |
|
|
|
13f101 |
;; Compare insns are next. Note that the RS/6000 has two types of compares,
|
|
|
13f101 |
diff --git a/gcc/testsuite/lib/target-supports.exp b/gcc/testsuite/lib/target-supports.exp
|
|
|
13f101 |
index 7c126e4122b..aba99513ed0 100644
|
|
|
13f101 |
--- a/gcc/testsuite/lib/target-supports.exp
|
|
|
13f101 |
+++ b/gcc/testsuite/lib/target-supports.exp
|
|
|
13f101 |
@@ -5421,12 +5421,12 @@ proc check_effective_target_autoincdec { } {
|
|
|
13f101 |
proc check_effective_target_supports_stack_clash_protection { } {
|
|
|
13f101 |
|
|
|
13f101 |
# Temporary until the target bits are fully ACK'd.
|
|
|
13f101 |
-# if { [istarget aarch*-*-*]
|
|
|
13f101 |
-# || [istarget powerpc*-*-*] || [istarget rs6000*-*-*] } {
|
|
|
13f101 |
+# if { [istarget aarch*-*-*] } {
|
|
|
13f101 |
# return 1
|
|
|
13f101 |
# }
|
|
|
13f101 |
|
|
|
13f101 |
if { [istarget x86_64-*-*] || [istarget i?86-*-*]
|
|
|
13f101 |
+ || [istarget powerpc*-*-*] || [istarget rs6000*-*-*]
|
|
|
13f101 |
|| [istarget s390*-*-*] } {
|
|
|
13f101 |
return 1
|
|
|
13f101 |
}
|