Blame SOURCES/gcc48-rh1469697-9.patch

85359c
commit b49f8fb8a97e9af8e6ba2b65d18195099cd1bb79
85359c
Author: law <law@138bc75d-0d04-0410-961f-82ee72b054a4>
85359c
Date:   Thu Sep 21 04:30:16 2017 +0000
85359c
85359c
            * config/s390/s390.c (MIN_UNROLL_PROBES): Define.
85359c
            (allocate_stack_space): New function, partially extracted from
85359c
            s390_emit_prologue.
85359c
            (s390_emit_prologue): Track offset to most recent stack probe.
85359c
            Code to allocate space moved into allocate_stack_space.
85359c
            Dump actions when no stack is allocated.
85359c
            (s390_prologue_plus_offset): New function.
85359c
            (s390_emit_stack_probe): Likewise.
85359c
    
85359c
            * gcc.dg/stack-check-5.c:  Add argument for s390.
85359c
            * lib/target-supports.exp:
85359c
            (check_effective_target_supports_stack_clash_protection): Enable for
85359c
            s390/s390x targets.
85359c
    
85359c
    git-svn-id: svn+ssh://gcc.gnu.org/svn/gcc/trunk@253049 138bc75d-0d04-0410-961f-82ee72b054a4
85359c
85359c
diff --git a/gcc/config/s390/s390.c b/gcc/config/s390/s390.c
85359c
index 3c04781f947..45998bc7516 100644
85359c
--- a/gcc/config/s390/s390.c
85359c
+++ b/gcc/config/s390/s390.c
85359c
@@ -10350,6 +10350,184 @@ s390_emit_stack_tie (void)
85359c
   emit_insn (gen_stack_tie (mem));
85359c
 }
85359c
 
85359c
+/* Calculate TARGET = REG + OFFSET as s390_emit_prologue would do it.
85359c
+   - push too big immediates to the literal pool and annotate the refs
85359c
+   - emit frame related notes for stack pointer changes.  */
85359c
+
85359c
+static rtx
85359c
+s390_prologue_plus_offset (rtx target, rtx reg, rtx offset, bool frame_related_p)
85359c
+{
85359c
+  rtx insn;
85359c
+  rtx orig_offset = offset;
85359c
+
85359c
+  gcc_assert (REG_P (target));
85359c
+  gcc_assert (REG_P (reg));
85359c
+  gcc_assert (CONST_INT_P (offset));
85359c
+
85359c
+  if (offset == const0_rtx)                               /* lr/lgr */
85359c
+    {
85359c
+      insn = emit_move_insn (target, reg);
85359c
+    }
85359c
+  else if (DISP_IN_RANGE (INTVAL (offset)))               /* la */
85359c
+    {
85359c
+      insn = emit_move_insn (target, gen_rtx_PLUS (Pmode, reg,
85359c
+						   offset));
85359c
+    }
85359c
+  else
85359c
+    {
85359c
+      if (!satisfies_constraint_K (offset)                /* ahi/aghi */
85359c
+	  && (!TARGET_EXTIMM
85359c
+	      || (!satisfies_constraint_Op (offset)       /* alfi/algfi */
85359c
+		  && !satisfies_constraint_On (offset)))) /* slfi/slgfi */
85359c
+	offset = force_const_mem (Pmode, offset);
85359c
+
85359c
+      if (target != reg)
85359c
+	{
85359c
+	  insn = emit_move_insn (target, reg);
85359c
+	  RTX_FRAME_RELATED_P (insn) = frame_related_p ? 1 : 0;
85359c
+	}
85359c
+
85359c
+      insn = emit_insn (gen_add2_insn (target, offset));
85359c
+
85359c
+      if (!CONST_INT_P (offset))
85359c
+	{
85359c
+	  annotate_constant_pool_refs (&PATTERN (insn));
85359c
+
85359c
+	  if (frame_related_p)
85359c
+	    add_reg_note (insn, REG_FRAME_RELATED_EXPR,
85359c
+			  gen_rtx_SET (VOIDmode, target,
85359c
+				       gen_rtx_PLUS (Pmode, target,
85359c
+						     orig_offset)));
85359c
+	}
85359c
+    }
85359c
+
85359c
+  RTX_FRAME_RELATED_P (insn) = frame_related_p ? 1 : 0;
85359c
+
85359c
+  /* If this is a stack adjustment and we are generating a stack clash
85359c
+     prologue, then add a REG_STACK_CHECK note to signal that this insn
85359c
+     should be left alone.  */
85359c
+  if (flag_stack_clash_protection && target == stack_pointer_rtx)
85359c
+    add_reg_note (insn, REG_STACK_CHECK, const0_rtx);
85359c
+
85359c
+  return insn;
85359c
+}
85359c
+
85359c
+/* Emit a compare instruction with a volatile memory access as stack
85359c
+   probe.  It does not waste store tags and does not clobber any
85359c
+   registers apart from the condition code.  */
85359c
+static void
85359c
+s390_emit_stack_probe (rtx addr)
85359c
+{
85359c
+  rtx tmp = gen_rtx_MEM (Pmode, addr);
85359c
+  MEM_VOLATILE_P (tmp) = 1;
85359c
+  s390_emit_compare (EQ, gen_rtx_REG (Pmode, 0), tmp);
85359c
+  emit_insn (gen_blockage ());
85359c
+}
85359c
+
85359c
+/* Use a runtime loop if we have to emit more probes than this.  */
85359c
+#define MIN_UNROLL_PROBES 3
85359c
+
85359c
+/* Allocate SIZE bytes of stack space, using TEMP_REG as a temporary
85359c
+   if necessary.  LAST_PROBE_OFFSET contains the offset of the closest
85359c
+   probe relative to the stack pointer.
85359c
+
85359c
+   Note that SIZE is negative.
85359c
+
85359c
+   The return value is true if TEMP_REG has been clobbered.  */
85359c
+static bool
85359c
+allocate_stack_space (rtx size, HOST_WIDE_INT last_probe_offset,
85359c
+		      rtx temp_reg)
85359c
+{
85359c
+  bool temp_reg_clobbered_p = false;
85359c
+  HOST_WIDE_INT probe_interval
85359c
+    = 1 << PARAM_VALUE (PARAM_STACK_CLASH_PROTECTION_PROBE_INTERVAL);
85359c
+  HOST_WIDE_INT guard_size
85359c
+    = 1 << PARAM_VALUE (PARAM_STACK_CLASH_PROTECTION_GUARD_SIZE);
85359c
+
85359c
+  if (flag_stack_clash_protection)
85359c
+    {
85359c
+      if (last_probe_offset + -INTVAL (size) < guard_size)
85359c
+	dump_stack_clash_frame_info (NO_PROBE_SMALL_FRAME, true);
85359c
+      else
85359c
+	{
85359c
+	  rtx offset = GEN_INT (probe_interval - UNITS_PER_LONG);
85359c
+	  HOST_WIDE_INT rounded_size = -INTVAL (size) & -probe_interval;
85359c
+	  HOST_WIDE_INT num_probes = rounded_size / probe_interval;
85359c
+	  HOST_WIDE_INT residual = -INTVAL (size) - rounded_size;
85359c
+
85359c
+	  if (num_probes < MIN_UNROLL_PROBES)
85359c
+	    {
85359c
+	      /* Emit unrolled probe statements.  */
85359c
+
85359c
+	      for (unsigned int i = 0; i < num_probes; i++)
85359c
+		{
85359c
+		  s390_prologue_plus_offset (stack_pointer_rtx,
85359c
+					     stack_pointer_rtx,
85359c
+					     GEN_INT (-probe_interval), true);
85359c
+		  s390_emit_stack_probe (gen_rtx_PLUS (Pmode,
85359c
+						       stack_pointer_rtx,
85359c
+						       offset));
85359c
+		}
85359c
+	      dump_stack_clash_frame_info (PROBE_INLINE, residual != 0);
85359c
+	    }
85359c
+	  else
85359c
+	    {
85359c
+	      /* Emit a loop probing the pages.  */
85359c
+
85359c
+	      rtx loop_start_label = gen_label_rtx ();
85359c
+
85359c
+	      /* From now on temp_reg will be the CFA register.  */
85359c
+	      s390_prologue_plus_offset (temp_reg, stack_pointer_rtx,
85359c
+					 GEN_INT (-rounded_size), true);
85359c
+	      emit_label (loop_start_label);
85359c
+
85359c
+	      s390_prologue_plus_offset (stack_pointer_rtx,
85359c
+					 stack_pointer_rtx,
85359c
+					 GEN_INT (-probe_interval), false);
85359c
+	      s390_emit_stack_probe (gen_rtx_PLUS (Pmode,
85359c
+						   stack_pointer_rtx,
85359c
+						   offset));
85359c
+	      emit_cmp_and_jump_insns (stack_pointer_rtx, temp_reg,
85359c
+				       GT, NULL_RTX,
85359c
+				       Pmode, 1, loop_start_label);
85359c
+
85359c
+	      /* Without this make_edges ICEes.  */
85359c
+	      JUMP_LABEL (get_last_insn ()) = loop_start_label;
85359c
+	      LABEL_NUSES (loop_start_label) = 1;
85359c
+
85359c
+	      /* That's going to be a NOP since stack pointer and
85359c
+		 temp_reg are supposed to be the same here.  We just
85359c
+		 emit it to set the CFA reg back to r15.  */
85359c
+	      s390_prologue_plus_offset (stack_pointer_rtx, temp_reg,
85359c
+					 const0_rtx, true);
85359c
+	      temp_reg_clobbered_p = true;
85359c
+	      dump_stack_clash_frame_info (PROBE_LOOP, residual != 0);
85359c
+	    }
85359c
+
85359c
+	  /* Handle any residual allocation request.  */
85359c
+	  s390_prologue_plus_offset (stack_pointer_rtx,
85359c
+				     stack_pointer_rtx,
85359c
+				     GEN_INT (-residual), true);
85359c
+	  last_probe_offset += residual;
85359c
+	  if (last_probe_offset >= probe_interval)
85359c
+	    s390_emit_stack_probe (gen_rtx_PLUS (Pmode,
85359c
+						 stack_pointer_rtx,
85359c
+						 GEN_INT (residual
85359c
+							  - UNITS_PER_LONG)));
85359c
+
85359c
+	  return temp_reg_clobbered_p;
85359c
+	}
85359c
+    }
85359c
+
85359c
+  /* Subtract frame size from stack pointer.  */
85359c
+  s390_prologue_plus_offset (stack_pointer_rtx,
85359c
+			     stack_pointer_rtx,
85359c
+			     size, true);
85359c
+
85359c
+  return temp_reg_clobbered_p;
85359c
+}
85359c
+
85359c
+
85359c
 /* Expand the prologue into a bunch of separate insns.  */
85359c
 
85359c
 void
85359c
@@ -10391,6 +10569,19 @@ s390_emit_prologue (void)
85359c
   else
85359c
     temp_reg = gen_rtx_REG (Pmode, 1);
85359c
 
85359c
+  /* When probing for stack-clash mitigation, we have to track the distance
85359c
+     between the stack pointer and closest known reference.
85359c
+
85359c
+     Most of the time we have to make a worst cast assumption.  The
85359c
+     only exception is when TARGET_BACKCHAIN is active, in which case
85359c
+     we know *sp (offset 0) was written.  */
85359c
+  HOST_WIDE_INT probe_interval
85359c
+    = 1 << PARAM_VALUE (PARAM_STACK_CLASH_PROTECTION_PROBE_INTERVAL);
85359c
+  HOST_WIDE_INT last_probe_offset
85359c
+    = (TARGET_BACKCHAIN
85359c
+       ? (TARGET_PACKED_STACK ? STACK_POINTER_OFFSET - UNITS_PER_LONG : 0)
85359c
+       : probe_interval - (STACK_BOUNDARY / UNITS_PER_WORD));
85359c
+
85359c
   /* Save call saved gprs.  */
85359c
   if (cfun_frame_layout.first_save_gpr != -1)
85359c
     {
85359c
@@ -10400,6 +10591,14 @@ s390_emit_prologue (void)
85359c
 					  - cfun_frame_layout.first_save_gpr_slot),
85359c
 			cfun_frame_layout.first_save_gpr,
85359c
 			cfun_frame_layout.last_save_gpr);
85359c
+
85359c
+      /* This is not 100% correct.  If we have more than one register saved,
85359c
+	 then LAST_PROBE_OFFSET can move even closer to sp.  */
85359c
+      last_probe_offset
85359c
+	= (cfun_frame_layout.gprs_offset +
85359c
+	   UNITS_PER_LONG * (cfun_frame_layout.first_save_gpr
85359c
+			     - cfun_frame_layout.first_save_gpr_slot));
85359c
+
85359c
       emit_insn (insn);
85359c
     }
85359c
 
85359c
@@ -10416,6 +10615,8 @@ s390_emit_prologue (void)
85359c
       if (cfun_fpr_bit_p (i))
85359c
 	{
85359c
 	  save_fpr (stack_pointer_rtx, offset, i + 16);
85359c
+	  if (offset < last_probe_offset)
85359c
+	    last_probe_offset = offset;
85359c
 	  offset += 8;
85359c
 	}
85359c
       else if (!TARGET_PACKED_STACK)
85359c
@@ -10429,6 +10630,8 @@ s390_emit_prologue (void)
85359c
       if (cfun_fpr_bit_p (i))
85359c
 	{
85359c
 	  insn = save_fpr (stack_pointer_rtx, offset, i + 16);
85359c
+	  if (offset < last_probe_offset)
85359c
+	    last_probe_offset = offset;
85359c
 	  offset += 8;
85359c
 
85359c
 	  /* If f4 and f6 are call clobbered they are saved due to stdargs and
85359c
@@ -10451,6 +10654,8 @@ s390_emit_prologue (void)
85359c
 	if (cfun_fpr_bit_p (i))
85359c
 	  {
85359c
 	    insn = save_fpr (stack_pointer_rtx, offset, i + 16);
85359c
+	    if (offset < last_probe_offset)
85359c
+	      last_probe_offset = offset;
85359c
 
85359c
 	    RTX_FRAME_RELATED_P (insn) = 1;
85359c
 	    offset -= 8;
85359c
@@ -10470,10 +10675,11 @@ s390_emit_prologue (void)
85359c
   if (cfun_frame_layout.frame_size > 0)
85359c
     {
85359c
       rtx frame_off = GEN_INT (-cfun_frame_layout.frame_size);
85359c
-      rtx real_frame_off;
85359c
+      rtx stack_pointer_backup_loc;
85359c
+      bool temp_reg_clobbered_p;
85359c
 
85359c
       if (s390_stack_size)
85359c
-  	{
85359c
+	{
85359c
 	  HOST_WIDE_INT stack_guard;
85359c
 
85359c
 	  if (s390_stack_guard)
85359c
@@ -10538,35 +10744,36 @@ s390_emit_prologue (void)
85359c
       if (s390_warn_dynamicstack_p && cfun->calls_alloca)
85359c
 	warning (0, "%qs uses dynamic stack allocation", current_function_name ());
85359c
 
85359c
-      /* Save incoming stack pointer into temp reg.  */
85359c
-      if (TARGET_BACKCHAIN || next_fpr)
85359c
-	insn = emit_insn (gen_move_insn (temp_reg, stack_pointer_rtx));
85359c
+      /* Save the location where we could backup the incoming stack
85359c
+	 pointer.  */
85359c
+      stack_pointer_backup_loc = get_last_insn ();
85359c
 
85359c
-      /* Subtract frame size from stack pointer.  */
85359c
+      temp_reg_clobbered_p = allocate_stack_space (frame_off, last_probe_offset,
85359c
+						   temp_reg);
85359c
 
85359c
-      if (DISP_IN_RANGE (INTVAL (frame_off)))
85359c
-	{
85359c
-	  insn = gen_rtx_SET (VOIDmode, stack_pointer_rtx,
85359c
-			      gen_rtx_PLUS (Pmode, stack_pointer_rtx,
85359c
-					    frame_off));
85359c
-	  insn = emit_insn (insn);
85359c
-	}
85359c
-      else
85359c
+      if (TARGET_BACKCHAIN || next_fpr)
85359c
 	{
85359c
-	  if (!CONST_OK_FOR_K (INTVAL (frame_off)))
85359c
-	    frame_off = force_const_mem (Pmode, frame_off);
85359c
-
85359c
-          insn = emit_insn (gen_add2_insn (stack_pointer_rtx, frame_off));
85359c
-	  annotate_constant_pool_refs (&PATTERN (insn));
85359c
+	  if (temp_reg_clobbered_p)
85359c
+	    {
85359c
+	      /* allocate_stack_space had to make use of temp_reg and
85359c
+		 we need it to hold a backup of the incoming stack
85359c
+		 pointer.  Calculate back that value from the current
85359c
+		 stack pointer.  */
85359c
+	      s390_prologue_plus_offset (temp_reg, stack_pointer_rtx,
85359c
+					 GEN_INT (cfun_frame_layout.frame_size),
85359c
+					 false);
85359c
+	    }
85359c
+	  else
85359c
+	    {
85359c
+	      /* allocate_stack_space didn't actually required
85359c
+		 temp_reg.  Insert the stack pointer backup insn
85359c
+		 before the stack pointer decrement code - knowing now
85359c
+		 that the value will survive.  */
85359c
+	      emit_insn_after (gen_move_insn (temp_reg, stack_pointer_rtx),
85359c
+			       stack_pointer_backup_loc);
85359c
+	    }
85359c
 	}
85359c
 
85359c
-      RTX_FRAME_RELATED_P (insn) = 1;
85359c
-      real_frame_off = GEN_INT (-cfun_frame_layout.frame_size);
85359c
-      add_reg_note (insn, REG_FRAME_RELATED_EXPR,
85359c
-		    gen_rtx_SET (VOIDmode, stack_pointer_rtx,
85359c
-				 gen_rtx_PLUS (Pmode, stack_pointer_rtx,
85359c
-					       real_frame_off)));
85359c
-
85359c
       /* Set backchain.  */
85359c
 
85359c
       if (TARGET_BACKCHAIN)
85359c
@@ -10590,6 +10797,8 @@ s390_emit_prologue (void)
85359c
 	  emit_clobber (addr);
85359c
 	}
85359c
     }
85359c
+  else if (flag_stack_clash_protection)
85359c
+    dump_stack_clash_frame_info (NO_PROBE_NO_FRAME, false);
85359c
 
85359c
   /* Save fprs 8 - 15 (64 bit ABI).  */
85359c
 
85359c
diff --git a/gcc/testsuite/gcc.dg/stack-check-5.c b/gcc/testsuite/gcc.dg/stack-check-5.c
85359c
index 2171d9b6c23..3178f5d8ce5 100644
85359c
--- a/gcc/testsuite/gcc.dg/stack-check-5.c
85359c
+++ b/gcc/testsuite/gcc.dg/stack-check-5.c
85359c
@@ -3,6 +3,10 @@
85359c
 /* { dg-require-effective-target supports_stack_clash_protection } */
85359c
 
85359c
 
85359c
+/* Otherwise the S/390 back-end might save the stack pointer in f2 ()
85359c
+   into an FPR.  */
85359c
+/* { dg-additional-options "-msoft-float" { target { s390x-*-* } } } */
85359c
+
85359c
 extern void foo (char *);
85359c
 extern void bar (void);
85359c
 
85359c
diff --git a/gcc/testsuite/lib/target-supports.exp b/gcc/testsuite/lib/target-supports.exp
85359c
index 2c669a9822f..f24c5c6e0ac 100644
85359c
--- a/gcc/testsuite/lib/target-supports.exp
85359c
+++ b/gcc/testsuite/lib/target-supports.exp
85359c
@@ -5422,12 +5422,12 @@ proc check_effective_target_supports_stack_clash_protection { } {
85359c
 
85359c
    # Temporary until the target bits are fully ACK'd.
85359c
 #  if { [istarget aarch*-*-*]
85359c
-#       || [istarget s390*-*-*]
85359c
 #       || [istarget powerpc*-*-*] || [istarget rs6000*-*-*] } {
85359c
 #	return 1
85359c
 #  }
85359c
 
85359c
-    if { [istarget x86_64-*-*] || [istarget i?86-*-*] } {
85359c
+    if { [istarget x86_64-*-*] || [istarget i?86-*-*] 
85359c
+	  || [istarget s390*-*-*] } {
85359c
 	return 1
85359c
     }
85359c
   return 0