Blame SOURCES/gcc48-rh1304449.patch

25c7f1
2015-12-24  Kirill Yukhin  <kirill.yukhin@intel.com>
25c7f1
25c7f1
	* common/config/i386/i386-common.c (OPTION_MASK_ISA_PKU_SET): New.
25c7f1
	(OPTION_MASK_ISA_PKU_UNSET): Ditto.
25c7f1
	(ix86_handle_option): Handle OPT_mpku.
25c7f1
	* config.gcc: Add pkuintrin.h to i[34567]86-*-* and x86_64-*-*
25c7f1
	targets.
25c7f1
	* config/i386/cpuid.h (host_detect_local_cpu): Detect PKU feature.
25c7f1
	* config/i386/i386-c.c (ix86_target_macros_internal): Handle PKU ISA
25c7f1
	flag.
25c7f1
	* config/i386/i386.c (ix86_target_string): Add "-mpku" to
25c7f1
	ix86_target_opts.
25c7f1
	(ix86_option_override_internal): Define PTA_PKU, mention new key
25c7f1
	in skylake-avx512. Handle new ISA bits.
25c7f1
	(ix86_valid_target_attribute_inner_p): Add "pku".
25c7f1
	(enum ix86_builtins): Add IX86_BUILTIN_RDPKRU and IX86_BUILTIN_WRPKRU.
25c7f1
	(builtin_description bdesc_special_args[]): Add new built-ins.
25c7f1
	* config/i386/i386.h (define TARGET_PKU): New.
25c7f1
	(define TARGET_PKU_P): Ditto.
25c7f1
	* config/i386/i386.md (define_c_enum "unspecv"): Add UNSPEC_PKU.
25c7f1
	(define_expand "rdpkru"): New.
25c7f1
	(define_insn "*rdpkru"): Ditto.
25c7f1
	(define_expand "wrpkru"): Ditto.
25c7f1
	(define_insn "*wrpkru"): Ditto.
25c7f1
	* config/i386/i386.opt (mpku): Ditto.
25c7f1
	* config/i386/pkuintrin.h: New file.
25c7f1
	* config/i386/x86intrin.h: Include pkuintrin.h
25c7f1
	* doc/extend.texi: Describe new built-ins.
25c7f1
	* doc/invoke.texi: Describe new switches.
25c7f1
25c7f1
	* g++.dg/other/i386-2.C: Add -mpku.
25c7f1
	* g++.dg/other/i386-3.C: Ditto.
25c7f1
	* gcc.target/i386/rdpku-1.c: New test.
25c7f1
	* gcc.target/i386/sse-12.c: Add -mpku.
25c7f1
	* gcc.target/i386/sse-13.c: Ditto.
25c7f1
	* gcc.target/i386/sse-22.c: Ditto.
25c7f1
	* gcc.target/i386/sse-33.c: Ditto.
25c7f1
	* gcc.target/i386/wrpku-1.c: New test.
25c7f1
25c7f1
--- gcc/config.gcc	(revision 231943)
25c7f1
+++ gcc/config.gcc	(revision 231945)
25c7f1
@@ -368,7 +368,7 @@ i[34567]86-*-*)
25c7f1
 		       lzcntintrin.h bmiintrin.h bmi2intrin.h tbmintrin.h
25c7f1
 		       avx2intrin.h fmaintrin.h f16cintrin.h rtmintrin.h
25c7f1
 		       xtestintrin.h rdseedintrin.h prfchwintrin.h adxintrin.h
25c7f1
-		       fxsrintrin.h xsaveintrin.h xsaveoptintrin.h"
25c7f1
+		       fxsrintrin.h xsaveintrin.h xsaveoptintrin.h pkuintrin.h"
25c7f1
 	;;
25c7f1
 x86_64-*-*)
25c7f1
 	cpu_type=i386
25c7f1
@@ -383,7 +383,7 @@ x86_64-*-*)
25c7f1
 		       lzcntintrin.h bmiintrin.h tbmintrin.h bmi2intrin.h
25c7f1
 		       avx2intrin.h fmaintrin.h f16cintrin.h rtmintrin.h
25c7f1
 		       xtestintrin.h rdseedintrin.h prfchwintrin.h adxintrin.h
25c7f1
-		       fxsrintrin.h xsaveintrin.h xsaveoptintrin.h"
25c7f1
+		       fxsrintrin.h xsaveintrin.h xsaveoptintrin.h pkuintrin.h"
25c7f1
 	need_64bit_hwint=yes
25c7f1
 	;;
25c7f1
 ia64-*-*)
25c7f1
--- gcc/common/config/i386/i386-common.c	(revision 231943)
25c7f1
+++ gcc/common/config/i386/i386-common.c	(revision 231945)
25c7f1
@@ -98,6 +98,7 @@ along with GCC; see the file COPYING3.
25c7f1
 #define OPTION_MASK_ISA_RDRND_SET OPTION_MASK_ISA_RDRND
25c7f1
 #define OPTION_MASK_ISA_F16C_SET \
25c7f1
   (OPTION_MASK_ISA_F16C | OPTION_MASK_ISA_AVX_SET)
25c7f1
+#define OPTION_MASK_ISA_PKU_SET OPTION_MASK_ISA_PKU
25c7f1
 
25c7f1
 /* Define a set of ISAs which aren't available when a given ISA is
25c7f1
    disabled.  MMX and SSE ISAs are handled separately.  */
25c7f1
@@ -164,6 +165,7 @@ along with GCC; see the file COPYING3.
25c7f1
 #define OPTION_MASK_ISA_FSGSBASE_UNSET OPTION_MASK_ISA_FSGSBASE
25c7f1
 #define OPTION_MASK_ISA_RDRND_UNSET OPTION_MASK_ISA_RDRND
25c7f1
 #define OPTION_MASK_ISA_F16C_UNSET OPTION_MASK_ISA_F16C
25c7f1
+#define OPTION_MASK_ISA_PKU_UNSET OPTION_MASK_ISA_PKU
25c7f1
 
25c7f1
 /* Implement TARGET_HANDLE_OPTION.  */
25c7f1
 
25c7f1
@@ -659,6 +661,19 @@ ix86_handle_option (struct gcc_options *
25c7f1
 	}
25c7f1
       return true;
25c7f1
 
25c7f1
+    case OPT_mpku:
25c7f1
+      if (value)
25c7f1
+	{
25c7f1
+	  opts->x_ix86_isa_flags |= OPTION_MASK_ISA_PKU_SET;
25c7f1
+	  opts->x_ix86_isa_flags_explicit |= OPTION_MASK_ISA_PKU_SET;
25c7f1
+	}
25c7f1
+      else
25c7f1
+	{
25c7f1
+	  opts->x_ix86_isa_flags &= ~OPTION_MASK_ISA_PKU_UNSET;
25c7f1
+	  opts->x_ix86_isa_flags_explicit |= OPTION_MASK_ISA_PKU_UNSET;
25c7f1
+	}
25c7f1
+      return true;
25c7f1
+
25c7f1
   /* Comes from final.c -- no real reason to change it.  */
25c7f1
 #define MAX_CODE_ALIGN 16
25c7f1
 
25c7f1
--- gcc/config/i386/i386.h	(revision 231943)
25c7f1
+++ gcc/config/i386/i386.h	(revision 231945)
25c7f1
@@ -80,6 +80,7 @@ see the files COPYING3 and COPYING.RUNTI
25c7f1
 #define TARGET_FXSR	TARGET_ISA_FXSR
25c7f1
 #define TARGET_XSAVE	TARGET_ISA_XSAVE
25c7f1
 #define TARGET_XSAVEOPT	TARGET_ISA_XSAVEOPT
25c7f1
+#define TARGET_PKU	TARGET_ISA_PKU
25c7f1
 
25c7f1
 #define TARGET_LP64	TARGET_ABI_64
25c7f1
 #define TARGET_X32	TARGET_ABI_X32
25c7f1
--- gcc/config/i386/i386.md	(revision 231943)
25c7f1
+++ gcc/config/i386/i386.md	(revision 231945)
25c7f1
@@ -224,6 +224,9 @@ (define_c_enum "unspecv" [
25c7f1
   UNSPECV_XTEST
25c7f1
 
25c7f1
   UNSPECV_NLGR
25c7f1
+
25c7f1
+  ;; For RDPKRU and WRPKRU support
25c7f1
+  UNSPECV_PKU
25c7f1
 ])
25c7f1
 
25c7f1
 ;; Constants to represent rounding modes in the ROUND instruction
25c7f1
@@ -18289,6 +18292,48 @@ (define_insn "xtest_1"
25c7f1
   [(set_attr "type" "other")
25c7f1
    (set_attr "length" "3")])
25c7f1
 
25c7f1
+;; RDPKRU and WRPKRU
25c7f1
+
25c7f1
+(define_expand "rdpkru"
25c7f1
+  [(parallel
25c7f1
+     [(set (match_operand:SI 0 "register_operand")
25c7f1
+	   (unspec_volatile:SI [(match_dup 1)] UNSPECV_PKU))
25c7f1
+      (set (match_dup 2) (const_int 0))])]
25c7f1
+  "TARGET_PKU"
25c7f1
+{
25c7f1
+  operands[1] = force_reg (SImode, const0_rtx);
25c7f1
+  operands[2] = gen_reg_rtx (SImode);
25c7f1
+})
25c7f1
+
25c7f1
+(define_insn "*rdpkru"
25c7f1
+  [(set (match_operand:SI 0 "register_operand" "=a")
25c7f1
+	(unspec_volatile:SI [(match_operand:SI 2 "register_operand" "c")]
25c7f1
+			    UNSPECV_PKU))
25c7f1
+   (set (match_operand:SI 1 "register_operand" "=d")
25c7f1
+	(const_int 0))]
25c7f1
+  "TARGET_PKU"
25c7f1
+  "rdpkru"
25c7f1
+  [(set_attr "type" "other")])
25c7f1
+
25c7f1
+(define_expand "wrpkru"
25c7f1
+  [(unspec_volatile:SI
25c7f1
+     [(match_operand:SI 0 "register_operand")
25c7f1
+      (match_dup 1) (match_dup 2)] UNSPECV_PKU)]
25c7f1
+  "TARGET_PKU"
25c7f1
+{
25c7f1
+  operands[1] = force_reg (SImode, const0_rtx);
25c7f1
+  operands[2] = force_reg (SImode, const0_rtx);
25c7f1
+})
25c7f1
+
25c7f1
+(define_insn "*wrpkru"
25c7f1
+  [(unspec_volatile:SI
25c7f1
+     [(match_operand:SI 0 "register_operand" "a")
25c7f1
+      (match_operand:SI 1 "register_operand" "d")
25c7f1
+      (match_operand:SI 2 "register_operand" "c")] UNSPECV_PKU)]
25c7f1
+  "TARGET_PKU"
25c7f1
+  "wrpkru"
25c7f1
+  [(set_attr "type" "other")])
25c7f1
+
25c7f1
 (include "mmx.md")
25c7f1
 (include "sse.md")
25c7f1
 (include "sync.md")
25c7f1
--- gcc/config/i386/pkuintrin.h	(revision 0)
25c7f1
+++ gcc/config/i386/pkuintrin.h	(revision 231945)
25c7f1
@@ -0,0 +1,45 @@
25c7f1
+/* Copyright (C) 2015 Free Software Foundation, Inc.
25c7f1
+
25c7f1
+   This file is part of GCC.
25c7f1
+
25c7f1
+   GCC is free software; you can redistribute it and/or modify
25c7f1
+   it under the terms of the GNU General Public License as published by
25c7f1
+   the Free Software Foundation; either version 3, or (at your option)
25c7f1
+   any later version.
25c7f1
+
25c7f1
+   GCC is distributed in the hope that it will be useful,
25c7f1
+   but WITHOUT ANY WARRANTY; without even the implied warranty of
25c7f1
+   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
25c7f1
+   GNU General Public License for more details.
25c7f1
+
25c7f1
+   Under Section 7 of GPL version 3, you are granted additional
25c7f1
+   permissions described in the GCC Runtime Library Exception, version
25c7f1
+   3.1, as published by the Free Software Foundation.
25c7f1
+
25c7f1
+   You should have received a copy of the GNU General Public License and
25c7f1
+   a copy of the GCC Runtime Library Exception along with this program;
25c7f1
+   see the files COPYING3 and COPYING.RUNTIME respectively.  If not, see
25c7f1
+   <http://www.gnu.org/licenses/>.  */
25c7f1
+
25c7f1
+#if !defined _X86INTRIN_H_INCLUDED
25c7f1
+# error "Never use <pkuintrin.h> directly; include <x86intrin.h> instead."
25c7f1
+#endif
25c7f1
+
25c7f1
+#ifndef _PKUINTRIN_H_INCLUDED
25c7f1
+#define _PKUINTRIN_H_INCLUDED
25c7f1
+
25c7f1
+extern __inline unsigned int
25c7f1
+__attribute__((__gnu_inline__, __always_inline__, __artificial__))
25c7f1
+_rdpkru_u32(void)
25c7f1
+{
25c7f1
+  return __builtin_ia32_rdpkru ();
25c7f1
+}
25c7f1
+
25c7f1
+extern __inline void
25c7f1
+__attribute__((__gnu_inline__, __always_inline__, __artificial__))
25c7f1
+_wrpkru(unsigned int key)
25c7f1
+{
25c7f1
+  return __builtin_ia32_wrpkru (key);
25c7f1
+}
25c7f1
+
25c7f1
+#endif /* _PKUINTRIN_H_INCLUDED */
25c7f1
--- gcc/config/i386/cpuid.h	(revision 231943)
25c7f1
+++ gcc/config/i386/cpuid.h	(revision 231945)
25c7f1
@@ -74,6 +74,10 @@
25c7f1
 #define bit_RDSEED	(1 << 18)
25c7f1
 #define bit_ADX	(1 << 19)
25c7f1
 
25c7f1
+/* %ecx */
25c7f1
+#define bit_PKU	(1 << 3)
25c7f1
+#define bit_OSPKE	(1 << 4)
25c7f1
+ 
25c7f1
 /* Extended State Enumeration Sub-leaf (%eax == 13, %ecx == 1) */
25c7f1
 #define bit_XSAVEOPT	(1 << 0)
25c7f1
 
25c7f1
--- gcc/config/i386/x86intrin.h	(revision 231943)
25c7f1
+++ gcc/config/i386/x86intrin.h	(revision 231945)
25c7f1
@@ -119,4 +119,8 @@
25c7f1
 
25c7f1
 #include <adxintrin.h>
25c7f1
 
25c7f1
+#ifdef __PKU__
25c7f1
+#include <pkuintrin.h>
25c7f1
+#endif
25c7f1
+
25c7f1
 #endif /* _X86INTRIN_H_INCLUDED */
25c7f1
--- gcc/config/i386/i386-c.c	(revision 231943)
25c7f1
+++ gcc/config/i386/i386-c.c	(revision 231945)
25c7f1
@@ -348,6 +348,8 @@ ix86_target_macros_internal (HOST_WIDE_I
25c7f1
     def_or_undef (parse_in, "__XSAVE__");
25c7f1
   if (isa_flag & OPTION_MASK_ISA_XSAVEOPT)
25c7f1
     def_or_undef (parse_in, "__XSAVEOPT__");
25c7f1
+  if (isa_flag & OPTION_MASK_ISA_PKU)
25c7f1
+    def_or_undef (parse_in, "__PKU__");
25c7f1
   if ((fpmath & FPMATH_SSE) && (isa_flag & OPTION_MASK_ISA_SSE))
25c7f1
     def_or_undef (parse_in, "__SSE_MATH__");
25c7f1
   if ((fpmath & FPMATH_SSE) && (isa_flag & OPTION_MASK_ISA_SSE2))
25c7f1
--- gcc/config/i386/i386.opt	(revision 231943)
25c7f1
+++ gcc/config/i386/i386.opt	(revision 231945)
25c7f1
@@ -626,3 +626,7 @@ Split 32-byte AVX unaligned store
25c7f1
 mrtm
25c7f1
 Target Report Mask(ISA_RTM) Var(ix86_isa_flags) Save
25c7f1
 Support RTM built-in functions and code generation
25c7f1
+
25c7f1
+mpku
25c7f1
+Target Report Mask(ISA_PKU) Var(ix86_isa_flags) Save
25c7f1
+Support PKU built-in functions and code generation
25c7f1
--- gcc/config/i386/driver-i386.c	(revision 231943)
25c7f1
+++ gcc/config/i386/driver-i386.c	(revision 231945)
25c7f1
@@ -408,6 +408,7 @@ const char *host_detect_local_cpu (int a
25c7f1
   unsigned int has_rdrnd = 0, has_f16c = 0, has_fsgsbase = 0;
25c7f1
   unsigned int has_rdseed = 0, has_prfchw = 0, has_adx = 0;
25c7f1
   unsigned int has_osxsave = 0, has_fxsr = 0, has_xsave = 0, has_xsaveopt = 0;
25c7f1
+  unsigned int has_pku = 0;
25c7f1
 
25c7f1
   bool arch;
25c7f1
 
25c7f1
@@ -479,6 +480,8 @@ const char *host_detect_local_cpu (int a
25c7f1
       has_fsgsbase = ebx & bit_FSGSBASE;
25c7f1
       has_rdseed = ebx & bit_RDSEED;
25c7f1
       has_adx = ebx & bit_ADX;
25c7f1
+
25c7f1
+      has_pku = ecx & bit_OSPKE;
25c7f1
     }
25c7f1
 
25c7f1
   if (max_level >= 13)
25c7f1
@@ -855,12 +858,13 @@ const char *host_detect_local_cpu (int a
25c7f1
       const char *fxsr = has_fxsr ? " -mfxsr" : " -mno-fxsr";
25c7f1
       const char *xsave = has_xsave ? " -mxsave" : " -mno-xsave";
25c7f1
       const char *xsaveopt = has_xsaveopt ? " -mxsaveopt" : " -mno-xsaveopt";
25c7f1
+      const char *pku = has_pku ? " -mpku" : " -mno-pku";
25c7f1
 
25c7f1
       options = concat (options, cx16, sahf, movbe, ase, pclmul,
25c7f1
 			popcnt, abm, lwp, fma, fma4, xop, bmi, bmi2,
25c7f1
 			tbm, avx, avx2, sse4_2, sse4_1, lzcnt, rtm,
25c7f1
 			hle, rdrnd, f16c, fsgsbase, rdseed, prfchw, adx,
25c7f1
-			fxsr, xsave, xsaveopt, NULL);
25c7f1
+			fxsr, xsave, xsaveopt, pku, NULL);
25c7f1
     }
25c7f1
 
25c7f1
 done:
25c7f1
--- gcc/config/i386/i386.c	(revision 231943)
25c7f1
+++ gcc/config/i386/i386.c	(revision 231945)
25c7f1
@@ -2632,6 +2632,7 @@ ix86_target_string (HOST_WIDE_INT isa, i
25c7f1
     { "-mrtm",		OPTION_MASK_ISA_RTM },
25c7f1
     { "-mxsave",	OPTION_MASK_ISA_XSAVE },
25c7f1
     { "-mxsaveopt",	OPTION_MASK_ISA_XSAVEOPT },
25c7f1
+    { "-mpku",		OPTION_MASK_ISA_PKU },
25c7f1
   };
25c7f1
 
25c7f1
   /* Flag options.  */
25c7f1
@@ -2905,6 +2906,7 @@ ix86_option_override_internal (bool main
25c7f1
 #define PTA_FXSR		(HOST_WIDE_INT_1 << 37)
25c7f1
 #define PTA_XSAVE		(HOST_WIDE_INT_1 << 38)
25c7f1
 #define PTA_XSAVEOPT		(HOST_WIDE_INT_1 << 39)
25c7f1
+#define PTA_PKU			(HOST_WIDE_INT_1 << 60)
25c7f1
 
25c7f1
 /* if this reaches 64, need to widen struct pta flags below */
25c7f1
 
25c7f1
@@ -3429,6 +3431,9 @@ ix86_option_override_internal (bool main
25c7f1
 	if (processor_alias_table[i].flags & PTA_XSAVEOPT
25c7f1
 	    && !(ix86_isa_flags_explicit & OPTION_MASK_ISA_XSAVEOPT))
25c7f1
 	  ix86_isa_flags |= OPTION_MASK_ISA_XSAVEOPT;
25c7f1
+	if (processor_alias_table[i].flags & PTA_PKU
25c7f1
+	    && !(ix86_isa_flags_explicit & OPTION_MASK_ISA_PKU))
25c7f1
+	  ix86_isa_flags |= OPTION_MASK_ISA_PKU;
25c7f1
 	if (processor_alias_table[i].flags & (PTA_PREFETCH_SSE | PTA_SSE))
25c7f1
 	  x86_prefetch_sse = true;
25c7f1
 
25c7f1
@@ -4220,6 +4225,7 @@ ix86_valid_target_attribute_inner_p (tre
25c7f1
     IX86_ATTR_ISA ("fxsr",	OPT_mfxsr),
25c7f1
     IX86_ATTR_ISA ("xsave",	OPT_mxsave),
25c7f1
     IX86_ATTR_ISA ("xsaveopt",	OPT_mxsaveopt),
25c7f1
+    IX86_ATTR_ISA ("pku",	OPT_mpku),
25c7f1
 
25c7f1
     /* enum options */
25c7f1
     IX86_ATTR_ENUM ("fpmath=",	OPT_mfpmath_),
25c7f1
@@ -27042,6 +27048,10 @@ enum ix86_builtins
25c7f1
   IX86_BUILTIN_CPU_IS,
25c7f1
   IX86_BUILTIN_CPU_SUPPORTS,
25c7f1
 
25c7f1
+  /* PKU instructions.  */
25c7f1
+  IX86_BUILTIN_RDPKRU,
25c7f1
+  IX86_BUILTIN_WRPKRU,
25c7f1
+
25c7f1
   IX86_BUILTIN_MAX
25c7f1
 };
25c7f1
 
25c7f1
@@ -27357,6 +27367,10 @@ static const struct builtin_description
25c7f1
   { OPTION_MASK_ISA_RTM, CODE_FOR_xbegin, "__builtin_ia32_xbegin", IX86_BUILTIN_XBEGIN, UNKNOWN, (int) UNSIGNED_FTYPE_VOID },
25c7f1
   { OPTION_MASK_ISA_RTM, CODE_FOR_xend, "__builtin_ia32_xend", IX86_BUILTIN_XEND, UNKNOWN, (int) VOID_FTYPE_VOID },
25c7f1
   { OPTION_MASK_ISA_RTM, CODE_FOR_xtest, "__builtin_ia32_xtest", IX86_BUILTIN_XTEST, UNKNOWN, (int) INT_FTYPE_VOID },
25c7f1
+
25c7f1
+  /* RDPKRU and WRPKRU.  */
25c7f1
+  { OPTION_MASK_ISA_PKU, CODE_FOR_rdpkru, "__builtin_ia32_rdpkru", IX86_BUILTIN_RDPKRU, UNKNOWN, (int) UNSIGNED_FTYPE_VOID },
25c7f1
+  { OPTION_MASK_ISA_PKU, CODE_FOR_wrpkru, "__builtin_ia32_wrpkru", IX86_BUILTIN_WRPKRU, UNKNOWN, (int) VOID_FTYPE_UNSIGNED },
25c7f1
 };
25c7f1
 
25c7f1
 /* Builtins with variable number of arguments.  */
25c7f1
--- gcc/doc/extend.texi	(revision 231943)
25c7f1
+++ gcc/doc/extend.texi	(revision 231945)
25c7f1
@@ -10996,6 +10996,13 @@ void __builtin_ia32_xabort (status)
25c7f1
 int __builtin_ia32_xtest ()
25c7f1
 @end smallexample
25c7f1
 
25c7f1
+The following built-in functions are available when @option{-mpku} is used.
25c7f1
+They generate reads and writes to PKRU.
25c7f1
+@smallexample
25c7f1
+void __builtin_ia32_wrpkru (unsigned int)
25c7f1
+unsigned int __builtin_ia32_rdpkru ()
25c7f1
+@end smallexample
25c7f1
+
25c7f1
 @node X86 transactional memory intrinsics
25c7f1
 @subsection X86 transaction memory intrinsics
25c7f1
 
25c7f1
--- gcc/doc/invoke.texi	(revision 231943)
25c7f1
+++ gcc/doc/invoke.texi	(revision 231945)
25c7f1
@@ -645,7 +645,7 @@ Objective-C and Objective-C++ Dialects}.
25c7f1
 -mmmx  -msse  -msse2 -msse3 -mssse3 -msse4.1 -msse4.2 -msse4 -mavx @gol
25c7f1
 -mavx2 -maes -mpclmul -mfsgsbase -mrdrnd -mf16c -mfma @gol
25c7f1
 -msse4a -m3dnow -mpopcnt -mabm -mbmi -mtbm -mfma4 -mxop -mlzcnt @gol
25c7f1
--mbmi2 -mrtm -mlwp -mthreads @gol
25c7f1
+-mbmi2 -mrtm -mlwp -mpku -mthreads @gol
25c7f1
 -mno-align-stringops  -minline-all-stringops @gol
25c7f1
 -minline-stringops-dynamically -mstringop-strategy=@var{alg} @gol
25c7f1
 -mpush-args  -maccumulate-outgoing-args  -m128bit-long-double @gol
25c7f1
@@ -14326,6 +14326,8 @@ preferred alignment to @option{-mpreferr
25c7f1
 @itemx -mlzcnt
25c7f1
 @itemx -mno-lzcnt
25c7f1
 @itemx -mrtm
25c7f1
+@itemx -mpku
25c7f1
+@itemx -mno-pku
25c7f1
 @itemx -mtbm
25c7f1
 @itemx -mno-tbm
25c7f1
 @opindex mmmx
25c7f1
@@ -14336,7 +14338,7 @@ preferred alignment to @option{-mpreferr
25c7f1
 @opindex mno-3dnow
25c7f1
 These switches enable or disable the use of instructions in the MMX, SSE,
25c7f1
 SSE2, SSE3, SSSE3, SSE4.1, AVX, AVX2, AES, PCLMUL, FSGSBASE, RDRND, F16C,
25c7f1
-FMA, SSE4A, FMA4, XOP, LWP, ABM, BMI, BMI2, LZCNT, RTM or 3DNow!@:
25c7f1
+FMA, SSE4A, FMA4, XOP, LWP, ABM, BMI, BMI2, LZCNT, RTM, PKU or 3DNow!@:
25c7f1
 extended instruction sets.
25c7f1
 These extensions are also available as built-in functions: see
25c7f1
 @ref{X86 Built-in Functions}, for details of the functions enabled and
25c7f1
--- gcc/testsuite/gcc.target/i386/sse-12.c	(revision 231943)
25c7f1
+++ gcc/testsuite/gcc.target/i386/sse-12.c	(revision 231945)
25c7f1
@@ -3,7 +3,7 @@
25c7f1
    popcntintrin.h and mm_malloc.h are usable
25c7f1
    with -O -std=c89 -pedantic-errors.  */
25c7f1
 /* { dg-do compile } */
25c7f1
-/* { dg-options "-O -std=c89 -pedantic-errors -march=k8 -msse4a -m3dnow -mavx -mavx2 -mfma4 -mxop -maes -mpclmul -mpopcnt -mabm -mlzcnt -mbmi -mbmi2 -mtbm -mlwp -mfsgsbase -mrdrnd -mf16c -mfma -mrtm -mrdseed -mprfchw -madx -mfxsr -mxsaveopt" } */
25c7f1
+/* { dg-options "-O -std=c89 -pedantic-errors -march=k8 -msse4a -m3dnow -mavx -mavx2 -mfma4 -mxop -maes -mpclmul -mpopcnt -mabm -mlzcnt -mbmi -mbmi2 -mtbm -mlwp -mfsgsbase -mrdrnd -mf16c -mfma -mrtm -mrdseed -mprfchw -madx -mfxsr -mxsaveopt -mpku" } */
25c7f1
 
25c7f1
 #include <x86intrin.h>
25c7f1
 
25c7f1
--- gcc/testsuite/gcc.target/i386/sse-13.c	(revision 231943)
25c7f1
+++ gcc/testsuite/gcc.target/i386/sse-13.c	(revision 231945)
25c7f1
@@ -1,5 +1,5 @@
25c7f1
 /* { dg-do compile } */
25c7f1
-/* { dg-options "-O2 -Werror-implicit-function-declaration -march=k8 -msse4a -m3dnow -mavx -mavx2 -mfma4 -mxop -maes -mpclmul -mpopcnt -mabm -mlzcnt -mbmi -mbmi2 -mtbm -mlwp -mfsgsbase -mrdrnd -mf16c -mfma -mrtm -mrdseed -mprfchw -madx -mfxsr -mxsaveopt" } */
25c7f1
+/* { dg-options "-O2 -Werror-implicit-function-declaration -march=k8 -msse4a -m3dnow -mavx -mavx2 -mfma4 -mxop -maes -mpclmul -mpopcnt -mabm -mlzcnt -mbmi -mbmi2 -mtbm -mlwp -mfsgsbase -mrdrnd -mf16c -mfma -mrtm -mrdseed -mprfchw -madx -mfxsr -mxsaveopt -mpku" } */
25c7f1
 
25c7f1
 #include <mm_malloc.h>
25c7f1
 
25c7f1
--- gcc/testsuite/gcc.target/i386/sse-22.c	(revision 231943)
25c7f1
+++ gcc/testsuite/gcc.target/i386/sse-22.c	(revision 231945)
25c7f1
@@ -268,7 +268,7 @@ test_2 (_mm_clmulepi64_si128, __m128i, _
25c7f1
 
25c7f1
 /* x86intrin.h (FMA4/XOP/LWP/BMI/BMI2/TBM/LZCNT/FMA). */
25c7f1
 #ifdef DIFFERENT_PRAGMAS
25c7f1
-#pragma GCC target ("fma4,xop,lwp,bmi,bmi2,tbm,lzcnt,fma,rdseed,prfchw,adx,fxsr,xsaveopt")
25c7f1
+#pragma GCC target ("fma4,xop,lwp,bmi,bmi2,tbm,lzcnt,fma,rdseed,prfchw,adx,fxsr,xsaveopt,pku")
25c7f1
 #endif
25c7f1
 #include <x86intrin.h>
25c7f1
 /* xopintrin.h */
25c7f1
--- gcc/testsuite/gcc.target/i386/sse-23.c	(revision 231943)
25c7f1
+++ gcc/testsuite/gcc.target/i386/sse-23.c	(revision 231945)
25c7f1
@@ -183,7 +183,7 @@
25c7f1
 /* rtmintrin.h */
25c7f1
 #define __builtin_ia32_xabort(M) __builtin_ia32_xabort(1)
25c7f1
 
25c7f1
-#pragma GCC target ("sse4a,3dnow,avx,avx2,fma4,xop,aes,pclmul,popcnt,abm,lzcnt,bmi,bmi2,tbm,lwp,fsgsbase,rdrnd,f16c,fma,rtm,rdseed,prfchw,adx,fxsr,xsaveopt")
25c7f1
+#pragma GCC target ("sse4a,3dnow,avx,avx2,fma4,xop,aes,pclmul,popcnt,abm,lzcnt,bmi,bmi2,tbm,lwp,fsgsbase,rdrnd,f16c,fma,rtm,rdseed,prfchw,adx,fxsr,xsaveopt,pku")
25c7f1
 #include <wmmintrin.h>
25c7f1
 #include <smmintrin.h>
25c7f1
 #include <mm3dnow.h>
25c7f1
--- gcc/testsuite/gcc.target/i386/rdpku-1.c	(revision 0)
25c7f1
+++ gcc/testsuite/gcc.target/i386/rdpku-1.c	(revision 231945)
25c7f1
@@ -0,0 +1,11 @@
25c7f1
+/* { dg-do compile } */
25c7f1
+/* { dg-options "-mpku -O2" } */
25c7f1
+/* { dg-final { scan-assembler "rdpkru\n" } } */
25c7f1
+
25c7f1
+#include <x86intrin.h>
25c7f1
+
25c7f1
+unsigned extern
25c7f1
+rdpku_test (void)
25c7f1
+{
25c7f1
+  return _rdpkru_u32 ();
25c7f1
+}
25c7f1
--- gcc/testsuite/gcc.target/i386/wrpku-1.c	(revision 0)
25c7f1
+++ gcc/testsuite/gcc.target/i386/wrpku-1.c	(revision 231945)
25c7f1
@@ -0,0 +1,11 @@
25c7f1
+/* { dg-do compile } */
25c7f1
+/* { dg-options "-mpku -O2" } */
25c7f1
+/* { dg-final { scan-assembler "wrpkru\n" } } */
25c7f1
+
25c7f1
+#include <x86intrin.h>
25c7f1
+
25c7f1
+void extern
25c7f1
+wrpku_test (unsigned int key)
25c7f1
+{
25c7f1
+  _wrpkru (key);
25c7f1
+}
25c7f1
--- gcc/testsuite/g++.dg/other/i386-2.C	(revision 231943)
25c7f1
+++ gcc/testsuite/g++.dg/other/i386-2.C	(revision 231945)
25c7f1
@@ -1,9 +1,9 @@
25c7f1
 /* { dg-do compile { target i?86-*-* x86_64-*-* } } */
25c7f1
-/* { dg-options "-O -pedantic-errors -march=k8 -msse4a -m3dnow -mavx -mavx2 -mfma4 -mxop -maes -mpclmul -mpopcnt -mabm -mlzcnt -mbmi -mbmi2 -mtbm -mlwp -mfsgsbase -mrdrnd -mf16c -mfma -mrtm -mrdseed -mprfchw -madx -mfxsr -mxsaveopt" } */
25c7f1
+/* { dg-options "-O -pedantic-errors -march=k8 -msse4a -m3dnow -mavx -mavx2 -mfma4 -mxop -maes -mpclmul -mpopcnt -mabm -mlzcnt -mbmi -mbmi2 -mtbm -mlwp -mfsgsbase -mrdrnd -mf16c -mfma -mrtm -mrdseed -mprfchw -madx -mfxsr -mxsaveopt -mpku" } */
25c7f1
 
25c7f1
 /* Test that {,x,e,p,t,s,w,a,b,i}mmintrin.h, mm3dnow.h, fma4intrin.h,
25c7f1
    xopintrin.h, abmintrin.h, bmiintrin.h, tbmintrin.h, lwpintrin.h,
25c7f1
-   popcntintrin.h, fmaintrin.h and mm_malloc.h.h are usable with 
25c7f1
+   popcntintrin.h, fmaintrin.h, pkuintrin.h and mm_malloc.h.h are usable with 
25c7f1
    -O -pedantic-errors.  */
25c7f1
 
25c7f1
 #include <x86intrin.h>
25c7f1
--- gcc/testsuite/g++.dg/other/i386-3.C	(revision 231943)
25c7f1
+++ gcc/testsuite/g++.dg/other/i386-3.C	(revision 231945)
25c7f1
@@ -1,9 +1,9 @@
25c7f1
 /* { dg-do compile { target i?86-*-* x86_64-*-* } } */
25c7f1
-/* { dg-options "-O -fkeep-inline-functions -march=k8 -msse4a -m3dnow -mavx -mavx2 -mfma4 -mxop -maes -mpclmul -mpopcnt -mabm -mlzcnt -mbmi -mbmi2 -mtbm -mlwp -mfsgsbase -mrdrnd -mf16c -mfma -mrtm -mrdseed -mprfchw -madx -mfxsr -mxsaveopt" } */
25c7f1
+/* { dg-options "-O -fkeep-inline-functions -march=k8 -msse4a -m3dnow -mavx -mavx2 -mfma4 -mxop -maes -mpclmul -mpopcnt -mabm -mlzcnt -mbmi -mbmi2 -mtbm -mlwp -mfsgsbase -mrdrnd -mf16c -mfma -mrtm -mrdseed -mprfchw -madx -mfxsr -mxsaveopt -mpku" } */
25c7f1
 
25c7f1
 /* Test that {,x,e,p,t,s,w,a,b,i}mmintrin.h, mm3dnow.h, fma4intrin.h,
25c7f1
    xopintrin.h, abmintrin.h, bmiintrin.h, tbmintrin.h, lwpintrin.h,
25c7f1
-   popcntintrin.h, fmaintrin.h and mm_malloc.h are usable with
25c7f1
+   popcntintrin.h, fmaintrin.h, pkuintrin.h and mm_malloc.h are usable with
25c7f1
    -O -fkeep-inline-functions.  */
25c7f1
 
25c7f1
 #include <x86intrin.h>