e354a5
commit f2c679d4b2c73a95f437c705f960a4af1fa23498
e354a5
Author: H.J. Lu <hjl.tools@gmail.com>
e354a5
Date:   Tue Sep 15 05:49:27 2020 -0700
e354a5
e354a5
    <sys/platform/x86.h>: Add Intel Key Locker support
e354a5
    
e354a5
    Add Intel Key Locker:
e354a5
    
e354a5
    https://software.intel.com/content/www/us/en/develop/download/intel-key-locker-specification.html
e354a5
    
e354a5
    support to <sys/platform/x86.h>.  Intel Key Locker has
e354a5
    
e354a5
    1. KL: AES Key Locker instructions.
e354a5
    2. WIDE_KL: AES wide Key Locker instructions.
e354a5
    3. AESKLE: AES Key Locker instructions are enabled by OS.
e354a5
    
e354a5
    Applications should use
e354a5
    
e354a5
    if (CPU_FEATURE_USABLE (KL))
e354a5
    
e354a5
    and
e354a5
    
e354a5
    if (CPU_FEATURE_USABLE (WIDE_KL))
e354a5
    
e354a5
    to check if AES Key Locker instructions and AES wide Key Locker
e354a5
    instructions are usable.
e354a5
e354a5
diff --git a/manual/platform.texi b/manual/platform.texi
e354a5
index 2c145acdc3564cbb..95b0ed0642c9f8a9 100644
e354a5
--- a/manual/platform.texi
e354a5
+++ b/manual/platform.texi
e354a5
@@ -177,6 +177,9 @@ The supported processor features are:
e354a5
 @item
e354a5
 @code{AES} -- The AES instruction extensions.
e354a5
 
e354a5
+@item
e354a5
+@code{AESKLE} -- AES Key Locker instructions are enabled by OS.
e354a5
+
e354a5
 @item
e354a5
 @code{AMX_BF16} -- Tile computational operations on bfloat16 numbers.
e354a5
 
e354a5
@@ -353,6 +356,9 @@ the indirect branch predictor barrier (IBPB).
e354a5
 @item
e354a5
 @code{INVPCID} -- INVPCID instruction.
e354a5
 
e354a5
+@item
e354a5
+@code{KL} -- AES Key Locker instructions.
e354a5
+
e354a5
 @item
e354a5
 @code{L1D_FLUSH} -- IA32_FLUSH_CMD MSR.
e354a5
 
e354a5
@@ -598,6 +604,9 @@ using a TSC deadline value.
e354a5
 @item
e354a5
 @code{WBNOINVD} -- WBINVD/WBNOINVD instructions.
e354a5
 
e354a5
+@item
e354a5
+@code{WIDE_KL} -- AES wide Key Locker instructions.
e354a5
+
e354a5
 @item
e354a5
 @code{X2APIC} -- x2APIC.
e354a5
 
e354a5
diff --git a/sysdeps/x86/cpu-features.c b/sysdeps/x86/cpu-features.c
e354a5
index 6954728c47d0126b..77a596a15404b575 100644
e354a5
--- a/sysdeps/x86/cpu-features.c
e354a5
+++ b/sysdeps/x86/cpu-features.c
e354a5
@@ -269,6 +269,14 @@ update_usable (struct cpu_features *cpu_features)
e354a5
   /* Determine if PKU is usable.  */
e354a5
   if (CPU_FEATURES_CPU_P (cpu_features, OSPKE))
e354a5
     CPU_FEATURE_SET (cpu_features, PKU);
e354a5
+
e354a5
+  /* Determine if Key Locker instructions are usable.  */
e354a5
+  if (CPU_FEATURES_CPU_P (cpu_features, AESKLE))
e354a5
+    {
e354a5
+      CPU_FEATURE_SET (cpu_features, AESKLE);
e354a5
+      CPU_FEATURE_SET_USABLE (cpu_features, KL);
e354a5
+      CPU_FEATURE_SET_USABLE (cpu_features, WIDE_KL);
e354a5
+    }
e354a5
 }
e354a5
 
e354a5
 static void
e354a5
@@ -341,6 +349,12 @@ get_common_indices (struct cpu_features *cpu_features,
e354a5
 		   cpu_features->features[COMMON_CPUID_INDEX_D_ECX_1].cpuid.ecx,
e354a5
 		   cpu_features->features[COMMON_CPUID_INDEX_D_ECX_1].cpuid.edx);
e354a5
 
e354a5
+  if (cpu_features->basic.max_cpuid >= 0x19)
e354a5
+    __cpuid_count (0x19, 0,
e354a5
+		   cpu_features->features[COMMON_CPUID_INDEX_19].cpuid.eax,
e354a5
+		   cpu_features->features[COMMON_CPUID_INDEX_19].cpuid.ebx,
e354a5
+		   cpu_features->features[COMMON_CPUID_INDEX_19].cpuid.ecx,
e354a5
+		   cpu_features->features[COMMON_CPUID_INDEX_19].cpuid.edx);
e354a5
 }
e354a5
 
e354a5
 _Static_assert (((index_arch_Fast_Unaligned_Load
e354a5
diff --git a/sysdeps/x86/sys/platform/x86.h b/sysdeps/x86/sys/platform/x86.h
e354a5
index ebc5f6fc16cb8104..bcc81ab5f8ac8265 100644
e354a5
--- a/sysdeps/x86/sys/platform/x86.h
e354a5
+++ b/sysdeps/x86/sys/platform/x86.h
e354a5
@@ -28,6 +28,7 @@ enum
e354a5
   COMMON_CPUID_INDEX_80000007,
e354a5
   COMMON_CPUID_INDEX_80000008,
e354a5
   COMMON_CPUID_INDEX_7_ECX_1,
e354a5
+  COMMON_CPUID_INDEX_19,
e354a5
   /* Keep the following line at the end.  */
e354a5
   COMMON_CPUID_INDEX_MAX
e354a5
 };
e354a5
@@ -224,7 +225,7 @@ extern const struct cpu_features *__x86_get_cpu_features (unsigned int)
e354a5
 /* Note: Bits 17-21: The value of MAWAU used by the BNDLDX and BNDSTX
e354a5
    instructions in 64-bit mode.  */
e354a5
 #define bit_cpu_RDPID		(1u << 22)
e354a5
-#define bit_cpu_INDEX_7_ECX_23	(1u << 23)
e354a5
+#define bit_cpu_KL		(1u << 23)
e354a5
 #define bit_cpu_INDEX_7_ECX_24	(1u << 24)
e354a5
 #define bit_cpu_CLDEMOTE	(1u << 25)
e354a5
 #define bit_cpu_INDEX_7_ECX_26	(1u << 26)
e354a5
@@ -312,6 +313,12 @@ extern const struct cpu_features *__x86_get_cpu_features (unsigned int)
e354a5
 /* EAX.  */
e354a5
 #define bit_cpu_AVX512_BF16	(1u << 5)
e354a5
 
e354a5
+/* COMMON_CPUID_INDEX_19.  */
e354a5
+
e354a5
+/* EBX.  */
e354a5
+#define bit_cpu_AESKLE		(1u << 0)
e354a5
+#define bit_cpu_WIDE_KL		(1u << 2)
e354a5
+
e354a5
 /* COMMON_CPUID_INDEX_1.  */
e354a5
 
e354a5
 /* ECX.  */
e354a5
@@ -437,7 +444,7 @@ extern const struct cpu_features *__x86_get_cpu_features (unsigned int)
e354a5
 #define index_cpu_INDEX_7_ECX_15 COMMON_CPUID_INDEX_7
e354a5
 #define index_cpu_INDEX_7_ECX_16 COMMON_CPUID_INDEX_7
e354a5
 #define index_cpu_RDPID		COMMON_CPUID_INDEX_7
e354a5
-#define index_cpu_INDEX_7_ECX_23 COMMON_CPUID_INDEX_7
e354a5
+#define index_cpu_KL		COMMON_CPUID_INDEX_7
e354a5
 #define index_cpu_INDEX_7_ECX_24 COMMON_CPUID_INDEX_7
e354a5
 #define index_cpu_CLDEMOTE	COMMON_CPUID_INDEX_7
e354a5
 #define index_cpu_INDEX_7_ECX_26 COMMON_CPUID_INDEX_7
e354a5
@@ -525,6 +532,12 @@ extern const struct cpu_features *__x86_get_cpu_features (unsigned int)
e354a5
 /* EAX.  */
e354a5
 #define index_cpu_AVX512_BF16	COMMON_CPUID_INDEX_7_ECX_1
e354a5
 
e354a5
+/* COMMON_CPUID_INDEX_19.  */
e354a5
+
e354a5
+/* EBX.  */
e354a5
+#define index_cpu_AESKLE	COMMON_CPUID_INDEX_19
e354a5
+#define index_cpu_WIDE_KL	COMMON_CPUID_INDEX_19
e354a5
+
e354a5
 /* COMMON_CPUID_INDEX_1.  */
e354a5
 
e354a5
 /* ECX.  */
e354a5
@@ -650,7 +663,7 @@ extern const struct cpu_features *__x86_get_cpu_features (unsigned int)
e354a5
 #define reg_INDEX_7_ECX_15	ecx
e354a5
 #define reg_INDEX_7_ECX_16	ecx
e354a5
 #define reg_RDPID		ecx
e354a5
-#define reg_INDEX_7_ECX_23	ecx
e354a5
+#define reg_KL			ecx
e354a5
 #define reg_INDEX_7_ECX_24	ecx
e354a5
 #define reg_CLDEMOTE		ecx
e354a5
 #define reg_INDEX_7_ECX_26	ecx
e354a5
@@ -738,4 +751,10 @@ extern const struct cpu_features *__x86_get_cpu_features (unsigned int)
e354a5
 /* EAX.  */
e354a5
 #define reg_AVX512_BF16		eax
e354a5
 
e354a5
+/* COMMON_CPUID_INDEX_19.  */
e354a5
+
e354a5
+/* EBX.  */
e354a5
+#define reg_AESKLE		ebx
e354a5
+#define reg_WIDE_KL		ebx
e354a5
+
e354a5
 #endif  /* _SYS_PLATFORM_X86_H */
e354a5
diff --git a/sysdeps/x86/tst-get-cpu-features.c b/sysdeps/x86/tst-get-cpu-features.c
e354a5
index 95e0d33f6c7eeace..c01d701b52090983 100644
e354a5
--- a/sysdeps/x86/tst-get-cpu-features.c
e354a5
+++ b/sysdeps/x86/tst-get-cpu-features.c
e354a5
@@ -170,6 +170,7 @@ do_test (void)
e354a5
   CHECK_CPU_FEATURE (AVX512_BITALG);
e354a5
   CHECK_CPU_FEATURE (AVX512_VPOPCNTDQ);
e354a5
   CHECK_CPU_FEATURE (RDPID);
e354a5
+  CHECK_CPU_FEATURE (KL);
e354a5
   CHECK_CPU_FEATURE (CLDEMOTE);
e354a5
   CHECK_CPU_FEATURE (MOVDIRI);
e354a5
   CHECK_CPU_FEATURE (MOVDIR64B);
e354a5
@@ -217,6 +218,8 @@ do_test (void)
e354a5
   CHECK_CPU_FEATURE (INVARIANT_TSC);
e354a5
   CHECK_CPU_FEATURE (WBNOINVD);
e354a5
   CHECK_CPU_FEATURE (AVX512_BF16);
e354a5
+  CHECK_CPU_FEATURE (AESKLE);
e354a5
+  CHECK_CPU_FEATURE (WIDE_KL);
e354a5
 
e354a5
   printf ("Usable CPU features:\n");
e354a5
   CHECK_CPU_FEATURE_USABLE (SSE3);
e354a5
@@ -323,6 +326,7 @@ do_test (void)
e354a5
   CHECK_CPU_FEATURE_USABLE (AVX512_BITALG);
e354a5
   CHECK_CPU_FEATURE_USABLE (AVX512_VPOPCNTDQ);
e354a5
   CHECK_CPU_FEATURE_USABLE (RDPID);
e354a5
+  CHECK_CPU_FEATURE_USABLE (KL);
e354a5
   CHECK_CPU_FEATURE_USABLE (CLDEMOTE);
e354a5
   CHECK_CPU_FEATURE_USABLE (MOVDIRI);
e354a5
   CHECK_CPU_FEATURE_USABLE (MOVDIR64B);
e354a5
@@ -370,6 +374,8 @@ do_test (void)
e354a5
   CHECK_CPU_FEATURE_USABLE (INVARIANT_TSC);
e354a5
   CHECK_CPU_FEATURE_USABLE (WBNOINVD);
e354a5
   CHECK_CPU_FEATURE_USABLE (AVX512_BF16);
e354a5
+  CHECK_CPU_FEATURE_USABLE (AESKLE);
e354a5
+  CHECK_CPU_FEATURE_USABLE (WIDE_KL);
e354a5
 
e354a5
   return 0;
e354a5
 }