|
|
e354a5 |
commit ebe454bcca6a5421512ad228595a5391506e990a
|
|
|
e354a5 |
Author: H.J. Lu <hjl.tools@gmail.com>
|
|
|
e354a5 |
Date: Thu Oct 8 08:24:47 2020 -0700
|
|
|
e354a5 |
|
|
|
e354a5 |
<sys/platform/x86.h>: Add AVX512_FP16 support
|
|
|
e354a5 |
|
|
|
e354a5 |
Add AVX512_FP16 support to <sys/platform/x86.h>.
|
|
|
e354a5 |
|
|
|
e354a5 |
diff --git a/manual/platform.texi b/manual/platform.texi
|
|
|
e354a5 |
index 0dd12a4353a93bf2..4f5fdff9d9ef16fd 100644
|
|
|
e354a5 |
--- a/manual/platform.texi
|
|
|
e354a5 |
+++ b/manual/platform.texi
|
|
|
e354a5 |
@@ -210,6 +210,9 @@ The supported processor features are:
|
|
|
e354a5 |
@item
|
|
|
e354a5 |
@code{AVX512_BITALG} -- The AVX512_BITALG instruction extensions.
|
|
|
e354a5 |
|
|
|
e354a5 |
+@item
|
|
|
e354a5 |
+@code{AVX512_FP16} -- The AVX512_FP16 instruction extensions.
|
|
|
e354a5 |
+
|
|
|
e354a5 |
@item
|
|
|
e354a5 |
@code{AVX512_IFMA} -- The AVX512_IFMA instruction extensions.
|
|
|
e354a5 |
|
|
|
e354a5 |
diff --git a/sysdeps/x86/cpu-features.c b/sysdeps/x86/cpu-features.c
|
|
|
e354a5 |
index 7f2ff00f2b4b45f2..67f137259fccf4ad 100644
|
|
|
e354a5 |
--- a/sysdeps/x86/cpu-features.c
|
|
|
e354a5 |
+++ b/sysdeps/x86/cpu-features.c
|
|
|
e354a5 |
@@ -175,6 +175,8 @@ update_usable (struct cpu_features *cpu_features)
|
|
|
e354a5 |
AVX512_VP2INTERSECT);
|
|
|
e354a5 |
/* Determine if AVX512_BF16 is usable. */
|
|
|
e354a5 |
CPU_FEATURE_SET_USABLE (cpu_features, AVX512_BF16);
|
|
|
e354a5 |
+ /* Determine if AVX512_FP16 is usable. */
|
|
|
e354a5 |
+ CPU_FEATURE_SET_USABLE (cpu_features, AVX512_FP16);
|
|
|
e354a5 |
}
|
|
|
e354a5 |
}
|
|
|
e354a5 |
}
|
|
|
e354a5 |
diff --git a/sysdeps/x86/sys/platform/x86.h b/sysdeps/x86/sys/platform/x86.h
|
|
|
e354a5 |
index 2760b81a56e6c7d7..0b18257e20105ea4 100644
|
|
|
e354a5 |
--- a/sysdeps/x86/sys/platform/x86.h
|
|
|
e354a5 |
+++ b/sysdeps/x86/sys/platform/x86.h
|
|
|
e354a5 |
@@ -259,7 +259,7 @@ extern const struct cpu_features *__x86_get_cpu_features (unsigned int)
|
|
|
e354a5 |
#define bit_cpu_IBT (1u << 20)
|
|
|
e354a5 |
#define bit_cpu_INDEX_7_EDX_21 (1u << 21)
|
|
|
e354a5 |
#define bit_cpu_AMX_BF16 (1u << 22)
|
|
|
e354a5 |
-#define bit_cpu_INDEX_7_EDX_23 (1u << 23)
|
|
|
e354a5 |
+#define bit_cpu_AVX512_FP16 (1u << 23)
|
|
|
e354a5 |
#define bit_cpu_AMX_TILE (1u << 24)
|
|
|
e354a5 |
#define bit_cpu_AMX_INT8 (1u << 25)
|
|
|
e354a5 |
#define bit_cpu_IBRS_IBPB (1u << 26)
|
|
|
e354a5 |
@@ -478,7 +478,7 @@ extern const struct cpu_features *__x86_get_cpu_features (unsigned int)
|
|
|
e354a5 |
#define index_cpu_IBT COMMON_CPUID_INDEX_7
|
|
|
e354a5 |
#define index_cpu_INDEX_7_EDX_21 COMMON_CPUID_INDEX_7
|
|
|
e354a5 |
#define index_cpu_AMX_BF16 COMMON_CPUID_INDEX_7
|
|
|
e354a5 |
-#define index_cpu_INDEX_7_EDX_23 COMMON_CPUID_INDEX_7
|
|
|
e354a5 |
+#define index_cpu_AVX512_FP16 COMMON_CPUID_INDEX_7
|
|
|
e354a5 |
#define index_cpu_AMX_TILE COMMON_CPUID_INDEX_7
|
|
|
e354a5 |
#define index_cpu_AMX_INT8 COMMON_CPUID_INDEX_7
|
|
|
e354a5 |
#define index_cpu_IBRS_IBPB COMMON_CPUID_INDEX_7
|
|
|
e354a5 |
@@ -697,7 +697,7 @@ extern const struct cpu_features *__x86_get_cpu_features (unsigned int)
|
|
|
e354a5 |
#define reg_IBT edx
|
|
|
e354a5 |
#define reg_INDEX_7_EDX_21 edx
|
|
|
e354a5 |
#define reg_AMX_BF16 edx
|
|
|
e354a5 |
-#define reg_INDEX_7_EDX_23 edx
|
|
|
e354a5 |
+#define reg_AVX512_FP16 edx
|
|
|
e354a5 |
#define reg_AMX_TILE edx
|
|
|
e354a5 |
#define reg_AMX_INT8 edx
|
|
|
e354a5 |
#define reg_IBRS_IBPB edx
|
|
|
e354a5 |
diff --git a/sysdeps/x86/tst-get-cpu-features.c b/sysdeps/x86/tst-get-cpu-features.c
|
|
|
e354a5 |
index 6fa092a8c10486a0..bcdeb243a82c4adc 100644
|
|
|
e354a5 |
--- a/sysdeps/x86/tst-get-cpu-features.c
|
|
|
e354a5 |
+++ b/sysdeps/x86/tst-get-cpu-features.c
|
|
|
e354a5 |
@@ -189,6 +189,7 @@ do_test (void)
|
|
|
e354a5 |
CHECK_CPU_FEATURE (PCONFIG);
|
|
|
e354a5 |
CHECK_CPU_FEATURE (IBT);
|
|
|
e354a5 |
CHECK_CPU_FEATURE (AMX_BF16);
|
|
|
e354a5 |
+ CHECK_CPU_FEATURE (AVX512_FP16);
|
|
|
e354a5 |
CHECK_CPU_FEATURE (AMX_TILE);
|
|
|
e354a5 |
CHECK_CPU_FEATURE (AMX_INT8);
|
|
|
e354a5 |
CHECK_CPU_FEATURE (IBRS_IBPB);
|
|
|
e354a5 |
@@ -343,6 +344,7 @@ do_test (void)
|
|
|
e354a5 |
CHECK_CPU_FEATURE_USABLE (TSXLDTRK);
|
|
|
e354a5 |
CHECK_CPU_FEATURE_USABLE (PCONFIG);
|
|
|
e354a5 |
CHECK_CPU_FEATURE_USABLE (AMX_BF16);
|
|
|
e354a5 |
+ CHECK_CPU_FEATURE_USABLE (AVX512_FP16);
|
|
|
e354a5 |
CHECK_CPU_FEATURE_USABLE (AMX_TILE);
|
|
|
e354a5 |
CHECK_CPU_FEATURE_USABLE (AMX_INT8);
|
|
|
e354a5 |
CHECK_CPU_FEATURE_USABLE (IBRS_IBPB);
|