aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorH.J. Lu <hjl.tools@gmail.com>2023-04-05 09:21:43 -0700
committerH.J. Lu <hjl.tools@gmail.com>2023-04-05 14:46:10 -0700
commitb05521c916790dbaeb953fca7b979a889d868db2 (patch)
treee88709b11e820a138de792a257263b81d399c8f8
parent609b7b2d3c0c44f4e42a235f8d7c207c903a6bb1 (diff)
downloadglibc-b05521c916790dbaeb953fca7b979a889d868db2.zip
glibc-b05521c916790dbaeb953fca7b979a889d868db2.tar.gz
glibc-b05521c916790dbaeb953fca7b979a889d868db2.tar.bz2
<sys/platform/x86.h>: Add AMX-COMPLEX support
Add AMX-COMPLEX support to <sys/platform/x86.h>. Reviewed-by: Noah Goldstein <goldstein.w.n@gmail.com>
-rw-r--r--manual/platform.texi3
-rw-r--r--sysdeps/x86/bits/platform/x86.h1
-rw-r--r--sysdeps/x86/cpu-features.c2
-rw-r--r--sysdeps/x86/include/cpu-features.h3
-rw-r--r--sysdeps/x86/tst-get-cpu-features.c2
5 files changed, 11 insertions, 0 deletions
diff --git a/manual/platform.texi b/manual/platform.texi
index 1e12099..e7448ff 100644
--- a/manual/platform.texi
+++ b/manual/platform.texi
@@ -198,6 +198,9 @@ The supported processor features are:
@code{AMX_BF16} -- Tile computational operations on bfloat16 numbers.
@item
+@code{AMX_COMPLEX} -- Tile computational operations on complex FP16 numbers.
+
+@item
@code{AMX_INT8} -- Tile computational operations on 8-bit numbers.
@item
diff --git a/sysdeps/x86/bits/platform/x86.h b/sysdeps/x86/bits/platform/x86.h
index d8ba33b..96eb4c0 100644
--- a/sysdeps/x86/bits/platform/x86.h
+++ b/sysdeps/x86/bits/platform/x86.h
@@ -310,6 +310,7 @@ enum
x86_cpu_AVX_VNNI_INT8 = x86_cpu_index_7_ecx_1_edx + 4,
x86_cpu_AVX_NE_CONVERT = x86_cpu_index_7_ecx_1_edx + 5,
+ x86_cpu_AMX_COMPLEX = x86_cpu_index_7_ecx_1_edx + 8,
x86_cpu_index_19_ebx
= (CPUID_INDEX_19 * 8 * 4 * sizeof (unsigned int)
diff --git a/sysdeps/x86/cpu-features.c b/sysdeps/x86/cpu-features.c
index dfd1b85..c2bea6a 100644
--- a/sysdeps/x86/cpu-features.c
+++ b/sysdeps/x86/cpu-features.c
@@ -221,6 +221,8 @@ update_active (struct cpu_features *cpu_features)
CPU_FEATURE_SET_ACTIVE (cpu_features, AMX_INT8);
/* Determine if AMX_FP16 is usable. */
CPU_FEATURE_SET_ACTIVE (cpu_features, AMX_FP16);
+ /* Determine if AMX_COMPLEX is usable. */
+ CPU_FEATURE_SET_ACTIVE (cpu_features, AMX_COMPLEX);
}
/* These features are usable only when OSXSAVE is enabled. */
diff --git a/sysdeps/x86/include/cpu-features.h b/sysdeps/x86/include/cpu-features.h
index 673cf8c..f14c107 100644
--- a/sysdeps/x86/include/cpu-features.h
+++ b/sysdeps/x86/include/cpu-features.h
@@ -317,6 +317,7 @@ enum
/* EDX. */
#define bit_cpu_AVX_VNNI_INT8 (1u << 4)
#define bit_cpu_AVX_NE_CONVERT (1u << 5)
+#define bit_cpu_AMX_COMPLEX (1u << 8)
/* CPUID_INDEX_19. */
@@ -558,6 +559,7 @@ enum
#define index_cpu_LAM CPUID_INDEX_7_ECX_1
#define index_cpu_AVX_VNNI_INT8 CPUID_INDEX_7_ECX_1
#define index_cpu_AVX_NE_CONVERT CPUID_INDEX_7_ECX_1
+#define index_cpu_AMX_COMPLEX CPUID_INDEX_7_ECX_1
/* CPUID_INDEX_19. */
@@ -801,6 +803,7 @@ enum
/* EDX. */
#define reg_AVX_VNNI_INT8 edx
#define reg_AVX_NE_CONVERT edx
+#define reg_AMX_COMPLEX edx
/* CPUID_INDEX_19. */
diff --git a/sysdeps/x86/tst-get-cpu-features.c b/sysdeps/x86/tst-get-cpu-features.c
index bb1b67f..87fe273 100644
--- a/sysdeps/x86/tst-get-cpu-features.c
+++ b/sysdeps/x86/tst-get-cpu-features.c
@@ -217,6 +217,7 @@ do_test (void)
CHECK_CPU_FEATURE_PRESENT (MSRLIST);
CHECK_CPU_FEATURE_PRESENT (AVX_VNNI_INT8);
CHECK_CPU_FEATURE_PRESENT (AVX_NE_CONVERT);
+ CHECK_CPU_FEATURE_PRESENT (AMX_COMPLEX);
CHECK_CPU_FEATURE_PRESENT (AESKLE);
CHECK_CPU_FEATURE_PRESENT (WIDE_KL);
CHECK_CPU_FEATURE_PRESENT (PTWRITE);
@@ -386,6 +387,7 @@ do_test (void)
CHECK_CPU_FEATURE_ACTIVE (AVX_IFMA);
CHECK_CPU_FEATURE_ACTIVE (AVX_VNNI_INT8);
CHECK_CPU_FEATURE_ACTIVE (AVX_NE_CONVERT);
+ CHECK_CPU_FEATURE_ACTIVE (AMX_COMPLEX);
CHECK_CPU_FEATURE_ACTIVE (AESKLE);
CHECK_CPU_FEATURE_ACTIVE (WIDE_KL);
CHECK_CPU_FEATURE_ACTIVE (PTWRITE);