aboutsummaryrefslogtreecommitdiff
path: root/gcc
diff options
context:
space:
mode:
authordianhong xu <dianhong.xu@intel.com>2021-10-09 18:23:35 +0800
committerHongyu Wang <hongyu.wang@intel.com>2021-10-19 14:48:21 +0800
commit38f6ee6bfc4633175ca6f6d29e597d379ccae820 (patch)
treea55886fa80906d79deb2dfe288703fbb2bc2d867 /gcc
parentce4d1f632ff3f680550d3b186b60176022f41190 (diff)
downloadgcc-38f6ee6bfc4633175ca6f6d29e597d379ccae820.zip
gcc-38f6ee6bfc4633175ca6f6d29e597d379ccae820.tar.gz
gcc-38f6ee6bfc4633175ca6f6d29e597d379ccae820.tar.bz2
AVX512FP16: Add *_set1_pch intrinsics.
Add *_set1_pch (_Float16 _Complex A) intrinsics. gcc/ChangeLog: * config/i386/avx512fp16intrin.h: (_mm512_set1_pch): New intrinsic. * config/i386/avx512fp16vlintrin.h: (_mm256_set1_pch): New intrinsic. (_mm_set1_pch): Ditto. gcc/testsuite/ChangeLog: * gcc.target/i386/avx512fp16-set1-pch-1a.c: New test. * gcc.target/i386/avx512fp16-set1-pch-1b.c: New test. * gcc.target/i386/avx512fp16vl-set1-pch-1a.c: New test. * gcc.target/i386/avx512fp16vl-set1-pch-1b.c: New test.
Diffstat (limited to 'gcc')
-rw-r--r--gcc/config/i386/avx512fp16intrin.h13
-rw-r--r--gcc/config/i386/avx512fp16vlintrin.h26
-rw-r--r--gcc/testsuite/gcc.target/i386/avx512fp16-set1-pch-1a.c13
-rw-r--r--gcc/testsuite/gcc.target/i386/avx512fp16-set1-pch-1b.c42
-rw-r--r--gcc/testsuite/gcc.target/i386/avx512fp16vl-set1-pch-1a.c20
-rw-r--r--gcc/testsuite/gcc.target/i386/avx512fp16vl-set1-pch-1b.c57
6 files changed, 171 insertions, 0 deletions
diff --git a/gcc/config/i386/avx512fp16intrin.h b/gcc/config/i386/avx512fp16intrin.h
index 5e49447..44c5e24 100644
--- a/gcc/config/i386/avx512fp16intrin.h
+++ b/gcc/config/i386/avx512fp16intrin.h
@@ -7149,6 +7149,19 @@ _mm512_permutexvar_ph (__m512i __A, __m512h __B)
(__mmask32)-1);
}
+extern __inline __m512h
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm512_set1_pch (_Float16 _Complex __A)
+{
+ union
+ {
+ _Float16 _Complex a;
+ float b;
+ } u = { .a = __A};
+
+ return (__m512h) _mm512_set1_ps (u.b);
+}
+
#ifdef __DISABLE_AVX512FP16__
#undef __DISABLE_AVX512FP16__
#pragma GCC pop_options
diff --git a/gcc/config/i386/avx512fp16vlintrin.h b/gcc/config/i386/avx512fp16vlintrin.h
index 0b1f1cb..11f34bb 100644
--- a/gcc/config/i386/avx512fp16vlintrin.h
+++ b/gcc/config/i386/avx512fp16vlintrin.h
@@ -3311,6 +3311,32 @@ _mm_permutexvar_ph (__m128i __A, __m128h __B)
(__mmask8)-1);
}
+extern __inline __m256h
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm256_set1_pch (_Float16 _Complex __A)
+{
+ union
+ {
+ _Float16 _Complex a;
+ float b;
+ } u = { .a = __A };
+
+ return (__m256h) _mm256_set1_ps (u.b);
+}
+
+extern __inline __m128h
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm_set1_pch (_Float16 _Complex __A)
+{
+ union
+ {
+ _Float16 _Complex a;
+ float b;
+ } u = { .a = __A };
+
+ return (__m128h) _mm_set1_ps (u.b);
+}
+
#ifdef __DISABLE_AVX512FP16VL__
#undef __DISABLE_AVX512FP16VL__
#pragma GCC pop_options
diff --git a/gcc/testsuite/gcc.target/i386/avx512fp16-set1-pch-1a.c b/gcc/testsuite/gcc.target/i386/avx512fp16-set1-pch-1a.c
new file mode 100644
index 0000000..0055193
--- /dev/null
+++ b/gcc/testsuite/gcc.target/i386/avx512fp16-set1-pch-1a.c
@@ -0,0 +1,13 @@
+/* { dg-do compile} */
+/* { dg-options "-O2 -mavx512fp16" } */
+
+#include <immintrin.h>
+
+__m512h
+__attribute__ ((noinline, noclone))
+test_mm512_set1_pch (_Float16 _Complex A)
+{
+ return _mm512_set1_pch(A);
+}
+
+/* { dg-final { scan-assembler "vbroadcastss\[ \\t\]+\[^\n\r\]*%zmm\[01\]" } } */
diff --git a/gcc/testsuite/gcc.target/i386/avx512fp16-set1-pch-1b.c b/gcc/testsuite/gcc.target/i386/avx512fp16-set1-pch-1b.c
new file mode 100644
index 0000000..450d7e3
--- /dev/null
+++ b/gcc/testsuite/gcc.target/i386/avx512fp16-set1-pch-1b.c
@@ -0,0 +1,42 @@
+/* { dg-do run { target avx512fp16 } } */
+/* { dg-options "-O2 -mavx512fp16" } */
+
+#include<stdio.h>
+#include <math.h>
+#include <complex.h>
+
+static void do_test (void);
+
+#define DO_TEST do_test
+#define AVX512FP16
+
+#include <immintrin.h>
+#include "avx512-check.h"
+
+static void
+do_test (void)
+{
+ _Float16 _Complex fc = 1.0 + 1.0*I;
+ union
+ {
+ _Float16 _Complex a;
+ float b;
+ } u = { .a = fc };
+ float ff= u.b;
+
+ typedef union
+ {
+ float fp[16];
+ __m512h m512h;
+ } u1;
+
+ __m512h test512 = _mm512_set1_pch(fc);
+
+ u1 test;
+ test.m512h = test512;
+ for (int i = 0; i<16; i++)
+ {
+ if (test.fp[i] != ff) abort();
+ }
+
+}
diff --git a/gcc/testsuite/gcc.target/i386/avx512fp16vl-set1-pch-1a.c b/gcc/testsuite/gcc.target/i386/avx512fp16vl-set1-pch-1a.c
new file mode 100644
index 0000000..4c5624f
--- /dev/null
+++ b/gcc/testsuite/gcc.target/i386/avx512fp16vl-set1-pch-1a.c
@@ -0,0 +1,20 @@
+/* { dg-do compile} */
+/* { dg-options "-O2 -mavx512fp16 -mavx512vl" } */
+
+#include <immintrin.h>
+
+__m256h
+__attribute__ ((noinline, noclone))
+test_mm256_set1_pch (_Float16 _Complex A)
+{
+ return _mm256_set1_pch(A);
+}
+
+__m128h
+__attribute__ ((noinline, noclone))
+test_mm_set1_pch (_Float16 _Complex A)
+{
+ return _mm_set1_pch(A);
+}
+
+/* { dg-final { scan-assembler-times "vbroadcastss" 2 } } */
diff --git a/gcc/testsuite/gcc.target/i386/avx512fp16vl-set1-pch-1b.c b/gcc/testsuite/gcc.target/i386/avx512fp16vl-set1-pch-1b.c
new file mode 100644
index 0000000..aebff14
--- /dev/null
+++ b/gcc/testsuite/gcc.target/i386/avx512fp16vl-set1-pch-1b.c
@@ -0,0 +1,57 @@
+/* { dg-do run { target avx512fp16 } } */
+/* { dg-options "-O2 -mavx512fp16 -mavx512vl" } */
+
+#include<stdio.h>
+#include <math.h>
+#include <complex.h>
+
+static void do_test (void);
+
+#define DO_TEST do_test
+#define AVX512FP16
+
+#include <immintrin.h>
+#include "avx512-check.h"
+
+static void
+do_test (void)
+{
+ _Float16 _Complex fc = 1.0 + 1.0*I;
+ union
+ {
+ _Float16 _Complex a;
+ float b;
+ } u = { .a = fc };
+ float ff= u.b;
+
+ typedef union
+ {
+ float fp[8];
+ __m256h m256h;
+ } u1;
+
+ __m256h test256 = _mm256_set1_pch(fc);
+
+ u1 test1;
+ test1.m256h = test256;
+ for (int i = 0; i<8; i++)
+ {
+ if (test1.fp[i] != ff) abort();
+ }
+
+ typedef union
+ {
+ float fp[4];
+ __m128h m128h;
+ } u2;
+
+ __m128h test128 = _mm_set1_pch(fc);
+
+ u2 test2;
+ test2.m128h = test128;
+ for (int i = 0; i<4; i++)
+ {
+ if (test2.fp[i] != ff) abort();
+ }
+
+}