aboutsummaryrefslogtreecommitdiff
path: root/gcc/testsuite
diff options
context:
space:
mode:
authorIlya Verbin <ilya.verbin@intel.com>2016-06-21 14:38:02 +0000
committerIlya Verbin <iverbin@gcc.gnu.org>2016-06-21 14:38:02 +0000
commit3b9bc511ee48c7c2e868baaa48f02e7e7e115ce7 (patch)
tree472112598083fd9265e7e97a3fe19079b8d23fcb /gcc/testsuite
parent21db1c786740b7de9e375f0dd54f78eaa4aa2339 (diff)
downloadgcc-3b9bc511ee48c7c2e868baaa48f02e7e7e115ce7.zip
gcc-3b9bc511ee48c7c2e868baaa48f02e7e7e115ce7.tar.gz
gcc-3b9bc511ee48c7c2e868baaa48f02e7e7e115ce7.tar.bz2
[AVX-512ER] vrsqrt28ps auto generation
gcc/ * config/i386/i386.c (ix86_emit_swsqrtsf): Emit vrsqrt28ps. * config/i386/sse.md (define_expand "rsqrtv16sf2"): New. gcc/testsuite/ * gcc.target/i386/avx512er-vrsqrt28ps-3.c: New test. * gcc.target/i386/avx512er-vrsqrt28ps-4.c: New test. * gcc.target/i386/avx512er-vrsqrt28ps-5.c: New test. * gcc.target/i386/avx512er-vrsqrt28ps-6.c: New test. From-SVN: r237649
Diffstat (limited to 'gcc/testsuite')
-rw-r--r--gcc/testsuite/ChangeLog7
-rw-r--r--gcc/testsuite/gcc.target/i386/avx512er-vrsqrt28ps-3.c47
-rw-r--r--gcc/testsuite/gcc.target/i386/avx512er-vrsqrt28ps-4.c7
-rw-r--r--gcc/testsuite/gcc.target/i386/avx512er-vrsqrt28ps-5.c47
-rw-r--r--gcc/testsuite/gcc.target/i386/avx512er-vrsqrt28ps-6.c7
5 files changed, 115 insertions, 0 deletions
diff --git a/gcc/testsuite/ChangeLog b/gcc/testsuite/ChangeLog
index cff25cc..461665e 100644
--- a/gcc/testsuite/ChangeLog
+++ b/gcc/testsuite/ChangeLog
@@ -1,5 +1,12 @@
2016-06-21 Ilya Verbin <ilya.verbin@intel.com>
+ * gcc.target/i386/avx512er-vrsqrt28ps-3.c: New test.
+ * gcc.target/i386/avx512er-vrsqrt28ps-4.c: New test.
+ * gcc.target/i386/avx512er-vrsqrt28ps-5.c: New test.
+ * gcc.target/i386/avx512er-vrsqrt28ps-6.c: New test.
+
+2016-06-21 Ilya Verbin <ilya.verbin@intel.com>
+
* gcc.target/i386/avx512er-vrcp28ps-3.c: New test.
* gcc.target/i386/avx512er-vrcp28ps-4.c: New test.
diff --git a/gcc/testsuite/gcc.target/i386/avx512er-vrsqrt28ps-3.c b/gcc/testsuite/gcc.target/i386/avx512er-vrsqrt28ps-3.c
new file mode 100644
index 0000000..1ba8172
--- /dev/null
+++ b/gcc/testsuite/gcc.target/i386/avx512er-vrsqrt28ps-3.c
@@ -0,0 +1,47 @@
+/* { dg-do run } */
+/* { dg-require-effective-target avx512er } */
+/* { dg-options "-O2 -ffast-math -ftree-vectorize -mavx512er" } */
+
+#include <math.h>
+#include "avx512er-check.h"
+
+#define MAX 1000
+#define EPS 0.00001
+
+__attribute__ ((noinline, optimize (1)))
+void static
+compute_rsqrt_ref (float *a, float *r)
+{
+ for (int i = 0; i < MAX; i++)
+ r[i] = 1.0 / sqrtf (a[i]);
+}
+
+__attribute__ ((noinline))
+void static
+compute_rsqrt_exp (float *a, float *r)
+{
+ for (int i = 0; i < MAX; i++)
+ r[i] = 1.0 / sqrtf (a[i]);
+}
+
+void static
+avx512er_test (void)
+{
+ float in[MAX];
+ float ref[MAX];
+ float exp[MAX];
+
+ for (int i = 0; i < MAX; i++)
+ in[i] = 8765.987 - 8.6756 * i;
+
+ compute_rsqrt_ref (in, ref);
+ compute_rsqrt_exp (in, exp);
+
+ for (int i = 0; i < MAX; i++)
+ {
+ float rel_err = (ref[i] - exp[i]) / ref[i];
+ rel_err = rel_err > 0.0 ? rel_err : -rel_err;
+ if (rel_err > EPS)
+ abort ();
+ }
+}
diff --git a/gcc/testsuite/gcc.target/i386/avx512er-vrsqrt28ps-4.c b/gcc/testsuite/gcc.target/i386/avx512er-vrsqrt28ps-4.c
new file mode 100644
index 0000000..2f5f73f
--- /dev/null
+++ b/gcc/testsuite/gcc.target/i386/avx512er-vrsqrt28ps-4.c
@@ -0,0 +1,7 @@
+/* { dg-do compile } */
+/* { dg-options "-O2 -ffast-math -ftree-vectorize -mavx512er" } */
+
+#include "avx512er-vrsqrt28ps-3.c"
+
+/* { dg-final { scan-assembler-times "vrsqrt28ps\[^\n\r\]*zmm\[0-9\]+(?:\n|\[ \\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-not "vrcp28ps\[^\n\r\]*zmm\[0-9\]+(?:\n|\[ \\t\]+#)" } } */
diff --git a/gcc/testsuite/gcc.target/i386/avx512er-vrsqrt28ps-5.c b/gcc/testsuite/gcc.target/i386/avx512er-vrsqrt28ps-5.c
new file mode 100644
index 0000000..e067a81
--- /dev/null
+++ b/gcc/testsuite/gcc.target/i386/avx512er-vrsqrt28ps-5.c
@@ -0,0 +1,47 @@
+/* { dg-do run } */
+/* { dg-require-effective-target avx512er } */
+/* { dg-options "-O2 -ffast-math -ftree-vectorize -mavx512er" } */
+
+#include <math.h>
+#include "avx512er-check.h"
+
+#define MAX 1000
+#define EPS 0.00001
+
+__attribute__ ((noinline, optimize (1)))
+void static
+compute_sqrt_ref (float *a, float *r)
+{
+ for (int i = 0; i < MAX; i++)
+ r[i] = sqrtf (a[i]);
+}
+
+__attribute__ ((noinline))
+void static
+compute_sqrt_exp (float *a, float *r)
+{
+ for (int i = 0; i < MAX; i++)
+ r[i] = sqrtf (a[i]);
+}
+
+void static
+avx512er_test (void)
+{
+ float in[MAX];
+ float ref[MAX];
+ float exp[MAX];
+
+ for (int i = 0; i < MAX; i++)
+ in[i] = 8765.987 - 8.6756 * i;
+
+ compute_sqrt_ref (in, ref);
+ compute_sqrt_exp (in, exp);
+
+ for (int i = 0; i < MAX; i++)
+ {
+ float rel_err = (ref[i] - exp[i]) / ref[i];
+ rel_err = rel_err > 0.0 ? rel_err : -rel_err;
+ if (rel_err > EPS)
+ abort ();
+ }
+}
diff --git a/gcc/testsuite/gcc.target/i386/avx512er-vrsqrt28ps-6.c b/gcc/testsuite/gcc.target/i386/avx512er-vrsqrt28ps-6.c
new file mode 100644
index 0000000..77c5cba
--- /dev/null
+++ b/gcc/testsuite/gcc.target/i386/avx512er-vrsqrt28ps-6.c
@@ -0,0 +1,7 @@
+/* { dg-do compile } */
+/* { dg-options "-O2 -ffast-math -ftree-vectorize -mavx512er" } */
+
+#include "avx512er-vrsqrt28ps-5.c"
+
+/* { dg-final { scan-assembler-times "vrsqrt28ps\[^\n\r\]*zmm\[0-9\]+(?:\n|\[ \\t\]+#)" 1 } } */
+/* { dg-final { scan-assembler-times "vrcp28ps\[^\n\r\]*zmm\[0-9\]+(?:\n|\[ \\t\]+#)" 1 } } */