/* { dg-do run } */ /* { dg-require-effective-target avx512er } */ /* { dg-options "-O2 -mavx512er" } */ #include "avx512er-check.h" #include "avx512f-mask-type.h" #include "avx512f-helper.h" #include #define IMM 0x23 void static avx512er_test (void) { union128 src1, src2, res, res1, res2, res3, res4; float res_ref[4]; MASK_TYPE mask = MASK_VALUE; int i; for (i = 0; i < 4; i++) { src1.a[i] = 179.345 - 6.5645 * i; src2.a[i] = 179221345 + 6.5645 * i; res_ref[i] = src1.a[i]; } res_ref[0] = 1.0 / sqrt (src2.a[0]); res.x = _mm_rsqrt28_round_ss (src1.x, src2.x, _MM_FROUND_NO_EXC); res1.x = _mm_mask_rsqrt28_ss (src1.x, IMM, src1.x, src2.x); res2.x = _mm_mask_rsqrt28_round_ss (src1.x, IMM, src1.x, src2.x, _MM_FROUND_TO_NEAREST_INT | _MM_FROUND_NO_EXC); res3.x = _mm_maskz_rsqrt28_ss (IMM, src1.x, src2.x); res4.x = _mm_maskz_rsqrt28_round_ss (IMM, src1.x, src2.x, _MM_FROUND_TO_NEAREST_INT | _MM_FROUND_NO_EXC); if (checkVf (res.a, res_ref, 4)) abort (); MASK_MERGE () (res_ref, mask, 1); if (checkVf (res1.a, res_ref, 2)) abort (); if (checkVf (res2.a, res_ref, 2)) abort (); MASK_ZERO () (res_ref, mask, 1); if (checkVf (res3.a, res_ref, 2)) abort (); if (checkVf (res4.a, res_ref, 2)) abort (); }