diff options
author | Matthias Kretz <m.kretz@gsi.de> | 2024-03-27 08:49:43 +0100 |
---|---|---|
committer | Matthias Kretz <m.kretz@gsi.de> | 2024-05-10 16:06:51 +0200 |
commit | f0b7583dab56c78824344e00eb6230eaaeb09a44 (patch) | |
tree | 5066aa5619b4e333bfc53607fe2dfb2b9d026de0 | |
parent | 4190a95cb837c5d221d9c5677f49f3c7d4d5576f (diff) | |
download | gcc-f0b7583dab56c78824344e00eb6230eaaeb09a44.zip gcc-f0b7583dab56c78824344e00eb6230eaaeb09a44.tar.gz gcc-f0b7583dab56c78824344e00eb6230eaaeb09a44.tar.bz2 |
libstdc++: Fix call signature of builtins from masked ++/--
This resolves failures in the "expensive" where-* test of check-simd
when targeting AVX-512.
Signed-off-by: Matthias Kretz <m.kretz@gsi.de>
libstdc++-v3/ChangeLog:
* include/experimental/bits/simd_x86.h (_S_masked_unary): Call
the 4- and 8-byte variants of __builtin_ia32_subp[ds] without
rounding direction argument.
(cherry picked from commit 0ac2c0f0687b321ab54de271d788b4e0a287b4e2)
-rw-r--r-- | libstdc++-v3/include/experimental/bits/simd_x86.h | 12 |
1 files changed, 9 insertions, 3 deletions
diff --git a/libstdc++-v3/include/experimental/bits/simd_x86.h b/libstdc++-v3/include/experimental/bits/simd_x86.h index 2e7ea23..fb0d697 100644 --- a/libstdc++-v3/include/experimental/bits/simd_x86.h +++ b/libstdc++-v3/include/experimental/bits/simd_x86.h @@ -3537,17 +3537,23 @@ template <typename _Abi> } else { -#define _GLIBCXX_SIMD_MASK_SUB(_Sizeof, _Width, _Instr) \ +#define _GLIBCXX_SIMD_MASK_SUB_512(_Sizeof, _Width, _Instr) \ if constexpr (sizeof(_Tp) == _Sizeof && sizeof(__v) == _Width) \ return __builtin_ia32_##_Instr##_mask( \ __v._M_data, __vector_broadcast<_Np>(_Tp(__pm_one)), __v._M_data, \ __k._M_data, _MM_FROUND_CUR_DIRECTION) - _GLIBCXX_SIMD_MASK_SUB(4, 64, subps512); +#define _GLIBCXX_SIMD_MASK_SUB(_Sizeof, _Width, _Instr) \ + if constexpr (sizeof(_Tp) == _Sizeof && sizeof(__v) == _Width) \ + return __builtin_ia32_##_Instr##_mask( \ + __v._M_data, __vector_broadcast<_Np>(_Tp(__pm_one)), __v._M_data, \ + __k._M_data) + _GLIBCXX_SIMD_MASK_SUB_512(4, 64, subps512); _GLIBCXX_SIMD_MASK_SUB(4, 32, subps256); _GLIBCXX_SIMD_MASK_SUB(4, 16, subps128); - _GLIBCXX_SIMD_MASK_SUB(8, 64, subpd512); + _GLIBCXX_SIMD_MASK_SUB_512(8, 64, subpd512); _GLIBCXX_SIMD_MASK_SUB(8, 32, subpd256); _GLIBCXX_SIMD_MASK_SUB(8, 16, subpd128); +#undef _GLIBCXX_SIMD_MASK_SUB_512 #undef _GLIBCXX_SIMD_MASK_SUB } #endif // __clang__ |