aboutsummaryrefslogtreecommitdiff
path: root/gcc
diff options
context:
space:
mode:
authorJonathan Wright <jonathan.wright@arm.com>2021-11-08 17:31:30 +0000
committerJonathan Wright <jonathan.wright@arm.com>2021-11-11 15:34:49 +0000
commita2590b545ee76867f3843749e38233f2887ce3ad (patch)
tree2208c23ef9c296bec56f855a9fcd03b475b31a49 /gcc
parent515ef83098325e9e3b9f7e74b11911fb9ef6daf2 (diff)
downloadgcc-a2590b545ee76867f3843749e38233f2887ce3ad.zip
gcc-a2590b545ee76867f3843749e38233f2887ce3ad.tar.gz
gcc-a2590b545ee76867f3843749e38233f2887ce3ad.tar.bz2
aarch64: Use type-qualified builtins for PMUL[L] Neon intrinsics
Declare poly type-qualified builtins and use them for PMUL[L] Neon intrinsics. This removes the need for casts in arm_neon.h. gcc/ChangeLog: 2021-11-08 Jonathan Wright <jonathan.wright@arm.com> * config/aarch64/aarch64-simd-builtins.def: Use poly type qualifier in builtin generator macros. * config/aarch64/arm_neon.h (vmul_p8): Use type-qualified builtin and remove casts. (vmulq_p8): Likewise. (vmull_high_p8): Likewise. (vmull_p8): Likewise.
Diffstat (limited to 'gcc')
-rw-r--r--gcc/config/aarch64/aarch64-simd-builtins.def6
-rw-r--r--gcc/config/aarch64/arm_neon.h12
2 files changed, 7 insertions, 11 deletions
diff --git a/gcc/config/aarch64/aarch64-simd-builtins.def b/gcc/config/aarch64/aarch64-simd-builtins.def
index c39f172..4e298de 100644
--- a/gcc/config/aarch64/aarch64-simd-builtins.def
+++ b/gcc/config/aarch64/aarch64-simd-builtins.def
@@ -45,9 +45,9 @@
BUILTIN_VDC (COMBINE, combine, 0, AUTO_FP)
VAR1 (COMBINEP, combine, 0, NONE, di)
- BUILTIN_VB (BINOP, pmul, 0, NONE)
- VAR1 (BINOP, pmull, 0, NONE, v8qi)
- VAR1 (BINOP, pmull_hi, 0, NONE, v16qi)
+ BUILTIN_VB (BINOPP, pmul, 0, NONE)
+ VAR1 (BINOPP, pmull, 0, NONE, v8qi)
+ VAR1 (BINOPP, pmull_hi, 0, NONE, v16qi)
BUILTIN_VHSDF_HSDF (BINOP, fmulx, 0, FP)
BUILTIN_VHSDF_DF (UNOP, sqrt, 2, FP)
BUILTIN_VDQ_I (BINOP, addp, 0, NONE)
diff --git a/gcc/config/aarch64/arm_neon.h b/gcc/config/aarch64/arm_neon.h
index 538fc3c..2363587 100644
--- a/gcc/config/aarch64/arm_neon.h
+++ b/gcc/config/aarch64/arm_neon.h
@@ -1007,8 +1007,7 @@ __extension__ extern __inline poly8x8_t
__attribute__ ((__always_inline__, __gnu_inline__, __artificial__))
vmul_p8 (poly8x8_t __a, poly8x8_t __b)
{
- return (poly8x8_t) __builtin_aarch64_pmulv8qi ((int8x8_t) __a,
- (int8x8_t) __b);
+ return __builtin_aarch64_pmulv8qi_ppp (__a, __b);
}
__extension__ extern __inline int8x16_t
@@ -1071,8 +1070,7 @@ __extension__ extern __inline poly8x16_t
__attribute__ ((__always_inline__, __gnu_inline__, __artificial__))
vmulq_p8 (poly8x16_t __a, poly8x16_t __b)
{
- return (poly8x16_t) __builtin_aarch64_pmulv16qi ((int8x16_t) __a,
- (int8x16_t) __b);
+ return __builtin_aarch64_pmulv16qi_ppp (__a, __b);
}
__extension__ extern __inline int8x8_t
@@ -7716,8 +7714,7 @@ __extension__ extern __inline poly16x8_t
__attribute__ ((__always_inline__, __gnu_inline__, __artificial__))
vmull_high_p8 (poly8x16_t __a, poly8x16_t __b)
{
- return (poly16x8_t) __builtin_aarch64_pmull_hiv16qi ((int8x16_t) __a,
- (int8x16_t) __b);
+ return __builtin_aarch64_pmull_hiv16qi_ppp (__a, __b);
}
__extension__ extern __inline int16x8_t
@@ -7850,8 +7847,7 @@ __extension__ extern __inline poly16x8_t
__attribute__ ((__always_inline__, __gnu_inline__, __artificial__))
vmull_p8 (poly8x8_t __a, poly8x8_t __b)
{
- return (poly16x8_t) __builtin_aarch64_pmullv8qi ((int8x8_t) __a,
- (int8x8_t) __b);
+ return __builtin_aarch64_pmullv8qi_ppp (__a, __b);
}
__extension__ extern __inline int16x8_t