aboutsummaryrefslogtreecommitdiff
path: root/gcc
diff options
context:
space:
mode:
authorAyan Shafqat <ayan.x.shafqat@gmail.com>2025-05-01 06:17:30 -0700
committerKyrylo Tkachov <ktkachov@nvidia.com>2025-05-01 15:44:28 +0200
commit05df554536a8d33f4c438cfc7b006b3b2083246a (patch)
tree9516f4d5607fe338a68352d1a0ed92d6aecf1a12 /gcc
parent5c917a585d765b0878afd9435e3b3eece9f820f9 (diff)
downloadgcc-05df554536a8d33f4c438cfc7b006b3b2083246a.zip
gcc-05df554536a8d33f4c438cfc7b006b3b2083246a.tar.gz
gcc-05df554536a8d33f4c438cfc7b006b3b2083246a.tar.bz2
Aarch64: Add __sqrt and __sqrtf intrinsics and corresponding tests
This patch introduces two new inline functions, __sqrt and __sqrtf, in arm_acle.h for Aarch64 targets. These functions wrap the new builtins __builtin_aarch64_sqrtdf and __builtin_aarch64_sqrtsf, respectively, providing direct access to hardware instructions without relying on the standard math library or optimization levels. This patch also introduces acle_sqrt.c in the AArch64 testsuite, verifying that the new __sqrt and __sqrtf intrinsics emit the expected fsqrt instructions for double and float arguments. Coverage for new intrinsics ensures that __sqrt and __sqrtf are correctly expanded to hardware instructions and do not fall back to library calls, regardless of optimization levels. gcc/ChangeLog: * config/aarch64/arm_acle.h (__sqrt, __sqrtf): New function. gcc/testsuite/ChangeLog: * gcc.target/aarch64/acle/acle_sqrt.c: New test. Signed-off-by: Ayan Shafqat <ayan.x.shafqat@gmail.com>
Diffstat (limited to 'gcc')
-rw-r--r--gcc/config/aarch64/arm_acle.h14
-rw-r--r--gcc/testsuite/gcc.target/aarch64/acle/acle_sqrt.c19
2 files changed, 33 insertions, 0 deletions
diff --git a/gcc/config/aarch64/arm_acle.h b/gcc/config/aarch64/arm_acle.h
index d9e2401..507b6e7 100644
--- a/gcc/config/aarch64/arm_acle.h
+++ b/gcc/config/aarch64/arm_acle.h
@@ -118,6 +118,20 @@ __revl (unsigned long __value)
return __rev (__value);
}
+__extension__ extern __inline double
+__attribute__ ((__always_inline__, __gnu_inline__, __artificial__))
+__sqrt (double __x)
+{
+ return __builtin_aarch64_sqrtdf (__x);
+}
+
+__extension__ extern __inline float
+__attribute__ ((__always_inline__, __gnu_inline__, __artificial__))
+__sqrtf (float __x)
+{
+ return __builtin_aarch64_sqrtsf (__x);
+}
+
#pragma GCC push_options
#pragma GCC target ("+nothing+jscvt")
__extension__ extern __inline int32_t
diff --git a/gcc/testsuite/gcc.target/aarch64/acle/acle_sqrt.c b/gcc/testsuite/gcc.target/aarch64/acle/acle_sqrt.c
new file mode 100644
index 0000000..482351f
--- /dev/null
+++ b/gcc/testsuite/gcc.target/aarch64/acle/acle_sqrt.c
@@ -0,0 +1,19 @@
+/* { dg-do compile } */
+/* { dg-options "-O2" } */
+
+#include "arm_acle.h"
+
+double
+test_acle_sqrt (double x)
+{
+ return __sqrt (x);
+}
+
+float
+test_acle_sqrtf (float x)
+{
+ return __sqrtf (x);
+}
+
+/* { dg-final { scan-assembler-times "fsqrt\td\[0-9\]" 1 } } */
+/* { dg-final { scan-assembler-times "fsqrt\ts\[0-9\]" 1 } } */