aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorKyrylo Tkachov <kyrylo.tkachov@arm.com>2023-04-23 14:44:13 +0100
committerKyrylo Tkachov <kyrylo.tkachov@arm.com>2023-04-23 14:44:13 +0100
commit7e26fd6bcd39f53bc917f55f8cce6101180c1dcd (patch)
tree2f05b9206b2a8d47ec5965239c07be5235aef965
parent3b13c59c835f92b353ef318398e39907cdeec4fa (diff)
downloadgcc-7e26fd6bcd39f53bc917f55f8cce6101180c1dcd.zip
gcc-7e26fd6bcd39f53bc917f55f8cce6101180c1dcd.tar.gz
gcc-7e26fd6bcd39f53bc917f55f8cce6101180c1dcd.tar.bz2
aarch64: Annotate fcvtn pattern for vec_concat with zeroes
Using the define_substs in aarch64-simd.md this is a straightforward annotation to remove a redundant fmov insn. So the codegen goes from: foo_d: fcvtn v0.2s, v0.2d fmov d0, d0 ret to the simple: foo_d: fcvtn v0.2s, v0.2d ret Bootstrapped and tested on aarch64-none-linux-gnu. gcc/ChangeLog: * config/aarch64/aarch64-simd.md (aarch64_float_truncate_lo_): Rename to... (aarch64_float_truncate_lo_<mode><vczle><vczbe>): ... This. gcc/testsuite/ChangeLog: * gcc.target/aarch64/float_truncate_zero.c: New test.
-rw-r--r--gcc/config/aarch64/aarch64-simd.md2
-rw-r--r--gcc/testsuite/gcc.target/aarch64/float_truncate_zero.c32
2 files changed, 33 insertions, 1 deletions
diff --git a/gcc/config/aarch64/aarch64-simd.md b/gcc/config/aarch64/aarch64-simd.md
index 4a1ec71..7bd4362 100644
--- a/gcc/config/aarch64/aarch64-simd.md
+++ b/gcc/config/aarch64/aarch64-simd.md
@@ -3331,7 +3331,7 @@
}
)
-(define_insn "aarch64_float_truncate_lo_<mode>"
+(define_insn "aarch64_float_truncate_lo_<mode><vczle><vczbe>"
[(set (match_operand:VDF 0 "register_operand" "=w")
(float_truncate:VDF
(match_operand:<VWIDE> 1 "register_operand" "w")))]
diff --git a/gcc/testsuite/gcc.target/aarch64/float_truncate_zero.c b/gcc/testsuite/gcc.target/aarch64/float_truncate_zero.c
new file mode 100644
index 0000000..41775d1
--- /dev/null
+++ b/gcc/testsuite/gcc.target/aarch64/float_truncate_zero.c
@@ -0,0 +1,32 @@
+/* { dg-do compile } */
+/* { dg-additional-options "--save-temps -O1" } */
+/* { dg-final { check-function-bodies "**" "" "" } } */
+
+#include <arm_neon.h>
+
+/*
+** foo:
+** fcvtn v0.4h, v0.4s
+** ret
+*/
+
+float16x8_t
+foo (float32x4_t a)
+{
+ float16x4_t b = vcvt_f16_f32 (a);
+ return vcombine_f16 (b, vdup_n_f16 (0.0));
+}
+
+/*
+** foo_d:
+** fcvtn v0.2s, v0.2d
+** ret
+*/
+
+float32x4_t
+foo_d (float64x2_t a)
+{
+ float32x2_t b = vcvt_f32_f64 (a);
+ return vcombine_f32 (b, vdup_n_f32 (0.0));
+}
+