aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorKyrylo Tkachov <kyrylo.tkachov@arm.com>2017-06-02 15:03:54 +0000
committerKyrylo Tkachov <ktkachov@gcc.gnu.org>2017-06-02 15:03:54 +0000
commitb160939bf3cd072e1c7a05bbbe221040f7670df2 (patch)
treef3303171cd508a8bbc26bdd003e6c0b98368b77f
parentd65d1bd970c3008e70a6418d2fdaace3f4f2e581 (diff)
downloadgcc-b160939bf3cd072e1c7a05bbbe221040f7670df2.zip
gcc-b160939bf3cd072e1c7a05bbbe221040f7670df2.tar.gz
gcc-b160939bf3cd072e1c7a05bbbe221040f7670df2.tar.bz2
[AArch64] Add HF vector modes to lane-to-lane INS pattern
* config/aarch64/aarch64-simd.md (*aarch64_simd_vec_copy_lane<mode>): Use VALL_F16 iterator rather than VALL. * gcc.target/aarch64/hfmode_ins_1.c: New test. From-SVN: r248835
-rw-r--r--gcc/ChangeLog5
-rw-r--r--gcc/config/aarch64/aarch64-simd.md10
-rw-r--r--gcc/testsuite/ChangeLog4
-rw-r--r--gcc/testsuite/gcc.target/aarch64/hfmode_ins_1.c21
4 files changed, 35 insertions, 5 deletions
diff --git a/gcc/ChangeLog b/gcc/ChangeLog
index 345c3ec..079f1fd 100644
--- a/gcc/ChangeLog
+++ b/gcc/ChangeLog
@@ -10,6 +10,11 @@
2017-06-02 Kyrylo Tkachov <kyrylo.tkachov@arm.com>
+ * config/aarch64/aarch64-simd.md (*aarch64_simd_vec_copy_lane<mode>):
+ Use VALL_F16 iterator rather than VALL.
+
+2017-06-02 Kyrylo Tkachov <kyrylo.tkachov@arm.com>
+
* config/aarch64/aarch64.c (aarch64_split_compare_and_swap):
Emit CBNZ inside loop when doing a strong exchange and comparing
against zero. Generate the CC flags after the loop.
diff --git a/gcc/config/aarch64/aarch64-simd.md b/gcc/config/aarch64/aarch64-simd.md
index 6852f39..693b476 100644
--- a/gcc/config/aarch64/aarch64-simd.md
+++ b/gcc/config/aarch64/aarch64-simd.md
@@ -565,14 +565,14 @@
)
(define_insn "*aarch64_simd_vec_copy_lane<mode>"
- [(set (match_operand:VALL 0 "register_operand" "=w")
- (vec_merge:VALL
- (vec_duplicate:VALL
+ [(set (match_operand:VALL_F16 0 "register_operand" "=w")
+ (vec_merge:VALL_F16
+ (vec_duplicate:VALL_F16
(vec_select:<VEL>
- (match_operand:VALL 3 "register_operand" "w")
+ (match_operand:VALL_F16 3 "register_operand" "w")
(parallel
[(match_operand:SI 4 "immediate_operand" "i")])))
- (match_operand:VALL 1 "register_operand" "0")
+ (match_operand:VALL_F16 1 "register_operand" "0")
(match_operand:SI 2 "immediate_operand" "i")))]
"TARGET_SIMD"
{
diff --git a/gcc/testsuite/ChangeLog b/gcc/testsuite/ChangeLog
index fdd4a90..70a8335 100644
--- a/gcc/testsuite/ChangeLog
+++ b/gcc/testsuite/ChangeLog
@@ -8,6 +8,10 @@
2017-06-02 Kyrylo Tkachov <kyrylo.tkachov@arm.com>
+ * gcc.target/aarch64/hfmode_ins_1.c: New test.
+
+2017-06-02 Kyrylo Tkachov <kyrylo.tkachov@arm.com>
+
* gcc.target/aarch64/atomic_cmp_exchange_zero_strong_1.c: New test.
2017-06-02 Will Schmidt <will_schmidt@vnet.ibm.com>
diff --git a/gcc/testsuite/gcc.target/aarch64/hfmode_ins_1.c b/gcc/testsuite/gcc.target/aarch64/hfmode_ins_1.c
new file mode 100644
index 0000000..7fafe92
--- /dev/null
+++ b/gcc/testsuite/gcc.target/aarch64/hfmode_ins_1.c
@@ -0,0 +1,21 @@
+/* { dg-do compile } */
+/* { dg-options "-O2" } */
+
+/* Check that we can perform this in a single INS without doing any DUPs. */
+
+#include <arm_neon.h>
+
+float16x8_t
+foo (float16x8_t a, float16x8_t b)
+{
+ return vsetq_lane_f16 (vgetq_lane_f16 (b, 2), a, 3);
+}
+
+float16x4_t
+bar (float16x4_t a, float16x4_t b)
+{
+ return vset_lane_f16 (vget_lane_f16 (b, 2), a, 3);
+}
+
+/* { dg-final { scan-assembler-times "ins\\t" 2 } } */
+/* { dg-final { scan-assembler-not "dup\\t" } } */