diff options
author | Sam Tebbs <sam.tebbs@arm.com> | 2018-08-01 10:10:28 +0000 |
---|---|---|
committer | Sudakshina Das <sudi@gcc.gnu.org> | 2018-08-01 10:10:28 +0000 |
commit | 00d29b97d9ed9af957f896b8279ae85d2e16deb4 (patch) | |
tree | ff15f38944d8bdba046eb54e983eb995d16e0557 | |
parent | 5922dcb5cc82f48862cd42bd84e3c85733cac0ce (diff) | |
download | gcc-00d29b97d9ed9af957f896b8279ae85d2e16deb4.zip gcc-00d29b97d9ed9af957f896b8279ae85d2e16deb4.tar.gz gcc-00d29b97d9ed9af957f896b8279ae85d2e16deb4.tar.bz2 |
[PATCH][AArch64] Stop redundant zero-extension after UMOV when in DI mode
This patch extends the aarch64_get_lane_zero_extendsi instruction
definition to also cover DI mode. This prevents a redundant AND
instruction from being generated due to the pattern failing to be matched.
Committed on behalf of Sam Tebbs.
gcc/
2018-08-01 Sam Tebbs <sam.tebbs@arm.com>
* config/aarch64/aarch64-simd.md
(*aarch64_get_lane_zero_extendsi<mode>): Rename to...
(*aarch64_get_lane_zero_extend<GPI:mode><VDQQH:mode>): ... This and
use GPI iterator instead of SI mode.
gcc/testsuite
2018-08-01 Sam Tebbs <sam.tebbs@arm.com>
* gcc.target/aarch64/extract_zero_extend.c: New file.
From-SVN: r263200
-rw-r--r-- | gcc/ChangeLog | 7 | ||||
-rw-r--r-- | gcc/config/aarch64/aarch64-simd.md | 31 | ||||
-rw-r--r-- | gcc/testsuite/ChangeLog | 4 | ||||
-rw-r--r-- | gcc/testsuite/gcc.target/aarch64/extract_zero_extend.c | 81 |
4 files changed, 108 insertions, 15 deletions
diff --git a/gcc/ChangeLog b/gcc/ChangeLog index 54cd8f9..b8152e3 100644 --- a/gcc/ChangeLog +++ b/gcc/ChangeLog @@ -1,3 +1,10 @@ +2018-08-01 Sam Tebbs <sam.tebbs@arm.com> + + * config/aarch64/aarch64-simd.md + (*aarch64_get_lane_zero_extendsi<mode>): Rename to... + (*aarch64_get_lane_zero_extend<GPI:mode><VDQQH:mode>): ... This and + use GPI iterator instead of SI mode. + 2018-08-01 Richard Earnshaw <rearnsha@arm.com> * config/rs6000/rs6000.md (speculation_barrier): Renamed from diff --git a/gcc/config/aarch64/aarch64-simd.md b/gcc/config/aarch64/aarch64-simd.md index 9ee9bbe..1d574cd 100644 --- a/gcc/config/aarch64/aarch64-simd.md +++ b/gcc/config/aarch64/aarch64-simd.md @@ -3030,21 +3030,22 @@ operands[2] = aarch64_endian_lane_rtx (<MODE>mode, INTVAL (operands[2])); return "smov\\t%<GPI:w>0, %1.<VDQQH:Vetype>[%2]"; } - [(set_attr "type" "neon_to_gp<q>")] -) - -(define_insn "*aarch64_get_lane_zero_extendsi<mode>" - [(set (match_operand:SI 0 "register_operand" "=r") - (zero_extend:SI - (vec_select:<VEL> - (match_operand:VDQQH 1 "register_operand" "w") - (parallel [(match_operand:SI 2 "immediate_operand" "i")]))))] - "TARGET_SIMD" - { - operands[2] = aarch64_endian_lane_rtx (<MODE>mode, INTVAL (operands[2])); - return "umov\\t%w0, %1.<Vetype>[%2]"; - } - [(set_attr "type" "neon_to_gp<q>")] + [(set_attr "type" "neon_to_gp<q>")]
+)
+
+(define_insn "*aarch64_get_lane_zero_extend<GPI:mode><VDQQH:mode>"
+ [(set (match_operand:GPI 0 "register_operand" "=r")
+ (zero_extend:GPI
+ (vec_select:<VEL>
+ (match_operand:VDQQH 1 "register_operand" "w")
+ (parallel [(match_operand:SI 2 "immediate_operand" "i")]))))]
+ "TARGET_SIMD"
+ {
+ operands[2] = aarch64_endian_lane_rtx (<VDQQH:MODE>mode,
+ INTVAL (operands[2]));
+ return "umov\\t%w0, %1.<Vetype>[%2]";
+ }
+ [(set_attr "type" "neon_to_gp<q>")]
) ;; Lane extraction of a value, neither sign nor zero extension diff --git a/gcc/testsuite/ChangeLog b/gcc/testsuite/ChangeLog index c4561cd..f9448b9 100644 --- a/gcc/testsuite/ChangeLog +++ b/gcc/testsuite/ChangeLog @@ -1,3 +1,7 @@ +2018-08-01 Sam Tebbs <sam.tebbs@arm.com> + + * gcc.target/aarch64/extract_zero_extend.c: New file. + 2018-08-01 Jakub Jelinek <jakub@redhat.com> PR c/85704 diff --git a/gcc/testsuite/gcc.target/aarch64/extract_zero_extend.c b/gcc/testsuite/gcc.target/aarch64/extract_zero_extend.c new file mode 100644 index 0000000..0209305 --- /dev/null +++ b/gcc/testsuite/gcc.target/aarch64/extract_zero_extend.c @@ -0,0 +1,81 @@ +/* { dg-do compile } */
+/* { dg-options "-O3 -fdump-rtl-final" } */
+
+/* Tests div16qi. */
+typedef unsigned char div16qi __attribute__ ((vector_size (16)));
+/* Tests div8qi. */
+typedef unsigned char div8qi __attribute__ ((vector_size (8)));
+/* Tests div8hi. */
+typedef unsigned short div8hi __attribute__ ((vector_size (16)));
+/* Tests div4hi. */
+typedef unsigned short div4hi __attribute__ ((vector_size (8)));
+
+/* Tests siv16qi. */
+typedef unsigned char siv16qi __attribute__ ((vector_size (16)));
+/* Tests siv8qi. */
+typedef unsigned char siv8qi __attribute__ ((vector_size (8)));
+/* Tests siv8hi. */
+typedef unsigned short siv8hi __attribute__ ((vector_size (16)));
+/* Tests siv4hi. */
+typedef unsigned short siv4hi __attribute__ ((vector_size (8)));
+
+
+unsigned long long
+foo_div16qi (div16qi a)
+{
+ return a[0];
+}
+
+unsigned long long
+foo_div8qi (div8qi a)
+{
+ return a[0];
+}
+
+unsigned long long
+foo_div8hi (div8hi a)
+{
+ return a[0];
+}
+
+unsigned long long
+foo_div4hi (div4hi a)
+{
+ return a[0];
+}
+
+unsigned int
+foo_siv16qi (siv16qi a)
+{
+ return a[0];
+}
+
+unsigned int
+foo_siv8qi (siv8qi a)
+{
+ return a[0];
+}
+
+unsigned int
+foo_siv8hi (siv8hi a)
+{
+ return a[0];
+}
+
+unsigned int
+foo_siv4hi (siv4hi a)
+{
+ return a[0];
+}
+
+/* { dg-final { scan-assembler-times "umov\\t" 8 } } */
+/* { dg-final { scan-assembler-not "and\\t" } } */
+
+/* { dg-final { scan-rtl-dump "aarch64_get_lane_zero_extenddiv16qi" "final" } } */
+/* { dg-final { scan-rtl-dump "aarch64_get_lane_zero_extenddiv8qi" "final" } } */
+/* { dg-final { scan-rtl-dump "aarch64_get_lane_zero_extenddiv8hi" "final" } } */
+/* { dg-final { scan-rtl-dump "aarch64_get_lane_zero_extenddiv4hi" "final" } } */
+/* { dg-final { scan-rtl-dump "aarch64_get_lane_zero_extendsiv16qi" "final" } } */
+/* { dg-final { scan-rtl-dump "aarch64_get_lane_zero_extendsiv8qi" "final" } } */
+/* { dg-final { scan-rtl-dump "aarch64_get_lane_zero_extendsiv8hi" "final" } } */
+/* { dg-final { scan-rtl-dump "aarch64_get_lane_zero_extendsiv4hi" "final" } } */
|