aboutsummaryrefslogtreecommitdiff
path: root/gcc
diff options
context:
space:
mode:
authorVladimir N. Makarov <vmakarov@redhat.com>2023-03-09 08:41:09 -0500
committerVladimir N. Makarov <vmakarov@redhat.com>2023-03-09 08:45:04 -0500
commita6457974a1f443ab58d2334c02260299616c78b8 (patch)
treefedf12457c84e0a14552be2793f694b192961855 /gcc
parentace65db9215882b95e2ead1bb0dc8c54c2ea69be (diff)
downloadgcc-a6457974a1f443ab58d2334c02260299616c78b8.zip
gcc-a6457974a1f443ab58d2334c02260299616c78b8.tar.gz
gcc-a6457974a1f443ab58d2334c02260299616c78b8.tar.bz2
LRA: For clobbered regs use operand mode instead of the biggest mode
LRA is too conservative in calculation of conflicts with clobbered regs by using the biggest access mode. This results in failure of possible reg coalescing and worse code. This patch solves the problem. PR rtl-optimization/108999 gcc/ChangeLog: * lra-constraints.cc (process_alt_operands): Use operand modes for clobbered regs instead of the biggest access mode. gcc/testsuite/ChangeLog: * gcc.target/aarch64/pr108999.c: New.
Diffstat (limited to 'gcc')
-rw-r--r--gcc/lra-constraints.cc3
-rw-r--r--gcc/testsuite/gcc.target/aarch64/pr108999.c21
2 files changed, 23 insertions, 1 deletions
diff --git a/gcc/lra-constraints.cc b/gcc/lra-constraints.cc
index dbfaf04..c38566a 100644
--- a/gcc/lra-constraints.cc
+++ b/gcc/lra-constraints.cc
@@ -3108,7 +3108,8 @@ process_alt_operands (int only_alternative)
lra_assert (operand_reg[i] != NULL_RTX);
clobbered_hard_regno = hard_regno[i];
CLEAR_HARD_REG_SET (temp_set);
- add_to_hard_reg_set (&temp_set, biggest_mode[i], clobbered_hard_regno);
+ add_to_hard_reg_set (&temp_set, GET_MODE (*curr_id->operand_loc[i]),
+ clobbered_hard_regno);
first_conflict_j = last_conflict_j = -1;
for (j = 0; j < n_operands; j++)
if (j == i
diff --git a/gcc/testsuite/gcc.target/aarch64/pr108999.c b/gcc/testsuite/gcc.target/aarch64/pr108999.c
new file mode 100644
index 0000000..a34db85
--- /dev/null
+++ b/gcc/testsuite/gcc.target/aarch64/pr108999.c
@@ -0,0 +1,21 @@
+/* { dg-do compile } */
+/* { dg-options "-O3 -march=armv8.2-a+sve" } */
+#include <arm_sve.h>
+
+void subreg_coalesce5 (
+ svbool_t pg, int64_t* base, int n,
+ int64_t *in1, int64_t *in2, int64_t*out
+)
+{
+ svint64x2_t result = svld2_s64 (pg, base);
+
+ for (int i = 0; i < n; i += 1) {
+ svint64_t v18 = svld1_s64(pg, in1 + i);
+ svint64_t v19 = svld1_s64(pg, in2 + i);
+ result.__val[0] = svmad_s64_z(pg, v18, v19, result.__val[0]);
+ result.__val[1] = svmad_s64_z(pg, v18, v19, result.__val[1]);
+ }
+ svst2_s64(pg, out, result);
+}
+
+/* { dg-final { scan-assembler-not {[ \t]*mov[ \t]*z[0-9]+\.d} } } */