aboutsummaryrefslogtreecommitdiff
path: root/gcc
diff options
context:
space:
mode:
authorEric Botcazou <ebotcazou@adacore.com>2018-11-20 08:59:30 +0000
committerEric Botcazou <ebotcazou@gcc.gnu.org>2018-11-20 08:59:30 +0000
commit643427d70f7a547a1db8a8492a6a124ff22c0d3a (patch)
treee254592484859d6e99362a4041f1d06658035748 /gcc
parent07b9f1de1ea532a66d8ac103f3a9827521d780f9 (diff)
downloadgcc-643427d70f7a547a1db8a8492a6a124ff22c0d3a.zip
gcc-643427d70f7a547a1db8a8492a6a124ff22c0d3a.tar.gz
gcc-643427d70f7a547a1db8a8492a6a124ff22c0d3a.tar.bz2
re PR rtl-optimization/85925 (compilation of masking with 257 goes wrong in combine at -02)
PR rtl-optimization/85925 * rtl.h (word_register_operation_p): New predicate. * combine.c (record_dead_and_set_regs_1): Only apply specific handling for WORD_REGISTER_OPERATIONS targets to word_register_operation_p RTX. * rtlanal.c (nonzero_bits1): Likewise. Adjust couple of comments. (num_sign_bit_copies1): Likewise. From-SVN: r266302
Diffstat (limited to 'gcc')
-rw-r--r--gcc/ChangeLog9
-rw-r--r--gcc/combine.c1
-rw-r--r--gcc/rtl.h19
-rw-r--r--gcc/rtlanal.c29
-rw-r--r--gcc/testsuite/ChangeLog4
-rw-r--r--gcc/testsuite/gcc.c-torture/execute/20181120-1.c26
6 files changed, 74 insertions, 14 deletions
diff --git a/gcc/ChangeLog b/gcc/ChangeLog
index 0c357fb..affdfd6 100644
--- a/gcc/ChangeLog
+++ b/gcc/ChangeLog
@@ -130,6 +130,15 @@
* dwarf2out.c (dwarf2out_early_global_decl): For
decl_function_context recurse instead of calling dwarf2out_decl.
+2018-11-20 Eric Botcazou <ebotcazou@adacore.com>
+
+ PR rtl-optimization/85925
+ * rtl.h (word_register_operation_p): New predicate.
+ * combine.c (record_dead_and_set_regs_1): Only apply specific handling
+ for WORD_REGISTER_OPERATIONS targets to word_register_operation_p RTX.
+ * rtlanal.c (nonzero_bits1): Likewise. Adjust couple of comments.
+ (num_sign_bit_copies1): Likewise.
+
2018-11-19 Richard Biener <rguenther@suse.de>
PR lto/87229
diff --git a/gcc/combine.c b/gcc/combine.c
index 945eca3..ecc83f8 100644
--- a/gcc/combine.c
+++ b/gcc/combine.c
@@ -13331,6 +13331,7 @@ record_dead_and_set_regs_1 (rtx dest, const_rtx setter, void *data)
&& subreg_lowpart_p (SET_DEST (setter)))
record_value_for_reg (dest, record_dead_insn,
WORD_REGISTER_OPERATIONS
+ && word_register_operation_p (SET_SRC (setter))
&& paradoxical_subreg_p (SET_DEST (setter))
? SET_SRC (setter)
: gen_lowpart (GET_MODE (dest),
diff --git a/gcc/rtl.h b/gcc/rtl.h
index 68d3cea..4114cd0 100644
--- a/gcc/rtl.h
+++ b/gcc/rtl.h
@@ -4374,6 +4374,25 @@ strip_offset_and_add (rtx x, poly_int64_pod *offset)
return x;
}
+/* Return true if X is an operation that always operates on the full
+ registers for WORD_REGISTER_OPERATIONS architectures. */
+
+inline bool
+word_register_operation_p (const_rtx x)
+{
+ switch (GET_CODE (x))
+ {
+ case ROTATE:
+ case ROTATERT:
+ case SIGN_EXTRACT:
+ case ZERO_EXTRACT:
+ return false;
+
+ default:
+ return true;
+ }
+}
+
/* gtype-desc.c. */
extern void gt_ggc_mx (rtx &);
extern void gt_pch_nx (rtx &);
diff --git a/gcc/rtlanal.c b/gcc/rtlanal.c
index e8b6b9c..9220cbf 100644
--- a/gcc/rtlanal.c
+++ b/gcc/rtlanal.c
@@ -4485,12 +4485,12 @@ nonzero_bits1 (const_rtx x, scalar_int_mode mode, const_rtx known_x,
might be nonzero in its own mode, taking into account the fact that, on
CISC machines, accessing an object in a wider mode generally causes the
high-order bits to become undefined, so they are not known to be zero.
- We extend this reasoning to RISC machines for rotate operations since the
- semantics of the operations in the larger mode is not well defined. */
+ We extend this reasoning to RISC machines for operations that might not
+ operate on the full registers. */
if (mode_width > xmode_width
&& xmode_width <= BITS_PER_WORD
&& xmode_width <= HOST_BITS_PER_WIDE_INT
- && (!WORD_REGISTER_OPERATIONS || code == ROTATE || code == ROTATERT))
+ && !(WORD_REGISTER_OPERATIONS && word_register_operation_p (x)))
{
nonzero &= cached_nonzero_bits (x, xmode,
known_x, known_mode, known_ret);
@@ -4758,13 +4758,16 @@ nonzero_bits1 (const_rtx x, scalar_int_mode mode, const_rtx known_x,
nonzero &= cached_nonzero_bits (SUBREG_REG (x), mode,
known_x, known_mode, known_ret);
- /* On many CISC machines, accessing an object in a wider mode
+ /* On a typical CISC machine, accessing an object in a wider mode
causes the high-order bits to become undefined. So they are
- not known to be zero. */
+ not known to be zero.
+
+ On a typical RISC machine, we only have to worry about the way
+ loads are extended. Otherwise, if we get a reload for the inner
+ part, it may be loaded from the stack, and then we may lose all
+ the zero bits that existed before the store to the stack. */
rtx_code extend_op;
if ((!WORD_REGISTER_OPERATIONS
- /* If this is a typical RISC machine, we only have to worry
- about the way loads are extended. */
|| ((extend_op = load_extend_op (inner_mode)) == SIGN_EXTEND
? val_signbit_known_set_p (inner_mode, nonzero)
: extend_op != ZERO_EXTEND)
@@ -5025,10 +5028,9 @@ num_sign_bit_copies1 (const_rtx x, scalar_int_mode mode, const_rtx known_x,
{
/* If this machine does not do all register operations on the entire
register and MODE is wider than the mode of X, we can say nothing
- at all about the high-order bits. We extend this reasoning to every
- machine for rotate operations since the semantics of the operations
- in the larger mode is not well defined. */
- if (!WORD_REGISTER_OPERATIONS || code == ROTATE || code == ROTATERT)
+ at all about the high-order bits. We extend this reasoning to RISC
+ machines for operations that might not operate on full registers. */
+ if (!(WORD_REGISTER_OPERATIONS && word_register_operation_p (x)))
return 1;
/* Likewise on machines that do, if the mode of the object is smaller
@@ -5107,13 +5109,12 @@ num_sign_bit_copies1 (const_rtx x, scalar_int_mode mode, const_rtx known_x,
/* For paradoxical SUBREGs on machines where all register operations
affect the entire register, just look inside. Note that we are
passing MODE to the recursive call, so the number of sign bit
- copies will remain relative to that mode, not the inner mode. */
+ copies will remain relative to that mode, not the inner mode.
- /* This works only if loads sign extend. Otherwise, if we get a
+ This works only if loads sign extend. Otherwise, if we get a
reload for the inner part, it may be loaded from the stack, and
then we lose all sign bit copies that existed before the store
to the stack. */
-
if (WORD_REGISTER_OPERATIONS
&& load_extend_op (inner_mode) == SIGN_EXTEND
&& paradoxical_subreg_p (x)
diff --git a/gcc/testsuite/ChangeLog b/gcc/testsuite/ChangeLog
index 4284ce2..e378047 100644
--- a/gcc/testsuite/ChangeLog
+++ b/gcc/testsuite/ChangeLog
@@ -1,3 +1,7 @@
+2018-11-20 Eric Botcazou <ebotcazou@adacore.com>
+
+ * gcc.c-torture/execute/20181120-1.c: New test.
+
2018-11-20 Richard Biener <rguenther@suse.de>
PR tree-optimization/88087
diff --git a/gcc/testsuite/gcc.c-torture/execute/20181120-1.c b/gcc/testsuite/gcc.c-torture/execute/20181120-1.c
new file mode 100644
index 0000000..21e5f7a
--- /dev/null
+++ b/gcc/testsuite/gcc.c-torture/execute/20181120-1.c
@@ -0,0 +1,26 @@
+/* PR rtl-optimization/85925 */
+/* Testcase by <sudi@gcc.gnu.org> */
+
+int a, c, d;
+volatile int b;
+int *e = &d;
+
+union U1 {
+ unsigned f0;
+ unsigned f1 : 15;
+};
+
+int main (void)
+{
+ for (c = 0; c <= 1; c++) {
+ union U1 f = {0x10101};
+ if (c == 1)
+ b;
+ *e = f.f1;
+ }
+
+ if (d != 0x101)
+ __builtin_abort ();
+
+ return 0;
+}