diff options
author | Richard Earnshaw <rearnsha@arm.com> | 2024-02-22 16:47:20 +0000 |
---|---|---|
committer | Richard Earnshaw <rearnsha@arm.com> | 2024-02-23 11:39:28 +0000 |
commit | 016c4eed368b80a97101f6156ed99e4c5474fbb7 (patch) | |
tree | e0a979e780b28d5b4311f07e00fe93ffa302827f /gcc | |
parent | 22121546e0315d25ee419d2389022e3974750885 (diff) | |
download | gcc-016c4eed368b80a97101f6156ed99e4c5474fbb7.zip gcc-016c4eed368b80a97101f6156ed99e4c5474fbb7.tar.gz gcc-016c4eed368b80a97101f6156ed99e4c5474fbb7.tar.bz2 |
arm: fix ICE with vectorized reciprocal division [PR108120]
The expand pattern for reciprocal division was enabled for all math
optimization modes, but the patterns it was generating were not
enabled unless -funsafe-math-optimizations were enabled, this leads to
an ICE when the pattern we generate cannot be recognized.
Fixed by only enabling vector division when doing unsafe math.
gcc:
PR target/108120
* config/arm/neon.md (div<VCVTF:mode>3): Rename from div<mode>3.
Gate with ARM_HAVE_NEON_<MODE>_ARITH.
gcc/testsuite:
PR target/108120
* gcc.target/arm/neon-recip-div-1.c: New file.
Diffstat (limited to 'gcc')
-rw-r--r-- | gcc/config/arm/neon.md | 4 | ||||
-rw-r--r-- | gcc/testsuite/gcc.target/arm/neon-recip-div-1.c | 16 |
2 files changed, 18 insertions, 2 deletions
diff --git a/gcc/config/arm/neon.md b/gcc/config/arm/neon.md index 17c90f4..fa4a7ae 100644 --- a/gcc/config/arm/neon.md +++ b/gcc/config/arm/neon.md @@ -553,11 +553,11 @@ Enabled with -funsafe-math-optimizations -freciprocal-math and disabled for -Os since it increases code size . */ -(define_expand "div<mode>3" +(define_expand "div<VCVTF:mode>3" [(set (match_operand:VCVTF 0 "s_register_operand") (div:VCVTF (match_operand:VCVTF 1 "s_register_operand") (match_operand:VCVTF 2 "s_register_operand")))] - "TARGET_NEON && !optimize_size + "ARM_HAVE_NEON_<MODE>_ARITH && !optimize_size && flag_reciprocal_math" { rtx rec = gen_reg_rtx (<MODE>mode); diff --git a/gcc/testsuite/gcc.target/arm/neon-recip-div-1.c b/gcc/testsuite/gcc.target/arm/neon-recip-div-1.c new file mode 100644 index 0000000..e15c3ca --- /dev/null +++ b/gcc/testsuite/gcc.target/arm/neon-recip-div-1.c @@ -0,0 +1,16 @@ +/* { dg-do compile } */ +/* { dg-require-effective-target arm_neon_ok } */ +/* { dg-options "-O3 -freciprocal-math -fno-unsafe-math-optimizations -save-temps" } */ +/* { dg-add-options arm_neon } */ + +int *a; +int n; +void b() { + int c; + for (c = 0; c < 100000; c++) + a[c] = (float)c / n; +} +/* We should not ICE, or get a vectorized reciprocal instruction when unsafe + math optimizations are disabled. */ +/* { dg-final { scan-assembler-not "vrecpe\\.f32\\t\[qd\].*" } } */ +/* { dg-final { scan-assembler-not "vrecps\\.f32\\t\[qd\].*" } } */ |