aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorXionghu Luo <luoxhu@linux.ibm.com>2020-07-12 20:22:56 -0500
committerXionghu Luo <luoxhu@linux.ibm.com>2020-07-12 20:22:56 -0500
commit56d78c58c233a358c780571ad6fecbabdcff2407 (patch)
treefd0a9f62e59f360a0385d50104235e997814a3b7
parent466dd1629c699599050f68d2bfee58be9db40aab (diff)
downloadgcc-56d78c58c233a358c780571ad6fecbabdcff2407.zip
gcc-56d78c58c233a358c780571ad6fecbabdcff2407.tar.gz
gcc-56d78c58c233a358c780571ad6fecbabdcff2407.tar.bz2
rs6000: Define define_insn_and_split to split unspec sldi+or to rldimi
Combine pass could recognize the pattern defined and split it in split1, this patch could optimize: 21: r130:DI=r133:DI<<0x20 11: {r129:DI=zero_extend(unspec[[r145:DI]] 87);clobber scratch;} 22: r134:DI=r130:DI|r129:DI to 21: {r149:DI=zero_extend(unspec[[r145:DI]] 87);clobber scratch;} 22: r134:DI=r149:DI&0xffffffff|r133:DI<<0x20 rldimi is generated instead of sldi+or. gcc/ChangeLog: 2020-07-13 Xionghu Luo <luoxhu@linux.ibm.com> * config/rs6000/rs6000.md (rotl_unspec): New define_insn_and_split. gcc/testsuite/ChangeLog: 2020-07-13 Xionghu Luo <luoxhu@linux.ibm.com> * gcc.target/powerpc/vector_float.c: New test.
-rw-r--r--gcc/config/rs6000/rs6000.md26
-rw-r--r--gcc/testsuite/gcc.target/powerpc/vector_float.c15
2 files changed, 41 insertions, 0 deletions
diff --git a/gcc/config/rs6000/rs6000.md b/gcc/config/rs6000/rs6000.md
index 7baaa61..e608a17 100644
--- a/gcc/config/rs6000/rs6000.md
+++ b/gcc/config/rs6000/rs6000.md
@@ -4240,6 +4240,32 @@
operands[5] = GEN_INT ((HOST_WIDE_INT_1U << <bits>) - 1);
})
+; rldimi with UNSPEC_SI_FROM_SF.
+(define_insn_and_split "*rotldi3_insert_sf"
+ [(set (match_operand:DI 0 "gpc_reg_operand")
+ (ior:DI
+ (ashift:DI (match_operand:DI 1 "gpc_reg_operand")
+ (match_operand:SI 2 "const_int_operand"))
+ (zero_extend:DI
+ (unspec:QHSI
+ [(match_operand:SF 3 "memory_operand")]
+ UNSPEC_SI_FROM_SF))))
+ (clobber (match_scratch:V4SF 4))]
+ "INTVAL (operands[2]) == <bits>"
+ "#"
+ ""
+ [(parallel [(set (match_dup 5)
+ (zero_extend:DI (unspec:QHSI [(match_dup 3)] UNSPEC_SI_FROM_SF)))
+ (clobber (match_dup 4))])
+ (set (match_dup 0)
+ (ior:DI
+ (and:DI (match_dup 5) (match_dup 6))
+ (ashift:DI (match_dup 1) (match_dup 2))))]
+{
+ operands[5] = gen_reg_rtx (DImode);
+ operands[6] = GEN_INT ((HOST_WIDE_INT_1U << <bits>) - 1);
+})
+
; rlwimi, too.
(define_split
[(set (match_operand:SI 0 "gpc_reg_operand")
diff --git a/gcc/testsuite/gcc.target/powerpc/vector_float.c b/gcc/testsuite/gcc.target/powerpc/vector_float.c
new file mode 100644
index 0000000..e6946da
--- /dev/null
+++ b/gcc/testsuite/gcc.target/powerpc/vector_float.c
@@ -0,0 +1,15 @@
+/* { dg-do compile } */
+/* { dg-require-effective-target powerpc_p9vector_ok } */
+/* { dg-options "-O2 -mdejagnu-cpu=power9" } */
+
+vector float
+test (float *a, float *b, float *c, float *d)
+{
+ return (vector float){*a, *b, *c, *d};
+}
+
+/* { dg-final { scan-assembler-not {\mlxssp} } } */
+/* { dg-final { scan-assembler-not {\mlfs} } } */
+/* { dg-final { scan-assembler-times {\mlwz\M} 4 } } */
+/* { dg-final { scan-assembler-times {\mrldimi\M} 2 } } */
+/* { dg-final { scan-assembler-times {\mmtvsrdd\M} 1 } } */