aboutsummaryrefslogtreecommitdiff
path: root/gcc
diff options
context:
space:
mode:
authorH.J. Lu <hongjiu.lu@intel.com>2010-10-20 11:21:19 +0000
committerH.J. Lu <hjl@gcc.gnu.org>2010-10-20 04:21:19 -0700
commitb9121f42a1086a219ab6312b76e920639a0de260 (patch)
treec60b901039bd33fa1ae88c7bec5ea5466cb3f2e0 /gcc
parent742d143c1be9352d388e37bb24ff82c81aca8340 (diff)
downloadgcc-b9121f42a1086a219ab6312b76e920639a0de260.zip
gcc-b9121f42a1086a219ab6312b76e920639a0de260.tar.gz
gcc-b9121f42a1086a219ab6312b76e920639a0de260.tar.bz2
Correct reduc_splus_v8sf and reduc_splus_v4df.
gcc/ 2010-10-20 H.J. Lu <hongjiu.lu@intel.com> PR target/46085 * config/i386/sse.md (reduc_splus_v8sf): Updated. (reduc_splus_v4df): Likewise. gcc/testsuite/ 2010-10-20 H.J. Lu <hongjiu.lu@intel.com> PR target/46085 * gcc.target/i386/pr46085-1.c: New. * gcc.target/i386/pr46085-2.c: Likewise. From-SVN: r165719
Diffstat (limited to 'gcc')
-rw-r--r--gcc/ChangeLog6
-rw-r--r--gcc/config/i386/sse.md9
-rw-r--r--gcc/testsuite/ChangeLog6
-rw-r--r--gcc/testsuite/gcc.target/i386/pr46085-1.c47
-rw-r--r--gcc/testsuite/gcc.target/i386/pr46085-2.c47
5 files changed, 112 insertions, 3 deletions
diff --git a/gcc/ChangeLog b/gcc/ChangeLog
index 4afbaec..686b591 100644
--- a/gcc/ChangeLog
+++ b/gcc/ChangeLog
@@ -1,3 +1,9 @@
+2010-10-20 H.J. Lu <hongjiu.lu@intel.com>
+
+ PR target/46085
+ * config/i386/sse.md (reduc_splus_v8sf): Updated.
+ (reduc_splus_v4df): Likewise.
+
2010-10-20 Richard Guenther <rguenther@suse.de>
PR tree-optimization/45860
diff --git a/gcc/config/i386/sse.md b/gcc/config/i386/sse.md
index 2402c70..bff74d5 100644
--- a/gcc/config/i386/sse.md
+++ b/gcc/config/i386/sse.md
@@ -1388,8 +1388,9 @@
rtx tmp = gen_reg_rtx (V8SFmode);
rtx tmp2 = gen_reg_rtx (V8SFmode);
emit_insn (gen_avx_haddv8sf3 (tmp, operands[1], operands[1]));
- emit_insn (gen_avx_haddv8sf3 (tmp2, operands[1], operands[1]));
- emit_insn (gen_avx_haddv8sf3 (operands[0], tmp2, tmp2));
+ emit_insn (gen_avx_haddv8sf3 (tmp2, tmp, tmp));
+ emit_insn (gen_avx_vperm2f128v8sf3 (tmp, tmp2, tmp2, GEN_INT (1)));
+ emit_insn (gen_addv8sf3 (operands[0], tmp, tmp2));
DONE;
})
@@ -1415,8 +1416,10 @@
"TARGET_AVX"
{
rtx tmp = gen_reg_rtx (V4DFmode);
+ rtx tmp2 = gen_reg_rtx (V4DFmode);
emit_insn (gen_avx_haddv4df3 (tmp, operands[1], operands[1]));
- emit_insn (gen_avx_haddv4df3 (operands[0], tmp, tmp));
+ emit_insn (gen_avx_vperm2f128v4df3 (tmp2, tmp, tmp, GEN_INT (1)));
+ emit_insn (gen_addv4df3 (operands[0], tmp, tmp2));
DONE;
})
diff --git a/gcc/testsuite/ChangeLog b/gcc/testsuite/ChangeLog
index 25fd703..fe74a3f 100644
--- a/gcc/testsuite/ChangeLog
+++ b/gcc/testsuite/ChangeLog
@@ -1,3 +1,9 @@
+2010-10-20 H.J. Lu <hongjiu.lu@intel.com>
+
+ PR target/46085
+ * gcc.target/i386/pr46085-1.c: New.
+ * gcc.target/i386/pr46085-2.c: Likewise.
+
2010-10-20 Richard Guenther <rguenther@suse.de>
PR tree-optimization/45860
diff --git a/gcc/testsuite/gcc.target/i386/pr46085-1.c b/gcc/testsuite/gcc.target/i386/pr46085-1.c
new file mode 100644
index 0000000..0251556
--- /dev/null
+++ b/gcc/testsuite/gcc.target/i386/pr46085-1.c
@@ -0,0 +1,47 @@
+/* { dg-do run } */
+/* { dg-require-effective-target avx } */
+/* { dg-options "-O2 -ftree-vectorize -mavx -mtune=generic -ffast-math" } */
+
+#include "avx-check.h"
+
+#define N 16
+#define DIFF 242
+
+float b[N] = {0,3,6,9,12,15,18,21,24,27,30,33,36,39,42,45};
+float c[N] = {0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15};
+
+void
+main1 (float x, float max_result)
+{
+ int i;
+ float diff = 2;
+ float max = x;
+ float min = 10;
+
+ for (i = 0; i < N; i++) {
+ diff += (b[i] - c[i]);
+ }
+
+ for (i = 0; i < N; i++) {
+ max = max < c[i] ? c[i] : max;
+ }
+
+ for (i = 0; i < N; i++) {
+ min = min > c[i] ? c[i] : min;
+ }
+
+ /* check results: */
+ if (diff != DIFF)
+ abort ();
+ if (max != max_result)
+ abort ();
+ if (min != 0)
+ abort ();
+}
+
+static void
+avx_test (void)
+{
+ main1 (100, 100);
+ main1 (0, 15);
+}
diff --git a/gcc/testsuite/gcc.target/i386/pr46085-2.c b/gcc/testsuite/gcc.target/i386/pr46085-2.c
new file mode 100644
index 0000000..568cdd9
--- /dev/null
+++ b/gcc/testsuite/gcc.target/i386/pr46085-2.c
@@ -0,0 +1,47 @@
+/* { dg-do run } */
+/* { dg-require-effective-target avx } */
+/* { dg-options "-O2 -ftree-vectorize -mavx -mtune=generic -ffast-math" } */
+
+#include "avx-check.h"
+
+#define N 16
+#define DIFF 242
+
+double b[N] = {0,3,6,9,12,15,18,21,24,27,30,33,36,39,42,45};
+double c[N] = {0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15};
+
+void
+main1 (double x, double max_result)
+{
+ int i;
+ double diff = 2;
+ double max = x;
+ double min = 10;
+
+ for (i = 0; i < N; i++) {
+ diff += (b[i] - c[i]);
+ }
+
+ for (i = 0; i < N; i++) {
+ max = max < c[i] ? c[i] : max;
+ }
+
+ for (i = 0; i < N; i++) {
+ min = min > c[i] ? c[i] : min;
+ }
+
+ /* check results: */
+ if (diff != DIFF)
+ abort ();
+ if (max != max_result)
+ abort ();
+ if (min != 0)
+ abort ();
+}
+
+static void
+avx_test (void)
+{
+ main1 (100, 100);
+ main1 (0, 15);
+}