diff options
author | H.J. Lu <hongjiu.lu@intel.com> | 2010-10-20 11:21:19 +0000 |
---|---|---|
committer | H.J. Lu <hjl@gcc.gnu.org> | 2010-10-20 04:21:19 -0700 |
commit | b9121f42a1086a219ab6312b76e920639a0de260 (patch) | |
tree | c60b901039bd33fa1ae88c7bec5ea5466cb3f2e0 /gcc | |
parent | 742d143c1be9352d388e37bb24ff82c81aca8340 (diff) | |
download | gcc-b9121f42a1086a219ab6312b76e920639a0de260.zip gcc-b9121f42a1086a219ab6312b76e920639a0de260.tar.gz gcc-b9121f42a1086a219ab6312b76e920639a0de260.tar.bz2 |
Correct reduc_splus_v8sf and reduc_splus_v4df.
gcc/
2010-10-20 H.J. Lu <hongjiu.lu@intel.com>
PR target/46085
* config/i386/sse.md (reduc_splus_v8sf): Updated.
(reduc_splus_v4df): Likewise.
gcc/testsuite/
2010-10-20 H.J. Lu <hongjiu.lu@intel.com>
PR target/46085
* gcc.target/i386/pr46085-1.c: New.
* gcc.target/i386/pr46085-2.c: Likewise.
From-SVN: r165719
Diffstat (limited to 'gcc')
-rw-r--r-- | gcc/ChangeLog | 6 | ||||
-rw-r--r-- | gcc/config/i386/sse.md | 9 | ||||
-rw-r--r-- | gcc/testsuite/ChangeLog | 6 | ||||
-rw-r--r-- | gcc/testsuite/gcc.target/i386/pr46085-1.c | 47 | ||||
-rw-r--r-- | gcc/testsuite/gcc.target/i386/pr46085-2.c | 47 |
5 files changed, 112 insertions, 3 deletions
diff --git a/gcc/ChangeLog b/gcc/ChangeLog index 4afbaec..686b591 100644 --- a/gcc/ChangeLog +++ b/gcc/ChangeLog @@ -1,3 +1,9 @@ +2010-10-20 H.J. Lu <hongjiu.lu@intel.com> + + PR target/46085 + * config/i386/sse.md (reduc_splus_v8sf): Updated. + (reduc_splus_v4df): Likewise. + 2010-10-20 Richard Guenther <rguenther@suse.de> PR tree-optimization/45860 diff --git a/gcc/config/i386/sse.md b/gcc/config/i386/sse.md index 2402c70..bff74d5 100644 --- a/gcc/config/i386/sse.md +++ b/gcc/config/i386/sse.md @@ -1388,8 +1388,9 @@ rtx tmp = gen_reg_rtx (V8SFmode); rtx tmp2 = gen_reg_rtx (V8SFmode); emit_insn (gen_avx_haddv8sf3 (tmp, operands[1], operands[1])); - emit_insn (gen_avx_haddv8sf3 (tmp2, operands[1], operands[1])); - emit_insn (gen_avx_haddv8sf3 (operands[0], tmp2, tmp2)); + emit_insn (gen_avx_haddv8sf3 (tmp2, tmp, tmp)); + emit_insn (gen_avx_vperm2f128v8sf3 (tmp, tmp2, tmp2, GEN_INT (1))); + emit_insn (gen_addv8sf3 (operands[0], tmp, tmp2)); DONE; }) @@ -1415,8 +1416,10 @@ "TARGET_AVX" { rtx tmp = gen_reg_rtx (V4DFmode); + rtx tmp2 = gen_reg_rtx (V4DFmode); emit_insn (gen_avx_haddv4df3 (tmp, operands[1], operands[1])); - emit_insn (gen_avx_haddv4df3 (operands[0], tmp, tmp)); + emit_insn (gen_avx_vperm2f128v4df3 (tmp2, tmp, tmp, GEN_INT (1))); + emit_insn (gen_addv4df3 (operands[0], tmp, tmp2)); DONE; }) diff --git a/gcc/testsuite/ChangeLog b/gcc/testsuite/ChangeLog index 25fd703..fe74a3f 100644 --- a/gcc/testsuite/ChangeLog +++ b/gcc/testsuite/ChangeLog @@ -1,3 +1,9 @@ +2010-10-20 H.J. Lu <hongjiu.lu@intel.com> + + PR target/46085 + * gcc.target/i386/pr46085-1.c: New. + * gcc.target/i386/pr46085-2.c: Likewise. + 2010-10-20 Richard Guenther <rguenther@suse.de> PR tree-optimization/45860 diff --git a/gcc/testsuite/gcc.target/i386/pr46085-1.c b/gcc/testsuite/gcc.target/i386/pr46085-1.c new file mode 100644 index 0000000..0251556 --- /dev/null +++ b/gcc/testsuite/gcc.target/i386/pr46085-1.c @@ -0,0 +1,47 @@ +/* { dg-do run } */ +/* { dg-require-effective-target avx } */ +/* { dg-options "-O2 -ftree-vectorize -mavx -mtune=generic -ffast-math" } */ + +#include "avx-check.h" + +#define N 16 +#define DIFF 242 + +float b[N] = {0,3,6,9,12,15,18,21,24,27,30,33,36,39,42,45}; +float c[N] = {0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15}; + +void +main1 (float x, float max_result) +{ + int i; + float diff = 2; + float max = x; + float min = 10; + + for (i = 0; i < N; i++) { + diff += (b[i] - c[i]); + } + + for (i = 0; i < N; i++) { + max = max < c[i] ? c[i] : max; + } + + for (i = 0; i < N; i++) { + min = min > c[i] ? c[i] : min; + } + + /* check results: */ + if (diff != DIFF) + abort (); + if (max != max_result) + abort (); + if (min != 0) + abort (); +} + +static void +avx_test (void) +{ + main1 (100, 100); + main1 (0, 15); +} diff --git a/gcc/testsuite/gcc.target/i386/pr46085-2.c b/gcc/testsuite/gcc.target/i386/pr46085-2.c new file mode 100644 index 0000000..568cdd9 --- /dev/null +++ b/gcc/testsuite/gcc.target/i386/pr46085-2.c @@ -0,0 +1,47 @@ +/* { dg-do run } */ +/* { dg-require-effective-target avx } */ +/* { dg-options "-O2 -ftree-vectorize -mavx -mtune=generic -ffast-math" } */ + +#include "avx-check.h" + +#define N 16 +#define DIFF 242 + +double b[N] = {0,3,6,9,12,15,18,21,24,27,30,33,36,39,42,45}; +double c[N] = {0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15}; + +void +main1 (double x, double max_result) +{ + int i; + double diff = 2; + double max = x; + double min = 10; + + for (i = 0; i < N; i++) { + diff += (b[i] - c[i]); + } + + for (i = 0; i < N; i++) { + max = max < c[i] ? c[i] : max; + } + + for (i = 0; i < N; i++) { + min = min > c[i] ? c[i] : min; + } + + /* check results: */ + if (diff != DIFF) + abort (); + if (max != max_result) + abort (); + if (min != 0) + abort (); +} + +static void +avx_test (void) +{ + main1 (100, 100); + main1 (0, 15); +} |