diff options
author | H.J. Lu <hongjiu.lu@intel.com> | 2010-11-03 12:02:06 +0000 |
---|---|---|
committer | H.J. Lu <hjl@gcc.gnu.org> | 2010-11-03 05:02:06 -0700 |
commit | 72fdf9e9c4c469d8ca5abf63c7ace0c6a7569f49 (patch) | |
tree | aad9e40071886d44c2ff1c643b1a701ff1b1a854 /gcc | |
parent | 02ff830b5812b80a0bdd747cb0bb85e0ee0253b6 (diff) | |
download | gcc-72fdf9e9c4c469d8ca5abf63c7ace0c6a7569f49.zip gcc-72fdf9e9c4c469d8ca5abf63c7ace0c6a7569f49.tar.gz gcc-72fdf9e9c4c469d8ca5abf63c7ace0c6a7569f49.tar.bz2 |
Generate avx_vzeroupper after reload is completed.
gcc/
2010-11-03 H.J. Lu <hongjiu.lu@intel.com>
PR target/46285
* config/i386/i386.c (ix86_expand_call): Conditionally decorate
calls with UNSPEC_CALL_NEEDS_VZEROUPPER unspec before reload
is completed.
gcc/testsuite/
2010-11-03 H.J. Lu <hongjiu.lu@intel.com>
PR target/46285
* gcc.target/i386/pr46285.c.
From-SVN: r166240
Diffstat (limited to 'gcc')
-rw-r--r-- | gcc/ChangeLog | 7 | ||||
-rw-r--r-- | gcc/config/i386/i386.c | 14 | ||||
-rw-r--r-- | gcc/testsuite/ChangeLog | 5 | ||||
-rw-r--r-- | gcc/testsuite/gcc.target/i386/pr46285.c | 5 |
4 files changed, 27 insertions, 4 deletions
diff --git a/gcc/ChangeLog b/gcc/ChangeLog index 76ebd7e..55b233d 100644 --- a/gcc/ChangeLog +++ b/gcc/ChangeLog @@ -1,3 +1,10 @@ +2010-11-03 H.J. Lu <hongjiu.lu@intel.com> + + PR target/46285 + * config/i386/i386.c (ix86_expand_call): Conditionally decorate + calls with UNSPEC_CALL_NEEDS_VZEROUPPER unspec before reload + is completed. + 2010-11-03 Richard Guenther <rguenther@suse.de> PR tree-optimization/46217 diff --git a/gcc/config/i386/i386.c b/gcc/config/i386/i386.c index afecc89..ba1e4fc 100644 --- a/gcc/config/i386/i386.c +++ b/gcc/config/i386/i386.c @@ -21540,10 +21540,16 @@ ix86_expand_call (rtx retval, rtx fnaddr, rtx callarg1, else avx256 = call_no_avx256; - unspec = gen_rtx_UNSPEC (VOIDmode, - gen_rtvec (1, GEN_INT (avx256)), - UNSPEC_CALL_NEEDS_VZEROUPPER); - call = gen_rtx_PARALLEL (VOIDmode, gen_rtvec (2, call, unspec)); + if (reload_completed) + emit_insn (gen_avx_vzeroupper (GEN_INT (avx256))); + else + { + unspec = gen_rtx_UNSPEC (VOIDmode, + gen_rtvec (1, GEN_INT (avx256)), + UNSPEC_CALL_NEEDS_VZEROUPPER); + call = gen_rtx_PARALLEL (VOIDmode, + gen_rtvec (2, call, unspec)); + } } call = emit_call_insn (call); diff --git a/gcc/testsuite/ChangeLog b/gcc/testsuite/ChangeLog index 86ff763..29f4dc3 100644 --- a/gcc/testsuite/ChangeLog +++ b/gcc/testsuite/ChangeLog @@ -1,3 +1,8 @@ +2010-11-03 H.J. Lu <hongjiu.lu@intel.com> + + PR target/46285 + * gcc.target/i386/pr46285.c. + 2010-11-03 Richard Guenther <rguenther@suse.de> PR tree-optimization/46217 diff --git a/gcc/testsuite/gcc.target/i386/pr46285.c b/gcc/testsuite/gcc.target/i386/pr46285.c new file mode 100644 index 0000000..8b8cbcf --- /dev/null +++ b/gcc/testsuite/gcc.target/i386/pr46285.c @@ -0,0 +1,5 @@ +/* { dg-do compile } */ +/* { dg-options "-mavx -fsplit-stack -mtune=generic" } */ + +typedef char __m256 __attribute__ ((__vector_size__ (32))); +void foo (__m256 x) {} |