diff options
author | Hongyu Wang <hongyu.wang@intel.com> | 2022-12-06 09:53:35 +0800 |
---|---|---|
committer | Hongyu Wang <hongyu.wang@intel.com> | 2022-12-07 16:44:14 +0800 |
commit | 3a1a141f79c83ad38f7db3a21d8a4dcfe625c176 (patch) | |
tree | 9ee231a5a32b4b51228a2907ace77bc3cd29e526 | |
parent | cb6922f490d3133e4ccbc1190b555d16695fc9c3 (diff) | |
download | gcc-3a1a141f79c83ad38f7db3a21d8a4dcfe625c176.zip gcc-3a1a141f79c83ad38f7db3a21d8a4dcfe625c176.tar.gz gcc-3a1a141f79c83ad38f7db3a21d8a4dcfe625c176.tar.bz2 |
i386: Avoid fma_chain for -march=alderlake and sapphirerapids.
For Alderlake there is similar issue like PR 81616, enable
avoid_fma256_chain will also benefit on Intel latest platforms
Alderlake and Sapphire Rapids.
gcc/ChangeLog:
* config/i386/x86-tune.def (X86_TUNE_AVOID_256FMA_CHAINS): Add
m_SAPPHIRERAPIDS, m_ALDERLAKE and m_CORE_ATOM.
-rw-r--r-- | gcc/config/i386/x86-tune.def | 3 |
1 files changed, 2 insertions, 1 deletions
diff --git a/gcc/config/i386/x86-tune.def b/gcc/config/i386/x86-tune.def index cd66f33..db85de2 100644 --- a/gcc/config/i386/x86-tune.def +++ b/gcc/config/i386/x86-tune.def @@ -499,7 +499,8 @@ DEF_TUNE (X86_TUNE_AVOID_128FMA_CHAINS, "avoid_fma_chains", m_ZNVER) /* X86_TUNE_AVOID_256FMA_CHAINS: Avoid creating loops with tight 256bit or smaller FMA chain. */ -DEF_TUNE (X86_TUNE_AVOID_256FMA_CHAINS, "avoid_fma256_chains", m_ZNVER2 | m_ZNVER3) +DEF_TUNE (X86_TUNE_AVOID_256FMA_CHAINS, "avoid_fma256_chains", m_ZNVER2 | m_ZNVER3 + | m_ALDERLAKE | m_SAPPHIRERAPIDS | m_CORE_ATOM) /* X86_TUNE_V2DF_REDUCTION_PREFER_PHADDPD: Prefer haddpd for v2df vector reduction. */ |