diff options
author | Juzhe-Zhong <juzhe.zhong@rivai.ai> | 2023-09-10 10:33:04 +0800 |
---|---|---|
committer | Pan Li <pan2.li@intel.com> | 2023-09-11 07:14:16 +0800 |
commit | 108779056eb4b56e715a094fac48a699d2dc91b3 (patch) | |
tree | a7c8f4a51e46b1202ecaead7bed6bc017de64d2a | |
parent | e390872aebcfebb7c9bc95d8fb7e44f2bec996d3 (diff) | |
download | gcc-108779056eb4b56e715a094fac48a699d2dc91b3.zip gcc-108779056eb4b56e715a094fac48a699d2dc91b3.tar.gz gcc-108779056eb4b56e715a094fac48a699d2dc91b3.tar.bz2 |
RISC-V: Expand fixed-vlmax/vls vector permutation in targethook
When debugging FAIL: gcc.dg/pr92301.c execution test.
Realize a vls vector permutation situation failed to vectorize since early return false:
- /* For constant size indices, we dont't need to handle it here.
- Just leave it to vec_perm<mode>. */
- if (d->perm.length ().is_constant ())
- return false;
To avoid more potential failed vectorization case. Now expand it in targethook.
gcc/ChangeLog:
* config/riscv/riscv-v.cc (shuffle_generic_patterns): Expand
fixed-vlmax/vls vector permutation.
-rw-r--r-- | gcc/config/riscv/riscv-v.cc | 14 |
1 files changed, 7 insertions, 7 deletions
diff --git a/gcc/config/riscv/riscv-v.cc b/gcc/config/riscv/riscv-v.cc index 8a548f5..847bc24 100644 --- a/gcc/config/riscv/riscv-v.cc +++ b/gcc/config/riscv/riscv-v.cc @@ -2793,14 +2793,9 @@ shuffle_generic_patterns (struct expand_vec_perm_d *d) if (!pow2p_hwi (d->perm.encoding().npatterns ())) return false; - /* For constant size indices, we dont't need to handle it here. - Just leave it to vec_perm<mode>. */ - if (d->perm.length ().is_constant ()) - return false; - /* Permuting two SEW8 variable-length vectors need vrgatherei16.vv. Otherwise, it could overflow the index range. */ - if (GET_MODE_INNER (d->vmode) == QImode + if (!nunits.is_constant () && GET_MODE_INNER (d->vmode) == QImode && !get_vector_mode (HImode, nunits).exists (&sel_mode)) return false; @@ -2809,7 +2804,12 @@ shuffle_generic_patterns (struct expand_vec_perm_d *d) return true; rtx sel = vec_perm_indices_to_rtx (sel_mode, d->perm); - expand_vec_perm (d->target, d->op0, d->op1, force_reg (sel_mode, sel)); + /* 'mov<mode>' generte interleave vector. */ + if (!nunits.is_constant ()) + sel = force_reg (sel_mode, sel); + /* Some FIXED-VLMAX/VLS vector permutation situations call targethook + instead of expand vec_perm<mode>, we handle it directly. */ + expand_vec_perm (d->target, d->op0, d->op1, sel); return true; } |