aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorRichard Biener <rguenther@suse.de>2024-05-02 13:55:15 +0200
committerRichard Biener <rguenther@suse.de>2024-05-03 08:19:51 +0200
commit87e35da16df74cd1c4729a55d94e7bc592487f48 (patch)
tree9480fb06a30c630224da93291ebe4b9a139fcdb3
parentf04dc89a991ddc6c08ac92c8ad29c6915c4ecafa (diff)
downloadgcc-87e35da16df74cd1c4729a55d94e7bc592487f48.zip
gcc-87e35da16df74cd1c4729a55d94e7bc592487f48.tar.gz
gcc-87e35da16df74cd1c4729a55d94e7bc592487f48.tar.bz2
tree-optimization/114921 - _Float16 -> __bf16 isn't noop
The vectorizer handles a _Float16 to __bf16 conversion through vectorizable_assignment, thinking it's a noop. The following fixes this by requiring the same vector component mode when checking for CONVERT_EXPR_CODE_P, being stricter than for VIEW_CONVERT_EXPR. PR tree-optimization/114921 * tree-vect-stmts.cc (vectorizable_assignment): Require same vector component modes for input and output for CONVERT_EXPR_CODE_P.
-rw-r--r--gcc/tree-vect-stmts.cc19
1 files changed, 11 insertions, 8 deletions
diff --git a/gcc/tree-vect-stmts.cc b/gcc/tree-vect-stmts.cc
index f8d8636..7e57196 100644
--- a/gcc/tree-vect-stmts.cc
+++ b/gcc/tree-vect-stmts.cc
@@ -5955,14 +5955,17 @@ vectorizable_assignment (vec_info *vinfo,
if (!vectype_in)
vectype_in = get_vectype_for_scalar_type (vinfo, TREE_TYPE (op), slp_node);
- /* We can handle NOP_EXPR conversions that do not change the number
- of elements or the vector size. */
- if ((CONVERT_EXPR_CODE_P (code)
- || code == VIEW_CONVERT_EXPR)
- && (!vectype_in
- || maybe_ne (TYPE_VECTOR_SUBPARTS (vectype_in), nunits)
- || maybe_ne (GET_MODE_SIZE (TYPE_MODE (vectype)),
- GET_MODE_SIZE (TYPE_MODE (vectype_in)))))
+ /* We can handle VIEW_CONVERT conversions that do not change the number
+ of elements or the vector size or other conversions when the component
+ mode keeps the same. */
+ if (!vectype_in
+ || maybe_ne (TYPE_VECTOR_SUBPARTS (vectype_in), nunits)
+ || (code == VIEW_CONVERT_EXPR
+ && maybe_ne (GET_MODE_SIZE (TYPE_MODE (vectype)),
+ GET_MODE_SIZE (TYPE_MODE (vectype_in))))
+ || (CONVERT_EXPR_CODE_P (code)
+ && (TYPE_MODE (TREE_TYPE (vectype))
+ != TYPE_MODE (TREE_TYPE (vectype_in)))))
return false;
if (VECTOR_BOOLEAN_TYPE_P (vectype) != VECTOR_BOOLEAN_TYPE_P (vectype_in))