[AArch64] Generalise aarch64_simd_valid_immediate for SVE

The current aarch64_simd_valid_immediate code predates the move to the new CONST_VECTOR representation, so for variable-length SVE it only handles duplicates of single elements, rather than duplicates of repeating patterns. This patch removes the restriction. It means that the validity of a duplicated constant depends only on the bit pattern, not on the mode used to represent it. The patch is needed by a later big-endian fix. 2018-02-01 Richard Sandiford <richard.sandiford@linaro.org> gcc/ * config/aarch64/aarch64.c (aarch64_simd_valid_immediate): Handle all CONST_VECTOR_DUPLICATE_P vectors, not just those with a single duplicated element. Reviewed-by: James Greenhalgh <james.greenhalgh@arm.com> From-SVN: r257286
author: Richard Sandiford <richard.sandiford@linaro.org> 2018-02-01 11:03:17 +0000
committer: Richard Sandiford <rsandifo@gcc.gnu.org> 2018-02-01 11:03:17 +0000
commit: f9093f23517498f99768816fb11849b798db85e9 (patch)
tree: 0656a9cae26eb657f0061400eb9cb763158487c5
parent: 9a1b9cb4d6fcf88d68f55b97c7d9d09c5606fed7 (diff)
download: gcc-f9093f23517498f99768816fb11849b798db85e9.zip
gcc-f9093f23517498f99768816fb11849b798db85e9.tar.gz
gcc-f9093f23517498f99768816fb11849b798db85e9.tar.bz2
2 files changed, 25 insertions, 15 deletions
diff --git a/gcc/ChangeLog b/gcc/ChangeLog
index adaec48..d665f3d 100644
--- a/gcc/ChangeLog
+++ b/gcc/ChangeLog
@@ -1,5 +1,11 @@
 2018-02-01  Richard Sandiford  <richard.sandiford@linaro.org>
 
+	* config/aarch64/aarch64.c (aarch64_simd_valid_immediate): Handle
+	all CONST_VECTOR_DUPLICATE_P vectors, not just those with a single
+	duplicated element.
+
+2018-02-01  Richard Sandiford  <richard.sandiford@linaro.org>
+
 	PR tearget/83845
 	* config/aarch64/aarch64.c (aarch64_secondary_reload): Tighten
 	check for operands that need to go through aarch64_sve_reload_be.
diff --git a/gcc/config/aarch64/aarch64.c b/gcc/config/aarch64/aarch64.c
index 656dd76..1278f83 100644
--- a/gcc/config/aarch64/aarch64.c
+++ b/gcc/config/aarch64/aarch64.c
@@ -13164,10 +13164,11 @@ aarch64_simd_valid_immediate (rtx op, simd_immediate_info *info,
     return false;
 
   scalar_mode elt_mode = GET_MODE_INNER (mode);
-  rtx elt = NULL, base, step;
+  rtx base, step;
   unsigned int n_elts;
-  if (const_vec_duplicate_p (op, &elt))
-    n_elts = 1;
+  if (GET_CODE (op) == CONST_VECTOR
+      && CONST_VECTOR_DUPLICATE_P (op))
+    n_elts = CONST_VECTOR_NPATTERNS (op);
   else if ((vec_flags & VEC_SVE_DATA)
 	   && const_vec_series_p (op, &base, &step))
     {
@@ -13192,14 +13193,17 @@ aarch64_simd_valid_immediate (rtx op, simd_immediate_info *info,
 	    || op == CONSTM1_RTX (mode));
 
   scalar_float_mode elt_float_mode;
-  if (elt
-      && is_a <scalar_float_mode> (elt_mode, &elt_float_mode)
-      && (aarch64_float_const_zero_rtx_p (elt)
-	  || aarch64_float_const_representable_p (elt)))
+  if (n_elts == 1
+      && is_a <scalar_float_mode> (elt_mode, &elt_float_mode))
     {
-      if (info)
-	*info = simd_immediate_info (elt_float_mode, elt);
-      return true;
+      rtx elt = CONST_VECTOR_ENCODED_ELT (op, 0);
+      if (aarch64_float_const_zero_rtx_p (elt)
+	  || aarch64_float_const_representable_p (elt))
+	{
+	  if (info)
+	    *info = simd_immediate_info (elt_float_mode, elt);
+	  return true;
+	}
     }
 
   unsigned int elt_size = GET_MODE_SIZE (elt_mode);
@@ -13214,11 +13218,11 @@ aarch64_simd_valid_immediate (rtx op, simd_immediate_info *info,
   bytes.reserve (n_elts * elt_size);
   for (unsigned int i = 0; i < n_elts; i++)
     {
-      if (!elt || n_elts != 1)
-	/* The vector is provided in gcc endian-neutral fashion.
-	   For aarch64_be, it must be laid out in the vector register
-	   in reverse order.  */
-	elt = CONST_VECTOR_ELT (op, BYTES_BIG_ENDIAN ? (n_elts - 1 - i) : i);
+      /* The vector is provided in gcc endian-neutral fashion.
+	 For aarch64_be Advanced SIMD, it must be laid out in the vector
+	 register in reverse order.  */
+      bool swap_p = ((vec_flags & VEC_ADVSIMD) != 0 && BYTES_BIG_ENDIAN);
+      rtx elt = CONST_VECTOR_ELT (op, swap_p ? (n_elts - 1 - i) : i);
 
       if (elt_mode != elt_int_mode)
 	elt = gen_lowpart (elt_int_mode, elt);
author	Richard Sandiford <richard.sandiford@linaro.org>	2018-02-01 11:03:17 +0000
committer	Richard Sandiford <rsandifo@gcc.gnu.org>	2018-02-01 11:03:17 +0000
commit	f9093f23517498f99768816fb11849b798db85e9 (patch)
tree	0656a9cae26eb657f0061400eb9cb763158487c5
parent	9a1b9cb4d6fcf88d68f55b97c7d9d09c5606fed7 (diff)
download	gcc-f9093f23517498f99768816fb11849b798db85e9.zip gcc-f9093f23517498f99768816fb11849b798db85e9.tar.gz gcc-f9093f23517498f99768816fb11849b798db85e9.tar.bz2