1 files changed, 363 insertions, 0 deletions
diff --git a/stdio-common/tst-scanf-format-real.h b/stdio-common/tst-scanf-format-real.h
new file mode 100644
index 0000000..639ac74
--- /dev/null
+++ b/stdio-common/tst-scanf-format-real.h
@@ -0,0 +1,363 @@
+/* Test feature wrapper for formatted real input.
+   Copyright (C) 2025 Free Software Foundation, Inc.
+   This file is part of the GNU C Library.
+
+   The GNU C Library is free software; you can redistribute it and/or
+   modify it under the terms of the GNU Lesser General Public
+   License as published by the Free Software Foundation; either
+   version 2.1 of the License, or (at your option) any later version.
+
+   The GNU C Library is distributed in the hope that it will be useful,
+   but WITHOUT ANY WARRANTY; without even the implied warranty of
+   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+   Lesser General Public License for more details.
+
+   You should have received a copy of the GNU Lesser General Public
+   License along with the GNU C Library; if not, see
+   <https://www.gnu.org/licenses/>.  */
+
+#include <ctype.h>
+#include <errno.h>
+#include <float.h>
+#include <tgmath.h>
+#include <stdbool.h>
+#include <stddef.h>
+#include <stdlib.h>
+#include <string.h>
+
+#include <support/support.h>
+
+/* Reference data is a case-inensitive signed datum, which is either a
+   hexadecimal floating constant or a literal representing infinity or
+   NaN data in any of the forms accepted by 'strtod' family functions,
+   whose binary representation is to match against byte-wise.
+
+   We need to be careful with parsing reference data in the handling of
+   the sign as with the IBM long double binary format unary negation
+   of a positive value whose lower-magnitude part is zero produces a
+   bit pattern that is different from one produced by initialization or
+   conversions made by functions such as 'scanf' or 'strtod' from the
+   complementing negative value.  The difference is in the sign of zero
+   held in the lower-magnitude part and therefore the bit patterns are
+   arithmetically equivalent, but they do not match byte-wise.
+
+   Therefore we set the sign with the initial value of the significand,
+   either -0.0 or 0.0, which sets the sign of both parts according to
+   what 'scanf' does, and never negate it afterwards.
+
+   Additionally the Intel long double binary format uses only 80 bits
+   out of 96 that the data type occupies.  Therefore preinitialize the
+   reference value with the same 0xa5 bit pattern that the value under
+   test has been so that the byte-wise comparison matches as well for
+   the unused parts of the two data pieces.
+
+   We use 'ldexp' to assemble the significand with the exponent, which
+   does not compromise verification, because internally this exercises
+   a code path different from one used by 'scanf' family functions for
+   this purpose.  Specifically 'ldexp' uses 'scalbn', whereas 'scanf'
+   defers to 'strtod' which uses '__mpn_construct_double'.  Analogously
+   for the remaining floating-point data types.  */
+
+#define nan(v, x)							\
+  _Generic((v), float: nanf, double: nan, long double: nanl) (x)
+
+#define pointer_to_value(val) (&(val))
+
+#define initialize_value(val)						\
+  memset (&val, 0xa5, sizeof (val))
+
+#define compare_real(x, y)						\
+  (memcmp (&(x), &(y), sizeof (y)) == 0)
+
+#define verify_input(f, val, count, errp)				\
+({									\
+  __label__ out;							\
+  bool match = true;							\
+  int err = 0;								\
+  type_t v;								\
+									\
+  initialize_value (v);							\
+  /* Make sure it's been committed.  */					\
+  __asm__ ("" : : : "memory");						\
+  v = read_real (&err);							\
+  if (err < 0)								\
+    goto out;								\
+  match = compare_real (val, v);					\
+									\
+out:									\
+  if (err || !match)							\
+    {									\
+      union								\
+	{								\
+	  type_t v;							\
+	  unsigned char x[sizeof (type_t)];				\
+	}								\
+      uv = { .v = v }, ui = { .v = val };				\
+									\
+      printf ("error: %s:%d: input buffer: `", __FILE__, __LINE__);	\
+      for (size_t j = 0; j < sizeof (ui.x); j++)			\
+	printf ("%02hhx", ui.x[j]);					\
+      printf ("'\n");							\
+      printf ("error: %s:%d: value buffer: `", __FILE__, __LINE__);	\
+      for (size_t j = 0; j < sizeof (uv.x); j++)			\
+	printf ("%02hhx", uv.x[j]);					\
+      printf ("'\n");							\
+    }									\
+									\
+  *errp = err;								\
+  match;								\
+})
+
+#define read_real(errp)							\
+({									\
+  __label__ out;							\
+  bool m = false;							\
+  int err = 0;								\
+  type_t v;								\
+  int ch;								\
+									\
+  ch = read_input ();							\
+  if (ch == '-' || ch == '+')						\
+    {									\
+      m = ch == '-';							\
+      ch = read_input ();						\
+    }									\
+									\
+  switch (ch)								\
+    {									\
+    case '0':								\
+      break;								\
+    case 'I':								\
+    case 'i':								\
+      {									\
+	static const char unf[] = { 'N', 'F' };				\
+	static const char lnf[] = { 'n', 'f' };				\
+	size_t i;							\
+									\
+	for (i = 0; i < sizeof (unf); i++)				\
+	  {								\
+	    ch = read_input ();						\
+	    if (ch != unf[i] && ch != lnf[i])				\
+	      {								\
+		err = ch < 0 ? ch : INPUT_FORMAT;			\
+		v = NAN;						\
+		goto out;						\
+	      }								\
+	  }								\
+									\
+	ch = read_input ();						\
+	if (ch == ':')							\
+	  {								\
+	    v = m ? -INFINITY : +INFINITY;				\
+	    goto out;							\
+	  }								\
+									\
+	static const char uinity[] = { 'I', 'N', 'I', 'T', 'Y' };	\
+	static const char linity[] = { 'i', 'n', 'i', 't', 'y' };	\
+									\
+	for (i = 0; i < sizeof (uinity); i++)				\
+	  {								\
+	    if (ch != uinity[i] && ch != linity[i])			\
+	      {								\
+		err = ch < 0 ? ch : INPUT_FORMAT;			\
+		v = NAN;						\
+		goto out;						\
+	      }								\
+	    ch = read_input ();						\
+	  }								\
+	if (ch == ':')							\
+	  {								\
+	    v = m ? -INFINITY : +INFINITY;				\
+	    goto out;							\
+	  }								\
+      }									\
+      err = ch < 0 ? ch : INPUT_FORMAT;					\
+      v = NAN;								\
+      goto out;								\
+									\
+    case 'N':								\
+    case 'n':								\
+      {									\
+	static const char uan[] = { 'A', 'N' };				\
+	static const char lan[] = { 'a', 'n' };				\
+	size_t i;							\
+									\
+	for (i = 0; i < sizeof (uan); i++)				\
+	  {								\
+	    ch = read_input ();						\
+	    if (ch != uan[i] && ch != lan[i])				\
+	      {								\
+		err = ch < 0 ? ch : INPUT_FORMAT;			\
+		v = NAN;						\
+		goto out;						\
+	      }								\
+	  }								\
+									\
+	ch = read_input ();						\
+	if (ch == ':')							\
+	  {								\
+	    v = m ? -nan (v, ".") : nan (v, ".");			\
+	    goto out;							\
+	  }								\
+									\
+	size_t seq_size = 0;						\
+	char *seq = NULL;						\
+	i = 0;								\
+	if (ch == '(')							\
+	  while (1)							\
+	    {								\
+	      ch = read_input ();					\
+	      if (ch == ')')						\
+		break;							\
+	      if (ch != '_' && !isdigit (ch)				\
+		  && !(ch >= 'A' && ch <= 'Z')				\
+		  && !(ch >= 'a' && ch <= 'z'))				\
+		{							\
+		  free (seq);						\
+		  err = ch < 0 ? ch : INPUT_FORMAT;			\
+		  v = NAN;						\
+		  goto out;						\
+		}							\
+	      if (i == seq_size)					\
+		{							\
+		  seq_size += SIZE_CHUNK;				\
+		  seq = xrealloc (seq, seq_size);			\
+		}							\
+	      seq[i++] = ch;						\
+	    }								\
+	seq[i] = '\0';							\
+									\
+	ch = read_input ();						\
+	if (ch == ':')							\
+	  {								\
+	    v = m ? -nan (v, seq) : nan (v, seq);			\
+	    free (seq);							\
+	    goto out;							\
+	  }								\
+	free (seq);							\
+      }									\
+      err = ch < 0 ? ch : INPUT_FORMAT;					\
+      v = NAN;								\
+      goto out;								\
+									\
+    default:								\
+      err = ch < 0 ? ch : INPUT_FORMAT;					\
+      v = NAN;								\
+      goto out;								\
+    }									\
+									\
+  ch = read_input ();							\
+  if (ch != 'X' && ch != 'x')						\
+    {									\
+      err = ch < 0 ? ch : INPUT_FORMAT;					\
+      v = NAN;								\
+      goto out;								\
+    }									\
+									\
+  type_t f = m ? -1.0 : 1.0;						\
+  v = m ? -0.0 : 0.0;							\
+  int i = 0;								\
+  do									\
+    {									\
+      int d = 0;							\
+									\
+      ch = read_input ();						\
+									\
+      if (i == 1)							\
+	switch (ch)							\
+	  {								\
+	  case '.':							\
+	    i++;							\
+	    continue;							\
+									\
+	  case ':':							\
+	  case 'P':							\
+	  case 'p':							\
+	    break;							\
+									\
+	  default:							\
+	    err = ch < 0 ? ch : INPUT_FORMAT;				\
+	    v = NAN;							\
+	    goto out;							\
+	  }								\
+									\
+      switch (ch)							\
+	{								\
+	case '0':							\
+	case '1':							\
+	case '2':							\
+	case '3':							\
+	case '4':							\
+	case '5':							\
+	case '6':							\
+	case '7':							\
+	case '8':							\
+	case '9':							\
+	  d = ch - '0';							\
+	  break;							\
+									\
+	case 'A':							\
+	case 'B':							\
+	case 'C':							\
+	case 'D':							\
+	case 'E':							\
+	case 'F':							\
+	  d = ch - 'A' + 10;						\
+	  break;							\
+									\
+	case 'a':							\
+	case 'b':							\
+	case 'c':							\
+	case 'd':							\
+	case 'e':							\
+	case 'f':							\
+	  d = ch - 'a' + 10;						\
+	  break;							\
+									\
+	case ':':							\
+	case 'P':							\
+	case 'p':							\
+	  if (i == 0)							\
+	    {								\
+	      err = INPUT_FORMAT;					\
+	      v = NAN;							\
+	      goto out;							\
+	    }								\
+	  break;							\
+									\
+	default:							\
+	  err = ch < 0 ? ch : INPUT_FORMAT;				\
+	  v = NAN;							\
+	  goto out;							\
+	}								\
+									\
+      v += f * d;							\
+      f /= 16.0l;							\
+      i++;								\
+    }									\
+  while (ch != ':' && ch != 'P' && ch != 'p');				\
+									\
+  long long exp = 0;							\
+  if (ch == 'P' || ch == 'p')						\
+    {									\
+      exp = read_integer (&err);					\
+      if (err)								\
+	{								\
+	  v = NAN;							\
+	  goto out;							\
+	}								\
+    }									\
+									\
+  errno = 0;								\
+  v = ldexp (v, exp);							\
+  if ((v == HUGE_VALL || v == -HUGE_VALL) && errno != 0)		\
+    {									\
+      err = INPUT_OVERFLOW;						\
+      v = NAN;								\
+      goto out;								\
+    }									\
+									\
+out:									\
+  *errp = err;								\
+  v;									\
+})