mirror of
				https://sourceware.org/git/glibc.git
				synced 2025-10-26 00:57:39 +03:00 
			
		
		
		
	The use of the same name for a local variable combined with passing a pointer to it to a nested macro call causes the wrong 'err' variable to be updated in 'read_real', because '&err' is only expanded at '*errp' evaluation. Consequently the variable defined in 'read_real' is set rather than one in its 'verify_input' caller as it would be the case should 'read_real' be a function, leading to invalid input such as: %a:nan:1:3:nan(: to be accepted. Address the issue by renaming the 'err' variable in 'verify_input' to 'errx', causing such input to be correctly rejected: error: ./tst-scanf-format-skeleton.c:242: input line 1: input data format error No test case added as it's a test case issue in the first place. Reviewed-by: Adhemerval Zanella <adhemerval.zanella@linaro.org>
		
			
				
	
	
		
			364 lines
		
	
	
		
			9.8 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			364 lines
		
	
	
		
			9.8 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| /* Test feature wrapper for formatted real input.
 | |
|    Copyright (C) 2025 Free Software Foundation, Inc.
 | |
|    This file is part of the GNU C Library.
 | |
| 
 | |
|    The GNU C Library is free software; you can redistribute it and/or
 | |
|    modify it under the terms of the GNU Lesser General Public
 | |
|    License as published by the Free Software Foundation; either
 | |
|    version 2.1 of the License, or (at your option) any later version.
 | |
| 
 | |
|    The GNU C Library is distributed in the hope that it will be useful,
 | |
|    but WITHOUT ANY WARRANTY; without even the implied warranty of
 | |
|    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 | |
|    Lesser General Public License for more details.
 | |
| 
 | |
|    You should have received a copy of the GNU Lesser General Public
 | |
|    License along with the GNU C Library; if not, see
 | |
|    <https://www.gnu.org/licenses/>.  */
 | |
| 
 | |
| #include <ctype.h>
 | |
| #include <errno.h>
 | |
| #include <float.h>
 | |
| #include <tgmath.h>
 | |
| #include <stdbool.h>
 | |
| #include <stddef.h>
 | |
| #include <stdlib.h>
 | |
| #include <string.h>
 | |
| 
 | |
| #include <support/support.h>
 | |
| 
 | |
| /* Reference data is a case-inensitive signed datum, which is either a
 | |
|    hexadecimal floating constant or a literal representing infinity or
 | |
|    NaN data in any of the forms accepted by 'strtod' family functions,
 | |
|    whose binary representation is to match against byte-wise.
 | |
| 
 | |
|    We need to be careful with parsing reference data in the handling of
 | |
|    the sign as with the IBM long double binary format unary negation
 | |
|    of a positive value whose lower-magnitude part is zero produces a
 | |
|    bit pattern that is different from one produced by initialization or
 | |
|    conversions made by functions such as 'scanf' or 'strtod' from the
 | |
|    complementing negative value.  The difference is in the sign of zero
 | |
|    held in the lower-magnitude part and therefore the bit patterns are
 | |
|    arithmetically equivalent, but they do not match byte-wise.
 | |
| 
 | |
|    Therefore we set the sign with the initial value of the significand,
 | |
|    either -0.0 or 0.0, which sets the sign of both parts according to
 | |
|    what 'scanf' does, and never negate it afterwards.
 | |
| 
 | |
|    Additionally the Intel long double binary format uses only 80 bits
 | |
|    out of 96 that the data type occupies.  Therefore preinitialize the
 | |
|    reference value with the same 0xa5 bit pattern that the value under
 | |
|    test has been so that the byte-wise comparison matches as well for
 | |
|    the unused parts of the two data pieces.
 | |
| 
 | |
|    We use 'ldexp' to assemble the significand with the exponent, which
 | |
|    does not compromise verification, because internally this exercises
 | |
|    a code path different from one used by 'scanf' family functions for
 | |
|    this purpose.  Specifically 'ldexp' uses 'scalbn', whereas 'scanf'
 | |
|    defers to 'strtod' which uses '__mpn_construct_double'.  Analogously
 | |
|    for the remaining floating-point data types.  */
 | |
| 
 | |
| #define nan(v, x)							\
 | |
|   _Generic((v), float: nanf, double: nan, long double: nanl) (x)
 | |
| 
 | |
| #define pointer_to_value(val) (&(val))
 | |
| 
 | |
| #define initialize_value(val)						\
 | |
|   memset (&val, 0xa5, sizeof (val))
 | |
| 
 | |
| #define compare_real(x, y)						\
 | |
|   (memcmp (&(x), &(y), sizeof (y)) == 0)
 | |
| 
 | |
| #define verify_input(f, val, count, errp)				\
 | |
| ({									\
 | |
|   __label__ out;							\
 | |
|   bool match = true;							\
 | |
|   int errx = 0;								\
 | |
|   type_t v;								\
 | |
| 									\
 | |
|   initialize_value (v);							\
 | |
|   /* Make sure it's been committed.  */					\
 | |
|   __asm__ ("" : : : "memory");						\
 | |
|   v = read_real (&errx);						\
 | |
|   if (errx < 0)								\
 | |
|     goto out;								\
 | |
|   match = compare_real (val, v);					\
 | |
| 									\
 | |
| out:									\
 | |
|   if (errx || !match)							\
 | |
|     {									\
 | |
|       union								\
 | |
| 	{								\
 | |
| 	  type_t v;							\
 | |
| 	  unsigned char x[sizeof (type_t)];				\
 | |
| 	}								\
 | |
|       uv = { .v = v }, ui = { .v = val };				\
 | |
| 									\
 | |
|       printf ("error: %s:%d: input buffer: `", __FILE__, __LINE__);	\
 | |
|       for (size_t j = 0; j < sizeof (ui.x); j++)			\
 | |
| 	printf ("%02hhx", ui.x[j]);					\
 | |
|       printf ("'\n");							\
 | |
|       printf ("error: %s:%d: value buffer: `", __FILE__, __LINE__);	\
 | |
|       for (size_t j = 0; j < sizeof (uv.x); j++)			\
 | |
| 	printf ("%02hhx", uv.x[j]);					\
 | |
|       printf ("'\n");							\
 | |
|     }									\
 | |
| 									\
 | |
|   *errp = errx;								\
 | |
|   match;								\
 | |
| })
 | |
| 
 | |
| #define read_real(errp)							\
 | |
| ({									\
 | |
|   __label__ out;							\
 | |
|   bool m = false;							\
 | |
|   int err = 0;								\
 | |
|   type_t v;								\
 | |
|   int ch;								\
 | |
| 									\
 | |
|   ch = read_input ();							\
 | |
|   if (ch == '-' || ch == '+')						\
 | |
|     {									\
 | |
|       m = ch == '-';							\
 | |
|       ch = read_input ();						\
 | |
|     }									\
 | |
| 									\
 | |
|   switch (ch)								\
 | |
|     {									\
 | |
|     case '0':								\
 | |
|       break;								\
 | |
|     case 'I':								\
 | |
|     case 'i':								\
 | |
|       {									\
 | |
| 	static const char unf[] = { 'N', 'F' };				\
 | |
| 	static const char lnf[] = { 'n', 'f' };				\
 | |
| 	size_t i;							\
 | |
| 									\
 | |
| 	for (i = 0; i < sizeof (unf); i++)				\
 | |
| 	  {								\
 | |
| 	    ch = read_input ();						\
 | |
| 	    if (ch != unf[i] && ch != lnf[i])				\
 | |
| 	      {								\
 | |
| 		err = ch < 0 ? ch : INPUT_FORMAT;			\
 | |
| 		v = NAN;						\
 | |
| 		goto out;						\
 | |
| 	      }								\
 | |
| 	  }								\
 | |
| 									\
 | |
| 	ch = read_input ();						\
 | |
| 	if (ch == ':')							\
 | |
| 	  {								\
 | |
| 	    v = m ? -INFINITY : +INFINITY;				\
 | |
| 	    goto out;							\
 | |
| 	  }								\
 | |
| 									\
 | |
| 	static const char uinity[] = { 'I', 'N', 'I', 'T', 'Y' };	\
 | |
| 	static const char linity[] = { 'i', 'n', 'i', 't', 'y' };	\
 | |
| 									\
 | |
| 	for (i = 0; i < sizeof (uinity); i++)				\
 | |
| 	  {								\
 | |
| 	    if (ch != uinity[i] && ch != linity[i])			\
 | |
| 	      {								\
 | |
| 		err = ch < 0 ? ch : INPUT_FORMAT;			\
 | |
| 		v = NAN;						\
 | |
| 		goto out;						\
 | |
| 	      }								\
 | |
| 	    ch = read_input ();						\
 | |
| 	  }								\
 | |
| 	if (ch == ':')							\
 | |
| 	  {								\
 | |
| 	    v = m ? -INFINITY : +INFINITY;				\
 | |
| 	    goto out;							\
 | |
| 	  }								\
 | |
|       }									\
 | |
|       err = ch < 0 ? ch : INPUT_FORMAT;					\
 | |
|       v = NAN;								\
 | |
|       goto out;								\
 | |
| 									\
 | |
|     case 'N':								\
 | |
|     case 'n':								\
 | |
|       {									\
 | |
| 	static const char uan[] = { 'A', 'N' };				\
 | |
| 	static const char lan[] = { 'a', 'n' };				\
 | |
| 	size_t i;							\
 | |
| 									\
 | |
| 	for (i = 0; i < sizeof (uan); i++)				\
 | |
| 	  {								\
 | |
| 	    ch = read_input ();						\
 | |
| 	    if (ch != uan[i] && ch != lan[i])				\
 | |
| 	      {								\
 | |
| 		err = ch < 0 ? ch : INPUT_FORMAT;			\
 | |
| 		v = NAN;						\
 | |
| 		goto out;						\
 | |
| 	      }								\
 | |
| 	  }								\
 | |
| 									\
 | |
| 	ch = read_input ();						\
 | |
| 	if (ch == ':')							\
 | |
| 	  {								\
 | |
| 	    v = m ? -nan (v, ".") : nan (v, ".");			\
 | |
| 	    goto out;							\
 | |
| 	  }								\
 | |
| 									\
 | |
| 	size_t seq_size = 0;						\
 | |
| 	char *seq = NULL;						\
 | |
| 	i = 0;								\
 | |
| 	if (ch == '(')							\
 | |
| 	  while (1)							\
 | |
| 	    {								\
 | |
| 	      ch = read_input ();					\
 | |
| 	      if (ch == ')')						\
 | |
| 		break;							\
 | |
| 	      if (ch != '_' && !isdigit (ch)				\
 | |
| 		  && !(ch >= 'A' && ch <= 'Z')				\
 | |
| 		  && !(ch >= 'a' && ch <= 'z'))				\
 | |
| 		{							\
 | |
| 		  free (seq);						\
 | |
| 		  err = ch < 0 ? ch : INPUT_FORMAT;			\
 | |
| 		  v = NAN;						\
 | |
| 		  goto out;						\
 | |
| 		}							\
 | |
| 	      if (i == seq_size)					\
 | |
| 		{							\
 | |
| 		  seq_size += SIZE_CHUNK;				\
 | |
| 		  seq = xrealloc (seq, seq_size);			\
 | |
| 		}							\
 | |
| 	      seq[i++] = ch;						\
 | |
| 	    }								\
 | |
| 	seq[i] = '\0';							\
 | |
| 									\
 | |
| 	ch = read_input ();						\
 | |
| 	if (ch == ':')							\
 | |
| 	  {								\
 | |
| 	    v = m ? -nan (v, seq) : nan (v, seq);			\
 | |
| 	    free (seq);							\
 | |
| 	    goto out;							\
 | |
| 	  }								\
 | |
| 	free (seq);							\
 | |
|       }									\
 | |
|       err = ch < 0 ? ch : INPUT_FORMAT;					\
 | |
|       v = NAN;								\
 | |
|       goto out;								\
 | |
| 									\
 | |
|     default:								\
 | |
|       err = ch < 0 ? ch : INPUT_FORMAT;					\
 | |
|       v = NAN;								\
 | |
|       goto out;								\
 | |
|     }									\
 | |
| 									\
 | |
|   ch = read_input ();							\
 | |
|   if (ch != 'X' && ch != 'x')						\
 | |
|     {									\
 | |
|       err = ch < 0 ? ch : INPUT_FORMAT;					\
 | |
|       v = NAN;								\
 | |
|       goto out;								\
 | |
|     }									\
 | |
| 									\
 | |
|   type_t f = m ? -1.0 : 1.0;						\
 | |
|   v = m ? -0.0 : 0.0;							\
 | |
|   int i = 0;								\
 | |
|   do									\
 | |
|     {									\
 | |
|       int d = 0;							\
 | |
| 									\
 | |
|       ch = read_input ();						\
 | |
| 									\
 | |
|       if (i == 1)							\
 | |
| 	switch (ch)							\
 | |
| 	  {								\
 | |
| 	  case '.':							\
 | |
| 	    i++;							\
 | |
| 	    continue;							\
 | |
| 									\
 | |
| 	  case ':':							\
 | |
| 	  case 'P':							\
 | |
| 	  case 'p':							\
 | |
| 	    break;							\
 | |
| 									\
 | |
| 	  default:							\
 | |
| 	    err = ch < 0 ? ch : INPUT_FORMAT;				\
 | |
| 	    v = NAN;							\
 | |
| 	    goto out;							\
 | |
| 	  }								\
 | |
| 									\
 | |
|       switch (ch)							\
 | |
| 	{								\
 | |
| 	case '0':							\
 | |
| 	case '1':							\
 | |
| 	case '2':							\
 | |
| 	case '3':							\
 | |
| 	case '4':							\
 | |
| 	case '5':							\
 | |
| 	case '6':							\
 | |
| 	case '7':							\
 | |
| 	case '8':							\
 | |
| 	case '9':							\
 | |
| 	  d = ch - '0';							\
 | |
| 	  break;							\
 | |
| 									\
 | |
| 	case 'A':							\
 | |
| 	case 'B':							\
 | |
| 	case 'C':							\
 | |
| 	case 'D':							\
 | |
| 	case 'E':							\
 | |
| 	case 'F':							\
 | |
| 	  d = ch - 'A' + 10;						\
 | |
| 	  break;							\
 | |
| 									\
 | |
| 	case 'a':							\
 | |
| 	case 'b':							\
 | |
| 	case 'c':							\
 | |
| 	case 'd':							\
 | |
| 	case 'e':							\
 | |
| 	case 'f':							\
 | |
| 	  d = ch - 'a' + 10;						\
 | |
| 	  break;							\
 | |
| 									\
 | |
| 	case ':':							\
 | |
| 	case 'P':							\
 | |
| 	case 'p':							\
 | |
| 	  if (i == 0)							\
 | |
| 	    {								\
 | |
| 	      err = INPUT_FORMAT;					\
 | |
| 	      v = NAN;							\
 | |
| 	      goto out;							\
 | |
| 	    }								\
 | |
| 	  break;							\
 | |
| 									\
 | |
| 	default:							\
 | |
| 	  err = ch < 0 ? ch : INPUT_FORMAT;				\
 | |
| 	  v = NAN;							\
 | |
| 	  goto out;							\
 | |
| 	}								\
 | |
| 									\
 | |
|       v += f * d;							\
 | |
|       f /= 16.0l;							\
 | |
|       i++;								\
 | |
|     }									\
 | |
|   while (ch != ':' && ch != 'P' && ch != 'p');				\
 | |
| 									\
 | |
|   long long exp = 0;							\
 | |
|   if (ch == 'P' || ch == 'p')						\
 | |
|     {									\
 | |
|       exp = read_integer (&err);					\
 | |
|       if (err)								\
 | |
| 	{								\
 | |
| 	  v = NAN;							\
 | |
| 	  goto out;							\
 | |
| 	}								\
 | |
|     }									\
 | |
| 									\
 | |
|   errno = 0;								\
 | |
|   v = ldexp (v, exp);							\
 | |
|   if ((v == HUGE_VALL || v == -HUGE_VALL) && errno != 0)		\
 | |
|     {									\
 | |
|       err = INPUT_OVERFLOW;						\
 | |
|       v = NAN;								\
 | |
|       goto out;								\
 | |
|     }									\
 | |
| 									\
 | |
| out:									\
 | |
|   *errp = err;								\
 | |
|   v;									\
 | |
| })
 |