mirror of
https://sourceware.org/git/glibc.git
synced 2025-04-19 01:04:13 +03:00
Add a collection of tests for formatted scanf input specifiers covering the b, d, i, o, u, x, and X integer conversions, the a, A, e, E, f, F, g, and G floating-point conversions, and the [, c, and s character conversions. Also the hh, h, l, and ll length modifiers are covered with the integer conversions as are the l and L length modifier with the floating-point conversions. The tests cover assignment suppressing and the field width as well, verifying the number of assignments made, the number of characters consumed and the value assigned. Add the common test code here as well as test cases for scanf, and then base Makefile infrastructure plus target-agnostic input data, for the character conversions and the `char', `short', and `long long' integer ones, signed and unsigned, with remaining input data and other functions from the scanf family deferred to subsequent additions. Keep input data disabled and referring to BZ #12701 for entries that are currently incorrectly accepted as valid data, such as '0b' or '0x' with the relevant integer conversions or sequences of an insufficient number of characters with the c conversion. Reviewed-by: Joseph Myers <josmyers@redhat.com>
364 lines
9.8 KiB
C
364 lines
9.8 KiB
C
/* Test feature wrapper for formatted real input.
|
|
Copyright (C) 2025 Free Software Foundation, Inc.
|
|
This file is part of the GNU C Library.
|
|
|
|
The GNU C Library is free software; you can redistribute it and/or
|
|
modify it under the terms of the GNU Lesser General Public
|
|
License as published by the Free Software Foundation; either
|
|
version 2.1 of the License, or (at your option) any later version.
|
|
|
|
The GNU C Library is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
Lesser General Public License for more details.
|
|
|
|
You should have received a copy of the GNU Lesser General Public
|
|
License along with the GNU C Library; if not, see
|
|
<https://www.gnu.org/licenses/>. */
|
|
|
|
#include <ctype.h>
|
|
#include <errno.h>
|
|
#include <float.h>
|
|
#include <tgmath.h>
|
|
#include <stdbool.h>
|
|
#include <stddef.h>
|
|
#include <stdlib.h>
|
|
#include <string.h>
|
|
|
|
#include <support/support.h>
|
|
|
|
/* Reference data is a case-inensitive signed datum, which is either a
|
|
hexadecimal floating constant or a literal representing infinity or
|
|
NaN data in any of the forms accepted by 'strtod' family functions,
|
|
whose binary representation is to match against byte-wise.
|
|
|
|
We need to be careful with parsing reference data in the handling of
|
|
the sign as with the IBM long double binary format unary negation
|
|
of a positive value whose lower-magnitude part is zero produces a
|
|
bit pattern that is different from one produced by initialization or
|
|
conversions made by functions such as 'scanf' or 'strtod' from the
|
|
complementing negative value. The difference is in the sign of zero
|
|
held in the lower-magnitude part and therefore the bit patterns are
|
|
arithmetically equivalent, but they do not match byte-wise.
|
|
|
|
Therefore we set the sign with the initial value of the significand,
|
|
either -0.0 or 0.0, which sets the sign of both parts according to
|
|
what 'scanf' does, and never negate it afterwards.
|
|
|
|
Additionally the Intel long double binary format uses only 80 bits
|
|
out of 96 that the data type occupies. Therefore preinitialize the
|
|
reference value with the same 0xa5 bit pattern that the value under
|
|
test has been so that the byte-wise comparison matches as well for
|
|
the unused parts of the two data pieces.
|
|
|
|
We use 'ldexp' to assemble the significand with the exponent, which
|
|
does not compromise verification, because internally this exercises
|
|
a code path different from one used by 'scanf' family functions for
|
|
this purpose. Specifically 'ldexp' uses 'scalbn', whereas 'scanf'
|
|
defers to 'strtod' which uses '__mpn_construct_double'. Analogously
|
|
for the remaining floating-point data types. */
|
|
|
|
#define nan(v, x) \
|
|
_Generic((v), float: nanf, double: nan, long double: nanl) (x)
|
|
|
|
#define pointer_to_value(val) (&(val))
|
|
|
|
#define initialize_value(val) \
|
|
memset (&val, 0xa5, sizeof (val))
|
|
|
|
#define compare_real(x, y) \
|
|
(memcmp (&(x), &(y), sizeof (y)) == 0)
|
|
|
|
#define verify_input(f, val, count, errp) \
|
|
({ \
|
|
__label__ out; \
|
|
bool match = true; \
|
|
int err = 0; \
|
|
type_t v; \
|
|
\
|
|
initialize_value (v); \
|
|
/* Make sure it's been committed. */ \
|
|
__asm__ ("" : : : "memory"); \
|
|
v = read_real (&err); \
|
|
if (err < 0) \
|
|
goto out; \
|
|
match = compare_real (val, v); \
|
|
\
|
|
out: \
|
|
if (err || !match) \
|
|
{ \
|
|
union \
|
|
{ \
|
|
type_t v; \
|
|
unsigned char x[sizeof (type_t)]; \
|
|
} \
|
|
uv = { .v = v }, ui = { .v = val }; \
|
|
\
|
|
printf ("error: %s:%d: input buffer: `", __FILE__, __LINE__); \
|
|
for (size_t j = 0; j < sizeof (ui.x); j++) \
|
|
printf ("%02hhx", ui.x[j]); \
|
|
printf ("'\n"); \
|
|
printf ("error: %s:%d: value buffer: `", __FILE__, __LINE__); \
|
|
for (size_t j = 0; j < sizeof (uv.x); j++) \
|
|
printf ("%02hhx", uv.x[j]); \
|
|
printf ("'\n"); \
|
|
} \
|
|
\
|
|
*errp = err; \
|
|
match; \
|
|
})
|
|
|
|
#define read_real(errp) \
|
|
({ \
|
|
__label__ out; \
|
|
bool m = false; \
|
|
int err = 0; \
|
|
type_t v; \
|
|
int ch; \
|
|
\
|
|
ch = read_input (); \
|
|
if (ch == '-' || ch == '+') \
|
|
{ \
|
|
m = ch == '-'; \
|
|
ch = read_input (); \
|
|
} \
|
|
\
|
|
switch (ch) \
|
|
{ \
|
|
case '0': \
|
|
break; \
|
|
case 'I': \
|
|
case 'i': \
|
|
{ \
|
|
static const char unf[] = { 'N', 'F' }; \
|
|
static const char lnf[] = { 'n', 'f' }; \
|
|
size_t i; \
|
|
\
|
|
for (i = 0; i < sizeof (unf); i++) \
|
|
{ \
|
|
ch = read_input (); \
|
|
if (ch != unf[i] && ch != lnf[i]) \
|
|
{ \
|
|
err = ch < 0 ? ch : INPUT_FORMAT; \
|
|
v = NAN; \
|
|
goto out; \
|
|
} \
|
|
} \
|
|
\
|
|
ch = read_input (); \
|
|
if (ch == ':') \
|
|
{ \
|
|
v = m ? -INFINITY : +INFINITY; \
|
|
goto out; \
|
|
} \
|
|
\
|
|
static const char uinity[] = { 'I', 'N', 'I', 'T', 'Y' }; \
|
|
static const char linity[] = { 'i', 'n', 'i', 't', 'y' }; \
|
|
\
|
|
for (i = 0; i < sizeof (uinity); i++) \
|
|
{ \
|
|
if (ch != uinity[i] && ch != linity[i]) \
|
|
{ \
|
|
err = ch < 0 ? ch : INPUT_FORMAT; \
|
|
v = NAN; \
|
|
goto out; \
|
|
} \
|
|
ch = read_input (); \
|
|
} \
|
|
if (ch == ':') \
|
|
{ \
|
|
v = m ? -INFINITY : +INFINITY; \
|
|
goto out; \
|
|
} \
|
|
} \
|
|
err = ch < 0 ? ch : INPUT_FORMAT; \
|
|
v = NAN; \
|
|
goto out; \
|
|
\
|
|
case 'N': \
|
|
case 'n': \
|
|
{ \
|
|
static const char uan[] = { 'A', 'N' }; \
|
|
static const char lan[] = { 'a', 'n' }; \
|
|
size_t i; \
|
|
\
|
|
for (i = 0; i < sizeof (uan); i++) \
|
|
{ \
|
|
ch = read_input (); \
|
|
if (ch != uan[i] && ch != lan[i]) \
|
|
{ \
|
|
err = ch < 0 ? ch : INPUT_FORMAT; \
|
|
v = NAN; \
|
|
goto out; \
|
|
} \
|
|
} \
|
|
\
|
|
ch = read_input (); \
|
|
if (ch == ':') \
|
|
{ \
|
|
v = m ? -nan (v, ".") : nan (v, "."); \
|
|
goto out; \
|
|
} \
|
|
\
|
|
size_t seq_size = 0; \
|
|
char *seq = NULL; \
|
|
i = 0; \
|
|
if (ch == '(') \
|
|
while (1) \
|
|
{ \
|
|
ch = read_input (); \
|
|
if (ch == ')') \
|
|
break; \
|
|
if (ch != '_' && !isdigit (ch) \
|
|
&& !(ch >= 'A' && ch <= 'Z') \
|
|
&& !(ch >= 'a' && ch <= 'z')) \
|
|
{ \
|
|
free (seq); \
|
|
err = ch < 0 ? ch : INPUT_FORMAT; \
|
|
v = NAN; \
|
|
goto out; \
|
|
} \
|
|
if (i == seq_size) \
|
|
{ \
|
|
seq_size += SIZE_CHUNK; \
|
|
seq = xrealloc (seq, seq_size); \
|
|
} \
|
|
seq[i++] = ch; \
|
|
} \
|
|
seq[i] = '\0'; \
|
|
\
|
|
ch = read_input (); \
|
|
if (ch == ':') \
|
|
{ \
|
|
v = m ? -nan (v, seq) : nan (v, seq); \
|
|
free (seq); \
|
|
goto out; \
|
|
} \
|
|
free (seq); \
|
|
} \
|
|
err = ch < 0 ? ch : INPUT_FORMAT; \
|
|
v = NAN; \
|
|
goto out; \
|
|
\
|
|
default: \
|
|
err = ch < 0 ? ch : INPUT_FORMAT; \
|
|
v = NAN; \
|
|
goto out; \
|
|
} \
|
|
\
|
|
ch = read_input (); \
|
|
if (ch != 'X' && ch != 'x') \
|
|
{ \
|
|
err = ch < 0 ? ch : INPUT_FORMAT; \
|
|
v = NAN; \
|
|
goto out; \
|
|
} \
|
|
\
|
|
type_t f = m ? -1.0 : 1.0; \
|
|
v = m ? -0.0 : 0.0; \
|
|
int i = 0; \
|
|
do \
|
|
{ \
|
|
int d = 0; \
|
|
\
|
|
ch = read_input (); \
|
|
\
|
|
if (i == 1) \
|
|
switch (ch) \
|
|
{ \
|
|
case '.': \
|
|
i++; \
|
|
continue; \
|
|
\
|
|
case ':': \
|
|
case 'P': \
|
|
case 'p': \
|
|
break; \
|
|
\
|
|
default: \
|
|
err = ch < 0 ? ch : INPUT_FORMAT; \
|
|
v = NAN; \
|
|
goto out; \
|
|
} \
|
|
\
|
|
switch (ch) \
|
|
{ \
|
|
case '0': \
|
|
case '1': \
|
|
case '2': \
|
|
case '3': \
|
|
case '4': \
|
|
case '5': \
|
|
case '6': \
|
|
case '7': \
|
|
case '8': \
|
|
case '9': \
|
|
d = ch - '0'; \
|
|
break; \
|
|
\
|
|
case 'A': \
|
|
case 'B': \
|
|
case 'C': \
|
|
case 'D': \
|
|
case 'E': \
|
|
case 'F': \
|
|
d = ch - 'A' + 10; \
|
|
break; \
|
|
\
|
|
case 'a': \
|
|
case 'b': \
|
|
case 'c': \
|
|
case 'd': \
|
|
case 'e': \
|
|
case 'f': \
|
|
d = ch - 'a' + 10; \
|
|
break; \
|
|
\
|
|
case ':': \
|
|
case 'P': \
|
|
case 'p': \
|
|
if (i == 0) \
|
|
{ \
|
|
err = INPUT_FORMAT; \
|
|
v = NAN; \
|
|
goto out; \
|
|
} \
|
|
break; \
|
|
\
|
|
default: \
|
|
err = ch < 0 ? ch : INPUT_FORMAT; \
|
|
v = NAN; \
|
|
goto out; \
|
|
} \
|
|
\
|
|
v += f * d; \
|
|
f /= 16.0l; \
|
|
i++; \
|
|
} \
|
|
while (ch != ':' && ch != 'P' && ch != 'p'); \
|
|
\
|
|
long long exp = 0; \
|
|
if (ch == 'P' || ch == 'p') \
|
|
{ \
|
|
exp = read_integer (&err); \
|
|
if (err) \
|
|
{ \
|
|
v = NAN; \
|
|
goto out; \
|
|
} \
|
|
} \
|
|
\
|
|
errno = 0; \
|
|
v = ldexp (v, exp); \
|
|
if ((v == HUGE_VALL || v == -HUGE_VALL) && errno != 0) \
|
|
{ \
|
|
err = INPUT_OVERFLOW; \
|
|
v = NAN; \
|
|
goto out; \
|
|
} \
|
|
\
|
|
out: \
|
|
*errp = err; \
|
|
v; \
|
|
})
|