glibc/stdio-common/tst-scanf-format-real.h

364 lines
9.8 KiB
C

/* Test feature wrapper for formatted real input.
Copyright (C) 2025 Free Software Foundation, Inc.
This file is part of the GNU C Library.
The GNU C Library is free software; you can redistribute it and/or
modify it under the terms of the GNU Lesser General Public
License as published by the Free Software Foundation; either
version 2.1 of the License, or (at your option) any later version.
The GNU C Library is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
Lesser General Public License for more details.
You should have received a copy of the GNU Lesser General Public
License along with the GNU C Library; if not, see
<https://www.gnu.org/licenses/>. */
#include <ctype.h>
#include <errno.h>
#include <float.h>
#include <tgmath.h>
#include <stdbool.h>
#include <stddef.h>
#include <stdlib.h>
#include <string.h>
#include <support/support.h>
/* Reference data is a case-inensitive signed datum, which is either a
hexadecimal floating constant or a literal representing infinity or
NaN data in any of the forms accepted by 'strtod' family functions,
whose binary representation is to match against byte-wise.
We need to be careful with parsing reference data in the handling of
the sign as with the IBM long double binary format unary negation
of a positive value whose lower-magnitude part is zero produces a
bit pattern that is different from one produced by initialization or
conversions made by functions such as 'scanf' or 'strtod' from the
complementing negative value. The difference is in the sign of zero
held in the lower-magnitude part and therefore the bit patterns are
arithmetically equivalent, but they do not match byte-wise.
Therefore we set the sign with the initial value of the significand,
either -0.0 or 0.0, which sets the sign of both parts according to
what 'scanf' does, and never negate it afterwards.
Additionally the Intel long double binary format uses only 80 bits
out of 96 that the data type occupies. Therefore preinitialize the
reference value with the same 0xa5 bit pattern that the value under
test has been so that the byte-wise comparison matches as well for
the unused parts of the two data pieces.
We use 'ldexp' to assemble the significand with the exponent, which
does not compromise verification, because internally this exercises
a code path different from one used by 'scanf' family functions for
this purpose. Specifically 'ldexp' uses 'scalbn', whereas 'scanf'
defers to 'strtod' which uses '__mpn_construct_double'. Analogously
for the remaining floating-point data types. */
#define nan(v, x) \
_Generic((v), float: nanf, double: nan, long double: nanl) (x)
#define pointer_to_value(val) (&(val))
#define initialize_value(val) \
memset (&val, 0xa5, sizeof (val))
#define compare_real(x, y) \
(memcmp (&(x), &(y), sizeof (y)) == 0)
#define verify_input(f, val, count, errp) \
({ \
__label__ out; \
bool match = true; \
int err = 0; \
type_t v; \
\
initialize_value (v); \
/* Make sure it's been committed. */ \
__asm__ ("" : : : "memory"); \
v = read_real (&err); \
if (err < 0) \
goto out; \
match = compare_real (val, v); \
\
out: \
if (err || !match) \
{ \
union \
{ \
type_t v; \
unsigned char x[sizeof (type_t)]; \
} \
uv = { .v = v }, ui = { .v = val }; \
\
printf ("error: %s:%d: input buffer: `", __FILE__, __LINE__); \
for (size_t j = 0; j < sizeof (ui.x); j++) \
printf ("%02hhx", ui.x[j]); \
printf ("'\n"); \
printf ("error: %s:%d: value buffer: `", __FILE__, __LINE__); \
for (size_t j = 0; j < sizeof (uv.x); j++) \
printf ("%02hhx", uv.x[j]); \
printf ("'\n"); \
} \
\
*errp = err; \
match; \
})
#define read_real(errp) \
({ \
__label__ out; \
bool m = false; \
int err = 0; \
type_t v; \
int ch; \
\
ch = read_input (); \
if (ch == '-' || ch == '+') \
{ \
m = ch == '-'; \
ch = read_input (); \
} \
\
switch (ch) \
{ \
case '0': \
break; \
case 'I': \
case 'i': \
{ \
static const char unf[] = { 'N', 'F' }; \
static const char lnf[] = { 'n', 'f' }; \
size_t i; \
\
for (i = 0; i < sizeof (unf); i++) \
{ \
ch = read_input (); \
if (ch != unf[i] && ch != lnf[i]) \
{ \
err = ch < 0 ? ch : INPUT_FORMAT; \
v = NAN; \
goto out; \
} \
} \
\
ch = read_input (); \
if (ch == ':') \
{ \
v = m ? -INFINITY : +INFINITY; \
goto out; \
} \
\
static const char uinity[] = { 'I', 'N', 'I', 'T', 'Y' }; \
static const char linity[] = { 'i', 'n', 'i', 't', 'y' }; \
\
for (i = 0; i < sizeof (uinity); i++) \
{ \
if (ch != uinity[i] && ch != linity[i]) \
{ \
err = ch < 0 ? ch : INPUT_FORMAT; \
v = NAN; \
goto out; \
} \
ch = read_input (); \
} \
if (ch == ':') \
{ \
v = m ? -INFINITY : +INFINITY; \
goto out; \
} \
} \
err = ch < 0 ? ch : INPUT_FORMAT; \
v = NAN; \
goto out; \
\
case 'N': \
case 'n': \
{ \
static const char uan[] = { 'A', 'N' }; \
static const char lan[] = { 'a', 'n' }; \
size_t i; \
\
for (i = 0; i < sizeof (uan); i++) \
{ \
ch = read_input (); \
if (ch != uan[i] && ch != lan[i]) \
{ \
err = ch < 0 ? ch : INPUT_FORMAT; \
v = NAN; \
goto out; \
} \
} \
\
ch = read_input (); \
if (ch == ':') \
{ \
v = m ? -nan (v, ".") : nan (v, "."); \
goto out; \
} \
\
size_t seq_size = 0; \
char *seq = NULL; \
i = 0; \
if (ch == '(') \
while (1) \
{ \
ch = read_input (); \
if (ch == ')') \
break; \
if (ch != '_' && !isdigit (ch) \
&& !(ch >= 'A' && ch <= 'Z') \
&& !(ch >= 'a' && ch <= 'z')) \
{ \
free (seq); \
err = ch < 0 ? ch : INPUT_FORMAT; \
v = NAN; \
goto out; \
} \
if (i == seq_size) \
{ \
seq_size += SIZE_CHUNK; \
seq = xrealloc (seq, seq_size); \
} \
seq[i++] = ch; \
} \
seq[i] = '\0'; \
\
ch = read_input (); \
if (ch == ':') \
{ \
v = m ? -nan (v, seq) : nan (v, seq); \
free (seq); \
goto out; \
} \
free (seq); \
} \
err = ch < 0 ? ch : INPUT_FORMAT; \
v = NAN; \
goto out; \
\
default: \
err = ch < 0 ? ch : INPUT_FORMAT; \
v = NAN; \
goto out; \
} \
\
ch = read_input (); \
if (ch != 'X' && ch != 'x') \
{ \
err = ch < 0 ? ch : INPUT_FORMAT; \
v = NAN; \
goto out; \
} \
\
type_t f = m ? -1.0 : 1.0; \
v = m ? -0.0 : 0.0; \
int i = 0; \
do \
{ \
int d = 0; \
\
ch = read_input (); \
\
if (i == 1) \
switch (ch) \
{ \
case '.': \
i++; \
continue; \
\
case ':': \
case 'P': \
case 'p': \
break; \
\
default: \
err = ch < 0 ? ch : INPUT_FORMAT; \
v = NAN; \
goto out; \
} \
\
switch (ch) \
{ \
case '0': \
case '1': \
case '2': \
case '3': \
case '4': \
case '5': \
case '6': \
case '7': \
case '8': \
case '9': \
d = ch - '0'; \
break; \
\
case 'A': \
case 'B': \
case 'C': \
case 'D': \
case 'E': \
case 'F': \
d = ch - 'A' + 10; \
break; \
\
case 'a': \
case 'b': \
case 'c': \
case 'd': \
case 'e': \
case 'f': \
d = ch - 'a' + 10; \
break; \
\
case ':': \
case 'P': \
case 'p': \
if (i == 0) \
{ \
err = INPUT_FORMAT; \
v = NAN; \
goto out; \
} \
break; \
\
default: \
err = ch < 0 ? ch : INPUT_FORMAT; \
v = NAN; \
goto out; \
} \
\
v += f * d; \
f /= 16.0l; \
i++; \
} \
while (ch != ':' && ch != 'P' && ch != 'p'); \
\
long long exp = 0; \
if (ch == 'P' || ch == 'p') \
{ \
exp = read_integer (&err); \
if (err) \
{ \
v = NAN; \
goto out; \
} \
} \
\
errno = 0; \
v = ldexp (v, exp); \
if ((v == HUGE_VALL || v == -HUGE_VALL) && errno != 0) \
{ \
err = INPUT_OVERFLOW; \
v = NAN; \
goto out; \
} \
\
out: \
*errp = err; \
v; \
})