mirror of
				https://sourceware.org/git/glibc.git
				synced 2025-10-30 10:45:40 +03:00 
			
		
		
		
	
		
			
				
	
	
		
			372 lines
		
	
	
		
			8.4 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			372 lines
		
	
	
		
			8.4 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| /* Test program for the wide character stream functions handling larger
 | |
|    amounts of text.
 | |
|    Copyright (C) 2000-2025 Free Software Foundation, Inc.
 | |
|    This file is part of the GNU C Library.
 | |
| 
 | |
|    The GNU C Library is free software; you can redistribute it and/or
 | |
|    modify it under the terms of the GNU Lesser General Public
 | |
|    License as published by the Free Software Foundation; either
 | |
|    version 2.1 of the License, or (at your option) any later version.
 | |
| 
 | |
|    The GNU C Library is distributed in the hope that it will be useful,
 | |
|    but WITHOUT ANY WARRANTY; without even the implied warranty of
 | |
|    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 | |
|    Lesser General Public License for more details.
 | |
| 
 | |
|    You should have received a copy of the GNU Lesser General Public
 | |
|    License along with the GNU C Library; if not, see
 | |
|    <https://www.gnu.org/licenses/>.  */
 | |
| 
 | |
| #include <assert.h>
 | |
| #include <iconv.h>
 | |
| #include <locale.h>
 | |
| #include <stdio.h>
 | |
| #include <stdlib.h>
 | |
| #include <string.h>
 | |
| #include <unistd.h>
 | |
| #include <wchar.h>
 | |
| 
 | |
| /* Approximate size of the file (must be larger).  */
 | |
| #define SIZE 210000
 | |
| 
 | |
| 
 | |
| static int
 | |
| do_test (void)
 | |
| {
 | |
|   char name[] = "/tmp/widetext.out.XXXXXX";
 | |
|   char mbbuf[SIZE];
 | |
|   char mb2buf[SIZE];
 | |
|   wchar_t wcbuf[SIZE];
 | |
|   wchar_t wc2buf[SIZE];
 | |
|   size_t mbsize;
 | |
|   size_t wcsize;
 | |
|   int fd;
 | |
|   FILE *fp;
 | |
|   size_t n;
 | |
|   int res;
 | |
|   int status = 0;
 | |
|   wchar_t *wcp;
 | |
| 
 | |
|   setlocale (LC_ALL, "de_DE.UTF-8");
 | |
|   printf ("locale used: %s\n\n", setlocale (LC_ALL, NULL));
 | |
| 
 | |
|   /* Read the file into memory.  */
 | |
|   mbsize = fread (mbbuf, 1, SIZE, stdin);
 | |
|   if (mbsize == 0)
 | |
|     {
 | |
|       printf ("%u: cannot read input file from standard input: %m\n",
 | |
| 	      __LINE__);
 | |
|       exit (1);
 | |
|     }
 | |
| 
 | |
|    printf ("INFO: input file has %zd bytes\n", mbsize);
 | |
| 
 | |
|   /* First convert the text to wide characters.  We use iconv here.  */
 | |
|   {
 | |
|     iconv_t cd;
 | |
|     char *inbuf = mbbuf;
 | |
|     size_t inleft = mbsize;
 | |
|     char *outbuf = (char *) wcbuf;
 | |
|     size_t outleft = sizeof (wcbuf);
 | |
|     size_t nonr;
 | |
| 
 | |
|     cd = iconv_open ("WCHAR_T", "UTF-8");
 | |
|     if (cd == (iconv_t) -1)
 | |
|       {
 | |
| 	printf ("%u: cannot get iconv descriptor for conversion to UCS4\n",
 | |
| 		__LINE__);
 | |
| 	exit (1);
 | |
|       }
 | |
| 
 | |
|     /* We must need only one call and there must be no losses.  */
 | |
|     nonr = iconv (cd, &inbuf, &inleft, &outbuf, &outleft);
 | |
|     if (nonr != 0 && nonr != (size_t) -1)
 | |
|       {
 | |
| 	printf ("%u: iconv performed %zd nonreversible conversions\n",
 | |
| 		__LINE__, nonr);
 | |
| 	exit (1);
 | |
|       }
 | |
| 
 | |
|     if  (nonr == (size_t) -1)
 | |
|       {
 | |
| 	printf ("\
 | |
| %u: iconv returned with %zd and errno = %m (inleft: %zd, outleft: %zd)\n",
 | |
| 		__LINE__, nonr, inleft, outleft);
 | |
| 	exit (1);
 | |
|       }
 | |
| 
 | |
|     if (inleft != 0)
 | |
|       {
 | |
| 	printf ("%u: iconv didn't convert all input\n", __LINE__);
 | |
| 	exit (1);
 | |
|       }
 | |
| 
 | |
|     iconv_close (cd);
 | |
| 
 | |
|     if ((sizeof (wcbuf) - outleft) % sizeof (wchar_t) != 0)
 | |
|       {
 | |
| 	printf ("%u: iconv converted not complete wchar_t\n", __LINE__);
 | |
| 	exit (1);
 | |
|       }
 | |
| 
 | |
|     wcsize = (sizeof (wcbuf) - outleft) / sizeof (wchar_t);
 | |
|     assert (wcsize + 1 <= SIZE);
 | |
|   }
 | |
| 
 | |
|   /* Now that we finished the preparations, run the first test.  We
 | |
|      are writing the wide char data out and read it back in.  We write
 | |
|      and read single characters.  */
 | |
| 
 | |
|   fd = mkstemp (name);
 | |
|   if (fd == -1)
 | |
|     {
 | |
|       printf ("%u: cannot open temporary file: %m\n", __LINE__);
 | |
|       exit (1);
 | |
|     }
 | |
| 
 | |
|   unlink (name);
 | |
| 
 | |
|   fp = fdopen (dup (fd), "w");
 | |
|   if (fp == NULL)
 | |
|     {
 | |
|       printf ("%u: fdopen of temp file for writing failed: %m\n", __LINE__);
 | |
|       exit (1);
 | |
|     }
 | |
| 
 | |
|   for (n = 0; n < wcsize; ++n)
 | |
|     {
 | |
|       if (fputwc (wcbuf[n], fp) == WEOF)
 | |
| 	{
 | |
| 	  printf ("%u: fputwc failed: %m\n", __LINE__);
 | |
| 	  exit (1);
 | |
| 	}
 | |
|     }
 | |
| 
 | |
|   res = fclose (fp);
 | |
|   if (res != 0)
 | |
|     {
 | |
|       printf ("%u: fclose after single-character writing failed (%d): %m\n",
 | |
| 	      __LINE__, res);
 | |
|       exit (1);
 | |
|     }
 | |
| 
 | |
|   lseek (fd, SEEK_SET, 0);
 | |
|   fp = fdopen (dup (fd), "r");
 | |
|   if (fp == NULL)
 | |
|     {
 | |
|       printf ("%u: fdopen of temp file for reading failed: %m\n", __LINE__);
 | |
|       exit (1);
 | |
|     }
 | |
| 
 | |
|   for (n = 0; n < wcsize; ++n)
 | |
|     {
 | |
|       wint_t wch = fgetwc (fp);
 | |
|       if (wch == WEOF)
 | |
| 	{
 | |
| 	  printf ("%u: fgetwc failed (idx %zd): %m\n", __LINE__, n);
 | |
| 	  exit (1);
 | |
| 	}
 | |
|       wc2buf[n] = wch;
 | |
|     }
 | |
| 
 | |
|   /* There should be nothing else.  */
 | |
|   if (fgetwc (fp) != WEOF)
 | |
|     {
 | |
|       printf ("%u: too many characters available with fgetwc\n", __LINE__);
 | |
|       status = 1;
 | |
|     }
 | |
|   else if (wmemcmp (wcbuf, wc2buf, wcsize) != 0)
 | |
|     {
 | |
|       printf ("%u: buffer read with fgetwc differs\n", __LINE__);
 | |
|       status = 1;
 | |
|     }
 | |
| 
 | |
|   res = fclose (fp);
 | |
|   if (res != 0)
 | |
|     {
 | |
|       printf ("%u: fclose after single-character reading failed (%d): %m\n",
 | |
| 	      __LINE__, res);
 | |
|       exit (1);
 | |
|     }
 | |
| 
 | |
|   /* Just make sure there are no two errors which hide each other, read the
 | |
|      file using the `char' functions.  */
 | |
| 
 | |
|   lseek (fd, SEEK_SET, 0);
 | |
|   fp = fdopen (fd, "r");
 | |
|   if (fp == NULL)
 | |
|     {
 | |
|       printf ("%u: fdopen of temp file for reading failed: %m\n", __LINE__);
 | |
|       exit (1);
 | |
|     }
 | |
| 
 | |
|   if (fread (mb2buf, 1, mbsize, fp) != mbsize)
 | |
|     {
 | |
|       printf ("%u: cannot read all of the temp file\n", __LINE__);
 | |
|       status = 1;
 | |
|     }
 | |
|   else
 | |
|     {
 | |
|       /* Make sure there is nothing left.  */
 | |
|       if (fgetc (fp) != EOF)
 | |
| 	{
 | |
| 	  printf ("%u: more input available\n", __LINE__);
 | |
| 	  status = 1;
 | |
| 	}
 | |
| 
 | |
|       if (memcmp (mb2buf, mbbuf, mbsize) != 0)
 | |
| 	{
 | |
| 	  printf ("%u: buffer written with fputwc differs\n", __LINE__);
 | |
| 	  status = 1;
 | |
| 	}
 | |
|     }
 | |
| 
 | |
|   res = fclose (fp);
 | |
|   if (res != 0)
 | |
|     {
 | |
|       printf ("%u: fclose after single-character reading failed (%d): %m\n",
 | |
| 	      __LINE__, res);
 | |
|       exit (1);
 | |
|     }
 | |
| 
 | |
|   /* Now to reading and writing line-wise.  */
 | |
| 
 | |
|   fd = mkstemp (strcpy (name, "/tmp/widetext.out.XXXXXX"));
 | |
|   if (fd == -1)
 | |
|     {
 | |
|       printf ("%u: cannot open temporary file: %m\n", __LINE__);
 | |
|       exit (1);
 | |
|     }
 | |
| 
 | |
|   unlink (name);
 | |
| 
 | |
|   fp = fdopen (dup (fd), "w");
 | |
|   if (fp == NULL)
 | |
|     {
 | |
|       printf ("%u: fdopen of temp file for writing failed: %m\n", __LINE__);
 | |
|       exit (1);
 | |
|     }
 | |
| 
 | |
|   for (wcp = wcbuf; wcp < &wcbuf[wcsize]; )
 | |
|     {
 | |
|       wchar_t *wendp = wcschr (wcp, L'\n');
 | |
| 
 | |
|       if (wendp != NULL)
 | |
| 	{
 | |
| 	  /* Temporarily NUL terminate the line.  */
 | |
| 	  wchar_t save = wendp[1];
 | |
| 	  wendp[1] = L'\0';
 | |
| 
 | |
| 	  fputws (wcp, fp);
 | |
| 
 | |
| 	  wendp[1] = save;
 | |
| 	  wcp = &wendp[1];
 | |
| 	}
 | |
|       else
 | |
| 	{
 | |
| 	  fputws (wcp, fp);
 | |
| 	  wcp = wcschr (wcp, L'\0');
 | |
| 	  assert (wcp == &wcbuf[wcsize]);
 | |
| 	}
 | |
|     }
 | |
| 
 | |
|   res = fclose (fp);
 | |
|   if (res != 0)
 | |
|     {
 | |
|       printf ("%u: fclose after line-wise writing failed (%d): %m\n",
 | |
| 	      __LINE__, res);
 | |
|       exit (1);
 | |
|     }
 | |
| 
 | |
|   lseek (fd, SEEK_SET, 0);
 | |
|   fp = fdopen (dup (fd), "r");
 | |
|   if (fp == NULL)
 | |
|     {
 | |
|       printf ("%u: fdopen of temp file for reading failed: %m\n", __LINE__);
 | |
|       exit (1);
 | |
|     }
 | |
| 
 | |
|   for (wcp = wc2buf; wcp < &wc2buf[wcsize]; )
 | |
|     {
 | |
|       if (fgetws (wcp, &wc2buf[wcsize] - wcp + 1, fp) == NULL)
 | |
| 	{
 | |
| 	  printf ("%u: short read using fgetws (only %td of %zd)\n",
 | |
| 		  __LINE__, wcp - wc2buf, wcsize);
 | |
| 	  status = 1;
 | |
| 	  break;
 | |
| 	}
 | |
|       wcp = wcschr (wcp, L'\0');
 | |
|     }
 | |
| 
 | |
|   if (wcp > &wc2buf[wcsize])
 | |
|     {
 | |
|       printf ("%u: fgetws read too much\n", __LINE__);
 | |
|       status = 1;
 | |
|     }
 | |
|   else if (fgetwc (fp) != WEOF)
 | |
|     {
 | |
|       /* There should be nothing else.  */
 | |
|       printf ("%u: too many characters available with fgetws\n", __LINE__);
 | |
|       status = 1;
 | |
|     }
 | |
| 
 | |
|   if (wcp >= &wc2buf[wcsize] && wmemcmp (wcbuf, wc2buf, wcsize) != 0)
 | |
|     {
 | |
|       printf ("%u: buffer read with fgetws differs\n", __LINE__);
 | |
|       status = 1;
 | |
|     }
 | |
| 
 | |
|   res = fclose (fp);
 | |
|   if (res != 0)
 | |
|     {
 | |
|       printf ("%u: fclose after single-character reading failed (%d): %m\n",
 | |
| 	      __LINE__, res);
 | |
|       exit (1);
 | |
|     }
 | |
| 
 | |
|   /* Just make sure there are no two errors which hide each other, read the
 | |
|      file using the `char' functions.  */
 | |
| 
 | |
|   lseek (fd, SEEK_SET, 0);
 | |
|   fp = fdopen (fd, "r");
 | |
|   if (fp == NULL)
 | |
|     {
 | |
|       printf ("%u: fdopen of temp file for reading failed: %m\n", __LINE__);
 | |
|       exit (1);
 | |
|     }
 | |
| 
 | |
|   if (fread (mb2buf, 1, mbsize, fp) != mbsize)
 | |
|     {
 | |
|       printf ("%u: cannot read all of the temp file\n", __LINE__);
 | |
|       status = 1;
 | |
|     }
 | |
|   else
 | |
|     {
 | |
|       /* Make sure there is nothing left.  */
 | |
|       if (fgetc (fp) != EOF)
 | |
| 	{
 | |
| 	  printf ("%u: more input available\n", __LINE__);
 | |
| 	  status = 1;
 | |
| 	}
 | |
| 
 | |
|       if (memcmp (mb2buf, mbbuf, mbsize) != 0)
 | |
| 	{
 | |
| 	  printf ("%u: buffer written with fputws differs\n", __LINE__);
 | |
| 	  status = 1;
 | |
| 	}
 | |
|     }
 | |
| 
 | |
|   res = fclose (fp);
 | |
|   if (res != 0)
 | |
|     {
 | |
|       printf ("%u: fclose after single-character reading failed (%d): %m\n",
 | |
| 	      __LINE__, res);
 | |
|       exit (1);
 | |
|     }
 | |
| 
 | |
|   return status;
 | |
| }
 | |
| 
 | |
| #define TEST_FUNCTION do_test ()
 | |
| #include "../test-skeleton.c"
 |