mirror of
https://git.savannah.gnu.org/git/gnulib.git
synced 2025-08-16 01:22:18 +03:00
* build-aux/gendocs.sh (version): * doc/gendocs_template: * doc/gendocs_template_min: * doc/gnulib.texi: * lib/version-etc.c (COPYRIGHT_YEAR): Update copyright dates by hand in templates and the like. * all files: Run 'make update-copyright'.
317 lines
8.9 KiB
C
317 lines
8.9 KiB
C
/* Test of character set conversion.
|
|
Copyright (C) 2007-2017 Free Software Foundation, Inc.
|
|
|
|
This program is free software: you can redistribute it and/or modify
|
|
it under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation; either version 3 of the License, or
|
|
(at your option) any later version.
|
|
|
|
This program is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with this program. If not, see <http://www.gnu.org/licenses/>. */
|
|
|
|
/* Written by Bruno Haible <bruno@clisp.org>, 2007. */
|
|
|
|
#include <config.h>
|
|
|
|
#if HAVE_ICONV
|
|
# include <iconv.h>
|
|
#endif
|
|
|
|
#include <errno.h>
|
|
#include <string.h>
|
|
|
|
#include "macros.h"
|
|
|
|
/* If compiling on an EBCDIC system, keep the test strings in ASCII. */
|
|
#if defined __IBMC__ && 'A' != 0x41
|
|
# pragma convert("ISO8859-1")
|
|
# define CONVERT_ENABLED
|
|
#endif
|
|
|
|
/* The text is "Japanese (日本語) [\U0001D50D\U0001D51E\U0001D52D]". */
|
|
|
|
const char test_utf8_string[] = "Japanese (\346\227\245\346\234\254\350\252\236) [\360\235\224\215\360\235\224\236\360\235\224\255]";
|
|
|
|
const char test_utf16be_string[] = "\000J\000a\000p\000a\000n\000e\000s\000e\000 \000(\145\345\147\054\212\236\000)\000 \000[\330\065\335\015\330\065\335\036\330\065\335\055\000]";
|
|
|
|
const char test_utf16le_string[] = "J\000a\000p\000a\000n\000e\000s\000e\000 \000(\000\345\145\054\147\236\212)\000 \000[\000\065\330\015\335\065\330\036\335\065\330\055\335]\000";
|
|
|
|
const char test_utf32be_string[] = "\000\000\000J\000\000\000a\000\000\000p\000\000\000a\000\000\000n\000\000\000e\000\000\000s\000\000\000e\000\000\000 \000\000\000(\000\000\145\345\000\000\147\054\000\000\212\236\000\000\000)\000\000\000 \000\000\000[\000\001\325\015\000\001\325\036\000\001\325\055\000\000\000]";
|
|
|
|
const char test_utf32le_string[] = "J\000\000\000a\000\000\000p\000\000\000a\000\000\000n\000\000\000e\000\000\000s\000\000\000e\000\000\000 \000\000\000(\000\000\000\345\145\000\000\054\147\000\000\236\212\000\000)\000\000\000 \000\000\000[\000\000\000\015\325\001\000\036\325\001\000\055\325\001\000]\000\000\000";
|
|
|
|
#ifdef CONVERT_ENABLED
|
|
# pragma convert(pop)
|
|
#endif
|
|
|
|
int
|
|
main ()
|
|
{
|
|
#if HAVE_ICONV
|
|
/* Assume that iconv() supports at least the encoding UTF-8. */
|
|
|
|
/* Test conversion from UTF-8 to UTF-16BE with no errors. */
|
|
{
|
|
#define input test_utf8_string
|
|
#define expected test_utf16be_string
|
|
iconv_t cd;
|
|
char buf[100];
|
|
const char *inptr;
|
|
size_t inbytesleft;
|
|
char *outptr;
|
|
size_t outbytesleft;
|
|
size_t res;
|
|
|
|
cd = iconv_open ("UTF-16BE", "UTF-8");
|
|
ASSERT (cd != (iconv_t)(-1));
|
|
|
|
inptr = input;
|
|
inbytesleft = sizeof (input) - 1;
|
|
outptr = buf;
|
|
outbytesleft = sizeof (buf);
|
|
res = iconv (cd,
|
|
(ICONV_CONST char **) &inptr, &inbytesleft,
|
|
&outptr, &outbytesleft);
|
|
ASSERT (res == 0 && inbytesleft == 0);
|
|
ASSERT (outptr == buf + (sizeof (expected) - 1));
|
|
ASSERT (memcmp (buf, expected, sizeof (expected) - 1) == 0);
|
|
|
|
ASSERT (iconv_close (cd) == 0);
|
|
|
|
#undef input
|
|
#undef expected
|
|
}
|
|
|
|
/* Test conversion from UTF-8 to UTF-16LE with no errors. */
|
|
{
|
|
#define input test_utf8_string
|
|
#define expected test_utf16le_string
|
|
iconv_t cd;
|
|
char buf[100];
|
|
const char *inptr;
|
|
size_t inbytesleft;
|
|
char *outptr;
|
|
size_t outbytesleft;
|
|
size_t res;
|
|
|
|
cd = iconv_open ("UTF-16LE", "UTF-8");
|
|
ASSERT (cd != (iconv_t)(-1));
|
|
|
|
inptr = input;
|
|
inbytesleft = sizeof (input) - 1;
|
|
outptr = buf;
|
|
outbytesleft = sizeof (buf);
|
|
res = iconv (cd,
|
|
(ICONV_CONST char **) &inptr, &inbytesleft,
|
|
&outptr, &outbytesleft);
|
|
ASSERT (res == 0 && inbytesleft == 0);
|
|
ASSERT (outptr == buf + (sizeof (expected) - 1));
|
|
ASSERT (memcmp (buf, expected, sizeof (expected) - 1) == 0);
|
|
|
|
ASSERT (iconv_close (cd) == 0);
|
|
|
|
#undef input
|
|
#undef expected
|
|
}
|
|
|
|
/* Test conversion from UTF-8 to UTF-32BE with no errors. */
|
|
{
|
|
#define input test_utf8_string
|
|
#define expected test_utf32be_string
|
|
iconv_t cd;
|
|
char buf[100];
|
|
const char *inptr;
|
|
size_t inbytesleft;
|
|
char *outptr;
|
|
size_t outbytesleft;
|
|
size_t res;
|
|
|
|
cd = iconv_open ("UTF-32BE", "UTF-8");
|
|
ASSERT (cd != (iconv_t)(-1));
|
|
|
|
inptr = input;
|
|
inbytesleft = sizeof (input) - 1;
|
|
outptr = buf;
|
|
outbytesleft = sizeof (buf);
|
|
res = iconv (cd,
|
|
(ICONV_CONST char **) &inptr, &inbytesleft,
|
|
&outptr, &outbytesleft);
|
|
ASSERT (res == 0 && inbytesleft == 0);
|
|
ASSERT (outptr == buf + (sizeof (expected) - 1));
|
|
ASSERT (memcmp (buf, expected, sizeof (expected) - 1) == 0);
|
|
|
|
ASSERT (iconv_close (cd) == 0);
|
|
|
|
#undef input
|
|
#undef expected
|
|
}
|
|
|
|
/* Test conversion from UTF-8 to UTF-32LE with no errors. */
|
|
{
|
|
#define input test_utf8_string
|
|
#define expected test_utf32le_string
|
|
iconv_t cd;
|
|
char buf[100];
|
|
const char *inptr;
|
|
size_t inbytesleft;
|
|
char *outptr;
|
|
size_t outbytesleft;
|
|
size_t res;
|
|
|
|
cd = iconv_open ("UTF-32LE", "UTF-8");
|
|
ASSERT (cd != (iconv_t)(-1));
|
|
|
|
inptr = input;
|
|
inbytesleft = sizeof (input) - 1;
|
|
outptr = buf;
|
|
outbytesleft = sizeof (buf);
|
|
res = iconv (cd,
|
|
(ICONV_CONST char **) &inptr, &inbytesleft,
|
|
&outptr, &outbytesleft);
|
|
ASSERT (res == 0 && inbytesleft == 0);
|
|
ASSERT (outptr == buf + (sizeof (expected) - 1));
|
|
ASSERT (memcmp (buf, expected, sizeof (expected) - 1) == 0);
|
|
|
|
ASSERT (iconv_close (cd) == 0);
|
|
|
|
#undef input
|
|
#undef expected
|
|
}
|
|
|
|
/* Test conversion from UTF-16BE to UTF-8 with no errors. */
|
|
{
|
|
#define input test_utf16be_string
|
|
#define expected test_utf8_string
|
|
iconv_t cd;
|
|
char buf[100];
|
|
const char *inptr;
|
|
size_t inbytesleft;
|
|
char *outptr;
|
|
size_t outbytesleft;
|
|
size_t res;
|
|
|
|
cd = iconv_open ("UTF-8", "UTF-16BE");
|
|
ASSERT (cd != (iconv_t)(-1));
|
|
|
|
inptr = input;
|
|
inbytesleft = sizeof (input) - 1;
|
|
outptr = buf;
|
|
outbytesleft = sizeof (buf);
|
|
res = iconv (cd,
|
|
(ICONV_CONST char **) &inptr, &inbytesleft,
|
|
&outptr, &outbytesleft);
|
|
ASSERT (res == 0 && inbytesleft == 0);
|
|
ASSERT (outptr == buf + (sizeof (expected) - 1));
|
|
ASSERT (memcmp (buf, expected, sizeof (expected) - 1) == 0);
|
|
|
|
ASSERT (iconv_close (cd) == 0);
|
|
|
|
#undef input
|
|
#undef expected
|
|
}
|
|
|
|
/* Test conversion from UTF-16LE to UTF-8 with no errors. */
|
|
{
|
|
#define input test_utf16le_string
|
|
#define expected test_utf8_string
|
|
iconv_t cd;
|
|
char buf[100];
|
|
const char *inptr;
|
|
size_t inbytesleft;
|
|
char *outptr;
|
|
size_t outbytesleft;
|
|
size_t res;
|
|
|
|
cd = iconv_open ("UTF-8", "UTF-16LE");
|
|
ASSERT (cd != (iconv_t)(-1));
|
|
|
|
inptr = input;
|
|
inbytesleft = sizeof (input) - 1;
|
|
outptr = buf;
|
|
outbytesleft = sizeof (buf);
|
|
res = iconv (cd,
|
|
(ICONV_CONST char **) &inptr, &inbytesleft,
|
|
&outptr, &outbytesleft);
|
|
ASSERT (res == 0 && inbytesleft == 0);
|
|
ASSERT (outptr == buf + (sizeof (expected) - 1));
|
|
ASSERT (memcmp (buf, expected, sizeof (expected) - 1) == 0);
|
|
|
|
ASSERT (iconv_close (cd) == 0);
|
|
|
|
#undef input
|
|
#undef expected
|
|
}
|
|
|
|
/* Test conversion from UTF-32BE to UTF-8 with no errors. */
|
|
{
|
|
#define input test_utf32be_string
|
|
#define expected test_utf8_string
|
|
iconv_t cd;
|
|
char buf[100];
|
|
const char *inptr;
|
|
size_t inbytesleft;
|
|
char *outptr;
|
|
size_t outbytesleft;
|
|
size_t res;
|
|
|
|
cd = iconv_open ("UTF-8", "UTF-32BE");
|
|
ASSERT (cd != (iconv_t)(-1));
|
|
|
|
inptr = input;
|
|
inbytesleft = sizeof (input) - 1;
|
|
outptr = buf;
|
|
outbytesleft = sizeof (buf);
|
|
res = iconv (cd,
|
|
(ICONV_CONST char **) &inptr, &inbytesleft,
|
|
&outptr, &outbytesleft);
|
|
ASSERT (res == 0 && inbytesleft == 0);
|
|
ASSERT (outptr == buf + (sizeof (expected) - 1));
|
|
ASSERT (memcmp (buf, expected, sizeof (expected) - 1) == 0);
|
|
|
|
ASSERT (iconv_close (cd) == 0);
|
|
|
|
#undef input
|
|
#undef expected
|
|
}
|
|
|
|
/* Test conversion from UTF-32LE to UTF-8 with no errors. */
|
|
{
|
|
#define input test_utf32le_string
|
|
#define expected test_utf8_string
|
|
iconv_t cd;
|
|
char buf[100];
|
|
const char *inptr;
|
|
size_t inbytesleft;
|
|
char *outptr;
|
|
size_t outbytesleft;
|
|
size_t res;
|
|
|
|
cd = iconv_open ("UTF-8", "UTF-32LE");
|
|
ASSERT (cd != (iconv_t)(-1));
|
|
|
|
inptr = input;
|
|
inbytesleft = sizeof (input) - 1;
|
|
outptr = buf;
|
|
outbytesleft = sizeof (buf);
|
|
res = iconv (cd,
|
|
(ICONV_CONST char **) &inptr, &inbytesleft,
|
|
&outptr, &outbytesleft);
|
|
ASSERT (res == 0 && inbytesleft == 0);
|
|
ASSERT (outptr == buf + (sizeof (expected) - 1));
|
|
ASSERT (memcmp (buf, expected, sizeof (expected) - 1) == 0);
|
|
|
|
ASSERT (iconv_close (cd) == 0);
|
|
|
|
#undef input
|
|
#undef expected
|
|
}
|
|
#endif
|
|
|
|
return 0;
|
|
}
|