glibc/wcsmbs/tst-mbrtowc.c

233 lines
6.8 KiB
C
Raw Normal View History

/* Copyright (C) 2000, 2001, 2002, 2003 Free Software Foundation, Inc.
This file is part of the GNU C Library.
Contributed by Ulrich Drepper <drepper@redhat.com>, 2000.
The GNU C Library is free software; you can redistribute it and/or
modify it under the terms of the GNU Lesser General Public
License as published by the Free Software Foundation; either
version 2.1 of the License, or (at your option) any later version.
The GNU C Library is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
Lesser General Public License for more details.
You should have received a copy of the GNU Lesser General Public
License along with the GNU C Library; if not, see
<http://www.gnu.org/licenses/>. */
/* We always want assert to be fully defined. */
#undef NDEBUG
#include <assert.h>
#include <locale.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <wchar.h>
static int check_ascii (const char *locname);
/* UTF-8 single byte feeding test for mbrtowc(),
contributed by Markus Kuhn <mkuhn@acm.org>. */
static int
utf8_test_1 (void)
{
wchar_t wc;
mbstate_t s;
wc = 42; /* arbitrary number */
memset (&s, 0, sizeof (s)); /* get s into initial state */
assert (mbrtowc (&wc, "\xE2", 1, &s) == (size_t) -2); /* 1st byte processed */
assert (mbrtowc (&wc, "\x89", 1, &s) == (size_t) -2); /* 2nd byte processed */
assert (wc == 42); /* no value has not been stored into &wc yet */
assert (mbrtowc (&wc, "\xA0", 1, &s) == 1); /* 3nd byte processed */
assert (wc == 0x2260); /* E2 89 A0 = U+2260 (not equal) decoded correctly */
assert (mbrtowc (&wc, "", 1, &s) == 0); /* test final byte processing */
assert (wc == 0); /* test final byte decoding */
/* The following test is by Al Viro <aviro@redhat.com>. */
const char str[] = "\xe0\xa0\x80";
wc = 42; /* arbitrary number */
memset (&s, 0, sizeof (s)); /* get s into initial state */
assert (mbrtowc (&wc, str, 1, &s) == -2);
assert (mbrtowc (&wc, str + 1, 2, &s) == 2);
assert (wc == 0x800);
wc = 42; /* arbitrary number */
memset (&s, 0, sizeof (s)); /* get s into initial state */
assert (mbrtowc (&wc, str, 3, &s) == 3);
assert (wc == 0x800);
return 0;
}
/* Test for NUL byte processing via empty string. */
static int
utf8_test_2 (void)
{
wchar_t wc;
mbstate_t s;
wc = 42; /* arbitrary number */
memset (&s, 0, sizeof (s)); /* get s into initial state */
assert (mbrtowc (NULL, "", 1, &s) == 0); /* valid terminator */
assert (mbsinit (&s));
wc = 42; /* arbitrary number */
memset (&s, 0, sizeof (s)); /* get s into initial state */
assert (mbrtowc (&wc, "\xE2", 1, &s) == (size_t) -2); /* 1st byte processed */
assert (mbrtowc (NULL, "", 1, &s) == (size_t) -1); /* invalid terminator */
wc = 42; /* arbitrary number */
memset (&s, 0, sizeof (s)); /* get s into initial state */
assert (mbrtowc (&wc, "\xE2", 1, &s) == (size_t) -2); /* 1st byte processed */
assert (mbrtowc (&wc, "\x89", 1, &s) == (size_t) -2); /* 2nd byte processed */
assert (mbrtowc (NULL, "", 1, &s) == (size_t) -1); /* invalid terminator */
wc = 42; /* arbitrary number */
memset (&s, 0, sizeof (s)); /* get s into initial state */
assert (mbrtowc (&wc, "\xE2", 1, &s) == (size_t) -2); /* 1st byte processed */
assert (mbrtowc (&wc, "\x89", 1, &s) == (size_t) -2); /* 2nd byte processed */
assert (mbrtowc (&wc, "\xA0", 1, &s) == 1); /* 3nd byte processed */
assert (mbrtowc (NULL, "", 1, &s) == 0); /* valid terminator */
assert (mbsinit (&s));
return 0;
}
/* Test for NUL byte processing via NULL string. */
static int
utf8_test_3 (void)
{
wchar_t wc;
mbstate_t s;
wc = 42; /* arbitrary number */
memset (&s, 0, sizeof (s)); /* get s into initial state */
assert (mbrtowc (NULL, NULL, 0, &s) == 0); /* valid terminator */
assert (mbsinit (&s));
wc = 42; /* arbitrary number */
memset (&s, 0, sizeof (s)); /* get s into initial state */
assert (mbrtowc (&wc, "\xE2", 1, &s) == (size_t) -2); /* 1st byte processed */
assert (mbrtowc (NULL, NULL, 0, &s) == (size_t) -1); /* invalid terminator */
wc = 42; /* arbitrary number */
memset (&s, 0, sizeof (s)); /* get s into initial state */
assert (mbrtowc (&wc, "\xE2", 1, &s) == (size_t) -2); /* 1st byte processed */
assert (mbrtowc (&wc, "\x89", 1, &s) == (size_t) -2); /* 2nd byte processed */
assert (mbrtowc (NULL, NULL, 0, &s) == (size_t) -1); /* invalid terminator */
wc = 42; /* arbitrary number */
memset (&s, 0, sizeof (s)); /* get s into initial state */
assert (mbrtowc (&wc, "\xE2", 1, &s) == (size_t) -2); /* 1st byte processed */
assert (mbrtowc (&wc, "\x89", 1, &s) == (size_t) -2); /* 2nd byte processed */
assert (mbrtowc (&wc, "\xA0", 1, &s) == 1); /* 3nd byte processed */
assert (mbrtowc (NULL, NULL, 0, &s) == 0); /* valid terminator */
assert (mbsinit (&s));
return 0;
}
static int
utf8_test (void)
{
const char *locale = "de_DE.UTF-8";
int error = 0;
if (!setlocale (LC_CTYPE, locale))
{
fprintf (stderr, "locale '%s' not available!\n", locale);
exit (1);
}
error |= utf8_test_1 ();
error |= utf8_test_2 ();
error |= utf8_test_3 ();
return error;
}
int
main (void)
{
int result = 0;
/* Check mapping of ASCII range for some character sets which have
ASCII as a subset. For those the wide char generated must have
the same value. */
setlocale (LC_ALL, "C");
result |= check_ascii (setlocale (LC_ALL, NULL));
setlocale (LC_ALL, "de_DE.UTF-8");
result |= check_ascii (setlocale (LC_ALL, NULL));
result |= utf8_test ();
setlocale (LC_ALL, "ja_JP.EUC-JP");
result |= check_ascii (setlocale (LC_ALL, NULL));
return result;
}
static int
check_ascii (const char *locname)
{
int c;
int res = 0;
printf ("Testing locale \"%s\":\n", locname);
for (c = 0; c <= 127; ++c)
{
char buf[MB_CUR_MAX];
wchar_t wc = 0xffffffff;
mbstate_t s;
* catgets/open_catalog.c (__open_catalog): Don't use a value type as the __builtin_expect expression, just the Boolean value. * sysdeps/generic/wordexp.c (parse_glob): int -> size_t for counter. * sysdeps/unix/sysv/linux/opensock.c (__opensock): Likewise. * resolv/res_hconf.c (arg_service_list, parse_line): Likewise. * iconvdata/tst-loading.c (main): Likewise. * catgets/tst-catgets.c (main): Likewise. * stdlib/tst-xpg-basename.c (main): Likewise. * stdlib/tst-bsearch.c (main): Likewise. * stdio-common/test-vfprintf.c (main): Likewise. * stdio-common/tst-rndseek.c (do_test): Likewise. * libio/tst_swprintf.c (main): Likewise. * libio/tst-fgetws.c (main): Likewise. * wcsmbs/tst-mbrtowc.c (check_ascii): Likewise. * time/tst-posixtz.c (main): Likewise. * time/tst-strptime.c (test_tm): Likewise. * time/tst-strptime.c (main): Likewise. * time/tst-getdate.c (main): Likewise. * posix/tst-mmap.c (main): Likewise. * posix/tst-getaddrinfo.c (do_test): Likewise. * io/tst-getcwd.c (do_test): Likewise. * resolv/tst-aton.c (main): Likewise. * inet/tst-network.c (main): Likewise. * libio/tst-fgetws.c (main): Likewise. * sysdeps/posix/sprofil.c (add_region): int -> unsigned int for I. * sysdeps/unix/sysv/linux/ptsname.c (__ptsname_r): int -> unsigned int for PTYNO. * stdlib/msort.c (qsort): Add a cast to silence warning. * stdio-common/vfprintf.c (process_string_arg): Likewise. * libio/oldfileops.c (_IO_old_do_write): Likewise. * sysdeps/unix/sysv/linux/getcwd.c (__getcwd): Likewise. * sysdeps/unix/sysv/linux/ttyname.c (ttyname): Likewise. * sysdeps/unix/sysv/linux/gethostid.c (gethostid): Likewise. * argp/argp-fmtstream.c (__argp_fmtstream_printf): Likewise. * nscd/nscd_getgr_r.c (nscd_getgr_r): Likewise. * sysdeps/unix/grantpt.c (grantpt): Likewise. * libio/tst-widetext.c (main): Likewise. * libio/tst-mmap2-eofsync.c (do_test): Likewise. * rt/tst-aio.c (test_file): Likewise. * rt/tst-aio64.c (test_file): Likewise. * resolv/tst-aton.c (main): Likewise. * catgets/catgetsinfo.h (CATGETS_MAGIC): Use U suffix on the constant. * ctype/ctype.c (__ctype_tolower, __ctype_toupper): Cast to int32_t instead of uint32_t in these macros.
2002-09-24 12:24:25 +08:00
size_t n, i;
for (i = 0; i < MB_CUR_MAX; ++i)
buf[i] = c + i;
memset (&s, '\0', sizeof (s));
n = mbrtowc (&wc, buf, MB_CUR_MAX, &s);
if (n == (size_t) -1)
{
printf ("%s: '\\x%x': encoding error\n", locname, c);
++res;
}
else if (n == (size_t) -2)
{
printf ("%s: '\\x%x': incomplete character\n", locname, c);
++res;
}
else if (n == 0 && c != 0)
{
printf ("%s: '\\x%x': 0 returned\n", locname, c);
++res;
}
else if (n != 0 && c == 0)
{
printf ("%s: '\\x%x': not 0 returned\n", locname, c);
++res;
}
else if (c != 0 && n != 1)
{
printf ("%s: '\\x%x': not 1 returned\n", locname, c);
++res;
}
else if (wc != (wchar_t) c)
{
printf ("%s: '\\x%x': wc != L'\\x%x'\n", locname, c, c);
++res;
}
}
printf (res == 1 ? "%d error\n" : "%d errors\n", res);
return res != 0;
}