Add regression tests for mblen(), mbtowc(), wctomb(), mbstowcs() and

wcstombs(). These tests have already found two libc bugs.
This commit is contained in:
tjr 2002-11-09 04:33:02 +00:00
parent cbcd393990
commit 5349a8bc12
6 changed files with 580 additions and 1 deletions

View File

@ -5,7 +5,12 @@ TESTS= test-mbrtowc \
test-mbsrtowcs \
test-wcsrtombs \
test-btowc \
test-mbrlen
test-mbrlen \
test-mbtowc \
test-wctomb \
test-mbstowcs \
test-wcstombs \
test-mblen
.PHONY: tests
tests: ${TESTS}

View File

@ -0,0 +1,109 @@
/*-
* Copyright (c) 2002 Tim J. Robbins
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
*/
/*
* Test program for mblen(), as specified by IEEE Std. 1003.1-2001 and
* ISO/IEC 9899:1990.
*
* The function is tested with both the "C" ("POSIX") LC_CTYPE setting and
* "ja_JP.eucJP". Other encodings are not tested.
*/
#include <sys/cdefs.h>
__FBSDID("$FreeBSD$");
#include <assert.h>
#include <limits.h>
#include <locale.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
int
main(int argc, char *argv[])
{
size_t len;
char buf[MB_LEN_MAX + 1];
/*
* C/POSIX locale.
*/
assert(MB_CUR_MAX == 1);
/* No shift states in C locale. */
assert(mblen(NULL, 0) == 0);
/* Null wide character. */
memset(buf, 0xcc, sizeof(buf));
buf[0] = '\0';
assert(mblen(buf, 1) == 0);
/* Latin letter A. */
buf[0] = 'A';
assert(mblen(buf, 1) == 1);
/* Incomplete character sequence. */
buf[0] = '\0';
assert(mblen(buf, 0) == -1);
/*
* Japanese (EUC) locale.
*/
assert(strcmp(setlocale(LC_CTYPE, "ja_JP.eucJP"), "ja_JP.eucJP") == 0);
assert(MB_CUR_MAX > 1);
/* No shift states in EUC. */
assert(mblen(NULL, 0) == 0);
/* Null wide character. */
memset(buf, 0xcc, sizeof(buf));
buf[0] = '\0';
assert(mblen(buf, 1) == 0);
/* Latin letter A. */
buf[0] = 'A';
assert(mblen(buf, 1) == 1);
/* Incomplete character sequence. */
buf[0] = '\0';
assert(mblen(buf, 0) == -1);
/* Incomplete character sequence (truncated double-byte). */
memset(buf, 0xcc, sizeof(buf));
buf[0] = 0xa3;
buf[1] = 0x00;
assert(mblen(buf, 1) == -1);
/* Same as above, but complete. */
buf[1] = 0xc1;
assert(mblen(buf, 2) == 2);
printf("PASS mblen()\n");
return (0);
}

View File

@ -0,0 +1,110 @@
/*-
* Copyright (c) 2002 Tim J. Robbins
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
*/
/*
* Test program for mbstowcs(), as specified by IEEE Std. 1003.1-2001 and
* ISO/IEC 9899:1999.
*
* The function is tested with both the "C" ("POSIX") LC_CTYPE setting and
* "ja_JP.eucJP". Other encodings are not tested.
*/
#include <sys/cdefs.h>
__FBSDID("$FreeBSD$");
#include <assert.h>
#include <errno.h>
#include <limits.h>
#include <locale.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <wchar.h>
int
main(int argc, char *argv[])
{
char srcbuf[128];
wchar_t dstbuf[128];
/*
* C/POSIX locale.
*/
/* Simple null terminated string. */
memset(srcbuf, 0xcc, sizeof(srcbuf));
strcpy(srcbuf, "hello");
wmemset(dstbuf, 0xcccc, sizeof(dstbuf) / sizeof(*dstbuf));
assert(mbstowcs(dstbuf, srcbuf, sizeof(dstbuf) / sizeof(*dstbuf)) == 5);
assert(wcscmp(dstbuf, L"hello") == 0);
assert(dstbuf[6] == 0xcccc);
/* Not enough space in destination buffer. */
memset(srcbuf, 0xcc, sizeof(srcbuf));
strcpy(srcbuf, "hello");
wmemset(dstbuf, 0xcccc, sizeof(dstbuf) / sizeof(*dstbuf));
assert(mbstowcs(dstbuf, srcbuf, 4) == 4);
assert(wmemcmp(dstbuf, L"hell", 4) == 0);
assert(dstbuf[5] == 0xcccc);
/* Null terminated string, internal dest. buffer (XSI extension) */
memset(srcbuf, 0xcc, sizeof(srcbuf));
strcpy(srcbuf, "hello");
assert(mbstowcs(NULL, srcbuf, 0) == 5);
/* Empty source buffer. */
memset(srcbuf, 0xcc, sizeof(srcbuf));
srcbuf[0] = '\0';
wmemset(dstbuf, 0xcccc, sizeof(dstbuf) / sizeof(*dstbuf));
assert(mbstowcs(dstbuf, srcbuf, 1) == 0);
assert(dstbuf[0] == 0);
assert(dstbuf[1] == 0xcccc);
/* Zero length destination buffer. */
memset(srcbuf, 0xcc, sizeof(srcbuf));
strcpy(srcbuf, "hello");
wmemset(dstbuf, 0xcccc, sizeof(dstbuf) / sizeof(*dstbuf));
assert(mbstowcs(dstbuf, srcbuf, 0) == 0);
assert(dstbuf[0] == 0xcccc);
/*
* Japanese (EUC) locale.
*/
assert(strcmp(setlocale(LC_CTYPE, "ja_JP.eucJP"), "ja_JP.eucJP") == 0);
assert(MB_CUR_MAX > 1);
memset(srcbuf, 0xcc, sizeof(srcbuf));
strcpy(srcbuf, "\xA3\xC1 B \xA3\xC3");
wmemset(dstbuf, 0xcccc, sizeof(dstbuf) / sizeof(*dstbuf));
assert(mbstowcs(dstbuf, srcbuf, sizeof(dstbuf) / sizeof(*dstbuf)) == 5);
assert(dstbuf[0] == 0xA3C1 && dstbuf[1] == 0x20 && dstbuf[2] == 0x42 &&
dstbuf[3] == 0x20 && dstbuf[4] == 0xA3C3 && dstbuf[5] == 0);
printf("PASS mbstowcs()\n");
return (0);
}

View File

@ -0,0 +1,119 @@
/*-
* Copyright (c) 2002 Tim J. Robbins
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
*/
/*
* Test program for mbtowc(), as specified by IEEE Std. 1003.1-2001 and
* ISO/IEC 9899:1990.
*
* The function is tested with both the "C" ("POSIX") LC_CTYPE setting and
* "ja_JP.eucJP". Other encodings are not tested.
*/
#include <sys/cdefs.h>
__FBSDID("$FreeBSD$");
#include <assert.h>
#include <limits.h>
#include <locale.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
int
main(int argc, char *argv[])
{
size_t len;
wchar_t wc;
char buf[MB_LEN_MAX + 1];
/*
* C/POSIX locale.
*/
assert(MB_CUR_MAX == 1);
/* No shift states in C locale. */
assert(mbtowc(NULL, NULL, 0) == 0);
/* Null wide character. */
wc = 0xcccc;
memset(buf, 0, sizeof(buf));
assert(mbtowc(&wc, buf, 1) == 0);
assert(wc == 0);
/* Latin letter A. */
buf[0] = 'A';
assert(mbtowc(&wc, buf, 1) == 1);
assert(wc == L'A');
/* Incomplete character sequence. */
wc = L'z';
buf[0] = '\0';
assert(mbtowc(&wc, buf, 0) == -1);
assert(wc == L'z');
/*
* Japanese (EUC) locale.
*/
assert(strcmp(setlocale(LC_CTYPE, "ja_JP.eucJP"), "ja_JP.eucJP") == 0);
assert(MB_CUR_MAX > 1);
/* Null wide character */
memset(buf, 0xcc, sizeof(buf));
buf[0] = 0;
wc = 0xcccc;
assert(mbtowc(&wc, buf, 1) == 0);
assert(wc == 0);
/* Latin letter A. */
buf[0] = 'A';
assert(mbtowc(&wc, buf, 1) == 1);
assert(wc == L'A');
/* Incomplete character sequence (zero length). */
wc = L'z';
buf[0] = '\0';
assert(mbtowc(&wc, buf, 0) == -1);
assert(wc == L'z');
/* Incomplete character sequence (truncated double-byte). */
memset(buf, 0xcc, sizeof(buf));
buf[0] = 0xa3;
buf[1] = 0x00;
wc = L'z';
assert(mbtowc(&wc, buf, 1) == -1);
assert(wc == L'z');
/* Same as above, but complete. */
buf[1] = 0xc1;
assert(mbtowc(&wc, buf, 2) == 2);
assert(wc == 0xa3c1);
printf("PASS mbtowc()\n");
return (0);
}

View File

@ -0,0 +1,127 @@
/*-
* Copyright (c) 2002 Tim J. Robbins
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
*/
/*
* Test program for wcstombs(), as specified by IEEE Std. 1003.1-2001 and
* ISO/IEC 9899:1999.
*
* The function is tested with both the "C" ("POSIX") LC_CTYPE setting and
* "ja_JP.eucJP". Other encodings are not tested.
*/
#include <sys/cdefs.h>
__FBSDID("$FreeBSD$");
#include <assert.h>
#include <errno.h>
#include <limits.h>
#include <locale.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <wchar.h>
int
main(int argc, char *argv[])
{
wchar_t srcbuf[128];
char dstbuf[128];
/*
* C/POSIX locale.
*/
/* Simple null terminated string. */
wmemset(srcbuf, 0xcc, sizeof(srcbuf) / sizeof(*srcbuf));
wcscpy(srcbuf, L"hello");
memset(dstbuf, 0xcc, sizeof(dstbuf));
assert(wcstombs(dstbuf, srcbuf, sizeof(dstbuf)) == 5);
assert(strcmp(dstbuf, "hello") == 0);
assert((unsigned char)dstbuf[6] == 0xcc);
/* Not enough space in destination buffer. */
wmemset(srcbuf, 0xcc, sizeof(srcbuf) / sizeof(*srcbuf));
wcscpy(srcbuf, L"hello");
memset(dstbuf, 0xcc, sizeof(dstbuf));
assert(wcstombs(dstbuf, srcbuf, 4) == 4);
assert(memcmp(dstbuf, "hell", 4) == 0);
assert((unsigned char)dstbuf[5] == 0xcc);
/* Null terminated string, internal dest. buffer */
wmemset(srcbuf, 0xcc, sizeof(srcbuf) / sizeof(*srcbuf));
wcscpy(srcbuf, L"hello");
assert(wcstombs(NULL, srcbuf, sizeof(dstbuf)) == 5);
/* Null terminated string, internal state. */
wmemset(srcbuf, 0xcc, sizeof(srcbuf) / sizeof(*srcbuf));
wcscpy(srcbuf, L"hello");
memset(dstbuf, 0xcc, sizeof(dstbuf));
assert(wcstombs(dstbuf, srcbuf, sizeof(dstbuf)) == 5);
assert(strcmp(dstbuf, "hello") == 0);
assert((unsigned char)dstbuf[6] == 0xcc);
/* Null terminated string, internal state, internal dest. buffer. */
wmemset(srcbuf, 0xcc, sizeof(srcbuf) / sizeof(*srcbuf));
wcscpy(srcbuf, L"hello");
assert(wcstombs(NULL, srcbuf, 0) == 5);
/* Empty source buffer. */
wmemset(srcbuf, 0xcc, sizeof(srcbuf) / sizeof(*srcbuf));
srcbuf[0] = L'\0';
memset(dstbuf, 0xcc, sizeof(dstbuf));
assert(wcstombs(dstbuf, srcbuf, sizeof(dstbuf)) == 0);
assert(dstbuf[0] == L'\0');
/* Zero length destination buffer. */
wmemset(srcbuf, 0xcc, sizeof(srcbuf) / sizeof(*srcbuf));
wcscpy(srcbuf, L"hello");
memset(dstbuf, 0xcc, sizeof(dstbuf));
assert(wcstombs(dstbuf, srcbuf, 0) == 0);
assert((unsigned char)dstbuf[0] == 0xcc);
/*
* Japanese (EUC) locale.
*/
assert(strcmp(setlocale(LC_CTYPE, "ja_JP.eucJP"), "ja_JP.eucJP") == 0);
assert(MB_CUR_MAX > 1);
wmemset(srcbuf, 0xcc, sizeof(srcbuf) / sizeof(*srcbuf));
srcbuf[0] = 0xA3C1;
srcbuf[1] = 0x0020;
srcbuf[2] = 0x0042;
srcbuf[3] = 0x0020;
srcbuf[4] = 0xA3C3;
srcbuf[5] = 0x0000;
memset(dstbuf, 0xcc, sizeof(dstbuf));
assert(wcstombs(dstbuf, srcbuf, sizeof(dstbuf)) == 7);
assert(strcmp(dstbuf, "\xA3\xC1 B \xA3\xC3") == 0);
assert((unsigned char)dstbuf[8] == 0xcc);
printf("PASS wcstombs()\n");
return (0);
}

View File

@ -0,0 +1,109 @@
/*-
* Copyright (c) 2002 Tim J. Robbins
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
*/
/*
* Test program for wctomb(), as specified by IEEE Std. 1003.1-2001 and
* ISO/IEC 9899:1999.
*
* The function is tested with both the "C" ("POSIX") LC_CTYPE setting and
* "ja_JP.eucJP". Other encodings are not tested.
*/
#include <sys/cdefs.h>
__FBSDID("$FreeBSD$");
#include <assert.h>
#include <errno.h>
#include <limits.h>
#include <locale.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
int
main(int argc, char *argv[])
{
size_t len;
char buf[MB_LEN_MAX + 1];
/*
* C/POSIX locale.
*/
assert(MB_CUR_MAX == 1);
/* No shift states in C locale. */
assert(wctomb(NULL, L'\0') == 0);
/* Null wide character. */
memset(buf, 0xcc, sizeof(buf));
len = wctomb(buf, L'\0');
assert(len == 1);
assert((unsigned char)buf[0] == 0 && (unsigned char)buf[1] == 0xcc);
/* Latin letter A. */
memset(buf, 0xcc, sizeof(buf));
len = wctomb(buf, L'A');
assert(len == 1);
assert((unsigned char)buf[0] == 'A' && (unsigned char)buf[1] == 0xcc);
/* Invalid code. */
assert(wctomb(buf, UCHAR_MAX + 1) == -1);
/*
* Japanese (EUC) locale.
*/
assert(strcmp(setlocale(LC_CTYPE, "ja_JP.eucJP"), "ja_JP.eucJP") == 0);
assert(MB_CUR_MAX == 3);
/* No shift states in EUC encoding. */
assert(wctomb(NULL, L'\0') == 0);
/* Null wide character. */
memset(buf, 0xcc, sizeof(buf));
len = wctomb(buf, L'\0');
assert(len == 1);
assert((unsigned char)buf[0] == 0 && (unsigned char)buf[1] == 0xcc);
/* Latin letter A. */
memset(buf, 0xcc, sizeof(buf));
len = wctomb(buf, L'A');
assert(len == 1);
assert((unsigned char)buf[0] == 'A' && (unsigned char)buf[1] == 0xcc);
/* Full width letter A. */
memset(buf, 0xcc, sizeof(buf));
len = wctomb(buf, 0xa3c1);
assert(len == 2);
assert((unsigned char)buf[0] == 0xa3 &&
(unsigned char)buf[1] == 0xc1 &&
(unsigned char)buf[2] == 0xcc);
printf("PASS wctomb()\n");
return (0);
}