xref: /freebsd/lib/libc/tests/locale/mbrtowc_test.c (revision d0b2dbfa)
1 /*-
2  * Copyright (c) 2002 Tim J. Robbins
3  * All rights reserved.
4  *
5  * Redistribution and use in source and binary forms, with or without
6  * modification, are permitted provided that the following conditions
7  * are met:
8  * 1. Redistributions of source code must retain the above copyright
9  *    notice, this list of conditions and the following disclaimer.
10  * 2. Redistributions in binary form must reproduce the above copyright
11  *    notice, this list of conditions and the following disclaimer in the
12  *    documentation and/or other materials provided with the distribution.
13  *
14  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
15  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
16  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
17  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
18  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
19  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
20  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
21  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
22  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
23  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
24  * SUCH DAMAGE.
25  */
26 
27 /*
28  * Test program for mbrtowc(), as specified by IEEE Std. 1003.1-2001 and
29  * ISO/IEC 9899:1999.
30  *
31  * The function is tested with both the "C" ("POSIX") LC_CTYPE setting and
32  * "ja_JP.eucJP". Other encodings are not tested.
33  */
34 
35 #include <sys/cdefs.h>
36 #include <errno.h>
37 #include <limits.h>
38 #include <locale.h>
39 #include <stdio.h>
40 #include <stdlib.h>
41 #include <string.h>
42 #include <wchar.h>
43 
44 #include <atf-c.h>
45 
46 ATF_TC_WITHOUT_HEAD(mbrtowc_test);
47 ATF_TC_BODY(mbrtowc_test, tc)
48 {
49 	mbstate_t s;
50 	wchar_t wc;
51 	char buf[MB_LEN_MAX + 1];
52 
53 	/*
54 	 * C/POSIX locale.
55 	 */
56 
57 	ATF_REQUIRE(MB_CUR_MAX == 1);
58 
59 	/* Null wide character, internal state. */
60 	memset(buf, 0xcc, sizeof(buf));
61 	buf[0] = 0;
62 	ATF_REQUIRE(mbrtowc(&wc, buf, 1, NULL) == 0);
63 	ATF_REQUIRE(wc == 0);
64 
65 	/* Null wide character. */
66 	memset(&s, 0, sizeof(s));
67 	ATF_REQUIRE(mbrtowc(&wc, buf, 1, &s) == 0);
68 	ATF_REQUIRE(wc == 0);
69 
70 	/* Latin letter A, internal state. */
71 	ATF_REQUIRE(mbrtowc(NULL, 0, 0, NULL) == 0);
72 	buf[0] = 'A';
73 	ATF_REQUIRE(mbrtowc(&wc, buf, 1, NULL) == 1);
74 	ATF_REQUIRE(wc == L'A');
75 
76 	/* Latin letter A. */
77 	memset(&s, 0, sizeof(s));
78 	ATF_REQUIRE(mbrtowc(&wc, buf, 1, &s) == 1);
79 	ATF_REQUIRE(wc == L'A');
80 
81 	/* Incomplete character sequence. */
82 	wc = L'z';
83 	memset(&s, 0, sizeof(s));
84 	ATF_REQUIRE(mbrtowc(&wc, buf, 0, &s) == (size_t)-2);
85 	ATF_REQUIRE(wc == L'z');
86 
87 	/* Check that mbrtowc() doesn't access the buffer when n == 0. */
88 	wc = L'z';
89 	memset(&s, 0, sizeof(s));
90 	buf[0] = '\0';
91 	ATF_REQUIRE(mbrtowc(&wc, buf, 0, &s) == (size_t)-2);
92 	ATF_REQUIRE(wc == L'z');
93 
94 	/*
95 	 * Japanese (EUC) locale.
96 	 */
97 
98 	ATF_REQUIRE(strcmp(setlocale(LC_CTYPE, "ja_JP.eucJP"), "ja_JP.eucJP") == 0);
99 	ATF_REQUIRE(MB_CUR_MAX > 1);
100 
101 	/* Null wide character, internal state. */
102 	ATF_REQUIRE(mbrtowc(NULL, 0, 0, NULL) == 0);
103 	memset(buf, 0xcc, sizeof(buf));
104 	buf[0] = 0;
105 	ATF_REQUIRE(mbrtowc(&wc, buf, 1, NULL) == 0);
106 	ATF_REQUIRE(wc == 0);
107 
108 	/* Null wide character. */
109 	memset(&s, 0, sizeof(s));
110 	ATF_REQUIRE(mbrtowc(&wc, buf, 1, &s) == 0);
111 	ATF_REQUIRE(wc == 0);
112 
113 	/* Latin letter A, internal state. */
114 	ATF_REQUIRE(mbrtowc(NULL, 0, 0, NULL) == 0);
115 	buf[0] = 'A';
116 	ATF_REQUIRE(mbrtowc(&wc, buf, 1, NULL) == 1);
117 	ATF_REQUIRE(wc == L'A');
118 
119 	/* Latin letter A. */
120 	memset(&s, 0, sizeof(s));
121 	ATF_REQUIRE(mbrtowc(&wc, buf, 1, &s) == 1);
122 	ATF_REQUIRE(wc == L'A');
123 
124 	/* Incomplete character sequence (zero length). */
125 	wc = L'z';
126 	memset(&s, 0, sizeof(s));
127 	ATF_REQUIRE(mbrtowc(&wc, buf, 0, &s) == (size_t)-2);
128 	ATF_REQUIRE(wc == L'z');
129 
130 	/* Incomplete character sequence (truncated double-byte). */
131 	memset(buf, 0xcc, sizeof(buf));
132 	buf[0] = 0xa3;
133 	buf[1] = 0x00;
134 	memset(&s, 0, sizeof(s));
135 	wc = 0;
136 	ATF_REQUIRE(mbrtowc(&wc, buf, 1, &s) == (size_t)-2);
137 
138 	/* Same as above, but complete. */
139 	buf[1] = 0xc1;
140 	memset(&s, 0, sizeof(s));
141 	wc = 0;
142 	ATF_REQUIRE(mbrtowc(&wc, buf, 2, &s) == 2);
143 	ATF_REQUIRE(wc == 0xa3c1);
144 
145 	/* Test restarting behaviour. */
146 	memset(buf, 0xcc, sizeof(buf));
147 	buf[0] = 0xa3;
148 	memset(&s, 0, sizeof(s));
149 	wc = 0;
150 	ATF_REQUIRE(mbrtowc(&wc, buf, 1, &s) == (size_t)-2);
151 	ATF_REQUIRE(wc == 0);
152 	buf[0] = 0xc1;
153 	ATF_REQUIRE(mbrtowc(&wc, buf, 1, &s) == 1);
154 	ATF_REQUIRE(wc == 0xa3c1);
155 }
156 
157 ATF_TP_ADD_TCS(tp)
158 {
159 
160 	ATF_TP_ADD_TC(tp, mbrtowc_test);
161 
162 	return (atf_no_error());
163 }
164