xref: /freebsd/lib/libc/tests/locale/mbrtowc_test.c (revision 069ac184)
1 /*-
2  * Copyright (c) 2002 Tim J. Robbins
3  * All rights reserved.
4  *
5  * Redistribution and use in source and binary forms, with or without
6  * modification, are permitted provided that the following conditions
7  * are met:
8  * 1. Redistributions of source code must retain the above copyright
9  *    notice, this list of conditions and the following disclaimer.
10  * 2. Redistributions in binary form must reproduce the above copyright
11  *    notice, this list of conditions and the following disclaimer in the
12  *    documentation and/or other materials provided with the distribution.
13  *
14  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
15  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
16  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
17  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
18  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
19  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
20  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
21  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
22  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
23  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
24  * SUCH DAMAGE.
25  */
26 
27 /*
28  * Test program for mbrtowc(), as specified by IEEE Std. 1003.1-2001 and
29  * ISO/IEC 9899:1999.
30  *
31  * The function is tested with both the "C" ("POSIX") LC_CTYPE setting and
32  * "ja_JP.eucJP". Other encodings are not tested.
33  */
34 
35 #include <errno.h>
36 #include <limits.h>
37 #include <locale.h>
38 #include <stdio.h>
39 #include <stdlib.h>
40 #include <string.h>
41 #include <wchar.h>
42 
43 #include <atf-c.h>
44 
45 ATF_TC_WITHOUT_HEAD(mbrtowc_test);
46 ATF_TC_BODY(mbrtowc_test, tc)
47 {
48 	mbstate_t s;
49 	wchar_t wc;
50 	char buf[MB_LEN_MAX + 1];
51 
52 	/*
53 	 * C/POSIX locale.
54 	 */
55 
56 	ATF_REQUIRE(MB_CUR_MAX == 1);
57 
58 	/* Null wide character, internal state. */
59 	memset(buf, 0xcc, sizeof(buf));
60 	buf[0] = 0;
61 	ATF_REQUIRE(mbrtowc(&wc, buf, 1, NULL) == 0);
62 	ATF_REQUIRE(wc == 0);
63 
64 	/* Null wide character. */
65 	memset(&s, 0, sizeof(s));
66 	ATF_REQUIRE(mbrtowc(&wc, buf, 1, &s) == 0);
67 	ATF_REQUIRE(wc == 0);
68 
69 	/* Latin letter A, internal state. */
70 	ATF_REQUIRE(mbrtowc(NULL, 0, 0, NULL) == 0);
71 	buf[0] = 'A';
72 	ATF_REQUIRE(mbrtowc(&wc, buf, 1, NULL) == 1);
73 	ATF_REQUIRE(wc == L'A');
74 
75 	/* Latin letter A. */
76 	memset(&s, 0, sizeof(s));
77 	ATF_REQUIRE(mbrtowc(&wc, buf, 1, &s) == 1);
78 	ATF_REQUIRE(wc == L'A');
79 
80 	/* Incomplete character sequence. */
81 	wc = L'z';
82 	memset(&s, 0, sizeof(s));
83 	ATF_REQUIRE(mbrtowc(&wc, buf, 0, &s) == (size_t)-2);
84 	ATF_REQUIRE(wc == L'z');
85 
86 	/* Check that mbrtowc() doesn't access the buffer when n == 0. */
87 	wc = L'z';
88 	memset(&s, 0, sizeof(s));
89 	buf[0] = '\0';
90 	ATF_REQUIRE(mbrtowc(&wc, buf, 0, &s) == (size_t)-2);
91 	ATF_REQUIRE(wc == L'z');
92 
93 	/*
94 	 * Japanese (EUC) locale.
95 	 */
96 
97 	ATF_REQUIRE(strcmp(setlocale(LC_CTYPE, "ja_JP.eucJP"), "ja_JP.eucJP") == 0);
98 	ATF_REQUIRE(MB_CUR_MAX > 1);
99 
100 	/* Null wide character, internal state. */
101 	ATF_REQUIRE(mbrtowc(NULL, 0, 0, NULL) == 0);
102 	memset(buf, 0xcc, sizeof(buf));
103 	buf[0] = 0;
104 	ATF_REQUIRE(mbrtowc(&wc, buf, 1, NULL) == 0);
105 	ATF_REQUIRE(wc == 0);
106 
107 	/* Null wide character. */
108 	memset(&s, 0, sizeof(s));
109 	ATF_REQUIRE(mbrtowc(&wc, buf, 1, &s) == 0);
110 	ATF_REQUIRE(wc == 0);
111 
112 	/* Latin letter A, internal state. */
113 	ATF_REQUIRE(mbrtowc(NULL, 0, 0, NULL) == 0);
114 	buf[0] = 'A';
115 	ATF_REQUIRE(mbrtowc(&wc, buf, 1, NULL) == 1);
116 	ATF_REQUIRE(wc == L'A');
117 
118 	/* Latin letter A. */
119 	memset(&s, 0, sizeof(s));
120 	ATF_REQUIRE(mbrtowc(&wc, buf, 1, &s) == 1);
121 	ATF_REQUIRE(wc == L'A');
122 
123 	/* Incomplete character sequence (zero length). */
124 	wc = L'z';
125 	memset(&s, 0, sizeof(s));
126 	ATF_REQUIRE(mbrtowc(&wc, buf, 0, &s) == (size_t)-2);
127 	ATF_REQUIRE(wc == L'z');
128 
129 	/* Incomplete character sequence (truncated double-byte). */
130 	memset(buf, 0xcc, sizeof(buf));
131 	buf[0] = 0xa3;
132 	buf[1] = 0x00;
133 	memset(&s, 0, sizeof(s));
134 	wc = 0;
135 	ATF_REQUIRE(mbrtowc(&wc, buf, 1, &s) == (size_t)-2);
136 
137 	/* Same as above, but complete. */
138 	buf[1] = 0xc1;
139 	memset(&s, 0, sizeof(s));
140 	wc = 0;
141 	ATF_REQUIRE(mbrtowc(&wc, buf, 2, &s) == 2);
142 	ATF_REQUIRE(wc == 0xa3c1);
143 
144 	/* Test restarting behaviour. */
145 	memset(buf, 0xcc, sizeof(buf));
146 	buf[0] = 0xa3;
147 	memset(&s, 0, sizeof(s));
148 	wc = 0;
149 	ATF_REQUIRE(mbrtowc(&wc, buf, 1, &s) == (size_t)-2);
150 	ATF_REQUIRE(wc == 0);
151 	buf[0] = 0xc1;
152 	ATF_REQUIRE(mbrtowc(&wc, buf, 1, &s) == 1);
153 	ATF_REQUIRE(wc == 0xa3c1);
154 }
155 
156 ATF_TP_ADD_TCS(tp)
157 {
158 
159 	ATF_TP_ADD_TC(tp, mbrtowc_test);
160 
161 	return (atf_no_error());
162 }
163