1 /*-
2 * Copyright (c) 2002 Tim J. Robbins
3 * All rights reserved.
4 *
5 * Copyright (c) 2013 Ed Schouten <[email protected]>
6 * All rights reserved.
7 *
8 * Redistribution and use in source and binary forms, with or without
9 * modification, are permitted provided that the following conditions
10 * are met:
11 * 1. Redistributions of source code must retain the above copyright
12 * notice, this list of conditions and the following disclaimer.
13 * 2. Redistributions in binary form must reproduce the above copyright
14 * notice, this list of conditions and the following disclaimer in the
15 * documentation and/or other materials provided with the distribution.
16 *
17 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
18 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
21 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
22 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
23 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
24 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
25 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
26 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
27 * SUCH DAMAGE.
28 */
29 /*
30 * Test program for mbrtoc16() as specified by ISO/IEC 9899:2011.
31 */
32
33 #include <sys/cdefs.h>
34 __FBSDID("$FreeBSD$");
35
36 #include <errno.h>
37 #include <limits.h>
38 #include <locale.h>
39 #include <stdio.h>
40 #include <string.h>
41 #include <uchar.h>
42
43 #include <atf-c.h>
44
45 static void
require_lc_ctype(const char * locale_name)46 require_lc_ctype(const char *locale_name)
47 {
48 char *lc_ctype_set;
49
50 lc_ctype_set = setlocale(LC_CTYPE, locale_name);
51 if (lc_ctype_set == NULL)
52 atf_tc_fail("setlocale(LC_CTYPE, \"%s\") failed; errno=%d",
53 locale_name, errno);
54
55 ATF_REQUIRE(strcmp(lc_ctype_set, locale_name) == 0);
56 }
57
58 static mbstate_t s;
59 static char16_t c16;
60
61 ATF_TC_WITHOUT_HEAD(mbrtoc16_c_locale_test);
ATF_TC_BODY(mbrtoc16_c_locale_test,tc)62 ATF_TC_BODY(mbrtoc16_c_locale_test, tc)
63 {
64
65 require_lc_ctype("C");
66
67 /* Null wide character, internal state. */
68 ATF_REQUIRE(mbrtoc16(&c16, "", 1, NULL) == 0);
69 ATF_REQUIRE(c16 == 0);
70
71 /* Null wide character. */
72 memset(&s, 0, sizeof(s));
73 ATF_REQUIRE(mbrtoc16(&c16, "", 1, &s) == 0);
74 ATF_REQUIRE(c16 == 0);
75
76 /* Latin letter A, internal state. */
77 ATF_REQUIRE(mbrtoc16(NULL, 0, 0, NULL) == 0);
78 ATF_REQUIRE(mbrtoc16(&c16, "A", 1, NULL) == 1);
79 ATF_REQUIRE(c16 == L'A');
80
81 /* Latin letter A. */
82 memset(&s, 0, sizeof(s));
83 ATF_REQUIRE(mbrtoc16(&c16, "A", 1, &s) == 1);
84 ATF_REQUIRE(c16 == L'A');
85
86 /* Incomplete character sequence. */
87 c16 = L'z';
88 memset(&s, 0, sizeof(s));
89 ATF_REQUIRE(mbrtoc16(&c16, "", 0, &s) == (size_t)-2);
90 ATF_REQUIRE(c16 == L'z');
91
92 /* Check that mbrtoc16() doesn't access the buffer when n == 0. */
93 c16 = L'z';
94 memset(&s, 0, sizeof(s));
95 ATF_REQUIRE(mbrtoc16(&c16, "", 0, &s) == (size_t)-2);
96 ATF_REQUIRE(c16 == L'z');
97
98 /* Check that mbrtoc16() doesn't read ahead too aggressively. */
99 memset(&s, 0, sizeof(s));
100 ATF_REQUIRE(mbrtoc16(&c16, "AB", 2, &s) == 1);
101 ATF_REQUIRE(c16 == L'A');
102 ATF_REQUIRE(mbrtoc16(&c16, "C", 1, &s) == 1);
103 ATF_REQUIRE(c16 == L'C');
104
105 }
106
107 ATF_TC_WITHOUT_HEAD(mbrtoc16_iso_8859_1_test);
ATF_TC_BODY(mbrtoc16_iso_8859_1_test,tc)108 ATF_TC_BODY(mbrtoc16_iso_8859_1_test, tc)
109 {
110
111 require_lc_ctype("en_US.ISO8859-1");
112
113 /* Currency sign. */
114 memset(&s, 0, sizeof(s));
115 ATF_REQUIRE(mbrtoc16(&c16, "\xa4", 1, &s) == 1);
116 ATF_REQUIRE(c16 == 0xa4);
117 }
118
119 ATF_TC_WITHOUT_HEAD(mbrtoc16_iso_8859_15_test);
ATF_TC_BODY(mbrtoc16_iso_8859_15_test,tc)120 ATF_TC_BODY(mbrtoc16_iso_8859_15_test, tc)
121 {
122
123 require_lc_ctype("en_US.ISO8859-15");
124
125 /* Euro sign. */
126 memset(&s, 0, sizeof(s));
127 ATF_REQUIRE(mbrtoc16(&c16, "\xa4", 1, &s) == 1);
128 ATF_REQUIRE(c16 == 0x20ac);
129 }
130
131 ATF_TC_WITHOUT_HEAD(mbrtoc16_utf_8_test);
ATF_TC_BODY(mbrtoc16_utf_8_test,tc)132 ATF_TC_BODY(mbrtoc16_utf_8_test, tc)
133 {
134
135 require_lc_ctype("en_US.UTF-8");
136
137 /* Null wide character, internal state. */
138 ATF_REQUIRE(mbrtoc16(NULL, 0, 0, NULL) == 0);
139 ATF_REQUIRE(mbrtoc16(&c16, "", 1, NULL) == 0);
140 ATF_REQUIRE(c16 == 0);
141
142 /* Null wide character. */
143 memset(&s, 0, sizeof(s));
144 ATF_REQUIRE(mbrtoc16(&c16, "", 1, &s) == 0);
145 ATF_REQUIRE(c16 == 0);
146
147 /* Latin letter A, internal state. */
148 ATF_REQUIRE(mbrtoc16(NULL, 0, 0, NULL) == 0);
149 ATF_REQUIRE(mbrtoc16(&c16, "A", 1, NULL) == 1);
150 ATF_REQUIRE(c16 == L'A');
151
152 /* Latin letter A. */
153 memset(&s, 0, sizeof(s));
154 ATF_REQUIRE(mbrtoc16(&c16, "A", 1, &s) == 1);
155 ATF_REQUIRE(c16 == L'A');
156
157 /* Incomplete character sequence (zero length). */
158 c16 = L'z';
159 memset(&s, 0, sizeof(s));
160 ATF_REQUIRE(mbrtoc16(&c16, "", 0, &s) == (size_t)-2);
161 ATF_REQUIRE(c16 == L'z');
162
163 /* Incomplete character sequence (truncated double-byte). */
164 memset(&s, 0, sizeof(s));
165 c16 = 0;
166 ATF_REQUIRE(mbrtoc16(&c16, "\xc3", 1, &s) == (size_t)-2);
167
168 /* Same as above, but complete. */
169 memset(&s, 0, sizeof(s));
170 c16 = 0;
171 ATF_REQUIRE(mbrtoc16(&c16, "\xc3\x84", 2, &s) == 2);
172 ATF_REQUIRE(c16 == 0xc4);
173
174 /* Test restarting behaviour. */
175 memset(&s, 0, sizeof(s));
176 c16 = 0;
177 ATF_REQUIRE(mbrtoc16(&c16, "\xc3", 1, &s) == (size_t)-2);
178 ATF_REQUIRE(c16 == 0);
179 ATF_REQUIRE(mbrtoc16(&c16, "\xb7", 1, &s) == 1);
180 ATF_REQUIRE(c16 == 0xf7);
181
182 /* Surrogate pair. */
183 memset(&s, 0, sizeof(s));
184 c16 = 0;
185 ATF_REQUIRE(mbrtoc16(&c16, "\xf0\x9f\x92\xa9", 4, &s) == 4);
186 ATF_REQUIRE(c16 == 0xd83d);
187 ATF_REQUIRE(mbrtoc16(&c16, "", 0, &s) == (size_t)-3);
188 ATF_REQUIRE(c16 == 0xdca9);
189
190 /* Letter e with acute, precomposed. */
191 memset(&s, 0, sizeof(s));
192 c16 = 0;
193 ATF_REQUIRE(mbrtoc16(&c16, "\xc3\xa9", 2, &s) == 2);
194 ATF_REQUIRE(c16 == 0xe9);
195
196 /* Letter e with acute, combined. */
197 memset(&s, 0, sizeof(s));
198 c16 = 0;
199 ATF_REQUIRE(mbrtoc16(&c16, "\x65\xcc\x81", 3, &s) == 1);
200 ATF_REQUIRE(c16 == 0x65);
201 ATF_REQUIRE(mbrtoc16(&c16, "\xcc\x81", 2, &s) == 2);
202 ATF_REQUIRE(c16 == 0x301);
203 }
204
ATF_TP_ADD_TCS(tp)205 ATF_TP_ADD_TCS(tp)
206 {
207
208 ATF_TP_ADD_TC(tp, mbrtoc16_c_locale_test);
209 ATF_TP_ADD_TC(tp, mbrtoc16_iso_8859_1_test);
210 ATF_TP_ADD_TC(tp, mbrtoc16_iso_8859_15_test);
211 ATF_TP_ADD_TC(tp, mbrtoc16_utf_8_test);
212
213 return (atf_no_error());
214 }
215