1/* $NetBSD: t_btowc.c,v 1.3 2017/08/10 19:08:43 perseant Exp $ */ 2 3/*- 4 * Copyright (c) 2017 The NetBSD Foundation, Inc. 5 * All rights reserved. 6 * 7 * This code is derived from software contributed to The NetBSD Foundation 8 * by Konrad Schroder. 9 * 10 * Redistribution and use in source and binary forms, with or without 11 * modification, are permitted provided that the following conditions 12 * are met: 13 * 1. Redistributions of source code must retain the above copyright 14 * notice, this list of conditions and the following disclaimer. 15 * 2. Redistributions in binary form must reproduce the above copyright 16 * notice, this list of conditions and the following disclaimer in the 17 * documentation and/or other materials provided with the distribution. 18 * 19 * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS 20 * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED 21 * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR 22 * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS 23 * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR 24 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF 25 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS 26 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN 27 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) 28 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE 29 * POSSIBILITY OF SUCH DAMAGE. 30 */ 31 32#include <sys/cdefs.h> 33__COPYRIGHT("@(#) Copyright (c) 2017\ 34 The NetBSD Foundation, inc. All rights reserved."); 35__RCSID("$NetBSD: t_btowc.c,v 1.3 2017/08/10 19:08:43 perseant Exp $"); 36 37#include <locale.h> 38#include <stdio.h> 39#include <stdlib.h> 40#include <errno.h> 41#include <string.h> 42#include <wchar.h> 43 44#include <atf-c.h> 45 46struct test { 47 const char *locale; 48 const char *illegal; /* Illegal single-byte characters, if any */ 49 const char *legal; /* Legal single-byte characters */ 50 /* The next two are only used if __STDC_ISO_10646__ is defined */ 51 const wchar_t wlegal[8]; /* The same characters, but in ISO-10646 */ 52 const wchar_t willegal[8]; /* ISO-10646 that do not map into charset */ 53} tests[] = { 54 { 55 "en_US.UTF-8", 56 "\200", 57 "ABC123@\t", 58 { 'A', 'B', 'C', '1', '2', '3', '@', '\t' }, 59 { 0xfdd0, 0x10fffe, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0} 60 }, 61 { 62 "ru_RU.KOI8-R", 63 "", /* No illegal characters in KOI8-R */ 64 "A\xc2\xd7\xc7\xc4\xc5\xa3", 65 { 'A', 0x0431, 0x432, 0x0433, 0x0434, 0x0435, 0x0451, 0x0 }, 66 { 0x00c5, 0x00e6, 0x00fe, 0x0630, 0x06fc, 0x56cd, 0x0, 0x0 } 67 }, 68 { 69 NULL, 70 NULL, 71 NULL, 72 { 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0 }, 73 { 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0 } 74 }, 75}; 76 77#ifdef __STDC_ISO_10646__ 78static void 79h_iso10646(struct test *t) 80{ 81 const char *cp; 82 int c, wc; 83 char *str; 84 const wchar_t *wcp; 85 86 ATF_REQUIRE_STREQ(setlocale(LC_ALL, "C"), "C"); 87 printf("Trying locale: %s\n", t->locale); 88 ATF_REQUIRE(setlocale(LC_CTYPE, t->locale) != NULL); 89 ATF_REQUIRE((str = setlocale(LC_ALL, NULL)) != NULL); 90 (void)printf("Using locale: %s\n", str); 91 92 /* These should have valid wchar representations */ 93 for (cp = t->legal, wcp = t->wlegal; *cp != '\0'; ++cp, ++wcp) { 94 c = (int)(unsigned char)*cp; 95 printf("Checking legal character 0x%x\n", c); 96 wc = btowc(c); 97 98 if (errno != 0) 99 printf(" btowc() failed with errno=%d\n", errno); 100 101 /* It should map to the known Unicode equivalent */ 102 printf("btowc(0x%2.2x) = 0x%x, expecting 0x%x\n", 103 c, wc, *wcp); 104 ATF_REQUIRE(btowc(c) == *wcp); 105 } 106 107 /* These are invalid characters in the target set */ 108 for (wcp = t->willegal; *wcp != '\0'; ++wcp) { 109 printf("Checking illegal wide character 0x%lx\n", 110 (unsigned long)*wcp); 111 ATF_REQUIRE_EQ(wctob(*wcp), EOF); 112 } 113} 114#endif 115 116static void 117h_btowc(struct test *t) 118{ 119 const char *cp; 120 unsigned char c; 121 char *str; 122 const wchar_t *wcp; 123 124 ATF_REQUIRE_STREQ(setlocale(LC_ALL, "C"), "C"); 125 printf("Trying locale: %s\n", t->locale); 126 ATF_REQUIRE(setlocale(LC_CTYPE, t->locale) != NULL); 127 ATF_REQUIRE((str = setlocale(LC_ALL, NULL)) != NULL); 128 (void)printf("Using locale: %s\n", str); 129 130 /* btowc(EOF) -> WEOF */ 131 ATF_REQUIRE_EQ(btowc(EOF), WEOF); 132 133 /* wctob(WEOF) -> EOF */ 134 ATF_REQUIRE_EQ(wctob(WEOF), EOF); 135 136 /* Invalid in initial shift state -> WEOF */ 137 for (cp = t->illegal; *cp != '\0'; ++cp) { 138 printf("Checking illegal character 0x%x\n", 139 (unsigned char)*cp); 140 ATF_REQUIRE_EQ(btowc(*cp), WEOF); 141 } 142 143 /* These should have valid wchar representations */ 144 for (cp = t->legal; *cp != '\0'; ++cp) { 145 c = (unsigned char)*cp; 146 printf("Checking legal character 0x%x\n", c); 147 148 /* A legal character never maps to EOF */ 149 ATF_REQUIRE(btowc(c) != WEOF); 150 151 /* And the mapping should be reversible */ 152 printf("0x%x -> wide 0x%x -> 0x%x\n", 153 c, btowc(c), (unsigned char)wctob(btowc(c))); 154 ATF_REQUIRE_EQ(wctob(btowc(c)), c); 155 } 156} 157 158ATF_TC(btowc); 159ATF_TC_HEAD(btowc, tc) 160{ 161 atf_tc_set_md_var(tc, "descr", "Checks btowc(3) and wctob(3)"); 162} 163ATF_TC_BODY(btowc, tc) 164{ 165 struct test *t; 166 167 for (t = tests; t->locale != NULL; ++t) 168 h_btowc(t); 169} 170 171ATF_TC(stdc_iso_10646); 172ATF_TC_HEAD(stdc_iso_10646, tc) 173{ 174 atf_tc_set_md_var(tc, "descr", 175 "Checks btowc(3) conversion to ISO10646"); 176} 177ATF_TC_BODY(stdc_iso_10646, tc) 178{ 179 struct test *t; 180 181#ifdef __STDC_ISO_10646__ 182 for (t = tests; t->locale != NULL; ++t) 183 h_iso10646(t); 184#else /* ! __STDC_ISO_10646__ */ 185 atf_tc_skip("__STDC_ISO_10646__ not defined"); 186#endif /* ! __STDC_ISO_10646__ */ 187} 188 189ATF_TC(btowc_posix); 190ATF_TC_HEAD(btowc_posix, tc) 191{ 192 atf_tc_set_md_var(tc, "descr", "Checks btowc(3) and wctob(3) for POSIX locale"); 193} 194ATF_TC_BODY(btowc_posix, tc) 195{ 196 const char *cp; 197 unsigned char c; 198 char *str; 199 const wchar_t *wcp; 200 int i; 201 202 ATF_REQUIRE_STREQ(setlocale(LC_ALL, "POSIX"), "POSIX"); 203 204 /* btowc(EOF) -> WEOF */ 205 ATF_REQUIRE_EQ(btowc(EOF), WEOF); 206 207 /* wctob(WEOF) -> EOF */ 208 ATF_REQUIRE_EQ(wctob(WEOF), EOF); 209 210 /* All characters from 0 to 255, inclusive, map 211 onto their unsigned char equivalent */ 212 for (i = 0; i <= 255; i++) { 213 ATF_REQUIRE_EQ(btowc(i), (wchar_t)(unsigned char)(i)); 214 ATF_REQUIRE_EQ((unsigned char)wctob(i), (wchar_t)i); 215 } 216} 217 218ATF_TP_ADD_TCS(tp) 219{ 220 ATF_TP_ADD_TC(tp, btowc); 221 ATF_TP_ADD_TC(tp, btowc_posix); 222 ATF_TP_ADD_TC(tp, stdc_iso_10646); 223 224 return atf_no_error(); 225} 226