138333Sphk/*- 2290494Sbapt * Copyright 2013 Garrett D'Amore <garrett@damore.org> 3290494Sbapt * Copyright 2010 Nexenta Systems, Inc. All rights reserved. 4128004Stjr * Copyright (c) 2002-2004 Tim J. Robbins. All rights reserved. 538333Sphk * Copyright (c) 1993 638333Sphk * The Regents of the University of California. All rights reserved. 738333Sphk * 838333Sphk * This code is derived from software contributed to Berkeley by 938333Sphk * Paul Borman at Krystal Technologies. 1038333Sphk * 11227753Stheraven * Copyright (c) 2011 The FreeBSD Foundation 12227753Stheraven * All rights reserved. 13227753Stheraven * Portions of this software were developed by David Chisnall 14227753Stheraven * under sponsorship from the FreeBSD Foundation. 15227753Stheraven * 1638333Sphk * Redistribution and use in source and binary forms, with or without 1738333Sphk * modification, are permitted provided that the following conditions 1838333Sphk * are met: 1938333Sphk * 1. Redistributions of source code must retain the above copyright 2038333Sphk * notice, this list of conditions and the following disclaimer. 2138333Sphk * 2. Redistributions in binary form must reproduce the above copyright 2238333Sphk * notice, this list of conditions and the following disclaimer in the 2338333Sphk * documentation and/or other materials provided with the distribution. 24290494Sbapt * 3. Neither the name of the University nor the names of its contributors 2538333Sphk * may be used to endorse or promote products derived from this software 2638333Sphk * without specific prior written permission. 2738333Sphk * 2838333Sphk * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 2938333Sphk * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 3038333Sphk * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 3138333Sphk * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 3238333Sphk * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 3338333Sphk * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 3438333Sphk * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 3538333Sphk * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 3638333Sphk * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 3738333Sphk * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 3838333Sphk * SUCH DAMAGE. 3938333Sphk */ 4038333Sphk 4138333Sphk#if defined(LIBC_SCCS) && !defined(lint) 4238333Sphkstatic char sccsid[] = "@(#)big5.c 8.1 (Berkeley) 6/4/93"; 4338333Sphk#endif /* LIBC_SCCS and not lint */ 44142654Sphantom#include <sys/cdefs.h> 4592986Sobrien__FBSDID("$FreeBSD$"); 4638333Sphk 47142654Sphantom#include <sys/types.h> 48128155Stjr#include <errno.h> 49121893Stjr#include <runetype.h> 5038333Sphk#include <stdlib.h> 51128004Stjr#include <string.h> 52121893Stjr#include <wchar.h> 53129153Stjr#include "mblocal.h" 5438333Sphk 55172619Sacheextern int __mb_sb_limit; 56172619Sache 57142654Sphantomstatic size_t _BIG5_mbrtowc(wchar_t * __restrict, const char * __restrict, 58142654Sphantom size_t, mbstate_t * __restrict); 59142654Sphantomstatic int _BIG5_mbsinit(const mbstate_t *); 60142654Sphantomstatic size_t _BIG5_wcrtomb(char * __restrict, wchar_t, 61142654Sphantom mbstate_t * __restrict); 62290494Sbaptstatic size_t _BIG5_mbsnrtowcs(wchar_t * __restrict, 63290494Sbapt const char ** __restrict, size_t, size_t, 64290494Sbapt mbstate_t * __restrict); 65290494Sbaptstatic size_t _BIG5_wcsnrtombs(char * __restrict, 66290494Sbapt const wchar_t ** __restrict, size_t, size_t, 67290494Sbapt mbstate_t * __restrict); 68121893Stjr 69128004Stjrtypedef struct { 70129334Stjr wchar_t ch; 71128004Stjr} _BIG5State; 72128004Stjr 7338333Sphkint 74227753Stheraven_BIG5_init(struct xlocale_ctype *l, _RuneLocale *rl) 7538333Sphk{ 76121893Stjr 77227753Stheraven l->__mbrtowc = _BIG5_mbrtowc; 78227753Stheraven l->__wcrtomb = _BIG5_wcrtomb; 79290494Sbapt l->__mbsnrtowcs = _BIG5_mbsnrtowcs; 80290494Sbapt l->__wcsnrtombs = _BIG5_wcsnrtombs; 81227753Stheraven l->__mbsinit = _BIG5_mbsinit; 82227753Stheraven l->runes = rl; 83227753Stheraven l->__mb_cur_max = 2; 84227753Stheraven l->__mb_sb_limit = 128; 8538333Sphk return (0); 8638333Sphk} 8738333Sphk 88142654Sphantomstatic int 89128004Stjr_BIG5_mbsinit(const mbstate_t *ps) 90128004Stjr{ 91128004Stjr 92129334Stjr return (ps == NULL || ((const _BIG5State *)ps)->ch == 0); 93128004Stjr} 94128004Stjr 95121893Stjrstatic __inline int 96121893Stjr_big5_check(u_int c) 9738333Sphk{ 98121893Stjr 9938333Sphk c &= 0xff; 10038333Sphk return ((c >= 0xa1 && c <= 0xfe) ? 2 : 1); 10138333Sphk} 10238333Sphk 103142654Sphantomstatic size_t 104121893Stjr_BIG5_mbrtowc(wchar_t * __restrict pwc, const char * __restrict s, size_t n, 105128004Stjr mbstate_t * __restrict ps) 10638333Sphk{ 107128004Stjr _BIG5State *bs; 108121893Stjr wchar_t wc; 109129334Stjr size_t len; 11038333Sphk 111128004Stjr bs = (_BIG5State *)ps; 112128004Stjr 113129334Stjr if ((bs->ch & ~0xFF) != 0) { 114129334Stjr /* Bad conversion state. */ 115128155Stjr errno = EINVAL; 116128155Stjr return ((size_t)-1); 117128155Stjr } 118128155Stjr 119128004Stjr if (s == NULL) { 120128004Stjr s = ""; 121128004Stjr n = 1; 122128004Stjr pwc = NULL; 123128004Stjr } 124128004Stjr 125129334Stjr if (n == 0) 126121893Stjr /* Incomplete multibyte sequence */ 127121893Stjr return ((size_t)-2); 128129334Stjr 129129334Stjr if (bs->ch != 0) { 130129334Stjr if (*s == '\0') { 131129334Stjr errno = EILSEQ; 132129334Stjr return ((size_t)-1); 133129334Stjr } 134129334Stjr wc = (bs->ch << 8) | (*s & 0xFF); 135129334Stjr if (pwc != NULL) 136129334Stjr *pwc = wc; 137129334Stjr bs->ch = 0; 138129334Stjr return (1); 139129117Stjr } 140129334Stjr 141129334Stjr len = (size_t)_big5_check(*s); 142129334Stjr wc = *s++ & 0xff; 143129334Stjr if (len == 2) { 144129334Stjr if (n < 2) { 145129334Stjr /* Incomplete multibyte sequence */ 146129334Stjr bs->ch = wc; 147129334Stjr return ((size_t)-2); 148129334Stjr } 149129334Stjr if (*s == '\0') { 150129334Stjr errno = EILSEQ; 151129334Stjr return ((size_t)-1); 152129334Stjr } 153129334Stjr wc = (wc << 8) | (*s++ & 0xff); 154129334Stjr if (pwc != NULL) 155129334Stjr *pwc = wc; 156290494Sbapt return (2); 157129334Stjr } else { 158129334Stjr if (pwc != NULL) 159129334Stjr *pwc = wc; 160129334Stjr return (wc == L'\0' ? 0 : 1); 161129334Stjr } 16238333Sphk} 16338333Sphk 164142654Sphantomstatic size_t 165128155Stjr_BIG5_wcrtomb(char * __restrict s, wchar_t wc, mbstate_t * __restrict ps) 16638333Sphk{ 167128155Stjr _BIG5State *bs; 168121893Stjr 169128155Stjr bs = (_BIG5State *)ps; 170128155Stjr 171129334Stjr if (bs->ch != 0) { 172128155Stjr errno = EINVAL; 173128155Stjr return ((size_t)-1); 174128155Stjr } 175128155Stjr 176121893Stjr if (s == NULL) 177121893Stjr /* Reset to initial shift state (no-op) */ 178121893Stjr return (1); 179121893Stjr if (wc & 0x8000) { 180121893Stjr *s++ = (wc >> 8) & 0xff; 181121893Stjr *s = wc & 0xff; 182121893Stjr return (2); 18338333Sphk } 184121893Stjr *s = wc & 0xff; 185121893Stjr return (1); 18638333Sphk} 187290494Sbapt 188290494Sbaptstatic size_t 189290494Sbapt_BIG5_mbsnrtowcs(wchar_t * __restrict dst, const char ** __restrict src, 190290494Sbapt size_t nms, size_t len, mbstate_t * __restrict ps) 191290494Sbapt{ 192290494Sbapt return (__mbsnrtowcs_std(dst, src, nms, len, ps, _BIG5_mbrtowc)); 193290494Sbapt} 194290494Sbapt 195290494Sbaptstatic size_t 196290494Sbapt_BIG5_wcsnrtombs(char * __restrict dst, const wchar_t ** __restrict src, 197290494Sbapt size_t nwc, size_t len, mbstate_t * __restrict ps) 198290494Sbapt{ 199290494Sbapt return (__wcsnrtombs_std(dst, src, nwc, len, ps, _BIG5_wcrtomb)); 200290494Sbapt} 201