big5.c revision 129334
138333Sphk/*- 2128004Stjr * Copyright (c) 2002-2004 Tim J. Robbins. All rights reserved. 338333Sphk * Copyright (c) 1993 438333Sphk * The Regents of the University of California. All rights reserved. 538333Sphk * 638333Sphk * This code is derived from software contributed to Berkeley by 738333Sphk * Paul Borman at Krystal Technologies. 838333Sphk * 938333Sphk * Redistribution and use in source and binary forms, with or without 1038333Sphk * modification, are permitted provided that the following conditions 1138333Sphk * are met: 1238333Sphk * 1. Redistributions of source code must retain the above copyright 1338333Sphk * notice, this list of conditions and the following disclaimer. 1438333Sphk * 2. Redistributions in binary form must reproduce the above copyright 1538333Sphk * notice, this list of conditions and the following disclaimer in the 1638333Sphk * documentation and/or other materials provided with the distribution. 1738333Sphk * 3. All advertising materials mentioning features or use of this software 1838333Sphk * must display the following acknowledgement: 1938333Sphk * This product includes software developed by the University of 2038333Sphk * California, Berkeley and its contributors. 2138333Sphk * 4. Neither the name of the University nor the names of its contributors 2238333Sphk * may be used to endorse or promote products derived from this software 2338333Sphk * without specific prior written permission. 2438333Sphk * 2538333Sphk * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 2638333Sphk * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 2738333Sphk * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 2838333Sphk * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 2938333Sphk * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 3038333Sphk * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 3138333Sphk * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 3238333Sphk * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 3338333Sphk * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 3438333Sphk * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 3538333Sphk * SUCH DAMAGE. 3638333Sphk */ 3738333Sphk 3838333Sphk#if defined(LIBC_SCCS) && !defined(lint) 3938333Sphkstatic char sccsid[] = "@(#)big5.c 8.1 (Berkeley) 6/4/93"; 4038333Sphk#endif /* LIBC_SCCS and not lint */ 41128004Stjr#include <sys/param.h> 4292986Sobrien__FBSDID("$FreeBSD: head/lib/libc/locale/big5.c 129334 2004-05-17 11:16:14Z tjr $"); 4338333Sphk 44128155Stjr#include <errno.h> 45121893Stjr#include <runetype.h> 4638333Sphk#include <stdlib.h> 47128004Stjr#include <string.h> 48121893Stjr#include <wchar.h> 49129153Stjr#include "mblocal.h" 5038333Sphk 51121893Stjrint _BIG5_init(_RuneLocale *); 52121893Stjrsize_t _BIG5_mbrtowc(wchar_t * __restrict, const char * __restrict, size_t, 53121893Stjr mbstate_t * __restrict); 54128004Stjrint _BIG5_mbsinit(const mbstate_t *); 55121893Stjrsize_t _BIG5_wcrtomb(char * __restrict, wchar_t, mbstate_t * __restrict); 56121893Stjr 57128004Stjrtypedef struct { 58129334Stjr wchar_t ch; 59128004Stjr} _BIG5State; 60128004Stjr 6138333Sphkint 62121893Stjr_BIG5_init(_RuneLocale *rl) 6338333Sphk{ 64121893Stjr 65121893Stjr __mbrtowc = _BIG5_mbrtowc; 66121893Stjr __wcrtomb = _BIG5_wcrtomb; 67128004Stjr __mbsinit = _BIG5_mbsinit; 6838333Sphk _CurrentRuneLocale = rl; 6938333Sphk __mb_cur_max = 2; 7038333Sphk return (0); 7138333Sphk} 7238333Sphk 73128004Stjrint 74128004Stjr_BIG5_mbsinit(const mbstate_t *ps) 75128004Stjr{ 76128004Stjr 77129334Stjr return (ps == NULL || ((const _BIG5State *)ps)->ch == 0); 78128004Stjr} 79128004Stjr 80121893Stjrstatic __inline int 81121893Stjr_big5_check(u_int c) 8238333Sphk{ 83121893Stjr 8438333Sphk c &= 0xff; 8538333Sphk return ((c >= 0xa1 && c <= 0xfe) ? 2 : 1); 8638333Sphk} 8738333Sphk 88121893Stjrsize_t 89121893Stjr_BIG5_mbrtowc(wchar_t * __restrict pwc, const char * __restrict s, size_t n, 90128004Stjr mbstate_t * __restrict ps) 9138333Sphk{ 92128004Stjr _BIG5State *bs; 93121893Stjr wchar_t wc; 94129334Stjr size_t len; 9538333Sphk 96128004Stjr bs = (_BIG5State *)ps; 97128004Stjr 98129334Stjr if ((bs->ch & ~0xFF) != 0) { 99129334Stjr /* Bad conversion state. */ 100128155Stjr errno = EINVAL; 101128155Stjr return ((size_t)-1); 102128155Stjr } 103128155Stjr 104128004Stjr if (s == NULL) { 105128004Stjr s = ""; 106128004Stjr n = 1; 107128004Stjr pwc = NULL; 108128004Stjr } 109128004Stjr 110129334Stjr if (n == 0) 111121893Stjr /* Incomplete multibyte sequence */ 112121893Stjr return ((size_t)-2); 113129334Stjr 114129334Stjr if (bs->ch != 0) { 115129334Stjr if (*s == '\0') { 116129334Stjr errno = EILSEQ; 117129334Stjr return ((size_t)-1); 118129334Stjr } 119129334Stjr wc = (bs->ch << 8) | (*s & 0xFF); 120129334Stjr if (pwc != NULL) 121129334Stjr *pwc = wc; 122129334Stjr bs->ch = 0; 123129334Stjr return (1); 124129117Stjr } 125129334Stjr 126129334Stjr len = (size_t)_big5_check(*s); 127129334Stjr wc = *s++ & 0xff; 128129334Stjr if (len == 2) { 129129334Stjr if (n < 2) { 130129334Stjr /* Incomplete multibyte sequence */ 131129334Stjr bs->ch = wc; 132129334Stjr return ((size_t)-2); 133129334Stjr } 134129334Stjr if (*s == '\0') { 135129334Stjr errno = EILSEQ; 136129334Stjr return ((size_t)-1); 137129334Stjr } 138129334Stjr wc = (wc << 8) | (*s++ & 0xff); 139129334Stjr if (pwc != NULL) 140129334Stjr *pwc = wc; 141129334Stjr return (2); 142129334Stjr } else { 143129334Stjr if (pwc != NULL) 144129334Stjr *pwc = wc; 145129334Stjr return (wc == L'\0' ? 0 : 1); 146129334Stjr } 14738333Sphk} 14838333Sphk 149121893Stjrsize_t 150128155Stjr_BIG5_wcrtomb(char * __restrict s, wchar_t wc, mbstate_t * __restrict ps) 15138333Sphk{ 152128155Stjr _BIG5State *bs; 153121893Stjr 154128155Stjr bs = (_BIG5State *)ps; 155128155Stjr 156129334Stjr if (bs->ch != 0) { 157128155Stjr errno = EINVAL; 158128155Stjr return ((size_t)-1); 159128155Stjr } 160128155Stjr 161121893Stjr if (s == NULL) 162121893Stjr /* Reset to initial shift state (no-op) */ 163121893Stjr return (1); 164121893Stjr if (wc & 0x8000) { 165121893Stjr *s++ = (wc >> 8) & 0xff; 166121893Stjr *s = wc & 0xff; 167121893Stjr return (2); 16838333Sphk } 169121893Stjr *s = wc & 0xff; 170121893Stjr return (1); 17138333Sphk} 172