big5.c revision 129334
138333Sphk/*-
2128004Stjr * Copyright (c) 2002-2004 Tim J. Robbins. All rights reserved.
338333Sphk * Copyright (c) 1993
438333Sphk *	The Regents of the University of California.  All rights reserved.
538333Sphk *
638333Sphk * This code is derived from software contributed to Berkeley by
738333Sphk * Paul Borman at Krystal Technologies.
838333Sphk *
938333Sphk * Redistribution and use in source and binary forms, with or without
1038333Sphk * modification, are permitted provided that the following conditions
1138333Sphk * are met:
1238333Sphk * 1. Redistributions of source code must retain the above copyright
1338333Sphk *    notice, this list of conditions and the following disclaimer.
1438333Sphk * 2. Redistributions in binary form must reproduce the above copyright
1538333Sphk *    notice, this list of conditions and the following disclaimer in the
1638333Sphk *    documentation and/or other materials provided with the distribution.
1738333Sphk * 3. All advertising materials mentioning features or use of this software
1838333Sphk *    must display the following acknowledgement:
1938333Sphk *	This product includes software developed by the University of
2038333Sphk *	California, Berkeley and its contributors.
2138333Sphk * 4. Neither the name of the University nor the names of its contributors
2238333Sphk *    may be used to endorse or promote products derived from this software
2338333Sphk *    without specific prior written permission.
2438333Sphk *
2538333Sphk * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
2638333Sphk * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
2738333Sphk * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
2838333Sphk * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
2938333Sphk * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
3038333Sphk * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
3138333Sphk * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
3238333Sphk * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
3338333Sphk * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
3438333Sphk * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
3538333Sphk * SUCH DAMAGE.
3638333Sphk */
3738333Sphk
3838333Sphk#if defined(LIBC_SCCS) && !defined(lint)
3938333Sphkstatic char sccsid[] = "@(#)big5.c	8.1 (Berkeley) 6/4/93";
4038333Sphk#endif /* LIBC_SCCS and not lint */
41128004Stjr#include <sys/param.h>
4292986Sobrien__FBSDID("$FreeBSD: head/lib/libc/locale/big5.c 129334 2004-05-17 11:16:14Z tjr $");
4338333Sphk
44128155Stjr#include <errno.h>
45121893Stjr#include <runetype.h>
4638333Sphk#include <stdlib.h>
47128004Stjr#include <string.h>
48121893Stjr#include <wchar.h>
49129153Stjr#include "mblocal.h"
5038333Sphk
51121893Stjrint	_BIG5_init(_RuneLocale *);
52121893Stjrsize_t	_BIG5_mbrtowc(wchar_t * __restrict, const char * __restrict, size_t,
53121893Stjr	    mbstate_t * __restrict);
54128004Stjrint	_BIG5_mbsinit(const mbstate_t *);
55121893Stjrsize_t	_BIG5_wcrtomb(char * __restrict, wchar_t, mbstate_t * __restrict);
56121893Stjr
57128004Stjrtypedef struct {
58129334Stjr	wchar_t	ch;
59128004Stjr} _BIG5State;
60128004Stjr
6138333Sphkint
62121893Stjr_BIG5_init(_RuneLocale *rl)
6338333Sphk{
64121893Stjr
65121893Stjr	__mbrtowc = _BIG5_mbrtowc;
66121893Stjr	__wcrtomb = _BIG5_wcrtomb;
67128004Stjr	__mbsinit = _BIG5_mbsinit;
6838333Sphk	_CurrentRuneLocale = rl;
6938333Sphk	__mb_cur_max = 2;
7038333Sphk	return (0);
7138333Sphk}
7238333Sphk
73128004Stjrint
74128004Stjr_BIG5_mbsinit(const mbstate_t *ps)
75128004Stjr{
76128004Stjr
77129334Stjr	return (ps == NULL || ((const _BIG5State *)ps)->ch == 0);
78128004Stjr}
79128004Stjr
80121893Stjrstatic __inline int
81121893Stjr_big5_check(u_int c)
8238333Sphk{
83121893Stjr
8438333Sphk	c &= 0xff;
8538333Sphk	return ((c >= 0xa1 && c <= 0xfe) ? 2 : 1);
8638333Sphk}
8738333Sphk
88121893Stjrsize_t
89121893Stjr_BIG5_mbrtowc(wchar_t * __restrict pwc, const char * __restrict s, size_t n,
90128004Stjr    mbstate_t * __restrict ps)
9138333Sphk{
92128004Stjr	_BIG5State *bs;
93121893Stjr	wchar_t wc;
94129334Stjr	size_t len;
9538333Sphk
96128004Stjr	bs = (_BIG5State *)ps;
97128004Stjr
98129334Stjr	if ((bs->ch & ~0xFF) != 0) {
99129334Stjr		/* Bad conversion state. */
100128155Stjr		errno = EINVAL;
101128155Stjr		return ((size_t)-1);
102128155Stjr	}
103128155Stjr
104128004Stjr	if (s == NULL) {
105128004Stjr		s = "";
106128004Stjr		n = 1;
107128004Stjr		pwc = NULL;
108128004Stjr	}
109128004Stjr
110129334Stjr	if (n == 0)
111121893Stjr		/* Incomplete multibyte sequence */
112121893Stjr		return ((size_t)-2);
113129334Stjr
114129334Stjr	if (bs->ch != 0) {
115129334Stjr		if (*s == '\0') {
116129334Stjr			errno = EILSEQ;
117129334Stjr			return ((size_t)-1);
118129334Stjr		}
119129334Stjr		wc = (bs->ch << 8) | (*s & 0xFF);
120129334Stjr		if (pwc != NULL)
121129334Stjr			*pwc = wc;
122129334Stjr		bs->ch = 0;
123129334Stjr		return (1);
124129117Stjr	}
125129334Stjr
126129334Stjr	len = (size_t)_big5_check(*s);
127129334Stjr	wc = *s++ & 0xff;
128129334Stjr	if (len == 2) {
129129334Stjr		if (n < 2) {
130129334Stjr			/* Incomplete multibyte sequence */
131129334Stjr			bs->ch = wc;
132129334Stjr			return ((size_t)-2);
133129334Stjr		}
134129334Stjr		if (*s == '\0') {
135129334Stjr			errno = EILSEQ;
136129334Stjr			return ((size_t)-1);
137129334Stjr		}
138129334Stjr		wc = (wc << 8) | (*s++ & 0xff);
139129334Stjr		if (pwc != NULL)
140129334Stjr			*pwc = wc;
141129334Stjr                return (2);
142129334Stjr	} else {
143129334Stjr		if (pwc != NULL)
144129334Stjr			*pwc = wc;
145129334Stjr		return (wc == L'\0' ? 0 : 1);
146129334Stjr	}
14738333Sphk}
14838333Sphk
149121893Stjrsize_t
150128155Stjr_BIG5_wcrtomb(char * __restrict s, wchar_t wc, mbstate_t * __restrict ps)
15138333Sphk{
152128155Stjr	_BIG5State *bs;
153121893Stjr
154128155Stjr	bs = (_BIG5State *)ps;
155128155Stjr
156129334Stjr	if (bs->ch != 0) {
157128155Stjr		errno = EINVAL;
158128155Stjr		return ((size_t)-1);
159128155Stjr	}
160128155Stjr
161121893Stjr	if (s == NULL)
162121893Stjr		/* Reset to initial shift state (no-op) */
163121893Stjr		return (1);
164121893Stjr	if (wc & 0x8000) {
165121893Stjr		*s++ = (wc >> 8) & 0xff;
166121893Stjr		*s = wc & 0xff;
167121893Stjr		return (2);
16838333Sphk	}
169121893Stjr	*s = wc & 0xff;
170121893Stjr	return (1);
17138333Sphk}
172