tc.nls.c revision 231990
1/* $Header: /p/tcsh/cvsroot/tcsh/tc.nls.c,v 3.23 2010/02/12 22:17:20 christos Exp $ */
2/*
3 * tc.nls.c: NLS handling
4 */
5/*-
6 * Copyright (c) 1980, 1991 The Regents of the University of California.
7 * All rights reserved.
8 *
9 * Redistribution and use in source and binary forms, with or without
10 * modification, are permitted provided that the following conditions
11 * are met:
12 * 1. Redistributions of source code must retain the above copyright
13 *    notice, this list of conditions and the following disclaimer.
14 * 2. Redistributions in binary form must reproduce the above copyright
15 *    notice, this list of conditions and the following disclaimer in the
16 *    documentation and/or other materials provided with the distribution.
17 * 3. Neither the name of the University nor the names of its contributors
18 *    may be used to endorse or promote products derived from this software
19 *    without specific prior written permission.
20 *
21 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
22 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
23 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
24 * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
25 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
26 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
27 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
28 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
29 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
30 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
31 * SUCH DAMAGE.
32 */
33#include "sh.h"
34
35RCSID("$tcsh: tc.nls.c,v 3.23 2010/02/12 22:17:20 christos Exp $")
36
37
38#ifdef WIDE_STRINGS
39# ifdef HAVE_WCWIDTH
40#  ifdef UTF16_STRINGS
41int
42xwcwidth (wint_t wchar)
43{
44  wchar_t ws[2];
45
46  if (wchar <= 0xffff)
47    return wcwidth ((wchar_t) wchar);
48  /* UTF-16 systems can't handle these values directly in calls to wcwidth.
49     However, they can handle them as surrogate pairs in calls to wcswidth.
50     What we do here is to convert UTF-32 values >= 0x10000 into surrogate
51     pairs and compute the width by calling wcswidth. */
52  wchar -= 0x10000;
53  ws[0] = 0xd800 | (wchar >> 10);
54  ws[1] = 0xdc00 | (wchar & 0x3ff);
55  return wcswidth (ws, 2);
56}
57#  else
58#define xwcwidth wcwidth
59#  endif /* !UTF16_STRINGS */
60# endif /* HAVE_WCWIDTH */
61
62int
63NLSWidth(Char c)
64{
65# ifdef HAVE_WCWIDTH
66    int l;
67    if (c & INVALID_BYTE)
68	return 1;
69    l = xwcwidth((wchar_t) c);
70    return l >= 0 ? l : 0;
71# else
72    return iswprint(c) != 0;
73# endif
74}
75
76int
77NLSStringWidth(const Char *s)
78{
79    int w = 0, l;
80    Char c;
81
82    while (*s) {
83	c = *s++;
84#ifdef HAVE_WCWIDTH
85	if ((l = xwcwidth((wchar_t) c)) < 0)
86		l = 2;
87#else
88	l = iswprint(c) != 0;
89#endif
90	w += l;
91    }
92    return w;
93}
94#endif
95
96Char *
97NLSChangeCase(const Char *p, int mode)
98{
99    Char c, *n, c2 = 0;
100    const Char *op = p;
101
102    for (; (c = *p) != 0; p++) {
103        if (mode == 0 && Islower(c)) {
104	    c2 = Toupper(c);
105	    break;
106        } else if (mode && Isupper(c)) {
107	    c2 = Tolower(c);
108	    break;
109	}
110    }
111    if (!*p)
112	return 0;
113    n = Strsave(op);
114    n[p - op] = c2;
115    return n;
116}
117
118int
119NLSClassify(Char c, int nocomb)
120{
121    int w;
122    if (c & INVALID_BYTE)
123	return NLSCLASS_ILLEGAL;
124    w = NLSWidth(c);
125    if ((w > 0 && !(Iscntrl(c) && (c & CHAR) < 0x100)) || (Isprint(c) && !nocomb))
126	return w;
127    if (Iscntrl(c) && (c & CHAR) < 0x100) {
128	if (c == '\n')
129	    return NLSCLASS_NL;
130	if (c == '\t')
131	    return NLSCLASS_TAB;
132	return NLSCLASS_CTRL;
133    }
134#ifdef WIDE_STRINGS
135    if (c >= 0x1000000)
136	return NLSCLASS_ILLEGAL4;
137    if (c >= 0x10000)
138	return NLSCLASS_ILLEGAL3;
139#endif
140    if (c >= 0x100)
141	return NLSCLASS_ILLEGAL2;
142    return NLSCLASS_ILLEGAL;
143}
144