1/*
2 * sh.char.h: Table for spotting special characters quickly
3 * 	      Makes for very obscure but efficient coding.
4 */
5/*-
6 * Copyright (c) 1980, 1991 The Regents of the University of California.
7 * All rights reserved.
8 *
9 * Redistribution and use in source and binary forms, with or without
10 * modification, are permitted provided that the following conditions
11 * are met:
12 * 1. Redistributions of source code must retain the above copyright
13 *    notice, this list of conditions and the following disclaimer.
14 * 2. Redistributions in binary form must reproduce the above copyright
15 *    notice, this list of conditions and the following disclaimer in the
16 *    documentation and/or other materials provided with the distribution.
17 * 3. Neither the name of the University nor the names of its contributors
18 *    may be used to endorse or promote products derived from this software
19 *    without specific prior written permission.
20 *
21 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
22 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
23 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
24 * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
25 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
26 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
27 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
28 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
29 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
30 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
31 * SUCH DAMAGE.
32 */
33#ifndef _h_sh_char
34#define _h_sh_char
35#if defined(NeXT) && defined(NLS)
36# include <appkit/NXCType.h>
37#else
38# include <ctype.h>
39# ifdef WIDE_STRINGS
40#  ifdef HAVE_WCTYPE_H
41#   include <wctype.h>
42#  else
43#   include <wchar.h>
44#  endif
45# endif
46#endif
47
48typedef unsigned char tcshuc;
49#ifdef _MINIX
50# undef _SP
51#endif /* _MINIX */
52extern unsigned short _cmap[];
53#if defined(DSPMBYTE)
54# define CHECK_MBYTEVAR	STRdspmbyte
55#endif
56extern unsigned short _cmap_c[];
57extern unsigned short _cmap_mbyte[];
58extern short _enable_mbdisp;
59extern unsigned short _mbmap[];
60extern unsigned short _mbmap_euc[];
61extern unsigned short _mbmap_sjis[];
62extern unsigned short _mbmap_big5[];
63extern unsigned short _mbmap_utf8[];
64/* VARIABLE Check str */
65/* same compiler require #define even not define DSPMBYTE */
66#undef	_MB1
67#define _MB1	0x0001
68#undef	_MB2
69#define _MB2	0x0002
70
71#ifndef NLS
72extern tcshuc _cmap_lower[], _cmap_upper[];
73
74#endif
75
76#ifndef __QNXNTO__
77#undef	_QF
78#define	_QF	0x0001		/* '" (Forward quotes) */
79#undef	_QB
80#define	_QB	0x0002		/* ` (Backquote) */
81#undef	_SP
82#define	_SP	0x0004		/* space and tab */
83#else
84#undef	_XD
85#define	_XD	0x0001		/* As in <ctype.h> */
86#undef	_UP
87#define	_UP	0x0002		/* As in <ctype.h> */
88#undef	_SP
89#define	_SP	0x0004		/* As in <ctype.h> */
90#endif
91#undef	_NL
92#define	_NL	0x0008		/* \n */
93#undef	_META
94#define	_META	0x0010		/* lex meta characters, sp #'`";&<>()|\t\n */
95#undef	_GLOB
96#define	_GLOB	0x0020		/* glob characters, *?{[` */
97#undef	_ESC
98#define	_ESC	0x0040		/* \ */
99#undef	_DOL
100#define	_DOL	0x0080		/* $ */
101#undef	_DIG
102#define	_DIG  	0x0100		/* 0-9 */
103#undef	_LET
104#define	_LET  	0x0200		/* a-z, A-Z, _, or locale-specific */
105#ifndef __QNXNTO__
106#undef	_UP
107#define	_UP   	0x0400		/* A-Z, or locale-specific */
108#else
109#undef	_QF
110#define	_QF	0x0400		/* '" (Forward quotes) */
111#endif
112#undef	_DOW
113#define	_DOW  	0x0800		/* a-z, or locale-specific */
114#ifndef __QNXNTO__
115#undef	_XD
116#define	_XD 	0x1000		/* 0-9, a-f, A-F */
117#else
118#undef	_QB
119#define	_QB	0x1000		/* 0-9, a-f, A-F */
120#endif
121#undef	_CMD
122#define	_CMD	0x2000		/* lex end of command chars, ;&(|` */
123#undef	_CTR
124#define _CTR	0x4000		/* control */
125#undef	_PUN
126#define _PUN	0x8000		/* punctuation */
127
128#ifdef IS_ASCII
129# define ASC(ch) (ch)
130# define CTL_ESC(ch) (ch)
131#else
132# ifdef _OSD_POSIX
133/* "BS2000 OSD" is a POSIX on a main frame using a EBCDIC char set */
134#   include <ascii_ebcdic.h>
135# else
136/* "OS/390 USS" is a POSIX on a main frame using an IBM1047 char set */
137# endif
138  extern unsigned short _toascii[256];
139  extern unsigned short _toebcdic[256];
140
141/* mainly for comparisons if (ASC(ch)=='\177')... */
142#  define ASC(ch)     _toascii[(tcshuc)(ch)]
143
144/* Literal escapes ('\010') must be mapped to EBCDIC,
145 * for C-Escapes   ('\b'), the compiler already does it.
146 */
147#  define CTL_ESC(ch) _toebcdic[(tcshuc)(ch)]
148#endif /*IS_ASCII*/
149
150#ifdef WIDE_STRINGS
151# define cmap(c, bits)	\
152    (((c) & QUOTE) || (unsigned int)(c) >= 0x0080 ? 0 : \
153	(_cmap[(tcshuc)ASC(c)] & (bits)))
154#elif defined(SHORT_STRINGS) && defined(KANJI)
155#  define cmap(c, bits)	\
156    ((((c) & QUOTE) || ((tcshuc)(ASC(c) & 0x80) && adrof(STRnokanji))) ? \
157	0 : (_cmap[(tcshuc)ASC(c)] & (bits)))
158#else /* SHORT_STRINGS && KANJI */
159# define cmap(c, bits)	\
160    (((c) & QUOTE) ? 0 : (_cmap[(tcshuc)ASC(c)] & (bits)))
161#endif /* SHORT_STRINGS && KANJI */
162
163#define isglob(c)	cmap((c), _GLOB)
164#define isspc(c)	cmap((c), _SP)
165#define ismeta(c)	cmap((c), _META)
166#define iscmdmeta(c)	cmap((c), _CMD)
167#ifdef WIDE_STRINGS
168#define letter(c)	(((c) & QUOTE) ? 0 :  \
169			 (iswalpha((c)) || (c) == '_'))
170#define alnum(c)	(((c) & QUOTE) ? 0 :  \
171		         (iswalnum((c)) || (c) == '_'))
172#else
173#define letter(c)	(((Char)(c) & QUOTE) ? 0 :  \
174			 ((isalpha((c)) && !(cmap((c), _PUN))) \
175			  || (c) == '_'))
176#define alnum(c)	(((Char)(c) & QUOTE) ? 0 :  \
177		         ((isalnum((c)) && !(cmap((c), _PUN))) \
178			  || (c) == '_'))
179
180#endif
181
182#if defined(DSPMBYTE)
183# define IsmbyteU(c)	(Ismbyte1((Char)(c))||(Ismbyte2((Char)(c))&&((c)&0200)))
184#endif
185
186#ifdef NLS
187# ifdef WIDE_STRINGS
188#  define Isspace(c)	(((c) & QUOTE) ? 0 : iswspace(c))
189#  define Isdigit(c)	(((c) & QUOTE) ? 0 : iswdigit(c))
190#  define Isalpha(c)	(((c) & QUOTE) ? 0 : iswalpha(c))
191#  define Islower(c)	(((c) & QUOTE) ? 0 : iswlower(c))
192#  define Isupper(c)	(((c) & QUOTE) ? 0 : iswupper(c))
193#  define Tolower(c) 	(((c) & QUOTE) ? 0 : (wchar_t)towlower(c))
194#  define Toupper(c) 	(((c) & QUOTE) ? 0 : (wchar_t)towupper(c))
195#  define Isxdigit(c)	(((c) & QUOTE) ? 0 : iswxdigit(c))
196#  define Isalnum(c)	(((c) & QUOTE) ? 0 : iswalnum(c))
197#  define Iscntrl(c) 	(((c) & QUOTE) ? 0 : iswcntrl(c))
198#  define Isprint(c) 	(((c) & QUOTE) ? 0 : iswprint(c))
199#  define Ispunct(c) 	(((c) & QUOTE) ? 0 : iswpunct(c))
200# elif defined (NeXT)
201#  define Isspace(c)	(((Char)(c) & QUOTE) ? 0 : NXIsSpace((unsigned) (c)))
202#  define Isdigit(c)	(((Char)(c) & QUOTE) ? 0 : NXIsDigit((unsigned) (c)))
203#  define Isalpha(c)	(((Char)(c) & QUOTE) ? 0 : NXIsAlpha((unsigned) (c)))
204#  define Islower(c)	(((Char)(c) & QUOTE) ? 0 : NXIsLower((unsigned) (c)))
205#  define Isupper(c)	(((Char)(c) & QUOTE) ? 0 : NXIsUpper((unsigned) (c)))
206#  define Tolower(c) 	(((Char)(c) & QUOTE) ? 0 : NXToLower((unsigned) (c)))
207#  define Toupper(c) 	(((Char)(c) & QUOTE) ? 0 : NXToUpper((unsigned) (c)))
208#  define Isxdigit(c)	(((Char)(c) & QUOTE) ? 0 : NXIsXDigit((unsigned) (c)))
209#if defined(DSPMBYTE)
210#  define IscntrlM(c) 	(((Char)(c) & QUOTE) ? 0 : NXIsCntrl((unsigned) (c)))
211#  define Iscntrl(c)	( (IscntrlM(c)) && !(_enable_mbdisp&&(IsmbyteU((c)))) )
212#  define IsprintM(c) 	(((Char)(c) & QUOTE) ? 0 : NXIsPrint((unsigned) (c)))
213#  define Isprint(c)	( (IsprintM(c)) || (_enable_mbdisp&&(IsmbyteU((c)))) )
214#else
215#  define Isalnum(c)	(((Char)(c) & QUOTE) ? 0 : NXIsAlNum((unsigned) (c)))
216#  define Iscntrl(c) 	(((Char)(c) & QUOTE) ? 0 : NXIsCntrl((unsigned) (c)))
217#  define Isprint(c) 	(((Char)(c) & QUOTE) ? 0 : NXIsPrint((unsigned) (c)))
218#endif /* !defined(DSPMBYTE) */
219#  define Ispunct(c) 	(((Char)(c) & QUOTE) ? 0 : NXIsPunct((unsigned) (c)))
220# else /* !NeXT */
221#  ifndef WINNT_NATIVE
222#   define Isspace(c)	(((Char)(c) & QUOTE) ? 0 : isspace((tcshuc) (c)))
223#   define Isdigit(c)	(((Char)(c) & QUOTE) ? 0 : isdigit((tcshuc) (c)))
224#   define Isalpha(c)	(((Char)(c) & QUOTE) ? 0 : isalpha((tcshuc) (c)))
225#   define Islower(c)	(((Char)(c) & QUOTE) ? 0 : islower((tcshuc) (c)))
226#   define Isupper(c)	(((Char)(c) & QUOTE) ? 0 : isupper((tcshuc) (c)))
227#   define Tolower(c) 	(((Char)(c) & QUOTE) ? 0 : tolower((tcshuc) (c)))
228#   define Toupper(c) 	(((Char)(c) & QUOTE) ? 0 : toupper((tcshuc) (c)))
229#   define Isxdigit(c)	(((Char)(c) & QUOTE) ? 0 : isxdigit((tcshuc) (c)))
230#   define Isalnum(c)	(((Char)(c) & QUOTE) ? 0 : isalnum((tcshuc) (c)))
231#if defined(DSPMBYTE)
232#   define IscntrlM(c) 	(((Char)(c) & QUOTE) ? 0 : iscntrl((tcshuc) (c)))
233#   define Iscntrl(c)	( (IscntrlM(c)) && !(_enable_mbdisp&&(IsmbyteU((c)))) )
234#else
235#   define Iscntrl(c) 	(((Char)(c) & QUOTE) ? 0 : iscntrl((tcshuc) (c)))
236#endif /* !defined(DSPMBYTE) */
237#   if SOLARIS2 == 24
238    /*
239     * From <casper@fwi.uva.nl> Casper Dik:
240     * In Solaris 2.4, isprint('\t') returns true after setlocal(LC_ALL,"").
241     * This breaks commandline editing when you include tabs.
242     * (This is in the en_US locale).
243     */
244#if defined(DSPMBYTE)
245#    define IsprintM(c) 	(((Char)(c) & QUOTE) ? 0 : \
246				(isprint((tcshuc) (c)) && (c) != '\t'))
247#else
248#    define Isprint(c) 	(((Char)(c) & QUOTE) ? 0 : \
249				(isprint((tcshuc) (c)) && (c) != '\t'))
250#endif /* !defined(DSPMBYTE) */
251#   else
252#if defined(DSPMBYTE)
253#    define IsprintM(c) (((Char)(c) & QUOTE) ? 0 : isprint((tcshuc) (c)))
254#else
255#    define Isprint(c) 	(((Char)(c) & QUOTE) ? 0 : isprint((tcshuc) (c)))
256#endif /* !defined(DSPMBYTE) */
257#   endif /* SOLARIS2 == 24 */
258#if defined(DSPMBYTE)
259#   define Isprint(c)	( (IsprintM(c)) || (_enable_mbdisp&&(IsmbyteU((c)))) )
260#endif /* !defined(DSPMBYTE) */
261#    define Ispunct(c) 	(((Char)(c) & QUOTE) ? 0 : ispunct((tcshuc) (c)))
262#  else /* WINNT_NATIVE */
263#   define Isspace(c) (((Char)(c) & QUOTE) ? 0 : isspace( oem_it((tcshuc)(c))))
264#   define Isdigit(c) (((Char)(c) & QUOTE) ? 0 : isdigit( oem_it((tcshuc)(c))))
265#   define Isalpha(c) (((Char)(c) & QUOTE) ? 0 : isalpha( oem_it((tcshuc)(c))))
266#   define Islower(c) (((Char)(c) & QUOTE) ? 0 : islower( oem_it((tcshuc)(c))))
267#   define Isupper(c) (((Char)(c) & QUOTE) ? 0 : isupper( oem_it((tcshuc)(c))))
268#   define Tolower(c) (((Char)(c) & QUOTE) ? 0 : tolower( oem_it((tcshuc)(c))))
269#   define Toupper(c) (((Char)(c) & QUOTE) ? 0 : toupper( oem_it((tcshuc)(c))))
270#   define Isxdigit(c)(((Char)(c) & QUOTE) ? 0 : isxdigit(oem_it((tcshuc)(c))))
271#   define Isalnum(c) (((Char)(c) & QUOTE) ? 0 : isalnum( oem_it((tcshuc)(c))))
272#   define Ispunct(c) (((Char)(c) & QUOTE) ? 0 : ispunct( oem_it((tcshuc)(c))))
273#if defined(DSPMBYTE)
274#   define IscntrlM(c) (((Char)(c) & QUOTE) ? 0 : iscntrl( oem_it((tcshuc)(c))))
275#   define Iscntrl(c)	( (IscntrlM(c)) && !(_enable_mbdisp&&(IsmbyteU((c)))) )
276#   define IsprintM(c) (((Char)(c) & QUOTE) ? 0 : isprint( oem_it((tcshuc)(c))))
277#   define Isprint(c)	( (IsprintM(c)) || (_enable_mbdisp&&(IsmbyteU((c)))) )
278#else
279#   define Iscntrl(c) (((Char)(c) & QUOTE) ? 0 : iscntrl( oem_it((tcshuc)(c))))
280#   define Isprint(c) (((Char)(c) & QUOTE) ? 0 : isprint( oem_it((tcshuc)(c))))
281#endif /* !defined(DSPMBYTE) */
282#  endif /* WINNT_NATIVE */
283# endif /* !NeXT */
284#else /* !NLS */
285# define Isspace(c)	cmap((c), _SP|_NL)
286# define Isdigit(c)	cmap((c), _DIG)
287# define Isalpha(c)	(cmap((c),_LET) && !(((c) & META) && AsciiOnly))
288# define Islower(c)	(cmap((c),_DOW) && !(((c) & META) && AsciiOnly))
289# define Isupper(c)	(cmap((c), _UP) && !(((c) & META) && AsciiOnly))
290# define Tolower(c)	(_cmap_lower[ASC(c)])
291# define Toupper(c)	(_cmap_upper[ASC(c)])
292# define Isxdigit(c)	cmap((c), _XD)
293# define Isalnum(c)	(cmap((c), _DIG|_LET) && !(((Char)(c) & META) && AsciiOnly))
294#if defined(DSPMBYTE)
295# define IscntrlM(c)	(cmap((c),_CTR) && !(((c) & META) && AsciiOnly))
296# define Iscntrl(c)	( (IscntrlM(c)) && !(_enable_mbdisp&&(IsmbyteU((c)))) )
297# define IsprintM(c)	(!cmap((c),_CTR) && !(((c) & META) && AsciiOnly))
298# define Isprint(c)	( (IsprintM(c)) || (_enable_mbdisp&&(IsmbyteU((c)))) )
299#else
300# define Iscntrl(c)	(cmap((c),_CTR) && !(((c) & META) && AsciiOnly))
301# define Isprint(c)	(!cmap((c),_CTR) && !(((c) & META) && AsciiOnly))
302#endif /* !defined(DSPMBYTE) */
303# define Ispunct(c)	(cmap((c),_PUN) && !(((c) & META) && AsciiOnly))
304
305#endif /* !NLS */
306
307#if defined(DSPMBYTE)
308# define Ismbyte1(c)	((_mbmap[(c) & 0377] & _MB1) ? 1 : 0)
309# define Ismbyte2(c)	((_mbmap[(c) & 0377] & _MB2) ? 1 : 0)
310#endif
311
312#endif /* _h_sh_char */
313