1/* rlmbutil.h -- utility functions for multibyte characters. */
2
3/* Copyright (C) 2001, 2003 Free Software Foundation, Inc.
4
5   This file is part of the GNU Readline Library, a library for
6   reading lines of text with interactive input and history editing.
7
8   The GNU Readline Library is free software; you can redistribute it
9   and/or modify it under the terms of the GNU General Public License
10   as published by the Free Software Foundation; either version 2, or
11   (at your option) any later version.
12
13   The GNU Readline Library is distributed in the hope that it will be
14   useful, but WITHOUT ANY WARRANTY; without even the implied warranty
15   of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
16   GNU General Public License for more details.
17
18   The GNU General Public License is often shipped with GNU software, and
19   is generally kept in a file called COPYING or LICENSE.  If you do not
20   have a copy of the license, write to the Free Software Foundation,
21   59 Temple Place, Suite 330, Boston, MA 02111 USA. */
22
23#if !defined (_RL_MBUTIL_H_)
24#define _RL_MBUTIL_H_
25
26#include "rlstdc.h"
27
28/************************************************/
29/* check multibyte capability for I18N code     */
30/************************************************/
31
32/* For platforms which support the ISO C amendement 1 functionality we
33   support user defined character classes.
34
35   Some platforms have the multibyte functions such as mbsrtowcs but
36   are lacking the multitype type mbstate_t.  BeOS (unknown version)
37   and HP/UX 11.23 without _XOPEN_SOURCE=500 are like this.
38
39   We really need mbstate_t type to operate properly.  For example, see
40   compute_lcd_of_matches, where two mbstate_t's are active at the same
41   time.  So we require both the functions and the mbstate_t type in
42   order to enable multibyte support.  */
43
44   /* Solaris 2.5 has a bug: <wchar.h> must be included before <wctype.h>.  */
45#if defined (HAVE_WCTYPE_H) && defined (HAVE_WCHAR_H)
46#  include <wchar.h>
47#  include <wctype.h>
48#  if defined (HAVE_MBSTATE_T) && defined (HAVE_MBSRTOWCS) && defined (HAVE_MBRTOWC) && defined (HAVE_MBRLEN) && defined (HAVE_WCWIDTH)
49     /* system is supposed to support XPG5 */
50#    define HANDLE_MULTIBYTE      1
51#  endif
52#endif
53
54/* If we don't want multibyte chars even on a system that supports them, let
55   the configuring user turn multibyte support off. */
56#if defined (NO_MULTIBYTE_SUPPORT)
57#  undef HANDLE_MULTIBYTE
58#endif
59
60/* Some systems, like BeOS, have multibyte encodings but lack mbstate_t.  */
61#if HANDLE_MULTIBYTE && !defined (HAVE_MBSTATE_T)
62#  define wcsrtombs(dest, src, len, ps) (wcsrtombs) (dest, src, len, 0)
63#  define mbsrtowcs(dest, src, len, ps) (mbsrtowcs) (dest, src, len, 0)
64#  define wcrtomb(s, wc, ps) (wcrtomb) (s, wc, 0)
65#  define mbrtowc(pwc, s, n, ps) (mbrtowc) (pwc, s, n, 0)
66#  define mbrlen(s, n, ps) (mbrlen) (s, n, 0)
67#  define mbstate_t int
68#endif
69
70/* Make sure MB_LEN_MAX is at least 16 on systems that claim to be able to
71   handle multibyte chars (some systems define MB_LEN_MAX as 1) */
72#ifdef HANDLE_MULTIBYTE
73#  include <limits.h>
74#  if defined(MB_LEN_MAX) && (MB_LEN_MAX < 16)
75#    undef MB_LEN_MAX
76#  endif
77#  if !defined (MB_LEN_MAX)
78#    define MB_LEN_MAX 16
79#  endif
80#endif
81
82/************************************************/
83/* end of multibyte capability checks for I18N  */
84/************************************************/
85
86/*
87 * Flags for _rl_find_prev_mbchar and _rl_find_next_mbchar:
88 *
89 * MB_FIND_ANY		find any multibyte character
90 * MB_FIND_NONZERO	find a non-zero-width multibyte character
91 */
92
93#define MB_FIND_ANY	0x00
94#define MB_FIND_NONZERO	0x01
95
96extern int _rl_find_prev_mbchar PARAMS((char *, int, int));
97extern int _rl_find_next_mbchar PARAMS((char *, int, int, int));
98
99#ifdef HANDLE_MULTIBYTE
100
101extern int _rl_compare_chars PARAMS((char *, int, mbstate_t *, char *, int, mbstate_t *));
102extern int _rl_get_char_len PARAMS((char *, mbstate_t *));
103extern int _rl_adjust_point PARAMS((char *, int, mbstate_t *));
104
105extern int _rl_read_mbchar PARAMS((char *, int));
106extern int _rl_read_mbstring PARAMS((int, char *, int));
107
108extern int _rl_is_mbchar_matched PARAMS((char *, int, int, char *, int));
109
110extern wchar_t _rl_char_value PARAMS((char *, int));
111extern int _rl_walphabetic PARAMS((wchar_t));
112
113#define _rl_to_wupper(wc)	(iswlower (wc) ? towupper (wc) : (wc))
114#define _rl_to_wlower(wc)	(iswupper (wc) ? towlower (wc) : (wc))
115
116#define MB_NEXTCHAR(b,s,c,f) \
117	((MB_CUR_MAX > 1 && rl_byte_oriented == 0) \
118		? _rl_find_next_mbchar ((b), (s), (c), (f)) \
119		: ((s) + (c)))
120#define MB_PREVCHAR(b,s,f) \
121	((MB_CUR_MAX > 1 && rl_byte_oriented == 0) \
122		? _rl_find_prev_mbchar ((b), (s), (f)) \
123		: ((s) - 1))
124
125#define MB_INVALIDCH(x)		((x) == (size_t)-1 || (x) == (size_t)-2)
126#define MB_NULLWCH(x)		((x) == 0)
127
128#else /* !HANDLE_MULTIBYTE */
129
130#undef MB_LEN_MAX
131#undef MB_CUR_MAX
132
133#define MB_LEN_MAX	1
134#define MB_CUR_MAX	1
135
136#define _rl_find_prev_mbchar(b, i, f)		(((i) == 0) ? (i) : ((i) - 1))
137#define _rl_find_next_mbchar(b, i1, i2, f)	((i1) + (i2))
138
139#define _rl_char_value(buf,ind)	((buf)[(ind)])
140
141#define _rl_walphabetic(c)	(rl_alphabetic (c))
142
143#define _rl_to_wupper(c)	(_rl_to_upper (c))
144#define _rl_to_wlower(c)	(_rl_to_lower (c))
145
146#define MB_NEXTCHAR(b,s,c,f)	((s) + (c))
147#define MB_PREVCHAR(b,s,f)	((s) - 1)
148
149#define MB_INVALIDCH(x)		(0)
150#define MB_NULLWCH(x)		(0)
151
152#endif /* !HANDLE_MULTIBYTE */
153
154extern int rl_byte_oriented;
155
156#endif /* _RL_MBUTIL_H_ */
157