1// std::ctype implementation details, GNU version -*- C++ -*- 2 3// Copyright (C) 2001, 2002, 2003, 2004, 2005 Free Software Foundation, Inc. 4// 5// This file is part of the GNU ISO C++ Library. This library is free 6// software; you can redistribute it and/or modify it under the 7// terms of the GNU General Public License as published by the 8// Free Software Foundation; either version 2, or (at your option) 9// any later version. 10 11// This library is distributed in the hope that it will be useful, 12// but WITHOUT ANY WARRANTY; without even the implied warranty of 13// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 14// GNU General Public License for more details. 15 16// You should have received a copy of the GNU General Public License along 17// with this library; see the file COPYING. If not, write to the Free 18// Software Foundation, 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, 19// USA. 20 21// As a special exception, you may use this file as part of a free software 22// library without restriction. Specifically, if other files instantiate 23// templates or use macros or inline functions from this file, or you compile 24// this file and link it with other files to produce an executable, this 25// file does not by itself cause the resulting executable to be covered by 26// the GNU General Public License. This exception does not however 27// invalidate any other reasons why the executable file might be covered by 28// the GNU General Public License. 29 30// 31// ISO C++ 14882: 22.2.1.1.2 ctype virtual functions. 32// 33 34// Written by Benjamin Kosnik <bkoz@redhat.com> 35 36#include <locale> 37#include <bits/c++locale_internal.h> 38 39_GLIBCXX_BEGIN_NAMESPACE(std) 40 41 // NB: The other ctype<char> specializations are in src/locale.cc and 42 // various /config/os/* files. 43 template<> 44 ctype_byname<char>::ctype_byname(const char* __s, size_t __refs) 45 : ctype<char>(0, false, __refs) 46 { 47 if (std::strcmp(__s, "C") != 0 && std::strcmp(__s, "POSIX") != 0) 48 { 49 this->_S_destroy_c_locale(this->_M_c_locale_ctype); 50 this->_S_create_c_locale(this->_M_c_locale_ctype, __s); 51 this->_M_toupper = this->_M_c_locale_ctype->__ctype_toupper; 52 this->_M_tolower = this->_M_c_locale_ctype->__ctype_tolower; 53 this->_M_table = this->_M_c_locale_ctype->__ctype_b; 54 } 55 } 56 57#ifdef _GLIBCXX_USE_WCHAR_T 58 ctype<wchar_t>::__wmask_type 59 ctype<wchar_t>::_M_convert_to_wmask(const mask __m) const 60 { 61 __wmask_type __ret; 62 switch (__m) 63 { 64 case space: 65 __ret = __wctype_l("space", _M_c_locale_ctype); 66 break; 67 case print: 68 __ret = __wctype_l("print", _M_c_locale_ctype); 69 break; 70 case cntrl: 71 __ret = __wctype_l("cntrl", _M_c_locale_ctype); 72 break; 73 case upper: 74 __ret = __wctype_l("upper", _M_c_locale_ctype); 75 break; 76 case lower: 77 __ret = __wctype_l("lower", _M_c_locale_ctype); 78 break; 79 case alpha: 80 __ret = __wctype_l("alpha", _M_c_locale_ctype); 81 break; 82 case digit: 83 __ret = __wctype_l("digit", _M_c_locale_ctype); 84 break; 85 case punct: 86 __ret = __wctype_l("punct", _M_c_locale_ctype); 87 break; 88 case xdigit: 89 __ret = __wctype_l("xdigit", _M_c_locale_ctype); 90 break; 91 case alnum: 92 __ret = __wctype_l("alnum", _M_c_locale_ctype); 93 break; 94 case graph: 95 __ret = __wctype_l("graph", _M_c_locale_ctype); 96 break; 97 default: 98 __ret = __wmask_type(); 99 } 100 return __ret; 101 } 102 103 wchar_t 104 ctype<wchar_t>::do_toupper(wchar_t __c) const 105 { return __towupper_l(__c, _M_c_locale_ctype); } 106 107 const wchar_t* 108 ctype<wchar_t>::do_toupper(wchar_t* __lo, const wchar_t* __hi) const 109 { 110 while (__lo < __hi) 111 { 112 *__lo = __towupper_l(*__lo, _M_c_locale_ctype); 113 ++__lo; 114 } 115 return __hi; 116 } 117 118 wchar_t 119 ctype<wchar_t>::do_tolower(wchar_t __c) const 120 { return __towlower_l(__c, _M_c_locale_ctype); } 121 122 const wchar_t* 123 ctype<wchar_t>::do_tolower(wchar_t* __lo, const wchar_t* __hi) const 124 { 125 while (__lo < __hi) 126 { 127 *__lo = __towlower_l(*__lo, _M_c_locale_ctype); 128 ++__lo; 129 } 130 return __hi; 131 } 132 133 bool 134 ctype<wchar_t>:: 135 do_is(mask __m, wchar_t __c) const 136 { 137 // The case of __m == ctype_base::space is particularly important, 138 // due to its use in many istream functions. Therefore we deal with 139 // it first, exploiting the knowledge that on GNU systems _M_bit[5] 140 // is the mask corresponding to ctype_base::space. NB: an encoding 141 // change would not affect correctness! 142 bool __ret = false; 143 if (__m == _M_bit[5]) 144 __ret = __iswctype_l(__c, _M_wmask[5], _M_c_locale_ctype); 145 else 146 { 147 // Highest bitmask in ctype_base == 10, but extra in "C" 148 // library for blank. 149 const size_t __bitmasksize = 11; 150 for (size_t __bitcur = 0; __bitcur <= __bitmasksize; ++__bitcur) 151 if (__m & _M_bit[__bitcur]) 152 { 153 if (__iswctype_l(__c, _M_wmask[__bitcur], _M_c_locale_ctype)) 154 { 155 __ret = true; 156 break; 157 } 158 else if (__m == _M_bit[__bitcur]) 159 break; 160 } 161 } 162 return __ret; 163 } 164 165 const wchar_t* 166 ctype<wchar_t>:: 167 do_is(const wchar_t* __lo, const wchar_t* __hi, mask* __vec) const 168 { 169 for (; __lo < __hi; ++__vec, ++__lo) 170 { 171 // Highest bitmask in ctype_base == 10, but extra in "C" 172 // library for blank. 173 const size_t __bitmasksize = 11; 174 mask __m = 0; 175 for (size_t __bitcur = 0; __bitcur <= __bitmasksize; ++__bitcur) 176 if (__iswctype_l(*__lo, _M_wmask[__bitcur], _M_c_locale_ctype)) 177 __m |= _M_bit[__bitcur]; 178 *__vec = __m; 179 } 180 return __hi; 181 } 182 183 const wchar_t* 184 ctype<wchar_t>:: 185 do_scan_is(mask __m, const wchar_t* __lo, const wchar_t* __hi) const 186 { 187 while (__lo < __hi && !this->do_is(__m, *__lo)) 188 ++__lo; 189 return __lo; 190 } 191 192 const wchar_t* 193 ctype<wchar_t>:: 194 do_scan_not(mask __m, const char_type* __lo, const char_type* __hi) const 195 { 196 while (__lo < __hi && this->do_is(__m, *__lo) != 0) 197 ++__lo; 198 return __lo; 199 } 200 201 wchar_t 202 ctype<wchar_t>:: 203 do_widen(char __c) const 204 { return _M_widen[static_cast<unsigned char>(__c)]; } 205 206 const char* 207 ctype<wchar_t>:: 208 do_widen(const char* __lo, const char* __hi, wchar_t* __dest) const 209 { 210 while (__lo < __hi) 211 { 212 *__dest = _M_widen[static_cast<unsigned char>(*__lo)]; 213 ++__lo; 214 ++__dest; 215 } 216 return __hi; 217 } 218 219 char 220 ctype<wchar_t>:: 221 do_narrow(wchar_t __wc, char __dfault) const 222 { 223 if (__wc >= 0 && __wc < 128 && _M_narrow_ok) 224 return _M_narrow[__wc]; 225#if __GLIBC__ > 2 || (__GLIBC__ == 2 && __GLIBC_MINOR__ > 2) 226 __c_locale __old = __uselocale(_M_c_locale_ctype); 227#endif 228 const int __c = wctob(__wc); 229#if __GLIBC__ > 2 || (__GLIBC__ == 2 && __GLIBC_MINOR__ > 2) 230 __uselocale(__old); 231#endif 232 return (__c == EOF ? __dfault : static_cast<char>(__c)); 233 } 234 235 const wchar_t* 236 ctype<wchar_t>:: 237 do_narrow(const wchar_t* __lo, const wchar_t* __hi, char __dfault, 238 char* __dest) const 239 { 240#if __GLIBC__ > 2 || (__GLIBC__ == 2 && __GLIBC_MINOR__ > 2) 241 __c_locale __old = __uselocale(_M_c_locale_ctype); 242#endif 243 if (_M_narrow_ok) 244 while (__lo < __hi) 245 { 246 if (*__lo >= 0 && *__lo < 128) 247 *__dest = _M_narrow[*__lo]; 248 else 249 { 250 const int __c = wctob(*__lo); 251 *__dest = (__c == EOF ? __dfault : static_cast<char>(__c)); 252 } 253 ++__lo; 254 ++__dest; 255 } 256 else 257 while (__lo < __hi) 258 { 259 const int __c = wctob(*__lo); 260 *__dest = (__c == EOF ? __dfault : static_cast<char>(__c)); 261 ++__lo; 262 ++__dest; 263 } 264#if __GLIBC__ > 2 || (__GLIBC__ == 2 && __GLIBC_MINOR__ > 2) 265 __uselocale(__old); 266#endif 267 return __hi; 268 } 269 270 void 271 ctype<wchar_t>::_M_initialize_ctype() 272 { 273#if __GLIBC__ > 2 || (__GLIBC__ == 2 && __GLIBC_MINOR__ > 2) 274 __c_locale __old = __uselocale(_M_c_locale_ctype); 275#endif 276 wint_t __i; 277 for (__i = 0; __i < 128; ++__i) 278 { 279 const int __c = wctob(__i); 280 if (__c == EOF) 281 break; 282 else 283 _M_narrow[__i] = static_cast<char>(__c); 284 } 285 if (__i == 128) 286 _M_narrow_ok = true; 287 else 288 _M_narrow_ok = false; 289 for (size_t __j = 0; 290 __j < sizeof(_M_widen) / sizeof(wint_t); ++__j) 291 _M_widen[__j] = btowc(__j); 292 293 for (size_t __k = 0; __k <= 11; ++__k) 294 { 295 _M_bit[__k] = static_cast<mask>(_ISbit(__k)); 296 _M_wmask[__k] = _M_convert_to_wmask(_M_bit[__k]); 297 } 298#if __GLIBC__ > 2 || (__GLIBC__ == 2 && __GLIBC_MINOR__ > 2) 299 __uselocale(__old); 300#endif 301 } 302#endif // _GLIBCXX_USE_WCHAR_T 303 304_GLIBCXX_END_NAMESPACE 305