1/* Categories of Unicode characters. 2 Copyright (C) 2002, 2006-2007, 2009-2010 Free Software Foundation, Inc. 3 Written by Bruno Haible <bruno@clisp.org>, 2002. 4 5 This program is free software: you can redistribute it and/or modify it 6 under the terms of the GNU Lesser General Public License as published 7 by the Free Software Foundation; either version 3 of the License, or 8 (at your option) any later version. 9 10 This program is distributed in the hope that it will be useful, 11 but WITHOUT ANY WARRANTY; without even the implied warranty of 12 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 13 Lesser General Public License for more details. 14 15 You should have received a copy of the GNU Lesser General Public License 16 along with this program. If not, see <http://www.gnu.org/licenses/>. */ 17 18#include <config.h> 19 20/* Specification. */ 21#include "unictype.h" 22 23/* Define u_category table. */ 24#include "categ_of.h" 25 26static inline int 27lookup_withtable (ucs4_t uc) 28{ 29 unsigned int index1 = uc >> category_header_0; 30 if (index1 < category_header_1) 31 { 32 int lookup1 = u_category.level1[index1]; 33 if (lookup1 >= 0) 34 { 35 unsigned int index2 = (uc >> category_header_2) & category_header_3; 36 int lookup2 = u_category.level2[lookup1 + index2]; 37 if (lookup2 >= 0) 38 { 39 unsigned int index3 = ((uc & category_header_4) + lookup2) * 5; 40 /* level3 contains 5-bit values, packed into 16-bit words. */ 41 unsigned int lookup3 = 42 ((u_category.level3[index3>>4] 43 | (u_category.level3[(index3>>4)+1] << 16)) 44 >> (index3 % 16)) 45 & 0x1f; 46 47 return lookup3; 48 } 49 } 50 return 29; /* = log2(UC_CATEGORY_MASK_Cn) */ 51 } 52 return -1; 53} 54 55bool 56uc_is_general_category_withtable (ucs4_t uc, uint32_t bitmask) 57{ 58 int bit = lookup_withtable (uc); 59 60 if (bit >= 0) 61 return ((bitmask >> bit) & 1); 62 else 63 return false; 64} 65 66uc_general_category_t 67uc_general_category (ucs4_t uc) 68{ 69 int bit = lookup_withtable (uc); 70 uc_general_category_t result; 71 72 if (bit >= 0) 73 { 74 result.bitmask = 1 << bit; 75 result.generic = 1; 76 result.lookup.lookup_fn = &uc_is_general_category_withtable; 77 return result; 78 } 79 else 80 return _UC_CATEGORY_NONE; 81} 82