1 /* Categories of Unicode characters.
2 Copyright (C) 2002, 2006-2007, 2009-2013 Free Software Foundation, Inc.
3 Written by Bruno Haible <bruno@clisp.org>, 2002.
5 This program is free software: you can redistribute it and/or modify it
6 under the terms of the GNU Lesser General Public License as published
7 by the Free Software Foundation; either version 3 of the License, or
8 (at your option) any later version.
10 This program is distributed in the hope that it will be useful,
11 but WITHOUT ANY WARRANTY; without even the implied warranty of
12 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 Lesser General Public License for more details.
15 You should have received a copy of the GNU Lesser General Public License
16 along with this program. If not, see <http://www.gnu.org/licenses/>. */
23 /* Define u_category table. */
27 lookup_withtable (ucs4_t uc)
29 unsigned int index1 = uc >> category_header_0;
30 if (index1 < category_header_1)
32 int lookup1 = u_category.level1[index1];
35 unsigned int index2 = (uc >> category_header_2) & category_header_3;
36 int lookup2 = u_category.level2[lookup1 + index2];
39 unsigned int index3 = ((uc & category_header_4) + lookup2) * 5;
40 /* level3 contains 5-bit values, packed into 16-bit words. */
41 unsigned int lookup3 =
42 ((u_category.level3[index3>>4]
43 | (u_category.level3[(index3>>4)+1] << 16))
50 return 29; /* = log2(UC_CATEGORY_MASK_Cn) */
56 uc_is_general_category_withtable (ucs4_t uc, uint32_t bitmask)
58 int bit = lookup_withtable (uc);
61 return ((bitmask >> bit) & 1);
67 uc_general_category (ucs4_t uc)
69 int bit = lookup_withtable (uc);
70 uc_general_category_t result;
74 result.bitmask = 1 << bit;
76 result.lookup.lookup_fn = &uc_is_general_category_withtable;
80 return _UC_CATEGORY_NONE;