1/*
2 * Copyright (C) 2007 Apple Computer, Inc.
3 *
4 * Portions are Copyright (C) 1998 Netscape Communications Corporation.
5 *
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2.1 of the License, or (at your option) any later version.
10 *
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
14 * Lesser General Public License for more details.
15 *
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with this library; if not, write to the Free Software
18 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301  USA
19 *
20 * Alternatively, the contents of this file may be used under the terms
21 * of either the Mozilla Public License Version 1.1, found at
22 * http://www.mozilla.org/MPL/ (the "MPL") or the GNU General Public
23 * License Version 2.0, found at http://www.fsf.org/copyleft/gpl.html
24 * (the "GPL"), in which case the provisions of the MPL or the GPL are
25 * applicable instead of those above.  If you wish to allow use of your
26 * version of this file only under the terms of one of those two
27 * licenses (the MPL or the GPL) and not to allow others to use your
28 * version of this file under the LGPL, indicate your decision by
29 * deletingthe provisions above and replace them with the notice and
30 * other provisions required by the MPL or the GPL, as the case may be.
31 * If you do not delete the provisions above, a recipient may use your
32 * version of this file under any of the LGPL, the MPL or the GPL.
33 */
34
35#ifndef UnicodeRange_H
36#define UnicodeRange_H
37
38#if PLATFORM(HAIKU)
39#include "stdint.h"
40#endif
41
42#include <wtf/unicode/Unicode.h>
43
44namespace WebCore {
45
46// The following constants define unicode subranges
47// values below cRangeNum must be continuous so that we can map to
48// a lang group directly.
49// All ranges we care about should fit within 32 bits.
50
51// Frequently used range definitions
52const unsigned char   cRangeCyrillic =    0;
53const unsigned char   cRangeGreek    =    1;
54const unsigned char   cRangeTurkish  =    2;
55const unsigned char   cRangeHebrew   =    3;
56const unsigned char   cRangeArabic   =    4;
57const unsigned char   cRangeBaltic   =    5;
58const unsigned char   cRangeThai     =    6;
59const unsigned char   cRangeKorean   =    7;
60const unsigned char   cRangeJapanese =    8;
61const unsigned char   cRangeSChinese =    9;
62const unsigned char   cRangeTChinese =   10;
63const unsigned char   cRangeDevanagari = 11;
64const unsigned char   cRangeTamil    =   12;
65const unsigned char   cRangeArmenian =   13;
66const unsigned char   cRangeBengali  =   14;
67const unsigned char   cRangeCanadian =   15;
68const unsigned char   cRangeEthiopic =   16;
69const unsigned char   cRangeGeorgian =   17;
70const unsigned char   cRangeGujarati =   18;
71const unsigned char   cRangeGurmukhi =   19;
72const unsigned char   cRangeKhmer    =   20;
73const unsigned char   cRangeMalayalam =  21;
74
75const unsigned char   cRangeSpecificItemNum = 22;
76
77//range/rangeSet grow to this place 22-29
78
79const unsigned char   cRangeSetStart  =  30;    // range set definition starts from here
80const unsigned char   cRangeSetLatin  =  30;
81const unsigned char   cRangeSetCJK    =  31;
82const unsigned char   cRangeSetEnd    =  31;   // range set definition ends here
83
84// less frequently used range definition
85const unsigned char   cRangeSurrogate            = 32;
86const unsigned char   cRangePrivate              = 33;
87const unsigned char   cRangeMisc                 = 34;
88const unsigned char   cRangeUnassigned           = 35;
89const unsigned char   cRangeSyriac               = 36;
90const unsigned char   cRangeThaana               = 37;
91const unsigned char   cRangeOriya                = 38;
92const unsigned char   cRangeTelugu               = 39;
93const unsigned char   cRangeKannada              = 40;
94const unsigned char   cRangeSinhala              = 41;
95const unsigned char   cRangeLao                  = 42;
96const unsigned char   cRangeTibetan              = 43;
97const unsigned char   cRangeMyanmar              = 44;
98const unsigned char   cRangeCherokee             = 45;
99const unsigned char   cRangeOghamRunic           = 46;
100const unsigned char   cRangeMongolian            = 47;
101const unsigned char   cRangeMathOperators        = 48;
102const unsigned char   cRangeMiscTechnical        = 49;
103const unsigned char   cRangeControlOpticalEnclose = 50;
104const unsigned char   cRangeBoxBlockGeometrics   = 51;
105const unsigned char   cRangeMiscSymbols          = 52;
106const unsigned char   cRangeDingbats             = 53;
107const unsigned char   cRangeBraillePattern       = 54;
108const unsigned char   cRangeYi                   = 55;
109const unsigned char   cRangeCombiningDiacriticalMarks = 56;
110const unsigned char   cRangeSpecials             = 57;
111
112const unsigned char   cRangeTableBase   = 128;    //values over 127 are reserved for internal use only
113const unsigned char   cRangeTertiaryTable  = 145; // leave room for 16 subtable
114                                            // indices (cRangeTableBase + 1 ..
115                                            // cRangeTableBase + 16)
116
117
118
119unsigned int findCharUnicodeRange(UChar32 ch);
120const char* langGroupFromUnicodeRange(unsigned char unicodeRange);
121
122}
123
124#endif // UnicodeRange_H
125