2  * Copyright (C) 2007 Apple Computer, Inc. 
   4  * Portions are Copyright (C) 1998 Netscape Communications Corporation. 
   6  * This library is free software; you can redistribute it and/or 
   7  * modify it under the terms of the GNU Lesser General Public 
   8  * License as published by the Free Software Foundation; either 
   9  * version 2.1 of the License, or (at your option) any later version. 
  11  * This library is distributed in the hope that it will be useful, 
  12  * but WITHOUT ANY WARRANTY; without even the implied warranty of 
  13  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU 
  14  * Lesser General Public License for more details. 
  16  * You should have received a copy of the GNU Lesser General Public 
  17  * License along with this library; if not, write to the Free Software 
  18  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301  USA 
  20  * Alternatively, the contents of this file may be used under the terms 
  21  * of either the Mozilla Public License Version 1.1, found at 
  22  * http://www.mozilla.org/MPL/ (the "MPL") or the GNU General Public 
  23  * License Version 2.0, found at http://www.fsf.org/copyleft/gpl.html 
  24  * (the "GPL"), in which case the provisions of the MPL or the GPL are 
  25  * applicable instead of those above.  If you wish to allow use of your 
  26  * version of this file only under the terms of one of those two 
  27  * licenses (the MPL or the GPL) and not to allow others to use your 
  28  * version of this file under the LGPL, indicate your decision by 
  29  * deletingthe provisions above and replace them with the notice and 
  30  * other provisions required by the MPL or the GPL, as the case may be. 
  31  * If you do not delete the provisions above, a recipient may use your 
  32  * version of this file under any of the LGPL, the MPL or the GPL. 
  35 #ifndef UnicodeRange_H 
  36 #define UnicodeRange_H 
  38 #include <wtf/unicode/Unicode.h> 
  42 // The following constants define unicode subranges 
  43 // values below cRangeNum must be continuous so that we can map to  
  44 // a lang group directly. 
  45 // All ranges we care about should fit within 32 bits. 
  47 // Frequently used range definitions 
  48 const unsigned char   cRangeCyrillic 
=    0; 
  49 const unsigned char   cRangeGreek    
=    1; 
  50 const unsigned char   cRangeTurkish  
=    2; 
  51 const unsigned char   cRangeHebrew   
=    3; 
  52 const unsigned char   cRangeArabic   
=    4; 
  53 const unsigned char   cRangeBaltic   
=    5; 
  54 const unsigned char   cRangeThai     
=    6; 
  55 const unsigned char   cRangeKorean   
=    7; 
  56 const unsigned char   cRangeJapanese 
=    8; 
  57 const unsigned char   cRangeSChinese 
=    9; 
  58 const unsigned char   cRangeTChinese 
=   10; 
  59 const unsigned char   cRangeDevanagari 
= 11; 
  60 const unsigned char   cRangeTamil    
=   12; 
  61 const unsigned char   cRangeArmenian 
=   13; 
  62 const unsigned char   cRangeBengali  
=   14; 
  63 const unsigned char   cRangeCanadian 
=   15; 
  64 const unsigned char   cRangeEthiopic 
=   16; 
  65 const unsigned char   cRangeGeorgian 
=   17; 
  66 const unsigned char   cRangeGujarati 
=   18; 
  67 const unsigned char   cRangeGurmukhi 
=   19; 
  68 const unsigned char   cRangeKhmer    
=   20; 
  69 const unsigned char   cRangeMalayalam 
=  21; 
  71 const unsigned char   cRangeSpecificItemNum 
= 22; 
  73 //range/rangeSet grow to this place 22-29 
  75 const unsigned char   cRangeSetStart  
=  30;    // range set definition starts from here 
  76 const unsigned char   cRangeSetLatin  
=  30; 
  77 const unsigned char   cRangeSetCJK    
=  31; 
  78 const unsigned char   cRangeSetEnd    
=  31;   // range set definition ends here 
  80 // less frequently used range definition 
  81 const unsigned char   cRangeSurrogate            
= 32; 
  82 const unsigned char   cRangePrivate              
= 33; 
  83 const unsigned char   cRangeMisc                 
= 34; 
  84 const unsigned char   cRangeUnassigned           
= 35; 
  85 const unsigned char   cRangeSyriac               
= 36; 
  86 const unsigned char   cRangeThaana               
= 37; 
  87 const unsigned char   cRangeOriya                
= 38; 
  88 const unsigned char   cRangeTelugu               
= 39; 
  89 const unsigned char   cRangeKannada              
= 40; 
  90 const unsigned char   cRangeSinhala              
= 41; 
  91 const unsigned char   cRangeLao                  
= 42; 
  92 const unsigned char   cRangeTibetan              
= 43; 
  93 const unsigned char   cRangeMyanmar              
= 44; 
  94 const unsigned char   cRangeCherokee             
= 45; 
  95 const unsigned char   cRangeOghamRunic           
= 46; 
  96 const unsigned char   cRangeMongolian            
= 47; 
  97 const unsigned char   cRangeMathOperators        
= 48; 
  98 const unsigned char   cRangeMiscTechnical        
= 49; 
  99 const unsigned char   cRangeControlOpticalEnclose 
= 50; 
 100 const unsigned char   cRangeBoxBlockGeometrics   
= 51; 
 101 const unsigned char   cRangeMiscSymbols          
= 52; 
 102 const unsigned char   cRangeDingbats             
= 53; 
 103 const unsigned char   cRangeBraillePattern       
= 54; 
 104 const unsigned char   cRangeYi                   
= 55; 
 105 const unsigned char   cRangeCombiningDiacriticalMarks 
= 56; 
 106 const unsigned char   cRangeSpecials             
= 57; 
 108 const unsigned char   cRangeTableBase   
= 128;    //values over 127 are reserved for internal use only 
 109 const unsigned char   cRangeTertiaryTable  
= 145; // leave room for 16 subtable  
 110                                             // indices (cRangeTableBase + 1 .. 
 111                                             // cRangeTableBase + 16) 
 115 unsigned int findCharUnicodeRange(UChar32 ch
); 
 116 const char* langGroupFromUnicodeRange(unsigned char unicodeRange
); 
 120 #endif // UnicodeRange_H