]>
Commit | Line | Data |
---|---|---|
374ca955 A |
1 | /* |
2 | ******************************************************************************* | |
3 | * | |
73c04bcf | 4 | * Copyright (C) 2004-2005, International Business Machines |
374ca955 A |
5 | * Corporation and others. All Rights Reserved. |
6 | * | |
7 | ******************************************************************************* | |
8 | * file name: gencase.h | |
9 | * encoding: US-ASCII | |
10 | * tab size: 8 (not used) | |
11 | * indentation:4 | |
12 | * | |
13 | * created on: 2004aug28 | |
14 | * created by: Markus W. Scherer | |
15 | */ | |
16 | ||
17 | #ifndef __GENCASE_H__ | |
18 | #define __GENCASE_H__ | |
19 | ||
20 | #include "unicode/utypes.h" | |
21 | #include "utrie.h" | |
22 | #include "ucase.h" | |
23 | ||
24 | U_CDECL_BEGIN | |
25 | ||
73c04bcf A |
26 | /* Unicode versions --------------------------------------------------------- */ |
27 | ||
28 | enum { | |
29 | UNI_1_0, | |
30 | UNI_1_1, | |
31 | UNI_2_0, | |
32 | UNI_3_0, | |
33 | UNI_3_1, | |
34 | UNI_3_2, | |
35 | UNI_4_0, | |
36 | UNI_4_0_1, | |
37 | UNI_4_1, | |
38 | UNI_VER_COUNT | |
39 | }; | |
40 | ||
41 | extern int32_t ucdVersion; | |
42 | ||
374ca955 A |
43 | /* gencase ------------------------------------------------------------------ */ |
44 | ||
45 | #define UGENCASE_EXC_SHIFT 16 | |
46 | #define UGENCASE_EXC_MASK 0xffff0000 | |
47 | ||
73c04bcf A |
48 | /* |
49 | * Values for the ucase.icu unfold[] data array, see store.c. | |
50 | * The values are stored in ucase.icu so that the runtime code will work with | |
51 | * changing values, but they are hardcoded for gencase for simplicity. | |
52 | * They are optimized, that is, provide for minimal table column widths, | |
53 | * for the actual Unicode data, so that the table size is minimized. | |
54 | * Future versions of Unicode may require increases of some of these values. | |
55 | */ | |
56 | enum { | |
57 | UGENCASE_UNFOLD_STRING_WIDTH=3, | |
58 | UGENCASE_UNFOLD_CP_WIDTH=2, | |
59 | UGENCASE_UNFOLD_WIDTH=UGENCASE_UNFOLD_STRING_WIDTH+UGENCASE_UNFOLD_CP_WIDTH, | |
60 | UGENCASE_UNFOLD_MAX_ROWS=250 | |
61 | }; | |
62 | ||
63 | /* Values for additional data stored in pv column 1 */ | |
64 | enum { | |
65 | UGENCASE_IS_MID_LETTER_SHIFT /* bit 0 */ | |
66 | }; | |
67 | ||
374ca955 A |
68 | /* special casing data */ |
69 | typedef struct { | |
70 | UChar32 code; | |
71 | UBool isComplex; | |
72 | UChar lowerCase[32], upperCase[32], titleCase[32]; | |
73 | } SpecialCasing; | |
74 | ||
75 | /* case folding data */ | |
76 | typedef struct { | |
77 | UChar32 code, simple; | |
78 | char status; | |
79 | UChar full[32]; | |
80 | } CaseFolding; | |
81 | ||
82 | /* case mapping properties */ | |
83 | typedef struct { | |
84 | UChar32 code, lowerCase, upperCase, titleCase; | |
73c04bcf | 85 | UChar32 closure[8]; |
374ca955 A |
86 | SpecialCasing *specialCasing; |
87 | CaseFolding *caseFolding; | |
88 | uint8_t gc, cc; | |
89 | } Props; | |
90 | ||
91 | /* global flags */ | |
92 | extern UBool beVerbose, haveCopyright; | |
93 | ||
94 | /* properties vectors in gencase.c */ | |
95 | extern uint32_t *pv; | |
96 | ||
97 | /* prototypes */ | |
98 | U_CFUNC void | |
99 | writeUCDFilename(char *basename, const char *filename, const char *suffix); | |
100 | ||
101 | U_CFUNC UBool | |
102 | isToken(const char *token, const char *s); | |
103 | ||
104 | extern void | |
105 | setUnicodeVersion(const char *v); | |
106 | ||
107 | extern void | |
108 | setProps(Props *p); | |
109 | ||
110 | U_CFUNC uint32_t U_EXPORT2 | |
111 | getFoldedPropsValue(UNewTrie *trie, UChar32 start, int32_t offset); | |
112 | ||
113 | extern void | |
114 | addCaseSensitive(UChar32 first, UChar32 last); | |
115 | ||
116 | extern void | |
117 | makeCaseClosure(void); | |
118 | ||
119 | extern void | |
120 | makeExceptions(void); | |
121 | ||
122 | extern void | |
73c04bcf | 123 | generateData(const char *dataDir, UBool csource); |
374ca955 A |
124 | |
125 | U_CDECL_END | |
126 | ||
127 | #endif |