]>
Commit | Line | Data |
---|---|---|
f3c0d7a5 A |
1 | // © 2016 and later: Unicode, Inc. and others. |
2 | // License & terms of use: http://www.unicode.org/copyright.html | |
46f4442e A |
3 | /* |
4 | ******************************************************************************* | |
2ca993e8 A |
5 | * Copyright (C) 2007-2016, International Business Machines Corporation and |
6 | * others. All Rights Reserved. | |
46f4442e A |
7 | ******************************************************************************* |
8 | * | |
9 | * File DTPTNGEN.H | |
10 | * | |
11 | ******************************************************************************* | |
12 | */ | |
13 | ||
46f4442e A |
14 | #ifndef __DTPTNGEN_IMPL_H__ |
15 | #define __DTPTNGEN_IMPL_H__ | |
16 | ||
2ca993e8 | 17 | #include "unicode/udatpg.h" |
f3c0d7a5 A |
18 | |
19 | #include "unicode/strenum.h" | |
20 | #include "unicode/unistr.h" | |
2ca993e8 A |
21 | #include "uvector.h" |
22 | ||
46f4442e A |
23 | // TODO(claireho): Split off Builder class. |
24 | // TODO(claireho): If splitting off Builder class: As subclass or independent? | |
25 | ||
26 | #define MAX_PATTERN_ENTRIES 52 | |
27 | #define MAX_CLDR_FIELD_LEN 60 | |
28 | #define MAX_DT_TOKEN 50 | |
29 | #define MAX_RESOURCE_FIELD 12 | |
30 | #define MAX_AVAILABLE_FORMATS 12 | |
31 | #define NONE 0 | |
32 | #define EXTRA_FIELD 0x10000 | |
33 | #define MISSING_FIELD 0x1000 | |
34 | #define MAX_STRING_ENUMERATION 200 | |
35 | #define SINGLE_QUOTE ((UChar)0x0027) | |
36 | #define FORWARDSLASH ((UChar)0x002F) | |
37 | #define BACKSLASH ((UChar)0x005C) | |
38 | #define SPACE ((UChar)0x0020) | |
39 | #define QUOTATION_MARK ((UChar)0x0022) | |
40 | #define ASTERISK ((UChar)0x002A) | |
41 | #define PLUSSITN ((UChar)0x002B) | |
42 | #define COMMA ((UChar)0x002C) | |
43 | #define HYPHEN ((UChar)0x002D) | |
44 | #define DOT ((UChar)0x002E) | |
45 | #define COLON ((UChar)0x003A) | |
46 | #define CAP_A ((UChar)0x0041) | |
2ca993e8 | 47 | #define CAP_B ((UChar)0x0042) |
46f4442e A |
48 | #define CAP_C ((UChar)0x0043) |
49 | #define CAP_D ((UChar)0x0044) | |
50 | #define CAP_E ((UChar)0x0045) | |
51 | #define CAP_F ((UChar)0x0046) | |
52 | #define CAP_G ((UChar)0x0047) | |
53 | #define CAP_H ((UChar)0x0048) | |
57a6839d | 54 | #define CAP_J ((UChar)0x004A) |
46f4442e A |
55 | #define CAP_K ((UChar)0x004B) |
56 | #define CAP_L ((UChar)0x004C) | |
57 | #define CAP_M ((UChar)0x004D) | |
58 | #define CAP_O ((UChar)0x004F) | |
59 | #define CAP_Q ((UChar)0x0051) | |
60 | #define CAP_S ((UChar)0x0053) | |
61 | #define CAP_T ((UChar)0x0054) | |
4388f060 | 62 | #define CAP_U ((UChar)0x0055) |
46f4442e A |
63 | #define CAP_V ((UChar)0x0056) |
64 | #define CAP_W ((UChar)0x0057) | |
57a6839d | 65 | #define CAP_X ((UChar)0x0058) |
46f4442e A |
66 | #define CAP_Y ((UChar)0x0059) |
67 | #define CAP_Z ((UChar)0x005A) | |
68 | #define LOWLINE ((UChar)0x005F) | |
69 | #define LOW_A ((UChar)0x0061) | |
2ca993e8 | 70 | #define LOW_B ((UChar)0x0062) |
46f4442e A |
71 | #define LOW_C ((UChar)0x0063) |
72 | #define LOW_D ((UChar)0x0064) | |
73 | #define LOW_E ((UChar)0x0065) | |
74 | #define LOW_F ((UChar)0x0066) | |
75 | #define LOW_G ((UChar)0x0067) | |
76 | #define LOW_H ((UChar)0x0068) | |
77 | #define LOW_I ((UChar)0x0069) | |
78 | #define LOW_J ((UChar)0x006A) | |
79 | #define LOW_K ((UChar)0x006B) | |
80 | #define LOW_L ((UChar)0x006C) | |
81 | #define LOW_M ((UChar)0x006D) | |
82 | #define LOW_N ((UChar)0x006E) | |
83 | #define LOW_O ((UChar)0x006F) | |
84 | #define LOW_P ((UChar)0x0070) | |
85 | #define LOW_Q ((UChar)0x0071) | |
86 | #define LOW_R ((UChar)0x0072) | |
87 | #define LOW_S ((UChar)0x0073) | |
88 | #define LOW_T ((UChar)0x0074) | |
89 | #define LOW_U ((UChar)0x0075) | |
90 | #define LOW_V ((UChar)0x0076) | |
91 | #define LOW_W ((UChar)0x0077) | |
57a6839d | 92 | #define LOW_X ((UChar)0x0078) |
46f4442e A |
93 | #define LOW_Y ((UChar)0x0079) |
94 | #define LOW_Z ((UChar)0x007A) | |
95 | #define DT_SHORT -0x102 | |
96 | #define DT_LONG -0x103 | |
97 | #define DT_NUMERIC 0x100 | |
98 | #define DT_NARROW -0x101 | |
99 | #define DT_DELTA 0x10 | |
100 | ||
101 | U_NAMESPACE_BEGIN | |
102 | ||
103 | const int32_t UDATPG_FRACTIONAL_MASK = 1<<UDATPG_FRACTIONAL_SECOND_FIELD; | |
104 | const int32_t UDATPG_SECOND_AND_FRACTIONAL_MASK = (1<<UDATPG_SECOND_FIELD) | (1<<UDATPG_FRACTIONAL_SECOND_FIELD); | |
105 | ||
106 | typedef enum dtStrEnum { | |
107 | DT_BASESKELETON, | |
108 | DT_SKELETON, | |
109 | DT_PATTERN | |
110 | }dtStrEnum; | |
111 | ||
112 | typedef struct dtTypeElem { | |
113 | UChar patternChar; | |
114 | UDateTimePatternField field; | |
115 | int16_t type; | |
116 | int16_t minLen; | |
117 | int16_t weight; | |
118 | }dtTypeElem; | |
119 | ||
f3c0d7a5 A |
120 | // A compact storage mechanism for skeleton field strings. Several dozen of these will be created |
121 | // for a typical DateTimePatternGenerator instance. | |
122 | class SkeletonFields : public UMemory { | |
123 | public: | |
124 | SkeletonFields(); | |
125 | void clear(); | |
126 | void copyFrom(const SkeletonFields& other); | |
127 | void clearField(int32_t field); | |
128 | UChar getFieldChar(int32_t field) const; | |
129 | int32_t getFieldLength(int32_t field) const; | |
130 | void populate(int32_t field, const UnicodeString& value); | |
131 | void populate(int32_t field, UChar repeatChar, int32_t repeatCount); | |
132 | UBool isFieldEmpty(int32_t field) const; | |
133 | UnicodeString& appendTo(UnicodeString& string) const; | |
134 | UnicodeString& appendFieldTo(int32_t field, UnicodeString& string) const; | |
135 | UChar getFirstChar() const; | |
136 | inline UBool operator==(const SkeletonFields& other) const; | |
137 | inline UBool operator!=(const SkeletonFields& other) const; | |
138 | ||
139 | private: | |
140 | int8_t chars[UDATPG_FIELD_COUNT]; | |
141 | int8_t lengths[UDATPG_FIELD_COUNT]; | |
142 | }; | |
143 | ||
144 | inline UBool SkeletonFields::operator==(const SkeletonFields& other) const { | |
145 | return (uprv_memcmp(chars, other.chars, sizeof(chars)) == 0 | |
146 | && uprv_memcmp(lengths, other.lengths, sizeof(lengths)) == 0); | |
147 | } | |
148 | ||
149 | inline UBool SkeletonFields::operator!=(const SkeletonFields& other) const { | |
150 | return (! operator==(other)); | |
151 | } | |
152 | ||
46f4442e A |
153 | class PtnSkeleton : public UMemory { |
154 | public: | |
155 | int32_t type[UDATPG_FIELD_COUNT]; | |
f3c0d7a5 A |
156 | SkeletonFields original; |
157 | SkeletonFields baseOriginal; | |
46f4442e A |
158 | |
159 | PtnSkeleton(); | |
160 | PtnSkeleton(const PtnSkeleton& other); | |
f3c0d7a5 A |
161 | void copyFrom(const PtnSkeleton& other); |
162 | void clear(); | |
163 | UBool equals(const PtnSkeleton& other) const; | |
164 | UnicodeString getSkeleton() const; | |
165 | UnicodeString getBaseSkeleton() const; | |
166 | UChar getFirstChar() const; | |
167 | ||
168 | // TODO: Why is this virtual, as well as the other destructors in this file? We don't want | |
169 | // vtables when we don't use class objects polymorphically. | |
46f4442e A |
170 | virtual ~PtnSkeleton(); |
171 | }; | |
172 | ||
173 | ||
174 | class PtnElem : public UMemory { | |
175 | public: | |
176 | UnicodeString basePattern; | |
177 | PtnSkeleton *skeleton; | |
178 | UnicodeString pattern; | |
179 | UBool skeletonWasSpecified; // if specified in availableFormats, not derived | |
180 | PtnElem *next; | |
181 | ||
182 | PtnElem(const UnicodeString &basePattern, const UnicodeString &pattern); | |
183 | virtual ~PtnElem(); | |
184 | ||
185 | }; | |
186 | ||
187 | class FormatParser : public UMemory { | |
188 | public: | |
189 | UnicodeString items[MAX_DT_TOKEN]; | |
190 | int32_t itemNumber; | |
191 | ||
192 | FormatParser(); | |
193 | virtual ~FormatParser(); | |
194 | void set(const UnicodeString& patternString); | |
46f4442e | 195 | void getQuoteLiteral(UnicodeString& quote, int32_t *itemIndex); |
46f4442e | 196 | UBool isPatternSeparator(UnicodeString& field); |
2ca993e8 A |
197 | static UBool isQuoteLiteral(const UnicodeString& s); |
198 | static int32_t getCanonicalIndex(const UnicodeString& s) { return getCanonicalIndex(s, TRUE); } | |
199 | static int32_t getCanonicalIndex(const UnicodeString& s, UBool strict); | |
46f4442e A |
200 | |
201 | private: | |
202 | typedef enum TokenStatus { | |
203 | START, | |
204 | ADD_TOKEN, | |
205 | SYNTAX_ERROR, | |
206 | DONE | |
207 | } ToeknStatus; | |
208 | ||
209 | TokenStatus status; | |
210 | virtual TokenStatus setTokens(const UnicodeString& pattern, int32_t startPos, int32_t *len); | |
211 | }; | |
212 | ||
213 | class DistanceInfo : public UMemory { | |
214 | public: | |
215 | int32_t missingFieldMask; | |
216 | int32_t extraFieldMask; | |
217 | ||
4388f060 A |
218 | DistanceInfo() {} |
219 | virtual ~DistanceInfo(); | |
220 | void clear() { missingFieldMask = extraFieldMask = 0; } | |
46f4442e | 221 | void setTo(DistanceInfo& other); |
4388f060 A |
222 | void addMissing(int32_t field) { missingFieldMask |= (1<<field); } |
223 | void addExtra(int32_t field) { extraFieldMask |= (1<<field); } | |
46f4442e A |
224 | }; |
225 | ||
226 | class DateTimeMatcher: public UMemory { | |
227 | public: | |
228 | PtnSkeleton skeleton; | |
229 | ||
f3c0d7a5 | 230 | void getBasePattern(UnicodeString& basePattern); |
46f4442e A |
231 | UnicodeString getPattern(); |
232 | void set(const UnicodeString& pattern, FormatParser* fp); | |
233 | void set(const UnicodeString& pattern, FormatParser* fp, PtnSkeleton& skeleton); | |
234 | void copyFrom(const PtnSkeleton& skeleton); | |
235 | void copyFrom(); | |
236 | PtnSkeleton* getSkeletonPtr(); | |
237 | UBool equals(const DateTimeMatcher* other) const; | |
238 | int32_t getDistance(const DateTimeMatcher& other, int32_t includeMask, DistanceInfo& distanceInfo); | |
239 | DateTimeMatcher(); | |
240 | DateTimeMatcher(const DateTimeMatcher& other); | |
4388f060 | 241 | virtual ~DateTimeMatcher(); |
46f4442e A |
242 | int32_t getFieldMask(); |
243 | }; | |
244 | ||
245 | class PatternMap : public UMemory { | |
246 | public: | |
247 | PtnElem *boot[MAX_PATTERN_ENTRIES]; | |
248 | PatternMap(); | |
249 | virtual ~PatternMap(); | |
250 | void add(const UnicodeString& basePattern, const PtnSkeleton& skeleton, const UnicodeString& value, UBool skeletonWasSpecified, UErrorCode& status); | |
251 | const UnicodeString* getPatternFromBasePattern(UnicodeString& basePattern, UBool& skeletonWasSpecified); | |
252 | const UnicodeString* getPatternFromSkeleton(PtnSkeleton& skeleton, const PtnSkeleton** specifiedSkeletonPtr = 0); | |
253 | void copyFrom(const PatternMap& other, UErrorCode& status); | |
254 | PtnElem* getHeader(UChar baseChar); | |
255 | UBool equals(const PatternMap& other); | |
256 | private: | |
257 | UBool isDupAllowed; | |
258 | PtnElem* getDuplicateElem(const UnicodeString &basePattern, const PtnSkeleton& skeleton, PtnElem *baseElem); | |
259 | }; // end PatternMap | |
260 | ||
261 | class PatternMapIterator : public UMemory { | |
262 | public: | |
263 | PatternMapIterator(); | |
264 | virtual ~PatternMapIterator(); | |
265 | void set(PatternMap& patternMap); | |
266 | PtnSkeleton* getSkeleton(); | |
267 | UBool hasNext(); | |
268 | DateTimeMatcher& next(); | |
269 | private: | |
270 | int32_t bootIndex; | |
271 | PtnElem *nodePtr; | |
272 | DateTimeMatcher *matcher; | |
273 | PatternMap *patternMap; | |
274 | }; | |
275 | ||
276 | class DTSkeletonEnumeration : public StringEnumeration { | |
277 | public: | |
278 | DTSkeletonEnumeration(PatternMap &patternMap, dtStrEnum type, UErrorCode& status); | |
279 | virtual ~DTSkeletonEnumeration(); | |
280 | static UClassID U_EXPORT2 getStaticClassID(void); | |
281 | virtual UClassID getDynamicClassID(void) const; | |
282 | virtual const UnicodeString* snext(UErrorCode& status); | |
283 | virtual void reset(UErrorCode& status); | |
284 | virtual int32_t count(UErrorCode& status) const; | |
285 | private: | |
286 | int32_t pos; | |
287 | UBool isCanonicalItem(const UnicodeString& item); | |
288 | UVector *fSkeletons; | |
289 | }; | |
290 | ||
291 | class DTRedundantEnumeration : public StringEnumeration { | |
292 | public: | |
293 | DTRedundantEnumeration(); | |
294 | virtual ~DTRedundantEnumeration(); | |
295 | static UClassID U_EXPORT2 getStaticClassID(void); | |
296 | virtual UClassID getDynamicClassID(void) const; | |
297 | virtual const UnicodeString* snext(UErrorCode& status); | |
298 | virtual void reset(UErrorCode& status); | |
299 | virtual int32_t count(UErrorCode& status) const; | |
300 | void add(const UnicodeString &pattern, UErrorCode& status); | |
301 | private: | |
302 | int32_t pos; | |
303 | UBool isCanonicalItem(const UnicodeString& item); | |
304 | UVector *fPatterns; | |
305 | }; | |
306 | ||
307 | U_NAMESPACE_END | |
308 | ||
309 | #endif |