]> git.saurik.com Git - apple/icu.git/blame - icuSources/i18n/unicode/smpdtfmt.h
ICU-531.48.tar.gz
[apple/icu.git] / icuSources / i18n / unicode / smpdtfmt.h
CommitLineData
b75a7d8f 1/*
57a6839d 2* Copyright (C) 1997-2014, International Business Machines Corporation and
729e4ab9 3* others. All Rights Reserved.
b75a7d8f
A
4*******************************************************************************
5*
6* File SMPDTFMT.H
7*
8* Modification History:
9*
10* Date Name Description
11* 02/19/97 aliu Converted from java.
12* 07/09/97 helena Make ParsePosition into a class.
13* 07/21/98 stephen Added GMT_PLUS, GMT_MINUS
14* Changed setTwoDigitStartDate to set2DigitYearStart
15* Changed getTwoDigitStartDate to get2DigitYearStart
16* Removed subParseLong
17* Removed getZoneIndex (added in DateFormatSymbols)
18* 06/14/99 stephen Removed fgTimeZoneDataSuffix
19* 10/14/99 aliu Updated class doc to describe 2-digit year parsing
20* {j28 4182066}.
21*******************************************************************************
22*/
23
24#ifndef SMPDTFMT_H
25#define SMPDTFMT_H
26
27#include "unicode/utypes.h"
28
73c04bcf 29/**
729e4ab9 30 * \file
73c04bcf
A
31 * \brief C++ API: Format and parse dates in a language-independent manner.
32 */
729e4ab9 33
b75a7d8f
A
34#if !UCONFIG_NO_FORMATTING
35
36#include "unicode/datefmt.h"
51004dcb 37#include "unicode/udisplaycontext.h"
57a6839d
A
38#include "unicode/tzfmt.h" /* for UTimeZoneFormatTimeType */
39#include "unicode/brkiter.h"
b75a7d8f
A
40
41U_NAMESPACE_BEGIN
42
43class DateFormatSymbols;
44class DateFormat;
46f4442e 45class MessageFormat;
729e4ab9 46class FieldPositionHandler;
4388f060 47class TimeZoneFormat;
b75a7d8f
A
48
49/**
73c04bcf 50 *
b75a7d8f
A
51 * SimpleDateFormat is a concrete class for formatting and parsing dates in a
52 * language-independent manner. It allows for formatting (millis -> text),
53 * parsing (text -> millis), and normalization. Formats/Parses a date or time,
54 * which is the standard milliseconds since 24:00 GMT, Jan 1, 1970.
55 * <P>
56 * Clients are encouraged to create a date-time formatter using DateFormat::getInstance(),
57 * getDateInstance(), getDateInstance(), or getDateTimeInstance() rather than
58 * explicitly constructing an instance of SimpleDateFormat. This way, the client
59 * is guaranteed to get an appropriate formatting pattern for whatever locale the
60 * program is running in. However, if the client needs something more unusual than
61 * the default patterns in the locales, he can construct a SimpleDateFormat directly
62 * and give it an appropriate pattern (or use one of the factory methods on DateFormat
63 * and modify the pattern after the fact with toPattern() and applyPattern().
51004dcb
A
64 *
65 * <p><strong>Date and Time Patterns:</strong></p>
66 *
67 * <p>Date and time formats are specified by <em>date and time pattern</em> strings.
68 * Within date and time pattern strings, all unquoted ASCII letters [A-Za-z] are reserved
69 * as pattern letters representing calendar fields. <code>SimpleDateFormat</code> supports
57a6839d
A
70 * the date and time formatting algorithm and pattern letters defined by
71 * <a href="http://www.unicode.org/reports/tr35/tr35-dates.html#Date_Field_Symbol_Table">UTS#35
72 * Unicode Locale Data Markup Language (LDML)</a> and further documented for ICU in the
73 * <a href="https://sites.google.com/site/icuprojectuserguide/formatparse/datetime?pli=1#TOC-Date-Field-Symbol-Table">ICU
74 * User Guide</a>. The following pattern letters are currently available:</p>
51004dcb
A
75 *
76 * <table border="1">
77 * <tr>
78 * <th>Field</th>
79 * <th style="text-align: center">Sym.</th>
80 * <th style="text-align: center">No.</th>
81 * <th>Example</th>
82 * <th>Description</th>
83 * </tr>
84 * <tr>
85 * <th rowspan="3">era</th>
86 * <td style="text-align: center" rowspan="3">G</td>
87 * <td style="text-align: center">1..3</td>
88 * <td>AD</td>
89 * <td rowspan="3">Era - Replaced with the Era string for the current date. One to three letters for the
90 * abbreviated form, four letters for the long form, five for the narrow form.</td>
91 * </tr>
92 * <tr>
93 * <td style="text-align: center">4</td>
94 * <td>Anno Domini</td>
95 * </tr>
96 * <tr>
97 * <td style="text-align: center">5</td>
98 * <td>A</td>
99 * </tr>
100 * <tr>
101 * <th rowspan="6">year</th>
102 * <td style="text-align: center">y</td>
103 * <td style="text-align: center">1..n</td>
104 * <td>1996</td>
105 * <td>Year. Normally the length specifies the padding, but for two letters it also specifies the maximum
106 * length. Example:<div align="center">
107 * <center>
108 * <table border="1" cellpadding="2" cellspacing="0">
109 * <tr>
110 * <th>Year</th>
111 * <th style="text-align: right">y</th>
112 * <th style="text-align: right">yy</th>
113 * <th style="text-align: right">yyy</th>
114 * <th style="text-align: right">yyyy</th>
115 * <th style="text-align: right">yyyyy</th>
116 * </tr>
117 * <tr>
118 * <td>AD 1</td>
119 * <td style="text-align: right">1</td>
120 * <td style="text-align: right">01</td>
121 * <td style="text-align: right">001</td>
122 * <td style="text-align: right">0001</td>
123 * <td style="text-align: right">00001</td>
124 * </tr>
125 * <tr>
126 * <td>AD 12</td>
127 * <td style="text-align: right">12</td>
128 * <td style="text-align: right">12</td>
129 * <td style="text-align: right">012</td>
130 * <td style="text-align: right">0012</td>
131 * <td style="text-align: right">00012</td>
132 * </tr>
133 * <tr>
134 * <td>AD 123</td>
135 * <td style="text-align: right">123</td>
136 * <td style="text-align: right">23</td>
137 * <td style="text-align: right">123</td>
138 * <td style="text-align: right">0123</td>
139 * <td style="text-align: right">00123</td>
140 * </tr>
141 * <tr>
142 * <td>AD 1234</td>
143 * <td style="text-align: right">1234</td>
144 * <td style="text-align: right">34</td>
145 * <td style="text-align: right">1234</td>
146 * <td style="text-align: right">1234</td>
147 * <td style="text-align: right">01234</td>
148 * </tr>
149 * <tr>
150 * <td>AD 12345</td>
151 * <td style="text-align: right">12345</td>
152 * <td style="text-align: right">45</td>
153 * <td style="text-align: right">12345</td>
154 * <td style="text-align: right">12345</td>
155 * <td style="text-align: right">12345</td>
156 * </tr>
157 * </table>
158 * </center></div>
159 * </td>
160 * </tr>
161 * <tr>
162 * <td style="text-align: center">Y</td>
163 * <td style="text-align: center">1..n</td>
164 * <td>1997</td>
165 * <td>Year (in "Week of Year" based calendars). Normally the length specifies the padding,
166 * but for two letters it also specifies the maximum length. This year designation is used in ISO
167 * year-week calendar as defined by ISO 8601, but can be used in non-Gregorian based calendar systems
168 * where week date processing is desired. May not always be the same value as calendar year.</td>
169 * </tr>
170 * <tr>
171 * <td style="text-align: center">u</td>
172 * <td style="text-align: center">1..n</td>
173 * <td>4601</td>
174 * <td>Extended year. This is a single number designating the year of this calendar system, encompassing
175 * all supra-year fields. For example, for the Julian calendar system, year numbers are positive, with an
176 * era of BCE or CE. An extended year value for the Julian calendar system assigns positive values to CE
177 * years and negative values to BCE years, with 1 BCE being year 0.</td>
178 * </tr>
179 * <tr>
180 * <td style="text-align: center" rowspan="3">U</td>
181 * <td style="text-align: center">1..3</td>
182 * <td>&#30002;&#23376;</td>
183 * <td rowspan="3">Cyclic year name. Calendars such as the Chinese lunar calendar (and related calendars)
184 * and the Hindu calendars use 60-year cycles of year names. Use one through three letters for the abbreviated
185 * name, four for the full name, or five for the narrow name (currently the data only provides abbreviated names,
186 * which will be used for all requested name widths). If the calendar does not provide cyclic year name data,
187 * or if the year value to be formatted is out of the range of years for which cyclic name data is provided,
188 * then numeric formatting is used (behaves like 'y').</td>
189 * </tr>
190 * <tr>
191 * <td style="text-align: center">4</td>
192 * <td>(currently also &#30002;&#23376;)</td>
193 * </tr>
194 * <tr>
195 * <td style="text-align: center">5</td>
196 * <td>(currently also &#30002;&#23376;)</td>
197 * </tr>
198 * <tr>
199 * <th rowspan="6">quarter</th>
200 * <td rowspan="3" style="text-align: center">Q</td>
201 * <td style="text-align: center">1..2</td>
202 * <td>02</td>
203 * <td rowspan="3">Quarter - Use one or two for the numerical quarter, three for the abbreviation, or four
204 * for the full name.</td>
205 * </tr>
206 * <tr>
207 * <td style="text-align: center">3</td>
208 * <td>Q2</td>
209 * </tr>
210 * <tr>
211 * <td style="text-align: center">4</td>
212 * <td>2nd quarter</td>
213 * </tr>
214 * <tr>
215 * <td rowspan="3" style="text-align: center">q</td>
216 * <td style="text-align: center">1..2</td>
217 * <td>02</td>
218 * <td rowspan="3"><b>Stand-Alone</b> Quarter - Use one or two for the numerical quarter, three for the abbreviation,
219 * or four for the full name.</td>
220 * </tr>
221 * <tr>
222 * <td style="text-align: center">3</td>
223 * <td>Q2</td>
224 * </tr>
225 * <tr>
226 * <td style="text-align: center">4</td>
227 * <td>2nd quarter</td>
228 * </tr>
229 * <tr>
230 * <th rowspan="8">month</th>
231 * <td rowspan="4" style="text-align: center">M</td>
232 * <td style="text-align: center">1..2</td>
233 * <td>09</td>
234 * <td rowspan="4">Month - Use one or two for the numerical month, three for the abbreviation, four for
235 * the full name, or five for the narrow name.</td>
236 * </tr>
237 * <tr>
238 * <td style="text-align: center">3</td>
239 * <td>Sept</td>
240 * </tr>
241 * <tr>
242 * <td style="text-align: center">4</td>
243 * <td>September</td>
244 * </tr>
245 * <tr>
246 * <td style="text-align: center">5</td>
247 * <td>S</td>
248 * </tr>
249 * <tr>
250 * <td rowspan="4" style="text-align: center">L</td>
251 * <td style="text-align: center">1..2</td>
252 * <td>09</td>
253 * <td rowspan="4"><b>Stand-Alone</b> Month - Use one or two for the numerical month, three for the abbreviation,
254 * or four for the full name, or 5 for the narrow name.</td>
255 * </tr>
256 * <tr>
257 * <td style="text-align: center">3</td>
258 * <td>Sept</td>
259 * </tr>
260 * <tr>
261 * <td style="text-align: center">4</td>
262 * <td>September</td>
263 * </tr>
264 * <tr>
265 * <td style="text-align: center">5</td>
266 * <td>S</td>
267 * </tr>
268 * <tr>
269 * <th rowspan="2">week</th>
270 * <td style="text-align: center">w</td>
271 * <td style="text-align: center">1..2</td>
272 * <td>27</td>
273 * <td>Week of Year.</td>
274 * </tr>
275 * <tr>
276 * <td style="text-align: center">W</td>
277 * <td style="text-align: center">1</td>
278 * <td>3</td>
279 * <td>Week of Month</td>
280 * </tr>
281 * <tr>
282 * <th rowspan="4">day</th>
283 * <td style="text-align: center">d</td>
284 * <td style="text-align: center">1..2</td>
285 * <td>1</td>
286 * <td>Date - Day of the month</td>
287 * </tr>
288 * <tr>
289 * <td style="text-align: center">D</td>
290 * <td style="text-align: center">1..3</td>
291 * <td>345</td>
292 * <td>Day of year</td>
293 * </tr>
294 * <tr>
295 * <td style="text-align: center">F</td>
296 * <td style="text-align: center">1</td>
297 * <td>2</td>
298 * <td>Day of Week in Month. The example is for the 2nd Wed in July</td>
299 * </tr>
300 * <tr>
301 * <td style="text-align: center">g</td>
302 * <td style="text-align: center">1..n</td>
303 * <td>2451334</td>
304 * <td>Modified Julian day. This is different from the conventional Julian day number in two regards.
305 * First, it demarcates days at local zone midnight, rather than noon GMT. Second, it is a local number;
306 * that is, it depends on the local time zone. It can be thought of as a single number that encompasses
307 * all the date-related fields.</td>
308 * </tr>
309 * <tr>
310 * <th rowspan="14">week<br>
311 * day</th>
312 * <td rowspan="4" style="text-align: center">E</td>
313 * <td style="text-align: center">1..3</td>
314 * <td>Tues</td>
315 * <td rowspan="4">Day of week - Use one through three letters for the short day, or four for the full name,
316 * five for the narrow name, or six for the short name.</td>
317 * </tr>
318 * <tr>
319 * <td style="text-align: center">4</td>
320 * <td>Tuesday</td>
321 * </tr>
322 * <tr>
323 * <td style="text-align: center">5</td>
324 * <td>T</td>
325 * </tr>
326 * <tr>
327 * <td style="text-align: center">6</td>
328 * <td>Tu</td>
329 * </tr>
330 * <tr>
331 * <td rowspan="5" style="text-align: center">e</td>
332 * <td style="text-align: center">1..2</td>
333 * <td>2</td>
334 * <td rowspan="5">Local day of week. Same as E except adds a numeric value that will depend on the local
335 * starting day of the week, using one or two letters. For this example, Monday is the first day of the week.</td>
336 * </tr>
337 * <tr>
338 * <td style="text-align: center">3</td>
339 * <td>Tues</td>
340 * </tr>
341 * <tr>
342 * <td style="text-align: center">4</td>
343 * <td>Tuesday</td>
344 * </tr>
345 * <tr>
346 * <td style="text-align: center">5</td>
347 * <td>T</td>
348 * </tr>
349 * <tr>
350 * <td style="text-align: center">6</td>
351 * <td>Tu</td>
352 * </tr>
353 * <tr>
354 * <td rowspan="5" style="text-align: center">c</td>
355 * <td style="text-align: center">1</td>
356 * <td>2</td>
357 * <td rowspan="5"><b>Stand-Alone</b> local day of week - Use one letter for the local numeric value (same
358 * as 'e'), three for the short day, four for the full name, five for the narrow name, or six for
359 * the short name.</td>
360 * </tr>
361 * <tr>
362 * <td style="text-align: center">3</td>
363 * <td>Tues</td>
364 * </tr>
365 * <tr>
366 * <td style="text-align: center">4</td>
367 * <td>Tuesday</td>
368 * </tr>
369 * <tr>
370 * <td style="text-align: center">5</td>
371 * <td>T</td>
372 * </tr>
373 * <tr>
374 * <td style="text-align: center">6</td>
375 * <td>Tu</td>
376 * </tr>
377 * <tr>
378 * <th>period</th>
379 * <td style="text-align: center">a</td>
380 * <td style="text-align: center">1</td>
381 * <td>AM</td>
382 * <td>AM or PM</td>
383 * </tr>
384 * <tr>
385 * <th rowspan="4">hour</th>
386 * <td style="text-align: center">h</td>
387 * <td style="text-align: center">1..2</td>
388 * <td>11</td>
389 * <td>Hour [1-12]. When used in skeleton data or in a skeleton passed in an API for flexible data pattern
390 * generation, it should match the 12-hour-cycle format preferred by the locale (h or K); it should not match
391 * a 24-hour-cycle format (H or k). Use hh for zero padding.</td>
392 * </tr>
393 * <tr>
394 * <td style="text-align: center">H</td>
395 * <td style="text-align: center">1..2</td>
396 * <td>13</td>
397 * <td>Hour [0-23]. When used in skeleton data or in a skeleton passed in an API for flexible data pattern
398 * generation, it should match the 24-hour-cycle format preferred by the locale (H or k); it should not match a
399 * 12-hour-cycle format (h or K). Use HH for zero padding.</td>
400 * </tr>
401 * <tr>
402 * <td style="text-align: center">K</td>
403 * <td style="text-align: center">1..2</td>
404 * <td>0</td>
405 * <td>Hour [0-11]. When used in a skeleton, only matches K or h, see above. Use KK for zero padding.</td>
406 * </tr>
407 * <tr>
408 * <td style="text-align: center">k</td>
409 * <td style="text-align: center">1..2</td>
410 * <td>24</td>
411 * <td>Hour [1-24]. When used in a skeleton, only matches k or H, see above. Use kk for zero padding.</td>
412 * </tr>
413 * <tr>
414 * <th>minute</th>
415 * <td style="text-align: center">m</td>
416 * <td style="text-align: center">1..2</td>
417 * <td>59</td>
418 * <td>Minute. Use one or two for zero padding.</td>
419 * </tr>
420 * <tr>
421 * <th rowspan="3">second</th>
422 * <td style="text-align: center">s</td>
423 * <td style="text-align: center">1..2</td>
424 * <td>12</td>
425 * <td>Second. Use one or two for zero padding.</td>
426 * </tr>
427 * <tr>
428 * <td style="text-align: center">S</td>
429 * <td style="text-align: center">1..n</td>
430 * <td>3456</td>
431 * <td>Fractional Second - truncates (like other time fields) to the count of letters.
432 * (example shows display using pattern SSSS for seconds value 12.34567)</td>
433 * </tr>
434 * <tr>
435 * <td style="text-align: center">A</td>
436 * <td style="text-align: center">1..n</td>
437 * <td>69540000</td>
438 * <td>Milliseconds in day. This field behaves <i>exactly</i> like a composite of all time-related fields,
439 * not including the zone fields. As such, it also reflects discontinuities of those fields on DST transition
440 * days. On a day of DST onset, it will jump forward. On a day of DST cessation, it will jump backward. This
441 * reflects the fact that is must be combined with the offset field to obtain a unique local time value.</td>
442 * </tr>
443 * <tr>
444 * <th rowspan="23">zone</th>
445 * <td rowspan="2" style="text-align: center">z</td>
446 * <td style="text-align: center">1..3</td>
447 * <td>PDT</td>
448 * <td>The <i>short specific non-location format</i>.
449 * Where that is unavailable, falls back to the <i>short localized GMT format</i> ("O").</td>
450 * </tr>
451 * <tr>
452 * <td style="text-align: center">4</td>
453 * <td>Pacific Daylight Time</td>
454 * <td>The <i>long specific non-location format</i>.
455 * Where that is unavailable, falls back to the <i>long localized GMT format</i> ("OOOO").</td>
456 * </tr>
457 * <tr>
458 * <td rowspan="3" style="text-align: center">Z</td>
459 * <td style="text-align: center">1..3</td>
460 * <td>-0800</td>
461 * <td>The <i>ISO8601 basic format</i> with hours, minutes and optional seconds fields.
462 * The format is equivalent to RFC 822 zone format (when optional seconds field is absent).
463 * This is equivalent to the "xxxx" specifier.</td>
464 * </tr>
465 * <tr>
466 * <td style="text-align: center">4</td>
467 * <td>GMT-8:00</td>
468 * <td>The <i>long localized GMT format</i>.
469 * This is equivalent to the "OOOO" specifier.</td>
470 * </tr>
471 * <tr>
472 * <td style="text-align: center">5</td>
473 * <td>-08:00<br>
474 * -07:52:58</td>
475 * <td>The <i>ISO8601 extended format</i> with hours, minutes and optional seconds fields.
476 * The ISO8601 UTC indicator "Z" is used when local time offset is 0.
477 * This is equivalent to the "XXXXX" specifier.</td>
478 * </tr>
479 * <tr>
480 * <td rowspan="2" style="text-align: center">O</td>
481 * <td style="text-align: center">1</td>
482 * <td>GMT-8</td>
483 * <td>The <i>short localized GMT format</i>.</td>
484 * </tr>
485 * <tr>
486 * <td style="text-align: center">4</td>
487 * <td>GMT-08:00</td>
488 * <td>The <i>long localized GMT format</i>.</td>
489 * </tr>
490 * <tr>
491 * <td rowspan="2" style="text-align: center">v</td>
492 * <td style="text-align: center">1</td>
493 * <td>PT</td>
494 * <td>The <i>short generic non-location format</i>.
495 * Where that is unavailable, falls back to the <i>generic location format</i> ("VVVV"),
496 * then the <i>short localized GMT format</i> as the final fallback.</td>
497 * </tr>
498 * <tr>
499 * <td style="text-align: center">4</td>
500 * <td>Pacific Time</td>
501 * <td>The <i>long generic non-location format</i>.
502 * Where that is unavailable, falls back to <i>generic location format</i> ("VVVV").
503 * </tr>
504 * <tr>
505 * <td rowspan="4" style="text-align: center">V</td>
506 * <td style="text-align: center">1</td>
507 * <td>uslax</td>
508 * <td>The short time zone ID.
509 * Where that is unavailable, the special short time zone ID <i>unk</i> (Unknown Zone) is used.<br>
510 * <i><b>Note</b>: This specifier was originally used for a variant of the short specific non-location format,
511 * but it was deprecated in the later version of the LDML specification. In CLDR 23/ICU 51, the definition of
512 * the specifier was changed to designate a short time zone ID.</i></td>
513 * </tr>
514 * <tr>
515 * <td style="text-align: center">2</td>
516 * <td>America/Los_Angeles</td>
517 * <td>The long time zone ID.</td>
518 * </tr>
519 * <tr>
520 * <td style="text-align: center">3</td>
521 * <td>Los Angeles</td>
522 * <td>The exemplar city (location) for the time zone.
523 * Where that is unavailable, the localized exemplar city name for the special zone <i>Etc/Unknown</i> is used
524 * as the fallback (for example, "Unknown City"). </td>
525 * </tr>
526 * <tr>
527 * <td style="text-align: center">4</td>
528 * <td>Los Angeles Time</td>
529 * <td>The <i>generic location format</i>.
530 * Where that is unavailable, falls back to the <i>long localized GMT format</i> ("OOOO";
531 * Note: Fallback is only necessary with a GMT-style Time Zone ID, like Etc/GMT-830.)<br>
532 * This is especially useful when presenting possible timezone choices for user selection,
533 * since the naming is more uniform than the "v" format.</td>
534 * </tr>
535 * <tr>
536 * <td rowspan="5" style="text-align: center">X</td>
537 * <td style="text-align: center">1</td>
538 * <td>-08<br>
539 * +0530<br>
540 * Z</td>
541 * <td>The <i>ISO8601 basic format</i> with hours field and optional minutes field.
542 * The ISO8601 UTC indicator "Z" is used when local time offset is 0.</td>
543 * </tr>
544 * <tr>
545 * <td style="text-align: center">2</td>
546 * <td>-0800<br>
547 * Z</td>
548 * <td>The <i>ISO8601 basic format</i> with hours and minutes fields.
549 * The ISO8601 UTC indicator "Z" is used when local time offset is 0.</td>
550 * </tr>
551 * <tr>
552 * <td style="text-align: center">3</td>
553 * <td>-08:00<br>
554 * Z</td>
555 * <td>The <i>ISO8601 extended format</i> with hours and minutes fields.
556 * The ISO8601 UTC indicator "Z" is used when local time offset is 0.</td>
557 * </tr>
558 * <tr>
559 * <td style="text-align: center">4</td>
560 * <td>-0800<br>
561 * -075258<br>
562 * Z</td>
563 * <td>The <i>ISO8601 basic format</i> with hours, minutes and optional seconds fields.
564 * (Note: The seconds field is not supported by the ISO8601 specification.)
565 * The ISO8601 UTC indicator "Z" is used when local time offset is 0.</td>
566 * </tr>
567 * <tr>
568 * <td style="text-align: center">5</td>
569 * <td>-08:00<br>
570 * -07:52:58<br>
571 * Z</td>
572 * <td>The <i>ISO8601 extended format</i> with hours, minutes and optional seconds fields.
573 * (Note: The seconds field is not supported by the ISO8601 specification.)
574 * The ISO8601 UTC indicator "Z" is used when local time offset is 0.</td>
575 * </tr>
576 * <tr>
577 * <td rowspan="5" style="text-align: center">x</td>
578 * <td style="text-align: center">1</td>
579 * <td>-08<br>
580 * +0530</td>
581 * <td>The <i>ISO8601 basic format</i> with hours field and optional minutes field.</td>
582 * </tr>
583 * <tr>
584 * <td style="text-align: center">2</td>
585 * <td>-0800</td>
586 * <td>The <i>ISO8601 basic format</i> with hours and minutes fields.</td>
587 * </tr>
588 * <tr>
589 * <td style="text-align: center">3</td>
590 * <td>-08:00</td>
591 * <td>The <i>ISO8601 extended format</i> with hours and minutes fields.</td>
592 * </tr>
593 * <tr>
594 * <td style="text-align: center">4</td>
595 * <td>-0800<br>
596 * -075258</td>
597 * <td>The <i>ISO8601 basic format</i> with hours, minutes and optional seconds fields.
598 * (Note: The seconds field is not supported by the ISO8601 specification.)</td>
599 * </tr>
600 * <tr>
601 * <td style="text-align: center">5</td>
602 * <td>-08:00<br>
603 * -07:52:58</td>
604 * <td>The <i>ISO8601 extended format</i> with hours, minutes and optional seconds fields.
605 * (Note: The seconds field is not supported by the ISO8601 specification.)</td>
606 * </tr>
607 * </table>
608 *
4388f060 609 * <P>
b75a7d8f
A
610 * Any characters in the pattern that are not in the ranges of ['a'..'z'] and
611 * ['A'..'Z'] will be treated as quoted text. For instance, characters
612 * like ':', '.', ' ', '#' and '@' will appear in the resulting time text
613 * even they are not embraced within single quotes.
614 * <P>
615 * A pattern containing any invalid pattern letter will result in a failing
616 * UErrorCode result during formatting or parsing.
617 * <P>
618 * Examples using the US locale:
619 * <pre>
620 * \code
621 * Format Pattern Result
622 * -------------- -------
73c04bcf 623 * "yyyy.MM.dd G 'at' HH:mm:ss vvvv" ->> 1996.07.10 AD at 15:08:56 Pacific Time
b75a7d8f
A
624 * "EEE, MMM d, ''yy" ->> Wed, July 10, '96
625 * "h:mm a" ->> 12:08 PM
626 * "hh 'o''clock' a, zzzz" ->> 12 o'clock PM, Pacific Daylight Time
73c04bcf 627 * "K:mm a, vvv" ->> 0:00 PM, PT
b75a7d8f
A
628 * "yyyyy.MMMMM.dd GGG hh:mm aaa" ->> 1996.July.10 AD 12:08 PM
629 * \endcode
630 * </pre>
631 * Code Sample:
632 * <pre>
633 * \code
634 * UErrorCode success = U_ZERO_ERROR;
635 * SimpleTimeZone* pdt = new SimpleTimeZone(-8 * 60 * 60 * 1000, "PST");
636 * pdt->setStartRule( Calendar::APRIL, 1, Calendar::SUNDAY, 2*60*60*1000);
637 * pdt->setEndRule( Calendar::OCTOBER, -1, Calendar::SUNDAY, 2*60*60*1000);
638 *
639 * // Format the current time.
640 * SimpleDateFormat* formatter
641 * = new SimpleDateFormat ("yyyy.MM.dd G 'at' hh:mm:ss a zzz", success );
642 * GregorianCalendar cal(success);
643 * UDate currentTime_1 = cal.getTime(success);
644 * FieldPosition fp(0);
645 * UnicodeString dateString;
646 * formatter->format( currentTime_1, dateString, fp );
647 * cout << "result: " << dateString << endl;
648 *
649 * // Parse the previous string back into a Date.
650 * ParsePosition pp(0);
651 * UDate currentTime_2 = formatter->parse(dateString, pp );
652 * \endcode
653 * </pre>
654 * In the above example, the time value "currentTime_2" obtained from parsing
655 * will be equal to currentTime_1. However, they may not be equal if the am/pm
656 * marker 'a' is left out from the format pattern while the "hour in am/pm"
657 * pattern symbol is used. This information loss can happen when formatting the
658 * time in PM.
659 *
660 * <p>
661 * When parsing a date string using the abbreviated year pattern ("y" or "yy"),
662 * SimpleDateFormat must interpret the abbreviated year
663 * relative to some century. It does this by adjusting dates to be
664 * within 80 years before and 20 years after the time the SimpleDateFormat
665 * instance is created. For example, using a pattern of "MM/dd/yy" and a
666 * SimpleDateFormat instance created on Jan 1, 1997, the string
667 * "01/11/12" would be interpreted as Jan 11, 2012 while the string "05/04/64"
668 * would be interpreted as May 4, 1964.
669 * During parsing, only strings consisting of exactly two digits, as defined by
670 * <code>Unicode::isDigit()</code>, will be parsed into the default century.
671 * Any other numeric string, such as a one digit string, a three or more digit
672 * string, or a two digit string that isn't all digits (for example, "-1"), is
4388f060
A
673 * interpreted literally. So "01/02/3" or "01/02/003" are parsed (for the
674 * Gregorian calendar), using the same pattern, as Jan 2, 3 AD. Likewise (but
675 * only in lenient parse mode, the default) "01/02/-3" is parsed as Jan 2, 4 BC.
b75a7d8f
A
676 *
677 * <p>
678 * If the year pattern has more than two 'y' characters, the year is
679 * interpreted literally, regardless of the number of digits. So using the
680 * pattern "MM/dd/yyyy", "01/11/12" parses to Jan 11, 12 A.D.
681 *
682 * <p>
683 * When numeric fields abut one another directly, with no intervening delimiter
684 * characters, they constitute a run of abutting numeric fields. Such runs are
685 * parsed specially. For example, the format "HHmmss" parses the input text
686 * "123456" to 12:34:56, parses the input text "12345" to 1:23:45, and fails to
687 * parse "1234". In other words, the leftmost field of the run is flexible,
688 * while the others keep a fixed width. If the parse fails anywhere in the run,
689 * then the leftmost field is shortened by one character, and the entire run is
690 * parsed again. This is repeated until either the parse succeeds or the
691 * leftmost field is one character in length. If the parse still fails at that
692 * point, the parse of the run fails.
693 *
694 * <P>
695 * For time zones that have no names, SimpleDateFormat uses strings GMT+hours:minutes or
696 * GMT-hours:minutes.
697 * <P>
698 * The calendar defines what is the first day of the week, the first week of the
699 * year, whether hours are zero based or not (0 vs 12 or 24), and the timezone.
700 * There is one common number format to handle all the numbers; the digit count
701 * is handled programmatically according to the pattern.
374ca955
A
702 *
703 * <p><em>User subclasses are not supported.</em> While clients may write
704 * subclasses, such code will not necessarily work and will not be
705 * guaranteed to work stably from release to release.
b75a7d8f
A
706 */
707class U_I18N_API SimpleDateFormat: public DateFormat {
708public:
709 /**
710 * Construct a SimpleDateFormat using the default pattern for the default
711 * locale.
712 * <P>
713 * [Note:] Not all locales support SimpleDateFormat; for full generality,
714 * use the factory methods in the DateFormat class.
715 * @param status Output param set to success/failure code.
716 * @stable ICU 2.0
717 */
718 SimpleDateFormat(UErrorCode& status);
719
720 /**
721 * Construct a SimpleDateFormat using the given pattern and the default locale.
722 * The locale is used to obtain the symbols used in formatting (e.g., the
723 * names of the months), but not to provide the pattern.
724 * <P>
725 * [Note:] Not all locales support SimpleDateFormat; for full generality,
726 * use the factory methods in the DateFormat class.
727 * @param pattern the pattern for the format.
728 * @param status Output param set to success/failure code.
729 * @stable ICU 2.0
730 */
731 SimpleDateFormat(const UnicodeString& pattern,
732 UErrorCode& status);
733
729e4ab9
A
734 /**
735 * Construct a SimpleDateFormat using the given pattern, numbering system override, and the default locale.
736 * The locale is used to obtain the symbols used in formatting (e.g., the
737 * names of the months), but not to provide the pattern.
738 * <P>
739 * A numbering system override is a string containing either the name of a known numbering system,
740 * or a set of field and numbering system pairs that specify which fields are to be formattied with
741 * the alternate numbering system. For example, to specify that all numeric fields in the specified
742 * date or time pattern are to be rendered using Thai digits, simply specify the numbering system override
743 * as "thai". To specify that just the year portion of the date be formatted using Hebrew numbering,
744 * use the override string "y=hebrew". Numbering system overrides can be combined using a semi-colon
745 * character in the override string, such as "d=decimal;M=arabic;y=hebrew", etc.
746 *
747 * <P>
748 * [Note:] Not all locales support SimpleDateFormat; for full generality,
749 * use the factory methods in the DateFormat class.
750 * @param pattern the pattern for the format.
751 * @param override the override string.
752 * @param status Output param set to success/failure code.
753 * @stable ICU 4.2
754 */
755 SimpleDateFormat(const UnicodeString& pattern,
756 const UnicodeString& override,
757 UErrorCode& status);
758
b75a7d8f
A
759 /**
760 * Construct a SimpleDateFormat using the given pattern and locale.
761 * The locale is used to obtain the symbols used in formatting (e.g., the
762 * names of the months), but not to provide the pattern.
763 * <P>
764 * [Note:] Not all locales support SimpleDateFormat; for full generality,
765 * use the factory methods in the DateFormat class.
766 * @param pattern the pattern for the format.
767 * @param locale the given locale.
768 * @param status Output param set to success/failure code.
769 * @stable ICU 2.0
770 */
771 SimpleDateFormat(const UnicodeString& pattern,
772 const Locale& locale,
773 UErrorCode& status);
774
729e4ab9
A
775 /**
776 * Construct a SimpleDateFormat using the given pattern, numbering system override, and locale.
777 * The locale is used to obtain the symbols used in formatting (e.g., the
778 * names of the months), but not to provide the pattern.
779 * <P>
780 * A numbering system override is a string containing either the name of a known numbering system,
781 * or a set of field and numbering system pairs that specify which fields are to be formattied with
782 * the alternate numbering system. For example, to specify that all numeric fields in the specified
783 * date or time pattern are to be rendered using Thai digits, simply specify the numbering system override
784 * as "thai". To specify that just the year portion of the date be formatted using Hebrew numbering,
785 * use the override string "y=hebrew". Numbering system overrides can be combined using a semi-colon
786 * character in the override string, such as "d=decimal;M=arabic;y=hebrew", etc.
787 * <P>
788 * [Note:] Not all locales support SimpleDateFormat; for full generality,
789 * use the factory methods in the DateFormat class.
790 * @param pattern the pattern for the format.
791 * @param override the numbering system override.
792 * @param locale the given locale.
793 * @param status Output param set to success/failure code.
794 * @stable ICU 4.2
795 */
796 SimpleDateFormat(const UnicodeString& pattern,
797 const UnicodeString& override,
798 const Locale& locale,
799 UErrorCode& status);
800
b75a7d8f
A
801 /**
802 * Construct a SimpleDateFormat using the given pattern and locale-specific
803 * symbol data. The formatter takes ownership of the DateFormatSymbols object;
804 * the caller is no longer responsible for deleting it.
805 * @param pattern the given pattern for the format.
806 * @param formatDataToAdopt the symbols to be adopted.
807 * @param status Output param set to success/faulure code.
808 * @stable ICU 2.0
809 */
810 SimpleDateFormat(const UnicodeString& pattern,
811 DateFormatSymbols* formatDataToAdopt,
812 UErrorCode& status);
813
814 /**
815 * Construct a SimpleDateFormat using the given pattern and locale-specific
816 * symbol data. The DateFormatSymbols object is NOT adopted; the caller
817 * remains responsible for deleting it.
818 * @param pattern the given pattern for the format.
819 * @param formatData the formatting symbols to be use.
820 * @param status Output param set to success/faulure code.
821 * @stable ICU 2.0
822 */
823 SimpleDateFormat(const UnicodeString& pattern,
824 const DateFormatSymbols& formatData,
825 UErrorCode& status);
826
827 /**
828 * Copy constructor.
829 * @stable ICU 2.0
830 */
831 SimpleDateFormat(const SimpleDateFormat&);
832
833 /**
834 * Assignment operator.
835 * @stable ICU 2.0
836 */
837 SimpleDateFormat& operator=(const SimpleDateFormat&);
838
839 /**
840 * Destructor.
841 * @stable ICU 2.0
842 */
843 virtual ~SimpleDateFormat();
844
845 /**
846 * Clone this Format object polymorphically. The caller owns the result and
847 * should delete it when done.
848 * @return A copy of the object.
849 * @stable ICU 2.0
850 */
851 virtual Format* clone(void) const;
852
853 /**
854 * Return true if the given Format objects are semantically equal. Objects
855 * of different subclasses are considered unequal.
856 * @param other the object to be compared with.
857 * @return true if the given Format objects are semantically equal.
858 * @stable ICU 2.0
859 */
860 virtual UBool operator==(const Format& other) const;
861
729e4ab9
A
862
863 using DateFormat::format;
864
b75a7d8f
A
865 /**
866 * Format a date or time, which is the standard millis since 24:00 GMT, Jan
867 * 1, 1970. Overrides DateFormat pure virtual method.
868 * <P>
869 * Example: using the US locale: "yyyy.MM.dd e 'at' HH:mm:ss zzz" ->>
870 * 1996.07.10 AD at 15:08:56 PDT
871 *
872 * @param cal Calendar set to the date and time to be formatted
873 * into a date/time string.
874 * @param appendTo Output parameter to receive result.
875 * Result is appended to existing contents.
876 * @param pos The formatting position. On input: an alignment field,
877 * if desired. On output: the offsets of the alignment field.
878 * @return Reference to 'appendTo' parameter.
879 * @stable ICU 2.1
880 */
881 virtual UnicodeString& format( Calendar& cal,
882 UnicodeString& appendTo,
883 FieldPosition& pos) const;
884
729e4ab9
A
885 /**
886 * Format a date or time, which is the standard millis since 24:00 GMT, Jan
887 * 1, 1970. Overrides DateFormat pure virtual method.
888 * <P>
889 * Example: using the US locale: "yyyy.MM.dd e 'at' HH:mm:ss zzz" ->>
890 * 1996.07.10 AD at 15:08:56 PDT
891 *
892 * @param cal Calendar set to the date and time to be formatted
893 * into a date/time string.
894 * @param appendTo Output parameter to receive result.
895 * Result is appended to existing contents.
896 * @param posIter On return, can be used to iterate over positions
897 * of fields generated by this format call. Field values
898 * are defined in UDateFormatField.
899 * @param status Input/output param set to success/failure code.
900 * @return Reference to 'appendTo' parameter.
901 * @stable ICU 4.4
902 */
903 virtual UnicodeString& format( Calendar& cal,
904 UnicodeString& appendTo,
905 FieldPositionIterator* posIter,
906 UErrorCode& status) const;
907
57a6839d 908 using DateFormat::parse;
b75a7d8f
A
909
910 /**
911 * Parse a date/time string beginning at the given parse position. For
912 * example, a time text "07/10/96 4:5 PM, PDT" will be parsed into a Date
913 * that is equivalent to Date(837039928046).
914 * <P>
915 * By default, parsing is lenient: If the input is not in the form used by
916 * this object's format method but can still be parsed as a date, then the
917 * parse succeeds. Clients may insist on strict adherence to the format by
918 * calling setLenient(false).
4388f060 919 * @see DateFormat::setLenient(boolean)
b75a7d8f
A
920 *
921 * @param text The date/time string to be parsed
4388f060
A
922 * @param cal A Calendar set on input to the date and time to be used for
923 * missing values in the date/time string being parsed, and set
924 * on output to the parsed date/time. When the calendar type is
925 * different from the internal calendar held by this SimpleDateFormat
926 * instance, the internal calendar will be cloned to a work
927 * calendar set to the same milliseconds and time zone as the
928 * cal parameter, field values will be parsed based on the work
929 * calendar, then the result (milliseconds and time zone) will
930 * be set in this calendar.
b75a7d8f
A
931 * @param pos On input, the position at which to start parsing; on
932 * output, the position at which parsing terminated, or the
933 * start position if the parse failed.
b75a7d8f
A
934 * @stable ICU 2.1
935 */
936 virtual void parse( const UnicodeString& text,
937 Calendar& cal,
938 ParsePosition& pos) const;
939
b75a7d8f
A
940
941 /**
942 * Set the start UDate used to interpret two-digit year strings.
943 * When dates are parsed having 2-digit year strings, they are placed within
944 * a assumed range of 100 years starting on the two digit start date. For
945 * example, the string "24-Jan-17" may be in the year 1817, 1917, 2017, or
946 * some other year. SimpleDateFormat chooses a year so that the resultant
947 * date is on or after the two digit start date and within 100 years of the
948 * two digit start date.
949 * <P>
950 * By default, the two digit start date is set to 80 years before the current
951 * time at which a SimpleDateFormat object is created.
952 * @param d start UDate used to interpret two-digit year strings.
953 * @param status Filled in with U_ZERO_ERROR if the parse was successful, and with
954 * an error value if there was a parse error.
955 * @stable ICU 2.0
956 */
957 virtual void set2DigitYearStart(UDate d, UErrorCode& status);
958
959 /**
960 * Get the start UDate used to interpret two-digit year strings.
961 * When dates are parsed having 2-digit year strings, they are placed within
962 * a assumed range of 100 years starting on the two digit start date. For
963 * example, the string "24-Jan-17" may be in the year 1817, 1917, 2017, or
964 * some other year. SimpleDateFormat chooses a year so that the resultant
965 * date is on or after the two digit start date and within 100 years of the
966 * two digit start date.
967 * <P>
968 * By default, the two digit start date is set to 80 years before the current
969 * time at which a SimpleDateFormat object is created.
970 * @param status Filled in with U_ZERO_ERROR if the parse was successful, and with
971 * an error value if there was a parse error.
972 * @stable ICU 2.0
973 */
974 UDate get2DigitYearStart(UErrorCode& status) const;
975
976 /**
977 * Return a pattern string describing this date format.
978 * @param result Output param to receive the pattern.
979 * @return A reference to 'result'.
980 * @stable ICU 2.0
981 */
982 virtual UnicodeString& toPattern(UnicodeString& result) const;
983
984 /**
985 * Return a localized pattern string describing this date format.
986 * In most cases, this will return the same thing as toPattern(),
987 * but a locale can specify characters to use in pattern descriptions
988 * in place of the ones described in this class's class documentation.
989 * (Presumably, letters that would be more mnemonic in that locale's
990 * language.) This function would produce a pattern using those
991 * letters.
992 *
993 * @param result Receives the localized pattern.
994 * @param status Output param set to success/failure code on
995 * exit. If the pattern is invalid, this will be
996 * set to a failure result.
997 * @return A reference to 'result'.
998 * @stable ICU 2.0
999 */
1000 virtual UnicodeString& toLocalizedPattern(UnicodeString& result,
1001 UErrorCode& status) const;
1002
1003 /**
1004 * Apply the given unlocalized pattern string to this date format.
1005 * (i.e., after this call, this formatter will format dates according to
1006 * the new pattern)
1007 *
1008 * @param pattern The pattern to be applied.
1009 * @stable ICU 2.0
1010 */
1011 virtual void applyPattern(const UnicodeString& pattern);
1012
1013 /**
1014 * Apply the given localized pattern string to this date format.
1015 * (see toLocalizedPattern() for more information on localized patterns.)
1016 *
1017 * @param pattern The localized pattern to be applied.
1018 * @param status Output param set to success/failure code on
1019 * exit. If the pattern is invalid, this will be
1020 * set to a failure result.
1021 * @stable ICU 2.0
1022 */
1023 virtual void applyLocalizedPattern(const UnicodeString& pattern,
1024 UErrorCode& status);
1025
1026 /**
1027 * Gets the date/time formatting symbols (this is an object carrying
1028 * the various strings and other symbols used in formatting: e.g., month
1029 * names and abbreviations, time zone names, AM/PM strings, etc.)
1030 * @return a copy of the date-time formatting data associated
1031 * with this date-time formatter.
1032 * @stable ICU 2.0
1033 */
1034 virtual const DateFormatSymbols* getDateFormatSymbols(void) const;
1035
1036 /**
1037 * Set the date/time formatting symbols. The caller no longer owns the
1038 * DateFormatSymbols object and should not delete it after making this call.
1039 * @param newFormatSymbols the given date-time formatting symbols to copy.
1040 * @stable ICU 2.0
1041 */
1042 virtual void adoptDateFormatSymbols(DateFormatSymbols* newFormatSymbols);
1043
1044 /**
1045 * Set the date/time formatting data.
1046 * @param newFormatSymbols the given date-time formatting symbols to copy.
1047 * @stable ICU 2.0
1048 */
1049 virtual void setDateFormatSymbols(const DateFormatSymbols& newFormatSymbols);
1050
1051 /**
1052 * Return the class ID for this class. This is useful only for comparing to
1053 * a return value from getDynamicClassID(). For example:
1054 * <pre>
1055 * . Base* polymorphic_pointer = createPolymorphicObject();
1056 * . if (polymorphic_pointer->getDynamicClassID() ==
1057 * . erived::getStaticClassID()) ...
1058 * </pre>
1059 * @return The class ID for all objects of this class.
1060 * @stable ICU 2.0
1061 */
374ca955 1062 static UClassID U_EXPORT2 getStaticClassID(void);
b75a7d8f
A
1063
1064 /**
1065 * Returns a unique class ID POLYMORPHICALLY. Pure virtual override. This
1066 * method is to implement a simple version of RTTI, since not all C++
1067 * compilers support genuine RTTI. Polymorphic operator==() and clone()
1068 * methods call this method.
1069 *
1070 * @return The class ID for this object. All objects of a
1071 * given class have the same class ID. Objects of
1072 * other classes have different class IDs.
1073 * @stable ICU 2.0
1074 */
1075 virtual UClassID getDynamicClassID(void) const;
1076
1077 /**
1078 * Set the calendar to be used by this date format. Initially, the default
1079 * calendar for the specified or default locale is used. The caller should
1080 * not delete the Calendar object after it is adopted by this call.
1081 * Adopting a new calendar will change to the default symbols.
1082 *
1083 * @param calendarToAdopt Calendar object to be adopted.
1084 * @stable ICU 2.0
1085 */
1086 virtual void adoptCalendar(Calendar* calendarToAdopt);
1087
51004dcb 1088 /* Cannot use #ifndef U_HIDE_INTERNAL_API for the following methods since they are virtual */
4388f060
A
1089 /**
1090 * Sets the TimeZoneFormat to be used by this date/time formatter.
1091 * The caller should not delete the TimeZoneFormat object after
1092 * it is adopted by this call.
1093 * @param timeZoneFormatToAdopt The TimeZoneFormat object to be adopted.
1094 * @internal ICU 49 technology preview
1095 */
1096 virtual void adoptTimeZoneFormat(TimeZoneFormat* timeZoneFormatToAdopt);
1097
1098 /**
1099 * Sets the TimeZoneFormat to be used by this date/time formatter.
1100 * @param newTimeZoneFormat The TimeZoneFormat object to copy.
1101 * @internal ICU 49 technology preview
1102 */
1103 virtual void setTimeZoneFormat(const TimeZoneFormat& newTimeZoneFormat);
1104
1105 /**
1106 * Gets the time zone format object associated with this date/time formatter.
1107 * @return the time zone format associated with this date/time formatter.
1108 * @internal ICU 49 technology preview
1109 */
1110 virtual const TimeZoneFormat* getTimeZoneFormat(void) const;
4388f060 1111
57a6839d
A
1112 /* Cannot use #ifndef U_HIDE_DRAFT_API for the following draft method since it is virtual */
1113 /**
1114 * Set a particular UDisplayContext value in the formatter, such as
1115 * UDISPCTX_CAPITALIZATION_FOR_STANDALONE. Note: For getContext, see
1116 * DateFormat.
1117 * @param value The UDisplayContext value to set.
1118 * @param status Input/output status. If at entry this indicates a failure
1119 * status, the function will do nothing; otherwise this will be
1120 * updated with any new status from the function.
1121 * @draft ICU 53
1122 */
1123 virtual void setContext(UDisplayContext value, UErrorCode& status);
1124
4388f060 1125#ifndef U_HIDE_INTERNAL_API
46f4442e
A
1126 /**
1127 * This is for ICU internal use only. Please do not use.
1128 * Check whether the 'field' is smaller than all the fields covered in
729e4ab9 1129 * pattern, return TRUE if it is. The sequence of calendar field,
46f4442e
A
1130 * from large to small is: ERA, YEAR, MONTH, DATE, AM_PM, HOUR, MINUTE,...
1131 * @param field the calendar field need to check against
729e4ab9 1132 * @return TRUE if the 'field' is smaller than all the fields
46f4442e
A
1133 * covered in pattern. FALSE otherwise.
1134 * @internal ICU 4.0
1135 */
1136 UBool isFieldUnitIgnored(UCalendarDateFields field) const;
1137
1138
1139 /**
1140 * This is for ICU internal use only. Please do not use.
1141 * Check whether the 'field' is smaller than all the fields covered in
729e4ab9 1142 * pattern, return TRUE if it is. The sequence of calendar field,
46f4442e
A
1143 * from large to small is: ERA, YEAR, MONTH, DATE, AM_PM, HOUR, MINUTE,...
1144 * @param pattern the pattern to check against
1145 * @param field the calendar field need to check against
729e4ab9 1146 * @return TRUE if the 'field' is smaller than all the fields
46f4442e
A
1147 * covered in pattern. FALSE otherwise.
1148 * @internal ICU 4.0
1149 */
729e4ab9 1150 static UBool isFieldUnitIgnored(const UnicodeString& pattern,
46f4442e
A
1151 UCalendarDateFields field);
1152
46f4442e
A
1153 /**
1154 * This is for ICU internal use only. Please do not use.
1155 * Get the locale of this simple date formatter.
1156 * It is used in DateIntervalFormat.
1157 *
1158 * @return locale in this simple date formatter
1159 * @internal ICU 4.0
1160 */
1161 const Locale& getSmpFmtLocale(void) const;
4388f060 1162#endif /* U_HIDE_INTERNAL_API */
46f4442e 1163
b75a7d8f 1164private:
b75a7d8f
A
1165 friend class DateFormat;
1166
1167 void initializeDefaultCentury(void);
1168
57a6839d
A
1169 void initializeBooleanAttributes(void);
1170
b75a7d8f
A
1171 SimpleDateFormat(); // default constructor not implemented
1172
1173 /**
1174 * Used by the DateFormat factory methods to construct a SimpleDateFormat.
1175 * @param timeStyle the time style.
1176 * @param dateStyle the date style.
1177 * @param locale the given locale.
1178 * @param status Output param set to success/failure code on
1179 * exit.
1180 */
1181 SimpleDateFormat(EStyle timeStyle, EStyle dateStyle, const Locale& locale, UErrorCode& status);
1182
1183 /**
1184 * Construct a SimpleDateFormat for the given locale. If no resource data
1185 * is available, create an object of last resort, using hard-coded strings.
1186 * This is an internal method, called by DateFormat. It should never fail.
1187 * @param locale the given locale.
1188 * @param status Output param set to success/failure code on
1189 * exit.
1190 */
1191 SimpleDateFormat(const Locale& locale, UErrorCode& status); // Use default pattern
1192
729e4ab9
A
1193 /**
1194 * Hook called by format(... FieldPosition& ...) and format(...FieldPositionIterator&...)
1195 */
51004dcb 1196 UnicodeString& _format(Calendar& cal, UnicodeString& appendTo, FieldPositionHandler& handler, UErrorCode& status) const;
729e4ab9 1197
b75a7d8f
A
1198 /**
1199 * Called by format() to format a single field.
1200 *
1201 * @param appendTo Output parameter to receive result.
1202 * Result is appended to existing contents.
1203 * @param ch The format character we encountered in the pattern.
1204 * @param count Number of characters in the current pattern symbol (e.g.,
1205 * "yyyy" in the pattern would result in a call to this function
1206 * with ch equal to 'y' and count equal to 4)
4388f060
A
1207 * @param capitalizationContext Capitalization context for this date format.
1208 * @param fieldNum Zero-based numbering of current field within the overall format.
729e4ab9 1209 * @param handler Records information about field positions.
4388f060 1210 * @param cal Calendar to use
b75a7d8f
A
1211 * @param status Receives a status code, which will be U_ZERO_ERROR if the operation
1212 * succeeds.
1213 */
729e4ab9
A
1214 void subFormat(UnicodeString &appendTo,
1215 UChar ch,
1216 int32_t count,
51004dcb 1217 UDisplayContext capitalizationContext,
4388f060 1218 int32_t fieldNum,
729e4ab9
A
1219 FieldPositionHandler& handler,
1220 Calendar& cal,
1221 UErrorCode& status) const; // in case of illegal argument
b75a7d8f
A
1222
1223 /**
1224 * Used by subFormat() to format a numeric value.
1225 * Appends to toAppendTo a string representation of "value"
1226 * having a number of digits between "minDigits" and
1227 * "maxDigits". Uses the DateFormat's NumberFormat.
1228 *
4388f060 1229 * @param currentNumberFormat
b75a7d8f
A
1230 * @param appendTo Output parameter to receive result.
1231 * Formatted number is appended to existing contents.
1232 * @param value Value to format.
1233 * @param minDigits Minimum number of digits the result should have
1234 * @param maxDigits Maximum number of digits the result should have
1235 */
729e4ab9
A
1236 void zeroPaddingNumber(NumberFormat *currentNumberFormat,
1237 UnicodeString &appendTo,
1238 int32_t value,
1239 int32_t minDigits,
51004dcb
A
1240 int32_t maxDigits,
1241 UBool basicNumFmt) const;
b75a7d8f
A
1242
1243 /**
1244 * Return true if the given format character, occuring count
1245 * times, represents a numeric field.
1246 */
1247 static UBool isNumeric(UChar formatChar, int32_t count);
1248
51004dcb
A
1249 /**
1250 * Returns TRUE if the patternOffset is at the start of a numeric field.
1251 */
1252 static UBool isAtNumericField(const UnicodeString &pattern, int32_t patternOffset);
1253
1254 /**
1255 * Returns TRUE if the patternOffset is right after a non-numeric field.
1256 */
1257 static UBool isAfterNonNumericField(const UnicodeString &pattern, int32_t patternOffset);
1258
b75a7d8f
A
1259 /**
1260 * initializes fCalendar from parameters. Returns fCalendar as a convenience.
1261 * @param adoptZone Zone to be adopted, or NULL for TimeZone::createDefault().
1262 * @param locale Locale of the calendar
1263 * @param status Error code
1264 * @return the newly constructed fCalendar
1265 */
1266 Calendar *initializeCalendar(TimeZone* adoptZone, const Locale& locale, UErrorCode& status);
1267
1268 /**
1269 * initializes fSymbols from parameters.
1270 * @param locale Locale of the symbols
1271 * @param calendar Alias to Calendar that will be used.
1272 * @param status Error code
1273 */
1274 void initializeSymbols(const Locale& locale, Calendar* calendar, UErrorCode& status);
1275
1276 /**
1277 * Called by several of the constructors to load pattern data and formatting symbols
1278 * out of a resource bundle and initialize the locale based on it.
1279 * @param timeStyle The time style, as passed to DateFormat::createDateInstance().
1280 * @param dateStyle The date style, as passed to DateFormat::createTimeInstance().
1281 * @param locale The locale to load the patterns from.
1282 * @param status Filled in with an error code if loading the data from the
1283 * resources fails.
1284 */
1285 void construct(EStyle timeStyle, EStyle dateStyle, const Locale& locale, UErrorCode& status);
1286
1287 /**
1288 * Called by construct() and the various constructors to set up the SimpleDateFormat's
1289 * Calendar and NumberFormat objects.
1290 * @param locale The locale for which we want a Calendar and a NumberFormat.
4388f060 1291 * @param status Filled in with an error code if creating either subobject fails.
b75a7d8f
A
1292 */
1293 void initialize(const Locale& locale, UErrorCode& status);
1294
1295 /**
1296 * Private code-size reduction function used by subParse.
1297 * @param text the time text being parsed.
1298 * @param start where to start parsing.
1299 * @param field the date field being parsed.
1300 * @param stringArray the string array to parsed.
1301 * @param stringArrayCount the size of the array.
4388f060 1302 * @param monthPattern pointer to leap month pattern, or NULL if none.
b75a7d8f
A
1303 * @param cal a Calendar set to the date and time to be formatted
1304 * into a date/time string.
1305 * @return the new start position if matching succeeded; a negative number
1306 * indicating matching failure, otherwise.
1307 */
1308 int32_t matchString(const UnicodeString& text, int32_t start, UCalendarDateFields field,
4388f060
A
1309 const UnicodeString* stringArray, int32_t stringArrayCount,
1310 const UnicodeString* monthPattern, Calendar& cal) const;
b75a7d8f 1311
73c04bcf
A
1312 /**
1313 * Private code-size reduction function used by subParse.
1314 * @param text the time text being parsed.
1315 * @param start where to start parsing.
1316 * @param field the date field being parsed.
1317 * @param stringArray the string array to parsed.
1318 * @param stringArrayCount the size of the array.
1319 * @param cal a Calendar set to the date and time to be formatted
1320 * into a date/time string.
1321 * @return the new start position if matching succeeded; a negative number
1322 * indicating matching failure, otherwise.
1323 */
1324 int32_t matchQuarterString(const UnicodeString& text, int32_t start, UCalendarDateFields field,
1325 const UnicodeString* stringArray, int32_t stringArrayCount, Calendar& cal) const;
46f4442e
A
1326
1327 /**
1328 * Private function used by subParse to match literal pattern text.
1329 *
1330 * @param pattern the pattern string
1331 * @param patternOffset the starting offset into the pattern text. On
1332 * outupt will be set the offset of the first non-literal character in the pattern
1333 * @param text the text being parsed
1334 * @param textOffset the starting offset into the text. On output
1335 * will be set to the offset of the character after the match
57a6839d
A
1336 * @param whitespaceLenient <code>TRUE</code> if whitespace parse is lenient, <code>FALSE</code> otherwise.
1337 * @param partialMatchLenient <code>TRUE</code> if partial match parse is lenient, <code>FALSE</code> otherwise.
46f4442e
A
1338 *
1339 * @return <code>TRUE</code> if the literal text could be matched, <code>FALSE</code> otherwise.
1340 */
1341 static UBool matchLiterals(const UnicodeString &pattern, int32_t &patternOffset,
57a6839d
A
1342 const UnicodeString &text, int32_t &textOffset,
1343 UBool whitespaceLenient, UBool partialMatchLenient);
46f4442e 1344
b75a7d8f
A
1345 /**
1346 * Private member function that converts the parsed date strings into
1347 * timeFields. Returns -start (for ParsePosition) if failed.
1348 * @param text the time text to be parsed.
1349 * @param start where to start parsing.
1350 * @param ch the pattern character for the date field text to be parsed.
1351 * @param count the count of a pattern character.
1352 * @param obeyCount if true then the count is strictly obeyed.
4388f060 1353 * @param allowNegative
b75a7d8f 1354 * @param ambiguousYear If true then the two-digit year == the default start year.
729e4ab9 1355 * @param saveHebrewMonth Used to hang onto month until year is known.
b75a7d8f
A
1356 * @param cal a Calendar set to the date and time to be formatted
1357 * into a date/time string.
4388f060
A
1358 * @param patLoc
1359 * @param numericLeapMonthFormatter If non-null, used to parse numeric leap months.
57a6839d
A
1360 * @param tzTimeType the type of parsed time zone - standard, daylight or unknown (output).
1361 * This parameter can be NULL if caller does not need the information.
b75a7d8f
A
1362 * @return the new start position if matching succeeded; a negative number
1363 * indicating matching failure, otherwise.
1364 */
1365 int32_t subParse(const UnicodeString& text, int32_t& start, UChar ch, int32_t count,
729e4ab9 1366 UBool obeyCount, UBool allowNegative, UBool ambiguousYear[], int32_t& saveHebrewMonth, Calendar& cal,
57a6839d 1367 int32_t patLoc, MessageFormat * numericLeapMonthFormatter, UTimeZoneFormatTimeType *tzTimeType) const;
b75a7d8f
A
1368
1369 void parseInt(const UnicodeString& text,
1370 Formattable& number,
1371 ParsePosition& pos,
729e4ab9
A
1372 UBool allowNegative,
1373 NumberFormat *fmt) const;
b75a7d8f 1374
46f4442e
A
1375 void parseInt(const UnicodeString& text,
1376 Formattable& number,
1377 int32_t maxDigits,
1378 ParsePosition& pos,
729e4ab9
A
1379 UBool allowNegative,
1380 NumberFormat *fmt) const;
1381
1382 int32_t checkIntSuffix(const UnicodeString& text, int32_t start,
1383 int32_t patLoc, UBool isNegative) const;
46f4442e 1384
b75a7d8f
A
1385 /**
1386 * Translate a pattern, mapping each character in the from string to the
1387 * corresponding character in the to string. Return an error if the original
1388 * pattern contains an unmapped character, or if a quote is unmatched.
1389 * Quoted (single quotes only) material is not translated.
1390 * @param originalPattern the original pattern.
1391 * @param translatedPattern Output param to receive the translited pattern.
1392 * @param from the characters to be translited from.
1393 * @param to the characters to be translited to.
374ca955 1394 * @param status Receives a status code, which will be U_ZERO_ERROR
b75a7d8f
A
1395 * if the operation succeeds.
1396 */
1397 static void translatePattern(const UnicodeString& originalPattern,
1398 UnicodeString& translatedPattern,
1399 const UnicodeString& from,
1400 const UnicodeString& to,
1401 UErrorCode& status);
1402
1403 /**
1404 * Sets the starting date of the 100-year window that dates with 2-digit years
1405 * are considered to fall within.
1406 * @param startDate the start date
374ca955 1407 * @param status Receives a status code, which will be U_ZERO_ERROR
b75a7d8f
A
1408 * if the operation succeeds.
1409 */
1410 void parseAmbiguousDatesAsAfter(UDate startDate, UErrorCode& status);
729e4ab9
A
1411
1412 /**
1413 * Return the length matched by the given affix, or -1 if none.
1414 * Runs of white space in the affix, match runs of white space in
1415 * the input.
1416 * @param affix pattern string, taken as a literal
1417 * @param input input text
1418 * @param pos offset into input at which to begin matching
1419 * @return length of input that matches, or -1 if match failure
1420 */
1421 int32_t compareSimpleAffix(const UnicodeString& affix,
1422 const UnicodeString& input,
1423 int32_t pos) const;
1424
1425 /**
4388f060 1426 * Skip over a run of zero or more Pattern_White_Space characters at
729e4ab9
A
1427 * pos in text.
1428 */
4388f060 1429 int32_t skipPatternWhiteSpace(const UnicodeString& text, int32_t pos) const;
729e4ab9
A
1430
1431 /**
1432 * Skip over a run of zero or more isUWhiteSpace() characters at pos
1433 * in text.
1434 */
1435 int32_t skipUWhiteSpace(const UnicodeString& text, int32_t pos) const;
1436
729e4ab9
A
1437 /**
1438 * Initialize NumberFormat instances used for numbering system overrides.
1439 */
1440 void initNumberFormatters(const Locale &locale,UErrorCode &status);
1441
1442 /**
1443 * Get the numbering system to be used for a particular field.
1444 */
1445 NumberFormat * getNumberFormatByIndex(UDateFormatField index) const;
1446
1447 /**
1448 * Parse the given override string and set up structures for number formats
1449 */
1450 void processOverrideString(const Locale &locale, const UnicodeString &str, int8_t type, UErrorCode &status);
1451
b75a7d8f
A
1452 /**
1453 * Used to map pattern characters to Calendar field identifiers.
1454 */
1455 static const UCalendarDateFields fgPatternIndexToCalendarField[];
1456
1457 /**
1458 * Map index into pattern character string to DateFormat field number
1459 */
374ca955 1460 static const UDateFormatField fgPatternIndexToDateFormatField[];
b75a7d8f 1461
4388f060
A
1462 /**
1463 * Lazy TimeZoneFormat instantiation, semantically const
1464 */
1465 TimeZoneFormat *tzFormat() const;
1466
46f4442e
A
1467 /**
1468 * Used to map Calendar field to field level.
1469 * The larger the level, the smaller the field unit.
1470 * For example, UCAL_ERA level is 0, UCAL_YEAR level is 10,
1471 * UCAL_MONTH level is 20.
1472 */
1473 static const int32_t fgCalendarFieldToLevel[];
1474 static const int32_t fgPatternCharToLevel[];
1475
b75a7d8f
A
1476 /**
1477 * The formatting pattern for this formatter.
1478 */
1479 UnicodeString fPattern;
1480
729e4ab9
A
1481 /**
1482 * The numbering system override for dates.
1483 */
1484 UnicodeString fDateOverride;
1485
1486 /**
1487 * The numbering system override for times.
1488 */
1489 UnicodeString fTimeOverride;
1490
1491
b75a7d8f
A
1492 /**
1493 * The original locale used (for reloading symbols)
1494 */
1495 Locale fLocale;
1496
1497 /**
1498 * A pointer to an object containing the strings to use in formatting (e.g.,
1499 * month and day names, AM and PM strings, time zone names, etc.)
1500 */
1501 DateFormatSymbols* fSymbols; // Owned
1502
4388f060
A
1503 /**
1504 * The time zone formatter
1505 */
1506 TimeZoneFormat* fTimeZoneFormat;
1507
b75a7d8f
A
1508 /**
1509 * If dates have ambiguous years, we map them into the century starting
1510 * at defaultCenturyStart, which may be any date. If defaultCenturyStart is
1511 * set to SYSTEM_DEFAULT_CENTURY, which it is by default, then the system
1512 * values are used. The instance values defaultCenturyStart and
1513 * defaultCenturyStartYear are only used if explicitly set by the user
1514 * through the API method parseAmbiguousDatesAsAfter().
1515 */
1516 UDate fDefaultCenturyStart;
1517
1518 /**
1519 * See documentation for defaultCenturyStart.
1520 */
1521 /*transient*/ int32_t fDefaultCenturyStartYear;
b75a7d8f 1522
729e4ab9
A
1523 typedef struct NSOverride {
1524 NumberFormat *nf;
1525 int32_t hash;
1526 NSOverride *next;
1527 } NSOverride;
1528
729e4ab9
A
1529 NumberFormat **fNumberFormatters;
1530
1531 NSOverride *fOverrideList;
73c04bcf 1532
374ca955 1533 UBool fHaveDefaultCentury;
4388f060 1534
57a6839d 1535 BreakIterator* fCapitalizationBrkIter;
b75a7d8f
A
1536};
1537
b75a7d8f
A
1538inline UDate
1539SimpleDateFormat::get2DigitYearStart(UErrorCode& /*status*/) const
1540{
1541 return fDefaultCenturyStart;
1542}
1543
b75a7d8f
A
1544U_NAMESPACE_END
1545
1546#endif /* #if !UCONFIG_NO_FORMATTING */
1547
1548#endif // _SMPDTFMT
1549//eof