]>
Commit | Line | Data |
---|---|---|
f3c0d7a5 A |
1 | # Copyright (C) 2016 and later: Unicode, Inc. and others. |
2 | # License & terms of use: http://www.unicode.org/copyright.html | |
b75a7d8f | 3 | # ******************************************************************************* |
374ca955 | 4 | # * Copyright (C) 2001-2003, International Business Machines |
b75a7d8f A |
5 | # * Corporation and others. All Rights Reserved. |
6 | # ******************************************************************************* | |
7 | # | |
8 | # test4.ucm | |
9 | # | |
374ca955 | 10 | # Test file for MBCS conversion with four-byte codepage data. |
b75a7d8f A |
11 | |
12 | <code_set_name> "test4" | |
13 | <mb_cur_max> 4 | |
14 | <mb_cur_min> 1 | |
15 | <uconv_class> "MBCS" | |
374ca955 A |
16 | |
17 | # both subchars are single-byters, which does not make sense | |
18 | # but works - adding subchar1 for tests but don't want to | |
19 | # change old tests for a new subchar -- markus 20031028 | |
20 | <subchar> \xff | |
21 | <subchar1> \xe1 | |
22 | <icu:state> 0, 1:1, 5-9, e1, ff | |
23 | <icu:state> 2:2 | |
24 | <icu:state> 3:3 | |
25 | <icu:state> a-f.p, ff | |
b75a7d8f A |
26 | |
27 | CHARMAP | |
28 | ||
29 | # fromUnicode result is zero byte from other than U+0000 | |
30 | <U20ac> \x00 |0 | |
31 | ||
374ca955 A |
32 | # fallback from non-zero to zero possible with extension table |
33 | <U20ad> \x00 |1 | |
34 | ||
b75a7d8f A |
35 | # nothing special |
36 | <U0005> \x05 |0 | |
37 | ||
38 | # toUnicode result is fallback direct | |
39 | <U0006> \x06 |3 | |
40 | ||
41 | # toUnicode result is direct non-BMP code point | |
42 | <U101234> \x07 |0 | |
43 | <Ufebcd> \x08 |3 | |
44 | ||
45 | #unassigned \x09 | |
46 | ||
47 | # toUnicode result is surrogate pair: test real pair, single unit, unassigned | |
48 | <U23456> \x01\x02\x03\x0a |0 | |
49 | <U000b> \x01\x02\x03\x0b |0 | |
50 | #unassigned \x01\x02\x03\x0c | |
51 | <U34567> \x01\x02\x03\x0d |3 | |
52 | <U000e> \x01\x02\x03\x0e |3 | |
53 | #unassigned \x01\x02\x03\x0f | |
54 | ||
374ca955 A |
55 | # <subchar1> non-mapping |
56 | <U50005> \xe1 |2 | |
57 | # add a mapping that turns the above's Unicode side into a prefix | |
58 | <U50005><U60006> \x06 |1 | |
59 | ||
60 | # many bytes, and bytes per UChar | |
61 | <U30ab><U309a> \x01\x02\x03\x0a\x01\x02\x03\x0b\x01\x02\x03\x0c\x01\x02\x03\x0d\x01\x02\x03\x0e\x01\x02\x03\x0f\x01\x02\x03\x0a\x05\x06\x07 |0 | |
62 | ||
63 | # many UChars, and UChars per byte | |
64 | <U304b><U309a><U304d><U309a><U304f><U309a><U3051><U309a><U3053><U309a><U30ab><U309a><U30ad><U309a><U30af><U309a><U30b1><U309a><U0300> \x08\x09 |0 | |
65 | ||
b75a7d8f | 66 | END CHARMAP |