]> git.saurik.com Git - apple/icu.git/blame - icuSources/test/testdata/test4.ucm
ICU-66108.tar.gz
[apple/icu.git] / icuSources / test / testdata / test4.ucm
CommitLineData
f3c0d7a5
A
1# Copyright (C) 2016 and later: Unicode, Inc. and others.
2# License & terms of use: http://www.unicode.org/copyright.html
b75a7d8f 3# *******************************************************************************
374ca955 4# * Copyright (C) 2001-2003, International Business Machines
b75a7d8f
A
5# * Corporation and others. All Rights Reserved.
6# *******************************************************************************
7#
8# test4.ucm
9#
374ca955 10# Test file for MBCS conversion with four-byte codepage data.
b75a7d8f
A
11
12<code_set_name> "test4"
13<mb_cur_max> 4
14<mb_cur_min> 1
15<uconv_class> "MBCS"
374ca955
A
16
17# both subchars are single-byters, which does not make sense
18# but works - adding subchar1 for tests but don't want to
19# change old tests for a new subchar -- markus 20031028
20<subchar> \xff
21<subchar1> \xe1
22<icu:state> 0, 1:1, 5-9, e1, ff
23<icu:state> 2:2
24<icu:state> 3:3
25<icu:state> a-f.p, ff
b75a7d8f
A
26
27CHARMAP
28
29# fromUnicode result is zero byte from other than U+0000
30<U20ac> \x00 |0
31
374ca955
A
32# fallback from non-zero to zero possible with extension table
33<U20ad> \x00 |1
34
b75a7d8f
A
35# nothing special
36<U0005> \x05 |0
37
38# toUnicode result is fallback direct
39<U0006> \x06 |3
40
41# toUnicode result is direct non-BMP code point
42<U101234> \x07 |0
43<Ufebcd> \x08 |3
44
45#unassigned \x09
46
47# toUnicode result is surrogate pair: test real pair, single unit, unassigned
48<U23456> \x01\x02\x03\x0a |0
49<U000b> \x01\x02\x03\x0b |0
50#unassigned \x01\x02\x03\x0c
51<U34567> \x01\x02\x03\x0d |3
52<U000e> \x01\x02\x03\x0e |3
53#unassigned \x01\x02\x03\x0f
54
374ca955
A
55# <subchar1> non-mapping
56<U50005> \xe1 |2
57# add a mapping that turns the above's Unicode side into a prefix
58<U50005><U60006> \x06 |1
59
60# many bytes, and bytes per UChar
61<U30ab><U309a> \x01\x02\x03\x0a\x01\x02\x03\x0b\x01\x02\x03\x0c\x01\x02\x03\x0d\x01\x02\x03\x0e\x01\x02\x03\x0f\x01\x02\x03\x0a\x05\x06\x07 |0
62
63# many UChars, and UChars per byte
64<U304b><U309a><U304d><U309a><U304f><U309a><U3051><U309a><U3053><U309a><U30ab><U309a><U30ad><U309a><U30af><U309a><U30b1><U309a><U0300> \x08\x09 |0
65
b75a7d8f 66END CHARMAP