]> git.saurik.com Git - apple/icu.git/blame - icuSources/test/testdata/test4.ucm
ICU-6.2.22.tar.gz
[apple/icu.git] / icuSources / test / testdata / test4.ucm
CommitLineData
b75a7d8f 1# *******************************************************************************
374ca955 2# * Copyright (C) 2001-2003, International Business Machines
b75a7d8f
A
3# * Corporation and others. All Rights Reserved.
4# *******************************************************************************
5#
6# test4.ucm
7#
374ca955 8# Test file for MBCS conversion with four-byte codepage data.
b75a7d8f
A
9
10<code_set_name> "test4"
11<mb_cur_max> 4
12<mb_cur_min> 1
13<uconv_class> "MBCS"
374ca955
A
14
15# both subchars are single-byters, which does not make sense
16# but works - adding subchar1 for tests but don't want to
17# change old tests for a new subchar -- markus 20031028
18<subchar> \xff
19<subchar1> \xe1
20<icu:state> 0, 1:1, 5-9, e1, ff
21<icu:state> 2:2
22<icu:state> 3:3
23<icu:state> a-f.p, ff
b75a7d8f
A
24
25CHARMAP
26
27# fromUnicode result is zero byte from other than U+0000
28<U20ac> \x00 |0
29
374ca955
A
30# fallback from non-zero to zero possible with extension table
31<U20ad> \x00 |1
32
b75a7d8f
A
33# nothing special
34<U0005> \x05 |0
35
36# toUnicode result is fallback direct
37<U0006> \x06 |3
38
39# toUnicode result is direct non-BMP code point
40<U101234> \x07 |0
41<Ufebcd> \x08 |3
42
43#unassigned \x09
44
45# toUnicode result is surrogate pair: test real pair, single unit, unassigned
46<U23456> \x01\x02\x03\x0a |0
47<U000b> \x01\x02\x03\x0b |0
48#unassigned \x01\x02\x03\x0c
49<U34567> \x01\x02\x03\x0d |3
50<U000e> \x01\x02\x03\x0e |3
51#unassigned \x01\x02\x03\x0f
52
374ca955
A
53# <subchar1> non-mapping
54<U50005> \xe1 |2
55# add a mapping that turns the above's Unicode side into a prefix
56<U50005><U60006> \x06 |1
57
58# many bytes, and bytes per UChar
59<U30ab><U309a> \x01\x02\x03\x0a\x01\x02\x03\x0b\x01\x02\x03\x0c\x01\x02\x03\x0d\x01\x02\x03\x0e\x01\x02\x03\x0f\x01\x02\x03\x0a\x05\x06\x07 |0
60
61# many UChars, and UChars per byte
62<U304b><U309a><U304d><U309a><U304f><U309a><U3051><U309a><U3053><U309a><U30ab><U309a><U30ad><U309a><U30af><U309a><U30b1><U309a><U0300> \x08\x09 |0
63
b75a7d8f 64END CHARMAP