]> git.saurik.com Git - apple/icu.git/blame - icuSources/data/unidata/PropertyValueAliases.txt
ICU-3.13.tar.gz
[apple/icu.git] / icuSources / data / unidata / PropertyValueAliases.txt
CommitLineData
b75a7d8f
A
1# PropertyValueAliases-4.0.0.txt
2# Date: 2003-03-12, 23:46:08 GMT [MD]
3#
4# This file contains aliases for property values used in the UCD.
5# These names can be used for XML formats of UCD data, for regular-expression
6# property tests, and other programmatic textual descriptions of Unicode data.
7# For information on which properties are normative, see UCD.html.
8#
9# The names may be translated in appropriate environments, and additional
10# aliases may be useful.
11#
12# FORMAT
13#
14# Each line describes a property value name.
15# This consists of three fields, separated by semicolons.
16#
17# First Field: The first field describes the property for which that
18# property value name is used.
19# There is one special pseudo-property: "qc" stands for any quick-check property
20#
21# Second Field: The second field is an abbreviated name.
22# If there is no abbreviated name available, the field is marked with "n/a".
23#
24# Third Field: The third field is a long name.
25#
26# In the case of ccc, there are 4 fields. The second field is numeric, third
27# is abbreviated, and fourth is long.
28#
29# With loose matching of property names, the case distinctions, whitespace,
30# and '_' are ignored.
31#
32# NOTE: Currently there is at most one abbreviated name and one long name for
33# property value. However, in the future additional aliases may be added.
34# In such a case, the first line for the property value would have
35# the preferred alias for output.
36#
37# NOTE: The property value names are NOT unique across properties, especially
38# with loose matches. For example:
39#
40# AL means Arabic Letter for the Bidi_Class property, and
41# AL means Alpha_Left for the Combining_Class property, and
42# AL means Alphabetic for the Line_Break property.
43#
44# In addition, some property names may be the same as some property value names.
45# For example:
46#
47# cc means Combining_Class property, and
48# cc means the General_Category property value Control (cc)
49#
50# The combination of property value and property name is, however, unique.
51# For more information, see UTR #18: Regular Expression Guidelines
52# ================================================
53
54
55bc ; AL ; Arabic_Letter
56bc ; AN ; Arabic_Number
57bc ; B ; Paragraph_Separator
58bc ; BN ; Boundary_Neutral
59bc ; CS ; Common_Separator
60bc ; EN ; European_Number
61bc ; ES ; European_Separator
62bc ; ET ; European_Terminator
63bc ; L ; Left_To_Right
64bc ; LRE ; Left_To_Right_Embedding
65bc ; LRO ; Left_To_Right_Override
66bc ; NSM ; Nonspacing_Mark
67bc ; ON ; Other_Neutral
68bc ; PDF ; Pop_Directional_Format
69bc ; R ; Right_To_Left
70bc ; RLE ; Right_To_Left_Embedding
71bc ; RLO ; Right_To_Left_Override
72bc ; S ; Segment_Separator
73bc ; WS ; White_Space
74
75blk; n/a ; Aegean_Numbers
76blk; n/a ; Alphabetic_Presentation_Forms
77blk; n/a ; Arabic
78blk; n/a ; Arabic_Presentation_Forms-A
79blk; n/a ; Arabic_Presentation_Forms-B
80blk; n/a ; Armenian
81blk; n/a ; Arrows
82blk; n/a ; Basic_Latin
83blk; n/a ; Bengali
84blk; n/a ; Block_Elements
85blk; n/a ; Bopomofo
86blk; n/a ; Bopomofo_Extended
87blk; n/a ; Box_Drawing
88blk; n/a ; Braille_Patterns
89blk; n/a ; Buhid
90blk; n/a ; Byzantine_Musical_Symbols
91blk; n/a ; Cherokee
92blk; n/a ; CJK_Compatibility
93blk; n/a ; CJK_Compatibility_Forms
94blk; n/a ; CJK_Compatibility_Ideographs
95blk; n/a ; CJK_Compatibility_Ideographs_Supplement
96blk; n/a ; CJK_Radicals_Supplement
97blk; n/a ; CJK_Symbols_and_Punctuation
98blk; n/a ; CJK_Unified_Ideographs
99blk; n/a ; CJK_Unified_Ideographs_Extension_A
100blk; n/a ; CJK_Unified_Ideographs_Extension_B
101blk; n/a ; Combining_Diacritical_Marks
102blk; n/a ; Combining_Diacritical_Marks_for_Symbols
103blk; n/a ; Combining_Half_Marks
104blk; n/a ; Control_Pictures
105blk; n/a ; Currency_Symbols
106blk; n/a ; Cypriot_Syllabary
107blk; n/a ; Cyrillic
108blk; n/a ; Cyrillic_Supplementary
109blk; n/a ; Deseret
110blk; n/a ; Devanagari
111blk; n/a ; Dingbats
112blk; n/a ; Enclosed_Alphanumerics
113blk; n/a ; Enclosed_CJK_Letters_and_Months
114blk; n/a ; Ethiopic
115blk; n/a ; General_Punctuation
116blk; n/a ; Geometric_Shapes
117blk; n/a ; Georgian
118blk; n/a ; Gothic
119blk; n/a ; Greek_and_Coptic
120blk; n/a ; Greek_Extended
121blk; n/a ; Gujarati
122blk; n/a ; Gurmukhi
123blk; n/a ; Halfwidth_and_Fullwidth_Forms
124blk; n/a ; Hangul_Compatibility_Jamo
125blk; n/a ; Hangul_Jamo
126blk; n/a ; Hangul_Syllables
127blk; n/a ; Hanunoo
128blk; n/a ; Hebrew
129blk; n/a ; High_Private_Use_Surrogates
130blk; n/a ; High_Surrogates
131blk; n/a ; Hiragana
132blk; n/a ; Ideographic_Description_Characters
133blk; n/a ; IPA_Extensions
134blk; n/a ; Kanbun
135blk; n/a ; Kangxi_Radicals
136blk; n/a ; Kannada
137blk; n/a ; Katakana
138blk; n/a ; Katakana_Phonetic_Extensions
139blk; n/a ; Khmer
140blk; n/a ; Khmer_Symbols
141blk; n/a ; Lao
142blk; n/a ; Latin_Extended_Additional
143blk; n/a ; Latin_Extended-A
144blk; n/a ; Latin_Extended-B
145blk; n/a ; Latin-1_Supplement
146blk; n/a ; Letterlike_Symbols
147blk; n/a ; Limbu
148blk; n/a ; Linear_B_Ideograms
149blk; n/a ; Linear_B_Syllabary
150blk; n/a ; Low_Surrogates
151blk; n/a ; Malayalam
152blk; n/a ; Mathematical_Alphanumeric_Symbols
153blk; n/a ; Mathematical_Operators
154blk; n/a ; Miscellaneous_Mathematical_Symbols-A
155blk; n/a ; Miscellaneous_Mathematical_Symbols-B
156blk; n/a ; Miscellaneous_Symbols
157blk; n/a ; Miscellaneous_Symbols_and_Arrows
158blk; n/a ; Miscellaneous_Technical
159blk; n/a ; Mongolian
160blk; n/a ; Musical_Symbols
161blk; n/a ; Myanmar
162blk; n/a ; No_Block
163blk; n/a ; Number_Forms
164blk; n/a ; Ogham
165blk; n/a ; Old_Italic
166blk; n/a ; Optical_Character_Recognition
167blk; n/a ; Oriya
168blk; n/a ; Osmanya
169blk; n/a ; Phonetic_Extensions
170blk; n/a ; Private_Use_Area
171blk; n/a ; Runic
172blk; n/a ; Shavian
173blk; n/a ; Sinhala
174blk; n/a ; Small_Form_Variants
175blk; n/a ; Spacing_Modifier_Letters
176blk; n/a ; Specials
177blk; n/a ; Superscripts_and_Subscripts
178blk; n/a ; Supplemental_Arrows-A
179blk; n/a ; Supplemental_Arrows-B
180blk; n/a ; Supplemental_Mathematical_Operators
181blk; n/a ; Supplementary_Private_Use_Area-A
182blk; n/a ; Supplementary_Private_Use_Area-B
183blk; n/a ; Syriac
184blk; n/a ; Tagalog
185blk; n/a ; Tagbanwa
186blk; n/a ; Tags
187blk; n/a ; Tai_Le
188blk; n/a ; Tai_Xuan_Jing_Symbols
189blk; n/a ; Tamil
190blk; n/a ; Telugu
191blk; n/a ; Thaana
192blk; n/a ; Thai
193blk; n/a ; Tibetan
194blk; n/a ; Ugaritic
195blk; n/a ; Unified_Canadian_Aboriginal_Syllabics
196blk; n/a ; Variation_Selectors
197blk; n/a ; Variation_Selectors_Supplement
198blk; n/a ; Yi_Radicals
199blk; n/a ; Yi_Syllables
200blk; n/a ; Yijing_Hexagram_Symbols
201
202ccc; 0; NR ; Not_Reordered
203ccc; 1; OV ; Overlay
204ccc; 202; ATB ; Attached_Below
205ccc; 216; ATAR ; Attached_Above_Right
206ccc; 218; BL ; Below_Left
207ccc; 220; B ; Below
208ccc; 222; BR ; Below_Right
209ccc; 224; L ; Left
210ccc; 226; R ; Right
211ccc; 228; AL ; Above_Left
212ccc; 230; A ; Above
213ccc; 232; AR ; Above_Right
214ccc; 233; DB ; Double_Below
215ccc; 234; DA ; Double_Above
216ccc; 240; IS ; Iota_Subscript
217ccc; 7; NK ; Nukta
218ccc; 8; KV ; Kana_Voicing
219ccc; 9; VR ; Virama
220
221dt ; can ; canonical
222dt ; com ; compat
223dt ; enc ; circle
224dt ; fin ; final
225dt ; font ; font
226dt ; fra ; fraction
227dt ; init ; initial
228dt ; iso ; isolated
229dt ; med ; medial
230dt ; n/a ; none
231dt ; nar ; narrow
232dt ; nb ; noBreak
233dt ; sml ; small
234dt ; sqr ; square
235dt ; sub ; sub
236dt ; sup ; super
237dt ; vert ; vertical
238dt ; wide ; wide
239
240ea ; A ; Ambiguous
241ea ; F ; Fullwidth
242ea ; H ; Halfwidth
243ea ; N ; Neutral
244ea ; Na ; Narrow
245ea ; W ; Wide
246
247gc ; C ; Other # Cc | Cf | Cn | Co | Cs
248gc ; Cc ; Control
249gc ; Cf ; Format
250gc ; Cn ; Unassigned
251gc ; Co ; Private_Use
252gc ; Cs ; Surrogate
253gc ; L ; Letter # Ll | Lm | Lo | Lt | Lu
254gc ; LC ; Cased_Letter # Ll | Lt | Lu
255gc ; Ll ; Lowercase_Letter
256gc ; Lm ; Modifier_Letter
257gc ; Lo ; Other_Letter
258gc ; Lt ; Titlecase_Letter
259gc ; Lu ; Uppercase_Letter
260gc ; M ; Mark # Mc | Me | Mn
261gc ; Mc ; Spacing_Mark
262gc ; Me ; Enclosing_Mark
263gc ; Mn ; Nonspacing_Mark
264gc ; N ; Number # Nd | Nl | No
265gc ; Nd ; Decimal_Number
266gc ; Nl ; Letter_Number
267gc ; No ; Other_Number
268gc ; P ; Punctuation # Pc | Pd | Pe | Pf | Pi | Po | Ps
269gc ; Pc ; Connector_Punctuation
270gc ; Pd ; Dash_Punctuation
271gc ; Pe ; Close_Punctuation
272gc ; Pf ; Final_Punctuation
273gc ; Pi ; Initial_Punctuation
274gc ; Po ; Other_Punctuation
275gc ; Ps ; Open_Punctuation
276gc ; S ; Symbol # Sc | Sk | Sm | So
277gc ; Sc ; Currency_Symbol
278gc ; Sk ; Modifier_Symbol
279gc ; Sm ; Math_Symbol
280gc ; So ; Other_Symbol
281gc ; Z ; Separator # Zl | Zp | Zs
282gc ; Zl ; Line_Separator
283gc ; Zp ; Paragraph_Separator
284gc ; Zs ; Space_Separator
285
286hst; L ; Leading_Jamo
287hst; LV ; LV_Syllable
288hst; LVT ; LVT_Syllable
289hst; NA ; Not_Applicable
290hst; T ; Trailing_Jamo
291hst; V ; Vowel_Jamo
292
293jg ; n/a ; AIN
294jg ; n/a ; ALAPH
295jg ; n/a ; ALEF
296jg ; n/a ; BEH
297jg ; n/a ; BETH
298jg ; n/a ; DAL
299jg ; n/a ; DALATH_RISH
300jg ; n/a ; E
301jg ; n/a ; FE
302jg ; n/a ; FEH
303jg ; n/a ; FINAL_SEMKATH
304jg ; n/a ; GAF
305jg ; n/a ; GAMAL
306jg ; n/a ; HAH
307jg ; n/a ; HAMZA_ON_HEH_GOAL
308jg ; n/a ; HE
309jg ; n/a ; HEH
310jg ; n/a ; HEH_GOAL
311jg ; n/a ; HETH
312jg ; n/a ; KAF
313jg ; n/a ; KAPH
314jg ; n/a ; KHAPH
315jg ; n/a ; KNOTTED_HEH
316jg ; n/a ; LAM
317jg ; n/a ; LAMADH
318jg ; n/a ; MEEM
319jg ; n/a ; MIM
320jg ; n/a ; NO_JOINING_GROUP
321jg ; n/a ; NOON
322jg ; n/a ; NUN
323jg ; n/a ; PE
324jg ; n/a ; QAF
325jg ; n/a ; QAPH
326jg ; n/a ; REH
327jg ; n/a ; REVERSED_PE
328jg ; n/a ; SAD
329jg ; n/a ; SADHE
330jg ; n/a ; SEEN
331jg ; n/a ; SEMKATH
332jg ; n/a ; SHIN
333jg ; n/a ; SWASH_KAF
334jg ; n/a ; SYRIAC_WAW
335jg ; n/a ; TAH
336jg ; n/a ; TAW
337jg ; n/a ; TEH_MARBUTA
338jg ; n/a ; TETH
339jg ; n/a ; WAW
340jg ; n/a ; YEH
341jg ; n/a ; YEH_BARREE
342jg ; n/a ; YEH_WITH_TAIL
343jg ; n/a ; YUDH
344jg ; n/a ; YUDH_HE
345jg ; n/a ; ZAIN
346jg ; n/a ; ZHAIN
347
348jt ; C ; Join_Causing
349jt ; D ; Dual_Joining
350jt ; L ; Left_Joining
351jt ; R ; Right_Joining
352jt ; T ; Transparent
353jt ; U ; Non_Joining
354
355lb ; AI ; Ambiguous
356lb ; AL ; Alphabetic
357lb ; B2 ; Break_Both
358lb ; BA ; Break_After
359lb ; BB ; Break_Before
360lb ; BK ; Mandatory_Break
361lb ; CB ; Contingent_Break
362lb ; CL ; Close_Punctuation
363lb ; CM ; Combining_Mark
364lb ; CR ; Carriage_Return
365lb ; EX ; Exclamation
366lb ; GL ; Glue
367lb ; HY ; Hyphen
368lb ; ID ; Ideographic
369lb ; IN ; Inseperable
370lb ; IS ; Infix_Numeric
371lb ; LF ; Line_Feed
372lb ; NL ; Next_Line
373lb ; NS ; Nonstarter
374lb ; NU ; Numeric
375lb ; OP ; Open_Punctuation
376lb ; PO ; Postfix_Numeric
377lb ; PR ; Prefix_Numeric
378lb ; QU ; Quotation
379lb ; SA ; Complex_Context
380lb ; SG ; Surrogate
381lb ; SP ; Space
382lb ; SY ; Break_Symbols
383lb ; WJ ; Word_Joiner
384lb ; XX ; Unknown
385lb ; ZW ; ZWSpace
386
387nt ; de ; Decimal
388nt ; di ; Digit
389nt ; n/a ; None
390nt ; nu ; Numeric
391
392qc ; M ; Maybe
393qc ; N ; No
394qc ; Y ; Yes
395
396sc ; Arab ; Arabic
397sc ; Armn ; Armenian
398sc ; Beng ; Bengali
399sc ; Bopo ; Bopomofo
400sc ; Brai ; Braille
401sc ; Buhd ; Buhid
402sc ; Cans ; Canadian_Aboriginal
403sc ; Cher ; Cherokee
404sc ; Cprt ; Cypriot
405sc ; Cyrl ; Cyrillic
406sc ; Deva ; Devanagari
407sc ; Dsrt ; Deseret
408sc ; Ethi ; Ethiopic
409sc ; Geor ; Georgian
410sc ; Goth ; Gothic
411sc ; Grek ; Greek
412sc ; Gujr ; Gujarati
413sc ; Guru ; Gurmukhi
414sc ; Hang ; Hangul
415sc ; Hani ; Han
416sc ; Hano ; Hanunoo
417sc ; Hebr ; Hebrew
418sc ; Hira ; Hiragana
419sc ; Ital ; Old_Italic
420sc ; Kana ; Katakana
421sc ; Khmr ; Khmer
422sc ; Knda ; Kannada
423sc ; Laoo ; Lao
424sc ; Latn ; Latin
425sc ; Limb ; Limbu
426sc ; Linb ; Linear_B
427sc ; Mlym ; Malayalam
428sc ; Mong ; Mongolian
429sc ; Mymr ; Myanmar
430sc ; Ogam ; Ogham
431sc ; Orya ; Oriya
432sc ; Osma ; Osmanya
433sc ; Qaai ; Inherited
434sc ; Runr ; Runic
435sc ; Shaw ; Shavian
436sc ; Sinh ; Sinhala
437sc ; Syrc ; Syriac
438sc ; Tagb ; Tagbanwa
439sc ; Tale ; Tai_Le
440sc ; Taml ; Tamil
441sc ; Telu ; Telugu
442sc ; Tglg ; Tagalog
443sc ; Thaa ; Thaana
444sc ; Thai ; Thai
445sc ; Tibt ; Tibetan
446sc ; Ugar ; Ugaritic
447sc ; Yiii ; Yi
448sc ; Zyyy ; Common