1 # PropertyValueAliases-4.0.0.txt
2 # Date: 2003-03-12, 23:46:08 GMT [MD]
4 # This file contains aliases for property values used in the UCD.
5 # These names can be used for XML formats of UCD data, for regular-expression
6 # property tests, and other programmatic textual descriptions of Unicode data.
7 # For information on which properties are normative, see UCD.html.
9 # The names may be translated in appropriate environments, and additional
10 # aliases may be useful.
14 # Each line describes a property value name.
15 # This consists of three fields, separated by semicolons.
17 # First Field: The first field describes the property for which that
18 # property value name is used.
19 # There is one special pseudo-property: "qc" stands for any quick-check property
21 # Second Field: The second field is an abbreviated name.
22 # If there is no abbreviated name available, the field is marked with "n/a".
24 # Third Field: The third field is a long name.
26 # In the case of ccc, there are 4 fields. The second field is numeric, third
27 # is abbreviated, and fourth is long.
29 # With loose matching of property names, the case distinctions, whitespace,
30 # and '_' are ignored.
32 # NOTE: Currently there is at most one abbreviated name and one long name for
33 # property value. However, in the future additional aliases may be added.
34 # In such a case, the first line for the property value would have
35 # the preferred alias for output.
37 # NOTE: The property value names are NOT unique across properties, especially
38 # with loose matches. For example:
40 # AL means Arabic Letter for the Bidi_Class property, and
41 # AL means Alpha_Left for the Combining_Class property, and
42 # AL means Alphabetic for the Line_Break property.
44 # In addition, some property names may be the same as some property value names.
47 # cc means Combining_Class property, and
48 # cc means the General_Category property value Control (cc)
50 # The combination of property value and property name is, however, unique.
51 # For more information, see UTR #18: Regular Expression Guidelines
52 # ================================================
55 bc ; AL ; Arabic_Letter
56 bc ; AN ; Arabic_Number
57 bc ; B ; Paragraph_Separator
58 bc ; BN ; Boundary_Neutral
59 bc ; CS ; Common_Separator
60 bc ; EN ; European_Number
61 bc ; ES ; European_Separator
62 bc ; ET ; European_Terminator
63 bc ; L ; Left_To_Right
64 bc ; LRE ; Left_To_Right_Embedding
65 bc ; LRO ; Left_To_Right_Override
66 bc ; NSM ; Nonspacing_Mark
67 bc ; ON ; Other_Neutral
68 bc ; PDF ; Pop_Directional_Format
69 bc ; R ; Right_To_Left
70 bc ; RLE ; Right_To_Left_Embedding
71 bc ; RLO ; Right_To_Left_Override
72 bc ; S ; Segment_Separator
75 blk; n/a ; Aegean_Numbers
76 blk; n/a ; Alphabetic_Presentation_Forms
78 blk; n/a ; Arabic_Presentation_Forms-A
79 blk; n/a ; Arabic_Presentation_Forms-B
82 blk; n/a ; Basic_Latin
84 blk; n/a ; Block_Elements
86 blk; n/a ; Bopomofo_Extended
87 blk; n/a ; Box_Drawing
88 blk; n/a ; Braille_Patterns
90 blk; n/a ; Byzantine_Musical_Symbols
92 blk; n/a ; CJK_Compatibility
93 blk; n/a ; CJK_Compatibility_Forms
94 blk; n/a ; CJK_Compatibility_Ideographs
95 blk; n/a ; CJK_Compatibility_Ideographs_Supplement
96 blk; n/a ; CJK_Radicals_Supplement
97 blk; n/a ; CJK_Symbols_and_Punctuation
98 blk; n/a ; CJK_Unified_Ideographs
99 blk; n/a ; CJK_Unified_Ideographs_Extension_A
100 blk; n/a ; CJK_Unified_Ideographs_Extension_B
101 blk; n/a ; Combining_Diacritical_Marks
102 blk; n/a ; Combining_Diacritical_Marks_for_Symbols
103 blk; n/a ; Combining_Half_Marks
104 blk; n/a ; Control_Pictures
105 blk; n/a ; Currency_Symbols
106 blk; n/a ; Cypriot_Syllabary
108 blk; n/a ; Cyrillic_Supplementary
110 blk; n/a ; Devanagari
112 blk; n/a ; Enclosed_Alphanumerics
113 blk; n/a ; Enclosed_CJK_Letters_and_Months
115 blk; n/a ; General_Punctuation
116 blk; n/a ; Geometric_Shapes
119 blk; n/a ; Greek_and_Coptic
120 blk; n/a ; Greek_Extended
123 blk; n/a ; Halfwidth_and_Fullwidth_Forms
124 blk; n/a ; Hangul_Compatibility_Jamo
125 blk; n/a ; Hangul_Jamo
126 blk; n/a ; Hangul_Syllables
129 blk; n/a ; High_Private_Use_Surrogates
130 blk; n/a ; High_Surrogates
132 blk; n/a ; Ideographic_Description_Characters
133 blk; n/a ; IPA_Extensions
135 blk; n/a ; Kangxi_Radicals
138 blk; n/a ; Katakana_Phonetic_Extensions
140 blk; n/a ; Khmer_Symbols
142 blk; n/a ; Latin_Extended_Additional
143 blk; n/a ; Latin_Extended-A
144 blk; n/a ; Latin_Extended-B
145 blk; n/a ; Latin-1_Supplement
146 blk; n/a ; Letterlike_Symbols
148 blk; n/a ; Linear_B_Ideograms
149 blk; n/a ; Linear_B_Syllabary
150 blk; n/a ; Low_Surrogates
152 blk; n/a ; Mathematical_Alphanumeric_Symbols
153 blk; n/a ; Mathematical_Operators
154 blk; n/a ; Miscellaneous_Mathematical_Symbols-A
155 blk; n/a ; Miscellaneous_Mathematical_Symbols-B
156 blk; n/a ; Miscellaneous_Symbols
157 blk; n/a ; Miscellaneous_Symbols_and_Arrows
158 blk; n/a ; Miscellaneous_Technical
160 blk; n/a ; Musical_Symbols
163 blk; n/a ; Number_Forms
165 blk; n/a ; Old_Italic
166 blk; n/a ; Optical_Character_Recognition
169 blk; n/a ; Phonetic_Extensions
170 blk; n/a ; Private_Use_Area
174 blk; n/a ; Small_Form_Variants
175 blk; n/a ; Spacing_Modifier_Letters
177 blk; n/a ; Superscripts_and_Subscripts
178 blk; n/a ; Supplemental_Arrows-A
179 blk; n/a ; Supplemental_Arrows-B
180 blk; n/a ; Supplemental_Mathematical_Operators
181 blk; n/a ; Supplementary_Private_Use_Area-A
182 blk; n/a ; Supplementary_Private_Use_Area-B
188 blk; n/a ; Tai_Xuan_Jing_Symbols
195 blk; n/a ; Unified_Canadian_Aboriginal_Syllabics
196 blk; n/a ; Variation_Selectors
197 blk; n/a ; Variation_Selectors_Supplement
198 blk; n/a ; Yi_Radicals
199 blk; n/a ; Yi_Syllables
200 blk; n/a ; Yijing_Hexagram_Symbols
202 ccc; 0; NR ; Not_Reordered
204 ccc; 202; ATB ; Attached_Below
205 ccc; 216; ATAR ; Attached_Above_Right
206 ccc; 218; BL ; Below_Left
208 ccc; 222; BR ; Below_Right
211 ccc; 228; AL ; Above_Left
213 ccc; 232; AR ; Above_Right
214 ccc; 233; DB ; Double_Below
215 ccc; 234; DA ; Double_Above
216 ccc; 240; IS ; Iota_Subscript
218 ccc; 8; KV ; Kana_Voicing
247 gc ; C ; Other # Cc | Cf | Cn | Co | Cs
251 gc ; Co ; Private_Use
253 gc ; L ; Letter # Ll | Lm | Lo | Lt | Lu
254 gc ; LC ; Cased_Letter # Ll | Lt | Lu
255 gc ; Ll ; Lowercase_Letter
256 gc ; Lm ; Modifier_Letter
257 gc ; Lo ; Other_Letter
258 gc ; Lt ; Titlecase_Letter
259 gc ; Lu ; Uppercase_Letter
260 gc ; M ; Mark # Mc | Me | Mn
261 gc ; Mc ; Spacing_Mark
262 gc ; Me ; Enclosing_Mark
263 gc ; Mn ; Nonspacing_Mark
264 gc ; N ; Number # Nd | Nl | No
265 gc ; Nd ; Decimal_Number
266 gc ; Nl ; Letter_Number
267 gc ; No ; Other_Number
268 gc ; P ; Punctuation # Pc | Pd | Pe | Pf | Pi | Po | Ps
269 gc ; Pc ; Connector_Punctuation
270 gc ; Pd ; Dash_Punctuation
271 gc ; Pe ; Close_Punctuation
272 gc ; Pf ; Final_Punctuation
273 gc ; Pi ; Initial_Punctuation
274 gc ; Po ; Other_Punctuation
275 gc ; Ps ; Open_Punctuation
276 gc ; S ; Symbol # Sc | Sk | Sm | So
277 gc ; Sc ; Currency_Symbol
278 gc ; Sk ; Modifier_Symbol
279 gc ; Sm ; Math_Symbol
280 gc ; So ; Other_Symbol
281 gc ; Z ; Separator # Zl | Zp | Zs
282 gc ; Zl ; Line_Separator
283 gc ; Zp ; Paragraph_Separator
284 gc ; Zs ; Space_Separator
286 hst; L ; Leading_Jamo
287 hst; LV ; LV_Syllable
288 hst; LVT ; LVT_Syllable
289 hst; NA ; Not_Applicable
290 hst; T ; Trailing_Jamo
299 jg ; n/a ; DALATH_RISH
303 jg ; n/a ; FINAL_SEMKATH
307 jg ; n/a ; HAMZA_ON_HEH_GOAL
315 jg ; n/a ; KNOTTED_HEH
320 jg ; n/a ; NO_JOINING_GROUP
327 jg ; n/a ; REVERSED_PE
334 jg ; n/a ; SYRIAC_WAW
337 jg ; n/a ; TEH_MARBUTA
341 jg ; n/a ; YEH_BARREE
342 jg ; n/a ; YEH_WITH_TAIL
348 jt ; C ; Join_Causing
349 jt ; D ; Dual_Joining
350 jt ; L ; Left_Joining
351 jt ; R ; Right_Joining
358 lb ; BA ; Break_After
359 lb ; BB ; Break_Before
360 lb ; BK ; Mandatory_Break
361 lb ; CB ; Contingent_Break
362 lb ; CL ; Close_Punctuation
363 lb ; CM ; Combining_Mark
364 lb ; CR ; Carriage_Return
365 lb ; EX ; Exclamation
368 lb ; ID ; Ideographic
369 lb ; IN ; Inseperable
370 lb ; IS ; Infix_Numeric
375 lb ; OP ; Open_Punctuation
376 lb ; PO ; Postfix_Numeric
377 lb ; PR ; Prefix_Numeric
379 lb ; SA ; Complex_Context
382 lb ; SY ; Break_Symbols
383 lb ; WJ ; Word_Joiner
402 sc ; Cans ; Canadian_Aboriginal
406 sc ; Deva ; Devanagari
419 sc ; Ital ; Old_Italic
427 sc ; Mlym ; Malayalam
428 sc ; Mong ; Mongolian
433 sc ; Qaai ; Inherited