1 # PropertyAliases-13.0.0.txt
2 # Date: 2019-10-23, 03:46:32 GMT
3 # © 2019 Unicode®, Inc.
4 # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
5 # For terms of use, see http://www.unicode.org/terms_of_use.html
7 # Unicode Character Database
8 # For documentation, see http://www.unicode.org/reports/tr44/
10 # This file contains aliases for properties used in the UCD.
11 # These names can be used for XML formats of UCD data, for regular-expression
12 # property tests, and other programmatic textual descriptions of Unicode data.
14 # The names may be translated in appropriate environments, and additional
15 # aliases may be useful.
19 # Each line has two or more fields, separated by semicolons.
21 # First Field: The first field is the short name for the property.
22 # It is typically an abbreviation, but in a number of cases it is simply
23 # a duplicate of the "long name" in the second field.
24 # For Unihan database tags, the short name is actually a longer string than
25 # the tag specified in the second field.
27 # Second Field: The second field is the long name for the property,
28 # typically the formal name used in documentation about the property.
30 # The above are the preferred aliases. Other aliases may be listed in additional fields.
32 # Loose matching should be applied to all property names and property values, with
33 # the exception of String Property values. With loose matching of property names and
34 # values, the case distinctions, whitespace, and '_' are ignored. For Numeric Property
35 # values, numeric equivalencies are applied: thus "01.00" is equivalent to "1".
37 # NOTE: Property value names are NOT unique across properties. For example:
39 # AL means Arabic Letter for the Bidi_Class property, and
40 # AL means Above_Left for the Combining_Class property, and
41 # AL means Alphabetic for the Line_Break property.
43 # In addition, some property names may be the same as some property value names.
46 # sc means the Script property, and
47 # Sc means the General_Category property value Currency_Symbol (Sc)
49 # The combination of property value and property name is, however, unique.
51 # For more information, see UAX #44, Unicode Character Database, and
52 # UTS #18, Unicode Regular Expressions.
53 # ================================================
56 # ================================================
58 # ================================================
59 cjkAccountingNumeric ; kAccountingNumeric
60 cjkOtherNumeric ; kOtherNumeric
61 cjkPrimaryNumeric ; kPrimaryNumeric
64 # ================================================
66 # ================================================
68 cjkCompatibilityVariant ; kCompatibilityVariant
69 dm ; Decomposition_Mapping
70 FC_NFKC ; FC_NFKC_Closure
71 lc ; Lowercase_Mapping
72 NFKC_CF ; NFKC_Casefold
73 scf ; Simple_Case_Folding ; sfc
74 slc ; Simple_Lowercase_Mapping
75 stc ; Simple_Titlecase_Mapping
76 suc ; Simple_Uppercase_Mapping
77 tc ; Titlecase_Mapping
78 uc ; Uppercase_Mapping
80 # ================================================
81 # Miscellaneous Properties
82 # ================================================
83 bmg ; Bidi_Mirroring_Glyph
84 bpb ; Bidi_Paired_Bracket
86 cjkIRG_GSource ; kIRG_GSource
87 cjkIRG_HSource ; kIRG_HSource
88 cjkIRG_JSource ; kIRG_JSource
89 cjkIRG_KPSource ; kIRG_KPSource
90 cjkIRG_KSource ; kIRG_KSource
91 cjkIRG_MSource ; kIRG_MSource
92 cjkIRG_SSource ; kIRG_SSource
93 cjkIRG_TSource ; kIRG_TSource
94 cjkIRG_UKSource ; kIRG_UKSource
95 cjkIRG_USource ; kIRG_USource
96 cjkIRG_VSource ; kIRG_VSource
97 cjkRSUnicode ; kRSUnicode ; Unicode_Radical_Stroke; URS
98 EqUIdeo ; Equivalent_Unified_Ideograph
100 JSN ; Jamo_Short_Name
103 Name_Alias ; Name_Alias
104 scx ; Script_Extensions
106 # ================================================
108 # ================================================
113 # ================================================
114 # Enumerated Properties
115 # ================================================
117 bpt ; Bidi_Paired_Bracket_Type
118 ccc ; Canonical_Combining_Class
119 dt ; Decomposition_Type
120 ea ; East_Asian_Width
121 gc ; General_Category
122 GCB ; Grapheme_Cluster_Break
123 hst ; Hangul_Syllable_Type
124 InPC ; Indic_Positional_Category
125 InSC ; Indic_Syllabic_Category
129 NFC_QC ; NFC_Quick_Check
130 NFD_QC ; NFD_Quick_Check
131 NFKC_QC ; NFKC_Quick_Check
132 NFKD_QC ; NFKD_Quick_Check
135 vo ; Vertical_Orientation
138 # ================================================
140 # ================================================
141 AHex ; ASCII_Hex_Digit
143 Bidi_C ; Bidi_Control
144 Bidi_M ; Bidi_Mirrored
146 CE ; Composition_Exclusion
148 Comp_Ex ; Full_Composition_Exclusion
149 CWCF ; Changes_When_Casefolded
150 CWCM ; Changes_When_Casemapped
151 CWKCF ; Changes_When_NFKC_Casefolded
152 CWL ; Changes_When_Lowercased
153 CWT ; Changes_When_Titlecased
154 CWU ; Changes_When_Uppercased
157 DI ; Default_Ignorable_Code_Point
159 EBase ; Emoji_Modifier_Base
160 EComp ; Emoji_Component
161 EMod ; Emoji_Modifier
163 EPres ; Emoji_Presentation
165 ExtPict ; Extended_Pictographic
166 Gr_Base ; Grapheme_Base
167 Gr_Ext ; Grapheme_Extend
168 Gr_Link ; Grapheme_Link
174 IDSB ; IDS_Binary_Operator
175 IDST ; IDS_Trinary_Operator
176 Join_C ; Join_Control
177 LOE ; Logical_Order_Exception
180 NChar ; Noncharacter_Code_Point
181 OAlpha ; Other_Alphabetic
182 ODI ; Other_Default_Ignorable_Code_Point
183 OGr_Ext ; Other_Grapheme_Extend
184 OIDC ; Other_ID_Continue
185 OIDS ; Other_ID_Start
186 OLower ; Other_Lowercase
188 OUpper ; Other_Uppercase
189 Pat_Syn ; Pattern_Syntax
190 Pat_WS ; Pattern_White_Space
191 PCM ; Prepended_Concatenation_Mark
192 QMark ; Quotation_Mark
194 RI ; Regional_Indicator
196 STerm ; Sentence_Terminal
197 Term ; Terminal_Punctuation
198 UIdeo ; Unified_Ideograph
200 VS ; Variation_Selector
201 WSpace ; White_Space ; space
204 XO_NFC ; Expands_On_NFC
205 XO_NFD ; Expands_On_NFD
206 XO_NFKC ; Expands_On_NFKC
207 XO_NFKD ; Expands_On_NFKD
209 # ================================================