1 | # PropertyValueAliases-4.1.0.txt
|
---|
2 | # Date: 2005-03-28, 17:21:48 GMT [MD]
|
---|
3 | #
|
---|
4 | # Unicode Character Database
|
---|
5 | # Copyright (c) 1991-2005 Unicode, Inc.
|
---|
6 | # For terms of use, see http://www.unicode.org/terms_of_use.html
|
---|
7 | # For documentation, see UCD.html
|
---|
8 | #
|
---|
9 | # This file contains aliases for property values used in the UCD.
|
---|
10 | # These names can be used for XML formats of UCD data, for regular-expression
|
---|
11 | # property tests, and other programmatic textual descriptions of Unicode data.
|
---|
12 | # For information on which properties are normative, see UCD.html.
|
---|
13 | #
|
---|
14 | # The names may be translated in appropriate environments, and additional
|
---|
15 | # aliases may be useful.
|
---|
16 | #
|
---|
17 | # FORMAT
|
---|
18 | #
|
---|
19 | # Each line describes a property value name.
|
---|
20 | # This consists of three or more fields, separated by semicolons.
|
---|
21 | #
|
---|
22 | # First Field: The first field describes the property for which that
|
---|
23 | # property value name is used.
|
---|
24 | #
|
---|
25 | # Second Field: The second field is an abbreviated name.
|
---|
26 | # If there is no abbreviated name available, the field is marked with "n/a".
|
---|
27 | #
|
---|
28 | # Third Field: The third field is a long name.
|
---|
29 | #
|
---|
30 | # In the case of ccc, there are 4 fields. The second field is numeric, third
|
---|
31 | # is abbreviated, and fourth is long.
|
---|
32 | #
|
---|
33 | # The above are the preferred aliases. Other aliases may be listed in additional fields.
|
---|
34 | #
|
---|
35 | # Loose matching should be applied to all property names and property values, with
|
---|
36 | # the exception of String Property values. With loose matching of property names and
|
---|
37 | # values, the case distinctions, whitespace, and '_' are ignored. For Numeric Property
|
---|
38 | # values, numeric equivalencies are applied: thus "01.00" is equivalent to "1".
|
---|
39 | #
|
---|
40 | # NOTE: Property value names are NOT unique across properties. For example:
|
---|
41 | #
|
---|
42 | # AL means Arabic Letter for the Bidi_Class property, and
|
---|
43 | # AL means Alpha_Left for the Combining_Class property, and
|
---|
44 | # AL means Alphabetic for the Line_Break property.
|
---|
45 | #
|
---|
46 | # In addition, some property names may be the same as some property value names.
|
---|
47 | # For example:
|
---|
48 | #
|
---|
49 | # sc means the Script property, and
|
---|
50 | # Sc means the General_Category property value Currency_Symbol (Sc)
|
---|
51 | #
|
---|
52 | # The combination of property value and property name is, however, unique.
|
---|
53 | #
|
---|
54 | # For more information, see UTS #18: Regular Expression Guidelines
|
---|
55 | # ================================================
|
---|
56 |
|
---|
57 |
|
---|
58 | # Age (age)
|
---|
59 |
|
---|
60 | age; n/a ; 1.1
|
---|
61 | age; n/a ; 2.0
|
---|
62 | age; n/a ; 2.1
|
---|
63 | age; n/a ; 3.0
|
---|
64 | age; n/a ; 3.1
|
---|
65 | age; n/a ; 3.2
|
---|
66 | age; n/a ; 4.0
|
---|
67 | age; n/a ; 4.1
|
---|
68 | age; n/a ; unassigned
|
---|
69 |
|
---|
70 | # Bidi_Class (bc)
|
---|
71 |
|
---|
72 | bc ; AL ; Arabic_Letter
|
---|
73 | bc ; AN ; Arabic_Number
|
---|
74 | bc ; B ; Paragraph_Separator
|
---|
75 | bc ; BN ; Boundary_Neutral
|
---|
76 | bc ; CS ; Common_Separator
|
---|
77 | bc ; EN ; European_Number
|
---|
78 | bc ; ES ; European_Separator
|
---|
79 | bc ; ET ; European_Terminator
|
---|
80 | bc ; L ; Left_To_Right
|
---|
81 | bc ; LRE ; Left_To_Right_Embedding
|
---|
82 | bc ; LRO ; Left_To_Right_Override
|
---|
83 | bc ; NSM ; Nonspacing_Mark
|
---|
84 | bc ; ON ; Other_Neutral
|
---|
85 | bc ; PDF ; Pop_Directional_Format
|
---|
86 | bc ; R ; Right_To_Left
|
---|
87 | bc ; RLE ; Right_To_Left_Embedding
|
---|
88 | bc ; RLO ; Right_To_Left_Override
|
---|
89 | bc ; S ; Segment_Separator
|
---|
90 | bc ; WS ; White_Space
|
---|
91 |
|
---|
92 | # Block (blk)
|
---|
93 |
|
---|
94 | blk; n/a ; Aegean_Numbers
|
---|
95 | blk; n/a ; Alphabetic_Presentation_Forms
|
---|
96 | blk; n/a ; Ancient_Greek_Musical_Notation
|
---|
97 | blk; n/a ; Ancient_Greek_Numbers
|
---|
98 | blk; n/a ; Arabic
|
---|
99 | blk; n/a ; Arabic_Presentation_Forms-A
|
---|
100 | blk; n/a ; Arabic_Presentation_Forms-B
|
---|
101 | blk; n/a ; Arabic_Supplement
|
---|
102 | blk; n/a ; Armenian
|
---|
103 | blk; n/a ; Arrows
|
---|
104 | blk; n/a ; Basic_Latin
|
---|
105 | blk; n/a ; Bengali
|
---|
106 | blk; n/a ; Block_Elements
|
---|
107 | blk; n/a ; Bopomofo
|
---|
108 | blk; n/a ; Bopomofo_Extended
|
---|
109 | blk; n/a ; Box_Drawing
|
---|
110 | blk; n/a ; Braille_Patterns
|
---|
111 | blk; n/a ; Buginese
|
---|
112 | blk; n/a ; Buhid
|
---|
113 | blk; n/a ; Byzantine_Musical_Symbols
|
---|
114 | blk; n/a ; Cherokee
|
---|
115 | blk; n/a ; CJK_Compatibility
|
---|
116 | blk; n/a ; CJK_Compatibility_Forms
|
---|
117 | blk; n/a ; CJK_Compatibility_Ideographs
|
---|
118 | blk; n/a ; CJK_Compatibility_Ideographs_Supplement
|
---|
119 | blk; n/a ; CJK_Radicals_Supplement
|
---|
120 | blk; n/a ; CJK_Strokes
|
---|
121 | blk; n/a ; CJK_Symbols_and_Punctuation
|
---|
122 | blk; n/a ; CJK_Unified_Ideographs
|
---|
123 | blk; n/a ; CJK_Unified_Ideographs_Extension_A
|
---|
124 | blk; n/a ; CJK_Unified_Ideographs_Extension_B
|
---|
125 | blk; n/a ; Combining_Diacritical_Marks
|
---|
126 | blk; n/a ; Combining_Diacritical_Marks_for_Symbols
|
---|
127 | blk; n/a ; Combining_Diacritical_Marks_Supplement
|
---|
128 | blk; n/a ; Combining_Half_Marks
|
---|
129 | blk; n/a ; Control_Pictures
|
---|
130 | blk; n/a ; Coptic
|
---|
131 | blk; n/a ; Currency_Symbols
|
---|
132 | blk; n/a ; Cypriot_Syllabary
|
---|
133 | blk; n/a ; Cyrillic
|
---|
134 | blk; n/a ; Cyrillic_Supplement ; Cyrillic_Supplementary
|
---|
135 | blk; n/a ; Deseret
|
---|
136 | blk; n/a ; Devanagari
|
---|
137 | blk; n/a ; Dingbats
|
---|
138 | blk; n/a ; Enclosed_Alphanumerics
|
---|
139 | blk; n/a ; Enclosed_CJK_Letters_and_Months
|
---|
140 | blk; n/a ; Ethiopic
|
---|
141 | blk; n/a ; Ethiopic_Extended
|
---|
142 | blk; n/a ; Ethiopic_Supplement
|
---|
143 | blk; n/a ; General_Punctuation
|
---|
144 | blk; n/a ; Geometric_Shapes
|
---|
145 | blk; n/a ; Georgian
|
---|
146 | blk; n/a ; Georgian_Supplement
|
---|
147 | blk; n/a ; Glagolitic
|
---|
148 | blk; n/a ; Gothic
|
---|
149 | blk; n/a ; Greek_and_Coptic
|
---|
150 | blk; n/a ; Greek_Extended
|
---|
151 | blk; n/a ; Gujarati
|
---|
152 | blk; n/a ; Gurmukhi
|
---|
153 | blk; n/a ; Halfwidth_and_Fullwidth_Forms
|
---|
154 | blk; n/a ; Hangul_Compatibility_Jamo
|
---|
155 | blk; n/a ; Hangul_Jamo
|
---|
156 | blk; n/a ; Hangul_Syllables
|
---|
157 | blk; n/a ; Hanunoo
|
---|
158 | blk; n/a ; Hebrew
|
---|
159 | blk; n/a ; High_Private_Use_Surrogates
|
---|
160 | blk; n/a ; High_Surrogates
|
---|
161 | blk; n/a ; Hiragana
|
---|
162 | blk; n/a ; Ideographic_Description_Characters
|
---|
163 | blk; n/a ; IPA_Extensions
|
---|
164 | blk; n/a ; Kanbun
|
---|
165 | blk; n/a ; Kangxi_Radicals
|
---|
166 | blk; n/a ; Kannada
|
---|
167 | blk; n/a ; Katakana
|
---|
168 | blk; n/a ; Katakana_Phonetic_Extensions
|
---|
169 | blk; n/a ; Kharoshthi
|
---|
170 | blk; n/a ; Khmer
|
---|
171 | blk; n/a ; Khmer_Symbols
|
---|
172 | blk; n/a ; Lao
|
---|
173 | blk; n/a ; Latin-1_Supplement
|
---|
174 | blk; n/a ; Latin_Extended-A
|
---|
175 | blk; n/a ; Latin_Extended-B
|
---|
176 | blk; n/a ; Latin_Extended_Additional
|
---|
177 | blk; n/a ; Letterlike_Symbols
|
---|
178 | blk; n/a ; Limbu
|
---|
179 | blk; n/a ; Linear_B_Ideograms
|
---|
180 | blk; n/a ; Linear_B_Syllabary
|
---|
181 | blk; n/a ; Low_Surrogates
|
---|
182 | blk; n/a ; Malayalam
|
---|
183 | blk; n/a ; Mathematical_Alphanumeric_Symbols
|
---|
184 | blk; n/a ; Mathematical_Operators
|
---|
185 | blk; n/a ; Miscellaneous_Mathematical_Symbols-A
|
---|
186 | blk; n/a ; Miscellaneous_Mathematical_Symbols-B
|
---|
187 | blk; n/a ; Miscellaneous_Symbols
|
---|
188 | blk; n/a ; Miscellaneous_Symbols_and_Arrows
|
---|
189 | blk; n/a ; Miscellaneous_Technical
|
---|
190 | blk; n/a ; Modifier_Tone_Letters
|
---|
191 | blk; n/a ; Mongolian
|
---|
192 | blk; n/a ; Musical_Symbols
|
---|
193 | blk; n/a ; Myanmar
|
---|
194 | blk; n/a ; New_Tai_Lue
|
---|
195 | blk; n/a ; No_Block
|
---|
196 | blk; n/a ; Number_Forms
|
---|
197 | blk; n/a ; Ogham
|
---|
198 | blk; n/a ; Old_Italic
|
---|
199 | blk; n/a ; Old_Persian
|
---|
200 | blk; n/a ; Optical_Character_Recognition
|
---|
201 | blk; n/a ; Oriya
|
---|
202 | blk; n/a ; Osmanya
|
---|
203 | blk; n/a ; Phonetic_Extensions
|
---|
204 | blk; n/a ; Phonetic_Extensions_Supplement
|
---|
205 | blk; n/a ; Private_Use_Area
|
---|
206 | blk; n/a ; Runic
|
---|
207 | blk; n/a ; Shavian
|
---|
208 | blk; n/a ; Sinhala
|
---|
209 | blk; n/a ; Small_Form_Variants
|
---|
210 | blk; n/a ; Spacing_Modifier_Letters
|
---|
211 | blk; n/a ; Specials
|
---|
212 | blk; n/a ; Superscripts_and_Subscripts
|
---|
213 | blk; n/a ; Supplemental_Arrows-A
|
---|
214 | blk; n/a ; Supplemental_Arrows-B
|
---|
215 | blk; n/a ; Supplemental_Mathematical_Operators
|
---|
216 | blk; n/a ; Supplemental_Punctuation
|
---|
217 | blk; n/a ; Supplementary_Private_Use_Area-A
|
---|
218 | blk; n/a ; Supplementary_Private_Use_Area-B
|
---|
219 | blk; n/a ; Syloti_Nagri
|
---|
220 | blk; n/a ; Syriac
|
---|
221 | blk; n/a ; Tagalog
|
---|
222 | blk; n/a ; Tagbanwa
|
---|
223 | blk; n/a ; Tags
|
---|
224 | blk; n/a ; Tai_Le
|
---|
225 | blk; n/a ; Tai_Xuan_Jing_Symbols
|
---|
226 | blk; n/a ; Tamil
|
---|
227 | blk; n/a ; Telugu
|
---|
228 | blk; n/a ; Thaana
|
---|
229 | blk; n/a ; Thai
|
---|
230 | blk; n/a ; Tibetan
|
---|
231 | blk; n/a ; Tifinagh
|
---|
232 | blk; n/a ; Ugaritic
|
---|
233 | blk; n/a ; Unified_Canadian_Aboriginal_Syllabics
|
---|
234 | blk; n/a ; Variation_Selectors
|
---|
235 | blk; n/a ; Variation_Selectors_Supplement
|
---|
236 | blk; n/a ; Vertical_Forms
|
---|
237 | blk; n/a ; Yi_Radicals
|
---|
238 | blk; n/a ; Yi_Syllables
|
---|
239 | blk; n/a ; Yijing_Hexagram_Symbols
|
---|
240 |
|
---|
241 | # Canonical_Combining_Class (ccc)
|
---|
242 |
|
---|
243 | ccc; 0; NR ; Not_Reordered
|
---|
244 | ccc; 1; OV ; Overlay
|
---|
245 | ccc; 7; NK ; Nukta
|
---|
246 | ccc; 8; KV ; Kana_Voicing
|
---|
247 | ccc; 9; VR ; Virama
|
---|
248 | ccc; 200; ATBL ; Attached_Below_Left
|
---|
249 | ccc; 202; ATB ; Attached_Below
|
---|
250 | ccc; 216; ATAR ; Attached_Above_Right
|
---|
251 | ccc; 218; BL ; Below_Left
|
---|
252 | ccc; 220; B ; Below
|
---|
253 | ccc; 222; BR ; Below_Right
|
---|
254 | ccc; 224; L ; Left
|
---|
255 | ccc; 226; R ; Right
|
---|
256 | ccc; 228; AL ; Above_Left
|
---|
257 | ccc; 230; A ; Above
|
---|
258 | ccc; 232; AR ; Above_Right
|
---|
259 | ccc; 233; DB ; Double_Below
|
---|
260 | ccc; 234; DA ; Double_Above
|
---|
261 | ccc; 240; IS ; Iota_Subscript
|
---|
262 |
|
---|
263 | # Decomposition_Type (dt)
|
---|
264 |
|
---|
265 | dt ; can ; Canonical
|
---|
266 | dt ; com ; Compat
|
---|
267 | dt ; enc ; Circle
|
---|
268 | dt ; fin ; Final
|
---|
269 | dt ; font ; Font
|
---|
270 | dt ; fra ; Fraction
|
---|
271 | dt ; init ; Initial
|
---|
272 | dt ; iso ; Isolated
|
---|
273 | dt ; med ; Medial
|
---|
274 | dt ; nar ; Narrow
|
---|
275 | dt ; nb ; Nobreak
|
---|
276 | dt ; none ; None
|
---|
277 | dt ; sml ; Small
|
---|
278 | dt ; sqr ; Square
|
---|
279 | dt ; sub ; Sub
|
---|
280 | dt ; sup ; Super
|
---|
281 | dt ; vert ; Vertical
|
---|
282 | dt ; wide ; Wide
|
---|
283 |
|
---|
284 | # East_Asian_Width (ea)
|
---|
285 |
|
---|
286 | ea ; A ; Ambiguous
|
---|
287 | ea ; F ; Fullwidth
|
---|
288 | ea ; H ; Halfwidth
|
---|
289 | ea ; N ; Neutral
|
---|
290 | ea ; Na ; Narrow
|
---|
291 | ea ; W ; Wide
|
---|
292 |
|
---|
293 | # General_Category (gc)
|
---|
294 |
|
---|
295 | gc ; C ; Other # Cc | Cf | Cn | Co | Cs
|
---|
296 | gc ; Cc ; Control ; cntrl
|
---|
297 | gc ; Cf ; Format
|
---|
298 | gc ; Cn ; Unassigned
|
---|
299 | gc ; Co ; Private_Use
|
---|
300 | gc ; Cs ; Surrogate
|
---|
301 | gc ; L ; Letter # Ll | Lm | Lo | Lt | Lu
|
---|
302 | gc ; LC ; Cased_Letter # Ll | Lt | Lu
|
---|
303 | gc ; Ll ; Lowercase_Letter
|
---|
304 | gc ; Lm ; Modifier_Letter
|
---|
305 | gc ; Lo ; Other_Letter
|
---|
306 | gc ; Lt ; Titlecase_Letter
|
---|
307 | gc ; Lu ; Uppercase_Letter
|
---|
308 | gc ; M ; Mark # Mc | Me | Mn
|
---|
309 | gc ; Mc ; Spacing_Mark
|
---|
310 | gc ; Me ; Enclosing_Mark
|
---|
311 | gc ; Mn ; Nonspacing_Mark
|
---|
312 | gc ; N ; Number # Nd | Nl | No
|
---|
313 | gc ; Nd ; Decimal_Number ; digit
|
---|
314 | gc ; Nl ; Letter_Number
|
---|
315 | gc ; No ; Other_Number
|
---|
316 | gc ; P ; Punctuation ; punct # Pc | Pd | Pe | Pf | Pi | Po | Ps
|
---|
317 | gc ; Pc ; Connector_Punctuation
|
---|
318 | gc ; Pd ; Dash_Punctuation
|
---|
319 | gc ; Pe ; Close_Punctuation
|
---|
320 | gc ; Pf ; Final_Punctuation
|
---|
321 | gc ; Pi ; Initial_Punctuation
|
---|
322 | gc ; Po ; Other_Punctuation
|
---|
323 | gc ; Ps ; Open_Punctuation
|
---|
324 | gc ; S ; Symbol # Sc | Sk | Sm | So
|
---|
325 | gc ; Sc ; Currency_Symbol
|
---|
326 | gc ; Sk ; Modifier_Symbol
|
---|
327 | gc ; Sm ; Math_Symbol
|
---|
328 | gc ; So ; Other_Symbol
|
---|
329 | gc ; Z ; Separator # Zl | Zp | Zs
|
---|
330 | gc ; Zl ; Line_Separator
|
---|
331 | gc ; Zp ; Paragraph_Separator
|
---|
332 | gc ; Zs ; Space_Separator
|
---|
333 |
|
---|
334 | # Grapheme_Cluster_Break (GCB)
|
---|
335 |
|
---|
336 | GCB; CN ; Control
|
---|
337 | GCB; CR ; CR
|
---|
338 | GCB; EX ; Extend
|
---|
339 | GCB; L ; L
|
---|
340 | GCB; LF ; LF
|
---|
341 | GCB; LV ; LV
|
---|
342 | GCB; LVT ; LVT
|
---|
343 | GCB; T ; T
|
---|
344 | GCB; V ; V
|
---|
345 | GCB; XX ; Other
|
---|
346 |
|
---|
347 | # Hangul_Syllable_Type (hst)
|
---|
348 |
|
---|
349 | hst; L ; Leading_Jamo
|
---|
350 | hst; LV ; LV_Syllable
|
---|
351 | hst; LVT ; LVT_Syllable
|
---|
352 | hst; NA ; Not_Applicable
|
---|
353 | hst; T ; Trailing_Jamo
|
---|
354 | hst; V ; Vowel_Jamo
|
---|
355 |
|
---|
356 | # Joining_Group (jg)
|
---|
357 |
|
---|
358 | jg ; n/a ; Ain
|
---|
359 | jg ; n/a ; Alaph
|
---|
360 | jg ; n/a ; Alef
|
---|
361 | jg ; n/a ; Beh
|
---|
362 | jg ; n/a ; Beth
|
---|
363 | jg ; n/a ; Dal
|
---|
364 | jg ; n/a ; Dalath_Rish
|
---|
365 | jg ; n/a ; E
|
---|
366 | jg ; n/a ; Fe
|
---|
367 | jg ; n/a ; Feh
|
---|
368 | jg ; n/a ; Final_Semkath
|
---|
369 | jg ; n/a ; Gaf
|
---|
370 | jg ; n/a ; Gamal
|
---|
371 | jg ; n/a ; Hah
|
---|
372 | jg ; n/a ; Hamza_On_Heh_Goal
|
---|
373 | jg ; n/a ; He
|
---|
374 | jg ; n/a ; Heh
|
---|
375 | jg ; n/a ; Heh_Goal
|
---|
376 | jg ; n/a ; Heth
|
---|
377 | jg ; n/a ; Kaf
|
---|
378 | jg ; n/a ; Kaph
|
---|
379 | jg ; n/a ; Khaph
|
---|
380 | jg ; n/a ; Knotted_Heh
|
---|
381 | jg ; n/a ; Lam
|
---|
382 | jg ; n/a ; Lamadh
|
---|
383 | jg ; n/a ; Meem
|
---|
384 | jg ; n/a ; Mim
|
---|
385 | jg ; n/a ; No_Joining_Group
|
---|
386 | jg ; n/a ; Noon
|
---|
387 | jg ; n/a ; Nun
|
---|
388 | jg ; n/a ; Pe
|
---|
389 | jg ; n/a ; Qaf
|
---|
390 | jg ; n/a ; Qaph
|
---|
391 | jg ; n/a ; Reh
|
---|
392 | jg ; n/a ; Reversed_Pe
|
---|
393 | jg ; n/a ; Sad
|
---|
394 | jg ; n/a ; Sadhe
|
---|
395 | jg ; n/a ; Seen
|
---|
396 | jg ; n/a ; Semkath
|
---|
397 | jg ; n/a ; Shin
|
---|
398 | jg ; n/a ; Swash_Kaf
|
---|
399 | jg ; n/a ; Syriac_Waw
|
---|
400 | jg ; n/a ; Tah
|
---|
401 | jg ; n/a ; Taw
|
---|
402 | jg ; n/a ; Teh_Marbuta
|
---|
403 | jg ; n/a ; Teth
|
---|
404 | jg ; n/a ; Waw
|
---|
405 | jg ; n/a ; Yeh
|
---|
406 | jg ; n/a ; Yeh_Barree
|
---|
407 | jg ; n/a ; Yeh_With_Tail
|
---|
408 | jg ; n/a ; Yudh
|
---|
409 | jg ; n/a ; Yudh_He
|
---|
410 | jg ; n/a ; Zain
|
---|
411 | jg ; n/a ; Zhain
|
---|
412 |
|
---|
413 | # Joining_Type (jt)
|
---|
414 |
|
---|
415 | jt ; C ; Join_Causing
|
---|
416 | jt ; D ; Dual_Joining
|
---|
417 | jt ; L ; Left_Joining
|
---|
418 | jt ; R ; Right_Joining
|
---|
419 | jt ; T ; Transparent
|
---|
420 | jt ; U ; Non_Joining
|
---|
421 |
|
---|
422 | # Line_Break (lb)
|
---|
423 |
|
---|
424 | lb ; AI ; Ambiguous
|
---|
425 | lb ; AL ; Alphabetic
|
---|
426 | lb ; B2 ; Break_Both
|
---|
427 | lb ; BA ; Break_After
|
---|
428 | lb ; BB ; Break_Before
|
---|
429 | lb ; BK ; Mandatory_Break
|
---|
430 | lb ; CB ; Contingent_Break
|
---|
431 | lb ; CL ; Close_Punctuation
|
---|
432 | lb ; CM ; Combining_Mark
|
---|
433 | lb ; CR ; Carriage_Return
|
---|
434 | lb ; EX ; Exclamation
|
---|
435 | lb ; GL ; Glue
|
---|
436 | lb ; H2 ; H2
|
---|
437 | lb ; H3 ; H3
|
---|
438 | lb ; HY ; Hyphen
|
---|
439 | lb ; ID ; Ideographic
|
---|
440 | lb ; IN ; Inseparable ; Inseperable
|
---|
441 | lb ; IS ; Infix_Numeric
|
---|
442 | lb ; JL ; JL
|
---|
443 | lb ; JT ; JT
|
---|
444 | lb ; JV ; JV
|
---|
445 | lb ; LF ; Line_Feed
|
---|
446 | lb ; NL ; Next_Line
|
---|
447 | lb ; NS ; Nonstarter
|
---|
448 | lb ; NU ; Numeric
|
---|
449 | lb ; OP ; Open_Punctuation
|
---|
450 | lb ; PO ; Postfix_Numeric
|
---|
451 | lb ; PR ; Prefix_Numeric
|
---|
452 | lb ; QU ; Quotation
|
---|
453 | lb ; SA ; Complex_Context
|
---|
454 | lb ; SG ; Surrogate
|
---|
455 | lb ; SP ; Space
|
---|
456 | lb ; SY ; Break_Symbols
|
---|
457 | lb ; WJ ; Word_Joiner
|
---|
458 | lb ; XX ; Unknown
|
---|
459 | lb ; ZW ; ZWSpace
|
---|
460 |
|
---|
461 | # NFC_Quick_Check (NFC_QC)
|
---|
462 |
|
---|
463 | NFC_QC; M ; Maybe
|
---|
464 | NFC_QC; N ; No
|
---|
465 | NFC_QC; Y ; Yes
|
---|
466 |
|
---|
467 | # NFD_Quick_Check (NFD_QC)
|
---|
468 |
|
---|
469 | NFD_QC; N ; No
|
---|
470 | NFD_QC; Y ; Yes
|
---|
471 |
|
---|
472 | # NFKC_Quick_Check (NFKC_QC)
|
---|
473 |
|
---|
474 | NFKC_QC; M ; Maybe
|
---|
475 | NFKC_QC; N ; No
|
---|
476 | NFKC_QC; Y ; Yes
|
---|
477 |
|
---|
478 | # NFKD_Quick_Check (NFKD_QC)
|
---|
479 |
|
---|
480 | NFKD_QC; N ; No
|
---|
481 | NFKD_QC; Y ; Yes
|
---|
482 |
|
---|
483 | # Numeric_Type (nt)
|
---|
484 |
|
---|
485 | nt ; De ; Decimal
|
---|
486 | nt ; Di ; Digit
|
---|
487 | nt ; None ; None
|
---|
488 | nt ; Nu ; Numeric
|
---|
489 |
|
---|
490 | # Script (sc)
|
---|
491 |
|
---|
492 | sc ; Arab ; Arabic
|
---|
493 | sc ; Armn ; Armenian
|
---|
494 | sc ; Beng ; Bengali
|
---|
495 | sc ; Bopo ; Bopomofo
|
---|
496 | sc ; Brai ; Braille
|
---|
497 | sc ; Bugi ; Buginese
|
---|
498 | sc ; Buhd ; Buhid
|
---|
499 | sc ; Cans ; Canadian_Aboriginal
|
---|
500 | sc ; Cher ; Cherokee
|
---|
501 | sc ; Copt ; Coptic ; Qaac
|
---|
502 | sc ; Cprt ; Cypriot
|
---|
503 | sc ; Cyrl ; Cyrillic
|
---|
504 | sc ; Deva ; Devanagari
|
---|
505 | sc ; Dsrt ; Deseret
|
---|
506 | sc ; Ethi ; Ethiopic
|
---|
507 | sc ; Geor ; Georgian
|
---|
508 | sc ; Glag ; Glagolitic
|
---|
509 | sc ; Goth ; Gothic
|
---|
510 | sc ; Grek ; Greek
|
---|
511 | sc ; Gujr ; Gujarati
|
---|
512 | sc ; Guru ; Gurmukhi
|
---|
513 | sc ; Hang ; Hangul
|
---|
514 | sc ; Hani ; Han
|
---|
515 | sc ; Hano ; Hanunoo
|
---|
516 | sc ; Hebr ; Hebrew
|
---|
517 | sc ; Hira ; Hiragana
|
---|
518 | sc ; Hrkt ; Katakana_Or_Hiragana
|
---|
519 | sc ; Ital ; Old_Italic
|
---|
520 | sc ; Kana ; Katakana
|
---|
521 | sc ; Khar ; Kharoshthi
|
---|
522 | sc ; Khmr ; Khmer
|
---|
523 | sc ; Knda ; Kannada
|
---|
524 | sc ; Laoo ; Lao
|
---|
525 | sc ; Latn ; Latin
|
---|
526 | sc ; Limb ; Limbu
|
---|
527 | sc ; Linb ; Linear_B
|
---|
528 | sc ; Mlym ; Malayalam
|
---|
529 | sc ; Mong ; Mongolian
|
---|
530 | sc ; Mymr ; Myanmar
|
---|
531 | sc ; Ogam ; Ogham
|
---|
532 | sc ; Orya ; Oriya
|
---|
533 | sc ; Osma ; Osmanya
|
---|
534 | sc ; Qaai ; Inherited
|
---|
535 | sc ; Runr ; Runic
|
---|
536 | sc ; Shaw ; Shavian
|
---|
537 | sc ; Sinh ; Sinhala
|
---|
538 | sc ; Sylo ; Syloti_Nagri
|
---|
539 | sc ; Syrc ; Syriac
|
---|
540 | sc ; Tagb ; Tagbanwa
|
---|
541 | sc ; Tale ; Tai_Le
|
---|
542 | sc ; Talu ; New_Tai_Lue
|
---|
543 | sc ; Taml ; Tamil
|
---|
544 | sc ; Telu ; Telugu
|
---|
545 | sc ; Tfng ; Tifinagh
|
---|
546 | sc ; Tglg ; Tagalog
|
---|
547 | sc ; Thaa ; Thaana
|
---|
548 | sc ; Thai ; Thai
|
---|
549 | sc ; Tibt ; Tibetan
|
---|
550 | sc ; Ugar ; Ugaritic
|
---|
551 | sc ; Xpeo ; Old_Persian
|
---|
552 | sc ; Yiii ; Yi
|
---|
553 | sc ; Zyyy ; Common
|
---|
554 |
|
---|
555 | # Sentence_Break (SB)
|
---|
556 |
|
---|
557 | SB ; AT ; ATerm
|
---|
558 | SB ; CL ; Close
|
---|
559 | SB ; FO ; Format
|
---|
560 | SB ; LE ; OLetter
|
---|
561 | SB ; LO ; Lower
|
---|
562 | SB ; NU ; Numeric
|
---|
563 | SB ; SE ; Sep
|
---|
564 | SB ; SP ; Sp
|
---|
565 | SB ; ST ; STerm
|
---|
566 | SB ; UP ; Upper
|
---|
567 | SB ; XX ; Other
|
---|
568 |
|
---|
569 | # Word_Break (WB)
|
---|
570 |
|
---|
571 | WB ; EX ; ExtendNumLet
|
---|
572 | WB ; FO ; Format
|
---|
573 | WB ; KA ; Katakana
|
---|
574 | WB ; LE ; ALetter
|
---|
575 | WB ; ML ; MidLetter
|
---|
576 | WB ; MN ; MidNum
|
---|
577 | WB ; NU ; Numeric
|
---|
578 | WB ; XX ; Other
|
---|