1 # PropertyValueAliases-7.0.0.txt
2 # Date: 2014-05-14, 23:55:16 GMT [MD]
4 # Unicode Character Database
5 # Copyright (c) 1991-2014 Unicode, Inc.
6 # For terms of use, see http://www.unicode.org/terms_of_use.html
7 # For documentation, see http://www.unicode.org/reports/tr44/
9 # This file contains aliases for property values used in the UCD.
10 # These names can be used for XML formats of UCD data, for regular-expression
11 # property tests, and other programmatic textual descriptions of Unicode data.
13 # The names may be translated in appropriate environments, and additional
14 # aliases may be useful.
18 # Each line describes a property value name.
19 # This consists of three or more fields, separated by semicolons.
21 # First Field: The first field describes the property for which that
22 # property value name is used.
24 # Second Field: The second field is an abbreviated name.
26 # Third Field: The third field is a long name.
28 # In the case of ccc, there are 4 fields. The second field is numeric, third
29 # is abbreviated, and fourth is long.
31 # The above are the preferred aliases. Other aliases may be listed in additional fields.
33 # Loose matching should be applied to all property names and property values, with
34 # the exception of String Property values. With loose matching of property names and
35 # values, the case distinctions, whitespace, hyphens, and '_' are ignored.
36 # For Numeric Property values, numeric equivalence is applied: thus "01.00"
37 # is equivalent to "1".
39 # NOTE: Property value names are NOT unique across properties. For example:
41 # AL means Arabic Letter for the Bidi_Class property, and
42 # AL means Above_Left for the Canonical_Combining_Class property, and
43 # AL means Alphabetic for the Line_Break property.
45 # In addition, some property names may be the same as some property value names.
48 # sc means the Script property, and
49 # Sc means the General_Category property value Currency_Symbol (Sc)
51 # The combination of property value and property name is, however, unique.
53 # For more information, see UTS #18: Unicode Regular Expressions
54 # ================================================
57 # ASCII_Hex_Digit (AHex)
59 AHex; N ; No ; F ; False
60 AHex; Y ; Yes ; T ; True
84 Alpha; N ; No ; F ; False
85 Alpha; Y ; Yes ; T ; True
89 bc ; AL ; Arabic_Letter
90 bc ; AN ; Arabic_Number
91 bc ; B ; Paragraph_Separator
92 bc ; BN ; Boundary_Neutral
93 bc ; CS ; Common_Separator
94 bc ; EN ; European_Number
95 bc ; ES ; European_Separator
96 bc ; ET ; European_Terminator
97 bc ; FSI ; First_Strong_Isolate
98 bc ; L ; Left_To_Right
99 bc ; LRE ; Left_To_Right_Embedding
100 bc ; LRI ; Left_To_Right_Isolate
101 bc ; LRO ; Left_To_Right_Override
102 bc ; NSM ; Nonspacing_Mark
103 bc ; ON ; Other_Neutral
104 bc ; PDF ; Pop_Directional_Format
105 bc ; PDI ; Pop_Directional_Isolate
106 bc ; R ; Right_To_Left
107 bc ; RLE ; Right_To_Left_Embedding
108 bc ; RLI ; Right_To_Left_Isolate
109 bc ; RLO ; Right_To_Left_Override
110 bc ; S ; Segment_Separator
111 bc ; WS ; White_Space
113 # Bidi_Control (Bidi_C)
115 Bidi_C; N ; No ; F ; False
116 Bidi_C; Y ; Yes ; T ; True
118 # Bidi_Mirrored (Bidi_M)
120 Bidi_M; N ; No ; F ; False
121 Bidi_M; Y ; Yes ; T ; True
123 # Bidi_Mirroring_Glyph (bmg)
125 # @missing: 0000..10FFFF; Bidi_Mirroring_Glyph; <none>
127 # Bidi_Paired_Bracket (bpb)
129 # @missing: 0000..10FFFF; Bidi_Paired_Bracket; <none>
131 # Bidi_Paired_Bracket_Type (bpt)
136 # @missing: 0000..10FFFF; Bidi_Paired_Bracket_Type; n
140 blk; Aegean_Numbers ; Aegean_Numbers
141 blk; Alchemical ; Alchemical_Symbols
142 blk; Alphabetic_PF ; Alphabetic_Presentation_Forms
143 blk; Ancient_Greek_Music ; Ancient_Greek_Musical_Notation
144 blk; Ancient_Greek_Numbers ; Ancient_Greek_Numbers
145 blk; Ancient_Symbols ; Ancient_Symbols
147 blk; Arabic_Ext_A ; Arabic_Extended_A
148 blk; Arabic_Math ; Arabic_Mathematical_Alphabetic_Symbols
149 blk; Arabic_PF_A ; Arabic_Presentation_Forms_A ; Arabic_Presentation_Forms-A
150 blk; Arabic_PF_B ; Arabic_Presentation_Forms_B
151 blk; Arabic_Sup ; Arabic_Supplement
152 blk; Armenian ; Armenian
154 blk; ASCII ; Basic_Latin
155 blk; Avestan ; Avestan
156 blk; Balinese ; Balinese
158 blk; Bamum_Sup ; Bamum_Supplement
159 blk; Bassa_Vah ; Bassa_Vah
161 blk; Bengali ; Bengali
162 blk; Block_Elements ; Block_Elements
163 blk; Bopomofo ; Bopomofo
164 blk; Bopomofo_Ext ; Bopomofo_Extended
165 blk; Box_Drawing ; Box_Drawing
167 blk; Braille ; Braille_Patterns
168 blk; Buginese ; Buginese
170 blk; Byzantine_Music ; Byzantine_Musical_Symbols
172 blk; Caucasian_Albanian ; Caucasian_Albanian
175 blk; Cherokee ; Cherokee
176 blk; CJK ; CJK_Unified_Ideographs
177 blk; CJK_Compat ; CJK_Compatibility
178 blk; CJK_Compat_Forms ; CJK_Compatibility_Forms
179 blk; CJK_Compat_Ideographs ; CJK_Compatibility_Ideographs
180 blk; CJK_Compat_Ideographs_Sup ; CJK_Compatibility_Ideographs_Supplement
181 blk; CJK_Ext_A ; CJK_Unified_Ideographs_Extension_A
182 blk; CJK_Ext_B ; CJK_Unified_Ideographs_Extension_B
183 blk; CJK_Ext_C ; CJK_Unified_Ideographs_Extension_C
184 blk; CJK_Ext_D ; CJK_Unified_Ideographs_Extension_D
185 blk; CJK_Radicals_Sup ; CJK_Radicals_Supplement
186 blk; CJK_Strokes ; CJK_Strokes
187 blk; CJK_Symbols ; CJK_Symbols_And_Punctuation
188 blk; Compat_Jamo ; Hangul_Compatibility_Jamo
189 blk; Control_Pictures ; Control_Pictures
191 blk; Coptic_Epact_Numbers ; Coptic_Epact_Numbers
192 blk; Counting_Rod ; Counting_Rod_Numerals
193 blk; Cuneiform ; Cuneiform
194 blk; Cuneiform_Numbers ; Cuneiform_Numbers_And_Punctuation
195 blk; Currency_Symbols ; Currency_Symbols
196 blk; Cypriot_Syllabary ; Cypriot_Syllabary
197 blk; Cyrillic ; Cyrillic
198 blk; Cyrillic_Ext_A ; Cyrillic_Extended_A
199 blk; Cyrillic_Ext_B ; Cyrillic_Extended_B
200 blk; Cyrillic_Sup ; Cyrillic_Supplement ; Cyrillic_Supplementary
201 blk; Deseret ; Deseret
202 blk; Devanagari ; Devanagari
203 blk; Devanagari_Ext ; Devanagari_Extended
204 blk; Diacriticals ; Combining_Diacritical_Marks
205 blk; Diacriticals_Ext ; Combining_Diacritical_Marks_Extended
206 blk; Diacriticals_For_Symbols ; Combining_Diacritical_Marks_For_Symbols; Combining_Marks_For_Symbols
207 blk; Diacriticals_Sup ; Combining_Diacritical_Marks_Supplement
208 blk; Dingbats ; Dingbats
209 blk; Domino ; Domino_Tiles
210 blk; Duployan ; Duployan
211 blk; Egyptian_Hieroglyphs ; Egyptian_Hieroglyphs
212 blk; Elbasan ; Elbasan
213 blk; Emoticons ; Emoticons
214 blk; Enclosed_Alphanum ; Enclosed_Alphanumerics
215 blk; Enclosed_Alphanum_Sup ; Enclosed_Alphanumeric_Supplement
216 blk; Enclosed_CJK ; Enclosed_CJK_Letters_And_Months
217 blk; Enclosed_Ideographic_Sup ; Enclosed_Ideographic_Supplement
218 blk; Ethiopic ; Ethiopic
219 blk; Ethiopic_Ext ; Ethiopic_Extended
220 blk; Ethiopic_Ext_A ; Ethiopic_Extended_A
221 blk; Ethiopic_Sup ; Ethiopic_Supplement
222 blk; Geometric_Shapes ; Geometric_Shapes
223 blk; Geometric_Shapes_Ext ; Geometric_Shapes_Extended
224 blk; Georgian ; Georgian
225 blk; Georgian_Sup ; Georgian_Supplement
226 blk; Glagolitic ; Glagolitic
228 blk; Grantha ; Grantha
229 blk; Greek ; Greek_And_Coptic
230 blk; Greek_Ext ; Greek_Extended
231 blk; Gujarati ; Gujarati
232 blk; Gurmukhi ; Gurmukhi
233 blk; Half_And_Full_Forms ; Halfwidth_And_Fullwidth_Forms
234 blk; Half_Marks ; Combining_Half_Marks
235 blk; Hangul ; Hangul_Syllables
236 blk; Hanunoo ; Hanunoo
238 blk; High_PU_Surrogates ; High_Private_Use_Surrogates
239 blk; High_Surrogates ; High_Surrogates
240 blk; Hiragana ; Hiragana
241 blk; IDC ; Ideographic_Description_Characters
242 blk; Imperial_Aramaic ; Imperial_Aramaic
243 blk; Indic_Number_Forms ; Common_Indic_Number_Forms
244 blk; Inscriptional_Pahlavi ; Inscriptional_Pahlavi
245 blk; Inscriptional_Parthian ; Inscriptional_Parthian
246 blk; IPA_Ext ; IPA_Extensions
247 blk; Jamo ; Hangul_Jamo
248 blk; Jamo_Ext_A ; Hangul_Jamo_Extended_A
249 blk; Jamo_Ext_B ; Hangul_Jamo_Extended_B
250 blk; Javanese ; Javanese
252 blk; Kana_Sup ; Kana_Supplement
254 blk; Kangxi ; Kangxi_Radicals
255 blk; Kannada ; Kannada
256 blk; Katakana ; Katakana
257 blk; Katakana_Ext ; Katakana_Phonetic_Extensions
258 blk; Kayah_Li ; Kayah_Li
259 blk; Kharoshthi ; Kharoshthi
261 blk; Khmer_Symbols ; Khmer_Symbols
263 blk; Khudawadi ; Khudawadi
265 blk; Latin_1_Sup ; Latin_1_Supplement ; Latin_1
266 blk; Latin_Ext_A ; Latin_Extended_A
267 blk; Latin_Ext_Additional ; Latin_Extended_Additional
268 blk; Latin_Ext_B ; Latin_Extended_B
269 blk; Latin_Ext_C ; Latin_Extended_C
270 blk; Latin_Ext_D ; Latin_Extended_D
271 blk; Latin_Ext_E ; Latin_Extended_E
273 blk; Letterlike_Symbols ; Letterlike_Symbols
275 blk; Linear_A ; Linear_A
276 blk; Linear_B_Ideograms ; Linear_B_Ideograms
277 blk; Linear_B_Syllabary ; Linear_B_Syllabary
279 blk; Low_Surrogates ; Low_Surrogates
282 blk; Mahajani ; Mahajani
283 blk; Mahjong ; Mahjong_Tiles
284 blk; Malayalam ; Malayalam
285 blk; Mandaic ; Mandaic
286 blk; Manichaean ; Manichaean
287 blk; Math_Alphanum ; Mathematical_Alphanumeric_Symbols
288 blk; Math_Operators ; Mathematical_Operators
289 blk; Meetei_Mayek ; Meetei_Mayek
290 blk; Meetei_Mayek_Ext ; Meetei_Mayek_Extensions
291 blk; Mende_Kikakui ; Mende_Kikakui
292 blk; Meroitic_Cursive ; Meroitic_Cursive
293 blk; Meroitic_Hieroglyphs ; Meroitic_Hieroglyphs
295 blk; Misc_Arrows ; Miscellaneous_Symbols_And_Arrows
296 blk; Misc_Math_Symbols_A ; Miscellaneous_Mathematical_Symbols_A
297 blk; Misc_Math_Symbols_B ; Miscellaneous_Mathematical_Symbols_B
298 blk; Misc_Pictographs ; Miscellaneous_Symbols_And_Pictographs
299 blk; Misc_Symbols ; Miscellaneous_Symbols
300 blk; Misc_Technical ; Miscellaneous_Technical
302 blk; Modifier_Letters ; Spacing_Modifier_Letters
303 blk; Modifier_Tone_Letters ; Modifier_Tone_Letters
304 blk; Mongolian ; Mongolian
306 blk; Music ; Musical_Symbols
307 blk; Myanmar ; Myanmar
308 blk; Myanmar_Ext_A ; Myanmar_Extended_A
309 blk; Myanmar_Ext_B ; Myanmar_Extended_B
310 blk; Nabataean ; Nabataean
312 blk; New_Tai_Lue ; New_Tai_Lue
314 blk; Number_Forms ; Number_Forms
315 blk; OCR ; Optical_Character_Recognition
317 blk; Ol_Chiki ; Ol_Chiki
318 blk; Old_Italic ; Old_Italic
319 blk; Old_North_Arabian ; Old_North_Arabian
320 blk; Old_Permic ; Old_Permic
321 blk; Old_Persian ; Old_Persian
322 blk; Old_South_Arabian ; Old_South_Arabian
323 blk; Old_Turkic ; Old_Turkic
325 blk; Ornamental_Dingbats ; Ornamental_Dingbats
326 blk; Osmanya ; Osmanya
327 blk; Pahawh_Hmong ; Pahawh_Hmong
328 blk; Palmyrene ; Palmyrene
329 blk; Pau_Cin_Hau ; Pau_Cin_Hau
330 blk; Phags_Pa ; Phags_Pa
331 blk; Phaistos ; Phaistos_Disc
332 blk; Phoenician ; Phoenician
333 blk; Phonetic_Ext ; Phonetic_Extensions
334 blk; Phonetic_Ext_Sup ; Phonetic_Extensions_Supplement
335 blk; Playing_Cards ; Playing_Cards
336 blk; Psalter_Pahlavi ; Psalter_Pahlavi
337 blk; PUA ; Private_Use_Area ; Private_Use
338 blk; Punctuation ; General_Punctuation
340 blk; Rumi ; Rumi_Numeral_Symbols
342 blk; Samaritan ; Samaritan
343 blk; Saurashtra ; Saurashtra
344 blk; Sharada ; Sharada
345 blk; Shavian ; Shavian
346 blk; Shorthand_Format_Controls ; Shorthand_Format_Controls
347 blk; Siddham ; Siddham
348 blk; Sinhala ; Sinhala
349 blk; Sinhala_Archaic_Numbers ; Sinhala_Archaic_Numbers
350 blk; Small_Forms ; Small_Form_Variants
351 blk; Sora_Sompeng ; Sora_Sompeng
352 blk; Specials ; Specials
353 blk; Sundanese ; Sundanese
354 blk; Sundanese_Sup ; Sundanese_Supplement
355 blk; Sup_Arrows_A ; Supplemental_Arrows_A
356 blk; Sup_Arrows_B ; Supplemental_Arrows_B
357 blk; Sup_Arrows_C ; Supplemental_Arrows_C
358 blk; Sup_Math_Operators ; Supplemental_Mathematical_Operators
359 blk; Sup_PUA_A ; Supplementary_Private_Use_Area_A
360 blk; Sup_PUA_B ; Supplementary_Private_Use_Area_B
361 blk; Sup_Punctuation ; Supplemental_Punctuation
362 blk; Super_And_Sub ; Superscripts_And_Subscripts
363 blk; Syloti_Nagri ; Syloti_Nagri
365 blk; Tagalog ; Tagalog
366 blk; Tagbanwa ; Tagbanwa
369 blk; Tai_Tham ; Tai_Tham
370 blk; Tai_Viet ; Tai_Viet
371 blk; Tai_Xuan_Jing ; Tai_Xuan_Jing_Symbols
377 blk; Tibetan ; Tibetan
378 blk; Tifinagh ; Tifinagh
379 blk; Tirhuta ; Tirhuta
380 blk; Transport_And_Map ; Transport_And_Map_Symbols
381 blk; UCAS ; Unified_Canadian_Aboriginal_Syllabics; Canadian_Syllabics
382 blk; UCAS_Ext ; Unified_Canadian_Aboriginal_Syllabics_Extended
383 blk; Ugaritic ; Ugaritic
385 blk; Vedic_Ext ; Vedic_Extensions
386 blk; Vertical_Forms ; Vertical_Forms
387 blk; VS ; Variation_Selectors
388 blk; VS_Sup ; Variation_Selectors_Supplement
389 blk; Warang_Citi ; Warang_Citi
390 blk; Yi_Radicals ; Yi_Radicals
391 blk; Yi_Syllables ; Yi_Syllables
392 blk; Yijing ; Yijing_Hexagram_Symbols
394 # Canonical_Combining_Class (ccc)
396 ccc; 0; NR ; Not_Reordered
399 ccc; 8; KV ; Kana_Voicing
401 ccc; 10; CCC10 ; CCC10
402 ccc; 11; CCC11 ; CCC11
403 ccc; 12; CCC12 ; CCC12
404 ccc; 13; CCC13 ; CCC13
405 ccc; 14; CCC14 ; CCC14
406 ccc; 15; CCC15 ; CCC15
407 ccc; 16; CCC16 ; CCC16
408 ccc; 17; CCC17 ; CCC17
409 ccc; 18; CCC18 ; CCC18
410 ccc; 19; CCC19 ; CCC19
411 ccc; 20; CCC20 ; CCC20
412 ccc; 21; CCC21 ; CCC21
413 ccc; 22; CCC22 ; CCC22
414 ccc; 23; CCC23 ; CCC23
415 ccc; 24; CCC24 ; CCC24
416 ccc; 25; CCC25 ; CCC25
417 ccc; 26; CCC26 ; CCC26
418 ccc; 27; CCC27 ; CCC27
419 ccc; 28; CCC28 ; CCC28
420 ccc; 29; CCC29 ; CCC29
421 ccc; 30; CCC30 ; CCC30
422 ccc; 31; CCC31 ; CCC31
423 ccc; 32; CCC32 ; CCC32
424 ccc; 33; CCC33 ; CCC33
425 ccc; 34; CCC34 ; CCC34
426 ccc; 35; CCC35 ; CCC35
427 ccc; 36; CCC36 ; CCC36
428 ccc; 84; CCC84 ; CCC84
429 ccc; 91; CCC91 ; CCC91
430 ccc; 103; CCC103 ; CCC103
431 ccc; 107; CCC107 ; CCC107
432 ccc; 118; CCC118 ; CCC118
433 ccc; 122; CCC122 ; CCC122
434 ccc; 129; CCC129 ; CCC129
435 ccc; 130; CCC130 ; CCC130
436 ccc; 132; CCC132 ; CCC132
437 ccc; 133; CCC133 ; CCC133 # RESERVED
438 ccc; 200; ATBL ; Attached_Below_Left
439 ccc; 202; ATB ; Attached_Below
440 ccc; 214; ATA ; Attached_Above
441 ccc; 216; ATAR ; Attached_Above_Right
442 ccc; 218; BL ; Below_Left
444 ccc; 222; BR ; Below_Right
447 ccc; 228; AL ; Above_Left
449 ccc; 232; AR ; Above_Right
450 ccc; 233; DB ; Double_Below
451 ccc; 234; DA ; Double_Above
452 ccc; 240; IS ; Iota_Subscript
456 # @missing: 0000..10FFFF; Case_Folding; <code point>
458 # Case_Ignorable (CI)
460 CI ; N ; No ; F ; False
461 CI ; Y ; Yes ; T ; True
465 Cased; N ; No ; F ; False
466 Cased; Y ; Yes ; T ; True
468 # Changes_When_Casefolded (CWCF)
470 CWCF; N ; No ; F ; False
471 CWCF; Y ; Yes ; T ; True
473 # Changes_When_Casemapped (CWCM)
475 CWCM; N ; No ; F ; False
476 CWCM; Y ; Yes ; T ; True
478 # Changes_When_Lowercased (CWL)
480 CWL; N ; No ; F ; False
481 CWL; Y ; Yes ; T ; True
483 # Changes_When_NFKC_Casefolded (CWKCF)
485 CWKCF; N ; No ; F ; False
486 CWKCF; Y ; Yes ; T ; True
488 # Changes_When_Titlecased (CWT)
490 CWT; N ; No ; F ; False
491 CWT; Y ; Yes ; T ; True
493 # Changes_When_Uppercased (CWU)
495 CWU; N ; No ; F ; False
496 CWU; Y ; Yes ; T ; True
498 # Composition_Exclusion (CE)
500 CE ; N ; No ; F ; False
501 CE ; Y ; Yes ; T ; True
505 Dash; N ; No ; F ; False
506 Dash; Y ; Yes ; T ; True
508 # Decomposition_Mapping (dm)
510 # @missing: 0000..10FFFF; Decomposition_Mapping; <code point>
512 # Decomposition_Type (dt)
514 dt ; Can ; Canonical ; can
515 dt ; Com ; Compat ; com
516 dt ; Enc ; Circle ; enc
517 dt ; Fin ; Final ; fin
518 dt ; Font ; Font ; font
519 dt ; Fra ; Fraction ; fra
520 dt ; Init ; Initial ; init
521 dt ; Iso ; Isolated ; iso
522 dt ; Med ; Medial ; med
523 dt ; Nar ; Narrow ; nar
524 dt ; Nb ; Nobreak ; nb
525 dt ; None ; None ; none
526 dt ; Sml ; Small ; sml
527 dt ; Sqr ; Square ; sqr
529 dt ; Sup ; Super ; sup
530 dt ; Vert ; Vertical ; vert
531 dt ; Wide ; Wide ; wide
533 # Default_Ignorable_Code_Point (DI)
535 DI ; N ; No ; F ; False
536 DI ; Y ; Yes ; T ; True
540 Dep; N ; No ; F ; False
541 Dep; Y ; Yes ; T ; True
545 Dia; N ; No ; F ; False
546 Dia; Y ; Yes ; T ; True
548 # East_Asian_Width (ea)
557 # Expands_On_NFC (XO_NFC)
559 XO_NFC; N ; No ; F ; False
560 XO_NFC; Y ; Yes ; T ; True
562 # Expands_On_NFD (XO_NFD)
564 XO_NFD; N ; No ; F ; False
565 XO_NFD; Y ; Yes ; T ; True
567 # Expands_On_NFKC (XO_NFKC)
569 XO_NFKC; N ; No ; F ; False
570 XO_NFKC; Y ; Yes ; T ; True
572 # Expands_On_NFKD (XO_NFKD)
574 XO_NFKD; N ; No ; F ; False
575 XO_NFKD; Y ; Yes ; T ; True
579 Ext; N ; No ; F ; False
580 Ext; Y ; Yes ; T ; True
582 # FC_NFKC_Closure (FC_NFKC)
584 # @missing: 0000..10FFFF; FC_NFKC_Closure; <code point>
586 # Full_Composition_Exclusion (Comp_Ex)
588 Comp_Ex; N ; No ; F ; False
589 Comp_Ex; Y ; Yes ; T ; True
591 # General_Category (gc)
593 gc ; C ; Other # Cc | Cf | Cn | Co | Cs
594 gc ; Cc ; Control ; cntrl
597 gc ; Co ; Private_Use
599 gc ; L ; Letter # Ll | Lm | Lo | Lt | Lu
600 gc ; LC ; Cased_Letter # Ll | Lt | Lu
601 gc ; Ll ; Lowercase_Letter
602 gc ; Lm ; Modifier_Letter
603 gc ; Lo ; Other_Letter
604 gc ; Lt ; Titlecase_Letter
605 gc ; Lu ; Uppercase_Letter
606 gc ; M ; Mark ; Combining_Mark # Mc | Me | Mn
607 gc ; Mc ; Spacing_Mark
608 gc ; Me ; Enclosing_Mark
609 gc ; Mn ; Nonspacing_Mark
610 gc ; N ; Number # Nd | Nl | No
611 gc ; Nd ; Decimal_Number ; digit
612 gc ; Nl ; Letter_Number
613 gc ; No ; Other_Number
614 gc ; P ; Punctuation ; punct # Pc | Pd | Pe | Pf | Pi | Po | Ps
615 gc ; Pc ; Connector_Punctuation
616 gc ; Pd ; Dash_Punctuation
617 gc ; Pe ; Close_Punctuation
618 gc ; Pf ; Final_Punctuation
619 gc ; Pi ; Initial_Punctuation
620 gc ; Po ; Other_Punctuation
621 gc ; Ps ; Open_Punctuation
622 gc ; S ; Symbol # Sc | Sk | Sm | So
623 gc ; Sc ; Currency_Symbol
624 gc ; Sk ; Modifier_Symbol
625 gc ; Sm ; Math_Symbol
626 gc ; So ; Other_Symbol
627 gc ; Z ; Separator # Zl | Zp | Zs
628 gc ; Zl ; Line_Separator
629 gc ; Zp ; Paragraph_Separator
630 gc ; Zs ; Space_Separator
631 # @missing: 0000..10FFFF; General_Category; Unassigned
633 # Grapheme_Base (Gr_Base)
635 Gr_Base; N ; No ; F ; False
636 Gr_Base; Y ; Yes ; T ; True
638 # Grapheme_Cluster_Break (GCB)
648 GCB; RI ; Regional_Indicator
649 GCB; SM ; SpacingMark
654 # Grapheme_Extend (Gr_Ext)
656 Gr_Ext; N ; No ; F ; False
657 Gr_Ext; Y ; Yes ; T ; True
659 # Grapheme_Link (Gr_Link)
661 Gr_Link; N ; No ; F ; False
662 Gr_Link; Y ; Yes ; T ; True
664 # Hangul_Syllable_Type (hst)
666 hst; L ; Leading_Jamo
667 hst; LV ; LV_Syllable
668 hst; LVT ; LVT_Syllable
669 hst; NA ; Not_Applicable
670 hst; T ; Trailing_Jamo
675 Hex; N ; No ; F ; False
676 Hex; Y ; Yes ; T ; True
680 Hyphen; N ; No ; F ; False
681 Hyphen; Y ; Yes ; T ; True
683 # IDS_Binary_Operator (IDSB)
685 IDSB; N ; No ; F ; False
686 IDSB; Y ; Yes ; T ; True
688 # IDS_Trinary_Operator (IDST)
690 IDST; N ; No ; F ; False
691 IDST; Y ; Yes ; T ; True
695 IDC; N ; No ; F ; False
696 IDC; Y ; Yes ; T ; True
700 IDS; N ; No ; F ; False
701 IDS; Y ; Yes ; T ; True
705 # @missing: 0000..10FFFF; ISO_Comment; <none>
709 Ideo; N ; No ; F ; False
710 Ideo; Y ; Yes ; T ; True
712 # Indic_Matra_Category (InMC)
714 InMC; Bottom ; Bottom
715 InMC; Bottom_And_Right ; Bottom_And_Right
717 InMC; Left_And_Right ; Left_And_Right
719 InMC; Overstruck ; Overstruck
722 InMC; Top_And_Bottom ; Top_And_Bottom
723 InMC; Top_And_Bottom_And_Right ; Top_And_Bottom_And_Right
724 InMC; Top_And_Left ; Top_And_Left
725 InMC; Top_And_Left_And_Right ; Top_And_Left_And_Right
726 InMC; Top_And_Right ; Top_And_Right
727 InMC; Visual_Order_Left ; Visual_Order_Left
729 # Indic_Syllabic_Category (InSC)
731 InSC; Avagraha ; Avagraha
733 InSC; Brahmi_Joining_Number ; Brahmi_Joining_Number
734 InSC; Cantillation_Mark ; Cantillation_Mark
735 InSC; Consonant ; Consonant
736 InSC; Consonant_Dead ; Consonant_Dead
737 InSC; Consonant_Final ; Consonant_Final
738 InSC; Consonant_Head_Letter ; Consonant_Head_Letter
739 InSC; Consonant_Medial ; Consonant_Medial
740 InSC; Consonant_Placeholder ; Consonant_Placeholder
741 InSC; Consonant_Preceding_Repha ; Consonant_Preceding_Repha
742 InSC; Consonant_Subjoined ; Consonant_Subjoined
743 InSC; Consonant_Succeeding_Repha ; Consonant_Succeeding_Repha
744 InSC; Gemination_Mark ; Gemination_Mark
745 InSC; Invisible_Stacker ; Invisible_Stacker
746 InSC; Joiner ; Joiner
747 InSC; Modifying_Letter ; Modifying_Letter
748 InSC; Non_Joiner ; Non_Joiner
750 InSC; Number ; Number
751 InSC; Number_Joiner ; Number_Joiner
753 InSC; Pure_Killer ; Pure_Killer
754 InSC; Register_Shifter ; Register_Shifter
755 InSC; Tone_Letter ; Tone_Letter
756 InSC; Tone_Mark ; Tone_Mark
757 InSC; Virama ; Virama
758 InSC; Visarga ; Visarga
760 InSC; Vowel_Dependent ; Vowel_Dependent
761 InSC; Vowel_Independent ; Vowel_Independent
763 # Jamo_Short_Name (JSN)
817 # @missing: 0000..10FFFF; Jamo_Short_Name; <none>
819 # Join_Control (Join_C)
821 Join_C; N ; No ; F ; False
822 Join_C; Y ; Yes ; T ; True
831 jg ; Burushaski_Yeh_Barree ; Burushaski_Yeh_Barree
833 jg ; Dalath_Rish ; Dalath_Rish
835 jg ; Farsi_Yeh ; Farsi_Yeh
838 jg ; Final_Semkath ; Final_Semkath
844 jg ; Heh_Goal ; Heh_Goal
849 jg ; Knotted_Heh ; Knotted_Heh
852 jg ; Manichaean_Aleph ; Manichaean_Aleph
853 jg ; Manichaean_Ayin ; Manichaean_Ayin
854 jg ; Manichaean_Beth ; Manichaean_Beth
855 jg ; Manichaean_Daleth ; Manichaean_Daleth
856 jg ; Manichaean_Dhamedh ; Manichaean_Dhamedh
857 jg ; Manichaean_Five ; Manichaean_Five
858 jg ; Manichaean_Gimel ; Manichaean_Gimel
859 jg ; Manichaean_Heth ; Manichaean_Heth
860 jg ; Manichaean_Hundred ; Manichaean_Hundred
861 jg ; Manichaean_Kaph ; Manichaean_Kaph
862 jg ; Manichaean_Lamedh ; Manichaean_Lamedh
863 jg ; Manichaean_Mem ; Manichaean_Mem
864 jg ; Manichaean_Nun ; Manichaean_Nun
865 jg ; Manichaean_One ; Manichaean_One
866 jg ; Manichaean_Pe ; Manichaean_Pe
867 jg ; Manichaean_Qoph ; Manichaean_Qoph
868 jg ; Manichaean_Resh ; Manichaean_Resh
869 jg ; Manichaean_Sadhe ; Manichaean_Sadhe
870 jg ; Manichaean_Samekh ; Manichaean_Samekh
871 jg ; Manichaean_Taw ; Manichaean_Taw
872 jg ; Manichaean_Ten ; Manichaean_Ten
873 jg ; Manichaean_Teth ; Manichaean_Teth
874 jg ; Manichaean_Thamedh ; Manichaean_Thamedh
875 jg ; Manichaean_Twenty ; Manichaean_Twenty
876 jg ; Manichaean_Waw ; Manichaean_Waw
877 jg ; Manichaean_Yodh ; Manichaean_Yodh
878 jg ; Manichaean_Zayin ; Manichaean_Zayin
881 jg ; No_Joining_Group ; No_Joining_Group
889 jg ; Reversed_Pe ; Reversed_Pe
890 jg ; Rohingya_Yeh ; Rohingya_Yeh
894 jg ; Semkath ; Semkath
896 jg ; Straight_Waw ; Straight_Waw
897 jg ; Swash_Kaf ; Swash_Kaf
898 jg ; Syriac_Waw ; Syriac_Waw
901 jg ; Teh_Marbuta ; Teh_Marbuta
902 jg ; Teh_Marbuta_Goal ; Hamza_On_Heh_Goal
906 jg ; Yeh_Barree ; Yeh_Barree
907 jg ; Yeh_With_Tail ; Yeh_With_Tail
909 jg ; Yudh_He ; Yudh_He
915 jt ; C ; Join_Causing
916 jt ; D ; Dual_Joining
917 jt ; L ; Left_Joining
918 jt ; R ; Right_Joining
927 lb ; BA ; Break_After
928 lb ; BB ; Break_Before
929 lb ; BK ; Mandatory_Break
930 lb ; CB ; Contingent_Break
931 lb ; CJ ; Conditional_Japanese_Starter
932 lb ; CL ; Close_Punctuation
933 lb ; CM ; Combining_Mark
934 lb ; CP ; Close_Parenthesis
935 lb ; CR ; Carriage_Return
936 lb ; EX ; Exclamation
940 lb ; HL ; Hebrew_Letter
942 lb ; ID ; Ideographic
943 lb ; IN ; Inseparable ; Inseperable
944 lb ; IS ; Infix_Numeric
952 lb ; OP ; Open_Punctuation
953 lb ; PO ; Postfix_Numeric
954 lb ; PR ; Prefix_Numeric
956 lb ; RI ; Regional_Indicator
957 lb ; SA ; Complex_Context
960 lb ; SY ; Break_Symbols
961 lb ; WJ ; Word_Joiner
965 # Logical_Order_Exception (LOE)
967 LOE; N ; No ; F ; False
968 LOE; Y ; Yes ; T ; True
972 Lower; N ; No ; F ; False
973 Lower; Y ; Yes ; T ; True
975 # Lowercase_Mapping (lc)
977 # @missing: 0000..10FFFF; Lowercase_Mapping; <code point>
981 Math; N ; No ; F ; False
982 Math; Y ; Yes ; T ; True
984 # NFC_Quick_Check (NFC_QC)
990 # NFD_Quick_Check (NFD_QC)
995 # NFKC_Casefold (NFKC_CF)
997 # @missing: 0000..10FFFF; NFKC_Casefold; <code point>
999 # NFKC_Quick_Check (NFKC_QC)
1005 # NFKD_Quick_Check (NFKD_QC)
1012 # @missing: 0000..10FFFF; Name; <none>
1014 # Name_Alias (Name_Alias)
1016 # @missing: 0000..10FFFF; Name_Alias; <none>
1018 # Noncharacter_Code_Point (NChar)
1020 NChar; N ; No ; F ; False
1021 NChar; Y ; Yes ; T ; True
1030 # Numeric_Value (nv)
1032 # @missing: 0000..10FFFF; Numeric_Value; NaN
1034 # Other_Alphabetic (OAlpha)
1036 OAlpha; N ; No ; F ; False
1037 OAlpha; Y ; Yes ; T ; True
1039 # Other_Default_Ignorable_Code_Point (ODI)
1041 ODI; N ; No ; F ; False
1042 ODI; Y ; Yes ; T ; True
1044 # Other_Grapheme_Extend (OGr_Ext)
1046 OGr_Ext; N ; No ; F ; False
1047 OGr_Ext; Y ; Yes ; T ; True
1049 # Other_ID_Continue (OIDC)
1051 OIDC; N ; No ; F ; False
1052 OIDC; Y ; Yes ; T ; True
1054 # Other_ID_Start (OIDS)
1056 OIDS; N ; No ; F ; False
1057 OIDS; Y ; Yes ; T ; True
1059 # Other_Lowercase (OLower)
1061 OLower; N ; No ; F ; False
1062 OLower; Y ; Yes ; T ; True
1064 # Other_Math (OMath)
1066 OMath; N ; No ; F ; False
1067 OMath; Y ; Yes ; T ; True
1069 # Other_Uppercase (OUpper)
1071 OUpper; N ; No ; F ; False
1072 OUpper; Y ; Yes ; T ; True
1074 # Pattern_Syntax (Pat_Syn)
1076 Pat_Syn; N ; No ; F ; False
1077 Pat_Syn; Y ; Yes ; T ; True
1079 # Pattern_White_Space (Pat_WS)
1081 Pat_WS; N ; No ; F ; False
1082 Pat_WS; Y ; Yes ; T ; True
1084 # Quotation_Mark (QMark)
1086 QMark; N ; No ; F ; False
1087 QMark; Y ; Yes ; T ; True
1091 Radical; N ; No ; F ; False
1092 Radical; Y ; Yes ; T ; True
1096 STerm; N ; No ; F ; False
1097 STerm; Y ; Yes ; T ; True
1101 sc ; Aghb ; Caucasian_Albanian
1103 sc ; Armi ; Imperial_Aramaic
1104 sc ; Armn ; Armenian
1106 sc ; Bali ; Balinese
1108 sc ; Bass ; Bassa_Vah
1111 sc ; Bopo ; Bopomofo
1114 sc ; Bugi ; Buginese
1117 sc ; Cans ; Canadian_Aboriginal
1120 sc ; Cher ; Cherokee
1121 sc ; Copt ; Coptic ; Qaac
1123 sc ; Cyrl ; Cyrillic
1124 sc ; Deva ; Devanagari
1126 sc ; Dupl ; Duployan
1127 sc ; Egyp ; Egyptian_Hieroglyphs
1129 sc ; Ethi ; Ethiopic
1130 sc ; Geor ; Georgian
1131 sc ; Glag ; Glagolitic
1135 sc ; Gujr ; Gujarati
1136 sc ; Guru ; Gurmukhi
1141 sc ; Hira ; Hiragana
1142 sc ; Hmng ; Pahawh_Hmong
1143 sc ; Hrkt ; Katakana_Or_Hiragana
1144 sc ; Ital ; Old_Italic
1145 sc ; Java ; Javanese
1146 sc ; Kali ; Kayah_Li
1147 sc ; Kana ; Katakana
1148 sc ; Khar ; Kharoshthi
1153 sc ; Lana ; Tai_Tham
1158 sc ; Lina ; Linear_A
1159 sc ; Linb ; Linear_B
1163 sc ; Mahj ; Mahajani
1165 sc ; Mani ; Manichaean
1166 sc ; Mend ; Mende_Kikakui
1167 sc ; Merc ; Meroitic_Cursive
1168 sc ; Mero ; Meroitic_Hieroglyphs
1169 sc ; Mlym ; Malayalam
1171 sc ; Mong ; Mongolian
1173 sc ; Mtei ; Meetei_Mayek
1175 sc ; Narb ; Old_North_Arabian
1176 sc ; Nbat ; Nabataean
1179 sc ; Olck ; Ol_Chiki
1180 sc ; Orkh ; Old_Turkic
1183 sc ; Palm ; Palmyrene
1184 sc ; Pauc ; Pau_Cin_Hau
1185 sc ; Perm ; Old_Permic
1186 sc ; Phag ; Phags_Pa
1187 sc ; Phli ; Inscriptional_Pahlavi
1188 sc ; Phlp ; Psalter_Pahlavi
1189 sc ; Phnx ; Phoenician
1191 sc ; Prti ; Inscriptional_Parthian
1194 sc ; Samr ; Samaritan
1195 sc ; Sarb ; Old_South_Arabian
1196 sc ; Saur ; Saurashtra
1200 sc ; Sind ; Khudawadi
1202 sc ; Sora ; Sora_Sompeng
1203 sc ; Sund ; Sundanese
1204 sc ; Sylo ; Syloti_Nagri
1206 sc ; Tagb ; Tagbanwa
1209 sc ; Talu ; New_Tai_Lue
1211 sc ; Tavt ; Tai_Viet
1213 sc ; Tfng ; Tifinagh
1219 sc ; Ugar ; Ugaritic
1221 sc ; Wara ; Warang_Citi
1222 sc ; Xpeo ; Old_Persian
1223 sc ; Xsux ; Cuneiform
1225 sc ; Zinh ; Inherited ; Qaai
1229 # Script_Extensions (scx)
1231 # @missing: 0000..10FFFF; Script_Extensions; <script>
1233 # Sentence_Break (SB)
1251 # Simple_Case_Folding (scf)
1253 # @missing: 0000..10FFFF; Simple_Case_Folding; <code point>
1255 # Simple_Lowercase_Mapping (slc)
1257 # @missing: 0000..10FFFF; Simple_Lowercase_Mapping; <code point>
1259 # Simple_Titlecase_Mapping (stc)
1261 # @missing: 0000..10FFFF; Simple_Titlecase_Mapping; <code point>
1263 # Simple_Uppercase_Mapping (suc)
1265 # @missing: 0000..10FFFF; Simple_Uppercase_Mapping; <code point>
1269 SD ; N ; No ; F ; False
1270 SD ; Y ; Yes ; T ; True
1272 # Terminal_Punctuation (Term)
1274 Term; N ; No ; F ; False
1275 Term; Y ; Yes ; T ; True
1277 # Titlecase_Mapping (tc)
1279 # @missing: 0000..10FFFF; Titlecase_Mapping; <code point>
1281 # Unicode_1_Name (na1)
1283 # @missing: 0000..10FFFF; Unicode_1_Name; <none>
1285 # Unified_Ideograph (UIdeo)
1287 UIdeo; N ; No ; F ; False
1288 UIdeo; Y ; Yes ; T ; True
1292 Upper; N ; No ; F ; False
1293 Upper; Y ; Yes ; T ; True
1295 # Uppercase_Mapping (uc)
1297 # @missing: 0000..10FFFF; Uppercase_Mapping; <code point>
1299 # Variation_Selector (VS)
1301 VS ; N ; No ; F ; False
1302 VS ; Y ; Yes ; T ; True
1304 # White_Space (WSpace)
1306 WSpace; N ; No ; F ; False
1307 WSpace; Y ; Yes ; T ; True
1312 WB ; DQ ; Double_Quote
1313 WB ; EX ; ExtendNumLet
1314 WB ; Extend ; Extend
1316 WB ; HL ; Hebrew_Letter
1325 WB ; RI ; Regional_Indicator
1326 WB ; SQ ; Single_Quote
1329 # XID_Continue (XIDC)
1331 XIDC; N ; No ; F ; False
1332 XIDC; Y ; Yes ; T ; True
1336 XIDS; N ; No ; F ; False
1337 XIDS; Y ; Yes ; T ; True
1339 # cjkAccountingNumeric (cjkAccountingNumeric)
1341 # @missing: 0000..10FFFF; cjkAccountingNumeric; NaN
1343 # cjkCompatibilityVariant (cjkCompatibilityVariant)
1345 # @missing: 0000..10FFFF; cjkCompatibilityVariant; <code point>
1347 # cjkIICore (cjkIICore)
1349 # @missing: 0000..10FFFF; cjkIICore; <none>
1351 # cjkIRG_GSource (cjkIRG_GSource)
1353 # @missing: 0000..10FFFF; cjkIRG_GSource; <none>
1355 # cjkIRG_HSource (cjkIRG_HSource)
1357 # @missing: 0000..10FFFF; cjkIRG_HSource; <none>
1359 # cjkIRG_JSource (cjkIRG_JSource)
1361 # @missing: 0000..10FFFF; cjkIRG_JSource; <none>
1363 # cjkIRG_KPSource (cjkIRG_KPSource)
1365 # @missing: 0000..10FFFF; cjkIRG_KPSource; <none>
1367 # cjkIRG_KSource (cjkIRG_KSource)
1369 # @missing: 0000..10FFFF; cjkIRG_KSource; <none>
1371 # cjkIRG_MSource (cjkIRG_MSource)
1373 # @missing: 0000..10FFFF; cjkIRG_MSource; <none>
1375 # cjkIRG_TSource (cjkIRG_TSource)
1377 # @missing: 0000..10FFFF; cjkIRG_TSource; <none>
1379 # cjkIRG_USource (cjkIRG_USource)
1381 # @missing: 0000..10FFFF; cjkIRG_USource; <none>
1383 # cjkIRG_VSource (cjkIRG_VSource)
1385 # @missing: 0000..10FFFF; cjkIRG_VSource; <none>
1387 # cjkOtherNumeric (cjkOtherNumeric)
1389 # @missing: 0000..10FFFF; cjkOtherNumeric; NaN
1391 # cjkPrimaryNumeric (cjkPrimaryNumeric)
1393 # @missing: 0000..10FFFF; cjkPrimaryNumeric; NaN
1395 # cjkRSUnicode (cjkRSUnicode)
1397 # @missing: 0000..10FFFF; cjkRSUnicode; <none>