This is a live mirror of the Perl 5 development currently hosted at https://github.com/perl/perl5
mktables not run unless needed
[perl5.git] / lib / unicore / PropValueAliases.txt
1 # PropertyValueAliases-5.1.0.txt
2 # Date: 2008-03-03, 21:58:08 GMT [MD]
3 #
4 # Unicode Character Database
5 # Copyright (c) 1991-2008 Unicode, Inc.
6 # For terms of use, see http://www.unicode.org/terms_of_use.html
7 # For documentation, see UCD.html
8 #
9 # This file contains aliases for property values used in the UCD.
10 # These names can be used for XML formats of UCD data, for regular-expression
11 # property tests, and other programmatic textual descriptions of Unicode data.
12 # For information on which properties are normative, see UCD.html.
13 #
14 # The names may be translated in appropriate environments, and additional
15 # aliases may be useful.
16 #
17 # FORMAT
18 #
19 # Each line describes a property value name.
20 # This consists of three or more fields, separated by semicolons.
21 #
22 # First Field: The first field describes the property for which that
23 # property value name is used.
24 #
25 # Second Field: The second field is an abbreviated name.
26 # If there is no abbreviated name available, the field is marked with "n/a".
27 #
28 # Third Field: The third field is a long name.
29 #
30 # In the case of ccc, there are 4 fields. The second field is numeric, third
31 # is abbreviated, and fourth is long.
32 #
33 # The above are the preferred aliases. Other aliases may be listed in additional fields.
34 #
35 # Loose matching should be applied to all property names and property values, with
36 # the exception of String Property values. With loose matching of property names and
37 # values, the case distinctions, whitespace, and '_' are ignored. For Numeric Property
38 # values, numeric equivalencies are applied: thus "01.00" is equivalent to "1".
39 #
40 # NOTE: Property value names are NOT unique across properties. For example:
41 #
42 #   AL means Arabic Letter for the Bidi_Class property, and
43 #   AL means Alpha_Left for the Combining_Class property, and
44 #   AL means Alphabetic for the Line_Break property.
45 #
46 # In addition, some property names may be the same as some property value names.
47 # For example:
48 #
49 #   sc means the Script property, and
50 #   Sc means the General_Category property value Currency_Symbol (Sc)
51 #
52 # The combination of property value and property name is, however, unique.
53 #
54 # For more information, see UTS #18: Regular Expression Guidelines
55 # ================================================
56
57
58 # ASCII_Hex_Digit (AHex)
59
60 AHex; N        ; No                               ; F                                ; False
61 AHex; Y        ; Yes                              ; T                                ; True
62
63 # Age (age)
64
65 age; n/a       ; 1.1
66 age; n/a       ; 2.0
67 age; n/a       ; 2.1
68 age; n/a       ; 3.0
69 age; n/a       ; 3.1
70 age; n/a       ; 3.2
71 age; n/a       ; 4.0
72 age; n/a       ; 4.1
73 age; n/a       ; 5.0
74 age; n/a       ; 5.1
75 age; n/a       ; unassigned
76
77 # Alphabetic (Alpha)
78
79 Alpha; N       ; No                               ; F                                ; False
80 Alpha; Y       ; Yes                              ; T                                ; True
81
82 # Bidi_Class (bc)
83
84 bc ; AL        ; Arabic_Letter
85 bc ; AN        ; Arabic_Number
86 bc ; B         ; Paragraph_Separator
87 bc ; BN        ; Boundary_Neutral
88 bc ; CS        ; Common_Separator
89 bc ; EN        ; European_Number
90 bc ; ES        ; European_Separator
91 bc ; ET        ; European_Terminator
92 bc ; L         ; Left_To_Right
93 bc ; LRE       ; Left_To_Right_Embedding
94 bc ; LRO       ; Left_To_Right_Override
95 bc ; NSM       ; Nonspacing_Mark
96 bc ; ON        ; Other_Neutral
97 bc ; PDF       ; Pop_Directional_Format
98 bc ; R         ; Right_To_Left
99 bc ; RLE       ; Right_To_Left_Embedding
100 bc ; RLO       ; Right_To_Left_Override
101 bc ; S         ; Segment_Separator
102 bc ; WS        ; White_Space
103
104 # Bidi_Control (Bidi_C)
105
106 Bidi_C; N      ; No                               ; F                                ; False
107 Bidi_C; Y      ; Yes                              ; T                                ; True
108
109 # Bidi_Mirrored (Bidi_M)
110
111 Bidi_M; N      ; No                               ; F                                ; False
112 Bidi_M; Y      ; Yes                              ; T                                ; True
113
114 # Bidi_Mirroring_Glyph (bmg)
115
116 # @missing: 0000..10FFFF; Bidi_Mirroring_Glyph; <none>
117
118 # Block (blk)
119
120 blk; n/a       ; Aegean_Numbers
121 blk; n/a       ; Alphabetic_Presentation_Forms
122 blk; n/a       ; Ancient_Greek_Musical_Notation
123 blk; n/a       ; Ancient_Greek_Numbers
124 blk; n/a       ; Ancient_Symbols
125 blk; n/a       ; Arabic
126 blk; n/a       ; Arabic_Presentation_Forms_A      ; Arabic_Presentation_Forms-A
127 blk; n/a       ; Arabic_Presentation_Forms_B
128 blk; n/a       ; Arabic_Supplement
129 blk; n/a       ; Armenian
130 blk; n/a       ; Arrows
131 blk; n/a       ; Balinese
132 blk; n/a       ; Basic_Latin                      ; ASCII
133 blk; n/a       ; Bengali
134 blk; n/a       ; Block_Elements
135 blk; n/a       ; Bopomofo
136 blk; n/a       ; Bopomofo_Extended
137 blk; n/a       ; Box_Drawing
138 blk; n/a       ; Braille_Patterns
139 blk; n/a       ; Buginese
140 blk; n/a       ; Buhid
141 blk; n/a       ; Byzantine_Musical_Symbols
142 blk; n/a       ; Carian
143 blk; n/a       ; Cham
144 blk; n/a       ; Cherokee
145 blk; n/a       ; CJK_Compatibility
146 blk; n/a       ; CJK_Compatibility_Forms
147 blk; n/a       ; CJK_Compatibility_Ideographs
148 blk; n/a       ; CJK_Compatibility_Ideographs_Supplement
149 blk; n/a       ; CJK_Radicals_Supplement
150 blk; n/a       ; CJK_Strokes
151 blk; n/a       ; CJK_Symbols_And_Punctuation
152 blk; n/a       ; CJK_Unified_Ideographs
153 blk; n/a       ; CJK_Unified_Ideographs_Extension_A
154 blk; n/a       ; CJK_Unified_Ideographs_Extension_B
155 blk; n/a       ; Combining_Diacritical_Marks
156 blk; n/a       ; Combining_Diacritical_Marks_For_Symbols; Combining_Marks_For_Symbols
157 blk; n/a       ; Combining_Diacritical_Marks_Supplement
158 blk; n/a       ; Combining_Half_Marks
159 blk; n/a       ; Control_Pictures
160 blk; n/a       ; Coptic
161 blk; n/a       ; Counting_Rod_Numerals
162 blk; n/a       ; Cuneiform
163 blk; n/a       ; Cuneiform_Numbers_And_Punctuation
164 blk; n/a       ; Currency_Symbols
165 blk; n/a       ; Cypriot_Syllabary
166 blk; n/a       ; Cyrillic
167 blk; n/a       ; Cyrillic_Extended_A
168 blk; n/a       ; Cyrillic_Extended_B
169 blk; n/a       ; Cyrillic_Supplement              ; Cyrillic_Supplementary
170 blk; n/a       ; Deseret
171 blk; n/a       ; Devanagari
172 blk; n/a       ; Dingbats
173 blk; n/a       ; Domino_Tiles
174 blk; n/a       ; Enclosed_Alphanumerics
175 blk; n/a       ; Enclosed_CJK_Letters_And_Months
176 blk; n/a       ; Ethiopic
177 blk; n/a       ; Ethiopic_Extended
178 blk; n/a       ; Ethiopic_Supplement
179 blk; n/a       ; General_Punctuation
180 blk; n/a       ; Geometric_Shapes
181 blk; n/a       ; Georgian
182 blk; n/a       ; Georgian_Supplement
183 blk; n/a       ; Glagolitic
184 blk; n/a       ; Gothic
185 blk; n/a       ; Greek_And_Coptic                 ; Greek
186 blk; n/a       ; Greek_Extended
187 blk; n/a       ; Gujarati
188 blk; n/a       ; Gurmukhi
189 blk; n/a       ; Halfwidth_And_Fullwidth_Forms
190 blk; n/a       ; Hangul_Compatibility_Jamo
191 blk; n/a       ; Hangul_Jamo
192 blk; n/a       ; Hangul_Syllables
193 blk; n/a       ; Hanunoo
194 blk; n/a       ; Hebrew
195 blk; n/a       ; High_Private_Use_Surrogates
196 blk; n/a       ; High_Surrogates
197 blk; n/a       ; Hiragana
198 blk; n/a       ; Ideographic_Description_Characters
199 blk; n/a       ; IPA_Extensions
200 blk; n/a       ; Kanbun
201 blk; n/a       ; Kangxi_Radicals
202 blk; n/a       ; Kannada
203 blk; n/a       ; Katakana
204 blk; n/a       ; Katakana_Phonetic_Extensions
205 blk; n/a       ; Kayah_Li
206 blk; n/a       ; Kharoshthi
207 blk; n/a       ; Khmer
208 blk; n/a       ; Khmer_Symbols
209 blk; n/a       ; Lao
210 blk; n/a       ; Latin_1_Supplement               ; Latin_1
211 blk; n/a       ; Latin_Extended_A
212 blk; n/a       ; Latin_Extended_Additional
213 blk; n/a       ; Latin_Extended_B
214 blk; n/a       ; Latin_Extended_C
215 blk; n/a       ; Latin_Extended_D
216 blk; n/a       ; Lepcha
217 blk; n/a       ; Letterlike_Symbols
218 blk; n/a       ; Limbu
219 blk; n/a       ; Linear_B_Ideograms
220 blk; n/a       ; Linear_B_Syllabary
221 blk; n/a       ; Low_Surrogates
222 blk; n/a       ; Lycian
223 blk; n/a       ; Lydian
224 blk; n/a       ; Mahjong_Tiles
225 blk; n/a       ; Malayalam
226 blk; n/a       ; Mathematical_Alphanumeric_Symbols
227 blk; n/a       ; Mathematical_Operators
228 blk; n/a       ; Miscellaneous_Mathematical_Symbols_A
229 blk; n/a       ; Miscellaneous_Mathematical_Symbols_B
230 blk; n/a       ; Miscellaneous_Symbols
231 blk; n/a       ; Miscellaneous_Symbols_And_Arrows
232 blk; n/a       ; Miscellaneous_Technical
233 blk; n/a       ; Modifier_Tone_Letters
234 blk; n/a       ; Mongolian
235 blk; n/a       ; Musical_Symbols
236 blk; n/a       ; Myanmar
237 blk; n/a       ; New_Tai_Lue
238 blk; n/a       ; NKo
239 blk; n/a       ; No_Block
240 blk; n/a       ; Number_Forms
241 blk; n/a       ; Ogham
242 blk; n/a       ; Ol_Chiki
243 blk; n/a       ; Old_Italic
244 blk; n/a       ; Old_Persian
245 blk; n/a       ; Optical_Character_Recognition
246 blk; n/a       ; Oriya
247 blk; n/a       ; Osmanya
248 blk; n/a       ; Phags_Pa
249 blk; n/a       ; Phaistos_Disc
250 blk; n/a       ; Phoenician
251 blk; n/a       ; Phonetic_Extensions
252 blk; n/a       ; Phonetic_Extensions_Supplement
253 blk; n/a       ; Private_Use_Area                 ; Private_Use
254 blk; n/a       ; Rejang
255 blk; n/a       ; Runic
256 blk; n/a       ; Saurashtra
257 blk; n/a       ; Shavian
258 blk; n/a       ; Sinhala
259 blk; n/a       ; Small_Form_Variants
260 blk; n/a       ; Spacing_Modifier_Letters
261 blk; n/a       ; Specials
262 blk; n/a       ; Sundanese
263 blk; n/a       ; Superscripts_And_Subscripts
264 blk; n/a       ; Supplemental_Arrows_A
265 blk; n/a       ; Supplemental_Arrows_B
266 blk; n/a       ; Supplemental_Mathematical_Operators
267 blk; n/a       ; Supplemental_Punctuation
268 blk; n/a       ; Supplementary_Private_Use_Area_A
269 blk; n/a       ; Supplementary_Private_Use_Area_B
270 blk; n/a       ; Syloti_Nagri
271 blk; n/a       ; Syriac
272 blk; n/a       ; Tagalog
273 blk; n/a       ; Tagbanwa
274 blk; n/a       ; Tags
275 blk; n/a       ; Tai_Le
276 blk; n/a       ; Tai_Xuan_Jing_Symbols
277 blk; n/a       ; Tamil
278 blk; n/a       ; Telugu
279 blk; n/a       ; Thaana
280 blk; n/a       ; Thai
281 blk; n/a       ; Tibetan
282 blk; n/a       ; Tifinagh
283 blk; n/a       ; Ugaritic
284 blk; n/a       ; Unified_Canadian_Aboriginal_Syllabics; Canadian_Syllabics
285 blk; n/a       ; Vai
286 blk; n/a       ; Variation_Selectors
287 blk; n/a       ; Variation_Selectors_Supplement
288 blk; n/a       ; Vertical_Forms
289 blk; n/a       ; Yi_Radicals
290 blk; n/a       ; Yi_Syllables
291 blk; n/a       ; Yijing_Hexagram_Symbols
292
293 # Canonical_Combining_Class (ccc)
294
295 ccc;   0; NR   ; Not_Reordered
296 ccc;   1; OV   ; Overlay
297 ccc;   7; NK   ; Nukta
298 ccc;   8; KV   ; Kana_Voicing
299 ccc;   9; VR   ; Virama
300 ccc; 200; ATBL ; Attached_Below_Left
301 ccc; 202; ATB  ; Attached_Below
302 ccc; 216; ATAR ; Attached_Above_Right
303 ccc; 218; BL   ; Below_Left
304 ccc; 220; B    ; Below
305 ccc; 222; BR   ; Below_Right
306 ccc; 224; L    ; Left
307 ccc; 226; R    ; Right
308 ccc; 228; AL   ; Above_Left
309 ccc; 230; A    ; Above
310 ccc; 232; AR   ; Above_Right
311 ccc; 233; DB   ; Double_Below
312 ccc; 234; DA   ; Double_Above
313 ccc; 240; IS   ; Iota_Subscript
314
315 # Case_Folding (cf)
316
317 # @missing: 0000..10FFFF; Case_Folding; <code point>
318
319 # Composition_Exclusion (CE)
320
321 CE ; N         ; No                               ; F                                ; False
322 CE ; Y         ; Yes                              ; T                                ; True
323
324 # Dash (Dash)
325
326 Dash; N        ; No                               ; F                                ; False
327 Dash; Y        ; Yes                              ; T                                ; True
328
329 # Decomposition_Mapping (dm)
330
331 # @missing: 0000..10FFFF; Decomposition_Mapping; <code point>
332
333 # Decomposition_Type (dt)
334
335 dt ; Can       ; Canonical                        ; can
336 dt ; Com       ; Compat                           ; com
337 dt ; Enc       ; Circle                           ; enc
338 dt ; Fin       ; Final                            ; fin
339 dt ; Font      ; font
340 dt ; Fra       ; Fraction                         ; fra
341 dt ; Init      ; Initial                          ; init
342 dt ; Iso       ; Isolated                         ; iso
343 dt ; Med       ; Medial                           ; med
344 dt ; Nar       ; Narrow                           ; nar
345 dt ; Nb        ; Nobreak                          ; nb
346 dt ; None      ; none
347 dt ; Sml       ; Small                            ; sml
348 dt ; Sqr       ; Square                           ; sqr
349 dt ; Sub       ; sub
350 dt ; Sup       ; Super                            ; sup
351 dt ; Vert      ; Vertical                         ; vert
352 dt ; Wide      ; wide
353
354 # Default_Ignorable_Code_Point (DI)
355
356 DI ; N         ; No                               ; F                                ; False
357 DI ; Y         ; Yes                              ; T                                ; True
358
359 # Deprecated (Dep)
360
361 Dep; N         ; No                               ; F                                ; False
362 Dep; Y         ; Yes                              ; T                                ; True
363
364 # Diacritic (Dia)
365
366 Dia; N         ; No                               ; F                                ; False
367 Dia; Y         ; Yes                              ; T                                ; True
368
369 # East_Asian_Width (ea)
370
371 ea ; A         ; Ambiguous
372 ea ; F         ; Fullwidth
373 ea ; H         ; Halfwidth
374 ea ; N         ; Neutral
375 ea ; Na        ; Narrow
376 ea ; W         ; Wide
377
378 # Expands_On_NFC (XO_NFC)
379
380 XO_NFC; N      ; No                               ; F                                ; False
381 XO_NFC; Y      ; Yes                              ; T                                ; True
382
383 # Expands_On_NFD (XO_NFD)
384
385 XO_NFD; N      ; No                               ; F                                ; False
386 XO_NFD; Y      ; Yes                              ; T                                ; True
387
388 # Expands_On_NFKC (XO_NFKC)
389
390 XO_NFKC; N     ; No                               ; F                                ; False
391 XO_NFKC; Y     ; Yes                              ; T                                ; True
392
393 # Expands_On_NFKD (XO_NFKD)
394
395 XO_NFKD; N     ; No                               ; F                                ; False
396 XO_NFKD; Y     ; Yes                              ; T                                ; True
397
398 # Extender (Ext)
399
400 Ext; N         ; No                               ; F                                ; False
401 Ext; Y         ; Yes                              ; T                                ; True
402
403 # FC_NFKC_Closure (FC_NFKC)
404
405 # @missing: 0000..10FFFF; FC_NFKC_Closure; <code point>
406
407 # Full_Composition_Exclusion (Comp_Ex)
408
409 Comp_Ex; N     ; No                               ; F                                ; False
410 Comp_Ex; Y     ; Yes                              ; T                                ; True
411
412 # General_Category (gc)
413
414 gc ; C         ; Other                            # Cc | Cf | Cn | Co | Cs
415 gc ; Cc        ; Control                          ; cntrl
416 gc ; Cf        ; Format
417 gc ; Cn        ; Unassigned
418 gc ; Co        ; Private_Use
419 gc ; Cs        ; Surrogate
420 gc ; L         ; Letter                           # Ll | Lm | Lo | Lt | Lu
421 gc ; LC        ; Cased_Letter                     # Ll | Lt | Lu
422 gc ; Ll        ; Lowercase_Letter
423 gc ; Lm        ; Modifier_Letter
424 gc ; Lo        ; Other_Letter
425 gc ; Lt        ; Titlecase_Letter
426 gc ; Lu        ; Uppercase_Letter
427 gc ; M         ; Mark                             # Mc | Me | Mn
428 gc ; Mc        ; Spacing_Mark
429 gc ; Me        ; Enclosing_Mark
430 gc ; Mn        ; Nonspacing_Mark
431 gc ; N         ; Number                           # Nd | Nl | No
432 gc ; Nd        ; Decimal_Number                   ; digit
433 gc ; Nl        ; Letter_Number
434 gc ; No        ; Other_Number
435 gc ; P         ; Punctuation                      ; punct                            # Pc | Pd | Pe | Pf | Pi | Po | Ps
436 gc ; Pc        ; Connector_Punctuation
437 gc ; Pd        ; Dash_Punctuation
438 gc ; Pe        ; Close_Punctuation
439 gc ; Pf        ; Final_Punctuation
440 gc ; Pi        ; Initial_Punctuation
441 gc ; Po        ; Other_Punctuation
442 gc ; Ps        ; Open_Punctuation
443 gc ; S         ; Symbol                           # Sc | Sk | Sm | So
444 gc ; Sc        ; Currency_Symbol
445 gc ; Sk        ; Modifier_Symbol
446 gc ; Sm        ; Math_Symbol
447 gc ; So        ; Other_Symbol
448 gc ; Z         ; Separator                        # Zl | Zp | Zs
449 gc ; Zl        ; Line_Separator
450 gc ; Zp        ; Paragraph_Separator
451 gc ; Zs        ; Space_Separator
452
453 # Grapheme_Base (Gr_Base)
454
455 Gr_Base; N     ; No                               ; F                                ; False
456 Gr_Base; Y     ; Yes                              ; T                                ; True
457
458 # Grapheme_Cluster_Break (GCB)
459
460 GCB; CN        ; Control
461 GCB; CR        ; CR
462 GCB; EX        ; Extend
463 GCB; L         ; L
464 GCB; LF        ; LF
465 GCB; LV        ; LV
466 GCB; LVT       ; LVT
467 GCB; PP        ; Prepend
468 GCB; SM        ; SpacingMark
469 GCB; T         ; T
470 GCB; V         ; V
471 GCB; XX        ; Other
472
473 # Grapheme_Extend (Gr_Ext)
474
475 Gr_Ext; N      ; No                               ; F                                ; False
476 Gr_Ext; Y      ; Yes                              ; T                                ; True
477
478 # Grapheme_Link (Gr_Link)
479
480 Gr_Link; N     ; No                               ; F                                ; False
481 Gr_Link; Y     ; Yes                              ; T                                ; True
482
483 # Hangul_Syllable_Type (hst)
484
485 hst; L         ; Leading_Jamo
486 hst; LV        ; LV_Syllable
487 hst; LVT       ; LVT_Syllable
488 hst; NA        ; Not_Applicable
489 hst; T         ; Trailing_Jamo
490 hst; V         ; Vowel_Jamo
491
492 # Hex_Digit (Hex)
493
494 Hex; N         ; No                               ; F                                ; False
495 Hex; Y         ; Yes                              ; T                                ; True
496
497 # Hyphen (Hyphen)
498
499 Hyphen; N      ; No                               ; F                                ; False
500 Hyphen; Y      ; Yes                              ; T                                ; True
501
502 # IDS_Binary_Operator (IDSB)
503
504 IDSB; N        ; No                               ; F                                ; False
505 IDSB; Y        ; Yes                              ; T                                ; True
506
507 # IDS_Trinary_Operator (IDST)
508
509 IDST; N        ; No                               ; F                                ; False
510 IDST; Y        ; Yes                              ; T                                ; True
511
512 # ID_Continue (IDC)
513
514 IDC; N         ; No                               ; F                                ; False
515 IDC; Y         ; Yes                              ; T                                ; True
516
517 # ID_Start (IDS)
518
519 IDS; N         ; No                               ; F                                ; False
520 IDS; Y         ; Yes                              ; T                                ; True
521
522 # ISO_Comment (isc)
523
524 # @missing: 0000..10FFFF; ISO_Comment; <none>
525
526 # Ideographic (Ideo)
527
528 Ideo; N        ; No                               ; F                                ; False
529 Ideo; Y        ; Yes                              ; T                                ; True
530
531 # Jamo_Short_Name (JSN)
532
533 # @missing: 0000..10FFFF; Jamo_Short_Name; <none>
534 JSN; A         ; A
535 JSN; AE        ; AE
536 JSN; B         ; B
537 JSN; BB        ; BB
538 JSN; BS        ; BS
539 JSN; C         ; C
540 JSN; D         ; D
541 JSN; DD        ; DD
542 JSN; E         ; E
543 JSN; EO        ; EO
544 JSN; EU        ; EU
545 JSN; G         ; G
546 JSN; GG        ; GG
547 JSN; GS        ; GS
548 JSN; H         ; H
549 JSN; I         ; I
550 JSN; J         ; J
551 JSN; JJ        ; JJ
552 JSN; K         ; K
553 JSN; L         ; L
554 JSN; LB        ; LB
555 JSN; LG        ; LG
556 JSN; LH        ; LH
557 JSN; LM        ; LM
558 JSN; LP        ; LP
559 JSN; LS        ; LS
560 JSN; LT        ; LT
561 JSN; M         ; M
562 JSN; N         ; N
563 JSN; NG        ; NG
564 JSN; NH        ; NH
565 JSN; NJ        ; NJ
566 JSN; O         ; O
567 JSN; OE        ; OE
568 JSN; P         ; P
569 JSN; R         ; R
570 JSN; S         ; S
571 JSN; SS        ; SS
572 JSN; T         ; T
573 JSN; U         ; U
574 JSN; WA        ; WA
575 JSN; WAE       ; WAE
576 JSN; WE        ; WE
577 JSN; WEO       ; WEO
578 JSN; WI        ; WI
579 JSN; YA        ; YA
580 JSN; YAE       ; YAE
581 JSN; YE        ; YE
582 JSN; YEO       ; YEO
583 JSN; YI        ; YI
584 JSN; YO        ; YO
585 JSN; YU        ; YU
586
587 # Join_Control (Join_C)
588
589 Join_C; N      ; No                               ; F                                ; False
590 Join_C; Y      ; Yes                              ; T                                ; True
591
592 # Joining_Group (jg)
593
594 jg ; n/a       ; Ain
595 jg ; n/a       ; Alaph
596 jg ; n/a       ; Alef
597 jg ; n/a       ; Beh
598 jg ; n/a       ; Beth
599 jg ; n/a       ; Burushaski_Yeh_Barree
600 jg ; n/a       ; Dal
601 jg ; n/a       ; Dalath_Rish
602 jg ; n/a       ; E
603 jg ; n/a       ; Fe
604 jg ; n/a       ; Feh
605 jg ; n/a       ; Final_Semkath
606 jg ; n/a       ; Gaf
607 jg ; n/a       ; Gamal
608 jg ; n/a       ; Hah
609 jg ; n/a       ; Hamza_On_Heh_Goal
610 jg ; n/a       ; He
611 jg ; n/a       ; Heh
612 jg ; n/a       ; Heh_Goal
613 jg ; n/a       ; Heth
614 jg ; n/a       ; Kaf
615 jg ; n/a       ; Kaph
616 jg ; n/a       ; Khaph
617 jg ; n/a       ; Knotted_Heh
618 jg ; n/a       ; Lam
619 jg ; n/a       ; Lamadh
620 jg ; n/a       ; Meem
621 jg ; n/a       ; Mim
622 jg ; n/a       ; No_Joining_Group
623 jg ; n/a       ; Noon
624 jg ; n/a       ; Nun
625 jg ; n/a       ; Pe
626 jg ; n/a       ; Qaf
627 jg ; n/a       ; Qaph
628 jg ; n/a       ; Reh
629 jg ; n/a       ; Reversed_Pe
630 jg ; n/a       ; Sad
631 jg ; n/a       ; Sadhe
632 jg ; n/a       ; Seen
633 jg ; n/a       ; Semkath
634 jg ; n/a       ; Shin
635 jg ; n/a       ; Swash_Kaf
636 jg ; n/a       ; Syriac_Waw
637 jg ; n/a       ; Tah
638 jg ; n/a       ; Taw
639 jg ; n/a       ; Teh_Marbuta
640 jg ; n/a       ; Teth
641 jg ; n/a       ; Waw
642 jg ; n/a       ; Yeh
643 jg ; n/a       ; Yeh_Barree
644 jg ; n/a       ; Yeh_With_Tail
645 jg ; n/a       ; Yudh
646 jg ; n/a       ; Yudh_He
647 jg ; n/a       ; Zain
648 jg ; n/a       ; Zhain
649
650 # Joining_Type (jt)
651
652 jt ; C         ; Join_Causing
653 jt ; D         ; Dual_Joining
654 jt ; L         ; Left_Joining
655 jt ; R         ; Right_Joining
656 jt ; T         ; Transparent
657 jt ; U         ; Non_Joining
658
659 # Line_Break (lb)
660
661 lb ; AI        ; Ambiguous
662 lb ; AL        ; Alphabetic
663 lb ; B2        ; Break_Both
664 lb ; BA        ; Break_After
665 lb ; BB        ; Break_Before
666 lb ; BK        ; Mandatory_Break
667 lb ; CB        ; Contingent_Break
668 lb ; CL        ; Close_Punctuation
669 lb ; CM        ; Combining_Mark
670 lb ; CR        ; Carriage_Return
671 lb ; EX        ; Exclamation
672 lb ; GL        ; Glue
673 lb ; H2        ; H2
674 lb ; H3        ; H3
675 lb ; HY        ; Hyphen
676 lb ; ID        ; Ideographic
677 lb ; IN        ; Inseparable                      ; Inseperable
678 lb ; IS        ; Infix_Numeric
679 lb ; JL        ; JL
680 lb ; JT        ; JT
681 lb ; JV        ; JV
682 lb ; LF        ; Line_Feed
683 lb ; NL        ; Next_Line
684 lb ; NS        ; Nonstarter
685 lb ; NU        ; Numeric
686 lb ; OP        ; Open_Punctuation
687 lb ; PO        ; Postfix_Numeric
688 lb ; PR        ; Prefix_Numeric
689 lb ; QU        ; Quotation
690 lb ; SA        ; Complex_Context
691 lb ; SG        ; Surrogate
692 lb ; SP        ; Space
693 lb ; SY        ; Break_Symbols
694 lb ; WJ        ; Word_Joiner
695 lb ; XX        ; Unknown
696 lb ; ZW        ; ZWSpace
697
698 # Logical_Order_Exception (LOE)
699
700 LOE; N         ; No                               ; F                                ; False
701 LOE; Y         ; Yes                              ; T                                ; True
702
703 # Lowercase (Lower)
704
705 Lower; N       ; No                               ; F                                ; False
706 Lower; Y       ; Yes                              ; T                                ; True
707
708 # Lowercase_Mapping (lc)
709
710 # @missing: 0000..10FFFF; Lowercase_Mapping; <code point>
711
712 # Math (Math)
713
714 Math; N        ; No                               ; F                                ; False
715 Math; Y        ; Yes                              ; T                                ; True
716
717 # NFC_Quick_Check (NFC_QC)
718
719 NFC_QC; M      ; Maybe
720 NFC_QC; N      ; No
721 NFC_QC; Y      ; Yes
722
723 # NFD_Quick_Check (NFD_QC)
724
725 NFD_QC; N      ; No
726 NFD_QC; Y      ; Yes
727
728 # NFKC_Quick_Check (NFKC_QC)
729
730 NFKC_QC; M     ; Maybe
731 NFKC_QC; N     ; No
732 NFKC_QC; Y     ; Yes
733
734 # NFKD_Quick_Check (NFKD_QC)
735
736 NFKD_QC; N     ; No
737 NFKD_QC; Y     ; Yes
738
739 # Name (na)
740
741 # @missing: 0000..10FFFF; Name; <none>
742
743 # Noncharacter_Code_Point (NChar)
744
745 NChar; N       ; No                               ; F                                ; False
746 NChar; Y       ; Yes                              ; T                                ; True
747
748 # Numeric_Type (nt)
749
750 nt ; De        ; Decimal
751 nt ; Di        ; Digit
752 nt ; None      ; None
753 nt ; Nu        ; Numeric
754
755 # Numeric_Value (nv)
756
757 # @missing: 0000..10FFFF; Numeric_Value; NaN
758
759 # Other_Alphabetic (OAlpha)
760
761 OAlpha; N      ; No                               ; F                                ; False
762 OAlpha; Y      ; Yes                              ; T                                ; True
763
764 # Other_Default_Ignorable_Code_Point (ODI)
765
766 ODI; N         ; No                               ; F                                ; False
767 ODI; Y         ; Yes                              ; T                                ; True
768
769 # Other_Grapheme_Extend (OGr_Ext)
770
771 OGr_Ext; N     ; No                               ; F                                ; False
772 OGr_Ext; Y     ; Yes                              ; T                                ; True
773
774 # Other_ID_Continue (OIDC)
775
776 OIDC; N        ; No                               ; F                                ; False
777 OIDC; Y        ; Yes                              ; T                                ; True
778
779 # Other_ID_Start (OIDS)
780
781 OIDS; N        ; No                               ; F                                ; False
782 OIDS; Y        ; Yes                              ; T                                ; True
783
784 # Other_Lowercase (OLower)
785
786 OLower; N      ; No                               ; F                                ; False
787 OLower; Y      ; Yes                              ; T                                ; True
788
789 # Other_Math (OMath)
790
791 OMath; N       ; No                               ; F                                ; False
792 OMath; Y       ; Yes                              ; T                                ; True
793
794 # Other_Uppercase (OUpper)
795
796 OUpper; N      ; No                               ; F                                ; False
797 OUpper; Y      ; Yes                              ; T                                ; True
798
799 # Pattern_Syntax (Pat_Syn)
800
801 Pat_Syn; N     ; No                               ; F                                ; False
802 Pat_Syn; Y     ; Yes                              ; T                                ; True
803
804 # Pattern_White_Space (Pat_WS)
805
806 Pat_WS; N      ; No                               ; F                                ; False
807 Pat_WS; Y      ; Yes                              ; T                                ; True
808
809 # Quotation_Mark (QMark)
810
811 QMark; N       ; No                               ; F                                ; False
812 QMark; Y       ; Yes                              ; T                                ; True
813
814 # Radical (Radical)
815
816 Radical; N     ; No                               ; F                                ; False
817 Radical; Y     ; Yes                              ; T                                ; True
818
819 # STerm (STerm)
820
821 STerm; N       ; No                               ; F                                ; False
822 STerm; Y       ; Yes                              ; T                                ; True
823
824 # Script (sc)
825
826 sc ; Arab      ; Arabic
827 sc ; Armn      ; Armenian
828 sc ; Bali      ; Balinese
829 sc ; Beng      ; Bengali
830 sc ; Bopo      ; Bopomofo
831 sc ; Brai      ; Braille
832 sc ; Bugi      ; Buginese
833 sc ; Buhd      ; Buhid
834 sc ; Cans      ; Canadian_Aboriginal
835 sc ; Cari      ; Carian
836 sc ; Cham      ; Cham
837 sc ; Cher      ; Cherokee
838 sc ; Copt      ; Coptic                           ; Qaac
839 sc ; Cprt      ; Cypriot
840 sc ; Cyrl      ; Cyrillic
841 sc ; Deva      ; Devanagari
842 sc ; Dsrt      ; Deseret
843 sc ; Ethi      ; Ethiopic
844 sc ; Geor      ; Georgian
845 sc ; Glag      ; Glagolitic
846 sc ; Goth      ; Gothic
847 sc ; Grek      ; Greek
848 sc ; Gujr      ; Gujarati
849 sc ; Guru      ; Gurmukhi
850 sc ; Hang      ; Hangul
851 sc ; Hani      ; Han
852 sc ; Hano      ; Hanunoo
853 sc ; Hebr      ; Hebrew
854 sc ; Hira      ; Hiragana
855 sc ; Hrkt      ; Katakana_Or_Hiragana
856 sc ; Ital      ; Old_Italic
857 sc ; Kali      ; Kayah_Li
858 sc ; Kana      ; Katakana
859 sc ; Khar      ; Kharoshthi
860 sc ; Khmr      ; Khmer
861 sc ; Knda      ; Kannada
862 sc ; Laoo      ; Lao
863 sc ; Latn      ; Latin
864 sc ; Lepc      ; Lepcha
865 sc ; Limb      ; Limbu
866 sc ; Linb      ; Linear_B
867 sc ; Lyci      ; Lycian
868 sc ; Lydi      ; Lydian
869 sc ; Mlym      ; Malayalam
870 sc ; Mong      ; Mongolian
871 sc ; Mymr      ; Myanmar
872 sc ; Nkoo      ; Nko
873 sc ; Ogam      ; Ogham
874 sc ; Olck      ; Ol_Chiki
875 sc ; Orya      ; Oriya
876 sc ; Osma      ; Osmanya
877 sc ; Phag      ; Phags_Pa
878 sc ; Phnx      ; Phoenician
879 sc ; Qaai      ; Inherited
880 sc ; Rjng      ; Rejang
881 sc ; Runr      ; Runic
882 sc ; Saur      ; Saurashtra
883 sc ; Shaw      ; Shavian
884 sc ; Sinh      ; Sinhala
885 sc ; Sund      ; Sundanese
886 sc ; Sylo      ; Syloti_Nagri
887 sc ; Syrc      ; Syriac
888 sc ; Tagb      ; Tagbanwa
889 sc ; Tale      ; Tai_Le
890 sc ; Talu      ; New_Tai_Lue
891 sc ; Taml      ; Tamil
892 sc ; Telu      ; Telugu
893 sc ; Tfng      ; Tifinagh
894 sc ; Tglg      ; Tagalog
895 sc ; Thaa      ; Thaana
896 sc ; Thai      ; Thai
897 sc ; Tibt      ; Tibetan
898 sc ; Ugar      ; Ugaritic
899 sc ; Vaii      ; Vai
900 sc ; Xpeo      ; Old_Persian
901 sc ; Xsux      ; Cuneiform
902 sc ; Yiii      ; Yi
903 sc ; Zyyy      ; Common
904 sc ; Zzzz      ; Unknown
905
906 # Sentence_Break (SB)
907
908 SB ; AT        ; ATerm
909 SB ; CL        ; Close
910 SB ; CR        ; CR
911 SB ; EX        ; Extend
912 SB ; FO        ; Format
913 SB ; LE        ; OLetter
914 SB ; LF        ; LF
915 SB ; LO        ; Lower
916 SB ; NU        ; Numeric
917 SB ; SC        ; SContinue
918 SB ; SE        ; Sep
919 SB ; SP        ; Sp
920 SB ; ST        ; STerm
921 SB ; UP        ; Upper
922 SB ; XX        ; Other
923
924 # Simple_Case_Folding (scf)
925
926 # @missing: 0000..10FFFF; Simple_Case_Folding; <code point>
927
928 # Simple_Lowercase_Mapping (slc)
929
930 # @missing: 0000..10FFFF; Simple_Lowercase_Mapping; <code point>
931
932 # Simple_Titlecase_Mapping (stc)
933
934 # @missing: 0000..10FFFF; Simple_Titlecase_Mapping; <code point>
935
936 # Simple_Uppercase_Mapping (suc)
937
938 # @missing: 0000..10FFFF; Simple_Uppercase_Mapping; <code point>
939
940 # Soft_Dotted (SD)
941
942 SD ; N         ; No                               ; F                                ; False
943 SD ; Y         ; Yes                              ; T                                ; True
944
945 # Terminal_Punctuation (Term)
946
947 Term; N        ; No                               ; F                                ; False
948 Term; Y        ; Yes                              ; T                                ; True
949
950 # Titlecase_Mapping (tc)
951
952 # @missing: 0000..10FFFF; Titlecase_Mapping; <code point>
953
954 # Unicode_1_Name (na1)
955
956 # @missing: 0000..10FFFF; Unicode_1_Name; <none>
957
958 # Unicode_Radical_Stroke (URS)
959
960 # @missing: 0000..10FFFF; Unicode_Radical_Stroke; <none>
961
962 # Unified_Ideograph (UIdeo)
963
964 UIdeo; N       ; No                               ; F                                ; False
965 UIdeo; Y       ; Yes                              ; T                                ; True
966
967 # Uppercase (Upper)
968
969 Upper; N       ; No                               ; F                                ; False
970 Upper; Y       ; Yes                              ; T                                ; True
971
972 # Uppercase_Mapping (uc)
973
974 # @missing: 0000..10FFFF; Uppercase_Mapping; <code point>
975
976 # Variation_Selector (VS)
977
978 VS ; N         ; No                               ; F                                ; False
979 VS ; Y         ; Yes                              ; T                                ; True
980
981 # White_Space (WSpace)
982
983 WSpace; N      ; No                               ; F                                ; False
984 WSpace; Y      ; Yes                              ; T                                ; True
985
986 # Word_Break (WB)
987
988 WB ; CR        ; CR
989 WB ; EX        ; ExtendNumLet
990 WB ; Extend    ; Extend
991 WB ; FO        ; Format
992 WB ; KA        ; Katakana
993 WB ; LE        ; ALetter
994 WB ; LF        ; LF
995 WB ; MB        ; MidNumLet
996 WB ; ML        ; MidLetter
997 WB ; MN        ; MidNum
998 WB ; NL        ; Newline
999 WB ; NU        ; Numeric
1000 WB ; XX        ; Other
1001
1002 # XID_Continue (XIDC)
1003
1004 XIDC; N        ; No                               ; F                                ; False
1005 XIDC; Y        ; Yes                              ; T                                ; True
1006
1007 # XID_Start (XIDS)
1008
1009 XIDS; N        ; No                               ; F                                ; False
1010 XIDS; Y        ; Yes                              ; T                                ; True
1011
1012 # EOF