summaryrefslogtreecommitdiff
path: root/data/unicode/PropertyValueAliases.txt
diff options
context:
space:
mode:
authorGravatar Jose Colon Rodriguez2024-02-19 09:11:56 -0400
committerGravatar Jose Colon Rodriguez2024-02-19 09:11:56 -0400
commit6013b2ded106521ee9cae6bd77dacbd5254ff763 (patch)
tree990f13cfbe4bfc20a08d2f097c4646984bffb565 /data/unicode/PropertyValueAliases.txt
parentTried SIMD lower/upper string. Slower than linear. (diff)
downloadzg-6013b2ded106521ee9cae6bd77dacbd5254ff763.tar.gz
zg-6013b2ded106521ee9cae6bd77dacbd5254ff763.tar.xz
zg-6013b2ded106521ee9cae6bd77dacbd5254ff763.zip
Cleaned up directory structure
Diffstat (limited to 'data/unicode/PropertyValueAliases.txt')
-rw-r--r--data/unicode/PropertyValueAliases.txt1653
1 files changed, 1653 insertions, 0 deletions
diff --git a/data/unicode/PropertyValueAliases.txt b/data/unicode/PropertyValueAliases.txt
new file mode 100644
index 0000000..240cd28
--- /dev/null
+++ b/data/unicode/PropertyValueAliases.txt
@@ -0,0 +1,1653 @@
1# PropertyValueAliases-15.1.0.txt
2# Date: 2023-08-07, 15:21:34 GMT
3# © 2023 Unicode®, Inc.
4# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
5# For terms of use, see https://www.unicode.org/terms_of_use.html
6#
7# Unicode Character Database
8# For documentation, see https://www.unicode.org/reports/tr44/
9#
10# This file contains aliases for property values used in the UCD.
11# These names can be used for XML formats of UCD data, for regular-expression
12# property tests, and other programmatic textual descriptions of Unicode data.
13#
14# The names may be translated in appropriate environments, and additional
15# aliases may be useful.
16#
17# FORMAT
18#
19# Each line describes a property value name.
20# This consists of three or more fields, separated by semicolons.
21#
22# First Field: The first field describes the property for which that
23# property value name is used.
24#
25# Second Field: The second field is the short name for the property value.
26# It is typically an abbreviation, but in a number of cases it is simply
27# a duplicate of the "long name" in the third field.
28#
29# Third Field: The third field is the long name for the property value,
30# typically the formal name used in documentation about the property value.
31#
32# In the case of Canonical_Combining_Class (ccc), there are 4 fields:
33# The second field is numeric, the third is the short name, and the fourth is the long name.
34#
35# The above are the preferred aliases. Other aliases may be listed in additional fields.
36#
37# Loose matching should be applied to all property names and property values, with
38# the exception of String Property values. With loose matching of property names and
39# values, the case distinctions, whitespace, hyphens, and '_' are ignored.
40# For Numeric Property values, numeric equivalence is applied: thus "01.00"
41# is equivalent to "1".
42#
43# NOTE: Property value names are NOT unique across properties. For example:
44#
45# AL means Arabic Letter for the Bidi_Class property, and
46# AL means Above_Left for the Canonical_Combining_Class property, and
47# AL means Alphabetic for the Line_Break property.
48#
49# In addition, some property names may be the same as some property value names.
50# For example:
51#
52# sc means the Script property, and
53# Sc means the General_Category property value Currency_Symbol (Sc)
54#
55# The combination of property value and property name is, however, unique.
56#
57# For more information, see UAX #44, Unicode Character Database, and
58# UTS #18, Unicode Regular Expressions.
59# ================================================
60
61
62# ASCII_Hex_Digit (AHex)
63
64AHex; N ; No ; F ; False
65AHex; Y ; Yes ; T ; True
66
67# Age (age)
68
69age; 1.1 ; V1_1
70age; 2.0 ; V2_0
71age; 2.1 ; V2_1
72age; 3.0 ; V3_0
73age; 3.1 ; V3_1
74age; 3.2 ; V3_2
75age; 4.0 ; V4_0
76age; 4.1 ; V4_1
77age; 5.0 ; V5_0
78age; 5.1 ; V5_1
79age; 5.2 ; V5_2
80age; 6.0 ; V6_0
81age; 6.1 ; V6_1
82age; 6.2 ; V6_2
83age; 6.3 ; V6_3
84age; 7.0 ; V7_0
85age; 8.0 ; V8_0
86age; 9.0 ; V9_0
87age; 10.0 ; V10_0
88age; 11.0 ; V11_0
89age; 12.0 ; V12_0
90age; 12.1 ; V12_1
91age; 13.0 ; V13_0
92age; 14.0 ; V14_0
93age; 15.0 ; V15_0
94age; 15.1 ; V15_1
95age; NA ; Unassigned
96
97# Alphabetic (Alpha)
98
99Alpha; N ; No ; F ; False
100Alpha; Y ; Yes ; T ; True
101
102# Bidi_Class (bc)
103
104bc ; AL ; Arabic_Letter
105bc ; AN ; Arabic_Number
106bc ; B ; Paragraph_Separator
107bc ; BN ; Boundary_Neutral
108bc ; CS ; Common_Separator
109bc ; EN ; European_Number
110bc ; ES ; European_Separator
111bc ; ET ; European_Terminator
112bc ; FSI ; First_Strong_Isolate
113bc ; L ; Left_To_Right
114bc ; LRE ; Left_To_Right_Embedding
115bc ; LRI ; Left_To_Right_Isolate
116bc ; LRO ; Left_To_Right_Override
117bc ; NSM ; Nonspacing_Mark
118bc ; ON ; Other_Neutral
119bc ; PDF ; Pop_Directional_Format
120bc ; PDI ; Pop_Directional_Isolate
121bc ; R ; Right_To_Left
122bc ; RLE ; Right_To_Left_Embedding
123bc ; RLI ; Right_To_Left_Isolate
124bc ; RLO ; Right_To_Left_Override
125bc ; S ; Segment_Separator
126bc ; WS ; White_Space
127
128# Bidi_Control (Bidi_C)
129
130Bidi_C; N ; No ; F ; False
131Bidi_C; Y ; Yes ; T ; True
132
133# Bidi_Mirrored (Bidi_M)
134
135Bidi_M; N ; No ; F ; False
136Bidi_M; Y ; Yes ; T ; True
137
138# Bidi_Mirroring_Glyph (bmg)
139
140
141# Bidi_Paired_Bracket (bpb)
142
143# @missing: 0000..10FFFF; Bidi_Paired_Bracket; <none>
144
145# Bidi_Paired_Bracket_Type (bpt)
146
147bpt; c ; Close
148bpt; n ; None
149bpt; o ; Open
150# @missing: 0000..10FFFF; Bidi_Paired_Bracket_Type; n
151
152# Block (blk)
153
154blk; Adlam ; Adlam
155blk; Aegean_Numbers ; Aegean_Numbers
156blk; Ahom ; Ahom
157blk; Alchemical ; Alchemical_Symbols
158blk; Alphabetic_PF ; Alphabetic_Presentation_Forms
159blk; Anatolian_Hieroglyphs ; Anatolian_Hieroglyphs
160blk; Ancient_Greek_Music ; Ancient_Greek_Musical_Notation
161blk; Ancient_Greek_Numbers ; Ancient_Greek_Numbers
162blk; Ancient_Symbols ; Ancient_Symbols
163blk; Arabic ; Arabic
164blk; Arabic_Ext_A ; Arabic_Extended_A
165blk; Arabic_Ext_B ; Arabic_Extended_B
166blk; Arabic_Ext_C ; Arabic_Extended_C
167blk; Arabic_Math ; Arabic_Mathematical_Alphabetic_Symbols
168blk; Arabic_PF_A ; Arabic_Presentation_Forms_A ; Arabic_Presentation_Forms-A
169blk; Arabic_PF_B ; Arabic_Presentation_Forms_B
170blk; Arabic_Sup ; Arabic_Supplement
171blk; Armenian ; Armenian
172blk; Arrows ; Arrows
173blk; ASCII ; Basic_Latin
174blk; Avestan ; Avestan
175blk; Balinese ; Balinese
176blk; Bamum ; Bamum
177blk; Bamum_Sup ; Bamum_Supplement
178blk; Bassa_Vah ; Bassa_Vah
179blk; Batak ; Batak
180blk; Bengali ; Bengali
181blk; Bhaiksuki ; Bhaiksuki
182blk; Block_Elements ; Block_Elements
183blk; Bopomofo ; Bopomofo
184blk; Bopomofo_Ext ; Bopomofo_Extended
185blk; Box_Drawing ; Box_Drawing
186blk; Brahmi ; Brahmi
187blk; Braille ; Braille_Patterns
188blk; Buginese ; Buginese
189blk; Buhid ; Buhid
190blk; Byzantine_Music ; Byzantine_Musical_Symbols
191blk; Carian ; Carian
192blk; Caucasian_Albanian ; Caucasian_Albanian
193blk; Chakma ; Chakma
194blk; Cham ; Cham
195blk; Cherokee ; Cherokee
196blk; Cherokee_Sup ; Cherokee_Supplement
197blk; Chess_Symbols ; Chess_Symbols
198blk; Chorasmian ; Chorasmian
199blk; CJK ; CJK_Unified_Ideographs
200blk; CJK_Compat ; CJK_Compatibility
201blk; CJK_Compat_Forms ; CJK_Compatibility_Forms
202blk; CJK_Compat_Ideographs ; CJK_Compatibility_Ideographs
203blk; CJK_Compat_Ideographs_Sup ; CJK_Compatibility_Ideographs_Supplement
204blk; CJK_Ext_A ; CJK_Unified_Ideographs_Extension_A
205blk; CJK_Ext_B ; CJK_Unified_Ideographs_Extension_B
206blk; CJK_Ext_C ; CJK_Unified_Ideographs_Extension_C
207blk; CJK_Ext_D ; CJK_Unified_Ideographs_Extension_D
208blk; CJK_Ext_E ; CJK_Unified_Ideographs_Extension_E
209blk; CJK_Ext_F ; CJK_Unified_Ideographs_Extension_F
210blk; CJK_Ext_G ; CJK_Unified_Ideographs_Extension_G
211blk; CJK_Ext_H ; CJK_Unified_Ideographs_Extension_H
212blk; CJK_Ext_I ; CJK_Unified_Ideographs_Extension_I
213blk; CJK_Radicals_Sup ; CJK_Radicals_Supplement
214blk; CJK_Strokes ; CJK_Strokes
215blk; CJK_Symbols ; CJK_Symbols_And_Punctuation
216blk; Compat_Jamo ; Hangul_Compatibility_Jamo
217blk; Control_Pictures ; Control_Pictures
218blk; Coptic ; Coptic
219blk; Coptic_Epact_Numbers ; Coptic_Epact_Numbers
220blk; Counting_Rod ; Counting_Rod_Numerals
221blk; Cuneiform ; Cuneiform
222blk; Cuneiform_Numbers ; Cuneiform_Numbers_And_Punctuation
223blk; Currency_Symbols ; Currency_Symbols
224blk; Cypriot_Syllabary ; Cypriot_Syllabary
225blk; Cypro_Minoan ; Cypro_Minoan
226blk; Cyrillic ; Cyrillic
227blk; Cyrillic_Ext_A ; Cyrillic_Extended_A
228blk; Cyrillic_Ext_B ; Cyrillic_Extended_B
229blk; Cyrillic_Ext_C ; Cyrillic_Extended_C
230blk; Cyrillic_Ext_D ; Cyrillic_Extended_D
231blk; Cyrillic_Sup ; Cyrillic_Supplement ; Cyrillic_Supplementary
232blk; Deseret ; Deseret
233blk; Devanagari ; Devanagari
234blk; Devanagari_Ext ; Devanagari_Extended
235blk; Devanagari_Ext_A ; Devanagari_Extended_A
236blk; Diacriticals ; Combining_Diacritical_Marks
237blk; Diacriticals_Ext ; Combining_Diacritical_Marks_Extended
238blk; Diacriticals_For_Symbols ; Combining_Diacritical_Marks_For_Symbols; Combining_Marks_For_Symbols
239blk; Diacriticals_Sup ; Combining_Diacritical_Marks_Supplement
240blk; Dingbats ; Dingbats
241blk; Dives_Akuru ; Dives_Akuru
242blk; Dogra ; Dogra
243blk; Domino ; Domino_Tiles
244blk; Duployan ; Duployan
245blk; Early_Dynastic_Cuneiform ; Early_Dynastic_Cuneiform
246blk; Egyptian_Hieroglyph_Format_Controls; Egyptian_Hieroglyph_Format_Controls
247blk; Egyptian_Hieroglyphs ; Egyptian_Hieroglyphs
248blk; Elbasan ; Elbasan
249blk; Elymaic ; Elymaic
250blk; Emoticons ; Emoticons
251blk; Enclosed_Alphanum ; Enclosed_Alphanumerics
252blk; Enclosed_Alphanum_Sup ; Enclosed_Alphanumeric_Supplement
253blk; Enclosed_CJK ; Enclosed_CJK_Letters_And_Months
254blk; Enclosed_Ideographic_Sup ; Enclosed_Ideographic_Supplement
255blk; Ethiopic ; Ethiopic
256blk; Ethiopic_Ext ; Ethiopic_Extended
257blk; Ethiopic_Ext_A ; Ethiopic_Extended_A
258blk; Ethiopic_Ext_B ; Ethiopic_Extended_B
259blk; Ethiopic_Sup ; Ethiopic_Supplement
260blk; Geometric_Shapes ; Geometric_Shapes
261blk; Geometric_Shapes_Ext ; Geometric_Shapes_Extended
262blk; Georgian ; Georgian
263blk; Georgian_Ext ; Georgian_Extended
264blk; Georgian_Sup ; Georgian_Supplement
265blk; Glagolitic ; Glagolitic
266blk; Glagolitic_Sup ; Glagolitic_Supplement
267blk; Gothic ; Gothic
268blk; Grantha ; Grantha
269blk; Greek ; Greek_And_Coptic
270blk; Greek_Ext ; Greek_Extended
271blk; Gujarati ; Gujarati
272blk; Gunjala_Gondi ; Gunjala_Gondi
273blk; Gurmukhi ; Gurmukhi
274blk; Half_And_Full_Forms ; Halfwidth_And_Fullwidth_Forms
275blk; Half_Marks ; Combining_Half_Marks
276blk; Hangul ; Hangul_Syllables
277blk; Hanifi_Rohingya ; Hanifi_Rohingya
278blk; Hanunoo ; Hanunoo
279blk; Hatran ; Hatran
280blk; Hebrew ; Hebrew
281blk; High_PU_Surrogates ; High_Private_Use_Surrogates
282blk; High_Surrogates ; High_Surrogates
283blk; Hiragana ; Hiragana
284blk; IDC ; Ideographic_Description_Characters
285blk; Ideographic_Symbols ; Ideographic_Symbols_And_Punctuation
286blk; Imperial_Aramaic ; Imperial_Aramaic
287blk; Indic_Number_Forms ; Common_Indic_Number_Forms
288blk; Indic_Siyaq_Numbers ; Indic_Siyaq_Numbers
289blk; Inscriptional_Pahlavi ; Inscriptional_Pahlavi
290blk; Inscriptional_Parthian ; Inscriptional_Parthian
291blk; IPA_Ext ; IPA_Extensions
292blk; Jamo ; Hangul_Jamo
293blk; Jamo_Ext_A ; Hangul_Jamo_Extended_A
294blk; Jamo_Ext_B ; Hangul_Jamo_Extended_B
295blk; Javanese ; Javanese
296blk; Kaithi ; Kaithi
297blk; Kaktovik_Numerals ; Kaktovik_Numerals
298blk; Kana_Ext_A ; Kana_Extended_A
299blk; Kana_Ext_B ; Kana_Extended_B
300blk; Kana_Sup ; Kana_Supplement
301blk; Kanbun ; Kanbun
302blk; Kangxi ; Kangxi_Radicals
303blk; Kannada ; Kannada
304blk; Katakana ; Katakana
305blk; Katakana_Ext ; Katakana_Phonetic_Extensions
306blk; Kawi ; Kawi
307blk; Kayah_Li ; Kayah_Li
308blk; Kharoshthi ; Kharoshthi
309blk; Khitan_Small_Script ; Khitan_Small_Script
310blk; Khmer ; Khmer
311blk; Khmer_Symbols ; Khmer_Symbols
312blk; Khojki ; Khojki
313blk; Khudawadi ; Khudawadi
314blk; Lao ; Lao
315blk; Latin_1_Sup ; Latin_1_Supplement ; Latin_1
316blk; Latin_Ext_A ; Latin_Extended_A
317blk; Latin_Ext_Additional ; Latin_Extended_Additional
318blk; Latin_Ext_B ; Latin_Extended_B
319blk; Latin_Ext_C ; Latin_Extended_C
320blk; Latin_Ext_D ; Latin_Extended_D
321blk; Latin_Ext_E ; Latin_Extended_E
322blk; Latin_Ext_F ; Latin_Extended_F
323blk; Latin_Ext_G ; Latin_Extended_G
324blk; Lepcha ; Lepcha
325blk; Letterlike_Symbols ; Letterlike_Symbols
326blk; Limbu ; Limbu
327blk; Linear_A ; Linear_A
328blk; Linear_B_Ideograms ; Linear_B_Ideograms
329blk; Linear_B_Syllabary ; Linear_B_Syllabary
330blk; Lisu ; Lisu
331blk; Lisu_Sup ; Lisu_Supplement
332blk; Low_Surrogates ; Low_Surrogates
333blk; Lycian ; Lycian
334blk; Lydian ; Lydian
335blk; Mahajani ; Mahajani
336blk; Mahjong ; Mahjong_Tiles
337blk; Makasar ; Makasar
338blk; Malayalam ; Malayalam
339blk; Mandaic ; Mandaic
340blk; Manichaean ; Manichaean
341blk; Marchen ; Marchen
342blk; Masaram_Gondi ; Masaram_Gondi
343blk; Math_Alphanum ; Mathematical_Alphanumeric_Symbols
344blk; Math_Operators ; Mathematical_Operators
345blk; Mayan_Numerals ; Mayan_Numerals
346blk; Medefaidrin ; Medefaidrin
347blk; Meetei_Mayek ; Meetei_Mayek
348blk; Meetei_Mayek_Ext ; Meetei_Mayek_Extensions
349blk; Mende_Kikakui ; Mende_Kikakui
350blk; Meroitic_Cursive ; Meroitic_Cursive
351blk; Meroitic_Hieroglyphs ; Meroitic_Hieroglyphs
352blk; Miao ; Miao
353blk; Misc_Arrows ; Miscellaneous_Symbols_And_Arrows
354blk; Misc_Math_Symbols_A ; Miscellaneous_Mathematical_Symbols_A
355blk; Misc_Math_Symbols_B ; Miscellaneous_Mathematical_Symbols_B
356blk; Misc_Pictographs ; Miscellaneous_Symbols_And_Pictographs
357blk; Misc_Symbols ; Miscellaneous_Symbols
358blk; Misc_Technical ; Miscellaneous_Technical
359blk; Modi ; Modi
360blk; Modifier_Letters ; Spacing_Modifier_Letters
361blk; Modifier_Tone_Letters ; Modifier_Tone_Letters
362blk; Mongolian ; Mongolian
363blk; Mongolian_Sup ; Mongolian_Supplement
364blk; Mro ; Mro
365blk; Multani ; Multani
366blk; Music ; Musical_Symbols
367blk; Myanmar ; Myanmar
368blk; Myanmar_Ext_A ; Myanmar_Extended_A
369blk; Myanmar_Ext_B ; Myanmar_Extended_B
370blk; Nabataean ; Nabataean
371blk; Nag_Mundari ; Nag_Mundari
372blk; Nandinagari ; Nandinagari
373blk; NB ; No_Block
374blk; New_Tai_Lue ; New_Tai_Lue
375blk; Newa ; Newa
376blk; NKo ; NKo
377blk; Number_Forms ; Number_Forms
378blk; Nushu ; Nushu
379blk; Nyiakeng_Puachue_Hmong ; Nyiakeng_Puachue_Hmong
380blk; OCR ; Optical_Character_Recognition
381blk; Ogham ; Ogham
382blk; Ol_Chiki ; Ol_Chiki
383blk; Old_Hungarian ; Old_Hungarian
384blk; Old_Italic ; Old_Italic
385blk; Old_North_Arabian ; Old_North_Arabian
386blk; Old_Permic ; Old_Permic
387blk; Old_Persian ; Old_Persian
388blk; Old_Sogdian ; Old_Sogdian
389blk; Old_South_Arabian ; Old_South_Arabian
390blk; Old_Turkic ; Old_Turkic
391blk; Old_Uyghur ; Old_Uyghur
392blk; Oriya ; Oriya
393blk; Ornamental_Dingbats ; Ornamental_Dingbats
394blk; Osage ; Osage
395blk; Osmanya ; Osmanya
396blk; Ottoman_Siyaq_Numbers ; Ottoman_Siyaq_Numbers
397blk; Pahawh_Hmong ; Pahawh_Hmong
398blk; Palmyrene ; Palmyrene
399blk; Pau_Cin_Hau ; Pau_Cin_Hau
400blk; Phags_Pa ; Phags_Pa
401blk; Phaistos ; Phaistos_Disc
402blk; Phoenician ; Phoenician
403blk; Phonetic_Ext ; Phonetic_Extensions
404blk; Phonetic_Ext_Sup ; Phonetic_Extensions_Supplement
405blk; Playing_Cards ; Playing_Cards
406blk; Psalter_Pahlavi ; Psalter_Pahlavi
407blk; PUA ; Private_Use_Area ; Private_Use
408blk; Punctuation ; General_Punctuation
409blk; Rejang ; Rejang
410blk; Rumi ; Rumi_Numeral_Symbols
411blk; Runic ; Runic
412blk; Samaritan ; Samaritan
413blk; Saurashtra ; Saurashtra
414blk; Sharada ; Sharada
415blk; Shavian ; Shavian
416blk; Shorthand_Format_Controls ; Shorthand_Format_Controls
417blk; Siddham ; Siddham
418blk; Sinhala ; Sinhala
419blk; Sinhala_Archaic_Numbers ; Sinhala_Archaic_Numbers
420blk; Small_Forms ; Small_Form_Variants
421blk; Small_Kana_Ext ; Small_Kana_Extension
422blk; Sogdian ; Sogdian
423blk; Sora_Sompeng ; Sora_Sompeng
424blk; Soyombo ; Soyombo
425blk; Specials ; Specials
426blk; Sundanese ; Sundanese
427blk; Sundanese_Sup ; Sundanese_Supplement
428blk; Sup_Arrows_A ; Supplemental_Arrows_A
429blk; Sup_Arrows_B ; Supplemental_Arrows_B
430blk; Sup_Arrows_C ; Supplemental_Arrows_C
431blk; Sup_Math_Operators ; Supplemental_Mathematical_Operators
432blk; Sup_PUA_A ; Supplementary_Private_Use_Area_A
433blk; Sup_PUA_B ; Supplementary_Private_Use_Area_B
434blk; Sup_Punctuation ; Supplemental_Punctuation
435blk; Sup_Symbols_And_Pictographs ; Supplemental_Symbols_And_Pictographs
436blk; Super_And_Sub ; Superscripts_And_Subscripts
437blk; Sutton_SignWriting ; Sutton_SignWriting
438blk; Syloti_Nagri ; Syloti_Nagri
439blk; Symbols_And_Pictographs_Ext_A ; Symbols_And_Pictographs_Extended_A
440blk; Symbols_For_Legacy_Computing ; Symbols_For_Legacy_Computing
441blk; Syriac ; Syriac
442blk; Syriac_Sup ; Syriac_Supplement
443blk; Tagalog ; Tagalog
444blk; Tagbanwa ; Tagbanwa
445blk; Tags ; Tags
446blk; Tai_Le ; Tai_Le
447blk; Tai_Tham ; Tai_Tham
448blk; Tai_Viet ; Tai_Viet
449blk; Tai_Xuan_Jing ; Tai_Xuan_Jing_Symbols
450blk; Takri ; Takri
451blk; Tamil ; Tamil
452blk; Tamil_Sup ; Tamil_Supplement
453blk; Tangsa ; Tangsa
454blk; Tangut ; Tangut
455blk; Tangut_Components ; Tangut_Components
456blk; Tangut_Sup ; Tangut_Supplement
457blk; Telugu ; Telugu
458blk; Thaana ; Thaana
459blk; Thai ; Thai
460blk; Tibetan ; Tibetan
461blk; Tifinagh ; Tifinagh
462blk; Tirhuta ; Tirhuta
463blk; Toto ; Toto
464blk; Transport_And_Map ; Transport_And_Map_Symbols
465blk; UCAS ; Unified_Canadian_Aboriginal_Syllabics; Canadian_Syllabics
466blk; UCAS_Ext ; Unified_Canadian_Aboriginal_Syllabics_Extended
467blk; UCAS_Ext_A ; Unified_Canadian_Aboriginal_Syllabics_Extended_A
468blk; Ugaritic ; Ugaritic
469blk; Vai ; Vai
470blk; Vedic_Ext ; Vedic_Extensions
471blk; Vertical_Forms ; Vertical_Forms
472blk; Vithkuqi ; Vithkuqi
473blk; VS ; Variation_Selectors
474blk; VS_Sup ; Variation_Selectors_Supplement
475blk; Wancho ; Wancho
476blk; Warang_Citi ; Warang_Citi
477blk; Yezidi ; Yezidi
478blk; Yi_Radicals ; Yi_Radicals
479blk; Yi_Syllables ; Yi_Syllables
480blk; Yijing ; Yijing_Hexagram_Symbols
481blk; Zanabazar_Square ; Zanabazar_Square
482blk; Znamenny_Music ; Znamenny_Musical_Notation
483
484# Canonical_Combining_Class (ccc)
485
486ccc; 0; NR ; Not_Reordered
487ccc; 1; OV ; Overlay
488ccc; 6; HANR ; Han_Reading
489ccc; 7; NK ; Nukta
490ccc; 8; KV ; Kana_Voicing
491ccc; 9; VR ; Virama
492ccc; 10; CCC10 ; CCC10
493ccc; 11; CCC11 ; CCC11
494ccc; 12; CCC12 ; CCC12
495ccc; 13; CCC13 ; CCC13
496ccc; 14; CCC14 ; CCC14
497ccc; 15; CCC15 ; CCC15
498ccc; 16; CCC16 ; CCC16
499ccc; 17; CCC17 ; CCC17
500ccc; 18; CCC18 ; CCC18
501ccc; 19; CCC19 ; CCC19
502ccc; 20; CCC20 ; CCC20
503ccc; 21; CCC21 ; CCC21
504ccc; 22; CCC22 ; CCC22
505ccc; 23; CCC23 ; CCC23
506ccc; 24; CCC24 ; CCC24
507ccc; 25; CCC25 ; CCC25
508ccc; 26; CCC26 ; CCC26
509ccc; 27; CCC27 ; CCC27
510ccc; 28; CCC28 ; CCC28
511ccc; 29; CCC29 ; CCC29
512ccc; 30; CCC30 ; CCC30
513ccc; 31; CCC31 ; CCC31
514ccc; 32; CCC32 ; CCC32
515ccc; 33; CCC33 ; CCC33
516ccc; 34; CCC34 ; CCC34
517ccc; 35; CCC35 ; CCC35
518ccc; 36; CCC36 ; CCC36
519ccc; 84; CCC84 ; CCC84
520ccc; 91; CCC91 ; CCC91
521ccc; 103; CCC103 ; CCC103
522ccc; 107; CCC107 ; CCC107
523ccc; 118; CCC118 ; CCC118
524ccc; 122; CCC122 ; CCC122
525ccc; 129; CCC129 ; CCC129
526ccc; 130; CCC130 ; CCC130
527ccc; 132; CCC132 ; CCC132
528ccc; 133; CCC133 ; CCC133 # RESERVED
529ccc; 200; ATBL ; Attached_Below_Left
530ccc; 202; ATB ; Attached_Below
531ccc; 214; ATA ; Attached_Above
532ccc; 216; ATAR ; Attached_Above_Right
533ccc; 218; BL ; Below_Left
534ccc; 220; B ; Below
535ccc; 222; BR ; Below_Right
536ccc; 224; L ; Left
537ccc; 226; R ; Right
538ccc; 228; AL ; Above_Left
539ccc; 230; A ; Above
540ccc; 232; AR ; Above_Right
541ccc; 233; DB ; Double_Below
542ccc; 234; DA ; Double_Above
543ccc; 240; IS ; Iota_Subscript
544
545# Case_Folding (cf)
546
547# @missing: 0000..10FFFF; Case_Folding; <code point>
548
549# Case_Ignorable (CI)
550
551CI ; N ; No ; F ; False
552CI ; Y ; Yes ; T ; True
553
554# Cased (Cased)
555
556Cased; N ; No ; F ; False
557Cased; Y ; Yes ; T ; True
558
559# Changes_When_Casefolded (CWCF)
560
561CWCF; N ; No ; F ; False
562CWCF; Y ; Yes ; T ; True
563
564# Changes_When_Casemapped (CWCM)
565
566CWCM; N ; No ; F ; False
567CWCM; Y ; Yes ; T ; True
568
569# Changes_When_Lowercased (CWL)
570
571CWL; N ; No ; F ; False
572CWL; Y ; Yes ; T ; True
573
574# Changes_When_NFKC_Casefolded (CWKCF)
575
576CWKCF; N ; No ; F ; False
577CWKCF; Y ; Yes ; T ; True
578
579# Changes_When_Titlecased (CWT)
580
581CWT; N ; No ; F ; False
582CWT; Y ; Yes ; T ; True
583
584# Changes_When_Uppercased (CWU)
585
586CWU; N ; No ; F ; False
587CWU; Y ; Yes ; T ; True
588
589# Composition_Exclusion (CE)
590
591CE ; N ; No ; F ; False
592CE ; Y ; Yes ; T ; True
593
594# Dash (Dash)
595
596Dash; N ; No ; F ; False
597Dash; Y ; Yes ; T ; True
598
599# Decomposition_Mapping (dm)
600
601# @missing: 0000..10FFFF; Decomposition_Mapping; <code point>
602
603# Decomposition_Type (dt)
604
605dt ; Can ; Canonical ; can
606dt ; Com ; Compat ; com
607dt ; Enc ; Circle ; enc
608dt ; Fin ; Final ; fin
609dt ; Font ; Font ; font
610dt ; Fra ; Fraction ; fra
611dt ; Init ; Initial ; init
612dt ; Iso ; Isolated ; iso
613dt ; Med ; Medial ; med
614dt ; Nar ; Narrow ; nar
615dt ; Nb ; Nobreak ; nb
616dt ; None ; None ; none
617dt ; Sml ; Small ; sml
618dt ; Sqr ; Square ; sqr
619dt ; Sub ; Sub ; sub
620dt ; Sup ; Super ; sup
621dt ; Vert ; Vertical ; vert
622dt ; Wide ; Wide ; wide
623
624# Default_Ignorable_Code_Point (DI)
625
626DI ; N ; No ; F ; False
627DI ; Y ; Yes ; T ; True
628
629# Deprecated (Dep)
630
631Dep; N ; No ; F ; False
632Dep; Y ; Yes ; T ; True
633
634# Diacritic (Dia)
635
636Dia; N ; No ; F ; False
637Dia; Y ; Yes ; T ; True
638
639# East_Asian_Width (ea)
640
641ea ; A ; Ambiguous
642ea ; F ; Fullwidth
643ea ; H ; Halfwidth
644ea ; N ; Neutral
645ea ; Na ; Narrow
646ea ; W ; Wide
647
648# Emoji (Emoji)
649
650Emoji; N ; No ; F ; False
651Emoji; Y ; Yes ; T ; True
652
653# Emoji_Component (EComp)
654
655EComp; N ; No ; F ; False
656EComp; Y ; Yes ; T ; True
657
658# Emoji_Modifier (EMod)
659
660EMod; N ; No ; F ; False
661EMod; Y ; Yes ; T ; True
662
663# Emoji_Modifier_Base (EBase)
664
665EBase; N ; No ; F ; False
666EBase; Y ; Yes ; T ; True
667
668# Emoji_Presentation (EPres)
669
670EPres; N ; No ; F ; False
671EPres; Y ; Yes ; T ; True
672
673# Equivalent_Unified_Ideograph (EqUIdeo)
674
675
676# Expands_On_NFC (XO_NFC)
677
678XO_NFC; N ; No ; F ; False
679XO_NFC; Y ; Yes ; T ; True
680
681# Expands_On_NFD (XO_NFD)
682
683XO_NFD; N ; No ; F ; False
684XO_NFD; Y ; Yes ; T ; True
685
686# Expands_On_NFKC (XO_NFKC)
687
688XO_NFKC; N ; No ; F ; False
689XO_NFKC; Y ; Yes ; T ; True
690
691# Expands_On_NFKD (XO_NFKD)
692
693XO_NFKD; N ; No ; F ; False
694XO_NFKD; Y ; Yes ; T ; True
695
696# Extended_Pictographic (ExtPict)
697
698ExtPict; N ; No ; F ; False
699ExtPict; Y ; Yes ; T ; True
700
701# Extender (Ext)
702
703Ext; N ; No ; F ; False
704Ext; Y ; Yes ; T ; True
705
706# FC_NFKC_Closure (FC_NFKC)
707
708# @missing: 0000..10FFFF; FC_NFKC_Closure; <code point>
709
710# Full_Composition_Exclusion (Comp_Ex)
711
712Comp_Ex; N ; No ; F ; False
713Comp_Ex; Y ; Yes ; T ; True
714
715# General_Category (gc)
716
717gc ; C ; Other # Cc | Cf | Cn | Co | Cs
718gc ; Cc ; Control ; cntrl
719gc ; Cf ; Format
720gc ; Cn ; Unassigned
721gc ; Co ; Private_Use
722gc ; Cs ; Surrogate
723gc ; L ; Letter # Ll | Lm | Lo | Lt | Lu
724gc ; LC ; Cased_Letter # Ll | Lt | Lu
725gc ; Ll ; Lowercase_Letter
726gc ; Lm ; Modifier_Letter
727gc ; Lo ; Other_Letter
728gc ; Lt ; Titlecase_Letter
729gc ; Lu ; Uppercase_Letter
730gc ; M ; Mark ; Combining_Mark # Mc | Me | Mn
731gc ; Mc ; Spacing_Mark
732gc ; Me ; Enclosing_Mark
733gc ; Mn ; Nonspacing_Mark
734gc ; N ; Number # Nd | Nl | No
735gc ; Nd ; Decimal_Number ; digit
736gc ; Nl ; Letter_Number
737gc ; No ; Other_Number
738gc ; P ; Punctuation ; punct # Pc | Pd | Pe | Pf | Pi | Po | Ps
739gc ; Pc ; Connector_Punctuation
740gc ; Pd ; Dash_Punctuation
741gc ; Pe ; Close_Punctuation
742gc ; Pf ; Final_Punctuation
743gc ; Pi ; Initial_Punctuation
744gc ; Po ; Other_Punctuation
745gc ; Ps ; Open_Punctuation
746gc ; S ; Symbol # Sc | Sk | Sm | So
747gc ; Sc ; Currency_Symbol
748gc ; Sk ; Modifier_Symbol
749gc ; Sm ; Math_Symbol
750gc ; So ; Other_Symbol
751gc ; Z ; Separator # Zl | Zp | Zs
752gc ; Zl ; Line_Separator
753gc ; Zp ; Paragraph_Separator
754gc ; Zs ; Space_Separator
755# @missing: 0000..10FFFF; General_Category; Unassigned
756
757# Grapheme_Base (Gr_Base)
758
759Gr_Base; N ; No ; F ; False
760Gr_Base; Y ; Yes ; T ; True
761
762# Grapheme_Cluster_Break (GCB)
763
764GCB; CN ; Control
765GCB; CR ; CR
766GCB; EB ; E_Base
767GCB; EBG ; E_Base_GAZ
768GCB; EM ; E_Modifier
769GCB; EX ; Extend
770GCB; GAZ ; Glue_After_Zwj
771GCB; L ; L
772GCB; LF ; LF
773GCB; LV ; LV
774GCB; LVT ; LVT
775GCB; PP ; Prepend
776GCB; RI ; Regional_Indicator
777GCB; SM ; SpacingMark
778GCB; T ; T
779GCB; V ; V
780GCB; XX ; Other
781GCB; ZWJ ; ZWJ
782
783# Grapheme_Extend (Gr_Ext)
784
785Gr_Ext; N ; No ; F ; False
786Gr_Ext; Y ; Yes ; T ; True
787
788# Grapheme_Link (Gr_Link)
789
790Gr_Link; N ; No ; F ; False
791Gr_Link; Y ; Yes ; T ; True
792
793# Hangul_Syllable_Type (hst)
794
795hst; L ; Leading_Jamo
796hst; LV ; LV_Syllable
797hst; LVT ; LVT_Syllable
798hst; NA ; Not_Applicable
799hst; T ; Trailing_Jamo
800hst; V ; Vowel_Jamo
801
802# Hex_Digit (Hex)
803
804Hex; N ; No ; F ; False
805Hex; Y ; Yes ; T ; True
806
807# Hyphen (Hyphen)
808
809Hyphen; N ; No ; F ; False
810Hyphen; Y ; Yes ; T ; True
811
812# IDS_Binary_Operator (IDSB)
813
814IDSB; N ; No ; F ; False
815IDSB; Y ; Yes ; T ; True
816
817# IDS_Trinary_Operator (IDST)
818
819IDST; N ; No ; F ; False
820IDST; Y ; Yes ; T ; True
821
822# IDS_Unary_Operator (IDSU)
823
824IDSU; N ; No ; F ; False
825IDSU; Y ; Yes ; T ; True
826
827# ID_Compat_Math_Continue (ID_Compat_Math_Continue)
828
829ID_Compat_Math_Continue; N ; No ; F ; False
830ID_Compat_Math_Continue; Y ; Yes ; T ; True
831
832# ID_Compat_Math_Start (ID_Compat_Math_Start)
833
834ID_Compat_Math_Start; N ; No ; F ; False
835ID_Compat_Math_Start; Y ; Yes ; T ; True
836
837# ID_Continue (IDC)
838
839IDC; N ; No ; F ; False
840IDC; Y ; Yes ; T ; True
841
842# ID_Start (IDS)
843
844IDS; N ; No ; F ; False
845IDS; Y ; Yes ; T ; True
846
847# ISO_Comment (isc)
848
849# @missing: 0000..10FFFF; ISO_Comment; <none>
850
851# Ideographic (Ideo)
852
853Ideo; N ; No ; F ; False
854Ideo; Y ; Yes ; T ; True
855
856# Indic_Conjunct_Break (InCB)
857
858InCB; Consonant ; Consonant
859InCB; Extend ; Extend
860InCB; Linker ; Linker
861InCB; None ; None
862
863# Indic_Positional_Category (InPC)
864
865InPC; Bottom ; Bottom
866InPC; Bottom_And_Left ; Bottom_And_Left
867InPC; Bottom_And_Right ; Bottom_And_Right
868InPC; Left ; Left
869InPC; Left_And_Right ; Left_And_Right
870InPC; NA ; NA
871InPC; Overstruck ; Overstruck
872InPC; Right ; Right
873InPC; Top ; Top
874InPC; Top_And_Bottom ; Top_And_Bottom
875InPC; Top_And_Bottom_And_Left ; Top_And_Bottom_And_Left
876InPC; Top_And_Bottom_And_Right ; Top_And_Bottom_And_Right
877InPC; Top_And_Left ; Top_And_Left
878InPC; Top_And_Left_And_Right ; Top_And_Left_And_Right
879InPC; Top_And_Right ; Top_And_Right
880InPC; Visual_Order_Left ; Visual_Order_Left
881
882# Indic_Syllabic_Category (InSC)
883
884InSC; Avagraha ; Avagraha
885InSC; Bindu ; Bindu
886InSC; Brahmi_Joining_Number ; Brahmi_Joining_Number
887InSC; Cantillation_Mark ; Cantillation_Mark
888InSC; Consonant ; Consonant
889InSC; Consonant_Dead ; Consonant_Dead
890InSC; Consonant_Final ; Consonant_Final
891InSC; Consonant_Head_Letter ; Consonant_Head_Letter
892InSC; Consonant_Initial_Postfixed ; Consonant_Initial_Postfixed
893InSC; Consonant_Killer ; Consonant_Killer
894InSC; Consonant_Medial ; Consonant_Medial
895InSC; Consonant_Placeholder ; Consonant_Placeholder
896InSC; Consonant_Preceding_Repha ; Consonant_Preceding_Repha
897InSC; Consonant_Prefixed ; Consonant_Prefixed
898InSC; Consonant_Subjoined ; Consonant_Subjoined
899InSC; Consonant_Succeeding_Repha ; Consonant_Succeeding_Repha
900InSC; Consonant_With_Stacker ; Consonant_With_Stacker
901InSC; Gemination_Mark ; Gemination_Mark
902InSC; Invisible_Stacker ; Invisible_Stacker
903InSC; Joiner ; Joiner
904InSC; Modifying_Letter ; Modifying_Letter
905InSC; Non_Joiner ; Non_Joiner
906InSC; Nukta ; Nukta
907InSC; Number ; Number
908InSC; Number_Joiner ; Number_Joiner
909InSC; Other ; Other
910InSC; Pure_Killer ; Pure_Killer
911InSC; Register_Shifter ; Register_Shifter
912InSC; Syllable_Modifier ; Syllable_Modifier
913InSC; Tone_Letter ; Tone_Letter
914InSC; Tone_Mark ; Tone_Mark
915InSC; Virama ; Virama
916InSC; Visarga ; Visarga
917InSC; Vowel ; Vowel
918InSC; Vowel_Dependent ; Vowel_Dependent
919InSC; Vowel_Independent ; Vowel_Independent
920
921# Jamo_Short_Name (JSN)
922
923JSN; A ; A
924JSN; AE ; AE
925JSN; B ; B
926JSN; BB ; BB
927JSN; BS ; BS
928JSN; C ; C
929JSN; D ; D
930JSN; DD ; DD
931JSN; E ; E
932JSN; EO ; EO
933JSN; EU ; EU
934JSN; G ; G
935JSN; GG ; GG
936JSN; GS ; GS
937JSN; H ; H
938JSN; I ; I
939JSN; J ; J
940JSN; JJ ; JJ
941JSN; K ; K
942JSN; L ; L
943JSN; LB ; LB
944JSN; LG ; LG
945JSN; LH ; LH
946JSN; LM ; LM
947JSN; LP ; LP
948JSN; LS ; LS
949JSN; LT ; LT
950JSN; M ; M
951JSN; N ; N
952JSN; NG ; NG
953JSN; NH ; NH
954JSN; NJ ; NJ
955JSN; O ; O
956JSN; OE ; OE
957JSN; P ; P
958JSN; R ; R
959JSN; S ; S
960JSN; SS ; SS
961JSN; T ; T
962JSN; U ; U
963JSN; WA ; WA
964JSN; WAE ; WAE
965JSN; WE ; WE
966JSN; WEO ; WEO
967JSN; WI ; WI
968JSN; YA ; YA
969JSN; YAE ; YAE
970JSN; YE ; YE
971JSN; YEO ; YEO
972JSN; YI ; YI
973JSN; YO ; YO
974JSN; YU ; YU
975# @missing: 0000..10FFFF; Jamo_Short_Name; <none>
976
977# Join_Control (Join_C)
978
979Join_C; N ; No ; F ; False
980Join_C; Y ; Yes ; T ; True
981
982# Joining_Group (jg)
983
984jg ; African_Feh ; African_Feh
985jg ; African_Noon ; African_Noon
986jg ; African_Qaf ; African_Qaf
987jg ; Ain ; Ain
988jg ; Alaph ; Alaph
989jg ; Alef ; Alef
990jg ; Beh ; Beh
991jg ; Beth ; Beth
992jg ; Burushaski_Yeh_Barree ; Burushaski_Yeh_Barree
993jg ; Dal ; Dal
994jg ; Dalath_Rish ; Dalath_Rish
995jg ; E ; E
996jg ; Farsi_Yeh ; Farsi_Yeh
997jg ; Fe ; Fe
998jg ; Feh ; Feh
999jg ; Final_Semkath ; Final_Semkath
1000jg ; Gaf ; Gaf
1001jg ; Gamal ; Gamal
1002jg ; Hah ; Hah
1003jg ; Hanifi_Rohingya_Kinna_Ya ; Hanifi_Rohingya_Kinna_Ya
1004jg ; Hanifi_Rohingya_Pa ; Hanifi_Rohingya_Pa
1005jg ; He ; He
1006jg ; Heh ; Heh
1007jg ; Heh_Goal ; Heh_Goal
1008jg ; Heth ; Heth
1009jg ; Kaf ; Kaf
1010jg ; Kaph ; Kaph
1011jg ; Khaph ; Khaph
1012jg ; Knotted_Heh ; Knotted_Heh
1013jg ; Lam ; Lam
1014jg ; Lamadh ; Lamadh
1015jg ; Malayalam_Bha ; Malayalam_Bha
1016jg ; Malayalam_Ja ; Malayalam_Ja
1017jg ; Malayalam_Lla ; Malayalam_Lla
1018jg ; Malayalam_Llla ; Malayalam_Llla
1019jg ; Malayalam_Nga ; Malayalam_Nga
1020jg ; Malayalam_Nna ; Malayalam_Nna
1021jg ; Malayalam_Nnna ; Malayalam_Nnna
1022jg ; Malayalam_Nya ; Malayalam_Nya
1023jg ; Malayalam_Ra ; Malayalam_Ra
1024jg ; Malayalam_Ssa ; Malayalam_Ssa
1025jg ; Malayalam_Tta ; Malayalam_Tta
1026jg ; Manichaean_Aleph ; Manichaean_Aleph
1027jg ; Manichaean_Ayin ; Manichaean_Ayin
1028jg ; Manichaean_Beth ; Manichaean_Beth
1029jg ; Manichaean_Daleth ; Manichaean_Daleth
1030jg ; Manichaean_Dhamedh ; Manichaean_Dhamedh
1031jg ; Manichaean_Five ; Manichaean_Five
1032jg ; Manichaean_Gimel ; Manichaean_Gimel
1033jg ; Manichaean_Heth ; Manichaean_Heth
1034jg ; Manichaean_Hundred ; Manichaean_Hundred
1035jg ; Manichaean_Kaph ; Manichaean_Kaph
1036jg ; Manichaean_Lamedh ; Manichaean_Lamedh
1037jg ; Manichaean_Mem ; Manichaean_Mem
1038jg ; Manichaean_Nun ; Manichaean_Nun
1039jg ; Manichaean_One ; Manichaean_One
1040jg ; Manichaean_Pe ; Manichaean_Pe
1041jg ; Manichaean_Qoph ; Manichaean_Qoph
1042jg ; Manichaean_Resh ; Manichaean_Resh
1043jg ; Manichaean_Sadhe ; Manichaean_Sadhe
1044jg ; Manichaean_Samekh ; Manichaean_Samekh
1045jg ; Manichaean_Taw ; Manichaean_Taw
1046jg ; Manichaean_Ten ; Manichaean_Ten
1047jg ; Manichaean_Teth ; Manichaean_Teth
1048jg ; Manichaean_Thamedh ; Manichaean_Thamedh
1049jg ; Manichaean_Twenty ; Manichaean_Twenty
1050jg ; Manichaean_Waw ; Manichaean_Waw
1051jg ; Manichaean_Yodh ; Manichaean_Yodh
1052jg ; Manichaean_Zayin ; Manichaean_Zayin
1053jg ; Meem ; Meem
1054jg ; Mim ; Mim
1055jg ; No_Joining_Group ; No_Joining_Group
1056jg ; Noon ; Noon
1057jg ; Nun ; Nun
1058jg ; Nya ; Nya
1059jg ; Pe ; Pe
1060jg ; Qaf ; Qaf
1061jg ; Qaph ; Qaph
1062jg ; Reh ; Reh
1063jg ; Reversed_Pe ; Reversed_Pe
1064jg ; Rohingya_Yeh ; Rohingya_Yeh
1065jg ; Sad ; Sad
1066jg ; Sadhe ; Sadhe
1067jg ; Seen ; Seen
1068jg ; Semkath ; Semkath
1069jg ; Shin ; Shin
1070jg ; Straight_Waw ; Straight_Waw
1071jg ; Swash_Kaf ; Swash_Kaf
1072jg ; Syriac_Waw ; Syriac_Waw
1073jg ; Tah ; Tah
1074jg ; Taw ; Taw
1075jg ; Teh_Marbuta ; Teh_Marbuta
1076jg ; Teh_Marbuta_Goal ; Hamza_On_Heh_Goal
1077jg ; Teth ; Teth
1078jg ; Thin_Yeh ; Thin_Yeh
1079jg ; Vertical_Tail ; Vertical_Tail
1080jg ; Waw ; Waw
1081jg ; Yeh ; Yeh
1082jg ; Yeh_Barree ; Yeh_Barree
1083jg ; Yeh_With_Tail ; Yeh_With_Tail
1084jg ; Yudh ; Yudh
1085jg ; Yudh_He ; Yudh_He
1086jg ; Zain ; Zain
1087jg ; Zhain ; Zhain
1088
1089# Joining_Type (jt)
1090
1091jt ; C ; Join_Causing
1092jt ; D ; Dual_Joining
1093jt ; L ; Left_Joining
1094jt ; R ; Right_Joining
1095jt ; T ; Transparent
1096jt ; U ; Non_Joining
1097
1098# Line_Break (lb)
1099
1100lb ; AI ; Ambiguous
1101lb ; AK ; Aksara
1102lb ; AL ; Alphabetic
1103lb ; AP ; Aksara_Prebase
1104lb ; AS ; Aksara_Start
1105lb ; B2 ; Break_Both
1106lb ; BA ; Break_After
1107lb ; BB ; Break_Before
1108lb ; BK ; Mandatory_Break
1109lb ; CB ; Contingent_Break
1110lb ; CJ ; Conditional_Japanese_Starter
1111lb ; CL ; Close_Punctuation
1112lb ; CM ; Combining_Mark
1113lb ; CP ; Close_Parenthesis
1114lb ; CR ; Carriage_Return
1115lb ; EB ; E_Base
1116lb ; EM ; E_Modifier
1117lb ; EX ; Exclamation
1118lb ; GL ; Glue
1119lb ; H2 ; H2
1120lb ; H3 ; H3
1121lb ; HL ; Hebrew_Letter
1122lb ; HY ; Hyphen
1123lb ; ID ; Ideographic
1124lb ; IN ; Inseparable ; Inseperable
1125lb ; IS ; Infix_Numeric
1126lb ; JL ; JL
1127lb ; JT ; JT
1128lb ; JV ; JV
1129lb ; LF ; Line_Feed
1130lb ; NL ; Next_Line
1131lb ; NS ; Nonstarter
1132lb ; NU ; Numeric
1133lb ; OP ; Open_Punctuation
1134lb ; PO ; Postfix_Numeric
1135lb ; PR ; Prefix_Numeric
1136lb ; QU ; Quotation
1137lb ; RI ; Regional_Indicator
1138lb ; SA ; Complex_Context
1139lb ; SG ; Surrogate
1140lb ; SP ; Space
1141lb ; SY ; Break_Symbols
1142lb ; VF ; Virama_Final
1143lb ; VI ; Virama
1144lb ; WJ ; Word_Joiner
1145lb ; XX ; Unknown
1146lb ; ZW ; ZWSpace
1147lb ; ZWJ ; ZWJ
1148
1149# Logical_Order_Exception (LOE)
1150
1151LOE; N ; No ; F ; False
1152LOE; Y ; Yes ; T ; True
1153
1154# Lowercase (Lower)
1155
1156Lower; N ; No ; F ; False
1157Lower; Y ; Yes ; T ; True
1158
1159# Lowercase_Mapping (lc)
1160
1161# @missing: 0000..10FFFF; Lowercase_Mapping; <code point>
1162
1163# Math (Math)
1164
1165Math; N ; No ; F ; False
1166Math; Y ; Yes ; T ; True
1167
1168# NFC_Quick_Check (NFC_QC)
1169
1170NFC_QC; M ; Maybe
1171NFC_QC; N ; No
1172NFC_QC; Y ; Yes
1173
1174# NFD_Quick_Check (NFD_QC)
1175
1176NFD_QC; N ; No
1177NFD_QC; Y ; Yes
1178
1179# NFKC_Casefold (NFKC_CF)
1180
1181
1182# NFKC_Quick_Check (NFKC_QC)
1183
1184NFKC_QC; M ; Maybe
1185NFKC_QC; N ; No
1186NFKC_QC; Y ; Yes
1187
1188# NFKC_Simple_Casefold (NFKC_SCF)
1189
1190
1191# NFKD_Quick_Check (NFKD_QC)
1192
1193NFKD_QC; N ; No
1194NFKD_QC; Y ; Yes
1195
1196# Name (na)
1197
1198# @missing: 0000..10FFFF; Name; <none>
1199
1200# Name_Alias (Name_Alias)
1201
1202# @missing: 0000..10FFFF; Name_Alias; <none>
1203
1204# Noncharacter_Code_Point (NChar)
1205
1206NChar; N ; No ; F ; False
1207NChar; Y ; Yes ; T ; True
1208
1209# Numeric_Type (nt)
1210
1211nt ; De ; Decimal
1212nt ; Di ; Digit
1213nt ; None ; None
1214nt ; Nu ; Numeric
1215
1216# Numeric_Value (nv)
1217
1218# @missing: 0000..10FFFF; Numeric_Value; NaN
1219
1220# Other_Alphabetic (OAlpha)
1221
1222OAlpha; N ; No ; F ; False
1223OAlpha; Y ; Yes ; T ; True
1224
1225# Other_Default_Ignorable_Code_Point (ODI)
1226
1227ODI; N ; No ; F ; False
1228ODI; Y ; Yes ; T ; True
1229
1230# Other_Grapheme_Extend (OGr_Ext)
1231
1232OGr_Ext; N ; No ; F ; False
1233OGr_Ext; Y ; Yes ; T ; True
1234
1235# Other_ID_Continue (OIDC)
1236
1237OIDC; N ; No ; F ; False
1238OIDC; Y ; Yes ; T ; True
1239
1240# Other_ID_Start (OIDS)
1241
1242OIDS; N ; No ; F ; False
1243OIDS; Y ; Yes ; T ; True
1244
1245# Other_Lowercase (OLower)
1246
1247OLower; N ; No ; F ; False
1248OLower; Y ; Yes ; T ; True
1249
1250# Other_Math (OMath)
1251
1252OMath; N ; No ; F ; False
1253OMath; Y ; Yes ; T ; True
1254
1255# Other_Uppercase (OUpper)
1256
1257OUpper; N ; No ; F ; False
1258OUpper; Y ; Yes ; T ; True
1259
1260# Pattern_Syntax (Pat_Syn)
1261
1262Pat_Syn; N ; No ; F ; False
1263Pat_Syn; Y ; Yes ; T ; True
1264
1265# Pattern_White_Space (Pat_WS)
1266
1267Pat_WS; N ; No ; F ; False
1268Pat_WS; Y ; Yes ; T ; True
1269
1270# Prepended_Concatenation_Mark (PCM)
1271
1272PCM; N ; No ; F ; False
1273PCM; Y ; Yes ; T ; True
1274
1275# Quotation_Mark (QMark)
1276
1277QMark; N ; No ; F ; False
1278QMark; Y ; Yes ; T ; True
1279
1280# Radical (Radical)
1281
1282Radical; N ; No ; F ; False
1283Radical; Y ; Yes ; T ; True
1284
1285# Regional_Indicator (RI)
1286
1287RI ; N ; No ; F ; False
1288RI ; Y ; Yes ; T ; True
1289
1290# Script (sc)
1291
1292sc ; Adlm ; Adlam
1293sc ; Aghb ; Caucasian_Albanian
1294sc ; Ahom ; Ahom
1295sc ; Arab ; Arabic
1296sc ; Armi ; Imperial_Aramaic
1297sc ; Armn ; Armenian
1298sc ; Avst ; Avestan
1299sc ; Bali ; Balinese
1300sc ; Bamu ; Bamum
1301sc ; Bass ; Bassa_Vah
1302sc ; Batk ; Batak
1303sc ; Beng ; Bengali
1304sc ; Bhks ; Bhaiksuki
1305sc ; Bopo ; Bopomofo
1306sc ; Brah ; Brahmi
1307sc ; Brai ; Braille
1308sc ; Bugi ; Buginese
1309sc ; Buhd ; Buhid
1310sc ; Cakm ; Chakma
1311sc ; Cans ; Canadian_Aboriginal
1312sc ; Cari ; Carian
1313sc ; Cham ; Cham
1314sc ; Cher ; Cherokee
1315sc ; Chrs ; Chorasmian
1316sc ; Copt ; Coptic ; Qaac
1317sc ; Cpmn ; Cypro_Minoan
1318sc ; Cprt ; Cypriot
1319sc ; Cyrl ; Cyrillic
1320sc ; Deva ; Devanagari
1321sc ; Diak ; Dives_Akuru
1322sc ; Dogr ; Dogra
1323sc ; Dsrt ; Deseret
1324sc ; Dupl ; Duployan
1325sc ; Egyp ; Egyptian_Hieroglyphs
1326sc ; Elba ; Elbasan
1327sc ; Elym ; Elymaic
1328sc ; Ethi ; Ethiopic
1329sc ; Geor ; Georgian
1330sc ; Glag ; Glagolitic
1331sc ; Gong ; Gunjala_Gondi
1332sc ; Gonm ; Masaram_Gondi
1333sc ; Goth ; Gothic
1334sc ; Gran ; Grantha
1335sc ; Grek ; Greek
1336sc ; Gujr ; Gujarati
1337sc ; Guru ; Gurmukhi
1338sc ; Hang ; Hangul
1339sc ; Hani ; Han
1340sc ; Hano ; Hanunoo
1341sc ; Hatr ; Hatran
1342sc ; Hebr ; Hebrew
1343sc ; Hira ; Hiragana
1344sc ; Hluw ; Anatolian_Hieroglyphs
1345sc ; Hmng ; Pahawh_Hmong
1346sc ; Hmnp ; Nyiakeng_Puachue_Hmong
1347sc ; Hrkt ; Katakana_Or_Hiragana
1348sc ; Hung ; Old_Hungarian
1349sc ; Ital ; Old_Italic
1350sc ; Java ; Javanese
1351sc ; Kali ; Kayah_Li
1352sc ; Kana ; Katakana
1353sc ; Kawi ; Kawi
1354sc ; Khar ; Kharoshthi
1355sc ; Khmr ; Khmer
1356sc ; Khoj ; Khojki
1357sc ; Kits ; Khitan_Small_Script
1358sc ; Knda ; Kannada
1359sc ; Kthi ; Kaithi
1360sc ; Lana ; Tai_Tham
1361sc ; Laoo ; Lao
1362sc ; Latn ; Latin
1363sc ; Lepc ; Lepcha
1364sc ; Limb ; Limbu
1365sc ; Lina ; Linear_A
1366sc ; Linb ; Linear_B
1367sc ; Lisu ; Lisu
1368sc ; Lyci ; Lycian
1369sc ; Lydi ; Lydian
1370sc ; Mahj ; Mahajani
1371sc ; Maka ; Makasar
1372sc ; Mand ; Mandaic
1373sc ; Mani ; Manichaean
1374sc ; Marc ; Marchen
1375sc ; Medf ; Medefaidrin
1376sc ; Mend ; Mende_Kikakui
1377sc ; Merc ; Meroitic_Cursive
1378sc ; Mero ; Meroitic_Hieroglyphs
1379sc ; Mlym ; Malayalam
1380sc ; Modi ; Modi
1381sc ; Mong ; Mongolian
1382sc ; Mroo ; Mro
1383sc ; Mtei ; Meetei_Mayek
1384sc ; Mult ; Multani
1385sc ; Mymr ; Myanmar
1386sc ; Nagm ; Nag_Mundari
1387sc ; Nand ; Nandinagari
1388sc ; Narb ; Old_North_Arabian
1389sc ; Nbat ; Nabataean
1390sc ; Newa ; Newa
1391sc ; Nkoo ; Nko
1392sc ; Nshu ; Nushu
1393sc ; Ogam ; Ogham
1394sc ; Olck ; Ol_Chiki
1395sc ; Orkh ; Old_Turkic
1396sc ; Orya ; Oriya
1397sc ; Osge ; Osage
1398sc ; Osma ; Osmanya
1399sc ; Ougr ; Old_Uyghur
1400sc ; Palm ; Palmyrene
1401sc ; Pauc ; Pau_Cin_Hau
1402sc ; Perm ; Old_Permic
1403sc ; Phag ; Phags_Pa
1404sc ; Phli ; Inscriptional_Pahlavi
1405sc ; Phlp ; Psalter_Pahlavi
1406sc ; Phnx ; Phoenician
1407sc ; Plrd ; Miao
1408sc ; Prti ; Inscriptional_Parthian
1409sc ; Rjng ; Rejang
1410sc ; Rohg ; Hanifi_Rohingya
1411sc ; Runr ; Runic
1412sc ; Samr ; Samaritan
1413sc ; Sarb ; Old_South_Arabian
1414sc ; Saur ; Saurashtra
1415sc ; Sgnw ; SignWriting
1416sc ; Shaw ; Shavian
1417sc ; Shrd ; Sharada
1418sc ; Sidd ; Siddham
1419sc ; Sind ; Khudawadi
1420sc ; Sinh ; Sinhala
1421sc ; Sogd ; Sogdian
1422sc ; Sogo ; Old_Sogdian
1423sc ; Sora ; Sora_Sompeng
1424sc ; Soyo ; Soyombo
1425sc ; Sund ; Sundanese
1426sc ; Sylo ; Syloti_Nagri
1427sc ; Syrc ; Syriac
1428sc ; Tagb ; Tagbanwa
1429sc ; Takr ; Takri
1430sc ; Tale ; Tai_Le
1431sc ; Talu ; New_Tai_Lue
1432sc ; Taml ; Tamil
1433sc ; Tang ; Tangut
1434sc ; Tavt ; Tai_Viet
1435sc ; Telu ; Telugu
1436sc ; Tfng ; Tifinagh
1437sc ; Tglg ; Tagalog
1438sc ; Thaa ; Thaana
1439sc ; Thai ; Thai
1440sc ; Tibt ; Tibetan
1441sc ; Tirh ; Tirhuta
1442sc ; Tnsa ; Tangsa
1443sc ; Toto ; Toto
1444sc ; Ugar ; Ugaritic
1445sc ; Vaii ; Vai
1446sc ; Vith ; Vithkuqi
1447sc ; Wara ; Warang_Citi
1448sc ; Wcho ; Wancho
1449sc ; Xpeo ; Old_Persian
1450sc ; Xsux ; Cuneiform
1451sc ; Yezi ; Yezidi
1452sc ; Yiii ; Yi
1453sc ; Zanb ; Zanabazar_Square
1454sc ; Zinh ; Inherited ; Qaai
1455sc ; Zyyy ; Common
1456sc ; Zzzz ; Unknown
1457
1458# Script_Extensions (scx)
1459
1460
1461# Sentence_Break (SB)
1462
1463SB ; AT ; ATerm
1464SB ; CL ; Close
1465SB ; CR ; CR
1466SB ; EX ; Extend
1467SB ; FO ; Format
1468SB ; LE ; OLetter
1469SB ; LF ; LF
1470SB ; LO ; Lower
1471SB ; NU ; Numeric
1472SB ; SC ; SContinue
1473SB ; SE ; Sep
1474SB ; SP ; Sp
1475SB ; ST ; STerm
1476SB ; UP ; Upper
1477SB ; XX ; Other
1478
1479# Sentence_Terminal (STerm)
1480
1481STerm; N ; No ; F ; False
1482STerm; Y ; Yes ; T ; True
1483
1484# Simple_Case_Folding (scf)
1485
1486# @missing: 0000..10FFFF; Simple_Case_Folding; <code point>
1487
1488# Simple_Lowercase_Mapping (slc)
1489
1490# @missing: 0000..10FFFF; Simple_Lowercase_Mapping; <code point>
1491
1492# Simple_Titlecase_Mapping (stc)
1493
1494# @missing: 0000..10FFFF; Simple_Titlecase_Mapping; <code point>
1495
1496# Simple_Uppercase_Mapping (suc)
1497
1498# @missing: 0000..10FFFF; Simple_Uppercase_Mapping; <code point>
1499
1500# Soft_Dotted (SD)
1501
1502SD ; N ; No ; F ; False
1503SD ; Y ; Yes ; T ; True
1504
1505# Terminal_Punctuation (Term)
1506
1507Term; N ; No ; F ; False
1508Term; Y ; Yes ; T ; True
1509
1510# Titlecase_Mapping (tc)
1511
1512# @missing: 0000..10FFFF; Titlecase_Mapping; <code point>
1513
1514# Unicode_1_Name (na1)
1515
1516# @missing: 0000..10FFFF; Unicode_1_Name; <none>
1517
1518# Unified_Ideograph (UIdeo)
1519
1520UIdeo; N ; No ; F ; False
1521UIdeo; Y ; Yes ; T ; True
1522
1523# Uppercase (Upper)
1524
1525Upper; N ; No ; F ; False
1526Upper; Y ; Yes ; T ; True
1527
1528# Uppercase_Mapping (uc)
1529
1530# @missing: 0000..10FFFF; Uppercase_Mapping; <code point>
1531
1532# Variation_Selector (VS)
1533
1534VS ; N ; No ; F ; False
1535VS ; Y ; Yes ; T ; True
1536
1537# Vertical_Orientation (vo)
1538
1539vo ; R ; Rotated
1540vo ; Tr ; Transformed_Rotated
1541vo ; Tu ; Transformed_Upright
1542vo ; U ; Upright
1543
1544# White_Space (WSpace)
1545
1546WSpace; N ; No ; F ; False
1547WSpace; Y ; Yes ; T ; True
1548
1549# Word_Break (WB)
1550
1551WB ; CR ; CR
1552WB ; DQ ; Double_Quote
1553WB ; EB ; E_Base
1554WB ; EBG ; E_Base_GAZ
1555WB ; EM ; E_Modifier
1556WB ; EX ; ExtendNumLet
1557WB ; Extend ; Extend
1558WB ; FO ; Format
1559WB ; GAZ ; Glue_After_Zwj
1560WB ; HL ; Hebrew_Letter
1561WB ; KA ; Katakana
1562WB ; LE ; ALetter
1563WB ; LF ; LF
1564WB ; MB ; MidNumLet
1565WB ; ML ; MidLetter
1566WB ; MN ; MidNum
1567WB ; NL ; Newline
1568WB ; NU ; Numeric
1569WB ; RI ; Regional_Indicator
1570WB ; SQ ; Single_Quote
1571WB ; WSegSpace ; WSegSpace
1572WB ; XX ; Other
1573WB ; ZWJ ; ZWJ
1574
1575# XID_Continue (XIDC)
1576
1577XIDC; N ; No ; F ; False
1578XIDC; Y ; Yes ; T ; True
1579
1580# XID_Start (XIDS)
1581
1582XIDS; N ; No ; F ; False
1583XIDS; Y ; Yes ; T ; True
1584
1585# cjkAccountingNumeric (cjkAccountingNumeric)
1586
1587# @missing: 0000..10FFFF; cjkAccountingNumeric; NaN
1588
1589# cjkCompatibilityVariant (cjkCompatibilityVariant)
1590
1591# @missing: 0000..10FFFF; cjkCompatibilityVariant; <code point>
1592
1593# cjkIICore (cjkIICore)
1594
1595# @missing: 0000..10FFFF; cjkIICore; <none>
1596
1597# cjkIRG_GSource (cjkIRG_GSource)
1598
1599# @missing: 0000..10FFFF; cjkIRG_GSource; <none>
1600
1601# cjkIRG_HSource (cjkIRG_HSource)
1602
1603# @missing: 0000..10FFFF; cjkIRG_HSource; <none>
1604
1605# cjkIRG_JSource (cjkIRG_JSource)
1606
1607# @missing: 0000..10FFFF; cjkIRG_JSource; <none>
1608
1609# cjkIRG_KPSource (cjkIRG_KPSource)
1610
1611# @missing: 0000..10FFFF; cjkIRG_KPSource; <none>
1612
1613# cjkIRG_KSource (cjkIRG_KSource)
1614
1615# @missing: 0000..10FFFF; cjkIRG_KSource; <none>
1616
1617# cjkIRG_MSource (cjkIRG_MSource)
1618
1619# @missing: 0000..10FFFF; cjkIRG_MSource; <none>
1620
1621# cjkIRG_SSource (cjkIRG_SSource)
1622
1623# @missing: 0000..10FFFF; cjkIRG_SSource; <none>
1624
1625# cjkIRG_TSource (cjkIRG_TSource)
1626
1627# @missing: 0000..10FFFF; cjkIRG_TSource; <none>
1628
1629# cjkIRG_UKSource (cjkIRG_UKSource)
1630
1631# @missing: 0000..10FFFF; cjkIRG_UKSource; <none>
1632
1633# cjkIRG_USource (cjkIRG_USource)
1634
1635# @missing: 0000..10FFFF; cjkIRG_USource; <none>
1636
1637# cjkIRG_VSource (cjkIRG_VSource)
1638
1639# @missing: 0000..10FFFF; cjkIRG_VSource; <none>
1640
1641# cjkOtherNumeric (cjkOtherNumeric)
1642
1643# @missing: 0000..10FFFF; cjkOtherNumeric; NaN
1644
1645# cjkPrimaryNumeric (cjkPrimaryNumeric)
1646
1647# @missing: 0000..10FFFF; cjkPrimaryNumeric; NaN
1648
1649# cjkRSUnicode (cjkRSUnicode)
1650
1651# @missing: 0000..10FFFF; cjkRSUnicode; <none>
1652
1653# EOF