source/data/unidata/PropertyValueAliases.txt - external/github.com/unicode-org/icu - Git at Google

 # PropertyValueAliases-4.0.1.txt
 # Date: 2004-03-02, 19:46:47 GMT [MD]
 #
 # Unicode Character Database
 # Copyright (c) 1991-2004 Unicode, Inc.
 # For terms of use, see http://www.unicode.org/terms_of_use.html
 # For documentation, see UCD.html
 # This file contains aliases for property values used in the UCD.
 # These names can be used for XML formats of UCD data, for regular-expression
 # property tests, and other programmatic textual descriptions of Unicode data.
 # For information on which properties are normative, see UCD.html.
 #
 # The names may be translated in appropriate environments, and additional
 # aliases may be useful.
 #
 # FORMAT
 #
 # Each line describes a property value name.
 # This consists of three or more fields, separated by semicolons.
 #
 # First Field: The first field describes the property for which that
 # property value name is used.
 #
 # Second Field: The second field is an abbreviated name.
 # If there is no abbreviated name available, the field is marked with "n/a".
 #
 # Third Field: The third field is a long name.
 #
 # In the case of ccc, there are 4 fields. The second field is numeric, third
 # is abbreviated, and fourth is long.
 #
 # The above are the preferred aliases. Other aliases may be listed in additional fields.
 #
 # Loose matching should be applied to all property names and property values, with
 # the exception of String Property values. With loose matching of property names and
 # values, the case distinctions, whitespace, and '_' are ignored. For Numeric Property
 # values, numeric equivalencies are applied: thus "01.00" is equivalent to "1".
 #
 # NOTE: Property value names are NOT unique across properties. For example:
 #
 #   AL means Arabic Letter for the Bidi_Class property, and
 #   AL means Alpha_Left for the Combining_Class property, and
 #   AL means Alphabetic for the Line_Break property.
 #
 # In addition, some property names may be the same as some property value names.
 # For example:
 #
 #   sc means the Script property, and
 #   Sc means the General_Category property value Currency_Symbol (Sc)
 #
 # The combination of property value and property name is, however, unique.
 #
 # For more information, see UTS #18: Regular Expression Guidelines
 # ================================================


 # Age (age)

 age; n/a       ; 1.1
 age; n/a       ; 2.0
 age; n/a       ; 2.1
 age; n/a       ; 3.0
 age; n/a       ; 3.1
 age; n/a       ; 3.2
 age; n/a       ; 4.0
 age; n/a       ; unassigned

 # Bidi_Class (bc)

 bc ; AL        ; Arabic_Letter
 bc ; AN        ; Arabic_Number
 bc ; B         ; Paragraph_Separator
 bc ; BN        ; Boundary_Neutral
 bc ; CS        ; Common_Separator
 bc ; EN        ; European_Number
 bc ; ES        ; European_Separator
 bc ; ET        ; European_Terminator
 bc ; L         ; Left_To_Right
 bc ; LRE       ; Left_To_Right_Embedding
 bc ; LRO       ; Left_To_Right_Override
 bc ; NSM       ; Nonspacing_Mark
 bc ; ON        ; Other_Neutral
 bc ; PDF       ; Pop_Directional_Format
 bc ; R         ; Right_To_Left
 bc ; RLE       ; Right_To_Left_Embedding
 bc ; RLO       ; Right_To_Left_Override
 bc ; S         ; Segment_Separator
 bc ; WS        ; White_Space

 # Block (blk)

 blk; n/a       ; Aegean_Numbers
 blk; n/a       ; Alphabetic_Presentation_Forms
 blk; n/a       ; Arabic
 blk; n/a       ; Arabic_Presentation_Forms-A
 blk; n/a       ; Arabic_Presentation_Forms-B
 blk; n/a       ; Armenian
 blk; n/a       ; Arrows
 blk; n/a       ; Basic_Latin
 blk; n/a       ; Bengali
 blk; n/a       ; Block_Elements
 blk; n/a       ; Bopomofo
 blk; n/a       ; Bopomofo_Extended
 blk; n/a       ; Box_Drawing
 blk; n/a       ; Braille_Patterns
 blk; n/a       ; Buhid
 blk; n/a       ; Byzantine_Musical_Symbols
 blk; n/a       ; Cherokee
 blk; n/a       ; CJK_Compatibility
 blk; n/a       ; CJK_Compatibility_Forms
 blk; n/a       ; CJK_Compatibility_Ideographs
 blk; n/a       ; CJK_Compatibility_Ideographs_Supplement
 blk; n/a       ; CJK_Radicals_Supplement
 blk; n/a       ; CJK_Symbols_and_Punctuation
 blk; n/a       ; CJK_Unified_Ideographs
 blk; n/a       ; CJK_Unified_Ideographs_Extension_A
 blk; n/a       ; CJK_Unified_Ideographs_Extension_B
 blk; n/a       ; Combining_Diacritical_Marks
 blk; n/a       ; Combining_Diacritical_Marks_for_Symbols
 blk; n/a       ; Combining_Half_Marks
 blk; n/a       ; Control_Pictures
 blk; n/a       ; Currency_Symbols
 blk; n/a       ; Cypriot_Syllabary
 blk; n/a       ; Cyrillic
 blk; n/a       ; Cyrillic_Supplement              ; Cyrillic_Supplementary
 blk; n/a       ; Deseret
 blk; n/a       ; Devanagari
 blk; n/a       ; Dingbats
 blk; n/a       ; Enclosed_Alphanumerics
 blk; n/a       ; Enclosed_CJK_Letters_and_Months
 blk; n/a       ; Ethiopic
 blk; n/a       ; General_Punctuation
 blk; n/a       ; Geometric_Shapes
 blk; n/a       ; Georgian
 blk; n/a       ; Gothic
 blk; n/a       ; Greek_and_Coptic
 blk; n/a       ; Greek_Extended
 blk; n/a       ; Gujarati
 blk; n/a       ; Gurmukhi
 blk; n/a       ; Halfwidth_and_Fullwidth_Forms
 blk; n/a       ; Hangul_Compatibility_Jamo
 blk; n/a       ; Hangul_Jamo
 blk; n/a       ; Hangul_Syllables
 blk; n/a       ; Hanunoo
 blk; n/a       ; Hebrew
 blk; n/a       ; High_Private_Use_Surrogates
 blk; n/a       ; High_Surrogates
 blk; n/a       ; Hiragana
 blk; n/a       ; Ideographic_Description_Characters
 blk; n/a       ; IPA_Extensions
 blk; n/a       ; Kanbun
 blk; n/a       ; Kangxi_Radicals
 blk; n/a       ; Kannada
 blk; n/a       ; Katakana
 blk; n/a       ; Katakana_Phonetic_Extensions
 blk; n/a       ; Khmer
 blk; n/a       ; Khmer_Symbols
 blk; n/a       ; Lao
 blk; n/a       ; Latin-1_Supplement
 blk; n/a       ; Latin_Extended-A
 blk; n/a       ; Latin_Extended-B
 blk; n/a       ; Latin_Extended_Additional
 blk; n/a       ; Letterlike_Symbols
 blk; n/a       ; Limbu
 blk; n/a       ; Linear_B_Ideograms
 blk; n/a       ; Linear_B_Syllabary
 blk; n/a       ; Low_Surrogates
 blk; n/a       ; Malayalam
 blk; n/a       ; Mathematical_Alphanumeric_Symbols
 blk; n/a       ; Mathematical_Operators
 blk; n/a       ; Miscellaneous_Mathematical_Symbols-A
 blk; n/a       ; Miscellaneous_Mathematical_Symbols-B
 blk; n/a       ; Miscellaneous_Symbols
 blk; n/a       ; Miscellaneous_Symbols_and_Arrows
 blk; n/a       ; Miscellaneous_Technical
 blk; n/a       ; Mongolian
 blk; n/a       ; Musical_Symbols
 blk; n/a       ; Myanmar
 blk; n/a       ; No_Block
 blk; n/a       ; Number_Forms
 blk; n/a       ; Ogham
 blk; n/a       ; Old_Italic
 blk; n/a       ; Optical_Character_Recognition
 blk; n/a       ; Oriya
 blk; n/a       ; Osmanya
 blk; n/a       ; Phonetic_Extensions
 blk; n/a       ; Private_Use_Area
 blk; n/a       ; Runic
 blk; n/a       ; Shavian
 blk; n/a       ; Sinhala
 blk; n/a       ; Small_Form_Variants
 blk; n/a       ; Spacing_Modifier_Letters
 blk; n/a       ; Specials
 blk; n/a       ; Superscripts_and_Subscripts
 blk; n/a       ; Supplemental_Arrows-A
 blk; n/a       ; Supplemental_Arrows-B
 blk; n/a       ; Supplemental_Mathematical_Operators
 blk; n/a       ; Supplementary_Private_Use_Area-A
 blk; n/a       ; Supplementary_Private_Use_Area-B
 blk; n/a       ; Syriac
 blk; n/a       ; Tagalog
 blk; n/a       ; Tagbanwa
 blk; n/a       ; Tags
 blk; n/a       ; Tai_Le
 blk; n/a       ; Tai_Xuan_Jing_Symbols
 blk; n/a       ; Tamil
 blk; n/a       ; Telugu
 blk; n/a       ; Thaana
 blk; n/a       ; Thai
 blk; n/a       ; Tibetan
 blk; n/a       ; Ugaritic
 blk; n/a       ; Unified_Canadian_Aboriginal_Syllabics
 blk; n/a       ; Variation_Selectors
 blk; n/a       ; Variation_Selectors_Supplement
 blk; n/a       ; Yi_Radicals
 blk; n/a       ; Yi_Syllables
 blk; n/a       ; Yijing_Hexagram_Symbols

 # Canonical_Combining_Class (ccc)

 ccc;   0; NR   ; Not_Reordered
 ccc;   1; OV   ; Overlay
 ccc;   7; NK   ; Nukta
 ccc;   8; KV   ; Kana_Voicing
 ccc;   9; VR   ; Virama
 ccc; 200; ATBL ; Attached_Below_Left
 ccc; 202; ATB  ; Attached_Below
 ccc; 216; ATAR ; Attached_Above_Right
 ccc; 218; BL   ; Below_Left
 ccc; 220; B    ; Below
 ccc; 222; BR   ; Below_Right
 ccc; 224; L    ; Left
 ccc; 226; R    ; Right
 ccc; 228; AL   ; Above_Left
 ccc; 230; A    ; Above
 ccc; 232; AR   ; Above_Right
 ccc; 233; DB   ; Double_Below
 ccc; 234; DA   ; Double_Above
 ccc; 240; IS   ; Iota_Subscript

 # Decomposition_Type (dt)

 dt ; can       ; Canonical
 dt ; com       ; Compat
 dt ; enc       ; Circle
 dt ; fin       ; Final
 dt ; font      ; Font
 dt ; fra       ; Fraction
 dt ; init      ; Initial
 dt ; iso       ; Isolated
 dt ; med       ; Medial
 dt ; nar       ; Narrow
 dt ; nb        ; Nobreak
 dt ; none      ; None
 dt ; sml       ; Small
 dt ; sqr       ; Square
 dt ; sub       ; Sub
 dt ; sup       ; Super
 dt ; vert      ; Vertical
 dt ; wide      ; Wide

 # East_Asian_Width (ea)

 ea ; A         ; Ambiguous
 ea ; F         ; Fullwidth
 ea ; H         ; Halfwidth
 ea ; N         ; Neutral
 ea ; Na        ; Narrow
 ea ; W         ; Wide

 # General_Category (gc)

 gc ; C         ; Other                            # Cc | Cf | Cn | Co | Cs
 gc ; Cc        ; Control
 gc ; Cf        ; Format
 gc ; Cn        ; Unassigned
 gc ; Co        ; Private_Use
 gc ; Cs        ; Surrogate
 gc ; L         ; Letter                           # Ll | Lm | Lo | Lt | Lu
 gc ; LC        ; Cased_Letter                     # Ll | Lt | Lu
 gc ; Ll        ; Lowercase_Letter
 gc ; Lm        ; Modifier_Letter
 gc ; Lo        ; Other_Letter
 gc ; Lt        ; Titlecase_Letter
 gc ; Lu        ; Uppercase_Letter
 gc ; M         ; Mark                             # Mc | Me | Mn
 gc ; Mc        ; Spacing_Mark
 gc ; Me        ; Enclosing_Mark
 gc ; Mn        ; Nonspacing_Mark
 gc ; N         ; Number                           # Nd | Nl | No
 gc ; Nd        ; Decimal_Number
 gc ; Nl        ; Letter_Number
 gc ; No        ; Other_Number
 gc ; P         ; Punctuation                      # Pc | Pd | Pe | Pf | Pi | Po | Ps
 gc ; Pc        ; Connector_Punctuation
 gc ; Pd        ; Dash_Punctuation
 gc ; Pe        ; Close_Punctuation
 gc ; Pf        ; Final_Punctuation
 gc ; Pi        ; Initial_Punctuation
 gc ; Po        ; Other_Punctuation
 gc ; Ps        ; Open_Punctuation
 gc ; S         ; Symbol                           # Sc | Sk | Sm | So
 gc ; Sc        ; Currency_Symbol
 gc ; Sk        ; Modifier_Symbol
 gc ; Sm        ; Math_Symbol
 gc ; So        ; Other_Symbol
 gc ; Z         ; Separator                        # Zl | Zp | Zs
 gc ; Zl        ; Line_Separator
 gc ; Zp        ; Paragraph_Separator
 gc ; Zs        ; Space_Separator

 # Hangul_Syllable_Type (hst)

 hst; L         ; Leading_Jamo
 hst; LV        ; LV_Syllable
 hst; LVT       ; LVT_Syllable
 hst; NA        ; Not_Applicable
 hst; T         ; Trailing_Jamo
 hst; V         ; Vowel_Jamo

 # Joining_Group (jg)

 jg ; n/a       ; Ain
 jg ; n/a       ; Alaph
 jg ; n/a       ; Alef
 jg ; n/a       ; Beh
 jg ; n/a       ; Beth
 jg ; n/a       ; Dal
 jg ; n/a       ; Dalath_Rish
 jg ; n/a       ; E
 jg ; n/a       ; Fe
 jg ; n/a       ; Feh
 jg ; n/a       ; Final_Semkath
 jg ; n/a       ; Gaf
 jg ; n/a       ; Gamal
 jg ; n/a       ; Hah
 jg ; n/a       ; Hamza_On_Heh_Goal
 jg ; n/a       ; He
 jg ; n/a       ; Heh
 jg ; n/a       ; Heh_Goal
 jg ; n/a       ; Heth
 jg ; n/a       ; Kaf
 jg ; n/a       ; Kaph
 jg ; n/a       ; Khaph
 jg ; n/a       ; Knotted_Heh
 jg ; n/a       ; Lam
 jg ; n/a       ; Lamadh
 jg ; n/a       ; Meem
 jg ; n/a       ; Mim
 jg ; n/a       ; No_Joining_Group
 jg ; n/a       ; Noon
 jg ; n/a       ; Nun
 jg ; n/a       ; Pe
 jg ; n/a       ; Qaf
 jg ; n/a       ; Qaph
 jg ; n/a       ; Reh
 jg ; n/a       ; Reversed_Pe
 jg ; n/a       ; Sad
 jg ; n/a       ; Sadhe
 jg ; n/a       ; Seen
 jg ; n/a       ; Semkath
 jg ; n/a       ; Shin
 jg ; n/a       ; Swash_Kaf
 jg ; n/a       ; Syriac_Waw
 jg ; n/a       ; Tah
 jg ; n/a       ; Taw
 jg ; n/a       ; Teh_Marbuta
 jg ; n/a       ; Teth
 jg ; n/a       ; Waw
 jg ; n/a       ; Yeh
 jg ; n/a       ; Yeh_Barree
 jg ; n/a       ; Yeh_With_Tail
 jg ; n/a       ; Yudh
 jg ; n/a       ; Yudh_He
 jg ; n/a       ; Zain
 jg ; n/a       ; Zhain

 # Joining_Type (jt)

 jt ; C         ; Join_Causing
 jt ; D         ; Dual_Joining
 jt ; L         ; Left_Joining
 jt ; R         ; Right_Joining
 jt ; T         ; Transparent
 jt ; U         ; Non_Joining

 # Line_Break (lb)

 lb ; AI        ; Ambiguous
 lb ; AL        ; Alphabetic
 lb ; B2        ; Break_Both
 lb ; BA        ; Break_After
 lb ; BB        ; Break_Before
 lb ; BK        ; Mandatory_Break
 lb ; CB        ; Contingent_Break
 lb ; CL        ; Close_Punctuation
 lb ; CM        ; Combining_Mark
 lb ; CR        ; Carriage_Return
 lb ; EX        ; Exclamation
 lb ; GL        ; Glue
 lb ; HY        ; Hyphen
 lb ; ID        ; Ideographic
 lb ; IN        ; Inseparable                      ; Inseperable
 lb ; IS        ; Infix_Numeric
 lb ; LF        ; Line_Feed
 lb ; NL        ; Next_Line
 lb ; NS        ; Nonstarter
 lb ; NU        ; Numeric
 lb ; OP        ; Open_Punctuation
 lb ; PO        ; Postfix_Numeric
 lb ; PR        ; Prefix_Numeric
 lb ; QU        ; Quotation
 lb ; SA        ; Complex_Context
 lb ; SG        ; Surrogate
 lb ; SP        ; Space
 lb ; SY        ; Break_Symbols
 lb ; WJ        ; Word_Joiner
 lb ; XX        ; Unknown
 lb ; ZW        ; ZWSpace

 # NFC_Quick_Check (NFC_QC)

 NFC_QC; M      ; Maybe
 NFC_QC; N      ; No
 NFC_QC; Y      ; Yes

 # NFD_Quick_Check (NFD_QC)

 NFD_QC; N      ; No
 NFD_QC; Y      ; Yes

 # NFKC_Quick_Check (NFKC_QC)

 NFKC_QC; M     ; Maybe
 NFKC_QC; N     ; No
 NFKC_QC; Y     ; Yes

 # NFKD_Quick_Check (NFKD_QC)

 NFKD_QC; N     ; No
 NFKD_QC; Y     ; Yes

 # Numeric_Type (nt)

 nt ; De        ; Decimal
 nt ; Di        ; Digit
 nt ; None      ; None
 nt ; Nu        ; Numeric

 # Script (sc)

 sc ; Arab      ; Arabic
 sc ; Armn      ; Armenian
 sc ; Beng      ; Bengali
 sc ; Bopo      ; Bopomofo
 sc ; Brai      ; Braille
 sc ; Buhd      ; Buhid
 sc ; Cans      ; Canadian_Aboriginal
 sc ; Cher      ; Cherokee
 sc ; Cprt      ; Cypriot
 sc ; Cyrl      ; Cyrillic
 sc ; Deva      ; Devanagari
 sc ; Dsrt      ; Deseret
 sc ; Ethi      ; Ethiopic
 sc ; Geor      ; Georgian
 sc ; Goth      ; Gothic
 sc ; Grek      ; Greek
 sc ; Gujr      ; Gujarati
 sc ; Guru      ; Gurmukhi
 sc ; Hang      ; Hangul
 sc ; Hani      ; Han
 sc ; Hano      ; Hanunoo
 sc ; Hebr      ; Hebrew
 sc ; Hira      ; Hiragana
 sc ; Hrkt      ; Katakana_Or_Hiragana
 sc ; Ital      ; Old_Italic
 sc ; Kana      ; Katakana
 sc ; Khmr      ; Khmer
 sc ; Knda      ; Kannada
 sc ; Laoo      ; Lao
 sc ; Latn      ; Latin
 sc ; Limb      ; Limbu
 sc ; Linb      ; Linear_B
 sc ; Mlym      ; Malayalam
 sc ; Mong      ; Mongolian
 sc ; Mymr      ; Myanmar
 sc ; Ogam      ; Ogham
 sc ; Orya      ; Oriya
 sc ; Osma      ; Osmanya
 sc ; Qaai      ; Inherited
 sc ; Runr      ; Runic
 sc ; Shaw      ; Shavian
 sc ; Sinh      ; Sinhala
 sc ; Syrc      ; Syriac
 sc ; Tagb      ; Tagbanwa
 sc ; Tale      ; Tai_Le
 sc ; Taml      ; Tamil
 sc ; Telu      ; Telugu
 sc ; Tglg      ; Tagalog
 sc ; Thaa      ; Thaana
 sc ; Thai      ; Thai
 sc ; Tibt      ; Tibetan
 sc ; Ugar      ; Ugaritic
 sc ; Yiii      ; Yi
 sc ; Zyyy      ; Common
	# PropertyValueAliases-4.0.1.txt
	# Date: 2004-03-02, 19:46:47 GMT [MD]
	#
	# Unicode Character Database
	# Copyright (c) 1991-2004 Unicode, Inc.
	# For terms of use, see http://www.unicode.org/terms_of_use.html
	# For documentation, see UCD.html
	# This file contains aliases for property values used in the UCD.
	# These names can be used for XML formats of UCD data, for regular-expression
	# property tests, and other programmatic textual descriptions of Unicode data.
	# For information on which properties are normative, see UCD.html.
	#
	# The names may be translated in appropriate environments, and additional
	# aliases may be useful.
	#
	# FORMAT
	#
	# Each line describes a property value name.
	# This consists of three or more fields, separated by semicolons.
	#
	# First Field: The first field describes the property for which that
	# property value name is used.
	#
	# Second Field: The second field is an abbreviated name.
	# If there is no abbreviated name available, the field is marked with "n/a".
	#
	# Third Field: The third field is a long name.
	#
	# In the case of ccc, there are 4 fields. The second field is numeric, third
	# is abbreviated, and fourth is long.
	#
	# The above are the preferred aliases. Other aliases may be listed in additional fields.
	#
	# Loose matching should be applied to all property names and property values, with
	# the exception of String Property values. With loose matching of property names and
	# values, the case distinctions, whitespace, and '_' are ignored. For Numeric Property
	# values, numeric equivalencies are applied: thus "01.00" is equivalent to "1".
	#
	# NOTE: Property value names are NOT unique across properties. For example:
	#
	# AL means Arabic Letter for the Bidi_Class property, and
	# AL means Alpha_Left for the Combining_Class property, and
	# AL means Alphabetic for the Line_Break property.
	#
	# In addition, some property names may be the same as some property value names.
	# For example:
	#
	# sc means the Script property, and
	# Sc means the General_Category property value Currency_Symbol (Sc)
	#
	# The combination of property value and property name is, however, unique.
	#
	# For more information, see UTS #18: Regular Expression Guidelines
	# ================================================


	# Age (age)

	age; n/a ; 1.1
	age; n/a ; 2.0
	age; n/a ; 2.1
	age; n/a ; 3.0
	age; n/a ; 3.1
	age; n/a ; 3.2
	age; n/a ; 4.0
	age; n/a ; unassigned

	# Bidi_Class (bc)

	bc ; AL ; Arabic_Letter
	bc ; AN ; Arabic_Number
	bc ; B ; Paragraph_Separator
	bc ; BN ; Boundary_Neutral
	bc ; CS ; Common_Separator
	bc ; EN ; European_Number
	bc ; ES ; European_Separator
	bc ; ET ; European_Terminator
	bc ; L ; Left_To_Right
	bc ; LRE ; Left_To_Right_Embedding
	bc ; LRO ; Left_To_Right_Override
	bc ; NSM ; Nonspacing_Mark
	bc ; ON ; Other_Neutral
	bc ; PDF ; Pop_Directional_Format
	bc ; R ; Right_To_Left
	bc ; RLE ; Right_To_Left_Embedding
	bc ; RLO ; Right_To_Left_Override
	bc ; S ; Segment_Separator
	bc ; WS ; White_Space

	# Block (blk)

	blk; n/a ; Aegean_Numbers
	blk; n/a ; Alphabetic_Presentation_Forms
	blk; n/a ; Arabic
	blk; n/a ; Arabic_Presentation_Forms-A
	blk; n/a ; Arabic_Presentation_Forms-B
	blk; n/a ; Armenian
	blk; n/a ; Arrows
	blk; n/a ; Basic_Latin
	blk; n/a ; Bengali
	blk; n/a ; Block_Elements
	blk; n/a ; Bopomofo
	blk; n/a ; Bopomofo_Extended
	blk; n/a ; Box_Drawing
	blk; n/a ; Braille_Patterns
	blk; n/a ; Buhid
	blk; n/a ; Byzantine_Musical_Symbols
	blk; n/a ; Cherokee
	blk; n/a ; CJK_Compatibility
	blk; n/a ; CJK_Compatibility_Forms
	blk; n/a ; CJK_Compatibility_Ideographs
	blk; n/a ; CJK_Compatibility_Ideographs_Supplement
	blk; n/a ; CJK_Radicals_Supplement
	blk; n/a ; CJK_Symbols_and_Punctuation
	blk; n/a ; CJK_Unified_Ideographs
	blk; n/a ; CJK_Unified_Ideographs_Extension_A
	blk; n/a ; CJK_Unified_Ideographs_Extension_B
	blk; n/a ; Combining_Diacritical_Marks
	blk; n/a ; Combining_Diacritical_Marks_for_Symbols
	blk; n/a ; Combining_Half_Marks
	blk; n/a ; Control_Pictures
	blk; n/a ; Currency_Symbols
	blk; n/a ; Cypriot_Syllabary
	blk; n/a ; Cyrillic
	blk; n/a ; Cyrillic_Supplement ; Cyrillic_Supplementary
	blk; n/a ; Deseret
	blk; n/a ; Devanagari
	blk; n/a ; Dingbats
	blk; n/a ; Enclosed_Alphanumerics
	blk; n/a ; Enclosed_CJK_Letters_and_Months
	blk; n/a ; Ethiopic
	blk; n/a ; General_Punctuation
	blk; n/a ; Geometric_Shapes
	blk; n/a ; Georgian
	blk; n/a ; Gothic
	blk; n/a ; Greek_and_Coptic
	blk; n/a ; Greek_Extended
	blk; n/a ; Gujarati
	blk; n/a ; Gurmukhi
	blk; n/a ; Halfwidth_and_Fullwidth_Forms
	blk; n/a ; Hangul_Compatibility_Jamo
	blk; n/a ; Hangul_Jamo
	blk; n/a ; Hangul_Syllables
	blk; n/a ; Hanunoo
	blk; n/a ; Hebrew
	blk; n/a ; High_Private_Use_Surrogates
	blk; n/a ; High_Surrogates
	blk; n/a ; Hiragana
	blk; n/a ; Ideographic_Description_Characters
	blk; n/a ; IPA_Extensions
	blk; n/a ; Kanbun
	blk; n/a ; Kangxi_Radicals
	blk; n/a ; Kannada
	blk; n/a ; Katakana
	blk; n/a ; Katakana_Phonetic_Extensions
	blk; n/a ; Khmer
	blk; n/a ; Khmer_Symbols
	blk; n/a ; Lao
	blk; n/a ; Latin-1_Supplement
	blk; n/a ; Latin_Extended-A
	blk; n/a ; Latin_Extended-B
	blk; n/a ; Latin_Extended_Additional
	blk; n/a ; Letterlike_Symbols
	blk; n/a ; Limbu
	blk; n/a ; Linear_B_Ideograms
	blk; n/a ; Linear_B_Syllabary
	blk; n/a ; Low_Surrogates
	blk; n/a ; Malayalam
	blk; n/a ; Mathematical_Alphanumeric_Symbols
	blk; n/a ; Mathematical_Operators
	blk; n/a ; Miscellaneous_Mathematical_Symbols-A
	blk; n/a ; Miscellaneous_Mathematical_Symbols-B
	blk; n/a ; Miscellaneous_Symbols
	blk; n/a ; Miscellaneous_Symbols_and_Arrows
	blk; n/a ; Miscellaneous_Technical
	blk; n/a ; Mongolian
	blk; n/a ; Musical_Symbols
	blk; n/a ; Myanmar
	blk; n/a ; No_Block
	blk; n/a ; Number_Forms
	blk; n/a ; Ogham
	blk; n/a ; Old_Italic
	blk; n/a ; Optical_Character_Recognition
	blk; n/a ; Oriya
	blk; n/a ; Osmanya
	blk; n/a ; Phonetic_Extensions
	blk; n/a ; Private_Use_Area
	blk; n/a ; Runic
	blk; n/a ; Shavian
	blk; n/a ; Sinhala
	blk; n/a ; Small_Form_Variants
	blk; n/a ; Spacing_Modifier_Letters
	blk; n/a ; Specials
	blk; n/a ; Superscripts_and_Subscripts
	blk; n/a ; Supplemental_Arrows-A
	blk; n/a ; Supplemental_Arrows-B
	blk; n/a ; Supplemental_Mathematical_Operators
	blk; n/a ; Supplementary_Private_Use_Area-A
	blk; n/a ; Supplementary_Private_Use_Area-B
	blk; n/a ; Syriac
	blk; n/a ; Tagalog
	blk; n/a ; Tagbanwa
	blk; n/a ; Tags
	blk; n/a ; Tai_Le
	blk; n/a ; Tai_Xuan_Jing_Symbols
	blk; n/a ; Tamil
	blk; n/a ; Telugu
	blk; n/a ; Thaana
	blk; n/a ; Thai
	blk; n/a ; Tibetan
	blk; n/a ; Ugaritic
	blk; n/a ; Unified_Canadian_Aboriginal_Syllabics
	blk; n/a ; Variation_Selectors
	blk; n/a ; Variation_Selectors_Supplement
	blk; n/a ; Yi_Radicals
	blk; n/a ; Yi_Syllables
	blk; n/a ; Yijing_Hexagram_Symbols

	# Canonical_Combining_Class (ccc)

	ccc; 0; NR ; Not_Reordered
	ccc; 1; OV ; Overlay
	ccc; 7; NK ; Nukta
	ccc; 8; KV ; Kana_Voicing
	ccc; 9; VR ; Virama
	ccc; 200; ATBL ; Attached_Below_Left
	ccc; 202; ATB ; Attached_Below
	ccc; 216; ATAR ; Attached_Above_Right
	ccc; 218; BL ; Below_Left
	ccc; 220; B ; Below
	ccc; 222; BR ; Below_Right
	ccc; 224; L ; Left
	ccc; 226; R ; Right
	ccc; 228; AL ; Above_Left
	ccc; 230; A ; Above
	ccc; 232; AR ; Above_Right
	ccc; 233; DB ; Double_Below
	ccc; 234; DA ; Double_Above
	ccc; 240; IS ; Iota_Subscript

	# Decomposition_Type (dt)

	dt ; can ; Canonical
	dt ; com ; Compat
	dt ; enc ; Circle
	dt ; fin ; Final
	dt ; font ; Font
	dt ; fra ; Fraction
	dt ; init ; Initial
	dt ; iso ; Isolated
	dt ; med ; Medial
	dt ; nar ; Narrow
	dt ; nb ; Nobreak
	dt ; none ; None
	dt ; sml ; Small
	dt ; sqr ; Square
	dt ; sub ; Sub
	dt ; sup ; Super
	dt ; vert ; Vertical
	dt ; wide ; Wide

	# East_Asian_Width (ea)

	ea ; A ; Ambiguous
	ea ; F ; Fullwidth
	ea ; H ; Halfwidth
	ea ; N ; Neutral
	ea ; Na ; Narrow
	ea ; W ; Wide

	# General_Category (gc)

	gc ; C ; Other # Cc \| Cf \| Cn \| Co \| Cs
	gc ; Cc ; Control
	gc ; Cf ; Format
	gc ; Cn ; Unassigned
	gc ; Co ; Private_Use
	gc ; Cs ; Surrogate
	gc ; L ; Letter # Ll \| Lm \| Lo \| Lt \| Lu
	gc ; LC ; Cased_Letter # Ll \| Lt \| Lu
	gc ; Ll ; Lowercase_Letter
	gc ; Lm ; Modifier_Letter
	gc ; Lo ; Other_Letter
	gc ; Lt ; Titlecase_Letter
	gc ; Lu ; Uppercase_Letter
	gc ; M ; Mark # Mc \| Me \| Mn
	gc ; Mc ; Spacing_Mark
	gc ; Me ; Enclosing_Mark
	gc ; Mn ; Nonspacing_Mark
	gc ; N ; Number # Nd \| Nl \| No
	gc ; Nd ; Decimal_Number
	gc ; Nl ; Letter_Number
	gc ; No ; Other_Number
	gc ; P ; Punctuation # Pc \| Pd \| Pe \| Pf \| Pi \| Po \| Ps
	gc ; Pc ; Connector_Punctuation
	gc ; Pd ; Dash_Punctuation
	gc ; Pe ; Close_Punctuation
	gc ; Pf ; Final_Punctuation
	gc ; Pi ; Initial_Punctuation
	gc ; Po ; Other_Punctuation
	gc ; Ps ; Open_Punctuation
	gc ; S ; Symbol # Sc \| Sk \| Sm \| So
	gc ; Sc ; Currency_Symbol
	gc ; Sk ; Modifier_Symbol
	gc ; Sm ; Math_Symbol
	gc ; So ; Other_Symbol
	gc ; Z ; Separator # Zl \| Zp \| Zs
	gc ; Zl ; Line_Separator
	gc ; Zp ; Paragraph_Separator
	gc ; Zs ; Space_Separator

	# Hangul_Syllable_Type (hst)

	hst; L ; Leading_Jamo
	hst; LV ; LV_Syllable
	hst; LVT ; LVT_Syllable
	hst; NA ; Not_Applicable
	hst; T ; Trailing_Jamo
	hst; V ; Vowel_Jamo

	# Joining_Group (jg)

	jg ; n/a ; Ain
	jg ; n/a ; Alaph
	jg ; n/a ; Alef
	jg ; n/a ; Beh
	jg ; n/a ; Beth
	jg ; n/a ; Dal
	jg ; n/a ; Dalath_Rish
	jg ; n/a ; E
	jg ; n/a ; Fe
	jg ; n/a ; Feh
	jg ; n/a ; Final_Semkath
	jg ; n/a ; Gaf
	jg ; n/a ; Gamal
	jg ; n/a ; Hah
	jg ; n/a ; Hamza_On_Heh_Goal
	jg ; n/a ; He
	jg ; n/a ; Heh
	jg ; n/a ; Heh_Goal
	jg ; n/a ; Heth
	jg ; n/a ; Kaf
	jg ; n/a ; Kaph
	jg ; n/a ; Khaph
	jg ; n/a ; Knotted_Heh
	jg ; n/a ; Lam
	jg ; n/a ; Lamadh
	jg ; n/a ; Meem
	jg ; n/a ; Mim
	jg ; n/a ; No_Joining_Group
	jg ; n/a ; Noon
	jg ; n/a ; Nun
	jg ; n/a ; Pe
	jg ; n/a ; Qaf
	jg ; n/a ; Qaph
	jg ; n/a ; Reh
	jg ; n/a ; Reversed_Pe
	jg ; n/a ; Sad
	jg ; n/a ; Sadhe
	jg ; n/a ; Seen
	jg ; n/a ; Semkath
	jg ; n/a ; Shin
	jg ; n/a ; Swash_Kaf
	jg ; n/a ; Syriac_Waw
	jg ; n/a ; Tah
	jg ; n/a ; Taw
	jg ; n/a ; Teh_Marbuta
	jg ; n/a ; Teth
	jg ; n/a ; Waw
	jg ; n/a ; Yeh
	jg ; n/a ; Yeh_Barree
	jg ; n/a ; Yeh_With_Tail
	jg ; n/a ; Yudh
	jg ; n/a ; Yudh_He
	jg ; n/a ; Zain
	jg ; n/a ; Zhain

	# Joining_Type (jt)

	jt ; C ; Join_Causing
	jt ; D ; Dual_Joining
	jt ; L ; Left_Joining
	jt ; R ; Right_Joining
	jt ; T ; Transparent
	jt ; U ; Non_Joining

	# Line_Break (lb)

	lb ; AI ; Ambiguous
	lb ; AL ; Alphabetic
	lb ; B2 ; Break_Both
	lb ; BA ; Break_After
	lb ; BB ; Break_Before
	lb ; BK ; Mandatory_Break
	lb ; CB ; Contingent_Break
	lb ; CL ; Close_Punctuation
	lb ; CM ; Combining_Mark
	lb ; CR ; Carriage_Return
	lb ; EX ; Exclamation
	lb ; GL ; Glue
	lb ; HY ; Hyphen
	lb ; ID ; Ideographic
	lb ; IN ; Inseparable ; Inseperable
	lb ; IS ; Infix_Numeric
	lb ; LF ; Line_Feed
	lb ; NL ; Next_Line
	lb ; NS ; Nonstarter
	lb ; NU ; Numeric
	lb ; OP ; Open_Punctuation
	lb ; PO ; Postfix_Numeric
	lb ; PR ; Prefix_Numeric
	lb ; QU ; Quotation
	lb ; SA ; Complex_Context
	lb ; SG ; Surrogate
	lb ; SP ; Space
	lb ; SY ; Break_Symbols
	lb ; WJ ; Word_Joiner
	lb ; XX ; Unknown
	lb ; ZW ; ZWSpace

	# NFC_Quick_Check (NFC_QC)

	NFC_QC; M ; Maybe
	NFC_QC; N ; No
	NFC_QC; Y ; Yes

	# NFD_Quick_Check (NFD_QC)

	NFD_QC; N ; No
	NFD_QC; Y ; Yes

	# NFKC_Quick_Check (NFKC_QC)

	NFKC_QC; M ; Maybe
	NFKC_QC; N ; No
	NFKC_QC; Y ; Yes

	# NFKD_Quick_Check (NFKD_QC)

	NFKD_QC; N ; No
	NFKD_QC; Y ; Yes

	# Numeric_Type (nt)

	nt ; De ; Decimal
	nt ; Di ; Digit
	nt ; None ; None
	nt ; Nu ; Numeric

	# Script (sc)

	sc ; Arab ; Arabic
	sc ; Armn ; Armenian
	sc ; Beng ; Bengali
	sc ; Bopo ; Bopomofo
	sc ; Brai ; Braille
	sc ; Buhd ; Buhid
	sc ; Cans ; Canadian_Aboriginal
	sc ; Cher ; Cherokee
	sc ; Cprt ; Cypriot
	sc ; Cyrl ; Cyrillic
	sc ; Deva ; Devanagari
	sc ; Dsrt ; Deseret
	sc ; Ethi ; Ethiopic
	sc ; Geor ; Georgian
	sc ; Goth ; Gothic
	sc ; Grek ; Greek
	sc ; Gujr ; Gujarati
	sc ; Guru ; Gurmukhi
	sc ; Hang ; Hangul
	sc ; Hani ; Han
	sc ; Hano ; Hanunoo
	sc ; Hebr ; Hebrew
	sc ; Hira ; Hiragana
	sc ; Hrkt ; Katakana_Or_Hiragana
	sc ; Ital ; Old_Italic
	sc ; Kana ; Katakana
	sc ; Khmr ; Khmer
	sc ; Knda ; Kannada
	sc ; Laoo ; Lao
	sc ; Latn ; Latin
	sc ; Limb ; Limbu
	sc ; Linb ; Linear_B
	sc ; Mlym ; Malayalam
	sc ; Mong ; Mongolian
	sc ; Mymr ; Myanmar
	sc ; Ogam ; Ogham
	sc ; Orya ; Oriya
	sc ; Osma ; Osmanya
	sc ; Qaai ; Inherited
	sc ; Runr ; Runic
	sc ; Shaw ; Shavian
	sc ; Sinh ; Sinhala
	sc ; Syrc ; Syriac
	sc ; Tagb ; Tagbanwa
	sc ; Tale ; Tai_Le
	sc ; Taml ; Tamil
	sc ; Telu ; Telugu
	sc ; Tglg ; Tagalog
	sc ; Thaa ; Thaana
	sc ; Thai ; Thai
	sc ; Tibt ; Tibetan
	sc ; Ugar ; Ugaritic
	sc ; Yiii ; Yi
	sc ; Zyyy ; Common