home *** CD-ROM | disk | FTP | other *** search
- # PropertyValueAliases-4.0.1.txt
- # Date: 2004-03-02, 19:46:47 GMT [MD]
- #
- # Unicode Character Database
- # Copyright (c) 1991-2004 Unicode, Inc.
- # For terms of use, see http://www.unicode.org/terms_of_use.html
- # For documentation, see UCD.html
- # This file contains aliases for property values used in the UCD.
- # These names can be used for XML formats of UCD data, for regular-expression
- # property tests, and other programmatic textual descriptions of Unicode data.
- # For information on which properties are normative, see UCD.html.
- #
- # The names may be translated in appropriate environments, and additional
- # aliases may be useful.
- #
- # FORMAT
- #
- # Each line describes a property value name.
- # This consists of three or more fields, separated by semicolons.
- #
- # First Field: The first field describes the property for which that
- # property value name is used.
- #
- # Second Field: The second field is an abbreviated name.
- # If there is no abbreviated name available, the field is marked with "n/a".
- #
- # Third Field: The third field is a long name.
- #
- # In the case of ccc, there are 4 fields. The second field is numeric, third
- # is abbreviated, and fourth is long.
- #
- # The above are the preferred aliases. Other aliases may be listed in additional fields.
- #
- # Loose matching should be applied to all property names and property values, with
- # the exception of String Property values. With loose matching of property names and
- # values, the case distinctions, whitespace, and '_' are ignored. For Numeric Property
- # values, numeric equivalencies are applied: thus "01.00" is equivalent to "1".
- #
- # NOTE: Property value names are NOT unique across properties. For example:
- #
- # AL means Arabic Letter for the Bidi_Class property, and
- # AL means Alpha_Left for the Combining_Class property, and
- # AL means Alphabetic for the Line_Break property.
- #
- # In addition, some property names may be the same as some property value names.
- # For example:
- #
- # sc means the Script property, and
- # Sc means the General_Category property value Currency_Symbol (Sc)
- #
- # The combination of property value and property name is, however, unique.
- #
- # For more information, see UTS #18: Regular Expression Guidelines
- # ================================================
-
-
- # Age (age)
-
- age; n/a ; 1.1
- age; n/a ; 2.0
- age; n/a ; 2.1
- age; n/a ; 3.0
- age; n/a ; 3.1
- age; n/a ; 3.2
- age; n/a ; 4.0
- age; n/a ; unassigned
-
- # Bidi_Class (bc)
-
- bc ; AL ; Arabic_Letter
- bc ; AN ; Arabic_Number
- bc ; B ; Paragraph_Separator
- bc ; BN ; Boundary_Neutral
- bc ; CS ; Common_Separator
- bc ; EN ; European_Number
- bc ; ES ; European_Separator
- bc ; ET ; European_Terminator
- bc ; L ; Left_To_Right
- bc ; LRE ; Left_To_Right_Embedding
- bc ; LRO ; Left_To_Right_Override
- bc ; NSM ; Nonspacing_Mark
- bc ; ON ; Other_Neutral
- bc ; PDF ; Pop_Directional_Format
- bc ; R ; Right_To_Left
- bc ; RLE ; Right_To_Left_Embedding
- bc ; RLO ; Right_To_Left_Override
- bc ; S ; Segment_Separator
- bc ; WS ; White_Space
-
- # Block (blk)
-
- blk; n/a ; Aegean_Numbers
- blk; n/a ; Alphabetic_Presentation_Forms
- blk; n/a ; Arabic
- blk; n/a ; Arabic_Presentation_Forms-A
- blk; n/a ; Arabic_Presentation_Forms-B
- blk; n/a ; Armenian
- blk; n/a ; Arrows
- blk; n/a ; Basic_Latin
- blk; n/a ; Bengali
- blk; n/a ; Block_Elements
- blk; n/a ; Bopomofo
- blk; n/a ; Bopomofo_Extended
- blk; n/a ; Box_Drawing
- blk; n/a ; Braille_Patterns
- blk; n/a ; Buhid
- blk; n/a ; Byzantine_Musical_Symbols
- blk; n/a ; Cherokee
- blk; n/a ; CJK_Compatibility
- blk; n/a ; CJK_Compatibility_Forms
- blk; n/a ; CJK_Compatibility_Ideographs
- blk; n/a ; CJK_Compatibility_Ideographs_Supplement
- blk; n/a ; CJK_Radicals_Supplement
- blk; n/a ; CJK_Symbols_and_Punctuation
- blk; n/a ; CJK_Unified_Ideographs
- blk; n/a ; CJK_Unified_Ideographs_Extension_A
- blk; n/a ; CJK_Unified_Ideographs_Extension_B
- blk; n/a ; Combining_Diacritical_Marks
- blk; n/a ; Combining_Diacritical_Marks_for_Symbols
- blk; n/a ; Combining_Half_Marks
- blk; n/a ; Control_Pictures
- blk; n/a ; Currency_Symbols
- blk; n/a ; Cypriot_Syllabary
- blk; n/a ; Cyrillic
- blk; n/a ; Cyrillic_Supplement ; Cyrillic_Supplementary
- blk; n/a ; Deseret
- blk; n/a ; Devanagari
- blk; n/a ; Dingbats
- blk; n/a ; Enclosed_Alphanumerics
- blk; n/a ; Enclosed_CJK_Letters_and_Months
- blk; n/a ; Ethiopic
- blk; n/a ; General_Punctuation
- blk; n/a ; Geometric_Shapes
- blk; n/a ; Georgian
- blk; n/a ; Gothic
- blk; n/a ; Greek_and_Coptic
- blk; n/a ; Greek_Extended
- blk; n/a ; Gujarati
- blk; n/a ; Gurmukhi
- blk; n/a ; Halfwidth_and_Fullwidth_Forms
- blk; n/a ; Hangul_Compatibility_Jamo
- blk; n/a ; Hangul_Jamo
- blk; n/a ; Hangul_Syllables
- blk; n/a ; Hanunoo
- blk; n/a ; Hebrew
- blk; n/a ; High_Private_Use_Surrogates
- blk; n/a ; High_Surrogates
- blk; n/a ; Hiragana
- blk; n/a ; Ideographic_Description_Characters
- blk; n/a ; IPA_Extensions
- blk; n/a ; Kanbun
- blk; n/a ; Kangxi_Radicals
- blk; n/a ; Kannada
- blk; n/a ; Katakana
- blk; n/a ; Katakana_Phonetic_Extensions
- blk; n/a ; Khmer
- blk; n/a ; Khmer_Symbols
- blk; n/a ; Lao
- blk; n/a ; Latin-1_Supplement
- blk; n/a ; Latin_Extended-A
- blk; n/a ; Latin_Extended-B
- blk; n/a ; Latin_Extended_Additional
- blk; n/a ; Letterlike_Symbols
- blk; n/a ; Limbu
- blk; n/a ; Linear_B_Ideograms
- blk; n/a ; Linear_B_Syllabary
- blk; n/a ; Low_Surrogates
- blk; n/a ; Malayalam
- blk; n/a ; Mathematical_Alphanumeric_Symbols
- blk; n/a ; Mathematical_Operators
- blk; n/a ; Miscellaneous_Mathematical_Symbols-A
- blk; n/a ; Miscellaneous_Mathematical_Symbols-B
- blk; n/a ; Miscellaneous_Symbols
- blk; n/a ; Miscellaneous_Symbols_and_Arrows
- blk; n/a ; Miscellaneous_Technical
- blk; n/a ; Mongolian
- blk; n/a ; Musical_Symbols
- blk; n/a ; Myanmar
- blk; n/a ; No_Block
- blk; n/a ; Number_Forms
- blk; n/a ; Ogham
- blk; n/a ; Old_Italic
- blk; n/a ; Optical_Character_Recognition
- blk; n/a ; Oriya
- blk; n/a ; Osmanya
- blk; n/a ; Phonetic_Extensions
- blk; n/a ; Private_Use_Area
- blk; n/a ; Runic
- blk; n/a ; Shavian
- blk; n/a ; Sinhala
- blk; n/a ; Small_Form_Variants
- blk; n/a ; Spacing_Modifier_Letters
- blk; n/a ; Specials
- blk; n/a ; Superscripts_and_Subscripts
- blk; n/a ; Supplemental_Arrows-A
- blk; n/a ; Supplemental_Arrows-B
- blk; n/a ; Supplemental_Mathematical_Operators
- blk; n/a ; Supplementary_Private_Use_Area-A
- blk; n/a ; Supplementary_Private_Use_Area-B
- blk; n/a ; Syriac
- blk; n/a ; Tagalog
- blk; n/a ; Tagbanwa
- blk; n/a ; Tags
- blk; n/a ; Tai_Le
- blk; n/a ; Tai_Xuan_Jing_Symbols
- blk; n/a ; Tamil
- blk; n/a ; Telugu
- blk; n/a ; Thaana
- blk; n/a ; Thai
- blk; n/a ; Tibetan
- blk; n/a ; Ugaritic
- blk; n/a ; Unified_Canadian_Aboriginal_Syllabics
- blk; n/a ; Variation_Selectors
- blk; n/a ; Variation_Selectors_Supplement
- blk; n/a ; Yi_Radicals
- blk; n/a ; Yi_Syllables
- blk; n/a ; Yijing_Hexagram_Symbols
-
- # Canonical_Combining_Class (ccc)
-
- ccc; 0; NR ; Not_Reordered
- ccc; 1; OV ; Overlay
- ccc; 7; NK ; Nukta
- ccc; 8; KV ; Kana_Voicing
- ccc; 9; VR ; Virama
- ccc; 200; ATBL ; Attached_Below_Left
- ccc; 202; ATB ; Attached_Below
- ccc; 216; ATAR ; Attached_Above_Right
- ccc; 218; BL ; Below_Left
- ccc; 220; B ; Below
- ccc; 222; BR ; Below_Right
- ccc; 224; L ; Left
- ccc; 226; R ; Right
- ccc; 228; AL ; Above_Left
- ccc; 230; A ; Above
- ccc; 232; AR ; Above_Right
- ccc; 233; DB ; Double_Below
- ccc; 234; DA ; Double_Above
- ccc; 240; IS ; Iota_Subscript
-
- # Decomposition_Type (dt)
-
- dt ; can ; Canonical
- dt ; com ; Compat
- dt ; enc ; Circle
- dt ; fin ; Final
- dt ; font ; Font
- dt ; fra ; Fraction
- dt ; init ; Initial
- dt ; iso ; Isolated
- dt ; med ; Medial
- dt ; nar ; Narrow
- dt ; nb ; Nobreak
- dt ; none ; None
- dt ; sml ; Small
- dt ; sqr ; Square
- dt ; sub ; Sub
- dt ; sup ; Super
- dt ; vert ; Vertical
- dt ; wide ; Wide
-
- # East_Asian_Width (ea)
-
- ea ; A ; Ambiguous
- ea ; F ; Fullwidth
- ea ; H ; Halfwidth
- ea ; N ; Neutral
- ea ; Na ; Narrow
- ea ; W ; Wide
-
- # General_Category (gc)
-
- gc ; C ; Other # Cc | Cf | Cn | Co | Cs
- gc ; Cc ; Control
- gc ; Cf ; Format
- gc ; Cn ; Unassigned
- gc ; Co ; Private_Use
- gc ; Cs ; Surrogate
- gc ; L ; Letter # Ll | Lm | Lo | Lt | Lu
- gc ; LC ; Cased_Letter # Ll | Lt | Lu
- gc ; Ll ; Lowercase_Letter
- gc ; Lm ; Modifier_Letter
- gc ; Lo ; Other_Letter
- gc ; Lt ; Titlecase_Letter
- gc ; Lu ; Uppercase_Letter
- gc ; M ; Mark # Mc | Me | Mn
- gc ; Mc ; Spacing_Mark
- gc ; Me ; Enclosing_Mark
- gc ; Mn ; Nonspacing_Mark
- gc ; N ; Number # Nd | Nl | No
- gc ; Nd ; Decimal_Number
- gc ; Nl ; Letter_Number
- gc ; No ; Other_Number
- gc ; P ; Punctuation # Pc | Pd | Pe | Pf | Pi | Po | Ps
- gc ; Pc ; Connector_Punctuation
- gc ; Pd ; Dash_Punctuation
- gc ; Pe ; Close_Punctuation
- gc ; Pf ; Final_Punctuation
- gc ; Pi ; Initial_Punctuation
- gc ; Po ; Other_Punctuation
- gc ; Ps ; Open_Punctuation
- gc ; S ; Symbol # Sc | Sk | Sm | So
- gc ; Sc ; Currency_Symbol
- gc ; Sk ; Modifier_Symbol
- gc ; Sm ; Math_Symbol
- gc ; So ; Other_Symbol
- gc ; Z ; Separator # Zl | Zp | Zs
- gc ; Zl ; Line_Separator
- gc ; Zp ; Paragraph_Separator
- gc ; Zs ; Space_Separator
-
- # Hangul_Syllable_Type (hst)
-
- hst; L ; Leading_Jamo
- hst; LV ; LV_Syllable
- hst; LVT ; LVT_Syllable
- hst; NA ; Not_Applicable
- hst; T ; Trailing_Jamo
- hst; V ; Vowel_Jamo
-
- # Joining_Group (jg)
-
- jg ; n/a ; Ain
- jg ; n/a ; Alaph
- jg ; n/a ; Alef
- jg ; n/a ; Beh
- jg ; n/a ; Beth
- jg ; n/a ; Dal
- jg ; n/a ; Dalath_Rish
- jg ; n/a ; E
- jg ; n/a ; Fe
- jg ; n/a ; Feh
- jg ; n/a ; Final_Semkath
- jg ; n/a ; Gaf
- jg ; n/a ; Gamal
- jg ; n/a ; Hah
- jg ; n/a ; Hamza_On_Heh_Goal
- jg ; n/a ; He
- jg ; n/a ; Heh
- jg ; n/a ; Heh_Goal
- jg ; n/a ; Heth
- jg ; n/a ; Kaf
- jg ; n/a ; Kaph
- jg ; n/a ; Khaph
- jg ; n/a ; Knotted_Heh
- jg ; n/a ; Lam
- jg ; n/a ; Lamadh
- jg ; n/a ; Meem
- jg ; n/a ; Mim
- jg ; n/a ; No_Joining_Group
- jg ; n/a ; Noon
- jg ; n/a ; Nun
- jg ; n/a ; Pe
- jg ; n/a ; Qaf
- jg ; n/a ; Qaph
- jg ; n/a ; Reh
- jg ; n/a ; Reversed_Pe
- jg ; n/a ; Sad
- jg ; n/a ; Sadhe
- jg ; n/a ; Seen
- jg ; n/a ; Semkath
- jg ; n/a ; Shin
- jg ; n/a ; Swash_Kaf
- jg ; n/a ; Syriac_Waw
- jg ; n/a ; Tah
- jg ; n/a ; Taw
- jg ; n/a ; Teh_Marbuta
- jg ; n/a ; Teth
- jg ; n/a ; Waw
- jg ; n/a ; Yeh
- jg ; n/a ; Yeh_Barree
- jg ; n/a ; Yeh_With_Tail
- jg ; n/a ; Yudh
- jg ; n/a ; Yudh_He
- jg ; n/a ; Zain
- jg ; n/a ; Zhain
-
- # Joining_Type (jt)
-
- jt ; C ; Join_Causing
- jt ; D ; Dual_Joining
- jt ; L ; Left_Joining
- jt ; R ; Right_Joining
- jt ; T ; Transparent
- jt ; U ; Non_Joining
-
- # Line_Break (lb)
-
- lb ; AI ; Ambiguous
- lb ; AL ; Alphabetic
- lb ; B2 ; Break_Both
- lb ; BA ; Break_After
- lb ; BB ; Break_Before
- lb ; BK ; Mandatory_Break
- lb ; CB ; Contingent_Break
- lb ; CL ; Close_Punctuation
- lb ; CM ; Combining_Mark
- lb ; CR ; Carriage_Return
- lb ; EX ; Exclamation
- lb ; GL ; Glue
- lb ; HY ; Hyphen
- lb ; ID ; Ideographic
- lb ; IN ; Inseparable ; Inseperable
- lb ; IS ; Infix_Numeric
- lb ; LF ; Line_Feed
- lb ; NL ; Next_Line
- lb ; NS ; Nonstarter
- lb ; NU ; Numeric
- lb ; OP ; Open_Punctuation
- lb ; PO ; Postfix_Numeric
- lb ; PR ; Prefix_Numeric
- lb ; QU ; Quotation
- lb ; SA ; Complex_Context
- lb ; SG ; Surrogate
- lb ; SP ; Space
- lb ; SY ; Break_Symbols
- lb ; WJ ; Word_Joiner
- lb ; XX ; Unknown
- lb ; ZW ; ZWSpace
-
- # NFC_Quick_Check (NFC_QC)
-
- NFC_QC; M ; Maybe
- NFC_QC; N ; No
- NFC_QC; Y ; Yes
-
- # NFD_Quick_Check (NFD_QC)
-
- NFD_QC; N ; No
- NFD_QC; Y ; Yes
-
- # NFKC_Quick_Check (NFKC_QC)
-
- NFKC_QC; M ; Maybe
- NFKC_QC; N ; No
- NFKC_QC; Y ; Yes
-
- # NFKD_Quick_Check (NFKD_QC)
-
- NFKD_QC; N ; No
- NFKD_QC; Y ; Yes
-
- # Numeric_Type (nt)
-
- nt ; De ; Decimal
- nt ; Di ; Digit
- nt ; None ; None
- nt ; Nu ; Numeric
-
- # Script (sc)
-
- sc ; Arab ; Arabic
- sc ; Armn ; Armenian
- sc ; Beng ; Bengali
- sc ; Bopo ; Bopomofo
- sc ; Brai ; Braille
- sc ; Buhd ; Buhid
- sc ; Cans ; Canadian_Aboriginal
- sc ; Cher ; Cherokee
- sc ; Cprt ; Cypriot
- sc ; Cyrl ; Cyrillic
- sc ; Deva ; Devanagari
- sc ; Dsrt ; Deseret
- sc ; Ethi ; Ethiopic
- sc ; Geor ; Georgian
- sc ; Goth ; Gothic
- sc ; Grek ; Greek
- sc ; Gujr ; Gujarati
- sc ; Guru ; Gurmukhi
- sc ; Hang ; Hangul
- sc ; Hani ; Han
- sc ; Hano ; Hanunoo
- sc ; Hebr ; Hebrew
- sc ; Hira ; Hiragana
- sc ; Hrkt ; Katakana_Or_Hiragana
- sc ; Ital ; Old_Italic
- sc ; Kana ; Katakana
- sc ; Khmr ; Khmer
- sc ; Knda ; Kannada
- sc ; Laoo ; Lao
- sc ; Latn ; Latin
- sc ; Limb ; Limbu
- sc ; Linb ; Linear_B
- sc ; Mlym ; Malayalam
- sc ; Mong ; Mongolian
- sc ; Mymr ; Myanmar
- sc ; Ogam ; Ogham
- sc ; Orya ; Oriya
- sc ; Osma ; Osmanya
- sc ; Qaai ; Inherited
- sc ; Runr ; Runic
- sc ; Shaw ; Shavian
- sc ; Sinh ; Sinhala
- sc ; Syrc ; Syriac
- sc ; Tagb ; Tagbanwa
- sc ; Tale ; Tai_Le
- sc ; Taml ; Tamil
- sc ; Telu ; Telugu
- sc ; Tglg ; Tagalog
- sc ; Thaa ; Thaana
- sc ; Thai ; Thai
- sc ; Tibt ; Tibetan
- sc ; Ugar ; Ugaritic
- sc ; Yiii ; Yi
- sc ; Zyyy ; Common
-