summaryrefslogtreecommitdiff
path: root/lib/unicore/PropValueAliases.txt
diff options
context:
space:
mode:
Diffstat (limited to 'lib/unicore/PropValueAliases.txt')
-rw-r--r--lib/unicore/PropValueAliases.txt181
1 files changed, 163 insertions, 18 deletions
diff --git a/lib/unicore/PropValueAliases.txt b/lib/unicore/PropValueAliases.txt
index eeb3583188..fe82f23617 100644
--- a/lib/unicore/PropValueAliases.txt
+++ b/lib/unicore/PropValueAliases.txt
@@ -1,12 +1,10 @@
-# PropertyValueAliases-3.2.0.txt
-# Date: 2002-03-19,23:31:21 GMT [MD]
+# PropertyValueAliases-4.0.0.txt
+# Date: 2003-03-12, 23:46:08 GMT [MD]
#
# This file contains aliases for property values used in the UCD.
# These names can be used for XML formats of UCD data, for regular-expression
# property tests, and other programmatic textual descriptions of Unicode data.
-# The names are not normative, except where they correspond to normative property
-# values in the UCD. For information on which properties are normative, see
-# UnicodeCharacterDatabase.html.
+# For information on which properties are normative, see UCD.html.
#
# The names may be translated in appropriate environments, and additional
# aliases may be useful.
@@ -25,32 +23,32 @@
#
# Third Field: The third field is a long name.
#
-# In the case of ccc, their are 4 fields. The second field is numeric, third
+# In the case of ccc, there are 4 fields. The second field is numeric, third
# is abbreviated, and fourth is long.
#
# With loose matching of property names, the case distinctions, whitespace,
# and '_' are ignored.
#
-# NOTE: The Block property values are in Blocks.txt, and not repeated here.
-# For more information on the use of blocks, see UTR #24: Regular Expression Guidelines
-#
# NOTE: Currently there is at most one abbreviated name and one long name for
-# property value. However, in the future additional aliases
-# may be added. In such a case, the first line for the property value
-# would have the preferred alias for output.
+# property value. However, in the future additional aliases may be added.
+# In such a case, the first line for the property value would have
+# the preferred alias for output.
#
# NOTE: The property value names are NOT unique across properties, especially
-# with loose matches. For example,
+# with loose matches. For example:
+#
# AL means Arabic Letter for the Bidi_Class property, and
# AL means Alpha_Left for the Combining_Class property, and
# AL means Alphabetic for the Line_Break property.
#
-# In addition, some property names may be the same as some property value names:
-# cc means Combining_Class property, and
-# cc means the General_Category property value Control (cc)
+# In addition, some property names may be the same as some property value names.
+# For example:
+#
+# cc means Combining_Class property, and
+# cc means the General_Category property value Control (cc)
#
# The combination of property value and property name is, however, unique.
-# For more information, see UTR #24: Regular Expression Guidelines
+# For more information, see UTR #18: Regular Expression Guidelines
# ================================================
@@ -74,9 +72,136 @@ bc ; RLO ; Right_To_Left_Override
bc ; S ; Segment_Separator
bc ; WS ; White_Space
+blk; n/a ; Aegean_Numbers
+blk; n/a ; Alphabetic_Presentation_Forms
+blk; n/a ; Arabic
+blk; n/a ; Arabic_Presentation_Forms-A
+blk; n/a ; Arabic_Presentation_Forms-B
+blk; n/a ; Armenian
+blk; n/a ; Arrows
+blk; n/a ; Basic_Latin
+blk; n/a ; Bengali
+blk; n/a ; Block_Elements
+blk; n/a ; Bopomofo
+blk; n/a ; Bopomofo_Extended
+blk; n/a ; Box_Drawing
+blk; n/a ; Braille_Patterns
+blk; n/a ; Buhid
+blk; n/a ; Byzantine_Musical_Symbols
+blk; n/a ; Cherokee
+blk; n/a ; CJK_Compatibility
+blk; n/a ; CJK_Compatibility_Forms
+blk; n/a ; CJK_Compatibility_Ideographs
+blk; n/a ; CJK_Compatibility_Ideographs_Supplement
+blk; n/a ; CJK_Radicals_Supplement
+blk; n/a ; CJK_Symbols_and_Punctuation
+blk; n/a ; CJK_Unified_Ideographs
+blk; n/a ; CJK_Unified_Ideographs_Extension_A
+blk; n/a ; CJK_Unified_Ideographs_Extension_B
+blk; n/a ; Combining_Diacritical_Marks
+blk; n/a ; Combining_Diacritical_Marks_for_Symbols
+blk; n/a ; Combining_Half_Marks
+blk; n/a ; Control_Pictures
+blk; n/a ; Currency_Symbols
+blk; n/a ; Cypriot_Syllabary
+blk; n/a ; Cyrillic
+blk; n/a ; Cyrillic_Supplementary
+blk; n/a ; Deseret
+blk; n/a ; Devanagari
+blk; n/a ; Dingbats
+blk; n/a ; Enclosed_Alphanumerics
+blk; n/a ; Enclosed_CJK_Letters_and_Months
+blk; n/a ; Ethiopic
+blk; n/a ; General_Punctuation
+blk; n/a ; Geometric_Shapes
+blk; n/a ; Georgian
+blk; n/a ; Gothic
+blk; n/a ; Greek_and_Coptic
+blk; n/a ; Greek_Extended
+blk; n/a ; Gujarati
+blk; n/a ; Gurmukhi
+blk; n/a ; Halfwidth_and_Fullwidth_Forms
+blk; n/a ; Hangul_Compatibility_Jamo
+blk; n/a ; Hangul_Jamo
+blk; n/a ; Hangul_Syllables
+blk; n/a ; Hanunoo
+blk; n/a ; Hebrew
+blk; n/a ; High_Private_Use_Surrogates
+blk; n/a ; High_Surrogates
+blk; n/a ; Hiragana
+blk; n/a ; Ideographic_Description_Characters
+blk; n/a ; IPA_Extensions
+blk; n/a ; Kanbun
+blk; n/a ; Kangxi_Radicals
+blk; n/a ; Kannada
+blk; n/a ; Katakana
+blk; n/a ; Katakana_Phonetic_Extensions
+blk; n/a ; Khmer
+blk; n/a ; Khmer_Symbols
+blk; n/a ; Lao
+blk; n/a ; Latin_Extended_Additional
+blk; n/a ; Latin_Extended-A
+blk; n/a ; Latin_Extended-B
+blk; n/a ; Latin-1_Supplement
+blk; n/a ; Letterlike_Symbols
+blk; n/a ; Limbu
+blk; n/a ; Linear_B_Ideograms
+blk; n/a ; Linear_B_Syllabary
+blk; n/a ; Low_Surrogates
+blk; n/a ; Malayalam
+blk; n/a ; Mathematical_Alphanumeric_Symbols
+blk; n/a ; Mathematical_Operators
+blk; n/a ; Miscellaneous_Mathematical_Symbols-A
+blk; n/a ; Miscellaneous_Mathematical_Symbols-B
+blk; n/a ; Miscellaneous_Symbols
+blk; n/a ; Miscellaneous_Symbols_and_Arrows
+blk; n/a ; Miscellaneous_Technical
+blk; n/a ; Mongolian
+blk; n/a ; Musical_Symbols
+blk; n/a ; Myanmar
+blk; n/a ; No_Block
+blk; n/a ; Number_Forms
+blk; n/a ; Ogham
+blk; n/a ; Old_Italic
+blk; n/a ; Optical_Character_Recognition
+blk; n/a ; Oriya
+blk; n/a ; Osmanya
+blk; n/a ; Phonetic_Extensions
+blk; n/a ; Private_Use_Area
+blk; n/a ; Runic
+blk; n/a ; Shavian
+blk; n/a ; Sinhala
+blk; n/a ; Small_Form_Variants
+blk; n/a ; Spacing_Modifier_Letters
+blk; n/a ; Specials
+blk; n/a ; Superscripts_and_Subscripts
+blk; n/a ; Supplemental_Arrows-A
+blk; n/a ; Supplemental_Arrows-B
+blk; n/a ; Supplemental_Mathematical_Operators
+blk; n/a ; Supplementary_Private_Use_Area-A
+blk; n/a ; Supplementary_Private_Use_Area-B
+blk; n/a ; Syriac
+blk; n/a ; Tagalog
+blk; n/a ; Tagbanwa
+blk; n/a ; Tags
+blk; n/a ; Tai_Le
+blk; n/a ; Tai_Xuan_Jing_Symbols
+blk; n/a ; Tamil
+blk; n/a ; Telugu
+blk; n/a ; Thaana
+blk; n/a ; Thai
+blk; n/a ; Tibetan
+blk; n/a ; Ugaritic
+blk; n/a ; Unified_Canadian_Aboriginal_Syllabics
+blk; n/a ; Variation_Selectors
+blk; n/a ; Variation_Selectors_Supplement
+blk; n/a ; Yi_Radicals
+blk; n/a ; Yi_Syllables
+blk; n/a ; Yijing_Hexagram_Symbols
+
ccc; 0; NR ; Not_Reordered
ccc; 1; OV ; Overlay
-ccc; 202; ATBL ; Attached_Below_Left
+ccc; 202; ATB ; Attached_Below
ccc; 216; ATAR ; Attached_Above_Right
ccc; 218; BL ; Below_Left
ccc; 220; B ; Below
@@ -158,6 +283,13 @@ gc ; Zl ; Line_Separator
gc ; Zp ; Paragraph_Separator
gc ; Zs ; Space_Separator
+hst; L ; Leading_Jamo
+hst; LV ; LV_Syllable
+hst; LVT ; LVT_Syllable
+hst; NA ; Not_Applicable
+hst; T ; Trailing_Jamo
+hst; V ; Vowel_Jamo
+
jg ; n/a ; AIN
jg ; n/a ; ALAPH
jg ; n/a ; ALEF
@@ -166,6 +298,7 @@ jg ; n/a ; BETH
jg ; n/a ; DAL
jg ; n/a ; DALATH_RISH
jg ; n/a ; E
+jg ; n/a ; FE
jg ; n/a ; FEH
jg ; n/a ; FINAL_SEMKATH
jg ; n/a ; GAF
@@ -178,6 +311,7 @@ jg ; n/a ; HEH_GOAL
jg ; n/a ; HETH
jg ; n/a ; KAF
jg ; n/a ; KAPH
+jg ; n/a ; KHAPH
jg ; n/a ; KNOTTED_HEH
jg ; n/a ; LAM
jg ; n/a ; LAMADH
@@ -209,6 +343,7 @@ jg ; n/a ; YEH_WITH_TAIL
jg ; n/a ; YUDH
jg ; n/a ; YUDH_HE
jg ; n/a ; ZAIN
+jg ; n/a ; ZHAIN
jt ; C ; Join_Causing
jt ; D ; Dual_Joining
@@ -234,6 +369,7 @@ lb ; ID ; Ideographic
lb ; IN ; Inseperable
lb ; IS ; Infix_Numeric
lb ; LF ; Line_Feed
+lb ; NL ; Next_Line
lb ; NS ; Nonstarter
lb ; NU ; Numeric
lb ; OP ; Open_Punctuation
@@ -244,6 +380,7 @@ lb ; SA ; Complex_Context
lb ; SG ; Surrogate
lb ; SP ; Space
lb ; SY ; Break_Symbols
+lb ; WJ ; Word_Joiner
lb ; XX ; Unknown
lb ; ZW ; ZWSpace
@@ -260,9 +397,11 @@ sc ; Arab ; Arabic
sc ; Armn ; Armenian
sc ; Beng ; Bengali
sc ; Bopo ; Bopomofo
+sc ; Brai ; Braille
sc ; Buhd ; Buhid
sc ; Cans ; Canadian_Aboriginal
sc ; Cher ; Cherokee
+sc ; Cprt ; Cypriot
sc ; Cyrl ; Cyrillic
sc ; Deva ; Devanagari
sc ; Dsrt ; Deseret
@@ -283,21 +422,27 @@ sc ; Khmr ; Khmer
sc ; Knda ; Kannada
sc ; Laoo ; Lao
sc ; Latn ; Latin
+sc ; Limb ; Limbu
+sc ; Linb ; Linear_B
sc ; Mlym ; Malayalam
sc ; Mong ; Mongolian
sc ; Mymr ; Myanmar
sc ; Ogam ; Ogham
sc ; Orya ; Oriya
+sc ; Osma ; Osmanya
sc ; Qaai ; Inherited
sc ; Runr ; Runic
+sc ; Shaw ; Shavian
sc ; Sinh ; Sinhala
sc ; Syrc ; Syriac
sc ; Tagb ; Tagbanwa
+sc ; Tale ; Tai_Le
sc ; Taml ; Tamil
sc ; Telu ; Telugu
sc ; Tglg ; Tagalog
sc ; Thaa ; Thaana
sc ; Thai ; Thai
sc ; Tibt ; Tibetan
+sc ; Ugar ; Ugaritic
sc ; Yiii ; Yi
sc ; Zyyy ; Common