diff options
author | Jarkko Hietaniemi <jhi@iki.fi> | 2002-03-29 15:36:43 +0000 |
---|---|---|
committer | Jarkko Hietaniemi <jhi@iki.fi> | 2002-03-29 15:36:43 +0000 |
commit | dbe755816e065c14b8ab50957873470db81d7b70 (patch) | |
tree | 627519e2f455f726c7a5e26f2524b417d44e8633 /lib/unicore/PropValueAliases.txt | |
parent | 1f6c91edf2c151ed2193ff9d3b2ac33d4db604fd (diff) | |
download | perl-dbe755816e065c14b8ab50957873470db81d7b70.tar.gz |
Rename for 8.3-friendliness.
p4raw-id: //depot/perl@15605
Diffstat (limited to 'lib/unicore/PropValueAliases.txt')
-rw-r--r-- | lib/unicore/PropValueAliases.txt | 303 |
1 files changed, 303 insertions, 0 deletions
diff --git a/lib/unicore/PropValueAliases.txt b/lib/unicore/PropValueAliases.txt new file mode 100644 index 0000000000..eeb3583188 --- /dev/null +++ b/lib/unicore/PropValueAliases.txt @@ -0,0 +1,303 @@ +# PropertyValueAliases-3.2.0.txt +# Date: 2002-03-19,23:31:21 GMT [MD] +# +# This file contains aliases for property values used in the UCD. +# These names can be used for XML formats of UCD data, for regular-expression +# property tests, and other programmatic textual descriptions of Unicode data. +# The names are not normative, except where they correspond to normative property +# values in the UCD. For information on which properties are normative, see +# UnicodeCharacterDatabase.html. +# +# The names may be translated in appropriate environments, and additional +# aliases may be useful. +# +# FORMAT +# +# Each line describes a property value name. +# This consists of three fields, separated by semicolons. +# +# First Field: The first field describes the property for which that +# property value name is used. +# There is one special pseudo-property: "qc" stands for any quick-check property +# +# Second Field: The second field is an abbreviated name. +# If there is no abbreviated name available, the field is marked with "n/a". +# +# Third Field: The third field is a long name. +# +# In the case of ccc, their are 4 fields. The second field is numeric, third +# is abbreviated, and fourth is long. +# +# With loose matching of property names, the case distinctions, whitespace, +# and '_' are ignored. +# +# NOTE: The Block property values are in Blocks.txt, and not repeated here. +# For more information on the use of blocks, see UTR #24: Regular Expression Guidelines +# +# NOTE: Currently there is at most one abbreviated name and one long name for +# property value. However, in the future additional aliases +# may be added. In such a case, the first line for the property value +# would have the preferred alias for output. +# +# NOTE: The property value names are NOT unique across properties, especially +# with loose matches. For example, +# AL means Arabic Letter for the Bidi_Class property, and +# AL means Alpha_Left for the Combining_Class property, and +# AL means Alphabetic for the Line_Break property. +# +# In addition, some property names may be the same as some property value names: +# cc means Combining_Class property, and +# cc means the General_Category property value Control (cc) +# +# The combination of property value and property name is, however, unique. +# For more information, see UTR #24: Regular Expression Guidelines +# ================================================ + + +bc ; AL ; Arabic_Letter +bc ; AN ; Arabic_Number +bc ; B ; Paragraph_Separator +bc ; BN ; Boundary_Neutral +bc ; CS ; Common_Separator +bc ; EN ; European_Number +bc ; ES ; European_Separator +bc ; ET ; European_Terminator +bc ; L ; Left_To_Right +bc ; LRE ; Left_To_Right_Embedding +bc ; LRO ; Left_To_Right_Override +bc ; NSM ; Nonspacing_Mark +bc ; ON ; Other_Neutral +bc ; PDF ; Pop_Directional_Format +bc ; R ; Right_To_Left +bc ; RLE ; Right_To_Left_Embedding +bc ; RLO ; Right_To_Left_Override +bc ; S ; Segment_Separator +bc ; WS ; White_Space + +ccc; 0; NR ; Not_Reordered +ccc; 1; OV ; Overlay +ccc; 202; ATBL ; Attached_Below_Left +ccc; 216; ATAR ; Attached_Above_Right +ccc; 218; BL ; Below_Left +ccc; 220; B ; Below +ccc; 222; BR ; Below_Right +ccc; 224; L ; Left +ccc; 226; R ; Right +ccc; 228; AL ; Above_Left +ccc; 230; A ; Above +ccc; 232; AR ; Above_Right +ccc; 233; DB ; Double_Below +ccc; 234; DA ; Double_Above +ccc; 240; IS ; Iota_Subscript +ccc; 7; NK ; Nukta +ccc; 8; KV ; Kana_Voicing +ccc; 9; VR ; Virama + +dt ; can ; canonical +dt ; com ; compat +dt ; enc ; circle +dt ; fin ; final +dt ; font ; font +dt ; fra ; fraction +dt ; init ; initial +dt ; iso ; isolated +dt ; med ; medial +dt ; n/a ; none +dt ; nar ; narrow +dt ; nb ; noBreak +dt ; sml ; small +dt ; sqr ; square +dt ; sub ; sub +dt ; sup ; super +dt ; vert ; vertical +dt ; wide ; wide + +ea ; A ; Ambiguous +ea ; F ; Fullwidth +ea ; H ; Halfwidth +ea ; N ; Neutral +ea ; Na ; Narrow +ea ; W ; Wide + +gc ; C ; Other # Cc | Cf | Cn | Co | Cs +gc ; Cc ; Control +gc ; Cf ; Format +gc ; Cn ; Unassigned +gc ; Co ; Private_Use +gc ; Cs ; Surrogate +gc ; L ; Letter # Ll | Lm | Lo | Lt | Lu +gc ; LC ; Cased_Letter # Ll | Lt | Lu +gc ; Ll ; Lowercase_Letter +gc ; Lm ; Modifier_Letter +gc ; Lo ; Other_Letter +gc ; Lt ; Titlecase_Letter +gc ; Lu ; Uppercase_Letter +gc ; M ; Mark # Mc | Me | Mn +gc ; Mc ; Spacing_Mark +gc ; Me ; Enclosing_Mark +gc ; Mn ; Nonspacing_Mark +gc ; N ; Number # Nd | Nl | No +gc ; Nd ; Decimal_Number +gc ; Nl ; Letter_Number +gc ; No ; Other_Number +gc ; P ; Punctuation # Pc | Pd | Pe | Pf | Pi | Po | Ps +gc ; Pc ; Connector_Punctuation +gc ; Pd ; Dash_Punctuation +gc ; Pe ; Close_Punctuation +gc ; Pf ; Final_Punctuation +gc ; Pi ; Initial_Punctuation +gc ; Po ; Other_Punctuation +gc ; Ps ; Open_Punctuation +gc ; S ; Symbol # Sc | Sk | Sm | So +gc ; Sc ; Currency_Symbol +gc ; Sk ; Modifier_Symbol +gc ; Sm ; Math_Symbol +gc ; So ; Other_Symbol +gc ; Z ; Separator # Zl | Zp | Zs +gc ; Zl ; Line_Separator +gc ; Zp ; Paragraph_Separator +gc ; Zs ; Space_Separator + +jg ; n/a ; AIN +jg ; n/a ; ALAPH +jg ; n/a ; ALEF +jg ; n/a ; BEH +jg ; n/a ; BETH +jg ; n/a ; DAL +jg ; n/a ; DALATH_RISH +jg ; n/a ; E +jg ; n/a ; FEH +jg ; n/a ; FINAL_SEMKATH +jg ; n/a ; GAF +jg ; n/a ; GAMAL +jg ; n/a ; HAH +jg ; n/a ; HAMZA_ON_HEH_GOAL +jg ; n/a ; HE +jg ; n/a ; HEH +jg ; n/a ; HEH_GOAL +jg ; n/a ; HETH +jg ; n/a ; KAF +jg ; n/a ; KAPH +jg ; n/a ; KNOTTED_HEH +jg ; n/a ; LAM +jg ; n/a ; LAMADH +jg ; n/a ; MEEM +jg ; n/a ; MIM +jg ; n/a ; NO_JOINING_GROUP +jg ; n/a ; NOON +jg ; n/a ; NUN +jg ; n/a ; PE +jg ; n/a ; QAF +jg ; n/a ; QAPH +jg ; n/a ; REH +jg ; n/a ; REVERSED_PE +jg ; n/a ; SAD +jg ; n/a ; SADHE +jg ; n/a ; SEEN +jg ; n/a ; SEMKATH +jg ; n/a ; SHIN +jg ; n/a ; SWASH_KAF +jg ; n/a ; SYRIAC_WAW +jg ; n/a ; TAH +jg ; n/a ; TAW +jg ; n/a ; TEH_MARBUTA +jg ; n/a ; TETH +jg ; n/a ; WAW +jg ; n/a ; YEH +jg ; n/a ; YEH_BARREE +jg ; n/a ; YEH_WITH_TAIL +jg ; n/a ; YUDH +jg ; n/a ; YUDH_HE +jg ; n/a ; ZAIN + +jt ; C ; Join_Causing +jt ; D ; Dual_Joining +jt ; L ; Left_Joining +jt ; R ; Right_Joining +jt ; T ; Transparent +jt ; U ; Non_Joining + +lb ; AI ; Ambiguous +lb ; AL ; Alphabetic +lb ; B2 ; Break_Both +lb ; BA ; Break_After +lb ; BB ; Break_Before +lb ; BK ; Mandatory_Break +lb ; CB ; Contingent_Break +lb ; CL ; Close_Punctuation +lb ; CM ; Combining_Mark +lb ; CR ; Carriage_Return +lb ; EX ; Exclamation +lb ; GL ; Glue +lb ; HY ; Hyphen +lb ; ID ; Ideographic +lb ; IN ; Inseperable +lb ; IS ; Infix_Numeric +lb ; LF ; Line_Feed +lb ; NS ; Nonstarter +lb ; NU ; Numeric +lb ; OP ; Open_Punctuation +lb ; PO ; Postfix_Numeric +lb ; PR ; Prefix_Numeric +lb ; QU ; Quotation +lb ; SA ; Complex_Context +lb ; SG ; Surrogate +lb ; SP ; Space +lb ; SY ; Break_Symbols +lb ; XX ; Unknown +lb ; ZW ; ZWSpace + +nt ; de ; Decimal +nt ; di ; Digit +nt ; n/a ; None +nt ; nu ; Numeric + +qc ; M ; Maybe +qc ; N ; No +qc ; Y ; Yes + +sc ; Arab ; Arabic +sc ; Armn ; Armenian +sc ; Beng ; Bengali +sc ; Bopo ; Bopomofo +sc ; Buhd ; Buhid +sc ; Cans ; Canadian_Aboriginal +sc ; Cher ; Cherokee +sc ; Cyrl ; Cyrillic +sc ; Deva ; Devanagari +sc ; Dsrt ; Deseret +sc ; Ethi ; Ethiopic +sc ; Geor ; Georgian +sc ; Goth ; Gothic +sc ; Grek ; Greek +sc ; Gujr ; Gujarati +sc ; Guru ; Gurmukhi +sc ; Hang ; Hangul +sc ; Hani ; Han +sc ; Hano ; Hanunoo +sc ; Hebr ; Hebrew +sc ; Hira ; Hiragana +sc ; Ital ; Old_Italic +sc ; Kana ; Katakana +sc ; Khmr ; Khmer +sc ; Knda ; Kannada +sc ; Laoo ; Lao +sc ; Latn ; Latin +sc ; Mlym ; Malayalam +sc ; Mong ; Mongolian +sc ; Mymr ; Myanmar +sc ; Ogam ; Ogham +sc ; Orya ; Oriya +sc ; Qaai ; Inherited +sc ; Runr ; Runic +sc ; Sinh ; Sinhala +sc ; Syrc ; Syriac +sc ; Tagb ; Tagbanwa +sc ; Taml ; Tamil +sc ; Telu ; Telugu +sc ; Tglg ; Tagalog +sc ; Thaa ; Thaana +sc ; Thai ; Thai +sc ; Tibt ; Tibetan +sc ; Yiii ; Yi +sc ; Zyyy ; Common |