blob: 651bc2a77c70af56e616c60e1c2e81c796d36fb6 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
|
/* -*- buffer-read-only: t -*-
* !!!!!!! DO NOT EDIT THIS FILE !!!!!!!
* This file is built by regen/unicode_constants.pl from Unicode data.
* Any changes made here will be lost!
*/
#ifndef H_UNICODE_CONSTANTS /* Guard against nested #includes */
#define H_UNICODE_CONSTANTS 1
/* This file contains #defines for various Unicode code points. The values
* the macros expand to are the native Unicode code point, or all or portions
* of the UTF-8 encoding for the code point. In the former case, the macro
* name has the suffix "_NATIVE"; otherwise, the suffix "_UTF8".
*
* The macros that have the suffix "_UTF8" may have further suffixes, as
* follows:
* "_FIRST_BYTE" if the value is just the first byte of the UTF-8
* representation; the value will be a numeric constant.
* "_TAIL" if instead it represents all but the first byte. This, and
* with no additional suffix are both string constants */
#if 'A' == 65 /* ASCII/Latin1 */
# define LATIN_SMALL_LETTER_LONG_S_UTF8 "\xC5\xBF" /* U+017F */
# define COMBINING_GRAVE_ACCENT_UTF8 "\xCC\x80" /* U+0300 */
# define GREEK_CAPITAL_LETTER_IOTA_UTF8 "\xCE\x99" /* U+0399 */
# define GREEK_SMALL_LETTER_MU_UTF8 "\xCE\xBC" /* U+03BC */
# define LATIN_CAPITAL_LETTER_SHARP_S_UTF8 "\xE1\xBA\x9E" /* U+1E9E */
# define LATIN_SMALL_LIGATURE_LONG_S_T_UTF8 "\xEF\xAC\x85" /* U+FB05 */
# define LATIN_SMALL_LIGATURE_ST_UTF8 "\xEF\xAC\x86" /* U+FB06 */
# define HYPHEN_UTF8 "\xE2\x80\x90" /* U+2010 */
# define FIRST_SURROGATE_UTF8_FIRST_BYTE 0xED /* U+D800 */
# define BOM_UTF8_FIRST_BYTE 0xEF /* U+FEFF */
# define BOM_UTF8_TAIL "\xBB\xBF" /* U+FEFF */
# define NBSP_NATIVE 0xA0 /* U+00A0 */
# define NBSP_UTF8 "\xC2\xA0" /* U+00A0 */
# define DEL_NATIVE 0x7F /* U+007F */
# define CR_NATIVE 0x0D /* U+000D */
# define LF_NATIVE 0x0A /* U+000A */
# define LATIN_SMALL_LETTER_SHARP_S_NATIVE 0xDF /* U+00DF */
# define LATIN_SMALL_LETTER_A_WITH_RING_ABOVE_NATIVE 0xE5 /* U+00E5 */
# define LATIN_CAPITAL_LETTER_A_WITH_RING_ABOVE_NATIVE 0xC5 /* U+00C5 */
# define LATIN_SMALL_LETTER_Y_WITH_DIAERESIS_NATIVE 0xFF /* U+00FF */
# define MICRO_SIGN_NATIVE 0xB5 /* U+00B5 */
#endif /* ASCII/Latin1 */
#if 'A' == 193 /* EBCDIC 1047 */ \
&& '\\' == 224 && '[' == 173 && ']' == 189 && '{' == 192 && '}' == 208 \
&& '^' == 95 && '~' == 161 && '!' == 90 && '#' == 123 && '|' == 79 \
&& '$' == 91 && '@' == 124 && '`' == 121
# define LATIN_SMALL_LETTER_LONG_S_UTF8 "\x8F\x73" /* U+017F */
# define COMBINING_GRAVE_ACCENT_UTF8 "\xAF\x41" /* U+0300 */
# define GREEK_CAPITAL_LETTER_IOTA_UTF8 "\xB3\x68" /* U+0399 */
# define GREEK_SMALL_LETTER_MU_UTF8 "\xB4\x70" /* U+03BC */
# define LATIN_CAPITAL_LETTER_SHARP_S_UTF8 "\xBF\x63\x72" /* U+1E9E */
# define LATIN_SMALL_LIGATURE_LONG_S_T_UTF8 "\xDD\x72\x67\x46" /* U+FB05 */
# define LATIN_SMALL_LIGATURE_ST_UTF8 "\xDD\x72\x67\x47" /* U+FB06 */
# define HYPHEN_UTF8 "\xCA\x41\x57" /* U+2010 */
# define FIRST_SURROGATE_UTF8_FIRST_BYTE 0xDD /* U+D800 */
# define BOM_UTF8_FIRST_BYTE 0xDD /* U+FEFF */
# define BOM_UTF8_TAIL "\x73\x66\x73" /* U+FEFF */
# define NBSP_NATIVE 0x41 /* U+00A0 */
# define NBSP_UTF8 "\x80\x41" /* U+00A0 */
# define DEL_NATIVE 0x07 /* U+007F */
# define CR_NATIVE 0x0D /* U+000D */
# define LF_NATIVE 0x15 /* U+000A */
# define LATIN_SMALL_LETTER_SHARP_S_NATIVE 0x59 /* U+00DF */
# define LATIN_SMALL_LETTER_A_WITH_RING_ABOVE_NATIVE 0x47 /* U+00E5 */
# define LATIN_CAPITAL_LETTER_A_WITH_RING_ABOVE_NATIVE 0x67 /* U+00C5 */
# define LATIN_SMALL_LETTER_Y_WITH_DIAERESIS_NATIVE 0xDF /* U+00FF */
# define MICRO_SIGN_NATIVE 0xA0 /* U+00B5 */
#endif /* EBCDIC 1047 */
#if 'A' == 193 /* EBCDIC 037 */ \
&& '\\' == 224 && '[' == 186 && ']' == 187 && '{' == 192 && '}' == 208 \
&& '^' == 176 && '~' == 161 && '!' == 90 && '#' == 123 && '|' == 79 \
&& '$' == 91 && '@' == 124 && '`' == 121
# define LATIN_SMALL_LETTER_LONG_S_UTF8 "\x8E\x72" /* U+017F */
# define COMBINING_GRAVE_ACCENT_UTF8 "\xAD\x41" /* U+0300 */
# define GREEK_CAPITAL_LETTER_IOTA_UTF8 "\xB2\x67" /* U+0399 */
# define GREEK_SMALL_LETTER_MU_UTF8 "\xB3\x6A" /* U+03BC */
# define LATIN_CAPITAL_LETTER_SHARP_S_UTF8 "\xBF\x62\x71" /* U+1E9E */
# define LATIN_SMALL_LIGATURE_LONG_S_T_UTF8 "\xDD\x71\x66\x46" /* U+FB05 */
# define LATIN_SMALL_LIGATURE_ST_UTF8 "\xDD\x71\x66\x47" /* U+FB06 */
# define HYPHEN_UTF8 "\xCA\x41\x57" /* U+2010 */
# define FIRST_SURROGATE_UTF8_FIRST_BYTE 0xDD /* U+D800 */
# define BOM_UTF8_FIRST_BYTE 0xDD /* U+FEFF */
# define BOM_UTF8_TAIL "\x72\x65\x72" /* U+FEFF */
# define NBSP_NATIVE 0x41 /* U+00A0 */
# define NBSP_UTF8 "\x78\x41" /* U+00A0 */
# define DEL_NATIVE 0x07 /* U+007F */
# define CR_NATIVE 0x0D /* U+000D */
# define LF_NATIVE 0x25 /* U+000A */
# define LATIN_SMALL_LETTER_SHARP_S_NATIVE 0x59 /* U+00DF */
# define LATIN_SMALL_LETTER_A_WITH_RING_ABOVE_NATIVE 0x47 /* U+00E5 */
# define LATIN_CAPITAL_LETTER_A_WITH_RING_ABOVE_NATIVE 0x67 /* U+00C5 */
# define LATIN_SMALL_LETTER_Y_WITH_DIAERESIS_NATIVE 0xDF /* U+00FF */
# define MICRO_SIGN_NATIVE 0xA0 /* U+00B5 */
#endif /* EBCDIC 037 */
#if 'A' == 193 /* EBCDIC POSIX-BC */ \
&& '\\' == 188 && '[' == 187 && ']' == 189 && '{' == 251 && '}' == 253 \
&& '^' == 106 && '~' == 255 && '!' == 90 && '#' == 123 && '|' == 79 \
&& '$' == 91 && '@' == 124 && '`' == 74
# define LATIN_SMALL_LETTER_LONG_S_UTF8 "\x90\x75" /* U+017F */
# define COMBINING_GRAVE_ACCENT_UTF8 "\xAE\x41" /* U+0300 */
# define GREEK_CAPITAL_LETTER_IOTA_UTF8 "\xB2\x69" /* U+0399 */
# define GREEK_SMALL_LETTER_MU_UTF8 "\xB3\x72" /* U+03BC */
# define LATIN_CAPITAL_LETTER_SHARP_S_UTF8 "\xC0\x64\x74" /* U+1E9E */
# define LATIN_SMALL_LIGATURE_LONG_S_T_UTF8 "\xDC\x74\x68\x46" /* U+FB05 */
# define LATIN_SMALL_LIGATURE_ST_UTF8 "\xDC\x74\x68\x47" /* U+FB06 */
# define HYPHEN_UTF8 "\xCA\x41\x58" /* U+2010 */
# define FIRST_SURROGATE_UTF8_FIRST_BYTE 0xDC /* U+D800 */
# define BOM_UTF8_FIRST_BYTE 0xDC /* U+FEFF */
# define BOM_UTF8_TAIL "\x75\x67\x75" /* U+FEFF */
# define NBSP_NATIVE 0x41 /* U+00A0 */
# define NBSP_UTF8 "\x8A\x41" /* U+00A0 */
# define DEL_NATIVE 0x07 /* U+007F */
# define CR_NATIVE 0x0D /* U+000D */
# define LF_NATIVE 0x15 /* U+000A */
# define LATIN_SMALL_LETTER_SHARP_S_NATIVE 0x59 /* U+00DF */
# define LATIN_SMALL_LETTER_A_WITH_RING_ABOVE_NATIVE 0x47 /* U+00E5 */
# define LATIN_CAPITAL_LETTER_A_WITH_RING_ABOVE_NATIVE 0x67 /* U+00C5 */
# define LATIN_SMALL_LETTER_Y_WITH_DIAERESIS_NATIVE 0xDF /* U+00FF */
# define MICRO_SIGN_NATIVE 0xA0 /* U+00B5 */
#endif /* EBCDIC POSIX-BC */
#endif /* H_UNICODE_CONSTANTS */
/* ex: set ro: */
|