1 /* The table and comments below along with the function xkb_keysym_to_ucs4
2 * are under the public domain and are derived as described below.
3 */
4 /* This module converts keysym values into the corresponding ISO 10646
5 * (UCS, Unicode) values.
6 *
7 * The array keysymtab[] contains pairs of X11 keysym values for graphical
8 * characters and the corresponding Unicode value. The function
9 * keysym2ucs() maps a keysym onto a Unicode value using a binary search,
10 * therefore keysymtab[] must remain SORTED by keysym value.
11 *
12 * The keysym -> UTF-8 conversion will hopefully one day be provided
13 * by Xlib via XmbLookupString() and should ideally not have to be
14 * done in X applications. But we are not there yet.
15 *
16 * We allow to represent any UCS character in the range U-00000000 to
17 * U-00FFFFFF by a keysym value in the range 0x01000000 to 0x01ffffff.
18 * This admittedly does not cover the entire 31-bit space of UCS, but
19 * it does cover all of the characters up to U-10FFFF, which can be
20 * represented by UTF-16, and more, and it is very unlikely that higher
21 * UCS codes will ever be assigned by ISO. So to get Unicode character
22 * U+ABCD you can directly use keysym 0x0100abcd.
23 *
24 * NOTE: The comments in the table below contain the actual character
25 * encoded in UTF-8, so for viewing and editing best use an editor in
26 * UTF-8 mode.
27 *
28 * Author: Markus G. Kuhn <http://www.cl.cam.ac.uk/~mgk25/>,
29 * University of Cambridge, April 2001
30 *
31 * Special thanks to Richard Verhoeven <river@win.tue.nl> for preparing
32 * an initial draft of the mapping table.
33 *
34 * This software is in the public domain. Share and enjoy!
35 *
36 */
37
38 #include "xkbcommon/xkbcommon.h"
39 #include "utils.h"
40 #include "utf8.h"
41
42 /* We don't use the uint32_t types here, to save some space. */
43 struct codepair {
44 uint16_t keysym;
45 uint16_t ucs;
46 };
47
48 static const struct codepair keysymtab[] = {
49 { 0x01a1, 0x0104 }, /* Aogonek Ą LATIN CAPITAL LETTER A WITH OGONEK */
50 { 0x01a2, 0x02d8 }, /* breve ˘ BREVE */
51 { 0x01a3, 0x0141 }, /* Lstroke Ł LATIN CAPITAL LETTER L WITH STROKE */
52 { 0x01a5, 0x013d }, /* Lcaron Ľ LATIN CAPITAL LETTER L WITH CARON */
53 { 0x01a6, 0x015a }, /* Sacute Ś LATIN CAPITAL LETTER S WITH ACUTE */
54 { 0x01a9, 0x0160 }, /* Scaron Š LATIN CAPITAL LETTER S WITH CARON */
55 { 0x01aa, 0x015e }, /* Scedilla Ş LATIN CAPITAL LETTER S WITH CEDILLA */
56 { 0x01ab, 0x0164 }, /* Tcaron Ť LATIN CAPITAL LETTER T WITH CARON */
57 { 0x01ac, 0x0179 }, /* Zacute Ź LATIN CAPITAL LETTER Z WITH ACUTE */
58 { 0x01ae, 0x017d }, /* Zcaron Ž LATIN CAPITAL LETTER Z WITH CARON */
59 { 0x01af, 0x017b }, /* Zabovedot Ż LATIN CAPITAL LETTER Z WITH DOT ABOVE */
60 { 0x01b1, 0x0105 }, /* aogonek ą LATIN SMALL LETTER A WITH OGONEK */
61 { 0x01b2, 0x02db }, /* ogonek ˛ OGONEK */
62 { 0x01b3, 0x0142 }, /* lstroke ł LATIN SMALL LETTER L WITH STROKE */
63 { 0x01b5, 0x013e }, /* lcaron ľ LATIN SMALL LETTER L WITH CARON */
64 { 0x01b6, 0x015b }, /* sacute ś LATIN SMALL LETTER S WITH ACUTE */
65 { 0x01b7, 0x02c7 }, /* caron ˇ CARON */
66 { 0x01b9, 0x0161 }, /* scaron š LATIN SMALL LETTER S WITH CARON */
67 { 0x01ba, 0x015f }, /* scedilla ş LATIN SMALL LETTER S WITH CEDILLA */
68 { 0x01bb, 0x0165 }, /* tcaron ť LATIN SMALL LETTER T WITH CARON */
69 { 0x01bc, 0x017a }, /* zacute ź LATIN SMALL LETTER Z WITH ACUTE */
70 { 0x01bd, 0x02dd }, /* doubleacute ˝ DOUBLE ACUTE ACCENT */
71 { 0x01be, 0x017e }, /* zcaron ž LATIN SMALL LETTER Z WITH CARON */
72 { 0x01bf, 0x017c }, /* zabovedot ż LATIN SMALL LETTER Z WITH DOT ABOVE */
73 { 0x01c0, 0x0154 }, /* Racute Ŕ LATIN CAPITAL LETTER R WITH ACUTE */
74 { 0x01c3, 0x0102 }, /* Abreve Ă LATIN CAPITAL LETTER A WITH BREVE */
75 { 0x01c5, 0x0139 }, /* Lacute Ĺ LATIN CAPITAL LETTER L WITH ACUTE */
76 { 0x01c6, 0x0106 }, /* Cacute Ć LATIN CAPITAL LETTER C WITH ACUTE */
77 { 0x01c8, 0x010c }, /* Ccaron Č LATIN CAPITAL LETTER C WITH CARON */
78 { 0x01ca, 0x0118 }, /* Eogonek Ę LATIN CAPITAL LETTER E WITH OGONEK */
79 { 0x01cc, 0x011a }, /* Ecaron Ě LATIN CAPITAL LETTER E WITH CARON */
80 { 0x01cf, 0x010e }, /* Dcaron Ď LATIN CAPITAL LETTER D WITH CARON */
81 { 0x01d0, 0x0110 }, /* Dstroke Đ LATIN CAPITAL LETTER D WITH STROKE */
82 { 0x01d1, 0x0143 }, /* Nacute Ń LATIN CAPITAL LETTER N WITH ACUTE */
83 { 0x01d2, 0x0147 }, /* Ncaron Ň LATIN CAPITAL LETTER N WITH CARON */
84 { 0x01d5, 0x0150 }, /* Odoubleacute Ő LATIN CAPITAL LETTER O WITH DOUBLE ACUTE */
85 { 0x01d8, 0x0158 }, /* Rcaron Ř LATIN CAPITAL LETTER R WITH CARON */
86 { 0x01d9, 0x016e }, /* Uring Ů LATIN CAPITAL LETTER U WITH RING ABOVE */
87 { 0x01db, 0x0170 }, /* Udoubleacute Ű LATIN CAPITAL LETTER U WITH DOUBLE ACUTE */
88 { 0x01de, 0x0162 }, /* Tcedilla Ţ LATIN CAPITAL LETTER T WITH CEDILLA */
89 { 0x01e0, 0x0155 }, /* racute ŕ LATIN SMALL LETTER R WITH ACUTE */
90 { 0x01e3, 0x0103 }, /* abreve ă LATIN SMALL LETTER A WITH BREVE */
91 { 0x01e5, 0x013a }, /* lacute ĺ LATIN SMALL LETTER L WITH ACUTE */
92 { 0x01e6, 0x0107 }, /* cacute ć LATIN SMALL LETTER C WITH ACUTE */
93 { 0x01e8, 0x010d }, /* ccaron č LATIN SMALL LETTER C WITH CARON */
94 { 0x01ea, 0x0119 }, /* eogonek ę LATIN SMALL LETTER E WITH OGONEK */
95 { 0x01ec, 0x011b }, /* ecaron ě LATIN SMALL LETTER E WITH CARON */
96 { 0x01ef, 0x010f }, /* dcaron ď LATIN SMALL LETTER D WITH CARON */
97 { 0x01f0, 0x0111 }, /* dstroke đ LATIN SMALL LETTER D WITH STROKE */
98 { 0x01f1, 0x0144 }, /* nacute ń LATIN SMALL LETTER N WITH ACUTE */
99 { 0x01f2, 0x0148 }, /* ncaron ň LATIN SMALL LETTER N WITH CARON */
100 { 0x01f5, 0x0151 }, /* odoubleacute ő LATIN SMALL LETTER O WITH DOUBLE ACUTE */
101 { 0x01f8, 0x0159 }, /* rcaron ř LATIN SMALL LETTER R WITH CARON */
102 { 0x01f9, 0x016f }, /* uring ů LATIN SMALL LETTER U WITH RING ABOVE */
103 { 0x01fb, 0x0171 }, /* udoubleacute ű LATIN SMALL LETTER U WITH DOUBLE ACUTE */
104 { 0x01fe, 0x0163 }, /* tcedilla ţ LATIN SMALL LETTER T WITH CEDILLA */
105 { 0x01ff, 0x02d9 }, /* abovedot ˙ DOT ABOVE */
106 { 0x02a1, 0x0126 }, /* Hstroke Ħ LATIN CAPITAL LETTER H WITH STROKE */
107 { 0x02a6, 0x0124 }, /* Hcircumflex Ĥ LATIN CAPITAL LETTER H WITH CIRCUMFLEX */
108 { 0x02a9, 0x0130 }, /* Iabovedot İ LATIN CAPITAL LETTER I WITH DOT ABOVE */
109 { 0x02ab, 0x011e }, /* Gbreve Ğ LATIN CAPITAL LETTER G WITH BREVE */
110 { 0x02ac, 0x0134 }, /* Jcircumflex Ĵ LATIN CAPITAL LETTER J WITH CIRCUMFLEX */
111 { 0x02b1, 0x0127 }, /* hstroke ħ LATIN SMALL LETTER H WITH STROKE */
112 { 0x02b6, 0x0125 }, /* hcircumflex ĥ LATIN SMALL LETTER H WITH CIRCUMFLEX */
113 { 0x02b9, 0x0131 }, /* idotless ı LATIN SMALL LETTER DOTLESS I */
114 { 0x02bb, 0x011f }, /* gbreve ğ LATIN SMALL LETTER G WITH BREVE */
115 { 0x02bc, 0x0135 }, /* jcircumflex ĵ LATIN SMALL LETTER J WITH CIRCUMFLEX */
116 { 0x02c5, 0x010a }, /* Cabovedot Ċ LATIN CAPITAL LETTER C WITH DOT ABOVE */
117 { 0x02c6, 0x0108 }, /* Ccircumflex Ĉ LATIN CAPITAL LETTER C WITH CIRCUMFLEX */
118 { 0x02d5, 0x0120 }, /* Gabovedot Ġ LATIN CAPITAL LETTER G WITH DOT ABOVE */
119 { 0x02d8, 0x011c }, /* Gcircumflex Ĝ LATIN CAPITAL LETTER G WITH CIRCUMFLEX */
120 { 0x02dd, 0x016c }, /* Ubreve Ŭ LATIN CAPITAL LETTER U WITH BREVE */
121 { 0x02de, 0x015c }, /* Scircumflex Ŝ LATIN CAPITAL LETTER S WITH CIRCUMFLEX */
122 { 0x02e5, 0x010b }, /* cabovedot ċ LATIN SMALL LETTER C WITH DOT ABOVE */
123 { 0x02e6, 0x0109 }, /* ccircumflex ĉ LATIN SMALL LETTER C WITH CIRCUMFLEX */
124 { 0x02f5, 0x0121 }, /* gabovedot ġ LATIN SMALL LETTER G WITH DOT ABOVE */
125 { 0x02f8, 0x011d }, /* gcircumflex ĝ LATIN SMALL LETTER G WITH CIRCUMFLEX */
126 { 0x02fd, 0x016d }, /* ubreve ŭ LATIN SMALL LETTER U WITH BREVE */
127 { 0x02fe, 0x015d }, /* scircumflex ŝ LATIN SMALL LETTER S WITH CIRCUMFLEX */
128 { 0x03a2, 0x0138 }, /* kra ĸ LATIN SMALL LETTER KRA */
129 { 0x03a3, 0x0156 }, /* Rcedilla Ŗ LATIN CAPITAL LETTER R WITH CEDILLA */
130 { 0x03a5, 0x0128 }, /* Itilde Ĩ LATIN CAPITAL LETTER I WITH TILDE */
131 { 0x03a6, 0x013b }, /* Lcedilla Ļ LATIN CAPITAL LETTER L WITH CEDILLA */
132 { 0x03aa, 0x0112 }, /* Emacron Ē LATIN CAPITAL LETTER E WITH MACRON */
133 { 0x03ab, 0x0122 }, /* Gcedilla Ģ LATIN CAPITAL LETTER G WITH CEDILLA */
134 { 0x03ac, 0x0166 }, /* Tslash Ŧ LATIN CAPITAL LETTER T WITH STROKE */
135 { 0x03b3, 0x0157 }, /* rcedilla ŗ LATIN SMALL LETTER R WITH CEDILLA */
136 { 0x03b5, 0x0129 }, /* itilde ĩ LATIN SMALL LETTER I WITH TILDE */
137 { 0x03b6, 0x013c }, /* lcedilla ļ LATIN SMALL LETTER L WITH CEDILLA */
138 { 0x03ba, 0x0113 }, /* emacron ē LATIN SMALL LETTER E WITH MACRON */
139 { 0x03bb, 0x0123 }, /* gcedilla ģ LATIN SMALL LETTER G WITH CEDILLA */
140 { 0x03bc, 0x0167 }, /* tslash ŧ LATIN SMALL LETTER T WITH STROKE */
141 { 0x03bd, 0x014a }, /* ENG Ŋ LATIN CAPITAL LETTER ENG */
142 { 0x03bf, 0x014b }, /* eng ŋ LATIN SMALL LETTER ENG */
143 { 0x03c0, 0x0100 }, /* Amacron Ā LATIN CAPITAL LETTER A WITH MACRON */
144 { 0x03c7, 0x012e }, /* Iogonek Į LATIN CAPITAL LETTER I WITH OGONEK */
145 { 0x03cc, 0x0116 }, /* Eabovedot Ė LATIN CAPITAL LETTER E WITH DOT ABOVE */
146 { 0x03cf, 0x012a }, /* Imacron Ī LATIN CAPITAL LETTER I WITH MACRON */
147 { 0x03d1, 0x0145 }, /* Ncedilla Ņ LATIN CAPITAL LETTER N WITH CEDILLA */
148 { 0x03d2, 0x014c }, /* Omacron Ō LATIN CAPITAL LETTER O WITH MACRON */
149 { 0x03d3, 0x0136 }, /* Kcedilla Ķ LATIN CAPITAL LETTER K WITH CEDILLA */
150 { 0x03d9, 0x0172 }, /* Uogonek Ų LATIN CAPITAL LETTER U WITH OGONEK */
151 { 0x03dd, 0x0168 }, /* Utilde Ũ LATIN CAPITAL LETTER U WITH TILDE */
152 { 0x03de, 0x016a }, /* Umacron Ū LATIN CAPITAL LETTER U WITH MACRON */
153 { 0x03e0, 0x0101 }, /* amacron ā LATIN SMALL LETTER A WITH MACRON */
154 { 0x03e7, 0x012f }, /* iogonek į LATIN SMALL LETTER I WITH OGONEK */
155 { 0x03ec, 0x0117 }, /* eabovedot ė LATIN SMALL LETTER E WITH DOT ABOVE */
156 { 0x03ef, 0x012b }, /* imacron ī LATIN SMALL LETTER I WITH MACRON */
157 { 0x03f1, 0x0146 }, /* ncedilla ņ LATIN SMALL LETTER N WITH CEDILLA */
158 { 0x03f2, 0x014d }, /* omacron ō LATIN SMALL LETTER O WITH MACRON */
159 { 0x03f3, 0x0137 }, /* kcedilla ķ LATIN SMALL LETTER K WITH CEDILLA */
160 { 0x03f9, 0x0173 }, /* uogonek ų LATIN SMALL LETTER U WITH OGONEK */
161 { 0x03fd, 0x0169 }, /* utilde ũ LATIN SMALL LETTER U WITH TILDE */
162 { 0x03fe, 0x016b }, /* umacron ū LATIN SMALL LETTER U WITH MACRON */
163 { 0x047e, 0x203e }, /* overline ‾ OVERLINE */
164 { 0x04a1, 0x3002 }, /* kana_fullstop 。 IDEOGRAPHIC FULL STOP */
165 { 0x04a2, 0x300c }, /* kana_openingbracket 「 LEFT CORNER BRACKET */
166 { 0x04a3, 0x300d }, /* kana_closingbracket 」 RIGHT CORNER BRACKET */
167 { 0x04a4, 0x3001 }, /* kana_comma 、 IDEOGRAPHIC COMMA */
168 { 0x04a5, 0x30fb }, /* kana_conjunctive ・ KATAKANA MIDDLE DOT */
169 { 0x04a6, 0x30f2 }, /* kana_WO ヲ KATAKANA LETTER WO */
170 { 0x04a7, 0x30a1 }, /* kana_a ァ KATAKANA LETTER SMALL A */
171 { 0x04a8, 0x30a3 }, /* kana_i ィ KATAKANA LETTER SMALL I */
172 { 0x04a9, 0x30a5 }, /* kana_u ゥ KATAKANA LETTER SMALL U */
173 { 0x04aa, 0x30a7 }, /* kana_e ェ KATAKANA LETTER SMALL E */
174 { 0x04ab, 0x30a9 }, /* kana_o ォ KATAKANA LETTER SMALL O */
175 { 0x04ac, 0x30e3 }, /* kana_ya ャ KATAKANA LETTER SMALL YA */
176 { 0x04ad, 0x30e5 }, /* kana_yu ュ KATAKANA LETTER SMALL YU */
177 { 0x04ae, 0x30e7 }, /* kana_yo ョ KATAKANA LETTER SMALL YO */
178 { 0x04af, 0x30c3 }, /* kana_tsu ッ KATAKANA LETTER SMALL TU */
179 { 0x04b0, 0x30fc }, /* prolongedsound ー KATAKANA-HIRAGANA PROLONGED SOUND MARK */
180 { 0x04b1, 0x30a2 }, /* kana_A ア KATAKANA LETTER A */
181 { 0x04b2, 0x30a4 }, /* kana_I イ KATAKANA LETTER I */
182 { 0x04b3, 0x30a6 }, /* kana_U ウ KATAKANA LETTER U */
183 { 0x04b4, 0x30a8 }, /* kana_E エ KATAKANA LETTER E */
184 { 0x04b5, 0x30aa }, /* kana_O オ KATAKANA LETTER O */
185 { 0x04b6, 0x30ab }, /* kana_KA カ KATAKANA LETTER KA */
186 { 0x04b7, 0x30ad }, /* kana_KI キ KATAKANA LETTER KI */
187 { 0x04b8, 0x30af }, /* kana_KU ク KATAKANA LETTER KU */
188 { 0x04b9, 0x30b1 }, /* kana_KE ケ KATAKANA LETTER KE */
189 { 0x04ba, 0x30b3 }, /* kana_KO コ KATAKANA LETTER KO */
190 { 0x04bb, 0x30b5 }, /* kana_SA サ KATAKANA LETTER SA */
191 { 0x04bc, 0x30b7 }, /* kana_SHI シ KATAKANA LETTER SI */
192 { 0x04bd, 0x30b9 }, /* kana_SU ス KATAKANA LETTER SU */
193 { 0x04be, 0x30bb }, /* kana_SE セ KATAKANA LETTER SE */
194 { 0x04bf, 0x30bd }, /* kana_SO ソ KATAKANA LETTER SO */
195 { 0x04c0, 0x30bf }, /* kana_TA タ KATAKANA LETTER TA */
196 { 0x04c1, 0x30c1 }, /* kana_CHI チ KATAKANA LETTER TI */
197 { 0x04c2, 0x30c4 }, /* kana_TSU ツ KATAKANA LETTER TU */
198 { 0x04c3, 0x30c6 }, /* kana_TE テ KATAKANA LETTER TE */
199 { 0x04c4, 0x30c8 }, /* kana_TO ト KATAKANA LETTER TO */
200 { 0x04c5, 0x30ca }, /* kana_NA ナ KATAKANA LETTER NA */
201 { 0x04c6, 0x30cb }, /* kana_NI ニ KATAKANA LETTER NI */
202 { 0x04c7, 0x30cc }, /* kana_NU ヌ KATAKANA LETTER NU */
203 { 0x04c8, 0x30cd }, /* kana_NE ネ KATAKANA LETTER NE */
204 { 0x04c9, 0x30ce }, /* kana_NO ノ KATAKANA LETTER NO */
205 { 0x04ca, 0x30cf }, /* kana_HA ハ KATAKANA LETTER HA */
206 { 0x04cb, 0x30d2 }, /* kana_HI ヒ KATAKANA LETTER HI */
207 { 0x04cc, 0x30d5 }, /* kana_FU フ KATAKANA LETTER HU */
208 { 0x04cd, 0x30d8 }, /* kana_HE ヘ KATAKANA LETTER HE */
209 { 0x04ce, 0x30db }, /* kana_HO ホ KATAKANA LETTER HO */
210 { 0x04cf, 0x30de }, /* kana_MA マ KATAKANA LETTER MA */
211 { 0x04d0, 0x30df }, /* kana_MI ミ KATAKANA LETTER MI */
212 { 0x04d1, 0x30e0 }, /* kana_MU ム KATAKANA LETTER MU */
213 { 0x04d2, 0x30e1 }, /* kana_ME メ KATAKANA LETTER ME */
214 { 0x04d3, 0x30e2 }, /* kana_MO モ KATAKANA LETTER MO */
215 { 0x04d4, 0x30e4 }, /* kana_YA ヤ KATAKANA LETTER YA */
216 { 0x04d5, 0x30e6 }, /* kana_YU ユ KATAKANA LETTER YU */
217 { 0x04d6, 0x30e8 }, /* kana_YO ヨ KATAKANA LETTER YO */
218 { 0x04d7, 0x30e9 }, /* kana_RA ラ KATAKANA LETTER RA */
219 { 0x04d8, 0x30ea }, /* kana_RI リ KATAKANA LETTER RI */
220 { 0x04d9, 0x30eb }, /* kana_RU ル KATAKANA LETTER RU */
221 { 0x04da, 0x30ec }, /* kana_RE レ KATAKANA LETTER RE */
222 { 0x04db, 0x30ed }, /* kana_RO ロ KATAKANA LETTER RO */
223 { 0x04dc, 0x30ef }, /* kana_WA ワ KATAKANA LETTER WA */
224 { 0x04dd, 0x30f3 }, /* kana_N ン KATAKANA LETTER N */
225 { 0x04de, 0x309b }, /* voicedsound ゛ KATAKANA-HIRAGANA VOICED SOUND MARK */
226 { 0x04df, 0x309c }, /* semivoicedsound ゜ KATAKANA-HIRAGANA SEMI-VOICED SOUND MARK */
227 { 0x05ac, 0x060c }, /* Arabic_comma ، ARABIC COMMA */
228 { 0x05bb, 0x061b }, /* Arabic_semicolon ؛ ARABIC SEMICOLON */
229 { 0x05bf, 0x061f }, /* Arabic_question_mark ؟ ARABIC QUESTION MARK */
230 { 0x05c1, 0x0621 }, /* Arabic_hamza ء ARABIC LETTER HAMZA */
231 { 0x05c2, 0x0622 }, /* Arabic_maddaonalef آ ARABIC LETTER ALEF WITH MADDA ABOVE */
232 { 0x05c3, 0x0623 }, /* Arabic_hamzaonalef أ ARABIC LETTER ALEF WITH HAMZA ABOVE */
233 { 0x05c4, 0x0624 }, /* Arabic_hamzaonwaw ؤ ARABIC LETTER WAW WITH HAMZA ABOVE */
234 { 0x05c5, 0x0625 }, /* Arabic_hamzaunderalef إ ARABIC LETTER ALEF WITH HAMZA BELOW */
235 { 0x05c6, 0x0626 }, /* Arabic_hamzaonyeh ئ ARABIC LETTER YEH WITH HAMZA ABOVE */
236 { 0x05c7, 0x0627 }, /* Arabic_alef ا ARABIC LETTER ALEF */
237 { 0x05c8, 0x0628 }, /* Arabic_beh ب ARABIC LETTER BEH */
238 { 0x05c9, 0x0629 }, /* Arabic_tehmarbuta ة ARABIC LETTER TEH MARBUTA */
239 { 0x05ca, 0x062a }, /* Arabic_teh ت ARABIC LETTER TEH */
240 { 0x05cb, 0x062b }, /* Arabic_theh ث ARABIC LETTER THEH */
241 { 0x05cc, 0x062c }, /* Arabic_jeem ج ARABIC LETTER JEEM */
242 { 0x05cd, 0x062d }, /* Arabic_hah ح ARABIC LETTER HAH */
243 { 0x05ce, 0x062e }, /* Arabic_khah خ ARABIC LETTER KHAH */
244 { 0x05cf, 0x062f }, /* Arabic_dal د ARABIC LETTER DAL */
245 { 0x05d0, 0x0630 }, /* Arabic_thal ذ ARABIC LETTER THAL */
246 { 0x05d1, 0x0631 }, /* Arabic_ra ر ARABIC LETTER REH */
247 { 0x05d2, 0x0632 }, /* Arabic_zain ز ARABIC LETTER ZAIN */
248 { 0x05d3, 0x0633 }, /* Arabic_seen س ARABIC LETTER SEEN */
249 { 0x05d4, 0x0634 }, /* Arabic_sheen ش ARABIC LETTER SHEEN */
250 { 0x05d5, 0x0635 }, /* Arabic_sad ص ARABIC LETTER SAD */
251 { 0x05d6, 0x0636 }, /* Arabic_dad ض ARABIC LETTER DAD */
252 { 0x05d7, 0x0637 }, /* Arabic_tah ط ARABIC LETTER TAH */
253 { 0x05d8, 0x0638 }, /* Arabic_zah ظ ARABIC LETTER ZAH */
254 { 0x05d9, 0x0639 }, /* Arabic_ain ع ARABIC LETTER AIN */
255 { 0x05da, 0x063a }, /* Arabic_ghain غ ARABIC LETTER GHAIN */
256 { 0x05e0, 0x0640 }, /* Arabic_tatweel ـ ARABIC TATWEEL */
257 { 0x05e1, 0x0641 }, /* Arabic_feh ف ARABIC LETTER FEH */
258 { 0x05e2, 0x0642 }, /* Arabic_qaf ق ARABIC LETTER QAF */
259 { 0x05e3, 0x0643 }, /* Arabic_kaf ك ARABIC LETTER KAF */
260 { 0x05e4, 0x0644 }, /* Arabic_lam ل ARABIC LETTER LAM */
261 { 0x05e5, 0x0645 }, /* Arabic_meem م ARABIC LETTER MEEM */
262 { 0x05e6, 0x0646 }, /* Arabic_noon ن ARABIC LETTER NOON */
263 { 0x05e7, 0x0647 }, /* Arabic_ha ه ARABIC LETTER HEH */
264 { 0x05e8, 0x0648 }, /* Arabic_waw و ARABIC LETTER WAW */
265 { 0x05e9, 0x0649 }, /* Arabic_alefmaksura ى ARABIC LETTER ALEF MAKSURA */
266 { 0x05ea, 0x064a }, /* Arabic_yeh ي ARABIC LETTER YEH */
267 { 0x05eb, 0x064b }, /* Arabic_fathatan ً ARABIC FATHATAN */
268 { 0x05ec, 0x064c }, /* Arabic_dammatan ٌ ARABIC DAMMATAN */
269 { 0x05ed, 0x064d }, /* Arabic_kasratan ٍ ARABIC KASRATAN */
270 { 0x05ee, 0x064e }, /* Arabic_fatha َ ARABIC FATHA */
271 { 0x05ef, 0x064f }, /* Arabic_damma ُ ARABIC DAMMA */
272 { 0x05f0, 0x0650 }, /* Arabic_kasra ِ ARABIC KASRA */
273 { 0x05f1, 0x0651 }, /* Arabic_shadda ّ ARABIC SHADDA */
274 { 0x05f2, 0x0652 }, /* Arabic_sukun ْ ARABIC SUKUN */
275 { 0x06a1, 0x0452 }, /* Serbian_dje ђ CYRILLIC SMALL LETTER DJE */
276 { 0x06a2, 0x0453 }, /* Macedonia_gje ѓ CYRILLIC SMALL LETTER GJE */
277 { 0x06a3, 0x0451 }, /* Cyrillic_io ё CYRILLIC SMALL LETTER IO */
278 { 0x06a4, 0x0454 }, /* Ukrainian_ie є CYRILLIC SMALL LETTER UKRAINIAN IE */
279 { 0x06a5, 0x0455 }, /* Macedonia_dse ѕ CYRILLIC SMALL LETTER DZE */
280 { 0x06a6, 0x0456 }, /* Ukrainian_i і CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I */
281 { 0x06a7, 0x0457 }, /* Ukrainian_yi ї CYRILLIC SMALL LETTER YI */
282 { 0x06a8, 0x0458 }, /* Cyrillic_je ј CYRILLIC SMALL LETTER JE */
283 { 0x06a9, 0x0459 }, /* Cyrillic_lje љ CYRILLIC SMALL LETTER LJE */
284 { 0x06aa, 0x045a }, /* Cyrillic_nje њ CYRILLIC SMALL LETTER NJE */
285 { 0x06ab, 0x045b }, /* Serbian_tshe ћ CYRILLIC SMALL LETTER TSHE */
286 { 0x06ac, 0x045c }, /* Macedonia_kje ќ CYRILLIC SMALL LETTER KJE */
287 { 0x06ad, 0x0491 }, /* Ukrainian_ghe_with_upturn ґ CYRILLIC SMALL LETTER GHE WITH UPTURN */
288 { 0x06ae, 0x045e }, /* Byelorussian_shortu ў CYRILLIC SMALL LETTER SHORT U */
289 { 0x06af, 0x045f }, /* Cyrillic_dzhe џ CYRILLIC SMALL LETTER DZHE */
290 { 0x06b0, 0x2116 }, /* numerosign № NUMERO SIGN */
291 { 0x06b1, 0x0402 }, /* Serbian_DJE Ђ CYRILLIC CAPITAL LETTER DJE */
292 { 0x06b2, 0x0403 }, /* Macedonia_GJE Ѓ CYRILLIC CAPITAL LETTER GJE */
293 { 0x06b3, 0x0401 }, /* Cyrillic_IO Ё CYRILLIC CAPITAL LETTER IO */
294 { 0x06b4, 0x0404 }, /* Ukrainian_IE Є CYRILLIC CAPITAL LETTER UKRAINIAN IE */
295 { 0x06b5, 0x0405 }, /* Macedonia_DSE Ѕ CYRILLIC CAPITAL LETTER DZE */
296 { 0x06b6, 0x0406 }, /* Ukrainian_I І CYRILLIC CAPITAL LETTER BYELORUSSIAN-UKRAINIAN I */
297 { 0x06b7, 0x0407 }, /* Ukrainian_YI Ї CYRILLIC CAPITAL LETTER YI */
298 { 0x06b8, 0x0408 }, /* Cyrillic_JE Ј CYRILLIC CAPITAL LETTER JE */
299 { 0x06b9, 0x0409 }, /* Cyrillic_LJE Љ CYRILLIC CAPITAL LETTER LJE */
300 { 0x06ba, 0x040a }, /* Cyrillic_NJE Њ CYRILLIC CAPITAL LETTER NJE */
301 { 0x06bb, 0x040b }, /* Serbian_TSHE Ћ CYRILLIC CAPITAL LETTER TSHE */
302 { 0x06bc, 0x040c }, /* Macedonia_KJE Ќ CYRILLIC CAPITAL LETTER KJE */
303 { 0x06bd, 0x0490 }, /* Ukrainian_GHE_WITH_UPTURN Ґ CYRILLIC CAPITAL LETTER GHE WITH UPTURN */
304 { 0x06be, 0x040e }, /* Byelorussian_SHORTU Ў CYRILLIC CAPITAL LETTER SHORT U */
305 { 0x06bf, 0x040f }, /* Cyrillic_DZHE Џ CYRILLIC CAPITAL LETTER DZHE */
306 { 0x06c0, 0x044e }, /* Cyrillic_yu ю CYRILLIC SMALL LETTER YU */
307 { 0x06c1, 0x0430 }, /* Cyrillic_a а CYRILLIC SMALL LETTER A */
308 { 0x06c2, 0x0431 }, /* Cyrillic_be б CYRILLIC SMALL LETTER BE */
309 { 0x06c3, 0x0446 }, /* Cyrillic_tse ц CYRILLIC SMALL LETTER TSE */
310 { 0x06c4, 0x0434 }, /* Cyrillic_de д CYRILLIC SMALL LETTER DE */
311 { 0x06c5, 0x0435 }, /* Cyrillic_ie е CYRILLIC SMALL LETTER IE */
312 { 0x06c6, 0x0444 }, /* Cyrillic_ef ф CYRILLIC SMALL LETTER EF */
313 { 0x06c7, 0x0433 }, /* Cyrillic_ghe г CYRILLIC SMALL LETTER GHE */
314 { 0x06c8, 0x0445 }, /* Cyrillic_ha х CYRILLIC SMALL LETTER HA */
315 { 0x06c9, 0x0438 }, /* Cyrillic_i и CYRILLIC SMALL LETTER I */
316 { 0x06ca, 0x0439 }, /* Cyrillic_shorti й CYRILLIC SMALL LETTER SHORT I */
317 { 0x06cb, 0x043a }, /* Cyrillic_ka к CYRILLIC SMALL LETTER KA */
318 { 0x06cc, 0x043b }, /* Cyrillic_el л CYRILLIC SMALL LETTER EL */
319 { 0x06cd, 0x043c }, /* Cyrillic_em м CYRILLIC SMALL LETTER EM */
320 { 0x06ce, 0x043d }, /* Cyrillic_en н CYRILLIC SMALL LETTER EN */
321 { 0x06cf, 0x043e }, /* Cyrillic_o о CYRILLIC SMALL LETTER O */
322 { 0x06d0, 0x043f }, /* Cyrillic_pe п CYRILLIC SMALL LETTER PE */
323 { 0x06d1, 0x044f }, /* Cyrillic_ya я CYRILLIC SMALL LETTER YA */
324 { 0x06d2, 0x0440 }, /* Cyrillic_er р CYRILLIC SMALL LETTER ER */
325 { 0x06d3, 0x0441 }, /* Cyrillic_es с CYRILLIC SMALL LETTER ES */
326 { 0x06d4, 0x0442 }, /* Cyrillic_te т CYRILLIC SMALL LETTER TE */
327 { 0x06d5, 0x0443 }, /* Cyrillic_u у CYRILLIC SMALL LETTER U */
328 { 0x06d6, 0x0436 }, /* Cyrillic_zhe ж CYRILLIC SMALL LETTER ZHE */
329 { 0x06d7, 0x0432 }, /* Cyrillic_ve в CYRILLIC SMALL LETTER VE */
330 { 0x06d8, 0x044c }, /* Cyrillic_softsign ь CYRILLIC SMALL LETTER SOFT SIGN */
331 { 0x06d9, 0x044b }, /* Cyrillic_yeru ы CYRILLIC SMALL LETTER YERU */
332 { 0x06da, 0x0437 }, /* Cyrillic_ze з CYRILLIC SMALL LETTER ZE */
333 { 0x06db, 0x0448 }, /* Cyrillic_sha ш CYRILLIC SMALL LETTER SHA */
334 { 0x06dc, 0x044d }, /* Cyrillic_e э CYRILLIC SMALL LETTER E */
335 { 0x06dd, 0x0449 }, /* Cyrillic_shcha щ CYRILLIC SMALL LETTER SHCHA */
336 { 0x06de, 0x0447 }, /* Cyrillic_che ч CYRILLIC SMALL LETTER CHE */
337 { 0x06df, 0x044a }, /* Cyrillic_hardsign ъ CYRILLIC SMALL LETTER HARD SIGN */
338 { 0x06e0, 0x042e }, /* Cyrillic_YU Ю CYRILLIC CAPITAL LETTER YU */
339 { 0x06e1, 0x0410 }, /* Cyrillic_A А CYRILLIC CAPITAL LETTER A */
340 { 0x06e2, 0x0411 }, /* Cyrillic_BE Б CYRILLIC CAPITAL LETTER BE */
341 { 0x06e3, 0x0426 }, /* Cyrillic_TSE Ц CYRILLIC CAPITAL LETTER TSE */
342 { 0x06e4, 0x0414 }, /* Cyrillic_DE Д CYRILLIC CAPITAL LETTER DE */
343 { 0x06e5, 0x0415 }, /* Cyrillic_IE Е CYRILLIC CAPITAL LETTER IE */
344 { 0x06e6, 0x0424 }, /* Cyrillic_EF Ф CYRILLIC CAPITAL LETTER EF */
345 { 0x06e7, 0x0413 }, /* Cyrillic_GHE Г CYRILLIC CAPITAL LETTER GHE */
346 { 0x06e8, 0x0425 }, /* Cyrillic_HA Х CYRILLIC CAPITAL LETTER HA */
347 { 0x06e9, 0x0418 }, /* Cyrillic_I И CYRILLIC CAPITAL LETTER I */
348 { 0x06ea, 0x0419 }, /* Cyrillic_SHORTI Й CYRILLIC CAPITAL LETTER SHORT I */
349 { 0x06eb, 0x041a }, /* Cyrillic_KA К CYRILLIC CAPITAL LETTER KA */
350 { 0x06ec, 0x041b }, /* Cyrillic_EL Л CYRILLIC CAPITAL LETTER EL */
351 { 0x06ed, 0x041c }, /* Cyrillic_EM М CYRILLIC CAPITAL LETTER EM */
352 { 0x06ee, 0x041d }, /* Cyrillic_EN Н CYRILLIC CAPITAL LETTER EN */
353 { 0x06ef, 0x041e }, /* Cyrillic_O О CYRILLIC CAPITAL LETTER O */
354 { 0x06f0, 0x041f }, /* Cyrillic_PE П CYRILLIC CAPITAL LETTER PE */
355 { 0x06f1, 0x042f }, /* Cyrillic_YA Я CYRILLIC CAPITAL LETTER YA */
356 { 0x06f2, 0x0420 }, /* Cyrillic_ER Р CYRILLIC CAPITAL LETTER ER */
357 { 0x06f3, 0x0421 }, /* Cyrillic_ES С CYRILLIC CAPITAL LETTER ES */
358 { 0x06f4, 0x0422 }, /* Cyrillic_TE Т CYRILLIC CAPITAL LETTER TE */
359 { 0x06f5, 0x0423 }, /* Cyrillic_U У CYRILLIC CAPITAL LETTER U */
360 { 0x06f6, 0x0416 }, /* Cyrillic_ZHE Ж CYRILLIC CAPITAL LETTER ZHE */
361 { 0x06f7, 0x0412 }, /* Cyrillic_VE В CYRILLIC CAPITAL LETTER VE */
362 { 0x06f8, 0x042c }, /* Cyrillic_SOFTSIGN Ь CYRILLIC CAPITAL LETTER SOFT SIGN */
363 { 0x06f9, 0x042b }, /* Cyrillic_YERU Ы CYRILLIC CAPITAL LETTER YERU */
364 { 0x06fa, 0x0417 }, /* Cyrillic_ZE З CYRILLIC CAPITAL LETTER ZE */
365 { 0x06fb, 0x0428 }, /* Cyrillic_SHA Ш CYRILLIC CAPITAL LETTER SHA */
366 { 0x06fc, 0x042d }, /* Cyrillic_E Э CYRILLIC CAPITAL LETTER E */
367 { 0x06fd, 0x0429 }, /* Cyrillic_SHCHA Щ CYRILLIC CAPITAL LETTER SHCHA */
368 { 0x06fe, 0x0427 }, /* Cyrillic_CHE Ч CYRILLIC CAPITAL LETTER CHE */
369 { 0x06ff, 0x042a }, /* Cyrillic_HARDSIGN Ъ CYRILLIC CAPITAL LETTER HARD SIGN */
370 { 0x07a1, 0x0386 }, /* Greek_ALPHAaccent Ά GREEK CAPITAL LETTER ALPHA WITH TONOS */
371 { 0x07a2, 0x0388 }, /* Greek_EPSILONaccent Έ GREEK CAPITAL LETTER EPSILON WITH TONOS */
372 { 0x07a3, 0x0389 }, /* Greek_ETAaccent Ή GREEK CAPITAL LETTER ETA WITH TONOS */
373 { 0x07a4, 0x038a }, /* Greek_IOTAaccent Ί GREEK CAPITAL LETTER IOTA WITH TONOS */
374 { 0x07a5, 0x03aa }, /* Greek_IOTAdiaeresis Ϊ GREEK CAPITAL LETTER IOTA WITH DIALYTIKA */
375 { 0x07a7, 0x038c }, /* Greek_OMICRONaccent Ό GREEK CAPITAL LETTER OMICRON WITH TONOS */
376 { 0x07a8, 0x038e }, /* Greek_UPSILONaccent Ύ GREEK CAPITAL LETTER UPSILON WITH TONOS */
377 { 0x07a9, 0x03ab }, /* Greek_UPSILONdieresis Ϋ GREEK CAPITAL LETTER UPSILON WITH DIALYTIKA */
378 { 0x07ab, 0x038f }, /* Greek_OMEGAaccent Ώ GREEK CAPITAL LETTER OMEGA WITH TONOS */
379 { 0x07ae, 0x0385 }, /* Greek_accentdieresis ΅ GREEK DIALYTIKA TONOS */
380 { 0x07af, 0x2015 }, /* Greek_horizbar ― HORIZONTAL BAR */
381 { 0x07b1, 0x03ac }, /* Greek_alphaaccent ά GREEK SMALL LETTER ALPHA WITH TONOS */
382 { 0x07b2, 0x03ad }, /* Greek_epsilonaccent έ GREEK SMALL LETTER EPSILON WITH TONOS */
383 { 0x07b3, 0x03ae }, /* Greek_etaaccent ή GREEK SMALL LETTER ETA WITH TONOS */
384 { 0x07b4, 0x03af }, /* Greek_iotaaccent ί GREEK SMALL LETTER IOTA WITH TONOS */
385 { 0x07b5, 0x03ca }, /* Greek_iotadieresis ϊ GREEK SMALL LETTER IOTA WITH DIALYTIKA */
386 { 0x07b6, 0x0390 }, /* Greek_iotaaccentdieresis ΐ GREEK SMALL LETTER IOTA WITH DIALYTIKA AND TONOS */
387 { 0x07b7, 0x03cc }, /* Greek_omicronaccent ό GREEK SMALL LETTER OMICRON WITH TONOS */
388 { 0x07b8, 0x03cd }, /* Greek_upsilonaccent ύ GREEK SMALL LETTER UPSILON WITH TONOS */
389 { 0x07b9, 0x03cb }, /* Greek_upsilondieresis ϋ GREEK SMALL LETTER UPSILON WITH DIALYTIKA */
390 { 0x07ba, 0x03b0 }, /* Greek_upsilonaccentdieresis ΰ GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND TONOS */
391 { 0x07bb, 0x03ce }, /* Greek_omegaaccent ώ GREEK SMALL LETTER OMEGA WITH TONOS */
392 { 0x07c1, 0x0391 }, /* Greek_ALPHA Α GREEK CAPITAL LETTER ALPHA */
393 { 0x07c2, 0x0392 }, /* Greek_BETA Β GREEK CAPITAL LETTER BETA */
394 { 0x07c3, 0x0393 }, /* Greek_GAMMA Γ GREEK CAPITAL LETTER GAMMA */
395 { 0x07c4, 0x0394 }, /* Greek_DELTA Δ GREEK CAPITAL LETTER DELTA */
396 { 0x07c5, 0x0395 }, /* Greek_EPSILON Ε GREEK CAPITAL LETTER EPSILON */
397 { 0x07c6, 0x0396 }, /* Greek_ZETA Ζ GREEK CAPITAL LETTER ZETA */
398 { 0x07c7, 0x0397 }, /* Greek_ETA Η GREEK CAPITAL LETTER ETA */
399 { 0x07c8, 0x0398 }, /* Greek_THETA Θ GREEK CAPITAL LETTER THETA */
400 { 0x07c9, 0x0399 }, /* Greek_IOTA Ι GREEK CAPITAL LETTER IOTA */
401 { 0x07ca, 0x039a }, /* Greek_KAPPA Κ GREEK CAPITAL LETTER KAPPA */
402 { 0x07cb, 0x039b }, /* Greek_LAMBDA Λ GREEK CAPITAL LETTER LAMDA */
403 { 0x07cc, 0x039c }, /* Greek_MU Μ GREEK CAPITAL LETTER MU */
404 { 0x07cd, 0x039d }, /* Greek_NU Ν GREEK CAPITAL LETTER NU */
405 { 0x07ce, 0x039e }, /* Greek_XI Ξ GREEK CAPITAL LETTER XI */
406 { 0x07cf, 0x039f }, /* Greek_OMICRON Ο GREEK CAPITAL LETTER OMICRON */
407 { 0x07d0, 0x03a0 }, /* Greek_PI Π GREEK CAPITAL LETTER PI */
408 { 0x07d1, 0x03a1 }, /* Greek_RHO Ρ GREEK CAPITAL LETTER RHO */
409 { 0x07d2, 0x03a3 }, /* Greek_SIGMA Σ GREEK CAPITAL LETTER SIGMA */
410 { 0x07d4, 0x03a4 }, /* Greek_TAU Τ GREEK CAPITAL LETTER TAU */
411 { 0x07d5, 0x03a5 }, /* Greek_UPSILON Υ GREEK CAPITAL LETTER UPSILON */
412 { 0x07d6, 0x03a6 }, /* Greek_PHI Φ GREEK CAPITAL LETTER PHI */
413 { 0x07d7, 0x03a7 }, /* Greek_CHI Χ GREEK CAPITAL LETTER CHI */
414 { 0x07d8, 0x03a8 }, /* Greek_PSI Ψ GREEK CAPITAL LETTER PSI */
415 { 0x07d9, 0x03a9 }, /* Greek_OMEGA Ω GREEK CAPITAL LETTER OMEGA */
416 { 0x07e1, 0x03b1 }, /* Greek_alpha α GREEK SMALL LETTER ALPHA */
417 { 0x07e2, 0x03b2 }, /* Greek_beta β GREEK SMALL LETTER BETA */
418 { 0x07e3, 0x03b3 }, /* Greek_gamma γ GREEK SMALL LETTER GAMMA */
419 { 0x07e4, 0x03b4 }, /* Greek_delta δ GREEK SMALL LETTER DELTA */
420 { 0x07e5, 0x03b5 }, /* Greek_epsilon ε GREEK SMALL LETTER EPSILON */
421 { 0x07e6, 0x03b6 }, /* Greek_zeta ζ GREEK SMALL LETTER ZETA */
422 { 0x07e7, 0x03b7 }, /* Greek_eta η GREEK SMALL LETTER ETA */
423 { 0x07e8, 0x03b8 }, /* Greek_theta θ GREEK SMALL LETTER THETA */
424 { 0x07e9, 0x03b9 }, /* Greek_iota ι GREEK SMALL LETTER IOTA */
425 { 0x07ea, 0x03ba }, /* Greek_kappa κ GREEK SMALL LETTER KAPPA */
426 { 0x07eb, 0x03bb }, /* Greek_lambda λ GREEK SMALL LETTER LAMDA */
427 { 0x07ec, 0x03bc }, /* Greek_mu μ GREEK SMALL LETTER MU */
428 { 0x07ed, 0x03bd }, /* Greek_nu ν GREEK SMALL LETTER NU */
429 { 0x07ee, 0x03be }, /* Greek_xi ξ GREEK SMALL LETTER XI */
430 { 0x07ef, 0x03bf }, /* Greek_omicron ο GREEK SMALL LETTER OMICRON */
431 { 0x07f0, 0x03c0 }, /* Greek_pi π GREEK SMALL LETTER PI */
432 { 0x07f1, 0x03c1 }, /* Greek_rho ρ GREEK SMALL LETTER RHO */
433 { 0x07f2, 0x03c3 }, /* Greek_sigma σ GREEK SMALL LETTER SIGMA */
434 { 0x07f3, 0x03c2 }, /* Greek_finalsmallsigma ς GREEK SMALL LETTER FINAL SIGMA */
435 { 0x07f4, 0x03c4 }, /* Greek_tau τ GREEK SMALL LETTER TAU */
436 { 0x07f5, 0x03c5 }, /* Greek_upsilon υ GREEK SMALL LETTER UPSILON */
437 { 0x07f6, 0x03c6 }, /* Greek_phi φ GREEK SMALL LETTER PHI */
438 { 0x07f7, 0x03c7 }, /* Greek_chi χ GREEK SMALL LETTER CHI */
439 { 0x07f8, 0x03c8 }, /* Greek_psi ψ GREEK SMALL LETTER PSI */
440 { 0x07f9, 0x03c9 }, /* Greek_omega ω GREEK SMALL LETTER OMEGA */
441 { 0x08a1, 0x23b7 }, /* leftradical ⎷ ??? */
442 { 0x08a2, 0x250c }, /* topleftradical ┌ BOX DRAWINGS LIGHT DOWN AND RIGHT */
443 { 0x08a3, 0x2500 }, /* horizconnector ─ BOX DRAWINGS LIGHT HORIZONTAL */
444 { 0x08a4, 0x2320 }, /* topintegral ⌠ TOP HALF INTEGRAL */
445 { 0x08a5, 0x2321 }, /* botintegral ⌡ BOTTOM HALF INTEGRAL */
446 { 0x08a6, 0x2502 }, /* vertconnector │ BOX DRAWINGS LIGHT VERTICAL */
447 { 0x08a7, 0x23a1 }, /* topleftsqbracket ⎡ ??? */
448 { 0x08a8, 0x23a3 }, /* botleftsqbracket ⎣ ??? */
449 { 0x08a9, 0x23a4 }, /* toprightsqbracket ⎤ ??? */
450 { 0x08aa, 0x23a6 }, /* botrightsqbracket ⎦ ??? */
451 { 0x08ab, 0x239b }, /* topleftparens ⎛ ??? */
452 { 0x08ac, 0x239d }, /* botleftparens ⎝ ??? */
453 { 0x08ad, 0x239e }, /* toprightparens ⎞ ??? */
454 { 0x08ae, 0x23a0 }, /* botrightparens ⎠ ??? */
455 { 0x08af, 0x23a8 }, /* leftmiddlecurlybrace ⎨ ??? */
456 { 0x08b0, 0x23ac }, /* rightmiddlecurlybrace ⎬ ??? */
457 /* 0x08b1 topleftsummation ? ??? */
458 /* 0x08b2 botleftsummation ? ??? */
459 /* 0x08b3 topvertsummationconnector ? ??? */
460 /* 0x08b4 botvertsummationconnector ? ??? */
461 /* 0x08b5 toprightsummation ? ??? */
462 /* 0x08b6 botrightsummation ? ??? */
463 /* 0x08b7 rightmiddlesummation ? ??? */
464 { 0x08bc, 0x2264 }, /* lessthanequal ≤ LESS-THAN OR EQUAL TO */
465 { 0x08bd, 0x2260 }, /* notequal ≠ NOT EQUAL TO */
466 { 0x08be, 0x2265 }, /* greaterthanequal ≥ GREATER-THAN OR EQUAL TO */
467 { 0x08bf, 0x222b }, /* integral ∫ INTEGRAL */
468 { 0x08c0, 0x2234 }, /* therefore ∴ THEREFORE */
469 { 0x08c1, 0x221d }, /* variation ∝ PROPORTIONAL TO */
470 { 0x08c2, 0x221e }, /* infinity ∞ INFINITY */
471 { 0x08c5, 0x2207 }, /* nabla ∇ NABLA */
472 { 0x08c8, 0x223c }, /* approximate ∼ TILDE OPERATOR */
473 { 0x08c9, 0x2243 }, /* similarequal ≃ ASYMPTOTICALLY EQUAL TO */
474 { 0x08cd, 0x21d4 }, /* ifonlyif ⇔ LEFT RIGHT DOUBLE ARROW */
475 { 0x08ce, 0x21d2 }, /* implies ⇒ RIGHTWARDS DOUBLE ARROW */
476 { 0x08cf, 0x2261 }, /* identical ≡ IDENTICAL TO */
477 { 0x08d6, 0x221a }, /* radical √ SQUARE ROOT */
478 { 0x08da, 0x2282 }, /* includedin ⊂ SUBSET OF */
479 { 0x08db, 0x2283 }, /* includes ⊃ SUPERSET OF */
480 { 0x08dc, 0x2229 }, /* intersection ∩ INTERSECTION */
481 { 0x08dd, 0x222a }, /* union ∪ UNION */
482 { 0x08de, 0x2227 }, /* logicaland ∧ LOGICAL AND */
483 { 0x08df, 0x2228 }, /* logicalor ∨ LOGICAL OR */
484 { 0x08ef, 0x2202 }, /* partialderivative ∂ PARTIAL DIFFERENTIAL */
485 { 0x08f6, 0x0192 }, /* function ƒ LATIN SMALL LETTER F WITH HOOK */
486 { 0x08fb, 0x2190 }, /* leftarrow ← LEFTWARDS ARROW */
487 { 0x08fc, 0x2191 }, /* uparrow ↑ UPWARDS ARROW */
488 { 0x08fd, 0x2192 }, /* rightarrow → RIGHTWARDS ARROW */
489 { 0x08fe, 0x2193 }, /* downarrow ↓ DOWNWARDS ARROW */
490 /* 0x09df blank ? ??? */
491 { 0x09e0, 0x25c6 }, /* soliddiamond ◆ BLACK DIAMOND */
492 { 0x09e1, 0x2592 }, /* checkerboard ▒ MEDIUM SHADE */
493 { 0x09e2, 0x2409 }, /* ht ␉ SYMBOL FOR HORIZONTAL TABULATION */
494 { 0x09e3, 0x240c }, /* ff ␌ SYMBOL FOR FORM FEED */
495 { 0x09e4, 0x240d }, /* cr ␍ SYMBOL FOR CARRIAGE RETURN */
496 { 0x09e5, 0x240a }, /* lf ␊ SYMBOL FOR LINE FEED */
497 { 0x09e8, 0x2424 }, /* nl  SYMBOL FOR NEWLINE */
498 { 0x09e9, 0x240b }, /* vt ␋ SYMBOL FOR VERTICAL TABULATION */
499 { 0x09ea, 0x2518 }, /* lowrightcorner ┘ BOX DRAWINGS LIGHT UP AND LEFT */
500 { 0x09eb, 0x2510 }, /* uprightcorner ┐ BOX DRAWINGS LIGHT DOWN AND LEFT */
501 { 0x09ec, 0x250c }, /* upleftcorner ┌ BOX DRAWINGS LIGHT DOWN AND RIGHT */
502 { 0x09ed, 0x2514 }, /* lowleftcorner └ BOX DRAWINGS LIGHT UP AND RIGHT */
503 { 0x09ee, 0x253c }, /* crossinglines ┼ BOX DRAWINGS LIGHT VERTICAL AND HORIZONTAL */
504 { 0x09ef, 0x23ba }, /* horizlinescan1 ⎺ HORIZONTAL SCAN LINE-1 (Unicode 3.2 draft) */
505 { 0x09f0, 0x23bb }, /* horizlinescan3 ⎻ HORIZONTAL SCAN LINE-3 (Unicode 3.2 draft) */
506 { 0x09f1, 0x2500 }, /* horizlinescan5 ─ BOX DRAWINGS LIGHT HORIZONTAL */
507 { 0x09f2, 0x23bc }, /* horizlinescan7 ⎼ HORIZONTAL SCAN LINE-7 (Unicode 3.2 draft) */
508 { 0x09f3, 0x23bd }, /* horizlinescan9 ⎽ HORIZONTAL SCAN LINE-9 (Unicode 3.2 draft) */
509 { 0x09f4, 0x251c }, /* leftt ├ BOX DRAWINGS LIGHT VERTICAL AND RIGHT */
510 { 0x09f5, 0x2524 }, /* rightt ┤ BOX DRAWINGS LIGHT VERTICAL AND LEFT */
511 { 0x09f6, 0x2534 }, /* bott ┴ BOX DRAWINGS LIGHT UP AND HORIZONTAL */
512 { 0x09f7, 0x252c }, /* topt ┬ BOX DRAWINGS LIGHT DOWN AND HORIZONTAL */
513 { 0x09f8, 0x2502 }, /* vertbar │ BOX DRAWINGS LIGHT VERTICAL */
514 { 0x0aa1, 0x2003 }, /* emspace EM SPACE */
515 { 0x0aa2, 0x2002 }, /* enspace EN SPACE */
516 { 0x0aa3, 0x2004 }, /* em3space THREE-PER-EM SPACE */
517 { 0x0aa4, 0x2005 }, /* em4space FOUR-PER-EM SPACE */
518 { 0x0aa5, 0x2007 }, /* digitspace FIGURE SPACE */
519 { 0x0aa6, 0x2008 }, /* punctspace PUNCTUATION SPACE */
520 { 0x0aa7, 0x2009 }, /* thinspace THIN SPACE */
521 { 0x0aa8, 0x200a }, /* hairspace HAIR SPACE */
522 { 0x0aa9, 0x2014 }, /* emdash — EM DASH */
523 { 0x0aaa, 0x2013 }, /* endash – EN DASH */
524 /* 0x0aac signifblank ? ??? */
525 { 0x0aae, 0x2026 }, /* ellipsis … HORIZONTAL ELLIPSIS */
526 { 0x0aaf, 0x2025 }, /* doubbaselinedot ‥ TWO DOT LEADER */
527 { 0x0ab0, 0x2153 }, /* onethird ⅓ VULGAR FRACTION ONE THIRD */
528 { 0x0ab1, 0x2154 }, /* twothirds ⅔ VULGAR FRACTION TWO THIRDS */
529 { 0x0ab2, 0x2155 }, /* onefifth ⅕ VULGAR FRACTION ONE FIFTH */
530 { 0x0ab3, 0x2156 }, /* twofifths ⅖ VULGAR FRACTION TWO FIFTHS */
531 { 0x0ab4, 0x2157 }, /* threefifths ⅗ VULGAR FRACTION THREE FIFTHS */
532 { 0x0ab5, 0x2158 }, /* fourfifths ⅘ VULGAR FRACTION FOUR FIFTHS */
533 { 0x0ab6, 0x2159 }, /* onesixth ⅙ VULGAR FRACTION ONE SIXTH */
534 { 0x0ab7, 0x215a }, /* fivesixths ⅚ VULGAR FRACTION FIVE SIXTHS */
535 { 0x0ab8, 0x2105 }, /* careof ℅ CARE OF */
536 { 0x0abb, 0x2012 }, /* figdash ‒ FIGURE DASH */
537 { 0x0abc, 0x2329 }, /* leftanglebracket 〈 LEFT-POINTING ANGLE BRACKET */
538 { 0x0abd, 0x002e }, /* decimalpoint . FULL STOP */
539 { 0x0abe, 0x232a }, /* rightanglebracket 〉 RIGHT-POINTING ANGLE BRACKET */
540 /* 0x0abf marker ? ??? */
541 { 0x0ac3, 0x215b }, /* oneeighth ⅛ VULGAR FRACTION ONE EIGHTH */
542 { 0x0ac4, 0x215c }, /* threeeighths ⅜ VULGAR FRACTION THREE EIGHTHS */
543 { 0x0ac5, 0x215d }, /* fiveeighths ⅝ VULGAR FRACTION FIVE EIGHTHS */
544 { 0x0ac6, 0x215e }, /* seveneighths ⅞ VULGAR FRACTION SEVEN EIGHTHS */
545 { 0x0ac9, 0x2122 }, /* trademark ™ TRADE MARK SIGN */
546 { 0x0aca, 0x2613 }, /* signaturemark ☓ SALTIRE */
547 /* 0x0acb trademarkincircle ? ??? */
548 { 0x0acc, 0x25c1 }, /* leftopentriangle ◁ WHITE LEFT-POINTING TRIANGLE */
549 { 0x0acd, 0x25b7 }, /* rightopentriangle ▷ WHITE RIGHT-POINTING TRIANGLE */
550 { 0x0ace, 0x25cb }, /* emopencircle ○ WHITE CIRCLE */
551 { 0x0acf, 0x25af }, /* emopenrectangle ▯ WHITE VERTICAL RECTANGLE */
552 { 0x0ad0, 0x2018 }, /* leftsinglequotemark ‘ LEFT SINGLE QUOTATION MARK */
553 { 0x0ad1, 0x2019 }, /* rightsinglequotemark ’ RIGHT SINGLE QUOTATION MARK */
554 { 0x0ad2, 0x201c }, /* leftdoublequotemark “ LEFT DOUBLE QUOTATION MARK */
555 { 0x0ad3, 0x201d }, /* rightdoublequotemark ” RIGHT DOUBLE QUOTATION MARK */
556 { 0x0ad4, 0x211e }, /* prescription ℞ PRESCRIPTION TAKE */
557 { 0x0ad6, 0x2032 }, /* minutes ′ PRIME */
558 { 0x0ad7, 0x2033 }, /* seconds ″ DOUBLE PRIME */
559 { 0x0ad9, 0x271d }, /* latincross ✝ LATIN CROSS */
560 /* 0x0ada hexagram ? ??? */
561 { 0x0adb, 0x25ac }, /* filledrectbullet ▬ BLACK RECTANGLE */
562 { 0x0adc, 0x25c0 }, /* filledlefttribullet ◀ BLACK LEFT-POINTING TRIANGLE */
563 { 0x0add, 0x25b6 }, /* filledrighttribullet ▶ BLACK RIGHT-POINTING TRIANGLE */
564 { 0x0ade, 0x25cf }, /* emfilledcircle ● BLACK CIRCLE */
565 { 0x0adf, 0x25ae }, /* emfilledrect ▮ BLACK VERTICAL RECTANGLE */
566 { 0x0ae0, 0x25e6 }, /* enopencircbullet ◦ WHITE BULLET */
567 { 0x0ae1, 0x25ab }, /* enopensquarebullet ▫ WHITE SMALL SQUARE */
568 { 0x0ae2, 0x25ad }, /* openrectbullet ▭ WHITE RECTANGLE */
569 { 0x0ae3, 0x25b3 }, /* opentribulletup △ WHITE UP-POINTING TRIANGLE */
570 { 0x0ae4, 0x25bd }, /* opentribulletdown ▽ WHITE DOWN-POINTING TRIANGLE */
571 { 0x0ae5, 0x2606 }, /* openstar ☆ WHITE STAR */
572 { 0x0ae6, 0x2022 }, /* enfilledcircbullet • BULLET */
573 { 0x0ae7, 0x25aa }, /* enfilledsqbullet ▪ BLACK SMALL SQUARE */
574 { 0x0ae8, 0x25b2 }, /* filledtribulletup ▲ BLACK UP-POINTING TRIANGLE */
575 { 0x0ae9, 0x25bc }, /* filledtribulletdown ▼ BLACK DOWN-POINTING TRIANGLE */
576 { 0x0aea, 0x261c }, /* leftpointer ☜ WHITE LEFT POINTING INDEX */
577 { 0x0aeb, 0x261e }, /* rightpointer ☞ WHITE RIGHT POINTING INDEX */
578 { 0x0aec, 0x2663 }, /* club ♣ BLACK CLUB SUIT */
579 { 0x0aed, 0x2666 }, /* diamond ♦ BLACK DIAMOND SUIT */
580 { 0x0aee, 0x2665 }, /* heart ♥ BLACK HEART SUIT */
581 { 0x0af0, 0x2720 }, /* maltesecross ✠ MALTESE CROSS */
582 { 0x0af1, 0x2020 }, /* dagger † DAGGER */
583 { 0x0af2, 0x2021 }, /* doubledagger ‡ DOUBLE DAGGER */
584 { 0x0af3, 0x2713 }, /* checkmark ✓ CHECK MARK */
585 { 0x0af4, 0x2717 }, /* ballotcross ✗ BALLOT X */
586 { 0x0af5, 0x266f }, /* musicalsharp ♯ MUSIC SHARP SIGN */
587 { 0x0af6, 0x266d }, /* musicalflat ♭ MUSIC FLAT SIGN */
588 { 0x0af7, 0x2642 }, /* malesymbol ♂ MALE SIGN */
589 { 0x0af8, 0x2640 }, /* femalesymbol ♀ FEMALE SIGN */
590 { 0x0af9, 0x260e }, /* telephone ☎ BLACK TELEPHONE */
591 { 0x0afa, 0x2315 }, /* telephonerecorder ⌕ TELEPHONE RECORDER */
592 { 0x0afb, 0x2117 }, /* phonographcopyright ℗ SOUND RECORDING COPYRIGHT */
593 { 0x0afc, 0x2038 }, /* caret ‸ CARET */
594 { 0x0afd, 0x201a }, /* singlelowquotemark ‚ SINGLE LOW-9 QUOTATION MARK */
595 { 0x0afe, 0x201e }, /* doublelowquotemark „ DOUBLE LOW-9 QUOTATION MARK */
596 /* 0x0aff cursor ? ??? */
597 { 0x0ba3, 0x003c }, /* leftcaret < LESS-THAN SIGN */
598 { 0x0ba6, 0x003e }, /* rightcaret > GREATER-THAN SIGN */
599 { 0x0ba8, 0x2228 }, /* downcaret ∨ LOGICAL OR */
600 { 0x0ba9, 0x2227 }, /* upcaret ∧ LOGICAL AND */
601 { 0x0bc0, 0x00af }, /* overbar ¯ MACRON */
602 { 0x0bc2, 0x22a4 }, /* downtack ⊤ DOWN TACK */
603 { 0x0bc3, 0x2229 }, /* upshoe ∩ INTERSECTION */
604 { 0x0bc4, 0x230a }, /* downstile ⌊ LEFT FLOOR */
605 { 0x0bc6, 0x005f }, /* underbar _ LOW LINE */
606 { 0x0bca, 0x2218 }, /* jot ∘ RING OPERATOR */
607 { 0x0bcc, 0x2395 }, /* quad ⎕ APL FUNCTIONAL SYMBOL QUAD (Unicode 3.0) */
608 { 0x0bce, 0x22a5 }, /* uptack ⊥ UP TACK */
609 { 0x0bcf, 0x25cb }, /* circle ○ WHITE CIRCLE */
610 { 0x0bd3, 0x2308 }, /* upstile ⌈ LEFT CEILING */
611 { 0x0bd6, 0x222a }, /* downshoe ∪ UNION */
612 { 0x0bd8, 0x2283 }, /* rightshoe ⊃ SUPERSET OF */
613 { 0x0bda, 0x2282 }, /* leftshoe ⊂ SUBSET OF */
614 { 0x0bdc, 0x22a2 }, /* lefttack ⊢ RIGHT TACK */
615 { 0x0bfc, 0x22a3 }, /* righttack ⊣ LEFT TACK */
616 { 0x0cdf, 0x2017 }, /* hebrew_doublelowline ‗ DOUBLE LOW LINE */
617 { 0x0ce0, 0x05d0 }, /* hebrew_aleph א HEBREW LETTER ALEF */
618 { 0x0ce1, 0x05d1 }, /* hebrew_bet ב HEBREW LETTER BET */
619 { 0x0ce2, 0x05d2 }, /* hebrew_gimel ג HEBREW LETTER GIMEL */
620 { 0x0ce3, 0x05d3 }, /* hebrew_dalet ד HEBREW LETTER DALET */
621 { 0x0ce4, 0x05d4 }, /* hebrew_he ה HEBREW LETTER HE */
622 { 0x0ce5, 0x05d5 }, /* hebrew_waw ו HEBREW LETTER VAV */
623 { 0x0ce6, 0x05d6 }, /* hebrew_zain ז HEBREW LETTER ZAYIN */
624 { 0x0ce7, 0x05d7 }, /* hebrew_chet ח HEBREW LETTER HET */
625 { 0x0ce8, 0x05d8 }, /* hebrew_tet ט HEBREW LETTER TET */
626 { 0x0ce9, 0x05d9 }, /* hebrew_yod י HEBREW LETTER YOD */
627 { 0x0cea, 0x05da }, /* hebrew_finalkaph ך HEBREW LETTER FINAL KAF */
628 { 0x0ceb, 0x05db }, /* hebrew_kaph כ HEBREW LETTER KAF */
629 { 0x0cec, 0x05dc }, /* hebrew_lamed ל HEBREW LETTER LAMED */
630 { 0x0ced, 0x05dd }, /* hebrew_finalmem ם HEBREW LETTER FINAL MEM */
631 { 0x0cee, 0x05de }, /* hebrew_mem מ HEBREW LETTER MEM */
632 { 0x0cef, 0x05df }, /* hebrew_finalnun ן HEBREW LETTER FINAL NUN */
633 { 0x0cf0, 0x05e0 }, /* hebrew_nun נ HEBREW LETTER NUN */
634 { 0x0cf1, 0x05e1 }, /* hebrew_samech ס HEBREW LETTER SAMEKH */
635 { 0x0cf2, 0x05e2 }, /* hebrew_ayin ע HEBREW LETTER AYIN */
636 { 0x0cf3, 0x05e3 }, /* hebrew_finalpe ף HEBREW LETTER FINAL PE */
637 { 0x0cf4, 0x05e4 }, /* hebrew_pe פ HEBREW LETTER PE */
638 { 0x0cf5, 0x05e5 }, /* hebrew_finalzade ץ HEBREW LETTER FINAL TSADI */
639 { 0x0cf6, 0x05e6 }, /* hebrew_zade צ HEBREW LETTER TSADI */
640 { 0x0cf7, 0x05e7 }, /* hebrew_qoph ק HEBREW LETTER QOF */
641 { 0x0cf8, 0x05e8 }, /* hebrew_resh ר HEBREW LETTER RESH */
642 { 0x0cf9, 0x05e9 }, /* hebrew_shin ש HEBREW LETTER SHIN */
643 { 0x0cfa, 0x05ea }, /* hebrew_taw ת HEBREW LETTER TAV */
644 { 0x0da1, 0x0e01 }, /* Thai_kokai ก THAI CHARACTER KO KAI */
645 { 0x0da2, 0x0e02 }, /* Thai_khokhai ข THAI CHARACTER KHO KHAI */
646 { 0x0da3, 0x0e03 }, /* Thai_khokhuat ฃ THAI CHARACTER KHO KHUAT */
647 { 0x0da4, 0x0e04 }, /* Thai_khokhwai ค THAI CHARACTER KHO KHWAI */
648 { 0x0da5, 0x0e05 }, /* Thai_khokhon ฅ THAI CHARACTER KHO KHON */
649 { 0x0da6, 0x0e06 }, /* Thai_khorakhang ฆ THAI CHARACTER KHO RAKHANG */
650 { 0x0da7, 0x0e07 }, /* Thai_ngongu ง THAI CHARACTER NGO NGU */
651 { 0x0da8, 0x0e08 }, /* Thai_chochan จ THAI CHARACTER CHO CHAN */
652 { 0x0da9, 0x0e09 }, /* Thai_choching ฉ THAI CHARACTER CHO CHING */
653 { 0x0daa, 0x0e0a }, /* Thai_chochang ช THAI CHARACTER CHO CHANG */
654 { 0x0dab, 0x0e0b }, /* Thai_soso ซ THAI CHARACTER SO SO */
655 { 0x0dac, 0x0e0c }, /* Thai_chochoe ฌ THAI CHARACTER CHO CHOE */
656 { 0x0dad, 0x0e0d }, /* Thai_yoying ญ THAI CHARACTER YO YING */
657 { 0x0dae, 0x0e0e }, /* Thai_dochada ฎ THAI CHARACTER DO CHADA */
658 { 0x0daf, 0x0e0f }, /* Thai_topatak ฏ THAI CHARACTER TO PATAK */
659 { 0x0db0, 0x0e10 }, /* Thai_thothan ฐ THAI CHARACTER THO THAN */
660 { 0x0db1, 0x0e11 }, /* Thai_thonangmontho ฑ THAI CHARACTER THO NANGMONTHO */
661 { 0x0db2, 0x0e12 }, /* Thai_thophuthao ฒ THAI CHARACTER THO PHUTHAO */
662 { 0x0db3, 0x0e13 }, /* Thai_nonen ณ THAI CHARACTER NO NEN */
663 { 0x0db4, 0x0e14 }, /* Thai_dodek ด THAI CHARACTER DO DEK */
664 { 0x0db5, 0x0e15 }, /* Thai_totao ต THAI CHARACTER TO TAO */
665 { 0x0db6, 0x0e16 }, /* Thai_thothung ถ THAI CHARACTER THO THUNG */
666 { 0x0db7, 0x0e17 }, /* Thai_thothahan ท THAI CHARACTER THO THAHAN */
667 { 0x0db8, 0x0e18 }, /* Thai_thothong ธ THAI CHARACTER THO THONG */
668 { 0x0db9, 0x0e19 }, /* Thai_nonu น THAI CHARACTER NO NU */
669 { 0x0dba, 0x0e1a }, /* Thai_bobaimai บ THAI CHARACTER BO BAIMAI */
670 { 0x0dbb, 0x0e1b }, /* Thai_popla ป THAI CHARACTER PO PLA */
671 { 0x0dbc, 0x0e1c }, /* Thai_phophung ผ THAI CHARACTER PHO PHUNG */
672 { 0x0dbd, 0x0e1d }, /* Thai_fofa ฝ THAI CHARACTER FO FA */
673 { 0x0dbe, 0x0e1e }, /* Thai_phophan พ THAI CHARACTER PHO PHAN */
674 { 0x0dbf, 0x0e1f }, /* Thai_fofan ฟ THAI CHARACTER FO FAN */
675 { 0x0dc0, 0x0e20 }, /* Thai_phosamphao ภ THAI CHARACTER PHO SAMPHAO */
676 { 0x0dc1, 0x0e21 }, /* Thai_moma ม THAI CHARACTER MO MA */
677 { 0x0dc2, 0x0e22 }, /* Thai_yoyak ย THAI CHARACTER YO YAK */
678 { 0x0dc3, 0x0e23 }, /* Thai_rorua ร THAI CHARACTER RO RUA */
679 { 0x0dc4, 0x0e24 }, /* Thai_ru ฤ THAI CHARACTER RU */
680 { 0x0dc5, 0x0e25 }, /* Thai_loling ล THAI CHARACTER LO LING */
681 { 0x0dc6, 0x0e26 }, /* Thai_lu ฦ THAI CHARACTER LU */
682 { 0x0dc7, 0x0e27 }, /* Thai_wowaen ว THAI CHARACTER WO WAEN */
683 { 0x0dc8, 0x0e28 }, /* Thai_sosala ศ THAI CHARACTER SO SALA */
684 { 0x0dc9, 0x0e29 }, /* Thai_sorusi ษ THAI CHARACTER SO RUSI */
685 { 0x0dca, 0x0e2a }, /* Thai_sosua ส THAI CHARACTER SO SUA */
686 { 0x0dcb, 0x0e2b }, /* Thai_hohip ห THAI CHARACTER HO HIP */
687 { 0x0dcc, 0x0e2c }, /* Thai_lochula ฬ THAI CHARACTER LO CHULA */
688 { 0x0dcd, 0x0e2d }, /* Thai_oang อ THAI CHARACTER O ANG */
689 { 0x0dce, 0x0e2e }, /* Thai_honokhuk ฮ THAI CHARACTER HO NOKHUK */
690 { 0x0dcf, 0x0e2f }, /* Thai_paiyannoi ฯ THAI CHARACTER PAIYANNOI */
691 { 0x0dd0, 0x0e30 }, /* Thai_saraa ะ THAI CHARACTER SARA A */
692 { 0x0dd1, 0x0e31 }, /* Thai_maihanakat ั THAI CHARACTER MAI HAN-AKAT */
693 { 0x0dd2, 0x0e32 }, /* Thai_saraaa า THAI CHARACTER SARA AA */
694 { 0x0dd3, 0x0e33 }, /* Thai_saraam ำ THAI CHARACTER SARA AM */
695 { 0x0dd4, 0x0e34 }, /* Thai_sarai ิ THAI CHARACTER SARA I */
696 { 0x0dd5, 0x0e35 }, /* Thai_saraii ี THAI CHARACTER SARA II */
697 { 0x0dd6, 0x0e36 }, /* Thai_saraue ึ THAI CHARACTER SARA UE */
698 { 0x0dd7, 0x0e37 }, /* Thai_sarauee ื THAI CHARACTER SARA UEE */
699 { 0x0dd8, 0x0e38 }, /* Thai_sarau ุ THAI CHARACTER SARA U */
700 { 0x0dd9, 0x0e39 }, /* Thai_sarauu ู THAI CHARACTER SARA UU */
701 { 0x0dda, 0x0e3a }, /* Thai_phinthu ฺ THAI CHARACTER PHINTHU */
702 { 0x0dde, 0x0e3e }, /* Thai_maihanakat_maitho ??? */
703 { 0x0ddf, 0x0e3f }, /* Thai_baht ฿ THAI CURRENCY SYMBOL BAHT */
704 { 0x0de0, 0x0e40 }, /* Thai_sarae เ THAI CHARACTER SARA E */
705 { 0x0de1, 0x0e41 }, /* Thai_saraae แ THAI CHARACTER SARA AE */
706 { 0x0de2, 0x0e42 }, /* Thai_sarao โ THAI CHARACTER SARA O */
707 { 0x0de3, 0x0e43 }, /* Thai_saraaimaimuan ใ THAI CHARACTER SARA AI MAIMUAN */
708 { 0x0de4, 0x0e44 }, /* Thai_saraaimaimalai ไ THAI CHARACTER SARA AI MAIMALAI */
709 { 0x0de5, 0x0e45 }, /* Thai_lakkhangyao ๅ THAI CHARACTER LAKKHANGYAO */
710 { 0x0de6, 0x0e46 }, /* Thai_maiyamok ๆ THAI CHARACTER MAIYAMOK */
711 { 0x0de7, 0x0e47 }, /* Thai_maitaikhu ็ THAI CHARACTER MAITAIKHU */
712 { 0x0de8, 0x0e48 }, /* Thai_maiek ่ THAI CHARACTER MAI EK */
713 { 0x0de9, 0x0e49 }, /* Thai_maitho ้ THAI CHARACTER MAI THO */
714 { 0x0dea, 0x0e4a }, /* Thai_maitri ๊ THAI CHARACTER MAI TRI */
715 { 0x0deb, 0x0e4b }, /* Thai_maichattawa ๋ THAI CHARACTER MAI CHATTAWA */
716 { 0x0dec, 0x0e4c }, /* Thai_thanthakhat ์ THAI CHARACTER THANTHAKHAT */
717 { 0x0ded, 0x0e4d }, /* Thai_nikhahit ํ THAI CHARACTER NIKHAHIT */
718 { 0x0df0, 0x0e50 }, /* Thai_leksun ๐ THAI DIGIT ZERO */
719 { 0x0df1, 0x0e51 }, /* Thai_leknung ๑ THAI DIGIT ONE */
720 { 0x0df2, 0x0e52 }, /* Thai_leksong ๒ THAI DIGIT TWO */
721 { 0x0df3, 0x0e53 }, /* Thai_leksam ๓ THAI DIGIT THREE */
722 { 0x0df4, 0x0e54 }, /* Thai_leksi ๔ THAI DIGIT FOUR */
723 { 0x0df5, 0x0e55 }, /* Thai_lekha ๕ THAI DIGIT FIVE */
724 { 0x0df6, 0x0e56 }, /* Thai_lekhok ๖ THAI DIGIT SIX */
725 { 0x0df7, 0x0e57 }, /* Thai_lekchet ๗ THAI DIGIT SEVEN */
726 { 0x0df8, 0x0e58 }, /* Thai_lekpaet ๘ THAI DIGIT EIGHT */
727 { 0x0df9, 0x0e59 }, /* Thai_lekkao ๙ THAI DIGIT NINE */
728 { 0x0ea1, 0x3131 }, /* Hangul_Kiyeog ㄱ HANGUL LETTER KIYEOK */
729 { 0x0ea2, 0x3132 }, /* Hangul_SsangKiyeog ㄲ HANGUL LETTER SSANGKIYEOK */
730 { 0x0ea3, 0x3133 }, /* Hangul_KiyeogSios ㄳ HANGUL LETTER KIYEOK-SIOS */
731 { 0x0ea4, 0x3134 }, /* Hangul_Nieun ㄴ HANGUL LETTER NIEUN */
732 { 0x0ea5, 0x3135 }, /* Hangul_NieunJieuj ㄵ HANGUL LETTER NIEUN-CIEUC */
733 { 0x0ea6, 0x3136 }, /* Hangul_NieunHieuh ㄶ HANGUL LETTER NIEUN-HIEUH */
734 { 0x0ea7, 0x3137 }, /* Hangul_Dikeud ㄷ HANGUL LETTER TIKEUT */
735 { 0x0ea8, 0x3138 }, /* Hangul_SsangDikeud ㄸ HANGUL LETTER SSANGTIKEUT */
736 { 0x0ea9, 0x3139 }, /* Hangul_Rieul ㄹ HANGUL LETTER RIEUL */
737 { 0x0eaa, 0x313a }, /* Hangul_RieulKiyeog ㄺ HANGUL LETTER RIEUL-KIYEOK */
738 { 0x0eab, 0x313b }, /* Hangul_RieulMieum ㄻ HANGUL LETTER RIEUL-MIEUM */
739 { 0x0eac, 0x313c }, /* Hangul_RieulPieub ㄼ HANGUL LETTER RIEUL-PIEUP */
740 { 0x0ead, 0x313d }, /* Hangul_RieulSios ㄽ HANGUL LETTER RIEUL-SIOS */
741 { 0x0eae, 0x313e }, /* Hangul_RieulTieut ㄾ HANGUL LETTER RIEUL-THIEUTH */
742 { 0x0eaf, 0x313f }, /* Hangul_RieulPhieuf ㄿ HANGUL LETTER RIEUL-PHIEUPH */
743 { 0x0eb0, 0x3140 }, /* Hangul_RieulHieuh ㅀ HANGUL LETTER RIEUL-HIEUH */
744 { 0x0eb1, 0x3141 }, /* Hangul_Mieum ㅁ HANGUL LETTER MIEUM */
745 { 0x0eb2, 0x3142 }, /* Hangul_Pieub ㅂ HANGUL LETTER PIEUP */
746 { 0x0eb3, 0x3143 }, /* Hangul_SsangPieub ㅃ HANGUL LETTER SSANGPIEUP */
747 { 0x0eb4, 0x3144 }, /* Hangul_PieubSios ㅄ HANGUL LETTER PIEUP-SIOS */
748 { 0x0eb5, 0x3145 }, /* Hangul_Sios ㅅ HANGUL LETTER SIOS */
749 { 0x0eb6, 0x3146 }, /* Hangul_SsangSios ㅆ HANGUL LETTER SSANGSIOS */
750 { 0x0eb7, 0x3147 }, /* Hangul_Ieung ㅇ HANGUL LETTER IEUNG */
751 { 0x0eb8, 0x3148 }, /* Hangul_Jieuj ㅈ HANGUL LETTER CIEUC */
752 { 0x0eb9, 0x3149 }, /* Hangul_SsangJieuj ㅉ HANGUL LETTER SSANGCIEUC */
753 { 0x0eba, 0x314a }, /* Hangul_Cieuc ㅊ HANGUL LETTER CHIEUCH */
754 { 0x0ebb, 0x314b }, /* Hangul_Khieuq ㅋ HANGUL LETTER KHIEUKH */
755 { 0x0ebc, 0x314c }, /* Hangul_Tieut ㅌ HANGUL LETTER THIEUTH */
756 { 0x0ebd, 0x314d }, /* Hangul_Phieuf ㅍ HANGUL LETTER PHIEUPH */
757 { 0x0ebe, 0x314e }, /* Hangul_Hieuh ㅎ HANGUL LETTER HIEUH */
758 { 0x0ebf, 0x314f }, /* Hangul_A ㅏ HANGUL LETTER A */
759 { 0x0ec0, 0x3150 }, /* Hangul_AE ㅐ HANGUL LETTER AE */
760 { 0x0ec1, 0x3151 }, /* Hangul_YA ㅑ HANGUL LETTER YA */
761 { 0x0ec2, 0x3152 }, /* Hangul_YAE ㅒ HANGUL LETTER YAE */
762 { 0x0ec3, 0x3153 }, /* Hangul_EO ㅓ HANGUL LETTER EO */
763 { 0x0ec4, 0x3154 }, /* Hangul_E ㅔ HANGUL LETTER E */
764 { 0x0ec5, 0x3155 }, /* Hangul_YEO ㅕ HANGUL LETTER YEO */
765 { 0x0ec6, 0x3156 }, /* Hangul_YE ㅖ HANGUL LETTER YE */
766 { 0x0ec7, 0x3157 }, /* Hangul_O ㅗ HANGUL LETTER O */
767 { 0x0ec8, 0x3158 }, /* Hangul_WA ㅘ HANGUL LETTER WA */
768 { 0x0ec9, 0x3159 }, /* Hangul_WAE ㅙ HANGUL LETTER WAE */
769 { 0x0eca, 0x315a }, /* Hangul_OE ㅚ HANGUL LETTER OE */
770 { 0x0ecb, 0x315b }, /* Hangul_YO ㅛ HANGUL LETTER YO */
771 { 0x0ecc, 0x315c }, /* Hangul_U ㅜ HANGUL LETTER U */
772 { 0x0ecd, 0x315d }, /* Hangul_WEO ㅝ HANGUL LETTER WEO */
773 { 0x0ece, 0x315e }, /* Hangul_WE ㅞ HANGUL LETTER WE */
774 { 0x0ecf, 0x315f }, /* Hangul_WI ㅟ HANGUL LETTER WI */
775 { 0x0ed0, 0x3160 }, /* Hangul_YU ㅠ HANGUL LETTER YU */
776 { 0x0ed1, 0x3161 }, /* Hangul_EU ㅡ HANGUL LETTER EU */
777 { 0x0ed2, 0x3162 }, /* Hangul_YI ㅢ HANGUL LETTER YI */
778 { 0x0ed3, 0x3163 }, /* Hangul_I ㅣ HANGUL LETTER I */
779 { 0x0ed4, 0x11a8 }, /* Hangul_J_Kiyeog ᆨ HANGUL JONGSEONG KIYEOK */
780 { 0x0ed5, 0x11a9 }, /* Hangul_J_SsangKiyeog ᆩ HANGUL JONGSEONG SSANGKIYEOK */
781 { 0x0ed6, 0x11aa }, /* Hangul_J_KiyeogSios ᆪ HANGUL JONGSEONG KIYEOK-SIOS */
782 { 0x0ed7, 0x11ab }, /* Hangul_J_Nieun ᆫ HANGUL JONGSEONG NIEUN */
783 { 0x0ed8, 0x11ac }, /* Hangul_J_NieunJieuj ᆬ HANGUL JONGSEONG NIEUN-CIEUC */
784 { 0x0ed9, 0x11ad }, /* Hangul_J_NieunHieuh ᆭ HANGUL JONGSEONG NIEUN-HIEUH */
785 { 0x0eda, 0x11ae }, /* Hangul_J_Dikeud ᆮ HANGUL JONGSEONG TIKEUT */
786 { 0x0edb, 0x11af }, /* Hangul_J_Rieul ᆯ HANGUL JONGSEONG RIEUL */
787 { 0x0edc, 0x11b0 }, /* Hangul_J_RieulKiyeog ᆰ HANGUL JONGSEONG RIEUL-KIYEOK */
788 { 0x0edd, 0x11b1 }, /* Hangul_J_RieulMieum ᆱ HANGUL JONGSEONG RIEUL-MIEUM */
789 { 0x0ede, 0x11b2 }, /* Hangul_J_RieulPieub ᆲ HANGUL JONGSEONG RIEUL-PIEUP */
790 { 0x0edf, 0x11b3 }, /* Hangul_J_RieulSios ᆳ HANGUL JONGSEONG RIEUL-SIOS */
791 { 0x0ee0, 0x11b4 }, /* Hangul_J_RieulTieut ᆴ HANGUL JONGSEONG RIEUL-THIEUTH */
792 { 0x0ee1, 0x11b5 }, /* Hangul_J_RieulPhieuf ᆵ HANGUL JONGSEONG RIEUL-PHIEUPH */
793 { 0x0ee2, 0x11b6 }, /* Hangul_J_RieulHieuh ᆶ HANGUL JONGSEONG RIEUL-HIEUH */
794 { 0x0ee3, 0x11b7 }, /* Hangul_J_Mieum ᆷ HANGUL JONGSEONG MIEUM */
795 { 0x0ee4, 0x11b8 }, /* Hangul_J_Pieub ᆸ HANGUL JONGSEONG PIEUP */
796 { 0x0ee5, 0x11b9 }, /* Hangul_J_PieubSios ᆹ HANGUL JONGSEONG PIEUP-SIOS */
797 { 0x0ee6, 0x11ba }, /* Hangul_J_Sios ᆺ HANGUL JONGSEONG SIOS */
798 { 0x0ee7, 0x11bb }, /* Hangul_J_SsangSios ᆻ HANGUL JONGSEONG SSANGSIOS */
799 { 0x0ee8, 0x11bc }, /* Hangul_J_Ieung ᆼ HANGUL JONGSEONG IEUNG */
800 { 0x0ee9, 0x11bd }, /* Hangul_J_Jieuj ᆽ HANGUL JONGSEONG CIEUC */
801 { 0x0eea, 0x11be }, /* Hangul_J_Cieuc ᆾ HANGUL JONGSEONG CHIEUCH */
802 { 0x0eeb, 0x11bf }, /* Hangul_J_Khieuq ᆿ HANGUL JONGSEONG KHIEUKH */
803 { 0x0eec, 0x11c0 }, /* Hangul_J_Tieut ᇀ HANGUL JONGSEONG THIEUTH */
804 { 0x0eed, 0x11c1 }, /* Hangul_J_Phieuf ᇁ HANGUL JONGSEONG PHIEUPH */
805 { 0x0eee, 0x11c2 }, /* Hangul_J_Hieuh ᇂ HANGUL JONGSEONG HIEUH */
806 { 0x0eef, 0x316d }, /* Hangul_RieulYeorinHieuh ㅭ HANGUL LETTER RIEUL-YEORINHIEUH */
807 { 0x0ef0, 0x3171 }, /* Hangul_SunkyeongeumMieum ㅱ HANGUL LETTER KAPYEOUNMIEUM */
808 { 0x0ef1, 0x3178 }, /* Hangul_SunkyeongeumPieub ㅸ HANGUL LETTER KAPYEOUNPIEUP */
809 { 0x0ef2, 0x317f }, /* Hangul_PanSios ㅿ HANGUL LETTER PANSIOS */
810 /* 0x0ef3 Hangul_KkogjiDalrinIeung ? ??? */
811 { 0x0ef4, 0x3184 }, /* Hangul_SunkyeongeumPhieuf ㆄ HANGUL LETTER KAPYEOUNPHIEUPH */
812 { 0x0ef5, 0x3186 }, /* Hangul_YeorinHieuh ㆆ HANGUL LETTER YEORINHIEUH */
813 { 0x0ef6, 0x318d }, /* Hangul_AraeA ㆍ HANGUL LETTER ARAEA */
814 { 0x0ef7, 0x318e }, /* Hangul_AraeAE ㆎ HANGUL LETTER ARAEAE */
815 { 0x0ef8, 0x11eb }, /* Hangul_J_PanSios ᇫ HANGUL JONGSEONG PANSIOS */
816 { 0x0ef9, 0x11f0 }, /* Hangul_J_KkogjiDalrinIeung ᇰ HANGUL JONGSEONG YESIEUNG */
817 { 0x0efa, 0x11f9 }, /* Hangul_J_YeorinHieuh ᇹ HANGUL JONGSEONG YEORINHIEUH */
818 { 0x0eff, 0x20a9 }, /* Korean_Won ₩ WON SIGN */
819 { 0x13a4, 0x20ac }, /* Euro € EURO SIGN */
820 { 0x13bc, 0x0152 }, /* OE Œ LATIN CAPITAL LIGATURE OE */
821 { 0x13bd, 0x0153 }, /* oe œ LATIN SMALL LIGATURE OE */
822 { 0x13be, 0x0178 }, /* Ydiaeresis Ÿ LATIN CAPITAL LETTER Y WITH DIAERESIS */
823 { 0x20a0, 0x20a0 }, /* EcuSign ₠ EURO-CURRENCY SIGN */
824 { 0x20a1, 0x20a1 }, /* ColonSign ₡ COLON SIGN */
825 { 0x20a2, 0x20a2 }, /* CruzeiroSign ₢ CRUZEIRO SIGN */
826 { 0x20a3, 0x20a3 }, /* FFrancSign ₣ FRENCH FRANC SIGN */
827 { 0x20a4, 0x20a4 }, /* LiraSign ₤ LIRA SIGN */
828 { 0x20a5, 0x20a5 }, /* MillSign ₥ MILL SIGN */
829 { 0x20a6, 0x20a6 }, /* NairaSign ₦ NAIRA SIGN */
830 { 0x20a7, 0x20a7 }, /* PesetaSign ₧ PESETA SIGN */
831 { 0x20a8, 0x20a8 }, /* RupeeSign ₨ RUPEE SIGN */
832 { 0x20a9, 0x20a9 }, /* WonSign ₩ WON SIGN */
833 { 0x20aa, 0x20aa }, /* NewSheqelSign ₪ NEW SHEQEL SIGN */
834 { 0x20ab, 0x20ab }, /* DongSign ₫ DONG SIGN */
835 { 0x20ac, 0x20ac }, /* EuroSign € EURO SIGN */
836 };
837
838 /* binary search with range check */
839 static uint32_t
bin_search(const struct codepair * table,size_t length,xkb_keysym_t keysym)840 bin_search(const struct codepair *table, size_t length, xkb_keysym_t keysym)
841 {
842 size_t first = 0;
843 size_t last = length;
844
845 if (keysym < table[0].keysym || keysym > table[length].keysym)
846 return 0;
847
848 /* binary search in table */
849 while (last >= first) {
850 size_t mid = (first + last) / 2;
851 if (table[mid].keysym < keysym)
852 first = mid + 1;
853 else if (table[mid].keysym > keysym)
854 last = mid - 1;
855 else /* found it */
856 return table[mid].ucs;
857 }
858
859 /* no matching Unicode value found in table */
860 return 0;
861 }
862
863 XKB_EXPORT uint32_t
xkb_keysym_to_utf32(xkb_keysym_t keysym)864 xkb_keysym_to_utf32(xkb_keysym_t keysym)
865 {
866 /* first check for Latin-1 characters (1:1 mapping) */
867 if ((keysym >= 0x0020 && keysym <= 0x007e) ||
868 (keysym >= 0x00a0 && keysym <= 0x00ff))
869 return keysym;
870
871 /* patch encoding botch */
872 if (keysym == XKB_KEY_KP_Space)
873 return XKB_KEY_space & 0x7f;
874
875 /* special keysyms */
876 if ((keysym >= XKB_KEY_BackSpace && keysym <= XKB_KEY_Clear) ||
877 (keysym >= XKB_KEY_KP_Multiply && keysym <= XKB_KEY_KP_9) ||
878 keysym == XKB_KEY_Return || keysym == XKB_KEY_Escape ||
879 keysym == XKB_KEY_Delete || keysym == XKB_KEY_KP_Tab ||
880 keysym == XKB_KEY_KP_Enter || keysym == XKB_KEY_KP_Equal)
881 return keysym & 0x7f;
882
883 /* also check for directly encoded 24-bit UCS characters */
884 if ((keysym & 0xff000000) == 0x01000000)
885 return keysym & 0x00ffffff;
886
887 /* search main table */
888 return bin_search(keysymtab, ARRAY_SIZE(keysymtab) - 1, keysym);
889 }
890
891 /*
892 * Copyright © 2012 Intel Corporation
893 *
894 * Permission is hereby granted, free of charge, to any person obtaining a
895 * copy of this software and associated documentation files (the "Software"),
896 * to deal in the Software without restriction, including without limitation
897 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
898 * and/or sell copies of the Software, and to permit persons to whom the
899 * Software is furnished to do so, subject to the following conditions:
900 *
901 * The above copyright notice and this permission notice (including the next
902 * paragraph) shall be included in all copies or substantial portions of the
903 * Software.
904 *
905 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
906 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
907 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
908 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
909 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
910 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
911 * DEALINGS IN THE SOFTWARE.
912 *
913 * Author: Rob Bradford <rob@linux.intel.com>
914 */
915
916 XKB_EXPORT int
xkb_keysym_to_utf8(xkb_keysym_t keysym,char * buffer,size_t size)917 xkb_keysym_to_utf8(xkb_keysym_t keysym, char *buffer, size_t size)
918 {
919 uint32_t codepoint;
920
921 if (size < 7)
922 return -1;
923
924 codepoint = xkb_keysym_to_utf32(keysym);
925
926 if (codepoint == 0)
927 return 0;
928
929 return utf32_to_utf8(codepoint, buffer);
930 }
931