blob: fb45c1524869bf6a79cdfe5e848a50ed5d064a51 [file] [log] [blame]
Bram Moolenaaredf3f972016-08-29 22:49:24 +02001/* vi:set ts=8 sts=4 sw=4 noet:
Bram Moolenaar071d4272004-06-13 20:20:40 +00002 *
3 * VIM - Vi IMproved by Bram Moolenaar
4 *
5 * Do ":help uganda" in Vim to read copying and usage conditions.
6 * Do ":help credits" in Vim to see a list of people who contributed.
7 * See README.txt for an overview of the Vim source code.
8 */
9
10/*
11 * digraph.c: code for digraphs
12 */
13
14#include "vim.h"
15
16#if defined(FEAT_DIGRAPHS) || defined(PROTO)
17
Bram Moolenaar071d4272004-06-13 20:20:40 +000018typedef int result_T;
Bram Moolenaar071d4272004-06-13 20:20:40 +000019
20typedef struct digraph
21{
22 char_u char1;
23 char_u char2;
24 result_T result;
25} digr_T;
26
Bram Moolenaareae8ae12018-12-14 18:53:02 +010027static void printdigraph(digr_T *dp, result_T *previous);
Bram Moolenaar071d4272004-06-13 20:20:40 +000028
Bram Moolenaar5d18efe2019-12-01 21:11:22 +010029// digraphs added by the user
Bram Moolenaar0ab2a882009-05-13 10:51:08 +000030static garray_T user_digraphs = {0, 0, (int)sizeof(digr_T), 10, NULL};
Bram Moolenaar071d4272004-06-13 20:20:40 +000031
32/*
Bram Moolenaare27d6e62022-08-30 15:05:30 +010033 * digraphs for Unicode from RFC1345
34 * (also work for ISO-8859-1 aka latin1)
35 *
Bram Moolenaar071d4272004-06-13 20:20:40 +000036 * Note: Characters marked with XX are not included literally, because some
37 * compilers cannot handle them (Amiga SAS/C is the most picky one).
38 */
Bram Moolenaare27d6e62022-08-30 15:05:30 +010039static digr_T digraphdefault[] = {
Bram Moolenaar5d18efe2019-12-01 21:11:22 +010040 {'N', 'U', 0x0a}, // LF for NUL
Bram Moolenaar071d4272004-06-13 20:20:40 +000041 {'S', 'H', 0x01},
42 {'S', 'X', 0x02},
43 {'E', 'X', 0x03},
44 {'E', 'T', 0x04},
45 {'E', 'Q', 0x05},
46 {'A', 'K', 0x06},
47 {'B', 'L', 0x07},
48 {'B', 'S', 0x08},
49 {'H', 'T', 0x09},
50 {'L', 'F', 0x0a},
51 {'V', 'T', 0x0b},
52 {'F', 'F', 0x0c},
53 {'C', 'R', 0x0d},
54 {'S', 'O', 0x0e},
55 {'S', 'I', 0x0f},
56 {'D', 'L', 0x10},
57 {'D', '1', 0x11},
58 {'D', '2', 0x12},
59 {'D', '3', 0x13},
60 {'D', '4', 0x14},
61 {'N', 'K', 0x15},
62 {'S', 'Y', 0x16},
63 {'E', 'B', 0x17},
64 {'C', 'N', 0x18},
65 {'E', 'M', 0x19},
66 {'S', 'B', 0x1a},
67 {'E', 'C', 0x1b},
68 {'F', 'S', 0x1c},
69 {'G', 'S', 0x1d},
70 {'R', 'S', 0x1e},
71 {'U', 'S', 0x1f},
72 {'S', 'P', 0x20},
73 {'N', 'b', 0x23},
74 {'D', 'O', 0x24},
75 {'A', 't', 0x40},
76 {'<', '(', 0x5b},
77 {'/', '/', 0x5c},
78 {')', '>', 0x5d},
79 {'\'', '>', 0x5e},
80 {'\'', '!', 0x60},
81 {'(', '!', 0x7b},
82 {'!', '!', 0x7c},
83 {'!', ')', 0x7d},
84 {'\'', '?', 0x7e},
85 {'D', 'T', 0x7f},
86 {'P', 'A', 0x80},
87 {'H', 'O', 0x81},
88 {'B', 'H', 0x82},
89 {'N', 'H', 0x83},
90 {'I', 'N', 0x84},
91 {'N', 'L', 0x85},
92 {'S', 'A', 0x86},
93 {'E', 'S', 0x87},
94 {'H', 'S', 0x88},
95 {'H', 'J', 0x89},
96 {'V', 'S', 0x8a},
97 {'P', 'D', 0x8b},
98 {'P', 'U', 0x8c},
99 {'R', 'I', 0x8d},
100 {'S', '2', 0x8e},
101 {'S', '3', 0x8f},
102 {'D', 'C', 0x90},
103 {'P', '1', 0x91},
104 {'P', '2', 0x92},
105 {'T', 'S', 0x93},
106 {'C', 'C', 0x94},
107 {'M', 'W', 0x95},
108 {'S', 'G', 0x96},
109 {'E', 'G', 0x97},
110 {'S', 'S', 0x98},
111 {'G', 'C', 0x99},
112 {'S', 'C', 0x9a},
113 {'C', 'I', 0x9b},
114 {'S', 'T', 0x9c},
115 {'O', 'C', 0x9d},
116 {'P', 'M', 0x9e},
117 {'A', 'C', 0x9f},
118 {'N', 'S', 0xa0},
Bram Moolenaare3f915d2020-07-14 23:02:44 +0200119# define DG_START_LATIN 0xa1
Bram Moolenaar071d4272004-06-13 20:20:40 +0000120 {'!', 'I', 0xa1},
Bram Moolenaar41193092019-08-24 21:53:31 +0200121 {'~', '!', 0xa1}, // ¡ Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000122 {'C', 't', 0xa2},
Bram Moolenaar41193092019-08-24 21:53:31 +0200123 {'c', '|', 0xa2}, // ¢ Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000124 {'P', 'd', 0xa3},
Bram Moolenaar41193092019-08-24 21:53:31 +0200125 {'$', '$', 0xa3}, // £ Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000126 {'C', 'u', 0xa4},
Bram Moolenaar41193092019-08-24 21:53:31 +0200127 {'o', 'x', 0xa4}, // ¤ Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000128 {'Y', 'e', 0xa5},
Bram Moolenaar41193092019-08-24 21:53:31 +0200129 {'Y', '-', 0xa5}, // ¥ Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000130 {'B', 'B', 0xa6},
Bram Moolenaar41193092019-08-24 21:53:31 +0200131 {'|', '|', 0xa6}, // ¦ Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000132 {'S', 'E', 0xa7},
133 {'\'', ':', 0xa8},
134 {'C', 'o', 0xa9},
Bram Moolenaar41193092019-08-24 21:53:31 +0200135 {'c', 'O', 0xa9}, // © Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000136 {'-', 'a', 0xaa},
137 {'<', '<', 0xab},
138 {'N', 'O', 0xac},
Bram Moolenaar41193092019-08-24 21:53:31 +0200139 {'-', ',', 0xac}, // ¬ Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000140 {'-', '-', 0xad},
141 {'R', 'g', 0xae},
142 {'\'', 'm', 0xaf},
Bram Moolenaar41193092019-08-24 21:53:31 +0200143 {'-', '=', 0xaf}, // ¯ Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000144 {'D', 'G', 0xb0},
Bram Moolenaar41193092019-08-24 21:53:31 +0200145 {'~', 'o', 0xb0}, // ° Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000146 {'+', '-', 0xb1},
147 {'2', 'S', 0xb2},
Bram Moolenaar41193092019-08-24 21:53:31 +0200148 {'2', '2', 0xb2}, // ² Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000149 {'3', 'S', 0xb3},
Bram Moolenaar41193092019-08-24 21:53:31 +0200150 {'3', '3', 0xb3}, // ³ Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000151 {'\'', '\'', 0xb4},
152 {'M', 'y', 0xb5},
153 {'P', 'I', 0xb6},
Bram Moolenaar41193092019-08-24 21:53:31 +0200154 {'p', 'p', 0xb6}, // ¶ Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000155 {'.', 'M', 0xb7},
Bram Moolenaar41193092019-08-24 21:53:31 +0200156 {'~', '.', 0xb7}, // · Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000157 {'\'', ',', 0xb8},
158 {'1', 'S', 0xb9},
Bram Moolenaar41193092019-08-24 21:53:31 +0200159 {'1', '1', 0xb9}, // ¹ Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000160 {'-', 'o', 0xba},
161 {'>', '>', 0xbb},
162 {'1', '4', 0xbc},
163 {'1', '2', 0xbd},
164 {'3', '4', 0xbe},
165 {'?', 'I', 0xbf},
Bram Moolenaar41193092019-08-24 21:53:31 +0200166 {'~', '?', 0xbf}, // ¿ Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000167 {'A', '!', 0xc0},
Bram Moolenaar41193092019-08-24 21:53:31 +0200168 {'A', '`', 0xc0}, // À Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000169 {'A', '\'', 0xc1},
170 {'A', '>', 0xc2},
Bram Moolenaar41193092019-08-24 21:53:31 +0200171 {'A', '^', 0xc2}, // Â Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000172 {'A', '?', 0xc3},
Bram Moolenaar41193092019-08-24 21:53:31 +0200173 {'A', '~', 0xc3}, // Ã Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000174 {'A', ':', 0xc4},
Bram Moolenaar41193092019-08-24 21:53:31 +0200175 {'A', '"', 0xc4}, // Ä Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000176 {'A', 'A', 0xc5},
Bram Moolenaar41193092019-08-24 21:53:31 +0200177 {'A', '@', 0xc5}, // Å Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000178 {'A', 'E', 0xc6},
179 {'C', ',', 0xc7},
180 {'E', '!', 0xc8},
Bram Moolenaar41193092019-08-24 21:53:31 +0200181 {'E', '`', 0xc8}, // È Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000182 {'E', '\'', 0xc9},
183 {'E', '>', 0xca},
Bram Moolenaar41193092019-08-24 21:53:31 +0200184 {'E', '^', 0xca}, // Ê Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000185 {'E', ':', 0xcb},
Bram Moolenaar41193092019-08-24 21:53:31 +0200186 {'E', '"', 0xcb}, // Ë Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000187 {'I', '!', 0xcc},
Bram Moolenaar41193092019-08-24 21:53:31 +0200188 {'I', '`', 0xcc}, // Ì Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000189 {'I', '\'', 0xcd},
190 {'I', '>', 0xce},
Bram Moolenaar41193092019-08-24 21:53:31 +0200191 {'I', '^', 0xce}, // Î Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000192 {'I', ':', 0xcf},
Bram Moolenaar41193092019-08-24 21:53:31 +0200193 {'I', '"', 0xcf}, // Ï Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000194 {'D', '-', 0xd0},
195 {'N', '?', 0xd1},
Bram Moolenaar41193092019-08-24 21:53:31 +0200196 {'N', '~', 0xd1}, // Ñ Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000197 {'O', '!', 0xd2},
Bram Moolenaar41193092019-08-24 21:53:31 +0200198 {'O', '`', 0xd2}, // Ò Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000199 {'O', '\'', 0xd3},
200 {'O', '>', 0xd4},
Bram Moolenaar41193092019-08-24 21:53:31 +0200201 {'O', '^', 0xd4}, // Ô Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000202 {'O', '?', 0xd5},
Bram Moolenaar41193092019-08-24 21:53:31 +0200203 {'O', '~', 0xd5}, // Õ Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000204 {'O', ':', 0xd6},
205 {'*', 'X', 0xd7},
Bram Moolenaar41193092019-08-24 21:53:31 +0200206 {'/', '\\', 0xd7}, // × Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000207 {'O', '/', 0xd8},
208 {'U', '!', 0xd9},
Bram Moolenaar41193092019-08-24 21:53:31 +0200209 {'U', '`', 0xd9}, // Ù Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000210 {'U', '\'', 0xda},
211 {'U', '>', 0xdb},
Bram Moolenaar41193092019-08-24 21:53:31 +0200212 {'U', '^', 0xdb}, // Û Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000213 {'U', ':', 0xdc},
214 {'Y', '\'', 0xdd},
215 {'T', 'H', 0xde},
Bram Moolenaar41193092019-08-24 21:53:31 +0200216 {'I', 'p', 0xde}, // Þ Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000217 {'s', 's', 0xdf},
218 {'a', '!', 0xe0},
Bram Moolenaar41193092019-08-24 21:53:31 +0200219 {'a', '`', 0xe0}, // à Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000220 {'a', '\'', 0xe1},
221 {'a', '>', 0xe2},
Bram Moolenaar41193092019-08-24 21:53:31 +0200222 {'a', '^', 0xe2}, // â Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000223 {'a', '?', 0xe3},
Bram Moolenaar41193092019-08-24 21:53:31 +0200224 {'a', '~', 0xe3}, // ã Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000225 {'a', ':', 0xe4},
Bram Moolenaar41193092019-08-24 21:53:31 +0200226 {'a', '"', 0xe4}, // ä Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000227 {'a', 'a', 0xe5},
Bram Moolenaar41193092019-08-24 21:53:31 +0200228 {'a', '@', 0xe5}, // å Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000229 {'a', 'e', 0xe6},
230 {'c', ',', 0xe7},
231 {'e', '!', 0xe8},
Bram Moolenaar41193092019-08-24 21:53:31 +0200232 {'e', '`', 0xe8}, // è Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000233 {'e', '\'', 0xe9},
234 {'e', '>', 0xea},
Bram Moolenaar41193092019-08-24 21:53:31 +0200235 {'e', '^', 0xea}, // ê Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000236 {'e', ':', 0xeb},
Bram Moolenaar41193092019-08-24 21:53:31 +0200237 {'e', '"', 0xeb}, // ë Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000238 {'i', '!', 0xec},
Bram Moolenaar41193092019-08-24 21:53:31 +0200239 {'i', '`', 0xec}, // ì Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000240 {'i', '\'', 0xed},
241 {'i', '>', 0xee},
Bram Moolenaar41193092019-08-24 21:53:31 +0200242 {'i', '^', 0xee}, // î Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000243 {'i', ':', 0xef},
244 {'d', '-', 0xf0},
245 {'n', '?', 0xf1},
Bram Moolenaar41193092019-08-24 21:53:31 +0200246 {'n', '~', 0xf1}, // ñ Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000247 {'o', '!', 0xf2},
Bram Moolenaar41193092019-08-24 21:53:31 +0200248 {'o', '`', 0xf2}, // ò Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000249 {'o', '\'', 0xf3},
250 {'o', '>', 0xf4},
Bram Moolenaar41193092019-08-24 21:53:31 +0200251 {'o', '^', 0xf4}, // ô Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000252 {'o', '?', 0xf5},
Bram Moolenaar41193092019-08-24 21:53:31 +0200253 {'o', '~', 0xf5}, // õ Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000254 {'o', ':', 0xf6},
255 {'-', ':', 0xf7},
256 {'o', '/', 0xf8},
257 {'u', '!', 0xf9},
Bram Moolenaar41193092019-08-24 21:53:31 +0200258 {'u', '`', 0xf9}, // ù Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000259 {'u', '\'', 0xfa},
260 {'u', '>', 0xfb},
Bram Moolenaar41193092019-08-24 21:53:31 +0200261 {'u', '^', 0xfb}, // û Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000262 {'u', ':', 0xfc},
263 {'y', '\'', 0xfd},
264 {'t', 'h', 0xfe},
265 {'y', ':', 0xff},
Bram Moolenaareae8ae12018-12-14 18:53:02 +0100266 {'y', '"', 0xff}, // x XX Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000267
Bram Moolenaare3f915d2020-07-14 23:02:44 +0200268# define USE_UNICODE_DIGRAPHS
Bram Moolenaar071d4272004-06-13 20:20:40 +0000269
270 {'A', '-', 0x0100},
271 {'a', '-', 0x0101},
272 {'A', '(', 0x0102},
273 {'a', '(', 0x0103},
274 {'A', ';', 0x0104},
275 {'a', ';', 0x0105},
276 {'C', '\'', 0x0106},
277 {'c', '\'', 0x0107},
278 {'C', '>', 0x0108},
279 {'c', '>', 0x0109},
280 {'C', '.', 0x010a},
281 {'c', '.', 0x010b},
282 {'C', '<', 0x010c},
283 {'c', '<', 0x010d},
284 {'D', '<', 0x010e},
285 {'d', '<', 0x010f},
286 {'D', '/', 0x0110},
287 {'d', '/', 0x0111},
288 {'E', '-', 0x0112},
289 {'e', '-', 0x0113},
290 {'E', '(', 0x0114},
291 {'e', '(', 0x0115},
292 {'E', '.', 0x0116},
293 {'e', '.', 0x0117},
294 {'E', ';', 0x0118},
295 {'e', ';', 0x0119},
296 {'E', '<', 0x011a},
297 {'e', '<', 0x011b},
298 {'G', '>', 0x011c},
299 {'g', '>', 0x011d},
300 {'G', '(', 0x011e},
301 {'g', '(', 0x011f},
302 {'G', '.', 0x0120},
303 {'g', '.', 0x0121},
304 {'G', ',', 0x0122},
305 {'g', ',', 0x0123},
306 {'H', '>', 0x0124},
307 {'h', '>', 0x0125},
308 {'H', '/', 0x0126},
309 {'h', '/', 0x0127},
310 {'I', '?', 0x0128},
311 {'i', '?', 0x0129},
312 {'I', '-', 0x012a},
313 {'i', '-', 0x012b},
314 {'I', '(', 0x012c},
315 {'i', '(', 0x012d},
316 {'I', ';', 0x012e},
317 {'i', ';', 0x012f},
318 {'I', '.', 0x0130},
319 {'i', '.', 0x0131},
320 {'I', 'J', 0x0132},
321 {'i', 'j', 0x0133},
322 {'J', '>', 0x0134},
323 {'j', '>', 0x0135},
324 {'K', ',', 0x0136},
325 {'k', ',', 0x0137},
326 {'k', 'k', 0x0138},
327 {'L', '\'', 0x0139},
328 {'l', '\'', 0x013a},
329 {'L', ',', 0x013b},
330 {'l', ',', 0x013c},
331 {'L', '<', 0x013d},
332 {'l', '<', 0x013e},
333 {'L', '.', 0x013f},
334 {'l', '.', 0x0140},
335 {'L', '/', 0x0141},
336 {'l', '/', 0x0142},
337 {'N', '\'', 0x0143},
338 {'n', '\'', 0x0144},
339 {'N', ',', 0x0145},
340 {'n', ',', 0x0146},
341 {'N', '<', 0x0147},
342 {'n', '<', 0x0148},
343 {'\'', 'n', 0x0149},
344 {'N', 'G', 0x014a},
345 {'n', 'g', 0x014b},
346 {'O', '-', 0x014c},
347 {'o', '-', 0x014d},
348 {'O', '(', 0x014e},
349 {'o', '(', 0x014f},
350 {'O', '"', 0x0150},
351 {'o', '"', 0x0151},
352 {'O', 'E', 0x0152},
353 {'o', 'e', 0x0153},
354 {'R', '\'', 0x0154},
355 {'r', '\'', 0x0155},
356 {'R', ',', 0x0156},
357 {'r', ',', 0x0157},
358 {'R', '<', 0x0158},
359 {'r', '<', 0x0159},
360 {'S', '\'', 0x015a},
361 {'s', '\'', 0x015b},
362 {'S', '>', 0x015c},
363 {'s', '>', 0x015d},
364 {'S', ',', 0x015e},
365 {'s', ',', 0x015f},
366 {'S', '<', 0x0160},
367 {'s', '<', 0x0161},
368 {'T', ',', 0x0162},
369 {'t', ',', 0x0163},
370 {'T', '<', 0x0164},
371 {'t', '<', 0x0165},
372 {'T', '/', 0x0166},
373 {'t', '/', 0x0167},
374 {'U', '?', 0x0168},
375 {'u', '?', 0x0169},
376 {'U', '-', 0x016a},
377 {'u', '-', 0x016b},
378 {'U', '(', 0x016c},
379 {'u', '(', 0x016d},
380 {'U', '0', 0x016e},
381 {'u', '0', 0x016f},
382 {'U', '"', 0x0170},
383 {'u', '"', 0x0171},
384 {'U', ';', 0x0172},
385 {'u', ';', 0x0173},
386 {'W', '>', 0x0174},
387 {'w', '>', 0x0175},
388 {'Y', '>', 0x0176},
389 {'y', '>', 0x0177},
390 {'Y', ':', 0x0178},
391 {'Z', '\'', 0x0179},
392 {'z', '\'', 0x017a},
393 {'Z', '.', 0x017b},
394 {'z', '.', 0x017c},
395 {'Z', '<', 0x017d},
396 {'z', '<', 0x017e},
397 {'O', '9', 0x01a0},
398 {'o', '9', 0x01a1},
399 {'O', 'I', 0x01a2},
400 {'o', 'i', 0x01a3},
401 {'y', 'r', 0x01a6},
402 {'U', '9', 0x01af},
403 {'u', '9', 0x01b0},
404 {'Z', '/', 0x01b5},
405 {'z', '/', 0x01b6},
406 {'E', 'D', 0x01b7},
407 {'A', '<', 0x01cd},
408 {'a', '<', 0x01ce},
409 {'I', '<', 0x01cf},
410 {'i', '<', 0x01d0},
411 {'O', '<', 0x01d1},
412 {'o', '<', 0x01d2},
413 {'U', '<', 0x01d3},
414 {'u', '<', 0x01d4},
415 {'A', '1', 0x01de},
416 {'a', '1', 0x01df},
417 {'A', '7', 0x01e0},
418 {'a', '7', 0x01e1},
419 {'A', '3', 0x01e2},
420 {'a', '3', 0x01e3},
421 {'G', '/', 0x01e4},
422 {'g', '/', 0x01e5},
423 {'G', '<', 0x01e6},
424 {'g', '<', 0x01e7},
425 {'K', '<', 0x01e8},
426 {'k', '<', 0x01e9},
427 {'O', ';', 0x01ea},
428 {'o', ';', 0x01eb},
429 {'O', '1', 0x01ec},
430 {'o', '1', 0x01ed},
431 {'E', 'Z', 0x01ee},
432 {'e', 'z', 0x01ef},
433 {'j', '<', 0x01f0},
434 {'G', '\'', 0x01f4},
435 {'g', '\'', 0x01f5},
436 {';', 'S', 0x02bf},
437 {'\'', '<', 0x02c7},
438 {'\'', '(', 0x02d8},
439 {'\'', '.', 0x02d9},
440 {'\'', '0', 0x02da},
441 {'\'', ';', 0x02db},
442 {'\'', '"', 0x02dd},
Bram Moolenaare3f915d2020-07-14 23:02:44 +0200443# define DG_START_GREEK 0x0386
Bram Moolenaar071d4272004-06-13 20:20:40 +0000444 {'A', '%', 0x0386},
445 {'E', '%', 0x0388},
446 {'Y', '%', 0x0389},
447 {'I', '%', 0x038a},
448 {'O', '%', 0x038c},
449 {'U', '%', 0x038e},
450 {'W', '%', 0x038f},
451 {'i', '3', 0x0390},
452 {'A', '*', 0x0391},
453 {'B', '*', 0x0392},
454 {'G', '*', 0x0393},
455 {'D', '*', 0x0394},
456 {'E', '*', 0x0395},
457 {'Z', '*', 0x0396},
458 {'Y', '*', 0x0397},
459 {'H', '*', 0x0398},
460 {'I', '*', 0x0399},
461 {'K', '*', 0x039a},
462 {'L', '*', 0x039b},
463 {'M', '*', 0x039c},
464 {'N', '*', 0x039d},
465 {'C', '*', 0x039e},
466 {'O', '*', 0x039f},
467 {'P', '*', 0x03a0},
468 {'R', '*', 0x03a1},
469 {'S', '*', 0x03a3},
470 {'T', '*', 0x03a4},
471 {'U', '*', 0x03a5},
472 {'F', '*', 0x03a6},
473 {'X', '*', 0x03a7},
474 {'Q', '*', 0x03a8},
475 {'W', '*', 0x03a9},
476 {'J', '*', 0x03aa},
477 {'V', '*', 0x03ab},
478 {'a', '%', 0x03ac},
479 {'e', '%', 0x03ad},
480 {'y', '%', 0x03ae},
481 {'i', '%', 0x03af},
482 {'u', '3', 0x03b0},
483 {'a', '*', 0x03b1},
484 {'b', '*', 0x03b2},
485 {'g', '*', 0x03b3},
486 {'d', '*', 0x03b4},
487 {'e', '*', 0x03b5},
488 {'z', '*', 0x03b6},
489 {'y', '*', 0x03b7},
490 {'h', '*', 0x03b8},
491 {'i', '*', 0x03b9},
492 {'k', '*', 0x03ba},
493 {'l', '*', 0x03bb},
494 {'m', '*', 0x03bc},
495 {'n', '*', 0x03bd},
496 {'c', '*', 0x03be},
497 {'o', '*', 0x03bf},
498 {'p', '*', 0x03c0},
499 {'r', '*', 0x03c1},
500 {'*', 's', 0x03c2},
501 {'s', '*', 0x03c3},
502 {'t', '*', 0x03c4},
503 {'u', '*', 0x03c5},
504 {'f', '*', 0x03c6},
505 {'x', '*', 0x03c7},
506 {'q', '*', 0x03c8},
507 {'w', '*', 0x03c9},
508 {'j', '*', 0x03ca},
509 {'v', '*', 0x03cb},
510 {'o', '%', 0x03cc},
511 {'u', '%', 0x03cd},
512 {'w', '%', 0x03ce},
513 {'\'', 'G', 0x03d8},
514 {',', 'G', 0x03d9},
515 {'T', '3', 0x03da},
516 {'t', '3', 0x03db},
517 {'M', '3', 0x03dc},
518 {'m', '3', 0x03dd},
519 {'K', '3', 0x03de},
520 {'k', '3', 0x03df},
521 {'P', '3', 0x03e0},
522 {'p', '3', 0x03e1},
523 {'\'', '%', 0x03f4},
524 {'j', '3', 0x03f5},
Bram Moolenaare3f915d2020-07-14 23:02:44 +0200525# define DG_START_CYRILLIC 0x0401
Bram Moolenaar071d4272004-06-13 20:20:40 +0000526 {'I', 'O', 0x0401},
527 {'D', '%', 0x0402},
528 {'G', '%', 0x0403},
529 {'I', 'E', 0x0404},
530 {'D', 'S', 0x0405},
531 {'I', 'I', 0x0406},
532 {'Y', 'I', 0x0407},
533 {'J', '%', 0x0408},
534 {'L', 'J', 0x0409},
535 {'N', 'J', 0x040a},
536 {'T', 's', 0x040b},
537 {'K', 'J', 0x040c},
538 {'V', '%', 0x040e},
539 {'D', 'Z', 0x040f},
540 {'A', '=', 0x0410},
541 {'B', '=', 0x0411},
542 {'V', '=', 0x0412},
543 {'G', '=', 0x0413},
544 {'D', '=', 0x0414},
545 {'E', '=', 0x0415},
546 {'Z', '%', 0x0416},
547 {'Z', '=', 0x0417},
548 {'I', '=', 0x0418},
549 {'J', '=', 0x0419},
550 {'K', '=', 0x041a},
551 {'L', '=', 0x041b},
552 {'M', '=', 0x041c},
553 {'N', '=', 0x041d},
554 {'O', '=', 0x041e},
555 {'P', '=', 0x041f},
556 {'R', '=', 0x0420},
557 {'S', '=', 0x0421},
558 {'T', '=', 0x0422},
559 {'U', '=', 0x0423},
560 {'F', '=', 0x0424},
561 {'H', '=', 0x0425},
562 {'C', '=', 0x0426},
563 {'C', '%', 0x0427},
564 {'S', '%', 0x0428},
565 {'S', 'c', 0x0429},
566 {'=', '"', 0x042a},
567 {'Y', '=', 0x042b},
568 {'%', '"', 0x042c},
569 {'J', 'E', 0x042d},
570 {'J', 'U', 0x042e},
571 {'J', 'A', 0x042f},
572 {'a', '=', 0x0430},
573 {'b', '=', 0x0431},
574 {'v', '=', 0x0432},
575 {'g', '=', 0x0433},
576 {'d', '=', 0x0434},
577 {'e', '=', 0x0435},
578 {'z', '%', 0x0436},
579 {'z', '=', 0x0437},
580 {'i', '=', 0x0438},
581 {'j', '=', 0x0439},
582 {'k', '=', 0x043a},
583 {'l', '=', 0x043b},
584 {'m', '=', 0x043c},
585 {'n', '=', 0x043d},
586 {'o', '=', 0x043e},
587 {'p', '=', 0x043f},
588 {'r', '=', 0x0440},
589 {'s', '=', 0x0441},
590 {'t', '=', 0x0442},
591 {'u', '=', 0x0443},
592 {'f', '=', 0x0444},
593 {'h', '=', 0x0445},
594 {'c', '=', 0x0446},
595 {'c', '%', 0x0447},
596 {'s', '%', 0x0448},
597 {'s', 'c', 0x0449},
598 {'=', '\'', 0x044a},
599 {'y', '=', 0x044b},
600 {'%', '\'', 0x044c},
601 {'j', 'e', 0x044d},
602 {'j', 'u', 0x044e},
603 {'j', 'a', 0x044f},
604 {'i', 'o', 0x0451},
605 {'d', '%', 0x0452},
606 {'g', '%', 0x0453},
607 {'i', 'e', 0x0454},
608 {'d', 's', 0x0455},
609 {'i', 'i', 0x0456},
610 {'y', 'i', 0x0457},
611 {'j', '%', 0x0458},
612 {'l', 'j', 0x0459},
613 {'n', 'j', 0x045a},
614 {'t', 's', 0x045b},
615 {'k', 'j', 0x045c},
616 {'v', '%', 0x045e},
617 {'d', 'z', 0x045f},
618 {'Y', '3', 0x0462},
619 {'y', '3', 0x0463},
620 {'O', '3', 0x046a},
621 {'o', '3', 0x046b},
622 {'F', '3', 0x0472},
623 {'f', '3', 0x0473},
624 {'V', '3', 0x0474},
625 {'v', '3', 0x0475},
626 {'C', '3', 0x0480},
627 {'c', '3', 0x0481},
628 {'G', '3', 0x0490},
629 {'g', '3', 0x0491},
Bram Moolenaare3f915d2020-07-14 23:02:44 +0200630# define DG_START_HEBREW 0x05d0
Bram Moolenaar071d4272004-06-13 20:20:40 +0000631 {'A', '+', 0x05d0},
632 {'B', '+', 0x05d1},
633 {'G', '+', 0x05d2},
634 {'D', '+', 0x05d3},
635 {'H', '+', 0x05d4},
636 {'W', '+', 0x05d5},
637 {'Z', '+', 0x05d6},
638 {'X', '+', 0x05d7},
639 {'T', 'j', 0x05d8},
640 {'J', '+', 0x05d9},
641 {'K', '%', 0x05da},
642 {'K', '+', 0x05db},
643 {'L', '+', 0x05dc},
644 {'M', '%', 0x05dd},
645 {'M', '+', 0x05de},
646 {'N', '%', 0x05df},
647 {'N', '+', 0x05e0},
648 {'S', '+', 0x05e1},
649 {'E', '+', 0x05e2},
650 {'P', '%', 0x05e3},
651 {'P', '+', 0x05e4},
652 {'Z', 'j', 0x05e5},
653 {'Z', 'J', 0x05e6},
654 {'Q', '+', 0x05e7},
655 {'R', '+', 0x05e8},
656 {'S', 'h', 0x05e9},
657 {'T', '+', 0x05ea},
Bram Moolenaare3f915d2020-07-14 23:02:44 +0200658# define DG_START_ARABIC 0x060c
Bram Moolenaar071d4272004-06-13 20:20:40 +0000659 {',', '+', 0x060c},
660 {';', '+', 0x061b},
661 {'?', '+', 0x061f},
662 {'H', '\'', 0x0621},
663 {'a', 'M', 0x0622},
664 {'a', 'H', 0x0623},
665 {'w', 'H', 0x0624},
666 {'a', 'h', 0x0625},
667 {'y', 'H', 0x0626},
668 {'a', '+', 0x0627},
669 {'b', '+', 0x0628},
670 {'t', 'm', 0x0629},
671 {'t', '+', 0x062a},
672 {'t', 'k', 0x062b},
673 {'g', '+', 0x062c},
674 {'h', 'k', 0x062d},
675 {'x', '+', 0x062e},
676 {'d', '+', 0x062f},
677 {'d', 'k', 0x0630},
678 {'r', '+', 0x0631},
679 {'z', '+', 0x0632},
680 {'s', '+', 0x0633},
681 {'s', 'n', 0x0634},
682 {'c', '+', 0x0635},
683 {'d', 'd', 0x0636},
684 {'t', 'j', 0x0637},
685 {'z', 'H', 0x0638},
686 {'e', '+', 0x0639},
687 {'i', '+', 0x063a},
688 {'+', '+', 0x0640},
689 {'f', '+', 0x0641},
690 {'q', '+', 0x0642},
691 {'k', '+', 0x0643},
692 {'l', '+', 0x0644},
693 {'m', '+', 0x0645},
694 {'n', '+', 0x0646},
695 {'h', '+', 0x0647},
696 {'w', '+', 0x0648},
697 {'j', '+', 0x0649},
698 {'y', '+', 0x064a},
699 {':', '+', 0x064b},
700 {'"', '+', 0x064c},
701 {'=', '+', 0x064d},
702 {'/', '+', 0x064e},
703 {'\'', '+', 0x064f},
704 {'1', '+', 0x0650},
705 {'3', '+', 0x0651},
706 {'0', '+', 0x0652},
707 {'a', 'S', 0x0670},
708 {'p', '+', 0x067e},
709 {'v', '+', 0x06a4},
710 {'g', 'f', 0x06af},
711 {'0', 'a', 0x06f0},
712 {'1', 'a', 0x06f1},
713 {'2', 'a', 0x06f2},
714 {'3', 'a', 0x06f3},
715 {'4', 'a', 0x06f4},
716 {'5', 'a', 0x06f5},
717 {'6', 'a', 0x06f6},
718 {'7', 'a', 0x06f7},
719 {'8', 'a', 0x06f8},
720 {'9', 'a', 0x06f9},
Bram Moolenaare3f915d2020-07-14 23:02:44 +0200721# define DG_START_LATIN_EXTENDED 0x1e02
Bram Moolenaar071d4272004-06-13 20:20:40 +0000722 {'B', '.', 0x1e02},
723 {'b', '.', 0x1e03},
724 {'B', '_', 0x1e06},
725 {'b', '_', 0x1e07},
726 {'D', '.', 0x1e0a},
727 {'d', '.', 0x1e0b},
728 {'D', '_', 0x1e0e},
729 {'d', '_', 0x1e0f},
730 {'D', ',', 0x1e10},
731 {'d', ',', 0x1e11},
732 {'F', '.', 0x1e1e},
733 {'f', '.', 0x1e1f},
734 {'G', '-', 0x1e20},
735 {'g', '-', 0x1e21},
736 {'H', '.', 0x1e22},
737 {'h', '.', 0x1e23},
738 {'H', ':', 0x1e26},
739 {'h', ':', 0x1e27},
740 {'H', ',', 0x1e28},
741 {'h', ',', 0x1e29},
742 {'K', '\'', 0x1e30},
743 {'k', '\'', 0x1e31},
744 {'K', '_', 0x1e34},
745 {'k', '_', 0x1e35},
746 {'L', '_', 0x1e3a},
747 {'l', '_', 0x1e3b},
748 {'M', '\'', 0x1e3e},
749 {'m', '\'', 0x1e3f},
750 {'M', '.', 0x1e40},
751 {'m', '.', 0x1e41},
752 {'N', '.', 0x1e44},
753 {'n', '.', 0x1e45},
754 {'N', '_', 0x1e48},
755 {'n', '_', 0x1e49},
756 {'P', '\'', 0x1e54},
757 {'p', '\'', 0x1e55},
758 {'P', '.', 0x1e56},
759 {'p', '.', 0x1e57},
760 {'R', '.', 0x1e58},
761 {'r', '.', 0x1e59},
762 {'R', '_', 0x1e5e},
763 {'r', '_', 0x1e5f},
764 {'S', '.', 0x1e60},
765 {'s', '.', 0x1e61},
766 {'T', '.', 0x1e6a},
767 {'t', '.', 0x1e6b},
768 {'T', '_', 0x1e6e},
769 {'t', '_', 0x1e6f},
770 {'V', '?', 0x1e7c},
771 {'v', '?', 0x1e7d},
772 {'W', '!', 0x1e80},
Bram Moolenaareae8ae12018-12-14 18:53:02 +0100773 {'W', '`', 0x1e80}, // extra alternative, easier to remember
Bram Moolenaar071d4272004-06-13 20:20:40 +0000774 {'w', '!', 0x1e81},
Bram Moolenaareae8ae12018-12-14 18:53:02 +0100775 {'w', '`', 0x1e81}, // extra alternative, easier to remember
Bram Moolenaar071d4272004-06-13 20:20:40 +0000776 {'W', '\'', 0x1e82},
777 {'w', '\'', 0x1e83},
778 {'W', ':', 0x1e84},
779 {'w', ':', 0x1e85},
780 {'W', '.', 0x1e86},
781 {'w', '.', 0x1e87},
782 {'X', '.', 0x1e8a},
783 {'x', '.', 0x1e8b},
784 {'X', ':', 0x1e8c},
785 {'x', ':', 0x1e8d},
786 {'Y', '.', 0x1e8e},
787 {'y', '.', 0x1e8f},
788 {'Z', '>', 0x1e90},
789 {'z', '>', 0x1e91},
790 {'Z', '_', 0x1e94},
791 {'z', '_', 0x1e95},
792 {'h', '_', 0x1e96},
793 {'t', ':', 0x1e97},
794 {'w', '0', 0x1e98},
795 {'y', '0', 0x1e99},
796 {'A', '2', 0x1ea2},
797 {'a', '2', 0x1ea3},
798 {'E', '2', 0x1eba},
799 {'e', '2', 0x1ebb},
800 {'E', '?', 0x1ebc},
801 {'e', '?', 0x1ebd},
802 {'I', '2', 0x1ec8},
803 {'i', '2', 0x1ec9},
804 {'O', '2', 0x1ece},
805 {'o', '2', 0x1ecf},
806 {'U', '2', 0x1ee6},
807 {'u', '2', 0x1ee7},
808 {'Y', '!', 0x1ef2},
Bram Moolenaareae8ae12018-12-14 18:53:02 +0100809 {'Y', '`', 0x1ef2}, // extra alternative, easier to remember
Bram Moolenaar071d4272004-06-13 20:20:40 +0000810 {'y', '!', 0x1ef3},
Bram Moolenaareae8ae12018-12-14 18:53:02 +0100811 {'y', '`', 0x1ef3}, // extra alternative, easier to remember
Bram Moolenaar071d4272004-06-13 20:20:40 +0000812 {'Y', '2', 0x1ef6},
813 {'y', '2', 0x1ef7},
814 {'Y', '?', 0x1ef8},
815 {'y', '?', 0x1ef9},
Bram Moolenaare3f915d2020-07-14 23:02:44 +0200816# define DG_START_GREEK_EXTENDED 0x1f00
Bram Moolenaar071d4272004-06-13 20:20:40 +0000817 {';', '\'', 0x1f00},
818 {',', '\'', 0x1f01},
819 {';', '!', 0x1f02},
820 {',', '!', 0x1f03},
821 {'?', ';', 0x1f04},
822 {'?', ',', 0x1f05},
823 {'!', ':', 0x1f06},
824 {'?', ':', 0x1f07},
Bram Moolenaare3f915d2020-07-14 23:02:44 +0200825# define DG_START_PUNCTUATION 0x2002
Bram Moolenaar071d4272004-06-13 20:20:40 +0000826 {'1', 'N', 0x2002},
827 {'1', 'M', 0x2003},
828 {'3', 'M', 0x2004},
829 {'4', 'M', 0x2005},
830 {'6', 'M', 0x2006},
831 {'1', 'T', 0x2009},
832 {'1', 'H', 0x200a},
833 {'-', '1', 0x2010},
834 {'-', 'N', 0x2013},
835 {'-', 'M', 0x2014},
836 {'-', '3', 0x2015},
837 {'!', '2', 0x2016},
838 {'=', '2', 0x2017},
839 {'\'', '6', 0x2018},
840 {'\'', '9', 0x2019},
841 {'.', '9', 0x201a},
842 {'9', '\'', 0x201b},
843 {'"', '6', 0x201c},
844 {'"', '9', 0x201d},
845 {':', '9', 0x201e},
846 {'9', '"', 0x201f},
847 {'/', '-', 0x2020},
848 {'/', '=', 0x2021},
Bram Moolenaar57ad94c2020-09-08 19:06:30 +0200849 {'o', 'o', 0x2022},
Bram Moolenaar071d4272004-06-13 20:20:40 +0000850 {'.', '.', 0x2025},
Bram Moolenaar81615512016-11-04 22:17:16 +0100851 {',', '.', 0x2026},
Bram Moolenaar071d4272004-06-13 20:20:40 +0000852 {'%', '0', 0x2030},
853 {'1', '\'', 0x2032},
854 {'2', '\'', 0x2033},
855 {'3', '\'', 0x2034},
856 {'1', '"', 0x2035},
857 {'2', '"', 0x2036},
858 {'3', '"', 0x2037},
859 {'C', 'a', 0x2038},
860 {'<', '1', 0x2039},
861 {'>', '1', 0x203a},
862 {':', 'X', 0x203b},
863 {'\'', '-', 0x203e},
864 {'/', 'f', 0x2044},
Bram Moolenaare3f915d2020-07-14 23:02:44 +0200865# define DG_START_SUB_SUPER 0x2070
Bram Moolenaar071d4272004-06-13 20:20:40 +0000866 {'0', 'S', 0x2070},
867 {'4', 'S', 0x2074},
868 {'5', 'S', 0x2075},
869 {'6', 'S', 0x2076},
870 {'7', 'S', 0x2077},
871 {'8', 'S', 0x2078},
872 {'9', 'S', 0x2079},
873 {'+', 'S', 0x207a},
874 {'-', 'S', 0x207b},
875 {'=', 'S', 0x207c},
876 {'(', 'S', 0x207d},
877 {')', 'S', 0x207e},
878 {'n', 'S', 0x207f},
879 {'0', 's', 0x2080},
880 {'1', 's', 0x2081},
881 {'2', 's', 0x2082},
882 {'3', 's', 0x2083},
883 {'4', 's', 0x2084},
884 {'5', 's', 0x2085},
885 {'6', 's', 0x2086},
886 {'7', 's', 0x2087},
887 {'8', 's', 0x2088},
888 {'9', 's', 0x2089},
889 {'+', 's', 0x208a},
890 {'-', 's', 0x208b},
891 {'=', 's', 0x208c},
892 {'(', 's', 0x208d},
893 {')', 's', 0x208e},
Bram Moolenaare3f915d2020-07-14 23:02:44 +0200894# define DG_START_CURRENCY 0x20a4
Bram Moolenaar071d4272004-06-13 20:20:40 +0000895 {'L', 'i', 0x20a4},
896 {'P', 't', 0x20a7},
897 {'W', '=', 0x20a9},
Bram Moolenaar5d18efe2019-12-01 21:11:22 +0100898 {'=', 'e', 0x20ac}, // euro
899 {'E', 'u', 0x20ac}, // euro
900 {'=', 'R', 0x20bd}, // rouble
901 {'=', 'P', 0x20bd}, // rouble
Bram Moolenaare3f915d2020-07-14 23:02:44 +0200902# define DG_START_OTHER1 0x2103
Bram Moolenaar071d4272004-06-13 20:20:40 +0000903 {'o', 'C', 0x2103},
904 {'c', 'o', 0x2105},
905 {'o', 'F', 0x2109},
906 {'N', '0', 0x2116},
907 {'P', 'O', 0x2117},
908 {'R', 'x', 0x211e},
909 {'S', 'M', 0x2120},
910 {'T', 'M', 0x2122},
911 {'O', 'm', 0x2126},
912 {'A', 'O', 0x212b},
913 {'1', '3', 0x2153},
914 {'2', '3', 0x2154},
915 {'1', '5', 0x2155},
916 {'2', '5', 0x2156},
917 {'3', '5', 0x2157},
918 {'4', '5', 0x2158},
919 {'1', '6', 0x2159},
920 {'5', '6', 0x215a},
921 {'1', '8', 0x215b},
922 {'3', '8', 0x215c},
923 {'5', '8', 0x215d},
924 {'7', '8', 0x215e},
Bram Moolenaare3f915d2020-07-14 23:02:44 +0200925# define DG_START_ROMAN 0x2160
Bram Moolenaar071d4272004-06-13 20:20:40 +0000926 {'1', 'R', 0x2160},
927 {'2', 'R', 0x2161},
928 {'3', 'R', 0x2162},
929 {'4', 'R', 0x2163},
930 {'5', 'R', 0x2164},
931 {'6', 'R', 0x2165},
932 {'7', 'R', 0x2166},
933 {'8', 'R', 0x2167},
934 {'9', 'R', 0x2168},
935 {'a', 'R', 0x2169},
936 {'b', 'R', 0x216a},
937 {'c', 'R', 0x216b},
938 {'1', 'r', 0x2170},
939 {'2', 'r', 0x2171},
940 {'3', 'r', 0x2172},
941 {'4', 'r', 0x2173},
942 {'5', 'r', 0x2174},
943 {'6', 'r', 0x2175},
944 {'7', 'r', 0x2176},
945 {'8', 'r', 0x2177},
946 {'9', 'r', 0x2178},
947 {'a', 'r', 0x2179},
948 {'b', 'r', 0x217a},
949 {'c', 'r', 0x217b},
Bram Moolenaare3f915d2020-07-14 23:02:44 +0200950# define DG_START_ARROWS 0x2190
Bram Moolenaar071d4272004-06-13 20:20:40 +0000951 {'<', '-', 0x2190},
952 {'-', '!', 0x2191},
953 {'-', '>', 0x2192},
954 {'-', 'v', 0x2193},
955 {'<', '>', 0x2194},
956 {'U', 'D', 0x2195},
957 {'<', '=', 0x21d0},
958 {'=', '>', 0x21d2},
959 {'=', '=', 0x21d4},
Bram Moolenaare3f915d2020-07-14 23:02:44 +0200960# define DG_START_MATH 0x2200
Bram Moolenaar071d4272004-06-13 20:20:40 +0000961 {'F', 'A', 0x2200},
962 {'d', 'P', 0x2202},
963 {'T', 'E', 0x2203},
964 {'/', '0', 0x2205},
965 {'D', 'E', 0x2206},
966 {'N', 'B', 0x2207},
967 {'(', '-', 0x2208},
968 {'-', ')', 0x220b},
969 {'*', 'P', 0x220f},
970 {'+', 'Z', 0x2211},
971 {'-', '2', 0x2212},
972 {'-', '+', 0x2213},
973 {'*', '-', 0x2217},
974 {'O', 'b', 0x2218},
975 {'S', 'b', 0x2219},
976 {'R', 'T', 0x221a},
977 {'0', '(', 0x221d},
978 {'0', '0', 0x221e},
979 {'-', 'L', 0x221f},
980 {'-', 'V', 0x2220},
981 {'P', 'P', 0x2225},
982 {'A', 'N', 0x2227},
983 {'O', 'R', 0x2228},
984 {'(', 'U', 0x2229},
985 {')', 'U', 0x222a},
986 {'I', 'n', 0x222b},
987 {'D', 'I', 0x222c},
988 {'I', 'o', 0x222e},
989 {'.', ':', 0x2234},
990 {':', '.', 0x2235},
991 {':', 'R', 0x2236},
992 {':', ':', 0x2237},
993 {'?', '1', 0x223c},
994 {'C', 'G', 0x223e},
995 {'?', '-', 0x2243},
996 {'?', '=', 0x2245},
997 {'?', '2', 0x2248},
998 {'=', '?', 0x224c},
999 {'H', 'I', 0x2253},
1000 {'!', '=', 0x2260},
1001 {'=', '3', 0x2261},
1002 {'=', '<', 0x2264},
1003 {'>', '=', 0x2265},
1004 {'<', '*', 0x226a},
1005 {'*', '>', 0x226b},
1006 {'!', '<', 0x226e},
1007 {'!', '>', 0x226f},
1008 {'(', 'C', 0x2282},
1009 {')', 'C', 0x2283},
1010 {'(', '_', 0x2286},
1011 {')', '_', 0x2287},
1012 {'0', '.', 0x2299},
1013 {'0', '2', 0x229a},
1014 {'-', 'T', 0x22a5},
1015 {'.', 'P', 0x22c5},
1016 {':', '3', 0x22ee},
1017 {'.', '3', 0x22ef},
Bram Moolenaare3f915d2020-07-14 23:02:44 +02001018# define DG_START_TECHNICAL 0x2302
Bram Moolenaar071d4272004-06-13 20:20:40 +00001019 {'E', 'h', 0x2302},
1020 {'<', '7', 0x2308},
1021 {'>', '7', 0x2309},
1022 {'7', '<', 0x230a},
1023 {'7', '>', 0x230b},
1024 {'N', 'I', 0x2310},
1025 {'(', 'A', 0x2312},
1026 {'T', 'R', 0x2315},
1027 {'I', 'u', 0x2320},
1028 {'I', 'l', 0x2321},
1029 {'<', '/', 0x2329},
1030 {'/', '>', 0x232a},
Bram Moolenaare3f915d2020-07-14 23:02:44 +02001031# define DG_START_OTHER2 0x2423
Bram Moolenaar071d4272004-06-13 20:20:40 +00001032 {'V', 's', 0x2423},
1033 {'1', 'h', 0x2440},
1034 {'3', 'h', 0x2441},
1035 {'2', 'h', 0x2442},
1036 {'4', 'h', 0x2443},
1037 {'1', 'j', 0x2446},
1038 {'2', 'j', 0x2447},
1039 {'3', 'j', 0x2448},
1040 {'4', 'j', 0x2449},
1041 {'1', '.', 0x2488},
1042 {'2', '.', 0x2489},
1043 {'3', '.', 0x248a},
1044 {'4', '.', 0x248b},
1045 {'5', '.', 0x248c},
1046 {'6', '.', 0x248d},
1047 {'7', '.', 0x248e},
1048 {'8', '.', 0x248f},
1049 {'9', '.', 0x2490},
Bram Moolenaare3f915d2020-07-14 23:02:44 +02001050# define DG_START_DRAWING 0x2500
Bram Moolenaar071d4272004-06-13 20:20:40 +00001051 {'h', 'h', 0x2500},
1052 {'H', 'H', 0x2501},
1053 {'v', 'v', 0x2502},
1054 {'V', 'V', 0x2503},
1055 {'3', '-', 0x2504},
1056 {'3', '_', 0x2505},
1057 {'3', '!', 0x2506},
1058 {'3', '/', 0x2507},
1059 {'4', '-', 0x2508},
1060 {'4', '_', 0x2509},
1061 {'4', '!', 0x250a},
1062 {'4', '/', 0x250b},
1063 {'d', 'r', 0x250c},
1064 {'d', 'R', 0x250d},
1065 {'D', 'r', 0x250e},
1066 {'D', 'R', 0x250f},
1067 {'d', 'l', 0x2510},
1068 {'d', 'L', 0x2511},
1069 {'D', 'l', 0x2512},
1070 {'L', 'D', 0x2513},
1071 {'u', 'r', 0x2514},
1072 {'u', 'R', 0x2515},
1073 {'U', 'r', 0x2516},
1074 {'U', 'R', 0x2517},
1075 {'u', 'l', 0x2518},
1076 {'u', 'L', 0x2519},
1077 {'U', 'l', 0x251a},
1078 {'U', 'L', 0x251b},
1079 {'v', 'r', 0x251c},
1080 {'v', 'R', 0x251d},
1081 {'V', 'r', 0x2520},
1082 {'V', 'R', 0x2523},
1083 {'v', 'l', 0x2524},
1084 {'v', 'L', 0x2525},
1085 {'V', 'l', 0x2528},
1086 {'V', 'L', 0x252b},
1087 {'d', 'h', 0x252c},
1088 {'d', 'H', 0x252f},
1089 {'D', 'h', 0x2530},
1090 {'D', 'H', 0x2533},
1091 {'u', 'h', 0x2534},
1092 {'u', 'H', 0x2537},
1093 {'U', 'h', 0x2538},
1094 {'U', 'H', 0x253b},
1095 {'v', 'h', 0x253c},
1096 {'v', 'H', 0x253f},
1097 {'V', 'h', 0x2542},
1098 {'V', 'H', 0x254b},
1099 {'F', 'D', 0x2571},
1100 {'B', 'D', 0x2572},
Bram Moolenaare3f915d2020-07-14 23:02:44 +02001101# define DG_START_BLOCK 0x2580
Bram Moolenaar071d4272004-06-13 20:20:40 +00001102 {'T', 'B', 0x2580},
1103 {'L', 'B', 0x2584},
1104 {'F', 'B', 0x2588},
1105 {'l', 'B', 0x258c},
1106 {'R', 'B', 0x2590},
1107 {'.', 'S', 0x2591},
1108 {':', 'S', 0x2592},
1109 {'?', 'S', 0x2593},
Bram Moolenaare3f915d2020-07-14 23:02:44 +02001110# define DG_START_SHAPES 0x25a0
Bram Moolenaar071d4272004-06-13 20:20:40 +00001111 {'f', 'S', 0x25a0},
1112 {'O', 'S', 0x25a1},
1113 {'R', 'O', 0x25a2},
1114 {'R', 'r', 0x25a3},
1115 {'R', 'F', 0x25a4},
1116 {'R', 'Y', 0x25a5},
1117 {'R', 'H', 0x25a6},
1118 {'R', 'Z', 0x25a7},
1119 {'R', 'K', 0x25a8},
1120 {'R', 'X', 0x25a9},
1121 {'s', 'B', 0x25aa},
1122 {'S', 'R', 0x25ac},
1123 {'O', 'r', 0x25ad},
1124 {'U', 'T', 0x25b2},
1125 {'u', 'T', 0x25b3},
1126 {'P', 'R', 0x25b6},
1127 {'T', 'r', 0x25b7},
1128 {'D', 't', 0x25bc},
1129 {'d', 'T', 0x25bd},
1130 {'P', 'L', 0x25c0},
1131 {'T', 'l', 0x25c1},
1132 {'D', 'b', 0x25c6},
1133 {'D', 'w', 0x25c7},
1134 {'L', 'Z', 0x25ca},
1135 {'0', 'm', 0x25cb},
1136 {'0', 'o', 0x25ce},
1137 {'0', 'M', 0x25cf},
1138 {'0', 'L', 0x25d0},
1139 {'0', 'R', 0x25d1},
1140 {'S', 'n', 0x25d8},
1141 {'I', 'c', 0x25d9},
1142 {'F', 'd', 0x25e2},
1143 {'B', 'd', 0x25e3},
Bram Moolenaare3f915d2020-07-14 23:02:44 +02001144# define DG_START_SYMBOLS 0x2605
Bram Moolenaar071d4272004-06-13 20:20:40 +00001145 {'*', '2', 0x2605},
1146 {'*', '1', 0x2606},
1147 {'<', 'H', 0x261c},
1148 {'>', 'H', 0x261e},
1149 {'0', 'u', 0x263a},
1150 {'0', 'U', 0x263b},
1151 {'S', 'U', 0x263c},
1152 {'F', 'm', 0x2640},
1153 {'M', 'l', 0x2642},
1154 {'c', 'S', 0x2660},
1155 {'c', 'H', 0x2661},
1156 {'c', 'D', 0x2662},
1157 {'c', 'C', 0x2663},
1158 {'M', 'd', 0x2669},
1159 {'M', '8', 0x266a},
1160 {'M', '2', 0x266b},
1161 {'M', 'b', 0x266d},
1162 {'M', 'x', 0x266e},
1163 {'M', 'X', 0x266f},
Bram Moolenaare3f915d2020-07-14 23:02:44 +02001164# define DG_START_DINGBATS 0x2713
Bram Moolenaar071d4272004-06-13 20:20:40 +00001165 {'O', 'K', 0x2713},
1166 {'X', 'X', 0x2717},
1167 {'-', 'X', 0x2720},
Bram Moolenaare3f915d2020-07-14 23:02:44 +02001168# define DG_START_CJK_SYMBOLS 0x3000
Bram Moolenaar071d4272004-06-13 20:20:40 +00001169 {'I', 'S', 0x3000},
1170 {',', '_', 0x3001},
1171 {'.', '_', 0x3002},
1172 {'+', '"', 0x3003},
1173 {'+', '_', 0x3004},
1174 {'*', '_', 0x3005},
1175 {';', '_', 0x3006},
1176 {'0', '_', 0x3007},
1177 {'<', '+', 0x300a},
1178 {'>', '+', 0x300b},
1179 {'<', '\'', 0x300c},
1180 {'>', '\'', 0x300d},
1181 {'<', '"', 0x300e},
1182 {'>', '"', 0x300f},
1183 {'(', '"', 0x3010},
1184 {')', '"', 0x3011},
1185 {'=', 'T', 0x3012},
1186 {'=', '_', 0x3013},
1187 {'(', '\'', 0x3014},
1188 {')', '\'', 0x3015},
1189 {'(', 'I', 0x3016},
1190 {')', 'I', 0x3017},
1191 {'-', '?', 0x301c},
Bram Moolenaare3f915d2020-07-14 23:02:44 +02001192# define DG_START_HIRAGANA 0x3041
Bram Moolenaar071d4272004-06-13 20:20:40 +00001193 {'A', '5', 0x3041},
1194 {'a', '5', 0x3042},
1195 {'I', '5', 0x3043},
1196 {'i', '5', 0x3044},
1197 {'U', '5', 0x3045},
1198 {'u', '5', 0x3046},
1199 {'E', '5', 0x3047},
1200 {'e', '5', 0x3048},
1201 {'O', '5', 0x3049},
1202 {'o', '5', 0x304a},
1203 {'k', 'a', 0x304b},
1204 {'g', 'a', 0x304c},
1205 {'k', 'i', 0x304d},
1206 {'g', 'i', 0x304e},
1207 {'k', 'u', 0x304f},
1208 {'g', 'u', 0x3050},
1209 {'k', 'e', 0x3051},
1210 {'g', 'e', 0x3052},
1211 {'k', 'o', 0x3053},
1212 {'g', 'o', 0x3054},
1213 {'s', 'a', 0x3055},
1214 {'z', 'a', 0x3056},
1215 {'s', 'i', 0x3057},
1216 {'z', 'i', 0x3058},
1217 {'s', 'u', 0x3059},
1218 {'z', 'u', 0x305a},
1219 {'s', 'e', 0x305b},
1220 {'z', 'e', 0x305c},
1221 {'s', 'o', 0x305d},
1222 {'z', 'o', 0x305e},
1223 {'t', 'a', 0x305f},
1224 {'d', 'a', 0x3060},
1225 {'t', 'i', 0x3061},
1226 {'d', 'i', 0x3062},
1227 {'t', 'U', 0x3063},
1228 {'t', 'u', 0x3064},
1229 {'d', 'u', 0x3065},
1230 {'t', 'e', 0x3066},
1231 {'d', 'e', 0x3067},
1232 {'t', 'o', 0x3068},
1233 {'d', 'o', 0x3069},
1234 {'n', 'a', 0x306a},
1235 {'n', 'i', 0x306b},
1236 {'n', 'u', 0x306c},
1237 {'n', 'e', 0x306d},
1238 {'n', 'o', 0x306e},
1239 {'h', 'a', 0x306f},
1240 {'b', 'a', 0x3070},
1241 {'p', 'a', 0x3071},
1242 {'h', 'i', 0x3072},
1243 {'b', 'i', 0x3073},
1244 {'p', 'i', 0x3074},
1245 {'h', 'u', 0x3075},
1246 {'b', 'u', 0x3076},
1247 {'p', 'u', 0x3077},
1248 {'h', 'e', 0x3078},
1249 {'b', 'e', 0x3079},
1250 {'p', 'e', 0x307a},
1251 {'h', 'o', 0x307b},
1252 {'b', 'o', 0x307c},
1253 {'p', 'o', 0x307d},
1254 {'m', 'a', 0x307e},
1255 {'m', 'i', 0x307f},
1256 {'m', 'u', 0x3080},
1257 {'m', 'e', 0x3081},
1258 {'m', 'o', 0x3082},
1259 {'y', 'A', 0x3083},
1260 {'y', 'a', 0x3084},
1261 {'y', 'U', 0x3085},
1262 {'y', 'u', 0x3086},
1263 {'y', 'O', 0x3087},
1264 {'y', 'o', 0x3088},
1265 {'r', 'a', 0x3089},
1266 {'r', 'i', 0x308a},
1267 {'r', 'u', 0x308b},
1268 {'r', 'e', 0x308c},
1269 {'r', 'o', 0x308d},
1270 {'w', 'A', 0x308e},
1271 {'w', 'a', 0x308f},
1272 {'w', 'i', 0x3090},
1273 {'w', 'e', 0x3091},
1274 {'w', 'o', 0x3092},
1275 {'n', '5', 0x3093},
1276 {'v', 'u', 0x3094},
1277 {'"', '5', 0x309b},
1278 {'0', '5', 0x309c},
1279 {'*', '5', 0x309d},
1280 {'+', '5', 0x309e},
Bram Moolenaare3f915d2020-07-14 23:02:44 +02001281# define DG_START_KATAKANA 0x30a1
Bram Moolenaar071d4272004-06-13 20:20:40 +00001282 {'a', '6', 0x30a1},
1283 {'A', '6', 0x30a2},
1284 {'i', '6', 0x30a3},
1285 {'I', '6', 0x30a4},
1286 {'u', '6', 0x30a5},
1287 {'U', '6', 0x30a6},
1288 {'e', '6', 0x30a7},
1289 {'E', '6', 0x30a8},
1290 {'o', '6', 0x30a9},
1291 {'O', '6', 0x30aa},
1292 {'K', 'a', 0x30ab},
1293 {'G', 'a', 0x30ac},
1294 {'K', 'i', 0x30ad},
1295 {'G', 'i', 0x30ae},
1296 {'K', 'u', 0x30af},
1297 {'G', 'u', 0x30b0},
1298 {'K', 'e', 0x30b1},
1299 {'G', 'e', 0x30b2},
1300 {'K', 'o', 0x30b3},
1301 {'G', 'o', 0x30b4},
1302 {'S', 'a', 0x30b5},
1303 {'Z', 'a', 0x30b6},
1304 {'S', 'i', 0x30b7},
1305 {'Z', 'i', 0x30b8},
1306 {'S', 'u', 0x30b9},
1307 {'Z', 'u', 0x30ba},
1308 {'S', 'e', 0x30bb},
1309 {'Z', 'e', 0x30bc},
1310 {'S', 'o', 0x30bd},
1311 {'Z', 'o', 0x30be},
1312 {'T', 'a', 0x30bf},
1313 {'D', 'a', 0x30c0},
1314 {'T', 'i', 0x30c1},
1315 {'D', 'i', 0x30c2},
1316 {'T', 'U', 0x30c3},
1317 {'T', 'u', 0x30c4},
1318 {'D', 'u', 0x30c5},
1319 {'T', 'e', 0x30c6},
1320 {'D', 'e', 0x30c7},
1321 {'T', 'o', 0x30c8},
1322 {'D', 'o', 0x30c9},
1323 {'N', 'a', 0x30ca},
1324 {'N', 'i', 0x30cb},
1325 {'N', 'u', 0x30cc},
1326 {'N', 'e', 0x30cd},
1327 {'N', 'o', 0x30ce},
1328 {'H', 'a', 0x30cf},
1329 {'B', 'a', 0x30d0},
1330 {'P', 'a', 0x30d1},
1331 {'H', 'i', 0x30d2},
1332 {'B', 'i', 0x30d3},
1333 {'P', 'i', 0x30d4},
1334 {'H', 'u', 0x30d5},
1335 {'B', 'u', 0x30d6},
1336 {'P', 'u', 0x30d7},
1337 {'H', 'e', 0x30d8},
1338 {'B', 'e', 0x30d9},
1339 {'P', 'e', 0x30da},
1340 {'H', 'o', 0x30db},
1341 {'B', 'o', 0x30dc},
1342 {'P', 'o', 0x30dd},
1343 {'M', 'a', 0x30de},
1344 {'M', 'i', 0x30df},
1345 {'M', 'u', 0x30e0},
1346 {'M', 'e', 0x30e1},
1347 {'M', 'o', 0x30e2},
1348 {'Y', 'A', 0x30e3},
1349 {'Y', 'a', 0x30e4},
1350 {'Y', 'U', 0x30e5},
1351 {'Y', 'u', 0x30e6},
1352 {'Y', 'O', 0x30e7},
1353 {'Y', 'o', 0x30e8},
1354 {'R', 'a', 0x30e9},
1355 {'R', 'i', 0x30ea},
1356 {'R', 'u', 0x30eb},
1357 {'R', 'e', 0x30ec},
1358 {'R', 'o', 0x30ed},
1359 {'W', 'A', 0x30ee},
1360 {'W', 'a', 0x30ef},
1361 {'W', 'i', 0x30f0},
1362 {'W', 'e', 0x30f1},
1363 {'W', 'o', 0x30f2},
1364 {'N', '6', 0x30f3},
1365 {'V', 'u', 0x30f4},
1366 {'K', 'A', 0x30f5},
1367 {'K', 'E', 0x30f6},
1368 {'V', 'a', 0x30f7},
1369 {'V', 'i', 0x30f8},
1370 {'V', 'e', 0x30f9},
1371 {'V', 'o', 0x30fa},
1372 {'.', '6', 0x30fb},
1373 {'-', '6', 0x30fc},
1374 {'*', '6', 0x30fd},
1375 {'+', '6', 0x30fe},
Bram Moolenaare3f915d2020-07-14 23:02:44 +02001376# define DG_START_BOPOMOFO 0x3105
Bram Moolenaar071d4272004-06-13 20:20:40 +00001377 {'b', '4', 0x3105},
1378 {'p', '4', 0x3106},
1379 {'m', '4', 0x3107},
1380 {'f', '4', 0x3108},
1381 {'d', '4', 0x3109},
1382 {'t', '4', 0x310a},
1383 {'n', '4', 0x310b},
1384 {'l', '4', 0x310c},
1385 {'g', '4', 0x310d},
1386 {'k', '4', 0x310e},
1387 {'h', '4', 0x310f},
1388 {'j', '4', 0x3110},
1389 {'q', '4', 0x3111},
1390 {'x', '4', 0x3112},
1391 {'z', 'h', 0x3113},
1392 {'c', 'h', 0x3114},
1393 {'s', 'h', 0x3115},
1394 {'r', '4', 0x3116},
1395 {'z', '4', 0x3117},
1396 {'c', '4', 0x3118},
1397 {'s', '4', 0x3119},
1398 {'a', '4', 0x311a},
1399 {'o', '4', 0x311b},
1400 {'e', '4', 0x311c},
1401 {'a', 'i', 0x311e},
1402 {'e', 'i', 0x311f},
1403 {'a', 'u', 0x3120},
1404 {'o', 'u', 0x3121},
1405 {'a', 'n', 0x3122},
1406 {'e', 'n', 0x3123},
1407 {'a', 'N', 0x3124},
1408 {'e', 'N', 0x3125},
1409 {'e', 'r', 0x3126},
1410 {'i', '4', 0x3127},
1411 {'u', '4', 0x3128},
1412 {'i', 'u', 0x3129},
1413 {'v', '4', 0x312a},
1414 {'n', 'G', 0x312b},
1415 {'g', 'n', 0x312c},
Bram Moolenaare3f915d2020-07-14 23:02:44 +02001416# define DG_START_OTHER3 0x3220
Bram Moolenaar071d4272004-06-13 20:20:40 +00001417 {'1', 'c', 0x3220},
1418 {'2', 'c', 0x3221},
1419 {'3', 'c', 0x3222},
1420 {'4', 'c', 0x3223},
1421 {'5', 'c', 0x3224},
1422 {'6', 'c', 0x3225},
1423 {'7', 'c', 0x3226},
1424 {'8', 'c', 0x3227},
1425 {'9', 'c', 0x3228},
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01001426 // code points 0xe000 - 0xefff excluded, they have no assigned
1427 // characters, only used in proposals.
Bram Moolenaar071d4272004-06-13 20:20:40 +00001428 {'f', 'f', 0xfb00},
1429 {'f', 'i', 0xfb01},
1430 {'f', 'l', 0xfb02},
1431 {'f', 't', 0xfb05},
1432 {'s', 't', 0xfb06},
Bram Moolenaar5f91c0c2008-01-03 16:54:33 +00001433
Bram Moolenaare27d6e62022-08-30 15:05:30 +01001434 {NUL, NUL, NUL} // end marker
1435};
Bram Moolenaar071d4272004-06-13 20:20:40 +00001436
1437/*
1438 * handle digraphs after typing a character
1439 */
1440 int
Bram Moolenaar7454a062016-01-30 15:14:10 +01001441do_digraph(int c)
Bram Moolenaar071d4272004-06-13 20:20:40 +00001442{
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01001443 static int backspaced; // character before K_BS
1444 static int lastchar; // last typed character
Bram Moolenaar071d4272004-06-13 20:20:40 +00001445
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01001446 if (c == -1) // init values
Bram Moolenaar071d4272004-06-13 20:20:40 +00001447 {
1448 backspaced = -1;
1449 }
1450 else if (p_dg)
1451 {
1452 if (backspaced >= 0)
h-east29b85712021-07-26 21:54:04 +02001453 c = digraph_get(backspaced, c, FALSE);
Bram Moolenaar071d4272004-06-13 20:20:40 +00001454 backspaced = -1;
1455 if ((c == K_BS || c == Ctrl_H) && lastchar >= 0)
1456 backspaced = lastchar;
1457 }
1458 lastchar = c;
1459 return c;
1460}
1461
1462/*
Bram Moolenaar5f73ef82018-02-27 21:09:30 +01001463 * Find a digraph for "val". If found return the string to display it.
1464 * If not found return NULL.
1465 */
1466 char_u *
Bram Moolenaarbc5020a2018-06-16 17:25:22 +02001467get_digraph_for_char(int val_arg)
Bram Moolenaar5f73ef82018-02-27 21:09:30 +01001468{
Bram Moolenaarbc5020a2018-06-16 17:25:22 +02001469 int val = val_arg;
Bram Moolenaar5f73ef82018-02-27 21:09:30 +01001470 int i;
1471 int use_defaults;
1472 digr_T *dp;
1473 static char_u r[3];
1474
Bram Moolenaareae8ae12018-12-14 18:53:02 +01001475#if defined(USE_UNICODE_DIGRAPHS)
Bram Moolenaarbc5020a2018-06-16 17:25:22 +02001476 if (!enc_utf8)
1477 {
1478 char_u buf[6], *to;
1479 vimconv_T vc;
1480
1481 // convert the character from 'encoding' to Unicode
1482 i = mb_char2bytes(val, buf);
1483 vc.vc_type = CONV_NONE;
1484 if (convert_setup(&vc, p_enc, (char_u *)"utf-8") == OK)
1485 {
1486 vc.vc_fail = TRUE;
1487 to = string_convert(&vc, buf, &i);
1488 if (to != NULL)
1489 {
1490 val = utf_ptr2char(to);
1491 vim_free(to);
1492 }
1493 (void)convert_setup(&vc, NULL, NULL);
1494 }
1495 }
1496#endif
1497
Bram Moolenaar5f73ef82018-02-27 21:09:30 +01001498 for (use_defaults = 0; use_defaults <= 1; use_defaults++)
1499 {
1500 if (use_defaults == 0)
1501 dp = (digr_T *)user_digraphs.ga_data;
1502 else
1503 dp = digraphdefault;
1504 for (i = 0; use_defaults ? dp->char1 != NUL
1505 : i < user_digraphs.ga_len; ++i)
1506 {
1507 if (dp->result == val)
1508 {
1509 r[0] = dp->char1;
1510 r[1] = dp->char2;
1511 r[2] = NUL;
1512 return r;
1513 }
1514 ++dp;
1515 }
1516 }
1517 return NULL;
1518}
1519
1520/*
Bram Moolenaar071d4272004-06-13 20:20:40 +00001521 * Get a digraph. Used after typing CTRL-K on the command line or in normal
1522 * mode.
1523 * Returns composed character, or NUL when ESC was used.
1524 */
1525 int
Bram Moolenaar7454a062016-01-30 15:14:10 +01001526get_digraph(
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01001527 int cmdline) // TRUE when called from the cmdline
Bram Moolenaar071d4272004-06-13 20:20:40 +00001528{
1529 int c, cc;
1530
1531 ++no_mapping;
1532 ++allow_keys;
Bram Moolenaar61abfd12007-09-13 16:26:47 +00001533 c = plain_vgetc();
Bram Moolenaar071d4272004-06-13 20:20:40 +00001534 --no_mapping;
1535 --allow_keys;
Yegappan Lakshmanan1cfb14a2023-01-09 19:04:23 +00001536
1537 if (c == ESC) // ESC cancels CTRL-K
1538 return NUL;
1539
1540 if (IS_SPECIAL(c)) // insert special key code
1541 return c;
1542 if (cmdline)
Bram Moolenaar071d4272004-06-13 20:20:40 +00001543 {
Yegappan Lakshmanan1cfb14a2023-01-09 19:04:23 +00001544 if (char2cells(c) == 1
Bram Moolenaar071d4272004-06-13 20:20:40 +00001545#if defined(FEAT_CRYPT) || defined(FEAT_EVAL)
Yegappan Lakshmanan1cfb14a2023-01-09 19:04:23 +00001546 && cmdline_star == 0
Bram Moolenaar071d4272004-06-13 20:20:40 +00001547#endif
Yegappan Lakshmanan1cfb14a2023-01-09 19:04:23 +00001548 )
1549 putcmdline(c, TRUE);
Bram Moolenaar071d4272004-06-13 20:20:40 +00001550 }
Yegappan Lakshmanan1cfb14a2023-01-09 19:04:23 +00001551 else
1552 add_to_showcmd(c);
1553 ++no_mapping;
1554 ++allow_keys;
1555 cc = plain_vgetc();
1556 --no_mapping;
1557 --allow_keys;
1558 if (cc != ESC) // ESC cancels CTRL-K
1559 return digraph_get(c, cc, TRUE);
Bram Moolenaar071d4272004-06-13 20:20:40 +00001560 return NUL;
1561}
1562
1563/*
1564 * Lookup the pair "char1", "char2" in the digraph tables.
1565 * If no match, return "char2".
Bram Moolenaar70b2a562012-01-10 22:26:17 +01001566 * If "meta_char" is TRUE and "char1" is a space, return "char2" | 0x80.
Bram Moolenaar071d4272004-06-13 20:20:40 +00001567 */
1568 static int
Bram Moolenaar7454a062016-01-30 15:14:10 +01001569getexactdigraph(int char1, int char2, int meta_char)
Bram Moolenaar071d4272004-06-13 20:20:40 +00001570{
1571 int i;
1572 int retval = 0;
1573 digr_T *dp;
1574
1575 if (IS_SPECIAL(char1) || IS_SPECIAL(char2))
1576 return char2;
1577
1578 /*
1579 * Search user digraphs first.
1580 */
1581 dp = (digr_T *)user_digraphs.ga_data;
1582 for (i = 0; i < user_digraphs.ga_len; ++i)
1583 {
1584 if ((int)dp->char1 == char1 && (int)dp->char2 == char2)
1585 {
1586 retval = dp->result;
1587 break;
1588 }
1589 ++dp;
1590 }
1591
1592 /*
1593 * Search default digraphs.
1594 */
1595 if (retval == 0)
1596 {
1597 dp = digraphdefault;
dundargocb2209f22022-09-24 15:55:27 +01001598 while (dp->char1 != 0)
Bram Moolenaar071d4272004-06-13 20:20:40 +00001599 {
1600 if ((int)dp->char1 == char1 && (int)dp->char2 == char2)
1601 {
1602 retval = dp->result;
1603 break;
1604 }
1605 ++dp;
1606 }
1607 }
Bram Moolenaar13505972019-01-24 15:04:48 +01001608#ifdef USE_UNICODE_DIGRAPHS
Bram Moolenaar071d4272004-06-13 20:20:40 +00001609 if (retval != 0 && !enc_utf8)
1610 {
1611 char_u buf[6], *to;
1612 vimconv_T vc;
1613
1614 /*
1615 * Convert the Unicode digraph to 'encoding'.
1616 */
1617 i = utf_char2bytes(retval, buf);
1618 retval = 0;
1619 vc.vc_type = CONV_NONE;
1620 if (convert_setup(&vc, (char_u *)"utf-8", p_enc) == OK)
1621 {
1622 vc.vc_fail = TRUE;
1623 to = string_convert(&vc, buf, &i);
1624 if (to != NULL)
1625 {
1626 retval = (*mb_ptr2char)(to);
1627 vim_free(to);
1628 }
1629 (void)convert_setup(&vc, NULL, NULL);
1630 }
1631 }
Bram Moolenaar13505972019-01-24 15:04:48 +01001632#endif
Bram Moolenaar071d4272004-06-13 20:20:40 +00001633
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01001634 // Ignore multi-byte characters when not in multi-byte mode.
Bram Moolenaar071d4272004-06-13 20:20:40 +00001635 if (!has_mbyte && retval > 0xff)
1636 retval = 0;
Bram Moolenaar071d4272004-06-13 20:20:40 +00001637
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01001638 if (retval == 0) // digraph deleted or not found
Bram Moolenaar071d4272004-06-13 20:20:40 +00001639 {
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01001640 if (char1 == ' ' && meta_char) // <space> <char> --> meta-char
Bram Moolenaar071d4272004-06-13 20:20:40 +00001641 return (char2 | 0x80);
1642 return char2;
1643 }
1644 return retval;
1645}
1646
1647/*
1648 * Get digraph.
1649 * Allow for both char1-char2 and char2-char1
1650 */
1651 int
h-east29b85712021-07-26 21:54:04 +02001652digraph_get(int char1, int char2, int meta_char)
Bram Moolenaar071d4272004-06-13 20:20:40 +00001653{
1654 int retval;
1655
Bram Moolenaar70b2a562012-01-10 22:26:17 +01001656 if (((retval = getexactdigraph(char1, char2, meta_char)) == char2)
Bram Moolenaar071d4272004-06-13 20:20:40 +00001657 && (char1 != char2)
Bram Moolenaar70b2a562012-01-10 22:26:17 +01001658 && ((retval = getexactdigraph(char2, char1, meta_char)) == char1))
Bram Moolenaar071d4272004-06-13 20:20:40 +00001659 return char2;
1660 return retval;
1661}
1662
1663/*
mityu61065042021-07-19 20:07:21 +02001664 * Add a digraph to the digraph table.
1665 */
1666 static void
1667registerdigraph(int char1, int char2, int n)
1668{
1669 int i;
1670 digr_T *dp;
1671
1672 // If the digraph already exists, replace "result".
1673 dp = (digr_T *)user_digraphs.ga_data;
1674 for (i = 0; i < user_digraphs.ga_len; ++i)
1675 {
1676 if ((int)dp->char1 == char1 && (int)dp->char2 == char2)
1677 {
1678 dp->result = n;
1679 return;
1680 }
1681 ++dp;
1682 }
1683
1684 // Add a new digraph to the table.
Yegappan Lakshmananfadc02a2023-01-27 21:03:12 +00001685 if (ga_grow(&user_digraphs, 1) == FAIL)
Yegappan Lakshmanan465de3a2022-12-26 12:50:04 +00001686 return;
1687
1688 dp = (digr_T *)user_digraphs.ga_data + user_digraphs.ga_len;
1689 dp->char1 = char1;
1690 dp->char2 = char2;
1691 dp->result = n;
1692 ++user_digraphs.ga_len;
mityu61065042021-07-19 20:07:21 +02001693}
1694
1695/*
1696 * Check the characters are valid for a digraph.
1697 * If they are valid, returns TRUE; otherwise, give an error message and
1698 * returns FALSE.
1699 */
Yegappan Lakshmanan8ee52af2021-08-09 19:59:06 +02001700 static int
mityu61065042021-07-19 20:07:21 +02001701check_digraph_chars_valid(int char1, int char2)
1702{
1703 if (char2 == 0)
1704 {
1705 char_u msg[MB_MAXBYTES + 1];
1706
1707 msg[mb_char2bytes(char1, msg)] = NUL;
1708
1709 semsg(_(e_digraph_must_be_just_two_characters_str), msg);
1710 return FALSE;
1711 }
1712 if (char1 == ESC || char2 == ESC)
1713 {
Bram Moolenaare1242042021-12-16 20:56:57 +00001714 emsg(_(e_escape_not_allowed_in_digraph));
mityu61065042021-07-19 20:07:21 +02001715 return FALSE;
1716 }
1717 return TRUE;
1718}
1719
1720
1721
1722/*
Bram Moolenaar071d4272004-06-13 20:20:40 +00001723 * Add the digraphs in the argument to the digraph table.
1724 * format: {c1}{c2} char {c1}{c2} char ...
1725 */
1726 void
Bram Moolenaar7454a062016-01-30 15:14:10 +01001727putdigraph(char_u *str)
Bram Moolenaar071d4272004-06-13 20:20:40 +00001728{
1729 int char1, char2, n;
Bram Moolenaar071d4272004-06-13 20:20:40 +00001730
1731 while (*str != NUL)
1732 {
1733 str = skipwhite(str);
1734 if (*str == NUL)
1735 return;
1736 char1 = *str++;
1737 char2 = *str++;
mityu61065042021-07-19 20:07:21 +02001738
1739 if (!check_digraph_chars_valid(char1, char2))
Bram Moolenaar071d4272004-06-13 20:20:40 +00001740 return;
mityu61065042021-07-19 20:07:21 +02001741
Bram Moolenaar071d4272004-06-13 20:20:40 +00001742 str = skipwhite(str);
1743 if (!VIM_ISDIGIT(*str))
1744 {
Bram Moolenaare29a27f2021-07-20 21:07:36 +02001745 emsg(_(e_number_expected));
Bram Moolenaar071d4272004-06-13 20:20:40 +00001746 return;
1747 }
1748 n = getdigits(&str);
1749
mityu61065042021-07-19 20:07:21 +02001750 registerdigraph(char1, char2, n);
Bram Moolenaar071d4272004-06-13 20:20:40 +00001751 }
1752}
1753
Bram Moolenaareae8ae12018-12-14 18:53:02 +01001754#if defined(USE_UNICODE_DIGRAPHS)
1755 static void
1756digraph_header(char *msg)
1757{
1758 if (msg_col > 0)
1759 msg_putchar('\n');
1760 msg_outtrans_attr((char_u *)msg, HL_ATTR(HLF_CM));
1761 msg_putchar('\n');
1762}
1763#endif
1764
Bram Moolenaar071d4272004-06-13 20:20:40 +00001765 void
Bram Moolenaareae8ae12018-12-14 18:53:02 +01001766listdigraphs(int use_headers)
Bram Moolenaar071d4272004-06-13 20:20:40 +00001767{
1768 int i;
1769 digr_T *dp;
Bram Moolenaareae8ae12018-12-14 18:53:02 +01001770 result_T previous = 0;
Bram Moolenaar071d4272004-06-13 20:20:40 +00001771
1772 msg_putchar('\n');
1773
1774 dp = digraphdefault;
dundargocb2209f22022-09-24 15:55:27 +01001775 while (dp->char1 != NUL && !got_int)
Bram Moolenaar071d4272004-06-13 20:20:40 +00001776 {
Bram Moolenaareae8ae12018-12-14 18:53:02 +01001777#if defined(USE_UNICODE_DIGRAPHS)
Bram Moolenaar071d4272004-06-13 20:20:40 +00001778 digr_T tmp;
1779
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01001780 // May need to convert the result to 'encoding'.
Bram Moolenaar071d4272004-06-13 20:20:40 +00001781 tmp.char1 = dp->char1;
1782 tmp.char2 = dp->char2;
1783 tmp.result = getexactdigraph(tmp.char1, tmp.char2, FALSE);
1784 if (tmp.result != 0 && tmp.result != tmp.char2
1785 && (has_mbyte || tmp.result <= 255))
Bram Moolenaareae8ae12018-12-14 18:53:02 +01001786 printdigraph(&tmp, use_headers ? &previous : NULL);
Bram Moolenaar071d4272004-06-13 20:20:40 +00001787#else
1788
1789 if (getexactdigraph(dp->char1, dp->char2, FALSE) == dp->result
Bram Moolenaar13505972019-01-24 15:04:48 +01001790 && (has_mbyte || dp->result <= 255))
Bram Moolenaareae8ae12018-12-14 18:53:02 +01001791 printdigraph(dp, use_headers ? &previous : NULL);
Bram Moolenaar071d4272004-06-13 20:20:40 +00001792#endif
1793 ++dp;
1794 ui_breakcheck();
1795 }
1796
1797 dp = (digr_T *)user_digraphs.ga_data;
1798 for (i = 0; i < user_digraphs.ga_len && !got_int; ++i)
1799 {
Bram Moolenaareae8ae12018-12-14 18:53:02 +01001800#if defined(USE_UNICODE_DIGRAPHS)
1801 if (previous >= 0 && use_headers)
1802 digraph_header(_("Custom"));
1803 previous = -1;
1804#endif
1805 printdigraph(dp, NULL);
Bram Moolenaar071d4272004-06-13 20:20:40 +00001806 ui_breakcheck();
1807 ++dp;
1808 }
Bram Moolenaara4d158b2022-08-14 14:17:45 +01001809
1810 // clear screen, because some digraphs may be wrong, in which case we
1811 // messed up ScreenLines
Bram Moolenaar471c0fa2022-08-22 15:19:16 +01001812 set_must_redraw(UPD_CLEAR);
Bram Moolenaar071d4272004-06-13 20:20:40 +00001813}
1814
mityu61065042021-07-19 20:07:21 +02001815 static void
h-east29b85712021-07-26 21:54:04 +02001816digraph_getlist_appendpair(digr_T *dp, list_T *l)
mityu61065042021-07-19 20:07:21 +02001817{
1818 char_u buf[30];
1819 char_u *p;
1820 list_T *l2;
1821 listitem_T *li, *li2;
1822
1823
1824 li = listitem_alloc();
1825 if (li == NULL)
1826 return;
1827 list_append(l, li);
1828 li->li_tv.v_type = VAR_LIST;
1829 li->li_tv.v_lock = 0;
1830
1831 l2 = list_alloc();
1832 li->li_tv.vval.v_list = l2;
1833 if (l2 == NULL)
1834 return;
1835 ++l2->lv_refcount;
1836
1837 li2 = listitem_alloc();
1838 if (li2 == NULL)
1839 return;
1840 list_append(l2, li2);
1841 li2->li_tv.v_type = VAR_STRING;
1842 li2->li_tv.v_lock = 0;
1843
1844 buf[0] = dp->char1;
1845 buf[1] = dp->char2;
1846 buf[2] = NUL;
1847 li2->li_tv.vval.v_string = vim_strsave(&buf[0]);
1848
1849 li2 = listitem_alloc();
1850 if (li2 == NULL)
1851 return;
1852 list_append(l2, li2);
1853 li2->li_tv.v_type = VAR_STRING;
1854 li2->li_tv.v_lock = 0;
1855
1856 p = buf;
1857 if (has_mbyte)
1858 p += (*mb_char2bytes)(dp->result, p);
1859 else
1860 *p++ = (char_u)dp->result;
1861 *p = NUL;
1862
1863 li2->li_tv.vval.v_string = vim_strsave(buf);
1864}
1865
Yegappan Lakshmanan8ee52af2021-08-09 19:59:06 +02001866 static void
h-east29b85712021-07-26 21:54:04 +02001867digraph_getlist_common(int list_all, typval_T *rettv)
mityu61065042021-07-19 20:07:21 +02001868{
1869 int i;
1870 digr_T *dp;
1871
1872 if (rettv_list_alloc(rettv) == FAIL)
1873 return;
1874
1875 if (list_all)
1876 {
1877 dp = digraphdefault;
dundargocb2209f22022-09-24 15:55:27 +01001878 while (dp->char1 != NUL && !got_int)
mityu61065042021-07-19 20:07:21 +02001879 {
1880#ifdef USE_UNICODE_DIGRAPHS
1881 digr_T tmp;
1882
1883 tmp.char1 = dp->char1;
1884 tmp.char2 = dp->char2;
1885 tmp.result = getexactdigraph(tmp.char1, tmp.char2, FALSE);
1886 if (tmp.result != 0 && tmp.result != tmp.char2
1887 && (has_mbyte || tmp.result <= 255))
h-east29b85712021-07-26 21:54:04 +02001888 digraph_getlist_appendpair(&tmp, rettv->vval.v_list);
mityu61065042021-07-19 20:07:21 +02001889#else
1890 if (getexactdigraph(dp->char1, dp->char2, FALSE) == dp->result
1891 && (has_mbyte || dp->result <= 255))
h-east29b85712021-07-26 21:54:04 +02001892 digraph_getlist_appendpair(dp, rettv->vval.v_list);
mityu61065042021-07-19 20:07:21 +02001893#endif
1894 ++dp;
1895 }
1896 }
1897
1898 dp = (digr_T *)user_digraphs.ga_data;
1899 for (i = 0; i < user_digraphs.ga_len && !got_int; ++i)
1900 {
h-east29b85712021-07-26 21:54:04 +02001901 digraph_getlist_appendpair(dp, rettv->vval.v_list);
mityu61065042021-07-19 20:07:21 +02001902 ++dp;
1903 }
1904}
1905
Bram Moolenaar5843f5f2019-08-20 20:13:45 +02001906static struct dg_header_entry {
Bram Moolenaareae8ae12018-12-14 18:53:02 +01001907 int dg_start;
1908 char *dg_header;
1909} header_table[] = {
1910 {DG_START_LATIN, N_("Latin supplement")},
1911 {DG_START_GREEK, N_("Greek and Coptic")},
1912 {DG_START_CYRILLIC, N_("Cyrillic")},
1913 {DG_START_HEBREW, N_("Hebrew")},
1914 {DG_START_ARABIC, N_("Arabic")},
1915 {DG_START_LATIN_EXTENDED, N_("Latin extended")},
1916 {DG_START_GREEK_EXTENDED, N_("Greek extended")},
1917 {DG_START_PUNCTUATION, N_("Punctuation")},
1918 {DG_START_SUB_SUPER, N_("Super- and subscripts")},
1919 {DG_START_CURRENCY, N_("Currency")},
1920 {DG_START_OTHER1, N_("Other")},
1921 {DG_START_ROMAN, N_("Roman numbers")},
1922 {DG_START_ARROWS, N_("Arrows")},
1923 {DG_START_MATH, N_("Mathematical operators")},
1924 {DG_START_TECHNICAL, N_("Technical")},
1925 {DG_START_OTHER2, N_("Other")},
1926 {DG_START_DRAWING, N_("Box drawing")},
1927 {DG_START_BLOCK, N_("Block elements")},
1928 {DG_START_SHAPES, N_("Geometric shapes")},
1929 {DG_START_SYMBOLS, N_("Symbols")},
1930 {DG_START_DINGBATS, N_("Dingbats")},
1931 {DG_START_CJK_SYMBOLS, N_("CJK symbols and punctuation")},
1932 {DG_START_HIRAGANA, N_("Hiragana")},
1933 {DG_START_KATAKANA, N_("Katakana")},
1934 {DG_START_BOPOMOFO, N_("Bopomofo")},
1935 {DG_START_OTHER3, N_("Other")},
1936 {0xfffffff, NULL},
1937};
1938
Bram Moolenaar071d4272004-06-13 20:20:40 +00001939 static void
Bram Moolenaareae8ae12018-12-14 18:53:02 +01001940printdigraph(digr_T *dp, result_T *previous)
Bram Moolenaar071d4272004-06-13 20:20:40 +00001941{
1942 char_u buf[30];
1943 char_u *p;
1944
1945 int list_width;
1946
Bram Moolenaar13505972019-01-24 15:04:48 +01001947 if ((dy_flags & DY_UHEX) || has_mbyte)
Bram Moolenaar071d4272004-06-13 20:20:40 +00001948 list_width = 13;
1949 else
1950 list_width = 11;
1951
Yegappan Lakshmanan465de3a2022-12-26 12:50:04 +00001952 if (dp->result == 0)
1953 return;
1954
Bram Moolenaareae8ae12018-12-14 18:53:02 +01001955#if defined(USE_UNICODE_DIGRAPHS)
Yegappan Lakshmanan465de3a2022-12-26 12:50:04 +00001956 if (previous != NULL)
1957 {
1958 int i;
Bram Moolenaareae8ae12018-12-14 18:53:02 +01001959
Yegappan Lakshmanan465de3a2022-12-26 12:50:04 +00001960 for (i = 0; header_table[i].dg_header != NULL; ++i)
1961 if (*previous < header_table[i].dg_start
1962 && dp->result >= header_table[i].dg_start
1963 && dp->result < header_table[i + 1].dg_start)
1964 {
1965 digraph_header(_(header_table[i].dg_header));
1966 break;
1967 }
1968 *previous = dp->result;
Bram Moolenaar071d4272004-06-13 20:20:40 +00001969 }
Yegappan Lakshmanan465de3a2022-12-26 12:50:04 +00001970#endif
1971 if (msg_col > Columns - list_width)
1972 msg_putchar('\n');
1973 if (msg_col)
1974 while (msg_col % list_width != 0)
1975 msg_putchar(' ');
1976
1977 p = buf;
1978 *p++ = dp->char1;
1979 *p++ = dp->char2;
1980 *p++ = ' ';
1981 *p = NUL;
1982 msg_outtrans(buf);
1983 p = buf;
1984 if (has_mbyte)
1985 {
1986 // add a space to draw a composing char on
1987 if (enc_utf8 && utf_iscomposing(dp->result))
1988 *p++ = ' ';
1989 p += (*mb_char2bytes)(dp->result, p);
1990 }
1991 else
1992 *p++ = (char_u)dp->result;
1993 *p = NUL;
1994 msg_outtrans_attr(buf, HL_ATTR(HLF_8));
1995 p = buf;
1996 if (char2cells(dp->result) == 1)
1997 *p++ = ' ';
1998 vim_snprintf((char *)p, sizeof(buf) - (p - buf), " %3d", dp->result);
1999 msg_outtrans(buf);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002000}
2001
mityu61065042021-07-19 20:07:21 +02002002# ifdef FEAT_EVAL
2003/*
2004 * Get the two digraph characters from a typval.
2005 * Return OK or FAIL.
2006 */
2007 static int
2008get_digraph_chars(typval_T *arg, int *char1, int *char2)
2009{
2010 char_u buf_chars[NUMBUFLEN];
2011 char_u *chars = tv_get_string_buf_chk(arg, buf_chars);
2012 char_u *p = chars;
2013
2014 if (p != NULL)
2015 {
2016 if (*p != NUL)
2017 {
2018 *char1 = mb_cptr2char_adv(&p);
2019 if (*p != NUL)
2020 {
2021 *char2 = mb_cptr2char_adv(&p);
2022 if (*p == NUL)
2023 {
2024 if (check_digraph_chars_valid(*char1, *char2))
2025 return OK;
2026 return FAIL;
2027 }
2028 }
2029 }
2030 }
2031 semsg(_(e_digraph_must_be_just_two_characters_str), chars);
2032 return FAIL;
2033}
2034
2035 static int
h-east29b85712021-07-26 21:54:04 +02002036digraph_set_common(typval_T *argchars, typval_T *argdigraph)
mityu61065042021-07-19 20:07:21 +02002037{
2038 int char1, char2;
2039 char_u *digraph;
2040 char_u *p;
2041 char_u buf_digraph[NUMBUFLEN];
2042 varnumber_T n;
2043
2044 if (get_digraph_chars(argchars, &char1, &char2) == FAIL)
2045 return FALSE;
2046
2047 digraph = tv_get_string_buf_chk(argdigraph, buf_digraph);
2048 if (digraph == NULL)
2049 return FALSE;
2050 p = digraph;
2051 n = mb_cptr2char_adv(&p);
2052 if (*p != NUL)
2053 {
2054 semsg(_(e_digraph_argument_must_be_one_character_str), digraph);
2055 return FALSE;
2056 }
2057
2058 registerdigraph(char1, char2, (int)n);
2059 return TRUE;
2060}
2061# endif
2062
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01002063#endif // FEAT_DIGRAPHS
Bram Moolenaar071d4272004-06-13 20:20:40 +00002064
mityu61065042021-07-19 20:07:21 +02002065#if defined(FEAT_EVAL) || defined(PROTO)
2066/*
h-east29b85712021-07-26 21:54:04 +02002067 * "digraph_get()" function
mityu61065042021-07-19 20:07:21 +02002068 */
2069 void
h-east29b85712021-07-26 21:54:04 +02002070f_digraph_get(typval_T *argvars, typval_T *rettv)
mityu61065042021-07-19 20:07:21 +02002071{
2072# ifdef FEAT_DIGRAPHS
2073 int code;
2074 char_u buf[NUMBUFLEN];
2075 char_u *digraphs;
2076
2077 rettv->v_type = VAR_STRING;
2078 rettv->vval.v_string = NULL; // Return empty string for failure
Yegappan Lakshmanan4490ec42021-07-27 22:00:44 +02002079
2080 if (in_vim9script() && check_for_string_arg(argvars, 0) == FAIL)
2081 return;
2082
mityu61065042021-07-19 20:07:21 +02002083 digraphs = tv_get_string_chk(&argvars[0]);
2084
2085 if (digraphs == NULL)
2086 return;
2087 else if (STRLEN(digraphs) != 2)
2088 {
2089 semsg(_(e_digraph_must_be_just_two_characters_str), digraphs);
2090 return;
2091 }
h-east29b85712021-07-26 21:54:04 +02002092 code = digraph_get(digraphs[0], digraphs[1], FALSE);
mityu61065042021-07-19 20:07:21 +02002093
2094 if (has_mbyte)
2095 buf[(*mb_char2bytes)(code, buf)] = NUL;
Bram Moolenaarebfec1c2023-01-22 21:14:53 +00002096 else
2097 {
mityu61065042021-07-19 20:07:21 +02002098 buf[0] = code;
2099 buf[1] = NUL;
2100 }
2101
2102 rettv->vval.v_string = vim_strsave(buf);
2103# else
2104 emsg(_(e_no_digraphs_version));
2105# endif
2106}
2107
2108/*
h-east29b85712021-07-26 21:54:04 +02002109 * "digraph_getlist()" function
mityu61065042021-07-19 20:07:21 +02002110 */
2111 void
h-east29b85712021-07-26 21:54:04 +02002112f_digraph_getlist(typval_T *argvars, typval_T *rettv)
mityu61065042021-07-19 20:07:21 +02002113{
2114# ifdef FEAT_DIGRAPHS
2115 int flag_list_all;
2116
Yegappan Lakshmananfc3b7752021-09-08 14:57:42 +02002117 if (in_vim9script() && check_for_opt_bool_arg(argvars, 0) == FAIL)
Yegappan Lakshmanan4490ec42021-07-27 22:00:44 +02002118 return;
2119
mityu61065042021-07-19 20:07:21 +02002120 if (argvars[0].v_type == VAR_UNKNOWN)
2121 flag_list_all = FALSE;
2122 else
2123 {
Bram Moolenaar6ed545e2022-05-09 20:09:23 +01002124 int error = FALSE;
mityu61065042021-07-19 20:07:21 +02002125 varnumber_T flag = tv_get_number_chk(&argvars[0], &error);
Bram Moolenaar6ed545e2022-05-09 20:09:23 +01002126
mityu61065042021-07-19 20:07:21 +02002127 if (error)
2128 return;
2129 flag_list_all = flag ? TRUE : FALSE;
2130 }
2131
h-east29b85712021-07-26 21:54:04 +02002132 digraph_getlist_common(flag_list_all, rettv);
mityu61065042021-07-19 20:07:21 +02002133# else
2134 emsg(_(e_no_digraphs_version));
2135# endif
2136}
2137
2138/*
h-east29b85712021-07-26 21:54:04 +02002139 * "digraph_set()" function
mityu61065042021-07-19 20:07:21 +02002140 */
2141 void
h-east29b85712021-07-26 21:54:04 +02002142f_digraph_set(typval_T *argvars, typval_T *rettv)
mityu61065042021-07-19 20:07:21 +02002143{
2144# ifdef FEAT_DIGRAPHS
2145 rettv->v_type = VAR_BOOL;
2146 rettv->vval.v_number = VVAL_FALSE;
2147
Yegappan Lakshmanan4490ec42021-07-27 22:00:44 +02002148 if (in_vim9script()
2149 && (check_for_string_arg(argvars, 0) == FAIL
Yegappan Lakshmananfc3b7752021-09-08 14:57:42 +02002150 || check_for_string_arg(argvars, 1) == FAIL))
Yegappan Lakshmanan4490ec42021-07-27 22:00:44 +02002151 return;
2152
h-east29b85712021-07-26 21:54:04 +02002153 if (!digraph_set_common(&argvars[0], &argvars[1]))
mityu61065042021-07-19 20:07:21 +02002154 return;
2155
2156 rettv->vval.v_number = VVAL_TRUE;
2157# else
2158 emsg(_(e_no_digraphs_version));
2159# endif
2160}
2161
2162/*
h-east29b85712021-07-26 21:54:04 +02002163 * "digraph_setlist()" function
mityu61065042021-07-19 20:07:21 +02002164 */
2165 void
h-east29b85712021-07-26 21:54:04 +02002166f_digraph_setlist(typval_T * argvars, typval_T *rettv)
mityu61065042021-07-19 20:07:21 +02002167{
2168# ifdef FEAT_DIGRAPHS
2169 list_T *pl, *l;
2170 listitem_T *pli;
2171
2172 rettv->v_type = VAR_BOOL;
2173 rettv->vval.v_number = VVAL_FALSE;
2174
2175 if (argvars[0].v_type != VAR_LIST)
2176 {
h-east29b85712021-07-26 21:54:04 +02002177 emsg(_(e_digraph_setlist_argument_must_be_list_of_lists_with_two_items));
mityu61065042021-07-19 20:07:21 +02002178 return;
2179 }
2180
2181 pl = argvars[0].vval.v_list;
2182 if (pl == NULL)
2183 {
2184 // Empty list always results in success.
2185 rettv->vval.v_number = VVAL_TRUE;
2186 return;
2187 }
2188
2189 FOR_ALL_LIST_ITEMS(pl, pli)
2190 {
2191 if (pli->li_tv.v_type != VAR_LIST)
2192 {
h-east29b85712021-07-26 21:54:04 +02002193 emsg(_(e_digraph_setlist_argument_must_be_list_of_lists_with_two_items));
mityu61065042021-07-19 20:07:21 +02002194 return;
2195 }
2196
2197 l = pli->li_tv.vval.v_list;
2198 if (l == NULL || l->lv_len != 2)
2199 {
h-east29b85712021-07-26 21:54:04 +02002200 emsg(_(e_digraph_setlist_argument_must_be_list_of_lists_with_two_items));
mityu61065042021-07-19 20:07:21 +02002201 return;
2202 }
2203
h-east29b85712021-07-26 21:54:04 +02002204 if (!digraph_set_common(&l->lv_first->li_tv,
mityu61065042021-07-19 20:07:21 +02002205 &l->lv_first->li_next->li_tv))
2206 return;
2207 }
2208 rettv->vval.v_number = VVAL_TRUE;
2209# else
2210 emsg(_(e_no_digraphs_version));
2211# endif
2212}
2213
2214#endif // FEAT_EVAL
2215
2216
Bram Moolenaar071d4272004-06-13 20:20:40 +00002217#if defined(FEAT_KEYMAP) || defined(PROTO)
2218
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01002219// structure used for b_kmap_ga.ga_data
Bram Moolenaar071d4272004-06-13 20:20:40 +00002220typedef struct
2221{
2222 char_u *from;
2223 char_u *to;
2224} kmap_T;
2225
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01002226#define KMAP_MAXLEN 20 // maximum length of "from" or "to"
Bram Moolenaar071d4272004-06-13 20:20:40 +00002227
Bram Moolenaarf28dbce2016-01-29 22:03:47 +01002228static void keymap_unload(void);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002229
2230/*
Bram Moolenaar0ab2a882009-05-13 10:51:08 +00002231 * Set up key mapping tables for the 'keymap' option.
2232 * Returns NULL if OK, an error message for failure. This only needs to be
2233 * used when setting the option, not later when the value has already been
2234 * checked.
Bram Moolenaar071d4272004-06-13 20:20:40 +00002235 */
Bram Moolenaarf9e3e092019-01-13 23:38:42 +01002236 char *
Bram Moolenaar7454a062016-01-30 15:14:10 +01002237keymap_init(void)
Bram Moolenaar071d4272004-06-13 20:20:40 +00002238{
2239 curbuf->b_kmap_state &= ~KEYMAP_INIT;
2240
2241 if (*curbuf->b_p_keymap == NUL)
2242 {
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01002243 // Stop any active keymap and clear the table. Also remove
2244 // b:keymap_name, as no keymap is active now.
Bram Moolenaar071d4272004-06-13 20:20:40 +00002245 keymap_unload();
Bram Moolenaarbf444172007-07-07 11:58:28 +00002246 do_cmdline_cmd((char_u *)"unlet! b:keymap_name");
Bram Moolenaar071d4272004-06-13 20:20:40 +00002247 }
2248 else
2249 {
2250 char_u *buf;
Bram Moolenaar0ab2a882009-05-13 10:51:08 +00002251 size_t buflen;
Bram Moolenaar071d4272004-06-13 20:20:40 +00002252
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01002253 // Source the keymap file. It will contain a ":loadkeymap" command
2254 // which will call ex_loadkeymap() below.
Bram Moolenaar13505972019-01-24 15:04:48 +01002255 buflen = STRLEN(curbuf->b_p_keymap) + STRLEN(p_enc) + 14;
Bram Moolenaar964b3742019-05-24 18:54:09 +02002256 buf = alloc(buflen);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002257 if (buf == NULL)
Bram Moolenaare29a27f2021-07-20 21:07:36 +02002258 return e_out_of_memory;
Bram Moolenaar071d4272004-06-13 20:20:40 +00002259
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01002260 // try finding "keymap/'keymap'_'encoding'.vim" in 'runtimepath'
Bram Moolenaar0ab2a882009-05-13 10:51:08 +00002261 vim_snprintf((char *)buf, buflen, "keymap/%s_%s.vim",
2262 curbuf->b_p_keymap, p_enc);
Bram Moolenaar7f8989d2016-03-12 22:11:39 +01002263 if (source_runtime(buf, 0) == FAIL)
Bram Moolenaar071d4272004-06-13 20:20:40 +00002264 {
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01002265 // try finding "keymap/'keymap'.vim" in 'runtimepath'
Bram Moolenaar0ab2a882009-05-13 10:51:08 +00002266 vim_snprintf((char *)buf, buflen, "keymap/%s.vim",
2267 curbuf->b_p_keymap);
Bram Moolenaar7f8989d2016-03-12 22:11:39 +01002268 if (source_runtime(buf, 0) == FAIL)
Bram Moolenaar071d4272004-06-13 20:20:40 +00002269 {
2270 vim_free(buf);
Bram Moolenaar1d423ef2022-01-02 21:26:16 +00002271 return N_(e_keymap_file_not_found);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002272 }
2273 }
2274 vim_free(buf);
2275 }
2276
2277 return NULL;
2278}
2279
2280/*
2281 * ":loadkeymap" command: load the following lines as the keymap.
2282 */
2283 void
Bram Moolenaar7454a062016-01-30 15:14:10 +01002284ex_loadkeymap(exarg_T *eap)
Bram Moolenaar071d4272004-06-13 20:20:40 +00002285{
2286 char_u *line;
2287 char_u *p;
2288 char_u *s;
2289 kmap_T *kp;
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01002290#define KMAP_LLEN 200 // max length of "to" and "from" together
Bram Moolenaar071d4272004-06-13 20:20:40 +00002291 char_u buf[KMAP_LLEN + 11];
2292 int i;
2293 char_u *save_cpo = p_cpo;
2294
Yegappan Lakshmanan36a5b682022-03-19 12:56:51 +00002295 if (!sourcing_a_script(eap))
Bram Moolenaar071d4272004-06-13 20:20:40 +00002296 {
Bram Moolenaare1242042021-12-16 20:56:57 +00002297 emsg(_(e_using_loadkeymap_not_in_sourced_file));
Bram Moolenaar071d4272004-06-13 20:20:40 +00002298 return;
2299 }
2300
2301 /*
2302 * Stop any active keymap and clear the table.
2303 */
2304 keymap_unload();
2305
2306 curbuf->b_kmap_state = 0;
Bram Moolenaar04935fb2022-01-08 16:19:22 +00002307 ga_init2(&curbuf->b_kmap_ga, sizeof(kmap_T), 20);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002308
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01002309 // Set 'cpoptions' to "C" to avoid line continuation.
Bram Moolenaar071d4272004-06-13 20:20:40 +00002310 p_cpo = (char_u *)"C";
2311
2312 /*
2313 * Get each line of the sourced file, break at the end.
2314 */
2315 for (;;)
2316 {
Bram Moolenaare96a2492019-06-25 04:12:16 +02002317 line = eap->getline(0, eap->cookie, 0, TRUE);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002318 if (line == NULL)
2319 break;
2320
2321 p = skipwhite(line);
2322 if (*p != '"' && *p != NUL && ga_grow(&curbuf->b_kmap_ga, 1) == OK)
2323 {
2324 kp = (kmap_T *)curbuf->b_kmap_ga.ga_data + curbuf->b_kmap_ga.ga_len;
2325 s = skiptowhite(p);
Bram Moolenaardf44a272020-06-07 20:49:05 +02002326 kp->from = vim_strnsave(p, s - p);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002327 p = skipwhite(s);
2328 s = skiptowhite(p);
Bram Moolenaardf44a272020-06-07 20:49:05 +02002329 kp->to = vim_strnsave(p, s - p);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002330
2331 if (kp->from == NULL || kp->to == NULL
Bram Moolenaar57657d82006-04-21 22:12:41 +00002332 || STRLEN(kp->from) + STRLEN(kp->to) >= KMAP_LLEN
2333 || *kp->from == NUL || *kp->to == NUL)
Bram Moolenaar071d4272004-06-13 20:20:40 +00002334 {
Bram Moolenaar57657d82006-04-21 22:12:41 +00002335 if (kp->to != NULL && *kp->to == NUL)
Bram Moolenaar677658a2022-01-05 16:09:06 +00002336 emsg(_(e_empty_keymap_entry));
Bram Moolenaar071d4272004-06-13 20:20:40 +00002337 vim_free(kp->from);
2338 vim_free(kp->to);
2339 }
2340 else
Bram Moolenaar071d4272004-06-13 20:20:40 +00002341 ++curbuf->b_kmap_ga.ga_len;
Bram Moolenaar071d4272004-06-13 20:20:40 +00002342 }
2343 vim_free(line);
2344 }
2345
2346 /*
2347 * setup ":lnoremap" to map the keys
2348 */
2349 for (i = 0; i < curbuf->b_kmap_ga.ga_len; ++i)
2350 {
Bram Moolenaar555b2802005-05-19 21:08:39 +00002351 vim_snprintf((char *)buf, sizeof(buf), "<buffer> %s %s",
Bram Moolenaar071d4272004-06-13 20:20:40 +00002352 ((kmap_T *)curbuf->b_kmap_ga.ga_data)[i].from,
2353 ((kmap_T *)curbuf->b_kmap_ga.ga_data)[i].to);
zeertzjq44068e92022-06-16 11:14:55 +01002354 (void)do_map(MAPTYPE_NOREMAP, buf, MODE_LANGMAP, FALSE);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002355 }
2356
2357 p_cpo = save_cpo;
2358
2359 curbuf->b_kmap_state |= KEYMAP_LOADED;
Bram Moolenaar071d4272004-06-13 20:20:40 +00002360 status_redraw_curbuf();
Bram Moolenaar071d4272004-06-13 20:20:40 +00002361}
2362
2363/*
2364 * Stop using 'keymap'.
2365 */
2366 static void
Bram Moolenaar7454a062016-01-30 15:14:10 +01002367keymap_unload(void)
Bram Moolenaar071d4272004-06-13 20:20:40 +00002368{
2369 char_u buf[KMAP_MAXLEN + 10];
2370 int i;
2371 char_u *save_cpo = p_cpo;
Bram Moolenaar8c8de832008-06-24 22:58:06 +00002372 kmap_T *kp;
Bram Moolenaar071d4272004-06-13 20:20:40 +00002373
2374 if (!(curbuf->b_kmap_state & KEYMAP_LOADED))
2375 return;
2376
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01002377 // Set 'cpoptions' to "C" to avoid line continuation.
Bram Moolenaar071d4272004-06-13 20:20:40 +00002378 p_cpo = (char_u *)"C";
2379
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01002380 // clear the ":lmap"s
Bram Moolenaar8c8de832008-06-24 22:58:06 +00002381 kp = (kmap_T *)curbuf->b_kmap_ga.ga_data;
Bram Moolenaar071d4272004-06-13 20:20:40 +00002382 for (i = 0; i < curbuf->b_kmap_ga.ga_len; ++i)
2383 {
Bram Moolenaar8c8de832008-06-24 22:58:06 +00002384 vim_snprintf((char *)buf, sizeof(buf), "<buffer> %s", kp[i].from);
zeertzjq44068e92022-06-16 11:14:55 +01002385 (void)do_map(MAPTYPE_UNMAP, buf, MODE_LANGMAP, FALSE);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002386 }
Bram Moolenaar50138322018-01-28 17:05:16 +01002387 keymap_clear(&curbuf->b_kmap_ga);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002388
2389 p_cpo = save_cpo;
2390
2391 ga_clear(&curbuf->b_kmap_ga);
2392 curbuf->b_kmap_state &= ~KEYMAP_LOADED;
Bram Moolenaar071d4272004-06-13 20:20:40 +00002393 status_redraw_curbuf();
Bram Moolenaar071d4272004-06-13 20:20:40 +00002394}
2395
Bram Moolenaar50138322018-01-28 17:05:16 +01002396 void
2397keymap_clear(garray_T *kmap)
2398{
2399 int i;
2400 kmap_T *kp = (kmap_T *)kmap->ga_data;
2401
2402 for (i = 0; i < kmap->ga_len; ++i)
2403 {
2404 vim_free(kp[i].from);
2405 vim_free(kp[i].to);
2406 }
2407}
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01002408#endif // FEAT_KEYMAP