blob: f19e58ec791e7d7136b960025c832273bde9353d [file] [log] [blame]
Bram Moolenaaredf3f972016-08-29 22:49:24 +02001/* vi:set ts=8 sts=4 sw=4 noet:
Bram Moolenaar071d4272004-06-13 20:20:40 +00002 *
3 * VIM - Vi IMproved by Bram Moolenaar
4 *
5 * Do ":help uganda" in Vim to read copying and usage conditions.
6 * Do ":help credits" in Vim to see a list of people who contributed.
7 * See README.txt for an overview of the Vim source code.
8 */
9
10/*
11 * digraph.c: code for digraphs
12 */
13
14#include "vim.h"
15
16#if defined(FEAT_DIGRAPHS) || defined(PROTO)
17
Bram Moolenaar071d4272004-06-13 20:20:40 +000018typedef int result_T;
Bram Moolenaar071d4272004-06-13 20:20:40 +000019
20typedef struct digraph
21{
22 char_u char1;
23 char_u char2;
24 result_T result;
25} digr_T;
26
Bram Moolenaareae8ae12018-12-14 18:53:02 +010027static void printdigraph(digr_T *dp, result_T *previous);
Bram Moolenaar071d4272004-06-13 20:20:40 +000028
Bram Moolenaar5d18efe2019-12-01 21:11:22 +010029// digraphs added by the user
Bram Moolenaar0ab2a882009-05-13 10:51:08 +000030static garray_T user_digraphs = {0, 0, (int)sizeof(digr_T), 10, NULL};
Bram Moolenaar071d4272004-06-13 20:20:40 +000031
32/*
Bram Moolenaare27d6e62022-08-30 15:05:30 +010033 * digraphs for Unicode from RFC1345
34 * (also work for ISO-8859-1 aka latin1)
35 *
Bram Moolenaar071d4272004-06-13 20:20:40 +000036 * Note: Characters marked with XX are not included literally, because some
37 * compilers cannot handle them (Amiga SAS/C is the most picky one).
38 */
Bram Moolenaare27d6e62022-08-30 15:05:30 +010039static digr_T digraphdefault[] = {
Bram Moolenaar5d18efe2019-12-01 21:11:22 +010040 {'N', 'U', 0x0a}, // LF for NUL
Bram Moolenaar071d4272004-06-13 20:20:40 +000041 {'S', 'H', 0x01},
42 {'S', 'X', 0x02},
43 {'E', 'X', 0x03},
44 {'E', 'T', 0x04},
45 {'E', 'Q', 0x05},
46 {'A', 'K', 0x06},
47 {'B', 'L', 0x07},
48 {'B', 'S', 0x08},
49 {'H', 'T', 0x09},
50 {'L', 'F', 0x0a},
51 {'V', 'T', 0x0b},
52 {'F', 'F', 0x0c},
53 {'C', 'R', 0x0d},
54 {'S', 'O', 0x0e},
55 {'S', 'I', 0x0f},
56 {'D', 'L', 0x10},
57 {'D', '1', 0x11},
58 {'D', '2', 0x12},
59 {'D', '3', 0x13},
60 {'D', '4', 0x14},
61 {'N', 'K', 0x15},
62 {'S', 'Y', 0x16},
63 {'E', 'B', 0x17},
64 {'C', 'N', 0x18},
65 {'E', 'M', 0x19},
66 {'S', 'B', 0x1a},
67 {'E', 'C', 0x1b},
68 {'F', 'S', 0x1c},
69 {'G', 'S', 0x1d},
70 {'R', 'S', 0x1e},
71 {'U', 'S', 0x1f},
72 {'S', 'P', 0x20},
73 {'N', 'b', 0x23},
74 {'D', 'O', 0x24},
75 {'A', 't', 0x40},
76 {'<', '(', 0x5b},
77 {'/', '/', 0x5c},
78 {')', '>', 0x5d},
79 {'\'', '>', 0x5e},
80 {'\'', '!', 0x60},
81 {'(', '!', 0x7b},
82 {'!', '!', 0x7c},
83 {'!', ')', 0x7d},
84 {'\'', '?', 0x7e},
85 {'D', 'T', 0x7f},
86 {'P', 'A', 0x80},
87 {'H', 'O', 0x81},
88 {'B', 'H', 0x82},
89 {'N', 'H', 0x83},
90 {'I', 'N', 0x84},
91 {'N', 'L', 0x85},
92 {'S', 'A', 0x86},
93 {'E', 'S', 0x87},
94 {'H', 'S', 0x88},
95 {'H', 'J', 0x89},
96 {'V', 'S', 0x8a},
97 {'P', 'D', 0x8b},
98 {'P', 'U', 0x8c},
99 {'R', 'I', 0x8d},
100 {'S', '2', 0x8e},
101 {'S', '3', 0x8f},
102 {'D', 'C', 0x90},
103 {'P', '1', 0x91},
104 {'P', '2', 0x92},
105 {'T', 'S', 0x93},
106 {'C', 'C', 0x94},
107 {'M', 'W', 0x95},
108 {'S', 'G', 0x96},
109 {'E', 'G', 0x97},
110 {'S', 'S', 0x98},
111 {'G', 'C', 0x99},
112 {'S', 'C', 0x9a},
113 {'C', 'I', 0x9b},
114 {'S', 'T', 0x9c},
115 {'O', 'C', 0x9d},
116 {'P', 'M', 0x9e},
117 {'A', 'C', 0x9f},
118 {'N', 'S', 0xa0},
Bram Moolenaare3f915d2020-07-14 23:02:44 +0200119# define DG_START_LATIN 0xa1
Bram Moolenaar071d4272004-06-13 20:20:40 +0000120 {'!', 'I', 0xa1},
Bram Moolenaar41193092019-08-24 21:53:31 +0200121 {'~', '!', 0xa1}, // ¡ Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000122 {'C', 't', 0xa2},
Bram Moolenaar41193092019-08-24 21:53:31 +0200123 {'c', '|', 0xa2}, // ¢ Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000124 {'P', 'd', 0xa3},
Bram Moolenaar41193092019-08-24 21:53:31 +0200125 {'$', '$', 0xa3}, // £ Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000126 {'C', 'u', 0xa4},
Bram Moolenaar41193092019-08-24 21:53:31 +0200127 {'o', 'x', 0xa4}, // ¤ Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000128 {'Y', 'e', 0xa5},
Bram Moolenaar41193092019-08-24 21:53:31 +0200129 {'Y', '-', 0xa5}, // ¥ Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000130 {'B', 'B', 0xa6},
Bram Moolenaar41193092019-08-24 21:53:31 +0200131 {'|', '|', 0xa6}, // ¦ Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000132 {'S', 'E', 0xa7},
133 {'\'', ':', 0xa8},
134 {'C', 'o', 0xa9},
Bram Moolenaar41193092019-08-24 21:53:31 +0200135 {'c', 'O', 0xa9}, // © Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000136 {'-', 'a', 0xaa},
137 {'<', '<', 0xab},
138 {'N', 'O', 0xac},
Bram Moolenaar41193092019-08-24 21:53:31 +0200139 {'-', ',', 0xac}, // ¬ Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000140 {'-', '-', 0xad},
141 {'R', 'g', 0xae},
142 {'\'', 'm', 0xaf},
Bram Moolenaar41193092019-08-24 21:53:31 +0200143 {'-', '=', 0xaf}, // ¯ Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000144 {'D', 'G', 0xb0},
Bram Moolenaar41193092019-08-24 21:53:31 +0200145 {'~', 'o', 0xb0}, // ° Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000146 {'+', '-', 0xb1},
147 {'2', 'S', 0xb2},
Bram Moolenaar41193092019-08-24 21:53:31 +0200148 {'2', '2', 0xb2}, // ² Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000149 {'3', 'S', 0xb3},
Bram Moolenaar41193092019-08-24 21:53:31 +0200150 {'3', '3', 0xb3}, // ³ Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000151 {'\'', '\'', 0xb4},
152 {'M', 'y', 0xb5},
153 {'P', 'I', 0xb6},
Bram Moolenaar41193092019-08-24 21:53:31 +0200154 {'p', 'p', 0xb6}, // ¶ Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000155 {'.', 'M', 0xb7},
Bram Moolenaar41193092019-08-24 21:53:31 +0200156 {'~', '.', 0xb7}, // · Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000157 {'\'', ',', 0xb8},
158 {'1', 'S', 0xb9},
Bram Moolenaar41193092019-08-24 21:53:31 +0200159 {'1', '1', 0xb9}, // ¹ Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000160 {'-', 'o', 0xba},
161 {'>', '>', 0xbb},
162 {'1', '4', 0xbc},
163 {'1', '2', 0xbd},
164 {'3', '4', 0xbe},
165 {'?', 'I', 0xbf},
Bram Moolenaar41193092019-08-24 21:53:31 +0200166 {'~', '?', 0xbf}, // ¿ Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000167 {'A', '!', 0xc0},
Bram Moolenaar41193092019-08-24 21:53:31 +0200168 {'A', '`', 0xc0}, // À Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000169 {'A', '\'', 0xc1},
170 {'A', '>', 0xc2},
Bram Moolenaar41193092019-08-24 21:53:31 +0200171 {'A', '^', 0xc2}, // Â Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000172 {'A', '?', 0xc3},
Bram Moolenaar41193092019-08-24 21:53:31 +0200173 {'A', '~', 0xc3}, // Ã Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000174 {'A', ':', 0xc4},
Bram Moolenaar41193092019-08-24 21:53:31 +0200175 {'A', '"', 0xc4}, // Ä Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000176 {'A', 'A', 0xc5},
Bram Moolenaar41193092019-08-24 21:53:31 +0200177 {'A', '@', 0xc5}, // Å Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000178 {'A', 'E', 0xc6},
179 {'C', ',', 0xc7},
180 {'E', '!', 0xc8},
Bram Moolenaar41193092019-08-24 21:53:31 +0200181 {'E', '`', 0xc8}, // È Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000182 {'E', '\'', 0xc9},
183 {'E', '>', 0xca},
Bram Moolenaar41193092019-08-24 21:53:31 +0200184 {'E', '^', 0xca}, // Ê Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000185 {'E', ':', 0xcb},
Bram Moolenaar41193092019-08-24 21:53:31 +0200186 {'E', '"', 0xcb}, // Ë Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000187 {'I', '!', 0xcc},
Bram Moolenaar41193092019-08-24 21:53:31 +0200188 {'I', '`', 0xcc}, // Ì Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000189 {'I', '\'', 0xcd},
190 {'I', '>', 0xce},
Bram Moolenaar41193092019-08-24 21:53:31 +0200191 {'I', '^', 0xce}, // Î Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000192 {'I', ':', 0xcf},
Bram Moolenaar41193092019-08-24 21:53:31 +0200193 {'I', '"', 0xcf}, // Ï Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000194 {'D', '-', 0xd0},
195 {'N', '?', 0xd1},
Bram Moolenaar41193092019-08-24 21:53:31 +0200196 {'N', '~', 0xd1}, // Ñ Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000197 {'O', '!', 0xd2},
Bram Moolenaar41193092019-08-24 21:53:31 +0200198 {'O', '`', 0xd2}, // Ò Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000199 {'O', '\'', 0xd3},
200 {'O', '>', 0xd4},
Bram Moolenaar41193092019-08-24 21:53:31 +0200201 {'O', '^', 0xd4}, // Ô Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000202 {'O', '?', 0xd5},
Bram Moolenaar41193092019-08-24 21:53:31 +0200203 {'O', '~', 0xd5}, // Õ Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000204 {'O', ':', 0xd6},
205 {'*', 'X', 0xd7},
Bram Moolenaar41193092019-08-24 21:53:31 +0200206 {'/', '\\', 0xd7}, // × Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000207 {'O', '/', 0xd8},
208 {'U', '!', 0xd9},
Bram Moolenaar41193092019-08-24 21:53:31 +0200209 {'U', '`', 0xd9}, // Ù Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000210 {'U', '\'', 0xda},
211 {'U', '>', 0xdb},
Bram Moolenaar41193092019-08-24 21:53:31 +0200212 {'U', '^', 0xdb}, // Û Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000213 {'U', ':', 0xdc},
214 {'Y', '\'', 0xdd},
215 {'T', 'H', 0xde},
Bram Moolenaar41193092019-08-24 21:53:31 +0200216 {'I', 'p', 0xde}, // Þ Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000217 {'s', 's', 0xdf},
218 {'a', '!', 0xe0},
Bram Moolenaar41193092019-08-24 21:53:31 +0200219 {'a', '`', 0xe0}, // à Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000220 {'a', '\'', 0xe1},
221 {'a', '>', 0xe2},
Bram Moolenaar41193092019-08-24 21:53:31 +0200222 {'a', '^', 0xe2}, // â Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000223 {'a', '?', 0xe3},
Bram Moolenaar41193092019-08-24 21:53:31 +0200224 {'a', '~', 0xe3}, // ã Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000225 {'a', ':', 0xe4},
Bram Moolenaar41193092019-08-24 21:53:31 +0200226 {'a', '"', 0xe4}, // ä Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000227 {'a', 'a', 0xe5},
Bram Moolenaar41193092019-08-24 21:53:31 +0200228 {'a', '@', 0xe5}, // å Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000229 {'a', 'e', 0xe6},
230 {'c', ',', 0xe7},
231 {'e', '!', 0xe8},
Bram Moolenaar41193092019-08-24 21:53:31 +0200232 {'e', '`', 0xe8}, // è Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000233 {'e', '\'', 0xe9},
234 {'e', '>', 0xea},
Bram Moolenaar41193092019-08-24 21:53:31 +0200235 {'e', '^', 0xea}, // ê Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000236 {'e', ':', 0xeb},
Bram Moolenaar41193092019-08-24 21:53:31 +0200237 {'e', '"', 0xeb}, // ë Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000238 {'i', '!', 0xec},
Bram Moolenaar41193092019-08-24 21:53:31 +0200239 {'i', '`', 0xec}, // ì Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000240 {'i', '\'', 0xed},
241 {'i', '>', 0xee},
Bram Moolenaar41193092019-08-24 21:53:31 +0200242 {'i', '^', 0xee}, // î Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000243 {'i', ':', 0xef},
244 {'d', '-', 0xf0},
245 {'n', '?', 0xf1},
Bram Moolenaar41193092019-08-24 21:53:31 +0200246 {'n', '~', 0xf1}, // ñ Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000247 {'o', '!', 0xf2},
Bram Moolenaar41193092019-08-24 21:53:31 +0200248 {'o', '`', 0xf2}, // ò Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000249 {'o', '\'', 0xf3},
250 {'o', '>', 0xf4},
Bram Moolenaar41193092019-08-24 21:53:31 +0200251 {'o', '^', 0xf4}, // ô Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000252 {'o', '?', 0xf5},
Bram Moolenaar41193092019-08-24 21:53:31 +0200253 {'o', '~', 0xf5}, // õ Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000254 {'o', ':', 0xf6},
255 {'-', ':', 0xf7},
256 {'o', '/', 0xf8},
257 {'u', '!', 0xf9},
Bram Moolenaar41193092019-08-24 21:53:31 +0200258 {'u', '`', 0xf9}, // ù Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000259 {'u', '\'', 0xfa},
260 {'u', '>', 0xfb},
Bram Moolenaar41193092019-08-24 21:53:31 +0200261 {'u', '^', 0xfb}, // û Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000262 {'u', ':', 0xfc},
263 {'y', '\'', 0xfd},
264 {'t', 'h', 0xfe},
265 {'y', ':', 0xff},
Bram Moolenaareae8ae12018-12-14 18:53:02 +0100266 {'y', '"', 0xff}, // x XX Vim 5.x compatible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000267
Bram Moolenaare3f915d2020-07-14 23:02:44 +0200268# define USE_UNICODE_DIGRAPHS
Bram Moolenaar071d4272004-06-13 20:20:40 +0000269
270 {'A', '-', 0x0100},
271 {'a', '-', 0x0101},
272 {'A', '(', 0x0102},
273 {'a', '(', 0x0103},
274 {'A', ';', 0x0104},
275 {'a', ';', 0x0105},
276 {'C', '\'', 0x0106},
277 {'c', '\'', 0x0107},
278 {'C', '>', 0x0108},
279 {'c', '>', 0x0109},
280 {'C', '.', 0x010a},
281 {'c', '.', 0x010b},
282 {'C', '<', 0x010c},
283 {'c', '<', 0x010d},
284 {'D', '<', 0x010e},
285 {'d', '<', 0x010f},
286 {'D', '/', 0x0110},
287 {'d', '/', 0x0111},
288 {'E', '-', 0x0112},
289 {'e', '-', 0x0113},
290 {'E', '(', 0x0114},
291 {'e', '(', 0x0115},
292 {'E', '.', 0x0116},
293 {'e', '.', 0x0117},
294 {'E', ';', 0x0118},
295 {'e', ';', 0x0119},
296 {'E', '<', 0x011a},
297 {'e', '<', 0x011b},
298 {'G', '>', 0x011c},
299 {'g', '>', 0x011d},
300 {'G', '(', 0x011e},
301 {'g', '(', 0x011f},
302 {'G', '.', 0x0120},
303 {'g', '.', 0x0121},
304 {'G', ',', 0x0122},
305 {'g', ',', 0x0123},
306 {'H', '>', 0x0124},
307 {'h', '>', 0x0125},
308 {'H', '/', 0x0126},
309 {'h', '/', 0x0127},
310 {'I', '?', 0x0128},
311 {'i', '?', 0x0129},
312 {'I', '-', 0x012a},
313 {'i', '-', 0x012b},
314 {'I', '(', 0x012c},
315 {'i', '(', 0x012d},
316 {'I', ';', 0x012e},
317 {'i', ';', 0x012f},
318 {'I', '.', 0x0130},
319 {'i', '.', 0x0131},
320 {'I', 'J', 0x0132},
321 {'i', 'j', 0x0133},
322 {'J', '>', 0x0134},
323 {'j', '>', 0x0135},
324 {'K', ',', 0x0136},
325 {'k', ',', 0x0137},
326 {'k', 'k', 0x0138},
327 {'L', '\'', 0x0139},
328 {'l', '\'', 0x013a},
329 {'L', ',', 0x013b},
330 {'l', ',', 0x013c},
331 {'L', '<', 0x013d},
332 {'l', '<', 0x013e},
333 {'L', '.', 0x013f},
334 {'l', '.', 0x0140},
335 {'L', '/', 0x0141},
336 {'l', '/', 0x0142},
337 {'N', '\'', 0x0143},
338 {'n', '\'', 0x0144},
339 {'N', ',', 0x0145},
340 {'n', ',', 0x0146},
341 {'N', '<', 0x0147},
342 {'n', '<', 0x0148},
343 {'\'', 'n', 0x0149},
344 {'N', 'G', 0x014a},
345 {'n', 'g', 0x014b},
346 {'O', '-', 0x014c},
347 {'o', '-', 0x014d},
348 {'O', '(', 0x014e},
349 {'o', '(', 0x014f},
350 {'O', '"', 0x0150},
351 {'o', '"', 0x0151},
352 {'O', 'E', 0x0152},
353 {'o', 'e', 0x0153},
354 {'R', '\'', 0x0154},
355 {'r', '\'', 0x0155},
356 {'R', ',', 0x0156},
357 {'r', ',', 0x0157},
358 {'R', '<', 0x0158},
359 {'r', '<', 0x0159},
360 {'S', '\'', 0x015a},
361 {'s', '\'', 0x015b},
362 {'S', '>', 0x015c},
363 {'s', '>', 0x015d},
364 {'S', ',', 0x015e},
365 {'s', ',', 0x015f},
366 {'S', '<', 0x0160},
367 {'s', '<', 0x0161},
368 {'T', ',', 0x0162},
369 {'t', ',', 0x0163},
370 {'T', '<', 0x0164},
371 {'t', '<', 0x0165},
372 {'T', '/', 0x0166},
373 {'t', '/', 0x0167},
374 {'U', '?', 0x0168},
375 {'u', '?', 0x0169},
376 {'U', '-', 0x016a},
377 {'u', '-', 0x016b},
378 {'U', '(', 0x016c},
379 {'u', '(', 0x016d},
380 {'U', '0', 0x016e},
381 {'u', '0', 0x016f},
382 {'U', '"', 0x0170},
383 {'u', '"', 0x0171},
384 {'U', ';', 0x0172},
385 {'u', ';', 0x0173},
386 {'W', '>', 0x0174},
387 {'w', '>', 0x0175},
388 {'Y', '>', 0x0176},
389 {'y', '>', 0x0177},
390 {'Y', ':', 0x0178},
391 {'Z', '\'', 0x0179},
392 {'z', '\'', 0x017a},
393 {'Z', '.', 0x017b},
394 {'z', '.', 0x017c},
395 {'Z', '<', 0x017d},
396 {'z', '<', 0x017e},
397 {'O', '9', 0x01a0},
398 {'o', '9', 0x01a1},
399 {'O', 'I', 0x01a2},
400 {'o', 'i', 0x01a3},
401 {'y', 'r', 0x01a6},
402 {'U', '9', 0x01af},
403 {'u', '9', 0x01b0},
404 {'Z', '/', 0x01b5},
405 {'z', '/', 0x01b6},
406 {'E', 'D', 0x01b7},
407 {'A', '<', 0x01cd},
408 {'a', '<', 0x01ce},
409 {'I', '<', 0x01cf},
410 {'i', '<', 0x01d0},
411 {'O', '<', 0x01d1},
412 {'o', '<', 0x01d2},
413 {'U', '<', 0x01d3},
414 {'u', '<', 0x01d4},
415 {'A', '1', 0x01de},
416 {'a', '1', 0x01df},
417 {'A', '7', 0x01e0},
418 {'a', '7', 0x01e1},
419 {'A', '3', 0x01e2},
420 {'a', '3', 0x01e3},
421 {'G', '/', 0x01e4},
422 {'g', '/', 0x01e5},
423 {'G', '<', 0x01e6},
424 {'g', '<', 0x01e7},
425 {'K', '<', 0x01e8},
426 {'k', '<', 0x01e9},
427 {'O', ';', 0x01ea},
428 {'o', ';', 0x01eb},
429 {'O', '1', 0x01ec},
430 {'o', '1', 0x01ed},
431 {'E', 'Z', 0x01ee},
432 {'e', 'z', 0x01ef},
433 {'j', '<', 0x01f0},
434 {'G', '\'', 0x01f4},
435 {'g', '\'', 0x01f5},
436 {';', 'S', 0x02bf},
437 {'\'', '<', 0x02c7},
438 {'\'', '(', 0x02d8},
439 {'\'', '.', 0x02d9},
440 {'\'', '0', 0x02da},
441 {'\'', ';', 0x02db},
442 {'\'', '"', 0x02dd},
Bram Moolenaare3f915d2020-07-14 23:02:44 +0200443# define DG_START_GREEK 0x0386
Bram Moolenaar071d4272004-06-13 20:20:40 +0000444 {'A', '%', 0x0386},
445 {'E', '%', 0x0388},
446 {'Y', '%', 0x0389},
447 {'I', '%', 0x038a},
448 {'O', '%', 0x038c},
449 {'U', '%', 0x038e},
450 {'W', '%', 0x038f},
451 {'i', '3', 0x0390},
452 {'A', '*', 0x0391},
453 {'B', '*', 0x0392},
454 {'G', '*', 0x0393},
455 {'D', '*', 0x0394},
456 {'E', '*', 0x0395},
457 {'Z', '*', 0x0396},
458 {'Y', '*', 0x0397},
459 {'H', '*', 0x0398},
460 {'I', '*', 0x0399},
461 {'K', '*', 0x039a},
462 {'L', '*', 0x039b},
463 {'M', '*', 0x039c},
464 {'N', '*', 0x039d},
465 {'C', '*', 0x039e},
466 {'O', '*', 0x039f},
467 {'P', '*', 0x03a0},
468 {'R', '*', 0x03a1},
469 {'S', '*', 0x03a3},
470 {'T', '*', 0x03a4},
471 {'U', '*', 0x03a5},
472 {'F', '*', 0x03a6},
473 {'X', '*', 0x03a7},
474 {'Q', '*', 0x03a8},
475 {'W', '*', 0x03a9},
476 {'J', '*', 0x03aa},
477 {'V', '*', 0x03ab},
478 {'a', '%', 0x03ac},
479 {'e', '%', 0x03ad},
480 {'y', '%', 0x03ae},
481 {'i', '%', 0x03af},
482 {'u', '3', 0x03b0},
483 {'a', '*', 0x03b1},
484 {'b', '*', 0x03b2},
485 {'g', '*', 0x03b3},
486 {'d', '*', 0x03b4},
487 {'e', '*', 0x03b5},
488 {'z', '*', 0x03b6},
489 {'y', '*', 0x03b7},
490 {'h', '*', 0x03b8},
491 {'i', '*', 0x03b9},
492 {'k', '*', 0x03ba},
493 {'l', '*', 0x03bb},
494 {'m', '*', 0x03bc},
495 {'n', '*', 0x03bd},
496 {'c', '*', 0x03be},
497 {'o', '*', 0x03bf},
498 {'p', '*', 0x03c0},
499 {'r', '*', 0x03c1},
500 {'*', 's', 0x03c2},
501 {'s', '*', 0x03c3},
502 {'t', '*', 0x03c4},
503 {'u', '*', 0x03c5},
504 {'f', '*', 0x03c6},
505 {'x', '*', 0x03c7},
506 {'q', '*', 0x03c8},
507 {'w', '*', 0x03c9},
508 {'j', '*', 0x03ca},
509 {'v', '*', 0x03cb},
510 {'o', '%', 0x03cc},
511 {'u', '%', 0x03cd},
512 {'w', '%', 0x03ce},
513 {'\'', 'G', 0x03d8},
514 {',', 'G', 0x03d9},
515 {'T', '3', 0x03da},
516 {'t', '3', 0x03db},
517 {'M', '3', 0x03dc},
518 {'m', '3', 0x03dd},
519 {'K', '3', 0x03de},
520 {'k', '3', 0x03df},
521 {'P', '3', 0x03e0},
522 {'p', '3', 0x03e1},
523 {'\'', '%', 0x03f4},
524 {'j', '3', 0x03f5},
Bram Moolenaare3f915d2020-07-14 23:02:44 +0200525# define DG_START_CYRILLIC 0x0401
Bram Moolenaar071d4272004-06-13 20:20:40 +0000526 {'I', 'O', 0x0401},
527 {'D', '%', 0x0402},
528 {'G', '%', 0x0403},
529 {'I', 'E', 0x0404},
530 {'D', 'S', 0x0405},
531 {'I', 'I', 0x0406},
532 {'Y', 'I', 0x0407},
533 {'J', '%', 0x0408},
534 {'L', 'J', 0x0409},
535 {'N', 'J', 0x040a},
536 {'T', 's', 0x040b},
537 {'K', 'J', 0x040c},
538 {'V', '%', 0x040e},
539 {'D', 'Z', 0x040f},
540 {'A', '=', 0x0410},
541 {'B', '=', 0x0411},
542 {'V', '=', 0x0412},
543 {'G', '=', 0x0413},
544 {'D', '=', 0x0414},
545 {'E', '=', 0x0415},
546 {'Z', '%', 0x0416},
547 {'Z', '=', 0x0417},
548 {'I', '=', 0x0418},
549 {'J', '=', 0x0419},
550 {'K', '=', 0x041a},
551 {'L', '=', 0x041b},
552 {'M', '=', 0x041c},
553 {'N', '=', 0x041d},
554 {'O', '=', 0x041e},
555 {'P', '=', 0x041f},
556 {'R', '=', 0x0420},
557 {'S', '=', 0x0421},
558 {'T', '=', 0x0422},
559 {'U', '=', 0x0423},
560 {'F', '=', 0x0424},
561 {'H', '=', 0x0425},
562 {'C', '=', 0x0426},
563 {'C', '%', 0x0427},
564 {'S', '%', 0x0428},
565 {'S', 'c', 0x0429},
566 {'=', '"', 0x042a},
567 {'Y', '=', 0x042b},
568 {'%', '"', 0x042c},
569 {'J', 'E', 0x042d},
570 {'J', 'U', 0x042e},
571 {'J', 'A', 0x042f},
572 {'a', '=', 0x0430},
573 {'b', '=', 0x0431},
574 {'v', '=', 0x0432},
575 {'g', '=', 0x0433},
576 {'d', '=', 0x0434},
577 {'e', '=', 0x0435},
578 {'z', '%', 0x0436},
579 {'z', '=', 0x0437},
580 {'i', '=', 0x0438},
581 {'j', '=', 0x0439},
582 {'k', '=', 0x043a},
583 {'l', '=', 0x043b},
584 {'m', '=', 0x043c},
585 {'n', '=', 0x043d},
586 {'o', '=', 0x043e},
587 {'p', '=', 0x043f},
588 {'r', '=', 0x0440},
589 {'s', '=', 0x0441},
590 {'t', '=', 0x0442},
591 {'u', '=', 0x0443},
592 {'f', '=', 0x0444},
593 {'h', '=', 0x0445},
594 {'c', '=', 0x0446},
595 {'c', '%', 0x0447},
596 {'s', '%', 0x0448},
597 {'s', 'c', 0x0449},
598 {'=', '\'', 0x044a},
599 {'y', '=', 0x044b},
600 {'%', '\'', 0x044c},
601 {'j', 'e', 0x044d},
602 {'j', 'u', 0x044e},
603 {'j', 'a', 0x044f},
604 {'i', 'o', 0x0451},
605 {'d', '%', 0x0452},
606 {'g', '%', 0x0453},
607 {'i', 'e', 0x0454},
608 {'d', 's', 0x0455},
609 {'i', 'i', 0x0456},
610 {'y', 'i', 0x0457},
611 {'j', '%', 0x0458},
612 {'l', 'j', 0x0459},
613 {'n', 'j', 0x045a},
614 {'t', 's', 0x045b},
615 {'k', 'j', 0x045c},
616 {'v', '%', 0x045e},
617 {'d', 'z', 0x045f},
618 {'Y', '3', 0x0462},
619 {'y', '3', 0x0463},
620 {'O', '3', 0x046a},
621 {'o', '3', 0x046b},
622 {'F', '3', 0x0472},
623 {'f', '3', 0x0473},
624 {'V', '3', 0x0474},
625 {'v', '3', 0x0475},
626 {'C', '3', 0x0480},
627 {'c', '3', 0x0481},
628 {'G', '3', 0x0490},
629 {'g', '3', 0x0491},
Bram Moolenaare3f915d2020-07-14 23:02:44 +0200630# define DG_START_HEBREW 0x05d0
Bram Moolenaar071d4272004-06-13 20:20:40 +0000631 {'A', '+', 0x05d0},
632 {'B', '+', 0x05d1},
633 {'G', '+', 0x05d2},
634 {'D', '+', 0x05d3},
635 {'H', '+', 0x05d4},
636 {'W', '+', 0x05d5},
637 {'Z', '+', 0x05d6},
638 {'X', '+', 0x05d7},
639 {'T', 'j', 0x05d8},
640 {'J', '+', 0x05d9},
641 {'K', '%', 0x05da},
642 {'K', '+', 0x05db},
643 {'L', '+', 0x05dc},
644 {'M', '%', 0x05dd},
645 {'M', '+', 0x05de},
646 {'N', '%', 0x05df},
647 {'N', '+', 0x05e0},
648 {'S', '+', 0x05e1},
649 {'E', '+', 0x05e2},
650 {'P', '%', 0x05e3},
651 {'P', '+', 0x05e4},
652 {'Z', 'j', 0x05e5},
653 {'Z', 'J', 0x05e6},
654 {'Q', '+', 0x05e7},
655 {'R', '+', 0x05e8},
656 {'S', 'h', 0x05e9},
657 {'T', '+', 0x05ea},
Bram Moolenaare3f915d2020-07-14 23:02:44 +0200658# define DG_START_ARABIC 0x060c
Bram Moolenaar071d4272004-06-13 20:20:40 +0000659 {',', '+', 0x060c},
660 {';', '+', 0x061b},
661 {'?', '+', 0x061f},
662 {'H', '\'', 0x0621},
663 {'a', 'M', 0x0622},
664 {'a', 'H', 0x0623},
665 {'w', 'H', 0x0624},
666 {'a', 'h', 0x0625},
667 {'y', 'H', 0x0626},
668 {'a', '+', 0x0627},
669 {'b', '+', 0x0628},
670 {'t', 'm', 0x0629},
671 {'t', '+', 0x062a},
672 {'t', 'k', 0x062b},
673 {'g', '+', 0x062c},
674 {'h', 'k', 0x062d},
675 {'x', '+', 0x062e},
676 {'d', '+', 0x062f},
677 {'d', 'k', 0x0630},
678 {'r', '+', 0x0631},
679 {'z', '+', 0x0632},
680 {'s', '+', 0x0633},
681 {'s', 'n', 0x0634},
682 {'c', '+', 0x0635},
683 {'d', 'd', 0x0636},
684 {'t', 'j', 0x0637},
685 {'z', 'H', 0x0638},
686 {'e', '+', 0x0639},
687 {'i', '+', 0x063a},
688 {'+', '+', 0x0640},
689 {'f', '+', 0x0641},
690 {'q', '+', 0x0642},
691 {'k', '+', 0x0643},
692 {'l', '+', 0x0644},
693 {'m', '+', 0x0645},
694 {'n', '+', 0x0646},
695 {'h', '+', 0x0647},
696 {'w', '+', 0x0648},
697 {'j', '+', 0x0649},
698 {'y', '+', 0x064a},
699 {':', '+', 0x064b},
700 {'"', '+', 0x064c},
701 {'=', '+', 0x064d},
702 {'/', '+', 0x064e},
703 {'\'', '+', 0x064f},
704 {'1', '+', 0x0650},
705 {'3', '+', 0x0651},
706 {'0', '+', 0x0652},
707 {'a', 'S', 0x0670},
708 {'p', '+', 0x067e},
709 {'v', '+', 0x06a4},
710 {'g', 'f', 0x06af},
711 {'0', 'a', 0x06f0},
712 {'1', 'a', 0x06f1},
713 {'2', 'a', 0x06f2},
714 {'3', 'a', 0x06f3},
715 {'4', 'a', 0x06f4},
716 {'5', 'a', 0x06f5},
717 {'6', 'a', 0x06f6},
718 {'7', 'a', 0x06f7},
719 {'8', 'a', 0x06f8},
720 {'9', 'a', 0x06f9},
Bram Moolenaare3f915d2020-07-14 23:02:44 +0200721# define DG_START_LATIN_EXTENDED 0x1e02
Bram Moolenaar071d4272004-06-13 20:20:40 +0000722 {'B', '.', 0x1e02},
723 {'b', '.', 0x1e03},
724 {'B', '_', 0x1e06},
725 {'b', '_', 0x1e07},
726 {'D', '.', 0x1e0a},
727 {'d', '.', 0x1e0b},
728 {'D', '_', 0x1e0e},
729 {'d', '_', 0x1e0f},
730 {'D', ',', 0x1e10},
731 {'d', ',', 0x1e11},
732 {'F', '.', 0x1e1e},
733 {'f', '.', 0x1e1f},
734 {'G', '-', 0x1e20},
735 {'g', '-', 0x1e21},
736 {'H', '.', 0x1e22},
737 {'h', '.', 0x1e23},
738 {'H', ':', 0x1e26},
739 {'h', ':', 0x1e27},
740 {'H', ',', 0x1e28},
741 {'h', ',', 0x1e29},
742 {'K', '\'', 0x1e30},
743 {'k', '\'', 0x1e31},
744 {'K', '_', 0x1e34},
745 {'k', '_', 0x1e35},
746 {'L', '_', 0x1e3a},
747 {'l', '_', 0x1e3b},
748 {'M', '\'', 0x1e3e},
749 {'m', '\'', 0x1e3f},
750 {'M', '.', 0x1e40},
751 {'m', '.', 0x1e41},
752 {'N', '.', 0x1e44},
753 {'n', '.', 0x1e45},
754 {'N', '_', 0x1e48},
755 {'n', '_', 0x1e49},
756 {'P', '\'', 0x1e54},
757 {'p', '\'', 0x1e55},
758 {'P', '.', 0x1e56},
759 {'p', '.', 0x1e57},
760 {'R', '.', 0x1e58},
761 {'r', '.', 0x1e59},
762 {'R', '_', 0x1e5e},
763 {'r', '_', 0x1e5f},
764 {'S', '.', 0x1e60},
765 {'s', '.', 0x1e61},
766 {'T', '.', 0x1e6a},
767 {'t', '.', 0x1e6b},
768 {'T', '_', 0x1e6e},
769 {'t', '_', 0x1e6f},
770 {'V', '?', 0x1e7c},
771 {'v', '?', 0x1e7d},
772 {'W', '!', 0x1e80},
Bram Moolenaareae8ae12018-12-14 18:53:02 +0100773 {'W', '`', 0x1e80}, // extra alternative, easier to remember
Bram Moolenaar071d4272004-06-13 20:20:40 +0000774 {'w', '!', 0x1e81},
Bram Moolenaareae8ae12018-12-14 18:53:02 +0100775 {'w', '`', 0x1e81}, // extra alternative, easier to remember
Bram Moolenaar071d4272004-06-13 20:20:40 +0000776 {'W', '\'', 0x1e82},
777 {'w', '\'', 0x1e83},
778 {'W', ':', 0x1e84},
779 {'w', ':', 0x1e85},
780 {'W', '.', 0x1e86},
781 {'w', '.', 0x1e87},
782 {'X', '.', 0x1e8a},
783 {'x', '.', 0x1e8b},
784 {'X', ':', 0x1e8c},
785 {'x', ':', 0x1e8d},
786 {'Y', '.', 0x1e8e},
787 {'y', '.', 0x1e8f},
788 {'Z', '>', 0x1e90},
789 {'z', '>', 0x1e91},
790 {'Z', '_', 0x1e94},
791 {'z', '_', 0x1e95},
792 {'h', '_', 0x1e96},
793 {'t', ':', 0x1e97},
794 {'w', '0', 0x1e98},
795 {'y', '0', 0x1e99},
796 {'A', '2', 0x1ea2},
797 {'a', '2', 0x1ea3},
798 {'E', '2', 0x1eba},
799 {'e', '2', 0x1ebb},
800 {'E', '?', 0x1ebc},
801 {'e', '?', 0x1ebd},
802 {'I', '2', 0x1ec8},
803 {'i', '2', 0x1ec9},
804 {'O', '2', 0x1ece},
805 {'o', '2', 0x1ecf},
806 {'U', '2', 0x1ee6},
807 {'u', '2', 0x1ee7},
808 {'Y', '!', 0x1ef2},
Bram Moolenaareae8ae12018-12-14 18:53:02 +0100809 {'Y', '`', 0x1ef2}, // extra alternative, easier to remember
Bram Moolenaar071d4272004-06-13 20:20:40 +0000810 {'y', '!', 0x1ef3},
Bram Moolenaareae8ae12018-12-14 18:53:02 +0100811 {'y', '`', 0x1ef3}, // extra alternative, easier to remember
Bram Moolenaar071d4272004-06-13 20:20:40 +0000812 {'Y', '2', 0x1ef6},
813 {'y', '2', 0x1ef7},
814 {'Y', '?', 0x1ef8},
815 {'y', '?', 0x1ef9},
Bram Moolenaare3f915d2020-07-14 23:02:44 +0200816# define DG_START_GREEK_EXTENDED 0x1f00
Bram Moolenaar071d4272004-06-13 20:20:40 +0000817 {';', '\'', 0x1f00},
818 {',', '\'', 0x1f01},
819 {';', '!', 0x1f02},
820 {',', '!', 0x1f03},
821 {'?', ';', 0x1f04},
822 {'?', ',', 0x1f05},
823 {'!', ':', 0x1f06},
824 {'?', ':', 0x1f07},
Bram Moolenaare3f915d2020-07-14 23:02:44 +0200825# define DG_START_PUNCTUATION 0x2002
Bram Moolenaar071d4272004-06-13 20:20:40 +0000826 {'1', 'N', 0x2002},
827 {'1', 'M', 0x2003},
828 {'3', 'M', 0x2004},
829 {'4', 'M', 0x2005},
830 {'6', 'M', 0x2006},
831 {'1', 'T', 0x2009},
832 {'1', 'H', 0x200a},
833 {'-', '1', 0x2010},
834 {'-', 'N', 0x2013},
835 {'-', 'M', 0x2014},
836 {'-', '3', 0x2015},
837 {'!', '2', 0x2016},
838 {'=', '2', 0x2017},
839 {'\'', '6', 0x2018},
840 {'\'', '9', 0x2019},
841 {'.', '9', 0x201a},
842 {'9', '\'', 0x201b},
843 {'"', '6', 0x201c},
844 {'"', '9', 0x201d},
845 {':', '9', 0x201e},
846 {'9', '"', 0x201f},
847 {'/', '-', 0x2020},
848 {'/', '=', 0x2021},
Bram Moolenaar57ad94c2020-09-08 19:06:30 +0200849 {'o', 'o', 0x2022},
Bram Moolenaar071d4272004-06-13 20:20:40 +0000850 {'.', '.', 0x2025},
Bram Moolenaar81615512016-11-04 22:17:16 +0100851 {',', '.', 0x2026},
Bram Moolenaar071d4272004-06-13 20:20:40 +0000852 {'%', '0', 0x2030},
853 {'1', '\'', 0x2032},
854 {'2', '\'', 0x2033},
855 {'3', '\'', 0x2034},
Jonathan Wright47416d12023-10-20 12:08:09 +0200856 {'4', '\'', 0x2057},
Bram Moolenaar071d4272004-06-13 20:20:40 +0000857 {'1', '"', 0x2035},
858 {'2', '"', 0x2036},
859 {'3', '"', 0x2037},
860 {'C', 'a', 0x2038},
861 {'<', '1', 0x2039},
862 {'>', '1', 0x203a},
863 {':', 'X', 0x203b},
864 {'\'', '-', 0x203e},
865 {'/', 'f', 0x2044},
Bram Moolenaare3f915d2020-07-14 23:02:44 +0200866# define DG_START_SUB_SUPER 0x2070
Bram Moolenaar071d4272004-06-13 20:20:40 +0000867 {'0', 'S', 0x2070},
868 {'4', 'S', 0x2074},
869 {'5', 'S', 0x2075},
870 {'6', 'S', 0x2076},
871 {'7', 'S', 0x2077},
872 {'8', 'S', 0x2078},
873 {'9', 'S', 0x2079},
874 {'+', 'S', 0x207a},
875 {'-', 'S', 0x207b},
876 {'=', 'S', 0x207c},
877 {'(', 'S', 0x207d},
878 {')', 'S', 0x207e},
879 {'n', 'S', 0x207f},
880 {'0', 's', 0x2080},
881 {'1', 's', 0x2081},
882 {'2', 's', 0x2082},
883 {'3', 's', 0x2083},
884 {'4', 's', 0x2084},
885 {'5', 's', 0x2085},
886 {'6', 's', 0x2086},
887 {'7', 's', 0x2087},
888 {'8', 's', 0x2088},
889 {'9', 's', 0x2089},
890 {'+', 's', 0x208a},
891 {'-', 's', 0x208b},
892 {'=', 's', 0x208c},
893 {'(', 's', 0x208d},
894 {')', 's', 0x208e},
Bram Moolenaare3f915d2020-07-14 23:02:44 +0200895# define DG_START_CURRENCY 0x20a4
Bram Moolenaar071d4272004-06-13 20:20:40 +0000896 {'L', 'i', 0x20a4},
897 {'P', 't', 0x20a7},
898 {'W', '=', 0x20a9},
Bram Moolenaar5d18efe2019-12-01 21:11:22 +0100899 {'=', 'e', 0x20ac}, // euro
900 {'E', 'u', 0x20ac}, // euro
901 {'=', 'R', 0x20bd}, // rouble
902 {'=', 'P', 0x20bd}, // rouble
Bram Moolenaare3f915d2020-07-14 23:02:44 +0200903# define DG_START_OTHER1 0x2103
Bram Moolenaar071d4272004-06-13 20:20:40 +0000904 {'o', 'C', 0x2103},
905 {'c', 'o', 0x2105},
906 {'o', 'F', 0x2109},
907 {'N', '0', 0x2116},
908 {'P', 'O', 0x2117},
909 {'R', 'x', 0x211e},
910 {'S', 'M', 0x2120},
911 {'T', 'M', 0x2122},
912 {'O', 'm', 0x2126},
913 {'A', 'O', 0x212b},
914 {'1', '3', 0x2153},
915 {'2', '3', 0x2154},
916 {'1', '5', 0x2155},
917 {'2', '5', 0x2156},
918 {'3', '5', 0x2157},
919 {'4', '5', 0x2158},
920 {'1', '6', 0x2159},
921 {'5', '6', 0x215a},
922 {'1', '8', 0x215b},
923 {'3', '8', 0x215c},
924 {'5', '8', 0x215d},
925 {'7', '8', 0x215e},
Bram Moolenaare3f915d2020-07-14 23:02:44 +0200926# define DG_START_ROMAN 0x2160
Bram Moolenaar071d4272004-06-13 20:20:40 +0000927 {'1', 'R', 0x2160},
928 {'2', 'R', 0x2161},
929 {'3', 'R', 0x2162},
930 {'4', 'R', 0x2163},
931 {'5', 'R', 0x2164},
932 {'6', 'R', 0x2165},
933 {'7', 'R', 0x2166},
934 {'8', 'R', 0x2167},
935 {'9', 'R', 0x2168},
936 {'a', 'R', 0x2169},
937 {'b', 'R', 0x216a},
938 {'c', 'R', 0x216b},
939 {'1', 'r', 0x2170},
940 {'2', 'r', 0x2171},
941 {'3', 'r', 0x2172},
942 {'4', 'r', 0x2173},
943 {'5', 'r', 0x2174},
944 {'6', 'r', 0x2175},
945 {'7', 'r', 0x2176},
946 {'8', 'r', 0x2177},
947 {'9', 'r', 0x2178},
948 {'a', 'r', 0x2179},
949 {'b', 'r', 0x217a},
950 {'c', 'r', 0x217b},
Bram Moolenaare3f915d2020-07-14 23:02:44 +0200951# define DG_START_ARROWS 0x2190
Bram Moolenaar071d4272004-06-13 20:20:40 +0000952 {'<', '-', 0x2190},
953 {'-', '!', 0x2191},
954 {'-', '>', 0x2192},
955 {'-', 'v', 0x2193},
956 {'<', '>', 0x2194},
957 {'U', 'D', 0x2195},
958 {'<', '=', 0x21d0},
959 {'=', '>', 0x21d2},
960 {'=', '=', 0x21d4},
Bram Moolenaare3f915d2020-07-14 23:02:44 +0200961# define DG_START_MATH 0x2200
Bram Moolenaar071d4272004-06-13 20:20:40 +0000962 {'F', 'A', 0x2200},
963 {'d', 'P', 0x2202},
964 {'T', 'E', 0x2203},
965 {'/', '0', 0x2205},
966 {'D', 'E', 0x2206},
967 {'N', 'B', 0x2207},
968 {'(', '-', 0x2208},
969 {'-', ')', 0x220b},
970 {'*', 'P', 0x220f},
971 {'+', 'Z', 0x2211},
972 {'-', '2', 0x2212},
973 {'-', '+', 0x2213},
974 {'*', '-', 0x2217},
975 {'O', 'b', 0x2218},
976 {'S', 'b', 0x2219},
977 {'R', 'T', 0x221a},
978 {'0', '(', 0x221d},
979 {'0', '0', 0x221e},
980 {'-', 'L', 0x221f},
981 {'-', 'V', 0x2220},
982 {'P', 'P', 0x2225},
983 {'A', 'N', 0x2227},
984 {'O', 'R', 0x2228},
985 {'(', 'U', 0x2229},
986 {')', 'U', 0x222a},
987 {'I', 'n', 0x222b},
988 {'D', 'I', 0x222c},
989 {'I', 'o', 0x222e},
990 {'.', ':', 0x2234},
991 {':', '.', 0x2235},
992 {':', 'R', 0x2236},
993 {':', ':', 0x2237},
994 {'?', '1', 0x223c},
995 {'C', 'G', 0x223e},
996 {'?', '-', 0x2243},
997 {'?', '=', 0x2245},
998 {'?', '2', 0x2248},
999 {'=', '?', 0x224c},
1000 {'H', 'I', 0x2253},
1001 {'!', '=', 0x2260},
1002 {'=', '3', 0x2261},
1003 {'=', '<', 0x2264},
1004 {'>', '=', 0x2265},
1005 {'<', '*', 0x226a},
1006 {'*', '>', 0x226b},
1007 {'!', '<', 0x226e},
1008 {'!', '>', 0x226f},
1009 {'(', 'C', 0x2282},
1010 {')', 'C', 0x2283},
1011 {'(', '_', 0x2286},
1012 {')', '_', 0x2287},
1013 {'0', '.', 0x2299},
1014 {'0', '2', 0x229a},
1015 {'-', 'T', 0x22a5},
1016 {'.', 'P', 0x22c5},
1017 {':', '3', 0x22ee},
1018 {'.', '3', 0x22ef},
Bram Moolenaare3f915d2020-07-14 23:02:44 +02001019# define DG_START_TECHNICAL 0x2302
Bram Moolenaar071d4272004-06-13 20:20:40 +00001020 {'E', 'h', 0x2302},
1021 {'<', '7', 0x2308},
1022 {'>', '7', 0x2309},
1023 {'7', '<', 0x230a},
1024 {'7', '>', 0x230b},
1025 {'N', 'I', 0x2310},
1026 {'(', 'A', 0x2312},
1027 {'T', 'R', 0x2315},
1028 {'I', 'u', 0x2320},
1029 {'I', 'l', 0x2321},
1030 {'<', '/', 0x2329},
1031 {'/', '>', 0x232a},
Bram Moolenaare3f915d2020-07-14 23:02:44 +02001032# define DG_START_OTHER2 0x2423
Bram Moolenaar071d4272004-06-13 20:20:40 +00001033 {'V', 's', 0x2423},
1034 {'1', 'h', 0x2440},
1035 {'3', 'h', 0x2441},
1036 {'2', 'h', 0x2442},
1037 {'4', 'h', 0x2443},
1038 {'1', 'j', 0x2446},
1039 {'2', 'j', 0x2447},
1040 {'3', 'j', 0x2448},
1041 {'4', 'j', 0x2449},
1042 {'1', '.', 0x2488},
1043 {'2', '.', 0x2489},
1044 {'3', '.', 0x248a},
1045 {'4', '.', 0x248b},
1046 {'5', '.', 0x248c},
1047 {'6', '.', 0x248d},
1048 {'7', '.', 0x248e},
1049 {'8', '.', 0x248f},
1050 {'9', '.', 0x2490},
Bram Moolenaare3f915d2020-07-14 23:02:44 +02001051# define DG_START_DRAWING 0x2500
Bram Moolenaar071d4272004-06-13 20:20:40 +00001052 {'h', 'h', 0x2500},
1053 {'H', 'H', 0x2501},
1054 {'v', 'v', 0x2502},
1055 {'V', 'V', 0x2503},
1056 {'3', '-', 0x2504},
1057 {'3', '_', 0x2505},
1058 {'3', '!', 0x2506},
1059 {'3', '/', 0x2507},
1060 {'4', '-', 0x2508},
1061 {'4', '_', 0x2509},
1062 {'4', '!', 0x250a},
1063 {'4', '/', 0x250b},
1064 {'d', 'r', 0x250c},
1065 {'d', 'R', 0x250d},
1066 {'D', 'r', 0x250e},
1067 {'D', 'R', 0x250f},
1068 {'d', 'l', 0x2510},
1069 {'d', 'L', 0x2511},
1070 {'D', 'l', 0x2512},
1071 {'L', 'D', 0x2513},
1072 {'u', 'r', 0x2514},
1073 {'u', 'R', 0x2515},
1074 {'U', 'r', 0x2516},
1075 {'U', 'R', 0x2517},
1076 {'u', 'l', 0x2518},
1077 {'u', 'L', 0x2519},
1078 {'U', 'l', 0x251a},
1079 {'U', 'L', 0x251b},
1080 {'v', 'r', 0x251c},
1081 {'v', 'R', 0x251d},
1082 {'V', 'r', 0x2520},
1083 {'V', 'R', 0x2523},
1084 {'v', 'l', 0x2524},
1085 {'v', 'L', 0x2525},
1086 {'V', 'l', 0x2528},
1087 {'V', 'L', 0x252b},
1088 {'d', 'h', 0x252c},
1089 {'d', 'H', 0x252f},
1090 {'D', 'h', 0x2530},
1091 {'D', 'H', 0x2533},
1092 {'u', 'h', 0x2534},
1093 {'u', 'H', 0x2537},
1094 {'U', 'h', 0x2538},
1095 {'U', 'H', 0x253b},
1096 {'v', 'h', 0x253c},
1097 {'v', 'H', 0x253f},
1098 {'V', 'h', 0x2542},
1099 {'V', 'H', 0x254b},
1100 {'F', 'D', 0x2571},
1101 {'B', 'D', 0x2572},
Bram Moolenaare3f915d2020-07-14 23:02:44 +02001102# define DG_START_BLOCK 0x2580
Bram Moolenaar071d4272004-06-13 20:20:40 +00001103 {'T', 'B', 0x2580},
1104 {'L', 'B', 0x2584},
1105 {'F', 'B', 0x2588},
1106 {'l', 'B', 0x258c},
1107 {'R', 'B', 0x2590},
1108 {'.', 'S', 0x2591},
1109 {':', 'S', 0x2592},
1110 {'?', 'S', 0x2593},
Bram Moolenaare3f915d2020-07-14 23:02:44 +02001111# define DG_START_SHAPES 0x25a0
Bram Moolenaar071d4272004-06-13 20:20:40 +00001112 {'f', 'S', 0x25a0},
1113 {'O', 'S', 0x25a1},
1114 {'R', 'O', 0x25a2},
1115 {'R', 'r', 0x25a3},
1116 {'R', 'F', 0x25a4},
1117 {'R', 'Y', 0x25a5},
1118 {'R', 'H', 0x25a6},
1119 {'R', 'Z', 0x25a7},
1120 {'R', 'K', 0x25a8},
1121 {'R', 'X', 0x25a9},
1122 {'s', 'B', 0x25aa},
1123 {'S', 'R', 0x25ac},
1124 {'O', 'r', 0x25ad},
1125 {'U', 'T', 0x25b2},
1126 {'u', 'T', 0x25b3},
1127 {'P', 'R', 0x25b6},
1128 {'T', 'r', 0x25b7},
1129 {'D', 't', 0x25bc},
1130 {'d', 'T', 0x25bd},
1131 {'P', 'L', 0x25c0},
1132 {'T', 'l', 0x25c1},
1133 {'D', 'b', 0x25c6},
1134 {'D', 'w', 0x25c7},
1135 {'L', 'Z', 0x25ca},
1136 {'0', 'm', 0x25cb},
1137 {'0', 'o', 0x25ce},
1138 {'0', 'M', 0x25cf},
1139 {'0', 'L', 0x25d0},
1140 {'0', 'R', 0x25d1},
1141 {'S', 'n', 0x25d8},
1142 {'I', 'c', 0x25d9},
1143 {'F', 'd', 0x25e2},
1144 {'B', 'd', 0x25e3},
Bram Moolenaare3f915d2020-07-14 23:02:44 +02001145# define DG_START_SYMBOLS 0x2605
Bram Moolenaar071d4272004-06-13 20:20:40 +00001146 {'*', '2', 0x2605},
1147 {'*', '1', 0x2606},
1148 {'<', 'H', 0x261c},
1149 {'>', 'H', 0x261e},
1150 {'0', 'u', 0x263a},
1151 {'0', 'U', 0x263b},
1152 {'S', 'U', 0x263c},
1153 {'F', 'm', 0x2640},
1154 {'M', 'l', 0x2642},
1155 {'c', 'S', 0x2660},
1156 {'c', 'H', 0x2661},
1157 {'c', 'D', 0x2662},
1158 {'c', 'C', 0x2663},
1159 {'M', 'd', 0x2669},
1160 {'M', '8', 0x266a},
1161 {'M', '2', 0x266b},
1162 {'M', 'b', 0x266d},
1163 {'M', 'x', 0x266e},
1164 {'M', 'X', 0x266f},
Bram Moolenaare3f915d2020-07-14 23:02:44 +02001165# define DG_START_DINGBATS 0x2713
Bram Moolenaar071d4272004-06-13 20:20:40 +00001166 {'O', 'K', 0x2713},
1167 {'X', 'X', 0x2717},
1168 {'-', 'X', 0x2720},
Bram Moolenaare3f915d2020-07-14 23:02:44 +02001169# define DG_START_CJK_SYMBOLS 0x3000
Bram Moolenaar071d4272004-06-13 20:20:40 +00001170 {'I', 'S', 0x3000},
1171 {',', '_', 0x3001},
1172 {'.', '_', 0x3002},
1173 {'+', '"', 0x3003},
1174 {'+', '_', 0x3004},
1175 {'*', '_', 0x3005},
1176 {';', '_', 0x3006},
1177 {'0', '_', 0x3007},
1178 {'<', '+', 0x300a},
1179 {'>', '+', 0x300b},
1180 {'<', '\'', 0x300c},
1181 {'>', '\'', 0x300d},
1182 {'<', '"', 0x300e},
1183 {'>', '"', 0x300f},
1184 {'(', '"', 0x3010},
1185 {')', '"', 0x3011},
1186 {'=', 'T', 0x3012},
1187 {'=', '_', 0x3013},
1188 {'(', '\'', 0x3014},
1189 {')', '\'', 0x3015},
1190 {'(', 'I', 0x3016},
1191 {')', 'I', 0x3017},
1192 {'-', '?', 0x301c},
Bram Moolenaare3f915d2020-07-14 23:02:44 +02001193# define DG_START_HIRAGANA 0x3041
Bram Moolenaar071d4272004-06-13 20:20:40 +00001194 {'A', '5', 0x3041},
1195 {'a', '5', 0x3042},
1196 {'I', '5', 0x3043},
1197 {'i', '5', 0x3044},
1198 {'U', '5', 0x3045},
1199 {'u', '5', 0x3046},
1200 {'E', '5', 0x3047},
1201 {'e', '5', 0x3048},
1202 {'O', '5', 0x3049},
1203 {'o', '5', 0x304a},
1204 {'k', 'a', 0x304b},
1205 {'g', 'a', 0x304c},
1206 {'k', 'i', 0x304d},
1207 {'g', 'i', 0x304e},
1208 {'k', 'u', 0x304f},
1209 {'g', 'u', 0x3050},
1210 {'k', 'e', 0x3051},
1211 {'g', 'e', 0x3052},
1212 {'k', 'o', 0x3053},
1213 {'g', 'o', 0x3054},
1214 {'s', 'a', 0x3055},
1215 {'z', 'a', 0x3056},
1216 {'s', 'i', 0x3057},
1217 {'z', 'i', 0x3058},
1218 {'s', 'u', 0x3059},
1219 {'z', 'u', 0x305a},
1220 {'s', 'e', 0x305b},
1221 {'z', 'e', 0x305c},
1222 {'s', 'o', 0x305d},
1223 {'z', 'o', 0x305e},
1224 {'t', 'a', 0x305f},
1225 {'d', 'a', 0x3060},
1226 {'t', 'i', 0x3061},
1227 {'d', 'i', 0x3062},
1228 {'t', 'U', 0x3063},
1229 {'t', 'u', 0x3064},
1230 {'d', 'u', 0x3065},
1231 {'t', 'e', 0x3066},
1232 {'d', 'e', 0x3067},
1233 {'t', 'o', 0x3068},
1234 {'d', 'o', 0x3069},
1235 {'n', 'a', 0x306a},
1236 {'n', 'i', 0x306b},
1237 {'n', 'u', 0x306c},
1238 {'n', 'e', 0x306d},
1239 {'n', 'o', 0x306e},
1240 {'h', 'a', 0x306f},
1241 {'b', 'a', 0x3070},
1242 {'p', 'a', 0x3071},
1243 {'h', 'i', 0x3072},
1244 {'b', 'i', 0x3073},
1245 {'p', 'i', 0x3074},
1246 {'h', 'u', 0x3075},
1247 {'b', 'u', 0x3076},
1248 {'p', 'u', 0x3077},
1249 {'h', 'e', 0x3078},
1250 {'b', 'e', 0x3079},
1251 {'p', 'e', 0x307a},
1252 {'h', 'o', 0x307b},
1253 {'b', 'o', 0x307c},
1254 {'p', 'o', 0x307d},
1255 {'m', 'a', 0x307e},
1256 {'m', 'i', 0x307f},
1257 {'m', 'u', 0x3080},
1258 {'m', 'e', 0x3081},
1259 {'m', 'o', 0x3082},
1260 {'y', 'A', 0x3083},
1261 {'y', 'a', 0x3084},
1262 {'y', 'U', 0x3085},
1263 {'y', 'u', 0x3086},
1264 {'y', 'O', 0x3087},
1265 {'y', 'o', 0x3088},
1266 {'r', 'a', 0x3089},
1267 {'r', 'i', 0x308a},
1268 {'r', 'u', 0x308b},
1269 {'r', 'e', 0x308c},
1270 {'r', 'o', 0x308d},
1271 {'w', 'A', 0x308e},
1272 {'w', 'a', 0x308f},
1273 {'w', 'i', 0x3090},
1274 {'w', 'e', 0x3091},
1275 {'w', 'o', 0x3092},
1276 {'n', '5', 0x3093},
1277 {'v', 'u', 0x3094},
1278 {'"', '5', 0x309b},
1279 {'0', '5', 0x309c},
1280 {'*', '5', 0x309d},
1281 {'+', '5', 0x309e},
Bram Moolenaare3f915d2020-07-14 23:02:44 +02001282# define DG_START_KATAKANA 0x30a1
Bram Moolenaar071d4272004-06-13 20:20:40 +00001283 {'a', '6', 0x30a1},
1284 {'A', '6', 0x30a2},
1285 {'i', '6', 0x30a3},
1286 {'I', '6', 0x30a4},
1287 {'u', '6', 0x30a5},
1288 {'U', '6', 0x30a6},
1289 {'e', '6', 0x30a7},
1290 {'E', '6', 0x30a8},
1291 {'o', '6', 0x30a9},
1292 {'O', '6', 0x30aa},
1293 {'K', 'a', 0x30ab},
1294 {'G', 'a', 0x30ac},
1295 {'K', 'i', 0x30ad},
1296 {'G', 'i', 0x30ae},
1297 {'K', 'u', 0x30af},
1298 {'G', 'u', 0x30b0},
1299 {'K', 'e', 0x30b1},
1300 {'G', 'e', 0x30b2},
1301 {'K', 'o', 0x30b3},
1302 {'G', 'o', 0x30b4},
1303 {'S', 'a', 0x30b5},
1304 {'Z', 'a', 0x30b6},
1305 {'S', 'i', 0x30b7},
1306 {'Z', 'i', 0x30b8},
1307 {'S', 'u', 0x30b9},
1308 {'Z', 'u', 0x30ba},
1309 {'S', 'e', 0x30bb},
1310 {'Z', 'e', 0x30bc},
1311 {'S', 'o', 0x30bd},
1312 {'Z', 'o', 0x30be},
1313 {'T', 'a', 0x30bf},
1314 {'D', 'a', 0x30c0},
1315 {'T', 'i', 0x30c1},
1316 {'D', 'i', 0x30c2},
1317 {'T', 'U', 0x30c3},
1318 {'T', 'u', 0x30c4},
1319 {'D', 'u', 0x30c5},
1320 {'T', 'e', 0x30c6},
1321 {'D', 'e', 0x30c7},
1322 {'T', 'o', 0x30c8},
1323 {'D', 'o', 0x30c9},
1324 {'N', 'a', 0x30ca},
1325 {'N', 'i', 0x30cb},
1326 {'N', 'u', 0x30cc},
1327 {'N', 'e', 0x30cd},
1328 {'N', 'o', 0x30ce},
1329 {'H', 'a', 0x30cf},
1330 {'B', 'a', 0x30d0},
1331 {'P', 'a', 0x30d1},
1332 {'H', 'i', 0x30d2},
1333 {'B', 'i', 0x30d3},
1334 {'P', 'i', 0x30d4},
1335 {'H', 'u', 0x30d5},
1336 {'B', 'u', 0x30d6},
1337 {'P', 'u', 0x30d7},
1338 {'H', 'e', 0x30d8},
1339 {'B', 'e', 0x30d9},
1340 {'P', 'e', 0x30da},
1341 {'H', 'o', 0x30db},
1342 {'B', 'o', 0x30dc},
1343 {'P', 'o', 0x30dd},
1344 {'M', 'a', 0x30de},
1345 {'M', 'i', 0x30df},
1346 {'M', 'u', 0x30e0},
1347 {'M', 'e', 0x30e1},
1348 {'M', 'o', 0x30e2},
1349 {'Y', 'A', 0x30e3},
1350 {'Y', 'a', 0x30e4},
1351 {'Y', 'U', 0x30e5},
1352 {'Y', 'u', 0x30e6},
1353 {'Y', 'O', 0x30e7},
1354 {'Y', 'o', 0x30e8},
1355 {'R', 'a', 0x30e9},
1356 {'R', 'i', 0x30ea},
1357 {'R', 'u', 0x30eb},
1358 {'R', 'e', 0x30ec},
1359 {'R', 'o', 0x30ed},
1360 {'W', 'A', 0x30ee},
1361 {'W', 'a', 0x30ef},
1362 {'W', 'i', 0x30f0},
1363 {'W', 'e', 0x30f1},
1364 {'W', 'o', 0x30f2},
1365 {'N', '6', 0x30f3},
1366 {'V', 'u', 0x30f4},
1367 {'K', 'A', 0x30f5},
1368 {'K', 'E', 0x30f6},
1369 {'V', 'a', 0x30f7},
1370 {'V', 'i', 0x30f8},
1371 {'V', 'e', 0x30f9},
1372 {'V', 'o', 0x30fa},
1373 {'.', '6', 0x30fb},
1374 {'-', '6', 0x30fc},
1375 {'*', '6', 0x30fd},
1376 {'+', '6', 0x30fe},
Bram Moolenaare3f915d2020-07-14 23:02:44 +02001377# define DG_START_BOPOMOFO 0x3105
Bram Moolenaar071d4272004-06-13 20:20:40 +00001378 {'b', '4', 0x3105},
1379 {'p', '4', 0x3106},
1380 {'m', '4', 0x3107},
1381 {'f', '4', 0x3108},
1382 {'d', '4', 0x3109},
1383 {'t', '4', 0x310a},
1384 {'n', '4', 0x310b},
1385 {'l', '4', 0x310c},
1386 {'g', '4', 0x310d},
1387 {'k', '4', 0x310e},
1388 {'h', '4', 0x310f},
1389 {'j', '4', 0x3110},
1390 {'q', '4', 0x3111},
1391 {'x', '4', 0x3112},
1392 {'z', 'h', 0x3113},
1393 {'c', 'h', 0x3114},
1394 {'s', 'h', 0x3115},
1395 {'r', '4', 0x3116},
1396 {'z', '4', 0x3117},
1397 {'c', '4', 0x3118},
1398 {'s', '4', 0x3119},
1399 {'a', '4', 0x311a},
1400 {'o', '4', 0x311b},
1401 {'e', '4', 0x311c},
1402 {'a', 'i', 0x311e},
1403 {'e', 'i', 0x311f},
1404 {'a', 'u', 0x3120},
1405 {'o', 'u', 0x3121},
1406 {'a', 'n', 0x3122},
1407 {'e', 'n', 0x3123},
1408 {'a', 'N', 0x3124},
1409 {'e', 'N', 0x3125},
1410 {'e', 'r', 0x3126},
1411 {'i', '4', 0x3127},
1412 {'u', '4', 0x3128},
1413 {'i', 'u', 0x3129},
1414 {'v', '4', 0x312a},
1415 {'n', 'G', 0x312b},
1416 {'g', 'n', 0x312c},
Bram Moolenaare3f915d2020-07-14 23:02:44 +02001417# define DG_START_OTHER3 0x3220
Bram Moolenaar071d4272004-06-13 20:20:40 +00001418 {'1', 'c', 0x3220},
1419 {'2', 'c', 0x3221},
1420 {'3', 'c', 0x3222},
1421 {'4', 'c', 0x3223},
1422 {'5', 'c', 0x3224},
1423 {'6', 'c', 0x3225},
1424 {'7', 'c', 0x3226},
1425 {'8', 'c', 0x3227},
1426 {'9', 'c', 0x3228},
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01001427 // code points 0xe000 - 0xefff excluded, they have no assigned
1428 // characters, only used in proposals.
Bram Moolenaar071d4272004-06-13 20:20:40 +00001429 {'f', 'f', 0xfb00},
1430 {'f', 'i', 0xfb01},
1431 {'f', 'l', 0xfb02},
1432 {'f', 't', 0xfb05},
1433 {'s', 't', 0xfb06},
Bram Moolenaar5f91c0c2008-01-03 16:54:33 +00001434
Bram Moolenaare27d6e62022-08-30 15:05:30 +01001435 {NUL, NUL, NUL} // end marker
1436};
Bram Moolenaar071d4272004-06-13 20:20:40 +00001437
1438/*
1439 * handle digraphs after typing a character
1440 */
1441 int
Bram Moolenaar7454a062016-01-30 15:14:10 +01001442do_digraph(int c)
Bram Moolenaar071d4272004-06-13 20:20:40 +00001443{
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01001444 static int backspaced; // character before K_BS
1445 static int lastchar; // last typed character
Bram Moolenaar071d4272004-06-13 20:20:40 +00001446
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01001447 if (c == -1) // init values
Bram Moolenaar071d4272004-06-13 20:20:40 +00001448 {
1449 backspaced = -1;
1450 }
1451 else if (p_dg)
1452 {
1453 if (backspaced >= 0)
h-east29b85712021-07-26 21:54:04 +02001454 c = digraph_get(backspaced, c, FALSE);
Bram Moolenaar071d4272004-06-13 20:20:40 +00001455 backspaced = -1;
1456 if ((c == K_BS || c == Ctrl_H) && lastchar >= 0)
1457 backspaced = lastchar;
1458 }
1459 lastchar = c;
1460 return c;
1461}
1462
1463/*
Bram Moolenaar5f73ef82018-02-27 21:09:30 +01001464 * Find a digraph for "val". If found return the string to display it.
1465 * If not found return NULL.
1466 */
1467 char_u *
Bram Moolenaarbc5020a2018-06-16 17:25:22 +02001468get_digraph_for_char(int val_arg)
Bram Moolenaar5f73ef82018-02-27 21:09:30 +01001469{
Bram Moolenaarbc5020a2018-06-16 17:25:22 +02001470 int val = val_arg;
Bram Moolenaar5f73ef82018-02-27 21:09:30 +01001471 int i;
1472 int use_defaults;
1473 digr_T *dp;
1474 static char_u r[3];
1475
Bram Moolenaareae8ae12018-12-14 18:53:02 +01001476#if defined(USE_UNICODE_DIGRAPHS)
Bram Moolenaarbc5020a2018-06-16 17:25:22 +02001477 if (!enc_utf8)
1478 {
1479 char_u buf[6], *to;
1480 vimconv_T vc;
1481
1482 // convert the character from 'encoding' to Unicode
1483 i = mb_char2bytes(val, buf);
1484 vc.vc_type = CONV_NONE;
1485 if (convert_setup(&vc, p_enc, (char_u *)"utf-8") == OK)
1486 {
1487 vc.vc_fail = TRUE;
1488 to = string_convert(&vc, buf, &i);
1489 if (to != NULL)
1490 {
1491 val = utf_ptr2char(to);
1492 vim_free(to);
1493 }
1494 (void)convert_setup(&vc, NULL, NULL);
1495 }
1496 }
1497#endif
1498
Bram Moolenaar5f73ef82018-02-27 21:09:30 +01001499 for (use_defaults = 0; use_defaults <= 1; use_defaults++)
1500 {
1501 if (use_defaults == 0)
1502 dp = (digr_T *)user_digraphs.ga_data;
1503 else
1504 dp = digraphdefault;
1505 for (i = 0; use_defaults ? dp->char1 != NUL
1506 : i < user_digraphs.ga_len; ++i)
1507 {
1508 if (dp->result == val)
1509 {
1510 r[0] = dp->char1;
1511 r[1] = dp->char2;
1512 r[2] = NUL;
1513 return r;
1514 }
1515 ++dp;
1516 }
1517 }
1518 return NULL;
1519}
1520
1521/*
Bram Moolenaar071d4272004-06-13 20:20:40 +00001522 * Get a digraph. Used after typing CTRL-K on the command line or in normal
1523 * mode.
1524 * Returns composed character, or NUL when ESC was used.
1525 */
1526 int
Bram Moolenaar7454a062016-01-30 15:14:10 +01001527get_digraph(
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01001528 int cmdline) // TRUE when called from the cmdline
Bram Moolenaar071d4272004-06-13 20:20:40 +00001529{
1530 int c, cc;
1531
1532 ++no_mapping;
1533 ++allow_keys;
Bram Moolenaar61abfd12007-09-13 16:26:47 +00001534 c = plain_vgetc();
Bram Moolenaar071d4272004-06-13 20:20:40 +00001535 --no_mapping;
1536 --allow_keys;
Yegappan Lakshmanan1cfb14a2023-01-09 19:04:23 +00001537
1538 if (c == ESC) // ESC cancels CTRL-K
1539 return NUL;
1540
1541 if (IS_SPECIAL(c)) // insert special key code
1542 return c;
1543 if (cmdline)
Bram Moolenaar071d4272004-06-13 20:20:40 +00001544 {
Yegappan Lakshmanan1cfb14a2023-01-09 19:04:23 +00001545 if (char2cells(c) == 1
Bram Moolenaar071d4272004-06-13 20:20:40 +00001546#if defined(FEAT_CRYPT) || defined(FEAT_EVAL)
Yegappan Lakshmanan1cfb14a2023-01-09 19:04:23 +00001547 && cmdline_star == 0
Bram Moolenaar071d4272004-06-13 20:20:40 +00001548#endif
Yegappan Lakshmanan1cfb14a2023-01-09 19:04:23 +00001549 )
1550 putcmdline(c, TRUE);
Bram Moolenaar071d4272004-06-13 20:20:40 +00001551 }
Yegappan Lakshmanan1cfb14a2023-01-09 19:04:23 +00001552 else
1553 add_to_showcmd(c);
1554 ++no_mapping;
1555 ++allow_keys;
1556 cc = plain_vgetc();
1557 --no_mapping;
1558 --allow_keys;
1559 if (cc != ESC) // ESC cancels CTRL-K
1560 return digraph_get(c, cc, TRUE);
Bram Moolenaar071d4272004-06-13 20:20:40 +00001561 return NUL;
1562}
1563
1564/*
1565 * Lookup the pair "char1", "char2" in the digraph tables.
1566 * If no match, return "char2".
Bram Moolenaar70b2a562012-01-10 22:26:17 +01001567 * If "meta_char" is TRUE and "char1" is a space, return "char2" | 0x80.
Bram Moolenaar071d4272004-06-13 20:20:40 +00001568 */
1569 static int
Bram Moolenaar7454a062016-01-30 15:14:10 +01001570getexactdigraph(int char1, int char2, int meta_char)
Bram Moolenaar071d4272004-06-13 20:20:40 +00001571{
1572 int i;
1573 int retval = 0;
1574 digr_T *dp;
1575
1576 if (IS_SPECIAL(char1) || IS_SPECIAL(char2))
1577 return char2;
1578
1579 /*
1580 * Search user digraphs first.
1581 */
1582 dp = (digr_T *)user_digraphs.ga_data;
1583 for (i = 0; i < user_digraphs.ga_len; ++i)
1584 {
1585 if ((int)dp->char1 == char1 && (int)dp->char2 == char2)
1586 {
1587 retval = dp->result;
1588 break;
1589 }
1590 ++dp;
1591 }
1592
1593 /*
1594 * Search default digraphs.
1595 */
1596 if (retval == 0)
1597 {
1598 dp = digraphdefault;
dundargocb2209f22022-09-24 15:55:27 +01001599 while (dp->char1 != 0)
Bram Moolenaar071d4272004-06-13 20:20:40 +00001600 {
1601 if ((int)dp->char1 == char1 && (int)dp->char2 == char2)
1602 {
1603 retval = dp->result;
1604 break;
1605 }
1606 ++dp;
1607 }
1608 }
Bram Moolenaar13505972019-01-24 15:04:48 +01001609#ifdef USE_UNICODE_DIGRAPHS
Bram Moolenaar071d4272004-06-13 20:20:40 +00001610 if (retval != 0 && !enc_utf8)
1611 {
1612 char_u buf[6], *to;
1613 vimconv_T vc;
1614
1615 /*
1616 * Convert the Unicode digraph to 'encoding'.
1617 */
1618 i = utf_char2bytes(retval, buf);
1619 retval = 0;
1620 vc.vc_type = CONV_NONE;
1621 if (convert_setup(&vc, (char_u *)"utf-8", p_enc) == OK)
1622 {
1623 vc.vc_fail = TRUE;
1624 to = string_convert(&vc, buf, &i);
1625 if (to != NULL)
1626 {
1627 retval = (*mb_ptr2char)(to);
1628 vim_free(to);
1629 }
1630 (void)convert_setup(&vc, NULL, NULL);
1631 }
1632 }
Bram Moolenaar13505972019-01-24 15:04:48 +01001633#endif
Bram Moolenaar071d4272004-06-13 20:20:40 +00001634
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01001635 // Ignore multi-byte characters when not in multi-byte mode.
Bram Moolenaar071d4272004-06-13 20:20:40 +00001636 if (!has_mbyte && retval > 0xff)
1637 retval = 0;
Bram Moolenaar071d4272004-06-13 20:20:40 +00001638
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01001639 if (retval == 0) // digraph deleted or not found
Bram Moolenaar071d4272004-06-13 20:20:40 +00001640 {
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01001641 if (char1 == ' ' && meta_char) // <space> <char> --> meta-char
Bram Moolenaar071d4272004-06-13 20:20:40 +00001642 return (char2 | 0x80);
1643 return char2;
1644 }
1645 return retval;
1646}
1647
1648/*
1649 * Get digraph.
1650 * Allow for both char1-char2 and char2-char1
1651 */
1652 int
h-east29b85712021-07-26 21:54:04 +02001653digraph_get(int char1, int char2, int meta_char)
Bram Moolenaar071d4272004-06-13 20:20:40 +00001654{
1655 int retval;
1656
Bram Moolenaar70b2a562012-01-10 22:26:17 +01001657 if (((retval = getexactdigraph(char1, char2, meta_char)) == char2)
Bram Moolenaar071d4272004-06-13 20:20:40 +00001658 && (char1 != char2)
Bram Moolenaar70b2a562012-01-10 22:26:17 +01001659 && ((retval = getexactdigraph(char2, char1, meta_char)) == char1))
Bram Moolenaar071d4272004-06-13 20:20:40 +00001660 return char2;
1661 return retval;
1662}
1663
1664/*
mityu61065042021-07-19 20:07:21 +02001665 * Add a digraph to the digraph table.
1666 */
1667 static void
1668registerdigraph(int char1, int char2, int n)
1669{
1670 int i;
1671 digr_T *dp;
1672
1673 // If the digraph already exists, replace "result".
1674 dp = (digr_T *)user_digraphs.ga_data;
1675 for (i = 0; i < user_digraphs.ga_len; ++i)
1676 {
1677 if ((int)dp->char1 == char1 && (int)dp->char2 == char2)
1678 {
1679 dp->result = n;
1680 return;
1681 }
1682 ++dp;
1683 }
1684
1685 // Add a new digraph to the table.
Yegappan Lakshmananfadc02a2023-01-27 21:03:12 +00001686 if (ga_grow(&user_digraphs, 1) == FAIL)
Yegappan Lakshmanan465de3a2022-12-26 12:50:04 +00001687 return;
1688
1689 dp = (digr_T *)user_digraphs.ga_data + user_digraphs.ga_len;
1690 dp->char1 = char1;
1691 dp->char2 = char2;
1692 dp->result = n;
1693 ++user_digraphs.ga_len;
mityu61065042021-07-19 20:07:21 +02001694}
1695
1696/*
1697 * Check the characters are valid for a digraph.
1698 * If they are valid, returns TRUE; otherwise, give an error message and
1699 * returns FALSE.
1700 */
Yegappan Lakshmanan8ee52af2021-08-09 19:59:06 +02001701 static int
mityu61065042021-07-19 20:07:21 +02001702check_digraph_chars_valid(int char1, int char2)
1703{
1704 if (char2 == 0)
1705 {
1706 char_u msg[MB_MAXBYTES + 1];
1707
1708 msg[mb_char2bytes(char1, msg)] = NUL;
1709
1710 semsg(_(e_digraph_must_be_just_two_characters_str), msg);
1711 return FALSE;
1712 }
1713 if (char1 == ESC || char2 == ESC)
1714 {
Bram Moolenaare1242042021-12-16 20:56:57 +00001715 emsg(_(e_escape_not_allowed_in_digraph));
mityu61065042021-07-19 20:07:21 +02001716 return FALSE;
1717 }
1718 return TRUE;
1719}
1720
1721
1722
1723/*
Bram Moolenaar071d4272004-06-13 20:20:40 +00001724 * Add the digraphs in the argument to the digraph table.
1725 * format: {c1}{c2} char {c1}{c2} char ...
1726 */
1727 void
Bram Moolenaar7454a062016-01-30 15:14:10 +01001728putdigraph(char_u *str)
Bram Moolenaar071d4272004-06-13 20:20:40 +00001729{
1730 int char1, char2, n;
Bram Moolenaar071d4272004-06-13 20:20:40 +00001731
1732 while (*str != NUL)
1733 {
1734 str = skipwhite(str);
1735 if (*str == NUL)
1736 return;
1737 char1 = *str++;
1738 char2 = *str++;
mityu61065042021-07-19 20:07:21 +02001739
1740 if (!check_digraph_chars_valid(char1, char2))
Bram Moolenaar071d4272004-06-13 20:20:40 +00001741 return;
mityu61065042021-07-19 20:07:21 +02001742
Bram Moolenaar071d4272004-06-13 20:20:40 +00001743 str = skipwhite(str);
1744 if (!VIM_ISDIGIT(*str))
1745 {
Bram Moolenaare29a27f2021-07-20 21:07:36 +02001746 emsg(_(e_number_expected));
Bram Moolenaar071d4272004-06-13 20:20:40 +00001747 return;
1748 }
1749 n = getdigits(&str);
1750
mityu61065042021-07-19 20:07:21 +02001751 registerdigraph(char1, char2, n);
Bram Moolenaar071d4272004-06-13 20:20:40 +00001752 }
1753}
1754
Bram Moolenaareae8ae12018-12-14 18:53:02 +01001755#if defined(USE_UNICODE_DIGRAPHS)
1756 static void
1757digraph_header(char *msg)
1758{
1759 if (msg_col > 0)
1760 msg_putchar('\n');
1761 msg_outtrans_attr((char_u *)msg, HL_ATTR(HLF_CM));
1762 msg_putchar('\n');
1763}
1764#endif
1765
Bram Moolenaar071d4272004-06-13 20:20:40 +00001766 void
Bram Moolenaareae8ae12018-12-14 18:53:02 +01001767listdigraphs(int use_headers)
Bram Moolenaar071d4272004-06-13 20:20:40 +00001768{
1769 int i;
1770 digr_T *dp;
Bram Moolenaareae8ae12018-12-14 18:53:02 +01001771 result_T previous = 0;
Bram Moolenaar071d4272004-06-13 20:20:40 +00001772
1773 msg_putchar('\n');
1774
1775 dp = digraphdefault;
dundargocb2209f22022-09-24 15:55:27 +01001776 while (dp->char1 != NUL && !got_int)
Bram Moolenaar071d4272004-06-13 20:20:40 +00001777 {
Bram Moolenaareae8ae12018-12-14 18:53:02 +01001778#if defined(USE_UNICODE_DIGRAPHS)
Bram Moolenaar071d4272004-06-13 20:20:40 +00001779 digr_T tmp;
1780
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01001781 // May need to convert the result to 'encoding'.
Bram Moolenaar071d4272004-06-13 20:20:40 +00001782 tmp.char1 = dp->char1;
1783 tmp.char2 = dp->char2;
1784 tmp.result = getexactdigraph(tmp.char1, tmp.char2, FALSE);
1785 if (tmp.result != 0 && tmp.result != tmp.char2
1786 && (has_mbyte || tmp.result <= 255))
Bram Moolenaareae8ae12018-12-14 18:53:02 +01001787 printdigraph(&tmp, use_headers ? &previous : NULL);
Bram Moolenaar071d4272004-06-13 20:20:40 +00001788#else
1789
1790 if (getexactdigraph(dp->char1, dp->char2, FALSE) == dp->result
Bram Moolenaar13505972019-01-24 15:04:48 +01001791 && (has_mbyte || dp->result <= 255))
Bram Moolenaareae8ae12018-12-14 18:53:02 +01001792 printdigraph(dp, use_headers ? &previous : NULL);
Bram Moolenaar071d4272004-06-13 20:20:40 +00001793#endif
1794 ++dp;
1795 ui_breakcheck();
1796 }
1797
1798 dp = (digr_T *)user_digraphs.ga_data;
1799 for (i = 0; i < user_digraphs.ga_len && !got_int; ++i)
1800 {
Bram Moolenaareae8ae12018-12-14 18:53:02 +01001801#if defined(USE_UNICODE_DIGRAPHS)
1802 if (previous >= 0 && use_headers)
1803 digraph_header(_("Custom"));
1804 previous = -1;
1805#endif
1806 printdigraph(dp, NULL);
Bram Moolenaar071d4272004-06-13 20:20:40 +00001807 ui_breakcheck();
1808 ++dp;
1809 }
Bram Moolenaara4d158b2022-08-14 14:17:45 +01001810
1811 // clear screen, because some digraphs may be wrong, in which case we
1812 // messed up ScreenLines
Bram Moolenaar471c0fa2022-08-22 15:19:16 +01001813 set_must_redraw(UPD_CLEAR);
Bram Moolenaar071d4272004-06-13 20:20:40 +00001814}
1815
mityu61065042021-07-19 20:07:21 +02001816 static void
h-east29b85712021-07-26 21:54:04 +02001817digraph_getlist_appendpair(digr_T *dp, list_T *l)
mityu61065042021-07-19 20:07:21 +02001818{
1819 char_u buf[30];
1820 char_u *p;
1821 list_T *l2;
1822 listitem_T *li, *li2;
1823
1824
1825 li = listitem_alloc();
1826 if (li == NULL)
1827 return;
1828 list_append(l, li);
1829 li->li_tv.v_type = VAR_LIST;
1830 li->li_tv.v_lock = 0;
1831
1832 l2 = list_alloc();
1833 li->li_tv.vval.v_list = l2;
1834 if (l2 == NULL)
1835 return;
1836 ++l2->lv_refcount;
1837
1838 li2 = listitem_alloc();
1839 if (li2 == NULL)
1840 return;
1841 list_append(l2, li2);
1842 li2->li_tv.v_type = VAR_STRING;
1843 li2->li_tv.v_lock = 0;
1844
1845 buf[0] = dp->char1;
1846 buf[1] = dp->char2;
1847 buf[2] = NUL;
1848 li2->li_tv.vval.v_string = vim_strsave(&buf[0]);
1849
1850 li2 = listitem_alloc();
1851 if (li2 == NULL)
1852 return;
1853 list_append(l2, li2);
1854 li2->li_tv.v_type = VAR_STRING;
1855 li2->li_tv.v_lock = 0;
1856
1857 p = buf;
1858 if (has_mbyte)
1859 p += (*mb_char2bytes)(dp->result, p);
1860 else
1861 *p++ = (char_u)dp->result;
1862 *p = NUL;
1863
1864 li2->li_tv.vval.v_string = vim_strsave(buf);
1865}
1866
Yegappan Lakshmanan8ee52af2021-08-09 19:59:06 +02001867 static void
h-east29b85712021-07-26 21:54:04 +02001868digraph_getlist_common(int list_all, typval_T *rettv)
mityu61065042021-07-19 20:07:21 +02001869{
1870 int i;
1871 digr_T *dp;
1872
1873 if (rettv_list_alloc(rettv) == FAIL)
1874 return;
1875
1876 if (list_all)
1877 {
1878 dp = digraphdefault;
dundargocb2209f22022-09-24 15:55:27 +01001879 while (dp->char1 != NUL && !got_int)
mityu61065042021-07-19 20:07:21 +02001880 {
1881#ifdef USE_UNICODE_DIGRAPHS
1882 digr_T tmp;
1883
1884 tmp.char1 = dp->char1;
1885 tmp.char2 = dp->char2;
1886 tmp.result = getexactdigraph(tmp.char1, tmp.char2, FALSE);
1887 if (tmp.result != 0 && tmp.result != tmp.char2
1888 && (has_mbyte || tmp.result <= 255))
h-east29b85712021-07-26 21:54:04 +02001889 digraph_getlist_appendpair(&tmp, rettv->vval.v_list);
mityu61065042021-07-19 20:07:21 +02001890#else
1891 if (getexactdigraph(dp->char1, dp->char2, FALSE) == dp->result
1892 && (has_mbyte || dp->result <= 255))
h-east29b85712021-07-26 21:54:04 +02001893 digraph_getlist_appendpair(dp, rettv->vval.v_list);
mityu61065042021-07-19 20:07:21 +02001894#endif
1895 ++dp;
1896 }
1897 }
1898
1899 dp = (digr_T *)user_digraphs.ga_data;
1900 for (i = 0; i < user_digraphs.ga_len && !got_int; ++i)
1901 {
h-east29b85712021-07-26 21:54:04 +02001902 digraph_getlist_appendpair(dp, rettv->vval.v_list);
mityu61065042021-07-19 20:07:21 +02001903 ++dp;
1904 }
1905}
1906
Bram Moolenaar5843f5f2019-08-20 20:13:45 +02001907static struct dg_header_entry {
Bram Moolenaareae8ae12018-12-14 18:53:02 +01001908 int dg_start;
1909 char *dg_header;
1910} header_table[] = {
1911 {DG_START_LATIN, N_("Latin supplement")},
1912 {DG_START_GREEK, N_("Greek and Coptic")},
1913 {DG_START_CYRILLIC, N_("Cyrillic")},
1914 {DG_START_HEBREW, N_("Hebrew")},
1915 {DG_START_ARABIC, N_("Arabic")},
1916 {DG_START_LATIN_EXTENDED, N_("Latin extended")},
1917 {DG_START_GREEK_EXTENDED, N_("Greek extended")},
1918 {DG_START_PUNCTUATION, N_("Punctuation")},
1919 {DG_START_SUB_SUPER, N_("Super- and subscripts")},
1920 {DG_START_CURRENCY, N_("Currency")},
1921 {DG_START_OTHER1, N_("Other")},
1922 {DG_START_ROMAN, N_("Roman numbers")},
1923 {DG_START_ARROWS, N_("Arrows")},
1924 {DG_START_MATH, N_("Mathematical operators")},
1925 {DG_START_TECHNICAL, N_("Technical")},
1926 {DG_START_OTHER2, N_("Other")},
1927 {DG_START_DRAWING, N_("Box drawing")},
1928 {DG_START_BLOCK, N_("Block elements")},
1929 {DG_START_SHAPES, N_("Geometric shapes")},
1930 {DG_START_SYMBOLS, N_("Symbols")},
1931 {DG_START_DINGBATS, N_("Dingbats")},
1932 {DG_START_CJK_SYMBOLS, N_("CJK symbols and punctuation")},
1933 {DG_START_HIRAGANA, N_("Hiragana")},
1934 {DG_START_KATAKANA, N_("Katakana")},
1935 {DG_START_BOPOMOFO, N_("Bopomofo")},
1936 {DG_START_OTHER3, N_("Other")},
1937 {0xfffffff, NULL},
1938};
1939
Bram Moolenaar071d4272004-06-13 20:20:40 +00001940 static void
Bram Moolenaareae8ae12018-12-14 18:53:02 +01001941printdigraph(digr_T *dp, result_T *previous)
Bram Moolenaar071d4272004-06-13 20:20:40 +00001942{
1943 char_u buf[30];
1944 char_u *p;
1945
1946 int list_width;
1947
Bram Moolenaar13505972019-01-24 15:04:48 +01001948 if ((dy_flags & DY_UHEX) || has_mbyte)
Bram Moolenaar071d4272004-06-13 20:20:40 +00001949 list_width = 13;
1950 else
1951 list_width = 11;
1952
Yegappan Lakshmanan465de3a2022-12-26 12:50:04 +00001953 if (dp->result == 0)
1954 return;
1955
Bram Moolenaareae8ae12018-12-14 18:53:02 +01001956#if defined(USE_UNICODE_DIGRAPHS)
Yegappan Lakshmanan465de3a2022-12-26 12:50:04 +00001957 if (previous != NULL)
1958 {
1959 int i;
Bram Moolenaareae8ae12018-12-14 18:53:02 +01001960
Yegappan Lakshmanan465de3a2022-12-26 12:50:04 +00001961 for (i = 0; header_table[i].dg_header != NULL; ++i)
1962 if (*previous < header_table[i].dg_start
1963 && dp->result >= header_table[i].dg_start
1964 && dp->result < header_table[i + 1].dg_start)
1965 {
1966 digraph_header(_(header_table[i].dg_header));
1967 break;
1968 }
1969 *previous = dp->result;
Bram Moolenaar071d4272004-06-13 20:20:40 +00001970 }
Yegappan Lakshmanan465de3a2022-12-26 12:50:04 +00001971#endif
1972 if (msg_col > Columns - list_width)
1973 msg_putchar('\n');
1974 if (msg_col)
1975 while (msg_col % list_width != 0)
1976 msg_putchar(' ');
1977
1978 p = buf;
1979 *p++ = dp->char1;
1980 *p++ = dp->char2;
1981 *p++ = ' ';
1982 *p = NUL;
1983 msg_outtrans(buf);
1984 p = buf;
1985 if (has_mbyte)
1986 {
1987 // add a space to draw a composing char on
1988 if (enc_utf8 && utf_iscomposing(dp->result))
1989 *p++ = ' ';
1990 p += (*mb_char2bytes)(dp->result, p);
1991 }
1992 else
1993 *p++ = (char_u)dp->result;
1994 *p = NUL;
1995 msg_outtrans_attr(buf, HL_ATTR(HLF_8));
1996 p = buf;
1997 if (char2cells(dp->result) == 1)
1998 *p++ = ' ';
1999 vim_snprintf((char *)p, sizeof(buf) - (p - buf), " %3d", dp->result);
2000 msg_outtrans(buf);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002001}
2002
mityu61065042021-07-19 20:07:21 +02002003# ifdef FEAT_EVAL
2004/*
2005 * Get the two digraph characters from a typval.
2006 * Return OK or FAIL.
2007 */
2008 static int
2009get_digraph_chars(typval_T *arg, int *char1, int *char2)
2010{
2011 char_u buf_chars[NUMBUFLEN];
2012 char_u *chars = tv_get_string_buf_chk(arg, buf_chars);
2013 char_u *p = chars;
2014
2015 if (p != NULL)
2016 {
2017 if (*p != NUL)
2018 {
2019 *char1 = mb_cptr2char_adv(&p);
2020 if (*p != NUL)
2021 {
2022 *char2 = mb_cptr2char_adv(&p);
2023 if (*p == NUL)
2024 {
2025 if (check_digraph_chars_valid(*char1, *char2))
2026 return OK;
2027 return FAIL;
2028 }
2029 }
2030 }
2031 }
2032 semsg(_(e_digraph_must_be_just_two_characters_str), chars);
2033 return FAIL;
2034}
2035
2036 static int
h-east29b85712021-07-26 21:54:04 +02002037digraph_set_common(typval_T *argchars, typval_T *argdigraph)
mityu61065042021-07-19 20:07:21 +02002038{
2039 int char1, char2;
2040 char_u *digraph;
2041 char_u *p;
2042 char_u buf_digraph[NUMBUFLEN];
2043 varnumber_T n;
2044
2045 if (get_digraph_chars(argchars, &char1, &char2) == FAIL)
2046 return FALSE;
2047
2048 digraph = tv_get_string_buf_chk(argdigraph, buf_digraph);
2049 if (digraph == NULL)
2050 return FALSE;
2051 p = digraph;
2052 n = mb_cptr2char_adv(&p);
2053 if (*p != NUL)
2054 {
2055 semsg(_(e_digraph_argument_must_be_one_character_str), digraph);
2056 return FALSE;
2057 }
2058
2059 registerdigraph(char1, char2, (int)n);
2060 return TRUE;
2061}
2062# endif
2063
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01002064#endif // FEAT_DIGRAPHS
Bram Moolenaar071d4272004-06-13 20:20:40 +00002065
mityu61065042021-07-19 20:07:21 +02002066#if defined(FEAT_EVAL) || defined(PROTO)
2067/*
h-east29b85712021-07-26 21:54:04 +02002068 * "digraph_get()" function
mityu61065042021-07-19 20:07:21 +02002069 */
2070 void
h-east29b85712021-07-26 21:54:04 +02002071f_digraph_get(typval_T *argvars, typval_T *rettv)
mityu61065042021-07-19 20:07:21 +02002072{
2073# ifdef FEAT_DIGRAPHS
2074 int code;
2075 char_u buf[NUMBUFLEN];
2076 char_u *digraphs;
2077
2078 rettv->v_type = VAR_STRING;
2079 rettv->vval.v_string = NULL; // Return empty string for failure
Yegappan Lakshmanan4490ec42021-07-27 22:00:44 +02002080
2081 if (in_vim9script() && check_for_string_arg(argvars, 0) == FAIL)
2082 return;
2083
mityu61065042021-07-19 20:07:21 +02002084 digraphs = tv_get_string_chk(&argvars[0]);
2085
2086 if (digraphs == NULL)
2087 return;
2088 else if (STRLEN(digraphs) != 2)
2089 {
2090 semsg(_(e_digraph_must_be_just_two_characters_str), digraphs);
2091 return;
2092 }
h-east29b85712021-07-26 21:54:04 +02002093 code = digraph_get(digraphs[0], digraphs[1], FALSE);
mityu61065042021-07-19 20:07:21 +02002094
2095 if (has_mbyte)
2096 buf[(*mb_char2bytes)(code, buf)] = NUL;
Bram Moolenaarebfec1c2023-01-22 21:14:53 +00002097 else
2098 {
mityu61065042021-07-19 20:07:21 +02002099 buf[0] = code;
2100 buf[1] = NUL;
2101 }
2102
2103 rettv->vval.v_string = vim_strsave(buf);
2104# else
2105 emsg(_(e_no_digraphs_version));
2106# endif
2107}
2108
2109/*
h-east29b85712021-07-26 21:54:04 +02002110 * "digraph_getlist()" function
mityu61065042021-07-19 20:07:21 +02002111 */
2112 void
h-east29b85712021-07-26 21:54:04 +02002113f_digraph_getlist(typval_T *argvars, typval_T *rettv)
mityu61065042021-07-19 20:07:21 +02002114{
2115# ifdef FEAT_DIGRAPHS
2116 int flag_list_all;
2117
Yegappan Lakshmananfc3b7752021-09-08 14:57:42 +02002118 if (in_vim9script() && check_for_opt_bool_arg(argvars, 0) == FAIL)
Yegappan Lakshmanan4490ec42021-07-27 22:00:44 +02002119 return;
2120
mityu61065042021-07-19 20:07:21 +02002121 if (argvars[0].v_type == VAR_UNKNOWN)
2122 flag_list_all = FALSE;
2123 else
2124 {
Bram Moolenaar6ed545e2022-05-09 20:09:23 +01002125 int error = FALSE;
mityu61065042021-07-19 20:07:21 +02002126 varnumber_T flag = tv_get_number_chk(&argvars[0], &error);
Bram Moolenaar6ed545e2022-05-09 20:09:23 +01002127
mityu61065042021-07-19 20:07:21 +02002128 if (error)
2129 return;
2130 flag_list_all = flag ? TRUE : FALSE;
2131 }
2132
h-east29b85712021-07-26 21:54:04 +02002133 digraph_getlist_common(flag_list_all, rettv);
mityu61065042021-07-19 20:07:21 +02002134# else
2135 emsg(_(e_no_digraphs_version));
2136# endif
2137}
2138
2139/*
h-east29b85712021-07-26 21:54:04 +02002140 * "digraph_set()" function
mityu61065042021-07-19 20:07:21 +02002141 */
2142 void
h-east29b85712021-07-26 21:54:04 +02002143f_digraph_set(typval_T *argvars, typval_T *rettv)
mityu61065042021-07-19 20:07:21 +02002144{
2145# ifdef FEAT_DIGRAPHS
2146 rettv->v_type = VAR_BOOL;
2147 rettv->vval.v_number = VVAL_FALSE;
2148
Yegappan Lakshmanan4490ec42021-07-27 22:00:44 +02002149 if (in_vim9script()
2150 && (check_for_string_arg(argvars, 0) == FAIL
Yegappan Lakshmananfc3b7752021-09-08 14:57:42 +02002151 || check_for_string_arg(argvars, 1) == FAIL))
Yegappan Lakshmanan4490ec42021-07-27 22:00:44 +02002152 return;
2153
h-east29b85712021-07-26 21:54:04 +02002154 if (!digraph_set_common(&argvars[0], &argvars[1]))
mityu61065042021-07-19 20:07:21 +02002155 return;
2156
2157 rettv->vval.v_number = VVAL_TRUE;
2158# else
2159 emsg(_(e_no_digraphs_version));
2160# endif
2161}
2162
2163/*
h-east29b85712021-07-26 21:54:04 +02002164 * "digraph_setlist()" function
mityu61065042021-07-19 20:07:21 +02002165 */
2166 void
h-east29b85712021-07-26 21:54:04 +02002167f_digraph_setlist(typval_T * argvars, typval_T *rettv)
mityu61065042021-07-19 20:07:21 +02002168{
2169# ifdef FEAT_DIGRAPHS
2170 list_T *pl, *l;
2171 listitem_T *pli;
2172
2173 rettv->v_type = VAR_BOOL;
2174 rettv->vval.v_number = VVAL_FALSE;
2175
2176 if (argvars[0].v_type != VAR_LIST)
2177 {
h-east29b85712021-07-26 21:54:04 +02002178 emsg(_(e_digraph_setlist_argument_must_be_list_of_lists_with_two_items));
mityu61065042021-07-19 20:07:21 +02002179 return;
2180 }
2181
2182 pl = argvars[0].vval.v_list;
2183 if (pl == NULL)
2184 {
2185 // Empty list always results in success.
2186 rettv->vval.v_number = VVAL_TRUE;
2187 return;
2188 }
2189
2190 FOR_ALL_LIST_ITEMS(pl, pli)
2191 {
2192 if (pli->li_tv.v_type != VAR_LIST)
2193 {
h-east29b85712021-07-26 21:54:04 +02002194 emsg(_(e_digraph_setlist_argument_must_be_list_of_lists_with_two_items));
mityu61065042021-07-19 20:07:21 +02002195 return;
2196 }
2197
2198 l = pli->li_tv.vval.v_list;
2199 if (l == NULL || l->lv_len != 2)
2200 {
h-east29b85712021-07-26 21:54:04 +02002201 emsg(_(e_digraph_setlist_argument_must_be_list_of_lists_with_two_items));
mityu61065042021-07-19 20:07:21 +02002202 return;
2203 }
2204
h-east29b85712021-07-26 21:54:04 +02002205 if (!digraph_set_common(&l->lv_first->li_tv,
mityu61065042021-07-19 20:07:21 +02002206 &l->lv_first->li_next->li_tv))
2207 return;
2208 }
2209 rettv->vval.v_number = VVAL_TRUE;
2210# else
2211 emsg(_(e_no_digraphs_version));
2212# endif
2213}
2214
2215#endif // FEAT_EVAL
2216
2217
Bram Moolenaar071d4272004-06-13 20:20:40 +00002218#if defined(FEAT_KEYMAP) || defined(PROTO)
2219
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01002220// structure used for b_kmap_ga.ga_data
Bram Moolenaar071d4272004-06-13 20:20:40 +00002221typedef struct
2222{
2223 char_u *from;
2224 char_u *to;
2225} kmap_T;
2226
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01002227#define KMAP_MAXLEN 20 // maximum length of "from" or "to"
Bram Moolenaar071d4272004-06-13 20:20:40 +00002228
Bram Moolenaarf28dbce2016-01-29 22:03:47 +01002229static void keymap_unload(void);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002230
2231/*
Bram Moolenaar0ab2a882009-05-13 10:51:08 +00002232 * Set up key mapping tables for the 'keymap' option.
2233 * Returns NULL if OK, an error message for failure. This only needs to be
2234 * used when setting the option, not later when the value has already been
2235 * checked.
Bram Moolenaar071d4272004-06-13 20:20:40 +00002236 */
Bram Moolenaarf9e3e092019-01-13 23:38:42 +01002237 char *
Bram Moolenaar7454a062016-01-30 15:14:10 +01002238keymap_init(void)
Bram Moolenaar071d4272004-06-13 20:20:40 +00002239{
2240 curbuf->b_kmap_state &= ~KEYMAP_INIT;
2241
2242 if (*curbuf->b_p_keymap == NUL)
2243 {
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01002244 // Stop any active keymap and clear the table. Also remove
2245 // b:keymap_name, as no keymap is active now.
Bram Moolenaar071d4272004-06-13 20:20:40 +00002246 keymap_unload();
Bram Moolenaarbf444172007-07-07 11:58:28 +00002247 do_cmdline_cmd((char_u *)"unlet! b:keymap_name");
Bram Moolenaar071d4272004-06-13 20:20:40 +00002248 }
2249 else
2250 {
2251 char_u *buf;
Bram Moolenaar0ab2a882009-05-13 10:51:08 +00002252 size_t buflen;
Bram Moolenaar071d4272004-06-13 20:20:40 +00002253
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01002254 // Source the keymap file. It will contain a ":loadkeymap" command
2255 // which will call ex_loadkeymap() below.
Bram Moolenaar13505972019-01-24 15:04:48 +01002256 buflen = STRLEN(curbuf->b_p_keymap) + STRLEN(p_enc) + 14;
Bram Moolenaar964b3742019-05-24 18:54:09 +02002257 buf = alloc(buflen);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002258 if (buf == NULL)
Bram Moolenaare29a27f2021-07-20 21:07:36 +02002259 return e_out_of_memory;
Bram Moolenaar071d4272004-06-13 20:20:40 +00002260
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01002261 // try finding "keymap/'keymap'_'encoding'.vim" in 'runtimepath'
Bram Moolenaar0ab2a882009-05-13 10:51:08 +00002262 vim_snprintf((char *)buf, buflen, "keymap/%s_%s.vim",
2263 curbuf->b_p_keymap, p_enc);
Bram Moolenaar7f8989d2016-03-12 22:11:39 +01002264 if (source_runtime(buf, 0) == FAIL)
Bram Moolenaar071d4272004-06-13 20:20:40 +00002265 {
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01002266 // try finding "keymap/'keymap'.vim" in 'runtimepath'
Bram Moolenaar0ab2a882009-05-13 10:51:08 +00002267 vim_snprintf((char *)buf, buflen, "keymap/%s.vim",
2268 curbuf->b_p_keymap);
Bram Moolenaar7f8989d2016-03-12 22:11:39 +01002269 if (source_runtime(buf, 0) == FAIL)
Bram Moolenaar071d4272004-06-13 20:20:40 +00002270 {
2271 vim_free(buf);
Bram Moolenaar1d423ef2022-01-02 21:26:16 +00002272 return N_(e_keymap_file_not_found);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002273 }
2274 }
2275 vim_free(buf);
2276 }
2277
2278 return NULL;
2279}
2280
2281/*
2282 * ":loadkeymap" command: load the following lines as the keymap.
2283 */
2284 void
Bram Moolenaar7454a062016-01-30 15:14:10 +01002285ex_loadkeymap(exarg_T *eap)
Bram Moolenaar071d4272004-06-13 20:20:40 +00002286{
2287 char_u *line;
2288 char_u *p;
2289 char_u *s;
2290 kmap_T *kp;
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01002291#define KMAP_LLEN 200 // max length of "to" and "from" together
Bram Moolenaar071d4272004-06-13 20:20:40 +00002292 char_u buf[KMAP_LLEN + 11];
2293 int i;
2294 char_u *save_cpo = p_cpo;
2295
Yegappan Lakshmanan36a5b682022-03-19 12:56:51 +00002296 if (!sourcing_a_script(eap))
Bram Moolenaar071d4272004-06-13 20:20:40 +00002297 {
Bram Moolenaare1242042021-12-16 20:56:57 +00002298 emsg(_(e_using_loadkeymap_not_in_sourced_file));
Bram Moolenaar071d4272004-06-13 20:20:40 +00002299 return;
2300 }
2301
2302 /*
2303 * Stop any active keymap and clear the table.
2304 */
2305 keymap_unload();
2306
2307 curbuf->b_kmap_state = 0;
Bram Moolenaar04935fb2022-01-08 16:19:22 +00002308 ga_init2(&curbuf->b_kmap_ga, sizeof(kmap_T), 20);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002309
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01002310 // Set 'cpoptions' to "C" to avoid line continuation.
Bram Moolenaar071d4272004-06-13 20:20:40 +00002311 p_cpo = (char_u *)"C";
2312
2313 /*
2314 * Get each line of the sourced file, break at the end.
2315 */
2316 for (;;)
2317 {
Zoltan Arpadffy6fdb6282023-12-19 20:53:07 +01002318 line = eap->ea_getline(0, eap->cookie, 0, TRUE);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002319 if (line == NULL)
2320 break;
2321
2322 p = skipwhite(line);
2323 if (*p != '"' && *p != NUL && ga_grow(&curbuf->b_kmap_ga, 1) == OK)
2324 {
2325 kp = (kmap_T *)curbuf->b_kmap_ga.ga_data + curbuf->b_kmap_ga.ga_len;
2326 s = skiptowhite(p);
Bram Moolenaardf44a272020-06-07 20:49:05 +02002327 kp->from = vim_strnsave(p, s - p);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002328 p = skipwhite(s);
2329 s = skiptowhite(p);
Bram Moolenaardf44a272020-06-07 20:49:05 +02002330 kp->to = vim_strnsave(p, s - p);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002331
2332 if (kp->from == NULL || kp->to == NULL
Bram Moolenaar57657d82006-04-21 22:12:41 +00002333 || STRLEN(kp->from) + STRLEN(kp->to) >= KMAP_LLEN
2334 || *kp->from == NUL || *kp->to == NUL)
Bram Moolenaar071d4272004-06-13 20:20:40 +00002335 {
Bram Moolenaar57657d82006-04-21 22:12:41 +00002336 if (kp->to != NULL && *kp->to == NUL)
Bram Moolenaar677658a2022-01-05 16:09:06 +00002337 emsg(_(e_empty_keymap_entry));
Bram Moolenaar071d4272004-06-13 20:20:40 +00002338 vim_free(kp->from);
2339 vim_free(kp->to);
2340 }
2341 else
Bram Moolenaar071d4272004-06-13 20:20:40 +00002342 ++curbuf->b_kmap_ga.ga_len;
Bram Moolenaar071d4272004-06-13 20:20:40 +00002343 }
2344 vim_free(line);
2345 }
2346
2347 /*
2348 * setup ":lnoremap" to map the keys
2349 */
2350 for (i = 0; i < curbuf->b_kmap_ga.ga_len; ++i)
2351 {
Bram Moolenaar555b2802005-05-19 21:08:39 +00002352 vim_snprintf((char *)buf, sizeof(buf), "<buffer> %s %s",
Bram Moolenaar071d4272004-06-13 20:20:40 +00002353 ((kmap_T *)curbuf->b_kmap_ga.ga_data)[i].from,
2354 ((kmap_T *)curbuf->b_kmap_ga.ga_data)[i].to);
zeertzjq44068e92022-06-16 11:14:55 +01002355 (void)do_map(MAPTYPE_NOREMAP, buf, MODE_LANGMAP, FALSE);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002356 }
2357
2358 p_cpo = save_cpo;
2359
2360 curbuf->b_kmap_state |= KEYMAP_LOADED;
Bram Moolenaar071d4272004-06-13 20:20:40 +00002361 status_redraw_curbuf();
Bram Moolenaar071d4272004-06-13 20:20:40 +00002362}
2363
2364/*
2365 * Stop using 'keymap'.
2366 */
2367 static void
Bram Moolenaar7454a062016-01-30 15:14:10 +01002368keymap_unload(void)
Bram Moolenaar071d4272004-06-13 20:20:40 +00002369{
2370 char_u buf[KMAP_MAXLEN + 10];
2371 int i;
2372 char_u *save_cpo = p_cpo;
Bram Moolenaar8c8de832008-06-24 22:58:06 +00002373 kmap_T *kp;
Bram Moolenaar071d4272004-06-13 20:20:40 +00002374
2375 if (!(curbuf->b_kmap_state & KEYMAP_LOADED))
2376 return;
2377
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01002378 // Set 'cpoptions' to "C" to avoid line continuation.
Bram Moolenaar071d4272004-06-13 20:20:40 +00002379 p_cpo = (char_u *)"C";
2380
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01002381 // clear the ":lmap"s
Bram Moolenaar8c8de832008-06-24 22:58:06 +00002382 kp = (kmap_T *)curbuf->b_kmap_ga.ga_data;
Bram Moolenaar071d4272004-06-13 20:20:40 +00002383 for (i = 0; i < curbuf->b_kmap_ga.ga_len; ++i)
2384 {
Bram Moolenaar8c8de832008-06-24 22:58:06 +00002385 vim_snprintf((char *)buf, sizeof(buf), "<buffer> %s", kp[i].from);
zeertzjq44068e92022-06-16 11:14:55 +01002386 (void)do_map(MAPTYPE_UNMAP, buf, MODE_LANGMAP, FALSE);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002387 }
Bram Moolenaar50138322018-01-28 17:05:16 +01002388 keymap_clear(&curbuf->b_kmap_ga);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002389
2390 p_cpo = save_cpo;
2391
2392 ga_clear(&curbuf->b_kmap_ga);
2393 curbuf->b_kmap_state &= ~KEYMAP_LOADED;
Bram Moolenaar071d4272004-06-13 20:20:40 +00002394 status_redraw_curbuf();
Bram Moolenaar071d4272004-06-13 20:20:40 +00002395}
2396
Bram Moolenaar50138322018-01-28 17:05:16 +01002397 void
2398keymap_clear(garray_T *kmap)
2399{
2400 int i;
2401 kmap_T *kp = (kmap_T *)kmap->ga_data;
2402
2403 for (i = 0; i < kmap->ga_len; ++i)
2404 {
2405 vim_free(kp[i].from);
2406 vim_free(kp[i].to);
2407 }
2408}
Bram Moolenaar5d18efe2019-12-01 21:11:22 +01002409#endif // FEAT_KEYMAP