blob: 1b30e0fed52b2a248b5fa3b2ffef3be5f4de5b91 [file] [log] [blame]
Bram Moolenaaredf3f972016-08-29 22:49:24 +02001/* vi:set ts=8 sts=4 sw=4 noet:
Bram Moolenaar071d4272004-06-13 20:20:40 +00002 *
3 * VIM - Vi IMproved by Bram Moolenaar
4 *
5 * Do ":help uganda" in Vim to read copying and usage conditions.
6 * Do ":help credits" in Vim to see a list of people who contributed.
7 * See README.txt for an overview of the Vim source code.
8 */
9
10/*
11 * fileio.c: read from and write to a file
12 */
13
Bram Moolenaar071d4272004-06-13 20:20:40 +000014#include "vim.h"
15
Bram Moolenaare3f915d2020-07-14 23:02:44 +020016#if defined(__TANDEM)
Bram Moolenaar217e1b82019-12-01 21:41:28 +010017# include <limits.h> // for SSIZE_MAX
Bram Moolenaar071d4272004-06-13 20:20:40 +000018#endif
Bram Moolenaar82c38fe2021-01-04 10:47:26 +010019#if (defined(UNIX) || defined(VMS)) && defined(FEAT_EVAL)
Bram Moolenaar6c9ba042020-06-01 16:09:41 +020020# include <pwd.h>
21# include <grp.h>
22#endif
Bram Moolenaar82c38fe2021-01-04 10:47:26 +010023#if defined(VMS) && defined(HAVE_XOS_R_H)
24# include <x11/xos_r.h>
25#endif
Bram Moolenaar071d4272004-06-13 20:20:40 +000026
Bram Moolenaar217e1b82019-12-01 21:41:28 +010027// Is there any system that doesn't have access()?
Bram Moolenaar9372a112005-12-06 19:59:18 +000028#define USE_MCH_ACCESS
Bram Moolenaar071d4272004-06-13 20:20:40 +000029
Bram Moolenaar9d8bfae2020-09-02 21:21:35 +020030#if defined(__hpux) && !defined(HAVE_DIRFD)
31# define dirfd(x) ((x)->__dd_fd)
32# define HAVE_DIRFD
33#endif
34
Bram Moolenaarf077db22019-08-13 00:18:24 +020035static char_u *next_fenc(char_u **pp, int *alloced);
Bram Moolenaar13505972019-01-24 15:04:48 +010036#ifdef FEAT_EVAL
Bram Moolenaard25c16e2016-01-29 22:13:30 +010037static char_u *readfile_charconvert(char_u *fname, char_u *fenc, int *fdp);
Bram Moolenaar071d4272004-06-13 20:20:40 +000038#endif
Bram Moolenaar071d4272004-06-13 20:20:40 +000039#ifdef FEAT_CRYPT
Bram Moolenaar8767f522016-07-01 17:17:39 +020040static char_u *check_for_cryptkey(char_u *cryptkey, char_u *ptr, long *sizep, off_T *filesizep, int newfile, char_u *fname, int *did_ask);
Bram Moolenaar071d4272004-06-13 20:20:40 +000041#endif
Bram Moolenaard25c16e2016-01-29 22:13:30 +010042static linenr_T readfile_linenr(linenr_T linecnt, char_u *p, char_u *endp);
Bram Moolenaard25c16e2016-01-29 22:13:30 +010043static char_u *check_for_bom(char_u *p, long size, int *lenp, int flags);
Bram Moolenaarb0bf8582005-12-13 20:02:15 +000044
Bram Moolenaar84cf6bd2020-06-16 20:03:43 +020045#ifdef FEAT_EVAL
46static int readdirex_sort;
47#endif
48
Bram Moolenaar473952e2019-09-28 16:30:04 +020049 void
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +010050filemess(
51 buf_T *buf,
52 char_u *name,
53 char_u *s,
54 int attr)
Bram Moolenaar071d4272004-06-13 20:20:40 +000055{
56 int msg_scroll_save;
Bram Moolenaar473952e2019-09-28 16:30:04 +020057 int prev_msg_col = msg_col;
Bram Moolenaar071d4272004-06-13 20:20:40 +000058
59 if (msg_silent != 0)
60 return;
Bram Moolenaar217e1b82019-12-01 21:41:28 +010061 msg_add_fname(buf, name); // put file name in IObuff with quotes
Bram Moolenaar6378b212020-06-29 21:32:06 +020062
Bram Moolenaar217e1b82019-12-01 21:41:28 +010063 // If it's extremely long, truncate it.
Bram Moolenaar6378b212020-06-29 21:32:06 +020064 if (STRLEN(IObuff) > IOSIZE - 100)
65 IObuff[IOSIZE - 100] = NUL;
66
67 // Avoid an over-long translation to cause trouble.
68 STRNCAT(IObuff, s, 99);
69
Bram Moolenaar071d4272004-06-13 20:20:40 +000070 /*
71 * For the first message may have to start a new line.
72 * For further ones overwrite the previous one, reset msg_scroll before
73 * calling filemess().
74 */
75 msg_scroll_save = msg_scroll;
76 if (shortmess(SHM_OVERALL) && !exiting && p_verbose == 0)
77 msg_scroll = FALSE;
Bram Moolenaar217e1b82019-12-01 21:41:28 +010078 if (!msg_scroll) // wait a bit when overwriting an error msg
Bram Moolenaar071d4272004-06-13 20:20:40 +000079 check_for_delay(FALSE);
80 msg_start();
Bram Moolenaar473952e2019-09-28 16:30:04 +020081 if (prev_msg_col != 0 && msg_col == 0)
82 msg_putchar('\r'); // overwrite any previous message.
Bram Moolenaar071d4272004-06-13 20:20:40 +000083 msg_scroll = msg_scroll_save;
84 msg_scrolled_ign = TRUE;
Bram Moolenaar217e1b82019-12-01 21:41:28 +010085 // may truncate the message to avoid a hit-return prompt
Bram Moolenaar071d4272004-06-13 20:20:40 +000086 msg_outtrans_attr(msg_may_trunc(FALSE, IObuff), attr);
87 msg_clr_eos();
88 out_flush();
89 msg_scrolled_ign = FALSE;
90}
91
92/*
93 * Read lines from file "fname" into the buffer after line "from".
94 *
95 * 1. We allocate blocks with lalloc, as big as possible.
96 * 2. Each block is filled with characters from the file with a single read().
97 * 3. The lines are inserted in the buffer with ml_append().
98 *
99 * (caller must check that fname != NULL, unless READ_STDIN is used)
100 *
101 * "lines_to_skip" is the number of lines that must be skipped
102 * "lines_to_read" is the number of lines that are appended
103 * When not recovering lines_to_skip is 0 and lines_to_read MAXLNUM.
104 *
105 * flags:
106 * READ_NEW starting to edit a new buffer
107 * READ_FILTER reading filter output
108 * READ_STDIN read from stdin instead of a file
109 * READ_BUFFER read from curbuf instead of a file (converting after reading
110 * stdin)
Bram Moolenaarb1d2c812022-08-26 11:55:01 +0100111 * READ_NOFILE do not read a file, only trigger BufReadCmd
Bram Moolenaar071d4272004-06-13 20:20:40 +0000112 * READ_DUMMY read into a dummy buffer (to check if file contents changed)
Bram Moolenaar59f931e2010-07-24 20:27:03 +0200113 * READ_KEEP_UNDO don't clear undo info or read it from a file
Bram Moolenaarf71d7b92016-08-09 22:14:05 +0200114 * READ_FIFO read from fifo/socket instead of a file
Bram Moolenaar071d4272004-06-13 20:20:40 +0000115 *
Bram Moolenaare13b9af2017-01-13 22:01:02 +0100116 * return FAIL for failure, NOTDONE for directory (failure), or OK
Bram Moolenaar071d4272004-06-13 20:20:40 +0000117 */
118 int
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +0100119readfile(
120 char_u *fname,
121 char_u *sfname,
122 linenr_T from,
123 linenr_T lines_to_skip,
124 linenr_T lines_to_read,
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100125 exarg_T *eap, // can be NULL!
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +0100126 int flags)
Bram Moolenaar071d4272004-06-13 20:20:40 +0000127{
128 int fd = 0;
129 int newfile = (flags & READ_NEW);
130 int check_readonly;
131 int filtering = (flags & READ_FILTER);
132 int read_stdin = (flags & READ_STDIN);
133 int read_buffer = (flags & READ_BUFFER);
Bram Moolenaarf71d7b92016-08-09 22:14:05 +0200134 int read_fifo = (flags & READ_FIFO);
Bram Moolenaar690ffc02008-01-04 15:31:21 +0000135 int set_options = newfile || read_buffer
136 || (eap != NULL && eap->read_edit);
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100137 linenr_T read_buf_lnum = 1; // next line to read from curbuf
138 colnr_T read_buf_col = 0; // next char to read from this line
Bram Moolenaar071d4272004-06-13 20:20:40 +0000139 char_u c;
140 linenr_T lnum = from;
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100141 char_u *ptr = NULL; // pointer into read buffer
142 char_u *buffer = NULL; // read buffer
143 char_u *new_buffer = NULL; // init to shut up gcc
144 char_u *line_start = NULL; // init to shut up gcc
145 int wasempty; // buffer was empty before reading
Bram Moolenaar071d4272004-06-13 20:20:40 +0000146 colnr_T len;
147 long size = 0;
148 char_u *p;
Bram Moolenaar8767f522016-07-01 17:17:39 +0200149 off_T filesize = 0;
Bram Moolenaar071d4272004-06-13 20:20:40 +0000150 int skip_read = FALSE;
Christian Brabandtf573c6e2021-06-20 14:02:16 +0200151 off_T filesize_disk = 0; // file size read from disk
152 off_T filesize_count = 0; // counter
Bram Moolenaar071d4272004-06-13 20:20:40 +0000153#ifdef FEAT_CRYPT
154 char_u *cryptkey = NULL;
Bram Moolenaarf50a2532010-05-21 15:36:08 +0200155 int did_ask_for_key = FALSE;
Bram Moolenaar071d4272004-06-13 20:20:40 +0000156#endif
Bram Moolenaar55debbe2010-05-23 23:34:36 +0200157#ifdef FEAT_PERSISTENT_UNDO
158 context_sha256_T sha_ctx;
159 int read_undo_file = FALSE;
160#endif
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100161 int split = 0; // number of split lines
162#define UNKNOWN 0x0fffffff // file size is unknown
Bram Moolenaar071d4272004-06-13 20:20:40 +0000163 linenr_T linecnt;
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100164 int error = FALSE; // errors encountered
165 int ff_error = EOL_UNKNOWN; // file format with errors
166 long linerest = 0; // remaining chars in line
Bram Moolenaar071d4272004-06-13 20:20:40 +0000167#ifdef UNIX
168 int perm = 0;
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100169 int swap_mode = -1; // protection bits for swap file
Bram Moolenaar071d4272004-06-13 20:20:40 +0000170#else
171 int perm;
172#endif
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100173 int fileformat = 0; // end-of-line format
Bram Moolenaar071d4272004-06-13 20:20:40 +0000174 int keep_fileformat = FALSE;
Bram Moolenaar8767f522016-07-01 17:17:39 +0200175 stat_T st;
Bram Moolenaar071d4272004-06-13 20:20:40 +0000176 int file_readonly;
177 linenr_T skip_count = 0;
178 linenr_T read_count = 0;
179 int msg_save = msg_scroll;
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100180 linenr_T read_no_eol_lnum = 0; // non-zero lnum when last line of
181 // last read was missing the eol
Bram Moolenaar7a2699e2017-01-23 21:31:09 +0100182 int try_mac;
183 int try_dos;
184 int try_unix;
Bram Moolenaar071d4272004-06-13 20:20:40 +0000185 int file_rewind = FALSE;
Bram Moolenaar071d4272004-06-13 20:20:40 +0000186 int can_retry;
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100187 linenr_T conv_error = 0; // line nr with conversion error
188 linenr_T illegal_byte = 0; // line nr with illegal byte
189 int keep_dest_enc = FALSE; // don't retry when char doesn't fit
190 // in destination encoding
Bram Moolenaarb0bf8582005-12-13 20:02:15 +0000191 int bad_char_behavior = BAD_REPLACE;
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100192 // BAD_KEEP, BAD_DROP or character to
193 // replace with
194 char_u *tmpname = NULL; // name of 'charconvert' output file
Bram Moolenaar071d4272004-06-13 20:20:40 +0000195 int fio_flags = 0;
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100196 char_u *fenc; // fileencoding to use
197 int fenc_alloced; // fenc_next is in allocated memory
198 char_u *fenc_next = NULL; // next item in 'fencs' or NULL
Bram Moolenaar071d4272004-06-13 20:20:40 +0000199 int advance_fenc = FALSE;
200 long real_size = 0;
Bram Moolenaar13505972019-01-24 15:04:48 +0100201#ifdef USE_ICONV
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100202 iconv_t iconv_fd = (iconv_t)-1; // descriptor for iconv() or -1
Bram Moolenaar13505972019-01-24 15:04:48 +0100203# ifdef FEAT_EVAL
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100204 int did_iconv = FALSE; // TRUE when iconv() failed and trying
205 // 'charconvert' next
Bram Moolenaar071d4272004-06-13 20:20:40 +0000206# endif
Bram Moolenaar13505972019-01-24 15:04:48 +0100207#endif
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100208 int converted = FALSE; // TRUE if conversion done
209 int notconverted = FALSE; // TRUE if conversion wanted but it
210 // wasn't possible
Bram Moolenaar071d4272004-06-13 20:20:40 +0000211 char_u conv_rest[CONV_RESTLEN];
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100212 int conv_restlen = 0; // nr of bytes in conv_rest[]
Bram Moolenaarf4a1d1c2019-11-16 13:50:25 +0100213 pos_T orig_start;
Bram Moolenaarbb3d5dc2010-08-14 14:32:54 +0200214 buf_T *old_curbuf;
215 char_u *old_b_ffname;
216 char_u *old_b_fname;
217 int using_b_ffname;
218 int using_b_fname;
Bram Moolenaarc8fe6452020-10-03 17:04:37 +0200219 static char *msg_is_a_directory = N_("is a directory");
Bram Moolenaar6ed545e2022-05-09 20:09:23 +0100220 int eof;
Bram Moolenaarbb3d5dc2010-08-14 14:32:54 +0200221
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100222 au_did_filetype = FALSE; // reset before triggering any autocommands
Bram Moolenaarc3691332016-04-20 12:49:49 +0200223
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100224 curbuf->b_no_eol_lnum = 0; // in case it was set by the previous read
Bram Moolenaar071d4272004-06-13 20:20:40 +0000225
226 /*
227 * If there is no file name yet, use the one for the read file.
228 * BF_NOTEDITED is set to reflect this.
229 * Don't do this for a read from a filter.
230 * Only do this when 'cpoptions' contains the 'f' flag.
231 */
232 if (curbuf->b_ffname == NULL
233 && !filtering
234 && fname != NULL
235 && vim_strchr(p_cpo, CPO_FNAMER) != NULL
236 && !(flags & READ_DUMMY))
237 {
Bram Moolenaar2d3f4892006-01-20 23:02:51 +0000238 if (set_rw_fname(fname, sfname) == FAIL)
239 return FAIL;
Bram Moolenaar071d4272004-06-13 20:20:40 +0000240 }
241
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100242 // Remember the initial values of curbuf, curbuf->b_ffname and
243 // curbuf->b_fname to detect whether they are altered as a result of
244 // executing nasty autocommands. Also check if "fname" and "sfname"
245 // point to one of these values.
Bram Moolenaarbb3d5dc2010-08-14 14:32:54 +0200246 old_curbuf = curbuf;
247 old_b_ffname = curbuf->b_ffname;
248 old_b_fname = curbuf->b_fname;
249 using_b_ffname = (fname == curbuf->b_ffname)
250 || (sfname == curbuf->b_ffname);
251 using_b_fname = (fname == curbuf->b_fname) || (sfname == curbuf->b_fname);
Bram Moolenaarbb3d5dc2010-08-14 14:32:54 +0200252
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100253 // After reading a file the cursor line changes but we don't want to
254 // display the line.
Bram Moolenaardf177f62005-02-22 08:39:57 +0000255 ex_no_reprint = TRUE;
256
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100257 // don't display the file info for another buffer now
Bram Moolenaar55b7cf82006-09-09 12:52:42 +0000258 need_fileinfo = FALSE;
259
Bram Moolenaar071d4272004-06-13 20:20:40 +0000260 /*
261 * For Unix: Use the short file name whenever possible.
262 * Avoids problems with networks and when directory names are changed.
263 * Don't do this for MS-DOS, a "cd" in a sub-shell may have moved us to
264 * another directory, which we don't detect.
265 */
266 if (sfname == NULL)
267 sfname = fname;
Bram Moolenaara06ecab2016-07-16 14:47:36 +0200268#if defined(UNIX)
Bram Moolenaar071d4272004-06-13 20:20:40 +0000269 fname = sfname;
270#endif
271
Bram Moolenaar071d4272004-06-13 20:20:40 +0000272 /*
273 * The BufReadCmd and FileReadCmd events intercept the reading process by
274 * executing the associated commands instead.
275 */
276 if (!filtering && !read_stdin && !read_buffer)
277 {
Bram Moolenaarf4a1d1c2019-11-16 13:50:25 +0100278 orig_start = curbuf->b_op_start;
Bram Moolenaar071d4272004-06-13 20:20:40 +0000279
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100280 // Set '[ mark to the line above where the lines go (line 1 if zero).
Bram Moolenaar071d4272004-06-13 20:20:40 +0000281 curbuf->b_op_start.lnum = ((from == 0) ? 1 : from);
282 curbuf->b_op_start.col = 0;
283
284 if (newfile)
285 {
286 if (apply_autocmds_exarg(EVENT_BUFREADCMD, NULL, sfname,
287 FALSE, curbuf, eap))
Bram Moolenaar0fff4412020-03-29 16:06:29 +0200288 {
289 int status = OK;
Bram Moolenaar071d4272004-06-13 20:20:40 +0000290#ifdef FEAT_EVAL
Bram Moolenaar0fff4412020-03-29 16:06:29 +0200291 if (aborting())
292 status = FAIL;
Bram Moolenaar071d4272004-06-13 20:20:40 +0000293#endif
Bram Moolenaar0fff4412020-03-29 16:06:29 +0200294 // The BufReadCmd code usually uses ":read" to get the text and
295 // perhaps ":file" to change the buffer name. But we should
296 // consider this to work like ":edit", thus reset the
297 // BF_NOTEDITED flag. Then ":write" will work to overwrite the
298 // same file.
299 if (status == OK)
300 curbuf->b_flags &= ~BF_NOTEDITED;
301 return status;
302 }
Bram Moolenaar071d4272004-06-13 20:20:40 +0000303 }
304 else if (apply_autocmds_exarg(EVENT_FILEREADCMD, sfname, sfname,
305 FALSE, NULL, eap))
306#ifdef FEAT_EVAL
307 return aborting() ? FAIL : OK;
308#else
309 return OK;
310#endif
311
Bram Moolenaarf4a1d1c2019-11-16 13:50:25 +0100312 curbuf->b_op_start = orig_start;
Bram Moolenaarb1d2c812022-08-26 11:55:01 +0100313
314 if (flags & READ_NOFILE)
315 return FAIL;
Bram Moolenaar071d4272004-06-13 20:20:40 +0000316 }
Bram Moolenaar071d4272004-06-13 20:20:40 +0000317
318 if ((shortmess(SHM_OVER) || curbuf->b_help) && p_verbose == 0)
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100319 msg_scroll = FALSE; // overwrite previous file message
Bram Moolenaar071d4272004-06-13 20:20:40 +0000320 else
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100321 msg_scroll = TRUE; // don't overwrite previous file message
Bram Moolenaar071d4272004-06-13 20:20:40 +0000322
Bram Moolenaar15d0a8c2004-09-06 17:44:46 +0000323 if (fname != NULL && *fname != NUL)
Bram Moolenaar071d4272004-06-13 20:20:40 +0000324 {
Bram Moolenaarc8fe6452020-10-03 17:04:37 +0200325 size_t namelen = STRLEN(fname);
326
327 // If the name is too long we might crash further on, quit here.
328 if (namelen >= MAXPATHL)
Bram Moolenaar15d0a8c2004-09-06 17:44:46 +0000329 {
330 filemess(curbuf, fname, (char_u *)_("Illegal file name"), 0);
331 msg_end();
332 msg_scroll = msg_save;
333 return FAIL;
334 }
Bram Moolenaarc8fe6452020-10-03 17:04:37 +0200335
336 // If the name ends in a path separator, we can't open it. Check here,
337 // because reading the file may actually work, but then creating the
338 // swap file may destroy it! Reported on MS-DOS and Win 95.
339 if (after_pathsep(fname, fname + namelen))
340 {
341 filemess(curbuf, fname, (char_u *)_(msg_is_a_directory), 0);
342 msg_end();
343 msg_scroll = msg_save;
Bram Moolenaar40fa12a2021-09-22 14:18:13 +0200344 return NOTDONE;
Bram Moolenaarc8fe6452020-10-03 17:04:37 +0200345 }
Bram Moolenaar071d4272004-06-13 20:20:40 +0000346 }
347
Bram Moolenaarf71d7b92016-08-09 22:14:05 +0200348 if (!read_stdin && !read_buffer && !read_fifo)
Bram Moolenaar071d4272004-06-13 20:20:40 +0000349 {
Bram Moolenaar82c38fe2021-01-04 10:47:26 +0100350#if defined(UNIX) || defined(VMS)
Bram Moolenaar4e4f5292013-08-30 17:07:01 +0200351 /*
352 * On Unix it is possible to read a directory, so we have to
353 * check for it before the mch_open().
354 */
Bram Moolenaar071d4272004-06-13 20:20:40 +0000355 perm = mch_getperm(fname);
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100356 if (perm >= 0 && !S_ISREG(perm) // not a regular file ...
357 && !S_ISFIFO(perm) // ... or fifo
358 && !S_ISSOCK(perm) // ... or socket
Bram Moolenaarfe1c56d2007-07-10 15:10:54 +0000359# ifdef OPEN_CHR_FILES
360 && !(S_ISCHR(perm) && is_dev_fd_file(fname))
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100361 // ... or a character special file named /dev/fd/<n>
Bram Moolenaarfe1c56d2007-07-10 15:10:54 +0000362# endif
Bram Moolenaar071d4272004-06-13 20:20:40 +0000363 )
364 {
Bram Moolenaare13b9af2017-01-13 22:01:02 +0100365 int retval = FAIL;
366
Bram Moolenaar071d4272004-06-13 20:20:40 +0000367 if (S_ISDIR(perm))
Bram Moolenaare13b9af2017-01-13 22:01:02 +0100368 {
Bram Moolenaarc8fe6452020-10-03 17:04:37 +0200369 filemess(curbuf, fname, (char_u *)_(msg_is_a_directory), 0);
Bram Moolenaare13b9af2017-01-13 22:01:02 +0100370 retval = NOTDONE;
371 }
Bram Moolenaar071d4272004-06-13 20:20:40 +0000372 else
373 filemess(curbuf, fname, (char_u *)_("is not a file"), 0);
374 msg_end();
375 msg_scroll = msg_save;
Bram Moolenaare13b9af2017-01-13 22:01:02 +0100376 return retval;
Bram Moolenaar071d4272004-06-13 20:20:40 +0000377 }
Bram Moolenaar4e4f5292013-08-30 17:07:01 +0200378#endif
Bram Moolenaar48e330a2016-02-23 14:53:34 +0100379#if defined(MSWIN)
Bram Moolenaarc67764a2006-10-12 19:14:26 +0000380 /*
381 * MS-Windows allows opening a device, but we will probably get stuck
382 * trying to read it.
383 */
384 if (!p_odev && mch_nodetype(fname) == NODE_WRITABLE)
385 {
Bram Moolenaar5386a122007-06-28 20:02:32 +0000386 filemess(curbuf, fname, (char_u *)_("is a device (disabled with 'opendevice' option)"), 0);
Bram Moolenaarc67764a2006-10-12 19:14:26 +0000387 msg_end();
388 msg_scroll = msg_save;
389 return FAIL;
390 }
Bram Moolenaar043545e2006-10-10 16:44:07 +0000391#endif
Bram Moolenaar4e4f5292013-08-30 17:07:01 +0200392 }
Bram Moolenaar043545e2006-10-10 16:44:07 +0000393
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100394 // Set default or forced 'fileformat' and 'binary'.
Bram Moolenaarad875fb2013-07-24 15:02:03 +0200395 set_file_options(set_options, eap);
Bram Moolenaar071d4272004-06-13 20:20:40 +0000396
397 /*
398 * When opening a new file we take the readonly flag from the file.
399 * Default is r/w, can be set to r/o below.
400 * Don't reset it when in readonly mode
401 * Only set/reset b_p_ro when BF_CHECK_RO is set.
402 */
403 check_readonly = (newfile && (curbuf->b_flags & BF_CHECK_RO));
Bram Moolenaar4399ef42005-02-12 14:29:27 +0000404 if (check_readonly && !readonlymode)
Bram Moolenaar071d4272004-06-13 20:20:40 +0000405 curbuf->b_p_ro = FALSE;
406
Bram Moolenaarf71d7b92016-08-09 22:14:05 +0200407 if (newfile && !read_stdin && !read_buffer && !read_fifo)
Bram Moolenaar071d4272004-06-13 20:20:40 +0000408 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100409 // Remember time of file.
Bram Moolenaar071d4272004-06-13 20:20:40 +0000410 if (mch_stat((char *)fname, &st) >= 0)
411 {
412 buf_store_time(curbuf, &st, fname);
413 curbuf->b_mtime_read = curbuf->b_mtime;
Leah Neukirchen0a7984a2021-10-14 21:27:55 +0100414 curbuf->b_mtime_read_ns = curbuf->b_mtime_ns;
Christian Brabandtf573c6e2021-06-20 14:02:16 +0200415 filesize_disk = st.st_size;
Bram Moolenaar071d4272004-06-13 20:20:40 +0000416#ifdef UNIX
417 /*
418 * Use the protection bits of the original file for the swap file.
419 * This makes it possible for others to read the name of the
420 * edited file from the swapfile, but only if they can read the
421 * edited file.
422 * Remove the "write" and "execute" bits for group and others
423 * (they must not write the swapfile).
424 * Add the "read" and "write" bits for the user, otherwise we may
425 * not be able to write to the file ourselves.
426 * Setting the bits is done below, after creating the swap file.
427 */
428 swap_mode = (st.st_mode & 0644) | 0600;
429#endif
Bram Moolenaar071d4272004-06-13 20:20:40 +0000430#ifdef VMS
431 curbuf->b_fab_rfm = st.st_fab_rfm;
Bram Moolenaard4755bb2004-09-02 19:12:26 +0000432 curbuf->b_fab_rat = st.st_fab_rat;
433 curbuf->b_fab_mrs = st.st_fab_mrs;
Bram Moolenaar071d4272004-06-13 20:20:40 +0000434#endif
435 }
436 else
437 {
438 curbuf->b_mtime = 0;
Leah Neukirchen0a7984a2021-10-14 21:27:55 +0100439 curbuf->b_mtime_ns = 0;
Bram Moolenaar071d4272004-06-13 20:20:40 +0000440 curbuf->b_mtime_read = 0;
Leah Neukirchen0a7984a2021-10-14 21:27:55 +0100441 curbuf->b_mtime_read_ns = 0;
Bram Moolenaar071d4272004-06-13 20:20:40 +0000442 curbuf->b_orig_size = 0;
443 curbuf->b_orig_mode = 0;
444 }
445
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100446 // Reset the "new file" flag. It will be set again below when the
447 // file doesn't exist.
Bram Moolenaar071d4272004-06-13 20:20:40 +0000448 curbuf->b_flags &= ~(BF_NEW | BF_NEW_W);
449 }
450
451/*
452 * for UNIX: check readonly with perm and mch_access()
Bram Moolenaar48e330a2016-02-23 14:53:34 +0100453 * for Amiga: check readonly by trying to open the file for writing
Bram Moolenaar071d4272004-06-13 20:20:40 +0000454 */
455 file_readonly = FALSE;
456 if (read_stdin)
457 {
Bram Moolenaar48e330a2016-02-23 14:53:34 +0100458#if defined(MSWIN)
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100459 // Force binary I/O on stdin to avoid CR-LF -> LF conversion.
Bram Moolenaar071d4272004-06-13 20:20:40 +0000460 setmode(0, O_BINARY);
461#endif
462 }
463 else if (!read_buffer)
464 {
465#ifdef USE_MCH_ACCESS
466 if (
467# ifdef UNIX
468 !(perm & 0222) ||
469# endif
470 mch_access((char *)fname, W_OK))
471 file_readonly = TRUE;
472 fd = mch_open((char *)fname, O_RDONLY | O_EXTRA, 0);
473#else
474 if (!newfile
475 || readonlymode
476 || (fd = mch_open((char *)fname, O_RDWR | O_EXTRA, 0)) < 0)
477 {
478 file_readonly = TRUE;
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100479 // try to open ro
Bram Moolenaar071d4272004-06-13 20:20:40 +0000480 fd = mch_open((char *)fname, O_RDONLY | O_EXTRA, 0);
481 }
482#endif
483 }
484
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100485 if (fd < 0) // cannot open at all
Bram Moolenaar071d4272004-06-13 20:20:40 +0000486 {
487#ifndef UNIX
488 int isdir_f;
489#endif
490 msg_scroll = msg_save;
491#ifndef UNIX
492 /*
Bram Moolenaar48e330a2016-02-23 14:53:34 +0100493 * On Amiga we can't open a directory, check here.
Bram Moolenaar071d4272004-06-13 20:20:40 +0000494 */
495 isdir_f = (mch_isdir(fname));
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100496 perm = mch_getperm(fname); // check if the file exists
Bram Moolenaar071d4272004-06-13 20:20:40 +0000497 if (isdir_f)
498 {
Bram Moolenaarc8fe6452020-10-03 17:04:37 +0200499 filemess(curbuf, sfname, (char_u *)_(msg_is_a_directory), 0);
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100500 curbuf->b_p_ro = TRUE; // must use "w!" now
Bram Moolenaar071d4272004-06-13 20:20:40 +0000501 }
502 else
503#endif
504 if (newfile)
505 {
Bram Moolenaar2efbc662010-05-14 18:56:38 +0200506 if (perm < 0
507#ifdef ENOENT
508 && errno == ENOENT
509#endif
510 )
Bram Moolenaar071d4272004-06-13 20:20:40 +0000511 {
512 /*
513 * Set the 'new-file' flag, so that when the file has
514 * been created by someone else, a ":w" will complain.
515 */
516 curbuf->b_flags |= BF_NEW;
517
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100518 // Create a swap file now, so that other Vims are warned
519 // that we are editing this file. Don't do this for a
520 // "nofile" or "nowrite" buffer type.
Bram Moolenaar071d4272004-06-13 20:20:40 +0000521 if (!bt_dontwrite(curbuf))
Bram Moolenaarbf1b7a72009-03-05 02:15:53 +0000522 {
Bram Moolenaar071d4272004-06-13 20:20:40 +0000523 check_need_swap(newfile);
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100524 // SwapExists autocommand may mess things up
Bram Moolenaarbf1b7a72009-03-05 02:15:53 +0000525 if (curbuf != old_curbuf
526 || (using_b_ffname
527 && (old_b_ffname != curbuf->b_ffname))
528 || (using_b_fname
529 && (old_b_fname != curbuf->b_fname)))
530 {
Bram Moolenaar9d00e4a2022-01-05 17:49:15 +0000531 emsg(_(e_autocommands_changed_buffer_or_buffer_name));
Bram Moolenaarbf1b7a72009-03-05 02:15:53 +0000532 return FAIL;
533 }
Bram Moolenaarbf1b7a72009-03-05 02:15:53 +0000534 }
Bram Moolenaar5b962cf2005-12-12 21:58:40 +0000535 if (dir_of_file_exists(fname))
Bram Moolenaar722e5052020-06-12 22:31:00 +0200536 filemess(curbuf, sfname,
537 (char_u *)new_file_message(), 0);
Bram Moolenaar5b962cf2005-12-12 21:58:40 +0000538 else
539 filemess(curbuf, sfname,
540 (char_u *)_("[New DIRECTORY]"), 0);
Bram Moolenaar071d4272004-06-13 20:20:40 +0000541#ifdef FEAT_VIMINFO
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100542 // Even though this is a new file, it might have been
543 // edited before and deleted. Get the old marks.
Bram Moolenaar071d4272004-06-13 20:20:40 +0000544 check_marks_read();
545#endif
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100546 // Set forced 'fileencoding'.
Bram Moolenaarad875fb2013-07-24 15:02:03 +0200547 if (eap != NULL)
548 set_forced_fenc(eap);
Bram Moolenaar071d4272004-06-13 20:20:40 +0000549 apply_autocmds_exarg(EVENT_BUFNEWFILE, sfname, sfname,
550 FALSE, curbuf, eap);
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100551 // remember the current fileformat
Bram Moolenaar071d4272004-06-13 20:20:40 +0000552 save_file_ff(curbuf);
553
Bram Moolenaarf2bd8ef2018-03-04 18:08:14 +0100554#if defined(FEAT_EVAL)
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100555 if (aborting()) // autocmds may abort script processing
Bram Moolenaar071d4272004-06-13 20:20:40 +0000556 return FAIL;
557#endif
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100558 return OK; // a new file is not an error
Bram Moolenaar071d4272004-06-13 20:20:40 +0000559 }
560 else
561 {
Bram Moolenaar202795b2005-10-11 20:29:39 +0000562 filemess(curbuf, sfname, (char_u *)(
563# ifdef EFBIG
564 (errno == EFBIG) ? _("[File too big]") :
565# endif
Bram Moolenaar2efbc662010-05-14 18:56:38 +0200566# ifdef EOVERFLOW
567 (errno == EOVERFLOW) ? _("[File too big]") :
568# endif
Bram Moolenaar202795b2005-10-11 20:29:39 +0000569 _("[Permission Denied]")), 0);
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100570 curbuf->b_p_ro = TRUE; // must use "w!" now
Bram Moolenaar071d4272004-06-13 20:20:40 +0000571 }
572 }
573
574 return FAIL;
575 }
576
577 /*
578 * Only set the 'ro' flag for readonly files the first time they are
579 * loaded. Help files always get readonly mode
580 */
581 if ((check_readonly && file_readonly) || curbuf->b_help)
582 curbuf->b_p_ro = TRUE;
583
Bram Moolenaar910f66f2006-04-05 20:41:53 +0000584 if (set_options)
Bram Moolenaar071d4272004-06-13 20:20:40 +0000585 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100586 // Don't change 'eol' if reading from buffer as it will already be
587 // correctly set when reading stdin.
Bram Moolenaar690ffc02008-01-04 15:31:21 +0000588 if (!read_buffer)
589 {
590 curbuf->b_p_eol = TRUE;
591 curbuf->b_start_eol = TRUE;
592 }
Bram Moolenaar071d4272004-06-13 20:20:40 +0000593 curbuf->b_p_bomb = FALSE;
Bram Moolenaar83eb8852007-08-12 13:51:26 +0000594 curbuf->b_start_bomb = FALSE;
Bram Moolenaar071d4272004-06-13 20:20:40 +0000595 }
596
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100597 // Create a swap file now, so that other Vims are warned that we are
598 // editing this file.
599 // Don't do this for a "nofile" or "nowrite" buffer type.
Bram Moolenaar071d4272004-06-13 20:20:40 +0000600 if (!bt_dontwrite(curbuf))
Bram Moolenaar071d4272004-06-13 20:20:40 +0000601 {
602 check_need_swap(newfile);
Bram Moolenaarbf1b7a72009-03-05 02:15:53 +0000603 if (!read_stdin && (curbuf != old_curbuf
604 || (using_b_ffname && (old_b_ffname != curbuf->b_ffname))
605 || (using_b_fname && (old_b_fname != curbuf->b_fname))))
606 {
Bram Moolenaar9d00e4a2022-01-05 17:49:15 +0000607 emsg(_(e_autocommands_changed_buffer_or_buffer_name));
Bram Moolenaarbf1b7a72009-03-05 02:15:53 +0000608 if (!read_buffer)
609 close(fd);
610 return FAIL;
611 }
Bram Moolenaar071d4272004-06-13 20:20:40 +0000612#ifdef UNIX
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100613 // Set swap file protection bits after creating it.
Bram Moolenaarf061e0b2009-06-24 15:32:01 +0000614 if (swap_mode > 0 && curbuf->b_ml.ml_mfp != NULL
615 && curbuf->b_ml.ml_mfp->mf_fname != NULL)
Bram Moolenaar5a73e0c2017-11-04 21:35:01 +0100616 {
617 char_u *swap_fname = curbuf->b_ml.ml_mfp->mf_fname;
618
619 /*
620 * If the group-read bit is set but not the world-read bit, then
621 * the group must be equal to the group of the original file. If
622 * we can't make that happen then reset the group-read bit. This
623 * avoids making the swap file readable to more users when the
624 * primary group of the user is too permissive.
625 */
626 if ((swap_mode & 044) == 040)
627 {
628 stat_T swap_st;
629
630 if (mch_stat((char *)swap_fname, &swap_st) >= 0
631 && st.st_gid != swap_st.st_gid
Bram Moolenaar02e802b2018-04-19 21:15:27 +0200632# ifdef HAVE_FCHOWN
Bram Moolenaar5a73e0c2017-11-04 21:35:01 +0100633 && fchown(curbuf->b_ml.ml_mfp->mf_fd, -1, st.st_gid)
Bram Moolenaar02e802b2018-04-19 21:15:27 +0200634 == -1
Bram Moolenaar1f131ae2018-05-21 13:39:40 +0200635# endif
Bram Moolenaar02e802b2018-04-19 21:15:27 +0200636 )
Bram Moolenaar5a73e0c2017-11-04 21:35:01 +0100637 swap_mode &= 0600;
638 }
639
640 (void)mch_setperm(swap_fname, (long)swap_mode);
641 }
Bram Moolenaar071d4272004-06-13 20:20:40 +0000642#endif
643 }
644
Bram Moolenaar67cf86b2019-04-28 22:25:38 +0200645 // If "Quit" selected at ATTENTION dialog, don't load the file
Bram Moolenaar071d4272004-06-13 20:20:40 +0000646 if (swap_exists_action == SEA_QUIT)
647 {
648 if (!read_buffer && !read_stdin)
649 close(fd);
650 return FAIL;
651 }
Bram Moolenaar071d4272004-06-13 20:20:40 +0000652
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100653 ++no_wait_return; // don't wait for return yet
Bram Moolenaar071d4272004-06-13 20:20:40 +0000654
655 /*
656 * Set '[ mark to the line above where the lines go (line 1 if zero).
657 */
Bram Moolenaarf4a1d1c2019-11-16 13:50:25 +0100658 orig_start = curbuf->b_op_start;
Bram Moolenaar071d4272004-06-13 20:20:40 +0000659 curbuf->b_op_start.lnum = ((from == 0) ? 1 : from);
660 curbuf->b_op_start.col = 0;
661
Bram Moolenaar7a2699e2017-01-23 21:31:09 +0100662 try_mac = (vim_strchr(p_ffs, 'm') != NULL);
663 try_dos = (vim_strchr(p_ffs, 'd') != NULL);
664 try_unix = (vim_strchr(p_ffs, 'x') != NULL);
665
Bram Moolenaar071d4272004-06-13 20:20:40 +0000666 if (!read_buffer)
667 {
668 int m = msg_scroll;
669 int n = msg_scrolled;
Bram Moolenaar071d4272004-06-13 20:20:40 +0000670
671 /*
672 * The file must be closed again, the autocommands may want to change
673 * the file before reading it.
674 */
675 if (!read_stdin)
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100676 close(fd); // ignore errors
Bram Moolenaar071d4272004-06-13 20:20:40 +0000677
678 /*
679 * The output from the autocommands should not overwrite anything and
680 * should not be overwritten: Set msg_scroll, restore its value if no
681 * output was done.
682 */
683 msg_scroll = TRUE;
684 if (filtering)
685 apply_autocmds_exarg(EVENT_FILTERREADPRE, NULL, sfname,
686 FALSE, curbuf, eap);
687 else if (read_stdin)
688 apply_autocmds_exarg(EVENT_STDINREADPRE, NULL, sfname,
689 FALSE, curbuf, eap);
690 else if (newfile)
691 apply_autocmds_exarg(EVENT_BUFREADPRE, NULL, sfname,
692 FALSE, curbuf, eap);
693 else
694 apply_autocmds_exarg(EVENT_FILEREADPRE, sfname, sfname,
695 FALSE, NULL, eap);
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100696 // autocommands may have changed it
Bram Moolenaar7a2699e2017-01-23 21:31:09 +0100697 try_mac = (vim_strchr(p_ffs, 'm') != NULL);
698 try_dos = (vim_strchr(p_ffs, 'd') != NULL);
699 try_unix = (vim_strchr(p_ffs, 'x') != NULL);
Bram Moolenaarf4a1d1c2019-11-16 13:50:25 +0100700 curbuf->b_op_start = orig_start;
Bram Moolenaar7a2699e2017-01-23 21:31:09 +0100701
Bram Moolenaar071d4272004-06-13 20:20:40 +0000702 if (msg_scrolled == n)
703 msg_scroll = m;
704
705#ifdef FEAT_EVAL
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100706 if (aborting()) // autocmds may abort script processing
Bram Moolenaar071d4272004-06-13 20:20:40 +0000707 {
708 --no_wait_return;
709 msg_scroll = msg_save;
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100710 curbuf->b_p_ro = TRUE; // must use "w!" now
Bram Moolenaar071d4272004-06-13 20:20:40 +0000711 return FAIL;
712 }
713#endif
714 /*
715 * Don't allow the autocommands to change the current buffer.
716 * Try to re-open the file.
Bram Moolenaarbf1b7a72009-03-05 02:15:53 +0000717 *
718 * Don't allow the autocommands to change the buffer name either
719 * (cd for example) if it invalidates fname or sfname.
Bram Moolenaar071d4272004-06-13 20:20:40 +0000720 */
721 if (!read_stdin && (curbuf != old_curbuf
Bram Moolenaarbf1b7a72009-03-05 02:15:53 +0000722 || (using_b_ffname && (old_b_ffname != curbuf->b_ffname))
723 || (using_b_fname && (old_b_fname != curbuf->b_fname))
Bram Moolenaar071d4272004-06-13 20:20:40 +0000724 || (fd = mch_open((char *)fname, O_RDONLY | O_EXTRA, 0)) < 0))
725 {
726 --no_wait_return;
727 msg_scroll = msg_save;
728 if (fd < 0)
Bram Moolenaar6d057012021-12-31 18:49:43 +0000729 emsg(_(e_readpre_autocommands_made_file_unreadable));
Bram Moolenaar071d4272004-06-13 20:20:40 +0000730 else
Bram Moolenaar6d057012021-12-31 18:49:43 +0000731 emsg(_(e_readpre_autocommands_must_not_change_current_buffer));
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100732 curbuf->b_p_ro = TRUE; // must use "w!" now
Bram Moolenaar071d4272004-06-13 20:20:40 +0000733 return FAIL;
734 }
735 }
Bram Moolenaar071d4272004-06-13 20:20:40 +0000736
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100737 // Autocommands may add lines to the file, need to check if it is empty
Bram Moolenaar071d4272004-06-13 20:20:40 +0000738 wasempty = (curbuf->b_ml.ml_flags & ML_EMPTY);
739
740 if (!recoverymode && !filtering && !(flags & READ_DUMMY))
741 {
742 /*
743 * Show the user that we are busy reading the input. Sometimes this
744 * may take a while. When reading from stdin another program may
745 * still be running, don't move the cursor to the last line, unless
746 * always using the GUI.
747 */
748 if (read_stdin)
749 {
Bram Moolenaar234d1622017-11-18 14:55:23 +0100750 if (!is_not_a_term())
751 {
Bram Moolenaar071d4272004-06-13 20:20:40 +0000752#ifndef ALWAYS_USE_GUI
Bram Moolenaarafde13b2019-04-28 19:46:49 +0200753# ifdef VIMDLL
754 if (!gui.in_use)
755# endif
756 mch_msg(_("Vim: Reading from stdin...\n"));
Bram Moolenaar071d4272004-06-13 20:20:40 +0000757#endif
758#ifdef FEAT_GUI
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100759 // Also write a message in the GUI window, if there is one.
Bram Moolenaar234d1622017-11-18 14:55:23 +0100760 if (gui.in_use && !gui.dying && !gui.starting)
761 {
Amon Sha10197932022-02-21 15:07:12 +0000762 // make a copy, gui_write() may try to change it
763 p = vim_strsave((char_u *)_("Reading from stdin..."));
764 if (p != NULL)
765 {
766 gui_write(p, (int)STRLEN(p));
767 vim_free(p);
768 }
Bram Moolenaar234d1622017-11-18 14:55:23 +0100769 }
Bram Moolenaar071d4272004-06-13 20:20:40 +0000770#endif
Bram Moolenaar234d1622017-11-18 14:55:23 +0100771 }
Bram Moolenaar071d4272004-06-13 20:20:40 +0000772 }
773 else if (!read_buffer)
774 filemess(curbuf, sfname, (char_u *)"", 0);
775 }
776
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100777 msg_scroll = FALSE; // overwrite the file message
Bram Moolenaar071d4272004-06-13 20:20:40 +0000778
779 /*
780 * Set linecnt now, before the "retry" caused by a wrong guess for
781 * fileformat, and after the autocommands, which may change them.
782 */
783 linecnt = curbuf->b_ml.ml_line_count;
784
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100785 // "++bad=" argument.
Bram Moolenaarb0bf8582005-12-13 20:02:15 +0000786 if (eap != NULL && eap->bad_char != 0)
Bram Moolenaar195d6352005-12-19 22:08:24 +0000787 {
Bram Moolenaarb0bf8582005-12-13 20:02:15 +0000788 bad_char_behavior = eap->bad_char;
Bram Moolenaar910f66f2006-04-05 20:41:53 +0000789 if (set_options)
Bram Moolenaar195d6352005-12-19 22:08:24 +0000790 curbuf->b_bad_char = eap->bad_char;
791 }
792 else
793 curbuf->b_bad_char = 0;
Bram Moolenaarb0bf8582005-12-13 20:02:15 +0000794
Bram Moolenaar071d4272004-06-13 20:20:40 +0000795 /*
Bram Moolenaarb0bf8582005-12-13 20:02:15 +0000796 * Decide which 'encoding' to use or use first.
Bram Moolenaar071d4272004-06-13 20:20:40 +0000797 */
798 if (eap != NULL && eap->force_enc != 0)
799 {
800 fenc = enc_canonize(eap->cmd + eap->force_enc);
801 fenc_alloced = TRUE;
Bram Moolenaarb0bf8582005-12-13 20:02:15 +0000802 keep_dest_enc = TRUE;
Bram Moolenaar071d4272004-06-13 20:20:40 +0000803 }
804 else if (curbuf->b_p_bin)
805 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100806 fenc = (char_u *)""; // binary: don't convert
Bram Moolenaar071d4272004-06-13 20:20:40 +0000807 fenc_alloced = FALSE;
808 }
809 else if (curbuf->b_help)
810 {
811 char_u firstline[80];
Bram Moolenaar75c50c42005-06-04 22:06:24 +0000812 int fc;
Bram Moolenaar071d4272004-06-13 20:20:40 +0000813
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100814 // Help files are either utf-8 or latin1. Try utf-8 first, if this
815 // fails it must be latin1.
816 // Always do this when 'encoding' is "utf-8". Otherwise only do
817 // this when needed to avoid [converted] remarks all the time.
818 // It is needed when the first line contains non-ASCII characters.
819 // That is only in *.??x files.
Bram Moolenaar071d4272004-06-13 20:20:40 +0000820 fenc = (char_u *)"latin1";
821 c = enc_utf8;
Bram Moolenaar75c50c42005-06-04 22:06:24 +0000822 if (!c && !read_stdin)
Bram Moolenaar071d4272004-06-13 20:20:40 +0000823 {
Bram Moolenaar75c50c42005-06-04 22:06:24 +0000824 fc = fname[STRLEN(fname) - 1];
825 if (TOLOWER_ASC(fc) == 'x')
826 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100827 // Read the first line (and a bit more). Immediately rewind to
828 // the start of the file. If the read() fails "len" is -1.
Bram Moolenaar540fc6f2010-12-17 16:27:16 +0100829 len = read_eintr(fd, firstline, 80);
Bram Moolenaar8767f522016-07-01 17:17:39 +0200830 vim_lseek(fd, (off_T)0L, SEEK_SET);
Bram Moolenaar75c50c42005-06-04 22:06:24 +0000831 for (p = firstline; p < firstline + len; ++p)
832 if (*p >= 0x80)
833 {
834 c = TRUE;
835 break;
836 }
837 }
Bram Moolenaar071d4272004-06-13 20:20:40 +0000838 }
839
840 if (c)
841 {
842 fenc_next = fenc;
843 fenc = (char_u *)"utf-8";
844
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100845 // When the file is utf-8 but a character doesn't fit in
846 // 'encoding' don't retry. In help text editing utf-8 bytes
847 // doesn't make sense.
Bram Moolenaarf193fff2006-04-27 00:02:13 +0000848 if (!enc_utf8)
849 keep_dest_enc = TRUE;
Bram Moolenaar071d4272004-06-13 20:20:40 +0000850 }
851 fenc_alloced = FALSE;
852 }
853 else if (*p_fencs == NUL)
854 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100855 fenc = curbuf->b_p_fenc; // use format from buffer
Bram Moolenaar071d4272004-06-13 20:20:40 +0000856 fenc_alloced = FALSE;
857 }
858 else
859 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100860 fenc_next = p_fencs; // try items in 'fileencodings'
Bram Moolenaarf077db22019-08-13 00:18:24 +0200861 fenc = next_fenc(&fenc_next, &fenc_alloced);
Bram Moolenaar071d4272004-06-13 20:20:40 +0000862 }
Bram Moolenaar071d4272004-06-13 20:20:40 +0000863
864 /*
865 * Jump back here to retry reading the file in different ways.
866 * Reasons to retry:
867 * - encoding conversion failed: try another one from "fenc_next"
868 * - BOM detected and fenc was set, need to setup conversion
869 * - "fileformat" check failed: try another
870 *
871 * Variables set for special retry actions:
872 * "file_rewind" Rewind the file to start reading it again.
873 * "advance_fenc" Advance "fenc" using "fenc_next".
874 * "skip_read" Re-use already read bytes (BOM detected).
875 * "did_iconv" iconv() conversion failed, try 'charconvert'.
876 * "keep_fileformat" Don't reset "fileformat".
877 *
878 * Other status indicators:
879 * "tmpname" When != NULL did conversion with 'charconvert'.
880 * Output file has to be deleted afterwards.
881 * "iconv_fd" When != -1 did conversion with iconv().
882 */
883retry:
884
885 if (file_rewind)
886 {
887 if (read_buffer)
888 {
889 read_buf_lnum = 1;
890 read_buf_col = 0;
891 }
Bram Moolenaar8767f522016-07-01 17:17:39 +0200892 else if (read_stdin || vim_lseek(fd, (off_T)0L, SEEK_SET) != 0)
Bram Moolenaar071d4272004-06-13 20:20:40 +0000893 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100894 // Can't rewind the file, give up.
Bram Moolenaar071d4272004-06-13 20:20:40 +0000895 error = TRUE;
896 goto failed;
897 }
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100898 // Delete the previously read lines.
Bram Moolenaar071d4272004-06-13 20:20:40 +0000899 while (lnum > from)
Bram Moolenaarca70c072020-05-30 20:30:46 +0200900 ml_delete(lnum--);
Bram Moolenaar071d4272004-06-13 20:20:40 +0000901 file_rewind = FALSE;
Bram Moolenaar910f66f2006-04-05 20:41:53 +0000902 if (set_options)
Bram Moolenaar83eb8852007-08-12 13:51:26 +0000903 {
Bram Moolenaar071d4272004-06-13 20:20:40 +0000904 curbuf->b_p_bomb = FALSE;
Bram Moolenaar83eb8852007-08-12 13:51:26 +0000905 curbuf->b_start_bomb = FALSE;
906 }
Bram Moolenaarb0bf8582005-12-13 20:02:15 +0000907 conv_error = 0;
Bram Moolenaar071d4272004-06-13 20:20:40 +0000908 }
909
910 /*
911 * When retrying with another "fenc" and the first time "fileformat"
912 * will be reset.
913 */
914 if (keep_fileformat)
915 keep_fileformat = FALSE;
916 else
917 {
918 if (eap != NULL && eap->force_ff != 0)
Bram Moolenaar1c860362008-11-12 15:05:21 +0000919 {
Bram Moolenaar071d4272004-06-13 20:20:40 +0000920 fileformat = get_fileformat_force(curbuf, eap);
Bram Moolenaar1c860362008-11-12 15:05:21 +0000921 try_unix = try_dos = try_mac = FALSE;
922 }
Bram Moolenaar071d4272004-06-13 20:20:40 +0000923 else if (curbuf->b_p_bin)
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100924 fileformat = EOL_UNIX; // binary: use Unix format
Bram Moolenaar071d4272004-06-13 20:20:40 +0000925 else if (*p_ffs == NUL)
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100926 fileformat = get_fileformat(curbuf);// use format from buffer
Bram Moolenaar071d4272004-06-13 20:20:40 +0000927 else
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100928 fileformat = EOL_UNKNOWN; // detect from file
Bram Moolenaar071d4272004-06-13 20:20:40 +0000929 }
930
Bram Moolenaar13505972019-01-24 15:04:48 +0100931#ifdef USE_ICONV
Bram Moolenaar071d4272004-06-13 20:20:40 +0000932 if (iconv_fd != (iconv_t)-1)
933 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100934 // aborted conversion with iconv(), close the descriptor
Bram Moolenaar071d4272004-06-13 20:20:40 +0000935 iconv_close(iconv_fd);
936 iconv_fd = (iconv_t)-1;
937 }
Bram Moolenaar13505972019-01-24 15:04:48 +0100938#endif
Bram Moolenaar071d4272004-06-13 20:20:40 +0000939
940 if (advance_fenc)
941 {
942 /*
943 * Try the next entry in 'fileencodings'.
944 */
945 advance_fenc = FALSE;
946
947 if (eap != NULL && eap->force_enc != 0)
948 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100949 // Conversion given with "++cc=" wasn't possible, read
950 // without conversion.
Bram Moolenaar071d4272004-06-13 20:20:40 +0000951 notconverted = TRUE;
Bram Moolenaarb0bf8582005-12-13 20:02:15 +0000952 conv_error = 0;
Bram Moolenaar071d4272004-06-13 20:20:40 +0000953 if (fenc_alloced)
954 vim_free(fenc);
955 fenc = (char_u *)"";
956 fenc_alloced = FALSE;
957 }
958 else
959 {
960 if (fenc_alloced)
961 vim_free(fenc);
962 if (fenc_next != NULL)
963 {
Bram Moolenaarf077db22019-08-13 00:18:24 +0200964 fenc = next_fenc(&fenc_next, &fenc_alloced);
Bram Moolenaar071d4272004-06-13 20:20:40 +0000965 }
966 else
967 {
968 fenc = (char_u *)"";
969 fenc_alloced = FALSE;
970 }
971 }
972 if (tmpname != NULL)
973 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100974 mch_remove(tmpname); // delete converted file
Bram Moolenaard23a8232018-02-10 18:45:26 +0100975 VIM_CLEAR(tmpname);
Bram Moolenaar071d4272004-06-13 20:20:40 +0000976 }
977 }
978
979 /*
Bram Moolenaarb5cdf2e2009-07-29 16:25:31 +0000980 * Conversion may be required when the encoding of the file is different
981 * from 'encoding' or 'encoding' is UTF-16, UCS-2 or UCS-4.
Bram Moolenaar071d4272004-06-13 20:20:40 +0000982 */
983 fio_flags = 0;
Bram Moolenaarb5cdf2e2009-07-29 16:25:31 +0000984 converted = need_conversion(fenc);
985 if (converted)
Bram Moolenaar071d4272004-06-13 20:20:40 +0000986 {
987
Bram Moolenaar217e1b82019-12-01 21:41:28 +0100988 // "ucs-bom" means we need to check the first bytes of the file
989 // for a BOM.
Bram Moolenaar071d4272004-06-13 20:20:40 +0000990 if (STRCMP(fenc, ENC_UCSBOM) == 0)
991 fio_flags = FIO_UCSBOM;
992
993 /*
994 * Check if UCS-2/4 or Latin1 to UTF-8 conversion needs to be
995 * done. This is handled below after read(). Prepare the
996 * fio_flags to avoid having to parse the string each time.
997 * Also check for Unicode to Latin1 conversion, because iconv()
998 * appears not to handle this correctly. This works just like
999 * conversion to UTF-8 except how the resulting character is put in
1000 * the buffer.
1001 */
1002 else if (enc_utf8 || STRCMP(p_enc, "latin1") == 0)
1003 fio_flags = get_fio_flags(fenc);
1004
Bram Moolenaar4f974752019-02-17 17:44:42 +01001005#ifdef MSWIN
Bram Moolenaar071d4272004-06-13 20:20:40 +00001006 /*
1007 * Conversion from an MS-Windows codepage to UTF-8 or another codepage
1008 * is handled with MultiByteToWideChar().
1009 */
1010 if (fio_flags == 0)
1011 fio_flags = get_win_fio_flags(fenc);
Bram Moolenaar13505972019-01-24 15:04:48 +01001012#endif
Bram Moolenaar071d4272004-06-13 20:20:40 +00001013
Bram Moolenaar13505972019-01-24 15:04:48 +01001014#ifdef MACOS_CONVERT
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001015 // Conversion from Apple MacRoman to latin1 or UTF-8
Bram Moolenaar071d4272004-06-13 20:20:40 +00001016 if (fio_flags == 0)
1017 fio_flags = get_mac_fio_flags(fenc);
Bram Moolenaar13505972019-01-24 15:04:48 +01001018#endif
Bram Moolenaar071d4272004-06-13 20:20:40 +00001019
Bram Moolenaar13505972019-01-24 15:04:48 +01001020#ifdef USE_ICONV
Bram Moolenaar071d4272004-06-13 20:20:40 +00001021 /*
1022 * Try using iconv() if we can't convert internally.
1023 */
1024 if (fio_flags == 0
Bram Moolenaar13505972019-01-24 15:04:48 +01001025# ifdef FEAT_EVAL
Bram Moolenaar071d4272004-06-13 20:20:40 +00001026 && !did_iconv
Bram Moolenaar13505972019-01-24 15:04:48 +01001027# endif
Bram Moolenaar071d4272004-06-13 20:20:40 +00001028 )
1029 iconv_fd = (iconv_t)my_iconv_open(
1030 enc_utf8 ? (char_u *)"utf-8" : p_enc, fenc);
Bram Moolenaar13505972019-01-24 15:04:48 +01001031#endif
Bram Moolenaar071d4272004-06-13 20:20:40 +00001032
Bram Moolenaar13505972019-01-24 15:04:48 +01001033#ifdef FEAT_EVAL
Bram Moolenaar071d4272004-06-13 20:20:40 +00001034 /*
1035 * Use the 'charconvert' expression when conversion is required
1036 * and we can't do it internally or with iconv().
1037 */
1038 if (fio_flags == 0 && !read_stdin && !read_buffer && *p_ccv != NUL
Bram Moolenaarf71d7b92016-08-09 22:14:05 +02001039 && !read_fifo
Bram Moolenaar13505972019-01-24 15:04:48 +01001040# ifdef USE_ICONV
Bram Moolenaar071d4272004-06-13 20:20:40 +00001041 && iconv_fd == (iconv_t)-1
Bram Moolenaar13505972019-01-24 15:04:48 +01001042# endif
Bram Moolenaar071d4272004-06-13 20:20:40 +00001043 )
1044 {
Bram Moolenaar13505972019-01-24 15:04:48 +01001045# ifdef USE_ICONV
Bram Moolenaar071d4272004-06-13 20:20:40 +00001046 did_iconv = FALSE;
Bram Moolenaar13505972019-01-24 15:04:48 +01001047# endif
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001048 // Skip conversion when it's already done (retry for wrong
1049 // "fileformat").
Bram Moolenaar071d4272004-06-13 20:20:40 +00001050 if (tmpname == NULL)
1051 {
1052 tmpname = readfile_charconvert(fname, fenc, &fd);
1053 if (tmpname == NULL)
1054 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001055 // Conversion failed. Try another one.
Bram Moolenaar071d4272004-06-13 20:20:40 +00001056 advance_fenc = TRUE;
1057 if (fd < 0)
1058 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001059 // Re-opening the original file failed!
Bram Moolenaar6d057012021-12-31 18:49:43 +00001060 emsg(_(e_conversion_mad_file_unreadable));
Bram Moolenaar071d4272004-06-13 20:20:40 +00001061 error = TRUE;
1062 goto failed;
1063 }
1064 goto retry;
1065 }
1066 }
1067 }
1068 else
Bram Moolenaar13505972019-01-24 15:04:48 +01001069#endif
Bram Moolenaar071d4272004-06-13 20:20:40 +00001070 {
1071 if (fio_flags == 0
Bram Moolenaar13505972019-01-24 15:04:48 +01001072#ifdef USE_ICONV
Bram Moolenaar071d4272004-06-13 20:20:40 +00001073 && iconv_fd == (iconv_t)-1
Bram Moolenaar13505972019-01-24 15:04:48 +01001074#endif
Bram Moolenaar071d4272004-06-13 20:20:40 +00001075 )
1076 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001077 // Conversion wanted but we can't.
1078 // Try the next conversion in 'fileencodings'
Bram Moolenaar071d4272004-06-13 20:20:40 +00001079 advance_fenc = TRUE;
1080 goto retry;
1081 }
1082 }
1083 }
1084
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001085 // Set "can_retry" when it's possible to rewind the file and try with
1086 // another "fenc" value. It's FALSE when no other "fenc" to try, reading
1087 // stdin or fixed at a specific encoding.
Bram Moolenaarf71d7b92016-08-09 22:14:05 +02001088 can_retry = (*fenc != NUL && !read_stdin && !read_fifo && !keep_dest_enc);
Bram Moolenaar071d4272004-06-13 20:20:40 +00001089
1090 if (!skip_read)
1091 {
1092 linerest = 0;
1093 filesize = 0;
Christian Brabandtf573c6e2021-06-20 14:02:16 +02001094 filesize_count = 0;
Bram Moolenaar071d4272004-06-13 20:20:40 +00001095 skip_count = lines_to_skip;
1096 read_count = lines_to_read;
Bram Moolenaar071d4272004-06-13 20:20:40 +00001097 conv_restlen = 0;
Bram Moolenaar55debbe2010-05-23 23:34:36 +02001098#ifdef FEAT_PERSISTENT_UNDO
Bram Moolenaar59f931e2010-07-24 20:27:03 +02001099 read_undo_file = (newfile && (flags & READ_KEEP_UNDO) == 0
1100 && curbuf->b_ffname != NULL
1101 && curbuf->b_p_udf
1102 && !filtering
Bram Moolenaarf71d7b92016-08-09 22:14:05 +02001103 && !read_fifo
Bram Moolenaar59f931e2010-07-24 20:27:03 +02001104 && !read_stdin
1105 && !read_buffer);
Bram Moolenaar55debbe2010-05-23 23:34:36 +02001106 if (read_undo_file)
1107 sha256_start(&sha_ctx);
1108#endif
Bram Moolenaar8f4ac012014-08-10 13:38:34 +02001109#ifdef FEAT_CRYPT
1110 if (curbuf->b_cryptstate != NULL)
1111 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001112 // Need to free the state, but keep the key, don't want to ask for
1113 // it again.
Bram Moolenaar8f4ac012014-08-10 13:38:34 +02001114 crypt_free_state(curbuf->b_cryptstate);
1115 curbuf->b_cryptstate = NULL;
1116 }
1117#endif
Bram Moolenaar071d4272004-06-13 20:20:40 +00001118 }
1119
1120 while (!error && !got_int)
1121 {
1122 /*
1123 * We allocate as much space for the file as we can get, plus
1124 * space for the old line plus room for one terminating NUL.
1125 * The amount is limited by the fact that read() only can read
Bram Moolenaar05ad5ff2019-11-30 22:48:27 +01001126 * up to max_unsigned characters (and other things).
Bram Moolenaar071d4272004-06-13 20:20:40 +00001127 */
Bram Moolenaar13d3b052018-04-29 13:34:47 +02001128 if (!skip_read)
1129 {
Bram Moolenaar30276f22019-01-24 17:59:39 +01001130#if defined(SSIZE_MAX) && (SSIZE_MAX < 0x10000L)
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001131 size = SSIZE_MAX; // use max I/O size, 52K
Bram Moolenaar30276f22019-01-24 17:59:39 +01001132#else
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001133 // Use buffer >= 64K. Add linerest to double the size if the
1134 // line gets very long, to avoid a lot of copying. But don't
1135 // read more than 1 Mbyte at a time, so we can be interrupted.
Bram Moolenaar13d3b052018-04-29 13:34:47 +02001136 size = 0x10000L + linerest;
1137 if (size > 0x100000L)
1138 size = 0x100000L;
Bram Moolenaar13d3b052018-04-29 13:34:47 +02001139#endif
1140 }
1141
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001142 // Protect against the argument of lalloc() going negative.
Bram Moolenaar30276f22019-01-24 17:59:39 +01001143 if (size < 0 || size + linerest + 1 < 0 || linerest >= MAXCOL)
Bram Moolenaar071d4272004-06-13 20:20:40 +00001144 {
1145 ++split;
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001146 *ptr = NL; // split line by inserting a NL
Bram Moolenaar071d4272004-06-13 20:20:40 +00001147 size = 1;
1148 }
1149 else
Bram Moolenaar071d4272004-06-13 20:20:40 +00001150 {
1151 if (!skip_read)
1152 {
Bram Moolenaarc1e37902006-04-18 21:55:01 +00001153 for ( ; size >= 10; size = (long)((long_u)size >> 1))
Bram Moolenaar071d4272004-06-13 20:20:40 +00001154 {
Bram Moolenaar18a4ba22019-05-24 19:39:03 +02001155 if ((new_buffer = lalloc(size + linerest + 1,
Bram Moolenaar071d4272004-06-13 20:20:40 +00001156 FALSE)) != NULL)
1157 break;
1158 }
1159 if (new_buffer == NULL)
1160 {
1161 do_outofmem_msg((long_u)(size * 2 + linerest + 1));
1162 error = TRUE;
1163 break;
1164 }
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001165 if (linerest) // copy characters from the previous buffer
Bram Moolenaar071d4272004-06-13 20:20:40 +00001166 mch_memmove(new_buffer, ptr - linerest, (size_t)linerest);
1167 vim_free(buffer);
1168 buffer = new_buffer;
1169 ptr = buffer + linerest;
1170 line_start = buffer;
1171
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001172 // May need room to translate into.
1173 // For iconv() we don't really know the required space, use a
1174 // factor ICONV_MULT.
1175 // latin1 to utf-8: 1 byte becomes up to 2 bytes
1176 // utf-16 to utf-8: 2 bytes become up to 3 bytes, 4 bytes
1177 // become up to 4 bytes, size must be multiple of 2
1178 // ucs-2 to utf-8: 2 bytes become up to 3 bytes, size must be
1179 // multiple of 2
1180 // ucs-4 to utf-8: 4 bytes become up to 6 bytes, size must be
1181 // multiple of 4
Bram Moolenaara93fa7e2006-04-17 22:14:47 +00001182 real_size = (int)size;
Bram Moolenaar13505972019-01-24 15:04:48 +01001183#ifdef USE_ICONV
Bram Moolenaar071d4272004-06-13 20:20:40 +00001184 if (iconv_fd != (iconv_t)-1)
1185 size = size / ICONV_MULT;
1186 else
Bram Moolenaar13505972019-01-24 15:04:48 +01001187#endif
Bram Moolenaar071d4272004-06-13 20:20:40 +00001188 if (fio_flags & FIO_LATIN1)
1189 size = size / 2;
1190 else if (fio_flags & (FIO_UCS2 | FIO_UTF16))
1191 size = (size * 2 / 3) & ~1;
1192 else if (fio_flags & FIO_UCS4)
1193 size = (size * 2 / 3) & ~3;
1194 else if (fio_flags == FIO_UCSBOM)
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001195 size = size / ICONV_MULT; // worst case
Bram Moolenaar4f974752019-02-17 17:44:42 +01001196#ifdef MSWIN
Bram Moolenaar071d4272004-06-13 20:20:40 +00001197 else if (fio_flags & FIO_CODEPAGE)
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001198 size = size / ICONV_MULT; // also worst case
Bram Moolenaar13505972019-01-24 15:04:48 +01001199#endif
1200#ifdef MACOS_CONVERT
Bram Moolenaar071d4272004-06-13 20:20:40 +00001201 else if (fio_flags & FIO_MACROMAN)
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001202 size = size / ICONV_MULT; // also worst case
Bram Moolenaar071d4272004-06-13 20:20:40 +00001203#endif
1204
Bram Moolenaar071d4272004-06-13 20:20:40 +00001205 if (conv_restlen > 0)
1206 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001207 // Insert unconverted bytes from previous line.
Bram Moolenaar071d4272004-06-13 20:20:40 +00001208 mch_memmove(ptr, conv_rest, conv_restlen);
1209 ptr += conv_restlen;
1210 size -= conv_restlen;
1211 }
Bram Moolenaar071d4272004-06-13 20:20:40 +00001212
1213 if (read_buffer)
1214 {
1215 /*
1216 * Read bytes from curbuf. Used for converting text read
1217 * from stdin.
1218 */
Christian Brabandt226b28b2021-06-21 21:08:08 +02001219 eof = FALSE;
Bram Moolenaar071d4272004-06-13 20:20:40 +00001220 if (read_buf_lnum > from)
1221 size = 0;
1222 else
1223 {
1224 int n, ni;
1225 long tlen;
1226
1227 tlen = 0;
1228 for (;;)
1229 {
1230 p = ml_get(read_buf_lnum) + read_buf_col;
1231 n = (int)STRLEN(p);
1232 if ((int)tlen + n + 1 > size)
1233 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001234 // Filled up to "size", append partial line.
1235 // Change NL to NUL to reverse the effect done
1236 // below.
Bram Moolenaara93fa7e2006-04-17 22:14:47 +00001237 n = (int)(size - tlen);
Bram Moolenaar071d4272004-06-13 20:20:40 +00001238 for (ni = 0; ni < n; ++ni)
1239 {
1240 if (p[ni] == NL)
1241 ptr[tlen++] = NUL;
1242 else
1243 ptr[tlen++] = p[ni];
1244 }
1245 read_buf_col += n;
1246 break;
1247 }
=?UTF-8?q?Dundar=20G=C3=B6c?=f26c1612022-04-07 13:26:34 +01001248
1249 // Append whole line and new-line. Change NL
1250 // to NUL to reverse the effect done below.
1251 for (ni = 0; ni < n; ++ni)
Bram Moolenaar071d4272004-06-13 20:20:40 +00001252 {
=?UTF-8?q?Dundar=20G=C3=B6c?=f26c1612022-04-07 13:26:34 +01001253 if (p[ni] == NL)
1254 ptr[tlen++] = NUL;
1255 else
1256 ptr[tlen++] = p[ni];
Bram Moolenaar071d4272004-06-13 20:20:40 +00001257 }
=?UTF-8?q?Dundar=20G=C3=B6c?=f26c1612022-04-07 13:26:34 +01001258 ptr[tlen++] = NL;
1259 read_buf_col = 0;
1260 if (++read_buf_lnum > from)
1261 {
1262 // When the last line didn't have an
1263 // end-of-line don't add it now either.
1264 if (!curbuf->b_p_eol)
1265 --tlen;
1266 size = tlen;
1267 eof = TRUE;
1268 break;
1269 }
1270
Bram Moolenaar071d4272004-06-13 20:20:40 +00001271 }
1272 }
1273 }
1274 else
1275 {
1276 /*
1277 * Read bytes from the file.
1278 */
Christian Brabandtf573c6e2021-06-20 14:02:16 +02001279# ifdef FEAT_SODIUM
1280 // Let the crypt layer work with a buffer size of 8192
1281 if (filesize == 0)
1282 // set size to 8K + Sodium Crypt Metadata
Christian Brabandt226b28b2021-06-21 21:08:08 +02001283 size = WRITEBUFSIZE + crypt_get_max_header_len()
Christian Brabandtf573c6e2021-06-20 14:02:16 +02001284 + crypto_secretstream_xchacha20poly1305_HEADERBYTES
1285 + crypto_secretstream_xchacha20poly1305_ABYTES;
1286
1287 else if (filesize > 0 && (curbuf->b_cryptstate != NULL &&
1288 curbuf->b_cryptstate->method_nr == CRYPT_M_SOD))
1289 size = WRITEBUFSIZE + crypto_secretstream_xchacha20poly1305_ABYTES;
1290# endif
1291 eof = size;
Bram Moolenaar540fc6f2010-12-17 16:27:16 +01001292 size = read_eintr(fd, ptr, size);
Christian Brabandtf573c6e2021-06-20 14:02:16 +02001293 filesize_count += size;
1294 // hit end of file
1295 eof = (size < eof || filesize_count == filesize_disk);
Bram Moolenaar071d4272004-06-13 20:20:40 +00001296 }
1297
Bram Moolenaar8f4ac012014-08-10 13:38:34 +02001298#ifdef FEAT_CRYPT
1299 /*
1300 * At start of file: Check for magic number of encryption.
1301 */
1302 if (filesize == 0 && size > 0)
Bram Moolenaar65aee0b2021-06-27 14:08:24 +02001303 {
Bram Moolenaar8f4ac012014-08-10 13:38:34 +02001304 cryptkey = check_for_cryptkey(cryptkey, ptr, &size,
1305 &filesize, newfile, sfname,
1306 &did_ask_for_key);
Bram Moolenaarb4868ed2022-01-19 11:24:40 +00001307# if defined(CRYPT_NOT_INPLACE) && defined(FEAT_PERSISTENT_UNDO)
Bram Moolenaar65aee0b2021-06-27 14:08:24 +02001308 if (curbuf->b_cryptstate != NULL
1309 && !crypt_works_inplace(curbuf->b_cryptstate))
1310 // reading undo file requires crypt_decode_inplace()
1311 read_undo_file = FALSE;
1312# endif
1313 }
Bram Moolenaar8f4ac012014-08-10 13:38:34 +02001314 /*
1315 * Decrypt the read bytes. This is done before checking for
1316 * EOF because the crypt layer may be buffering.
1317 */
Bram Moolenaar829aa642017-08-23 22:32:35 +02001318 if (cryptkey != NULL && curbuf->b_cryptstate != NULL
1319 && size > 0)
Bram Moolenaar8f4ac012014-08-10 13:38:34 +02001320 {
Bram Moolenaar987411d2019-01-18 22:48:34 +01001321# ifdef CRYPT_NOT_INPLACE
Bram Moolenaar8f4ac012014-08-10 13:38:34 +02001322 if (crypt_works_inplace(curbuf->b_cryptstate))
1323 {
Bram Moolenaar987411d2019-01-18 22:48:34 +01001324# endif
Christian Brabandtf573c6e2021-06-20 14:02:16 +02001325 crypt_decode_inplace(curbuf->b_cryptstate, ptr,
1326 size, eof);
Bram Moolenaar987411d2019-01-18 22:48:34 +01001327# ifdef CRYPT_NOT_INPLACE
Bram Moolenaar8f4ac012014-08-10 13:38:34 +02001328 }
1329 else
1330 {
1331 char_u *newptr = NULL;
1332 int decrypted_size;
1333
1334 decrypted_size = crypt_decode_alloc(
Christian Brabandtf573c6e2021-06-20 14:02:16 +02001335 curbuf->b_cryptstate, ptr, size,
1336 &newptr, eof);
Bram Moolenaar8f4ac012014-08-10 13:38:34 +02001337
Christian Brabandtf573c6e2021-06-20 14:02:16 +02001338 if (decrypted_size < 0)
1339 {
1340 // error message already given
1341 error = TRUE;
1342 vim_free(newptr);
1343 break;
1344 }
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001345 // If the crypt layer is buffering, not producing
1346 // anything yet, need to read more.
Bram Moolenaar1c17ffa2018-04-24 15:19:04 +02001347 if (decrypted_size == 0)
Bram Moolenaar8f4ac012014-08-10 13:38:34 +02001348 continue;
1349
1350 if (linerest == 0)
1351 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001352 // Simple case: reuse returned buffer (may be
1353 // NULL, checked later).
Bram Moolenaar8f4ac012014-08-10 13:38:34 +02001354 new_buffer = newptr;
1355 }
1356 else
1357 {
1358 long_u new_size;
1359
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001360 // Need new buffer to add bytes carried over.
Bram Moolenaar8f4ac012014-08-10 13:38:34 +02001361 new_size = (long_u)(decrypted_size + linerest + 1);
1362 new_buffer = lalloc(new_size, FALSE);
1363 if (new_buffer == NULL)
1364 {
1365 do_outofmem_msg(new_size);
1366 error = TRUE;
1367 break;
1368 }
1369
1370 mch_memmove(new_buffer, buffer, linerest);
1371 if (newptr != NULL)
1372 mch_memmove(new_buffer + linerest, newptr,
1373 decrypted_size);
Christian Brabandtf573c6e2021-06-20 14:02:16 +02001374 vim_free(newptr);
Bram Moolenaar8f4ac012014-08-10 13:38:34 +02001375 }
1376
1377 if (new_buffer != NULL)
1378 {
1379 vim_free(buffer);
1380 buffer = new_buffer;
1381 new_buffer = NULL;
1382 line_start = buffer;
1383 ptr = buffer + linerest;
Christian Brabandtf573c6e2021-06-20 14:02:16 +02001384 real_size = size;
Bram Moolenaar8f4ac012014-08-10 13:38:34 +02001385 }
1386 size = decrypted_size;
1387 }
Bram Moolenaar987411d2019-01-18 22:48:34 +01001388# endif
Bram Moolenaar8f4ac012014-08-10 13:38:34 +02001389 }
1390#endif
1391
Bram Moolenaar071d4272004-06-13 20:20:40 +00001392 if (size <= 0)
1393 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001394 if (size < 0) // read error
Bram Moolenaar071d4272004-06-13 20:20:40 +00001395 error = TRUE;
Bram Moolenaar071d4272004-06-13 20:20:40 +00001396 else if (conv_restlen > 0)
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001397 {
Bram Moolenaarf453d352008-06-04 17:37:34 +00001398 /*
1399 * Reached end-of-file but some trailing bytes could
1400 * not be converted. Truncated file?
1401 */
1402
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001403 // When we did a conversion report an error.
Bram Moolenaarf453d352008-06-04 17:37:34 +00001404 if (fio_flags != 0
Bram Moolenaar13505972019-01-24 15:04:48 +01001405#ifdef USE_ICONV
Bram Moolenaarf453d352008-06-04 17:37:34 +00001406 || iconv_fd != (iconv_t)-1
Bram Moolenaar13505972019-01-24 15:04:48 +01001407#endif
Bram Moolenaarf453d352008-06-04 17:37:34 +00001408 )
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001409 {
Bram Moolenaare8d95302013-04-24 16:34:02 +02001410 if (can_retry)
1411 goto rewind_retry;
Bram Moolenaarf453d352008-06-04 17:37:34 +00001412 if (conv_error == 0)
1413 conv_error = curbuf->b_ml.ml_line_count
1414 - linecnt + 1;
1415 }
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001416 // Remember the first linenr with an illegal byte
Bram Moolenaarf453d352008-06-04 17:37:34 +00001417 else if (illegal_byte == 0)
1418 illegal_byte = curbuf->b_ml.ml_line_count
1419 - linecnt + 1;
1420 if (bad_char_behavior == BAD_DROP)
1421 {
1422 *(ptr - conv_restlen) = NUL;
1423 conv_restlen = 0;
1424 }
1425 else
1426 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001427 // Replace the trailing bytes with the replacement
1428 // character if we were converting; if we weren't,
1429 // leave the UTF8 checking code to do it, as it
1430 // works slightly differently.
Bram Moolenaarf453d352008-06-04 17:37:34 +00001431 if (bad_char_behavior != BAD_KEEP && (fio_flags != 0
Bram Moolenaar13505972019-01-24 15:04:48 +01001432#ifdef USE_ICONV
Bram Moolenaarf453d352008-06-04 17:37:34 +00001433 || iconv_fd != (iconv_t)-1
Bram Moolenaar13505972019-01-24 15:04:48 +01001434#endif
Bram Moolenaarf453d352008-06-04 17:37:34 +00001435 ))
1436 {
1437 while (conv_restlen > 0)
1438 {
1439 *(--ptr) = bad_char_behavior;
1440 --conv_restlen;
1441 }
1442 }
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001443 fio_flags = 0; // don't convert this
Bram Moolenaar13505972019-01-24 15:04:48 +01001444#ifdef USE_ICONV
Bram Moolenaarb21e5842006-04-16 18:30:08 +00001445 if (iconv_fd != (iconv_t)-1)
1446 {
1447 iconv_close(iconv_fd);
1448 iconv_fd = (iconv_t)-1;
1449 }
Bram Moolenaar13505972019-01-24 15:04:48 +01001450#endif
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001451 }
1452 }
Bram Moolenaar071d4272004-06-13 20:20:40 +00001453 }
Bram Moolenaar071d4272004-06-13 20:20:40 +00001454 }
1455 skip_read = FALSE;
1456
Bram Moolenaar071d4272004-06-13 20:20:40 +00001457 /*
1458 * At start of file (or after crypt magic number): Check for BOM.
1459 * Also check for a BOM for other Unicode encodings, but not after
1460 * converting with 'charconvert' or when a BOM has already been
1461 * found.
1462 */
1463 if ((filesize == 0
Bram Moolenaar13505972019-01-24 15:04:48 +01001464#ifdef FEAT_CRYPT
Bram Moolenaar8f4ac012014-08-10 13:38:34 +02001465 || (cryptkey != NULL
1466 && filesize == crypt_get_header_len(
1467 crypt_get_method_nr(curbuf)))
Bram Moolenaar13505972019-01-24 15:04:48 +01001468#endif
Bram Moolenaar071d4272004-06-13 20:20:40 +00001469 )
1470 && (fio_flags == FIO_UCSBOM
1471 || (!curbuf->b_p_bomb
1472 && tmpname == NULL
1473 && (*fenc == 'u' || (*fenc == NUL && enc_utf8)))))
1474 {
1475 char_u *ccname;
1476 int blen;
1477
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001478 // no BOM detection in a short file or in binary mode
Bram Moolenaar071d4272004-06-13 20:20:40 +00001479 if (size < 2 || curbuf->b_p_bin)
1480 ccname = NULL;
1481 else
1482 ccname = check_for_bom(ptr, size, &blen,
1483 fio_flags == FIO_UCSBOM ? FIO_ALL : get_fio_flags(fenc));
1484 if (ccname != NULL)
1485 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001486 // Remove BOM from the text
Bram Moolenaar071d4272004-06-13 20:20:40 +00001487 filesize += blen;
1488 size -= blen;
1489 mch_memmove(ptr, ptr + blen, (size_t)size);
Bram Moolenaar910f66f2006-04-05 20:41:53 +00001490 if (set_options)
Bram Moolenaar83eb8852007-08-12 13:51:26 +00001491 {
Bram Moolenaar071d4272004-06-13 20:20:40 +00001492 curbuf->b_p_bomb = TRUE;
Bram Moolenaar83eb8852007-08-12 13:51:26 +00001493 curbuf->b_start_bomb = TRUE;
1494 }
Bram Moolenaar071d4272004-06-13 20:20:40 +00001495 }
1496
1497 if (fio_flags == FIO_UCSBOM)
1498 {
1499 if (ccname == NULL)
1500 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001501 // No BOM detected: retry with next encoding.
Bram Moolenaar071d4272004-06-13 20:20:40 +00001502 advance_fenc = TRUE;
1503 }
1504 else
1505 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001506 // BOM detected: set "fenc" and jump back
Bram Moolenaar071d4272004-06-13 20:20:40 +00001507 if (fenc_alloced)
1508 vim_free(fenc);
1509 fenc = ccname;
1510 fenc_alloced = FALSE;
1511 }
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001512 // retry reading without getting new bytes or rewinding
Bram Moolenaar071d4272004-06-13 20:20:40 +00001513 skip_read = TRUE;
1514 goto retry;
1515 }
1516 }
Bram Moolenaarf453d352008-06-04 17:37:34 +00001517
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001518 // Include not converted bytes.
Bram Moolenaarf453d352008-06-04 17:37:34 +00001519 ptr -= conv_restlen;
1520 size += conv_restlen;
1521 conv_restlen = 0;
Bram Moolenaar071d4272004-06-13 20:20:40 +00001522 /*
1523 * Break here for a read error or end-of-file.
1524 */
1525 if (size <= 0)
1526 break;
1527
Bram Moolenaar071d4272004-06-13 20:20:40 +00001528
Bram Moolenaar13505972019-01-24 15:04:48 +01001529#ifdef USE_ICONV
Bram Moolenaar071d4272004-06-13 20:20:40 +00001530 if (iconv_fd != (iconv_t)-1)
1531 {
1532 /*
1533 * Attempt conversion of the read bytes to 'encoding' using
1534 * iconv().
1535 */
1536 const char *fromp;
1537 char *top;
1538 size_t from_size;
1539 size_t to_size;
1540
1541 fromp = (char *)ptr;
1542 from_size = size;
1543 ptr += size;
1544 top = (char *)ptr;
1545 to_size = real_size - size;
1546
1547 /*
1548 * If there is conversion error or not enough room try using
Bram Moolenaar19a09a12005-03-04 23:39:37 +00001549 * another conversion. Except for when there is no
1550 * alternative (help files).
Bram Moolenaar071d4272004-06-13 20:20:40 +00001551 */
Bram Moolenaar8cd06ca2005-02-28 22:44:58 +00001552 while ((iconv(iconv_fd, (void *)&fromp, &from_size,
1553 &top, &to_size)
Bram Moolenaar071d4272004-06-13 20:20:40 +00001554 == (size_t)-1 && ICONV_ERRNO != ICONV_EINVAL)
1555 || from_size > CONV_RESTLEN)
Bram Moolenaar8cd06ca2005-02-28 22:44:58 +00001556 {
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001557 if (can_retry)
Bram Moolenaar8cd06ca2005-02-28 22:44:58 +00001558 goto rewind_retry;
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001559 if (conv_error == 0)
1560 conv_error = readfile_linenr(linecnt,
1561 ptr, (char_u *)top);
Bram Moolenaar42eeac32005-06-29 22:40:58 +00001562
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001563 // Deal with a bad byte and continue with the next.
Bram Moolenaar8cd06ca2005-02-28 22:44:58 +00001564 ++fromp;
1565 --from_size;
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001566 if (bad_char_behavior == BAD_KEEP)
1567 {
1568 *top++ = *(fromp - 1);
1569 --to_size;
1570 }
1571 else if (bad_char_behavior != BAD_DROP)
1572 {
1573 *top++ = bad_char_behavior;
1574 --to_size;
1575 }
Bram Moolenaar8cd06ca2005-02-28 22:44:58 +00001576 }
Bram Moolenaar071d4272004-06-13 20:20:40 +00001577
1578 if (from_size > 0)
1579 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001580 // Some remaining characters, keep them for the next
1581 // round.
Bram Moolenaar071d4272004-06-13 20:20:40 +00001582 mch_memmove(conv_rest, (char_u *)fromp, from_size);
1583 conv_restlen = (int)from_size;
1584 }
1585
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001586 // move the linerest to before the converted characters
Bram Moolenaar071d4272004-06-13 20:20:40 +00001587 line_start = ptr - linerest;
1588 mch_memmove(line_start, buffer, (size_t)linerest);
1589 size = (long)((char_u *)top - ptr);
1590 }
Bram Moolenaar13505972019-01-24 15:04:48 +01001591#endif
Bram Moolenaar071d4272004-06-13 20:20:40 +00001592
Bram Moolenaar4f974752019-02-17 17:44:42 +01001593#ifdef MSWIN
Bram Moolenaar071d4272004-06-13 20:20:40 +00001594 if (fio_flags & FIO_CODEPAGE)
1595 {
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001596 char_u *src, *dst;
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001597 WCHAR ucs2buf[3];
1598 int ucs2len;
1599 int codepage = FIO_GET_CP(fio_flags);
1600 int bytelen;
1601 int found_bad;
1602 char replstr[2];
1603
Bram Moolenaar071d4272004-06-13 20:20:40 +00001604 /*
1605 * Conversion from an MS-Windows codepage or UTF-8 to UTF-8 or
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001606 * a codepage, using standard MS-Windows functions. This
1607 * requires two steps:
1608 * 1. convert from 'fileencoding' to ucs-2
1609 * 2. convert from ucs-2 to 'encoding'
Bram Moolenaar071d4272004-06-13 20:20:40 +00001610 *
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001611 * Because there may be illegal bytes AND an incomplete byte
1612 * sequence at the end, we may have to do the conversion one
1613 * character at a time to get it right.
Bram Moolenaar071d4272004-06-13 20:20:40 +00001614 */
Bram Moolenaar071d4272004-06-13 20:20:40 +00001615
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001616 // Replacement string for WideCharToMultiByte().
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001617 if (bad_char_behavior > 0)
1618 replstr[0] = bad_char_behavior;
Bram Moolenaar071d4272004-06-13 20:20:40 +00001619 else
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001620 replstr[0] = '?';
1621 replstr[1] = NUL;
Bram Moolenaar071d4272004-06-13 20:20:40 +00001622
1623 /*
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001624 * Move the bytes to the end of the buffer, so that we have
1625 * room to put the result at the start.
Bram Moolenaar071d4272004-06-13 20:20:40 +00001626 */
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001627 src = ptr + real_size - size;
1628 mch_memmove(src, ptr, size);
Bram Moolenaar071d4272004-06-13 20:20:40 +00001629
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001630 /*
1631 * Do the conversion.
1632 */
1633 dst = ptr;
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001634 while (size > 0)
1635 {
1636 found_bad = FALSE;
1637
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001638# ifdef CP_UTF8 // VC 4.1 doesn't define CP_UTF8
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001639 if (codepage == CP_UTF8)
1640 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001641 // Handle CP_UTF8 input ourselves to be able to handle
1642 // trailing bytes properly.
1643 // Get one UTF-8 character from src.
Bram Moolenaara93fa7e2006-04-17 22:14:47 +00001644 bytelen = (int)utf_ptr2len_len(src, size);
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001645 if (bytelen > size)
1646 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001647 // Only got some bytes of a character. Normally
1648 // it's put in "conv_rest", but if it's too long
1649 // deal with it as if they were illegal bytes.
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001650 if (bytelen <= CONV_RESTLEN)
1651 break;
1652
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001653 // weird overlong byte sequence
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001654 bytelen = size;
1655 found_bad = TRUE;
1656 }
1657 else
1658 {
Bram Moolenaarc01140a2006-03-24 22:21:52 +00001659 int u8c = utf_ptr2char(src);
1660
Bram Moolenaar86e01082005-12-29 22:45:34 +00001661 if (u8c > 0xffff || (*src >= 0x80 && bytelen == 1))
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001662 found_bad = TRUE;
1663 ucs2buf[0] = u8c;
1664 ucs2len = 1;
1665 }
1666 }
1667 else
1668# endif
1669 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001670 // We don't know how long the byte sequence is, try
1671 // from one to three bytes.
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001672 for (bytelen = 1; bytelen <= size && bytelen <= 3;
1673 ++bytelen)
1674 {
1675 ucs2len = MultiByteToWideChar(codepage,
1676 MB_ERR_INVALID_CHARS,
1677 (LPCSTR)src, bytelen,
1678 ucs2buf, 3);
1679 if (ucs2len > 0)
1680 break;
1681 }
1682 if (ucs2len == 0)
1683 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001684 // If we have only one byte then it's probably an
1685 // incomplete byte sequence. Otherwise discard
1686 // one byte as a bad character.
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001687 if (size == 1)
1688 break;
1689 found_bad = TRUE;
1690 bytelen = 1;
1691 }
1692 }
1693
1694 if (!found_bad)
1695 {
1696 int i;
1697
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001698 // Convert "ucs2buf[ucs2len]" to 'enc' in "dst".
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001699 if (enc_utf8)
1700 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001701 // From UCS-2 to UTF-8. Cannot fail.
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001702 for (i = 0; i < ucs2len; ++i)
1703 dst += utf_char2bytes(ucs2buf[i], dst);
1704 }
1705 else
1706 {
1707 BOOL bad = FALSE;
1708 int dstlen;
1709
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001710 // From UCS-2 to "enc_codepage". If the
1711 // conversion uses the default character "?",
1712 // the data doesn't fit in this encoding.
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001713 dstlen = WideCharToMultiByte(enc_codepage, 0,
1714 (LPCWSTR)ucs2buf, ucs2len,
Bram Moolenaara93fa7e2006-04-17 22:14:47 +00001715 (LPSTR)dst, (int)(src - dst),
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001716 replstr, &bad);
1717 if (bad)
1718 found_bad = TRUE;
1719 else
1720 dst += dstlen;
1721 }
1722 }
1723
1724 if (found_bad)
1725 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001726 // Deal with bytes we can't convert.
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001727 if (can_retry)
1728 goto rewind_retry;
1729 if (conv_error == 0)
1730 conv_error = readfile_linenr(linecnt, ptr, dst);
1731 if (bad_char_behavior != BAD_DROP)
1732 {
1733 if (bad_char_behavior == BAD_KEEP)
1734 {
1735 mch_memmove(dst, src, bytelen);
1736 dst += bytelen;
1737 }
1738 else
1739 *dst++ = bad_char_behavior;
1740 }
1741 }
1742
1743 src += bytelen;
1744 size -= bytelen;
Bram Moolenaar071d4272004-06-13 20:20:40 +00001745 }
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001746
1747 if (size > 0)
1748 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001749 // An incomplete byte sequence remaining.
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001750 mch_memmove(conv_rest, src, size);
1751 conv_restlen = size;
1752 }
1753
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001754 // The new size is equal to how much "dst" was advanced.
Bram Moolenaara93fa7e2006-04-17 22:14:47 +00001755 size = (long)(dst - ptr);
Bram Moolenaar071d4272004-06-13 20:20:40 +00001756 }
1757 else
Bram Moolenaar13505972019-01-24 15:04:48 +01001758#endif
1759#ifdef MACOS_CONVERT
Bram Moolenaar071d4272004-06-13 20:20:40 +00001760 if (fio_flags & FIO_MACROMAN)
1761 {
1762 /*
1763 * Conversion from Apple MacRoman char encoding to UTF-8 or
Bram Moolenaarab79bcb2004-07-18 21:34:53 +00001764 * latin1. This is in os_mac_conv.c.
Bram Moolenaar071d4272004-06-13 20:20:40 +00001765 */
Bram Moolenaarab79bcb2004-07-18 21:34:53 +00001766 if (macroman2enc(ptr, &size, real_size) == FAIL)
Bram Moolenaar071d4272004-06-13 20:20:40 +00001767 goto rewind_retry;
Bram Moolenaar071d4272004-06-13 20:20:40 +00001768 }
1769 else
Bram Moolenaar13505972019-01-24 15:04:48 +01001770#endif
Bram Moolenaar071d4272004-06-13 20:20:40 +00001771 if (fio_flags != 0)
1772 {
1773 int u8c;
1774 char_u *dest;
1775 char_u *tail = NULL;
1776
1777 /*
1778 * "enc_utf8" set: Convert Unicode or Latin1 to UTF-8.
1779 * "enc_utf8" not set: Convert Unicode to Latin1.
1780 * Go from end to start through the buffer, because the number
1781 * of bytes may increase.
1782 * "dest" points to after where the UTF-8 bytes go, "p" points
1783 * to after the next character to convert.
1784 */
1785 dest = ptr + real_size;
1786 if (fio_flags == FIO_LATIN1 || fio_flags == FIO_UTF8)
1787 {
1788 p = ptr + size;
1789 if (fio_flags == FIO_UTF8)
1790 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001791 // Check for a trailing incomplete UTF-8 sequence
Bram Moolenaar071d4272004-06-13 20:20:40 +00001792 tail = ptr + size - 1;
1793 while (tail > ptr && (*tail & 0xc0) == 0x80)
1794 --tail;
1795 if (tail + utf_byte2len(*tail) <= ptr + size)
1796 tail = NULL;
1797 else
1798 p = tail;
1799 }
1800 }
1801 else if (fio_flags & (FIO_UCS2 | FIO_UTF16))
1802 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001803 // Check for a trailing byte
Bram Moolenaar071d4272004-06-13 20:20:40 +00001804 p = ptr + (size & ~1);
1805 if (size & 1)
1806 tail = p;
1807 if ((fio_flags & FIO_UTF16) && p > ptr)
1808 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001809 // Check for a trailing leading word
Bram Moolenaar071d4272004-06-13 20:20:40 +00001810 if (fio_flags & FIO_ENDIAN_L)
1811 {
1812 u8c = (*--p << 8);
1813 u8c += *--p;
1814 }
1815 else
1816 {
1817 u8c = *--p;
1818 u8c += (*--p << 8);
1819 }
1820 if (u8c >= 0xd800 && u8c <= 0xdbff)
1821 tail = p;
1822 else
1823 p += 2;
1824 }
1825 }
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001826 else // FIO_UCS4
Bram Moolenaar071d4272004-06-13 20:20:40 +00001827 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001828 // Check for trailing 1, 2 or 3 bytes
Bram Moolenaar071d4272004-06-13 20:20:40 +00001829 p = ptr + (size & ~3);
1830 if (size & 3)
1831 tail = p;
1832 }
1833
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001834 // If there is a trailing incomplete sequence move it to
1835 // conv_rest[].
Bram Moolenaar071d4272004-06-13 20:20:40 +00001836 if (tail != NULL)
1837 {
1838 conv_restlen = (int)((ptr + size) - tail);
1839 mch_memmove(conv_rest, (char_u *)tail, conv_restlen);
1840 size -= conv_restlen;
1841 }
1842
1843
1844 while (p > ptr)
1845 {
1846 if (fio_flags & FIO_LATIN1)
1847 u8c = *--p;
1848 else if (fio_flags & (FIO_UCS2 | FIO_UTF16))
1849 {
1850 if (fio_flags & FIO_ENDIAN_L)
1851 {
1852 u8c = (*--p << 8);
1853 u8c += *--p;
1854 }
1855 else
1856 {
1857 u8c = *--p;
1858 u8c += (*--p << 8);
1859 }
1860 if ((fio_flags & FIO_UTF16)
1861 && u8c >= 0xdc00 && u8c <= 0xdfff)
1862 {
1863 int u16c;
1864
1865 if (p == ptr)
1866 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001867 // Missing leading word.
Bram Moolenaar071d4272004-06-13 20:20:40 +00001868 if (can_retry)
1869 goto rewind_retry;
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001870 if (conv_error == 0)
1871 conv_error = readfile_linenr(linecnt,
1872 ptr, p);
1873 if (bad_char_behavior == BAD_DROP)
1874 continue;
1875 if (bad_char_behavior != BAD_KEEP)
1876 u8c = bad_char_behavior;
Bram Moolenaar071d4272004-06-13 20:20:40 +00001877 }
1878
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001879 // found second word of double-word, get the first
1880 // word and compute the resulting character
Bram Moolenaar071d4272004-06-13 20:20:40 +00001881 if (fio_flags & FIO_ENDIAN_L)
1882 {
1883 u16c = (*--p << 8);
1884 u16c += *--p;
1885 }
1886 else
1887 {
1888 u16c = *--p;
1889 u16c += (*--p << 8);
1890 }
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001891 u8c = 0x10000 + ((u16c & 0x3ff) << 10)
1892 + (u8c & 0x3ff);
1893
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001894 // Check if the word is indeed a leading word.
Bram Moolenaar071d4272004-06-13 20:20:40 +00001895 if (u16c < 0xd800 || u16c > 0xdbff)
1896 {
1897 if (can_retry)
1898 goto rewind_retry;
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001899 if (conv_error == 0)
1900 conv_error = readfile_linenr(linecnt,
1901 ptr, p);
1902 if (bad_char_behavior == BAD_DROP)
1903 continue;
1904 if (bad_char_behavior != BAD_KEEP)
1905 u8c = bad_char_behavior;
Bram Moolenaar071d4272004-06-13 20:20:40 +00001906 }
Bram Moolenaar071d4272004-06-13 20:20:40 +00001907 }
1908 }
1909 else if (fio_flags & FIO_UCS4)
1910 {
1911 if (fio_flags & FIO_ENDIAN_L)
1912 {
Bram Moolenaardc1c9812017-10-27 22:15:24 +02001913 u8c = (unsigned)*--p << 24;
1914 u8c += (unsigned)*--p << 16;
1915 u8c += (unsigned)*--p << 8;
Bram Moolenaar071d4272004-06-13 20:20:40 +00001916 u8c += *--p;
1917 }
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001918 else // big endian
Bram Moolenaar071d4272004-06-13 20:20:40 +00001919 {
1920 u8c = *--p;
Bram Moolenaardc1c9812017-10-27 22:15:24 +02001921 u8c += (unsigned)*--p << 8;
1922 u8c += (unsigned)*--p << 16;
1923 u8c += (unsigned)*--p << 24;
Bram Moolenaar071d4272004-06-13 20:20:40 +00001924 }
1925 }
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001926 else // UTF-8
Bram Moolenaar071d4272004-06-13 20:20:40 +00001927 {
1928 if (*--p < 0x80)
1929 u8c = *p;
1930 else
1931 {
1932 len = utf_head_off(ptr, p);
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001933 p -= len;
1934 u8c = utf_ptr2char(p);
Bram Moolenaar071d4272004-06-13 20:20:40 +00001935 if (len == 0)
1936 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001937 // Not a valid UTF-8 character, retry with
1938 // another fenc when possible, otherwise just
1939 // report the error.
Bram Moolenaar071d4272004-06-13 20:20:40 +00001940 if (can_retry)
1941 goto rewind_retry;
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001942 if (conv_error == 0)
1943 conv_error = readfile_linenr(linecnt,
1944 ptr, p);
1945 if (bad_char_behavior == BAD_DROP)
1946 continue;
1947 if (bad_char_behavior != BAD_KEEP)
1948 u8c = bad_char_behavior;
Bram Moolenaar071d4272004-06-13 20:20:40 +00001949 }
Bram Moolenaar071d4272004-06-13 20:20:40 +00001950 }
1951 }
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001952 if (enc_utf8) // produce UTF-8
Bram Moolenaar071d4272004-06-13 20:20:40 +00001953 {
1954 dest -= utf_char2len(u8c);
1955 (void)utf_char2bytes(u8c, dest);
1956 }
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001957 else // produce Latin1
Bram Moolenaar071d4272004-06-13 20:20:40 +00001958 {
1959 --dest;
1960 if (u8c >= 0x100)
1961 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001962 // character doesn't fit in latin1, retry with
1963 // another fenc when possible, otherwise just
1964 // report the error.
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001965 if (can_retry)
Bram Moolenaar071d4272004-06-13 20:20:40 +00001966 goto rewind_retry;
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001967 if (conv_error == 0)
1968 conv_error = readfile_linenr(linecnt, ptr, p);
1969 if (bad_char_behavior == BAD_DROP)
1970 ++dest;
1971 else if (bad_char_behavior == BAD_KEEP)
1972 *dest = u8c;
1973 else if (eap != NULL && eap->bad_char != 0)
1974 *dest = bad_char_behavior;
1975 else
1976 *dest = 0xBF;
Bram Moolenaar071d4272004-06-13 20:20:40 +00001977 }
1978 else
1979 *dest = u8c;
1980 }
1981 }
1982
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001983 // move the linerest to before the converted characters
Bram Moolenaar071d4272004-06-13 20:20:40 +00001984 line_start = dest - linerest;
1985 mch_memmove(line_start, buffer, (size_t)linerest);
1986 size = (long)((ptr + real_size) - dest);
1987 ptr = dest;
1988 }
Bram Moolenaarf453d352008-06-04 17:37:34 +00001989 else if (enc_utf8 && !curbuf->b_p_bin)
Bram Moolenaar071d4272004-06-13 20:20:40 +00001990 {
Bram Moolenaarf453d352008-06-04 17:37:34 +00001991 int incomplete_tail = FALSE;
1992
Bram Moolenaar217e1b82019-12-01 21:41:28 +01001993 // Reading UTF-8: Check if the bytes are valid UTF-8.
Bram Moolenaarf453d352008-06-04 17:37:34 +00001994 for (p = ptr; ; ++p)
Bram Moolenaar071d4272004-06-13 20:20:40 +00001995 {
Bram Moolenaara93fa7e2006-04-17 22:14:47 +00001996 int todo = (int)((ptr + size) - p);
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00001997 int l;
1998
1999 if (todo <= 0)
2000 break;
Bram Moolenaar071d4272004-06-13 20:20:40 +00002001 if (*p >= 0x80)
2002 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002003 // A length of 1 means it's an illegal byte. Accept
2004 // an incomplete character at the end though, the next
2005 // read() will get the next bytes, we'll check it
2006 // then.
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00002007 l = utf_ptr2len_len(p, todo);
Bram Moolenaarf453d352008-06-04 17:37:34 +00002008 if (l > todo && !incomplete_tail)
Bram Moolenaar071d4272004-06-13 20:20:40 +00002009 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002010 // Avoid retrying with a different encoding when
2011 // a truncated file is more likely, or attempting
2012 // to read the rest of an incomplete sequence when
2013 // we have already done so.
Bram Moolenaarf453d352008-06-04 17:37:34 +00002014 if (p > ptr || filesize > 0)
2015 incomplete_tail = TRUE;
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002016 // Incomplete byte sequence, move it to conv_rest[]
2017 // and try to read the rest of it, unless we've
2018 // already done so.
Bram Moolenaarf453d352008-06-04 17:37:34 +00002019 if (p > ptr)
2020 {
2021 conv_restlen = todo;
2022 mch_memmove(conv_rest, p, conv_restlen);
2023 size -= conv_restlen;
2024 break;
2025 }
Bram Moolenaar071d4272004-06-13 20:20:40 +00002026 }
Bram Moolenaarf453d352008-06-04 17:37:34 +00002027 if (l == 1 || l > todo)
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00002028 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002029 // Illegal byte. If we can try another encoding
2030 // do that, unless at EOF where a truncated
2031 // file is more likely than a conversion error.
Bram Moolenaarf453d352008-06-04 17:37:34 +00002032 if (can_retry && !incomplete_tail)
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00002033 break;
Bram Moolenaar13505972019-01-24 15:04:48 +01002034#ifdef USE_ICONV
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002035 // When we did a conversion report an error.
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00002036 if (iconv_fd != (iconv_t)-1 && conv_error == 0)
2037 conv_error = readfile_linenr(linecnt, ptr, p);
Bram Moolenaar13505972019-01-24 15:04:48 +01002038#endif
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002039 // Remember the first linenr with an illegal byte
Bram Moolenaarf453d352008-06-04 17:37:34 +00002040 if (conv_error == 0 && illegal_byte == 0)
2041 illegal_byte = readfile_linenr(linecnt, ptr, p);
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00002042
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002043 // Drop, keep or replace the bad byte.
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00002044 if (bad_char_behavior == BAD_DROP)
2045 {
Bram Moolenaarf453d352008-06-04 17:37:34 +00002046 mch_memmove(p, p + 1, todo - 1);
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00002047 --p;
2048 --size;
2049 }
2050 else if (bad_char_behavior != BAD_KEEP)
2051 *p = bad_char_behavior;
2052 }
Bram Moolenaarf453d352008-06-04 17:37:34 +00002053 else
2054 p += l - 1;
Bram Moolenaar071d4272004-06-13 20:20:40 +00002055 }
2056 }
Bram Moolenaarf453d352008-06-04 17:37:34 +00002057 if (p < ptr + size && !incomplete_tail)
Bram Moolenaar071d4272004-06-13 20:20:40 +00002058 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002059 // Detected a UTF-8 error.
Bram Moolenaar071d4272004-06-13 20:20:40 +00002060rewind_retry:
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002061 // Retry reading with another conversion.
Bram Moolenaar13505972019-01-24 15:04:48 +01002062#if defined(FEAT_EVAL) && defined(USE_ICONV)
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00002063 if (*p_ccv != NUL && iconv_fd != (iconv_t)-1)
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002064 // iconv() failed, try 'charconvert'
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00002065 did_iconv = TRUE;
Bram Moolenaar071d4272004-06-13 20:20:40 +00002066 else
Bram Moolenaar13505972019-01-24 15:04:48 +01002067#endif
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002068 // use next item from 'fileencodings'
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00002069 advance_fenc = TRUE;
2070 file_rewind = TRUE;
2071 goto retry;
Bram Moolenaar071d4272004-06-13 20:20:40 +00002072 }
2073 }
Bram Moolenaar071d4272004-06-13 20:20:40 +00002074
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002075 // count the number of characters (after conversion!)
Bram Moolenaar071d4272004-06-13 20:20:40 +00002076 filesize += size;
2077
2078 /*
2079 * when reading the first part of a file: guess EOL type
2080 */
2081 if (fileformat == EOL_UNKNOWN)
2082 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002083 // First try finding a NL, for Dos and Unix
Bram Moolenaar071d4272004-06-13 20:20:40 +00002084 if (try_dos || try_unix)
2085 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002086 // Reset the carriage return counter.
Bram Moolenaarc6b72172015-02-27 17:48:09 +01002087 if (try_mac)
2088 try_mac = 1;
2089
Bram Moolenaar071d4272004-06-13 20:20:40 +00002090 for (p = ptr; p < ptr + size; ++p)
2091 {
2092 if (*p == NL)
2093 {
2094 if (!try_unix
2095 || (try_dos && p > ptr && p[-1] == CAR))
2096 fileformat = EOL_DOS;
2097 else
2098 fileformat = EOL_UNIX;
2099 break;
2100 }
Bram Moolenaar05eb6122015-02-17 14:15:19 +01002101 else if (*p == CAR && try_mac)
2102 try_mac++;
Bram Moolenaar071d4272004-06-13 20:20:40 +00002103 }
2104
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002105 // Don't give in to EOL_UNIX if EOL_MAC is more likely
Bram Moolenaar071d4272004-06-13 20:20:40 +00002106 if (fileformat == EOL_UNIX && try_mac)
2107 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002108 // Need to reset the counters when retrying fenc.
Bram Moolenaar071d4272004-06-13 20:20:40 +00002109 try_mac = 1;
2110 try_unix = 1;
2111 for (; p >= ptr && *p != CAR; p--)
2112 ;
2113 if (p >= ptr)
2114 {
2115 for (p = ptr; p < ptr + size; ++p)
2116 {
2117 if (*p == NL)
2118 try_unix++;
2119 else if (*p == CAR)
2120 try_mac++;
2121 }
2122 if (try_mac > try_unix)
2123 fileformat = EOL_MAC;
2124 }
2125 }
Bram Moolenaar05eb6122015-02-17 14:15:19 +01002126 else if (fileformat == EOL_UNKNOWN && try_mac == 1)
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002127 // Looking for CR but found no end-of-line markers at
2128 // all: use the default format.
Bram Moolenaar05eb6122015-02-17 14:15:19 +01002129 fileformat = default_fileformat();
Bram Moolenaar071d4272004-06-13 20:20:40 +00002130 }
2131
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002132 // No NL found: may use Mac format
Bram Moolenaar071d4272004-06-13 20:20:40 +00002133 if (fileformat == EOL_UNKNOWN && try_mac)
2134 fileformat = EOL_MAC;
2135
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002136 // Still nothing found? Use first format in 'ffs'
Bram Moolenaar071d4272004-06-13 20:20:40 +00002137 if (fileformat == EOL_UNKNOWN)
2138 fileformat = default_fileformat();
2139
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002140 // if editing a new file: may set p_tx and p_ff
Bram Moolenaar910f66f2006-04-05 20:41:53 +00002141 if (set_options)
Bram Moolenaar071d4272004-06-13 20:20:40 +00002142 set_fileformat(fileformat, OPT_LOCAL);
2143 }
2144 }
2145
2146 /*
2147 * This loop is executed once for every character read.
2148 * Keep it fast!
2149 */
2150 if (fileformat == EOL_MAC)
2151 {
2152 --ptr;
2153 while (++ptr, --size >= 0)
2154 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002155 // catch most common case first
Bram Moolenaar071d4272004-06-13 20:20:40 +00002156 if ((c = *ptr) != NUL && c != CAR && c != NL)
2157 continue;
2158 if (c == NUL)
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002159 *ptr = NL; // NULs are replaced by newlines!
Bram Moolenaar071d4272004-06-13 20:20:40 +00002160 else if (c == NL)
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002161 *ptr = CAR; // NLs are replaced by CRs!
Bram Moolenaar071d4272004-06-13 20:20:40 +00002162 else
2163 {
2164 if (skip_count == 0)
2165 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002166 *ptr = NUL; // end of line
Bram Moolenaar071d4272004-06-13 20:20:40 +00002167 len = (colnr_T) (ptr - line_start + 1);
2168 if (ml_append(lnum, line_start, len, newfile) == FAIL)
2169 {
2170 error = TRUE;
2171 break;
2172 }
Bram Moolenaar55debbe2010-05-23 23:34:36 +02002173#ifdef FEAT_PERSISTENT_UNDO
2174 if (read_undo_file)
2175 sha256_update(&sha_ctx, line_start, len);
2176#endif
Bram Moolenaar071d4272004-06-13 20:20:40 +00002177 ++lnum;
2178 if (--read_count == 0)
2179 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002180 error = TRUE; // break loop
2181 line_start = ptr; // nothing left to write
Bram Moolenaar071d4272004-06-13 20:20:40 +00002182 break;
2183 }
2184 }
2185 else
2186 --skip_count;
2187 line_start = ptr + 1;
2188 }
2189 }
2190 }
2191 else
2192 {
2193 --ptr;
2194 while (++ptr, --size >= 0)
2195 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002196 if ((c = *ptr) != NUL && c != NL) // catch most common case
Bram Moolenaar071d4272004-06-13 20:20:40 +00002197 continue;
2198 if (c == NUL)
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002199 *ptr = NL; // NULs are replaced by newlines!
Bram Moolenaar071d4272004-06-13 20:20:40 +00002200 else
2201 {
2202 if (skip_count == 0)
2203 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002204 *ptr = NUL; // end of line
Bram Moolenaar071d4272004-06-13 20:20:40 +00002205 len = (colnr_T)(ptr - line_start + 1);
2206 if (fileformat == EOL_DOS)
2207 {
Bram Moolenaar2aa5f692017-01-24 15:46:48 +01002208 if (ptr > line_start && ptr[-1] == CAR)
Bram Moolenaar071d4272004-06-13 20:20:40 +00002209 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002210 // remove CR before NL
Bram Moolenaar071d4272004-06-13 20:20:40 +00002211 ptr[-1] = NUL;
2212 --len;
2213 }
2214 /*
2215 * Reading in Dos format, but no CR-LF found!
2216 * When 'fileformats' includes "unix", delete all
2217 * the lines read so far and start all over again.
2218 * Otherwise give an error message later.
2219 */
2220 else if (ff_error != EOL_DOS)
2221 {
2222 if ( try_unix
2223 && !read_stdin
2224 && (read_buffer
Bram Moolenaar8767f522016-07-01 17:17:39 +02002225 || vim_lseek(fd, (off_T)0L, SEEK_SET)
2226 == 0))
Bram Moolenaar071d4272004-06-13 20:20:40 +00002227 {
2228 fileformat = EOL_UNIX;
Bram Moolenaar910f66f2006-04-05 20:41:53 +00002229 if (set_options)
Bram Moolenaar071d4272004-06-13 20:20:40 +00002230 set_fileformat(EOL_UNIX, OPT_LOCAL);
2231 file_rewind = TRUE;
2232 keep_fileformat = TRUE;
2233 goto retry;
2234 }
2235 ff_error = EOL_DOS;
2236 }
2237 }
2238 if (ml_append(lnum, line_start, len, newfile) == FAIL)
2239 {
2240 error = TRUE;
2241 break;
2242 }
Bram Moolenaar55debbe2010-05-23 23:34:36 +02002243#ifdef FEAT_PERSISTENT_UNDO
2244 if (read_undo_file)
2245 sha256_update(&sha_ctx, line_start, len);
2246#endif
Bram Moolenaar071d4272004-06-13 20:20:40 +00002247 ++lnum;
2248 if (--read_count == 0)
2249 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002250 error = TRUE; // break loop
2251 line_start = ptr; // nothing left to write
Bram Moolenaar071d4272004-06-13 20:20:40 +00002252 break;
2253 }
2254 }
2255 else
2256 --skip_count;
2257 line_start = ptr + 1;
2258 }
2259 }
2260 }
2261 linerest = (long)(ptr - line_start);
2262 ui_breakcheck();
2263 }
2264
2265failed:
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002266 // not an error, max. number of lines reached
Bram Moolenaar071d4272004-06-13 20:20:40 +00002267 if (error && read_count == 0)
2268 error = FALSE;
2269
2270 /*
2271 * If we get EOF in the middle of a line, note the fact and
2272 * complete the line ourselves.
2273 * In Dos format ignore a trailing CTRL-Z, unless 'binary' set.
2274 */
2275 if (!error
2276 && !got_int
2277 && linerest != 0
2278 && !(!curbuf->b_p_bin
2279 && fileformat == EOL_DOS
2280 && *line_start == Ctrl_Z
2281 && ptr == line_start + 1))
2282 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002283 // remember for when writing
Bram Moolenaar910f66f2006-04-05 20:41:53 +00002284 if (set_options)
Bram Moolenaar071d4272004-06-13 20:20:40 +00002285 curbuf->b_p_eol = FALSE;
2286 *ptr = NUL;
Bram Moolenaar55debbe2010-05-23 23:34:36 +02002287 len = (colnr_T)(ptr - line_start + 1);
2288 if (ml_append(lnum, line_start, len, newfile) == FAIL)
Bram Moolenaar071d4272004-06-13 20:20:40 +00002289 error = TRUE;
2290 else
Bram Moolenaar55debbe2010-05-23 23:34:36 +02002291 {
2292#ifdef FEAT_PERSISTENT_UNDO
2293 if (read_undo_file)
2294 sha256_update(&sha_ctx, line_start, len);
2295#endif
Bram Moolenaar071d4272004-06-13 20:20:40 +00002296 read_no_eol_lnum = ++lnum;
Bram Moolenaar55debbe2010-05-23 23:34:36 +02002297 }
Bram Moolenaar071d4272004-06-13 20:20:40 +00002298 }
2299
Bram Moolenaar910f66f2006-04-05 20:41:53 +00002300 if (set_options)
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002301 save_file_ff(curbuf); // remember the current file format
Bram Moolenaar071d4272004-06-13 20:20:40 +00002302
2303#ifdef FEAT_CRYPT
Bram Moolenaar8f4ac012014-08-10 13:38:34 +02002304 if (curbuf->b_cryptstate != NULL)
Bram Moolenaara8ffcbb2010-06-21 06:15:46 +02002305 {
Bram Moolenaar8f4ac012014-08-10 13:38:34 +02002306 crypt_free_state(curbuf->b_cryptstate);
2307 curbuf->b_cryptstate = NULL;
Bram Moolenaara8ffcbb2010-06-21 06:15:46 +02002308 }
Bram Moolenaar8f4ac012014-08-10 13:38:34 +02002309 if (cryptkey != NULL && cryptkey != curbuf->b_p_key)
2310 crypt_free_key(cryptkey);
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002311 // Don't set cryptkey to NULL, it's used below as a flag that
2312 // encryption was used.
Bram Moolenaar071d4272004-06-13 20:20:40 +00002313#endif
2314
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002315 // If editing a new file: set 'fenc' for the current buffer.
2316 // Also for ":read ++edit file".
Bram Moolenaar910f66f2006-04-05 20:41:53 +00002317 if (set_options)
Bram Moolenaar071d4272004-06-13 20:20:40 +00002318 set_string_option_direct((char_u *)"fenc", -1, fenc,
Bram Moolenaar5e3cb7e2006-02-27 23:58:35 +00002319 OPT_FREE|OPT_LOCAL, 0);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002320 if (fenc_alloced)
2321 vim_free(fenc);
Bram Moolenaar13505972019-01-24 15:04:48 +01002322#ifdef USE_ICONV
Bram Moolenaar071d4272004-06-13 20:20:40 +00002323 if (iconv_fd != (iconv_t)-1)
Bram Moolenaar071d4272004-06-13 20:20:40 +00002324 iconv_close(iconv_fd);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002325#endif
2326
2327 if (!read_buffer && !read_stdin)
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002328 close(fd); // errors are ignored
Bram Moolenaarf05da212009-11-17 16:13:15 +00002329#ifdef HAVE_FD_CLOEXEC
2330 else
2331 {
2332 int fdflags = fcntl(fd, F_GETFD);
Bram Moolenaara7251492021-01-02 16:53:13 +01002333
Bram Moolenaarf05da212009-11-17 16:13:15 +00002334 if (fdflags >= 0 && (fdflags & FD_CLOEXEC) == 0)
Bram Moolenaarfbc4b4d2016-02-07 15:14:01 +01002335 (void)fcntl(fd, F_SETFD, fdflags | FD_CLOEXEC);
Bram Moolenaarf05da212009-11-17 16:13:15 +00002336 }
2337#endif
Bram Moolenaar071d4272004-06-13 20:20:40 +00002338 vim_free(buffer);
2339
2340#ifdef HAVE_DUP
2341 if (read_stdin)
2342 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002343 // Use stderr for stdin, makes shell commands work.
Bram Moolenaar071d4272004-06-13 20:20:40 +00002344 close(0);
Bram Moolenaar42335f52018-09-13 15:33:43 +02002345 vim_ignored = dup(2);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002346 }
2347#endif
2348
Bram Moolenaar071d4272004-06-13 20:20:40 +00002349 if (tmpname != NULL)
2350 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002351 mch_remove(tmpname); // delete converted file
Bram Moolenaar071d4272004-06-13 20:20:40 +00002352 vim_free(tmpname);
2353 }
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002354 --no_wait_return; // may wait for return now
Bram Moolenaar071d4272004-06-13 20:20:40 +00002355
2356 /*
2357 * In recovery mode everything but autocommands is skipped.
2358 */
2359 if (!recoverymode)
2360 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002361 // need to delete the last line, which comes from the empty buffer
Bram Moolenaar071d4272004-06-13 20:20:40 +00002362 if (newfile && wasempty && !(curbuf->b_ml.ml_flags & ML_EMPTY))
2363 {
2364#ifdef FEAT_NETBEANS_INTG
2365 netbeansFireChanges = 0;
2366#endif
Bram Moolenaarca70c072020-05-30 20:30:46 +02002367 ml_delete(curbuf->b_ml.ml_line_count);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002368#ifdef FEAT_NETBEANS_INTG
2369 netbeansFireChanges = 1;
2370#endif
2371 --linecnt;
2372 }
2373 linecnt = curbuf->b_ml.ml_line_count - linecnt;
2374 if (filesize == 0)
2375 linecnt = 0;
2376 if (newfile || read_buffer)
Bram Moolenaar7263a772007-05-10 17:35:54 +00002377 {
Bram Moolenaara4d158b2022-08-14 14:17:45 +01002378 redraw_curbuf_later(UPD_NOT_VALID);
Bram Moolenaar7263a772007-05-10 17:35:54 +00002379#ifdef FEAT_DIFF
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002380 // After reading the text into the buffer the diff info needs to
2381 // be updated.
Bram Moolenaar7263a772007-05-10 17:35:54 +00002382 diff_invalidate(curbuf);
2383#endif
2384#ifdef FEAT_FOLDING
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002385 // All folds in the window are invalid now. Mark them for update
2386 // before triggering autocommands.
Bram Moolenaar7263a772007-05-10 17:35:54 +00002387 foldUpdateAll(curwin);
2388#endif
2389 }
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002390 else if (linecnt) // appended at least one line
Bram Moolenaar071d4272004-06-13 20:20:40 +00002391 appended_lines_mark(from, linecnt);
2392
Bram Moolenaar071d4272004-06-13 20:20:40 +00002393#ifndef ALWAYS_USE_GUI
2394 /*
2395 * If we were reading from the same terminal as where messages go,
2396 * the screen will have been messed up.
2397 * Switch on raw mode now and clear the screen.
2398 */
2399 if (read_stdin)
2400 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002401 settmode(TMODE_RAW); // set to raw mode
Bram Moolenaar071d4272004-06-13 20:20:40 +00002402 starttermcap();
2403 screenclear();
2404 }
2405#endif
2406
2407 if (got_int)
2408 {
2409 if (!(flags & READ_DUMMY))
2410 {
Bram Moolenaar436b5ad2021-12-31 22:49:24 +00002411 filemess(curbuf, sfname, (char_u *)_(e_interrupted), 0);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002412 if (newfile)
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002413 curbuf->b_p_ro = TRUE; // must use "w!" now
Bram Moolenaar071d4272004-06-13 20:20:40 +00002414 }
2415 msg_scroll = msg_save;
2416#ifdef FEAT_VIMINFO
2417 check_marks_read();
2418#endif
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002419 return OK; // an interrupt isn't really an error
Bram Moolenaar071d4272004-06-13 20:20:40 +00002420 }
2421
2422 if (!filtering && !(flags & READ_DUMMY))
2423 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002424 msg_add_fname(curbuf, sfname); // fname in IObuff with quotes
Bram Moolenaar071d4272004-06-13 20:20:40 +00002425 c = FALSE;
2426
2427#ifdef UNIX
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002428 if (S_ISFIFO(perm)) // fifo
Bram Moolenaar071d4272004-06-13 20:20:40 +00002429 {
2430 STRCAT(IObuff, _("[fifo]"));
2431 c = TRUE;
2432 }
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002433 if (S_ISSOCK(perm)) // or socket
Bram Moolenaar071d4272004-06-13 20:20:40 +00002434 {
2435 STRCAT(IObuff, _("[socket]"));
2436 c = TRUE;
2437 }
Bram Moolenaarfe1c56d2007-07-10 15:10:54 +00002438# ifdef OPEN_CHR_FILES
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002439 if (S_ISCHR(perm)) // or character special
Bram Moolenaarfe1c56d2007-07-10 15:10:54 +00002440 {
2441 STRCAT(IObuff, _("[character special]"));
2442 c = TRUE;
2443 }
2444# endif
Bram Moolenaar071d4272004-06-13 20:20:40 +00002445#endif
2446 if (curbuf->b_p_ro)
2447 {
2448 STRCAT(IObuff, shortmess(SHM_RO) ? _("[RO]") : _("[readonly]"));
2449 c = TRUE;
2450 }
2451 if (read_no_eol_lnum)
2452 {
2453 msg_add_eol();
2454 c = TRUE;
2455 }
2456 if (ff_error == EOL_DOS)
2457 {
2458 STRCAT(IObuff, _("[CR missing]"));
2459 c = TRUE;
2460 }
Bram Moolenaar071d4272004-06-13 20:20:40 +00002461 if (split)
2462 {
2463 STRCAT(IObuff, _("[long lines split]"));
2464 c = TRUE;
2465 }
Bram Moolenaar071d4272004-06-13 20:20:40 +00002466 if (notconverted)
2467 {
2468 STRCAT(IObuff, _("[NOT converted]"));
2469 c = TRUE;
2470 }
2471 else if (converted)
2472 {
2473 STRCAT(IObuff, _("[converted]"));
2474 c = TRUE;
2475 }
Bram Moolenaar071d4272004-06-13 20:20:40 +00002476#ifdef FEAT_CRYPT
2477 if (cryptkey != NULL)
2478 {
Bram Moolenaar8f4ac012014-08-10 13:38:34 +02002479 crypt_append_msg(curbuf);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002480 c = TRUE;
2481 }
2482#endif
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00002483 if (conv_error != 0)
Bram Moolenaar071d4272004-06-13 20:20:40 +00002484 {
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00002485 sprintf((char *)IObuff + STRLEN(IObuff),
2486 _("[CONVERSION ERROR in line %ld]"), (long)conv_error);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002487 c = TRUE;
2488 }
2489 else if (illegal_byte > 0)
2490 {
2491 sprintf((char *)IObuff + STRLEN(IObuff),
2492 _("[ILLEGAL BYTE in line %ld]"), (long)illegal_byte);
2493 c = TRUE;
2494 }
Bram Moolenaar13505972019-01-24 15:04:48 +01002495 else if (error)
Bram Moolenaar071d4272004-06-13 20:20:40 +00002496 {
2497 STRCAT(IObuff, _("[READ ERRORS]"));
2498 c = TRUE;
2499 }
2500 if (msg_add_fileformat(fileformat))
2501 c = TRUE;
2502#ifdef FEAT_CRYPT
2503 if (cryptkey != NULL)
Bram Moolenaar40e6a712010-05-16 22:32:54 +02002504 msg_add_lines(c, (long)linecnt, filesize
Bram Moolenaar8f4ac012014-08-10 13:38:34 +02002505 - crypt_get_header_len(crypt_get_method_nr(curbuf)));
Bram Moolenaar071d4272004-06-13 20:20:40 +00002506 else
2507#endif
2508 msg_add_lines(c, (long)linecnt, filesize);
2509
Bram Moolenaard23a8232018-02-10 18:45:26 +01002510 VIM_CLEAR(keep_msg);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002511 msg_scrolled_ign = TRUE;
2512#ifdef ALWAYS_USE_GUI
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002513 // Don't show the message when reading stdin, it would end up in a
2514 // message box (which might be shown when exiting!)
Bram Moolenaar071d4272004-06-13 20:20:40 +00002515 if (read_stdin || read_buffer)
2516 p = msg_may_trunc(FALSE, IObuff);
2517 else
2518#endif
Bram Moolenaar473952e2019-09-28 16:30:04 +02002519 {
2520 if (msg_col > 0)
2521 msg_putchar('\r'); // overwrite previous message
Bram Moolenaar32526b32019-01-19 17:43:09 +01002522 p = (char_u *)msg_trunc_attr((char *)IObuff, FALSE, 0);
Bram Moolenaar473952e2019-09-28 16:30:04 +02002523 }
Bram Moolenaar071d4272004-06-13 20:20:40 +00002524 if (read_stdin || read_buffer || restart_edit != 0
Bram Moolenaar1c7715d2005-10-03 22:02:18 +00002525 || (msg_scrolled != 0 && !need_wait_return))
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002526 // Need to repeat the message after redrawing when:
2527 // - When reading from stdin (the screen will be cleared next).
2528 // - When restart_edit is set (otherwise there will be a delay
2529 // before redrawing).
2530 // - When the screen was scrolled but there is no wait-return
2531 // prompt.
Bram Moolenaar8f7fd652006-02-21 22:04:51 +00002532 set_keep_msg(p, 0);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002533 msg_scrolled_ign = FALSE;
2534 }
2535
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002536 // with errors writing the file requires ":w!"
Bram Moolenaar071d4272004-06-13 20:20:40 +00002537 if (newfile && (error
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00002538 || conv_error != 0
Bram Moolenaar13505972019-01-24 15:04:48 +01002539 || (illegal_byte > 0 && bad_char_behavior != BAD_KEEP)))
Bram Moolenaar071d4272004-06-13 20:20:40 +00002540 curbuf->b_p_ro = TRUE;
2541
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002542 u_clearline(); // cannot use "U" command after adding lines
Bram Moolenaar071d4272004-06-13 20:20:40 +00002543
2544 /*
2545 * In Ex mode: cursor at last new line.
2546 * Otherwise: cursor at first new line.
2547 */
2548 if (exmode_active)
2549 curwin->w_cursor.lnum = from + linecnt;
2550 else
2551 curwin->w_cursor.lnum = from + 1;
2552 check_cursor_lnum();
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002553 beginline(BL_WHITE | BL_FIX); // on first non-blank
Bram Moolenaar071d4272004-06-13 20:20:40 +00002554
Bram Moolenaare1004402020-10-24 20:49:43 +02002555 if ((cmdmod.cmod_flags & CMOD_LOCKMARKS) == 0)
Bram Moolenaarf4a1d1c2019-11-16 13:50:25 +01002556 {
2557 // Set '[ and '] marks to the newly read lines.
2558 curbuf->b_op_start.lnum = from + 1;
2559 curbuf->b_op_start.col = 0;
2560 curbuf->b_op_end.lnum = from + linecnt;
2561 curbuf->b_op_end.col = 0;
2562 }
Bram Moolenaar03f48552006-02-28 23:52:23 +00002563
Bram Moolenaar4f974752019-02-17 17:44:42 +01002564#ifdef MSWIN
Bram Moolenaar03f48552006-02-28 23:52:23 +00002565 /*
2566 * Work around a weird problem: When a file has two links (only
2567 * possible on NTFS) and we write through one link, then stat() it
Bram Moolenaarb23a7e82008-06-27 18:42:32 +00002568 * through the other link, the timestamp information may be wrong.
Bram Moolenaar03f48552006-02-28 23:52:23 +00002569 * It's correct again after reading the file, thus reset the timestamp
2570 * here.
2571 */
2572 if (newfile && !read_stdin && !read_buffer
2573 && mch_stat((char *)fname, &st) >= 0)
2574 {
2575 buf_store_time(curbuf, &st, fname);
2576 curbuf->b_mtime_read = curbuf->b_mtime;
Leah Neukirchen0a7984a2021-10-14 21:27:55 +01002577 curbuf->b_mtime_read_ns = curbuf->b_mtime_ns;
Bram Moolenaar03f48552006-02-28 23:52:23 +00002578 }
2579#endif
Bram Moolenaar071d4272004-06-13 20:20:40 +00002580 }
2581 msg_scroll = msg_save;
2582
2583#ifdef FEAT_VIMINFO
2584 /*
2585 * Get the marks before executing autocommands, so they can be used there.
2586 */
2587 check_marks_read();
2588#endif
2589
Bram Moolenaar071d4272004-06-13 20:20:40 +00002590 /*
Bram Moolenaar34d72d42015-07-17 14:18:08 +02002591 * We remember if the last line of the read didn't have
2592 * an eol even when 'binary' is off, to support turning 'fixeol' off,
2593 * or writing the read again with 'binary' on. The latter is required
2594 * for ":autocmd FileReadPost *.gz set bin|'[,']!gunzip" to work.
Bram Moolenaar071d4272004-06-13 20:20:40 +00002595 */
Bram Moolenaarcab35ad2011-02-15 17:39:22 +01002596 curbuf->b_no_eol_lnum = read_no_eol_lnum;
Bram Moolenaar071d4272004-06-13 20:20:40 +00002597
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002598 // When reloading a buffer put the cursor at the first line that is
2599 // different.
Bram Moolenaarf9bb7342010-08-04 14:29:54 +02002600 if (flags & READ_KEEP_UNDO)
2601 u_find_first_changed();
2602
Bram Moolenaar55debbe2010-05-23 23:34:36 +02002603#ifdef FEAT_PERSISTENT_UNDO
2604 /*
2605 * When opening a new file locate undo info and read it.
2606 */
2607 if (read_undo_file)
2608 {
2609 char_u hash[UNDO_HASH_SIZE];
2610
2611 sha256_finish(&sha_ctx, hash);
Bram Moolenaar6ed8ed82010-05-30 20:40:11 +02002612 u_read_undo(NULL, hash, fname);
Bram Moolenaar55debbe2010-05-23 23:34:36 +02002613 }
2614#endif
2615
Bram Moolenaarf71d7b92016-08-09 22:14:05 +02002616 if (!read_stdin && !read_fifo && (!read_buffer || sfname != NULL))
Bram Moolenaar071d4272004-06-13 20:20:40 +00002617 {
2618 int m = msg_scroll;
2619 int n = msg_scrolled;
2620
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002621 // Save the fileformat now, otherwise the buffer will be considered
2622 // modified if the format/encoding was automatically detected.
Bram Moolenaar910f66f2006-04-05 20:41:53 +00002623 if (set_options)
Bram Moolenaar071d4272004-06-13 20:20:40 +00002624 save_file_ff(curbuf);
2625
2626 /*
2627 * The output from the autocommands should not overwrite anything and
2628 * should not be overwritten: Set msg_scroll, restore its value if no
2629 * output was done.
2630 */
2631 msg_scroll = TRUE;
2632 if (filtering)
2633 apply_autocmds_exarg(EVENT_FILTERREADPOST, NULL, sfname,
2634 FALSE, curbuf, eap);
Bram Moolenaarf71d7b92016-08-09 22:14:05 +02002635 else if (newfile || (read_buffer && sfname != NULL))
Bram Moolenaarc3691332016-04-20 12:49:49 +02002636 {
Bram Moolenaar071d4272004-06-13 20:20:40 +00002637 apply_autocmds_exarg(EVENT_BUFREADPOST, NULL, sfname,
2638 FALSE, curbuf, eap);
Bram Moolenaarc3691332016-04-20 12:49:49 +02002639 if (!au_did_filetype && *curbuf->b_p_ft != NUL)
2640 /*
2641 * EVENT_FILETYPE was not triggered but the buffer already has a
2642 * filetype. Trigger EVENT_FILETYPE using the existing filetype.
2643 */
2644 apply_autocmds(EVENT_FILETYPE, curbuf->b_p_ft, curbuf->b_fname,
2645 TRUE, curbuf);
2646 }
Bram Moolenaar071d4272004-06-13 20:20:40 +00002647 else
2648 apply_autocmds_exarg(EVENT_FILEREADPOST, sfname, sfname,
2649 FALSE, NULL, eap);
2650 if (msg_scrolled == n)
2651 msg_scroll = m;
Bram Moolenaarcab35ad2011-02-15 17:39:22 +01002652# ifdef FEAT_EVAL
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002653 if (aborting()) // autocmds may abort script processing
Bram Moolenaar071d4272004-06-13 20:20:40 +00002654 return FAIL;
Bram Moolenaarcab35ad2011-02-15 17:39:22 +01002655# endif
Bram Moolenaar071d4272004-06-13 20:20:40 +00002656 }
Bram Moolenaar071d4272004-06-13 20:20:40 +00002657
2658 if (recoverymode && error)
2659 return FAIL;
2660 return OK;
2661}
2662
Bram Moolenaarf04507d2016-08-20 15:05:39 +02002663#if defined(OPEN_CHR_FILES) || defined(PROTO)
Bram Moolenaarfe1c56d2007-07-10 15:10:54 +00002664/*
2665 * Returns TRUE if the file name argument is of the form "/dev/fd/\d\+",
2666 * which is the name of files used for process substitution output by
2667 * some shells on some operating systems, e.g., bash on SunOS.
2668 * Do not accept "/dev/fd/[012]", opening these may hang Vim.
2669 */
Bram Moolenaarf04507d2016-08-20 15:05:39 +02002670 int
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01002671is_dev_fd_file(char_u *fname)
Bram Moolenaarfe1c56d2007-07-10 15:10:54 +00002672{
2673 return (STRNCMP(fname, "/dev/fd/", 8) == 0
2674 && VIM_ISDIGIT(fname[8])
2675 && *skipdigits(fname + 9) == NUL
2676 && (fname[9] != NUL
2677 || (fname[8] != '0' && fname[8] != '1' && fname[8] != '2')));
2678}
2679#endif
2680
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00002681/*
2682 * From the current line count and characters read after that, estimate the
2683 * line number where we are now.
2684 * Used for error messages that include a line number.
2685 */
2686 static linenr_T
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01002687readfile_linenr(
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002688 linenr_T linecnt, // line count before reading more bytes
2689 char_u *p, // start of more bytes read
2690 char_u *endp) // end of more bytes read
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00002691{
2692 char_u *s;
2693 linenr_T lnum;
2694
2695 lnum = curbuf->b_ml.ml_line_count - linecnt + 1;
2696 for (s = p; s < endp; ++s)
2697 if (*s == '\n')
2698 ++lnum;
2699 return lnum;
2700}
Bram Moolenaarb0bf8582005-12-13 20:02:15 +00002701
Bram Moolenaar071d4272004-06-13 20:20:40 +00002702/*
Rob Pilling8196e942022-02-11 15:12:10 +00002703 * Fill "*eap" to force the 'fileencoding', 'fileformat' and 'binary' to be
Bram Moolenaar195d6352005-12-19 22:08:24 +00002704 * equal to the buffer "buf". Used for calling readfile().
Bram Moolenaar071d4272004-06-13 20:20:40 +00002705 * Returns OK or FAIL.
2706 */
2707 int
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01002708prep_exarg(exarg_T *eap, buf_T *buf)
Bram Moolenaar071d4272004-06-13 20:20:40 +00002709{
Bram Moolenaar13505972019-01-24 15:04:48 +01002710 eap->cmd = alloc(15 + (unsigned)STRLEN(buf->b_p_fenc));
Bram Moolenaar071d4272004-06-13 20:20:40 +00002711 if (eap->cmd == NULL)
2712 return FAIL;
2713
Bram Moolenaar333b80a2018-04-04 22:57:29 +02002714 sprintf((char *)eap->cmd, "e ++enc=%s", buf->b_p_fenc);
2715 eap->force_enc = 8;
Bram Moolenaar195d6352005-12-19 22:08:24 +00002716 eap->bad_char = buf->b_bad_char;
Bram Moolenaar333b80a2018-04-04 22:57:29 +02002717 eap->force_ff = *buf->b_p_ff;
Bram Moolenaar195d6352005-12-19 22:08:24 +00002718
2719 eap->force_bin = buf->b_p_bin ? FORCE_BIN : FORCE_NOBIN;
Bram Moolenaar910f66f2006-04-05 20:41:53 +00002720 eap->read_edit = FALSE;
Bram Moolenaar195d6352005-12-19 22:08:24 +00002721 eap->forceit = FALSE;
Bram Moolenaar071d4272004-06-13 20:20:40 +00002722 return OK;
2723}
2724
Bram Moolenaarad875fb2013-07-24 15:02:03 +02002725/*
2726 * Set default or forced 'fileformat' and 'binary'.
2727 */
2728 void
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01002729set_file_options(int set_options, exarg_T *eap)
Bram Moolenaarad875fb2013-07-24 15:02:03 +02002730{
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002731 // set default 'fileformat'
Bram Moolenaarad875fb2013-07-24 15:02:03 +02002732 if (set_options)
2733 {
2734 if (eap != NULL && eap->force_ff != 0)
2735 set_fileformat(get_fileformat_force(curbuf, eap), OPT_LOCAL);
2736 else if (*p_ffs != NUL)
2737 set_fileformat(default_fileformat(), OPT_LOCAL);
2738 }
2739
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002740 // set or reset 'binary'
Bram Moolenaarad875fb2013-07-24 15:02:03 +02002741 if (eap != NULL && eap->force_bin != 0)
2742 {
2743 int oldval = curbuf->b_p_bin;
2744
2745 curbuf->b_p_bin = (eap->force_bin == FORCE_BIN);
2746 set_options_bin(oldval, curbuf->b_p_bin, OPT_LOCAL);
2747 }
2748}
2749
Bram Moolenaarad875fb2013-07-24 15:02:03 +02002750/*
2751 * Set forced 'fileencoding'.
2752 */
2753 void
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01002754set_forced_fenc(exarg_T *eap)
Bram Moolenaarad875fb2013-07-24 15:02:03 +02002755{
2756 if (eap->force_enc != 0)
2757 {
2758 char_u *fenc = enc_canonize(eap->cmd + eap->force_enc);
2759
2760 if (fenc != NULL)
2761 set_string_option_direct((char_u *)"fenc", -1,
2762 fenc, OPT_FREE|OPT_LOCAL, 0);
2763 vim_free(fenc);
2764 }
2765}
2766
Bram Moolenaar071d4272004-06-13 20:20:40 +00002767/*
2768 * Find next fileencoding to use from 'fileencodings'.
2769 * "pp" points to fenc_next. It's advanced to the next item.
2770 * When there are no more items, an empty string is returned and *pp is set to
2771 * NULL.
Bram Moolenaarf077db22019-08-13 00:18:24 +02002772 * When *pp is not set to NULL, the result is in allocated memory and "alloced"
2773 * is set to TRUE.
Bram Moolenaar071d4272004-06-13 20:20:40 +00002774 */
2775 static char_u *
Bram Moolenaarf077db22019-08-13 00:18:24 +02002776next_fenc(char_u **pp, int *alloced)
Bram Moolenaar071d4272004-06-13 20:20:40 +00002777{
2778 char_u *p;
2779 char_u *r;
2780
Bram Moolenaarf077db22019-08-13 00:18:24 +02002781 *alloced = FALSE;
Bram Moolenaar071d4272004-06-13 20:20:40 +00002782 if (**pp == NUL)
2783 {
2784 *pp = NULL;
2785 return (char_u *)"";
2786 }
2787 p = vim_strchr(*pp, ',');
2788 if (p == NULL)
2789 {
2790 r = enc_canonize(*pp);
2791 *pp += STRLEN(*pp);
2792 }
2793 else
2794 {
Bram Moolenaar71ccd032020-06-12 22:59:11 +02002795 r = vim_strnsave(*pp, p - *pp);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002796 *pp = p + 1;
2797 if (r != NULL)
2798 {
2799 p = enc_canonize(r);
2800 vim_free(r);
2801 r = p;
2802 }
2803 }
Bram Moolenaarf077db22019-08-13 00:18:24 +02002804 if (r != NULL)
2805 *alloced = TRUE;
2806 else
Bram Moolenaar071d4272004-06-13 20:20:40 +00002807 {
Bram Moolenaarf077db22019-08-13 00:18:24 +02002808 // out of memory
Bram Moolenaar071d4272004-06-13 20:20:40 +00002809 r = (char_u *)"";
2810 *pp = NULL;
2811 }
2812 return r;
2813}
2814
Bram Moolenaar13505972019-01-24 15:04:48 +01002815#ifdef FEAT_EVAL
Bram Moolenaar071d4272004-06-13 20:20:40 +00002816/*
2817 * Convert a file with the 'charconvert' expression.
2818 * This closes the file which is to be read, converts it and opens the
2819 * resulting file for reading.
2820 * Returns name of the resulting converted file (the caller should delete it
2821 * after reading it).
2822 * Returns NULL if the conversion failed ("*fdp" is not set) .
2823 */
2824 static char_u *
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01002825readfile_charconvert(
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002826 char_u *fname, // name of input file
2827 char_u *fenc, // converted from
2828 int *fdp) // in/out: file descriptor of file
Bram Moolenaar071d4272004-06-13 20:20:40 +00002829{
2830 char_u *tmpname;
Bram Moolenaar32526b32019-01-19 17:43:09 +01002831 char *errmsg = NULL;
Bram Moolenaar071d4272004-06-13 20:20:40 +00002832
Bram Moolenaare5c421c2015-03-31 13:33:08 +02002833 tmpname = vim_tempname('r', FALSE);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002834 if (tmpname == NULL)
Bram Moolenaar32526b32019-01-19 17:43:09 +01002835 errmsg = _("Can't find temp file for conversion");
Bram Moolenaar071d4272004-06-13 20:20:40 +00002836 else
2837 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002838 close(*fdp); // close the input file, ignore errors
Bram Moolenaar071d4272004-06-13 20:20:40 +00002839 *fdp = -1;
2840 if (eval_charconvert(fenc, enc_utf8 ? (char_u *)"utf-8" : p_enc,
2841 fname, tmpname) == FAIL)
Bram Moolenaar32526b32019-01-19 17:43:09 +01002842 errmsg = _("Conversion with 'charconvert' failed");
Bram Moolenaar071d4272004-06-13 20:20:40 +00002843 if (errmsg == NULL && (*fdp = mch_open((char *)tmpname,
2844 O_RDONLY | O_EXTRA, 0)) < 0)
Bram Moolenaar32526b32019-01-19 17:43:09 +01002845 errmsg = _("can't read output of 'charconvert'");
Bram Moolenaar071d4272004-06-13 20:20:40 +00002846 }
2847
2848 if (errmsg != NULL)
2849 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002850 // Don't use emsg(), it breaks mappings, the retry with
2851 // another type of conversion might still work.
Bram Moolenaar32526b32019-01-19 17:43:09 +01002852 msg(errmsg);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002853 if (tmpname != NULL)
2854 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002855 mch_remove(tmpname); // delete converted file
Bram Moolenaard23a8232018-02-10 18:45:26 +01002856 VIM_CLEAR(tmpname);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002857 }
2858 }
2859
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002860 // If the input file is closed, open it (caller should check for error).
Bram Moolenaar071d4272004-06-13 20:20:40 +00002861 if (*fdp < 0)
2862 *fdp = mch_open((char *)fname, O_RDONLY | O_EXTRA, 0);
2863
2864 return tmpname;
2865}
Bram Moolenaar071d4272004-06-13 20:20:40 +00002866#endif
2867
Bram Moolenaara3ff49f2010-05-30 22:48:02 +02002868#if defined(FEAT_CRYPT) || defined(PROTO)
Bram Moolenaar071d4272004-06-13 20:20:40 +00002869/*
Bram Moolenaar40e6a712010-05-16 22:32:54 +02002870 * Check for magic number used for encryption. Applies to the current buffer.
Bram Moolenaar071d4272004-06-13 20:20:40 +00002871 * If found, the magic number is removed from ptr[*sizep] and *sizep and
2872 * *filesizep are updated.
2873 * Return the (new) encryption key, NULL for no encryption.
2874 */
2875 static char_u *
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01002876check_for_cryptkey(
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002877 char_u *cryptkey, // previous encryption key or NULL
2878 char_u *ptr, // pointer to read bytes
2879 long *sizep, // length of read bytes
2880 off_T *filesizep, // nr of bytes used from file
2881 int newfile, // editing a new buffer
2882 char_u *fname, // file name to display
2883 int *did_ask) // flag: whether already asked for key
Bram Moolenaar071d4272004-06-13 20:20:40 +00002884{
Bram Moolenaar8f4ac012014-08-10 13:38:34 +02002885 int method = crypt_method_nr_from_magic((char *)ptr, *sizep);
Bram Moolenaarcf81aef2013-08-25 17:46:08 +02002886 int b_p_ro = curbuf->b_p_ro;
Bram Moolenaar40e6a712010-05-16 22:32:54 +02002887
2888 if (method >= 0)
Bram Moolenaar071d4272004-06-13 20:20:40 +00002889 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002890 // Mark the buffer as read-only until the decryption has taken place.
2891 // Avoids accidentally overwriting the file with garbage.
Bram Moolenaarcf81aef2013-08-25 17:46:08 +02002892 curbuf->b_p_ro = TRUE;
2893
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002894 // Set the cryptmethod local to the buffer.
Bram Moolenaar8f4ac012014-08-10 13:38:34 +02002895 crypt_set_cm_option(curbuf, method);
Bram Moolenaarf50a2532010-05-21 15:36:08 +02002896 if (cryptkey == NULL && !*did_ask)
Bram Moolenaar071d4272004-06-13 20:20:40 +00002897 {
2898 if (*curbuf->b_p_key)
2899 cryptkey = curbuf->b_p_key;
2900 else
2901 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002902 // When newfile is TRUE, store the typed key in the 'key'
2903 // option and don't free it. bf needs hash of the key saved.
2904 // Don't ask for the key again when first time Enter was hit.
2905 // Happens when retrying to detect encoding.
Bram Moolenaarf9e3e092019-01-13 23:38:42 +01002906 smsg(_(need_key_msg), fname);
Bram Moolenaara8ffcbb2010-06-21 06:15:46 +02002907 msg_scroll = TRUE;
Bram Moolenaar3a0c9082014-11-12 15:15:42 +01002908 crypt_check_method(method);
Bram Moolenaar8f4ac012014-08-10 13:38:34 +02002909 cryptkey = crypt_get_key(newfile, FALSE);
Bram Moolenaarf50a2532010-05-21 15:36:08 +02002910 *did_ask = TRUE;
2911
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002912 // check if empty key entered
Bram Moolenaar071d4272004-06-13 20:20:40 +00002913 if (cryptkey != NULL && *cryptkey == NUL)
2914 {
2915 if (cryptkey != curbuf->b_p_key)
2916 vim_free(cryptkey);
2917 cryptkey = NULL;
2918 }
2919 }
2920 }
2921
2922 if (cryptkey != NULL)
2923 {
Bram Moolenaar8f4ac012014-08-10 13:38:34 +02002924 int header_len;
Bram Moolenaar40e6a712010-05-16 22:32:54 +02002925
Bram Moolenaar8f4ac012014-08-10 13:38:34 +02002926 header_len = crypt_get_header_len(method);
Bram Moolenaar680e0152016-09-25 20:54:11 +02002927 if (*sizep <= header_len)
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002928 // invalid header, buffer can't be encrypted
Bram Moolenaar680e0152016-09-25 20:54:11 +02002929 return NULL;
Bram Moolenaar77ab4e22021-07-29 21:23:50 +02002930
2931 curbuf->b_cryptstate = crypt_create_from_header(
2932 method, cryptkey, ptr);
2933 crypt_set_cm_option(curbuf, method);
2934
2935 // Remove cryptmethod specific header from the text.
Bram Moolenaar8f4ac012014-08-10 13:38:34 +02002936 *filesizep += header_len;
2937 *sizep -= header_len;
2938 mch_memmove(ptr, ptr + header_len, (size_t)*sizep);
2939
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002940 // Restore the read-only flag.
Bram Moolenaarcf81aef2013-08-25 17:46:08 +02002941 curbuf->b_p_ro = b_p_ro;
Bram Moolenaar071d4272004-06-13 20:20:40 +00002942 }
2943 }
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002944 // When starting to edit a new file which does not have encryption, clear
2945 // the 'key' option, except when starting up (called with -x argument)
Bram Moolenaarfa0ff9a2010-07-25 16:05:19 +02002946 else if (newfile && *curbuf->b_p_key != NUL && !starting)
Bram Moolenaar24959102022-05-07 20:01:16 +01002947 set_option_value_give_err((char_u *)"key", 0L, (char_u *)"", OPT_LOCAL);
Bram Moolenaar071d4272004-06-13 20:20:40 +00002948
2949 return cryptkey;
2950}
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002951#endif // FEAT_CRYPT
Bram Moolenaar80794b12010-06-13 05:20:42 +02002952
Bram Moolenaar071d4272004-06-13 20:20:40 +00002953/*
Bram Moolenaar5386a122007-06-28 20:02:32 +00002954 * Return TRUE if a file appears to be read-only from the file permissions.
2955 */
2956 int
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01002957check_file_readonly(
Bram Moolenaar217e1b82019-12-01 21:41:28 +01002958 char_u *fname, // full path to file
2959 int perm UNUSED) // known permissions on file
Bram Moolenaar5386a122007-06-28 20:02:32 +00002960{
2961#ifndef USE_MCH_ACCESS
2962 int fd = 0;
2963#endif
2964
2965 return (
2966#ifdef USE_MCH_ACCESS
2967# ifdef UNIX
2968 (perm & 0222) == 0 ||
2969# endif
2970 mch_access((char *)fname, W_OK)
2971#else
2972 (fd = mch_open((char *)fname, O_RDWR | O_EXTRA, 0)) < 0
2973 ? TRUE : (close(fd), FALSE)
2974#endif
2975 );
2976}
2977
Bram Moolenaara7870192019-02-14 12:56:36 +01002978#if defined(HAVE_FSYNC) || defined(PROTO)
2979/*
2980 * Call fsync() with Mac-specific exception.
2981 * Return fsync() result: zero for success.
2982 */
2983 int
2984vim_fsync(int fd)
2985{
2986 int r;
2987
2988# ifdef MACOS_X
2989 r = fcntl(fd, F_FULLFSYNC);
Bram Moolenaar91668382019-02-21 12:16:12 +01002990 if (r != 0) // F_FULLFSYNC not working or not supported
Bram Moolenaara7870192019-02-14 12:56:36 +01002991# endif
2992 r = fsync(fd);
2993 return r;
2994}
2995#endif
2996
Bram Moolenaar071d4272004-06-13 20:20:40 +00002997/*
Bram Moolenaar2d3f4892006-01-20 23:02:51 +00002998 * Set the name of the current buffer. Use when the buffer doesn't have a
2999 * name and a ":r" or ":w" command with a file name is used.
3000 */
Bram Moolenaar473952e2019-09-28 16:30:04 +02003001 int
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01003002set_rw_fname(char_u *fname, char_u *sfname)
Bram Moolenaar2d3f4892006-01-20 23:02:51 +00003003{
Bram Moolenaar8b38e242009-06-16 13:35:20 +00003004 buf_T *buf = curbuf;
3005
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003006 // It's like the unnamed buffer is deleted....
Bram Moolenaar2d3f4892006-01-20 23:02:51 +00003007 if (curbuf->b_p_bl)
3008 apply_autocmds(EVENT_BUFDELETE, NULL, NULL, FALSE, curbuf);
3009 apply_autocmds(EVENT_BUFWIPEOUT, NULL, NULL, FALSE, curbuf);
Bram Moolenaarf2bd8ef2018-03-04 18:08:14 +01003010#ifdef FEAT_EVAL
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003011 if (aborting()) // autocmds may abort script processing
Bram Moolenaar2d3f4892006-01-20 23:02:51 +00003012 return FAIL;
Bram Moolenaarf2bd8ef2018-03-04 18:08:14 +01003013#endif
Bram Moolenaar8b38e242009-06-16 13:35:20 +00003014 if (curbuf != buf)
3015 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003016 // We are in another buffer now, don't do the renaming.
Bram Moolenaar9d00e4a2022-01-05 17:49:15 +00003017 emsg(_(e_autocommands_changed_buffer_or_buffer_name));
Bram Moolenaar8b38e242009-06-16 13:35:20 +00003018 return FAIL;
3019 }
Bram Moolenaar2d3f4892006-01-20 23:02:51 +00003020
3021 if (setfname(curbuf, fname, sfname, FALSE) == OK)
3022 curbuf->b_flags |= BF_NOTEDITED;
3023
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003024 // ....and a new named one is created
Bram Moolenaar2d3f4892006-01-20 23:02:51 +00003025 apply_autocmds(EVENT_BUFNEW, NULL, NULL, FALSE, curbuf);
3026 if (curbuf->b_p_bl)
3027 apply_autocmds(EVENT_BUFADD, NULL, NULL, FALSE, curbuf);
Bram Moolenaarf2bd8ef2018-03-04 18:08:14 +01003028#ifdef FEAT_EVAL
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003029 if (aborting()) // autocmds may abort script processing
Bram Moolenaar2d3f4892006-01-20 23:02:51 +00003030 return FAIL;
Bram Moolenaarf2bd8ef2018-03-04 18:08:14 +01003031#endif
Bram Moolenaar2d3f4892006-01-20 23:02:51 +00003032
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003033 // Do filetype detection now if 'filetype' is empty.
Bram Moolenaar2d3f4892006-01-20 23:02:51 +00003034 if (*curbuf->b_p_ft == NUL)
3035 {
Bram Moolenaar910f66f2006-04-05 20:41:53 +00003036 if (au_has_group((char_u *)"filetypedetect"))
Bram Moolenaar1610d052016-06-09 22:53:01 +02003037 (void)do_doautocmd((char_u *)"filetypedetect BufRead", FALSE, NULL);
Bram Moolenaara3227e22006-03-08 21:32:40 +00003038 do_modelines(0);
Bram Moolenaar2d3f4892006-01-20 23:02:51 +00003039 }
Bram Moolenaar2d3f4892006-01-20 23:02:51 +00003040
3041 return OK;
3042}
3043
3044/*
Bram Moolenaar071d4272004-06-13 20:20:40 +00003045 * Put file name into IObuff with quotes.
3046 */
Bram Moolenaar009b2592004-10-24 19:18:58 +00003047 void
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01003048msg_add_fname(buf_T *buf, char_u *fname)
Bram Moolenaar071d4272004-06-13 20:20:40 +00003049{
3050 if (fname == NULL)
3051 fname = (char_u *)"-stdin-";
3052 home_replace(buf, fname, IObuff + 1, IOSIZE - 4, TRUE);
3053 IObuff[0] = '"';
3054 STRCAT(IObuff, "\" ");
3055}
3056
3057/*
3058 * Append message for text mode to IObuff.
3059 * Return TRUE if something appended.
3060 */
Bram Moolenaar473952e2019-09-28 16:30:04 +02003061 int
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01003062msg_add_fileformat(int eol_type)
Bram Moolenaar071d4272004-06-13 20:20:40 +00003063{
3064#ifndef USE_CRNL
3065 if (eol_type == EOL_DOS)
3066 {
3067 STRCAT(IObuff, shortmess(SHM_TEXT) ? _("[dos]") : _("[dos format]"));
3068 return TRUE;
3069 }
3070#endif
Bram Moolenaar071d4272004-06-13 20:20:40 +00003071 if (eol_type == EOL_MAC)
3072 {
3073 STRCAT(IObuff, shortmess(SHM_TEXT) ? _("[mac]") : _("[mac format]"));
3074 return TRUE;
3075 }
Bram Moolenaar00590742019-02-15 21:06:09 +01003076#ifdef USE_CRNL
Bram Moolenaar071d4272004-06-13 20:20:40 +00003077 if (eol_type == EOL_UNIX)
3078 {
3079 STRCAT(IObuff, shortmess(SHM_TEXT) ? _("[unix]") : _("[unix format]"));
3080 return TRUE;
3081 }
3082#endif
3083 return FALSE;
3084}
3085
3086/*
3087 * Append line and character count to IObuff.
3088 */
Bram Moolenaar009b2592004-10-24 19:18:58 +00003089 void
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01003090msg_add_lines(
3091 int insert_space,
3092 long lnum,
Bram Moolenaar8767f522016-07-01 17:17:39 +02003093 off_T nchars)
Bram Moolenaar071d4272004-06-13 20:20:40 +00003094{
3095 char_u *p;
3096
3097 p = IObuff + STRLEN(IObuff);
3098
3099 if (insert_space)
3100 *p++ = ' ';
3101 if (shortmess(SHM_LINES))
Bram Moolenaarbde98102016-07-01 20:03:42 +02003102 vim_snprintf((char *)p, IOSIZE - (p - IObuff),
Bram Moolenaar3f40ce72020-07-05 14:10:13 +02003103 "%ldL, %lldB", lnum, (varnumber_T)nchars);
Bram Moolenaar071d4272004-06-13 20:20:40 +00003104 else
3105 {
Bram Moolenaarda6e8912018-08-21 15:12:14 +02003106 sprintf((char *)p, NGETTEXT("%ld line, ", "%ld lines, ", lnum), lnum);
Bram Moolenaar071d4272004-06-13 20:20:40 +00003107 p += STRLEN(p);
Bram Moolenaarda6e8912018-08-21 15:12:14 +02003108 vim_snprintf((char *)p, IOSIZE - (p - IObuff),
Bram Moolenaar3f40ce72020-07-05 14:10:13 +02003109 NGETTEXT("%lld byte", "%lld bytes", nchars),
Bram Moolenaarf9706e92020-02-22 14:27:04 +01003110 (varnumber_T)nchars);
Bram Moolenaar071d4272004-06-13 20:20:40 +00003111 }
3112}
3113
3114/*
3115 * Append message for missing line separator to IObuff.
3116 */
Bram Moolenaar473952e2019-09-28 16:30:04 +02003117 void
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01003118msg_add_eol(void)
Bram Moolenaar071d4272004-06-13 20:20:40 +00003119{
3120 STRCAT(IObuff, shortmess(SHM_LAST) ? _("[noeol]") : _("[Incomplete last line]"));
3121}
3122
Bram Moolenaar473952e2019-09-28 16:30:04 +02003123 int
Leah Neukirchen0a7984a2021-10-14 21:27:55 +01003124time_differs(stat_T *st, long mtime, long mtime_ns UNUSED)
Bram Moolenaar071d4272004-06-13 20:20:40 +00003125{
ichizokdef69df2021-10-15 17:23:12 +01003126 return
3127#ifdef ST_MTIM_NSEC
3128 (long)st->ST_MTIM_NSEC != mtime_ns ||
Bram Moolenaar071d4272004-06-13 20:20:40 +00003129#endif
ichizokdef69df2021-10-15 17:23:12 +01003130#if defined(__linux__) || defined(MSWIN)
3131 // On a FAT filesystem, esp. under Linux, there are only 5 bits to store
3132 // the seconds. Since the roundoff is done when flushing the inode, the
3133 // time may change unexpectedly by one second!!!
3134 (long)st->st_mtime - mtime > 1 || mtime - (long)st->st_mtime > 1
3135#else
3136 (long)st->st_mtime != mtime
3137#endif
3138 ;
Bram Moolenaar071d4272004-06-13 20:20:40 +00003139}
3140
3141/*
Bram Moolenaarb5cdf2e2009-07-29 16:25:31 +00003142 * Return TRUE if file encoding "fenc" requires conversion from or to
3143 * 'encoding'.
Bram Moolenaar071d4272004-06-13 20:20:40 +00003144 */
Bram Moolenaar473952e2019-09-28 16:30:04 +02003145 int
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01003146need_conversion(char_u *fenc)
Bram Moolenaar071d4272004-06-13 20:20:40 +00003147{
Bram Moolenaarb5cdf2e2009-07-29 16:25:31 +00003148 int same_encoding;
3149 int enc_flags;
3150 int fenc_flags;
Bram Moolenaar071d4272004-06-13 20:20:40 +00003151
Bram Moolenaarb5cdf2e2009-07-29 16:25:31 +00003152 if (*fenc == NUL || STRCMP(p_enc, fenc) == 0)
Bram Moolenaar442b4222010-05-24 21:34:22 +02003153 {
Bram Moolenaarb5cdf2e2009-07-29 16:25:31 +00003154 same_encoding = TRUE;
Bram Moolenaar442b4222010-05-24 21:34:22 +02003155 fenc_flags = 0;
3156 }
Bram Moolenaarb5cdf2e2009-07-29 16:25:31 +00003157 else
3158 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003159 // Ignore difference between "ansi" and "latin1", "ucs-4" and
3160 // "ucs-4be", etc.
Bram Moolenaarb5cdf2e2009-07-29 16:25:31 +00003161 enc_flags = get_fio_flags(p_enc);
3162 fenc_flags = get_fio_flags(fenc);
3163 same_encoding = (enc_flags != 0 && fenc_flags == enc_flags);
3164 }
3165 if (same_encoding)
3166 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003167 // Specified encoding matches with 'encoding'. This requires
3168 // conversion when 'encoding' is Unicode but not UTF-8.
Bram Moolenaarb5cdf2e2009-07-29 16:25:31 +00003169 return enc_unicode != 0;
3170 }
3171
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003172 // Encodings differ. However, conversion is not needed when 'enc' is any
3173 // Unicode encoding and the file is UTF-8.
Bram Moolenaarb5cdf2e2009-07-29 16:25:31 +00003174 return !(enc_utf8 && fenc_flags == FIO_UTF8);
Bram Moolenaar071d4272004-06-13 20:20:40 +00003175}
3176
3177/*
3178 * Check "ptr" for a unicode encoding and return the FIO_ flags needed for the
3179 * internal conversion.
3180 * if "ptr" is an empty string, use 'encoding'.
3181 */
Bram Moolenaar473952e2019-09-28 16:30:04 +02003182 int
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01003183get_fio_flags(char_u *ptr)
Bram Moolenaar071d4272004-06-13 20:20:40 +00003184{
3185 int prop;
3186
3187 if (*ptr == NUL)
3188 ptr = p_enc;
3189
3190 prop = enc_canon_props(ptr);
3191 if (prop & ENC_UNICODE)
3192 {
3193 if (prop & ENC_2BYTE)
3194 {
3195 if (prop & ENC_ENDIAN_L)
3196 return FIO_UCS2 | FIO_ENDIAN_L;
3197 return FIO_UCS2;
3198 }
3199 if (prop & ENC_4BYTE)
3200 {
3201 if (prop & ENC_ENDIAN_L)
3202 return FIO_UCS4 | FIO_ENDIAN_L;
3203 return FIO_UCS4;
3204 }
3205 if (prop & ENC_2WORD)
3206 {
3207 if (prop & ENC_ENDIAN_L)
3208 return FIO_UTF16 | FIO_ENDIAN_L;
3209 return FIO_UTF16;
3210 }
3211 return FIO_UTF8;
3212 }
3213 if (prop & ENC_LATIN1)
3214 return FIO_LATIN1;
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003215 // must be ENC_DBCS, requires iconv()
Bram Moolenaar071d4272004-06-13 20:20:40 +00003216 return 0;
3217}
3218
Bram Moolenaar473952e2019-09-28 16:30:04 +02003219#if defined(MSWIN) || defined(PROTO)
Bram Moolenaar071d4272004-06-13 20:20:40 +00003220/*
3221 * Check "ptr" for a MS-Windows codepage name and return the FIO_ flags needed
3222 * for the conversion MS-Windows can do for us. Also accept "utf-8".
3223 * Used for conversion between 'encoding' and 'fileencoding'.
3224 */
Bram Moolenaar473952e2019-09-28 16:30:04 +02003225 int
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01003226get_win_fio_flags(char_u *ptr)
Bram Moolenaar071d4272004-06-13 20:20:40 +00003227{
3228 int cp;
3229
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003230 // Cannot do this when 'encoding' is not utf-8 and not a codepage.
Bram Moolenaar071d4272004-06-13 20:20:40 +00003231 if (!enc_utf8 && enc_codepage <= 0)
3232 return 0;
3233
3234 cp = encname2codepage(ptr);
3235 if (cp == 0)
3236 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003237# ifdef CP_UTF8 // VC 4.1 doesn't define CP_UTF8
Bram Moolenaar071d4272004-06-13 20:20:40 +00003238 if (STRCMP(ptr, "utf-8") == 0)
3239 cp = CP_UTF8;
3240 else
3241# endif
3242 return 0;
3243 }
3244 return FIO_PUT_CP(cp) | FIO_CODEPAGE;
3245}
3246#endif
3247
Bram Moolenaar473952e2019-09-28 16:30:04 +02003248#if defined(MACOS_CONVERT) || defined(PROTO)
Bram Moolenaar071d4272004-06-13 20:20:40 +00003249/*
3250 * Check "ptr" for a Carbon supported encoding and return the FIO_ flags
3251 * needed for the internal conversion to/from utf-8 or latin1.
3252 */
Bram Moolenaar473952e2019-09-28 16:30:04 +02003253 int
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01003254get_mac_fio_flags(char_u *ptr)
Bram Moolenaar071d4272004-06-13 20:20:40 +00003255{
3256 if ((enc_utf8 || STRCMP(p_enc, "latin1") == 0)
3257 && (enc_canon_props(ptr) & ENC_MACROMAN))
3258 return FIO_MACROMAN;
3259 return 0;
3260}
3261#endif
3262
3263/*
3264 * Check for a Unicode BOM (Byte Order Mark) at the start of p[size].
3265 * "size" must be at least 2.
3266 * Return the name of the encoding and set "*lenp" to the length.
3267 * Returns NULL when no BOM found.
3268 */
3269 static char_u *
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01003270check_for_bom(
3271 char_u *p,
3272 long size,
3273 int *lenp,
3274 int flags)
Bram Moolenaar071d4272004-06-13 20:20:40 +00003275{
3276 char *name = NULL;
3277 int len = 2;
3278
3279 if (p[0] == 0xef && p[1] == 0xbb && size >= 3 && p[2] == 0xbf
Bram Moolenaaree0f5a62008-07-24 20:09:16 +00003280 && (flags == FIO_ALL || flags == FIO_UTF8 || flags == 0))
Bram Moolenaar071d4272004-06-13 20:20:40 +00003281 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003282 name = "utf-8"; // EF BB BF
Bram Moolenaar071d4272004-06-13 20:20:40 +00003283 len = 3;
3284 }
3285 else if (p[0] == 0xff && p[1] == 0xfe)
3286 {
3287 if (size >= 4 && p[2] == 0 && p[3] == 0
3288 && (flags == FIO_ALL || flags == (FIO_UCS4 | FIO_ENDIAN_L)))
3289 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003290 name = "ucs-4le"; // FF FE 00 00
Bram Moolenaar071d4272004-06-13 20:20:40 +00003291 len = 4;
3292 }
Bram Moolenaar223a1892008-11-11 20:57:11 +00003293 else if (flags == (FIO_UCS2 | FIO_ENDIAN_L))
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003294 name = "ucs-2le"; // FF FE
Bram Moolenaar223a1892008-11-11 20:57:11 +00003295 else if (flags == FIO_ALL || flags == (FIO_UTF16 | FIO_ENDIAN_L))
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003296 // utf-16le is preferred, it also works for ucs-2le text
3297 name = "utf-16le"; // FF FE
Bram Moolenaar071d4272004-06-13 20:20:40 +00003298 }
3299 else if (p[0] == 0xfe && p[1] == 0xff
3300 && (flags == FIO_ALL || flags == FIO_UCS2 || flags == FIO_UTF16))
3301 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003302 // Default to utf-16, it works also for ucs-2 text.
Bram Moolenaarffd82c52008-02-20 17:15:26 +00003303 if (flags == FIO_UCS2)
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003304 name = "ucs-2"; // FE FF
Bram Moolenaarffd82c52008-02-20 17:15:26 +00003305 else
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003306 name = "utf-16"; // FE FF
Bram Moolenaar071d4272004-06-13 20:20:40 +00003307 }
3308 else if (size >= 4 && p[0] == 0 && p[1] == 0 && p[2] == 0xfe
3309 && p[3] == 0xff && (flags == FIO_ALL || flags == FIO_UCS4))
3310 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003311 name = "ucs-4"; // 00 00 FE FF
Bram Moolenaar071d4272004-06-13 20:20:40 +00003312 len = 4;
3313 }
3314
3315 *lenp = len;
3316 return (char_u *)name;
3317}
3318
3319/*
Bram Moolenaar071d4272004-06-13 20:20:40 +00003320 * Try to find a shortname by comparing the fullname with the current
3321 * directory.
Bram Moolenaard089d9b2007-09-30 12:02:55 +00003322 * Returns "full_path" or pointer into "full_path" if shortened.
3323 */
3324 char_u *
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01003325shorten_fname1(char_u *full_path)
Bram Moolenaard089d9b2007-09-30 12:02:55 +00003326{
Bram Moolenaard9462e32011-04-11 21:35:11 +02003327 char_u *dirname;
Bram Moolenaard089d9b2007-09-30 12:02:55 +00003328 char_u *p = full_path;
3329
Bram Moolenaard9462e32011-04-11 21:35:11 +02003330 dirname = alloc(MAXPATHL);
3331 if (dirname == NULL)
3332 return full_path;
Bram Moolenaard089d9b2007-09-30 12:02:55 +00003333 if (mch_dirname(dirname, MAXPATHL) == OK)
3334 {
3335 p = shorten_fname(full_path, dirname);
3336 if (p == NULL || *p == NUL)
3337 p = full_path;
3338 }
Bram Moolenaard9462e32011-04-11 21:35:11 +02003339 vim_free(dirname);
Bram Moolenaard089d9b2007-09-30 12:02:55 +00003340 return p;
3341}
3342
3343/*
3344 * Try to find a shortname by comparing the fullname with the current
3345 * directory.
Bram Moolenaar071d4272004-06-13 20:20:40 +00003346 * Returns NULL if not shorter name possible, pointer into "full_path"
3347 * otherwise.
3348 */
3349 char_u *
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01003350shorten_fname(char_u *full_path, char_u *dir_name)
Bram Moolenaar071d4272004-06-13 20:20:40 +00003351{
3352 int len;
3353 char_u *p;
3354
3355 if (full_path == NULL)
3356 return NULL;
3357 len = (int)STRLEN(dir_name);
3358 if (fnamencmp(dir_name, full_path, len) == 0)
3359 {
3360 p = full_path + len;
Bram Moolenaar48e330a2016-02-23 14:53:34 +01003361#if defined(MSWIN)
Bram Moolenaar071d4272004-06-13 20:20:40 +00003362 /*
Bram Moolenaar4f974752019-02-17 17:44:42 +01003363 * MS-Windows: when a file is in the root directory, dir_name will end
3364 * in a slash, since C: by itself does not define a specific dir. In
3365 * this case p may already be correct. <negri>
Bram Moolenaar071d4272004-06-13 20:20:40 +00003366 */
3367 if (!((len > 2) && (*(p - 2) == ':')))
3368#endif
3369 {
3370 if (vim_ispathsep(*p))
3371 ++p;
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003372#ifndef VMS // the path separator is always part of the path
Bram Moolenaar071d4272004-06-13 20:20:40 +00003373 else
3374 p = NULL;
3375#endif
3376 }
3377 }
Bram Moolenaar48e330a2016-02-23 14:53:34 +01003378#if defined(MSWIN)
Bram Moolenaar071d4272004-06-13 20:20:40 +00003379 /*
3380 * When using a file in the current drive, remove the drive name:
3381 * "A:\dir\file" -> "\dir\file". This helps when moving a session file on
3382 * a floppy from "A:\dir" to "B:\dir".
3383 */
3384 else if (len > 3
3385 && TOUPPER_LOC(full_path[0]) == TOUPPER_LOC(dir_name[0])
3386 && full_path[1] == ':'
3387 && vim_ispathsep(full_path[2]))
3388 p = full_path + 2;
3389#endif
3390 else
3391 p = NULL;
3392 return p;
3393}
3394
3395/*
Bram Moolenaara796d462018-05-01 14:30:36 +02003396 * Shorten filename of a buffer.
Bram Moolenaar071d4272004-06-13 20:20:40 +00003397 * When "force" is TRUE: Use full path from now on for files currently being
3398 * edited, both for file name and swap file name. Try to shorten the file
3399 * names a bit, if safe to do so.
3400 * When "force" is FALSE: Only try to shorten absolute file names.
3401 * For buffers that have buftype "nofile" or "scratch": never change the file
3402 * name.
3403 */
3404 void
Bram Moolenaara796d462018-05-01 14:30:36 +02003405shorten_buf_fname(buf_T *buf, char_u *dirname, int force)
3406{
3407 char_u *p;
3408
3409 if (buf->b_fname != NULL
Bram Moolenaar26910de2019-06-15 19:37:15 +02003410 && !bt_nofilename(buf)
Bram Moolenaara796d462018-05-01 14:30:36 +02003411 && !path_with_url(buf->b_fname)
3412 && (force
3413 || buf->b_sfname == NULL
3414 || mch_isFullName(buf->b_sfname)))
3415 {
Bram Moolenaar3d6014f2018-10-11 19:27:47 +02003416 if (buf->b_sfname != buf->b_ffname)
3417 VIM_CLEAR(buf->b_sfname);
Bram Moolenaara796d462018-05-01 14:30:36 +02003418 p = shorten_fname(buf->b_ffname, dirname);
3419 if (p != NULL)
3420 {
3421 buf->b_sfname = vim_strsave(p);
3422 buf->b_fname = buf->b_sfname;
3423 }
3424 if (p == NULL || buf->b_fname == NULL)
3425 buf->b_fname = buf->b_ffname;
3426 }
3427}
3428
3429/*
3430 * Shorten filenames for all buffers.
3431 */
3432 void
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01003433shorten_fnames(int force)
Bram Moolenaar071d4272004-06-13 20:20:40 +00003434{
3435 char_u dirname[MAXPATHL];
3436 buf_T *buf;
Bram Moolenaar071d4272004-06-13 20:20:40 +00003437
3438 mch_dirname(dirname, MAXPATHL);
Bram Moolenaar29323592016-07-24 22:04:11 +02003439 FOR_ALL_BUFFERS(buf)
Bram Moolenaar071d4272004-06-13 20:20:40 +00003440 {
Bram Moolenaara796d462018-05-01 14:30:36 +02003441 shorten_buf_fname(buf, dirname, force);
Bram Moolenaar69a7cb42004-06-20 12:51:53 +00003442
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003443 // Always make the swap file name a full path, a "nofile" buffer may
3444 // also have a swap file.
Bram Moolenaar69a7cb42004-06-20 12:51:53 +00003445 mf_fullname(buf->b_ml.ml_mfp);
Bram Moolenaar071d4272004-06-13 20:20:40 +00003446 }
Bram Moolenaar071d4272004-06-13 20:20:40 +00003447 status_redraw_all();
Bram Moolenaar49d7bf12006-02-17 21:45:41 +00003448 redraw_tabline = TRUE;
Bram Moolenaar5a4c3082019-12-01 15:23:11 +01003449#if defined(FEAT_PROP_POPUP) && defined(FEAT_QUICKFIX)
Bram Moolenaar90f3e7a2019-08-01 22:40:44 +02003450 popup_update_preview_title();
3451#endif
Bram Moolenaar071d4272004-06-13 20:20:40 +00003452}
3453
3454#if (defined(FEAT_DND) && defined(FEAT_GUI_GTK)) \
3455 || defined(FEAT_GUI_MSWIN) \
Bram Moolenaarb3f74062020-02-26 16:16:53 +01003456 || defined(FEAT_GUI_HAIKU) \
Bram Moolenaar071d4272004-06-13 20:20:40 +00003457 || defined(PROTO)
3458/*
3459 * Shorten all filenames in "fnames[count]" by current directory.
3460 */
3461 void
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01003462shorten_filenames(char_u **fnames, int count)
Bram Moolenaar071d4272004-06-13 20:20:40 +00003463{
3464 int i;
3465 char_u dirname[MAXPATHL];
3466 char_u *p;
3467
3468 if (fnames == NULL || count < 1)
3469 return;
3470 mch_dirname(dirname, sizeof(dirname));
3471 for (i = 0; i < count; ++i)
3472 {
3473 if ((p = shorten_fname(fnames[i], dirname)) != NULL)
3474 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003475 // shorten_fname() returns pointer in given "fnames[i]". If free
3476 // "fnames[i]" first, "p" becomes invalid. So we need to copy
3477 // "p" first then free fnames[i].
Bram Moolenaar071d4272004-06-13 20:20:40 +00003478 p = vim_strsave(p);
3479 vim_free(fnames[i]);
3480 fnames[i] = p;
3481 }
3482 }
3483}
3484#endif
3485
3486/*
Bram Moolenaarb782ba42018-08-07 21:39:28 +02003487 * Add extension to file name - change path/fo.o.h to path/fo.o.h.ext or
Bram Moolenaar071d4272004-06-13 20:20:40 +00003488 * fo_o_h.ext for MSDOS or when shortname option set.
3489 *
3490 * Assumed that fname is a valid name found in the filesystem we assure that
3491 * the return value is a different name and ends in 'ext'.
3492 * "ext" MUST be at most 4 characters long if it starts with a dot, 3
3493 * characters otherwise.
3494 * Space for the returned name is allocated, must be freed later.
3495 * Returns NULL when out of memory.
3496 */
3497 char_u *
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01003498modname(
3499 char_u *fname,
3500 char_u *ext,
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003501 int prepend_dot) // may prepend a '.' to file name
Bram Moolenaar071d4272004-06-13 20:20:40 +00003502{
Bram Moolenaar48e330a2016-02-23 14:53:34 +01003503 return buf_modname((curbuf->b_p_sn || curbuf->b_shortname),
Bram Moolenaar071d4272004-06-13 20:20:40 +00003504 fname, ext, prepend_dot);
3505}
3506
3507 char_u *
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01003508buf_modname(
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003509 int shortname, // use 8.3 file name
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01003510 char_u *fname,
3511 char_u *ext,
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003512 int prepend_dot) // may prepend a '.' to file name
Bram Moolenaar071d4272004-06-13 20:20:40 +00003513{
3514 char_u *retval;
3515 char_u *s;
3516 char_u *e;
3517 char_u *ptr;
3518 int fnamelen, extlen;
3519
3520 extlen = (int)STRLEN(ext);
3521
3522 /*
3523 * If there is no file name we must get the name of the current directory
3524 * (we need the full path in case :cd is used).
3525 */
3526 if (fname == NULL || *fname == NUL)
3527 {
Bram Moolenaar964b3742019-05-24 18:54:09 +02003528 retval = alloc(MAXPATHL + extlen + 3);
Bram Moolenaar071d4272004-06-13 20:20:40 +00003529 if (retval == NULL)
3530 return NULL;
3531 if (mch_dirname(retval, MAXPATHL) == FAIL ||
3532 (fnamelen = (int)STRLEN(retval)) == 0)
3533 {
3534 vim_free(retval);
3535 return NULL;
3536 }
Bram Moolenaar1cd871b2004-12-19 22:46:22 +00003537 if (!after_pathsep(retval, retval + fnamelen))
Bram Moolenaar071d4272004-06-13 20:20:40 +00003538 {
3539 retval[fnamelen++] = PATHSEP;
3540 retval[fnamelen] = NUL;
3541 }
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003542 prepend_dot = FALSE; // nothing to prepend a dot to
Bram Moolenaar071d4272004-06-13 20:20:40 +00003543 }
3544 else
3545 {
3546 fnamelen = (int)STRLEN(fname);
Bram Moolenaar964b3742019-05-24 18:54:09 +02003547 retval = alloc(fnamelen + extlen + 3);
Bram Moolenaar071d4272004-06-13 20:20:40 +00003548 if (retval == NULL)
3549 return NULL;
3550 STRCPY(retval, fname);
3551#ifdef VMS
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003552 vms_remove_version(retval); // we do not need versions here
Bram Moolenaar071d4272004-06-13 20:20:40 +00003553#endif
3554 }
3555
3556 /*
3557 * search backwards until we hit a '/', '\' or ':' replacing all '.'
3558 * by '_' for MSDOS or when shortname option set and ext starts with a dot.
3559 * Then truncate what is after the '/', '\' or ':' to 8 characters for
3560 * MSDOS and 26 characters for AMIGA, a lot more for UNIX.
3561 */
Bram Moolenaar91acfff2017-03-12 19:22:36 +01003562 for (ptr = retval + fnamelen; ptr > retval; MB_PTR_BACK(retval, ptr))
Bram Moolenaar071d4272004-06-13 20:20:40 +00003563 {
Bram Moolenaar00f148d2019-02-12 22:37:27 +01003564 if (*ext == '.' && shortname)
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003565 if (*ptr == '.') // replace '.' by '_'
Bram Moolenaar071d4272004-06-13 20:20:40 +00003566 *ptr = '_';
Bram Moolenaar071d4272004-06-13 20:20:40 +00003567 if (vim_ispathsep(*ptr))
Bram Moolenaar53180ce2005-07-05 21:48:14 +00003568 {
3569 ++ptr;
Bram Moolenaar071d4272004-06-13 20:20:40 +00003570 break;
Bram Moolenaar53180ce2005-07-05 21:48:14 +00003571 }
Bram Moolenaar071d4272004-06-13 20:20:40 +00003572 }
Bram Moolenaar071d4272004-06-13 20:20:40 +00003573
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003574 // the file name has at most BASENAMELEN characters.
Bram Moolenaar071d4272004-06-13 20:20:40 +00003575 if (STRLEN(ptr) > (unsigned)BASENAMELEN)
3576 ptr[BASENAMELEN] = '\0';
Bram Moolenaar071d4272004-06-13 20:20:40 +00003577
3578 s = ptr + STRLEN(ptr);
3579
3580 /*
3581 * For 8.3 file names we may have to reduce the length.
3582 */
Bram Moolenaar071d4272004-06-13 20:20:40 +00003583 if (shortname)
Bram Moolenaar071d4272004-06-13 20:20:40 +00003584 {
3585 /*
3586 * If there is no file name, or the file name ends in '/', and the
3587 * extension starts with '.', put a '_' before the dot, because just
3588 * ".ext" is invalid.
3589 */
3590 if (fname == NULL || *fname == NUL
3591 || vim_ispathsep(fname[STRLEN(fname) - 1]))
3592 {
Bram Moolenaar071d4272004-06-13 20:20:40 +00003593 if (*ext == '.')
Bram Moolenaar071d4272004-06-13 20:20:40 +00003594 *s++ = '_';
3595 }
3596 /*
3597 * If the extension starts with '.', truncate the base name at 8
3598 * characters
3599 */
Bram Moolenaar071d4272004-06-13 20:20:40 +00003600 else if (*ext == '.')
Bram Moolenaar071d4272004-06-13 20:20:40 +00003601 {
Bram Moolenaar78a15312009-05-15 19:33:18 +00003602 if ((size_t)(s - ptr) > (size_t)8)
Bram Moolenaar071d4272004-06-13 20:20:40 +00003603 {
3604 s = ptr + 8;
3605 *s = '\0';
3606 }
3607 }
3608 /*
3609 * If the extension doesn't start with '.', and the file name
3610 * doesn't have an extension yet, append a '.'
3611 */
Bram Moolenaar071d4272004-06-13 20:20:40 +00003612 else if ((e = vim_strchr(ptr, '.')) == NULL)
3613 *s++ = '.';
Bram Moolenaar071d4272004-06-13 20:20:40 +00003614 /*
3615 * If the extension doesn't start with '.', and there already is an
Bram Moolenaar7263a772007-05-10 17:35:54 +00003616 * extension, it may need to be truncated
Bram Moolenaar071d4272004-06-13 20:20:40 +00003617 */
3618 else if ((int)STRLEN(e) + extlen > 4)
3619 s = e + 4 - extlen;
3620 }
Bram Moolenaar4f974752019-02-17 17:44:42 +01003621#ifdef MSWIN
Bram Moolenaar071d4272004-06-13 20:20:40 +00003622 /*
3623 * If there is no file name, and the extension starts with '.', put a
3624 * '_' before the dot, because just ".ext" may be invalid if it's on a
3625 * FAT partition, and on HPFS it doesn't matter.
3626 */
3627 else if ((fname == NULL || *fname == NUL) && *ext == '.')
3628 *s++ = '_';
3629#endif
3630
3631 /*
Bram Moolenaarb23a7e82008-06-27 18:42:32 +00003632 * Append the extension.
Bram Moolenaar071d4272004-06-13 20:20:40 +00003633 * ext can start with '.' and cannot exceed 3 more characters.
3634 */
3635 STRCPY(s, ext);
3636
Bram Moolenaar071d4272004-06-13 20:20:40 +00003637 /*
3638 * Prepend the dot.
3639 */
Bram Moolenaar00f148d2019-02-12 22:37:27 +01003640 if (prepend_dot && !shortname && *(e = gettail(retval)) != '.')
Bram Moolenaar071d4272004-06-13 20:20:40 +00003641 {
Bram Moolenaar3577c6f2008-06-24 21:16:56 +00003642 STRMOVE(e + 1, e);
Bram Moolenaar071d4272004-06-13 20:20:40 +00003643 *e = '.';
Bram Moolenaar071d4272004-06-13 20:20:40 +00003644 }
Bram Moolenaar071d4272004-06-13 20:20:40 +00003645
3646 /*
3647 * Check that, after appending the extension, the file name is really
3648 * different.
3649 */
3650 if (fname != NULL && STRCMP(fname, retval) == 0)
3651 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003652 // we search for a character that can be replaced by '_'
Bram Moolenaar071d4272004-06-13 20:20:40 +00003653 while (--s >= ptr)
3654 {
3655 if (*s != '_')
3656 {
3657 *s = '_';
3658 break;
3659 }
3660 }
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003661 if (s < ptr) // fname was "________.<ext>", how tricky!
Bram Moolenaar071d4272004-06-13 20:20:40 +00003662 *ptr = 'v';
3663 }
3664 return retval;
3665}
3666
3667/*
3668 * Like fgets(), but if the file line is too long, it is truncated and the
3669 * rest of the line is thrown away. Returns TRUE for end-of-file.
Bram Moolenaar7e1652c2017-12-16 18:27:02 +01003670 * If the line is truncated then buf[size - 2] will not be NUL.
Bram Moolenaar071d4272004-06-13 20:20:40 +00003671 */
3672 int
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01003673vim_fgets(char_u *buf, int size, FILE *fp)
Bram Moolenaar071d4272004-06-13 20:20:40 +00003674{
3675 char *eof;
3676#define FGETS_SIZE 200
3677 char tbuf[FGETS_SIZE];
3678
3679 buf[size - 2] = NUL;
Bram Moolenaar071d4272004-06-13 20:20:40 +00003680 eof = fgets((char *)buf, size, fp);
Bram Moolenaar071d4272004-06-13 20:20:40 +00003681 if (buf[size - 2] != NUL && buf[size - 2] != '\n')
3682 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003683 buf[size - 1] = NUL; // Truncate the line
Bram Moolenaar071d4272004-06-13 20:20:40 +00003684
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003685 // Now throw away the rest of the line:
Bram Moolenaar071d4272004-06-13 20:20:40 +00003686 do
3687 {
3688 tbuf[FGETS_SIZE - 2] = NUL;
Bram Moolenaar42335f52018-09-13 15:33:43 +02003689 vim_ignoredp = fgets((char *)tbuf, FGETS_SIZE, fp);
Bram Moolenaar071d4272004-06-13 20:20:40 +00003690 } while (tbuf[FGETS_SIZE - 2] != NUL && tbuf[FGETS_SIZE - 2] != '\n');
3691 }
3692 return (eof == NULL);
3693}
3694
Bram Moolenaar071d4272004-06-13 20:20:40 +00003695/*
3696 * rename() only works if both files are on the same file system, this
3697 * function will (attempts to?) copy the file across if rename fails -- webb
3698 * Return -1 for failure, 0 for success.
3699 */
3700 int
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01003701vim_rename(char_u *from, char_u *to)
Bram Moolenaar071d4272004-06-13 20:20:40 +00003702{
3703 int fd_in;
3704 int fd_out;
3705 int n;
3706 char *errmsg = NULL;
3707 char *buffer;
3708#ifdef AMIGA
3709 BPTR flock;
3710#endif
Bram Moolenaar8767f522016-07-01 17:17:39 +02003711 stat_T st;
Bram Moolenaar9be038d2005-03-08 22:34:32 +00003712 long perm;
Bram Moolenaarcd71fa32005-03-11 22:46:48 +00003713#ifdef HAVE_ACL
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003714 vim_acl_T acl; // ACL from original file
Bram Moolenaarcd71fa32005-03-11 22:46:48 +00003715#endif
Bram Moolenaare0e6f992008-12-31 15:21:32 +00003716 int use_tmp_file = FALSE;
Bram Moolenaar071d4272004-06-13 20:20:40 +00003717
3718 /*
Bram Moolenaare0e6f992008-12-31 15:21:32 +00003719 * When the names are identical, there is nothing to do. When they refer
3720 * to the same file (ignoring case and slash/backslash differences) but
3721 * the file name differs we need to go through a temp file.
Bram Moolenaar071d4272004-06-13 20:20:40 +00003722 */
3723 if (fnamecmp(from, to) == 0)
Bram Moolenaare0e6f992008-12-31 15:21:32 +00003724 {
Bram Moolenaar71afbfe2013-03-19 16:49:16 +01003725 if (p_fic && STRCMP(gettail(from), gettail(to)) != 0)
Bram Moolenaare0e6f992008-12-31 15:21:32 +00003726 use_tmp_file = TRUE;
3727 else
Bram Moolenaare0e6f992008-12-31 15:21:32 +00003728 return 0;
3729 }
Bram Moolenaar071d4272004-06-13 20:20:40 +00003730
3731 /*
3732 * Fail if the "from" file doesn't exist. Avoids that "to" is deleted.
3733 */
3734 if (mch_stat((char *)from, &st) < 0)
3735 return -1;
3736
Bram Moolenaar3576da72008-12-30 15:15:57 +00003737#ifdef UNIX
3738 {
Bram Moolenaar8767f522016-07-01 17:17:39 +02003739 stat_T st_to;
Bram Moolenaar3576da72008-12-30 15:15:57 +00003740
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003741 // It's possible for the source and destination to be the same file.
3742 // This happens when "from" and "to" differ in case and are on a FAT32
3743 // filesystem. In that case go through a temp file name.
Bram Moolenaar3576da72008-12-30 15:15:57 +00003744 if (mch_stat((char *)to, &st_to) >= 0
3745 && st.st_dev == st_to.st_dev
3746 && st.st_ino == st_to.st_ino)
Bram Moolenaare0e6f992008-12-31 15:21:32 +00003747 use_tmp_file = TRUE;
3748 }
3749#endif
Bram Moolenaar4f974752019-02-17 17:44:42 +01003750#ifdef MSWIN
Bram Moolenaar1c32dff2011-05-05 16:41:24 +02003751 {
3752 BY_HANDLE_FILE_INFORMATION info1, info2;
3753
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003754 // It's possible for the source and destination to be the same file.
3755 // In that case go through a temp file name. This makes rename("foo",
3756 // "./foo") a no-op (in a complicated way).
Bram Moolenaar1c32dff2011-05-05 16:41:24 +02003757 if (win32_fileinfo(from, &info1) == FILEINFO_OK
3758 && win32_fileinfo(to, &info2) == FILEINFO_OK
3759 && info1.dwVolumeSerialNumber == info2.dwVolumeSerialNumber
3760 && info1.nFileIndexHigh == info2.nFileIndexHigh
3761 && info1.nFileIndexLow == info2.nFileIndexLow)
3762 use_tmp_file = TRUE;
3763 }
3764#endif
Bram Moolenaare0e6f992008-12-31 15:21:32 +00003765
Bram Moolenaare0e6f992008-12-31 15:21:32 +00003766 if (use_tmp_file)
3767 {
3768 char tempname[MAXPATHL + 1];
3769
3770 /*
3771 * Find a name that doesn't exist and is in the same directory.
3772 * Rename "from" to "tempname" and then rename "tempname" to "to".
3773 */
3774 if (STRLEN(from) >= MAXPATHL - 5)
3775 return -1;
3776 STRCPY(tempname, from);
3777 for (n = 123; n < 99999; ++n)
Bram Moolenaar3576da72008-12-30 15:15:57 +00003778 {
Bram Moolenaare0e6f992008-12-31 15:21:32 +00003779 sprintf((char *)gettail((char_u *)tempname), "%d", n);
3780 if (mch_stat(tempname, &st) < 0)
Bram Moolenaar3576da72008-12-30 15:15:57 +00003781 {
Bram Moolenaare0e6f992008-12-31 15:21:32 +00003782 if (mch_rename((char *)from, tempname) == 0)
Bram Moolenaar3576da72008-12-30 15:15:57 +00003783 {
Bram Moolenaare0e6f992008-12-31 15:21:32 +00003784 if (mch_rename(tempname, (char *)to) == 0)
3785 return 0;
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003786 // Strange, the second step failed. Try moving the
3787 // file back and return failure.
Bram Moolenaar97a6c6a2021-05-03 19:49:51 +02003788 (void)mch_rename(tempname, (char *)from);
Bram Moolenaar3576da72008-12-30 15:15:57 +00003789 return -1;
3790 }
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003791 // If it fails for one temp name it will most likely fail
3792 // for any temp name, give up.
Bram Moolenaare0e6f992008-12-31 15:21:32 +00003793 return -1;
Bram Moolenaar3576da72008-12-30 15:15:57 +00003794 }
Bram Moolenaar3576da72008-12-30 15:15:57 +00003795 }
Bram Moolenaare0e6f992008-12-31 15:21:32 +00003796 return -1;
Bram Moolenaar3576da72008-12-30 15:15:57 +00003797 }
Bram Moolenaar3576da72008-12-30 15:15:57 +00003798
Bram Moolenaar071d4272004-06-13 20:20:40 +00003799 /*
3800 * Delete the "to" file, this is required on some systems to make the
3801 * mch_rename() work, on other systems it makes sure that we don't have
3802 * two files when the mch_rename() fails.
3803 */
3804
3805#ifdef AMIGA
3806 /*
3807 * With MSDOS-compatible filesystems (crossdos, messydos) it is possible
3808 * that the name of the "to" file is the same as the "from" file, even
Bram Moolenaar7263a772007-05-10 17:35:54 +00003809 * though the names are different. To avoid the chance of accidentally
Bram Moolenaar071d4272004-06-13 20:20:40 +00003810 * deleting the "from" file (horror!) we lock it during the remove.
3811 *
3812 * When used for making a backup before writing the file: This should not
3813 * happen with ":w", because startscript() should detect this problem and
3814 * set buf->b_shortname, causing modname() to return a correct ".bak" file
3815 * name. This problem does exist with ":w filename", but then the
3816 * original file will be somewhere else so the backup isn't really
3817 * important. If autoscripting is off the rename may fail.
3818 */
3819 flock = Lock((UBYTE *)from, (long)ACCESS_READ);
3820#endif
3821 mch_remove(to);
3822#ifdef AMIGA
3823 if (flock)
3824 UnLock(flock);
3825#endif
3826
3827 /*
3828 * First try a normal rename, return if it works.
3829 */
3830 if (mch_rename((char *)from, (char *)to) == 0)
3831 return 0;
3832
3833 /*
3834 * Rename() failed, try copying the file.
3835 */
Bram Moolenaar9be038d2005-03-08 22:34:32 +00003836 perm = mch_getperm(from);
Bram Moolenaarcd71fa32005-03-11 22:46:48 +00003837#ifdef HAVE_ACL
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003838 // For systems that support ACL: get the ACL from the original file.
Bram Moolenaarcd71fa32005-03-11 22:46:48 +00003839 acl = mch_get_acl(from);
3840#endif
Bram Moolenaar071d4272004-06-13 20:20:40 +00003841 fd_in = mch_open((char *)from, O_RDONLY|O_EXTRA, 0);
3842 if (fd_in == -1)
Bram Moolenaarb23a7e82008-06-27 18:42:32 +00003843 {
3844#ifdef HAVE_ACL
3845 mch_free_acl(acl);
3846#endif
Bram Moolenaar071d4272004-06-13 20:20:40 +00003847 return -1;
Bram Moolenaarb23a7e82008-06-27 18:42:32 +00003848 }
Bram Moolenaar9be038d2005-03-08 22:34:32 +00003849
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003850 // Create the new file with same permissions as the original.
Bram Moolenaara5792f52005-11-23 21:25:05 +00003851 fd_out = mch_open((char *)to,
3852 O_CREAT|O_EXCL|O_WRONLY|O_EXTRA|O_NOFOLLOW, (int)perm);
Bram Moolenaar071d4272004-06-13 20:20:40 +00003853 if (fd_out == -1)
3854 {
3855 close(fd_in);
Bram Moolenaarb23a7e82008-06-27 18:42:32 +00003856#ifdef HAVE_ACL
3857 mch_free_acl(acl);
3858#endif
Bram Moolenaar071d4272004-06-13 20:20:40 +00003859 return -1;
3860 }
3861
Bram Moolenaar473952e2019-09-28 16:30:04 +02003862 buffer = alloc(WRITEBUFSIZE);
Bram Moolenaar071d4272004-06-13 20:20:40 +00003863 if (buffer == NULL)
3864 {
Bram Moolenaar071d4272004-06-13 20:20:40 +00003865 close(fd_out);
Bram Moolenaarb23a7e82008-06-27 18:42:32 +00003866 close(fd_in);
3867#ifdef HAVE_ACL
3868 mch_free_acl(acl);
3869#endif
Bram Moolenaar071d4272004-06-13 20:20:40 +00003870 return -1;
3871 }
3872
Bram Moolenaar473952e2019-09-28 16:30:04 +02003873 while ((n = read_eintr(fd_in, buffer, WRITEBUFSIZE)) > 0)
Bram Moolenaar540fc6f2010-12-17 16:27:16 +01003874 if (write_eintr(fd_out, buffer, n) != n)
Bram Moolenaar071d4272004-06-13 20:20:40 +00003875 {
Bram Moolenaar6d057012021-12-31 18:49:43 +00003876 errmsg = _(e_error_writing_to_str);
Bram Moolenaar071d4272004-06-13 20:20:40 +00003877 break;
3878 }
3879
3880 vim_free(buffer);
3881 close(fd_in);
3882 if (close(fd_out) < 0)
Bram Moolenaar6d057012021-12-31 18:49:43 +00003883 errmsg = _(e_error_closing_str);
Bram Moolenaar071d4272004-06-13 20:20:40 +00003884 if (n < 0)
3885 {
Bram Moolenaar6d057012021-12-31 18:49:43 +00003886 errmsg = _(e_error_reading_str);
Bram Moolenaar071d4272004-06-13 20:20:40 +00003887 to = from;
3888 }
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003889#ifndef UNIX // for Unix mch_open() already set the permission
Bram Moolenaar9be038d2005-03-08 22:34:32 +00003890 mch_setperm(to, perm);
Bram Moolenaarc6039d82005-12-02 00:44:04 +00003891#endif
Bram Moolenaarcd71fa32005-03-11 22:46:48 +00003892#ifdef HAVE_ACL
3893 mch_set_acl(to, acl);
Bram Moolenaarb23a7e82008-06-27 18:42:32 +00003894 mch_free_acl(acl);
Bram Moolenaarcd71fa32005-03-11 22:46:48 +00003895#endif
Bram Moolenaar5bd32f42014-04-02 14:05:38 +02003896#if defined(HAVE_SELINUX) || defined(HAVE_SMACK)
Bram Moolenaare8747442013-11-12 18:09:29 +01003897 mch_copy_sec(from, to);
Bram Moolenaar0671de32013-11-12 05:12:03 +01003898#endif
Bram Moolenaar071d4272004-06-13 20:20:40 +00003899 if (errmsg != NULL)
3900 {
Bram Moolenaarf9e3e092019-01-13 23:38:42 +01003901 semsg(errmsg, to);
Bram Moolenaar071d4272004-06-13 20:20:40 +00003902 return -1;
3903 }
3904 mch_remove(from);
3905 return 0;
3906}
3907
3908static int already_warned = FALSE;
3909
3910/*
3911 * Check if any not hidden buffer has been changed.
3912 * Postpone the check if there are characters in the stuff buffer, a global
3913 * command is being executed, a mapping is being executed or an autocommand is
3914 * busy.
3915 * Returns TRUE if some message was written (screen should be redrawn and
3916 * cursor positioned).
3917 */
3918 int
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01003919check_timestamps(
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003920 int focus) // called for GUI focus event
Bram Moolenaar071d4272004-06-13 20:20:40 +00003921{
3922 buf_T *buf;
3923 int didit = 0;
3924 int n;
3925
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003926 // Don't check timestamps while system() or another low-level function may
3927 // cause us to lose and gain focus.
Bram Moolenaar071d4272004-06-13 20:20:40 +00003928 if (no_check_timestamps > 0)
3929 return FALSE;
3930
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003931 // Avoid doing a check twice. The OK/Reload dialog can cause a focus
3932 // event and we would keep on checking if the file is steadily growing.
3933 // Do check again after typing something.
Bram Moolenaar071d4272004-06-13 20:20:40 +00003934 if (focus && did_check_timestamps)
3935 {
3936 need_check_timestamps = TRUE;
3937 return FALSE;
3938 }
3939
3940 if (!stuff_empty() || global_busy || !typebuf_typed()
Bram Moolenaarf2bd8ef2018-03-04 18:08:14 +01003941 || autocmd_busy || curbuf_lock > 0 || allbuf_lock > 0)
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003942 need_check_timestamps = TRUE; // check later
Bram Moolenaar071d4272004-06-13 20:20:40 +00003943 else
3944 {
3945 ++no_wait_return;
3946 did_check_timestamps = TRUE;
3947 already_warned = FALSE;
Bram Moolenaar29323592016-07-24 22:04:11 +02003948 FOR_ALL_BUFFERS(buf)
Bram Moolenaar071d4272004-06-13 20:20:40 +00003949 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003950 // Only check buffers in a window.
Bram Moolenaar071d4272004-06-13 20:20:40 +00003951 if (buf->b_nwindows > 0)
3952 {
Bram Moolenaar7c0a2f32016-07-10 22:11:16 +02003953 bufref_T bufref;
3954
3955 set_bufref(&bufref, buf);
Bram Moolenaar071d4272004-06-13 20:20:40 +00003956 n = buf_check_timestamp(buf, focus);
3957 if (didit < n)
3958 didit = n;
Bram Moolenaar7c0a2f32016-07-10 22:11:16 +02003959 if (n > 0 && !bufref_valid(&bufref))
Bram Moolenaar071d4272004-06-13 20:20:40 +00003960 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003961 // Autocommands have removed the buffer, start at the
3962 // first one again.
Bram Moolenaar071d4272004-06-13 20:20:40 +00003963 buf = firstbuf;
3964 continue;
3965 }
3966 }
Bram Moolenaar071d4272004-06-13 20:20:40 +00003967 }
3968 --no_wait_return;
3969 need_check_timestamps = FALSE;
3970 if (need_wait_return && didit == 2)
3971 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003972 // make sure msg isn't overwritten
Bram Moolenaar32526b32019-01-19 17:43:09 +01003973 msg_puts("\n");
Bram Moolenaar071d4272004-06-13 20:20:40 +00003974 out_flush();
3975 }
3976 }
3977 return didit;
3978}
3979
3980/*
3981 * Move all the lines from buffer "frombuf" to buffer "tobuf".
3982 * Return OK or FAIL. When FAIL "tobuf" is incomplete and/or "frombuf" is not
3983 * empty.
3984 */
3985 static int
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01003986move_lines(buf_T *frombuf, buf_T *tobuf)
Bram Moolenaar071d4272004-06-13 20:20:40 +00003987{
3988 buf_T *tbuf = curbuf;
3989 int retval = OK;
3990 linenr_T lnum;
3991 char_u *p;
3992
Bram Moolenaar217e1b82019-12-01 21:41:28 +01003993 // Copy the lines in "frombuf" to "tobuf".
Bram Moolenaar071d4272004-06-13 20:20:40 +00003994 curbuf = tobuf;
3995 for (lnum = 1; lnum <= frombuf->b_ml.ml_line_count; ++lnum)
3996 {
3997 p = vim_strsave(ml_get_buf(frombuf, lnum, FALSE));
3998 if (p == NULL || ml_append(lnum - 1, p, 0, FALSE) == FAIL)
3999 {
4000 vim_free(p);
4001 retval = FAIL;
4002 break;
4003 }
4004 vim_free(p);
4005 }
4006
Bram Moolenaar217e1b82019-12-01 21:41:28 +01004007 // Delete all the lines in "frombuf".
Bram Moolenaar071d4272004-06-13 20:20:40 +00004008 if (retval != FAIL)
4009 {
4010 curbuf = frombuf;
Bram Moolenaar9460b9d2007-01-09 14:37:01 +00004011 for (lnum = curbuf->b_ml.ml_line_count; lnum > 0; --lnum)
Bram Moolenaarca70c072020-05-30 20:30:46 +02004012 if (ml_delete(lnum) == FAIL)
Bram Moolenaar071d4272004-06-13 20:20:40 +00004013 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01004014 // Oops! We could try putting back the saved lines, but that
4015 // might fail again...
Bram Moolenaar071d4272004-06-13 20:20:40 +00004016 retval = FAIL;
4017 break;
4018 }
4019 }
4020
4021 curbuf = tbuf;
4022 return retval;
4023}
4024
4025/*
4026 * Check if buffer "buf" has been changed.
4027 * Also check if the file for a new buffer unexpectedly appeared.
4028 * return 1 if a changed buffer was found.
4029 * return 2 if a message has been displayed.
4030 * return 0 otherwise.
4031 */
Bram Moolenaar071d4272004-06-13 20:20:40 +00004032 int
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01004033buf_check_timestamp(
4034 buf_T *buf,
Bram Moolenaar217e1b82019-12-01 21:41:28 +01004035 int focus UNUSED) // called for GUI focus event
Bram Moolenaar071d4272004-06-13 20:20:40 +00004036{
Bram Moolenaar8767f522016-07-01 17:17:39 +02004037 stat_T st;
Bram Moolenaar071d4272004-06-13 20:20:40 +00004038 int stat_res;
4039 int retval = 0;
4040 char_u *path;
Bram Moolenaarf9e3e092019-01-13 23:38:42 +01004041 char *tbuf;
Bram Moolenaar071d4272004-06-13 20:20:40 +00004042 char *mesg = NULL;
Bram Moolenaar44ecf652005-03-07 23:09:59 +00004043 char *mesg2 = "";
Bram Moolenaar071d4272004-06-13 20:20:40 +00004044 int helpmesg = FALSE;
Rob Pilling8196e942022-02-11 15:12:10 +00004045 enum {
4046 RELOAD_NONE,
4047 RELOAD_NORMAL,
4048 RELOAD_DETECT
4049 } reload = RELOAD_NONE;
Bram Moolenaar7c0a2f32016-07-10 22:11:16 +02004050 char *reason;
Bram Moolenaar071d4272004-06-13 20:20:40 +00004051#if defined(FEAT_CON_DIALOG) || defined(FEAT_GUI_DIALOG)
4052 int can_reload = FALSE;
4053#endif
Bram Moolenaar8767f522016-07-01 17:17:39 +02004054 off_T orig_size = buf->b_orig_size;
Bram Moolenaar071d4272004-06-13 20:20:40 +00004055 int orig_mode = buf->b_orig_mode;
4056#ifdef FEAT_GUI
4057 int save_mouse_correct = need_mouse_correct;
4058#endif
Bram Moolenaar071d4272004-06-13 20:20:40 +00004059 static int busy = FALSE;
Bram Moolenaar19a09a12005-03-04 23:39:37 +00004060 int n;
Bram Moolenaarf2bd8ef2018-03-04 18:08:14 +01004061#ifdef FEAT_EVAL
Bram Moolenaar19a09a12005-03-04 23:39:37 +00004062 char_u *s;
Bram Moolenaarf2bd8ef2018-03-04 18:08:14 +01004063#endif
Bram Moolenaar7c0a2f32016-07-10 22:11:16 +02004064 bufref_T bufref;
4065
4066 set_bufref(&bufref, buf);
Bram Moolenaar071d4272004-06-13 20:20:40 +00004067
Bram Moolenaar217e1b82019-12-01 21:41:28 +01004068 // If there is no file name, the buffer is not loaded, 'buftype' is
4069 // set, we are in the middle of a save or being called recursively: ignore
4070 // this buffer.
Bram Moolenaar071d4272004-06-13 20:20:40 +00004071 if (buf->b_ffname == NULL
4072 || buf->b_ml.ml_mfp == NULL
Bram Moolenaar91335e52018-08-01 17:53:12 +02004073 || !bt_normal(buf)
Bram Moolenaar071d4272004-06-13 20:20:40 +00004074 || buf->b_saving
Bram Moolenaar071d4272004-06-13 20:20:40 +00004075 || busy
Bram Moolenaar009b2592004-10-24 19:18:58 +00004076#ifdef FEAT_NETBEANS_INTG
4077 || isNetbeansBuffer(buf)
4078#endif
Bram Moolenaar8cad9302017-08-12 14:32:32 +02004079#ifdef FEAT_TERMINAL
4080 || buf->b_term != NULL
4081#endif
Bram Moolenaar071d4272004-06-13 20:20:40 +00004082 )
4083 return 0;
4084
4085 if ( !(buf->b_flags & BF_NOTEDITED)
4086 && buf->b_mtime != 0
4087 && ((stat_res = mch_stat((char *)buf->b_ffname, &st)) < 0
Leah Neukirchen0a7984a2021-10-14 21:27:55 +01004088 || time_differs(&st, buf->b_mtime, buf->b_mtime_ns)
Bram Moolenaara7611f62014-05-02 15:46:14 +02004089 || st.st_size != buf->b_orig_size
Bram Moolenaar071d4272004-06-13 20:20:40 +00004090#ifdef HAVE_ST_MODE
4091 || (int)st.st_mode != buf->b_orig_mode
4092#else
4093 || mch_getperm(buf->b_ffname) != buf->b_orig_mode
4094#endif
4095 ))
4096 {
Bram Moolenaar674e2bd2019-07-31 20:21:01 +02004097 long prev_b_mtime = buf->b_mtime;
4098
Bram Moolenaar071d4272004-06-13 20:20:40 +00004099 retval = 1;
4100
Bram Moolenaar386bc822018-07-07 18:34:12 +02004101 // set b_mtime to stop further warnings (e.g., when executing
4102 // FileChangedShell autocmd)
Bram Moolenaar071d4272004-06-13 20:20:40 +00004103 if (stat_res < 0)
4104 {
Bram Moolenaar8239c622019-05-24 16:46:01 +02004105 // Check the file again later to see if it re-appears.
4106 buf->b_mtime = -1;
Bram Moolenaar071d4272004-06-13 20:20:40 +00004107 buf->b_orig_size = 0;
4108 buf->b_orig_mode = 0;
4109 }
4110 else
4111 buf_store_time(buf, &st, buf->b_ffname);
4112
Bram Moolenaar217e1b82019-12-01 21:41:28 +01004113 // Don't do anything for a directory. Might contain the file
4114 // explorer.
Bram Moolenaar071d4272004-06-13 20:20:40 +00004115 if (mch_isdir(buf->b_fname))
4116 ;
4117
4118 /*
4119 * If 'autoread' is set, the buffer has no changes and the file still
4120 * exists, reload the buffer. Use the buffer-local option value if it
4121 * was set, the global option value otherwise.
4122 */
4123 else if ((buf->b_p_ar >= 0 ? buf->b_p_ar : p_ar)
4124 && !bufIsChanged(buf) && stat_res >= 0)
Rob Pilling8196e942022-02-11 15:12:10 +00004125 reload = RELOAD_NORMAL;
Bram Moolenaar071d4272004-06-13 20:20:40 +00004126 else
4127 {
Bram Moolenaar19a09a12005-03-04 23:39:37 +00004128 if (stat_res < 0)
4129 reason = "deleted";
4130 else if (bufIsChanged(buf))
4131 reason = "conflict";
Bram Moolenaar3e460fd2019-01-26 16:21:07 +01004132 /*
4133 * Check if the file contents really changed to avoid giving a
4134 * warning when only the timestamp was set (e.g., checked out of
4135 * CVS). Always warn when the buffer was changed.
4136 */
Bram Moolenaar19a09a12005-03-04 23:39:37 +00004137 else if (orig_size != buf->b_orig_size || buf_contents_changed(buf))
4138 reason = "changed";
4139 else if (orig_mode != buf->b_orig_mode)
4140 reason = "mode";
4141 else
4142 reason = "time";
Bram Moolenaar071d4272004-06-13 20:20:40 +00004143
4144 /*
4145 * Only give the warning if there are no FileChangedShell
4146 * autocommands.
4147 * Avoid being called recursively by setting "busy".
4148 */
4149 busy = TRUE;
Bram Moolenaarf2bd8ef2018-03-04 18:08:14 +01004150#ifdef FEAT_EVAL
Bram Moolenaar19a09a12005-03-04 23:39:37 +00004151 set_vim_var_string(VV_FCS_REASON, (char_u *)reason, -1);
4152 set_vim_var_string(VV_FCS_CHOICE, (char_u *)"", -1);
Bram Moolenaarf2bd8ef2018-03-04 18:08:14 +01004153#endif
Bram Moolenaarbf1b7a72009-03-05 02:15:53 +00004154 ++allbuf_lock;
Bram Moolenaar071d4272004-06-13 20:20:40 +00004155 n = apply_autocmds(EVENT_FILECHANGEDSHELL,
4156 buf->b_fname, buf->b_fname, FALSE, buf);
Bram Moolenaarbf1b7a72009-03-05 02:15:53 +00004157 --allbuf_lock;
Bram Moolenaar071d4272004-06-13 20:20:40 +00004158 busy = FALSE;
4159 if (n)
4160 {
Bram Moolenaar7c0a2f32016-07-10 22:11:16 +02004161 if (!bufref_valid(&bufref))
Bram Moolenaarcbadefe2022-01-01 19:33:50 +00004162 emsg(_(e_filechangedshell_autocommand_deleted_buffer));
Bram Moolenaarf2bd8ef2018-03-04 18:08:14 +01004163#ifdef FEAT_EVAL
Bram Moolenaar19a09a12005-03-04 23:39:37 +00004164 s = get_vim_var_str(VV_FCS_CHOICE);
4165 if (STRCMP(s, "reload") == 0 && *reason != 'd')
Rob Pilling8196e942022-02-11 15:12:10 +00004166 reload = RELOAD_NORMAL;
4167 else if (STRCMP(s, "edit") == 0)
4168 reload = RELOAD_DETECT;
Bram Moolenaar19a09a12005-03-04 23:39:37 +00004169 else if (STRCMP(s, "ask") == 0)
4170 n = FALSE;
4171 else
Bram Moolenaarf2bd8ef2018-03-04 18:08:14 +01004172#endif
Bram Moolenaar19a09a12005-03-04 23:39:37 +00004173 return 2;
Bram Moolenaar071d4272004-06-13 20:20:40 +00004174 }
Bram Moolenaar19a09a12005-03-04 23:39:37 +00004175 if (!n)
Bram Moolenaar071d4272004-06-13 20:20:40 +00004176 {
Bram Moolenaar19a09a12005-03-04 23:39:37 +00004177 if (*reason == 'd')
Bram Moolenaar674e2bd2019-07-31 20:21:01 +02004178 {
4179 // Only give the message once.
4180 if (prev_b_mtime != -1)
Bram Moolenaar6d057012021-12-31 18:49:43 +00004181 mesg = _(e_file_str_no_longer_available);
Bram Moolenaar674e2bd2019-07-31 20:21:01 +02004182 }
Bram Moolenaar071d4272004-06-13 20:20:40 +00004183 else
4184 {
4185 helpmesg = TRUE;
4186#if defined(FEAT_CON_DIALOG) || defined(FEAT_GUI_DIALOG)
4187 can_reload = TRUE;
4188#endif
Bram Moolenaar19a09a12005-03-04 23:39:37 +00004189 if (reason[2] == 'n')
4190 {
Bram Moolenaar071d4272004-06-13 20:20:40 +00004191 mesg = _("W12: Warning: File \"%s\" has changed and the buffer was changed in Vim as well");
Bram Moolenaar19a09a12005-03-04 23:39:37 +00004192 mesg2 = _("See \":help W12\" for more info.");
4193 }
4194 else if (reason[1] == 'h')
4195 {
Bram Moolenaar071d4272004-06-13 20:20:40 +00004196 mesg = _("W11: Warning: File \"%s\" has changed since editing started");
Bram Moolenaar19a09a12005-03-04 23:39:37 +00004197 mesg2 = _("See \":help W11\" for more info.");
4198 }
4199 else if (*reason == 'm')
4200 {
Bram Moolenaar071d4272004-06-13 20:20:40 +00004201 mesg = _("W16: Warning: Mode of file \"%s\" has changed since editing started");
Bram Moolenaar19a09a12005-03-04 23:39:37 +00004202 mesg2 = _("See \":help W16\" for more info.");
4203 }
Bram Moolenaar85388b52009-06-24 09:58:32 +00004204 else
Leah Neukirchen0a7984a2021-10-14 21:27:55 +01004205 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01004206 // Only timestamp changed, store it to avoid a warning
4207 // in check_mtime() later.
Bram Moolenaar85388b52009-06-24 09:58:32 +00004208 buf->b_mtime_read = buf->b_mtime;
Leah Neukirchen0a7984a2021-10-14 21:27:55 +01004209 buf->b_mtime_read_ns = buf->b_mtime_ns;
4210 }
Bram Moolenaar071d4272004-06-13 20:20:40 +00004211 }
4212 }
4213 }
4214
4215 }
4216 else if ((buf->b_flags & BF_NEW) && !(buf->b_flags & BF_NEW_W)
4217 && vim_fexists(buf->b_ffname))
4218 {
4219 retval = 1;
4220 mesg = _("W13: Warning: File \"%s\" has been created after editing started");
4221 buf->b_flags |= BF_NEW_W;
4222#if defined(FEAT_CON_DIALOG) || defined(FEAT_GUI_DIALOG)
4223 can_reload = TRUE;
4224#endif
4225 }
4226
4227 if (mesg != NULL)
4228 {
4229 path = home_replace_save(buf, buf->b_fname);
4230 if (path != NULL)
4231 {
Bram Moolenaar19a09a12005-03-04 23:39:37 +00004232 if (!helpmesg)
Bram Moolenaar071d4272004-06-13 20:20:40 +00004233 mesg2 = "";
Bram Moolenaarc799fe22019-05-28 23:08:19 +02004234 tbuf = alloc(STRLEN(path) + STRLEN(mesg) + STRLEN(mesg2) + 2);
Bram Moolenaarf9e3e092019-01-13 23:38:42 +01004235 sprintf(tbuf, mesg, path);
Bram Moolenaar496c5262009-03-18 14:42:00 +00004236#ifdef FEAT_EVAL
Bram Moolenaar217e1b82019-12-01 21:41:28 +01004237 // Set warningmsg here, before the unimportant and output-specific
4238 // mesg2 has been appended.
Bram Moolenaarf9e3e092019-01-13 23:38:42 +01004239 set_vim_var_string(VV_WARNINGMSG, (char_u *)tbuf, -1);
Bram Moolenaar496c5262009-03-18 14:42:00 +00004240#endif
Bram Moolenaar071d4272004-06-13 20:20:40 +00004241#if defined(FEAT_CON_DIALOG) || defined(FEAT_GUI_DIALOG)
4242 if (can_reload)
4243 {
4244 if (*mesg2 != NUL)
4245 {
4246 STRCAT(tbuf, "\n");
4247 STRCAT(tbuf, mesg2);
4248 }
Rob Pilling8196e942022-02-11 15:12:10 +00004249 switch (do_dialog(VIM_WARNING, (char_u *)_("Warning"),
4250 (char_u *)tbuf,
4251 (char_u *)_("&OK\n&Load File\nLoad File &and Options"),
4252 1, NULL, TRUE))
4253 {
4254 case 2:
4255 reload = RELOAD_NORMAL;
4256 break;
4257 case 3:
4258 reload = RELOAD_DETECT;
4259 break;
4260 }
Bram Moolenaar071d4272004-06-13 20:20:40 +00004261 }
4262 else
4263#endif
Bram Moolenaar24959102022-05-07 20:01:16 +01004264 if (State > MODE_NORMAL_BUSY || (State & MODE_CMDLINE)
4265 || already_warned)
Bram Moolenaar071d4272004-06-13 20:20:40 +00004266 {
4267 if (*mesg2 != NUL)
4268 {
4269 STRCAT(tbuf, "; ");
4270 STRCAT(tbuf, mesg2);
4271 }
Bram Moolenaarf9e3e092019-01-13 23:38:42 +01004272 emsg(tbuf);
Bram Moolenaar071d4272004-06-13 20:20:40 +00004273 retval = 2;
4274 }
4275 else
4276 {
Bram Moolenaar071d4272004-06-13 20:20:40 +00004277 if (!autocmd_busy)
Bram Moolenaar071d4272004-06-13 20:20:40 +00004278 {
4279 msg_start();
Bram Moolenaar32526b32019-01-19 17:43:09 +01004280 msg_puts_attr(tbuf, HL_ATTR(HLF_E) + MSG_HIST);
Bram Moolenaar071d4272004-06-13 20:20:40 +00004281 if (*mesg2 != NUL)
Bram Moolenaar32526b32019-01-19 17:43:09 +01004282 msg_puts_attr(mesg2, HL_ATTR(HLF_W) + MSG_HIST);
Bram Moolenaar071d4272004-06-13 20:20:40 +00004283 msg_clr_eos();
4284 (void)msg_end();
Bram Moolenaar28ee8922020-10-28 20:20:00 +01004285 if (emsg_silent == 0 && !in_assert_fails)
Bram Moolenaar071d4272004-06-13 20:20:40 +00004286 {
4287 out_flush();
Bram Moolenaarf2bd8ef2018-03-04 18:08:14 +01004288#ifdef FEAT_GUI
Bram Moolenaar071d4272004-06-13 20:20:40 +00004289 if (!focus)
Bram Moolenaarf2bd8ef2018-03-04 18:08:14 +01004290#endif
Bram Moolenaar217e1b82019-12-01 21:41:28 +01004291 // give the user some time to think about it
Bram Moolenaareda1da02019-11-17 17:06:33 +01004292 ui_delay(1004L, TRUE);
Bram Moolenaar071d4272004-06-13 20:20:40 +00004293
Bram Moolenaar217e1b82019-12-01 21:41:28 +01004294 // don't redraw and erase the message
Bram Moolenaar071d4272004-06-13 20:20:40 +00004295 redraw_cmdline = FALSE;
4296 }
4297 }
4298 already_warned = TRUE;
Bram Moolenaar071d4272004-06-13 20:20:40 +00004299 }
4300
4301 vim_free(path);
4302 vim_free(tbuf);
4303 }
4304 }
4305
Rob Pilling8196e942022-02-11 15:12:10 +00004306 if (reload != RELOAD_NONE)
Bram Moolenaar465748e2012-08-29 18:50:54 +02004307 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01004308 // Reload the buffer.
Rob Pilling8196e942022-02-11 15:12:10 +00004309 buf_reload(buf, orig_mode, reload == RELOAD_DETECT);
Bram Moolenaar465748e2012-08-29 18:50:54 +02004310#ifdef FEAT_PERSISTENT_UNDO
4311 if (buf->b_p_udf && buf->b_ffname != NULL)
4312 {
4313 char_u hash[UNDO_HASH_SIZE];
4314 buf_T *save_curbuf = curbuf;
4315
Bram Moolenaar217e1b82019-12-01 21:41:28 +01004316 // Any existing undo file is unusable, write it now.
Bram Moolenaar465748e2012-08-29 18:50:54 +02004317 curbuf = buf;
4318 u_compute_hash(hash);
4319 u_write_undo(NULL, FALSE, buf, hash);
4320 curbuf = save_curbuf;
4321 }
4322#endif
4323 }
Bram Moolenaar071d4272004-06-13 20:20:40 +00004324
Bram Moolenaar217e1b82019-12-01 21:41:28 +01004325 // Trigger FileChangedShell when the file was changed in any way.
Bram Moolenaar7c0a2f32016-07-10 22:11:16 +02004326 if (bufref_valid(&bufref) && retval != 0)
Bram Moolenaar56718732006-03-15 22:53:57 +00004327 (void)apply_autocmds(EVENT_FILECHANGEDSHELLPOST,
4328 buf->b_fname, buf->b_fname, FALSE, buf);
Bram Moolenaar071d4272004-06-13 20:20:40 +00004329#ifdef FEAT_GUI
Bram Moolenaar217e1b82019-12-01 21:41:28 +01004330 // restore this in case an autocommand has set it; it would break
4331 // 'mousefocus'
Bram Moolenaar071d4272004-06-13 20:20:40 +00004332 need_mouse_correct = save_mouse_correct;
4333#endif
4334
4335 return retval;
4336}
4337
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004338/*
4339 * Reload a buffer that is already loaded.
4340 * Used when the file was changed outside of Vim.
Bram Moolenaar316059c2006-01-14 21:18:42 +00004341 * "orig_mode" is buf->b_orig_mode before the need for reloading was detected.
4342 * buf->b_orig_mode may have been reset already.
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004343 */
4344 void
Rob Pilling8196e942022-02-11 15:12:10 +00004345buf_reload(buf_T *buf, int orig_mode, int reload_options)
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004346{
4347 exarg_T ea;
4348 pos_T old_cursor;
4349 linenr_T old_topline;
4350 int old_ro = buf->b_p_ro;
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004351 buf_T *savebuf;
Bram Moolenaar7c0a2f32016-07-10 22:11:16 +02004352 bufref_T bufref;
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004353 int saved = OK;
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004354 aco_save_T aco;
Bram Moolenaar59f931e2010-07-24 20:27:03 +02004355 int flags = READ_NEW;
Rob Pilling8196e942022-02-11 15:12:10 +00004356 int prepped = OK;
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004357
Bram Moolenaar217e1b82019-12-01 21:41:28 +01004358 // set curwin/curbuf for "buf" and save some things
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004359 aucmd_prepbuf(&aco, buf);
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004360
Rob Pilling8196e942022-02-11 15:12:10 +00004361 // Unless reload_options is set, we only want to read the text from the
4362 // file, not reset the syntax highlighting, clear marks, diff status, etc.
4363 // Force the fileformat and encoding to be the same.
4364 if (reload_options)
4365 memset(&ea, 0, sizeof(ea));
4366 else
4367 prepped = prep_exarg(&ea, buf);
4368
4369 if (prepped == OK)
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004370 {
4371 old_cursor = curwin->w_cursor;
4372 old_topline = curwin->w_topline;
4373
Bram Moolenaarf9bb7342010-08-04 14:29:54 +02004374 if (p_ur < 0 || curbuf->b_ml.ml_line_count <= p_ur)
Bram Moolenaar59f931e2010-07-24 20:27:03 +02004375 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01004376 // Save all the text, so that the reload can be undone.
4377 // Sync first so that this is a separate undo-able action.
Bram Moolenaar59f931e2010-07-24 20:27:03 +02004378 u_sync(FALSE);
4379 saved = u_savecommon(0, curbuf->b_ml.ml_line_count + 1, 0, TRUE);
4380 flags |= READ_KEEP_UNDO;
4381 }
4382
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004383 /*
4384 * To behave like when a new file is edited (matters for
4385 * BufReadPost autocommands) we first need to delete the current
4386 * buffer contents. But if reading the file fails we should keep
4387 * the old contents. Can't use memory only, the file might be
4388 * too big. Use a hidden buffer to move the buffer contents to.
4389 */
Bram Moolenaarb5aedf32017-03-12 18:23:53 +01004390 if (BUFEMPTY() || saved == FAIL)
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004391 savebuf = NULL;
4392 else
4393 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01004394 // Allocate a buffer without putting it in the buffer list.
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004395 savebuf = buflist_new(NULL, NULL, (linenr_T)1, BLN_DUMMY);
Bram Moolenaar7c0a2f32016-07-10 22:11:16 +02004396 set_bufref(&bufref, savebuf);
Bram Moolenaar8424a622006-04-19 21:23:36 +00004397 if (savebuf != NULL && buf == curbuf)
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004398 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01004399 // Open the memline.
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004400 curbuf = savebuf;
4401 curwin->w_buffer = savebuf;
Bram Moolenaar4770d092006-01-12 23:22:24 +00004402 saved = ml_open(curbuf);
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004403 curbuf = buf;
4404 curwin->w_buffer = buf;
4405 }
Bram Moolenaar8424a622006-04-19 21:23:36 +00004406 if (savebuf == NULL || saved == FAIL || buf != curbuf
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004407 || move_lines(buf, savebuf) == FAIL)
4408 {
Bram Moolenaarb09feaa2022-01-02 20:20:45 +00004409 semsg(_(e_could_not_prepare_for_reloading_str), buf->b_fname);
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004410 saved = FAIL;
4411 }
4412 }
4413
4414 if (saved == OK)
4415 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01004416 curbuf->b_flags |= BF_CHECK_RO; // check for RO again
4417 keep_filetype = TRUE; // don't detect 'filetype'
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004418 if (readfile(buf->b_ffname, buf->b_fname, (linenr_T)0,
4419 (linenr_T)0,
Bram Moolenaare13b9af2017-01-13 22:01:02 +01004420 (linenr_T)MAXLNUM, &ea, flags) != OK)
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004421 {
Bram Moolenaarf2bd8ef2018-03-04 18:08:14 +01004422#if defined(FEAT_EVAL)
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004423 if (!aborting())
4424#endif
Bram Moolenaareaaac012022-01-02 17:00:40 +00004425 semsg(_(e_could_not_reload_str), buf->b_fname);
Bram Moolenaar7c0a2f32016-07-10 22:11:16 +02004426 if (savebuf != NULL && bufref_valid(&bufref) && buf == curbuf)
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004427 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01004428 // Put the text back from the save buffer. First
4429 // delete any lines that readfile() added.
Bram Moolenaarb5aedf32017-03-12 18:23:53 +01004430 while (!BUFEMPTY())
Bram Moolenaarca70c072020-05-30 20:30:46 +02004431 if (ml_delete(buf->b_ml.ml_line_count) == FAIL)
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004432 break;
4433 (void)move_lines(savebuf, buf);
4434 }
4435 }
Bram Moolenaar217e1b82019-12-01 21:41:28 +01004436 else if (buf == curbuf) // "buf" still valid
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004437 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01004438 // Mark the buffer as unmodified and free undo info.
Bram Moolenaarc024b462019-06-08 18:07:21 +02004439 unchanged(buf, TRUE, TRUE);
Bram Moolenaar59f931e2010-07-24 20:27:03 +02004440 if ((flags & READ_KEEP_UNDO) == 0)
4441 {
4442 u_blockfree(buf);
4443 u_clearall(buf);
4444 }
4445 else
Bram Moolenaarf9bb7342010-08-04 14:29:54 +02004446 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01004447 // Mark all undo states as changed.
Bram Moolenaar59f931e2010-07-24 20:27:03 +02004448 u_unchanged(curbuf);
Bram Moolenaarf9bb7342010-08-04 14:29:54 +02004449 }
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004450 }
4451 }
4452 vim_free(ea.cmd);
4453
Bram Moolenaar7c0a2f32016-07-10 22:11:16 +02004454 if (savebuf != NULL && bufref_valid(&bufref))
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004455 wipe_buffer(savebuf, FALSE);
4456
4457#ifdef FEAT_DIFF
Bram Moolenaar217e1b82019-12-01 21:41:28 +01004458 // Invalidate diff info if necessary.
Bram Moolenaar8424a622006-04-19 21:23:36 +00004459 diff_invalidate(curbuf);
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004460#endif
4461
Bram Moolenaar217e1b82019-12-01 21:41:28 +01004462 // Restore the topline and cursor position and check it (lines may
4463 // have been removed).
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004464 if (old_topline > curbuf->b_ml.ml_line_count)
4465 curwin->w_topline = curbuf->b_ml.ml_line_count;
4466 else
4467 curwin->w_topline = old_topline;
4468 curwin->w_cursor = old_cursor;
4469 check_cursor();
4470 update_topline();
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004471 keep_filetype = FALSE;
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004472#ifdef FEAT_FOLDING
4473 {
Bram Moolenaarbd1e5d22009-04-29 09:02:44 +00004474 win_T *wp;
4475 tabpage_T *tp;
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004476
Bram Moolenaar217e1b82019-12-01 21:41:28 +01004477 // Update folds unless they are defined manually.
Bram Moolenaarbd1e5d22009-04-29 09:02:44 +00004478 FOR_ALL_TAB_WINDOWS(tp, wp)
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004479 if (wp->w_buffer == curwin->w_buffer
4480 && !foldmethodIsManual(wp))
4481 foldUpdateAll(wp);
4482 }
4483#endif
Bram Moolenaar217e1b82019-12-01 21:41:28 +01004484 // If the mode didn't change and 'readonly' was set, keep the old
4485 // value; the user probably used the ":view" command. But don't
4486 // reset it, might have had a read error.
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004487 if (orig_mode == curbuf->b_orig_mode)
4488 curbuf->b_p_ro |= old_ro;
Bram Moolenaar52f85b72013-01-30 14:13:56 +01004489
Bram Moolenaar217e1b82019-12-01 21:41:28 +01004490 // Modelines must override settings done by autocommands.
Bram Moolenaar52f85b72013-01-30 14:13:56 +01004491 do_modelines(0);
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004492 }
4493
Bram Moolenaar217e1b82019-12-01 21:41:28 +01004494 // restore curwin/curbuf and a few other things
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004495 aucmd_restbuf(&aco);
Bram Moolenaar217e1b82019-12-01 21:41:28 +01004496 // Careful: autocommands may have made "buf" invalid!
Bram Moolenaar631d6f62005-06-07 21:02:10 +00004497}
4498
Bram Moolenaar071d4272004-06-13 20:20:40 +00004499 void
Bram Moolenaar8767f522016-07-01 17:17:39 +02004500buf_store_time(buf_T *buf, stat_T *st, char_u *fname UNUSED)
Bram Moolenaar071d4272004-06-13 20:20:40 +00004501{
4502 buf->b_mtime = (long)st->st_mtime;
Leah Neukirchen0a7984a2021-10-14 21:27:55 +01004503#ifdef ST_MTIM_NSEC
4504 buf->b_mtime_ns = (long)st->ST_MTIM_NSEC;
4505#else
4506 buf->b_mtime_ns = 0;
4507#endif
Bram Moolenaar914703b2010-05-31 21:59:46 +02004508 buf->b_orig_size = st->st_size;
Bram Moolenaar071d4272004-06-13 20:20:40 +00004509#ifdef HAVE_ST_MODE
4510 buf->b_orig_mode = (int)st->st_mode;
4511#else
4512 buf->b_orig_mode = mch_getperm(fname);
4513#endif
4514}
4515
4516/*
4517 * Adjust the line with missing eol, used for the next write.
4518 * Used for do_filter(), when the input lines for the filter are deleted.
4519 */
4520 void
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01004521write_lnum_adjust(linenr_T offset)
Bram Moolenaar071d4272004-06-13 20:20:40 +00004522{
Bram Moolenaar217e1b82019-12-01 21:41:28 +01004523 if (curbuf->b_no_eol_lnum != 0) // only if there is a missing eol
Bram Moolenaarcab35ad2011-02-15 17:39:22 +01004524 curbuf->b_no_eol_lnum += offset;
Bram Moolenaar071d4272004-06-13 20:20:40 +00004525}
4526
Bram Moolenaar6c9ba042020-06-01 16:09:41 +02004527// Subfuncions for readdirex()
4528#ifdef FEAT_EVAL
4529# ifdef MSWIN
4530 static char_u *
4531getfpermwfd(WIN32_FIND_DATAW *wfd, char_u *perm)
4532{
4533 stat_T st;
4534 unsigned short st_mode;
4535 DWORD flag = wfd->dwFileAttributes;
4536 WCHAR *wp;
4537
4538 st_mode = (flag & FILE_ATTRIBUTE_DIRECTORY)
4539 ? (_S_IFDIR | _S_IEXEC) : _S_IFREG;
4540 st_mode |= (flag & FILE_ATTRIBUTE_READONLY)
4541 ? _S_IREAD : (_S_IREAD | _S_IWRITE);
4542
4543 wp = wcsrchr(wfd->cFileName, L'.');
4544 if (wp != NULL)
4545 {
4546 if (_wcsicmp(wp, L".exe") == 0 ||
4547 _wcsicmp(wp, L".com") == 0 ||
4548 _wcsicmp(wp, L".cmd") == 0 ||
4549 _wcsicmp(wp, L".bat") == 0)
4550 st_mode |= _S_IEXEC;
4551 }
4552
4553 // Copy user bits to group/other.
4554 st_mode |= (st_mode & 0700) >> 3;
4555 st_mode |= (st_mode & 0700) >> 6;
4556
4557 st.st_mode = st_mode;
4558 return getfpermst(&st, perm);
4559}
4560
4561 static char_u *
4562getftypewfd(WIN32_FIND_DATAW *wfd)
4563{
4564 DWORD flag = wfd->dwFileAttributes;
4565 DWORD tag = wfd->dwReserved0;
4566
4567 if (flag & FILE_ATTRIBUTE_REPARSE_POINT)
4568 {
4569 if (tag == IO_REPARSE_TAG_MOUNT_POINT)
4570 return (char_u*)"junction";
4571 else if (tag == IO_REPARSE_TAG_SYMLINK)
4572 {
4573 if (flag & FILE_ATTRIBUTE_DIRECTORY)
4574 return (char_u*)"linkd";
4575 else
4576 return (char_u*)"link";
4577 }
4578 return (char_u*)"reparse"; // unknown reparse point type
4579 }
4580 if (flag & FILE_ATTRIBUTE_DIRECTORY)
4581 return (char_u*)"dir";
4582 else
4583 return (char_u*)"file";
4584}
4585
4586 static dict_T *
4587create_readdirex_item(WIN32_FIND_DATAW *wfd)
4588{
4589 dict_T *item;
4590 char_u *p;
4591 varnumber_T size, time;
4592 char_u permbuf[] = "---------";
4593
4594 item = dict_alloc();
4595 if (item == NULL)
4596 return NULL;
4597 item->dv_refcount++;
4598
4599 p = utf16_to_enc(wfd->cFileName, NULL);
4600 if (p == NULL)
4601 goto theend;
4602 if (dict_add_string(item, "name", p) == FAIL)
4603 {
4604 vim_free(p);
4605 goto theend;
4606 }
4607 vim_free(p);
4608
4609 size = (((varnumber_T)wfd->nFileSizeHigh) << 32) | wfd->nFileSizeLow;
4610 if (dict_add_number(item, "size", size) == FAIL)
4611 goto theend;
4612
4613 // Convert FILETIME to unix time.
4614 time = (((((varnumber_T)wfd->ftLastWriteTime.dwHighDateTime) << 32) |
4615 wfd->ftLastWriteTime.dwLowDateTime)
4616 - 116444736000000000) / 10000000;
4617 if (dict_add_number(item, "time", time) == FAIL)
4618 goto theend;
4619
4620 if (dict_add_string(item, "type", getftypewfd(wfd)) == FAIL)
4621 goto theend;
4622 if (dict_add_string(item, "perm", getfpermwfd(wfd, permbuf)) == FAIL)
4623 goto theend;
4624
4625 if (dict_add_string(item, "user", (char_u*)"") == FAIL)
4626 goto theend;
4627 if (dict_add_string(item, "group", (char_u*)"") == FAIL)
4628 goto theend;
4629
4630 return item;
4631
4632theend:
4633 dict_unref(item);
4634 return NULL;
4635}
4636# else
4637 static dict_T *
4638create_readdirex_item(char_u *path, char_u *name)
4639{
4640 dict_T *item;
4641 char *p;
4642 size_t len;
4643 stat_T st;
4644 int ret, link = FALSE;
4645 varnumber_T size;
4646 char_u permbuf[] = "---------";
Bram Moolenaarab540322020-06-10 15:55:36 +02004647 char_u *q = NULL;
Bram Moolenaar6c9ba042020-06-01 16:09:41 +02004648 struct passwd *pw;
4649 struct group *gr;
4650
4651 item = dict_alloc();
4652 if (item == NULL)
4653 return NULL;
4654 item->dv_refcount++;
4655
4656 len = STRLEN(path) + 1 + STRLEN(name) + 1;
4657 p = alloc(len);
4658 if (p == NULL)
4659 goto theend;
4660 vim_snprintf(p, len, "%s/%s", path, name);
4661 ret = mch_lstat(p, &st);
4662 if (ret >= 0 && S_ISLNK(st.st_mode))
4663 {
4664 link = TRUE;
4665 ret = mch_stat(p, &st);
Bram Moolenaarab540322020-06-10 15:55:36 +02004666 if (ret < 0)
4667 q = (char_u*)"link";
4668
Bram Moolenaar6c9ba042020-06-01 16:09:41 +02004669 }
4670 vim_free(p);
4671
4672 if (dict_add_string(item, "name", name) == FAIL)
4673 goto theend;
4674
4675 if (ret >= 0)
4676 {
4677 size = (varnumber_T)st.st_size;
4678 if (S_ISDIR(st.st_mode))
4679 size = 0;
4680 // non-perfect check for overflow
Bram Moolenaar441d60e2020-06-02 22:19:50 +02004681 else if ((off_T)size != (off_T)st.st_size)
Bram Moolenaar6c9ba042020-06-01 16:09:41 +02004682 size = -2;
4683 if (dict_add_number(item, "size", size) == FAIL)
4684 goto theend;
4685 if (dict_add_number(item, "time", (varnumber_T)st.st_mtime) == FAIL)
4686 goto theend;
4687
4688 if (link)
4689 {
4690 if (S_ISDIR(st.st_mode))
4691 q = (char_u*)"linkd";
4692 else
4693 q = (char_u*)"link";
4694 }
4695 else
4696 q = getftypest(&st);
4697 if (dict_add_string(item, "type", q) == FAIL)
4698 goto theend;
4699 if (dict_add_string(item, "perm", getfpermst(&st, permbuf)) == FAIL)
4700 goto theend;
4701
4702 pw = getpwuid(st.st_uid);
4703 if (pw == NULL)
4704 q = (char_u*)"";
4705 else
4706 q = (char_u*)pw->pw_name;
4707 if (dict_add_string(item, "user", q) == FAIL)
4708 goto theend;
Bram Moolenaar82c38fe2021-01-04 10:47:26 +01004709# if !defined(VMS) || (defined(VMS) && defined(HAVE_XOS_R_H))
Bram Moolenaar6c9ba042020-06-01 16:09:41 +02004710 gr = getgrgid(st.st_gid);
4711 if (gr == NULL)
4712 q = (char_u*)"";
4713 else
4714 q = (char_u*)gr->gr_name;
Bram Moolenaar82c38fe2021-01-04 10:47:26 +01004715# endif
Bram Moolenaar6c9ba042020-06-01 16:09:41 +02004716 if (dict_add_string(item, "group", q) == FAIL)
4717 goto theend;
4718 }
4719 else
4720 {
4721 if (dict_add_number(item, "size", -1) == FAIL)
4722 goto theend;
4723 if (dict_add_number(item, "time", -1) == FAIL)
4724 goto theend;
Bram Moolenaarab540322020-06-10 15:55:36 +02004725 if (dict_add_string(item, "type", q == NULL ? (char_u*)"" : q) == FAIL)
Bram Moolenaar6c9ba042020-06-01 16:09:41 +02004726 goto theend;
4727 if (dict_add_string(item, "perm", (char_u*)"") == FAIL)
4728 goto theend;
4729 if (dict_add_string(item, "user", (char_u*)"") == FAIL)
4730 goto theend;
4731 if (dict_add_string(item, "group", (char_u*)"") == FAIL)
4732 goto theend;
4733 }
4734 return item;
4735
4736theend:
4737 dict_unref(item);
4738 return NULL;
4739}
4740# endif
4741
4742 static int
4743compare_readdirex_item(const void *p1, const void *p2)
4744{
4745 char_u *name1, *name2;
4746
Bram Moolenaard61efa52022-07-23 09:52:04 +01004747 name1 = dict_get_string(*(dict_T**)p1, "name", FALSE);
4748 name2 = dict_get_string(*(dict_T**)p2, "name", FALSE);
Bram Moolenaar84cf6bd2020-06-16 20:03:43 +02004749 if (readdirex_sort == READDIR_SORT_BYTE)
4750 return STRCMP(name1, name2);
4751 else if (readdirex_sort == READDIR_SORT_IC)
4752 return STRICMP(name1, name2);
4753 else
4754 return STRCOLL(name1, name2);
4755}
4756
4757 static int
4758compare_readdir_item(const void *s1, const void *s2)
4759{
4760 if (readdirex_sort == READDIR_SORT_BYTE)
4761 return STRCMP(*(char **)s1, *(char **)s2);
4762 else if (readdirex_sort == READDIR_SORT_IC)
4763 return STRICMP(*(char **)s1, *(char **)s2);
4764 else
4765 return STRCOLL(*(char **)s1, *(char **)s2);
Bram Moolenaar6c9ba042020-06-01 16:09:41 +02004766}
4767#endif
4768
Bram Moolenaarda440d22016-01-16 21:27:23 +01004769#if defined(TEMPDIRNAMES) || defined(FEAT_EVAL) || defined(PROTO)
4770/*
Bram Moolenaar6c9ba042020-06-01 16:09:41 +02004771 * Core part of "readdir()" and "readdirex()" function.
Bram Moolenaar701ff0a2019-05-24 14:14:14 +02004772 * Retrieve the list of files/directories of "path" into "gap".
Bram Moolenaar6c9ba042020-06-01 16:09:41 +02004773 * If "withattr" is TRUE, retrieve the names and their attributes.
4774 * If "withattr" is FALSE, retrieve the names only.
Bram Moolenaar701ff0a2019-05-24 14:14:14 +02004775 * Return OK for success, FAIL for failure.
4776 */
4777 int
4778readdir_core(
4779 garray_T *gap,
4780 char_u *path,
Bram Moolenaar6c9ba042020-06-01 16:09:41 +02004781 int withattr UNUSED,
Bram Moolenaar701ff0a2019-05-24 14:14:14 +02004782 void *context,
Bram Moolenaar84cf6bd2020-06-16 20:03:43 +02004783 int (*checkitem)(void *context, void *item),
Bram Moolenaar6ed545e2022-05-09 20:09:23 +01004784 int sort)
Bram Moolenaar701ff0a2019-05-24 14:14:14 +02004785{
Bram Moolenaar6c9ba042020-06-01 16:09:41 +02004786 int failed = FALSE;
4787 char_u *p;
Bram Moolenaar80147dd2020-02-04 22:32:59 +01004788# ifdef MSWIN
Bram Moolenaar6c9ba042020-06-01 16:09:41 +02004789 char_u *buf;
4790 int ok;
4791 HANDLE hFind = INVALID_HANDLE_VALUE;
4792 WIN32_FIND_DATAW wfd;
4793 WCHAR *wn = NULL; // UTF-16 name, NULL when not used.
Bram Moolenaar80147dd2020-02-04 22:32:59 +01004794# else
Bram Moolenaar6c9ba042020-06-01 16:09:41 +02004795 DIR *dirp;
4796 struct dirent *dp;
Bram Moolenaar80147dd2020-02-04 22:32:59 +01004797# endif
Bram Moolenaar701ff0a2019-05-24 14:14:14 +02004798
Bram Moolenaar04935fb2022-01-08 16:19:22 +00004799 ga_init2(gap, sizeof(void *), 20);
Bram Moolenaar6c9ba042020-06-01 16:09:41 +02004800
4801# ifdef FEAT_EVAL
4802# define FREE_ITEM(item) do { \
4803 if (withattr) \
kylo252ae6f1d82022-02-16 19:24:07 +00004804 dict_unref((dict_T*)(item)); \
Bram Moolenaar6c9ba042020-06-01 16:09:41 +02004805 else \
4806 vim_free(item); \
4807 } while (0)
Bram Moolenaar84cf6bd2020-06-16 20:03:43 +02004808
4809 readdirex_sort = READDIR_SORT_BYTE;
Bram Moolenaar6c9ba042020-06-01 16:09:41 +02004810# else
4811# define FREE_ITEM(item) vim_free(item)
4812# endif
4813
4814# ifdef MSWIN
4815 buf = alloc(MAXPATHL);
4816 if (buf == NULL)
4817 return FAIL;
4818 STRNCPY(buf, path, MAXPATHL-5);
4819 p = buf + STRLEN(buf);
4820 MB_PTR_BACK(buf, p);
4821 if (*p == '\\' || *p == '/')
4822 *p = NUL;
4823 STRCAT(p, "\\*");
4824
4825 wn = enc_to_utf16(buf, NULL);
4826 if (wn != NULL)
4827 hFind = FindFirstFileW(wn, &wfd);
4828 ok = (hFind != INVALID_HANDLE_VALUE);
4829 if (!ok)
4830 {
4831 failed = TRUE;
Bram Moolenaar460ae5d2022-01-01 14:19:49 +00004832 semsg(_(e_cant_open_file_str), path);
Bram Moolenaar6c9ba042020-06-01 16:09:41 +02004833 }
4834 else
4835 {
4836 while (ok)
4837 {
4838 int ignore;
4839 void *item;
4840 WCHAR *wp;
4841
4842 wp = wfd.cFileName;
4843 ignore = wp[0] == L'.' &&
4844 (wp[1] == NUL ||
4845 (wp[1] == L'.' && wp[2] == NUL));
Bram Moolenaarab540322020-06-10 15:55:36 +02004846 if (ignore)
4847 {
4848 ok = FindNextFileW(hFind, &wfd);
4849 continue;
4850 }
Bram Moolenaar6c9ba042020-06-01 16:09:41 +02004851# ifdef FEAT_EVAL
4852 if (withattr)
4853 item = (void*)create_readdirex_item(&wfd);
4854 else
4855# endif
4856 item = (void*)utf16_to_enc(wfd.cFileName, NULL);
4857 if (item == NULL)
4858 {
4859 failed = TRUE;
4860 break;
4861 }
4862
4863 if (!ignore && checkitem != NULL)
4864 {
4865 int r = checkitem(context, item);
4866
4867 if (r < 0)
4868 {
4869 FREE_ITEM(item);
4870 break;
4871 }
4872 if (r == 0)
4873 ignore = TRUE;
4874 }
4875
4876 if (!ignore)
4877 {
4878 if (ga_grow(gap, 1) == OK)
4879 ((void**)gap->ga_data)[gap->ga_len++] = item;
4880 else
4881 {
4882 failed = TRUE;
4883 FREE_ITEM(item);
4884 break;
4885 }
4886 }
4887 else
4888 FREE_ITEM(item);
4889
4890 ok = FindNextFileW(hFind, &wfd);
4891 }
4892 FindClose(hFind);
4893 }
4894
4895 vim_free(buf);
4896 vim_free(wn);
4897# else // MSWIN
4898 dirp = opendir((char *)path);
4899 if (dirp == NULL)
4900 {
4901 failed = TRUE;
Bram Moolenaar460ae5d2022-01-01 14:19:49 +00004902 semsg(_(e_cant_open_file_str), path);
Bram Moolenaar6c9ba042020-06-01 16:09:41 +02004903 }
4904 else
4905 {
4906 for (;;)
4907 {
4908 int ignore;
4909 void *item;
4910
4911 dp = readdir(dirp);
4912 if (dp == NULL)
4913 break;
4914 p = (char_u *)dp->d_name;
4915
4916 ignore = p[0] == '.' &&
4917 (p[1] == NUL ||
4918 (p[1] == '.' && p[2] == NUL));
Bram Moolenaarab540322020-06-10 15:55:36 +02004919 if (ignore)
4920 continue;
Bram Moolenaar6c9ba042020-06-01 16:09:41 +02004921# ifdef FEAT_EVAL
4922 if (withattr)
4923 item = (void*)create_readdirex_item(path, p);
4924 else
4925# endif
4926 item = (void*)vim_strsave(p);
4927 if (item == NULL)
4928 {
4929 failed = TRUE;
4930 break;
4931 }
4932
Bram Moolenaarfe154992022-03-22 20:42:12 +00004933 if (checkitem != NULL)
Bram Moolenaar6c9ba042020-06-01 16:09:41 +02004934 {
4935 int r = checkitem(context, item);
4936
4937 if (r < 0)
4938 {
4939 FREE_ITEM(item);
4940 break;
4941 }
4942 if (r == 0)
4943 ignore = TRUE;
4944 }
4945
4946 if (!ignore)
4947 {
4948 if (ga_grow(gap, 1) == OK)
4949 ((void**)gap->ga_data)[gap->ga_len++] = item;
4950 else
4951 {
4952 failed = TRUE;
4953 FREE_ITEM(item);
4954 break;
4955 }
4956 }
4957 else
4958 FREE_ITEM(item);
4959 }
4960
4961 closedir(dirp);
4962 }
4963# endif // MSWIN
4964
4965# undef FREE_ITEM
4966
Bram Moolenaar84cf6bd2020-06-16 20:03:43 +02004967 if (!failed && gap->ga_len > 0 && sort > READDIR_SORT_NONE)
Bram Moolenaar6c9ba042020-06-01 16:09:41 +02004968 {
4969# ifdef FEAT_EVAL
Bram Moolenaar84cf6bd2020-06-16 20:03:43 +02004970 readdirex_sort = sort;
Bram Moolenaar6c9ba042020-06-01 16:09:41 +02004971 if (withattr)
4972 qsort((void*)gap->ga_data, (size_t)gap->ga_len, sizeof(dict_T*),
4973 compare_readdirex_item);
4974 else
Bram Moolenaar84cf6bd2020-06-16 20:03:43 +02004975 qsort((void*)gap->ga_data, (size_t)gap->ga_len, sizeof(char_u *),
4976 compare_readdir_item);
4977# else
Bram Moolenaar6c9ba042020-06-01 16:09:41 +02004978 sort_strings((char_u **)gap->ga_data, gap->ga_len);
Bram Moolenaar84cf6bd2020-06-16 20:03:43 +02004979# endif
Bram Moolenaar6c9ba042020-06-01 16:09:41 +02004980 }
Bram Moolenaar701ff0a2019-05-24 14:14:14 +02004981
4982 return failed ? FAIL : OK;
4983}
4984
4985/*
Bram Moolenaarda440d22016-01-16 21:27:23 +01004986 * Delete "name" and everything in it, recursively.
Bram Moolenaar701ff0a2019-05-24 14:14:14 +02004987 * return 0 for success, -1 if some file was not deleted.
Bram Moolenaarda440d22016-01-16 21:27:23 +01004988 */
4989 int
4990delete_recursive(char_u *name)
4991{
4992 int result = 0;
Bram Moolenaarda440d22016-01-16 21:27:23 +01004993 int i;
4994 char_u *exp;
Bram Moolenaar701ff0a2019-05-24 14:14:14 +02004995 garray_T ga;
Bram Moolenaarda440d22016-01-16 21:27:23 +01004996
Bram Moolenaar701ff0a2019-05-24 14:14:14 +02004997 // A symbolic link to a directory itself is deleted, not the directory it
4998 // points to.
Bram Moolenaar43a34f92016-01-17 15:56:34 +01004999 if (
Bram Moolenaar4f974752019-02-17 17:44:42 +01005000# if defined(UNIX) || defined(MSWIN)
Bram Moolenaar43a34f92016-01-17 15:56:34 +01005001 mch_isrealdir(name)
Bram Moolenaar203258c2016-01-17 22:15:16 +01005002# else
Bram Moolenaar43a34f92016-01-17 15:56:34 +01005003 mch_isdir(name)
Bram Moolenaar43a34f92016-01-17 15:56:34 +01005004# endif
5005 )
Bram Moolenaarda440d22016-01-16 21:27:23 +01005006 {
Bram Moolenaar701ff0a2019-05-24 14:14:14 +02005007 exp = vim_strsave(name);
Bram Moolenaarda440d22016-01-16 21:27:23 +01005008 if (exp == NULL)
5009 return -1;
Bram Moolenaar84cf6bd2020-06-16 20:03:43 +02005010 if (readdir_core(&ga, exp, FALSE, NULL, NULL, READDIR_SORT_NONE) == OK)
Bram Moolenaarda440d22016-01-16 21:27:23 +01005011 {
Bram Moolenaar701ff0a2019-05-24 14:14:14 +02005012 for (i = 0; i < ga.ga_len; ++i)
5013 {
5014 vim_snprintf((char *)NameBuff, MAXPATHL, "%s/%s", exp,
5015 ((char_u **)ga.ga_data)[i]);
5016 if (delete_recursive(NameBuff) != 0)
zeertzjq47870032022-04-05 15:31:01 +01005017 // Remember the failure but continue deleting any further
5018 // entries.
Bram Moolenaarda440d22016-01-16 21:27:23 +01005019 result = -1;
Bram Moolenaar701ff0a2019-05-24 14:14:14 +02005020 }
5021 ga_clear_strings(&ga);
zeertzjq47870032022-04-05 15:31:01 +01005022 if (mch_rmdir(exp) != 0)
5023 result = -1;
Bram Moolenaarda440d22016-01-16 21:27:23 +01005024 }
5025 else
5026 result = -1;
5027 vim_free(exp);
Bram Moolenaarda440d22016-01-16 21:27:23 +01005028 }
5029 else
5030 result = mch_remove(name) == 0 ? 0 : -1;
5031
5032 return result;
5033}
5034#endif
5035
Bram Moolenaar071d4272004-06-13 20:20:40 +00005036#if defined(TEMPDIRNAMES) || defined(PROTO)
Bram Moolenaar217e1b82019-12-01 21:41:28 +01005037static long temp_count = 0; // Temp filename counter.
Bram Moolenaar071d4272004-06-13 20:20:40 +00005038
Bram Moolenaarb2d0e512020-05-07 18:37:03 +02005039# if defined(UNIX) && defined(HAVE_FLOCK) && defined(HAVE_DIRFD)
5040/*
5041 * Open temporary directory and take file lock to prevent
5042 * to be auto-cleaned.
5043 */
5044 static void
5045vim_opentempdir(void)
5046{
5047 DIR *dp = NULL;
5048
5049 if (vim_tempdir_dp != NULL)
5050 return;
5051
5052 dp = opendir((const char*)vim_tempdir);
5053
5054 if (dp != NULL)
5055 {
5056 vim_tempdir_dp = dp;
5057 flock(dirfd(vim_tempdir_dp), LOCK_SH);
5058 }
5059}
5060
5061/*
5062 * Close temporary directory - it automatically release file lock.
5063 */
5064 static void
5065vim_closetempdir(void)
5066{
5067 if (vim_tempdir_dp != NULL)
5068 {
5069 closedir(vim_tempdir_dp);
5070 vim_tempdir_dp = NULL;
5071 }
5072}
5073# endif
5074
Bram Moolenaar071d4272004-06-13 20:20:40 +00005075/*
5076 * Delete the temp directory and all files it contains.
5077 */
5078 void
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01005079vim_deltempdir(void)
Bram Moolenaar071d4272004-06-13 20:20:40 +00005080{
Bram Moolenaar071d4272004-06-13 20:20:40 +00005081 if (vim_tempdir != NULL)
5082 {
Bram Moolenaarb2d0e512020-05-07 18:37:03 +02005083# if defined(UNIX) && defined(HAVE_FLOCK) && defined(HAVE_DIRFD)
5084 vim_closetempdir();
5085# endif
Bram Moolenaar217e1b82019-12-01 21:41:28 +01005086 // remove the trailing path separator
Bram Moolenaarda440d22016-01-16 21:27:23 +01005087 gettail(vim_tempdir)[-1] = NUL;
5088 delete_recursive(vim_tempdir);
Bram Moolenaard23a8232018-02-10 18:45:26 +01005089 VIM_CLEAR(vim_tempdir);
Bram Moolenaar071d4272004-06-13 20:20:40 +00005090 }
5091}
Bram Moolenaar071d4272004-06-13 20:20:40 +00005092
5093/*
Bram Moolenaareaf03392009-11-17 11:08:52 +00005094 * Directory "tempdir" was created. Expand this name to a full path and put
5095 * it in "vim_tempdir". This avoids that using ":cd" would confuse us.
5096 * "tempdir" must be no longer than MAXPATHL.
5097 */
5098 static void
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01005099vim_settempdir(char_u *tempdir)
Bram Moolenaareaf03392009-11-17 11:08:52 +00005100{
5101 char_u *buf;
5102
Bram Moolenaar964b3742019-05-24 18:54:09 +02005103 buf = alloc(MAXPATHL + 2);
Bram Moolenaareaf03392009-11-17 11:08:52 +00005104 if (buf != NULL)
5105 {
5106 if (vim_FullName(tempdir, buf, MAXPATHL, FALSE) == FAIL)
5107 STRCPY(buf, tempdir);
Bram Moolenaara06ecab2016-07-16 14:47:36 +02005108 add_pathsep(buf);
Bram Moolenaareaf03392009-11-17 11:08:52 +00005109 vim_tempdir = vim_strsave(buf);
Bram Moolenaarb2d0e512020-05-07 18:37:03 +02005110# if defined(UNIX) && defined(HAVE_FLOCK) && defined(HAVE_DIRFD)
5111 vim_opentempdir();
5112# endif
Bram Moolenaareaf03392009-11-17 11:08:52 +00005113 vim_free(buf);
5114 }
5115}
Bram Moolenaar4592dee2009-11-18 19:11:58 +00005116#endif
Bram Moolenaareaf03392009-11-17 11:08:52 +00005117
5118/*
Bram Moolenaar071d4272004-06-13 20:20:40 +00005119 * vim_tempname(): Return a unique name that can be used for a temp file.
5120 *
Bram Moolenaar76ae22f2016-06-13 20:00:29 +02005121 * The temp file is NOT guaranteed to be created. If "keep" is FALSE it is
5122 * guaranteed to NOT be created.
Bram Moolenaar071d4272004-06-13 20:20:40 +00005123 *
5124 * The returned pointer is to allocated memory.
5125 * The returned pointer is NULL if no valid name was found.
5126 */
Bram Moolenaar071d4272004-06-13 20:20:40 +00005127 char_u *
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01005128vim_tempname(
Bram Moolenaar217e1b82019-12-01 21:41:28 +01005129 int extra_char UNUSED, // char to use in the name instead of '?'
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01005130 int keep UNUSED)
Bram Moolenaar071d4272004-06-13 20:20:40 +00005131{
5132#ifdef USE_TMPNAM
Bram Moolenaar217e1b82019-12-01 21:41:28 +01005133 char_u itmp[L_tmpnam]; // use tmpnam()
Bram Moolenaar4f974752019-02-17 17:44:42 +01005134#elif defined(MSWIN)
Bram Moolenaarec0f50a2019-02-10 23:26:13 +01005135 WCHAR itmp[TEMPNAMELEN];
Bram Moolenaar071d4272004-06-13 20:20:40 +00005136#else
5137 char_u itmp[TEMPNAMELEN];
5138#endif
5139
5140#ifdef TEMPDIRNAMES
5141 static char *(tempdirs[]) = {TEMPDIRNAMES};
5142 int i;
Bram Moolenaar071d4272004-06-13 20:20:40 +00005143# ifndef EEXIST
Bram Moolenaar8767f522016-07-01 17:17:39 +02005144 stat_T st;
Bram Moolenaar071d4272004-06-13 20:20:40 +00005145# endif
5146
5147 /*
5148 * This will create a directory for private use by this instance of Vim.
5149 * This is done once, and the same directory is used for all temp files.
5150 * This method avoids security problems because of symlink attacks et al.
5151 * It's also a bit faster, because we only need to check for an existing
5152 * file when creating the directory and not for each temp file.
5153 */
5154 if (vim_tempdir == NULL)
5155 {
5156 /*
5157 * Try the entries in TEMPDIRNAMES to create the temp directory.
5158 */
K.Takataeeec2542021-06-02 13:28:16 +02005159 for (i = 0; i < (int)ARRAY_LENGTH(tempdirs); ++i)
Bram Moolenaar071d4272004-06-13 20:20:40 +00005160 {
Bram Moolenaareaf03392009-11-17 11:08:52 +00005161# ifndef HAVE_MKDTEMP
Bram Moolenaar2660c0e2010-01-19 14:59:56 +01005162 size_t itmplen;
Bram Moolenaareaf03392009-11-17 11:08:52 +00005163 long nr;
5164 long off;
5165# endif
5166
Bram Moolenaar217e1b82019-12-01 21:41:28 +01005167 // Expand $TMP, leave room for "/v1100000/999999999".
5168 // Skip the directory check if the expansion fails.
Bram Moolenaar071d4272004-06-13 20:20:40 +00005169 expand_env((char_u *)tempdirs[i], itmp, TEMPNAMELEN - 20);
Bram Moolenaare1a61992015-12-03 21:02:27 +01005170 if (itmp[0] != '$' && mch_isdir(itmp))
Bram Moolenaar071d4272004-06-13 20:20:40 +00005171 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01005172 // directory exists
Bram Moolenaara06ecab2016-07-16 14:47:36 +02005173 add_pathsep(itmp);
Bram Moolenaar071d4272004-06-13 20:20:40 +00005174
Bram Moolenaareaf03392009-11-17 11:08:52 +00005175# ifdef HAVE_MKDTEMP
Bram Moolenaar35d88f42016-06-04 14:52:00 +02005176 {
5177# if defined(UNIX) || defined(VMS)
Bram Moolenaar217e1b82019-12-01 21:41:28 +01005178 // Make sure the umask doesn't remove the executable bit.
5179 // "repl" has been reported to use "177".
Bram Moolenaar35d88f42016-06-04 14:52:00 +02005180 mode_t umask_save = umask(077);
5181# endif
Bram Moolenaar217e1b82019-12-01 21:41:28 +01005182 // Leave room for filename
Bram Moolenaar35d88f42016-06-04 14:52:00 +02005183 STRCAT(itmp, "vXXXXXX");
5184 if (mkdtemp((char *)itmp) != NULL)
5185 vim_settempdir(itmp);
5186# if defined(UNIX) || defined(VMS)
5187 (void)umask(umask_save);
5188# endif
5189 }
Bram Moolenaareaf03392009-11-17 11:08:52 +00005190# else
Bram Moolenaar217e1b82019-12-01 21:41:28 +01005191 // Get an arbitrary number of up to 6 digits. When it's
5192 // unlikely that it already exists it will be faster,
5193 // otherwise it doesn't matter. The use of mkdir() avoids any
5194 // security problems because of the predictable number.
Bram Moolenaar071d4272004-06-13 20:20:40 +00005195 nr = (mch_get_pid() + (long)time(NULL)) % 1000000L;
Bram Moolenaar2660c0e2010-01-19 14:59:56 +01005196 itmplen = STRLEN(itmp);
Bram Moolenaar071d4272004-06-13 20:20:40 +00005197
Bram Moolenaar217e1b82019-12-01 21:41:28 +01005198 // Try up to 10000 different values until we find a name that
5199 // doesn't exist.
Bram Moolenaar071d4272004-06-13 20:20:40 +00005200 for (off = 0; off < 10000L; ++off)
5201 {
5202 int r;
Bram Moolenaareaf03392009-11-17 11:08:52 +00005203# if defined(UNIX) || defined(VMS)
Bram Moolenaar071d4272004-06-13 20:20:40 +00005204 mode_t umask_save;
Bram Moolenaareaf03392009-11-17 11:08:52 +00005205# endif
Bram Moolenaar071d4272004-06-13 20:20:40 +00005206
Bram Moolenaareaf03392009-11-17 11:08:52 +00005207 sprintf((char *)itmp + itmplen, "v%ld", nr + off);
5208# ifndef EEXIST
Bram Moolenaar217e1b82019-12-01 21:41:28 +01005209 // If mkdir() does not set errno to EEXIST, check for
5210 // existing file here. There is a race condition then,
5211 // although it's fail-safe.
Bram Moolenaar071d4272004-06-13 20:20:40 +00005212 if (mch_stat((char *)itmp, &st) >= 0)
5213 continue;
Bram Moolenaareaf03392009-11-17 11:08:52 +00005214# endif
5215# if defined(UNIX) || defined(VMS)
Bram Moolenaar217e1b82019-12-01 21:41:28 +01005216 // Make sure the umask doesn't remove the executable bit.
5217 // "repl" has been reported to use "177".
Bram Moolenaar071d4272004-06-13 20:20:40 +00005218 umask_save = umask(077);
Bram Moolenaareaf03392009-11-17 11:08:52 +00005219# endif
Bram Moolenaar071d4272004-06-13 20:20:40 +00005220 r = vim_mkdir(itmp, 0700);
Bram Moolenaareaf03392009-11-17 11:08:52 +00005221# if defined(UNIX) || defined(VMS)
Bram Moolenaar071d4272004-06-13 20:20:40 +00005222 (void)umask(umask_save);
Bram Moolenaareaf03392009-11-17 11:08:52 +00005223# endif
Bram Moolenaar071d4272004-06-13 20:20:40 +00005224 if (r == 0)
5225 {
Bram Moolenaareaf03392009-11-17 11:08:52 +00005226 vim_settempdir(itmp);
Bram Moolenaar071d4272004-06-13 20:20:40 +00005227 break;
5228 }
Bram Moolenaareaf03392009-11-17 11:08:52 +00005229# ifdef EEXIST
Bram Moolenaar217e1b82019-12-01 21:41:28 +01005230 // If the mkdir() didn't fail because the file/dir exists,
5231 // we probably can't create any dir here, try another
5232 // place.
Bram Moolenaar071d4272004-06-13 20:20:40 +00005233 if (errno != EEXIST)
Bram Moolenaareaf03392009-11-17 11:08:52 +00005234# endif
Bram Moolenaar071d4272004-06-13 20:20:40 +00005235 break;
5236 }
Bram Moolenaar217e1b82019-12-01 21:41:28 +01005237# endif // HAVE_MKDTEMP
Bram Moolenaar071d4272004-06-13 20:20:40 +00005238 if (vim_tempdir != NULL)
5239 break;
5240 }
5241 }
5242 }
5243
5244 if (vim_tempdir != NULL)
5245 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01005246 // There is no need to check if the file exists, because we own the
5247 // directory and nobody else creates a file in it.
Bram Moolenaar071d4272004-06-13 20:20:40 +00005248 sprintf((char *)itmp, "%s%ld", vim_tempdir, temp_count++);
5249 return vim_strsave(itmp);
5250 }
5251
5252 return NULL;
5253
Bram Moolenaar217e1b82019-12-01 21:41:28 +01005254#else // TEMPDIRNAMES
Bram Moolenaar071d4272004-06-13 20:20:40 +00005255
Bram Moolenaar4f974752019-02-17 17:44:42 +01005256# ifdef MSWIN
Bram Moolenaarec0f50a2019-02-10 23:26:13 +01005257 WCHAR wszTempFile[_MAX_PATH + 1];
5258 WCHAR buf4[4];
Bram Moolenaar2472a742020-11-26 19:47:28 +01005259 WCHAR *chartab = L"0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ";
Bram Moolenaar071d4272004-06-13 20:20:40 +00005260 char_u *retval;
5261 char_u *p;
Mike Williamsa3d1b292021-06-30 20:56:00 +02005262 char_u *shname;
Bram Moolenaar2472a742020-11-26 19:47:28 +01005263 long i;
Bram Moolenaar071d4272004-06-13 20:20:40 +00005264
Bram Moolenaarec0f50a2019-02-10 23:26:13 +01005265 wcscpy(itmp, L"");
5266 if (GetTempPathW(_MAX_PATH, wszTempFile) == 0)
Bram Moolenaarb1891912011-02-09 14:47:03 +01005267 {
Bram Moolenaarec0f50a2019-02-10 23:26:13 +01005268 wszTempFile[0] = L'.'; // GetTempPathW() failed, use current dir
Bram Moolenaar2472a742020-11-26 19:47:28 +01005269 wszTempFile[1] = L'\\';
5270 wszTempFile[2] = NUL;
Bram Moolenaarb1891912011-02-09 14:47:03 +01005271 }
Bram Moolenaarec0f50a2019-02-10 23:26:13 +01005272 wcscpy(buf4, L"VIM");
Bram Moolenaar2472a742020-11-26 19:47:28 +01005273
5274 // randomize the name to avoid collisions
5275 i = mch_get_pid() + extra_char;
5276 buf4[1] = chartab[i % 36];
5277 buf4[2] = chartab[101 * i % 36];
Bram Moolenaarec0f50a2019-02-10 23:26:13 +01005278 if (GetTempFileNameW(wszTempFile, buf4, 0, itmp) == 0)
Bram Moolenaar071d4272004-06-13 20:20:40 +00005279 return NULL;
Bram Moolenaare5c421c2015-03-31 13:33:08 +02005280 if (!keep)
Bram Moolenaarec0f50a2019-02-10 23:26:13 +01005281 // GetTempFileName() will create the file, we don't want that
5282 (void)DeleteFileW(itmp);
Bram Moolenaar071d4272004-06-13 20:20:40 +00005283
Bram Moolenaarec0f50a2019-02-10 23:26:13 +01005284 // Backslashes in a temp file name cause problems when filtering with
5285 // "sh". NOTE: This also checks 'shellcmdflag' to help those people who
Mike Williams12795022021-06-28 20:53:58 +02005286 // didn't set 'shellslash' but only if not using PowerShell.
Bram Moolenaarec0f50a2019-02-10 23:26:13 +01005287 retval = utf16_to_enc(itmp, NULL);
Mike Williamsa3d1b292021-06-30 20:56:00 +02005288 shname = gettail(p_sh);
5289 if ((*p_shcf == '-' && !(strstr((char *)shname, "powershell") != NULL
5290 || strstr((char *)shname, "pwsh") != NULL ))
5291 || p_ssl)
Bram Moolenaar071d4272004-06-13 20:20:40 +00005292 for (p = retval; *p; ++p)
5293 if (*p == '\\')
5294 *p = '/';
5295 return retval;
5296
Bram Moolenaar4f974752019-02-17 17:44:42 +01005297# else // MSWIN
Bram Moolenaar071d4272004-06-13 20:20:40 +00005298
5299# ifdef USE_TMPNAM
Bram Moolenaar95474ca2011-02-09 16:44:51 +01005300 char_u *p;
5301
Bram Moolenaar217e1b82019-12-01 21:41:28 +01005302 // tmpnam() will make its own name
Bram Moolenaar95474ca2011-02-09 16:44:51 +01005303 p = tmpnam((char *)itmp);
5304 if (p == NULL || *p == NUL)
Bram Moolenaar071d4272004-06-13 20:20:40 +00005305 return NULL;
5306# else
5307 char_u *p;
5308
5309# ifdef VMS_TEMPNAM
Bram Moolenaar217e1b82019-12-01 21:41:28 +01005310 // mktemp() is not working on VMS. It seems to be
5311 // a do-nothing function. Therefore we use tempnam().
Bram Moolenaar071d4272004-06-13 20:20:40 +00005312 sprintf((char *)itmp, "VIM%c", extra_char);
5313 p = (char_u *)tempnam("tmp:", (char *)itmp);
5314 if (p != NULL)
5315 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01005316 // VMS will use '.LIS' if we don't explicitly specify an extension,
5317 // and VIM will then be unable to find the file later
Bram Moolenaar071d4272004-06-13 20:20:40 +00005318 STRCPY(itmp, p);
5319 STRCAT(itmp, ".txt");
5320 free(p);
5321 }
5322 else
5323 return NULL;
5324# else
5325 STRCPY(itmp, TEMPNAME);
5326 if ((p = vim_strchr(itmp, '?')) != NULL)
5327 *p = extra_char;
5328 if (mktemp((char *)itmp) == NULL)
5329 return NULL;
5330# endif
5331# endif
5332
5333 return vim_strsave(itmp);
Bram Moolenaar4f974752019-02-17 17:44:42 +01005334# endif // MSWIN
Bram Moolenaar217e1b82019-12-01 21:41:28 +01005335#endif // TEMPDIRNAMES
Bram Moolenaar071d4272004-06-13 20:20:40 +00005336}
5337
5338#if defined(BACKSLASH_IN_FILENAME) || defined(PROTO)
5339/*
Bram Moolenaarb4f6a462015-10-13 19:43:17 +02005340 * Convert all backslashes in fname to forward slashes in-place, unless when
5341 * it looks like a URL.
Bram Moolenaar071d4272004-06-13 20:20:40 +00005342 */
5343 void
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01005344forward_slash(char_u *fname)
Bram Moolenaar071d4272004-06-13 20:20:40 +00005345{
5346 char_u *p;
5347
Bram Moolenaarb4f6a462015-10-13 19:43:17 +02005348 if (path_with_url(fname))
5349 return;
Bram Moolenaar071d4272004-06-13 20:20:40 +00005350 for (p = fname; *p != NUL; ++p)
Bram Moolenaar217e1b82019-12-01 21:41:28 +01005351 // The Big5 encoding can have '\' in the trail byte.
Bram Moolenaar0fa313a2005-08-10 21:07:57 +00005352 if (enc_dbcs != 0 && (*mb_ptr2len)(p) > 1)
Bram Moolenaar071d4272004-06-13 20:20:40 +00005353 ++p;
Bram Moolenaar13505972019-01-24 15:04:48 +01005354 else if (*p == '\\')
Bram Moolenaar071d4272004-06-13 20:20:40 +00005355 *p = '/';
5356}
5357#endif
5358
Bram Moolenaarf30e74c2006-08-16 17:35:00 +00005359/*
Bram Moolenaar748bf032005-02-02 23:04:36 +00005360 * Try matching a filename with a "pattern" ("prog" is NULL), or use the
5361 * precompiled regprog "prog" ("pattern" is NULL). That avoids calling
5362 * vim_regcomp() often.
Bram Moolenaar071d4272004-06-13 20:20:40 +00005363 * Used for autocommands and 'wildignore'.
5364 * Returns TRUE if there is a match, FALSE otherwise.
5365 */
Bram Moolenaar3e460fd2019-01-26 16:21:07 +01005366 int
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01005367match_file_pat(
Bram Moolenaar217e1b82019-12-01 21:41:28 +01005368 char_u *pattern, // pattern to match with
5369 regprog_T **prog, // pre-compiled regprog or NULL
5370 char_u *fname, // full path of file name
5371 char_u *sfname, // short file name or NULL
5372 char_u *tail, // tail of path
5373 int allow_dirs) // allow matching with dir
Bram Moolenaar071d4272004-06-13 20:20:40 +00005374{
5375 regmatch_T regmatch;
5376 int result = FALSE;
Bram Moolenaar071d4272004-06-13 20:20:40 +00005377
Bram Moolenaar217e1b82019-12-01 21:41:28 +01005378 regmatch.rm_ic = p_fic; // ignore case if 'fileignorecase' is set
Bram Moolenaar49a6ed82015-01-07 14:43:39 +01005379 if (prog != NULL)
5380 regmatch.regprog = *prog;
Bram Moolenaar071d4272004-06-13 20:20:40 +00005381 else
Bram Moolenaar49a6ed82015-01-07 14:43:39 +01005382 regmatch.regprog = vim_regcomp(pattern, RE_MAGIC);
Bram Moolenaar071d4272004-06-13 20:20:40 +00005383
5384 /*
5385 * Try for a match with the pattern with:
5386 * 1. the full file name, when the pattern has a '/'.
5387 * 2. the short file name, when the pattern has a '/'.
5388 * 3. the tail of the file name, when the pattern has no '/'.
5389 */
Bram Moolenaar49a6ed82015-01-07 14:43:39 +01005390 if (regmatch.regprog != NULL
Bram Moolenaar071d4272004-06-13 20:20:40 +00005391 && ((allow_dirs
5392 && (vim_regexec(&regmatch, fname, (colnr_T)0)
5393 || (sfname != NULL
5394 && vim_regexec(&regmatch, sfname, (colnr_T)0))))
Bram Moolenaar49a6ed82015-01-07 14:43:39 +01005395 || (!allow_dirs && vim_regexec(&regmatch, tail, (colnr_T)0))))
Bram Moolenaar071d4272004-06-13 20:20:40 +00005396 result = TRUE;
5397
Bram Moolenaardffa5b82014-11-19 16:38:07 +01005398 if (prog != NULL)
5399 *prog = regmatch.regprog;
5400 else
Bram Moolenaar473de612013-06-08 18:19:48 +02005401 vim_regfree(regmatch.regprog);
Bram Moolenaar071d4272004-06-13 20:20:40 +00005402 return result;
5403}
Bram Moolenaar071d4272004-06-13 20:20:40 +00005404
5405#if defined(FEAT_WILDIGN) || defined(PROTO)
5406/*
5407 * Return TRUE if a file matches with a pattern in "list".
5408 * "list" is a comma-separated list of patterns, like 'wildignore'.
5409 * "sfname" is the short file name or NULL, "ffname" the long file name.
5410 */
5411 int
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01005412match_file_list(char_u *list, char_u *sfname, char_u *ffname)
Bram Moolenaar071d4272004-06-13 20:20:40 +00005413{
5414 char_u buf[100];
5415 char_u *tail;
5416 char_u *regpat;
5417 char allow_dirs;
5418 int match;
5419 char_u *p;
5420
5421 tail = gettail(sfname);
5422
Bram Moolenaar217e1b82019-12-01 21:41:28 +01005423 // try all patterns in 'wildignore'
Bram Moolenaar071d4272004-06-13 20:20:40 +00005424 p = list;
5425 while (*p)
5426 {
5427 copy_option_part(&p, buf, 100, ",");
5428 regpat = file_pat_to_reg_pat(buf, NULL, &allow_dirs, FALSE);
5429 if (regpat == NULL)
5430 break;
Bram Moolenaar748bf032005-02-02 23:04:36 +00005431 match = match_file_pat(regpat, NULL, ffname, sfname,
5432 tail, (int)allow_dirs);
Bram Moolenaar071d4272004-06-13 20:20:40 +00005433 vim_free(regpat);
5434 if (match)
5435 return TRUE;
5436 }
5437 return FALSE;
5438}
5439#endif
5440
5441/*
5442 * Convert the given pattern "pat" which has shell style wildcards in it, into
5443 * a regular expression, and return the result in allocated memory. If there
5444 * is a directory path separator to be matched, then TRUE is put in
5445 * allow_dirs, otherwise FALSE is put there -- webb.
5446 * Handle backslashes before special characters, like "\*" and "\ ".
5447 *
Bram Moolenaar071d4272004-06-13 20:20:40 +00005448 * Returns NULL when out of memory.
5449 */
Bram Moolenaar071d4272004-06-13 20:20:40 +00005450 char_u *
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01005451file_pat_to_reg_pat(
5452 char_u *pat,
Bram Moolenaar217e1b82019-12-01 21:41:28 +01005453 char_u *pat_end, // first char after pattern or NULL
5454 char *allow_dirs, // Result passed back out in here
5455 int no_bslash UNUSED) // Don't use a backward slash as pathsep
Bram Moolenaar071d4272004-06-13 20:20:40 +00005456{
Bram Moolenaar217e1b82019-12-01 21:41:28 +01005457 int size = 2; // '^' at start, '$' at end
Bram Moolenaar071d4272004-06-13 20:20:40 +00005458 char_u *endp;
5459 char_u *reg_pat;
5460 char_u *p;
5461 int i;
5462 int nested = 0;
5463 int add_dollar = TRUE;
Bram Moolenaar071d4272004-06-13 20:20:40 +00005464
5465 if (allow_dirs != NULL)
5466 *allow_dirs = FALSE;
5467 if (pat_end == NULL)
5468 pat_end = pat + STRLEN(pat);
5469
Bram Moolenaar071d4272004-06-13 20:20:40 +00005470 for (p = pat; p < pat_end; p++)
5471 {
5472 switch (*p)
5473 {
5474 case '*':
5475 case '.':
5476 case ',':
5477 case '{':
5478 case '}':
5479 case '~':
Bram Moolenaar217e1b82019-12-01 21:41:28 +01005480 size += 2; // extra backslash
Bram Moolenaar071d4272004-06-13 20:20:40 +00005481 break;
5482#ifdef BACKSLASH_IN_FILENAME
5483 case '\\':
5484 case '/':
Bram Moolenaar217e1b82019-12-01 21:41:28 +01005485 size += 4; // could become "[\/]"
Bram Moolenaar071d4272004-06-13 20:20:40 +00005486 break;
5487#endif
5488 default:
5489 size++;
Bram Moolenaar0fa313a2005-08-10 21:07:57 +00005490 if (enc_dbcs != 0 && (*mb_ptr2len)(p) > 1)
Bram Moolenaar071d4272004-06-13 20:20:40 +00005491 {
5492 ++p;
5493 ++size;
5494 }
Bram Moolenaar071d4272004-06-13 20:20:40 +00005495 break;
5496 }
5497 }
5498 reg_pat = alloc(size + 1);
5499 if (reg_pat == NULL)
5500 return NULL;
5501
Bram Moolenaar071d4272004-06-13 20:20:40 +00005502 i = 0;
Bram Moolenaar071d4272004-06-13 20:20:40 +00005503
5504 if (pat[0] == '*')
5505 while (pat[0] == '*' && pat < pat_end - 1)
5506 pat++;
5507 else
5508 reg_pat[i++] = '^';
5509 endp = pat_end - 1;
Bram Moolenaar8fee8782015-08-11 18:45:48 +02005510 if (endp >= pat && *endp == '*')
Bram Moolenaar071d4272004-06-13 20:20:40 +00005511 {
5512 while (endp - pat > 0 && *endp == '*')
5513 endp--;
5514 add_dollar = FALSE;
5515 }
5516 for (p = pat; *p && nested >= 0 && p <= endp; p++)
5517 {
5518 switch (*p)
5519 {
5520 case '*':
5521 reg_pat[i++] = '.';
5522 reg_pat[i++] = '*';
Bram Moolenaar217e1b82019-12-01 21:41:28 +01005523 while (p[1] == '*') // "**" matches like "*"
Bram Moolenaar02743632005-07-25 20:42:36 +00005524 ++p;
Bram Moolenaar071d4272004-06-13 20:20:40 +00005525 break;
5526 case '.':
Bram Moolenaar071d4272004-06-13 20:20:40 +00005527 case '~':
5528 reg_pat[i++] = '\\';
5529 reg_pat[i++] = *p;
5530 break;
5531 case '?':
Bram Moolenaar071d4272004-06-13 20:20:40 +00005532 reg_pat[i++] = '.';
5533 break;
5534 case '\\':
5535 if (p[1] == NUL)
5536 break;
5537#ifdef BACKSLASH_IN_FILENAME
5538 if (!no_bslash)
5539 {
Bram Moolenaar217e1b82019-12-01 21:41:28 +01005540 // translate:
5541 // "\x" to "\\x" e.g., "dir\file"
5542 // "\*" to "\\.*" e.g., "dir\*.c"
5543 // "\?" to "\\." e.g., "dir\??.c"
5544 // "\+" to "\+" e.g., "fileX\+.c"
Bram Moolenaar071d4272004-06-13 20:20:40 +00005545 if ((vim_isfilec(p[1]) || p[1] == '*' || p[1] == '?')
5546 && p[1] != '+')
5547 {
5548 reg_pat[i++] = '[';
5549 reg_pat[i++] = '\\';
5550 reg_pat[i++] = '/';
5551 reg_pat[i++] = ']';
5552 if (allow_dirs != NULL)
5553 *allow_dirs = TRUE;
5554 break;
5555 }
5556 }
5557#endif
Bram Moolenaar217e1b82019-12-01 21:41:28 +01005558 // Undo escaping from ExpandEscape():
5559 // foo\?bar -> foo?bar
5560 // foo\%bar -> foo%bar
5561 // foo\,bar -> foo,bar
5562 // foo\ bar -> foo bar
5563 // Don't unescape \, * and others that are also special in a
5564 // regexp.
5565 // An escaped { must be unescaped since we use magic not
5566 // verymagic. Use "\\\{n,m\}"" to get "\{n,m}".
Bram Moolenaar071d4272004-06-13 20:20:40 +00005567 if (*++p == '?'
5568#ifdef BACKSLASH_IN_FILENAME
5569 && no_bslash
5570#endif
5571 )
5572 reg_pat[i++] = '?';
5573 else
Bram Moolenaarf4e11432013-07-03 16:53:03 +02005574 if (*p == ',' || *p == '%' || *p == '#'
Bram Moolenaar2288afe2015-08-11 16:20:05 +02005575 || vim_isspace(*p) || *p == '{' || *p == '}')
Bram Moolenaar8cd213c2010-06-01 21:57:09 +02005576 reg_pat[i++] = *p;
Bram Moolenaara946afe2013-08-02 15:22:39 +02005577 else if (*p == '\\' && p[1] == '\\' && p[2] == '{')
5578 {
5579 reg_pat[i++] = '\\';
5580 reg_pat[i++] = '{';
5581 p += 2;
5582 }
Bram Moolenaar071d4272004-06-13 20:20:40 +00005583 else
5584 {
5585 if (allow_dirs != NULL && vim_ispathsep(*p)
5586#ifdef BACKSLASH_IN_FILENAME
5587 && (!no_bslash || *p != '\\')
5588#endif
5589 )
5590 *allow_dirs = TRUE;
5591 reg_pat[i++] = '\\';
5592 reg_pat[i++] = *p;
5593 }
5594 break;
5595#ifdef BACKSLASH_IN_FILENAME
5596 case '/':
5597 reg_pat[i++] = '[';
5598 reg_pat[i++] = '\\';
5599 reg_pat[i++] = '/';
5600 reg_pat[i++] = ']';
5601 if (allow_dirs != NULL)
5602 *allow_dirs = TRUE;
5603 break;
5604#endif
5605 case '{':
5606 reg_pat[i++] = '\\';
5607 reg_pat[i++] = '(';
5608 nested++;
5609 break;
5610 case '}':
5611 reg_pat[i++] = '\\';
5612 reg_pat[i++] = ')';
5613 --nested;
5614 break;
5615 case ',':
5616 if (nested)
5617 {
5618 reg_pat[i++] = '\\';
5619 reg_pat[i++] = '|';
5620 }
5621 else
5622 reg_pat[i++] = ',';
5623 break;
5624 default:
Bram Moolenaar0fa313a2005-08-10 21:07:57 +00005625 if (enc_dbcs != 0 && (*mb_ptr2len)(p) > 1)
Bram Moolenaar071d4272004-06-13 20:20:40 +00005626 reg_pat[i++] = *p++;
Bram Moolenaar13505972019-01-24 15:04:48 +01005627 else if (allow_dirs != NULL && vim_ispathsep(*p))
Bram Moolenaar071d4272004-06-13 20:20:40 +00005628 *allow_dirs = TRUE;
5629 reg_pat[i++] = *p;
5630 break;
5631 }
5632 }
5633 if (add_dollar)
5634 reg_pat[i++] = '$';
5635 reg_pat[i] = NUL;
5636 if (nested != 0)
5637 {
5638 if (nested < 0)
Bram Moolenaar6d057012021-12-31 18:49:43 +00005639 emsg(_(e_missing_open_curly));
Bram Moolenaar071d4272004-06-13 20:20:40 +00005640 else
Bram Moolenaar6d057012021-12-31 18:49:43 +00005641 emsg(_(e_missing_close_curly));
Bram Moolenaard23a8232018-02-10 18:45:26 +01005642 VIM_CLEAR(reg_pat);
Bram Moolenaar071d4272004-06-13 20:20:40 +00005643 }
5644 return reg_pat;
5645}
Bram Moolenaar540fc6f2010-12-17 16:27:16 +01005646
5647#if defined(EINTR) || defined(PROTO)
5648/*
5649 * Version of read() that retries when interrupted by EINTR (possibly
5650 * by a SIGWINCH).
5651 */
5652 long
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01005653read_eintr(int fd, void *buf, size_t bufsize)
Bram Moolenaar540fc6f2010-12-17 16:27:16 +01005654{
5655 long ret;
5656
5657 for (;;)
5658 {
5659 ret = vim_read(fd, buf, bufsize);
5660 if (ret >= 0 || errno != EINTR)
5661 break;
5662 }
5663 return ret;
5664}
5665
5666/*
5667 * Version of write() that retries when interrupted by EINTR (possibly
5668 * by a SIGWINCH).
5669 */
5670 long
Bram Moolenaar78c0b7d2016-01-30 15:52:46 +01005671write_eintr(int fd, void *buf, size_t bufsize)
Bram Moolenaar540fc6f2010-12-17 16:27:16 +01005672{
5673 long ret = 0;
5674 long wlen;
5675
Bram Moolenaar217e1b82019-12-01 21:41:28 +01005676 // Repeat the write() so long it didn't fail, other than being interrupted
5677 // by a signal.
Bram Moolenaar540fc6f2010-12-17 16:27:16 +01005678 while (ret < (long)bufsize)
5679 {
Bram Moolenaar9c263032010-12-17 18:06:06 +01005680 wlen = vim_write(fd, (char *)buf + ret, bufsize - ret);
Bram Moolenaar540fc6f2010-12-17 16:27:16 +01005681 if (wlen < 0)
5682 {
5683 if (errno != EINTR)
5684 break;
5685 }
5686 else
5687 ret += wlen;
5688 }
5689 return ret;
5690}
5691#endif