Bram Moolenaar | 1d94f9b | 2005-08-04 21:29:45 +0000 | [diff] [blame] | 1 | " Vim script for checking .po files. |
| 2 | " |
Bram Moolenaar | 595f51c | 2008-06-09 12:46:00 +0000 | [diff] [blame] | 3 | " Go through the file and verify that: |
| 4 | " - All %...s items in "msgid" are identical to the ones in "msgstr". |
| 5 | " - An error or warning code in "msgid" matches the one in "msgstr". |
Bram Moolenaar | 1d94f9b | 2005-08-04 21:29:45 +0000 | [diff] [blame] | 6 | |
| 7 | if 1 " Only execute this if the eval feature is available. |
| 8 | |
Bram Moolenaar | 78ee625 | 2023-05-28 18:39:55 +0100 | [diff] [blame] | 9 | " using line continuation |
| 10 | set cpo&vim |
| 11 | |
Bram Moolenaar | 1d94f9b | 2005-08-04 21:29:45 +0000 | [diff] [blame] | 12 | " Function to get a split line at the cursor. |
| 13 | " Used for both msgid and msgstr lines. |
| 14 | " Removes all text except % items and returns the result. |
| 15 | func! GetMline() |
| 16 | let idline = substitute(getline('.'), '"\(.*\)"$', '\1', '') |
| 17 | while line('.') < line('$') |
| 18 | + |
| 19 | let line = getline('.') |
| 20 | if line[0] != '"' |
| 21 | break |
| 22 | endif |
| 23 | let idline .= substitute(line, '"\(.*\)"$', '\1', '') |
| 24 | endwhile |
| 25 | |
Bram Moolenaar | a5792f5 | 2005-11-23 21:25:05 +0000 | [diff] [blame] | 26 | " remove '%', not used for formatting. |
| 27 | let idline = substitute(idline, "'%'", '', 'g') |
Bram Moolenaar | 0b8cf27 | 2020-08-30 19:42:06 +0200 | [diff] [blame] | 28 | let idline = substitute(idline, "%%", '', 'g') |
Bram Moolenaar | a5792f5 | 2005-11-23 21:25:05 +0000 | [diff] [blame] | 29 | |
Bram Moolenaar | 1c6136a | 2009-09-11 11:00:05 +0000 | [diff] [blame] | 30 | " remove '%' used for plural forms. |
| 31 | let idline = substitute(idline, '\\nPlural-Forms: .\+;\\n', '', '') |
| 32 | |
Bram Moolenaar | 1d94f9b | 2005-08-04 21:29:45 +0000 | [diff] [blame] | 33 | " remove everything but % items. |
| 34 | return substitute(idline, '[^%]*\(%[-+ #''.0-9*]*l\=[dsuxXpoc%]\)\=', '\1', 'g') |
| 35 | endfunc |
| 36 | |
Bram Moolenaar | ec42059 | 2016-08-26 15:51:53 +0200 | [diff] [blame] | 37 | " This only works when 'wrapscan' is not set. |
Bram Moolenaar | a411e5d | 2010-08-04 15:47:08 +0200 | [diff] [blame] | 38 | let s:save_wrapscan = &wrapscan |
Bram Moolenaar | ec42059 | 2016-08-26 15:51:53 +0200 | [diff] [blame] | 39 | set nowrapscan |
Bram Moolenaar | a411e5d | 2010-08-04 15:47:08 +0200 | [diff] [blame] | 40 | |
Bram Moolenaar | 1d94f9b | 2005-08-04 21:29:45 +0000 | [diff] [blame] | 41 | " Start at the first "msgid" line. |
Bram Moolenaar | 7f93703 | 2017-07-19 14:34:42 +0200 | [diff] [blame] | 42 | let wsv = winsaveview() |
Bram Moolenaar | 1d94f9b | 2005-08-04 21:29:45 +0000 | [diff] [blame] | 43 | 1 |
Bram Moolenaar | 8a37047 | 2022-05-22 15:28:31 +0100 | [diff] [blame] | 44 | keeppatterns /^msgid\> |
Bram Moolenaar | ec42059 | 2016-08-26 15:51:53 +0200 | [diff] [blame] | 45 | |
| 46 | " When an error is detected this is set to the line number. |
| 47 | " Note: this is used in the Makefile. |
Bram Moolenaar | 1d94f9b | 2005-08-04 21:29:45 +0000 | [diff] [blame] | 48 | let error = 0 |
| 49 | |
| 50 | while 1 |
Bram Moolenaar | e53ec39 | 2019-11-16 18:49:50 +0100 | [diff] [blame] | 51 | let lnum = line('.') |
| 52 | if getline(lnum) =~ 'msgid "Text;.*;"' |
| 53 | if getline(lnum + 1) !~ '^msgstr "\([^;]\+;\)\+"' |
| 54 | echomsg 'Mismatching ; in line ' . (lnum + 1) |
| 55 | echomsg 'Did you forget the trailing semicolon?' |
| 56 | if error == 0 |
| 57 | let error = lnum + 1 |
| 58 | endif |
| 59 | endif |
| 60 | endif |
| 61 | |
Bram Moolenaar | 1d94f9b | 2005-08-04 21:29:45 +0000 | [diff] [blame] | 62 | if getline(line('.') - 1) !~ "no-c-format" |
Bram Moolenaar | ec42059 | 2016-08-26 15:51:53 +0200 | [diff] [blame] | 63 | " go over the "msgid" and "msgid_plural" lines |
| 64 | let prevfromline = 'foobar' |
Bram Moolenaar | 78ee625 | 2023-05-28 18:39:55 +0100 | [diff] [blame] | 65 | let plural = 0 |
Bram Moolenaar | ec42059 | 2016-08-26 15:51:53 +0200 | [diff] [blame] | 66 | while 1 |
Bram Moolenaar | 78ee625 | 2023-05-28 18:39:55 +0100 | [diff] [blame] | 67 | if getline('.') =~ 'msgid_plural' |
| 68 | let plural += 1 |
| 69 | endif |
Bram Moolenaar | ec42059 | 2016-08-26 15:51:53 +0200 | [diff] [blame] | 70 | let fromline = GetMline() |
| 71 | if prevfromline != 'foobar' && prevfromline != fromline |
Bram Moolenaar | 78ee625 | 2023-05-28 18:39:55 +0100 | [diff] [blame] | 72 | \ && (plural != 1 |
| 73 | \ || count(prevfromline, '%') + 1 != count(fromline, '%')) |
Bram Moolenaar | ec42059 | 2016-08-26 15:51:53 +0200 | [diff] [blame] | 74 | echomsg 'Mismatching % in line ' . (line('.') - 1) |
| 75 | echomsg 'msgid: ' . prevfromline |
Bram Moolenaar | 78ee625 | 2023-05-28 18:39:55 +0100 | [diff] [blame] | 76 | echomsg 'msgid: ' . fromline |
Bram Moolenaar | ec42059 | 2016-08-26 15:51:53 +0200 | [diff] [blame] | 77 | if error == 0 |
| 78 | let error = line('.') |
| 79 | endif |
| 80 | endif |
| 81 | if getline('.') !~ 'msgid_plural' |
| 82 | break |
| 83 | endif |
| 84 | let prevfromline = fromline |
| 85 | endwhile |
| 86 | |
Bram Moolenaar | 1d94f9b | 2005-08-04 21:29:45 +0000 | [diff] [blame] | 87 | if getline('.') !~ '^msgstr' |
Bram Moolenaar | ec42059 | 2016-08-26 15:51:53 +0200 | [diff] [blame] | 88 | echomsg 'Missing "msgstr" in line ' . line('.') |
| 89 | if error == 0 |
| 90 | let error = line('.') |
| 91 | endif |
Bram Moolenaar | 1d94f9b | 2005-08-04 21:29:45 +0000 | [diff] [blame] | 92 | endif |
Bram Moolenaar | ec42059 | 2016-08-26 15:51:53 +0200 | [diff] [blame] | 93 | |
| 94 | " check all the 'msgstr' lines |
| 95 | while getline('.') =~ '^msgstr' |
| 96 | let toline = GetMline() |
| 97 | if fromline != toline |
Bram Moolenaar | 78ee625 | 2023-05-28 18:39:55 +0100 | [diff] [blame] | 98 | \ && (plural == 0 || count(fromline, '%') != count(toline, '%') + 1) |
Bram Moolenaar | ec42059 | 2016-08-26 15:51:53 +0200 | [diff] [blame] | 99 | echomsg 'Mismatching % in line ' . (line('.') - 1) |
| 100 | echomsg 'msgid: ' . fromline |
| 101 | echomsg 'msgstr: ' . toline |
| 102 | if error == 0 |
| 103 | let error = line('.') |
| 104 | endif |
| 105 | endif |
| 106 | if line('.') == line('$') |
| 107 | break |
| 108 | endif |
| 109 | endwhile |
Bram Moolenaar | 1d94f9b | 2005-08-04 21:29:45 +0000 | [diff] [blame] | 110 | endif |
| 111 | |
Bram Moolenaar | ec42059 | 2016-08-26 15:51:53 +0200 | [diff] [blame] | 112 | " Find next msgid. Quit when there is no more. |
| 113 | let lnum = line('.') |
Bram Moolenaar | 8a37047 | 2022-05-22 15:28:31 +0100 | [diff] [blame] | 114 | silent! keeppatterns /^msgid\> |
Bram Moolenaar | ec42059 | 2016-08-26 15:51:53 +0200 | [diff] [blame] | 115 | if line('.') == lnum |
Bram Moolenaar | 1d94f9b | 2005-08-04 21:29:45 +0000 | [diff] [blame] | 116 | break |
| 117 | endif |
| 118 | endwhile |
| 119 | |
Bram Moolenaar | 595f51c | 2008-06-09 12:46:00 +0000 | [diff] [blame] | 120 | " Check that error code in msgid matches the one in msgstr. |
| 121 | " |
| 122 | " Examples of mismatches found with msgid "E123: ..." |
| 123 | " - msgstr "E321: ..." error code mismatch |
| 124 | " - msgstr "W123: ..." warning instead of error |
| 125 | " - msgstr "E123 ..." missing colon |
| 126 | " - msgstr "..." missing error code |
| 127 | " |
| 128 | 1 |
| 129 | if search('msgid "\("\n"\)\?\([EW][0-9]\+:\).*\nmsgstr "\("\n"\)\?[^"]\@=\2\@!') > 0 |
Bram Moolenaar | ec42059 | 2016-08-26 15:51:53 +0200 | [diff] [blame] | 130 | echomsg 'Mismatching error/warning code in line ' . line('.') |
| 131 | if error == 0 |
| 132 | let error = line('.') |
| 133 | endif |
Bram Moolenaar | 595f51c | 2008-06-09 12:46:00 +0000 | [diff] [blame] | 134 | endif |
| 135 | |
Bram Moolenaar | 7f93703 | 2017-07-19 14:34:42 +0200 | [diff] [blame] | 136 | func! CountNl(first, last) |
| 137 | let nl = 0 |
| 138 | for lnum in range(a:first, a:last) |
Bram Moolenaar | 9966b21 | 2017-07-28 16:46:57 +0200 | [diff] [blame] | 139 | let nl += count(getline(lnum), "\n") |
Bram Moolenaar | 7f93703 | 2017-07-19 14:34:42 +0200 | [diff] [blame] | 140 | endfor |
| 141 | return nl |
| 142 | endfunc |
| 143 | |
Bram Moolenaar | 9966b21 | 2017-07-28 16:46:57 +0200 | [diff] [blame] | 144 | " Check that the \n at the end of the msgid line is also present in the msgstr |
Bram Moolenaar | 7f93703 | 2017-07-19 14:34:42 +0200 | [diff] [blame] | 145 | " line. Skip over the header. |
Bram Moolenaar | b07bbb0 | 2018-04-30 15:45:17 +0200 | [diff] [blame] | 146 | 1 |
Bram Moolenaar | 8a37047 | 2022-05-22 15:28:31 +0100 | [diff] [blame] | 147 | keeppatterns /^"MIME-Version: |
Bram Moolenaar | 7f93703 | 2017-07-19 14:34:42 +0200 | [diff] [blame] | 148 | while 1 |
| 149 | let lnum = search('^msgid\>') |
| 150 | if lnum <= 0 |
| 151 | break |
| 152 | endif |
| 153 | let strlnum = search('^msgstr\>') |
| 154 | let end = search('^$') |
| 155 | if end <= 0 |
| 156 | let end = line('$') + 1 |
| 157 | endif |
| 158 | let origcount = CountNl(lnum, strlnum - 1) |
| 159 | let transcount = CountNl(strlnum, end - 1) |
| 160 | " Allow for a few more or less line breaks when there are 2 or more |
| 161 | if origcount != transcount && (origcount <= 2 || transcount <= 2) |
Bram Moolenaar | 9966b21 | 2017-07-28 16:46:57 +0200 | [diff] [blame] | 162 | echomsg 'Mismatching "\n" in line ' . line('.') |
Bram Moolenaar | 7f93703 | 2017-07-19 14:34:42 +0200 | [diff] [blame] | 163 | if error == 0 |
| 164 | let error = lnum |
| 165 | endif |
| 166 | endif |
| 167 | endwhile |
| 168 | |
Bram Moolenaar | aaef1ba | 2017-08-01 17:40:23 +0200 | [diff] [blame] | 169 | " Check that the file is well formed according to msgfmts understanding |
| 170 | if executable("msgfmt") |
| 171 | let filename = expand("%") |
Bram Moolenaar | 01164a6 | 2017-11-02 22:58:42 +0100 | [diff] [blame] | 172 | " Newer msgfmt does not take OLD_PO_FILE_INPUT argument, must be in |
| 173 | " environment. |
| 174 | let $OLD_PO_FILE_INPUT = 'yes' |
| 175 | let a = system("msgfmt --statistics " . filename) |
Bram Moolenaar | aaef1ba | 2017-08-01 17:40:23 +0200 | [diff] [blame] | 176 | if v:shell_error != 0 |
| 177 | let error = matchstr(a, filename.':\zs\d\+\ze:')+0 |
| 178 | for line in split(a, '\n') | echomsg line | endfor |
| 179 | endif |
| 180 | endif |
| 181 | |
Bram Moolenaar | 9cfc7d8 | 2018-05-13 22:37:03 +0200 | [diff] [blame] | 182 | " Check that the plural form is properly initialized |
| 183 | 1 |
| 184 | let plural = search('^msgid_plural ', 'n') |
| 185 | if (plural && search('^"Plural-Forms: ', 'n') == 0) || (plural && search('^msgstr\[0\] ".\+"', 'n') != plural + 1) |
| 186 | if search('^"Plural-Forms: ', 'n') == 0 |
| 187 | echomsg "Missing Plural header" |
| 188 | if error == 0 |
| 189 | let error = search('\(^"[A-Za-z-_]\+: .*\\n"\n\)\+\zs', 'n') - 1 |
| 190 | endif |
| 191 | elseif error == 0 |
| 192 | let error = plural |
| 193 | endif |
| 194 | elseif !plural && search('^"Plural-Forms: ', 'n') |
| 195 | " We allow for a stray plural header, msginit adds one. |
| 196 | endif |
| 197 | |
Bram Moolenaar | d1d037e | 2018-06-24 18:04:50 +0200 | [diff] [blame] | 198 | " Check that 8bit encoding is used instead of 8-bit |
| 199 | let cte = search('^"Content-Transfer-Encoding:\s\+8-bit', 'n') |
| 200 | let ctc = search('^"Content-Type:.*;\s\+\<charset=[iI][sS][oO]_', 'n') |
| 201 | let ctu = search('^"Content-Type:.*;\s\+\<charset=utf-8', 'n') |
| 202 | if cte |
| 203 | echomsg "Content-Transfer-Encoding should be 8bit instead of 8-bit" |
| 204 | " TODO: make this an error |
| 205 | " if error == 0 |
| 206 | " let error = cte |
| 207 | " endif |
| 208 | elseif ctc |
| 209 | echomsg "Content-Type charset should be 'ISO-...' instead of 'ISO_...'" |
| 210 | " TODO: make this an error |
| 211 | " if error == 0 |
| 212 | " let error = ct |
| 213 | " endif |
| 214 | elseif ctu |
| 215 | echomsg "Content-Type charset should be 'UTF-8' instead of 'utf-8'" |
| 216 | " TODO: make this an error |
| 217 | " if error == 0 |
| 218 | " let error = ct |
| 219 | " endif |
| 220 | endif |
| 221 | |
Bram Moolenaar | 9cfc7d8 | 2018-05-13 22:37:03 +0200 | [diff] [blame] | 222 | |
Bram Moolenaar | 1d94f9b | 2005-08-04 21:29:45 +0000 | [diff] [blame] | 223 | if error == 0 |
Bram Moolenaar | 7f93703 | 2017-07-19 14:34:42 +0200 | [diff] [blame] | 224 | " If all was OK restore the view. |
| 225 | call winrestview(wsv) |
Bram Moolenaar | ec42059 | 2016-08-26 15:51:53 +0200 | [diff] [blame] | 226 | echomsg "OK" |
| 227 | else |
Bram Moolenaar | d1d037e | 2018-06-24 18:04:50 +0200 | [diff] [blame] | 228 | " Put the cursor on the line with the error. |
Bram Moolenaar | ec42059 | 2016-08-26 15:51:53 +0200 | [diff] [blame] | 229 | exe error |
Bram Moolenaar | 1d94f9b | 2005-08-04 21:29:45 +0000 | [diff] [blame] | 230 | endif |
| 231 | |
Bram Moolenaar | a411e5d | 2010-08-04 15:47:08 +0200 | [diff] [blame] | 232 | let &wrapscan = s:save_wrapscan |
| 233 | unlet s:save_wrapscan |
| 234 | |
Bram Moolenaar | 1d94f9b | 2005-08-04 21:29:45 +0000 | [diff] [blame] | 235 | endif |