Bram Moolenaar | 53180ce | 2005-07-05 21:48:14 +0000 | [diff] [blame] | 1 | Tests for spell checking with 'encoding' set to "utf-8". vim: set ft=vim : |
| 2 | |
| 3 | STARTTEST |
| 4 | :so small.vim |
| 5 | :so mbyte.vim |
| 6 | :" |
Bram Moolenaar | 8d34330 | 2005-07-12 22:46:17 +0000 | [diff] [blame] | 7 | :" Don't want to depend on the locale from the environment. The .aff and .dic |
| 8 | :" text is in latin1, the test text is utf-8. |
| 9 | :set enc=latin1 |
| 10 | :e! |
Bram Moolenaar | 53180ce | 2005-07-05 21:48:14 +0000 | [diff] [blame] | 11 | :set enc=utf-8 |
Bram Moolenaar | ac6e65f | 2005-08-29 22:25:38 +0000 | [diff] [blame^] | 12 | :set fenc= |
Bram Moolenaar | 53180ce | 2005-07-05 21:48:14 +0000 | [diff] [blame] | 13 | :" |
Bram Moolenaar | ac6e65f | 2005-08-29 22:25:38 +0000 | [diff] [blame^] | 14 | :" Function to test .aff/.dic with list of good and bad words. |
| 15 | :func TestOne(aff, dic) |
| 16 | set spellfile= |
| 17 | $put ='' |
| 18 | $put ='test '. a:aff . '-' . a:dic |
| 19 | " Generate a .spl file from a .dic and .aff file. |
| 20 | exe '1;/^' . a:aff . 'affstart/+1,/^' . a:aff . 'affend/-1w! Xtest.aff' |
| 21 | exe '1;/^' . a:dic . 'dicstart/+1,/^' . a:dic . 'dicend/-1w! Xtest.dic' |
| 22 | mkspell! Xtest Xtest |
| 23 | " use that spell file |
| 24 | set spl=Xtest.utf-8.spl spell |
| 25 | " list all valid words |
| 26 | spelldump |
| 27 | %yank |
| 28 | quit |
| 29 | $put |
| 30 | $put ='-------' |
| 31 | " find all bad words and suggestions for them |
| 32 | exe '1;/^' . a:aff . 'good:' |
| 33 | normal 0f:]s |
| 34 | let prevbad = '' |
| 35 | while 1 |
| 36 | let bad = spellbadword() |
| 37 | if bad == '' || bad == prevbad || bad == 'badend' |
| 38 | break |
| 39 | endif |
| 40 | let prevbad = bad |
| 41 | let lst = spellsuggest(bad, 3) |
| 42 | normal mm |
| 43 | $put =bad |
| 44 | $put =string(lst) |
| 45 | normal `m]s |
| 46 | endwhile |
Bram Moolenaar | 53180ce | 2005-07-05 21:48:14 +0000 | [diff] [blame] | 47 | endfunc |
Bram Moolenaar | ac6e65f | 2005-08-29 22:25:38 +0000 | [diff] [blame^] | 48 | :" |
| 49 | :call TestOne('1', '1') |
Bram Moolenaar | 53180ce | 2005-07-05 21:48:14 +0000 | [diff] [blame] | 50 | :$put =soundfold('goobledygoook') |
| 51 | :$put =soundfold('kóopërÿnôven') |
| 52 | :$put =soundfold('oeverloos gezwets edale') |
| 53 | :" |
Bram Moolenaar | ac6e65f | 2005-08-29 22:25:38 +0000 | [diff] [blame^] | 54 | :" |
Bram Moolenaar | 53180ce | 2005-07-05 21:48:14 +0000 | [diff] [blame] | 55 | :" and now with SAL instead of SOFO items; test automatic reloading |
Bram Moolenaar | ac6e65f | 2005-08-29 22:25:38 +0000 | [diff] [blame^] | 56 | gg:/^affstart_sal/+1,/^affend_sal/-1w! Xtest.aff |
Bram Moolenaar | 53180ce | 2005-07-05 21:48:14 +0000 | [diff] [blame] | 57 | :mkspell! Xtest Xtest |
| 58 | :$put =soundfold('goobledygoook') |
| 59 | :$put =soundfold('kóopërÿnôven') |
| 60 | :$put =soundfold('oeverloos gezwets edale') |
| 61 | :" |
| 62 | :" also use an addition file |
| 63 | gg:/^addstart/+1,/^addend/-1w! Xtest.utf-8.add |
| 64 | :mkspell! Xtest.utf-8.add.spl Xtest.utf-8.add |
Bram Moolenaar | 53180ce | 2005-07-05 21:48:14 +0000 | [diff] [blame] | 65 | :set spellfile=Xtest.utf-8.add |
| 66 | /^test2: |
| 67 | ]s:let str = spellbadword() |
| 68 | :$put =str |
Bram Moolenaar | bbebc85 | 2005-07-18 21:47:53 +0000 | [diff] [blame] | 69 | :set spl=Xtest_us.utf-8.spl |
Bram Moolenaar | 53180ce | 2005-07-05 21:48:14 +0000 | [diff] [blame] | 70 | /^test2: |
| 71 | ]smm:let str = spellbadword() |
| 72 | :$put =str |
| 73 | `m]s:let str = spellbadword() |
| 74 | :$put =str |
Bram Moolenaar | bbebc85 | 2005-07-18 21:47:53 +0000 | [diff] [blame] | 75 | :set spl=Xtest_gb.utf-8.spl |
Bram Moolenaar | 53180ce | 2005-07-05 21:48:14 +0000 | [diff] [blame] | 76 | /^test2: |
| 77 | ]smm:let str = spellbadword() |
| 78 | :$put =str |
| 79 | `m]s:let str = spellbadword() |
| 80 | :$put =str |
Bram Moolenaar | bbebc85 | 2005-07-18 21:47:53 +0000 | [diff] [blame] | 81 | :set spl=Xtest_nz.utf-8.spl |
Bram Moolenaar | 53180ce | 2005-07-05 21:48:14 +0000 | [diff] [blame] | 82 | /^test2: |
| 83 | ]smm:let str = spellbadword() |
| 84 | :$put =str |
| 85 | `m]s:let str = spellbadword() |
| 86 | :$put =str |
Bram Moolenaar | bbebc85 | 2005-07-18 21:47:53 +0000 | [diff] [blame] | 87 | :set spl=Xtest_ca.utf-8.spl |
Bram Moolenaar | 53180ce | 2005-07-05 21:48:14 +0000 | [diff] [blame] | 88 | /^test2: |
| 89 | ]smm:let str = spellbadword() |
| 90 | :$put =str |
| 91 | `m]s:let str = spellbadword() |
| 92 | :$put =str |
| 93 | :" |
| 94 | :" Postponed prefixes |
Bram Moolenaar | ac6e65f | 2005-08-29 22:25:38 +0000 | [diff] [blame^] | 95 | :call TestOne('2', '1') |
| 96 | :" |
| 97 | :" Compound words |
| 98 | :call TestOne('3', '3') |
| 99 | :call TestOne('4', '4') |
Bram Moolenaar | 53180ce | 2005-07-05 21:48:14 +0000 | [diff] [blame] | 100 | :" |
| 101 | gg:/^test output:/,$wq! test.out |
| 102 | ENDTEST |
| 103 | |
Bram Moolenaar | ac6e65f | 2005-08-29 22:25:38 +0000 | [diff] [blame^] | 104 | 1affstart |
Bram Moolenaar | 53180ce | 2005-07-05 21:48:14 +0000 | [diff] [blame] | 105 | SET ISO8859-1 |
| 106 | TRY esianrtolcdugmphbyfvkwjkqxz-ëéèêïîäàâöüû'ESIANRTOLCDUGMPHBYFVKWJKQXZ |
| 107 | |
| 108 | FOL àáâãäåæçèéêëìíîïðñòóôõöøùúûüýþßÿ |
| 109 | LOW àáâãäåæçèéêëìíîïðñòóôõöøùúûüýþßÿ |
| 110 | UPP ÀÁÂÃÄÅÆÇÈÉÊËÌÍÎÏÐÑÒÓÔÕÖØÙÚÛÜÝÞßÿ |
| 111 | |
| 112 | SOFOFROM abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZàáâãäåæçèéêëìíîïðñòóôõöøùúûüýþßÿÀÁÂÃÄÅÆÇÈÉÊËÌÍÎÏÐÑÒÓÔÕÖØÙÚÛÜÝÞ¿ |
| 113 | SOFOTO ebctefghejklnnepkrstevvkesebctefghejklnnepkrstevvkeseeeeeeeceeeeeeeedneeeeeeeeeeepseeeeeeeeceeeeeeeedneeeeeeeeeeep? |
| 114 | |
| 115 | MIDWORD '- |
| 116 | |
| 117 | KEP = |
| 118 | RAR ? |
| 119 | BAD ! |
| 120 | |
| 121 | NOSPLITSUGS |
| 122 | |
| 123 | PFX I N 1 |
| 124 | PFX I 0 in . |
| 125 | |
| 126 | PFX O Y 1 |
| 127 | PFX O 0 out . |
| 128 | |
| 129 | SFX S Y 2 |
| 130 | SFX S 0 s [^s] |
| 131 | SFX S 0 es s |
| 132 | |
| 133 | SFX N N 3 |
| 134 | SFX N 0 en [^n] |
| 135 | SFX N 0 nen n |
| 136 | SFX N 0 n . |
| 137 | |
| 138 | REP 3 |
| 139 | REP g ch |
| 140 | REP ch g |
| 141 | REP svp s.v.p. |
| 142 | |
| 143 | MAP 9 |
| 144 | MAP aàáâãäå |
| 145 | MAP eèéêë |
| 146 | MAP iìíîï |
| 147 | MAP oòóôõö |
| 148 | MAP uùúûü |
| 149 | MAP nñ |
| 150 | MAP cç |
| 151 | MAP yÿý |
| 152 | MAP sß |
Bram Moolenaar | ac6e65f | 2005-08-29 22:25:38 +0000 | [diff] [blame^] | 153 | 1affend |
Bram Moolenaar | 53180ce | 2005-07-05 21:48:14 +0000 | [diff] [blame] | 154 | |
Bram Moolenaar | ac6e65f | 2005-08-29 22:25:38 +0000 | [diff] [blame^] | 155 | affstart_sal |
Bram Moolenaar | 53180ce | 2005-07-05 21:48:14 +0000 | [diff] [blame] | 156 | SET ISO8859-1 |
| 157 | TRY esianrtolcdugmphbyfvkwjkqxz-ëéèêïîäàâöüû'ESIANRTOLCDUGMPHBYFVKWJKQXZ |
| 158 | |
| 159 | FOL àáâãäåæçèéêëìíîïðñòóôõöøùúûüýþßÿ |
| 160 | LOW àáâãäåæçèéêëìíîïðñòóôõöøùúûüýþßÿ |
| 161 | UPP ÀÁÂÃÄÅÆÇÈÉÊËÌÍÎÏÐÑÒÓÔÕÖØÙÚÛÜÝÞßÿ |
| 162 | |
| 163 | MIDWORD '- |
| 164 | |
| 165 | KEP = |
| 166 | RAR ? |
| 167 | BAD ! |
| 168 | |
| 169 | NOSPLITSUGS |
| 170 | |
| 171 | PFX I N 1 |
| 172 | PFX I 0 in . |
| 173 | |
| 174 | PFX O Y 1 |
| 175 | PFX O 0 out . |
| 176 | |
| 177 | SFX S Y 2 |
| 178 | SFX S 0 s [^s] |
| 179 | SFX S 0 es s |
| 180 | |
| 181 | SFX N N 3 |
| 182 | SFX N 0 en [^n] |
| 183 | SFX N 0 nen n |
| 184 | SFX N 0 n . |
| 185 | |
| 186 | REP 3 |
| 187 | REP g ch |
| 188 | REP ch g |
| 189 | REP svp s.v.p. |
| 190 | |
| 191 | MAP 9 |
| 192 | MAP aàáâãäå |
| 193 | MAP eèéêë |
| 194 | MAP iìíîï |
| 195 | MAP oòóôõö |
| 196 | MAP uùúûü |
| 197 | MAP nñ |
| 198 | MAP cç |
| 199 | MAP yÿý |
| 200 | MAP sß |
| 201 | |
| 202 | SAL AH(AEIOUY)-^ *H |
| 203 | SAL AR(AEIOUY)-^ *R |
| 204 | SAL A(HR)^ * |
| 205 | SAL A^ * |
| 206 | SAL AH(AEIOUY)- H |
| 207 | SAL AR(AEIOUY)- R |
| 208 | SAL A(HR) _ |
| 209 | SAL À^ * |
| 210 | SAL Å^ * |
| 211 | SAL BB- _ |
| 212 | SAL B B |
| 213 | SAL CQ- _ |
| 214 | SAL CIA X |
| 215 | SAL CH X |
| 216 | SAL C(EIY)- S |
| 217 | SAL CK K |
| 218 | SAL COUGH^ KF |
| 219 | SAL CC< C |
| 220 | SAL C K |
| 221 | SAL DG(EIY) K |
| 222 | SAL DD- _ |
| 223 | SAL D T |
| 224 | SAL É< E |
| 225 | SAL EH(AEIOUY)-^ *H |
| 226 | SAL ER(AEIOUY)-^ *R |
| 227 | SAL E(HR)^ * |
| 228 | SAL ENOUGH^$ *NF |
| 229 | SAL E^ * |
| 230 | SAL EH(AEIOUY)- H |
| 231 | SAL ER(AEIOUY)- R |
| 232 | SAL E(HR) _ |
| 233 | SAL FF- _ |
| 234 | SAL F F |
| 235 | SAL GN^ N |
| 236 | SAL GN$ N |
| 237 | SAL GNS$ NS |
| 238 | SAL GNED$ N |
| 239 | SAL GH(AEIOUY)- K |
| 240 | SAL GH _ |
| 241 | SAL GG9 K |
| 242 | SAL G K |
| 243 | SAL H H |
| 244 | SAL IH(AEIOUY)-^ *H |
| 245 | SAL IR(AEIOUY)-^ *R |
| 246 | SAL I(HR)^ * |
| 247 | SAL I^ * |
| 248 | SAL ING6 N |
| 249 | SAL IH(AEIOUY)- H |
| 250 | SAL IR(AEIOUY)- R |
| 251 | SAL I(HR) _ |
| 252 | SAL J K |
| 253 | SAL KN^ N |
| 254 | SAL KK- _ |
| 255 | SAL K K |
| 256 | SAL LAUGH^ LF |
| 257 | SAL LL- _ |
| 258 | SAL L L |
| 259 | SAL MB$ M |
| 260 | SAL MM M |
| 261 | SAL M M |
| 262 | SAL NN- _ |
| 263 | SAL N N |
| 264 | SAL OH(AEIOUY)-^ *H |
| 265 | SAL OR(AEIOUY)-^ *R |
| 266 | SAL O(HR)^ * |
| 267 | SAL O^ * |
| 268 | SAL OH(AEIOUY)- H |
| 269 | SAL OR(AEIOUY)- R |
| 270 | SAL O(HR) _ |
| 271 | SAL PH F |
| 272 | SAL PN^ N |
| 273 | SAL PP- _ |
| 274 | SAL P P |
| 275 | SAL Q K |
| 276 | SAL RH^ R |
| 277 | SAL ROUGH^ RF |
| 278 | SAL RR- _ |
| 279 | SAL R R |
| 280 | SAL SCH(EOU)- SK |
| 281 | SAL SC(IEY)- S |
| 282 | SAL SH X |
| 283 | SAL SI(AO)- X |
| 284 | SAL SS- _ |
| 285 | SAL S S |
| 286 | SAL TI(AO)- X |
| 287 | SAL TH @ |
| 288 | SAL TCH-- _ |
| 289 | SAL TOUGH^ TF |
| 290 | SAL TT- _ |
| 291 | SAL T T |
| 292 | SAL UH(AEIOUY)-^ *H |
| 293 | SAL UR(AEIOUY)-^ *R |
| 294 | SAL U(HR)^ * |
| 295 | SAL U^ * |
| 296 | SAL UH(AEIOUY)- H |
| 297 | SAL UR(AEIOUY)- R |
| 298 | SAL U(HR) _ |
| 299 | SAL V^ W |
| 300 | SAL V F |
| 301 | SAL WR^ R |
| 302 | SAL WH^ W |
| 303 | SAL W(AEIOU)- W |
| 304 | SAL X^ S |
| 305 | SAL X KS |
| 306 | SAL Y(AEIOU)- Y |
| 307 | SAL ZZ- _ |
| 308 | SAL Z S |
Bram Moolenaar | ac6e65f | 2005-08-29 22:25:38 +0000 | [diff] [blame^] | 309 | affend_sal |
Bram Moolenaar | 53180ce | 2005-07-05 21:48:14 +0000 | [diff] [blame] | 310 | |
Bram Moolenaar | ac6e65f | 2005-08-29 22:25:38 +0000 | [diff] [blame^] | 311 | 2affstart |
Bram Moolenaar | 53180ce | 2005-07-05 21:48:14 +0000 | [diff] [blame] | 312 | SET ISO8859-1 |
| 313 | |
| 314 | FOL àáâãäåæçèéêëìíîïðñòóôõöøùúûüýþßÿ |
| 315 | LOW àáâãäåæçèéêëìíîïðñòóôõöøùúûüýþßÿ |
| 316 | UPP ÀÁÂÃÄÅÆÇÈÉÊËÌÍÎÏÐÑÒÓÔÕÖØÙÚÛÜÝÞßÿ |
| 317 | |
| 318 | PFXPOSTPONE |
| 319 | |
| 320 | MIDWORD '- |
| 321 | |
| 322 | KEP = |
| 323 | RAR ? |
| 324 | BAD ! |
| 325 | |
| 326 | NOSPLITSUGS |
| 327 | |
| 328 | PFX I N 1 |
| 329 | PFX I 0 in . |
| 330 | |
| 331 | PFX O Y 1 |
Bram Moolenaar | 78984f5 | 2005-08-01 07:19:10 +0000 | [diff] [blame] | 332 | PFX O 0 out [a-z] |
Bram Moolenaar | 53180ce | 2005-07-05 21:48:14 +0000 | [diff] [blame] | 333 | |
| 334 | SFX S Y 2 |
| 335 | SFX S 0 s [^s] |
| 336 | SFX S 0 es s |
| 337 | |
| 338 | SFX N N 3 |
| 339 | SFX N 0 en [^n] |
| 340 | SFX N 0 nen n |
| 341 | SFX N 0 n . |
| 342 | |
| 343 | REP 3 |
| 344 | REP g ch |
| 345 | REP ch g |
| 346 | REP svp s.v.p. |
| 347 | |
| 348 | MAP 9 |
| 349 | MAP aàáâãäå |
| 350 | MAP eèéêë |
| 351 | MAP iìíîï |
| 352 | MAP oòóôõö |
| 353 | MAP uùúûü |
| 354 | MAP nñ |
| 355 | MAP cç |
| 356 | MAP yÿý |
| 357 | MAP sß |
Bram Moolenaar | ac6e65f | 2005-08-29 22:25:38 +0000 | [diff] [blame^] | 358 | 2affend |
Bram Moolenaar | 53180ce | 2005-07-05 21:48:14 +0000 | [diff] [blame] | 359 | |
Bram Moolenaar | ac6e65f | 2005-08-29 22:25:38 +0000 | [diff] [blame^] | 360 | 1dicstart |
Bram Moolenaar | 53180ce | 2005-07-05 21:48:14 +0000 | [diff] [blame] | 361 | 123456 |
| 362 | test/NO |
| 363 | # comment |
| 364 | wrong |
| 365 | Comment |
| 366 | OK |
| 367 | uk |
| 368 | put/ISO |
| 369 | the end |
| 370 | deol |
| 371 | déôr |
Bram Moolenaar | ac6e65f | 2005-08-29 22:25:38 +0000 | [diff] [blame^] | 372 | 1dicend |
Bram Moolenaar | 53180ce | 2005-07-05 21:48:14 +0000 | [diff] [blame] | 373 | |
| 374 | addstart |
| 375 | /regions=usgbnz |
| 376 | elequint/2 |
| 377 | elekwint/3 |
| 378 | addend |
| 379 | |
Bram Moolenaar | ac6e65f | 2005-08-29 22:25:38 +0000 | [diff] [blame^] | 380 | 1good: wrong OK puts. Test the end |
| 381 | bad: inputs comment ok Ok. test déôl end the |
| 382 | badend |
| 383 | |
| 384 | 2good: puts |
| 385 | bad: inputs comment ok Ok end the. test déôl |
| 386 | badend |
| 387 | |
| 388 | Test rules for compounding. |
| 389 | |
| 390 | 3affstart |
| 391 | SET ISO8859-1 |
| 392 | |
| 393 | COMPOUNDMIN 3 |
| 394 | COMPOUNDFLAGS m* |
| 395 | NEEDCOMPOUND x |
| 396 | 3affend |
| 397 | |
| 398 | 3dicstart |
| 399 | 1234 |
| 400 | foo/m |
| 401 | bar/mx |
| 402 | mï/m |
| 403 | la/mx |
| 404 | 3dicend |
| 405 | |
| 406 | 3good: foo mï foobar foofoobar barfoo barbarfoo |
| 407 | bad: bar la foomï barmï mïfoo mïbar mïmï lala mïla lamï foola labar |
| 408 | badend |
| 409 | |
| 410 | |
| 411 | Tests for compounding. |
| 412 | |
| 413 | 4affstart |
| 414 | SET ISO8859-1 |
| 415 | |
| 416 | FOL àáâãäåæçèéêëìíîïðñòóôõöøùúûüýþßÿ |
| 417 | LOW àáâãäåæçèéêëìíîïðñòóôõöøùúûüýþßÿ |
| 418 | UPP ÀÁÂÃÄÅÆÇÈÉÊËÌÍÎÏÐÑÒÓÔÕÖØÙÚÛÜÝÞßÿ |
| 419 | |
| 420 | COMPOUNDFLAGS m+ |
| 421 | COMPOUNDFLAGS sm*e |
| 422 | COMPOUNDFLAGS sm+ |
| 423 | COMPOUNDMIN 3 |
| 424 | COMPOUNDMAX 3 |
| 425 | |
| 426 | COMPOUNDSYLMAX 5 |
| 427 | SYLLABLE aáeéiíoóöõuúüûy/aa/au/ea/ee/ei/ie/oa/oe/oo/ou/uu/ui |
| 428 | |
| 429 | MAP 9 |
| 430 | MAP aàáâãäå |
| 431 | MAP eèéêë |
| 432 | MAP iìíîï |
| 433 | MAP oòóôõö |
| 434 | MAP uùúûü |
| 435 | MAP nñ |
| 436 | MAP cç |
| 437 | MAP yÿý |
| 438 | MAP sß |
| 439 | |
| 440 | NEEDAFFIX x |
| 441 | |
| 442 | PFXPOSTPONE |
| 443 | |
| 444 | MIDWORD '- |
| 445 | |
| 446 | SFX q N 1 |
| 447 | SFX q 0 -ok . |
| 448 | |
| 449 | SFX a Y 2 |
| 450 | SFX a 0 s . |
| 451 | SFX a 0 ize . nocomp |
| 452 | |
| 453 | PFX p N 1 |
| 454 | PFX p 0 pre . |
| 455 | 4affend |
| 456 | |
| 457 | 4dicstart |
| 458 | 1234 |
| 459 | word/m |
| 460 | util/am |
| 461 | pro/xq |
| 462 | tomato/m |
| 463 | bork/mp |
| 464 | start/s |
| 465 | end/e |
| 466 | 4dicend |
| 467 | |
| 468 | 4good: word util bork prebork start end wordutil wordutils pro-ok |
| 469 | bork borkbork borkborkbork borkborkborkbork borkborkborkborkbork |
| 470 | tomato tomatotomato startend startword startwordword startwordend |
| 471 | startwordwordend startwordwordwordend prebork preborkprebork |
| 472 | preborkborkprebork preborkpreborkbork |
| 473 | bad: wordutilize pro borkborkborkborkborkbork tomatotomatotomato |
| 474 | endstart endend startstart wordend wordstart |
| 475 | startwordwordwordwordend borkpreborkpreborkbork |
| 476 | badend |
Bram Moolenaar | 53180ce | 2005-07-05 21:48:14 +0000 | [diff] [blame] | 477 | |
| 478 | test2: |
| 479 | elequint test elekwint test elekwent asdf |
| 480 | |
Bram Moolenaar | 53180ce | 2005-07-05 21:48:14 +0000 | [diff] [blame] | 481 | test output: |