blob: 6247b30e6c220f328d506a9b7b9e19a118db942b [file] [log] [blame]
Bram Moolenaar22e42152016-04-03 14:02:02 +02001" Tests for regexp in utf8 encoding
2if !has('multi_byte')
3 finish
4endif
5set encoding=utf-8
6scriptencoding utf-8
7
8func s:equivalence_test()
9 let str = "AÀÁÂÃÄÅĀĂĄǍǞǠẢ BḂḆ CÇĆĈĊČ DĎĐḊḎḐ EÈÉÊËĒĔĖĘĚẺẼ F GĜĞĠĢǤǦǴḠ HĤĦḢḦḨ IÌÍÎÏĨĪĬĮİǏỈ JĴ KĶǨḰḴ LĹĻĽĿŁḺ MḾṀ NÑŃŅŇṄṈ OÒÓÔÕÖØŌŎŐƠǑǪǬỎ PṔṖ Q RŔŖŘṘṞ SŚŜŞŠṠ TŢŤŦṪṮ UÙÚÛÜŨŪŬŮŰŲƯǓỦ V WŴẀẂẄẆ XẊẌ YÝŶŸẎỲỶỸ ZŹŻŽƵẐẔ aàáâãäåāăąǎǟǡả bḃḇ cçćĉċč dďđḋḏḑ eèéêëēĕėęěẻẽ f gĝğġģǥǧǵḡ hĥħḣḧḩẖ iìíîïĩīĭįǐỉ jĵǰ kķǩḱḵ lĺļľŀłḻ mḿṁ nñńņňʼnṅṉ oòóôõöøōŏőơǒǫǭỏ pṕṗ q rŕŗřṙṟ sśŝşšṡ tţťŧṫṯẗ uùúûüũūŭůűųưǔủ v wŵẁẃẅẇẘ xẋẍ yýÿŷẏẙỳỷỹ zźżžƶẑẕ"
10 let groups = split(str)
11 for group1 in groups
12 for c in split(group1, '\zs')
13 " next statement confirms that equivalence class matches every
14 " character in group
15 call assert_match('^[[=' . c . '=]]*$', group1)
16 for group2 in groups
17 if group2 != group1
18 " next statement converts that equivalence class doesn't match
19 " character in any other group
20 call assert_equal(-1, match(group2, '[[=' . c . '=]]'))
21 endif
22 endfor
23 endfor
24 endfor
25endfunc
26
27func Test_equivalence_re1()
28 set re=1
29 call s:equivalence_test()
30endfunc
31
32func Test_equivalence_re2()
33 set re=2
34 call s:equivalence_test()
35endfunc
Bram Moolenaaraf98a492016-04-24 14:40:12 +020036
37func s:classes_test()
Bram Moolenaar490465b2016-04-24 15:11:02 +020038 set isprint=@,161-255
Bram Moolenaaraf98a492016-04-24 14:40:12 +020039 call assert_equal('Motörhead', matchstr('Motörhead', '[[:print:]]\+'))
40
41 let alphachars = ''
42 let lowerchars = ''
43 let upperchars = ''
44 let alnumchars = ''
45 let printchars = ''
46 let punctchars = ''
47 let xdigitchars = ''
48 let i = 1
49 while i <= 255
50 let c = nr2char(i)
51 if c =~ '[[:alpha:]]'
52 let alphachars .= c
53 endif
54 if c =~ '[[:lower:]]'
55 let lowerchars .= c
56 endif
57 if c =~ '[[:upper:]]'
58 let upperchars .= c
59 endif
60 if c =~ '[[:alnum:]]'
61 let alnumchars .= c
62 endif
63 if c =~ '[[:print:]]'
64 let printchars .= c
65 endif
66 if c =~ '[[:punct:]]'
67 let punctchars .= c
68 endif
69 if c =~ '[[:xdigit:]]'
70 let xdigitchars .= c
71 endif
72 let i += 1
73 endwhile
74
75 call assert_equal('ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz', alphachars)
76 call assert_equal('abcdefghijklmnopqrstuvwxyzµßàáâãäåæçèéêëìíîïðñòóôõöøùúûüýþÿ', lowerchars)
77 call assert_equal('ABCDEFGHIJKLMNOPQRSTUVWXYZÀÁÂÃÄÅÆÇÈÉÊËÌÍÎÏÐÑÒÓÔÕÖØÙÚÛÜÝÞ', upperchars)
78 call assert_equal('0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz', alnumchars)
79 call assert_equal(' !"#$%&''()*+,-./0123456789:;<=>?@ABCDEFGHIJKLMNOPQRSTUVWXYZ[\]^_`abcdefghijklmnopqrstuvwxyz{|}~ ¡¢£¤¥¦§¨©ª«¬­®¯°±²³´µ¶·¸¹º»¼½¾¿ÀÁÂÃÄÅÆÇÈÉÊËÌÍÎÏÐÑÒÓÔÕÖרÙÚÛÜÝÞßàáâãäåæçèéêëìíîïðñòóôõö÷øùúûüýþÿ', printchars)
80 call assert_equal('!"#$%&''()*+,-./:;<=>?@[\]^_`{|}~', punctchars)
81 call assert_equal('0123456789ABCDEFabcdef', xdigitchars)
82endfunc
83
84func Test_classes_re1()
85 set re=1
86 call s:classes_test()
87endfunc
88
89func Test_classes_re2()
90 set re=2
91 call s:classes_test()
92endfunc