blob: 81d8f5b04a8e372e39180da5eed44fde8a059f07 [file] [log] [blame]
Bram Moolenaar22e42152016-04-03 14:02:02 +02001" Tests for regexp in utf8 encoding
2if !has('multi_byte')
3 finish
4endif
Bram Moolenaar22e42152016-04-03 14:02:02 +02005
6func s:equivalence_test()
7 let str = "AÀÁÂÃÄÅĀĂĄǍǞǠẢ BḂḆ CÇĆĈĊČ DĎĐḊḎḐ EÈÉÊËĒĔĖĘĚẺẼ F GĜĞĠĢǤǦǴḠ HĤĦḢḦḨ IÌÍÎÏĨĪĬĮİǏỈ JĴ KĶǨḰḴ LĹĻĽĿŁḺ MḾṀ NÑŃŅŇṄṈ OÒÓÔÕÖØŌŎŐƠǑǪǬỎ PṔṖ Q RŔŖŘṘṞ SŚŜŞŠṠ TŢŤŦṪṮ UÙÚÛÜŨŪŬŮŰŲƯǓỦ V WŴẀẂẄẆ XẊẌ YÝŶŸẎỲỶỸ ZŹŻŽƵẐẔ aàáâãäåāăąǎǟǡả bḃḇ cçćĉċč dďđḋḏḑ eèéêëēĕėęěẻẽ f gĝğġģǥǧǵḡ hĥħḣḧḩẖ iìíîïĩīĭįǐỉ jĵǰ kķǩḱḵ lĺļľŀłḻ mḿṁ nñńņňʼnṅṉ oòóôõöøōŏőơǒǫǭỏ pṕṗ q rŕŗřṙṟ sśŝşšṡ tţťŧṫṯẗ uùúûüũūŭůűųưǔủ v wŵẁẃẅẇẘ xẋẍ yýÿŷẏẙỳỷỹ zźżžƶẑẕ"
8 let groups = split(str)
9 for group1 in groups
10 for c in split(group1, '\zs')
11 " next statement confirms that equivalence class matches every
12 " character in group
13 call assert_match('^[[=' . c . '=]]*$', group1)
14 for group2 in groups
15 if group2 != group1
16 " next statement converts that equivalence class doesn't match
17 " character in any other group
18 call assert_equal(-1, match(group2, '[[=' . c . '=]]'))
19 endif
20 endfor
21 endfor
22 endfor
23endfunc
24
25func Test_equivalence_re1()
26 set re=1
27 call s:equivalence_test()
28endfunc
29
30func Test_equivalence_re2()
31 set re=2
32 call s:equivalence_test()
33endfunc
Bram Moolenaaraf98a492016-04-24 14:40:12 +020034
35func s:classes_test()
Bram Moolenaar490465b2016-04-24 15:11:02 +020036 set isprint=@,161-255
Bram Moolenaaraf98a492016-04-24 14:40:12 +020037 call assert_equal('Motörhead', matchstr('Motörhead', '[[:print:]]\+'))
38
39 let alphachars = ''
40 let lowerchars = ''
41 let upperchars = ''
42 let alnumchars = ''
43 let printchars = ''
44 let punctchars = ''
45 let xdigitchars = ''
46 let i = 1
47 while i <= 255
48 let c = nr2char(i)
49 if c =~ '[[:alpha:]]'
50 let alphachars .= c
51 endif
52 if c =~ '[[:lower:]]'
53 let lowerchars .= c
54 endif
55 if c =~ '[[:upper:]]'
56 let upperchars .= c
57 endif
58 if c =~ '[[:alnum:]]'
59 let alnumchars .= c
60 endif
61 if c =~ '[[:print:]]'
62 let printchars .= c
63 endif
64 if c =~ '[[:punct:]]'
65 let punctchars .= c
66 endif
67 if c =~ '[[:xdigit:]]'
68 let xdigitchars .= c
69 endif
70 let i += 1
71 endwhile
72
73 call assert_equal('ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz', alphachars)
74 call assert_equal('abcdefghijklmnopqrstuvwxyzµßàáâãäåæçèéêëìíîïðñòóôõöøùúûüýþÿ', lowerchars)
75 call assert_equal('ABCDEFGHIJKLMNOPQRSTUVWXYZÀÁÂÃÄÅÆÇÈÉÊËÌÍÎÏÐÑÒÓÔÕÖØÙÚÛÜÝÞ', upperchars)
76 call assert_equal('0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz', alnumchars)
77 call assert_equal(' !"#$%&''()*+,-./0123456789:;<=>?@ABCDEFGHIJKLMNOPQRSTUVWXYZ[\]^_`abcdefghijklmnopqrstuvwxyz{|}~ ¡¢£¤¥¦§¨©ª«¬­®¯°±²³´µ¶·¸¹º»¼½¾¿ÀÁÂÃÄÅÆÇÈÉÊËÌÍÎÏÐÑÒÓÔÕÖרÙÚÛÜÝÞßàáâãäåæçèéêëìíîïðñòóôõö÷øùúûüýþÿ', printchars)
78 call assert_equal('!"#$%&''()*+,-./:;<=>?@[\]^_`{|}~', punctchars)
79 call assert_equal('0123456789ABCDEFabcdef', xdigitchars)
80endfunc
81
82func Test_classes_re1()
83 set re=1
84 call s:classes_test()
85endfunc
86
87func Test_classes_re2()
88 set re=2
89 call s:classes_test()
90endfunc