forked from aniani/vim
Problem: regex: wrong match when searching multi-byte char
case-insensitive (diffsetter)
Solution: Apply proper case-folding for characters and search-string
This patch does the following 4 things:
1) When the regexp engine compares two utf-8 codepoints case
insensitive it may match an adjacent character, because it assumes
it can step over as many bytes as the pattern contains.
This however is not necessarily true because of case-folding, a
multi-byte UTF-8 character can be considered equal to some
single-byte value.
Let's consider the pattern 'ſ' and the string 's'. When comparing and
ignoring case, the single character 's' matches, and since it matches
Vim will try to step over the match (by the amount of bytes of the
pattern), assuming that since it matches, the length of both strings is
the same.
However in that case, it should only step over the single byte value
's' by 1 byte and try to start matching after it again. So for the
backtracking engine we need to ensure:
* we try to match the correct length for the pattern and the text
* in case of a match, we step over it correctly
There is one tricky thing for the backtracing engine. We also need to
calculate correctly the number of bytes to compare the 2 different
utf-8 strings s1 and s2. So we will count the number of characters in
s1 that the byte len specified. Then we count the number of bytes to
step over the same number of characters in string s2 and then we can
correctly compare the 2 utf-8 strings.
2) A similar thing can happen for the NFA engine, when skipping to the
next character to test for a match. We are skipping over the regstart
pointer, however we do not consider the case that because of
case-folding we may need to adjust the number of bytes to skip over.
So this needs to be adjusted in find_match_text() as well.
3) A related issue turned out, when prog->match_text is actually empty.
In that case we should try to find the next match and skip this
condition.
4) When comparing characters using collections, we must also apply case
folding to each character in the collection and not just to the
current character from the search string. This doesn't apply to the
NFA engine, because internally it converts collections to branches
[abc] -> a\|b\|c
fixes: #14294
closes: #14756
Signed-off-by: Christian Brabandt <cb@256bit.org>
623 lines
23 KiB
VimL
623 lines
23 KiB
VimL
" Tests for regexp in utf8 encoding
|
||
|
||
source shared.vim
|
||
|
||
func s:equivalence_test()
|
||
let str = "A<><41><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>ゾ<EFBFBD><E382BE><EFBFBD>廎<EFBFBD>廕<EFBFBD>滯廕戶漲廕兕漯廕矜漁廕唸熔廕氮熄 B<><42>廎<EFBFBD><E5BB8E>廎<EFBFBD> C<><43><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>廎<EFBFBD><E5BB8E> D<><44><EFBFBD>廎𢈈<E5BB8E>廎墰<E5BB8E>廎<EFBFBD> E<><45><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>廎竢<E5BB8E>廎嘣<E5BB8E>廎𦸇爾廕筵獐廕擔<E5BB95>廙<EFBFBD><E5BB99>廙<EFBFBD> F<>廎嵴<E5BB8E> G<><47><EFBFBD>罌<EFBFBD>エオジ廎𥻗<E5BB8E> H臚藻<E8879A>廎S舅廎艮落廎芬惕 I<><49><EFBFBD><EFBFBD>蘑蘆蘇蠔襤<E8A094><E8A5A4><EFBFBD><EFBFBD>廎矜葬廙<E891AC><E5BB99> J譬<4A> K譯<4B>ガ廎唸葡廎氯惟<E6B0AF><E6839F> L贏躉躅醴<E8BA85><E986B4>廎嗤虜廎筵蜈漹<E89C88> M廎擔<E5BB8E>廜<EFBFBD> N<><4E><EFBFBD><EFBFBD>ゼ廜<E382BC><E5BB9C>廜<EFBFBD><E5BB9C><EFBFBD><EFBFBD> O<><4F><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>ギグヂ<E382B0><E38382><EFBFBD><EFBFBD><EFBFBD><EFBFBD>廜𣉖<E5BB9C>廜靟<E5BB9C>廙𣉖<E5BB99>廙靟<E5BB99>廙竢<E5BB99>廙嘣<E5BB99>廙𦸇<E5BB99>廙<EFBFBD>誥 P④廜竢<E5BB9C>漹<EFBFBD> Q<> R<><52><EFBFBD><EFBFBD><EFBFBD><EFBFBD>廜嘣<E5BB9C>廜𦸇<E5BB9C>漹曰𩵼 S<><53><EFBFBD><EFBFBD><EFBFBD>廜<EFBFBD>飾廜戶髡廜兩掛<E585A9><E68E9B> T籠聾臟⑵⑷<E291B5><E291B7>廜花僧廜桑僭 U<><55><EFBFBD><EFBFBD>襯讀贗躓酈⑸<E98588><E291B8><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>廜聊僑廜嗤兢廜筵誘廙艮豪廙花賑廙桑趕 V⑻廜澄嗾 W霽廕<E99CBD>廕<EFBFBD><E5BB95>廕<EFBFBD><E5BB95> X廕𢈈<E5BB95> Y<>韃顫⑼<E9A1AB><E291BC>廕墰輔廙氮辣廙<E8BEA3> Z饕驍鬚ⅰ廕靟<E5BB95>廕婙惚 a<>獺璽瓊瓣疇<E793A3><E79687><EFBFBD><EFBFBD><EFBFBD>ゥタ<E382A5><E382BF>廑𥕥<E5BB91>廕𠹳滿廕€漸廕扭漫廕後滬廕脊滷廕喔熊廕猾悼 b<><62>廘矜<E5BB98>廎<EFBFBD><E5BB8E>廎<EFBFBD> c癟<63><E7999F><EFBFBD><EFBFBD><EFBFBD><EFBFBD>廎㕓<E5BB8E><E39593><EFBFBD> d<><64><EFBFBD>廘凍<E5BB98>廑𤒹<E5BB91>廎溆<E5BB8E>廎𤒹<E5BB8E> e癡矇礙禱<E7A499><E7A6B1><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>廑𠯆<E5BB91>廎䤾<E5BB8E>廎𧘲<E5BB8E>廕嫗獄廕賦瑪廙<E791AA><E5BB99>廙<EFBFBD><E5BB99> f<>廘桑<E5BB98>廎<EFBFBD><E5BB8E> g<><67>纂耀ォカス<E382AB>廑<EFBFBD>腹<EFBFBD><E885B9> h艦藹<E889A6>廎€艇廎扭萱廎後<E5BB8E>漹刷<E6BCB9> i穫穩簾簿藺蘋蘊蠕<E8988A><E8A095><EFBFBD>禸廑𥕝葉廎脊<E5BB8E>廙<EFBFBD> j警ゴ<E8ADA6> k譟<6B>キ廑<E382AD>萵廎喔葭漹虎<E6BCB9> l贍躁躂<E8BA81><E8BA82><EFBFBD>廎猿號廎頗蜇漹<E89C87> m廘脊蛾廜<E89BBE><E5BB9C> n簽<6E><E7B0BD><EFBFBD><EFBFBD>ソ廘唸<E5BB98>廜<EFBFBD><E5BB9C>廜刅<E5BB9C><E58885><EFBFBD> o簷籀繫繭繹繪<E7B9B9><E7B9AA><EFBFBD>①<EFBFBD>クケッ<E382B1><E38383><EFBFBD><EFBFBD><EFBFBD><EFBFBD>伂廜溆<E5BB9C>廜𤒹<E5BB9C>廙溆<E5BB99>廙𤒹<E5BB99>廙鐧<E5BB99>廙䟭<E5BB99>廙鍅<E5BB99>廙﹥誨 p⑤廘晨善廑<E59684><E5BB91>廜<EFBFBD> q<><71> r<><72><EFBFBD><EFBFBD><EFBFBD><EFBFBD>刓廘聊絨廑刅<E5BB91>廜鍅<E5BB9C><E98D85><EFBFBD> s<><73><EFBFBD>禳<EFBFBD><E7A6B3>廘氮<E5BB98>廜﹥馳廜丟鳩廜抱恢 t籟聽襲⑴⑶<E291B4><E291B6>廘菲鼠廜凍僖廜晨<E5BB9C>漹<EFBFBD> u羅繳羶羹觼贖躑轡鑄鑒<E99184><E99192>⑹<EFBFBD><E291B9><EFBFBD><EFBFBD><EFBFBD><EFBFBD>廘擔<E5BB98>廜喔僱廜猿凳廜頗誑廙扭貍廙後賒廙脊跼 v<>廑𣉖厭廜<E58EAD> w霾廕<E99CBE><E5BB95>廕<EFBFBD><E5BB95>廕刅<E5BB95> x廕𦘒<E5BB95> y羸藩韁⑽<E99F81><E291BD>廕𥕥<E5BB95>廙喔輓廙猿遜 z驕髒鱉ⅱ廘嗤<E5BB98>廕𤒹<E5BB95>廕𨰝惇"
|
||
let groups = split(str)
|
||
for group1 in groups
|
||
for c in split(group1, '\zs')
|
||
" next statement confirms that equivalence class matches every
|
||
" character in group
|
||
call assert_match('^[[=' .. c .. '=]]*$', group1)
|
||
for group2 in groups
|
||
if group2 != group1
|
||
" next statement converts that equivalence class doesn't match
|
||
" character in any other group
|
||
call assert_equal(-1, match(group2, '[[=' .. c .. '=]]'), c)
|
||
endif
|
||
endfor
|
||
endfor
|
||
endfor
|
||
endfunc
|
||
|
||
func Test_equivalence_re1()
|
||
set re=1
|
||
call s:equivalence_test()
|
||
set re=0
|
||
endfunc
|
||
|
||
func Test_equivalence_re2()
|
||
set re=2
|
||
call s:equivalence_test()
|
||
set re=0
|
||
endfunc
|
||
|
||
func s:classes_test()
|
||
if has('win32')
|
||
set iskeyword=@,48-57,_,192-255
|
||
endif
|
||
set isprint=@,161-255
|
||
call assert_equal('Mot繹rhead', matchstr('Mot繹rhead', '[[:print:]]\+'))
|
||
|
||
let alnumchars = ''
|
||
let alphachars = ''
|
||
let backspacechar = ''
|
||
let blankchars = ''
|
||
let cntrlchars = ''
|
||
let digitchars = ''
|
||
let escapechar = ''
|
||
let graphchars = ''
|
||
let lowerchars = ''
|
||
let printchars = ''
|
||
let punctchars = ''
|
||
let returnchar = ''
|
||
let spacechars = ''
|
||
let tabchar = ''
|
||
let upperchars = ''
|
||
let xdigitchars = ''
|
||
let identchars = ''
|
||
let identchars1 = ''
|
||
let kwordchars = ''
|
||
let kwordchars1 = ''
|
||
let fnamechars = ''
|
||
let fnamechars1 = ''
|
||
let i = 1
|
||
while i <= 255
|
||
let c = nr2char(i)
|
||
if c =~ '[[:alpha:]]'
|
||
let alphachars .= c
|
||
endif
|
||
if c =~ '[[:alnum:]]'
|
||
let alnumchars .= c
|
||
endif
|
||
if c =~ '[[:backspace:]]'
|
||
let backspacechar .= c
|
||
endif
|
||
if c =~ '[[:blank:]]'
|
||
let blankchars .= c
|
||
endif
|
||
if c =~ '[[:cntrl:]]'
|
||
let cntrlchars .= c
|
||
endif
|
||
if c =~ '[[:digit:]]'
|
||
let digitchars .= c
|
||
endif
|
||
if c =~ '[[:escape:]]'
|
||
let escapechar .= c
|
||
endif
|
||
if c =~ '[[:graph:]]'
|
||
let graphchars .= c
|
||
endif
|
||
if c =~ '[[:lower:]]'
|
||
let lowerchars .= c
|
||
endif
|
||
if c =~ '[[:print:]]'
|
||
let printchars .= c
|
||
endif
|
||
if c =~ '[[:punct:]]'
|
||
let punctchars .= c
|
||
endif
|
||
if c =~ '[[:return:]]'
|
||
let returnchar .= c
|
||
endif
|
||
if c =~ '[[:space:]]'
|
||
let spacechars .= c
|
||
endif
|
||
if c =~ '[[:tab:]]'
|
||
let tabchar .= c
|
||
endif
|
||
if c =~ '[[:upper:]]'
|
||
let upperchars .= c
|
||
endif
|
||
if c =~ '[[:xdigit:]]'
|
||
let xdigitchars .= c
|
||
endif
|
||
if c =~ '[[:ident:]]'
|
||
let identchars .= c
|
||
endif
|
||
if c =~ '\i'
|
||
let identchars1 .= c
|
||
endif
|
||
if c =~ '[[:keyword:]]'
|
||
let kwordchars .= c
|
||
endif
|
||
if c =~ '\k'
|
||
let kwordchars1 .= c
|
||
endif
|
||
if c =~ '[[:fname:]]'
|
||
let fnamechars .= c
|
||
endif
|
||
if c =~ '\f'
|
||
let fnamechars1 .= c
|
||
endif
|
||
let i += 1
|
||
endwhile
|
||
|
||
call assert_equal('ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz', alphachars)
|
||
call assert_equal('0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz', alnumchars)
|
||
call assert_equal("\b", backspacechar)
|
||
call assert_equal("\t ", blankchars)
|
||
call assert_equal("\x01\x02\x03\x04\x05\x06\x07\b\t\n\x0b\f\r\x0e\x0f\x10\x11\x12\x13\x14\x15\x16\x17\x18\x19\x1a\e\x1c\x1d\x1e\x1f\x7f", cntrlchars)
|
||
call assert_equal("0123456789", digitchars)
|
||
call assert_equal("\<Esc>", escapechar)
|
||
call assert_equal('!"#$%&''()*+,-./0123456789:;<=>?@ABCDEFGHIJKLMNOPQRSTUVWXYZ[\]^_`abcdefghijklmnopqrstuvwxyz{|}~', graphchars)
|
||
call assert_equal('abcdefghijklmnopqrstuvwxyz繕<7A><E7B995>獺璽瓊瓣疇疆癟癡矇礙禱穫穩簾簿簸簽簷籀繫繭繹繪羅繳羶羹羸臘藩', lowerchars)
|
||
call assert_equal(' !"#$%&''()*+,-./0123456789:;<=>?@ABCDEFGHIJKLMNOPQRSTUVWXYZ[\]^_`abcdefghijklmnopqrstuvwxyz{|}~<7E>癒瞽瞿瞻瞼礎禮穡穢穠竄竅簫簧簪簞簣簡糧織繕繞繚繡繒繙罈翹翻職聶<E881B7><E881B6><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>獺璽瓊瓣疇疆癟癡矇礙禱穫穩簾簿簸簽簷籀繫繭繹繩繪羅繳羶羹羸臘藩', printchars)
|
||
call assert_equal('!"#$%&''()*+,-./:;<=>?@[\]^_`{|}~', punctchars)
|
||
call assert_equal('ABCDEFGHIJKLMNOPQRSTUVWXYZ<59><5A><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>', upperchars)
|
||
call assert_equal("\r", returnchar)
|
||
call assert_equal("\t\n\x0b\f\r ", spacechars)
|
||
call assert_equal("\t", tabchar)
|
||
call assert_equal('0123456789ABCDEFabcdef', xdigitchars)
|
||
|
||
if has('win32')
|
||
let identchars_ok = '0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ_abcdefghijklmnopqrstuvwxyz<79><7A><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>癒瞽瞿瞻瞼礎禮繕<E7A6AE><E7B995><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>獺璽瓊瓣疇疆癟癡矇礙禱穫穩簾簿簸簽簷籀繫繭繹繪羅繳羶羹羸臘藩'
|
||
let kwordchars_ok = '0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ_abcdefghijklmnopqrstuvwxyz繕<7A><E7B995><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>獺璽瓊瓣疇疆癟癡矇礙禱穫穩簾簿簸簽簷籀繫繭繹繩繪羅繳羶羹羸臘藩'
|
||
else
|
||
let identchars_ok = '0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ_abcdefghijklmnopqrstuvwxyz繕<7A><E7B995><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>獺璽瓊瓣疇疆癟癡矇礙禱穫穩簾簿簸簽簷籀繫繭繹繩繪羅繳羶羹羸臘藩'
|
||
let kwordchars_ok = '0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ_abcdefghijklmnopqrstuvwxyz繕<7A><E7B995><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>獺璽瓊瓣疇疆癟癡矇礙禱穫穩簾簿簸簽簷籀繫繭繹繩繪羅繳羶羹羸臘藩'
|
||
endif
|
||
|
||
if has('win32')
|
||
let fnamechars_ok = '!#$%+,-./0123456789:=@ABCDEFGHIJKLMNOPQRSTUVWXYZ[\]_abcdefghijklmnopqrstuvwxyz{}~<7E>癒瞽瞿瞻瞼礎禮穡穢穠竄竅簫簧簪簞簣簡糧織繕繞繚繡繒繙罈翹翻職聶<E881B7><E881B6><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>獺璽瓊瓣疇疆癟癡矇礙禱穫穩簾簿簸簽簷籀繫繭繹繩繪羅繳羶羹羸臘藩'
|
||
elseif has('amiga')
|
||
let fnamechars_ok = '$+,-./0123456789:ABCDEFGHIJKLMNOPQRSTUVWXYZ_abcdefghijklmnopqrstuvwxyz~<7E>癒瞽瞿瞻瞼礎禮穡穢穠竄竅簫簧簪簞簣簡糧織繕繞繚繡繒繙罈翹翻職聶<E881B7><E881B6><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>獺璽瓊瓣疇疆癟癡矇礙禱穫穩簾簿簸簽簷籀繫繭繹繩繪羅繳羶羹羸臘藩'
|
||
elseif has('vms')
|
||
let fnamechars_ok = '#$%+,-./0123456789:;<>ABCDEFGHIJKLMNOPQRSTUVWXYZ[]_abcdefghijklmnopqrstuvwxyz~<7E>癒瞽瞿瞻瞼礎禮穡穢穠竄竅簫簧簪簞簣簡糧織繕繞繚繡繒繙罈翹翻職聶<E881B7><E881B6><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>獺璽瓊瓣疇疆癟癡矇礙禱穫穩簾簿簸簽簷籀繫繭繹繩繪羅繳羶羹羸臘藩'
|
||
else
|
||
let fnamechars_ok = '#$%+,-./0123456789=ABCDEFGHIJKLMNOPQRSTUVWXYZ_abcdefghijklmnopqrstuvwxyz~<7E>癒瞽瞿瞻瞼礎禮穡穢穠竄竅簫簧簪簞簣簡糧織繕繞繚繡繒繙罈翹翻職聶<E881B7><E881B6><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>獺璽瓊瓣疇疆癟癡矇礙禱穫穩簾簿簸簽簷籀繫繭繹繩繪羅繳羶羹羸臘藩'
|
||
endif
|
||
|
||
call assert_equal(identchars_ok, identchars)
|
||
call assert_equal(kwordchars_ok, kwordchars)
|
||
call assert_equal(fnamechars_ok, fnamechars)
|
||
|
||
call assert_equal(identchars1, identchars)
|
||
call assert_equal(kwordchars1, kwordchars)
|
||
call assert_equal(fnamechars1, fnamechars)
|
||
endfunc
|
||
|
||
func Test_classes_re1()
|
||
set re=1
|
||
call s:classes_test()
|
||
set re=0
|
||
endfunc
|
||
|
||
func Test_classes_re2()
|
||
set re=2
|
||
call s:classes_test()
|
||
set re=0
|
||
endfunc
|
||
|
||
func Test_reversed_range()
|
||
for re in range(0, 2)
|
||
exe 'set re=' . re
|
||
call assert_fails('call match("abc def", "[c-a]")', 'E944:', re)
|
||
endfor
|
||
set re=0
|
||
endfunc
|
||
|
||
func Test_large_class()
|
||
set re=1
|
||
call assert_fails('call match("abc def", "[\u3000-\u4000]")', 'E945:')
|
||
set re=2
|
||
call assert_equal(0, 'abc def' =~# '[\u3000-\u4000]')
|
||
call assert_equal(1, "\u3042" =~# '[\u3000-\u4000]')
|
||
set re=0
|
||
endfunc
|
||
|
||
func Test_optmatch_toolong()
|
||
set re=1
|
||
" Can only handle about 8000 characters.
|
||
let pat = '\\%[' .. repeat('x', 9000) .. ']'
|
||
call assert_fails('call match("abc def", "' .. pat .. '")', 'E339:')
|
||
set re=0
|
||
endfunc
|
||
|
||
" Test for regexp patterns with multi-byte support, using utf-8.
|
||
func Test_multibyte_chars()
|
||
" tl is a List of Lists with:
|
||
" 2: test auto/old/new 0: test auto/old 1: test auto/new
|
||
" regexp pattern
|
||
" text to test the pattern on
|
||
" expected match (optional)
|
||
" expected submatch 1 (optional)
|
||
" expected submatch 2 (optional)
|
||
" etc.
|
||
" When there is no match use only the first two items.
|
||
let tl = []
|
||
|
||
" Multi-byte character tests.
|
||
call add(tl, [2, '[[:alpha:][=a=]]\+', '879 aia瓊璽aiuvna ', 'aia瓊璽aiuvna'])
|
||
call add(tl, [2, '[[=a=]]\+', 'dda瓊璽bcd', 'a瓊璽']) " equivalence classes
|
||
call add(tl, [2, '[^鉊<> ]\+', '鉊﹤腹 oijasoifjos ifjoisj f osij j 鉊﹤腹鉊﹤腹鉊<E885B9> abcd', 'oijasoifjos'])
|
||
call add(tl, [2, ' [^ ]\+', 'start 鉊{bcd鉊<64> ', ' 鉊{bcd鉊<64>'])
|
||
call add(tl, [2, '[鉊︴:alpha:][=a=]]\+', '879 aia瓊鉊 ̄R腹aiuvna ', 'aia瓊鉊 ̄R腹aiuvna'])
|
||
|
||
" this is not a normal "i" but 0xec
|
||
call add(tl, [2, '\p\+', '穫a', '穫a'])
|
||
call add(tl, [2, '\p*', 'a<><61>', 'a<><61>'])
|
||
|
||
" Test recognition of some character classes
|
||
call add(tl, [2, '\i\+', '&*穡xx ', 'xx'])
|
||
call add(tl, [2, '\f\+', '&*<2A>fname ', 'fname'])
|
||
|
||
" Test composing character matching
|
||
call add(tl, [2, '.鉊<>', 'x鉊﹤<E9898A>x y鉊『', 'y鉊<79>'])
|
||
call add(tl, [2, '.鉊﹤<E9898A>', 'x鉊﹤<E9898A>x y鉊『', 'x鉊﹤<E9898A>'])
|
||
call add(tl, [2, "\u05b9", " x\u05b9 ", "x\u05b9"])
|
||
call add(tl, [2, ".\u05b9", " x\u05b9 ", "x\u05b9"])
|
||
call add(tl, [2, "\u05b9\u05bb", " x\u05b9\u05bb ", "x\u05b9\u05bb"])
|
||
call add(tl, [2, ".\u05b9\u05bb", " x\u05b9\u05bb ", "x\u05b9\u05bb"])
|
||
call add(tl, [2, "\u05bb\u05b9", " x\u05b9\u05bb ", "x\u05b9\u05bb"])
|
||
call add(tl, [2, ".\u05bb\u05b9", " x\u05b9\u05bb ", "x\u05b9\u05bb"])
|
||
call add(tl, [2, "\u05b9", " y\u05bb x\u05b9 ", "x\u05b9"])
|
||
call add(tl, [2, ".\u05b9", " y\u05bb x\u05b9 ", "x\u05b9"])
|
||
call add(tl, [2, "\u05b9", " y\u05bb\u05b9 x\u05b9 ", "y\u05bb\u05b9"])
|
||
call add(tl, [2, ".\u05b9", " y\u05bb\u05b9 x\u05b9 ", "y\u05bb\u05b9"])
|
||
call add(tl, [1, "\u05b9\u05bb", " y\u05b9 x\u05b9\u05bb ", "x\u05b9\u05bb"])
|
||
call add(tl, [2, ".\u05b9\u05bb", " y\u05bb x\u05b9\u05bb ", "x\u05b9\u05bb"])
|
||
call add(tl, [2, "a", "ca\u0300t"])
|
||
call add(tl, [2, "ca", "ca\u0300t"])
|
||
call add(tl, [2, "a\u0300", "ca\u0300t", "a\u0300"])
|
||
call add(tl, [2, 'a\%C', "ca\u0300t", "a\u0300"])
|
||
call add(tl, [2, 'ca\%C', "ca\u0300t", "ca\u0300"])
|
||
call add(tl, [2, 'ca\%Ct', "ca\u0300t", "ca\u0300t"])
|
||
|
||
" Test \Z
|
||
call add(tl, [2, '繳\Z', 'x'])
|
||
call add(tl, [2, '<27><><EFBFBD><EFBFBD>\Z', '<27><><EFBFBD><EFBFBD>', '<27><><EFBFBD><EFBFBD>'])
|
||
call add(tl, [2, '<27>眥<EFBFBD><E79CA5>硌<EFBFBD>\Z', '<27><><EFBFBD><EFBFBD>', '<27><><EFBFBD><EFBFBD>'])
|
||
call add(tl, [2, '<27><><EFBFBD><EFBFBD>\Z', '<27>眥<EFBFBD><E79CA5>硌<EFBFBD>', '<27>眥<EFBFBD><E79CA5>硌<EFBFBD>'])
|
||
call add(tl, [2, '<27>眥<EFBFBD><E79CA5>硌<EFBFBD>\Z', '<27>眥<EFBFBD><E79CA5>硌<EFBFBD>', '<27>眥<EFBFBD><E79CA5>硌<EFBFBD>'])
|
||
call add(tl, [2, '<27>眥\Z', '<27>眥<EFBFBD>硊', '<27>硊'])
|
||
call add(tl, [2, "蚹\u200d\u05b9x\\Z", "x蚹\u200d\u05b9xy", "蚹\u200d\u05b9x"])
|
||
call add(tl, [2, "蚹\u200d\u05b9x\\Z", "x蚹\u200dxy", "蚹\u200dx"])
|
||
call add(tl, [2, "蚹\u200dx\\Z", "x蚹\u200d\u05b9xy", "蚹\u200d\u05b9x"])
|
||
call add(tl, [2, "蚹\u200dx\\Z", "x蚹\u200dxy", "蚹\u200dx"])
|
||
call add(tl, [2, "\u05b9\\Z", "xyz"])
|
||
call add(tl, [2, "\\Z\u05b9", "xyz"])
|
||
call add(tl, [2, "\u05b9\\Z", "xy\u05b9z", "y\u05b9"])
|
||
call add(tl, [2, "\\Z\u05b9", "xy\u05b9z", "y\u05b9"])
|
||
call add(tl, [1, "\u05b9\\+\\Z", "xy\u05b9z\u05b9 ", "y\u05b9z\u05b9"])
|
||
call add(tl, [1, "\\Z\u05b9\\+", "xy\u05b9z\u05b9 ", "y\u05b9z\u05b9"])
|
||
|
||
" Combining different tests and features
|
||
call add(tl, [2, '[^[=a=]]\+', 'dda瓊璽bcd', 'dd'])
|
||
|
||
" Run the tests
|
||
for t in tl
|
||
let re = t[0]
|
||
let pat = t[1]
|
||
let text = t[2]
|
||
let matchidx = 3
|
||
for engine in [0, 1, 2]
|
||
if engine == 2 && re == 0 || engine == 1 && re == 1
|
||
continue
|
||
endif
|
||
let ®expengine = engine
|
||
try
|
||
let l = matchlist(text, pat)
|
||
catch
|
||
call assert_report('Error ' . engine . ': pat: \"' . pat .
|
||
\ '\", text: \"' . text .
|
||
\ '\", caused an exception: \"' . v:exception . '\"')
|
||
endtry
|
||
" check the match itself
|
||
if len(l) == 0 && len(t) > matchidx
|
||
call assert_report('Error ' . engine . ': pat: \"' . pat .
|
||
\ '\", text: \"' . text .
|
||
\ '\", did not match, expected: \"' . t[matchidx] . '\"')
|
||
elseif len(l) > 0 && len(t) == matchidx
|
||
call assert_report('Error ' . engine . ': pat: \"' . pat .
|
||
\ '\", text: \"' . text . '\", match: \"' . l[0] .
|
||
\ '\", expected no match')
|
||
elseif len(t) > matchidx && l[0] != t[matchidx]
|
||
call assert_report('Error ' . engine . ': pat: \"' . pat .
|
||
\ '\", text: \"' . text . '\", match: \"' . l[0] .
|
||
\ '\", expected: \"' . t[matchidx] . '\"')
|
||
else
|
||
" Test passed
|
||
endif
|
||
if len(l) > 0
|
||
" check all the nine submatches
|
||
for i in range(1, 9)
|
||
if len(t) <= matchidx + i
|
||
let e = ''
|
||
else
|
||
let e = t[matchidx + i]
|
||
endif
|
||
if l[i] != e
|
||
call assert_report('Error ' . engine . ': pat: \"' . pat .
|
||
\ '\", text: \"' . text . '\", submatch ' . i .
|
||
\ ': \"' . l[i] . '\", expected: \"' . e . '\"')
|
||
endif
|
||
endfor
|
||
unlet i
|
||
endif
|
||
endfor
|
||
endfor
|
||
set regexpengine&
|
||
endfunc
|
||
|
||
" check that 'ambiwidth' does not change the meaning of \p
|
||
func Test_regexp_ambiwidth()
|
||
set regexpengine=1 ambiwidth=single
|
||
call assert_equal(0, match("\u00EC", '\p'))
|
||
set regexpengine=1 ambiwidth=double
|
||
call assert_equal(0, match("\u00EC", '\p'))
|
||
set regexpengine=2 ambiwidth=single
|
||
call assert_equal(0, match("\u00EC", '\p'))
|
||
set regexpengine=2 ambiwidth=double
|
||
call assert_equal(0, match("\u00EC", '\p'))
|
||
set regexpengine& ambiwidth&
|
||
endfunc
|
||
|
||
func Run_regexp_ignore_case()
|
||
call assert_equal('iI襤', substitute('iI襤', '\([iI襤]\)', '\1', 'g'))
|
||
|
||
call assert_equal('iIx', substitute('iI襤', '\c\([襤]\)', 'x', 'g'))
|
||
call assert_equal('xx襤', substitute('iI襤', '\(i\c\)', 'x', 'g'))
|
||
call assert_equal('iIx', substitute('iI襤', '\(襤\c\)', 'x', 'g'))
|
||
call assert_equal('iIx', substitute('iI襤', '\c\(\%u0130\)', 'x', 'g'))
|
||
call assert_equal('iIx', substitute('iI襤', '\c\([\u0130]\)', 'x', 'g'))
|
||
call assert_equal('iIx', substitute('iI襤', '\c\([\u012f-\u0131]\)', 'x', 'g'))
|
||
endfunc
|
||
|
||
func Test_regexp_ignore_case()
|
||
set regexpengine=1
|
||
call Run_regexp_ignore_case()
|
||
set regexpengine=2
|
||
call Run_regexp_ignore_case()
|
||
set regexpengine&
|
||
endfunc
|
||
|
||
" Tests for regexp with multi-byte encoding and various magic settings
|
||
func Run_regexp_multibyte_magic()
|
||
let text =<< trim END
|
||
1 a aa abb abbccc
|
||
2 d dd dee deefff
|
||
3 g gg ghh ghhiii
|
||
4 j jj jkk jkklll
|
||
5 m mm mnn mnnooo
|
||
6 x ^aa$ x
|
||
7 (a)(b) abbaa
|
||
8 axx [ab]xx
|
||
9 鉊徇腹鉆ū 鉊冢腹x
|
||
a 鉊冢腹x 鉊徇腹鉆ū
|
||
b <20>~<EFBFBD><EFBD9E>具<EFBFBD>
|
||
c x 竅<EFBFBD>洪
|
||
d 憭拐蝙x
|
||
e <20><>烵y
|
||
f <20><><EFBFBD>z
|
||
g a<EFBFBD>搓b
|
||
j 0123<EFBFBD>巳
|
||
k combinations
|
||
l 瓣繹 羹帢<EFBFBD><EFBFBD><EFBFBD>
|
||
END
|
||
|
||
new
|
||
call setline(1, text)
|
||
exe 'normal /a*b\{2}c\+/e' .. "\<CR>x"
|
||
call assert_equal('1 a aa abb abbcc', getline('.'))
|
||
exe 'normal /\Md\*e\{2}f\+/e' .. "\<CR>x"
|
||
call assert_equal('2 d dd dee deeff', getline('.'))
|
||
set nomagic
|
||
exe 'normal /g\*h\{2}i\+/e' .. "\<CR>x"
|
||
call assert_equal('3 g gg ghh ghhii', getline('.'))
|
||
exe 'normal /\mj*k\{2}l\+/e' .. "\<CR>x"
|
||
call assert_equal('4 j jj jkk jkkll', getline('.'))
|
||
exe 'normal /\vm*n{2}o+/e' .. "\<CR>x"
|
||
call assert_equal('5 m mm mnn mnnoo', getline('.'))
|
||
exe 'normal /\V^aa$/' .. "\<CR>x"
|
||
call assert_equal('6 x aa$ x', getline('.'))
|
||
set magic
|
||
exe 'normal /\v(a)(b)\2\1\1/e' .. "\<CR>x"
|
||
call assert_equal('7 (a)(b) abba', getline('.'))
|
||
exe 'normal /\V[ab]\(\[xy]\)\1' .. "\<CR>x"
|
||
call assert_equal('8 axx ab]xx', getline('.'))
|
||
|
||
" search for multi-byte without composing char
|
||
exe 'normal /鉊<>' .. "\<CR>x"
|
||
call assert_equal('9 鉊徇腹鉆ū 鉊軍', getline('.'))
|
||
|
||
" search for multi-byte with composing char
|
||
exe 'normal /鉊﹤<E9898A>' .. "\<CR>x"
|
||
call assert_equal('a 鉊冢腹x 鉊咦', getline('.'))
|
||
|
||
" find word by change of word class
|
||
exe 'normal /<2F>﹏<<3C>怒<EFBFBD>\><3E><>' .. "\<CR>x"
|
||
call assert_equal('b <20>怒<EFBFBD><E68092><EFBFBD>', getline('.'))
|
||
|
||
" Test \%u, [\u] and friends
|
||
" c
|
||
exe 'normal /\%u20ac' .. "\<CR>x"
|
||
call assert_equal('c x 竅x', getline('.'))
|
||
" d
|
||
exe 'normal /[\u4f7f\u5929]\+' .. "\<CR>x"
|
||
call assert_equal('d 雿篛', getline('.'))
|
||
" e
|
||
exe 'normal /\%U12345678' .. "\<CR>x"
|
||
call assert_equal('e y', getline('.'))
|
||
" f
|
||
exe 'normal /[\U1234abcd\u1234\uabcd]' .. "\<CR>x"
|
||
call assert_equal('f z', getline('.'))
|
||
" g
|
||
exe 'normal /\%d21879b' .. "\<CR>x"
|
||
call assert_equal('g abb', getline('.'))
|
||
|
||
" j Test backwards search from a multi-byte char
|
||
exe "normal /x\<CR>x?.\<CR>x"
|
||
call assert_equal('j 012<31><32>', getline('.'))
|
||
" k
|
||
let @w=':%s#comb[i]nations#<23><>廜␌<E5BB9C>怚<EFBFBD>帢<EFBFBD><E5B8A2><EFBFBD>#g'
|
||
@w
|
||
call assert_equal('k <20><>廜␌<E5BB9C>怚<EFBFBD>帢<EFBFBD><E5B8A2><EFBFBD>', getline(18))
|
||
|
||
close!
|
||
endfunc
|
||
|
||
func Test_regexp_multibyte_magic()
|
||
set regexpengine=1
|
||
call Run_regexp_multibyte_magic()
|
||
set regexpengine=2
|
||
call Run_regexp_multibyte_magic()
|
||
set regexpengine&
|
||
endfunc
|
||
|
||
" Test for 7.3.192
|
||
" command ":s/ \?/ /g" splits multi-byte characters into bytes
|
||
func Test_split_multibyte_to_bytes()
|
||
new
|
||
call setline(1, 'l 瓣繹 羹帢<E7BEB9><E5B8A2><EFBFBD>')
|
||
s/ \?/ /g
|
||
call assert_equal(' l 瓣 繹 羹 帢<><E5B8A2><EFBFBD>', getline(1))
|
||
close!
|
||
endfunc
|
||
|
||
" Test for matchstr() with multibyte characters
|
||
func Test_matchstr_multibyte()
|
||
new
|
||
call assert_equal('<27>', matchstr("<22><><EFBFBD><EFBFBD>", ".", 0, 2))
|
||
call assert_equal('<27><>', matchstr("<22><><EFBFBD><EFBFBD>", "..", 0, 2))
|
||
call assert_equal('<27>', matchstr("<22><><EFBFBD><EFBFBD>", ".", 0, 0))
|
||
call assert_equal('<27>', matchstr("<22><><EFBFBD><EFBFBD>", ".", 4, -1))
|
||
close!
|
||
endfunc
|
||
|
||
" Test for 7.4.636
|
||
" A search with end offset gets stuck at end of file.
|
||
func Test_search_with_end_offset()
|
||
new
|
||
call setline(1, ['', 'dog(a', 'cat('])
|
||
exe "normal /(/e+\<CR>"
|
||
normal n"ayn
|
||
call assert_equal("a\ncat(", @a)
|
||
close!
|
||
endfunc
|
||
|
||
" Check that "^" matches even when the line starts with a combining char
|
||
func Test_match_start_of_line_combining()
|
||
new
|
||
call setline(1, ['', "\u05ae", ''])
|
||
exe "normal gg/^\<CR>"
|
||
call assert_equal(2, getcurpos()[1])
|
||
bwipe!
|
||
endfunc
|
||
|
||
" Check that [[:upper:]] matches for automatic engine
|
||
func Test_match_char_class_upper()
|
||
new
|
||
|
||
" Test 1: [[:upper:]]\{2,\}
|
||
set regexpengine=0
|
||
call setline(1, ['05. <20><>苤<EFBFBD>觓 <20> <20><><EFBFBD><EFBFBD>觓苭 邾<>郱. <20>. <20>訄赲邽迡迮郇郕郋, <20>. <20>郋赲訄郅<E8A884> 邽 <20>. 虼迮<E899BC><E8BFAE>迮<EFBFBD>訄 ...', '05. PJESNJA O GJEROJAKH mus. A. Davidjenko, M. Kovalja i B. Shjekhtjera ...'])
|
||
call cursor(1,1)
|
||
let search_cmd='norm /\<[[:upper:]]\{2,\}\>' .. "\<CR>"
|
||
exe search_cmd
|
||
call assert_equal(4, searchcount().total, 'TEST 1')
|
||
set regexpengine=1
|
||
exe search_cmd
|
||
call assert_equal(2, searchcount().total, 'TEST 1')
|
||
set regexpengine=2
|
||
exe search_cmd
|
||
call assert_equal(4, searchcount().total, 'TEST 1')
|
||
|
||
" Test 2: [[:upper:]].\+
|
||
let search_cmd='norm /\<[[:upper:]].\+\>' .. "\<CR>"
|
||
set regexpengine=0
|
||
exe search_cmd
|
||
call assert_equal(2, searchcount().total, 'TEST 2')
|
||
set regexpengine=1
|
||
exe search_cmd
|
||
call assert_equal(1, searchcount().total, 'TEST 2')
|
||
set regexpengine=2
|
||
exe search_cmd
|
||
call assert_equal(2, searchcount().total, 'TEST 2')
|
||
|
||
" Test 3: [[:lower:]]\+
|
||
let search_cmd='norm /\<[[:lower:]]\+\>' .. "\<CR>"
|
||
set regexpengine=0
|
||
exe search_cmd
|
||
call assert_equal(4, searchcount().total, 'TEST 3 lower')
|
||
set regexpengine=1
|
||
exe search_cmd
|
||
call assert_equal(2, searchcount().total, 'TEST 3 lower')
|
||
set regexpengine=2
|
||
exe search_cmd
|
||
call assert_equal(4, searchcount().total, 'TEST 3 lower')
|
||
|
||
" clean up
|
||
set regexpengine=0
|
||
bwipe!
|
||
endfunc
|
||
|
||
func Test_match_invalid_byte()
|
||
call writefile(0z630a.765d30aa0a.2e0a.790a.4030, 'Xinvalid', 'D')
|
||
new
|
||
source Xinvalid
|
||
bwipe!
|
||
endfunc
|
||
|
||
func Test_match_illegal_byte()
|
||
" Text has illegal bytes which need to be set explicitly
|
||
let lines = ["norm :set no\x01\<CR>", "silent n\xff", "silent norm :b\xff\<CR>"]
|
||
call writefile(lines, 'Xregexp', 'D')
|
||
call system(GetVimCommand() .. ' -X -Z -e -s -S Xregexp -c qa!')
|
||
endfunc
|
||
|
||
func Test_match_too_complicated()
|
||
set regexpengine=1
|
||
exe "noswapfile vsplit \xeb\xdb\x99"
|
||
silent! buf \&\zs*\zs*0
|
||
bwipe!
|
||
set regexpengine=0
|
||
endfunc
|
||
|
||
func Test_combining_chars_in_collection()
|
||
new
|
||
for i in range(0,2)
|
||
exe "set re=".i
|
||
put =['<27><>', '<27>', '<27> a<>', 'abcd']
|
||
:%s/[<5B><>]//
|
||
call assert_equal(['', '', '<27>', '<27> a<>', 'abcd'], getline(1,'$'))
|
||
%d
|
||
endfor
|
||
bw!
|
||
endfunc
|
||
|
||
func Test_search_multibyte_match_ascii()
|
||
new
|
||
" Match single '鰱' and 's'
|
||
call setline(1, 'das abc heraus abc 鰱ich abc 鰱ind')
|
||
for i in range(0, 2)
|
||
exe "set re="..i
|
||
let ic_match = matchbufline('%', '\c\%u17f', 1, '$')->mapnew({idx, val -> val.text})
|
||
let noic_match = matchbufline('%', '\C\%u17f', 1, '$')->mapnew({idx, val -> val.text})
|
||
call assert_equal(['s', 's', '鰱','鰱'], ic_match, "Ignorecase Regex-engine: " .. &re)
|
||
call assert_equal(['鰱','鰱'], noic_match, "No-Ignorecase Regex-engine: " .. &re)
|
||
endfor
|
||
" Match several '鰱鰱' and 'ss'
|
||
call setline(1, 'das abc herauss abc 鰱鰱ich abc 鰱ind')
|
||
for i in range(0, 2)
|
||
exe "set re="..i
|
||
let ic_match = matchbufline('%', '\c\%u17f\%u17f', 1, '$')->mapnew({idx, val -> val.text})
|
||
let noic_match = matchbufline('%', '\C\%u17f\%u17f', 1, '$')->mapnew({idx, val -> val.text})
|
||
let ic_match2 = matchbufline('%', '\c\%u17f\+', 1, '$')->mapnew({idx, val -> val.text})
|
||
let noic_match2 = matchbufline('%', '\C\%u17f\+', 1, '$')->mapnew({idx, val -> val.text})
|
||
let ic_match3 = matchbufline('%', '\c[\u17f]\+', 1, '$')->mapnew({idx, val -> val.text})
|
||
let noic_match3 = matchbufline('%', '\C[\u17f]\+', 1, '$')->mapnew({idx, val -> val.text})
|
||
|
||
call assert_equal(['ss', '鰱鰱'], ic_match, "Ignorecase Regex-engine: " .. &re)
|
||
call assert_equal(['鰱鰱'], noic_match, "No-Ignorecase Regex-engine: " .. &re)
|
||
call assert_equal(['s', 'ss', '鰱鰱', '鰱'], ic_match2, "Ignorecase Regex-engine: " .. &re)
|
||
call assert_equal(['鰱鰱','鰱'], noic_match2, "No-Ignorecase Regex-engine: " .. &re)
|
||
call assert_equal(['s', 'ss', '鰱鰱', '鰱'], ic_match3, "Ignorecase Collection Regex-engine: " .. &re)
|
||
call assert_equal(['鰱鰱','鰱'], noic_match3, "No-Ignorecase Collection Regex-engine: " .. &re)
|
||
endfor
|
||
bw!
|
||
endfunc
|
||
|
||
" vim: shiftwidth=2 sts=2 expandtab
|