2018-02-11 11:30:26 -07:00
" Tests for regexp in latin1 encoding
2021-05-24 11:43:47 -07:00
2021-03-26 22:39:45 -07:00
" set encoding=latin1
2018-02-11 11:30:26 -07:00
scriptencoding latin1
2021-05-24 11:43:47 -07:00
source check .vim
2018-02-11 11:30:26 -07:00
func s :equivalence_test ( )
2022-04-03 18:12:20 -07:00
let str = 'A<> <41> <EFBFBD> <EFBFBD> <EFBFBD> <EFBFBD> B C D E<> <45> <EFBFBD> <EFBFBD> F G H I<> <49> <EFBFBD> <EFBFBD> J K L M N<> O<> <4F> <EFBFBD> <EFBFBD> <EFBFBD> <EFBFBD> P Q R S T U<> <55> <EFBFBD> <EFBFBD> V W X Y<> Z '
\ .. 'a<> <61> <EFBFBD> <EFBFBD> <EFBFBD> <EFBFBD> b c d e<> <65> <EFBFBD> <EFBFBD> f g h i<> <69> <EFBFBD> <EFBFBD> j k l m n<> o<> <6F> <EFBFBD> <EFBFBD> <EFBFBD> <EFBFBD> p q r s t u<> <75> <EFBFBD> <EFBFBD> v w x y<> <79> z '
\ .. "0 1 2 3 4 5 6 7 8 9 "
\ .. "` ~ ! ? ; : . , / \\ ' \" | < > [ ] { } ( ) @ # $ % ^ & * _ - + \b \e \f \n \r \t"
2018-02-11 11:30:26 -07:00
let groups = split ( str )
for group1 in groups
for c in split ( group1 , '\zs' )
" next statement confirms that equivalence class matches every
" character in group
call assert_match ( '^[[=' . c . '=]]*$' , group1 )
for group2 in groups
if group2 ! = group1
" next statement converts that equivalence class doesn't match
" a character in any other group
call assert_equal ( -1 , match ( group2 , '[[=' . c . '=]]' ) )
endif
endfor
endfor
endfor
endfunc
func Test_equivalence_re1 ( )
2021-03-26 22:39:45 -07:00
throw 'skipped: Nvim does not support enc=latin1'
2018-02-11 11:30:26 -07:00
set re = 1
call s :equivalence_test ( )
endfunc
func Test_equivalence_re2 ( )
2021-03-26 22:39:45 -07:00
throw 'skipped: Nvim does not support enc=latin1'
2018-02-11 11:30:26 -07:00
set re = 2
call s :equivalence_test ( )
endfunc
2019-02-17 17:03:25 -07:00
func Test_range_with_newline ( )
new
call setline ( 1 , "a" )
call assert_equal ( 0 , search ( "[ -*\\n- ]" ) )
call assert_equal ( 0 , search ( "[ -*\\t-\\n]" ) )
bwipe !
endfunc
2019-02-17 17:34:19 -07:00
2021-03-28 08:15:19 -07:00
func Test_pattern_compile_speed ( )
2021-05-24 11:43:47 -07:00
CheckOption spellcapcheck
CheckFunction reltimefloat
2021-03-28 08:15:19 -07:00
let start = reltime ( )
" this used to be very slow, not it should be about a second
set spc = \\v ( ( ( ( ( Nxxxxxxx &&xxxx ) {179 }) + ) + ) + ) {179 }
call assert_inrange ( 0 .01 , 10 .0 , reltimefloat ( reltime ( start ) ) )
set spc =
endfunc
2019-02-17 17:34:19 -07:00
func Test_get_equi_class ( )
new
" Incomplete equivalence class caused invalid memory access
s /^/ [[=
call assert_equal ( 1 , search ( getline ( 1 ) ) )
2019-02-17 17:36:21 -07:00
s /.*/ [[.
call assert_equal ( 1 , search ( getline ( 1 ) ) )
2019-02-17 17:34:19 -07:00
endfunc
2019-03-07 04:05:22 -07:00
func Test_rex_init ( )
set noincsearch
set re = 1
new
setlocal iskeyword = a - z
call setline ( 1 , ['abc' , 'ABC' ])
call assert_equal ( 1 , search ( '[[:keyword:]]' ) )
new
setlocal iskeyword = A - Z
call setline ( 1 , ['abc' , 'ABC' ])
call assert_equal ( 2 , search ( '[[:keyword:]]' ) )
bwipe !
bwipe !
set re = 0
endfunc
2019-03-01 21:38:36 -07:00
func Test_backref ( )
new
call setline ( 1 , ['one' , 'two' , 'three' , 'four' , 'five' ])
call assert_equal ( 3 , search ( '\%#=1\(e\)\1' ) )
call assert_equal ( 3 , search ( '\%#=2\(e\)\1' ) )
call assert_fails ( 'call search("\\%#=1\\(e\\1\\)")' , 'E65:' )
call assert_fails ( 'call search("\\%#=2\\(e\\1\\)")' , 'E65:' )
bwipe !
endfunc
2019-05-25 13:31:17 -07:00
func Test_multi_failure ( )
set re = 1
call assert_fails ( '/a**' , 'E61:' )
call assert_fails ( '/a*\+' , 'E62:' )
call assert_fails ( '/a\{a}' , 'E554:' )
set re = 2
call assert_fails ( '/a**' , 'E871:' )
call assert_fails ( '/a*\+' , 'E871:' )
call assert_fails ( '/a\{a}' , 'E870:' )
set re = 0
endfunc
2019-07-24 22:41:42 -07:00
func Test_recursive_addstate ( )
2021-03-26 22:39:45 -07:00
throw 'skipped: TODO: '
2019-07-24 22:41:42 -07:00
" This will call addstate() recursively until it runs into the limit.
let lnum = search ( '\v((){328}){389}' )
call assert_equal ( 0 , lnum )
endfunc
2019-07-24 23:22:02 -07:00
func Test_out_of_memory ( )
new
s /^/ , n
" This will be slow...
call assert_fails ( 'call search("\\v((n||<)+);")' , 'E363:' )
endfunc
2019-12-15 08:57:43 -07:00
" Tests for regexp patterns without multi-byte support.
func Test_regexp_single_line_pat ( )
" tl is a List of Lists with:
2022-07-15 01:26:35 -07:00
" regexp engines to test
" 0 - test with 'regexpengine' values 0 and 1
" 1 - test with 'regexpengine' values 0 and 2
" 2 - test with 'regexpengine' values 0, 1 and 2
2019-12-15 08:57:43 -07:00
" regexp pattern
" text to test the pattern on
" expected match (optional)
" expected submatch 1 (optional)
" expected submatch 2 (optional)
" etc.
" When there is no match use only the first two items.
let tl = []
call add ( tl , [2 , 'ab' , 'aab' , 'ab' ])
call add ( tl , [2 , 'b' , 'abcdef' , 'b' ])
call add ( tl , [2 , 'bc*' , 'abccccdef' , 'bcccc' ])
call add ( tl , [2 , 'bc\{-}' , 'abccccdef' , 'b' ])
call add ( tl , [2 , 'bc\{-}\(d\)' , 'abccccdef' , 'bccccd' , 'd' ])
call add ( tl , [2 , 'bc*' , 'abbdef' , 'b' ])
call add ( tl , [2 , 'c*' , 'ccc' , 'ccc' ])
call add ( tl , [2 , 'bc*' , 'abdef' , 'b' ])
call add ( tl , [2 , 'c*' , 'abdef' , '' ])
call add ( tl , [2 , 'bc\+' , 'abccccdef' , 'bcccc' ])
call add ( tl , [2 , 'bc\+' , 'abdef' ]) " no match
2022-07-15 01:26:35 -07:00
" match newline character in a string
call add ( tl , [2 , 'o\nb' , "foo\nbar" , "o\nb" ])
2019-12-15 08:57:43 -07:00
" operator \|
call add ( tl , [2 , 'a\|ab' , 'cabd' , 'a' ]) " alternation is ordered
call add ( tl , [2 , 'c\?' , 'ccb' , 'c' ])
call add ( tl , [2 , 'bc\?' , 'abd' , 'b' ])
call add ( tl , [2 , 'bc\?' , 'abccd' , 'bc' ])
call add ( tl , [2 , '\va{1}' , 'ab' , 'a' ])
call add ( tl , [2 , '\va{2}' , 'aa' , 'aa' ])
call add ( tl , [2 , '\va{2}' , 'caad' , 'aa' ])
call add ( tl , [2 , '\va{2}' , 'aba' ])
call add ( tl , [2 , '\va{2}' , 'ab' ])
call add ( tl , [2 , '\va{2}' , 'abaa' , 'aa' ])
call add ( tl , [2 , '\va{2}' , 'aaa' , 'aa' ])
call add ( tl , [2 , '\vb{1}' , 'abca' , 'b' ])
call add ( tl , [2 , '\vba{2}' , 'abaa' , 'baa' ])
call add ( tl , [2 , '\vba{3}' , 'aabaac' ])
call add ( tl , [2 , '\v(ab){1}' , 'ab' , 'ab' , 'ab' ])
call add ( tl , [2 , '\v(ab){1}' , 'dabc' , 'ab' , 'ab' ])
call add ( tl , [2 , '\v(ab){1}' , 'acb' ])
call add ( tl , [2 , '\v(ab){0,2}' , 'acb' , "" , "" ])
call add ( tl , [2 , '\v(ab){0,2}' , 'ab' , 'ab' , 'ab' ])
call add ( tl , [2 , '\v(ab){1,2}' , 'ab' , 'ab' , 'ab' ])
call add ( tl , [2 , '\v(ab){1,2}' , 'ababc' , 'abab' , 'ab' ])
call add ( tl , [2 , '\v(ab){2,4}' , 'ababcab' , 'abab' , 'ab' ])
call add ( tl , [2 , '\v(ab){2,4}' , 'abcababa' , 'abab' , 'ab' ])
call add ( tl , [2 , '\v(ab){2}' , 'abab' , 'abab' , 'ab' ])
call add ( tl , [2 , '\v(ab){2}' , 'cdababe' , 'abab' , 'ab' ])
call add ( tl , [2 , '\v(ab){2}' , 'abac' ])
call add ( tl , [2 , '\v(ab){2}' , 'abacabab' , 'abab' , 'ab' ])
call add ( tl , [2 , '\v((ab){2}){2}' , 'abababab' , 'abababab' , 'abab' , 'ab' ])
call add ( tl , [2 , '\v((ab){2}){2}' , 'abacabababab' , 'abababab' , 'abab' , 'ab' ])
call add ( tl , [2 , '\v(a{1}){1}' , 'a' , 'a' , 'a' ])
call add ( tl , [2 , '\v(a{2}){1}' , 'aa' , 'aa' , 'aa' ])
call add ( tl , [2 , '\v(a{2}){1}' , 'aaac' , 'aa' , 'aa' ])
call add ( tl , [2 , '\v(a{2}){1}' , 'daaac' , 'aa' , 'aa' ])
call add ( tl , [2 , '\v(a{1}){2}' , 'daaac' , 'aa' , 'a' ])
call add ( tl , [2 , '\v(a{1}){2}' , 'aaa' , 'aa' , 'a' ])
call add ( tl , [2 , '\v(a{2})+' , 'adaac' , 'aa' , 'aa' ])
call add ( tl , [2 , '\v(a{2})+' , 'aa' , 'aa' , 'aa' ])
call add ( tl , [2 , '\v(a{2}){1}' , 'aa' , 'aa' , 'aa' ])
call add ( tl , [2 , '\v(a{1}){2}' , 'aa' , 'aa' , 'a' ])
call add ( tl , [2 , '\v(a{1}){1}' , 'a' , 'a' , 'a' ])
call add ( tl , [2 , '\v(a{2}){2}' , 'aaaa' , 'aaaa' , 'aa' ])
call add ( tl , [2 , '\v(a{2}){2}' , 'aaabaaaa' , 'aaaa' , 'aa' ])
call add ( tl , [2 , '\v(a+){2}' , 'dadaac' , 'aa' , 'a' ])
call add ( tl , [2 , '\v(a{3}){2}' , 'aaaaaaa' , 'aaaaaa' , 'aaa' ])
call add ( tl , [2 , '\v(a{1,2}){2}' , 'daaac' , 'aaa' , 'a' ])
call add ( tl , [2 , '\v(a{1,3}){2}' , 'daaaac' , 'aaaa' , 'a' ])
call add ( tl , [2 , '\v(a{1,3}){2}' , 'daaaaac' , 'aaaaa' , 'aa' ])
call add ( tl , [2 , '\v(a{1,3}){3}' , 'daac' ])
call add ( tl , [2 , '\v(a{1,2}){2}' , 'dac' ])
call add ( tl , [2 , '\v(a+)+' , 'daac' , 'aa' , 'aa' ])
call add ( tl , [2 , '\v(a+)+' , 'aaa' , 'aaa' , 'aaa' ])
call add ( tl , [2 , '\v(a+){1,2}' , 'aaa' , 'aaa' , 'aaa' ])
call add ( tl , [2 , '\v(a+)(a+)' , 'aaa' , 'aaa' , 'aa' , 'a' ])
call add ( tl , [2 , '\v(a{3})+' , 'daaaac' , 'aaa' , 'aaa' ])
call add ( tl , [2 , '\v(a|b|c)+' , 'aacb' , 'aacb' , 'b' ])
call add ( tl , [2 , '\v(a|b|c){2}' , 'abcb' , 'ab' , 'b' ])
call add ( tl , [2 , '\v(abc){2}' , 'abcabd' , ])
call add ( tl , [2 , '\v(abc){2}' , 'abdabcabc' , 'abcabc' , 'abc' ])
call add ( tl , [2 , 'a*' , 'cc' , '' ])
call add ( tl , [2 , '\v(a*)+' , 'cc' , '' ])
call add ( tl , [2 , '\v((ab)+)+' , 'ab' , 'ab' , 'ab' , 'ab' ])
call add ( tl , [2 , '\v(((ab)+)+)+' , 'ab' , 'ab' , 'ab' , 'ab' , 'ab' ])
call add ( tl , [2 , '\v(((ab)+)+)+' , 'dababc' , 'abab' , 'abab' , 'abab' , 'ab' ])
call add ( tl , [2 , '\v(a{0,2})+' , 'cc' , '' ])
call add ( tl , [2 , '\v(a*)+' , '' , '' ])
call add ( tl , [2 , '\v((a*)+)+' , '' , '' ])
call add ( tl , [2 , '\v((ab)*)+' , '' , '' ])
call add ( tl , [2 , '\va{1,3}' , 'aab' , 'aa' ])
call add ( tl , [2 , '\va{2,3}' , 'abaa' , 'aa' ])
call add ( tl , [2 , '\v((ab)+|c*)+' , 'abcccaba' , 'abcccab' , '' , 'ab' ])
call add ( tl , [2 , '\v(a{2})|(b{3})' , 'bbabbbb' , 'bbb' , '' , 'bbb' ])
call add ( tl , [2 , '\va{2}|b{2}' , 'abab' ])
call add ( tl , [2 , '\v(a)+|(c)+' , 'bbacbaacbbb' , 'a' , 'a' ])
call add ( tl , [2 , '\vab{2,3}c' , 'aabbccccccccccccc' , 'abbc' ])
call add ( tl , [2 , '\vab{2,3}c' , 'aabbbccccccccccccc' , 'abbbc' ])
call add ( tl , [2 , '\vab{2,3}cd{2,3}e' , 'aabbbcddee' , 'abbbcdde' ])
call add ( tl , [2 , '\va(bc){2}d' , 'aabcbfbc' ])
call add ( tl , [2 , '\va*a{2}' , 'a' , ])
call add ( tl , [2 , '\va*a{2}' , 'aa' , 'aa' ])
call add ( tl , [2 , '\va*a{2}' , 'aaa' , 'aaa' ])
call add ( tl , [2 , '\va*a{2}' , 'bbbabcc' , ])
call add ( tl , [2 , '\va*b*|a*c*' , 'a' , 'a' ])
call add ( tl , [2 , '\va{1}b{1}|a{1}b{1}' , '' ])
" submatches
call add ( tl , [2 , '\v(a)' , 'ab' , 'a' , 'a' ])
call add ( tl , [2 , '\v(a)(b)' , 'ab' , 'ab' , 'a' , 'b' ])
call add ( tl , [2 , '\v(ab)(b)(c)' , 'abbc' , 'abbc' , 'ab' , 'b' , 'c' ])
call add ( tl , [2 , '\v((a)(b))' , 'ab' , 'ab' , 'ab' , 'a' , 'b' ])
call add ( tl , [2 , '\v(a)|(b)' , 'ab' , 'a' , 'a' ])
call add ( tl , [2 , '\v(a*)+' , 'aaaa' , 'aaaa' , '' ])
call add ( tl , [2 , 'x' , 'abcdef' ])
"
" Simple tests
"
" Search single groups
call add ( tl , [2 , 'ab' , 'aab' , 'ab' ])
call add ( tl , [2 , 'ab' , 'baced' ])
call add ( tl , [2 , 'ab' , ' ab ' , 'ab' ])
" Search multi-modifiers
call add ( tl , [2 , 'x*' , 'xcd' , 'x' ])
call add ( tl , [2 , 'x*' , 'xxxxxxxxxxxxxxxxsofijiojgf' , 'xxxxxxxxxxxxxxxx' ])
" empty match is good
call add ( tl , [2 , 'x*' , 'abcdoij' , '' ])
" no match here
call add ( tl , [2 , 'x\+' , 'abcdoin' ])
call add ( tl , [2 , 'x\+' , 'abcdeoijdfxxiuhfij' , 'xx' ])
call add ( tl , [2 , 'x\+' , 'xxxxx' , 'xxxxx' ])
call add ( tl , [2 , 'x\+' , 'abc x siufhiush xxxxxxxxx' , 'x' ])
call add ( tl , [2 , 'x\=' , 'x sdfoij' , 'x' ])
call add ( tl , [2 , 'x\=' , 'abc sfoij' , '' ]) " empty match is good
call add ( tl , [2 , 'x\=' , 'xxxxxxxxx c' , 'x' ])
call add ( tl , [2 , 'x\?' , 'x sdfoij' , 'x' ])
" empty match is good
call add ( tl , [2 , 'x\?' , 'abc sfoij' , '' ])
call add ( tl , [2 , 'x\?' , 'xxxxxxxxxx c' , 'x' ])
call add ( tl , [2 , 'a\{0,0}' , 'abcdfdoij' , '' ])
" same thing as 'a?'
call add ( tl , [2 , 'a\{0,1}' , 'asiubid axxxaaa' , 'a' ])
" same thing as 'a\{0,1}'
call add ( tl , [2 , 'a\{1,0}' , 'asiubid axxxaaa' , 'a' ])
call add ( tl , [2 , 'a\{3,6}' , 'aa siofuh' ])
call add ( tl , [2 , 'a\{3,6}' , 'aaaaa asfoij afaa' , 'aaaaa' ])
call add ( tl , [2 , 'a\{3,6}' , 'aaaaaaaa' , 'aaaaaa' ])
call add ( tl , [2 , 'a\{0}' , 'asoiuj' , '' ])
call add ( tl , [2 , 'a\{2}' , 'aaaa' , 'aa' ])
call add ( tl , [2 , 'a\{2}' , 'iuash fiusahfliusah fiushfilushfi uhsaifuh askfj nasfvius afg aaaa sfiuhuhiushf' , 'aa' ])
call add ( tl , [2 , 'a\{2}' , 'abcdefghijklmnopqrestuvwxyz1234567890' ])
" same thing as 'a*'
call add ( tl , [2 , 'a\{0,}' , 'oij sdigfusnf' , '' ])
call add ( tl , [2 , 'a\{0,}' , 'aaaaa aa' , 'aaaaa' ])
call add ( tl , [2 , 'a\{2,}' , 'sdfiougjdsafg' ])
call add ( tl , [2 , 'a\{2,}' , 'aaaaasfoij ' , 'aaaaa' ])
call add ( tl , [2 , 'a\{5,}' , 'xxaaaaxxx ' ])
call add ( tl , [2 , 'a\{5,}' , 'xxaaaaaxxx ' , 'aaaaa' ])
call add ( tl , [2 , 'a\{,0}' , 'oidfguih iuhi hiu aaaa' , '' ])
call add ( tl , [2 , 'a\{,5}' , 'abcd' , 'a' ])
call add ( tl , [2 , 'a\{,5}' , 'aaaaaaaaaa' , 'aaaaa' ])
" leading star as normal char when \{} follows
call add ( tl , [2 , '^*\{4,}$' , '***' ])
call add ( tl , [2 , '^*\{4,}$' , '****' , '****' ])
call add ( tl , [2 , '^*\{4,}$' , '*****' , '*****' ])
" same thing as 'a*'
call add ( tl , [2 , 'a\{}' , 'bbbcddiuhfcd' , '' ])
call add ( tl , [2 , 'a\{}' , 'aaaaioudfh coisf jda' , 'aaaa' ])
call add ( tl , [2 , 'a\{-0,0}' , 'abcdfdoij' , '' ])
" anti-greedy version of 'a?'
call add ( tl , [2 , 'a\{-0,1}' , 'asiubid axxxaaa' , '' ])
call add ( tl , [2 , 'a\{-3,6}' , 'aa siofuh' ])
call add ( tl , [2 , 'a\{-3,6}' , 'aaaaa asfoij afaa' , 'aaa' ])
call add ( tl , [2 , 'a\{-3,6}' , 'aaaaaaaa' , 'aaa' ])
call add ( tl , [2 , 'a\{-0}' , 'asoiuj' , '' ])
call add ( tl , [2 , 'a\{-2}' , 'aaaa' , 'aa' ])
call add ( tl , [2 , 'a\{-2}' , 'abcdefghijklmnopqrestuvwxyz1234567890' ])
call add ( tl , [2 , 'a\{-0,}' , 'oij sdigfusnf' , '' ])
call add ( tl , [2 , 'a\{-0,}' , 'aaaaa aa' , '' ])
call add ( tl , [2 , 'a\{-2,}' , 'sdfiougjdsafg' ])
call add ( tl , [2 , 'a\{-2,}' , 'aaaaasfoij ' , 'aa' ])
call add ( tl , [2 , 'a\{-,0}' , 'oidfguih iuhi hiu aaaa' , '' ])
call add ( tl , [2 , 'a\{-,5}' , 'abcd' , '' ])
call add ( tl , [2 , 'a\{-,5}' , 'aaaaaaaaaa' , '' ])
" anti-greedy version of 'a*'
call add ( tl , [2 , 'a\{-}' , 'bbbcddiuhfcd' , '' ])
call add ( tl , [2 , 'a\{-}' , 'aaaaioudfh coisf jda' , '' ])
" Test groups of characters and submatches
call add ( tl , [2 , '\(abc\)*' , 'abcabcabc' , 'abcabcabc' , 'abc' ])
call add ( tl , [2 , '\(ab\)\+' , 'abababaaaaa' , 'ababab' , 'ab' ])
call add ( tl , [2 , '\(abaaaaa\)*cd' , 'cd' , 'cd' , '' ])
call add ( tl , [2 , '\(test1\)\? \(test2\)\?' , 'test1 test3' , 'test1 ' , 'test1' , '' ])
call add ( tl , [2 , '\(test1\)\= \(test2\) \(test4443\)\=' , ' test2 test4443 yupiiiiiiiiiii' , ' test2 test4443' , '' , 'test2' , 'test4443' ])
call add ( tl , [2 , '\(\(sub1\) hello \(sub 2\)\)' , 'asterix sub1 hello sub 2 obelix' , 'sub1 hello sub 2' , 'sub1 hello sub 2' , 'sub1' , 'sub 2' ])
call add ( tl , [2 , '\(\(\(yyxxzz\)\)\)' , 'abcdddsfiusfyyzzxxyyxxzz' , 'yyxxzz' , 'yyxxzz' , 'yyxxzz' , 'yyxxzz' ])
call add ( tl , [2 , '\v((ab)+|c+)+' , 'abcccaba' , 'abcccab' , 'ab' , 'ab' ])
call add ( tl , [2 , '\v((ab)|c*)+' , 'abcccaba' , 'abcccab' , '' , 'ab' ])
call add ( tl , [2 , '\v(a(c*)+b)+' , 'acbababaaa' , 'acbabab' , 'ab' , '' ])
call add ( tl , [2 , '\v(a|b*)+' , 'aaaa' , 'aaaa' , '' ])
2022-04-03 18:12:20 -07:00
call add ( tl , [2 , '\p*' , 'a<> ' , 'a<> ' ])
2019-12-15 08:57:43 -07:00
" Test greedy-ness and lazy-ness
call add ( tl , [2 , 'a\{-2,7}' , 'aaaaaaaaaaaaa' , 'aa' ])
call add ( tl , [2 , 'a\{-2,7}x' , 'aaaaaaaaax' , 'aaaaaaax' ])
call add ( tl , [2 , 'a\{2,7}' , 'aaaaaaaaaaaaaaaaaaaa' , 'aaaaaaa' ])
call add ( tl , [2 , 'a\{2,7}x' , 'aaaaaaaaax' , 'aaaaaaax' ])
call add ( tl , [2 , '\vx(.{-,8})yz(.*)' , 'xayxayzxayzxayz' , 'xayxayzxayzxayz' , 'ayxa' , 'xayzxayz' ])
call add ( tl , [2 , '\vx(.*)yz(.*)' , 'xayxayzxayzxayz' , 'xayxayzxayzxayz' , 'ayxayzxayzxa' , '' ])
call add ( tl , [2 , '\v(a{1,2}){-2,3}' , 'aaaaaaa' , 'aaaa' , 'aa' ])
call add ( tl , [2 , '\v(a{-1,3})+' , 'aa' , 'aa' , 'a' ])
call add ( tl , [2 , '^\s\{-}\zs\( x\|x$\)' , ' x' , ' x' , ' x' ])
call add ( tl , [2 , '^\s\{-}\zs\(x\| x$\)' , ' x' , ' x' , ' x' ])
call add ( tl , [2 , '^\s\{-}\ze\(x\| x$\)' , ' x' , '' , ' x' ])
call add ( tl , [2 , '^\(\s\{-}\)\(x\| x$\)' , ' x' , ' x' , '' , ' x' ])
" Test Character classes
call add ( tl , [2 , '\d\+e\d\d' , 'test 10e23 fd' , '10e23' ])
" Test collections and character range []
call add ( tl , [2 , '\v[a]' , 'abcd' , 'a' ])
call add ( tl , [2 , 'a[bcd]' , 'abcd' , 'ab' ])
call add ( tl , [2 , 'a[b-d]' , 'acbd' , 'ac' ])
call add ( tl , [2 , '[a-d][e-f][x-x]d' , 'cexdxx' , 'cexd' ])
call add ( tl , [2 , '\v[[:alpha:]]+' , 'abcdefghijklmnopqrstuvwxyz6' , 'abcdefghijklmnopqrstuvwxyz' ])
call add ( tl , [2 , '[[:alpha:]\+]' , '6x8' , 'x' ])
call add ( tl , [2 , '[^abc]\+' , 'abcabcabc' ])
call add ( tl , [2 , '[^abc]' , 'defghiasijvoinasoiunbvb' , 'd' ])
call add ( tl , [2 , '[^abc]\+' , 'ddddddda' , 'ddddddd' ])
call add ( tl , [2 , '[^a-d]\+' , 'aaaAAAZIHFNCddd' , 'AAAZIHFNC' ])
call add ( tl , [2 , '[a-f]*' , 'iiiiiiii' , '' ])
call add ( tl , [2 , '[a-f]*' , 'abcdefgh' , 'abcdef' ])
call add ( tl , [2 , '[^a-f]\+' , 'abcdefgh' , 'gh' ])
call add ( tl , [2 , '[a-c]\{-3,6}' , 'abcabc' , 'abc' ])
call add ( tl , [2 , '[^[:alpha:]]\+' , 'abcccadfoij7787ysf287yrnccdu' , '7787' ])
call add ( tl , [2 , '[-a]' , '-' , '-' ])
call add ( tl , [2 , '[a-]' , '-' , '-' ])
call add ( tl , [2 , '[a-f]*\c' , 'ABCDEFGH' , 'ABCDEF' ])
call add ( tl , [2 , '[abc][xyz]\c' , '-af-AF-BY--' , 'BY' ])
" filename regexp
call add ( tl , [2 , '[-./[:alnum:]_~]\+' , 'log13.file' , 'log13.file' ])
" special chars
call add ( tl , [2 , '[\]\^\-\\]\+' , '\^\\\-\---^' , '\^\\\-\---^' ])
" collation elem
call add ( tl , [2 , '[[.a.]]\+' , 'aa' , 'aa' ])
" middle of regexp
call add ( tl , [2 , 'abc[0-9]*ddd' , 'siuhabc ii' ])
call add ( tl , [2 , 'abc[0-9]*ddd' , 'adf abc44482ddd oijs' , 'abc44482ddd' ])
call add ( tl , [2 , '\_[0-9]\+' , 'asfi9888u' , '9888' ])
call add ( tl , [2 , '[0-9\n]\+' , 'asfi9888u' , '9888' ])
call add ( tl , [2 , '\_[0-9]\+' , "asfi\n9888u" , "\n9888" ])
call add ( tl , [2 , '\_f' , " \na " , "\n" ])
call add ( tl , [2 , '\_f\+' , " \na " , "\na" ])
call add ( tl , [2 , '[0-9A-Za-z-_.]\+' , " @0_a.A-{ " , "0_a.A-" ])
" Test start/end of line, start/end of file
call add ( tl , [2 , '^a.' , "a_\nb " , "a_" ])
call add ( tl , [2 , '^a.' , "b a \na_" ])
call add ( tl , [2 , '.a$' , " a\n " ])
call add ( tl , [2 , '.a$' , " a b\n_a" , "_a" ])
call add ( tl , [2 , '\%^a.' , "a a\na" , "a " ])
call add ( tl , [2 , '\%^a' , " a \na " ])
call add ( tl , [2 , '.a\%$' , " a\n " ])
call add ( tl , [2 , '.a\%$' , " a\n_a" , "_a" ])
" Test recognition of character classes
call add ( tl , [2 , '[0-7]\+' , 'x0123456789x' , '01234567' ])
call add ( tl , [2 , '[^0-7]\+' , '0a;X+% 897' , 'a;X+% 89' ])
call add ( tl , [2 , '[0-9]\+' , 'x0123456789x' , '0123456789' ])
call add ( tl , [2 , '[^0-9]\+' , '0a;X+% 9' , 'a;X+% ' ])
call add ( tl , [2 , '[0-9a-fA-F]\+' , 'x0189abcdefg' , '0189abcdef' ])
call add ( tl , [2 , '[^0-9A-Fa-f]\+' , '0189g;X+% ab' , 'g;X+% ' ])
call add ( tl , [2 , '[a-z_A-Z0-9]\+' , ';+aso_SfOij ' , 'aso_SfOij' ])
call add ( tl , [2 , '[^a-z_A-Z0-9]\+' , 'aSo_;+% sfOij' , ';+% ' ])
call add ( tl , [2 , '[a-z_A-Z]\+' , '0abyz_ABYZ;' , 'abyz_ABYZ' ])
call add ( tl , [2 , '[^a-z_A-Z]\+' , 'abAB_09;+% yzYZ' , '09;+% ' ])
call add ( tl , [2 , '[a-z]\+' , '0abcxyz1' , 'abcxyz' ])
call add ( tl , [2 , '[a-z]\+' , 'AabxyzZ' , 'abxyz' ])
call add ( tl , [2 , '[^a-z]\+' , 'a;X09+% x' , ';X09+% ' ])
call add ( tl , [2 , '[^a-z]\+' , 'abX0;%yz' , 'X0;%' ])
call add ( tl , [2 , '[a-zA-Z]\+' , '0abABxzXZ9' , 'abABxzXZ' ])
call add ( tl , [2 , '[^a-zA-Z]\+' , 'ab09_;+ XZ' , '09_;+ ' ])
call add ( tl , [2 , '[A-Z]\+' , 'aABXYZz' , 'ABXYZ' ])
call add ( tl , [2 , '[^A-Z]\+' , 'ABx0;%YZ' , 'x0;%' ])
call add ( tl , [2 , '[a-z]\+\c' , '0abxyzABXYZ;' , 'abxyzABXYZ' ])
call add ( tl , [2 , '[A-Z]\+\c' , '0abABxzXZ9' , 'abABxzXZ' ])
call add ( tl , [2 , '\c[^a-z]\+' , 'ab09_;+ XZ' , '09_;+ ' ])
call add ( tl , [2 , '\c[^A-Z]\+' , 'ab09_;+ XZ' , '09_;+ ' ])
call add ( tl , [2 , '\C[^A-Z]\+' , 'ABCOIJDEOIFNSD jsfoij sa' , ' jsfoij sa' ])
" Tests for \z features
" match ends at \ze
call add ( tl , [2 , 'xx \ze test' , 'xx ' ])
call add ( tl , [2 , 'abc\zeend' , 'oij abcend' , 'abc' ])
call add ( tl , [2 , 'aa\zebb\|aaxx' , ' aabb ' , 'aa' ])
call add ( tl , [2 , 'aa\zebb\|aaxx' , ' aaxx ' , 'aaxx' ])
call add ( tl , [2 , 'aabb\|aa\zebb' , ' aabb ' , 'aabb' ])
call add ( tl , [2 , 'aa\zebb\|aaebb' , ' aabb ' , 'aa' ])
" match starts at \zs
call add ( tl , [2 , 'abc\zsdd' , 'ddabcddxyzt' , 'dd' ])
call add ( tl , [2 , 'aa \zsax' , ' ax' ])
call add ( tl , [2 , 'abc \zsmatch\ze abc' , 'abc abc abc match abc abc' , 'match' ])
call add ( tl , [2 , '\v(a \zsif .*){2}' , 'a if then a if last' , 'if last' , 'a if last' ])
call add ( tl , [2 , '\>\zs.' , 'aword. ' , '.' ])
call add ( tl , [2 , '\s\+\ze\[/\|\s\zs\s\+' , 'is [a t' , ' ' ])
" Tests for \@= and \& features
call add ( tl , [2 , 'abc\@=' , 'abc' , 'ab' ])
call add ( tl , [2 , 'abc\@=cd' , 'abcd' , 'abcd' ])
call add ( tl , [2 , 'abc\@=' , 'ababc' , 'ab' ])
" will never match, no matter the input text
call add ( tl , [2 , 'abcd\@=e' , 'abcd' ])
" will never match
call add ( tl , [2 , 'abcd\@=e' , 'any text in here ... ' ])
call add ( tl , [2 , '\v(abc)@=..' , 'xabcd' , 'ab' , 'abc' ])
call add ( tl , [2 , '\(.*John\)\@=.*Bob' , 'here is John, and here is B' ])
call add ( tl , [2 , '\(John.*\)\@=.*Bob' , 'John is Bobs friend' , 'John is Bob' , 'John is Bobs friend' ])
call add ( tl , [2 , '\<\S\+\())\)\@=' , '$((i=i+1))' , 'i=i+1' , '))' ])
call add ( tl , [2 , '.*John\&.*Bob' , 'here is John, and here is B' ])
call add ( tl , [2 , '.*John\&.*Bob' , 'John is Bobs friend' , 'John is Bob' ])
call add ( tl , [2 , '\v(test1)@=.*yep' , 'this is a test1, yep it is' , 'test1, yep' , 'test1' ])
call add ( tl , [2 , 'foo\(bar\)\@!' , 'foobar' ])
call add ( tl , [2 , 'foo\(bar\)\@!' , 'foo bar' , 'foo' ])
call add ( tl , [2 , 'if \(\(then\)\@!.\)*$' , ' if then else' ])
call add ( tl , [2 , 'if \(\(then\)\@!.\)*$' , ' if else ' , 'if else ' , ' ' ])
call add ( tl , [2 , '\(foo\)\@!bar' , 'foobar' , 'bar' ])
call add ( tl , [2 , '\(foo\)\@!...bar' , 'foobar' ])
call add ( tl , [2 , '^\%(.*bar\)\@!.*\zsfoo' , ' bar foo ' ])
call add ( tl , [2 , '^\%(.*bar\)\@!.*\zsfoo' , ' foo bar ' ])
call add ( tl , [2 , '^\%(.*bar\)\@!.*\zsfoo' , ' foo xxx ' , 'foo' ])
call add ( tl , [2 , '[ ]\@!\p\%([ ]\@!\p\)*:' , 'implicit mappings:' , 'mappings:' ])
call add ( tl , [2 , '[ ]\@!\p\([ ]\@!\p\)*:' , 'implicit mappings:' , 'mappings:' , 's' ])
call add ( tl , [2 , 'm\k\+_\@=\%(_\@!\k\)\@<=\k\+e' , 'mx__xe' , 'mx__xe' ])
call add ( tl , [2 , '\%(\U\@<=S\k*\|S\l\)R' , 'SuR' , 'SuR' ])
" Combining different tests and features
call add ( tl , [2 , '[[:alpha:]]\{-2,6}' , '787abcdiuhsasiuhb4' , 'ab' ])
call add ( tl , [2 , '' , 'abcd' , '' ])
call add ( tl , [2 , '\v(())' , 'any possible text' , '' ])
call add ( tl , [2 , '\v%(ab(xyz)c)' , ' abxyzc ' , 'abxyzc' , 'xyz' ])
call add ( tl , [2 , '\v(test|)empty' , 'tesempty' , 'empty' , '' ])
call add ( tl , [2 , '\v(a|aa)(a|aa)' , 'aaa' , 'aa' , 'a' , 'a' ])
" \%u and friends
call add ( tl , [2 , '\%d32' , 'yes no' , ' ' ])
call add ( tl , [2 , '\%o40' , 'yes no' , ' ' ])
call add ( tl , [2 , '\%x20' , 'yes no' , ' ' ])
call add ( tl , [2 , '\%u0020' , 'yes no' , ' ' ])
call add ( tl , [2 , '\%U00000020' , 'yes no' , ' ' ])
call add ( tl , [2 , '\%d0' , "yes\x0ano" , "\x0a" ])
"" \%[abc]
call add ( tl , [2 , 'foo\%[bar]' , 'fobar' ])
call add ( tl , [2 , 'foo\%[bar]' , 'foobar' , 'foobar' ])
call add ( tl , [2 , 'foo\%[bar]' , 'fooxx' , 'foo' ])
call add ( tl , [2 , 'foo\%[bar]' , 'foobxx' , 'foob' ])
call add ( tl , [2 , 'foo\%[bar]' , 'foobaxx' , 'fooba' ])
call add ( tl , [2 , 'foo\%[bar]' , 'foobarxx' , 'foobar' ])
call add ( tl , [2 , 'foo\%[bar]x' , 'foobxx' , 'foobx' ])
call add ( tl , [2 , 'foo\%[bar]x' , 'foobarxx' , 'foobarx' ])
call add ( tl , [2 , '\%[bar]x' , 'barxx' , 'barx' ])
call add ( tl , [2 , '\%[bar]x' , 'bxx' , 'bx' ])
call add ( tl , [2 , '\%[bar]x' , 'xxx' , 'x' ])
call add ( tl , [2 , 'b\%[[ao]r]' , 'bar bor' , 'bar' ])
call add ( tl , [2 , 'b\%[[]]r]' , 'b]r bor' , 'b]r' ])
call add ( tl , [2 , '@\%[\w\-]*' , '<http://john.net/pandoc/>[@pandoc]' , '@pandoc' ])
" Alternatives, must use first longest match
call add ( tl , [2 , 'goo\|go' , 'google' , 'goo' ])
call add ( tl , [2 , '\<goo\|\<go' , 'google' , 'goo' ])
call add ( tl , [2 , '\<goo\|go' , 'google' , 'goo' ])
" Back references
call add ( tl , [2 , '\(\i\+\) \1' , ' abc abc' , 'abc abc' , 'abc' ])
call add ( tl , [2 , '\(\i\+\) \1' , 'xgoo goox' , 'goo goo' , 'goo' ])
call add ( tl , [2 , '\(a\)\(b\)\(c\)\(dd\)\(e\)\(f\)\(g\)\(h\)\(i\)\1\2\3\4\5\6\7\8\9' , 'xabcddefghiabcddefghix' , 'abcddefghiabcddefghi' , 'a' , 'b' , 'c' , 'dd' , 'e' , 'f' , 'g' , 'h' , 'i' ])
call add ( tl , [2 , '\(\d*\)a \1b' , ' a b ' , 'a b' , '' ])
call add ( tl , [2 , '^.\(.\).\_..\1.' , "aaa\naaa\nb" , "aaa\naaa" , 'a' ])
call add ( tl , [2 , '^.*\.\(.*\)/.\+\(\1\)\@<!$' , 'foo.bat/foo.com' , 'foo.bat/foo.com' , 'bat' ])
call add ( tl , [2 , '^.*\.\(.*\)/.\+\(\1\)\@<!$' , 'foo.bat/foo.bat' ])
call add ( tl , [2 , '^.*\.\(.*\)/.\+\(\1\)\@<=$' , 'foo.bat/foo.bat' , 'foo.bat/foo.bat' , 'bat' , 'bat' ])
call add ( tl , [2 , '\\\@<!\${\(\d\+\%(:.\{-}\)\?\\\@<!\)}' , '2013-06-27${0}' , '${0}' , '0' ])
call add ( tl , [2 , '^\(a*\)\1$' , 'aaaaaaaa' , 'aaaaaaaa' , 'aaaa' ])
call add ( tl , [2 , '^\(a\{-2,}\)\1\+$' , 'aaaaaaaaa' , 'aaaaaaaaa' , 'aaa' ])
" Look-behind with limit
call add ( tl , [2 , '<\@<=span.' , 'xxspanxx<spanyyy' , 'spany' ])
call add ( tl , [2 , '<\@1<=span.' , 'xxspanxx<spanyyy' , 'spany' ])
call add ( tl , [2 , '<\@2<=span.' , 'xxspanxx<spanyyy' , 'spany' ])
call add ( tl , [2 , '\(<<\)\@<=span.' , 'xxspanxxxx<spanxx<<spanyyy' , 'spany' , '<<' ])
call add ( tl , [2 , '\(<<\)\@1<=span.' , 'xxspanxxxx<spanxx<<spanyyy' ])
call add ( tl , [2 , '\(<<\)\@2<=span.' , 'xxspanxxxx<spanxx<<spanyyy' , 'spany' , '<<' ])
call add ( tl , [2 , '\(foo\)\@<!bar.' , 'xx foobar1 xbar2 xx' , 'bar2' ])
" look-behind match in front of a zero-width item
call add ( tl , [2 , '\v\C%(<Last Changed:\s+)@<=.*$' , '" test header' ])
call add ( tl , [2 , '\v\C%(<Last Changed:\s+)@<=.*$' , '" Last Changed: 1970' , '1970' ])
call add ( tl , [2 , '\(foo\)\@<=\>' , 'foobar' ])
call add ( tl , [2 , '\(foo\)\@<=\>' , 'barfoo' , '' , 'foo' ])
call add ( tl , [2 , '\(foo\)\@<=.*' , 'foobar' , 'bar' , 'foo' ])
" complicated look-behind match
call add ( tl , [2 , '\(r\@<=\|\w\@<!\)\/' , 'x = /word/;' , '/' ])
call add ( tl , [2 , '^[a-z]\+\ze \&\(asdf\)\@<!' , 'foo bar' , 'foo' ])
"" \@>
call add ( tl , [2 , '\(a*\)\@>a' , 'aaaa' ])
call add ( tl , [2 , '\(a*\)\@>b' , 'aaab' , 'aaab' , 'aaa' ])
call add ( tl , [2 , '^\(.\{-}b\)\@>.' , ' abcbd' , ' abc' , ' ab' ])
call add ( tl , [2 , '\(.\{-}\)\(\)\@>$' , 'abc' , 'abc' , 'abc' , '' ])
" TODO: BT engine does not restore submatch after failure
call add ( tl , [1 , '\(a*\)\@>a\|a\+' , 'aaaa' , 'aaaa' ])
" "\_" prepended negated collection matches EOL
call add ( tl , [2 , '\_[^8-9]\+' , "asfi\n9888" , "asfi\n" ])
call add ( tl , [2 , '\_[^a]\+' , "asfi\n9888" , "sfi\n9888" ])
" Requiring lots of states.
call add ( tl , [2 , '[0-9a-zA-Z]\{8}-\([0-9a-zA-Z]\{4}-\)\{3}[0-9a-zA-Z]\{12}' , " 12345678-1234-1234-1234-123456789012 " , "12345678-1234-1234-1234-123456789012" , "1234-" ])
" Skip adding state twice
call add ( tl , [2 , '^\%(\%(^\s*#\s*if\>\|#\s*if\)\)\(\%>1c.*$\)\@=' , "#if FOO" , "#if" , ' FOO' ])
" Test \%V atom
call add ( tl , [2 , '\%>70vGesamt' , 'Jean-Michel Charlier & Victor Hubinon\Gesamtausgabe [Salleck] Buck Danny {Jean-Michel Charlier & Victor Hubinon}\Gesamtausgabe' , 'Gesamt' ])
2022-07-15 01:26:35 -07:00
" Test for ignoring case and matching repeated characters
call add ( tl , [2 , '\cb\+' , 'aAbBbBcC' , 'bBbB' ])
2019-12-15 08:57:43 -07:00
" Run the tests
for t in tl
let re = t [0 ]
let pat = t [1 ]
let text = t [2 ]
let matchidx = 3
for engine in [0 , 1 , 2 ]
if engine = = 2 && re = = 0 | | engine = = 1 && re = = 1
continue
endif
let ®expengine = engine
try
let l = matchlist ( text , pat )
catch
call assert_report ( 'Error ' . engine . ': pat: \"' . pat
\ . '\", text: \"' . text . '\", caused an exception: \"'
\ . v :exception . '\"' )
endtry
" check the match itself
if len ( l ) = = 0 && len ( t ) > matchidx
call assert_report ( 'Error ' . engine . ': pat: \"' . pat
\ . '\", text: \"' . text . '\", did not match, expected: \"'
\ . t [matchidx ] . '\"' )
elseif len ( l ) > 0 && len ( t ) = = matchidx
call assert_report ( 'Error ' . engine . ': pat: \"' . pat
\ . '\", text: \"' . text . '\", match: \"' . l [0 ]
\ . '\", expected no match' )
elseif len ( t ) > matchidx && l [0 ] ! = t [matchidx ]
call assert_report ( 'Error ' . engine . ': pat: \"' . pat
\ . '\", text: \"' . text . '\", match: \"' . l [0 ]
\ . '\", expected: \"' . t [matchidx ] . '\"' )
else
" Test passed
endif
" check all the nine submatches
if len ( l ) > 0
for i in range ( 1 , 9 )
if len ( t ) < = matchidx + i
let e = ''
else
let e = t [matchidx + i ]
endif
if l [i ] ! = e
call assert_report ( 'Error ' . engine . ': pat: \"' . pat
\ . '\", text: \"' . text . '\", submatch ' . i . ': \"'
\ . l [i ] . '\", expected: \"' . e . '\"' )
endif
endfor
unlet i
endif
endfor
endfor
unlet t tl e l
endfunc
" Tests for multi-line regexp patterns without multi-byte support.
func Test_regexp_multiline_pat ( )
2022-07-15 01:26:35 -07:00
" tl is a List of Lists with:
" regexp engines to test
" 0 - test with 'regexpengine' values 0 and 1
" 1 - test with 'regexpengine' values 0 and 2
" 2 - test with 'regexpengine' values 0, 1 and 2
" regexp pattern
" List with text to test the pattern on
" List with the expected match
2019-12-15 08:57:43 -07:00
let tl = []
" back references
call add ( tl , [2 , '^.\(.\).\_..\1.' , ['aaa' , 'aaa' , 'b' ], ['XX' , 'b' ]])
call add ( tl , [2 , '\v.*\/(.*)\n.*\/\1$' , ['./Dir1/Dir2/zyxwvuts.txt' , './Dir1/Dir2/abcdefgh.bat' , '' , './Dir1/Dir2/file1.txt' , './OtherDir1/OtherDir2/file1.txt' ], ['./Dir1/Dir2/zyxwvuts.txt' , './Dir1/Dir2/abcdefgh.bat' , '' , 'XX' ]])
" line breaks
call add ( tl , [2 , '\S.*\nx' , ['abc' , 'def' , 'ghi' , 'xjk' , 'lmn' ], ['abc' , 'def' , 'XXjk' , 'lmn' ]])
2022-07-15 01:26:35 -07:00
" Any single character or end-of-line
call add ( tl , [2 , '\_.\+' , ['a' , 'b' , 'c' ], ['XX' ]])
" Any identifier or end-of-line
call add ( tl , [2 , '\_i\+' , ['a' , 'b' , ';' , '2' ], ['XX;XX' ]])
" Any identifier but excluding digits or end-of-line
call add ( tl , [2 , '\_I\+' , ['a' , 'b' , ';' , '2' ], ['XX;XX2XX' ]])
" Any keyword or end-of-line
call add ( tl , [2 , '\_k\+' , ['a' , 'b' , '=' , '2' ], ['XX=XX' ]])
" Any keyword but excluding digits or end-of-line
call add ( tl , [2 , '\_K\+' , ['a' , 'b' , '=' , '2' ], ['XX=XX2XX' ]])
" Any filename character or end-of-line
call add ( tl , [2 , '\_f\+' , ['a' , 'b' , '.' , '5' ], ['XX' ]])
" Any filename character but excluding digits or end-of-line
call add ( tl , [2 , '\_F\+' , ['a' , 'b' , '.' , '5' ], ['XX5XX' ]])
" Any printable character or end-of-line
call add ( tl , [2 , '\_p\+' , ['a' , 'b' , '=' , '4' ], ['XX' ]])
" Any printable character excluding digits or end-of-line
call add ( tl , [2 , '\_P\+' , ['a' , 'b' , '=' , '4' ], ['XX4XX' ]])
" Any whitespace character or end-of-line
call add ( tl , [2 , '\_s\+' , [' ' , ' ' , 'a' , 'b' ], ['XXaXXbXX' ]])
" Any non-whitespace character or end-of-line
call add ( tl , [2 , '\_S\+' , [' ' , ' ' , 'a' , 'b' ], [' XX XX' ]])
" Any decimal digit or end-of-line
call add ( tl , [2 , '\_d\+' , ['1' , 'a' , '2' , 'b' , '3' ], ['XXaXXbXX' ]])
" Any non-decimal digit or end-of-line
call add ( tl , [2 , '\_D\+' , ['1' , 'a' , '2' , 'b' , '3' ], ['1XX2XX3XX' ]])
" Any hexadecimal digit or end-of-line
call add ( tl , [2 , '\_x\+' , ['1' , 'a' , 'g' , '9' , '8' ], ['XXgXX' ]])
" Any non-hexadecimal digit or end-of-line
call add ( tl , [2 , '\_X\+' , ['1' , 'a' , 'g' , '9' , '8' ], ['1XXaXX9XX8XX' ]])
" Any octal digit or end-of-line
call add ( tl , [2 , '\_o\+' , ['0' , '7' , '8' , '9' , '0' ], ['XX8XX9XX' ]])
" Any non-octal digit or end-of-line
call add ( tl , [2 , '\_O\+' , ['0' , '7' , '8' , '9' , '0' ], ['0XX7XX0XX' ]])
" Any word character or end-of-line
call add ( tl , [2 , '\_w\+' , ['A' , 'B' , '=' , 'C' , 'D' ], ['XX=XX' ]])
" Any non-word character or end-of-line
call add ( tl , [2 , '\_W\+' , ['A' , 'B' , '=' , 'C' , 'D' ], ['AXXBXXCXXDXX' ]])
" Any head-of-word character or end-of-line
call add ( tl , [2 , '\_h\+' , ['a' , '1' , 'b' , '2' , 'c' ], ['XX1XX2XX' ]])
" Any non-head-of-word character or end-of-line
call add ( tl , [2 , '\_H\+' , ['a' , '1' , 'b' , '2' , 'c' ], ['aXXbXXcXX' ]])
" Any alphabetic character or end-of-line
call add ( tl , [2 , '\_a\+' , ['a' , '1' , 'b' , '2' , 'c' ], ['XX1XX2XX' ]])
" Any non-alphabetic character or end-of-line
call add ( tl , [2 , '\_A\+' , ['a' , '1' , 'b' , '2' , 'c' ], ['aXXbXXcXX' ]])
" Any lowercase character or end-of-line
call add ( tl , [2 , '\_l\+' , ['a' , 'A' , 'b' , 'B' ], ['XXAXXBXX' ]])
" Any non-lowercase character or end-of-line
call add ( tl , [2 , '\_L\+' , ['a' , 'A' , 'b' , 'B' ], ['aXXbXX' ]])
" Any uppercase character or end-of-line
call add ( tl , [2 , '\_u\+' , ['a' , 'A' , 'b' , 'B' ], ['aXXbXX' ]])
" Any non-uppercase character or end-of-line
call add ( tl , [2 , '\_U\+' , ['a' , 'A' , 'b' , 'B' ], ['XXAXXBXX' ]])
" Collection or end-of-line
call add ( tl , [2 , '\_[a-z]\+' , ['a' , 'A' , 'b' , 'B' ], ['XXAXXBXX' ]])
" start of line anywhere in the text
call add ( tl , [2 , 'one\zs\_s*\_^\zetwo' ,
\ ['' , 'one' , ' two' , 'one' , '' , 'two' ],
\ ['' , 'one' , ' two' , 'oneXXtwo' ]])
" end of line anywhere in the text
call add ( tl , [2 , 'one\zs\_$\_s*two' ,
\ ['' , 'one' , ' two' , 'one' , '' , 'two' ], ['' , 'oneXX' , 'oneXX' ]])
2019-12-15 08:57:43 -07:00
" Check that \_[0-9] matching EOL does not break a following \>
call add ( tl , [2 , '\<\(\(25\_[0-5]\|2\_[0-4]\_[0-9]\|\_[01]\?\_[0-9]\_[0-9]\?\)\.\)\{3\}\(25\_[0-5]\|2\_[0-4]\_[0-9]\|\_[01]\?\_[0-9]\_[0-9]\?\)\>' , ['' , 'localnet/192.168.0.1' , '' ], ['' , 'localnet/XX' , '' ]])
" Check a pattern with a line break and ^ and $
call add ( tl , [2 , 'a\n^b$\n^c' , ['a' , 'b' , 'c' ], ['XX' ]])
call add ( tl , [2 , '\(^.\+\n\)\1' , [' dog' , ' dog' , 'asdf' ], ['XXasdf' ]])
" Run the multi-line tests
for t in tl
let re = t [0 ]
let pat = t [1 ]
let before = t [2 ]
let after = t [3 ]
for engine in [0 , 1 , 2 ]
2022-07-15 01:26:35 -07:00
if engine = = 2 && re = = 0 | | engine = = 1 && re = = 1
2019-12-15 08:57:43 -07:00
continue
endif
let ®expengine = engine
new
call setline ( 1 , before )
exe '%s/' . pat . '/XX/'
let result = getline ( 1 , '$' )
q !
if result ! = after
call assert_report ( 'Error: pat: \"' . pat . '\", text: \"'
\ . string ( before ) . '\", expected: \"' . string ( after )
\ . '\", got: \"' . string ( result ) . '\"' )
else
" Test passed
endif
endfor
endfor
unlet t tl
endfunc
" Check that using a pattern on two lines doesn't get messed up by using
" matchstr() with \ze in between.
func Test_matchstr_with_ze ( )
new
call append ( 0 , ['Substitute here:' , '<T="">Ta 5</Title>' ,
\ '<T="">Ac 7</Title>' ])
call cursor ( 1 , 1 )
set re = 0
.+ 1 , .+ 2 s/""/ \= '"' . matchstr ( getline ( "." ) , '\d\+\ze<' ) . '"'
call assert_equal ( ['Substitute here:' , '<T="5">Ta 5</Title>' ,
\ '<T="7">Ac 7</Title>' , '' ], getline ( 1 , '$' ) )
bwipe !
endfunc
" Check a pattern with a look behind crossing a line boundary
func Test_lookbehind_across_line ( )
new
call append ( 0 , ['Behind:' , 'asdfasd<yyy' , 'xxstart1' , 'asdfasd<yy' ,
\ 'xxxstart2' , 'asdfasd<yy' , 'xxstart3' ])
call cursor ( 1 , 1 )
call search ( '\(<\_[xy]\+\)\@3<=start' )
call assert_equal ( [0 , 7 , 3 , 0 ], getpos ( '.' ) )
bwipe !
endfunc
2022-07-15 01:26:35 -07:00
" Test for the \%V atom (match inside the visual area)
func Regex_Match_Visual_Area ( )
2019-12-15 08:57:43 -07:00
call append ( 0 , ['Visual:' , 'thexe the thexethe' , 'andaxand andaxand' ,
\ 'oooxofor foroxooo' , 'oooxofor foroxooo' ])
call cursor ( 1 , 1 )
exe "normal jfxvfx:s/\\%Ve/E/g\<CR>"
exe "normal jV:s/\\%Va/A/g\<CR>"
exe "normal jfx\<C-V>fxj:s/\\%Vo/O/g\<CR>"
call assert_equal ( ['Visual:' , 'thexE thE thExethe' , 'AndAxAnd AndAxAnd' ,
\ 'oooxOfOr fOrOxooo' , 'oooxOfOr fOrOxooo' , '' ], getline ( 1 , '$' ) )
2022-07-15 01:26:35 -07:00
%d
endfunc
" Check matching Visual area
func Test_matching_visual_area ( )
new
set regexpengine = 1
call Regex_Match_Visual_Area ( )
set regexpengine = 2
call Regex_Match_Visual_Area ( )
set regexpengine &
2019-12-15 08:57:43 -07:00
bwipe !
endfunc
" Check matching marks
2022-07-15 01:26:35 -07:00
func Regex_Mark ( )
2019-12-15 08:57:43 -07:00
call append ( 0 , ['' , '' , '' , 'Marks:' , 'asdfSasdfsadfEasdf' , 'asdfSas' ,
\ 'dfsadfEasdf' , '' , '' , '' , '' , '' ])
call cursor ( 4 , 1 )
exe "normal jfSmsfEme:.-4,.+6s/.\\%>'s.*\\%<'e../here/\<CR>"
exe "normal jfSmsj0fEme:.-4,.+6s/.\\%>'s\\_.*\\%<'e../again/\<CR>"
call assert_equal ( ['' , '' , '' , 'Marks:' , 'asdfhereasdf' , 'asdfagainasdf' ,
\ '' , '' , '' , '' , '' , '' ], getline ( 1 , '$' ) )
2022-07-15 01:26:35 -07:00
%d
endfunc
func Test_matching_marks ( )
new
set regexpengine = 1
call Regex_Mark ( )
set regexpengine = 2
call Regex_Mark ( )
2019-12-15 08:57:43 -07:00
bwipe !
endfunc
" Check patterns matching cursor position.
func s :curpos_test ( )
new
call setline ( 1 , ['ffooooo' , 'boboooo' , 'zoooooo' , 'koooooo' , 'moooooo' ,
\ "\t\t\tfoo" , 'abababababababfoo' , 'bababababababafoo' , '********_' ,
\ ' xxxxxxxxxxxx xxxx xxxxxx xxxxxxx x xxxxxxxxx xx xxxxxx xxxxxx xxxxx xxxxxxx xx xxxx xxxxxxxx xxxx xxxxxxxxxxx xxx xxxxxxx xxxxxxxxx xx xxxxxx xx xxxxxxx xxxxxxxxxxxxxxxx xxxxxxxxx xxx xxxxxxxx xxxxxxxxx xxxx xxx xxxx xxx xxx xxxxx xxxxxxxxxxxx xxxx xxxxxxxxx xxxxxxxxxxx xx xxxxx xxx xxxxxxxx xxxxxx xxx xxx xxxxxxxxx xxxxxxx x xxxxxxxxx xx xxxxxx xxxxxxx xxxxxxxxxxxxxxxxxx xxxxxxx xxxxxxx xxx xxx xxxxxxxx xxxxxxx xxxx xxx xxxxxx xxxxx xxxxx xx xxxxxx xxxxxxx xxx xxxxxxxxxxxx xxxx xxxxxxxxx xxxxxx xxxxxx xxxxx xxx xxxxxxx xxxxxxxxxxxxxxxx xxxxxxxxx xxxxxxxxxx xxxx xx xxxxxxxx xxx xxxxxxxxxxx xxxxx' ])
call setpos ( '.' , [0 , 1 , 0 , 0 ])
s /\%>3c./ /g
call setpos ( '.' , [0 , 2 , 4 , 0 ])
s /\%#.*$/ /g
call setpos ( '.' , [0 , 3 , 0 , 0 ])
s /\%<3c./ _ /g
%s /\%4l\%>5c./ _ /g
%s /\%6l\%>25v./ _ /g
%s /\%>6l\%3c./ ! /g
%s /\%>7l\%12c./ ?/g
%s /\%>7l\%<9l\%>5v\%<8v./ #/g
$s /\%(|\u.*\)\@<=[^|\t]\+$/ /ge
call assert_equal ( ['ffo' , 'bob' , '__ooooo' , 'koooo__' , 'moooooo' ,
\ ' f__' , 'ab!babababababfoo' ,
\ 'ba!ab##abab?bafoo' , '**!*****_' ,
\ ' ! xxx?xxxxxxxx xxxx xxxxxx xxxxxxx x xxxxxxxxx xx xxxxxx xxxxxx xxxxx xxxxxxx xx xxxx xxxxxxxx xxxx xxxxxxxxxxx xxx xxxxxxx xxxxxxxxx xx xxxxxx xx xxxxxxx xxxxxxxxxxxxxxxx xxxxxxxxx xxx xxxxxxxx xxxxxxxxx xxxx xxx xxxx xxx xxx xxxxx xxxxxxxxxxxx xxxx xxxxxxxxx xxxxxxxxxxx xx xxxxx xxx xxxxxxxx xxxxxx xxx xxx xxxxxxxxx xxxxxxx x xxxxxxxxx xx xxxxxx xxxxxxx xxxxxxxxxxxxxxxxxx xxxxxxx xxxxxxx xxx xxx xxxxxxxx xxxxxxx xxxx xxx xxxxxx xxxxx xxxxx xx xxxxxx xxxxxxx xxx xxxxxxxxxxxx xxxx xxxxxxxxx xxxxxx xxxxxx xxxxx xxx xxxxxxx xxxxxxxxxxxxxxxx xxxxxxxxx xxxxxxxxxx xxxx xx xxxxxxxx xxx xxxxxxxxxxx xxxxx' ],
\ getline ( 1 , '$' ) )
bwipe !
endfunc
func Test_matching_curpos ( )
set re = 0
call s :curpos_test ( )
set re = 1
call s :curpos_test ( )
set re = 2
call s :curpos_test ( )
set re &
endfunc
" Test for matching the start and end of a buffer
2022-07-15 01:26:35 -07:00
func Regex_start_end_buffer ( )
2019-12-15 08:57:43 -07:00
call setline ( 1 , repeat ( ['vim edit' ], 20 ) )
/\%^
call assert_equal ( [0 , 1 , 1 , 0 ], getpos ( '.' ) )
exe "normal 50%/\\%^..\<CR>"
call assert_equal ( [0 , 1 , 1 , 0 ], getpos ( '.' ) )
exe "normal 50%/\\%$\<CR>"
call assert_equal ( [0 , 20 , 8 , 0 ], getpos ( '.' ) )
exe "normal 6gg/..\\%$\<CR>"
call assert_equal ( [0 , 20 , 7 , 0 ], getpos ( '.' ) )
2022-07-15 01:26:35 -07:00
%d
endfunc
func Test_start_end_of_buffer_match ( )
new
set regexpengine = 1
call Regex_start_end_buffer ( )
set regexpengine = 2
call Regex_start_end_buffer ( )
2019-12-15 08:57:43 -07:00
bwipe !
endfunc
2020-12-09 11:53:55 -07:00
func Test_ze_before_zs ( )
call assert_equal ( '' , matchstr ( ' ' , '\%#=1\ze \zs' ) )
call assert_equal ( '' , matchstr ( ' ' , '\%#=2\ze \zs' ) )
call assert_equal ( repeat ( ['' ], 10 ) , matchlist ( ' ' , '\%#=1\ze \zs' ) )
call assert_equal ( repeat ( ['' ], 10 ) , matchlist ( ' ' , '\%#=2\ze \zs' ) )
endfunc
2019-12-15 08:57:43 -07:00
" Check for detecting error
func Test_regexp_error ( )
2022-07-15 01:26:35 -07:00
call assert_fails ( "call matchlist('x x', '\\%#=1 \\zs*')" , 'E888:' )
call assert_fails ( "call matchlist('x x', '\\%#=1 \\ze*')" , 'E888:' )
call assert_fails ( "call matchlist('x x', '\\%#=2 \\zs*')" , 'E888:' )
call assert_fails ( "call matchlist('x x', '\\%#=2 \\ze*')" , 'E888:' )
call assert_fails ( 'exe "normal /\\%#=1\\%[x\\%[x]]\<CR>"' , 'E369:' )
endfunc
" Test for using the last substitute string pattern (~)
func Test_regexp_last_subst_string ( )
new
s /bar/ baz /e
call assert_equal ( matchstr ( "foo\nbaz\nbar" , "\\%#=1\~" ) , "baz" )
call assert_equal ( matchstr ( "foo\nbaz\nbar" , "\\%#=2\~" ) , "baz" )
close !
2019-12-15 08:57:43 -07:00
endfunc
2022-03-19 01:42:24 -07:00
" Check patterns matching cursor position.
func s :curpos_test2 ( )
new
2022-04-03 18:12:20 -07:00
call setline ( 1 , ['1' , '2 foobar eins zwei drei vier f<> nf sechse' ,
\ '3 foobar eins zwei drei vier f<> nf sechse' ,
\ '4 foobar eins zwei drei vier f<> nf sechse' ,
\ '5 foobar eins zwei drei vier f<> nf sechse' ,
\ '6 foobar eins zwei drei vier f<> nf sechse' ,
\ '7 foobar eins zwei drei vier f<> nf sechse' ])
2022-03-19 01:42:24 -07:00
call setpos ( '.' , [0 , 2 , 10 , 0 ])
s /\%.c.*/ /g
call setpos ( '.' , [0 , 3 , 15 , 0 ])
s /\%.l.*/ /g
call setpos ( '.' , [0 , 5 , 3 , 0 ])
s /\%.v.*/ _ /g
call assert_equal ( ['1' ,
\ '2 foobar ' ,
\ '' ,
2022-04-03 18:12:20 -07:00
\ '4 foobar eins zwei drei vier f<> nf sechse' ,
2022-03-19 01:42:24 -07:00
\ '5 _' ,
2022-04-03 18:12:20 -07:00
\ '6 foobar eins zwei drei vier f<> nf sechse' ,
\ '7 foobar eins zwei drei vier f<> nf sechse' ],
2022-03-19 01:42:24 -07:00
\ getline ( 1 , '$' ) )
call assert_fails ( 'call search("\\%.1l")' , 'E1204:' )
call assert_fails ( 'call search("\\%.1c")' , 'E1204:' )
call assert_fails ( 'call search("\\%.1v")' , 'E1204:' )
bwipe !
endfunc
" Check patterns matching before or after cursor position.
func s :curpos_test3 ( )
new
2022-04-03 18:12:20 -07:00
call setline ( 1 , ['1' , '2 foobar eins zwei drei vier f<> nf sechse' ,
\ '3 foobar eins zwei drei vier f<> nf sechse' ,
\ '4 foobar eins zwei drei vier f<> nf sechse' ,
\ '5 foobar eins zwei drei vier f<> nf sechse' ,
\ '6 foobar eins zwei drei vier f<> nf sechse' ,
\ '7 foobar eins zwei drei vier f<> nf sechse' ])
2022-03-19 01:42:24 -07:00
call setpos ( '.' , [0 , 2 , 10 , 0 ])
" Note: This removes all columns, except for the column directly in front of
" the cursor. Bug????
:s /^.*\%<.c/ /
call setpos ( '.' , [0 , 3 , 10 , 0 ])
:s /\%>.c.*$/ /
call setpos ( '.' , [0 , 5 , 4 , 0 ])
" Note: This removes all columns, except for the column directly in front of
" the cursor. Bug????
:s /^.*\%<.v/ _ /
call setpos ( '.' , [0 , 6 , 4 , 0 ])
:s /\%>.v.*$/ _ /
call assert_equal ( ['1' ,
2022-04-03 18:12:20 -07:00
\ ' eins zwei drei vier f<> nf sechse' ,
2022-03-19 01:42:24 -07:00
\ '3 foobar e' ,
2022-04-03 18:12:20 -07:00
\ '4 foobar eins zwei drei vier f<> nf sechse' ,
\ '_foobar eins zwei drei vier f<> nf sechse' ,
2022-03-19 01:42:24 -07:00
\ '6 fo_' ,
2022-04-03 18:12:20 -07:00
\ '7 foobar eins zwei drei vier f<> nf sechse' ],
2022-03-19 01:42:24 -07:00
\ getline ( 1 , '$' ) )
sil %d
2022-04-03 18:12:20 -07:00
call setline ( 1 , ['1' , '2 foobar eins zwei drei vier f<> nf sechse' ,
\ '3 foobar eins zwei drei vier f<> nf sechse' ,
\ '4 foobar eins zwei drei vier f<> nf sechse' ,
\ '5 foobar eins zwei drei vier f<> nf sechse' ,
\ '6 foobar eins zwei drei vier f<> nf sechse' ,
\ '7 foobar eins zwei drei vier f<> nf sechse' ])
2022-03-19 01:42:24 -07:00
call setpos ( '.' , [0 , 4 , 4 , 0 ])
%s /\%<.l.*/ /
call setpos ( '.' , [0 , 5 , 4 , 0 ])
%s /\%>.l.*/ /
call assert_equal ( ['' , '' , '' ,
2022-04-03 18:12:20 -07:00
\ '4 foobar eins zwei drei vier f<> nf sechse' ,
\ '5 foobar eins zwei drei vier f<> nf sechse' ,
2022-03-19 01:42:24 -07:00
\ '' , '' ],
\ getline ( 1 , '$' ) )
bwipe !
endfunc
" Test that matching below, at or after the
" cursor position work
func Test_matching_pos ( )
for val in range ( 3 )
exe "set re=" .. val
" Match at cursor position
call s :curpos_test2 ( )
" Match before or after cursor position
call s :curpos_test3 ( )
endfor
set re &
endfunc
2022-01-27 06:59:30 -07:00
func Test_using_mark_position ( )
" this was using freed memory
2022-03-29 16:44:12 -07:00
" new engine
2022-01-27 06:59:30 -07:00
new
norm O0
call assert_fails ( "s/\\%')" , 'E486:' )
bwipe !
2022-03-29 16:44:12 -07:00
" old engine
new
norm O0
call assert_fails ( "s/\\%#=1\\%')" , 'E486:' )
bwipe !
2022-01-27 06:59:30 -07:00
endfunc
2022-03-10 01:40:45 -07:00
func Test_using_visual_position ( )
" this was using freed memory
new
exe "norm 0o\<Esc>\<C-V>k\<C-X>o0"
/\%V
bwipe !
endfunc
2022-03-10 01:43:32 -07:00
func Test_using_invalid_visual_position ( )
" this was going beyond the end of the line
new
exe "norm 0o000\<Esc>0\<C-V>$s0"
/\%V
bwipe !
endfunc
2022-07-21 01:00:45 -07:00
func Test_recursive_substitute_expr ( )
new
func Repl ( )
s
endfunc
silent ! s /\%')/ ~ \= Repl ( )
bwipe !
delfunc Repl
endfunc
2019-12-15 08:57:43 -07:00
" vim: shiftwidth=2 sts=2 expandtab