summaryrefslogtreecommitdiffstats
path: root/src/testdir/test_regexp_latin.vim
diff options
context:
space:
mode:
authorDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-10 20:09:20 +0000
committerDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-10 20:09:20 +0000
commit029f72b1a93430b24b88eb3a72c6114d9f149737 (patch)
tree765d5c2041967f9c6fef195fe343d9234a030e90 /src/testdir/test_regexp_latin.vim
parentInitial commit. (diff)
downloadvim-029f72b1a93430b24b88eb3a72c6114d9f149737.tar.xz
vim-029f72b1a93430b24b88eb3a72c6114d9f149737.zip
Adding upstream version 2:9.1.0016.upstream/2%9.1.0016
Signed-off-by: Daniel Baumann <daniel.baumann@progress-linux.org>
Diffstat (limited to 'src/testdir/test_regexp_latin.vim')
-rw-r--r--src/testdir/test_regexp_latin.vim1163
1 files changed, 1163 insertions, 0 deletions
diff --git a/src/testdir/test_regexp_latin.vim b/src/testdir/test_regexp_latin.vim
new file mode 100644
index 0000000..9acb12b
--- /dev/null
+++ b/src/testdir/test_regexp_latin.vim
@@ -0,0 +1,1163 @@
+" Tests for regexp in latin1 encoding
+
+set encoding=latin1
+scriptencoding latin1
+
+source check.vim
+
+func s:equivalence_test()
+ let str = 'AÀÁÂÃÄÅ B C D EÈÉÊË F G H IÌÍÎÏ J K L M NÑ OÒÓÔÕÖØ P Q R S T UÙÚÛÜ V W X YÝ Z '
+ \ .. 'aàáâãäå b c d eèéêë f g h iìíîï j k l m nñ oòóôõöø p q r s t uùúûü v w x yýÿ z '
+ \ .. "0 1 2 3 4 5 6 7 8 9 "
+ \ .. "` ~ ! ? ; : . , / \\ ' \" | < > [ ] { } ( ) @ # $ % ^ & * _ - + \b \e \f \n \r \t"
+ let groups = split(str)
+ for group1 in groups
+ for c in split(group1, '\zs')
+ " next statement confirms that equivalence class matches every
+ " character in group
+ call assert_match('^[[=' . c . '=]]*$', group1)
+ for group2 in groups
+ if group2 != group1
+ " next statement converts that equivalence class doesn't match
+ " a character in any other group
+ call assert_equal(-1, match(group2, '[[=' . c . '=]]'))
+ endif
+ endfor
+ endfor
+ endfor
+endfunc
+
+func Test_equivalence_re1()
+ set re=1
+ call s:equivalence_test()
+ set re=0
+endfunc
+
+func Test_equivalence_re2()
+ set re=2
+ call s:equivalence_test()
+ set re=0
+endfunc
+
+func Test_recursive_substitute()
+ new
+ s/^/\=execute("s#^##gn")
+ " check we are now not in the sandbox
+ call setwinvar(1, 'myvar', 1)
+ bwipe!
+endfunc
+
+func Test_nested_backrefs()
+ " Check example in change.txt.
+ new
+ for re in range(0, 2)
+ exe 'set re=' . re
+ call setline(1, 'aa ab x')
+ 1s/\(\(a[a-d] \)*\)\(x\)/-\1- -\2- -\3-/
+ call assert_equal('-aa ab - -ab - -x-', getline(1))
+
+ call assert_equal('-aa ab - -ab - -x-', substitute('aa ab x', '\(\(a[a-d] \)*\)\(x\)', '-\1- -\2- -\3-', ''))
+ endfor
+ bwipe!
+ set re=0
+endfunc
+
+func Test_eow_with_optional()
+ let expected = ['abc def', 'abc', 'def', '', '', '', '', '', '', '']
+ for re in range(0, 2)
+ exe 'set re=' . re
+ let actual = matchlist('abc def', '\(abc\>\)\?\s*\(def\)')
+ call assert_equal(expected, actual)
+ endfor
+ set re=0
+endfunc
+
+func Test_backref()
+ new
+ call setline(1, ['one', 'two', 'three', 'four', 'five'])
+ call assert_equal(3, search('\%#=1\(e\)\1'))
+ call assert_equal(3, search('\%#=2\(e\)\1'))
+ call assert_fails('call search("\\%#=1\\(e\\1\\)")', 'E65:')
+ call assert_fails('call search("\\%#=2\\(e\\1\\)")', 'E65:')
+ bwipe!
+endfunc
+
+func Test_multi_failure()
+ set re=1
+ call assert_fails('/a**', 'E61:')
+ call assert_fails('/a*\+', 'E62:')
+ call assert_fails('/a\{a}', 'E554:')
+ set re=2
+ call assert_fails('/a**', 'E871:')
+ call assert_fails('/a*\+', 'E871:')
+ call assert_fails('/a\{a}', 'E554:')
+ set re=0
+endfunc
+
+func Test_column_success_failure()
+ new
+ call setline(1, 'xbar')
+
+ set re=1
+ %s/\%>0v./A/
+ call assert_equal('Abar', getline(1))
+ call assert_fails('/\%v', 'E71:')
+ call assert_fails('/\%>v', 'E71:')
+ call assert_fails('/\%c', 'E71:')
+ call assert_fails('/\%<c', 'E71:')
+ call assert_fails('/\%l', 'E71:')
+ set re=2
+ %s/\%>0v./B/
+ call assert_equal('Bbar', getline(1))
+ call assert_fails('/\%v', 'E1273:')
+ call assert_fails('/\%>v', 'E1273:')
+ call assert_fails('/\%c', 'E1273:')
+ call assert_fails('/\%<c', 'E1273:')
+ call assert_fails('/\%l', 'E1273:')
+
+ set re=0
+ bwipe!
+endfunc
+
+func Test_recursive_addstate()
+ " This will call addstate() recursively until it runs into the limit.
+ let lnum = search('\v((){328}){389}')
+ call assert_equal(0, lnum)
+endfunc
+
+func Test_out_of_memory()
+ new
+ s/^/,n
+ " This will be slow...
+ call assert_fails('call search("\\v((n||<)+);")', 'E363:')
+endfunc
+
+func Test_get_equi_class()
+ new
+ " Incomplete equivalence class caused invalid memory access
+ s/^/[[=
+ call assert_equal(1, search(getline(1)))
+ s/.*/[[.
+ call assert_equal(1, search(getline(1)))
+endfunc
+
+func Test_rex_init()
+ set noincsearch
+ set re=1
+ new
+ setlocal iskeyword=a-z
+ call setline(1, ['abc', 'ABC'])
+ call assert_equal(1, search('[[:keyword:]]'))
+ new
+ setlocal iskeyword=A-Z
+ call setline(1, ['abc', 'ABC'])
+ call assert_equal(2, search('[[:keyword:]]'))
+ bwipe!
+ bwipe!
+ set re=0
+endfunc
+
+func Test_range_with_newline()
+ new
+ call setline(1, "a")
+ call assert_equal(0, search("[ -*\\n- ]"))
+ call assert_equal(0, search("[ -*\\t-\\n]"))
+ bwipe!
+endfunc
+
+func Test_pattern_compile_speed()
+ CheckOption spellcapcheck
+ CheckFunction reltimefloat
+
+ let start = reltime()
+ " this used to be very slow, not it should be about a second
+ set spc=\\v(((((Nxxxxxxx&&xxxx){179})+)+)+){179}
+ call assert_inrange(0.01, 10.0, reltimefloat(reltime(start)))
+ set spc=
+endfunc
+
+" Tests for regexp patterns without multi-byte support.
+func Test_regexp_single_line_pat()
+ " tl is a List of Lists with:
+ " regexp engines to test
+ " 0 - test with 'regexpengine' values 0 and 1
+ " 1 - test with 'regexpengine' values 0 and 2
+ " 2 - test with 'regexpengine' values 0, 1 and 2
+ " regexp pattern
+ " text to test the pattern on
+ " expected match (optional)
+ " expected submatch 1 (optional)
+ " expected submatch 2 (optional)
+ " etc.
+ " When there is no match use only the first two items.
+ let tl = []
+
+ call add(tl, [2, 'ab', 'aab', 'ab'])
+ call add(tl, [2, 'b', 'abcdef', 'b'])
+ call add(tl, [2, 'bc*', 'abccccdef', 'bcccc'])
+ call add(tl, [2, 'bc\{-}', 'abccccdef', 'b'])
+ call add(tl, [2, 'bc\{-}\(d\)', 'abccccdef', 'bccccd', 'd'])
+ call add(tl, [2, 'bc*', 'abbdef', 'b'])
+ call add(tl, [2, 'c*', 'ccc', 'ccc'])
+ call add(tl, [2, 'bc*', 'abdef', 'b'])
+ call add(tl, [2, 'c*', 'abdef', ''])
+ call add(tl, [2, 'bc\+', 'abccccdef', 'bcccc'])
+ call add(tl, [2, 'bc\+', 'abdef']) " no match
+ " match escape character in a string
+ call add(tl, [2, '.\e.', "one\<Esc>two", "e\<Esc>t"])
+ " match backspace character in a string
+ call add(tl, [2, '.\b.', "one\<C-H>two", "e\<C-H>t"])
+ " match newline character in a string
+ call add(tl, [2, 'o\nb', "foo\nbar", "o\nb"])
+
+ " operator \|
+ call add(tl, [2, 'a\|ab', 'cabd', 'a']) " alternation is ordered
+
+ call add(tl, [2, 'c\?', 'ccb', 'c'])
+ call add(tl, [2, 'bc\?', 'abd', 'b'])
+ call add(tl, [2, 'bc\?', 'abccd', 'bc'])
+
+ call add(tl, [2, '\va{1}', 'ab', 'a'])
+
+ call add(tl, [2, '\va{2}', 'aa', 'aa'])
+ call add(tl, [2, '\va{2}', 'caad', 'aa'])
+ call add(tl, [2, '\va{2}', 'aba'])
+ call add(tl, [2, '\va{2}', 'ab'])
+ call add(tl, [2, '\va{2}', 'abaa', 'aa'])
+ call add(tl, [2, '\va{2}', 'aaa', 'aa'])
+
+ call add(tl, [2, '\vb{1}', 'abca', 'b'])
+ call add(tl, [2, '\vba{2}', 'abaa', 'baa'])
+ call add(tl, [2, '\vba{3}', 'aabaac'])
+
+ call add(tl, [2, '\v(ab){1}', 'ab', 'ab', 'ab'])
+ call add(tl, [2, '\v(ab){1}', 'dabc', 'ab', 'ab'])
+ call add(tl, [2, '\v(ab){1}', 'acb'])
+
+ call add(tl, [2, '\v(ab){0,2}', 'acb', "", ""])
+ call add(tl, [2, '\v(ab){0,2}', 'ab', 'ab', 'ab'])
+ call add(tl, [2, '\v(ab){1,2}', 'ab', 'ab', 'ab'])
+ call add(tl, [2, '\v(ab){1,2}', 'ababc', 'abab', 'ab'])
+ call add(tl, [2, '\v(ab){2,4}', 'ababcab', 'abab', 'ab'])
+ call add(tl, [2, '\v(ab){2,4}', 'abcababa', 'abab', 'ab'])
+
+ call add(tl, [2, '\v(ab){2}', 'abab', 'abab', 'ab'])
+ call add(tl, [2, '\v(ab){2}', 'cdababe', 'abab', 'ab'])
+ call add(tl, [2, '\v(ab){2}', 'abac'])
+ call add(tl, [2, '\v(ab){2}', 'abacabab', 'abab', 'ab'])
+ call add(tl, [2, '\v((ab){2}){2}', 'abababab', 'abababab', 'abab', 'ab'])
+ call add(tl, [2, '\v((ab){2}){2}', 'abacabababab', 'abababab', 'abab', 'ab'])
+
+ call add(tl, [2, '\v(a{1}){1}', 'a', 'a', 'a'])
+ call add(tl, [2, '\v(a{2}){1}', 'aa', 'aa', 'aa'])
+ call add(tl, [2, '\v(a{2}){1}', 'aaac', 'aa', 'aa'])
+ call add(tl, [2, '\v(a{2}){1}', 'daaac', 'aa', 'aa'])
+ call add(tl, [2, '\v(a{1}){2}', 'daaac', 'aa', 'a'])
+ call add(tl, [2, '\v(a{1}){2}', 'aaa', 'aa', 'a'])
+ call add(tl, [2, '\v(a{2})+', 'adaac', 'aa', 'aa'])
+ call add(tl, [2, '\v(a{2})+', 'aa', 'aa', 'aa'])
+ call add(tl, [2, '\v(a{2}){1}', 'aa', 'aa', 'aa'])
+ call add(tl, [2, '\v(a{1}){2}', 'aa', 'aa', 'a'])
+ call add(tl, [2, '\v(a{1}){1}', 'a', 'a', 'a'])
+ call add(tl, [2, '\v(a{2}){2}', 'aaaa', 'aaaa', 'aa'])
+ call add(tl, [2, '\v(a{2}){2}', 'aaabaaaa', 'aaaa', 'aa'])
+
+ call add(tl, [2, '\v(a+){2}', 'dadaac', 'aa', 'a'])
+ call add(tl, [2, '\v(a{3}){2}', 'aaaaaaa', 'aaaaaa', 'aaa'])
+
+ call add(tl, [2, '\v(a{1,2}){2}', 'daaac', 'aaa', 'a'])
+ call add(tl, [2, '\v(a{1,3}){2}', 'daaaac', 'aaaa', 'a'])
+ call add(tl, [2, '\v(a{1,3}){2}', 'daaaaac', 'aaaaa', 'aa'])
+ call add(tl, [2, '\v(a{1,3}){3}', 'daac'])
+ call add(tl, [2, '\v(a{1,2}){2}', 'dac'])
+ call add(tl, [2, '\v(a+)+', 'daac', 'aa', 'aa'])
+ call add(tl, [2, '\v(a+)+', 'aaa', 'aaa', 'aaa'])
+ call add(tl, [2, '\v(a+){1,2}', 'aaa', 'aaa', 'aaa'])
+ call add(tl, [2, '\v(a+)(a+)', 'aaa', 'aaa', 'aa', 'a'])
+ call add(tl, [2, '\v(a{3})+', 'daaaac', 'aaa', 'aaa'])
+ call add(tl, [2, '\v(a|b|c)+', 'aacb', 'aacb', 'b'])
+ call add(tl, [2, '\v(a|b|c){2}', 'abcb', 'ab', 'b'])
+ call add(tl, [2, '\v(abc){2}', 'abcabd', ])
+ call add(tl, [2, '\v(abc){2}', 'abdabcabc','abcabc', 'abc'])
+
+ call add(tl, [2, 'a*', 'cc', ''])
+ call add(tl, [2, '\v(a*)+', 'cc', ''])
+ call add(tl, [2, '\v((ab)+)+', 'ab', 'ab', 'ab', 'ab'])
+ call add(tl, [2, '\v(((ab)+)+)+', 'ab', 'ab', 'ab', 'ab', 'ab'])
+ call add(tl, [2, '\v(((ab)+)+)+', 'dababc', 'abab', 'abab', 'abab', 'ab'])
+ call add(tl, [2, '\v(a{0,2})+', 'cc', ''])
+ call add(tl, [2, '\v(a*)+', '', ''])
+ call add(tl, [2, '\v((a*)+)+', '', ''])
+ call add(tl, [2, '\v((ab)*)+', '', ''])
+ call add(tl, [2, '\va{1,3}', 'aab', 'aa'])
+ call add(tl, [2, '\va{2,3}', 'abaa', 'aa'])
+
+ call add(tl, [2, '\v((ab)+|c*)+', 'abcccaba', 'abcccab', '', 'ab'])
+ call add(tl, [2, '\v(a{2})|(b{3})', 'bbabbbb', 'bbb', '', 'bbb'])
+ call add(tl, [2, '\va{2}|b{2}', 'abab'])
+ call add(tl, [2, '\v(a)+|(c)+', 'bbacbaacbbb', 'a', 'a'])
+ call add(tl, [2, '\vab{2,3}c', 'aabbccccccccccccc', 'abbc'])
+ call add(tl, [2, '\vab{2,3}c', 'aabbbccccccccccccc', 'abbbc'])
+ call add(tl, [2, '\vab{2,3}cd{2,3}e', 'aabbbcddee', 'abbbcdde'])
+ call add(tl, [2, '\va(bc){2}d', 'aabcbfbc' ])
+ call add(tl, [2, '\va*a{2}', 'a', ])
+ call add(tl, [2, '\va*a{2}', 'aa', 'aa' ])
+ call add(tl, [2, '\va*a{2}', 'aaa', 'aaa' ])
+ call add(tl, [2, '\va*a{2}', 'bbbabcc', ])
+ call add(tl, [2, '\va*b*|a*c*', 'a', 'a'])
+ call add(tl, [2, '\va{1}b{1}|a{1}b{1}', ''])
+
+ " submatches
+ call add(tl, [2, '\v(a)', 'ab', 'a', 'a'])
+ call add(tl, [2, '\v(a)(b)', 'ab', 'ab', 'a', 'b'])
+ call add(tl, [2, '\v(ab)(b)(c)', 'abbc', 'abbc', 'ab', 'b', 'c'])
+ call add(tl, [2, '\v((a)(b))', 'ab', 'ab', 'ab', 'a', 'b'])
+ call add(tl, [2, '\v(a)|(b)', 'ab', 'a', 'a'])
+
+ call add(tl, [2, '\v(a*)+', 'aaaa', 'aaaa', ''])
+ call add(tl, [2, 'x', 'abcdef'])
+
+ "
+ " Simple tests
+ "
+
+ " Search single groups
+ call add(tl, [2, 'ab', 'aab', 'ab'])
+ call add(tl, [2, 'ab', 'baced'])
+ call add(tl, [2, 'ab', ' ab ', 'ab'])
+
+ " Search multi-modifiers
+ call add(tl, [2, 'x*', 'xcd', 'x'])
+ call add(tl, [2, 'x*', 'xxxxxxxxxxxxxxxxsofijiojgf', 'xxxxxxxxxxxxxxxx'])
+ " empty match is good
+ call add(tl, [2, 'x*', 'abcdoij', ''])
+ " no match here
+ call add(tl, [2, 'x\+', 'abcdoin'])
+ call add(tl, [2, 'x\+', 'abcdeoijdfxxiuhfij', 'xx'])
+ call add(tl, [2, 'x\+', 'xxxxx', 'xxxxx'])
+ call add(tl, [2, 'x\+', 'abc x siufhiush xxxxxxxxx', 'x'])
+ call add(tl, [2, 'x\=', 'x sdfoij', 'x'])
+ call add(tl, [2, 'x\=', 'abc sfoij', '']) " empty match is good
+ call add(tl, [2, 'x\=', 'xxxxxxxxx c', 'x'])
+ call add(tl, [2, 'x\?', 'x sdfoij', 'x'])
+ " empty match is good
+ call add(tl, [2, 'x\?', 'abc sfoij', ''])
+ call add(tl, [2, 'x\?', 'xxxxxxxxxx c', 'x'])
+
+ call add(tl, [2, 'a\{0,0}', 'abcdfdoij', ''])
+ " same thing as 'a?'
+ call add(tl, [2, 'a\{0,1}', 'asiubid axxxaaa', 'a'])
+ " same thing as 'a\{0,1}'
+ call add(tl, [2, 'a\{1,0}', 'asiubid axxxaaa', 'a'])
+ call add(tl, [2, 'a\{3,6}', 'aa siofuh'])
+ call add(tl, [2, 'a\{3,6}', 'aaaaa asfoij afaa', 'aaaaa'])
+ call add(tl, [2, 'a\{3,6}', 'aaaaaaaa', 'aaaaaa'])
+ call add(tl, [2, 'a\{0}', 'asoiuj', ''])
+ call add(tl, [2, 'a\{2}', 'aaaa', 'aa'])
+ call add(tl, [2, 'a\{2}', 'iuash fiusahfliusah fiushfilushfi uhsaifuh askfj nasfvius afg aaaa sfiuhuhiushf', 'aa'])
+ call add(tl, [2, 'a\{2}', 'abcdefghijklmnopqrestuvwxyz1234567890'])
+ " same thing as 'a*'
+ call add(tl, [2, 'a\{0,}', 'oij sdigfusnf', ''])
+ call add(tl, [2, 'a\{0,}', 'aaaaa aa', 'aaaaa'])
+ call add(tl, [2, 'a\{2,}', 'sdfiougjdsafg'])
+ call add(tl, [2, 'a\{2,}', 'aaaaasfoij ', 'aaaaa'])
+ call add(tl, [2, 'a\{5,}', 'xxaaaaxxx '])
+ call add(tl, [2, 'a\{5,}', 'xxaaaaaxxx ', 'aaaaa'])
+ call add(tl, [2, 'a\{,0}', 'oidfguih iuhi hiu aaaa', ''])
+ call add(tl, [2, 'a\{,5}', 'abcd', 'a'])
+ call add(tl, [2, 'a\{,5}', 'aaaaaaaaaa', 'aaaaa'])
+ " leading star as normal char when \{} follows
+ call add(tl, [2, '^*\{4,}$', '***'])
+ call add(tl, [2, '^*\{4,}$', '****', '****'])
+ call add(tl, [2, '^*\{4,}$', '*****', '*****'])
+ " same thing as 'a*'
+ call add(tl, [2, 'a\{}', 'bbbcddiuhfcd', ''])
+ call add(tl, [2, 'a\{}', 'aaaaioudfh coisf jda', 'aaaa'])
+
+ call add(tl, [2, 'a\{-0,0}', 'abcdfdoij', ''])
+ " anti-greedy version of 'a?'
+ call add(tl, [2, 'a\{-0,1}', 'asiubid axxxaaa', ''])
+ call add(tl, [2, 'a\{-3,6}', 'aa siofuh'])
+ call add(tl, [2, 'a\{-3,6}', 'aaaaa asfoij afaa', 'aaa'])
+ call add(tl, [2, 'a\{-3,6}', 'aaaaaaaa', 'aaa'])
+ call add(tl, [2, 'a\{-0}', 'asoiuj', ''])
+ call add(tl, [2, 'a\{-2}', 'aaaa', 'aa'])
+ call add(tl, [2, 'a\{-2}', 'abcdefghijklmnopqrestuvwxyz1234567890'])
+ call add(tl, [2, 'a\{-0,}', 'oij sdigfusnf', ''])
+ call add(tl, [2, 'a\{-0,}', 'aaaaa aa', ''])
+ call add(tl, [2, 'a\{-2,}', 'sdfiougjdsafg'])
+ call add(tl, [2, 'a\{-2,}', 'aaaaasfoij ', 'aa'])
+ call add(tl, [2, 'a\{-,0}', 'oidfguih iuhi hiu aaaa', ''])
+ call add(tl, [2, 'a\{-,5}', 'abcd', ''])
+ call add(tl, [2, 'a\{-,5}', 'aaaaaaaaaa', ''])
+ " anti-greedy version of 'a*'
+ call add(tl, [2, 'a\{-}', 'bbbcddiuhfcd', ''])
+ call add(tl, [2, 'a\{-}', 'aaaaioudfh coisf jda', ''])
+
+ " Test groups of characters and submatches
+ call add(tl, [2, '\(abc\)*', 'abcabcabc', 'abcabcabc', 'abc'])
+ call add(tl, [2, '\(ab\)\+', 'abababaaaaa', 'ababab', 'ab'])
+ call add(tl, [2, '\(abaaaaa\)*cd', 'cd', 'cd', ''])
+ call add(tl, [2, '\(test1\)\? \(test2\)\?', 'test1 test3', 'test1 ', 'test1', ''])
+ call add(tl, [2, '\(test1\)\= \(test2\) \(test4443\)\=', ' test2 test4443 yupiiiiiiiiiii', ' test2 test4443', '', 'test2', 'test4443'])
+ call add(tl, [2, '\(\(sub1\) hello \(sub 2\)\)', 'asterix sub1 hello sub 2 obelix', 'sub1 hello sub 2', 'sub1 hello sub 2', 'sub1', 'sub 2'])
+ call add(tl, [2, '\(\(\(yyxxzz\)\)\)', 'abcdddsfiusfyyzzxxyyxxzz', 'yyxxzz', 'yyxxzz', 'yyxxzz', 'yyxxzz'])
+ call add(tl, [2, '\v((ab)+|c+)+', 'abcccaba', 'abcccab', 'ab', 'ab'])
+ call add(tl, [2, '\v((ab)|c*)+', 'abcccaba', 'abcccab', '', 'ab'])
+ call add(tl, [2, '\v(a(c*)+b)+', 'acbababaaa', 'acbabab', 'ab', ''])
+ call add(tl, [2, '\v(a|b*)+', 'aaaa', 'aaaa', ''])
+ call add(tl, [2, '\p*', 'aá ', 'aá '])
+
+ " Test greedy-ness and lazy-ness
+ call add(tl, [2, 'a\{-2,7}','aaaaaaaaaaaaa', 'aa'])
+ call add(tl, [2, 'a\{-2,7}x','aaaaaaaaax', 'aaaaaaax'])
+ call add(tl, [2, 'a\{2,7}','aaaaaaaaaaaaaaaaaaaa', 'aaaaaaa'])
+ call add(tl, [2, 'a\{2,7}x','aaaaaaaaax', 'aaaaaaax'])
+ call add(tl, [2, '\vx(.{-,8})yz(.*)','xayxayzxayzxayz','xayxayzxayzxayz','ayxa','xayzxayz'])
+ call add(tl, [2, '\vx(.*)yz(.*)','xayxayzxayzxayz','xayxayzxayzxayz', 'ayxayzxayzxa',''])
+ call add(tl, [2, '\v(a{1,2}){-2,3}','aaaaaaa','aaaa','aa'])
+ call add(tl, [2, '\v(a{-1,3})+', 'aa', 'aa', 'a'])
+ call add(tl, [2, '^\s\{-}\zs\( x\|x$\)', ' x', ' x', ' x'])
+ call add(tl, [2, '^\s\{-}\zs\(x\| x$\)', ' x', ' x', ' x'])
+ call add(tl, [2, '^\s\{-}\ze\(x\| x$\)', ' x', '', ' x'])
+ call add(tl, [2, '^\(\s\{-}\)\(x\| x$\)', ' x', ' x', '', ' x'])
+
+ " Test Character classes
+ call add(tl, [2, '\d\+e\d\d','test 10e23 fd','10e23'])
+
+ " Test collections and character range []
+ call add(tl, [2, '\v[a]', 'abcd', 'a'])
+ call add(tl, [2, 'a[bcd]', 'abcd', 'ab'])
+ call add(tl, [2, 'a[b-d]', 'acbd', 'ac'])
+ call add(tl, [2, '[a-d][e-f][x-x]d', 'cexdxx', 'cexd'])
+ call add(tl, [2, '\v[[:alpha:]]+', 'abcdefghijklmnopqrstuvwxyz6','abcdefghijklmnopqrstuvwxyz'])
+ call add(tl, [2, '[[:alpha:]\+]', '6x8','x'])
+ call add(tl, [2, '[^abc]\+','abcabcabc'])
+ call add(tl, [2, '[^abc]','defghiasijvoinasoiunbvb','d'])
+ call add(tl, [2, '[^abc]\+','ddddddda','ddddddd'])
+ call add(tl, [2, '[^a-d]\+','aaaAAAZIHFNCddd','AAAZIHFNC'])
+ call add(tl, [2, '[a-f]*','iiiiiiii',''])
+ call add(tl, [2, '[a-f]*','abcdefgh','abcdef'])
+ call add(tl, [2, '[^a-f]\+','abcdefgh','gh'])
+ call add(tl, [2, '[a-c]\{-3,6}','abcabc','abc'])
+ call add(tl, [2, '[^[:alpha:]]\+','abcccadfoij7787ysf287yrnccdu','7787'])
+ call add(tl, [2, '[-a]', '-', '-'])
+ call add(tl, [2, '[a-]', '-', '-'])
+ call add(tl, [2, '[a-f]*\c','ABCDEFGH','ABCDEF'])
+ call add(tl, [2, '[abc][xyz]\c','-af-AF-BY--','BY'])
+ " filename regexp
+ call add(tl, [2, '[-./[:alnum:]_~]\+', 'log13.file', 'log13.file'])
+ " special chars
+ call add(tl, [2, '[\]\^\-\\]\+', '\^\\\-\---^', '\^\\\-\---^'])
+ " collation elem
+ call add(tl, [2, '[[.a.]]\+', 'aa', 'aa'])
+ " middle of regexp
+ call add(tl, [2, 'abc[0-9]*ddd', 'siuhabc ii'])
+ call add(tl, [2, 'abc[0-9]*ddd', 'adf abc44482ddd oijs', 'abc44482ddd'])
+ call add(tl, [2, '\_[0-9]\+', 'asfi9888u', '9888'])
+ call add(tl, [2, '[0-9\n]\+', 'asfi9888u', '9888'])
+ call add(tl, [2, '\_[0-9]\+', "asfi\n9888u", "\n9888"])
+ call add(tl, [2, '\_f', " \na ", "\n"])
+ call add(tl, [2, '\_f\+', " \na ", "\na"])
+ call add(tl, [2, '[0-9A-Za-z-_.]\+', " @0_a.A-{ ", "0_a.A-"])
+
+ " Test start/end of line, start/end of file
+ call add(tl, [2, '^a.', "a_\nb ", "a_"])
+ call add(tl, [2, '^a.', "b a \na_"])
+ call add(tl, [2, '.a$', " a\n "])
+ call add(tl, [2, '.a$', " a b\n_a", "_a"])
+ call add(tl, [2, '\%^a.', "a a\na", "a "])
+ call add(tl, [2, '\%^a', " a \na "])
+ call add(tl, [2, '.a\%$', " a\n "])
+ call add(tl, [2, '.a\%$', " a\n_a", "_a"])
+
+ " Test recognition of character classes
+ call add(tl, [2, '[0-7]\+', 'x0123456789x', '01234567'])
+ call add(tl, [2, '[^0-7]\+', '0a;X+% 897', 'a;X+% 89'])
+ call add(tl, [2, '[0-9]\+', 'x0123456789x', '0123456789'])
+ call add(tl, [2, '[^0-9]\+', '0a;X+% 9', 'a;X+% '])
+ call add(tl, [2, '[0-9a-fA-F]\+', 'x0189abcdefg', '0189abcdef'])
+ call add(tl, [2, '[^0-9A-Fa-f]\+', '0189g;X+% ab', 'g;X+% '])
+ call add(tl, [2, '[a-z_A-Z0-9]\+', ';+aso_SfOij ', 'aso_SfOij'])
+ call add(tl, [2, '[^a-z_A-Z0-9]\+', 'aSo_;+% sfOij', ';+% '])
+ call add(tl, [2, '[a-z_A-Z]\+', '0abyz_ABYZ;', 'abyz_ABYZ'])
+ call add(tl, [2, '[^a-z_A-Z]\+', 'abAB_09;+% yzYZ', '09;+% '])
+ call add(tl, [2, '[a-z]\+', '0abcxyz1', 'abcxyz'])
+ call add(tl, [2, '[a-z]\+', 'AabxyzZ', 'abxyz'])
+ call add(tl, [2, '[^a-z]\+', 'a;X09+% x', ';X09+% '])
+ call add(tl, [2, '[^a-z]\+', 'abX0;%yz', 'X0;%'])
+ call add(tl, [2, '[a-zA-Z]\+', '0abABxzXZ9', 'abABxzXZ'])
+ call add(tl, [2, '[^a-zA-Z]\+', 'ab09_;+ XZ', '09_;+ '])
+ call add(tl, [2, '[A-Z]\+', 'aABXYZz', 'ABXYZ'])
+ call add(tl, [2, '[^A-Z]\+', 'ABx0;%YZ', 'x0;%'])
+ call add(tl, [2, '[a-z]\+\c', '0abxyzABXYZ;', 'abxyzABXYZ'])
+ call add(tl, [2, '[A-Z]\+\c', '0abABxzXZ9', 'abABxzXZ'])
+ call add(tl, [2, '\c[^a-z]\+', 'ab09_;+ XZ', '09_;+ '])
+ call add(tl, [2, '\c[^A-Z]\+', 'ab09_;+ XZ', '09_;+ '])
+ call add(tl, [2, '\C[^A-Z]\+', 'ABCOIJDEOIFNSD jsfoij sa', ' jsfoij sa'])
+
+ " Tests for \z features
+ " match ends at \ze
+ call add(tl, [2, 'xx \ze test', 'xx '])
+ call add(tl, [2, 'abc\zeend', 'oij abcend', 'abc'])
+ call add(tl, [2, 'aa\zebb\|aaxx', ' aabb ', 'aa'])
+ call add(tl, [2, 'aa\zebb\|aaxx', ' aaxx ', 'aaxx'])
+ call add(tl, [2, 'aabb\|aa\zebb', ' aabb ', 'aabb'])
+ call add(tl, [2, 'aa\zebb\|aaebb', ' aabb ', 'aa'])
+ " match starts at \zs
+ call add(tl, [2, 'abc\zsdd', 'ddabcddxyzt', 'dd'])
+ call add(tl, [2, 'aa \zsax', ' ax'])
+ call add(tl, [2, 'abc \zsmatch\ze abc', 'abc abc abc match abc abc', 'match'])
+ call add(tl, [2, '\v(a \zsif .*){2}', 'a if then a if last', 'if last', 'a if last'])
+ call add(tl, [2, '\>\zs.', 'aword. ', '.'])
+ call add(tl, [2, '\s\+\ze\[/\|\s\zs\s\+', 'is [a t', ' '])
+
+ " Tests for \@= and \& features
+ call add(tl, [2, 'abc\@=', 'abc', 'ab'])
+ call add(tl, [2, 'abc\@=cd', 'abcd', 'abcd'])
+ call add(tl, [2, 'abc\@=', 'ababc', 'ab'])
+ " will never match, no matter the input text
+ call add(tl, [2, 'abcd\@=e', 'abcd'])
+ " will never match
+ call add(tl, [2, 'abcd\@=e', 'any text in here ... '])
+ call add(tl, [2, '\v(abc)@=..', 'xabcd', 'ab', 'abc'])
+ call add(tl, [2, '\(.*John\)\@=.*Bob', 'here is John, and here is B'])
+ call add(tl, [2, '\(John.*\)\@=.*Bob', 'John is Bobs friend', 'John is Bob', 'John is Bobs friend'])
+ call add(tl, [2, '\<\S\+\())\)\@=', '$((i=i+1))', 'i=i+1', '))'])
+ call add(tl, [2, '.*John\&.*Bob', 'here is John, and here is B'])
+ call add(tl, [2, '.*John\&.*Bob', 'John is Bobs friend', 'John is Bob'])
+ call add(tl, [2, '\v(test1)@=.*yep', 'this is a test1, yep it is', 'test1, yep', 'test1'])
+ call add(tl, [2, 'foo\(bar\)\@!', 'foobar'])
+ call add(tl, [2, 'foo\(bar\)\@!', 'foo bar', 'foo'])
+ call add(tl, [2, 'if \(\(then\)\@!.\)*$', ' if then else'])
+ call add(tl, [2, 'if \(\(then\)\@!.\)*$', ' if else ', 'if else ', ' '])
+ call add(tl, [2, '\(foo\)\@!bar', 'foobar', 'bar'])
+ call add(tl, [2, '\(foo\)\@!...bar', 'foobar'])
+ call add(tl, [2, '^\%(.*bar\)\@!.*\zsfoo', ' bar foo '])
+ call add(tl, [2, '^\%(.*bar\)\@!.*\zsfoo', ' foo bar '])
+ call add(tl, [2, '^\%(.*bar\)\@!.*\zsfoo', ' foo xxx ', 'foo'])
+ call add(tl, [2, '[ ]\@!\p\%([ ]\@!\p\)*:', 'implicit mappings:', 'mappings:'])
+ call add(tl, [2, '[ ]\@!\p\([ ]\@!\p\)*:', 'implicit mappings:', 'mappings:', 's'])
+ call add(tl, [2, 'm\k\+_\@=\%(_\@!\k\)\@<=\k\+e', 'mx__xe', 'mx__xe'])
+ call add(tl, [2, '\%(\U\@<=S\k*\|S\l\)R', 'SuR', 'SuR'])
+
+ " Combining different tests and features
+ call add(tl, [2, '[[:alpha:]]\{-2,6}', '787abcdiuhsasiuhb4', 'ab'])
+ call add(tl, [2, '', 'abcd', ''])
+ call add(tl, [2, '\v(())', 'any possible text', ''])
+ call add(tl, [2, '\v%(ab(xyz)c)', ' abxyzc ', 'abxyzc', 'xyz'])
+ call add(tl, [2, '\v(test|)empty', 'tesempty', 'empty', ''])
+ call add(tl, [2, '\v(a|aa)(a|aa)', 'aaa', 'aa', 'a', 'a'])
+
+ " \%u and friends
+ call add(tl, [2, '\%d32', 'yes no', ' '])
+ call add(tl, [2, '\%o40', 'yes no', ' '])
+ call add(tl, [2, '\%x20', 'yes no', ' '])
+ call add(tl, [2, '\%u0020', 'yes no', ' '])
+ call add(tl, [2, '\%U00000020', 'yes no', ' '])
+ call add(tl, [2, '\%d0', "yes\x0ano", "\x0a"])
+
+ "" \%[abc]
+ call add(tl, [2, 'foo\%[bar]', 'fobar'])
+ call add(tl, [2, 'foo\%[bar]', 'foobar', 'foobar'])
+ call add(tl, [2, 'foo\%[bar]', 'fooxx', 'foo'])
+ call add(tl, [2, 'foo\%[bar]', 'foobxx', 'foob'])
+ call add(tl, [2, 'foo\%[bar]', 'foobaxx', 'fooba'])
+ call add(tl, [2, 'foo\%[bar]', 'foobarxx', 'foobar'])
+ call add(tl, [2, 'foo\%[bar]x', 'foobxx', 'foobx'])
+ call add(tl, [2, 'foo\%[bar]x', 'foobarxx', 'foobarx'])
+ call add(tl, [2, '\%[bar]x', 'barxx', 'barx'])
+ call add(tl, [2, '\%[bar]x', 'bxx', 'bx'])
+ call add(tl, [2, '\%[bar]x', 'xxx', 'x'])
+ call add(tl, [2, 'b\%[[ao]r]', 'bar bor', 'bar'])
+ call add(tl, [2, 'b\%[[]]r]', 'b]r bor', 'b]r'])
+ call add(tl, [2, '@\%[\w\-]*', '<http://john.net/pandoc/>[@pandoc]', '@pandoc'])
+
+ " Alternatives, must use first longest match
+ call add(tl, [2, 'goo\|go', 'google', 'goo'])
+ call add(tl, [2, '\<goo\|\<go', 'google', 'goo'])
+ call add(tl, [2, '\<goo\|go', 'google', 'goo'])
+
+ " Back references
+ call add(tl, [2, '\(\i\+\) \1', ' abc abc', 'abc abc', 'abc'])
+ call add(tl, [2, '\(\i\+\) \1', 'xgoo goox', 'goo goo', 'goo'])
+ call add(tl, [2, '\(a\)\(b\)\(c\)\(dd\)\(e\)\(f\)\(g\)\(h\)\(i\)\1\2\3\4\5\6\7\8\9', 'xabcddefghiabcddefghix', 'abcddefghiabcddefghi', 'a', 'b', 'c', 'dd', 'e', 'f', 'g', 'h', 'i'])
+ call add(tl, [2, '\(\d*\)a \1b', ' a b ', 'a b', ''])
+ call add(tl, [2, '^.\(.\).\_..\1.', "aaa\naaa\nb", "aaa\naaa", 'a'])
+ call add(tl, [2, '^.*\.\(.*\)/.\+\(\1\)\@<!$', 'foo.bat/foo.com', 'foo.bat/foo.com', 'bat'])
+ call add(tl, [2, '^.*\.\(.*\)/.\+\(\1\)\@<!$', 'foo.bat/foo.bat'])
+ call add(tl, [2, '^.*\.\(.*\)/.\+\(\1\)\@<=$', 'foo.bat/foo.bat', 'foo.bat/foo.bat', 'bat', 'bat'])
+ call add(tl, [2, '\\\@<!\${\(\d\+\%(:.\{-}\)\?\\\@<!\)}', '2013-06-27${0}', '${0}', '0'])
+ call add(tl, [2, '^\(a*\)\1$', 'aaaaaaaa', 'aaaaaaaa', 'aaaa'])
+ call add(tl, [2, '^\(a\{-2,}\)\1\+$', 'aaaaaaaaa', 'aaaaaaaaa', 'aaa'])
+
+ " Look-behind with limit
+ call add(tl, [2, '<\@<=span.', 'xxspanxx<spanyyy', 'spany'])
+ call add(tl, [2, '<\@1<=span.', 'xxspanxx<spanyyy', 'spany'])
+ call add(tl, [2, '<\@2<=span.', 'xxspanxx<spanyyy', 'spany'])
+ call add(tl, [2, '\(<<\)\@<=span.', 'xxspanxxxx<spanxx<<spanyyy', 'spany', '<<'])
+ call add(tl, [2, '\(<<\)\@1<=span.', 'xxspanxxxx<spanxx<<spanyyy'])
+ call add(tl, [2, '\(<<\)\@2<=span.', 'xxspanxxxx<spanxx<<spanyyy', 'spany', '<<'])
+ call add(tl, [2, '\(foo\)\@<!bar.', 'xx foobar1 xbar2 xx', 'bar2'])
+
+ " look-behind match in front of a zero-width item
+ call add(tl, [2, '\v\C%(<Last Changed:\s+)@<=.*$', '" test header'])
+ call add(tl, [2, '\v\C%(<Last Changed:\s+)@<=.*$', '" Last Changed: 1970', '1970'])
+ call add(tl, [2, '\(foo\)\@<=\>', 'foobar'])
+ call add(tl, [2, '\(foo\)\@<=\>', 'barfoo', '', 'foo'])
+ call add(tl, [2, '\(foo\)\@<=.*', 'foobar', 'bar', 'foo'])
+
+ " complicated look-behind match
+ call add(tl, [2, '\(r\@<=\|\w\@<!\)\/', 'x = /word/;', '/'])
+ call add(tl, [2, '^[a-z]\+\ze \&\(asdf\)\@<!', 'foo bar', 'foo'])
+
+ "" \@>
+ call add(tl, [2, '\(a*\)\@>a', 'aaaa'])
+ call add(tl, [2, '\(a*\)\@>b', 'aaab', 'aaab', 'aaa'])
+ call add(tl, [2, '^\(.\{-}b\)\@>.', ' abcbd', ' abc', ' ab'])
+ call add(tl, [2, '\(.\{-}\)\(\)\@>$', 'abc', 'abc', 'abc', ''])
+ " TODO: BT engine does not restore submatch after failure
+ call add(tl, [1, '\(a*\)\@>a\|a\+', 'aaaa', 'aaaa'])
+
+ " "\_" prepended negated collection matches EOL
+ call add(tl, [2, '\_[^8-9]\+', "asfi\n9888", "asfi\n"])
+ call add(tl, [2, '\_[^a]\+', "asfi\n9888", "sfi\n9888"])
+
+ " Requiring lots of states.
+ call add(tl, [2, '[0-9a-zA-Z]\{8}-\([0-9a-zA-Z]\{4}-\)\{3}[0-9a-zA-Z]\{12}', " 12345678-1234-1234-1234-123456789012 ", "12345678-1234-1234-1234-123456789012", "1234-"])
+
+ " Skip adding state twice
+ call add(tl, [2, '^\%(\%(^\s*#\s*if\>\|#\s*if\)\)\(\%>1c.*$\)\@=', "#if FOO", "#if", ' FOO'])
+
+ " Test \%V atom
+ call add(tl, [2, '\%>70vGesamt', 'Jean-Michel Charlier & Victor Hubinon\Gesamtausgabe [Salleck] Buck Danny {Jean-Michel Charlier & Victor Hubinon}\Gesamtausgabe', 'Gesamt'])
+
+ " Test for ignoring case and matching repeated characters
+ call add(tl, [2, '\cb\+', 'aAbBbBcC', 'bBbB'])
+
+ " Run the tests
+ for t in tl
+ let re = t[0]
+ let pat = t[1]
+ let text = t[2]
+ let matchidx = 3
+ for engine in [0, 1, 2]
+ if engine == 2 && re == 0 || engine == 1 && re == 1
+ continue
+ endif
+ let &regexpengine = engine
+ try
+ let l = matchlist(text, pat)
+ catch
+ call assert_report('Error ' . engine . ': pat: \"' . pat
+ \ . '\", text: \"' . text . '\", caused an exception: \"'
+ \ . v:exception . '\"')
+ endtry
+ " check the match itself
+ if len(l) == 0 && len(t) > matchidx
+ call assert_report('Error ' . engine . ': pat: \"' . pat
+ \ . '\", text: \"' . text . '\", did not match, expected: \"'
+ \ . t[matchidx] . '\"')
+ elseif len(l) > 0 && len(t) == matchidx
+ call assert_report('Error ' . engine . ': pat: \"' . pat
+ \ . '\", text: \"' . text . '\", match: \"' . l[0]
+ \ . '\", expected no match')
+ elseif len(t) > matchidx && l[0] != t[matchidx]
+ call assert_report('Error ' . engine . ': pat: \"' . pat
+ \ . '\", text: \"' . text . '\", match: \"' . l[0]
+ \ . '\", expected: \"' . t[matchidx] . '\"')
+ else
+ " Test passed
+ endif
+
+ " check all the nine submatches
+ if len(l) > 0
+ for i in range(1, 9)
+ if len(t) <= matchidx + i
+ let e = ''
+ else
+ let e = t[matchidx + i]
+ endif
+ if l[i] != e
+ call assert_report('Error ' . engine . ': pat: \"' . pat
+ \ . '\", text: \"' . text . '\", submatch ' . i . ': \"'
+ \ . l[i] . '\", expected: \"' . e . '\"')
+ endif
+ endfor
+ unlet i
+ endif
+ endfor
+ endfor
+
+ unlet t tl e l
+endfunc
+
+" Tests for multi-line regexp patterns without multi-byte support.
+func Test_regexp_multiline_pat()
+ " tl is a List of Lists with:
+ " regexp engines to test
+ " 0 - test with 'regexpengine' values 0 and 1
+ " 1 - test with 'regexpengine' values 0 and 2
+ " 2 - test with 'regexpengine' values 0, 1 and 2
+ " regexp pattern
+ " List with text to test the pattern on
+ " List with the expected match
+ let tl = []
+
+ " back references
+ call add(tl, [2, '^.\(.\).\_..\1.', ['aaa', 'aaa', 'b'], ['XX', 'b']])
+ call add(tl, [2, '\v.*\/(.*)\n.*\/\1$', ['./Dir1/Dir2/zyxwvuts.txt', './Dir1/Dir2/abcdefgh.bat', '', './Dir1/Dir2/file1.txt', './OtherDir1/OtherDir2/file1.txt'], ['./Dir1/Dir2/zyxwvuts.txt', './Dir1/Dir2/abcdefgh.bat', '', 'XX']])
+
+ " line breaks
+ call add(tl, [2, '\S.*\nx', ['abc', 'def', 'ghi', 'xjk', 'lmn'], ['abc', 'def', 'XXjk', 'lmn']])
+
+ " Any single character or end-of-line
+ call add(tl, [2, '\_.\+', ['a', 'b', 'c'], ['XX']])
+ " Any identifier or end-of-line
+ call add(tl, [2, '\_i\+', ['a', 'b', ';', '2'], ['XX;XX']])
+ " Any identifier but excluding digits or end-of-line
+ call add(tl, [2, '\_I\+', ['a', 'b', ';', '2'], ['XX;XX2XX']])
+ " Any keyword or end-of-line
+ call add(tl, [2, '\_k\+', ['a', 'b', '=', '2'], ['XX=XX']])
+ " Any keyword but excluding digits or end-of-line
+ call add(tl, [2, '\_K\+', ['a', 'b', '=', '2'], ['XX=XX2XX']])
+ " Any filename character or end-of-line
+ call add(tl, [2, '\_f\+', ['a', 'b', '.', '5'], ['XX']])
+ " Any filename character but excluding digits or end-of-line
+ call add(tl, [2, '\_F\+', ['a', 'b', '.', '5'], ['XX5XX']])
+ " Any printable character or end-of-line
+ call add(tl, [2, '\_p\+', ['a', 'b', '=', '4'], ['XX']])
+ " Any printable character excluding digits or end-of-line
+ call add(tl, [2, '\_P\+', ['a', 'b', '=', '4'], ['XX4XX']])
+ " Any whitespace character or end-of-line
+ call add(tl, [2, '\_s\+', [' ', ' ', 'a', 'b'], ['XXaXXbXX']])
+ " Any non-whitespace character or end-of-line
+ call add(tl, [2, '\_S\+', [' ', ' ', 'a', 'b'], [' XX XX']])
+ " Any decimal digit or end-of-line
+ call add(tl, [2, '\_d\+', ['1', 'a', '2', 'b', '3'], ['XXaXXbXX']])
+ " Any non-decimal digit or end-of-line
+ call add(tl, [2, '\_D\+', ['1', 'a', '2', 'b', '3'], ['1XX2XX3XX']])
+ " Any hexadecimal digit or end-of-line
+ call add(tl, [2, '\_x\+', ['1', 'a', 'g', '9', '8'], ['XXgXX']])
+ " Any non-hexadecimal digit or end-of-line
+ call add(tl, [2, '\_X\+', ['1', 'a', 'g', '9', '8'], ['1XXaXX9XX8XX']])
+ " Any octal digit or end-of-line
+ call add(tl, [2, '\_o\+', ['0', '7', '8', '9', '0'], ['XX8XX9XX']])
+ " Any non-octal digit or end-of-line
+ call add(tl, [2, '\_O\+', ['0', '7', '8', '9', '0'], ['0XX7XX0XX']])
+ " Any word character or end-of-line
+ call add(tl, [2, '\_w\+', ['A', 'B', '=', 'C', 'D'], ['XX=XX']])
+ " Any non-word character or end-of-line
+ call add(tl, [2, '\_W\+', ['A', 'B', '=', 'C', 'D'], ['AXXBXXCXXDXX']])
+ " Any head-of-word character or end-of-line
+ call add(tl, [2, '\_h\+', ['a', '1', 'b', '2', 'c'], ['XX1XX2XX']])
+ " Any non-head-of-word character or end-of-line
+ call add(tl, [2, '\_H\+', ['a', '1', 'b', '2', 'c'], ['aXXbXXcXX']])
+ " Any alphabetic character or end-of-line
+ call add(tl, [2, '\_a\+', ['a', '1', 'b', '2', 'c'], ['XX1XX2XX']])
+ " Any non-alphabetic character or end-of-line
+ call add(tl, [2, '\_A\+', ['a', '1', 'b', '2', 'c'], ['aXXbXXcXX']])
+ " Any lowercase character or end-of-line
+ call add(tl, [2, '\_l\+', ['a', 'A', 'b', 'B'], ['XXAXXBXX']])
+ " Any non-lowercase character or end-of-line
+ call add(tl, [2, '\_L\+', ['a', 'A', 'b', 'B'], ['aXXbXX']])
+ " Any uppercase character or end-of-line
+ call add(tl, [2, '\_u\+', ['a', 'A', 'b', 'B'], ['aXXbXX']])
+ " Any non-uppercase character or end-of-line
+ call add(tl, [2, '\_U\+', ['a', 'A', 'b', 'B'], ['XXAXXBXX']])
+ " Collection or end-of-line
+ call add(tl, [2, '\_[a-z]\+', ['a', 'A', 'b', 'B'], ['XXAXXBXX']])
+ " start of line anywhere in the text
+ call add(tl, [2, 'one\zs\_s*\_^\zetwo',
+ \ ['', 'one', ' two', 'one', '', 'two'],
+ \ ['', 'one', ' two', 'oneXXtwo']])
+ " end of line anywhere in the text
+ call add(tl, [2, 'one\zs\_$\_s*two',
+ \ ['', 'one', ' two', 'one', '', 'two'], ['', 'oneXX', 'oneXX']])
+
+ " Check that \_[0-9] matching EOL does not break a following \>
+ call add(tl, [2, '\<\(\(25\_[0-5]\|2\_[0-4]\_[0-9]\|\_[01]\?\_[0-9]\_[0-9]\?\)\.\)\{3\}\(25\_[0-5]\|2\_[0-4]\_[0-9]\|\_[01]\?\_[0-9]\_[0-9]\?\)\>', ['', 'localnet/192.168.0.1', ''], ['', 'localnet/XX', '']])
+
+ " Check a pattern with a line break and ^ and $
+ call add(tl, [2, 'a\n^b$\n^c', ['a', 'b', 'c'], ['XX']])
+
+ call add(tl, [2, '\(^.\+\n\)\1', [' dog', ' dog', 'asdf'], ['XXasdf']])
+
+ " Run the multi-line tests
+ for t in tl
+ let re = t[0]
+ let pat = t[1]
+ let before = t[2]
+ let after = t[3]
+ for engine in [0, 1, 2]
+ if engine == 2 && re == 0 || engine == 1 && re == 1
+ continue
+ endif
+ let &regexpengine = engine
+ new
+ call setline(1, before)
+ exe '%s/' . pat . '/XX/'
+ let result = getline(1, '$')
+ q!
+ if result != after
+ call assert_report('Error: pat: \"' . pat . '\", text: \"'
+ \ . string(before) . '\", expected: \"' . string(after)
+ \ . '\", got: \"' . string(result) . '\"')
+ else
+ " Test passed
+ endif
+ endfor
+ endfor
+ unlet t tl
+endfunc
+
+" Check that using a pattern on two lines doesn't get messed up by using
+" matchstr() with \ze in between.
+func Test_matchstr_with_ze()
+ new
+ call append(0, ['Substitute here:', '<T="">Ta 5</Title>',
+ \ '<T="">Ac 7</Title>'])
+ call cursor(1, 1)
+ set re=0
+
+ .+1,.+2s/""/\='"' . matchstr(getline("."), '\d\+\ze<') . '"'
+ call assert_equal(['Substitute here:', '<T="5">Ta 5</Title>',
+ \ '<T="7">Ac 7</Title>', ''], getline(1, '$'))
+
+ bwipe!
+endfunc
+
+" Check a pattern with a look behind crossing a line boundary
+func Test_lookbehind_across_line()
+ new
+ call append(0, ['Behind:', 'asdfasd<yyy', 'xxstart1', 'asdfasd<yy',
+ \ 'xxxstart2', 'asdfasd<yy', 'xxstart3'])
+ call cursor(1, 1)
+ call search('\(<\_[xy]\+\)\@3<=start')
+ call assert_equal([0, 7, 3, 0], getpos('.'))
+ bwipe!
+endfunc
+
+" Test for the \%V atom (match inside the visual area)
+func Regex_Match_Visual_Area()
+ call append(0, ['Visual:', 'thexe the thexethe', 'andaxand andaxand',
+ \ 'oooxofor foroxooo', 'oooxofor foroxooo'])
+ call cursor(1, 1)
+ exe "normal jfxvfx:s/\\%Ve/E/g\<CR>"
+ exe "normal jV:s/\\%Va/A/g\<CR>"
+ exe "normal jfx\<C-V>fxj:s/\\%Vo/O/g\<CR>"
+ call assert_equal(['Visual:', 'thexE thE thExethe', 'AndAxAnd AndAxAnd',
+ \ 'oooxOfOr fOrOxooo', 'oooxOfOr fOrOxooo', ''], getline(1, '$'))
+ %d
+endfunc
+
+" Check matching Visual area
+func Test_matching_visual_area()
+ new
+ set regexpengine=1
+ call Regex_Match_Visual_Area()
+ set regexpengine=2
+ call Regex_Match_Visual_Area()
+ set regexpengine&
+ bwipe!
+endfunc
+
+" Check matching marks
+func Regex_Mark()
+ call append(0, ['', '', '', 'Marks:', 'asdfSasdfsadfEasdf', 'asdfSas',
+ \ 'dfsadfEasdf', '', '', '', '', ''])
+ call cursor(4, 1)
+ exe "normal jfSmsfEme:.-4,.+6s/.\\%>'s.*\\%<'e../here/\<CR>"
+ exe "normal jfSmsj0fEme:.-4,.+6s/.\\%>'s\\_.*\\%<'e../again/\<CR>"
+ call assert_equal(['', '', '', 'Marks:', 'asdfhereasdf', 'asdfagainasdf',
+ \ '', '', '', '', '', ''], getline(1, '$'))
+ %d
+endfunc
+
+func Test_matching_marks()
+ new
+ set regexpengine=1
+ call Regex_Mark()
+ set regexpengine=2
+ call Regex_Mark()
+ bwipe!
+endfunc
+
+" Check patterns matching cursor position.
+func s:curpos_test()
+ new
+ call setline(1, ['ffooooo', 'boboooo', 'zoooooo', 'koooooo', 'moooooo',
+ \ "\t\t\tfoo", 'abababababababfoo', 'bababababababafoo', '********_',
+ \ ' xxxxxxxxxxxx xxxx xxxxxx xxxxxxx x xxxxxxxxx xx xxxxxx xxxxxx xxxxx xxxxxxx xx xxxx xxxxxxxx xxxx xxxxxxxxxxx xxx xxxxxxx xxxxxxxxx xx xxxxxx xx xxxxxxx xxxxxxxxxxxxxxxx xxxxxxxxx xxx xxxxxxxx xxxxxxxxx xxxx xxx xxxx xxx xxx xxxxx xxxxxxxxxxxx xxxx xxxxxxxxx xxxxxxxxxxx xx xxxxx xxx xxxxxxxx xxxxxx xxx xxx xxxxxxxxx xxxxxxx x xxxxxxxxx xx xxxxxx xxxxxxx xxxxxxxxxxxxxxxxxx xxxxxxx xxxxxxx xxx xxx xxxxxxxx xxxxxxx xxxx xxx xxxxxx xxxxx xxxxx xx xxxxxx xxxxxxx xxx xxxxxxxxxxxx xxxx xxxxxxxxx xxxxxx xxxxxx xxxxx xxx xxxxxxx xxxxxxxxxxxxxxxx xxxxxxxxx xxxxxxxxxx xxxx xx xxxxxxxx xxx xxxxxxxxxxx xxxxx'])
+ call setpos('.', [0, 1, 0, 0])
+ s/\%>3c.//g
+ call setpos('.', [0, 2, 4, 0])
+ s/\%#.*$//g
+ call setpos('.', [0, 3, 0, 0])
+ s/\%<3c./_/g
+ %s/\%4l\%>5c./_/g
+ %s/\%6l\%>25v./_/g
+ %s/\%>6l\%3c./!/g
+ %s/\%>7l\%12c./?/g
+ %s/\%>7l\%<9l\%>5v\%<8v./#/g
+ $s/\%(|\u.*\)\@<=[^|\t]\+$//ge
+ call assert_equal(['ffo', 'bob', '__ooooo', 'koooo__', 'moooooo',
+ \ ' f__', 'ab!babababababfoo',
+ \ 'ba!ab##abab?bafoo', '**!*****_',
+ \ ' ! xxx?xxxxxxxx xxxx xxxxxx xxxxxxx x xxxxxxxxx xx xxxxxx xxxxxx xxxxx xxxxxxx xx xxxx xxxxxxxx xxxx xxxxxxxxxxx xxx xxxxxxx xxxxxxxxx xx xxxxxx xx xxxxxxx xxxxxxxxxxxxxxxx xxxxxxxxx xxx xxxxxxxx xxxxxxxxx xxxx xxx xxxx xxx xxx xxxxx xxxxxxxxxxxx xxxx xxxxxxxxx xxxxxxxxxxx xx xxxxx xxx xxxxxxxx xxxxxx xxx xxx xxxxxxxxx xxxxxxx x xxxxxxxxx xx xxxxxx xxxxxxx xxxxxxxxxxxxxxxxxx xxxxxxx xxxxxxx xxx xxx xxxxxxxx xxxxxxx xxxx xxx xxxxxx xxxxx xxxxx xx xxxxxx xxxxxxx xxx xxxxxxxxxxxx xxxx xxxxxxxxx xxxxxx xxxxxx xxxxx xxx xxxxxxx xxxxxxxxxxxxxxxx xxxxxxxxx xxxxxxxxxx xxxx xx xxxxxxxx xxx xxxxxxxxxxx xxxxx'],
+ \ getline(1, '$'))
+ bwipe!
+endfunc
+
+func Test_matching_curpos()
+ set re=0
+ call s:curpos_test()
+ set re=1
+ call s:curpos_test()
+ set re=2
+ call s:curpos_test()
+ set re&
+endfunc
+
+" Test for matching the start and end of a buffer
+func Regex_start_end_buffer()
+ call setline(1, repeat(['vim edit'], 20))
+ /\%^
+ call assert_equal([0, 1, 1, 0], getpos('.'))
+ exe "normal 50%/\\%^..\<CR>"
+ call assert_equal([0, 1, 1, 0], getpos('.'))
+ exe "normal 50%/\\%$\<CR>"
+ call assert_equal([0, 20, 8, 0], getpos('.'))
+ exe "normal 6gg/..\\%$\<CR>"
+ call assert_equal([0, 20, 7, 0], getpos('.'))
+ %d
+endfunc
+
+func Test_start_end_of_buffer_match()
+ new
+ set regexpengine=1
+ call Regex_start_end_buffer()
+ set regexpengine=2
+ call Regex_start_end_buffer()
+ bwipe!
+endfunc
+
+func Test_ze_before_zs()
+ call assert_equal('', matchstr(' ', '\%#=1\ze \zs'))
+ call assert_equal('', matchstr(' ', '\%#=2\ze \zs'))
+ call assert_equal(repeat([''], 10), matchlist(' ', '\%#=1\ze \zs'))
+ call assert_equal(repeat([''], 10), matchlist(' ', '\%#=2\ze \zs'))
+endfunc
+
+" Check for detecting error
+func Test_regexp_error()
+ call assert_fails("call matchlist('x x', '\\%#=1 \\zs*')", 'E888:')
+ call assert_fails("call matchlist('x x', '\\%#=1 \\ze*')", 'E888:')
+ call assert_fails("call matchlist('x x', '\\%#=2 \\zs*')", 'E888:')
+ call assert_fails("call matchlist('x x', '\\%#=2 \\ze*')", 'E888:')
+ call assert_fails("call matchstr('abcd', '\\%o841\\%o142')", 'E678:')
+ call assert_fails("call matchstr('abcd', '\\%#=2\\%2147483647c')", 'E951:')
+ call assert_fails("call matchstr('abcd', '\\%#=2\\%2147483647l')", 'E951:')
+ call assert_fails("call matchstr('abcd', '\\%#=2\\%2147483647v')", 'E951:')
+ call assert_fails('exe "normal /\\%#=1\\%[x\\%[x]]\<CR>"', 'E369:')
+ call assert_fails('exe "normal /\\%#=2\\%2147483647l\<CR>"', 'E951:')
+ call assert_fails('exe "normal /\\%#=2\\%2147483647c\<CR>"', 'E951:')
+ call assert_fails('exe "normal /\\%#=2\\%102261126v\<CR>"', 'E951:')
+ call assert_fails('exe "normal /\\%#=2\\%2147483646l\<CR>"', 'E486:')
+ call assert_fails('exe "normal /\\%#=2\\%2147483646c\<CR>"', 'E486:')
+ call assert_fails('exe "normal /\\%#=2\\%102261125v\<CR>"', 'E486:')
+ call assert_equal('', matchstr('abcd', '\%o181\%o142'))
+endfunc
+
+" Test for using the last substitute string pattern (~)
+func Test_regexp_last_subst_string()
+ new
+ s/bar/baz/e
+ call assert_equal(matchstr("foo\nbaz\nbar", "\\%#=1\~"), "baz")
+ call assert_equal(matchstr("foo\nbaz\nbar", "\\%#=2\~"), "baz")
+ close!
+endfunc
+
+" Check patterns matching cursor position.
+func s:curpos_test2()
+ new
+ call setline(1, ['1', '2 foobar eins zwei drei vier fünf sechse',
+ \ '3 foobar eins zwei drei vier fünf sechse',
+ \ '4 foobar eins zwei drei vier fünf sechse',
+ \ '5 foobar eins zwei drei vier fünf sechse',
+ \ '6 foobar eins zwei drei vier fünf sechse',
+ \ '7 foobar eins zwei drei vier fünf sechse'])
+ call setpos('.', [0, 2, 10, 0])
+ s/\%.c.*//g
+ call setpos('.', [0, 3, 15, 0])
+ s/\%.l.*//g
+ call setpos('.', [0, 5, 3, 0])
+ s/\%.v.*/_/g
+ call assert_equal(['1',
+ \ '2 foobar ',
+ \ '',
+ \ '4 foobar eins zwei drei vier fünf sechse',
+ \ '5 _',
+ \ '6 foobar eins zwei drei vier fünf sechse',
+ \ '7 foobar eins zwei drei vier fünf sechse'],
+ \ getline(1, '$'))
+ call assert_fails('call search("\\%.1l")', 'E1204:')
+ call assert_fails('call search("\\%.1c")', 'E1204:')
+ call assert_fails('call search("\\%.1v")', 'E1204:')
+ bwipe!
+endfunc
+
+" Check patterns matching before or after cursor position.
+func s:curpos_test3()
+ new
+ call setline(1, ['1', '2 foobar eins zwei drei vier fünf sechse',
+ \ '3 foobar eins zwei drei vier fünf sechse',
+ \ '4 foobar eins zwei drei vier fünf sechse',
+ \ '5 foobar eins zwei drei vier fünf sechse',
+ \ '6 foobar eins zwei drei vier fünf sechse',
+ \ '7 foobar eins zwei drei vier fünf sechse'])
+ call setpos('.', [0, 2, 10, 0])
+ " Note: This removes all columns, except for the column directly in front of
+ " the cursor. Bug????
+ :s/^.*\%<.c//
+ call setpos('.', [0, 3, 10, 0])
+ :s/\%>.c.*$//
+ call setpos('.', [0, 5, 4, 0])
+ " Note: This removes all columns, except for the column directly in front of
+ " the cursor. Bug????
+ :s/^.*\%<.v/_/
+ call setpos('.', [0, 6, 4, 0])
+ :s/\%>.v.*$/_/
+ call assert_equal(['1',
+ \ ' eins zwei drei vier fünf sechse',
+ \ '3 foobar e',
+ \ '4 foobar eins zwei drei vier fünf sechse',
+ \ '_foobar eins zwei drei vier fünf sechse',
+ \ '6 fo_',
+ \ '7 foobar eins zwei drei vier fünf sechse'],
+ \ getline(1, '$'))
+ sil %d
+ call setline(1, ['1', '2 foobar eins zwei drei vier fünf sechse',
+ \ '3 foobar eins zwei drei vier fünf sechse',
+ \ '4 foobar eins zwei drei vier fünf sechse',
+ \ '5 foobar eins zwei drei vier fünf sechse',
+ \ '6 foobar eins zwei drei vier fünf sechse',
+ \ '7 foobar eins zwei drei vier fünf sechse'])
+ call setpos('.', [0, 4, 4, 0])
+ %s/\%<.l.*//
+ call setpos('.', [0, 5, 4, 0])
+ %s/\%>.l.*//
+ call assert_equal(['', '', '',
+ \ '4 foobar eins zwei drei vier fünf sechse',
+ \ '5 foobar eins zwei drei vier fünf sechse',
+ \ '', ''],
+ \ getline(1, '$'))
+ bwipe!
+endfunc
+
+" Test that matching below, at or after the
+" cursor position work
+func Test_matching_pos()
+ for val in range(3)
+ exe "set re=" .. val
+ " Match at cursor position
+ call s:curpos_test2()
+ " Match before or after cursor position
+ call s:curpos_test3()
+ endfor
+ set re&
+endfunc
+
+func Test_using_mark_position()
+ " this was using freed memory
+ " new engine
+ new
+ norm O0
+ call assert_fails("s/\\%')", 'E486:')
+ bwipe!
+
+ " old engine
+ new
+ norm O0
+ call assert_fails("s/\\%#=1\\%')", 'E486:')
+ bwipe!
+endfunc
+
+func Test_using_visual_position()
+ " this was using freed memory
+ new
+ exe "norm 0o\<Esc>\<C-V>k\<C-X>o0"
+ /\%V
+ bwipe!
+endfunc
+
+func Test_using_invalid_visual_position()
+ " this was going beyond the end of the line
+ new
+ exe "norm 0o000\<Esc>0\<C-V>$s0"
+ /\%V
+ bwipe!
+endfunc
+
+func Test_using_two_engines_pattern()
+ new
+ call setline(1, ['foobar=0', 'foobar=1', 'foobar=2'])
+ " \%#= at the end of the pattern
+ for i in range(0, 2)
+ for j in range(0, 2)
+ exe "set re=" .. i
+ call cursor(j + 1, 7)
+ call assert_fails("%s/foobar\\%#=" .. j, 'E1281:')
+ endfor
+ endfor
+ set re=0
+
+ " \%#= at the start of the pattern
+ for i in range(0, 2)
+ call cursor(i + 1, 7)
+ exe ":%s/\\%#=" .. i .. "foobar=" .. i .. "/xx"
+ endfor
+ call assert_equal(['xx', 'xx', 'xx'], getline(1, '$'))
+ bwipe!
+endfunc
+
+func Test_recursive_substitute_expr()
+ new
+ func Repl()
+ s
+ endfunc
+ silent! s/\%')/~\=Repl()
+
+ bwipe!
+ delfunc Repl
+endfunc
+
+def Test_compare_columns()
+ # this was using a line below the last line
+ enew
+ setline(1, ['', ''])
+ prop_type_add('name', {highlight: 'ErrorMsg'})
+ prop_add(1, 1, {length: 1, type: 'name'})
+ search('\%#=1\%>.l\n.*\%<2v', 'nW')
+ search('\%#=2\%>.l\n.*\%<2v', 'nW')
+ bwipe!
+ prop_type_delete('name')
+enddef
+
+def Test_compare_column_matchstr()
+ # do some search in text to set the line number, it should be ignored in
+ # matchstr().
+ enew
+ setline(1, ['one', 'two', 'three'])
+ :3
+ :/ee
+ bwipe!
+ set re=1
+ call assert_equal('aaa', matchstr('aaaaaaaaaaaaaaaaaaaa', '.*\%<5v'))
+ set re=2
+ call assert_equal('aaa', matchstr('aaaaaaaaaaaaaaaaaaaa', '.*\%<5v'))
+ set re=0
+enddef
+
+
+" vim: shiftwidth=2 sts=2 expandtab