Mercurial > vim
view src/testdir/test_regexp_utf8.vim @ 34379:37b4c89ba420 v9.1.0116
patch 9.1.0116: win_split_ins may not check available room
Commit: https://github.com/vim/vim/commit/0fd44a5ad81ade342cb54d8984965bdedd2272c8
Author: Sean Dewar <6256228+seandewar@users.noreply.github.com>
Date: Tue Feb 20 20:28:15 2024 +0100
patch 9.1.0116: win_split_ins may not check available room
Problem: win_split_ins has no check for E36 when moving an existing
window
Solution: check for room and fix the issues in f_win_splitmove()
(Sean Dewar)
win_split_ins has no check for E36 when moving an existing window,
allowing for layouts with many overlapping zero-sized windows to be
created (which may also cause drawing issues with tablines and such).
f_win_splitmove also has some bugs.
So check for room and fix the issues in f_win_splitmove. Handle failure
in the two relevant win_split_ins callers by restoring the original
layout, and factor the common logic into win_splitmove.
Don't check for room when opening an autocommand window, as it's a
temporary window that's rarely interacted with or drawn anyhow, and is
rather important for some autocommands.
Issues fixed in f_win_splitmove:
- Error if splitting is disallowed.
- Fix heap-use-after-frees if autocommands fired from switching to "targetwin"
close "wp" or "oldwin".
- Fix splitting the wrong window if autocommands fired from switching to
"targetwin" switch to a different window.
- Ensure -1 is returned for all errors.
Also handle allocation failure a bit earlier in make_snapshot (callers,
except win_splitmove, don't really care if a snapshot can't be made, so
just ignore the return value).
Note: Test_smoothscroll_in_zero_width_window failed after these changes with
E36, as it was using the previous behaviour to create a zero-width window.
I've fixed the test such that it fails with UBSAN as expected when v9.0.1367 is
reverted (and simplified it too).
related: #14042
Signed-off-by: Sean Dewar <6256228+seandewar@users.noreply.github.com>
Signed-off-by: Christian Brabandt <cb@256bit.org>
author | Christian Brabandt <cb@256bit.org> |
---|---|
date | Tue, 20 Feb 2024 22:30:04 +0100 |
parents | 90063f44c99a |
children | 97b5457962ed |
line wrap: on
line source
" Tests for regexp in utf8 encoding source shared.vim func s:equivalence_test() let str = "AÀÁÂÃÄÅĀĂĄǍǞǠǺȂȦȺḀẠẢẤẦẨẪẬẮẰẲẴẶ BƁɃḂḄḆ CÇĆĈĊČƇȻḈꞒ DĎĐƊḊḌḎḐḒ EÈÉÊËĒĔĖĘĚȄȆȨɆḔḖḘḚḜẸẺẼẾỀỂỄỆ FƑḞꞘ GĜĞĠĢƓǤǦǴḠꞠ HĤĦȞḢḤḦḨḪⱧ IÌÍÎÏĨĪĬĮİƗǏȈȊḬḮỈỊ JĴɈ KĶƘǨḰḲḴⱩꝀ LĹĻĽĿŁȽḶḸḺḼⱠ MḾṀṂ NÑŃŅŇǸṄṆṈṊꞤ OÒÓÔÕÖØŌŎŐƟƠǑǪǬǾȌȎȪȬȮȰṌṎṐṒỌỎỐỒỔỖỘỚỜỞỠỢ PƤṔṖⱣ QɊ RŔŖŘȐȒɌṘṚṜṞⱤꞦ SŚŜŞŠȘṠṢṤṦṨⱾꞨ TŢŤŦƬƮȚȾṪṬṮṰ UÙÚÛÜŨŪŬŮŰƯǕǙǛǓǗȔȖɄṲṴṶṸṺỤỦỨỪỬỮỰ VƲṼṾ WŴẀẂẄẆẈ XẊẌ YÝŶŸƳȲɎẎỲỴỶỸ ZŹŻŽƵẐẒẔⱫ aàáâãäåāăąǎǟǡǻȃȧᶏḁẚạảấầẩẫậắằẳẵặⱥ bƀɓᵬᶀḃḅḇ cçćĉċčƈȼḉꞓꞔ dďđɗᵭᶁᶑḋḍḏḑḓ eèéêëēĕėęěȅȇȩɇᶒḕḗḙḛḝẹẻẽếềểễệ fƒᵮᶂḟꞙ gĝğġģǥǧǵɠᶃḡꞡ hĥħȟḣḥḧḩḫẖⱨꞕ iìíîïĩīĭįǐȉȋɨᶖḭḯỉị jĵǰɉ kķƙǩᶄḱḳḵⱪꝁ lĺļľŀłƚḷḹḻḽⱡ mᵯḿṁṃ nñńņňʼnǹᵰᶇṅṇṉṋꞥ oòóôõöøōŏőơǒǫǭǿȍȏȫȭȯȱɵṍṏṑṓọỏốồổỗộớờởỡợ pƥᵱᵽᶈṕṗ qɋʠ rŕŗřȑȓɍɽᵲᵳᶉṛṝṟꞧ sśŝşšșȿᵴᶊṡṣṥṧṩꞩ tţťŧƫƭțʈᵵṫṭṯṱẗⱦ uùúûüũūŭůűųǚǖưǔǘǜȕȗʉᵾᶙṳṵṷṹṻụủứừửữự vʋᶌṽṿ wŵẁẃẅẇẉẘ xẋẍ yýÿŷƴȳɏẏẙỳỵỷỹ zźżžƶᵶᶎẑẓẕⱬ" let groups = split(str) for group1 in groups for c in split(group1, '\zs') " next statement confirms that equivalence class matches every " character in group call assert_match('^[[=' .. c .. '=]]*$', group1) for group2 in groups if group2 != group1 " next statement converts that equivalence class doesn't match " character in any other group call assert_equal(-1, match(group2, '[[=' .. c .. '=]]'), c) endif endfor endfor endfor endfunc func Test_equivalence_re1() set re=1 call s:equivalence_test() set re=0 endfunc func Test_equivalence_re2() set re=2 call s:equivalence_test() set re=0 endfunc func s:classes_test() if has('win32') set iskeyword=@,48-57,_,192-255 endif set isprint=@,161-255 call assert_equal('Motörhead', matchstr('Motörhead', '[[:print:]]\+')) let alnumchars = '' let alphachars = '' let backspacechar = '' let blankchars = '' let cntrlchars = '' let digitchars = '' let escapechar = '' let graphchars = '' let lowerchars = '' let printchars = '' let punctchars = '' let returnchar = '' let spacechars = '' let tabchar = '' let upperchars = '' let xdigitchars = '' let identchars = '' let identchars1 = '' let kwordchars = '' let kwordchars1 = '' let fnamechars = '' let fnamechars1 = '' let i = 1 while i <= 255 let c = nr2char(i) if c =~ '[[:alpha:]]' let alphachars .= c endif if c =~ '[[:alnum:]]' let alnumchars .= c endif if c =~ '[[:backspace:]]' let backspacechar .= c endif if c =~ '[[:blank:]]' let blankchars .= c endif if c =~ '[[:cntrl:]]' let cntrlchars .= c endif if c =~ '[[:digit:]]' let digitchars .= c endif if c =~ '[[:escape:]]' let escapechar .= c endif if c =~ '[[:graph:]]' let graphchars .= c endif if c =~ '[[:lower:]]' let lowerchars .= c endif if c =~ '[[:print:]]' let printchars .= c endif if c =~ '[[:punct:]]' let punctchars .= c endif if c =~ '[[:return:]]' let returnchar .= c endif if c =~ '[[:space:]]' let spacechars .= c endif if c =~ '[[:tab:]]' let tabchar .= c endif if c =~ '[[:upper:]]' let upperchars .= c endif if c =~ '[[:xdigit:]]' let xdigitchars .= c endif if c =~ '[[:ident:]]' let identchars .= c endif if c =~ '\i' let identchars1 .= c endif if c =~ '[[:keyword:]]' let kwordchars .= c endif if c =~ '\k' let kwordchars1 .= c endif if c =~ '[[:fname:]]' let fnamechars .= c endif if c =~ '\f' let fnamechars1 .= c endif let i += 1 endwhile call assert_equal('ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz', alphachars) call assert_equal('0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz', alnumchars) call assert_equal("\b", backspacechar) call assert_equal("\t ", blankchars) call assert_equal("\x01\x02\x03\x04\x05\x06\x07\b\t\n\x0b\f\r\x0e\x0f\x10\x11\x12\x13\x14\x15\x16\x17\x18\x19\x1a\e\x1c\x1d\x1e\x1f\x7f", cntrlchars) call assert_equal("0123456789", digitchars) call assert_equal("\<Esc>", escapechar) call assert_equal('!"#$%&''()*+,-./0123456789:;<=>?@ABCDEFGHIJKLMNOPQRSTUVWXYZ[\]^_`abcdefghijklmnopqrstuvwxyz{|}~', graphchars) call assert_equal('abcdefghijklmnopqrstuvwxyzµßàáâãäåæçèéêëìíîïðñòóôõöøùúûüýþÿ', lowerchars) call assert_equal(' !"#$%&''()*+,-./0123456789:;<=>?@ABCDEFGHIJKLMNOPQRSTUVWXYZ[\]^_`abcdefghijklmnopqrstuvwxyz{|}~ ¡¢£¤¥¦§¨©ª«¬®¯°±²³´µ¶·¸¹º»¼½¾¿ÀÁÂÃÄÅÆÇÈÉÊËÌÍÎÏÐÑÒÓÔÕÖ×ØÙÚÛÜÝÞßàáâãäåæçèéêëìíîïðñòóôõö÷øùúûüýþÿ', printchars) call assert_equal('!"#$%&''()*+,-./:;<=>?@[\]^_`{|}~', punctchars) call assert_equal('ABCDEFGHIJKLMNOPQRSTUVWXYZÀÁÂÃÄÅÆÇÈÉÊËÌÍÎÏÐÑÒÓÔÕÖØÙÚÛÜÝÞ', upperchars) call assert_equal("\r", returnchar) call assert_equal("\t\n\x0b\f\r ", spacechars) call assert_equal("\t", tabchar) call assert_equal('0123456789ABCDEFabcdef', xdigitchars) if has('win32') let identchars_ok = '0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ_abcdefghijklmnopqrstuvwxyz ¡¢£¤¥¦§µÀÁÂÃÄÅÆÇÈÉÊËÌÍÎÏÐÑÒÓÔÕÖØÙÚÛÜÝÞßàáâãäåæçèéêëìíîïðñòóôõöøùúûüýþÿ' let kwordchars_ok = '0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ_abcdefghijklmnopqrstuvwxyzµÀÁÂÃÄÅÆÇÈÉÊËÌÍÎÏÐÑÒÓÔÕÖ×ØÙÚÛÜÝÞßàáâãäåæçèéêëìíîïðñòóôõö÷øùúûüýþÿ' else let identchars_ok = '0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ_abcdefghijklmnopqrstuvwxyzµÀÁÂÃÄÅÆÇÈÉÊËÌÍÎÏÐÑÒÓÔÕÖ×ØÙÚÛÜÝÞßàáâãäåæçèéêëìíîïðñòóôõö÷øùúûüýþÿ' let kwordchars_ok = '0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ_abcdefghijklmnopqrstuvwxyzµÀÁÂÃÄÅÆÇÈÉÊËÌÍÎÏÐÑÒÓÔÕÖ×ØÙÚÛÜÝÞßàáâãäåæçèéêëìíîïðñòóôõö÷øùúûüýþÿ' endif if has('win32') let fnamechars_ok = '!#$%+,-./0123456789:=@ABCDEFGHIJKLMNOPQRSTUVWXYZ[\]_abcdefghijklmnopqrstuvwxyz{}~ ¡¢£¤¥¦§¨©ª«¬®¯°±²³´µ¶·¸¹º»¼½¾¿ÀÁÂÃÄÅÆÇÈÉÊËÌÍÎÏÐÑÒÓÔÕÖ×ØÙÚÛÜÝÞßàáâãäåæçèéêëìíîïðñòóôõö÷øùúûüýþÿ' elseif has('amiga') let fnamechars_ok = '$+,-./0123456789:ABCDEFGHIJKLMNOPQRSTUVWXYZ_abcdefghijklmnopqrstuvwxyz~ ¡¢£¤¥¦§¨©ª«¬®¯°±²³´µ¶·¸¹º»¼½¾¿ÀÁÂÃÄÅÆÇÈÉÊËÌÍÎÏÐÑÒÓÔÕÖ×ØÙÚÛÜÝÞßàáâãäåæçèéêëìíîïðñòóôõö÷øùúûüýþÿ' elseif has('vms') let fnamechars_ok = '#$%+,-./0123456789:;<>ABCDEFGHIJKLMNOPQRSTUVWXYZ[]_abcdefghijklmnopqrstuvwxyz~ ¡¢£¤¥¦§¨©ª«¬®¯°±²³´µ¶·¸¹º»¼½¾¿ÀÁÂÃÄÅÆÇÈÉÊËÌÍÎÏÐÑÒÓÔÕÖ×ØÙÚÛÜÝÞßàáâãäåæçèéêëìíîïðñòóôõö÷øùúûüýþÿ' else let fnamechars_ok = '#$%+,-./0123456789=ABCDEFGHIJKLMNOPQRSTUVWXYZ_abcdefghijklmnopqrstuvwxyz~ ¡¢£¤¥¦§¨©ª«¬®¯°±²³´µ¶·¸¹º»¼½¾¿ÀÁÂÃÄÅÆÇÈÉÊËÌÍÎÏÐÑÒÓÔÕÖ×ØÙÚÛÜÝÞßàáâãäåæçèéêëìíîïðñòóôõö÷øùúûüýþÿ' endif call assert_equal(identchars_ok, identchars) call assert_equal(kwordchars_ok, kwordchars) call assert_equal(fnamechars_ok, fnamechars) call assert_equal(identchars1, identchars) call assert_equal(kwordchars1, kwordchars) call assert_equal(fnamechars1, fnamechars) endfunc func Test_classes_re1() set re=1 call s:classes_test() set re=0 endfunc func Test_classes_re2() set re=2 call s:classes_test() set re=0 endfunc func Test_reversed_range() for re in range(0, 2) exe 'set re=' . re call assert_fails('call match("abc def", "[c-a]")', 'E944:', re) endfor set re=0 endfunc func Test_large_class() set re=1 call assert_fails('call match("abc def", "[\u3000-\u4000]")', 'E945:') set re=2 call assert_equal(0, 'abc def' =~# '[\u3000-\u4000]') call assert_equal(1, "\u3042" =~# '[\u3000-\u4000]') set re=0 endfunc func Test_optmatch_toolong() set re=1 " Can only handle about 8000 characters. let pat = '\\%[' .. repeat('x', 9000) .. ']' call assert_fails('call match("abc def", "' .. pat .. '")', 'E339:') set re=0 endfunc " Test for regexp patterns with multi-byte support, using utf-8. func Test_multibyte_chars() " tl is a List of Lists with: " 2: test auto/old/new 0: test auto/old 1: test auto/new " regexp pattern " text to test the pattern on " expected match (optional) " expected submatch 1 (optional) " expected submatch 2 (optional) " etc. " When there is no match use only the first two items. let tl = [] " Multi-byte character tests. call add(tl, [2, '[[:alpha:][=a=]]\+', '879 aiaãâaiuvna ', 'aiaãâaiuvna']) call add(tl, [2, '[[=a=]]\+', 'ddaãâbcd', 'aãâ']) " equivalence classes call add(tl, [2, '[^ม ]\+', 'มม oijasoifjos ifjoisj f osij j มมมมม abcd', 'oijasoifjos']) call add(tl, [2, ' [^ ]\+', 'start มabcdม ', ' มabcdม']) call add(tl, [2, '[ม[:alpha:][=a=]]\+', '879 aiaãมâมaiuvna ', 'aiaãมâมaiuvna']) " this is not a normal "i" but 0xec call add(tl, [2, '\p\+', 'ìa', 'ìa']) call add(tl, [2, '\p*', 'aあ', 'aあ']) " Test recognition of some character classes call add(tl, [2, '\i\+', '&*¨xx ', 'xx']) call add(tl, [2, '\f\+', '&*fname ', 'fname']) " Test composing character matching call add(tl, [2, '.ม', 'xม่x yมy', 'yม']) call add(tl, [2, '.ม่', 'xม่x yมy', 'xม่']) call add(tl, [2, "\u05b9", " x\u05b9 ", "x\u05b9"]) call add(tl, [2, ".\u05b9", " x\u05b9 ", "x\u05b9"]) call add(tl, [2, "\u05b9\u05bb", " x\u05b9\u05bb ", "x\u05b9\u05bb"]) call add(tl, [2, ".\u05b9\u05bb", " x\u05b9\u05bb ", "x\u05b9\u05bb"]) call add(tl, [2, "\u05bb\u05b9", " x\u05b9\u05bb ", "x\u05b9\u05bb"]) call add(tl, [2, ".\u05bb\u05b9", " x\u05b9\u05bb ", "x\u05b9\u05bb"]) call add(tl, [2, "\u05b9", " y\u05bb x\u05b9 ", "x\u05b9"]) call add(tl, [2, ".\u05b9", " y\u05bb x\u05b9 ", "x\u05b9"]) call add(tl, [2, "\u05b9", " y\u05bb\u05b9 x\u05b9 ", "y\u05bb\u05b9"]) call add(tl, [2, ".\u05b9", " y\u05bb\u05b9 x\u05b9 ", "y\u05bb\u05b9"]) call add(tl, [1, "\u05b9\u05bb", " y\u05b9 x\u05b9\u05bb ", "x\u05b9\u05bb"]) call add(tl, [2, ".\u05b9\u05bb", " y\u05bb x\u05b9\u05bb ", "x\u05b9\u05bb"]) call add(tl, [2, "a", "ca\u0300t"]) call add(tl, [2, "ca", "ca\u0300t"]) call add(tl, [2, "a\u0300", "ca\u0300t", "a\u0300"]) call add(tl, [2, 'a\%C', "ca\u0300t", "a\u0300"]) call add(tl, [2, 'ca\%C', "ca\u0300t", "ca\u0300"]) call add(tl, [2, 'ca\%Ct', "ca\u0300t", "ca\u0300t"]) " Test \Z call add(tl, [2, 'ú\Z', 'x']) call add(tl, [2, 'יהוה\Z', 'יהוה', 'יהוה']) call add(tl, [2, 'יְהוָה\Z', 'יהוה', 'יהוה']) call add(tl, [2, 'יהוה\Z', 'יְהוָה', 'יְהוָה']) call add(tl, [2, 'יְהוָה\Z', 'יְהוָה', 'יְהוָה']) call add(tl, [2, 'יְ\Z', 'וְיַ', 'יַ']) call add(tl, [2, "ק\u200d\u05b9x\\Z", "xק\u200d\u05b9xy", "ק\u200d\u05b9x"]) call add(tl, [2, "ק\u200d\u05b9x\\Z", "xק\u200dxy", "ק\u200dx"]) call add(tl, [2, "ק\u200dx\\Z", "xק\u200d\u05b9xy", "ק\u200d\u05b9x"]) call add(tl, [2, "ק\u200dx\\Z", "xק\u200dxy", "ק\u200dx"]) call add(tl, [2, "\u05b9\\Z", "xyz"]) call add(tl, [2, "\\Z\u05b9", "xyz"]) call add(tl, [2, "\u05b9\\Z", "xy\u05b9z", "y\u05b9"]) call add(tl, [2, "\\Z\u05b9", "xy\u05b9z", "y\u05b9"]) call add(tl, [1, "\u05b9\\+\\Z", "xy\u05b9z\u05b9 ", "y\u05b9z\u05b9"]) call add(tl, [1, "\\Z\u05b9\\+", "xy\u05b9z\u05b9 ", "y\u05b9z\u05b9"]) " Combining different tests and features call add(tl, [2, '[^[=a=]]\+', 'ddaãâbcd', 'dd']) " Run the tests for t in tl let re = t[0] let pat = t[1] let text = t[2] let matchidx = 3 for engine in [0, 1, 2] if engine == 2 && re == 0 || engine == 1 && re == 1 continue endif let ®expengine = engine try let l = matchlist(text, pat) catch call assert_report('Error ' . engine . ': pat: \"' . pat . \ '\", text: \"' . text . \ '\", caused an exception: \"' . v:exception . '\"') endtry " check the match itself if len(l) == 0 && len(t) > matchidx call assert_report('Error ' . engine . ': pat: \"' . pat . \ '\", text: \"' . text . \ '\", did not match, expected: \"' . t[matchidx] . '\"') elseif len(l) > 0 && len(t) == matchidx call assert_report('Error ' . engine . ': pat: \"' . pat . \ '\", text: \"' . text . '\", match: \"' . l[0] . \ '\", expected no match') elseif len(t) > matchidx && l[0] != t[matchidx] call assert_report('Error ' . engine . ': pat: \"' . pat . \ '\", text: \"' . text . '\", match: \"' . l[0] . \ '\", expected: \"' . t[matchidx] . '\"') else " Test passed endif if len(l) > 0 " check all the nine submatches for i in range(1, 9) if len(t) <= matchidx + i let e = '' else let e = t[matchidx + i] endif if l[i] != e call assert_report('Error ' . engine . ': pat: \"' . pat . \ '\", text: \"' . text . '\", submatch ' . i . \ ': \"' . l[i] . '\", expected: \"' . e . '\"') endif endfor unlet i endif endfor endfor set regexpengine& endfunc " check that 'ambiwidth' does not change the meaning of \p func Test_ambiwidth() set regexpengine=1 ambiwidth=single call assert_equal(0, match("\u00EC", '\p')) set regexpengine=1 ambiwidth=double call assert_equal(0, match("\u00EC", '\p')) set regexpengine=2 ambiwidth=single call assert_equal(0, match("\u00EC", '\p')) set regexpengine=2 ambiwidth=double call assert_equal(0, match("\u00EC", '\p')) set regexpengine& ambiwidth& endfunc func Run_regexp_ignore_case() call assert_equal('iIİ', substitute('iIİ', '\([iIİ]\)', '\1', 'g')) call assert_equal('iIx', substitute('iIİ', '\c\([İ]\)', 'x', 'g')) call assert_equal('xxİ', substitute('iIİ', '\(i\c\)', 'x', 'g')) call assert_equal('iIx', substitute('iIİ', '\(İ\c\)', 'x', 'g')) call assert_equal('iIx', substitute('iIİ', '\c\(\%u0130\)', 'x', 'g')) call assert_equal('iIx', substitute('iIİ', '\c\([\u0130]\)', 'x', 'g')) call assert_equal('iIx', substitute('iIİ', '\c\([\u012f-\u0131]\)', 'x', 'g')) endfunc func Test_regexp_ignore_case() set regexpengine=1 call Run_regexp_ignore_case() set regexpengine=2 call Run_regexp_ignore_case() set regexpengine& endfunc " Tests for regexp with multi-byte encoding and various magic settings func Run_regexp_multibyte_magic() let text =<< trim END 1 a aa abb abbccc 2 d dd dee deefff 3 g gg ghh ghhiii 4 j jj jkk jkklll 5 m mm mnn mnnooo 6 x ^aa$ x 7 (a)(b) abbaa 8 axx [ab]xx 9 หม่x อมx a อมx หม่x b ちカヨは c x ¬€x d 天使x e y f z g a啷bb j 0123❤x k combinations l äö üᾱ̆́ END new call setline(1, text) exe 'normal /a*b\{2}c\+/e' .. "\<CR>x" call assert_equal('1 a aa abb abbcc', getline('.')) exe 'normal /\Md\*e\{2}f\+/e' .. "\<CR>x" call assert_equal('2 d dd dee deeff', getline('.')) set nomagic exe 'normal /g\*h\{2}i\+/e' .. "\<CR>x" call assert_equal('3 g gg ghh ghhii', getline('.')) exe 'normal /\mj*k\{2}l\+/e' .. "\<CR>x" call assert_equal('4 j jj jkk jkkll', getline('.')) exe 'normal /\vm*n{2}o+/e' .. "\<CR>x" call assert_equal('5 m mm mnn mnnoo', getline('.')) exe 'normal /\V^aa$/' .. "\<CR>x" call assert_equal('6 x aa$ x', getline('.')) set magic exe 'normal /\v(a)(b)\2\1\1/e' .. "\<CR>x" call assert_equal('7 (a)(b) abba', getline('.')) exe 'normal /\V[ab]\(\[xy]\)\1' .. "\<CR>x" call assert_equal('8 axx ab]xx', getline('.')) " search for multi-byte without composing char exe 'normal /ม' .. "\<CR>x" call assert_equal('9 หม่x อx', getline('.')) " search for multi-byte with composing char exe 'normal /ม่' .. "\<CR>x" call assert_equal('a อมx หx', getline('.')) " find word by change of word class exe 'normal /ち\<カヨ\>は' .. "\<CR>x" call assert_equal('b カヨは', getline('.')) " Test \%u, [\u] and friends " c exe 'normal /\%u20ac' .. "\<CR>x" call assert_equal('c x ¬x', getline('.')) " d exe 'normal /[\u4f7f\u5929]\+' .. "\<CR>x" call assert_equal('d 使x', getline('.')) " e exe 'normal /\%U12345678' .. "\<CR>x" call assert_equal('e y', getline('.')) " f exe 'normal /[\U1234abcd\u1234\uabcd]' .. "\<CR>x" call assert_equal('f z', getline('.')) " g exe 'normal /\%d21879b' .. "\<CR>x" call assert_equal('g abb', getline('.')) " j Test backwards search from a multi-byte char exe "normal /x\<CR>x?.\<CR>x" call assert_equal('j 012❤', getline('.')) " k let @w=':%s#comb[i]nations#œ̄ṣ́m̥̄ᾱ̆́#g' @w call assert_equal('k œ̄ṣ́m̥̄ᾱ̆́', getline(18)) close! endfunc func Test_regexp_multibyte_magic() set regexpengine=1 call Run_regexp_multibyte_magic() set regexpengine=2 call Run_regexp_multibyte_magic() set regexpengine& endfunc " Test for 7.3.192 " command ":s/ \?/ /g" splits multi-byte characters into bytes func Test_split_multibyte_to_bytes() new call setline(1, 'l äö üᾱ̆́') s/ \?/ /g call assert_equal(' l ä ö ü ᾱ̆́', getline(1)) close! endfunc " Test for matchstr() with multibyte characters func Test_matchstr_multibyte() new call assert_equal('ב', matchstr("אבגד", ".", 0, 2)) call assert_equal('בג', matchstr("אבגד", "..", 0, 2)) call assert_equal('א', matchstr("אבגד", ".", 0, 0)) call assert_equal('ג', matchstr("אבגד", ".", 4, -1)) close! endfunc " Test for 7.4.636 " A search with end offset gets stuck at end of file. func Test_search_with_end_offset() new call setline(1, ['', 'dog(a', 'cat(']) exe "normal /(/e+\<CR>" normal n"ayn call assert_equal("a\ncat(", @a) close! endfunc " Check that "^" matches even when the line starts with a combining char func Test_match_start_of_line_combining() new call setline(1, ['', "\u05ae", '']) exe "normal gg/^\<CR>" call assert_equal(2, getcurpos()[1]) bwipe! endfunc " Check that [[:upper:]] matches for automatic engine func Test_match_char_class_upper() new " Test 1: [[:upper:]]\{2,\} set regexpengine=0 call setline(1, ['05. ПЕСНЯ О ГЕРОЯХ муз. А. Давиденко, М. Коваля и Б. Шехтера ...', '05. PJESNJA O GJEROJAKH mus. A. Davidjenko, M. Kovalja i B. Shjekhtjera ...']) call cursor(1,1) let search_cmd='norm /\<[[:upper:]]\{2,\}\>' .. "\<CR>" exe search_cmd call assert_equal(4, searchcount().total, 'TEST 1') set regexpengine=1 exe search_cmd call assert_equal(2, searchcount().total, 'TEST 1') set regexpengine=2 exe search_cmd call assert_equal(4, searchcount().total, 'TEST 1') " Test 2: [[:upper:]].\+ let search_cmd='norm /\<[[:upper:]].\+\>' .. "\<CR>" set regexpengine=0 exe search_cmd call assert_equal(2, searchcount().total, 'TEST 2') set regexpengine=1 exe search_cmd call assert_equal(1, searchcount().total, 'TEST 2') set regexpengine=2 exe search_cmd call assert_equal(2, searchcount().total, 'TEST 2') " Test 3: [[:lower:]]\+ let search_cmd='norm /\<[[:lower:]]\+\>' .. "\<CR>" set regexpengine=0 exe search_cmd call assert_equal(4, searchcount().total, 'TEST 3 lower') set regexpengine=1 exe search_cmd call assert_equal(2, searchcount().total, 'TEST 3 lower') set regexpengine=2 exe search_cmd call assert_equal(4, searchcount().total, 'TEST 3 lower') " clean up set regexpengine=0 bwipe! endfunc func Test_match_invalid_byte() call writefile(0z630a.765d30aa0a.2e0a.790a.4030, 'Xinvalid', 'D') new source Xinvalid bwipe! endfunc func Test_match_illegal_byte() " Text has illegal bytes which need to be set explicitly let lines = ["norm :set no\x01\<CR>", "silent n\xff", "silent norm :b\xff\<CR>"] call writefile(lines, 'Xregexp', 'D') call system(GetVimCommand() .. ' -X -Z -e -s -S Xregexp -c qa!') endfunc func Test_match_too_complicated() set regexpengine=1 exe "noswapfile vsplit \xeb\xdb\x99" silent! buf \&\zs*\zs*0 bwipe! set regexpengine=0 endfunc func Test_combining_chars_in_collection() new for i in range(0,2) exe "set re=".i put =['ɔ̃', 'ɔ', '̃ ã', 'abcd'] :%s/[ɔ̃]// call assert_equal(['', '', 'ɔ', '̃ ã', 'abcd'], getline(1,'$')) %d endfor bw! endfunc " vim: shiftwidth=2 sts=2 expandtab