Mercurial > vim
view src/testdir/test_utf8.vim @ 33811:06219b3bdaf3 v9.0.2121
patch 9.0.2121: [security]: use-after-free in ex_substitute
Commit: https://github.com/vim/vim/commit/26c11c56888d01e298cd8044caf860f3c26f57bb
Author: Christian Brabandt <cb@256bit.org>
Date: Wed Nov 22 21:26:41 2023 +0100
patch 9.0.2121: [security]: use-after-free in ex_substitute
Problem: [security]: use-after-free in ex_substitute
Solution: always allocate memory
closes: #13552
A recursive :substitute command could cause a heap-use-after free in Vim
(CVE-2023-48706).
The whole reproducible test is a bit tricky, I can only reproduce this
reliably when no previous substitution command has been used yet
(which is the reason, the test needs to run as first one in the
test_substitute.vim file) and as a combination of the `:~` command
together with a :s command that contains the special substitution atom `~\=`
which will make use of a sub-replace special atom and calls a vim script
function.
There was a comment in the existing :s code, that already makes the
`sub` variable allocate memory so that a recursive :s call won't be able
to cause any issues here, so this was known as a potential problem
already. But for the current test-case that one does not work, because
the substitution does not start with `\=` but with `~\=` (and since
there does not yet exist a previous substitution atom, Vim will simply
increment the `sub` pointer (which then was not allocated dynamically)
and later one happily use a sub-replace special expression (which could
then free the `sub` var).
The following commit fixes this, by making the sub var always using
allocated memory, which also means we need to free the pointer whenever
we leave the function. Since sub is now always an allocated variable,
we also do no longer need the sub_copy variable anymore, since this one
was used to indicated when sub pointed to allocated memory (and had
therefore to be freed on exit) and when not.
Github Security Advisory:
https://github.com/vim/vim/security/advisories/GHSA-c8qm-x72m-q53q
Signed-off-by: Christian Brabandt <cb@256bit.org>
author | Christian Brabandt <cb@256bit.org> |
---|---|
date | Wed, 22 Nov 2023 22:15:05 +0100 |
parents | 695b50472e85 |
children | f8f45612de4e |
line wrap: on
line source
" Tests for Unicode manipulations source check.vim source view_util.vim source screendump.vim " Visual block Insert adjusts for multi-byte char func Test_visual_block_insert() new call setline(1, ["aaa", "あああ", "bbb"]) exe ":norm! gg0l\<C-V>jjIx\<Esc>" call assert_equal(['axaa', ' xあああ', 'bxbb'], getline(1, '$')) bwipeout! endfunc " Test for built-in functions strchars() and strcharlen() func Test_strchars() let inp = ["a", "あいa", "A\u20dd", "A\u20dd\u20dd", "\u20dd"] let exp = [[1, 1, 1], [3, 3, 3], [2, 2, 1], [3, 3, 1], [1, 1, 1]] for i in range(len(inp)) call assert_equal(exp[i][0], strchars(inp[i])) call assert_equal(exp[i][1], inp[i]->strchars(0)) call assert_equal(exp[i][2], strchars(inp[i], 1)) endfor let exp = [1, 3, 1, 1, 1] for i in range(len(inp)) call assert_equal(exp[i], inp[i]->strcharlen()) call assert_equal(exp[i], strcharlen(inp[i])) endfor call assert_fails("call strchars('abc', 2)", ['E1023:', 'E1023:']) call assert_fails("call strchars('abc', -1)", ['E1023:', 'E1023:']) call assert_fails("call strchars('abc', {})", ['E728:', 'E728:']) call assert_fails("call strchars('abc', [])", ['E745:', 'E745:']) endfunc " Test for customlist completion func CustomComplete1(lead, line, pos) return ['あ', 'い'] endfunc func CustomComplete2(lead, line, pos) return ['あたし', 'あたま', 'あたりめ'] endfunc func CustomComplete3(lead, line, pos) return ['Nこ', 'Nん', 'Nぶ'] endfunc func Test_customlist_completion() command -nargs=1 -complete=customlist,CustomComplete1 Test1 echo call feedkeys(":Test1 \<C-L>\<C-B>\"\<CR>", 'itx') call assert_equal('"Test1 ', getreg(':')) command -nargs=1 -complete=customlist,CustomComplete2 Test2 echo call feedkeys(":Test2 \<C-L>\<C-B>\"\<CR>", 'itx') call assert_equal('"Test2 あた', getreg(':')) command -nargs=1 -complete=customlist,CustomComplete3 Test3 echo call feedkeys(":Test3 \<C-L>\<C-B>\"\<CR>", 'itx') call assert_equal('"Test3 N', getreg(':')) call garbagecollect(1) endfunc " Yank one 3 byte character and check the mark columns. func Test_getvcol() new call setline(1, "x\u2500x") normal 0lvy call assert_equal(2, col("'[")) call assert_equal(4, col("']")) call assert_equal(2, virtcol("'[")) call assert_equal(2, virtcol("']")) endfunc func Test_list2str_str2list_utf8() " One Unicode codepoint let s = "\u3042\u3044" let l = [0x3042, 0x3044] call assert_equal(l, str2list(s, 1)) call assert_equal(s, list2str(l, 1)) if &enc ==# 'utf-8' call assert_equal(str2list(s), str2list(s, 1)) call assert_equal(list2str(l), list2str(l, 1)) endif " With composing characters let s = "\u304b\u3099\u3044" let l = [0x304b, 0x3099, 0x3044] call assert_equal(l, str2list(s, 1)) call assert_equal(s, l->list2str(1)) if &enc ==# 'utf-8' call assert_equal(str2list(s), str2list(s, 1)) call assert_equal(list2str(l), list2str(l, 1)) endif " Null list is the same as an empty list call assert_equal('', list2str([])) call assert_equal('', list2str(test_null_list())) endfunc func Test_list2str_str2list_latin1() " When 'encoding' is not multi-byte can still get utf-8 string. " But we need to create the utf-8 string while 'encoding' is utf-8. let s = "\u3042\u3044" let l = [0x3042, 0x3044] let save_encoding = &encoding set encoding=latin1 let lres = str2list(s, 1) let sres = list2str(l, 1) call assert_equal([65, 66, 67], str2list("ABC")) " Try converting a list to a string in latin-1 encoding call assert_equal([1, 2, 3], str2list(list2str([1, 2, 3]))) let &encoding = save_encoding call assert_equal(l, lres) call assert_equal(s, sres) endfunc func Test_screenchar_utf8() new " 1-cell, with composing characters call setline(1, ["ABC\u0308"]) redraw call assert_equal([0x0041], screenchars(1, 1)) call assert_equal([0x0042], 1->screenchars(2)) call assert_equal([0x0043, 0x0308], screenchars(1, 3)) call assert_equal("A", screenstring(1, 1)) call assert_equal("B", screenstring(1, 2)) call assert_equal("C\u0308", screenstring(1, 3)) " 1-cell, with 6 composing characters set maxcombine=6 call setline(1, ["ABC" .. repeat("\u0308", 6)]) redraw call assert_equal([0x0041], screenchars(1, 1)) call assert_equal([0x0042], 1->screenchars(2)) " This should not use uninitialized memory call assert_equal([0x0043] + repeat([0x0308], 6), screenchars(1, 3)) call assert_equal("A", screenstring(1, 1)) call assert_equal("B", screenstring(1, 2)) call assert_equal("C" .. repeat("\u0308", 6), screenstring(1, 3)) set maxcombine& " 2-cells, with composing characters let text = "\u3042\u3044\u3046\u3099" call setline(1, text) redraw call assert_equal([0x3042], screenchars(1, 1)) call assert_equal([0], screenchars(1, 2)) call assert_equal([0x3044], screenchars(1, 3)) call assert_equal([0], screenchars(1, 4)) call assert_equal([0x3046, 0x3099], screenchars(1, 5)) call assert_equal("\u3042", screenstring(1, 1)) call assert_equal("", screenstring(1, 2)) call assert_equal("\u3044", screenstring(1, 3)) call assert_equal("", screenstring(1, 4)) call assert_equal("\u3046\u3099", screenstring(1, 5)) call assert_equal([text . ' '], ScreenLines(1, 8)) bwipe! endfunc func Test_setcellwidths() call setcellwidths([ \ [0x1330, 0x1330, 2], \ [9999, 10000, 1], \ [0x1337, 0x1339, 2], \]) call assert_equal(2, strwidth("\u1330")) call assert_equal(1, strwidth("\u1336")) call assert_equal(2, strwidth("\u1337")) call assert_equal(2, strwidth("\u1339")) call assert_equal(1, strwidth("\u133a")) for aw in ['single', 'double'] exe 'set ambiwidth=' . aw " Handle \u0080 to \u009F as control chars even on MS-Windows. set isprint=@,161-255 call setcellwidths([]) " Control chars call assert_equal(4, strwidth("\u0081")) call assert_equal(6, strwidth("\uFEFF")) " Ambiguous width chars call assert_equal((aw == 'single') ? 1 : 2, strwidth("\u00A1")) call assert_equal((aw == 'single') ? 1 : 2, strwidth("\u2010")) call setcellwidths([[0x81, 0x81, 1], [0xA1, 0xA1, 1], \ [0x2010, 0x2010, 1], [0xFEFF, 0xFEFF, 1]]) " Control chars call assert_equal(4, strwidth("\u0081")) call assert_equal(6, strwidth("\uFEFF")) " Ambiguous width chars call assert_equal(1, strwidth("\u00A1")) call assert_equal(1, strwidth("\u2010")) call setcellwidths([[0x81, 0x81, 2], [0xA1, 0xA1, 2], \ [0x2010, 0x2010, 2], [0xFEFF, 0xFEFF, 2]]) " Control chars call assert_equal(4, strwidth("\u0081")) call assert_equal(6, strwidth("\uFEFF")) " Ambiguous width chars call assert_equal(2, strwidth("\u00A1")) call assert_equal(2, strwidth("\u2010")) endfor set ambiwidth& isprint& call setcellwidths([]) call assert_fails('call setcellwidths(1)', 'E1211:') call assert_fails('call setcellwidths([1, 2, 0])', 'E1109:') call assert_fails('call setcellwidths([[0x101]])', 'E1110:') call assert_fails('call setcellwidths([[0x101, 0x102]])', 'E1110:') call assert_fails('call setcellwidths([[0x101, 0x102, 1, 4]])', 'E1110:') call assert_fails('call setcellwidths([["a"]])', 'E1110:') call assert_fails('call setcellwidths([[0x102, 0x101, 1]])', 'E1111:') call assert_fails('call setcellwidths([[0x101, 0x102, 0]])', 'E1112:') call assert_fails('call setcellwidths([[0x101, 0x102, 3]])', 'E1112:') call assert_fails('call setcellwidths([[0x111, 0x122, 1], [0x115, 0x116, 2]])', 'E1113:') call assert_fails('call setcellwidths([[0x111, 0x122, 1], [0x122, 0x123, 2]])', 'E1113:') call assert_fails('call setcellwidths([[0x33, 0x44, 2]])', 'E1114:') set listchars=tab:--\\u2192 call assert_fails('call setcellwidths([[0x2192, 0x2192, 2]])', 'E834:') set fillchars=stl:\\u2501 call assert_fails('call setcellwidths([[0x2501, 0x2501, 2]])', 'E835:') set listchars& set fillchars& call setcellwidths([]) endfunc func Test_getcellwidths() call setcellwidths([]) call assert_equal([], getcellwidths()) let widthlist = [ \ [0x1330, 0x1330, 2], \ [9999, 10000, 1], \ [0x1337, 0x1339, 2], \] let widthlistsorted = [ \ [0x1330, 0x1330, 2], \ [0x1337, 0x1339, 2], \ [9999, 10000, 1], \] call setcellwidths(widthlist) call assert_equal(widthlistsorted, getcellwidths()) call setcellwidths([]) endfunc func Test_setcellwidths_dump() CheckRunVimInTerminal let lines =<< trim END call setline(1, "\ue5ffDesktop") END call writefile(lines, 'XCellwidths', 'D') let buf = RunVimInTerminal('-S XCellwidths', {'rows': 6}) call VerifyScreenDump(buf, 'Test_setcellwidths_dump_1', {}) call term_sendkeys(buf, ":call setcellwidths([[0xe5ff, 0xe5ff, 2]])\<CR>") call VerifyScreenDump(buf, 'Test_setcellwidths_dump_2', {}) call StopVimInTerminal(buf) endfunc func Test_print_overlong() " Text with more composing characters than MB_MAXBYTES. new call setline(1, 'axxxxxxxxxxxxxxxxxxxxxxxxxxxxxx') s/x/\=nr2char(1629)/g print bwipe! endfunc func Test_recording_with_select_mode_utf8() call Run_test_recording_with_select_mode_utf8() endfunc func Run_test_recording_with_select_mode_utf8() new " No escaping call feedkeys("qacc12345\<Esc>gH哦\<Esc>q", "tx") call assert_equal("哦", getline(1)) call assert_equal("cc12345\<Esc>gH哦\<Esc>", @a) call setline(1, 'asdf') normal! @a call assert_equal("哦", getline(1)) " 固 is 0xE5 0x9B 0xBA where 0x9B is CSI call feedkeys("qacc12345\<Esc>gH固\<Esc>q", "tx") call assert_equal("固", getline(1)) call assert_equal("cc12345\<Esc>gH固\<Esc>", @a) call setline(1, 'asdf') normal! @a call assert_equal("固", getline(1)) " 四 is 0xE5 0x9B 0x9B where 0x9B is CSI call feedkeys("qacc12345\<Esc>gH四\<Esc>q", "tx") call assert_equal("四", getline(1)) call assert_equal("cc12345\<Esc>gH四\<Esc>", @a) call setline(1, 'asdf') normal! @a call assert_equal("四", getline(1)) " 倒 is 0xE5 0x80 0x92 where 0x80 is K_SPECIAL call feedkeys("qacc12345\<Esc>gH倒\<Esc>q", "tx") call assert_equal("倒", getline(1)) call assert_equal("cc12345\<Esc>gH倒\<Esc>", @a) call setline(1, 'asdf') normal! @a call assert_equal("倒", getline(1)) bwipe! endfunc " This must be done as one of the last tests, because it starts the GUI, which " cannot be undone. func Test_zz_recording_with_select_mode_utf8_gui() CheckCanRunGui gui -f call Run_test_recording_with_select_mode_utf8() endfunc " vim: shiftwidth=2 sts=2 expandtab