patch 9.1.1645: fuzzy.c can be further improved
Problem: fuzzy.c can be further improved Solution: Fix memory leak and refactor it (glepnir). Optimize performance and memory allocation: - Fix memory leak in fuzzy_match_in_list. - using single memory allocation in match_positions - Improve has_match performance and add null pointer checks closes: #18012 Signed-off-by: glepnir <glephunter@gmail.com> Signed-off-by: Christian Brabandt <cb@256bit.org>
This commit is contained in:
committed by
Christian Brabandt
parent
ce288c7fb0
commit
59799f3afa
144
src/fuzzy.c
144
src/fuzzy.c
@ -216,7 +216,7 @@ fuzzy_match_in_list(
|
||||
long max_matches)
|
||||
{
|
||||
long len;
|
||||
fuzzyItem_T *items;
|
||||
fuzzyItem_T *items = NULL;
|
||||
listitem_T *li;
|
||||
long match_count = 0;
|
||||
int_u matches[FUZZY_MATCH_MAX_LEN];
|
||||
@ -235,14 +235,15 @@ fuzzy_match_in_list(
|
||||
FOR_ALL_LIST_ITEMS(l, li)
|
||||
{
|
||||
int score;
|
||||
char_u *itemstr;
|
||||
char_u *itemstr = NULL;
|
||||
char_u *itemstr_copy = NULL;
|
||||
typval_T rettv;
|
||||
int itemstr_allocate = FALSE;
|
||||
list_T *match_positions = NULL;
|
||||
|
||||
if (max_matches > 0 && match_count >= max_matches)
|
||||
break;
|
||||
|
||||
itemstr = NULL;
|
||||
rettv.v_type = VAR_UNKNOWN;
|
||||
if (li->li_tv.v_type == VAR_STRING) // list of strings
|
||||
itemstr = li->li_tv.vval.v_string;
|
||||
@ -279,34 +280,45 @@ fuzzy_match_in_list(
|
||||
&& fuzzy_match(itemstr, str, matchseq, &score, matches,
|
||||
FUZZY_MATCH_MAX_LEN))
|
||||
{
|
||||
items[match_count].idx = match_count;
|
||||
items[match_count].item = li;
|
||||
items[match_count].score = score;
|
||||
items[match_count].pat = str;
|
||||
items[match_count].startpos = matches[0];
|
||||
items[match_count].itemstr = itemstr_allocate
|
||||
? vim_strsave(itemstr) : itemstr;
|
||||
items[match_count].itemstr_allocated = itemstr_allocate;
|
||||
if (itemstr_allocate)
|
||||
{
|
||||
itemstr_copy = vim_strsave(itemstr);
|
||||
if (itemstr_copy == NULL)
|
||||
{
|
||||
clear_tv(&rettv);
|
||||
continue;
|
||||
}
|
||||
}
|
||||
else
|
||||
itemstr_copy = itemstr;
|
||||
|
||||
// Copy the list of matching positions in itemstr to a list, if
|
||||
// "retmatchpos" is set.
|
||||
if (retmatchpos)
|
||||
{
|
||||
match_positions = list_alloc();
|
||||
if (match_positions == NULL)
|
||||
{
|
||||
if (itemstr_allocate && itemstr_copy)
|
||||
vim_free(itemstr_copy);
|
||||
clear_tv(&rettv);
|
||||
continue;
|
||||
}
|
||||
|
||||
// Fill position information
|
||||
int j = 0;
|
||||
char_u *p;
|
||||
char_u *p = str;
|
||||
int success = TRUE;
|
||||
|
||||
items[match_count].lmatchpos = list_alloc();
|
||||
if (items[match_count].lmatchpos == NULL)
|
||||
goto done;
|
||||
|
||||
p = str;
|
||||
while (*p != NUL && j < FUZZY_MATCH_MAX_LEN)
|
||||
while (*p != NUL && j < FUZZY_MATCH_MAX_LEN && success)
|
||||
{
|
||||
if (!VIM_ISWHITE(PTR2CHAR(p)) || matchseq)
|
||||
{
|
||||
if (list_append_number(items[match_count].lmatchpos,
|
||||
matches[j]) == FAIL)
|
||||
goto done;
|
||||
if (list_append_number(match_positions, matches[j]) == FAIL)
|
||||
{
|
||||
success = FALSE;
|
||||
break;
|
||||
}
|
||||
j++;
|
||||
}
|
||||
if (has_mbyte)
|
||||
@ -314,7 +326,25 @@ fuzzy_match_in_list(
|
||||
else
|
||||
++p;
|
||||
}
|
||||
|
||||
if (!success)
|
||||
{
|
||||
list_free(match_positions);
|
||||
if (itemstr_allocate && itemstr_copy)
|
||||
vim_free(itemstr_copy);
|
||||
clear_tv(&rettv);
|
||||
continue;
|
||||
}
|
||||
}
|
||||
items[match_count].idx = match_count;
|
||||
items[match_count].item = li;
|
||||
items[match_count].score = score;
|
||||
items[match_count].pat = str;
|
||||
items[match_count].startpos = matches[0];
|
||||
items[match_count].itemstr = itemstr_copy;
|
||||
items[match_count].itemstr_allocated = itemstr_allocate;
|
||||
items[match_count].lmatchpos = match_positions;
|
||||
|
||||
++match_count;
|
||||
}
|
||||
clear_tv(&rettv);
|
||||
@ -888,8 +918,6 @@ fuzzymatches_to_strmatches(
|
||||
int count,
|
||||
int funcsort)
|
||||
{
|
||||
int i;
|
||||
|
||||
if (count <= 0)
|
||||
goto theend;
|
||||
|
||||
@ -906,7 +934,7 @@ fuzzymatches_to_strmatches(
|
||||
else
|
||||
fuzzy_match_str_sort((void *)fuzmatch, (size_t)count);
|
||||
|
||||
for (i = 0; i < count; i++)
|
||||
for (int i = 0; i < count; i++)
|
||||
(*matches)[i] = fuzmatch[i].str;
|
||||
|
||||
theend:
|
||||
@ -933,33 +961,36 @@ theend:
|
||||
static int
|
||||
has_match(char_u *needle, char_u *haystack)
|
||||
{
|
||||
while (*needle != NUL)
|
||||
if (!needle || !haystack || !*needle)
|
||||
return FAIL;
|
||||
|
||||
char_u *n_ptr = needle;
|
||||
char_u *h_ptr = haystack;
|
||||
|
||||
while (*n_ptr)
|
||||
{
|
||||
int n_char = mb_ptr2char(needle);
|
||||
char_u *p = haystack;
|
||||
int h_char;
|
||||
int matched = FALSE;
|
||||
int n_char = mb_ptr2char(n_ptr);
|
||||
int found = FALSE;
|
||||
|
||||
while (*p != NUL)
|
||||
while (*h_ptr)
|
||||
{
|
||||
h_char = mb_ptr2char(p);
|
||||
|
||||
if (n_char == h_char
|
||||
|| MB_TOUPPER(n_char) == h_char)
|
||||
int h_char = mb_ptr2char(h_ptr);
|
||||
if (h_char == n_char || h_char == MB_TOUPPER(n_char))
|
||||
{
|
||||
matched = TRUE;
|
||||
found = TRUE;
|
||||
h_ptr += mb_ptr2len(h_ptr);
|
||||
break;
|
||||
}
|
||||
p += mb_ptr2len(p);
|
||||
h_ptr += mb_ptr2len(h_ptr);
|
||||
}
|
||||
|
||||
if (!matched)
|
||||
return 0;
|
||||
if (!found)
|
||||
return FAIL;
|
||||
|
||||
needle += mb_ptr2len(needle);
|
||||
haystack = p + mb_ptr2len(p);
|
||||
n_ptr += mb_ptr2len(n_ptr);
|
||||
}
|
||||
return 1;
|
||||
|
||||
return OK;
|
||||
}
|
||||
|
||||
typedef struct match_struct
|
||||
@ -993,8 +1024,7 @@ compute_bonus_codepoint(int last_c, int c)
|
||||
}
|
||||
|
||||
static void
|
||||
setup_match_struct(match_struct *match, char_u *needle,
|
||||
char_u *haystack)
|
||||
setup_match_struct(match_struct *match, char_u *needle, char_u *haystack)
|
||||
{
|
||||
int i = 0;
|
||||
char_u *p = needle;
|
||||
@ -1073,7 +1103,7 @@ match_row(const match_struct *match, int row, score_t *curr_D,
|
||||
static score_t
|
||||
match_positions(char_u *needle, char_u *haystack, int_u *positions)
|
||||
{
|
||||
if (!*needle)
|
||||
if (!needle || !haystack || !*needle)
|
||||
return SCORE_MIN;
|
||||
|
||||
match_struct match;
|
||||
@ -1095,20 +1125,27 @@ match_positions(char_u *needle, char_u *haystack, int_u *positions)
|
||||
// matches needle. If the lengths of the strings are equal the
|
||||
// strings themselves must also be equal (ignoring case).
|
||||
if (positions)
|
||||
{
|
||||
for (int i = 0; i < n; i++)
|
||||
positions[i] = i;
|
||||
}
|
||||
return SCORE_MAX;
|
||||
}
|
||||
|
||||
// ensure n * MATCH_MAX_LEN * 2 won't overflow
|
||||
if ((size_t)n > (SIZE_MAX / sizeof(score_t)) / MATCH_MAX_LEN / 2)
|
||||
return SCORE_MIN;
|
||||
|
||||
// Allocate for both D and M matrices in one contiguous block
|
||||
score_t *block = (score_t*)alloc(sizeof(score_t) * MATCH_MAX_LEN * n * 2);
|
||||
if (!block)
|
||||
return SCORE_MIN;
|
||||
|
||||
// D[][] Stores the best score for this position ending with a match.
|
||||
// M[][] Stores the best possible score at this position.
|
||||
score_t (*D)[MATCH_MAX_LEN], (*M)[MATCH_MAX_LEN];
|
||||
M = alloc(sizeof(score_t) * MATCH_MAX_LEN * n);
|
||||
if (!M)
|
||||
return SCORE_MIN;
|
||||
D = alloc(sizeof(score_t) * MATCH_MAX_LEN * n);
|
||||
if (!D)
|
||||
return SCORE_MIN;
|
||||
score_t (*D)[MATCH_MAX_LEN] = (score_t(*)[MATCH_MAX_LEN])block;
|
||||
score_t (*M)[MATCH_MAX_LEN] = (score_t(*)[MATCH_MAX_LEN])(block
|
||||
+ MATCH_MAX_LEN * n);
|
||||
|
||||
match_row(&match, 0, D[0], M[0], D[0], M[0]);
|
||||
for (int i = 1; i < n; i++)
|
||||
@ -1144,9 +1181,6 @@ match_positions(char_u *needle, char_u *haystack, int_u *positions)
|
||||
}
|
||||
|
||||
score_t result = M[n - 1][m - 1];
|
||||
|
||||
vim_free(M);
|
||||
vim_free(D);
|
||||
|
||||
vim_free(block);
|
||||
return result;
|
||||
}
|
||||
|
||||
@ -719,6 +719,8 @@ static char *(features[]) =
|
||||
|
||||
static int included_patches[] =
|
||||
{ /* Add new patch number below this line */
|
||||
/**/
|
||||
1645,
|
||||
/**/
|
||||
1644,
|
||||
/**/
|
||||
|
||||
Reference in New Issue
Block a user