patch 9.1.1645: fuzzy.c can be further improved
Problem: fuzzy.c can be further improved Solution: Fix memory leak and refactor it (glepnir). Optimize performance and memory allocation: - Fix memory leak in fuzzy_match_in_list. - using single memory allocation in match_positions - Improve has_match performance and add null pointer checks closes: #18012 Signed-off-by: glepnir <glephunter@gmail.com> Signed-off-by: Christian Brabandt <cb@256bit.org>
This commit is contained in:
		
				
					committed by
					
						 Christian Brabandt
						Christian Brabandt
					
				
			
			
				
	
			
			
			
						parent
						
							ce288c7fb0
						
					
				
				
					commit
					59799f3afa
				
			
							
								
								
									
										144
									
								
								src/fuzzy.c
									
									
									
									
									
								
							
							
						
						
									
										144
									
								
								src/fuzzy.c
									
									
									
									
									
								
							| @ -216,7 +216,7 @@ fuzzy_match_in_list( | |||||||
|     long	max_matches) |     long	max_matches) | ||||||
| { | { | ||||||
|     long	    len; |     long	    len; | ||||||
|     fuzzyItem_T	    *items; |     fuzzyItem_T	    *items = NULL; | ||||||
|     listitem_T	    *li; |     listitem_T	    *li; | ||||||
|     long	    match_count = 0; |     long	    match_count = 0; | ||||||
|     int_u	    matches[FUZZY_MATCH_MAX_LEN]; |     int_u	    matches[FUZZY_MATCH_MAX_LEN]; | ||||||
| @ -235,14 +235,15 @@ fuzzy_match_in_list( | |||||||
|     FOR_ALL_LIST_ITEMS(l, li) |     FOR_ALL_LIST_ITEMS(l, li) | ||||||
|     { |     { | ||||||
| 	int		score; | 	int		score; | ||||||
| 	char_u		*itemstr; | 	char_u		*itemstr = NULL; | ||||||
|  | 	char_u		*itemstr_copy = NULL; | ||||||
| 	typval_T	rettv; | 	typval_T	rettv; | ||||||
| 	int		itemstr_allocate = FALSE; | 	int		itemstr_allocate = FALSE; | ||||||
|  | 	list_T		*match_positions = NULL; | ||||||
|  |  | ||||||
| 	if (max_matches > 0 && match_count >= max_matches) | 	if (max_matches > 0 && match_count >= max_matches) | ||||||
| 	    break; | 	    break; | ||||||
|  |  | ||||||
| 	itemstr = NULL; |  | ||||||
| 	rettv.v_type = VAR_UNKNOWN; | 	rettv.v_type = VAR_UNKNOWN; | ||||||
| 	if (li->li_tv.v_type == VAR_STRING)	// list of strings | 	if (li->li_tv.v_type == VAR_STRING)	// list of strings | ||||||
| 	    itemstr = li->li_tv.vval.v_string; | 	    itemstr = li->li_tv.vval.v_string; | ||||||
| @ -279,34 +280,45 @@ fuzzy_match_in_list( | |||||||
| 		&& fuzzy_match(itemstr, str, matchseq, &score, matches, | 		&& fuzzy_match(itemstr, str, matchseq, &score, matches, | ||||||
| 						FUZZY_MATCH_MAX_LEN)) | 						FUZZY_MATCH_MAX_LEN)) | ||||||
| 	{ | 	{ | ||||||
| 	    items[match_count].idx = match_count; | 	    if (itemstr_allocate) | ||||||
| 	    items[match_count].item = li; | 	    { | ||||||
| 	    items[match_count].score = score; | 		itemstr_copy = vim_strsave(itemstr); | ||||||
| 	    items[match_count].pat = str; | 		if (itemstr_copy == NULL) | ||||||
| 	    items[match_count].startpos = matches[0]; | 		{ | ||||||
| 	    items[match_count].itemstr = itemstr_allocate | 		    clear_tv(&rettv); | ||||||
| 					    ? vim_strsave(itemstr) : itemstr; | 		    continue; | ||||||
| 	    items[match_count].itemstr_allocated = itemstr_allocate; | 		} | ||||||
|  | 	    } | ||||||
|  | 	    else | ||||||
|  | 		itemstr_copy = itemstr; | ||||||
|  |  | ||||||
| 	    // Copy the list of matching positions in itemstr to a list, if | 	    // Copy the list of matching positions in itemstr to a list, if | ||||||
| 	    // "retmatchpos" is set. | 	    // "retmatchpos" is set. | ||||||
| 	    if (retmatchpos) | 	    if (retmatchpos) | ||||||
| 	    { | 	    { | ||||||
|  | 		match_positions = list_alloc(); | ||||||
|  | 		if (match_positions == NULL) | ||||||
|  | 		{ | ||||||
|  | 		    if (itemstr_allocate && itemstr_copy) | ||||||
|  | 			vim_free(itemstr_copy); | ||||||
|  | 		    clear_tv(&rettv); | ||||||
|  | 		    continue; | ||||||
|  | 		} | ||||||
|  |  | ||||||
|  | 		// Fill position information | ||||||
| 		int	j = 0; | 		int	j = 0; | ||||||
| 		char_u	*p; | 		char_u	*p = str; | ||||||
|  | 		int	success = TRUE; | ||||||
|  |  | ||||||
| 		items[match_count].lmatchpos = list_alloc(); | 		while (*p != NUL && j < FUZZY_MATCH_MAX_LEN && success) | ||||||
| 		if (items[match_count].lmatchpos == NULL) |  | ||||||
| 		    goto done; |  | ||||||
|  |  | ||||||
| 		p = str; |  | ||||||
| 		while (*p != NUL && j < FUZZY_MATCH_MAX_LEN) |  | ||||||
| 		{ | 		{ | ||||||
| 		    if (!VIM_ISWHITE(PTR2CHAR(p)) || matchseq) | 		    if (!VIM_ISWHITE(PTR2CHAR(p)) || matchseq) | ||||||
| 		    { | 		    { | ||||||
| 			if (list_append_number(items[match_count].lmatchpos, | 			if (list_append_number(match_positions, matches[j]) == FAIL) | ||||||
| 				    matches[j]) == FAIL) | 			{ | ||||||
| 			    goto done; | 			    success = FALSE; | ||||||
|  | 			    break; | ||||||
|  | 			} | ||||||
| 			j++; | 			j++; | ||||||
| 		    } | 		    } | ||||||
| 		    if (has_mbyte) | 		    if (has_mbyte) | ||||||
| @ -314,7 +326,25 @@ fuzzy_match_in_list( | |||||||
| 		    else | 		    else | ||||||
| 			++p; | 			++p; | ||||||
| 		} | 		} | ||||||
|  |  | ||||||
|  | 		if (!success) | ||||||
|  | 		{ | ||||||
|  | 		    list_free(match_positions); | ||||||
|  | 		    if (itemstr_allocate && itemstr_copy) | ||||||
|  | 			vim_free(itemstr_copy); | ||||||
|  | 		    clear_tv(&rettv); | ||||||
|  | 		    continue; | ||||||
|  | 		} | ||||||
| 	    } | 	    } | ||||||
|  | 	    items[match_count].idx = match_count; | ||||||
|  | 	    items[match_count].item = li; | ||||||
|  | 	    items[match_count].score = score; | ||||||
|  | 	    items[match_count].pat = str; | ||||||
|  | 	    items[match_count].startpos = matches[0]; | ||||||
|  | 	    items[match_count].itemstr = itemstr_copy; | ||||||
|  | 	    items[match_count].itemstr_allocated = itemstr_allocate; | ||||||
|  | 	    items[match_count].lmatchpos = match_positions; | ||||||
|  |  | ||||||
| 	    ++match_count; | 	    ++match_count; | ||||||
| 	} | 	} | ||||||
| 	clear_tv(&rettv); | 	clear_tv(&rettv); | ||||||
| @ -888,8 +918,6 @@ fuzzymatches_to_strmatches( | |||||||
| 	int		count, | 	int		count, | ||||||
| 	int		funcsort) | 	int		funcsort) | ||||||
| { | { | ||||||
|     int		i; |  | ||||||
|  |  | ||||||
|     if (count <= 0) |     if (count <= 0) | ||||||
| 	goto theend; | 	goto theend; | ||||||
|  |  | ||||||
| @ -906,7 +934,7 @@ fuzzymatches_to_strmatches( | |||||||
|     else |     else | ||||||
| 	fuzzy_match_str_sort((void *)fuzmatch, (size_t)count); | 	fuzzy_match_str_sort((void *)fuzmatch, (size_t)count); | ||||||
|  |  | ||||||
|     for (i = 0; i < count; i++) |     for (int i = 0; i < count; i++) | ||||||
| 	(*matches)[i] = fuzmatch[i].str; | 	(*matches)[i] = fuzmatch[i].str; | ||||||
|  |  | ||||||
| theend: | theend: | ||||||
| @ -933,33 +961,36 @@ theend: | |||||||
|     static int |     static int | ||||||
| has_match(char_u *needle, char_u *haystack) | has_match(char_u *needle, char_u *haystack) | ||||||
| { | { | ||||||
|     while (*needle != NUL) |     if (!needle || !haystack || !*needle) | ||||||
|  | 	return FAIL; | ||||||
|  |  | ||||||
|  |     char_u *n_ptr = needle; | ||||||
|  |     char_u *h_ptr = haystack; | ||||||
|  |  | ||||||
|  |     while (*n_ptr) | ||||||
|     { |     { | ||||||
| 	int n_char = mb_ptr2char(needle); | 	int n_char = mb_ptr2char(n_ptr); | ||||||
| 	char_u *p = haystack; | 	int found = FALSE; | ||||||
| 	int h_char; |  | ||||||
| 	int matched = FALSE; |  | ||||||
|  |  | ||||||
| 	while (*p != NUL) | 	while (*h_ptr) | ||||||
| 	{ | 	{ | ||||||
| 	    h_char = mb_ptr2char(p); | 	    int h_char = mb_ptr2char(h_ptr); | ||||||
|  | 	    if (h_char == n_char || h_char == MB_TOUPPER(n_char)) | ||||||
| 	    if (n_char == h_char |  | ||||||
| 		    || MB_TOUPPER(n_char) == h_char) |  | ||||||
| 	    { | 	    { | ||||||
| 		matched = TRUE; | 		found = TRUE; | ||||||
|  | 		h_ptr += mb_ptr2len(h_ptr); | ||||||
| 		break; | 		break; | ||||||
| 	    } | 	    } | ||||||
| 	    p += mb_ptr2len(p); | 	    h_ptr += mb_ptr2len(h_ptr); | ||||||
| 	} | 	} | ||||||
|  |  | ||||||
| 	if (!matched) | 	if (!found) | ||||||
| 	    return 0; | 	    return FAIL; | ||||||
|  |  | ||||||
| 	needle += mb_ptr2len(needle); | 	n_ptr += mb_ptr2len(n_ptr); | ||||||
| 	haystack = p + mb_ptr2len(p); |  | ||||||
|     } |     } | ||||||
|     return 1; |  | ||||||
|  |     return OK; | ||||||
| } | } | ||||||
|  |  | ||||||
| typedef struct match_struct | typedef struct match_struct | ||||||
| @ -993,8 +1024,7 @@ compute_bonus_codepoint(int last_c, int c) | |||||||
| } | } | ||||||
|  |  | ||||||
|     static void |     static void | ||||||
| setup_match_struct(match_struct *match, char_u *needle, | setup_match_struct(match_struct *match, char_u *needle, char_u *haystack) | ||||||
| 	char_u *haystack) |  | ||||||
| { | { | ||||||
|     int i = 0; |     int i = 0; | ||||||
|     char_u *p = needle; |     char_u *p = needle; | ||||||
| @ -1073,7 +1103,7 @@ match_row(const match_struct *match, int row, score_t *curr_D, | |||||||
|     static score_t |     static score_t | ||||||
| match_positions(char_u *needle, char_u *haystack, int_u *positions) | match_positions(char_u *needle, char_u *haystack, int_u *positions) | ||||||
| { | { | ||||||
|     if (!*needle) |     if (!needle || !haystack || !*needle) | ||||||
| 	return SCORE_MIN; | 	return SCORE_MIN; | ||||||
|  |  | ||||||
|     match_struct match; |     match_struct match; | ||||||
| @ -1095,20 +1125,27 @@ match_positions(char_u *needle, char_u *haystack, int_u *positions) | |||||||
| 	// matches needle. If the lengths of the strings are equal the | 	// matches needle. If the lengths of the strings are equal the | ||||||
| 	// strings themselves must also be equal (ignoring case). | 	// strings themselves must also be equal (ignoring case). | ||||||
| 	if (positions) | 	if (positions) | ||||||
|  | 	{ | ||||||
| 	    for (int i = 0; i < n; i++) | 	    for (int i = 0; i < n; i++) | ||||||
| 		positions[i] = i; | 		positions[i] = i; | ||||||
|  | 	} | ||||||
| 	return SCORE_MAX; | 	return SCORE_MAX; | ||||||
|     } |     } | ||||||
|  |  | ||||||
|  |     // ensure n * MATCH_MAX_LEN * 2 won't overflow | ||||||
|  |     if ((size_t)n > (SIZE_MAX / sizeof(score_t)) / MATCH_MAX_LEN / 2) | ||||||
|  | 	return SCORE_MIN; | ||||||
|  |  | ||||||
|  |     // Allocate for both D and M matrices in one contiguous block | ||||||
|  |     score_t *block = (score_t*)alloc(sizeof(score_t) * MATCH_MAX_LEN * n * 2); | ||||||
|  |     if (!block) | ||||||
|  | 	return SCORE_MIN; | ||||||
|  |  | ||||||
|     // D[][] Stores the best score for this position ending with a match. |     // D[][] Stores the best score for this position ending with a match. | ||||||
|     // M[][] Stores the best possible score at this position. |     // M[][] Stores the best possible score at this position. | ||||||
|     score_t (*D)[MATCH_MAX_LEN], (*M)[MATCH_MAX_LEN]; |     score_t (*D)[MATCH_MAX_LEN] = (score_t(*)[MATCH_MAX_LEN])block; | ||||||
|     M = alloc(sizeof(score_t) * MATCH_MAX_LEN * n); |     score_t (*M)[MATCH_MAX_LEN] = (score_t(*)[MATCH_MAX_LEN])(block | ||||||
|     if (!M) | 							+ MATCH_MAX_LEN * n); | ||||||
| 	return SCORE_MIN; |  | ||||||
|     D = alloc(sizeof(score_t) * MATCH_MAX_LEN * n); |  | ||||||
|     if (!D) |  | ||||||
| 	return SCORE_MIN; |  | ||||||
|  |  | ||||||
|     match_row(&match, 0, D[0], M[0], D[0], M[0]); |     match_row(&match, 0, D[0], M[0], D[0], M[0]); | ||||||
|     for (int i = 1; i < n; i++) |     for (int i = 1; i < n; i++) | ||||||
| @ -1144,9 +1181,6 @@ match_positions(char_u *needle, char_u *haystack, int_u *positions) | |||||||
|     } |     } | ||||||
|  |  | ||||||
|     score_t result = M[n - 1][m - 1]; |     score_t result = M[n - 1][m - 1]; | ||||||
|  |     vim_free(block); | ||||||
|     vim_free(M); |  | ||||||
|     vim_free(D); |  | ||||||
|  |  | ||||||
|     return result; |     return result; | ||||||
| } | } | ||||||
|  | |||||||
| @ -719,6 +719,8 @@ static char *(features[]) = | |||||||
|  |  | ||||||
| static int included_patches[] = | static int included_patches[] = | ||||||
| {   /* Add new patch number below this line */ | {   /* Add new patch number below this line */ | ||||||
|  | /**/ | ||||||
|  |     1645, | ||||||
| /**/ | /**/ | ||||||
|     1644, |     1644, | ||||||
| /**/ | /**/ | ||||||
|  | |||||||
		Reference in New Issue
	
	Block a user