mirror of
				https://github.com/vim/vim.git
				synced 2025-10-26 09:14:23 -04:00 
			
		
		
		
	patch 9.0.1629: having utf16idx() rounding up is inconvenient
Problem: Having utf16idx() rounding up is inconvenient. Solution: Make utf16idx() round down. (Yegappan Lakshmanan, closes #12523)
This commit is contained in:
		
				
					committed by
					
						 Bram Moolenaar
						Bram Moolenaar
					
				
			
			
				
	
			
			
			
						parent
						
							d5b952a871
						
					
				
				
					commit
					95707037af
				
			| @@ -10127,8 +10127,8 @@ utf16idx({string}, {idx} [, {countcc} [, {charidx}]]) | |||||||
| 		When {charidx} is present and TRUE, {idx} is used as the | 		When {charidx} is present and TRUE, {idx} is used as the | ||||||
| 		character index in the String {string} instead of as the byte | 		character index in the String {string} instead of as the byte | ||||||
| 		index. | 		index. | ||||||
| 		An {idx} in the middle of a UTF-8 sequence is rounded upwards | 		An {idx} in the middle of a UTF-8 sequence is rounded | ||||||
| 		to the end of that sequence. | 		downwards to the beginning of that sequence. | ||||||
|  |  | ||||||
| 		Returns -1 if the arguments are invalid or if there are less | 		Returns -1 if the arguments are invalid or if there are less | ||||||
| 		than {idx} bytes in {string}. If there are exactly {idx} bytes | 		than {idx} bytes in {string}. If there are exactly {idx} bytes | ||||||
|   | |||||||
| @@ -1743,8 +1743,10 @@ f_strtrans(typval_T *argvars, typval_T *rettv) | |||||||
|  |  | ||||||
|  |  | ||||||
| /* | /* | ||||||
|  * |  | ||||||
|  * "utf16idx()" function |  * "utf16idx()" function | ||||||
|  |  * | ||||||
|  |  * Converts a byte or character offset in a string to the corresponding UTF-16 | ||||||
|  |  * code unit offset. | ||||||
|  */ |  */ | ||||||
|     void |     void | ||||||
| f_utf16idx(typval_T *argvars, typval_T *rettv) | f_utf16idx(typval_T *argvars, typval_T *rettv) | ||||||
| @@ -1780,6 +1782,7 @@ f_utf16idx(typval_T *argvars, typval_T *rettv) | |||||||
|  |  | ||||||
|     char_u	*p; |     char_u	*p; | ||||||
|     int		len; |     int		len; | ||||||
|  |     int		utf16idx = 0; | ||||||
|     for (p = str, len = 0; charidx ? idx >= 0 : p <= str + idx; len++) |     for (p = str, len = 0; charidx ? idx >= 0 : p <= str + idx; len++) | ||||||
|     { |     { | ||||||
| 	if (*p == NUL) | 	if (*p == NUL) | ||||||
| @@ -1791,6 +1794,7 @@ f_utf16idx(typval_T *argvars, typval_T *rettv) | |||||||
| 		rettv->vval.v_number = len; | 		rettv->vval.v_number = len; | ||||||
| 	    return; | 	    return; | ||||||
| 	} | 	} | ||||||
|  | 	utf16idx = len; | ||||||
| 	int clen = ptr2len(p); | 	int clen = ptr2len(p); | ||||||
| 	int c = (clen > 1) ? utf_ptr2char(p) : *p; | 	int c = (clen > 1) ? utf_ptr2char(p) : *p; | ||||||
| 	if (c > 0xFFFF) | 	if (c > 0xFFFF) | ||||||
| @@ -1800,7 +1804,7 @@ f_utf16idx(typval_T *argvars, typval_T *rettv) | |||||||
| 	    idx--; | 	    idx--; | ||||||
|     } |     } | ||||||
|  |  | ||||||
|     rettv->vval.v_number = len > 0 ? len - 1 : 0; |     rettv->vval.v_number = utf16idx; | ||||||
| } | } | ||||||
|  |  | ||||||
| /* | /* | ||||||
|   | |||||||
| @@ -1518,14 +1518,14 @@ func Test_utf16idx_from_byteidx() | |||||||
|   " UTF-16 index of a string with four byte characters |   " UTF-16 index of a string with four byte characters | ||||||
|   let str = 'a😊😊b' |   let str = 'a😊😊b' | ||||||
|   call assert_equal(0, utf16idx(str, 0)) |   call assert_equal(0, utf16idx(str, 0)) | ||||||
|   call assert_equal(2, utf16idx(str, 1)) |   call assert_equal(1, utf16idx(str, 1)) | ||||||
|   call assert_equal(2, utf16idx(str, 2)) |   call assert_equal(1, utf16idx(str, 2)) | ||||||
|   call assert_equal(2, utf16idx(str, 3)) |   call assert_equal(1, utf16idx(str, 3)) | ||||||
|   call assert_equal(2, utf16idx(str, 4)) |   call assert_equal(1, utf16idx(str, 4)) | ||||||
|   call assert_equal(4, utf16idx(str, 5)) |   call assert_equal(3, utf16idx(str, 5)) | ||||||
|   call assert_equal(4, utf16idx(str, 6)) |   call assert_equal(3, utf16idx(str, 6)) | ||||||
|   call assert_equal(4, utf16idx(str, 7)) |   call assert_equal(3, utf16idx(str, 7)) | ||||||
|   call assert_equal(4, utf16idx(str, 8)) |   call assert_equal(3, utf16idx(str, 8)) | ||||||
|   call assert_equal(5, utf16idx(str, 9)) |   call assert_equal(5, utf16idx(str, 9)) | ||||||
|   call assert_equal(6, utf16idx(str, 10)) |   call assert_equal(6, utf16idx(str, 10)) | ||||||
|   call assert_equal(-1, utf16idx(str, 11)) |   call assert_equal(-1, utf16idx(str, 11)) | ||||||
| @@ -1621,8 +1621,8 @@ func Test_utf16idx_from_charidx() | |||||||
|   " UTF-16 index of a string with four byte characters |   " UTF-16 index of a string with four byte characters | ||||||
|   let str = "a😊😊b" |   let str = "a😊😊b" | ||||||
|   call assert_equal(0, utf16idx(str, 0, v:false, v:true)) |   call assert_equal(0, utf16idx(str, 0, v:false, v:true)) | ||||||
|   call assert_equal(2, utf16idx(str, 1, v:false, v:true)) |   call assert_equal(1, utf16idx(str, 1, v:false, v:true)) | ||||||
|   call assert_equal(4, utf16idx(str, 2, v:false, v:true)) |   call assert_equal(3, utf16idx(str, 2, v:false, v:true)) | ||||||
|   call assert_equal(5, utf16idx(str, 3, v:false, v:true)) |   call assert_equal(5, utf16idx(str, 3, v:false, v:true)) | ||||||
|   call assert_equal(6, utf16idx(str, 4, v:false, v:true)) |   call assert_equal(6, utf16idx(str, 4, v:false, v:true)) | ||||||
|   call assert_equal(-1, utf16idx(str, 5, v:false, v:true)) |   call assert_equal(-1, utf16idx(str, 5, v:false, v:true)) | ||||||
|   | |||||||
| @@ -695,6 +695,8 @@ static char *(features[]) = | |||||||
|  |  | ||||||
| static int included_patches[] = | static int included_patches[] = | ||||||
| {   /* Add new patch number below this line */ | {   /* Add new patch number below this line */ | ||||||
|  | /**/ | ||||||
|  |     1629, | ||||||
| /**/ | /**/ | ||||||
|     1628, |     1628, | ||||||
| /**/ | /**/ | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user