chars: speed up the parsing of a character for the plain ASCII case
Again, if the most significant bit of a UTF-8 byte is zero, it means the character is a single byte and we can skip the call of mblen(), *and* if the character is one byte it also occupies just one column, because all ASCII characters are single-column characters -- apart from control codes. This partially addresses https://savannah.gnu.org/bugs/?51491.master
parent
cc2b19c8fd
commit
9a7ba5db79
19
src/chars.c
19
src/chars.c
|
@ -294,14 +294,17 @@ int parse_mbchar(const char *buf, char *chr, size_t *col)
|
||||||
{
|
{
|
||||||
#ifdef ENABLE_UTF8
|
#ifdef ENABLE_UTF8
|
||||||
if (use_utf8) {
|
if (use_utf8) {
|
||||||
/* Get the number of bytes in the multibyte character. */
|
int length;
|
||||||
int length = mblen(buf, MAXCHARLEN);
|
|
||||||
|
|
||||||
/* When the multibyte sequence is invalid, only take the first byte. */
|
/* If this is a UTF-8 starter byte, get the number of bytes of the character. */
|
||||||
if (length <= 0) {
|
if ((signed char)*buf < 0) {
|
||||||
IGNORE_CALL_RESULT(mblen(NULL, 0));
|
length = mblen(buf, MAXCHARLEN);
|
||||||
|
|
||||||
|
/* When the multibyte sequence is invalid, only take the first byte. */
|
||||||
|
if (length <= 0)
|
||||||
|
length = 1;
|
||||||
|
} else
|
||||||
length = 1;
|
length = 1;
|
||||||
}
|
|
||||||
|
|
||||||
/* When requested, store the multibyte character in chr. */
|
/* When requested, store the multibyte character in chr. */
|
||||||
if (chr != NULL) {
|
if (chr != NULL) {
|
||||||
|
@ -322,7 +325,9 @@ int parse_mbchar(const char *buf, char *chr, size_t *col)
|
||||||
else if (is_cntrl_mbchar(buf)) {
|
else if (is_cntrl_mbchar(buf)) {
|
||||||
*col += 2;
|
*col += 2;
|
||||||
/* If we have a normal character, get its width normally. */
|
/* If we have a normal character, get its width normally. */
|
||||||
} else
|
} else if (length == 1)
|
||||||
|
*col += 1;
|
||||||
|
else
|
||||||
*col += mbwidth(buf);
|
*col += mbwidth(buf);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
Loading…
Reference in New Issue