summaryrefslogtreecommitdiffstats
path: root/utf8.c
diff options
context:
space:
mode:
authornicm <nicm>2023-01-08 22:15:30 +0000
committernicm <nicm>2023-01-08 22:15:30 +0000
commit7ced0a03d2ff51274d5fa5fb6eeaa6f4aac9f2f4 (patch)
tree44cb365fc5e93a05f1a2df4f7d201eeca1d650b1 /utf8.c
parentcb51942669cef089b46cd2b6cdbd62405000c0e7 (diff)
Restore code to handle wcwidth failure so that unknown codepoints still
do the most likely right thing. GitHub issue 3427, patch based on an diff from Jesse Luehrs in GitHub issue 3003.
Diffstat (limited to 'utf8.c')
-rw-r--r--utf8.c11
1 files changed, 9 insertions, 2 deletions
diff --git a/utf8.c b/utf8.c
index 03918cd2..3c6f88ff 100644
--- a/utf8.c
+++ b/utf8.c
@@ -226,9 +226,16 @@ utf8_width(struct utf8_data *ud, int *width)
case 0:
return (UTF8_ERROR);
}
+ log_debug("UTF-8 %.*s is %08X", (int)ud->size, ud->data, (u_int)wc);
*width = wcwidth(wc);
- log_debug("UTF-8 %.*s %#x, wcwidth() %d", (int)ud->size, ud->data,
- (u_int)wc, *width);
+ log_debug("wcwidth(%08X) returned %d", (u_int)wc, *width);
+ if (*width < 0) {
+ /*
+ * C1 control characters are nonprintable, so they are always
+ * zero width.
+ */
+ *width = (wc >= 0x80 && wc <= 0x9f) ? 0 : 1;
+ }
if (*width >= 0 && *width <= 0xff)
return (UTF8_DONE);
return (UTF8_ERROR);