From 7e501f1993cc1e4b8344643bcee449cc8c958d7e Mon Sep 17 00:00:00 2001 From: nicm Date: Tue, 2 Jun 2020 17:17:44 +0000 Subject: [PATCH] UTF-8 keys need to be big endian so the size bits are at the top. --- utf8.c | 10 +++++----- 1 file changed, 5 insertions(+), 5 deletions(-) diff --git a/utf8.c b/utf8.c index 893cb5ee..5c11b7ca 100644 --- a/utf8.c +++ b/utf8.c @@ -162,14 +162,14 @@ utf8_from_data(const struct utf8_data *ud, utf8_char *uc) m.data[1] = (offset >> 8) & 0xff; m.data[2] = (offset >> 16); } - *uc = m.uc; + *uc = htonl(m.uc); return (UTF8_DONE); fail: if (ud->width == 1) - *uc = utf8_space1.uc; + *uc = htonl(utf8_space1.uc); else - *uc = utf8_space2.uc; + *uc = htonl(utf8_space2.uc); return (UTF8_ERROR); } @@ -177,7 +177,7 @@ fail: void utf8_to_data(utf8_char uc, struct utf8_data *ud) { - union utf8_map m = { .uc = uc }; + union utf8_map m = { .uc = ntohl(uc) }; struct utf8_item *ui; u_int offset; @@ -210,7 +210,7 @@ utf8_build_one(char c, u_int width) if (width == 2) m.flags |= UTF8_FLAG_WIDTH2; - return (m.uc); + return (htonl(m.uc)); } /* Set a single character. */