Fix decompression of unicode values above 2047

Two problems: The lead byte for 3-byte sequences was wrong, and one mid-byte was not even filled in due to a missing "++"! Apparently this was broken ever since the first "Compress as unicode, not bytes" commit, but I believed I'd "tested" it by running on the Pinyin translation. This rendered at least the Korean and Japanese translations completely illegible, affecting 5.0 and all later releases.
2020-09-08 20:54:47 -05:00 · 2020-09-08 20:54:47 -05:00 · e82940697c
commit e82940697c
parent 365d69e831
1 changed files with 2 additions and 2 deletions
--- a/supervisor/shared/translate.c
+++ b/supervisor/shared/translate.c
@ -51,8 +51,8 @@ STATIC int put_utf8(char *buf, int u) {
        *buf   = 0b10000000 | (u & 0b00111111);
        return 2;
    } else { // u <= 0xffff)
-        *buf++ = 0b11000000 | (u >> 12);
-        *buf   = 0b10000000 | ((u >> 6) & 0b00111111);
+        *buf++ = 0b11100000 | (u >> 12);
+        *buf++ = 0b10000000 | ((u >> 6) & 0b00111111);
        *buf   = 0b10000000 | (u & 0b00111111);
        return 3;
    }