From: Rich Felker Date: Fri, 1 Sep 2017 21:05:40 +0000 (-0400) Subject: fix erroneous acceptance of f4 9x xx xx code sequences by utf-8 decoder X-Git-Tag: v1.1.17~18 X-Git-Url: https://git.librecmc.org/?a=commitdiff_plain;h=39db00afadc9d8d0456c46eab42b8cb8ff9f375c;p=oweals%2Fmusl.git fix erroneous acceptance of f4 9x xx xx code sequences by utf-8 decoder the DFA table controlling accepted ranges for the f4 prefix used an incorrect upper bound of 0xa0 where it should have been 0x90, allowing such sequences to be accepted and decoded as non-Unicode-scalar values 0x110000 through 0x11ffff. --- diff --git a/src/multibyte/internal.c b/src/multibyte/internal.c index 7e1b1c03..2f5aaa91 100644 --- a/src/multibyte/internal.c +++ b/src/multibyte/internal.c @@ -9,7 +9,7 @@ | x ) #define F(x) ( ( x>=5 ? 0 : \ x==0 ? R(0x90,0xc0) : \ - x==4 ? R(0x80,0xa0) : \ + x==4 ? R(0x80,0x90) : \ R(0x80,0xc0) ) \ | ( R(0x80,0xc0) >> 6 ) \ | ( R(0x80,0xc0) >> 12 ) \