From 8bb93485fb51aac423ec000aa292815cf50bb02c Mon Sep 17 00:00:00 2001 From: Baptiste Daroussin Date: Sun, 9 Aug 2015 00:06:56 +0000 Subject: [PATCH] Remove 5 and 6 bytes sequences which are illegal in UTF-8 space. (part2) Per rfc3629 value greater than 0x10ffff should be rejected Suggested by: jilles --- lib/libc/locale/utf8.c | 8 +------- 1 file changed, 1 insertion(+), 7 deletions(-) diff --git a/lib/libc/locale/utf8.c b/lib/libc/locale/utf8.c index 843d59f77c5..55e29319c62 100644 --- a/lib/libc/locale/utf8.c +++ b/lib/libc/locale/utf8.c @@ -320,15 +320,9 @@ _UTF8_wcrtomb(char * __restrict s, wchar_t wc, mbstate_t * __restrict ps) } else if ((wc & ~0xffff) == 0) { lead = 0xe0; len = 3; - } else if ((wc & ~0x1fffff) == 0) { + } else if (wc >= 0 && wc <= 0x10ffff) { lead = 0xf0; len = 4; - } else if ((wc & ~0x3ffffff) == 0) { - lead = 0xf8; - len = 5; - } else if ((wc & ~0x7fffffff) == 0) { - lead = 0xfc; - len = 6; } else { errno = EILSEQ; return ((size_t)-1);