mirror of
https://github.com/samba-team/samba.git
synced 2025-01-10 01:18:15 +03:00
libutil/iconv: avoid overflow in surrogate pairs
Consider the non-conforment utf-8 sequence "\xf5\x80\x80\x80", which would encode 0x140000. We would set the high byte of the first surrogate to 0xd8 | (0x130000 >> 18), or 0xdc, which is an invalid start for a high surrogate, making the sequence as a whole invalid (as you would expect -- the Unicode range was set precisely to that covered by utf-16 surrogates). Signed-off-by: Douglas Bagnall <douglas.bagnall@catalyst.net.nz> Reviewed-by: Andrew Bartlett <abartlet@samba.org>
This commit is contained in:
parent
949fe57077
commit
3960eabca7
@ -923,6 +923,16 @@ static size_t utf8_pull(void *cd, const char **inbuf, size_t *inbytesleft,
|
|||||||
errno = EILSEQ;
|
errno = EILSEQ;
|
||||||
goto error;
|
goto error;
|
||||||
}
|
}
|
||||||
|
if (codepoint > 0x10ffff) {
|
||||||
|
/*
|
||||||
|
* Unicode stops at 0x10ffff, and if
|
||||||
|
* we ignore that, we'll end up
|
||||||
|
* encoding the wrong characters in
|
||||||
|
* the surrogate pair.
|
||||||
|
*/
|
||||||
|
errno = EILSEQ;
|
||||||
|
goto error;
|
||||||
|
}
|
||||||
|
|
||||||
codepoint -= 0x10000;
|
codepoint -= 0x10000;
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user