|
|
- From b7466e31e4bee160d82a68fca11b1f61d46debae Mon Sep 17 00:00:00 2001
- From: Ben Noordhuis <info@bnoordhuis.nl>
- Date: Fri, 21 May 2021 11:23:36 +0200
- Subject: [PATCH] idna: fix OOB read in punycode decoder
-
- libuv was vulnerable to out-of-bounds reads in the uv__idna_toascii()
- function which is used to convert strings to ASCII. This is called by
- the DNS resolution function and can lead to information disclosures or
- crashes.
-
- Reported by Eric Sesterhenn in collaboration with Cure53 and ExpressVPN.
-
- Reported-By: Eric Sesterhenn <eric.sesterhenn@x41-dsec.de>
- Fixes: https://github.com/libuv/libuv/issues/3147
- PR-URL: https://github.com/libuv/libuv-private/pull/1
- Refs: https://cve.mitre.org/cgi-bin/cvename.cgi?name=CVE-2021-22918
- Reviewed-By: Colin Ihrig <cjihrig@gmail.com>
- Reviewed-By: Richard Lau <riclau@uk.ibm.com>
- ---
- src/idna.c | 49 +++++++++++++++++++++++++++++++++++-------------
- test/test-idna.c | 19 +++++++++++++++++++
- test/test-list.h | 2 ++
- 3 files changed, 57 insertions(+), 13 deletions(-)
-
- --- a/src/idna.c
- +++ b/src/idna.c
- @@ -19,6 +19,7 @@
-
- #include "uv.h"
- #include "idna.h"
- +#include <assert.h>
- #include <string.h>
-
- static unsigned uv__utf8_decode1_slow(const char** p,
- @@ -32,7 +33,7 @@ static unsigned uv__utf8_decode1_slow(co
- if (a > 0xF7)
- return -1;
-
- - switch (*p - pe) {
- + switch (pe - *p) {
- default:
- if (a > 0xEF) {
- min = 0x10000;
- @@ -62,6 +63,8 @@ static unsigned uv__utf8_decode1_slow(co
- a = 0;
- break;
- }
- + /* Fall through. */
- + case 0:
- return -1; /* Invalid continuation byte. */
- }
-
- @@ -88,6 +91,8 @@ static unsigned uv__utf8_decode1_slow(co
- unsigned uv__utf8_decode1(const char** p, const char* pe) {
- unsigned a;
-
- + assert(*p < pe);
- +
- a = (unsigned char) *(*p)++;
-
- if (a < 128)
- @@ -96,9 +101,6 @@ unsigned uv__utf8_decode1(const char** p
- return uv__utf8_decode1_slow(p, pe, a);
- }
-
- -#define foreach_codepoint(c, p, pe) \
- - for (; (void) (*p <= pe && (c = uv__utf8_decode1(p, pe))), *p <= pe;)
- -
- static int uv__idna_toascii_label(const char* s, const char* se,
- char** d, char* de) {
- static const char alphabet[] = "abcdefghijklmnopqrstuvwxyz0123456789";
- @@ -121,15 +123,22 @@ static int uv__idna_toascii_label(const
- ss = s;
- todo = 0;
-
- - foreach_codepoint(c, &s, se) {
- + /* Note: after this loop we've visited all UTF-8 characters and know
- + * they're legal so we no longer need to check for decode errors.
- + */
- + while (s < se) {
- + c = uv__utf8_decode1(&s, se);
- +
- + if (c == -1u)
- + return UV_EINVAL;
- +
- if (c < 128)
- h++;
- - else if (c == (unsigned) -1)
- - return UV_EINVAL;
- else
- todo++;
- }
-
- + /* Only write "xn--" when there are non-ASCII characters. */
- if (todo > 0) {
- if (*d < de) *(*d)++ = 'x';
- if (*d < de) *(*d)++ = 'n';
- @@ -137,9 +146,13 @@ static int uv__idna_toascii_label(const
- if (*d < de) *(*d)++ = '-';
- }
-
- + /* Write ASCII characters. */
- x = 0;
- s = ss;
- - foreach_codepoint(c, &s, se) {
- + while (s < se) {
- + c = uv__utf8_decode1(&s, se);
- + assert(c != -1u);
- +
- if (c > 127)
- continue;
-
- @@ -166,10 +179,15 @@ static int uv__idna_toascii_label(const
- while (todo > 0) {
- m = -1;
- s = ss;
- - foreach_codepoint(c, &s, se)
- +
- + while (s < se) {
- + c = uv__utf8_decode1(&s, se);
- + assert(c != -1u);
- +
- if (c >= n)
- if (c < m)
- m = c;
- + }
-
- x = m - n;
- y = h + 1;
- @@ -181,7 +199,10 @@ static int uv__idna_toascii_label(const
- n = m;
-
- s = ss;
- - foreach_codepoint(c, &s, se) {
- + while (s < se) {
- + c = uv__utf8_decode1(&s, se);
- + assert(c != -1u);
- +
- if (c < n)
- if (++delta == 0)
- return UV_E2BIG; /* Overflow. */
- @@ -245,8 +266,6 @@ static int uv__idna_toascii_label(const
- return 0;
- }
-
- -#undef foreach_codepoint
- -
- long uv__idna_toascii(const char* s, const char* se, char* d, char* de) {
- const char* si;
- const char* st;
- @@ -256,10 +275,14 @@ long uv__idna_toascii(const char* s, con
-
- ds = d;
-
- - for (si = s; si < se; /* empty */) {
- + si = s;
- + while (si < se) {
- st = si;
- c = uv__utf8_decode1(&si, se);
-
- + if (c == -1u)
- + return UV_EINVAL;
- +
- if (c != '.')
- if (c != 0x3002) /* 。 */
- if (c != 0xFF0E) /* . */
|