Fix CVE-2021-22918

author Dominique Dumont <dod@debian.org>

Sun, 4 Jul 2021 07:43:38 +0000 (08:43 +0100)

committer Dominique Dumont <dod@debian.org>

Sun, 4 Jul 2021 07:43:38 +0000 (08:43 +0100)
author Dominique Dumont <dod@debian.org>
Sun, 4 Jul 2021 07:43:38 +0000 (08:43 +0100)
committer Dominique Dumont <dod@debian.org>
Sun, 4 Jul 2021 07:43:38 +0000 (08:43 +0100)
diff --git a/src/idna.c b/src/idna.c

index 13ffac6be8142d905bc7045a1454790fbb0ac44b..b44cb16a1ee60bae84c3ed6ebb65eaeefa32bbd8 100644 (file)
--- a/src/idna.c
+++ b/src/idna.c
@@ -19,6 +19,7 @@
  
  #include "uv.h"
  #include "idna.h"
+#include <assert.h>
  #include <string.h>
  
  static unsigned uv__utf8_decode1_slow(const char** p,
@@ -32,7 +33,7 @@ static unsigned uv__utf8_decode1_slow(const char** p,
    if (a > 0xF7)
      return -1;
  
-  switch (*p - pe) {
+  switch (pe - *p) {
    default:
      if (a > 0xEF) {
        min = 0x10000;
@@ -62,6 +63,8 @@ static unsigned uv__utf8_decode1_slow(const char** p,
        a = 0;
        break;
      }
+    /* Fall through. */
+  case 0:
      return -1;  /* Invalid continuation byte. */
    }
  
@@ -88,6 +91,8 @@ static unsigned uv__utf8_decode1_slow(const char** p,
  unsigned uv__utf8_decode1(const char** p, const char* pe) {
    unsigned a;
  
+  assert(*p < pe);
+
    a = (unsigned char) *(*p)++;
  
    if (a < 128)
@@ -96,9 +101,6 @@ unsigned uv__utf8_decode1(const char** p, const char* pe) {
    return uv__utf8_decode1_slow(p, pe, a);
  }
  
-#define foreach_codepoint(c, p, pe) \
-  for (; (void) (*p <= pe && (c = uv__utf8_decode1(p, pe))), *p <= pe;)
-
  static int uv__idna_toascii_label(const char* s, const char* se,
                                    char** d, char* de) {
    static const char alphabet[] = "abcdefghijklmnopqrstuvwxyz0123456789";
@@ -121,15 +123,22 @@ static int uv__idna_toascii_label(const char* s, const char* se,
    ss = s;
    todo = 0;
  
-  foreach_codepoint(c, &s, se) {
+  /* Note: after this loop we've visited all UTF-8 characters and know
+   * they're legal so we no longer need to check for decode errors.
+   */
+  while (s < se) {
+    c = uv__utf8_decode1(&s, se);
+
+    if (c == -1u)
+      return UV_EINVAL;
+
      if (c < 128)
        h++;
-    else if (c == (unsigned) -1)
-      return UV_EINVAL;
      else
        todo++;
    }
  
+  /* Only write "xn--" when there are non-ASCII characters. */
    if (todo > 0) {
      if (*d < de) *(*d)++ = 'x';
      if (*d < de) *(*d)++ = 'n';
@@ -137,9 +146,13 @@ static int uv__idna_toascii_label(const char* s, const char* se,
      if (*d < de) *(*d)++ = '-';
    }
  
+  /* Write ASCII characters. */
    x = 0;
    s = ss;
-  foreach_codepoint(c, &s, se) {
+  while (s < se) {
+    c = uv__utf8_decode1(&s, se);
+    assert(c != -1u);
+
      if (c > 127)
        continue;
  
@@ -166,10 +179,15 @@ static int uv__idna_toascii_label(const char* s, const char* se,
    while (todo > 0) {
      m = -1;
      s = ss;
-    foreach_codepoint(c, &s, se)
+
+    while (s < se) {
+      c = uv__utf8_decode1(&s, se);
+      assert(c != -1u);
+
        if (c >= n)
          if (c < m)
            m = c;
+    }
  
      x = m - n;
      y = h + 1;
@@ -181,7 +199,10 @@ static int uv__idna_toascii_label(const char* s, const char* se,
      n = m;
  
      s = ss;
-    foreach_codepoint(c, &s, se) {
+    while (s < se) {
+      c = uv__utf8_decode1(&s, se);
+      assert(c != -1u);
+
        if (c < n)
          if (++delta == 0)
            return UV_E2BIG;  /* Overflow. */
@@ -245,8 +266,6 @@ static int uv__idna_toascii_label(const char* s, const char* se,
    return 0;
  }
  
-#undef foreach_codepoint
-
  long uv__idna_toascii(const char* s, const char* se, char* d, char* de) {
    const char* si;
    const char* st;
@@ -256,10 +275,14 @@ long uv__idna_toascii(const char* s, const char* se, char* d, char* de) {
  
    ds = d;
  
-  for (si = s; si < se; /* empty */) {
+  si = s;
+  while (si < se) {
      st = si;
      c = uv__utf8_decode1(&si, se);
  
+    if (c == -1u)
+      return UV_EINVAL;
+
      if (c != '.')
        if (c != 0x3002)  /* 。 */
          if (c != 0xFF0E)  /* ． */
diff --git a/test/test-idna.c b/test/test-idna.c

index b76853cb996ecc099440d186e70e8dd0b4398fa5..f4fad9653df2cfcaad504f737e8d38b45a3d1c4d 100644 (file)
--- a/test/test-idna.c
+++ b/test/test-idna.c
@@ -96,6 +96,25 @@ TEST_IMPL(utf8_decode1) {
    return 0;
  }
  
+TEST_IMPL(utf8_decode1_overrun) {
+  const char* p;
+  char b[1];
+
+  /* Single byte. */
+  p = b;
+  b[0] = 0x7F;
+  ASSERT_EQ(0x7F, uv__utf8_decode1(&p, b + 1));
+  ASSERT_EQ(p, b + 1);
+
+  /* Multi-byte. */
+  p = b;
+  b[0] = 0xC0;
+  ASSERT_EQ((unsigned) -1, uv__utf8_decode1(&p, b + 1));
+  ASSERT_EQ(p, b + 1);
+
+  return 0;
+}
+
  /* Doesn't work on z/OS because that platform uses EBCDIC, not ASCII. */
  #ifndef __MVS__
  
diff --git a/test/test-list.h b/test/test-list.h

index 52b17a69147aa0afbe8387dcbd53e6c237ab28cb..66e88a9f74c2160ff73730b11d412fab5b515c05 100644 (file)
--- a/test/test-list.h
+++ b/test/test-list.h
@@ -521,6 +521,7 @@ TEST_DECLARE  (fork_threadpool_queue_work_simple)
  
  TEST_DECLARE  (idna_toascii)
  TEST_DECLARE  (utf8_decode1)
+TEST_DECLARE  (utf8_decode1_overrun)
  TEST_DECLARE  (uname)
  
  TEST_DECLARE  (metrics_idle_time)
@@ -1108,6 +1109,7 @@ TASK_LIST_START
  #endif
  
    TEST_ENTRY  (utf8_decode1)
+  TEST_ENTRY  (utf8_decode1_overrun)
    TEST_ENTRY  (uname)
  
  /* Doesn't work on z/OS because that platform uses EBCDIC, not ASCII. */
author	Dominique Dumont <dod@debian.org>
	Sun, 4 Jul 2021 07:43:38 +0000 (08:43 +0100)
committer	Dominique Dumont <dod@debian.org>
	Sun, 4 Jul 2021 07:43:38 +0000 (08:43 +0100)
src/idna.c		patch \| blob \| history
test/test-idna.c		patch \| blob \| history
test/test-list.h		patch \| blob \| history