udf: Fix leak of UTF-16 surrogates into encoded strings

author Jan Kara <jack@suse.cz>

Thu, 12 Apr 2018 15:22:23 +0000 (17:22 +0200)

committer Greg Kroah-Hartman <gregkh@linuxfoundation.org>

Tue, 24 Apr 2018 07:36:38 +0000 (09:36 +0200)
author Jan Kara <jack@suse.cz>
Thu, 12 Apr 2018 15:22:23 +0000 (17:22 +0200)
committer Greg Kroah-Hartman <gregkh@linuxfoundation.org>
Tue, 24 Apr 2018 07:36:38 +0000 (09:36 +0200)
diff --git a/fs/udf/unicode.c b/fs/udf/unicode.c

index 695389a4fc239f245cfacfa5a1e2fde9eae5b4a7..3a3be23689b352be9d19c7f34172c00645f5a83b 100644 (file)
--- a/fs/udf/unicode.c
+++ b/fs/udf/unicode.c
@@ -28,6 +28,9 @@
  
  #include "udf_sb.h"
  
+#define SURROGATE_MASK 0xfffff800
+#define SURROGATE_PAIR 0x0000d800
+
  static int udf_uni2char_utf8(wchar_t uni,
                              unsigned char *out,
                              int boundlen)
@@ -37,6 +40,9 @@ static int udf_uni2char_utf8(wchar_t uni,
         if (boundlen <= 0)
                 return -ENAMETOOLONG;
  
+       if ((uni & SURROGATE_MASK) == SURROGATE_PAIR)
+               return -EINVAL;
+
         if (uni < 0x80) {
                 out[u_len++] = (unsigned char)uni;
         } else if (uni < 0x800) {
author	Jan Kara <jack@suse.cz>
	Thu, 12 Apr 2018 15:22:23 +0000 (17:22 +0200)
committer	Greg Kroah-Hartman <gregkh@linuxfoundation.org>
	Tue, 24 Apr 2018 07:36:38 +0000 (09:36 +0200)