Merge topic 'utf8-fixes'

fb5de060bc cm_utf8: reject codepoints above 0x10FFFF a11e5e021b cm_utf8: reject UTF-16 surrogate half codepoints 7111873efd testUTF8: add more test cases bba2b1c89b testUTF8: comment why sequences are invalid Acked-by: Kitware Robot <kwrobot@kitware.com> Merge-request: !3097
author: Brad King <brad.king@kitware.com> 2019-03-18 15:28:43 (GMT)
committer: Kitware Robot <kwrobot@kitware.com> 2019-03-18 15:28:52 (GMT)
commit: 875f49cc588b898f5da24bff34638d16de5c6413 (patch)
tree: 67d6b95887ac9cd125af2273e34718d6ef05230d /Tests
parent: f6cbb02b59d179c572c347461e81201bdd2337ed (diff)
parent: fb5de060bc99635a5b18b3389cc15e9937b19a0e (diff)
download: CMake-875f49cc588b898f5da24bff34638d16de5c6413.zip
CMake-875f49cc588b898f5da24bff34638d16de5c6413.tar.gz
CMake-875f49cc588b898f5da24bff34638d16de5c6413.tar.bz2
1 files changed, 19 insertions, 7 deletions
diff --git a/Tests/CMakeLib/testUTF8.cxx b/Tests/CMakeLib/testUTF8.cxx
index c99c46d..7f52c82 100644
--- a/Tests/CMakeLib/testUTF8.cxx
+++ b/Tests/CMakeLib/testUTF8.cxx
@@ -21,17 +21,29 @@ struct test_utf8_entry
 };
 
 static test_utf8_entry const good_entry[] = {
-  { 1, "\x20\x00\x00\x00", 0x0020 },  /* Space.  */
-  { 2, "\xC2\xA9\x00\x00", 0x00A9 },  /* Copyright.  */
-  { 3, "\xE2\x80\x98\x00", 0x2018 },  /* Open-single-quote.  */
-  { 3, "\xE2\x80\x99\x00", 0x2019 },  /* Close-single-quote.  */
-  { 4, "\xF0\xA3\x8E\xB4", 0x233B4 }, /* Example from RFC 3629.  */
+  { 1, "\x20\x00\x00\x00", 0x0020 },   /* Space.  */
+  { 2, "\xC2\xA9\x00\x00", 0x00A9 },   /* Copyright.  */
+  { 3, "\xE2\x80\x98\x00", 0x2018 },   /* Open-single-quote.  */
+  { 3, "\xE2\x80\x99\x00", 0x2019 },   /* Close-single-quote.  */
+  { 4, "\xF0\xA3\x8E\xB4", 0x233B4 },  /* Example from RFC 3629.  */
+  { 3, "\xED\x80\x80\x00", 0xD000 },   /* Valid 0xED prefixed codepoint.  */
+  { 4, "\xF4\x8F\xBF\xBF", 0x10FFFF }, /* Highest valid RFC codepoint. */
   { 0, { 0, 0, 0, 0, 0 }, 0 }
 };
 
 static test_utf8_char const bad_chars[] = {
-  "\x80\x00\x00\x00", "\xC0\x00\x00\x00", "\xE0\x00\x00\x00",
-  "\xE0\x80\x80\x00", "\xF0\x80\x80\x80", { 0, 0, 0, 0, 0 }
+  "\x80\x00\x00\x00", /* Leading continuation byte. */
+  "\xC0\x80\x00\x00", /* Overlong encoding. */
+  "\xC1\x80\x00\x00", /* Overlong encoding. */
+  "\xC2\x00\x00\x00", /* Missing continuation byte. */
+  "\xE0\x00\x00\x00", /* Missing continuation bytes. */
+  "\xE0\x80\x80\x00", /* Overlong encoding. */
+  "\xF0\x80\x80\x80", /* Overlong encoding. */
+  "\xED\xA0\x80\x00", /* UTF-16 surrogate half. */
+  "\xED\xBF\xBF\x00", /* UTF-16 surrogate half. */
+  "\xF4\x90\x80\x80", /* Lowest out-of-range codepoint. */
+  "\xF5\x80\x80\x80", /* Prefix forces out-of-range codepoints. */
+  { 0, 0, 0, 0, 0 }
 };
 
 static void report_good(bool passed, test_utf8_char const c)
author	Brad King <brad.king@kitware.com>	2019-03-18 15:28:43 (GMT)
committer	Kitware Robot <kwrobot@kitware.com>	2019-03-18 15:28:52 (GMT)
commit	875f49cc588b898f5da24bff34638d16de5c6413 (patch)
tree	67d6b95887ac9cd125af2273e34718d6ef05230d /Tests
parent	f6cbb02b59d179c572c347461e81201bdd2337ed (diff)
parent	fb5de060bc99635a5b18b3389cc15e9937b19a0e (diff)
download	CMake-875f49cc588b898f5da24bff34638d16de5c6413.zip CMake-875f49cc588b898f5da24bff34638d16de5c6413.tar.gz CMake-875f49cc588b898f5da24bff34638d16de5c6413.tar.bz2