summaryrefslogtreecommitdiffstats
path: root/tests/encoding.test
diff options
context:
space:
mode:
authorjan.nijtmans <nijtmans@users.sourceforge.net>2023-02-01 08:10:12 (GMT)
committerjan.nijtmans <nijtmans@users.sourceforge.net>2023-02-01 08:10:12 (GMT)
commit3eaad4bbc95c9cb3eaaf79872646d4fa7f6d8c6e (patch)
tree4952179bcfbada1be4941093c77d7a531dc7f135 /tests/encoding.test
parent537c8e77ba967fbb6f2ef1d7b2134420a3117bad (diff)
downloadtcl-3eaad4bbc95c9cb3eaaf79872646d4fa7f6d8c6e.zip
tcl-3eaad4bbc95c9cb3eaaf79872646d4fa7f6d8c6e.tar.gz
tcl-3eaad4bbc95c9cb3eaaf79872646d4fa7f6d8c6e.tar.bz2
(cherry-pick) Make Tcl_UniCharToUtf more readable and add test to exercise surrogate handling. (test-case was still missing, which cannot be used in Tcl 8.6)
Diffstat (limited to 'tests/encoding.test')
-rw-r--r--tests/encoding.test24
1 files changed, 24 insertions, 0 deletions
diff --git a/tests/encoding.test b/tests/encoding.test
index 10a37f8..ae6c78a 100644
--- a/tests/encoding.test
+++ b/tests/encoding.test
@@ -482,6 +482,30 @@ test encoding-16.7 {Utf32ToUtfProc} -body {
list $val [format %x [scan $val %c]]
} -result "乎 4e4e"
+test encoding-16.8 {
+ Utf16ToUtfProc, Tcl_UniCharToUtf, surrogate pairs in utf-16
+} -body {
+ apply [list {} {
+ for {set i 0xD800} {$i < 0xDBFF} {incr i} {
+ for {set j 0xDC00} {$j < 0xDFFF} {incr j} {
+ set string [binary format S2 [list $i $j]]
+ set status [catch {
+ set decoded [encoding convertfrom utf-16be $string]
+ set encoded [encoding convertto utf-16be $decoded]
+ }]
+ if {$status || ( $encoded ne $string )} {
+ return [list [format %x $i] [format %x $j]]
+ }
+ }
+ }
+ return done
+ } [namespace current]]
+} -result done
+
+
+
+
+
test encoding-17.1 {UtfToUtf16Proc} -body {
encoding convertto utf-16 "\U460DC"
} -result "\xD8\xD8\xDC\xDC"