Follow-up to [67aa9a2070]: Use uppercase consistantly, slight optimization in character tests, comment fixes. No change in functionality.

author: jan.nijtmans <nijtmans@users.sourceforge.net> 2017-06-06 09:23:23 (GMT)
committer: jan.nijtmans <nijtmans@users.sourceforge.net> 2017-06-06 09:23:23 (GMT)
commit: fab7d970afbfa2aff68ecb1d99ab72e967d6cffe (patch)
tree: 21da69859e3e07548bd569cc3a67cbc368c84433
parent: 3cdd3064b55f4ac8bc05e222696f0e36e52366ab (diff)
parent: 617e92d7b4b71479c4854f19bae7473a7af8b7c7 (diff)
download: tcl-fab7d970afbfa2aff68ecb1d99ab72e967d6cffe.zip
tcl-fab7d970afbfa2aff68ecb1d99ab72e967d6cffe.tar.gz
tcl-fab7d970afbfa2aff68ecb1d99ab72e967d6cffe.tar.bz2
2 files changed, 19 insertions, 19 deletions
diff --git a/generic/tclUtf.c b/generic/tclUtf.c
index fe47f0b..52b4291 100644
--- a/generic/tclUtf.c
+++ b/generic/tclUtf.c
@@ -109,7 +109,7 @@ UtfCount(
 	return 2;
     }
 #if TCL_UTF_MAX > 3
-    if (((unsigned)(ch - 0x10000) <= 0xfffff)) {
+    if (((unsigned)(ch - 0x10000) <= 0xFFFFF)) {
 	return 4;
     }
 #endif
@@ -298,7 +298,7 @@ Tcl_UtfToUniChar(
 	     */
 
 	    *chPtr = (Tcl_UniChar) (((byte & 0x1F) << 6) | (src[1] & 0x3F));
-	    if ((*chPtr == 0) || (*chPtr > 0x7f)) {
+	    if ((unsigned)(*chPtr - 1) >= (UNICODE_SELF - 1)) {
 		return 2;
 	    }
 	}
@@ -315,7 +315,7 @@ Tcl_UtfToUniChar(
 
 	    *chPtr = (Tcl_UniChar) (((byte & 0x0F) << 12)
 		    | ((src[1] & 0x3F) << 6) | (src[2] & 0x3F));
-	    if (*chPtr > 0x7ff) {
+	    if (*chPtr > 0x7FF) {
 		return 3;
 	    }
 	}
@@ -332,15 +332,15 @@ Tcl_UtfToUniChar(
 	     * Four-byte-character lead byte followed by three trail bytes.
 	     */
 
-	    *chPtr = (Tcl_UniChar) (((byte & 0x0E) << 18) | ((src[1] & 0x3F) << 12)
+	    *chPtr = (Tcl_UniChar) (((byte & 0x07) << 18) | ((src[1] & 0x3F) << 12)
 		    | ((src[2] & 0x3F) << 6) | (src[3] & 0x3F));
-	    if ((*chPtr <= 0x10ffff) && (*chPtr > 0xffff)) {
+	    if ((unsigned)(*chPtr - 0x10000) <= 0xFFFFF) {
 		return 4;
 	    }
 	}
 
 	/*
-	 * A three-byte-character lead-byte not followed by two trail-bytes
+	 * A four-byte-character lead-byte not followed by two trail-bytes
 	 * represents itself.
 	 */
     }
@@ -1016,7 +1016,7 @@ Tcl_UtfNcmp(
 
     /*
      * Cannot use 'memcmp(cs, ct, n);' as byte representation of \u0000 (the
-     * pair of bytes 0xc0,0x80) is larger than byte representation of \u0001
+     * pair of bytes 0xC0,0x80) is larger than byte representation of \u0001
      * (the byte 0x01.)
      */
 
@@ -1400,11 +1400,11 @@ Tcl_UniCharIsControl(
 {
 #if TCL_UTF_MAX > 3
     if (UNICODE_OUT_OF_RANGE(ch)) {
-	ch &= 0x1fffff;
-	if ((ch == 0xe0001) || ((ch >= 0xe0020) && (ch <= 0xe007f))) {
+	ch &= 0x1FFFFF;
+	if ((ch == 0xE0001) || ((ch >= 0xE0020) && (ch <= 0xE007f))) {
 	    return 1;
 	}
-	if ((ch >= 0xf0000) && ((ch & 0xffff) <= 0xfffd)) {
+	if ((ch >= 0xF0000) && ((ch & 0xFFFF) <= 0xFFFD)) {
 	    return 1;
 	}
 	return 0;
@@ -1463,8 +1463,8 @@ Tcl_UniCharIsGraph(
 {
 #if TCL_UTF_MAX > 3
     if (UNICODE_OUT_OF_RANGE(ch)) {
-	ch &= 0x1fffff;
-	return (ch >= 0xe0100) && (ch <= 0xe01ef);
+	ch &= 0x1FFFFF;
+	return (ch >= 0xE0100) && (ch <= 0xE01EF);
     }
 #endif
     return ((GRAPH_BITS >> GetCategory(ch)) & 1);
@@ -1520,8 +1520,8 @@ Tcl_UniCharIsPrint(
 {
 #if TCL_UTF_MAX > 3
     if (UNICODE_OUT_OF_RANGE(ch)) {
-	ch &= 0x1fffff;
-	return (ch >= 0xe0100) && (ch <= 0xe01ef);
+	ch &= 0x1FFFFF;
+	return (ch >= 0xE0100) && (ch <= 0xE01EF);
     }
 #endif
     return (((GRAPH_BITS|SPACE_BITS) >> GetCategory(ch)) & 1);
@@ -1577,10 +1577,10 @@ Tcl_UniCharIsSpace(
 {
 #if TCL_UTF_MAX > 3
     /* Ignore upper 11 bits. */
-    ch &= 0x1fffff;
+    ch &= 0x1FFFFF;
 #else
     /* Ignore upper 16 bits. */
-    ch &= 0xffff;
+    ch &= 0xFFFF;
 #endif
 
     /*
@@ -1594,8 +1594,8 @@ Tcl_UniCharIsSpace(
     } else if (UNICODE_OUT_OF_RANGE(ch)) {
 	return 0;
 #endif
-    } else if (ch == 0x0085 || ch == 0x180e || ch == 0x200b
-	    || ch == 0x202f || ch == 0x2060 || ch == 0xfeff) {
+    } else if (ch == 0x0085 || ch == 0x180E || ch == 0x200B
+	    || ch == 0x202F || ch == 0x2060 || ch == 0xFEFF) {
 	return 1;
     } else {
 	return ((SPACE_BITS >> GetCategory(ch)) & 1);
diff --git a/tests/encoding.test b/tests/encoding.test
index 1d8bae5..a359f76 100644
--- a/tests/encoding.test
+++ b/tests/encoding.test
@@ -469,7 +469,7 @@ test encoding-24.9 {Parse valid or invalid utf-8} {
 test encoding-24.10 {Parse valid or invalid utf-8} {
     string length [encoding convertfrom utf-8 "\xe0\xa0\x80"]
 } 1
-test encoding-24.10 {Parse valid or invalid utf-8} {
+test encoding-24.11 {Parse valid or invalid utf-8} {
     string length [encoding convertfrom utf-8 "\xef\xbf\xbf"]
 } 1
author	jan.nijtmans <nijtmans@users.sourceforge.net>	2017-06-06 09:23:23 (GMT)
committer	jan.nijtmans <nijtmans@users.sourceforge.net>	2017-06-06 09:23:23 (GMT)
commit	fab7d970afbfa2aff68ecb1d99ab72e967d6cffe (patch)
tree	21da69859e3e07548bd569cc3a67cbc368c84433
parent	3cdd3064b55f4ac8bc05e222696f0e36e52366ab (diff)
parent	617e92d7b4b71479c4854f19bae7473a7af8b7c7 (diff)
download	tcl-fab7d970afbfa2aff68ecb1d99ab72e967d6cffe.zip tcl-fab7d970afbfa2aff68ecb1d99ab72e967d6cffe.tar.gz tcl-fab7d970afbfa2aff68ecb1d99ab72e967d6cffe.tar.bz2