diff options
author | Marc-André Lemburg <mal@egenix.com> | 2000-06-30 09:45:20 (GMT) |
---|---|---|
committer | Marc-André Lemburg <mal@egenix.com> | 2000-06-30 09:45:20 (GMT) |
commit | 6cdec2efbb0139600aa582ffc4530172194364be (patch) | |
tree | f82c38de54b39abb169081f3944f76ea2947c875 /Lib/test/test_ucn.py | |
parent | 5f2e75e87ce7ca3fd2b2de7a4af4c3fede289b77 (diff) | |
download | cpython-6cdec2efbb0139600aa582ffc4530172194364be.zip cpython-6cdec2efbb0139600aa582ffc4530172194364be.tar.gz cpython-6cdec2efbb0139600aa582ffc4530172194364be.tar.bz2 |
New test for the ucnhash module.
Diffstat (limited to 'Lib/test/test_ucn.py')
-rw-r--r-- | Lib/test/test_ucn.py | 82 |
1 files changed, 82 insertions, 0 deletions
diff --git a/Lib/test/test_ucn.py b/Lib/test/test_ucn.py new file mode 100644 index 0000000..d631406 --- /dev/null +++ b/Lib/test/test_ucn.py @@ -0,0 +1,82 @@ +""" Test script for the Unicode implementation. + +Written by Bill Tutt. + +(c) Copyright CNRI, All Rights Reserved. NO WARRANTY. + +"""#" +print 'Testing General Unicode Character Name, and case insensitivity...', + +# General and case insensitivity test: +s = u"\N{LATIN CAPITAL LETTER T}" \ + u"\N{LATIN SMALL LETTER H}" \ + u"\N{LATIN SMALL LETTER E}" \ + u"\N{SPACE}" \ + u"\N{LATIN SMALL LETTER R}" \ + u"\N{LATIN CAPITAL LETTER E}" \ + u"\N{LATIN SMALL LETTER D}" \ + u"\N{SPACE}" \ + u"\N{LATIN SMALL LETTER f}" \ + u"\N{LATIN CAPITAL LeTtEr o}" \ + u"\N{LATIN SMaLl LETTER x}" \ + u"\N{SPACE}" \ + u"\N{LATIN SMALL LETTER A}" \ + u"\N{LATIN SMALL LETTER T}" \ + u"\N{LATIN SMALL LETTER E}" \ + u"\N{SPACE}" \ + u"\N{LATIN SMALL LETTER T}" \ + u"\N{LATIN SMALL LETTER H}" \ + u"\N{LATIN SMALL LETTER E}" \ + u"\N{SpAcE}" \ + u"\N{LATIN SMALL LETTER S}" \ + u"\N{LATIN SMALL LETTER H}" \ + u"\N{LATIN SMALL LETTER E}" \ + u"\N{LATIN SMALL LETTER E}" \ + u"\N{LATIN SMALL LETTER P}" \ + u"\N{FULL STOP}" +assert s == u"The rEd fOx ate the sheep.", s +print "done." + +# misc. symbol testing +print "Testing misc. symbols for unicode character name expansion....", +assert u"\N{PILCROW SIGN}" == u"\u00b6" +assert u"\N{REPLACEMENT CHARACTER}" == u"\uFFFD" +assert u"\N{HALFWIDTH KATAKANA SEMI-VOICED SOUND MARK}" == u"\uFF9F" +assert u"\N{FULLWIDTH LATIN SMALL LETTER A}" == u"\uFF41" +print "done." + + +# strict error testing: +print "Testing unicode character name expansion strict error handling....", +k_cchMaxUnicodeName = 83 + +s = "\N{" + "1" * (k_cchMaxUnicodeName + 2) + "}" +try: + unicode(s, 'unicode-escape', 'strict') +except UnicodeError: + pass +else: + raise AssertionError, "failed to raise an exception when presented " \ + "with a UCN > k_cchMaxUnicodeName" +try: + unicode("\N{blah}", 'unicode-escape', 'strict') +except UnicodeError: + pass +else: + raise AssertionError, "failed to raise an exception when given a bogus character name" + +try: + unicode("\N{SPACE", 'unicode-escape', 'strict') +except UnicodeError: + pass +else: + raise AssertionError, "failed to raise an exception for a missing closing brace." + +try: + unicode("\NSPACE", 'unicode-escape', 'strict') +except UnicodeError: + pass +else: + raise AssertionError, "failed to raise an exception for a missing opening brace." +print "done." + |