From 6cdec2efbb0139600aa582ffc4530172194364be Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Marc-Andr=C3=A9=20Lemburg?= Date: Fri, 30 Jun 2000 09:45:20 +0000 Subject: New test for the ucnhash module. --- Lib/test/test_ucn.py | 82 ++++++++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 82 insertions(+) create mode 100644 Lib/test/test_ucn.py diff --git a/Lib/test/test_ucn.py b/Lib/test/test_ucn.py new file mode 100644 index 0000000..d631406 --- /dev/null +++ b/Lib/test/test_ucn.py @@ -0,0 +1,82 @@ +""" Test script for the Unicode implementation. + +Written by Bill Tutt. + +(c) Copyright CNRI, All Rights Reserved. NO WARRANTY. + +"""#" +print 'Testing General Unicode Character Name, and case insensitivity...', + +# General and case insensitivity test: +s = u"\N{LATIN CAPITAL LETTER T}" \ + u"\N{LATIN SMALL LETTER H}" \ + u"\N{LATIN SMALL LETTER E}" \ + u"\N{SPACE}" \ + u"\N{LATIN SMALL LETTER R}" \ + u"\N{LATIN CAPITAL LETTER E}" \ + u"\N{LATIN SMALL LETTER D}" \ + u"\N{SPACE}" \ + u"\N{LATIN SMALL LETTER f}" \ + u"\N{LATIN CAPITAL LeTtEr o}" \ + u"\N{LATIN SMaLl LETTER x}" \ + u"\N{SPACE}" \ + u"\N{LATIN SMALL LETTER A}" \ + u"\N{LATIN SMALL LETTER T}" \ + u"\N{LATIN SMALL LETTER E}" \ + u"\N{SPACE}" \ + u"\N{LATIN SMALL LETTER T}" \ + u"\N{LATIN SMALL LETTER H}" \ + u"\N{LATIN SMALL LETTER E}" \ + u"\N{SpAcE}" \ + u"\N{LATIN SMALL LETTER S}" \ + u"\N{LATIN SMALL LETTER H}" \ + u"\N{LATIN SMALL LETTER E}" \ + u"\N{LATIN SMALL LETTER E}" \ + u"\N{LATIN SMALL LETTER P}" \ + u"\N{FULL STOP}" +assert s == u"The rEd fOx ate the sheep.", s +print "done." + +# misc. symbol testing +print "Testing misc. symbols for unicode character name expansion....", +assert u"\N{PILCROW SIGN}" == u"\u00b6" +assert u"\N{REPLACEMENT CHARACTER}" == u"\uFFFD" +assert u"\N{HALFWIDTH KATAKANA SEMI-VOICED SOUND MARK}" == u"\uFF9F" +assert u"\N{FULLWIDTH LATIN SMALL LETTER A}" == u"\uFF41" +print "done." + + +# strict error testing: +print "Testing unicode character name expansion strict error handling....", +k_cchMaxUnicodeName = 83 + +s = "\N{" + "1" * (k_cchMaxUnicodeName + 2) + "}" +try: + unicode(s, 'unicode-escape', 'strict') +except UnicodeError: + pass +else: + raise AssertionError, "failed to raise an exception when presented " \ + "with a UCN > k_cchMaxUnicodeName" +try: + unicode("\N{blah}", 'unicode-escape', 'strict') +except UnicodeError: + pass +else: + raise AssertionError, "failed to raise an exception when given a bogus character name" + +try: + unicode("\N{SPACE", 'unicode-escape', 'strict') +except UnicodeError: + pass +else: + raise AssertionError, "failed to raise an exception for a missing closing brace." + +try: + unicode("\NSPACE", 'unicode-escape', 'strict') +except UnicodeError: + pass +else: + raise AssertionError, "failed to raise an exception for a missing opening brace." +print "done." + -- cgit v0.12