summaryrefslogtreecommitdiffstats
path: root/Lib/test/test_ucn.py
blob: d631406a005ecaad35c0c26e902c214c18c2fa32 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
""" Test script for the Unicode implementation.

Written by Bill Tutt.

(c) Copyright CNRI, All Rights Reserved. NO WARRANTY.

"""#"
print 'Testing General Unicode Character Name, and case insensitivity...',

# General and case insensitivity test:
s = u"\N{LATIN CAPITAL LETTER T}" \
    u"\N{LATIN SMALL LETTER H}" \
    u"\N{LATIN SMALL LETTER E}" \
    u"\N{SPACE}" \
    u"\N{LATIN SMALL LETTER R}" \
    u"\N{LATIN CAPITAL LETTER E}" \
    u"\N{LATIN SMALL LETTER D}" \
    u"\N{SPACE}" \
    u"\N{LATIN SMALL LETTER f}" \
    u"\N{LATIN CAPITAL LeTtEr o}" \
    u"\N{LATIN SMaLl LETTER x}" \
    u"\N{SPACE}" \
    u"\N{LATIN SMALL LETTER A}" \
    u"\N{LATIN SMALL LETTER T}" \
    u"\N{LATIN SMALL LETTER E}" \
    u"\N{SPACE}" \
    u"\N{LATIN SMALL LETTER T}" \
    u"\N{LATIN SMALL LETTER H}" \
    u"\N{LATIN SMALL LETTER E}" \
    u"\N{SpAcE}" \
    u"\N{LATIN SMALL LETTER S}" \
    u"\N{LATIN SMALL LETTER H}" \
    u"\N{LATIN SMALL LETTER E}" \
    u"\N{LATIN SMALL LETTER E}" \
    u"\N{LATIN SMALL LETTER P}" \
    u"\N{FULL STOP}"
assert s == u"The rEd fOx ate the sheep.", s
print "done."

# misc. symbol testing
print "Testing misc. symbols for unicode character name expansion....",
assert u"\N{PILCROW SIGN}" == u"\u00b6"
assert u"\N{REPLACEMENT CHARACTER}" == u"\uFFFD"
assert u"\N{HALFWIDTH KATAKANA SEMI-VOICED SOUND MARK}" == u"\uFF9F"
assert u"\N{FULLWIDTH LATIN SMALL LETTER A}" == u"\uFF41"
print "done."


# strict error testing:
print "Testing unicode character name expansion strict error handling....",
k_cchMaxUnicodeName = 83

s = "\N{" + "1" * (k_cchMaxUnicodeName + 2) + "}"
try:
  unicode(s, 'unicode-escape', 'strict')
except UnicodeError:
  pass
else:
  raise AssertionError, "failed to raise an exception when presented " \
                        "with a UCN > k_cchMaxUnicodeName"
try:
  unicode("\N{blah}", 'unicode-escape', 'strict')
except UnicodeError:
  pass
else:
  raise AssertionError, "failed to raise an exception when given a bogus character name"

try:
  unicode("\N{SPACE", 'unicode-escape', 'strict')
except UnicodeError:
  pass
else:
  raise AssertionError, "failed to raise an exception for a missing closing brace."

try:
  unicode("\NSPACE", 'unicode-escape', 'strict')
except UnicodeError:
  pass
else:
  raise AssertionError, "failed to raise an exception for a missing opening brace."
print "done."