blob: d4b4a13d0de26451a2be746a7c18540a6e93b368 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
|
# To fully test this module, we would need a copy of the stringprep tables.
# Since we don't have them, this test checks only a few code points.
import unittest
from stringprep import *
class StringprepTests(unittest.TestCase):
def test(self):
self.assertTrue(in_table_a1("\u0221"))
self.assertFalse(in_table_a1("\u0222"))
self.assertTrue(in_table_b1("\u00ad"))
self.assertFalse(in_table_b1("\u00ae"))
self.assertTrue(map_table_b2("\u0041"), "\u0061")
self.assertTrue(map_table_b2("\u0061"), "\u0061")
self.assertTrue(map_table_b3("\u0041"), "\u0061")
self.assertTrue(map_table_b3("\u0061"), "\u0061")
self.assertTrue(in_table_c11("\u0020"))
self.assertFalse(in_table_c11("\u0021"))
self.assertTrue(in_table_c12("\u00a0"))
self.assertFalse(in_table_c12("\u00a1"))
self.assertTrue(in_table_c12("\u00a0"))
self.assertFalse(in_table_c12("\u00a1"))
self.assertTrue(in_table_c11_c12("\u00a0"))
self.assertFalse(in_table_c11_c12("\u00a1"))
self.assertTrue(in_table_c21("\u001f"))
self.assertFalse(in_table_c21("\u0020"))
self.assertTrue(in_table_c22("\u009f"))
self.assertFalse(in_table_c22("\u00a0"))
self.assertTrue(in_table_c21_c22("\u009f"))
self.assertFalse(in_table_c21_c22("\u00a0"))
self.assertTrue(in_table_c3("\ue000"))
self.assertFalse(in_table_c3("\uf900"))
self.assertTrue(in_table_c4("\uffff"))
self.assertFalse(in_table_c4("\u0000"))
self.assertTrue(in_table_c5("\ud800"))
self.assertFalse(in_table_c5("\ud7ff"))
self.assertTrue(in_table_c6("\ufff9"))
self.assertFalse(in_table_c6("\ufffe"))
self.assertTrue(in_table_c7("\u2ff0"))
self.assertFalse(in_table_c7("\u2ffc"))
self.assertTrue(in_table_c8("\u0340"))
self.assertFalse(in_table_c8("\u0342"))
# C.9 is not in the bmp
# self.assertTrue(in_table_c9(u"\U000E0001"))
# self.assertFalse(in_table_c8(u"\U000E0002"))
self.assertTrue(in_table_d1("\u05be"))
self.assertFalse(in_table_d1("\u05bf"))
self.assertTrue(in_table_d2("\u0041"))
self.assertFalse(in_table_d2("\u0040"))
# This would generate a hash of all predicates. However, running
# it is quite expensive, and only serves to detect changes in the
# unicode database. Instead, stringprep.py asserts the version of
# the database.
# import hashlib
# predicates = [k for k in dir(stringprep) if k.startswith("in_table")]
# predicates.sort()
# for p in predicates:
# f = getattr(stringprep, p)
# # Collect all BMP code points
# data = ["0"] * 0x10000
# for i in range(0x10000):
# if f(unichr(i)):
# data[i] = "1"
# data = "".join(data)
# h = hashlib.sha1()
# h.update(data)
# print p, h.hexdigest()
if __name__ == '__main__':
unittest.main()
|