blob: d4b4a13d0de26451a2be746a7c18540a6e93b368 [file] [log] [blame]
Martin v. Löwisb4cb6642003-04-19 12:57:57 +00001# To fully test this module, we would need a copy of the stringprep tables.
Serhiy Storchakad3faf432015-01-18 11:28:37 +02002# Since we don't have them, this test checks only a few code points.
Martin v. Löwisb4cb6642003-04-19 12:57:57 +00003
Guido van Rossumd8faa362007-04-27 19:54:29 +00004import unittest
Martin v. Löwisb4cb6642003-04-19 12:57:57 +00005
Martin v. Löwisb4cb6642003-04-19 12:57:57 +00006from stringprep import *
7
Guido van Rossumd8faa362007-04-27 19:54:29 +00008class StringprepTests(unittest.TestCase):
9 def test(self):
Benjamin Petersonc9c0f202009-06-30 23:06:06 +000010 self.assertTrue(in_table_a1("\u0221"))
11 self.assertFalse(in_table_a1("\u0222"))
Martin v. Löwisb4cb6642003-04-19 12:57:57 +000012
Benjamin Petersonc9c0f202009-06-30 23:06:06 +000013 self.assertTrue(in_table_b1("\u00ad"))
14 self.assertFalse(in_table_b1("\u00ae"))
Martin v. Löwisb4cb6642003-04-19 12:57:57 +000015
Benjamin Petersonc9c0f202009-06-30 23:06:06 +000016 self.assertTrue(map_table_b2("\u0041"), "\u0061")
17 self.assertTrue(map_table_b2("\u0061"), "\u0061")
Martin v. Löwisb4cb6642003-04-19 12:57:57 +000018
Benjamin Petersonc9c0f202009-06-30 23:06:06 +000019 self.assertTrue(map_table_b3("\u0041"), "\u0061")
20 self.assertTrue(map_table_b3("\u0061"), "\u0061")
Martin v. Löwisb4cb6642003-04-19 12:57:57 +000021
Benjamin Petersonc9c0f202009-06-30 23:06:06 +000022 self.assertTrue(in_table_c11("\u0020"))
23 self.assertFalse(in_table_c11("\u0021"))
Martin v. Löwisb4cb6642003-04-19 12:57:57 +000024
Benjamin Petersonc9c0f202009-06-30 23:06:06 +000025 self.assertTrue(in_table_c12("\u00a0"))
26 self.assertFalse(in_table_c12("\u00a1"))
Martin v. Löwisb4cb6642003-04-19 12:57:57 +000027
Benjamin Petersonc9c0f202009-06-30 23:06:06 +000028 self.assertTrue(in_table_c12("\u00a0"))
29 self.assertFalse(in_table_c12("\u00a1"))
Martin v. Löwisb4cb6642003-04-19 12:57:57 +000030
Benjamin Petersonc9c0f202009-06-30 23:06:06 +000031 self.assertTrue(in_table_c11_c12("\u00a0"))
32 self.assertFalse(in_table_c11_c12("\u00a1"))
Martin v. Löwisb4cb6642003-04-19 12:57:57 +000033
Benjamin Petersonc9c0f202009-06-30 23:06:06 +000034 self.assertTrue(in_table_c21("\u001f"))
35 self.assertFalse(in_table_c21("\u0020"))
Martin v. Löwisb4cb6642003-04-19 12:57:57 +000036
Benjamin Petersonc9c0f202009-06-30 23:06:06 +000037 self.assertTrue(in_table_c22("\u009f"))
38 self.assertFalse(in_table_c22("\u00a0"))
Martin v. Löwisb4cb6642003-04-19 12:57:57 +000039
Benjamin Petersonc9c0f202009-06-30 23:06:06 +000040 self.assertTrue(in_table_c21_c22("\u009f"))
41 self.assertFalse(in_table_c21_c22("\u00a0"))
Martin v. Löwisb4cb6642003-04-19 12:57:57 +000042
Benjamin Petersonc9c0f202009-06-30 23:06:06 +000043 self.assertTrue(in_table_c3("\ue000"))
44 self.assertFalse(in_table_c3("\uf900"))
Martin v. Löwisb4cb6642003-04-19 12:57:57 +000045
Benjamin Petersonc9c0f202009-06-30 23:06:06 +000046 self.assertTrue(in_table_c4("\uffff"))
47 self.assertFalse(in_table_c4("\u0000"))
Martin v. Löwisb4cb6642003-04-19 12:57:57 +000048
Benjamin Petersonc9c0f202009-06-30 23:06:06 +000049 self.assertTrue(in_table_c5("\ud800"))
50 self.assertFalse(in_table_c5("\ud7ff"))
Martin v. Löwisb4cb6642003-04-19 12:57:57 +000051
Benjamin Petersonc9c0f202009-06-30 23:06:06 +000052 self.assertTrue(in_table_c6("\ufff9"))
53 self.assertFalse(in_table_c6("\ufffe"))
Martin v. Löwisb4cb6642003-04-19 12:57:57 +000054
Benjamin Petersonc9c0f202009-06-30 23:06:06 +000055 self.assertTrue(in_table_c7("\u2ff0"))
56 self.assertFalse(in_table_c7("\u2ffc"))
Martin v. Löwisb4cb6642003-04-19 12:57:57 +000057
Benjamin Petersonc9c0f202009-06-30 23:06:06 +000058 self.assertTrue(in_table_c8("\u0340"))
59 self.assertFalse(in_table_c8("\u0342"))
Martin v. Löwisb4cb6642003-04-19 12:57:57 +000060
Guido van Rossumd8faa362007-04-27 19:54:29 +000061 # C.9 is not in the bmp
Benjamin Petersonc9c0f202009-06-30 23:06:06 +000062 # self.assertTrue(in_table_c9(u"\U000E0001"))
63 # self.assertFalse(in_table_c8(u"\U000E0002"))
Martin v. Löwisb4cb6642003-04-19 12:57:57 +000064
Benjamin Petersonc9c0f202009-06-30 23:06:06 +000065 self.assertTrue(in_table_d1("\u05be"))
66 self.assertFalse(in_table_d1("\u05bf"))
Martin v. Löwisb4cb6642003-04-19 12:57:57 +000067
Benjamin Petersonc9c0f202009-06-30 23:06:06 +000068 self.assertTrue(in_table_d2("\u0041"))
69 self.assertFalse(in_table_d2("\u0040"))
Martin v. Löwisb4cb6642003-04-19 12:57:57 +000070
Guido van Rossumd8faa362007-04-27 19:54:29 +000071 # This would generate a hash of all predicates. However, running
72 # it is quite expensive, and only serves to detect changes in the
73 # unicode database. Instead, stringprep.py asserts the version of
74 # the database.
Martin v. Löwisb4cb6642003-04-19 12:57:57 +000075
Guido van Rossumd8faa362007-04-27 19:54:29 +000076 # import hashlib
77 # predicates = [k for k in dir(stringprep) if k.startswith("in_table")]
78 # predicates.sort()
79 # for p in predicates:
80 # f = getattr(stringprep, p)
81 # # Collect all BMP code points
82 # data = ["0"] * 0x10000
83 # for i in range(0x10000):
84 # if f(unichr(i)):
85 # data[i] = "1"
86 # data = "".join(data)
87 # h = hashlib.sha1()
88 # h.update(data)
89 # print p, h.hexdigest()
90
Guido van Rossumd8faa362007-04-27 19:54:29 +000091if __name__ == '__main__':
Zachary Ware38c707e2015-04-13 15:00:43 -050092 unittest.main()