You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
93 lines
3.0 KiB
93 lines
3.0 KiB
3 years ago
|
# To fully test this module, we would need a copy of the stringprep tables.
|
||
|
# Since we don't have them, this test checks only a few code points.
|
||
|
|
||
|
import unittest
|
||
|
|
||
|
from stringprep import *
|
||
|
|
||
|
class StringprepTests(unittest.TestCase):
|
||
|
def test(self):
|
||
|
self.assertTrue(in_table_a1("\u0221"))
|
||
|
self.assertFalse(in_table_a1("\u0222"))
|
||
|
|
||
|
self.assertTrue(in_table_b1("\u00ad"))
|
||
|
self.assertFalse(in_table_b1("\u00ae"))
|
||
|
|
||
|
self.assertTrue(map_table_b2("\u0041"), "\u0061")
|
||
|
self.assertTrue(map_table_b2("\u0061"), "\u0061")
|
||
|
|
||
|
self.assertTrue(map_table_b3("\u0041"), "\u0061")
|
||
|
self.assertTrue(map_table_b3("\u0061"), "\u0061")
|
||
|
|
||
|
self.assertTrue(in_table_c11("\u0020"))
|
||
|
self.assertFalse(in_table_c11("\u0021"))
|
||
|
|
||
|
self.assertTrue(in_table_c12("\u00a0"))
|
||
|
self.assertFalse(in_table_c12("\u00a1"))
|
||
|
|
||
|
self.assertTrue(in_table_c12("\u00a0"))
|
||
|
self.assertFalse(in_table_c12("\u00a1"))
|
||
|
|
||
|
self.assertTrue(in_table_c11_c12("\u00a0"))
|
||
|
self.assertFalse(in_table_c11_c12("\u00a1"))
|
||
|
|
||
|
self.assertTrue(in_table_c21("\u001f"))
|
||
|
self.assertFalse(in_table_c21("\u0020"))
|
||
|
|
||
|
self.assertTrue(in_table_c22("\u009f"))
|
||
|
self.assertFalse(in_table_c22("\u00a0"))
|
||
|
|
||
|
self.assertTrue(in_table_c21_c22("\u009f"))
|
||
|
self.assertFalse(in_table_c21_c22("\u00a0"))
|
||
|
|
||
|
self.assertTrue(in_table_c3("\ue000"))
|
||
|
self.assertFalse(in_table_c3("\uf900"))
|
||
|
|
||
|
self.assertTrue(in_table_c4("\uffff"))
|
||
|
self.assertFalse(in_table_c4("\u0000"))
|
||
|
|
||
|
self.assertTrue(in_table_c5("\ud800"))
|
||
|
self.assertFalse(in_table_c5("\ud7ff"))
|
||
|
|
||
|
self.assertTrue(in_table_c6("\ufff9"))
|
||
|
self.assertFalse(in_table_c6("\ufffe"))
|
||
|
|
||
|
self.assertTrue(in_table_c7("\u2ff0"))
|
||
|
self.assertFalse(in_table_c7("\u2ffc"))
|
||
|
|
||
|
self.assertTrue(in_table_c8("\u0340"))
|
||
|
self.assertFalse(in_table_c8("\u0342"))
|
||
|
|
||
|
# C.9 is not in the bmp
|
||
|
# self.assertTrue(in_table_c9(u"\U000E0001"))
|
||
|
# self.assertFalse(in_table_c8(u"\U000E0002"))
|
||
|
|
||
|
self.assertTrue(in_table_d1("\u05be"))
|
||
|
self.assertFalse(in_table_d1("\u05bf"))
|
||
|
|
||
|
self.assertTrue(in_table_d2("\u0041"))
|
||
|
self.assertFalse(in_table_d2("\u0040"))
|
||
|
|
||
|
# This would generate a hash of all predicates. However, running
|
||
|
# it is quite expensive, and only serves to detect changes in the
|
||
|
# unicode database. Instead, stringprep.py asserts the version of
|
||
|
# the database.
|
||
|
|
||
|
# import hashlib
|
||
|
# predicates = [k for k in dir(stringprep) if k.startswith("in_table")]
|
||
|
# predicates.sort()
|
||
|
# for p in predicates:
|
||
|
# f = getattr(stringprep, p)
|
||
|
# # Collect all BMP code points
|
||
|
# data = ["0"] * 0x10000
|
||
|
# for i in range(0x10000):
|
||
|
# if f(unichr(i)):
|
||
|
# data[i] = "1"
|
||
|
# data = "".join(data)
|
||
|
# h = hashlib.sha1()
|
||
|
# h.update(data)
|
||
|
# print p, h.hexdigest()
|
||
|
|
||
|
if __name__ == '__main__':
|
||
|
unittest.main()
|