test_stringprep.py 3.0 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192
  1. # To fully test this module, we would need a copy of the stringprep tables.
  2. # Since we don't have them, this test checks only a few code points.
  3. import unittest
  4. from stringprep import *
  5. class StringprepTests(unittest.TestCase):
  6. def test(self):
  7. self.assertTrue(in_table_a1("\u0221"))
  8. self.assertFalse(in_table_a1("\u0222"))
  9. self.assertTrue(in_table_b1("\u00ad"))
  10. self.assertFalse(in_table_b1("\u00ae"))
  11. self.assertTrue(map_table_b2("\u0041"), "\u0061")
  12. self.assertTrue(map_table_b2("\u0061"), "\u0061")
  13. self.assertTrue(map_table_b3("\u0041"), "\u0061")
  14. self.assertTrue(map_table_b3("\u0061"), "\u0061")
  15. self.assertTrue(in_table_c11("\u0020"))
  16. self.assertFalse(in_table_c11("\u0021"))
  17. self.assertTrue(in_table_c12("\u00a0"))
  18. self.assertFalse(in_table_c12("\u00a1"))
  19. self.assertTrue(in_table_c12("\u00a0"))
  20. self.assertFalse(in_table_c12("\u00a1"))
  21. self.assertTrue(in_table_c11_c12("\u00a0"))
  22. self.assertFalse(in_table_c11_c12("\u00a1"))
  23. self.assertTrue(in_table_c21("\u001f"))
  24. self.assertFalse(in_table_c21("\u0020"))
  25. self.assertTrue(in_table_c22("\u009f"))
  26. self.assertFalse(in_table_c22("\u00a0"))
  27. self.assertTrue(in_table_c21_c22("\u009f"))
  28. self.assertFalse(in_table_c21_c22("\u00a0"))
  29. self.assertTrue(in_table_c3("\ue000"))
  30. self.assertFalse(in_table_c3("\uf900"))
  31. self.assertTrue(in_table_c4("\uffff"))
  32. self.assertFalse(in_table_c4("\u0000"))
  33. self.assertTrue(in_table_c5("\ud800"))
  34. self.assertFalse(in_table_c5("\ud7ff"))
  35. self.assertTrue(in_table_c6("\ufff9"))
  36. self.assertFalse(in_table_c6("\ufffe"))
  37. self.assertTrue(in_table_c7("\u2ff0"))
  38. self.assertFalse(in_table_c7("\u2ffc"))
  39. self.assertTrue(in_table_c8("\u0340"))
  40. self.assertFalse(in_table_c8("\u0342"))
  41. # C.9 is not in the bmp
  42. # self.assertTrue(in_table_c9(u"\U000E0001"))
  43. # self.assertFalse(in_table_c8(u"\U000E0002"))
  44. self.assertTrue(in_table_d1("\u05be"))
  45. self.assertFalse(in_table_d1("\u05bf"))
  46. self.assertTrue(in_table_d2("\u0041"))
  47. self.assertFalse(in_table_d2("\u0040"))
  48. # This would generate a hash of all predicates. However, running
  49. # it is quite expensive, and only serves to detect changes in the
  50. # unicode database. Instead, stringprep.py asserts the version of
  51. # the database.
  52. # import hashlib
  53. # predicates = [k for k in dir(stringprep) if k.startswith("in_table")]
  54. # predicates.sort()
  55. # for p in predicates:
  56. # f = getattr(stringprep, p)
  57. # # Collect all BMP code points
  58. # data = ["0"] * 0x10000
  59. # for i in range(0x10000):
  60. # if f(unichr(i)):
  61. # data[i] = "1"
  62. # data = "".join(data)
  63. # h = hashlib.sha1()
  64. # h.update(data)
  65. # print p, h.hexdigest()
  66. if __name__ == '__main__':
  67. unittest.main()