test_stringprep.py 3.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596
  1. # To fully test this module, we would need a copy of the stringprep tables.
  2. # Since we don't have them, this test checks only a few code points.
  3. import unittest
  4. from test import test_support
  5. from stringprep import *
  6. class StringprepTests(unittest.TestCase):
  7. def test(self):
  8. self.assertTrue(in_table_a1(u"\u0221"))
  9. self.assertFalse(in_table_a1(u"\u0222"))
  10. self.assertTrue(in_table_b1(u"\u00ad"))
  11. self.assertFalse(in_table_b1(u"\u00ae"))
  12. self.assertTrue(map_table_b2(u"\u0041"), u"\u0061")
  13. self.assertTrue(map_table_b2(u"\u0061"), u"\u0061")
  14. self.assertTrue(map_table_b3(u"\u0041"), u"\u0061")
  15. self.assertTrue(map_table_b3(u"\u0061"), u"\u0061")
  16. self.assertTrue(in_table_c11(u"\u0020"))
  17. self.assertFalse(in_table_c11(u"\u0021"))
  18. self.assertTrue(in_table_c12(u"\u00a0"))
  19. self.assertFalse(in_table_c12(u"\u00a1"))
  20. self.assertTrue(in_table_c12(u"\u00a0"))
  21. self.assertFalse(in_table_c12(u"\u00a1"))
  22. self.assertTrue(in_table_c11_c12(u"\u00a0"))
  23. self.assertFalse(in_table_c11_c12(u"\u00a1"))
  24. self.assertTrue(in_table_c21(u"\u001f"))
  25. self.assertFalse(in_table_c21(u"\u0020"))
  26. self.assertTrue(in_table_c22(u"\u009f"))
  27. self.assertFalse(in_table_c22(u"\u00a0"))
  28. self.assertTrue(in_table_c21_c22(u"\u009f"))
  29. self.assertFalse(in_table_c21_c22(u"\u00a0"))
  30. self.assertTrue(in_table_c3(u"\ue000"))
  31. self.assertFalse(in_table_c3(u"\uf900"))
  32. self.assertTrue(in_table_c4(u"\uffff"))
  33. self.assertFalse(in_table_c4(u"\u0000"))
  34. self.assertTrue(in_table_c5(u"\ud800"))
  35. self.assertFalse(in_table_c5(u"\ud7ff"))
  36. self.assertTrue(in_table_c6(u"\ufff9"))
  37. self.assertFalse(in_table_c6(u"\ufffe"))
  38. self.assertTrue(in_table_c7(u"\u2ff0"))
  39. self.assertFalse(in_table_c7(u"\u2ffc"))
  40. self.assertTrue(in_table_c8(u"\u0340"))
  41. self.assertFalse(in_table_c8(u"\u0342"))
  42. # C.9 is not in the bmp
  43. # self.assertTrue(in_table_c9(u"\U000E0001"))
  44. # self.assertFalse(in_table_c8(u"\U000E0002"))
  45. self.assertTrue(in_table_d1(u"\u05be"))
  46. self.assertFalse(in_table_d1(u"\u05bf"))
  47. self.assertTrue(in_table_d2(u"\u0041"))
  48. self.assertFalse(in_table_d2(u"\u0040"))
  49. # This would generate a hash of all predicates. However, running
  50. # it is quite expensive, and only serves to detect changes in the
  51. # unicode database. Instead, stringprep.py asserts the version of
  52. # the database.
  53. # import hashlib
  54. # predicates = [k for k in dir(stringprep) if k.startswith("in_table")]
  55. # predicates.sort()
  56. # for p in predicates:
  57. # f = getattr(stringprep, p)
  58. # # Collect all BMP code points
  59. # data = ["0"] * 0x10000
  60. # for i in range(0x10000):
  61. # if f(unichr(i)):
  62. # data[i] = "1"
  63. # data = "".join(data)
  64. # h = hashlib.sha1()
  65. # h.update(data)
  66. # print p, h.hexdigest()
  67. def test_main():
  68. test_support.run_unittest(StringprepTests)
  69. if __name__ == '__main__':
  70. test_main()