| 1 | # To fully test this module, we would need a copy of the stringprep tables.
|
|---|
| 2 | # Since we don't have them, this test checks only a few codepoints.
|
|---|
| 3 |
|
|---|
| 4 | from test.test_support import verify, vereq
|
|---|
| 5 |
|
|---|
| 6 | import stringprep
|
|---|
| 7 | from stringprep import *
|
|---|
| 8 |
|
|---|
| 9 | verify(in_table_a1(u"\u0221"))
|
|---|
| 10 | verify(not in_table_a1(u"\u0222"))
|
|---|
| 11 |
|
|---|
| 12 | verify(in_table_b1(u"\u00ad"))
|
|---|
| 13 | verify(not in_table_b1(u"\u00ae"))
|
|---|
| 14 |
|
|---|
| 15 | verify(map_table_b2(u"\u0041"), u"\u0061")
|
|---|
| 16 | verify(map_table_b2(u"\u0061"), u"\u0061")
|
|---|
| 17 |
|
|---|
| 18 | verify(map_table_b3(u"\u0041"), u"\u0061")
|
|---|
| 19 | verify(map_table_b3(u"\u0061"), u"\u0061")
|
|---|
| 20 |
|
|---|
| 21 | verify(in_table_c11(u"\u0020"))
|
|---|
| 22 | verify(not in_table_c11(u"\u0021"))
|
|---|
| 23 |
|
|---|
| 24 | verify(in_table_c12(u"\u00a0"))
|
|---|
| 25 | verify(not in_table_c12(u"\u00a1"))
|
|---|
| 26 |
|
|---|
| 27 | verify(in_table_c12(u"\u00a0"))
|
|---|
| 28 | verify(not in_table_c12(u"\u00a1"))
|
|---|
| 29 |
|
|---|
| 30 | verify(in_table_c11_c12(u"\u00a0"))
|
|---|
| 31 | verify(not in_table_c11_c12(u"\u00a1"))
|
|---|
| 32 |
|
|---|
| 33 | verify(in_table_c21(u"\u001f"))
|
|---|
| 34 | verify(not in_table_c21(u"\u0020"))
|
|---|
| 35 |
|
|---|
| 36 | verify(in_table_c22(u"\u009f"))
|
|---|
| 37 | verify(not in_table_c22(u"\u00a0"))
|
|---|
| 38 |
|
|---|
| 39 | verify(in_table_c21_c22(u"\u009f"))
|
|---|
| 40 | verify(not in_table_c21_c22(u"\u00a0"))
|
|---|
| 41 |
|
|---|
| 42 | verify(in_table_c3(u"\ue000"))
|
|---|
| 43 | verify(not in_table_c3(u"\uf900"))
|
|---|
| 44 |
|
|---|
| 45 | verify(in_table_c4(u"\uffff"))
|
|---|
| 46 | verify(not in_table_c4(u"\u0000"))
|
|---|
| 47 |
|
|---|
| 48 | verify(in_table_c5(u"\ud800"))
|
|---|
| 49 | verify(not in_table_c5(u"\ud7ff"))
|
|---|
| 50 |
|
|---|
| 51 | verify(in_table_c6(u"\ufff9"))
|
|---|
| 52 | verify(not in_table_c6(u"\ufffe"))
|
|---|
| 53 |
|
|---|
| 54 | verify(in_table_c7(u"\u2ff0"))
|
|---|
| 55 | verify(not in_table_c7(u"\u2ffc"))
|
|---|
| 56 |
|
|---|
| 57 | verify(in_table_c8(u"\u0340"))
|
|---|
| 58 | verify(not in_table_c8(u"\u0342"))
|
|---|
| 59 |
|
|---|
| 60 | # C.9 is not in the bmp
|
|---|
| 61 | # verify(in_table_c9(u"\U000E0001"))
|
|---|
| 62 | # verify(not in_table_c8(u"\U000E0002"))
|
|---|
| 63 |
|
|---|
| 64 | verify(in_table_d1(u"\u05be"))
|
|---|
| 65 | verify(not in_table_d1(u"\u05bf"))
|
|---|
| 66 |
|
|---|
| 67 | verify(in_table_d2(u"\u0041"))
|
|---|
| 68 | verify(not in_table_d2(u"\u0040"))
|
|---|
| 69 |
|
|---|
| 70 | # This would generate a hash of all predicates. However, running
|
|---|
| 71 | # it is quite expensive, and only serves to detect changes in the
|
|---|
| 72 | # unicode database. Instead, stringprep.py asserts the version of
|
|---|
| 73 | # the database.
|
|---|
| 74 |
|
|---|
| 75 | # import hashlib
|
|---|
| 76 | # predicates = [k for k in dir(stringprep) if k.startswith("in_table")]
|
|---|
| 77 | # predicates.sort()
|
|---|
| 78 | # for p in predicates:
|
|---|
| 79 | # f = getattr(stringprep, p)
|
|---|
| 80 | # # Collect all BMP code points
|
|---|
| 81 | # data = ["0"] * 0x10000
|
|---|
| 82 | # for i in range(0x10000):
|
|---|
| 83 | # if f(unichr(i)):
|
|---|
| 84 | # data[i] = "1"
|
|---|
| 85 | # data = "".join(data)
|
|---|
| 86 | # h = hashlib.sha1()
|
|---|
| 87 | # h.update(data)
|
|---|
| 88 | # print p, h.hexdigest()
|
|---|