|
| 1 | +import uuid |
| 2 | + |
| 3 | +from data_diff.abcs.database_types import String_UUID |
| 4 | +from data_diff.databases import MySQL |
| 5 | +from data_diff.table_segment import create_mesh_from_points |
| 6 | +from data_diff.utils import ArithUUID, safezip |
| 7 | +from tests.common import DiffTestCase, table_segment |
| 8 | + |
| 9 | + |
| 10 | +# We do not need real tables, just any reference to them for proper object creation. |
| 11 | +class TestDiffMesh(DiffTestCase): |
| 12 | + db_cls = MySQL |
| 13 | + |
| 14 | + def test_meta_parameters_passed_from_coltypes_to_values(self): |
| 15 | + key_types1 = [String_UUID(lowercase=True, uppercase=False)] |
| 16 | + key_types2 = [String_UUID(lowercase=False, uppercase=True)] |
| 17 | + |
| 18 | + # side B is wider than side A to ensure there are "outer" regions. |
| 19 | + min_uuid1 = uuid.UUID("11111111-1111-1111-1111-111111111111") |
| 20 | + max_uuid1 = uuid.UUID("EEEEEEEE-EEEE-EEEE-EEEE-EEEEEEEEEEEE") |
| 21 | + min_uuid2 = uuid.UUID("00000000-0000-0000-0000-000000000000") |
| 22 | + max_uuid2 = uuid.UUID("FFFFFFFF-FFFF-FFFF-FFFF-FFFFFFFFFFFF") |
| 23 | + min_key1 = (key_types1[0].make_value(min_uuid1),) |
| 24 | + max_key1 = (key_types1[0].make_value(max_uuid1),) |
| 25 | + min_key2 = (key_types2[0].make_value(min_uuid2),) |
| 26 | + max_key2 = (key_types2[0].make_value(max_uuid2),) |
| 27 | + |
| 28 | + # Verify that we pass the meta-parameters from col types to values: |
| 29 | + assert isinstance(min_key1[0], ArithUUID) |
| 30 | + assert isinstance(max_key1[0], ArithUUID) |
| 31 | + assert isinstance(min_key2[0], ArithUUID) |
| 32 | + assert isinstance(max_key2[0], ArithUUID) |
| 33 | + assert min_key1[0].uuid == min_uuid1 |
| 34 | + assert min_key1[0].lowercase == True |
| 35 | + assert min_key1[0].uppercase == False |
| 36 | + assert max_key1[0].uuid == max_uuid1 |
| 37 | + assert max_key1[0].lowercase == True |
| 38 | + assert max_key1[0].uppercase == False |
| 39 | + assert min_key2[0].uuid == min_uuid2 |
| 40 | + assert min_key2[0].lowercase == False |
| 41 | + assert min_key2[0].uppercase == True |
| 42 | + assert max_key2[0].uuid == max_uuid2 |
| 43 | + assert max_key2[0].lowercase == False |
| 44 | + assert max_key2[0].uppercase == True |
| 45 | + |
| 46 | + def test_meta_parameters_left_as_is_if_not_casted(self): |
| 47 | + table1 = table_segment(self.connection, self.table_src_path, "id", "timestamp", case_sensitive=False) |
| 48 | + key_types1 = [String_UUID(lowercase=True, uppercase=False)] |
| 49 | + |
| 50 | + min_uuid1 = uuid.UUID("11111111-1111-1111-1111-111111111111") |
| 51 | + max_uuid1 = uuid.UUID("EEEEEEEE-EEEE-EEEE-EEEE-EEEEEEEEEEEE") |
| 52 | + min_key1 = (key_types1[0].make_value(min_uuid1),) |
| 53 | + max_key1 = (key_types1[0].make_value(max_uuid1),) |
| 54 | + |
| 55 | + btable1 = table1.new_key_bounds(min_key=min_key1, max_key=max_key1) |
| 56 | + assert btable1.min_key[0] is min_key1[0] # by identity, not by equality |
| 57 | + assert btable1.max_key[0] is max_key1[0] # by identity, not by equality |
| 58 | + |
| 59 | + def test_mesh_keys_meta_parameters_preserved(self): |
| 60 | + table1 = table_segment(self.connection, self.table_src_path, "id", "timestamp", case_sensitive=False) |
| 61 | + table2 = table_segment(self.connection, self.table_src_path, "id", "timestamp", case_sensitive=False) |
| 62 | + key_types1 = [String_UUID(lowercase=True, uppercase=False)] |
| 63 | + key_types2 = [String_UUID(lowercase=False, uppercase=True)] |
| 64 | + |
| 65 | + # side B is wider than side A to ensure there are "outer" regions. |
| 66 | + min_uuid1 = uuid.UUID("11111111-1111-1111-1111-111111111111") |
| 67 | + max_uuid1 = uuid.UUID("EEEEEEEE-EEEE-EEEE-EEEE-EEEEEEEEEEEE") |
| 68 | + min_uuid2 = uuid.UUID("00000000-0000-0000-0000-000000000000") |
| 69 | + max_uuid2 = uuid.UUID("FFFFFFFF-FFFF-FFFF-FFFF-FFFFFFFFFFFF") |
| 70 | + min_key1 = (key_types1[0].make_value(min_uuid1),) |
| 71 | + max_key1 = (key_types1[0].make_value(max_uuid1),) |
| 72 | + min_key2 = (key_types2[0].make_value(min_uuid2),) |
| 73 | + max_key2 = (key_types2[0].make_value(max_uuid2),) |
| 74 | + |
| 75 | + # This is what TableDiffer._bisect_and_diff_tables() does, precisely (yes, using key1!): |
| 76 | + btable1 = table1.new_key_bounds(min_key=min_key1, max_key=max_key1, key_types=key_types1) |
| 77 | + btable2 = table2.new_key_bounds(min_key=min_key1, max_key=max_key1, key_types=key_types2) |
| 78 | + |
| 79 | + # Verify that both sides have proper (the side-specific) pk meta-parameters: |
| 80 | + assert btable1.min_key[0].uuid == min_uuid1 |
| 81 | + assert btable1.min_key[0].lowercase == True |
| 82 | + assert btable1.min_key[0].uppercase == False |
| 83 | + assert btable1.max_key[0].uuid == max_uuid1 |
| 84 | + assert btable1.max_key[0].lowercase == True |
| 85 | + assert btable1.max_key[0].uppercase == False |
| 86 | + assert btable2.min_key[0].uuid == min_uuid1 |
| 87 | + assert btable2.min_key[0].lowercase == False |
| 88 | + assert btable2.min_key[0].uppercase == True |
| 89 | + assert btable2.max_key[0].uuid == max_uuid1 |
| 90 | + assert btable2.max_key[0].lowercase == False |
| 91 | + assert btable2.max_key[0].uppercase == True |
| 92 | + |
| 93 | + # This is what TableDiffer._bisect_and_diff_tables() does, precisely: |
| 94 | + points = [list(sorted(p)) for p in safezip(min_key1, min_key2, max_key1, max_key2)] |
| 95 | + box_mesh = create_mesh_from_points(*points) |
| 96 | + new_regions = [(p1, p2) for p1, p2 in box_mesh if p1 < p2 and not (p1 >= min_key1 and p2 <= max_key1)] |
| 97 | + extra_tables = [ |
| 98 | + ( |
| 99 | + table1.new_key_bounds(min_key=p1, max_key=p2, key_types=key_types1), |
| 100 | + table2.new_key_bounds(min_key=p1, max_key=p2, key_types=key_types2), |
| 101 | + ) |
| 102 | + for p1, p2 in new_regions |
| 103 | + ] |
| 104 | + |
| 105 | + # Verify that extra ("outer") segments have the proper pk meta-parameters: |
| 106 | + assert len(extra_tables) == 2 |
| 107 | + |
| 108 | + assert extra_tables[0][0].min_key[0].uuid == min_uuid2 |
| 109 | + assert extra_tables[0][0].min_key[0].lowercase == True |
| 110 | + assert extra_tables[0][0].min_key[0].uppercase == False |
| 111 | + assert extra_tables[0][0].max_key[0].uuid == min_uuid1 |
| 112 | + assert extra_tables[0][0].max_key[0].lowercase == True |
| 113 | + assert extra_tables[0][0].max_key[0].uppercase == False |
| 114 | + assert extra_tables[0][1].min_key[0].uuid == min_uuid2 |
| 115 | + assert extra_tables[0][1].min_key[0].lowercase == False |
| 116 | + assert extra_tables[0][1].min_key[0].uppercase == True |
| 117 | + assert extra_tables[0][1].max_key[0].uuid == min_uuid1 |
| 118 | + assert extra_tables[0][1].max_key[0].lowercase == False |
| 119 | + assert extra_tables[0][1].max_key[0].uppercase == True |
| 120 | + |
| 121 | + assert extra_tables[1][0].min_key[0].uuid == max_uuid1 |
| 122 | + assert extra_tables[1][0].min_key[0].lowercase == True |
| 123 | + assert extra_tables[1][0].min_key[0].uppercase == False |
| 124 | + assert extra_tables[1][0].max_key[0].uuid == max_uuid2 |
| 125 | + assert extra_tables[1][0].max_key[0].lowercase == True |
| 126 | + assert extra_tables[1][0].max_key[0].uppercase == False |
| 127 | + assert extra_tables[1][1].min_key[0].uuid == max_uuid1 |
| 128 | + assert extra_tables[1][1].min_key[0].lowercase == False |
| 129 | + assert extra_tables[1][1].min_key[0].uppercase == True |
| 130 | + assert extra_tables[1][1].max_key[0].uuid == max_uuid2 |
| 131 | + assert extra_tables[1][1].max_key[0].lowercase == False |
| 132 | + assert extra_tables[1][1].max_key[0].uppercase == True |
0 commit comments