-
Notifications
You must be signed in to change notification settings - Fork 208
Expand file tree
/
Copy pathtest_data_contract_checks.py
More file actions
110 lines (73 loc) · 4.14 KB
/
test_data_contract_checks.py
File metadata and controls
110 lines (73 loc) · 4.14 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
import yaml
from open_data_contract_standard.model import DataQuality, Server
from datacontract.engines.data_contract_checks import (
QuotingConfig,
check_property_invalid_values,
check_property_missing_values,
prepare_query,
)
def test_prepare_query_schema_placeholder():
"""Test that {schema} placeholder is replaced with server schema."""
quality = DataQuality(type="sql", query="SELECT * FROM {schema}.{model}")
server = Server(**{"type": "postgres", "schema": "my_schema"})
result = prepare_query(quality, "my_table", None, QuotingConfig(), server)
assert result == "SELECT * FROM my_schema.my_table"
def test_prepare_query_schema_placeholder_quoted():
"""Test that {schema} placeholder is quoted for postgres/sqlserver."""
quality = DataQuality(type="sql", query="SELECT * FROM {schema}.{model}")
server = Server(**{"type": "postgres", "schema": "my_schema"})
quoting_config = QuotingConfig(quote_model_name=True)
result = prepare_query(quality, "my_table", None, quoting_config, server)
assert result == 'SELECT * FROM "my_schema"."my_table"'
def test_prepare_query_schema_placeholder_backticks():
"""Test that {schema} placeholder uses backticks for bigquery."""
quality = DataQuality(type="sql", query="SELECT * FROM {schema}.{model}")
server = Server(**{"type": "bigquery", "schema": "my_dataset"})
quoting_config = QuotingConfig(quote_model_name_with_backticks=True)
result = prepare_query(quality, "my_table", None, quoting_config, server)
assert result == "SELECT * FROM `my_dataset`.`my_table`"
def test_prepare_query_schema_placeholder_no_server():
"""Test that {schema} falls back to model name when server is None."""
quality = DataQuality(type="sql", query="SELECT * FROM {schema}")
result = prepare_query(quality, "my_table", None, QuotingConfig(), None)
assert result == "SELECT * FROM my_table"
def test_prepare_query_schema_placeholder_no_schema():
"""Test that {schema} falls back to model name when server has no schema."""
quality = DataQuality(type="sql", query="SELECT * FROM {schema}")
server = Server(type="postgres")
result = prepare_query(quality, "my_table", None, QuotingConfig(), server)
assert result == "SELECT * FROM my_table"
def test_prepare_query_schema_placeholder_with_dollar():
"""Test that ${schema} placeholder (with $) is replaced with server schema."""
quality = DataQuality(type="sql", query="SELECT * FROM ${schema}.${model}")
server = Server(**{"type": "postgres", "schema": "my_schema"})
result = prepare_query(quality, "my_table", None, QuotingConfig(), server)
assert result == "SELECT * FROM my_schema.my_table"
def test_prepare_query_all_placeholders_with_dollar():
"""Test that all placeholders work with $ prefix."""
quality = DataQuality(type="sql", query="SELECT ${column} FROM ${schema}.${table}")
server = Server(**{"type": "postgres", "schema": "my_schema"})
result = prepare_query(quality, "my_table", "my_field", QuotingConfig(), server)
assert result == "SELECT my_field FROM my_schema.my_table"
def test_check_property_invalid_values_escapes_single_quotes():
"""Test that single quotes in validValues are properly escaped for SQL."""
check = check_property_invalid_values(
model_name="test_model",
field_name="test_field",
threshold="= 0",
valid_values=["peter's", "john's"],
)
yaml_dict = yaml.safe_load(check.implementation)
valid_values = yaml_dict["checks for test_model"][0]["invalid_count(test_field) = 0"]["valid values"]
assert valid_values == ["peter''s", "john''s"]
def test_check_property_missing_values_escapes_single_quotes():
"""Test that single quotes in missingValues are properly escaped for SQL."""
check = check_property_missing_values(
model_name="test_model",
field_name="test_field",
threshold="= 0",
missing_values=["N/A", "peter's"],
)
yaml_dict = yaml.safe_load(check.implementation)
missing_values = yaml_dict["checks for test_model"][0]["missing_count(test_field) = 0"]["missing values"]
assert missing_values == ["N/A", "peter''s"]