@@ -25,93 +25,8 @@ sql: |
2525 ORDER BY c_customer_id
2626 LIMIT 100
2727
28- # Table statistics derived from snow_plan's TableScan information
29- table_statistics :
30- date_dim :
31- num_rows : 73049 # Estimated based on typical date dimension cardinality
32- data_size : 2138624 # Directly from snow_plan: "bytes: 2,138,624"
33- number_of_segments : 1 # From snow_plan: "partitions: 1/1"
34-
35- store_returns :
36- num_rows : 287000000 # Estimated based on data size and typical row size
37- data_size : 124763446272 # Directly from snow_plan: "bytes: 124,763,446,272"
38- number_of_segments : 7070 # From snow_plan: "partitions: 7070/7070"
39-
40- store :
41- num_rows : 1002 # Estimated based on typical store dimension cardinality
42- data_size : 135680 # Directly from snow_plan: "bytes: 135,680"
43- number_of_segments : 1 # From snow_plan: "partitions: 1/1"
44-
45- customer :
46- num_rows : 12000000 # Estimated based on typical customer dimension size
47- data_size : 2328538624 # Directly from snow_plan: "bytes: 2,328,538,624"
48- number_of_segments : 261 # From snow_plan: "partitions: 261/261"
49-
50- # Column statistics derived from query predicates and typical TPC-DS data distributions
51- column_statistics :
52- # Date dimension columns used in the query
53- date_dim.d_year :
54- min : 1990 # Typical range for TPC-DS
55- max : 2010 # Typical range for TPC-DS
56- ndv : 21 # Based on min/max range (2010-1990+1)
57- null_count : 0 # Primary dimension columns typically don't have nulls
58-
59- date_dim.d_date_sk :
60- min : 1 # Typical starting value for surrogate key
61- max : 73049 # Based on table row count
62- ndv : 73049 # Primary key, so NDV equals row count
63- null_count : 0 # Primary key cannot be null
64-
65- # Store returns columns used in the query
66- store_returns.sr_returned_date_sk :
67- min : 1 # Matches date_dim.d_date_sk min
68- max : 73049 # Matches date_dim.d_date_sk max
69- ndv : 73049 # Foreign key to date_dim
70- null_count : 287998 # Inferred from filter in snow_plan: "STORE_RETURNS.SR_RETURNED_DATE_SK IS NOT NULL"
71-
72- store_returns.sr_customer_sk :
73- min : 1 # Typical starting value for surrogate key
74- max : 12000000 # Matches customer.c_customer_sk max
75- ndv : 11000000 # Estimated as slightly less than customer table cardinality
76- null_count : 143500 # Inferred from filter in snow_plan: "STORE_RETURNS.SR_CUSTOMER_SK IS NOT NULL"
77-
78- store_returns.sr_store_sk :
79- min : 1 # Typical starting value for surrogate key
80- max : 1002 # Matches store.s_store_sk max
81- ndv : 1002 # Foreign key to store table
82- null_count : 143500 # Inferred from filter in snow_plan: "STORE_RETURNS.SR_STORE_SK IS NOT NULL"
83-
84- store_returns.sr_return_amt :
85- min : 0.01 # Minimum reasonable return amount
86- max : 10000.00 # Maximum reasonable return amount
87- ndv : 100000 # Estimated based on typical distribution
88- null_count : 0 # Return amount is typically not null
89-
90- # Store columns used in the query
91- store.s_store_sk :
92- min : 1 # Typical starting value for surrogate key
93- max : 1002 # Based on estimated row count
94- ndv : 1002 # Primary key, so NDV equals row count
95- null_count : 0 # Primary key cannot be null
96-
97- store.s_state :
98- min : " AK" # Alaska (alphabetically first US state)
99- max : " WY" # Wyoming (alphabetically last US state)
100- ndv : 50 # Number of US states
101- null_count : 0 # State is typically not null
102-
103- # Customer columns used in the query
104- customer.c_customer_sk :
105- min : 1 # Typical starting value for surrogate key
106- max : 12000000 # Based on estimated row count
107- ndv : 12000000 # Primary key, so NDV equals row count
108- null_count : 0 # Primary key cannot be null
109-
110- customer.c_customer_id :
111- min : " AAAAAAAAAAAAAA" # Lexicographically smallest possible customer ID
112- max : " ZZZZZZZZZZZZZZ" # Lexicographically largest possible customer ID
113- ndv : 12000000 # Same as c_customer_sk (1:1 relationship)
114- null_count : 0 # Customer ID is typically not null
28+ # Reference to external statistics file
29+ statistics_file : statistics.yaml
11530
11631raw_plan : |
11732 Limit
0 commit comments