cockroachdb
diff --git a/‎pkg/ccl/logictestccl/testdata/logic_test/regional_by_row_cascade‎
Lines changed: 127 additions & 0 deletions b/‎pkg/ccl/logictestccl/testdata/logic_test/regional_by_row_cascade‎
Lines changed: 127 additions & 0 deletions
diff --git a/‎pkg/ccl/logictestccl/testdata/logic_test/regional_by_row_query_behavior‎
Lines changed: 16 additions & 0 deletions b/‎pkg/ccl/logictestccl/testdata/logic_test/regional_by_row_query_behavior‎
Lines changed: 16 additions & 0 deletions
diff --git a/‎pkg/sql/exec_util.go‎
Lines changed: 16 additions & 0 deletions b/‎pkg/sql/exec_util.go‎
Lines changed: 16 additions & 0 deletions
diff --git a/‎pkg/sql/logictest/testdata/logic_test/information_schema‎
Lines changed: 4 additions & 0 deletions b/‎pkg/sql/logictest/testdata/logic_test/information_schema‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎pkg/sql/logictest/testdata/logic_test/pg_catalog‎
Lines changed: 12 additions & 0 deletions b/‎pkg/sql/logictest/testdata/logic_test/pg_catalog‎
Lines changed: 12 additions & 0 deletions
diff --git a/‎pkg/sql/logictest/testdata/logic_test/show_source‎
Lines changed: 4 additions & 0 deletions b/‎pkg/sql/logictest/testdata/logic_test/show_source‎
Lines changed: 4 additions & 0 deletions
@@ -58,15 +58,36 @@ INSERT INTO child (c, p, crdb_region) VALUES (1000, 100, 'us-east-1'), (2000, 20
 statement ok
 ANALYZE great_grandparent;
 
+# Only the scan in the main query is parallelized when we don't have stats on
+# the descendant tables.
+query I
+SELECT count(*) FROM [EXPLAIN (VERBOSE) DELETE FROM great_grandparent WHERE i = 1] WHERE info LIKE '%parallel%';
+----
+1
+
 statement ok
 ANALYZE grandparent;
 
+# Now we also should parallelize lookup join into the grandparent table.
+query I
+SELECT count(*) FROM [EXPLAIN (VERBOSE) DELETE FROM great_grandparent WHERE i = 1] WHERE info LIKE '%parallel%';
+----
+2
+
 statement ok
 ANALYZE parent;
 
+# Now we also should parallelize lookup join into the parent table.
+query I
+SELECT count(*) FROM [EXPLAIN (VERBOSE) DELETE FROM great_grandparent WHERE i = 1] WHERE info LIKE '%parallel%';
+----
+3
+
 statement ok
 ANALYZE child;
 
+# Finally, all three lookup joins as well as the scan in the main query should
+# be parallelized.
 query T
 EXPLAIN (VERBOSE) DELETE FROM great_grandparent WHERE i = 1;
 ----
@@ -126,6 +147,7 @@ vectorized: true
         │               │ estimated row count: 3
         │               │ table: grandparent@grandparent_gg_idx
         │               │ lookup condition: (crdb_region IN ('ap-southeast-2', 'ca-central-1', 'us-east-1')) AND (gg = gg)
+        │               │ parallel
         │               │
         │               └── • distinct
         │                   │ columns: (gg)
@@ -163,6 +185,7 @@ vectorized: true
                 │               │ estimated row count: 3
                 │               │ table: parent@parent_g_idx
                 │               │ lookup condition: (crdb_region IN ('ap-southeast-2', 'ca-central-1', 'us-east-1')) AND (g = g)
+                │               │ parallel
                 │               │
                 │               └── • distinct
                 │                   │ columns: (g)
@@ -193,6 +216,7 @@ vectorized: true
                                 │ estimated row count: 3
                                 │ table: child@child_p_idx
                                 │ lookup condition: (crdb_region IN ('ap-southeast-2', 'ca-central-1', 'us-east-1')) AND (p = p)
+                                │ parallel
                                 │
                                 └── • distinct
                                     │ columns: (p)
@@ -206,3 +230,106 @@ vectorized: true
                                               columns: (p, g, crdb_region)
                                               estimated row count: 100
                                               label: buffer 1000000
+
+statement ok
+SET parallelize_multi_key_lookup_joins_avg_lookup_ratio = 0;
+
+# Only the scan in the main query is parallelized when the "average lookup
+# ratio" heuristic is disabled.
+query I
+SELECT count(*) FROM [EXPLAIN (VERBOSE) DELETE FROM great_grandparent WHERE i = 1] WHERE info LIKE '%parallel%';
+----
+1
+
+statement ok
+RESET parallelize_multi_key_lookup_joins_avg_lookup_ratio;
+
+# All three lookup joins as well as the scan in the main query should be
+# parallelized.
+query I
+SELECT count(*) FROM [EXPLAIN (VERBOSE) DELETE FROM great_grandparent WHERE i = 1] WHERE info LIKE '%parallel%';
+----
+4
+
+# Inject the table stats for grandparent table to simulate the case when each
+# region stores 100k rows each. The lookup into the table should still be
+# parallelized (if it's not, then we're using the wrong ColumnIDs when
+# retrieving column stats).
+statement ok
+ALTER TABLE grandparent INJECT STATISTICS '[
+    {
+        "avg_size": 4,
+        "columns": [
+            "crdb_region"
+        ],
+        "created_at": "2025-01-01 00:00:00.000000",
+        "distinct_count": 3,
+        "histo_col_type": "",
+        "name": "__auto__",
+        "null_count": 0,
+        "row_count": 300000
+    },
+    {
+        "avg_size": 2,
+        "columns": [
+            "gg"
+        ],
+        "created_at": "2025-01-01 00:00:00.000000",
+        "distinct_count": 300000,
+        "histo_buckets": [
+            {"distinct_range": 0, "num_eq": 1, "num_range": 0, "upper_bound": "1"},
+            {"distinct_range": 299999, "num_eq": 1, "num_range": 299999, "upper_bound": "300000"}
+        ],
+        "histo_col_type": "INT8",
+        "histo_version": 3,
+        "name": "__auto__",
+        "null_count": 0,
+        "row_count": 300000
+    }
+]'
+
+query I
+SELECT count(*) FROM [EXPLAIN (VERBOSE) DELETE FROM great_grandparent WHERE i = 1] WHERE info LIKE '%parallel%';
+----
+4
+
+# Now simulate a scenario where many rows have NULLs in the lookup column 'gg'.
+# The lookup into the table should still be parallelized (if it's not, then
+# we're incorrectly considering NULLs in the heuristic).
+statement ok
+ALTER TABLE grandparent INJECT STATISTICS '[
+    {
+        "avg_size": 4,
+        "columns": [
+            "crdb_region"
+        ],
+        "created_at": "2025-01-01 00:00:00.000000",
+        "distinct_count": 3,
+        "histo_col_type": "",
+        "name": "__auto__",
+        "null_count": 0,
+        "row_count": 1000000
+    },
+    {
+        "avg_size": 2,
+        "columns": [
+            "gg"
+        ],
+        "created_at": "2025-01-01 00:00:00.000000",
+        "distinct_count": 300000,
+        "histo_buckets": [
+            {"distinct_range": 0, "num_eq": 1, "num_range": 0, "upper_bound": "1"},
+            {"distinct_range": 299999, "num_eq": 1, "num_range": 299999, "upper_bound": "300000"}
+        ],
+        "histo_col_type": "INT8",
+        "histo_version": 3,
+        "name": "__auto__",
+        "null_count": 700000,
+        "row_count": 1000000
+    }
+]'
+
+query I
+SELECT count(*) FROM [EXPLAIN (VERBOSE) DELETE FROM great_grandparent WHERE i = 1] WHERE info LIKE '%parallel%';
+----
+4
@@ -3626,6 +3626,22 @@ vectorized: true
               table: abc@abc_id1_id2_idx
               spans: /"@"/"m\xa4\xf3V\xe5&Kx\xb9\xf9\xbb\xb1\xa7\xfc\x12\xd6"/"h\b\x87\x06\x02\xc6Gѹ\x93\xa4!\xcdv\x1f+"-/"@"/"m\xa4\xf3V\xe5&Kx\xb9\xf9\xbb\xb1\xa7\xfc\x12\xd6"/"h\b\x87\x06\x02\xc6Gѹ\x93\xa4!\xcdv\x1f+"/PrefixEnd
 
+# Same query as above but ensure that the "average lookup ratio" parallelization
+# heuristic applies to the SELECT statement (both the index join and the lookup
+# join should be parallelized).
+statement ok
+SET parallelize_multi_key_lookup_joins_only_on_mr_mutations = false;
+
+query I
+SELECT count(*) FROM [
+  EXPLAIN (VERBOSE) SELECT xyz.str, abc.id, abc.id1, abc.id2, abc.created_at, abc.updated_at FROM abc JOIN xyz ON xyz.abc_id = abc.id AND xyz.id2 = abc.id2 AND xyz.crdb_region = abc.crdb_region WHERE abc.id1 = '6da4f356-e526-4b78-b9f9-bbb1a7fc12d6' AND abc.id2 = '68088706-02c6-47d1-b993-a421cd761f2b' AND abc.crdb_region = 'ap-southeast-2' AND xyz.crdb_region = 'ap-southeast-2'
+] WHERE info LIKE '%parallel%';
+----
+2
+
+statement ok
+RESET parallelize_multi_key_lookup_joins_only_on_mr_mutations;
+
 # The following should use a string of 4 lookup/index joins with a cost under 200.
 query T retry
 EXPLAIN(opt,verbose) SELECT
 
@@ -3871,6 +3871,22 @@ func (m *sessionDataMutator) SetParallelizeMultiKeyLookupJoinsEnabled(val bool)
 	m.data.ParallelizeMultiKeyLookupJoinsEnabled = val
 }
 
+func (m *sessionDataMutator) SetParallelizeMultiKeyLookupJoinsAvgLookupRatio(val float64) {
+	m.data.ParallelizeMultiKeyLookupJoinsAvgLookupRatio = val
+}
+
+func (m *sessionDataMutator) SetParallelizeMultiKeyLookupJoinsMaxLookupRatio(val float64) {
+	m.data.ParallelizeMultiKeyLookupJoinsMaxLookupRatio = val
+}
+
+func (m *sessionDataMutator) SetParallelizeMultiKeyLookupJoinsAvgLookupRowSize(val int64) {
+	m.data.ParallelizeMultiKeyLookupJoinsAvgLookupRowSize = val
+}
+
+func (m *sessionDataMutator) SetParallelizeMultiKeyLookupJoinsOnlyOnMRMutations(val bool) {
+	m.data.ParallelizeMultiKeyLookupJoinsOnlyOnMRMutations = val
+}
+
 // TODO(harding): Remove this when costing scans based on average column size
 // is fully supported.
 func (m *sessionDataMutator) SetCostScansWithDefaultColSize(val bool) {
 
@@ -4080,7 +4080,11 @@ optimizer_use_provided_ordering_fix                              on
 optimizer_use_trigram_similarity_optimization                    on
 optimizer_use_virtual_computed_column_stats                      on
 override_multi_region_zone_config                                off
+parallelize_multi_key_lookup_joins_avg_lookup_ratio              10
+parallelize_multi_key_lookup_joins_avg_lookup_row_size           100 KiB
 parallelize_multi_key_lookup_joins_enabled                       off
+parallelize_multi_key_lookup_joins_max_lookup_ratio              10000
+parallelize_multi_key_lookup_joins_only_on_mr_mutations          on
 password_encryption                                              scram-sha-256
 pg_trgm.similarity_threshold                                     0.3
 plan_cache_mode                                                  auto
 
@@ -3083,7 +3083,11 @@ optimizer_use_provided_ordering_fix                              on
 optimizer_use_trigram_similarity_optimization                    on                  NULL      NULL        NULL        string
 optimizer_use_virtual_computed_column_stats                      on                  NULL      NULL        NULL        string
 override_multi_region_zone_config                                off                 NULL      NULL        NULL        string
+parallelize_multi_key_lookup_joins_avg_lookup_ratio              10                  NULL      NULL        NULL        string
+parallelize_multi_key_lookup_joins_avg_lookup_row_size           100 KiB             NULL      NULL        NULL        string
 parallelize_multi_key_lookup_joins_enabled                       off                 NULL      NULL        NULL        string
+parallelize_multi_key_lookup_joins_max_lookup_ratio              10000               NULL      NULL        NULL        string
+parallelize_multi_key_lookup_joins_only_on_mr_mutations          on                  NULL      NULL        NULL        string
 password_encryption                                              scram-sha-256       NULL      NULL        NULL        string
 pg_trgm.similarity_threshold                                     0.3                 NULL      NULL        NULL        string
 plan_cache_mode                                                  auto                NULL      NULL        NULL        string
@@ -3320,7 +3324,11 @@ optimizer_use_provided_ordering_fix                              on
 optimizer_use_trigram_similarity_optimization                    on                  NULL  user     NULL      on                  on
 optimizer_use_virtual_computed_column_stats                      on                  NULL  user     NULL      on                  on
 override_multi_region_zone_config                                off                 NULL  user     NULL      off                 off
+parallelize_multi_key_lookup_joins_avg_lookup_ratio              10                  NULL  user     NULL      10                  10
+parallelize_multi_key_lookup_joins_avg_lookup_row_size           100 KiB             B     user     NULL      100 KiB             100 KiB
 parallelize_multi_key_lookup_joins_enabled                       off                 NULL  user     NULL      off                 off
+parallelize_multi_key_lookup_joins_max_lookup_ratio              10000               NULL  user     NULL      10000               10000
+parallelize_multi_key_lookup_joins_only_on_mr_mutations          on                  NULL  user     NULL      on                  on
 password_encryption                                              scram-sha-256       NULL  user     NULL      scram-sha-256       scram-sha-256
 pg_trgm.similarity_threshold                                     0.3                 NULL  user     NULL      0.3                 0.3
 plan_cache_mode                                                  auto                NULL  user     NULL      auto                auto
@@ -3548,7 +3556,11 @@ optimizer_use_provided_ordering_fix                              NULL    NULL
 optimizer_use_trigram_similarity_optimization                    NULL    NULL     NULL     NULL        NULL
 optimizer_use_virtual_computed_column_stats                      NULL    NULL     NULL     NULL        NULL
 override_multi_region_zone_config                                NULL    NULL     NULL     NULL        NULL
+parallelize_multi_key_lookup_joins_avg_lookup_ratio              NULL    NULL     NULL     NULL        NULL
+parallelize_multi_key_lookup_joins_avg_lookup_row_size           NULL    NULL     NULL     NULL        NULL
 parallelize_multi_key_lookup_joins_enabled                       NULL    NULL     NULL     NULL        NULL
+parallelize_multi_key_lookup_joins_max_lookup_ratio              NULL    NULL     NULL     NULL        NULL
+parallelize_multi_key_lookup_joins_only_on_mr_mutations          NULL    NULL     NULL     NULL        NULL
 password_encryption                                              NULL    NULL     NULL     NULL        NULL
 pg_trgm.similarity_threshold                                     NULL    NULL     NULL     NULL        NULL
 plan_cache_mode                                                  NULL    NULL     NULL     NULL        NULL
 
@@ -187,7 +187,11 @@ optimizer_use_provided_ordering_fix                              on
 optimizer_use_trigram_similarity_optimization                    on
 optimizer_use_virtual_computed_column_stats                      on
 override_multi_region_zone_config                                off
+parallelize_multi_key_lookup_joins_avg_lookup_ratio              10
+parallelize_multi_key_lookup_joins_avg_lookup_row_size           100 KiB
 parallelize_multi_key_lookup_joins_enabled                       off
+parallelize_multi_key_lookup_joins_max_lookup_ratio              10000
+parallelize_multi_key_lookup_joins_only_on_mr_mutations          on
 password_encryption                                              scram-sha-256
 pg_trgm.similarity_threshold                                     0.3
 plan_cache_mode                                                  auto