Skip to content

Commit 4f63ae9

Browse files
add excluded paths to crawler (#2292)
* add excluded paths to crawler * combine compatible schemas
1 parent 9cefb85 commit 4f63ae9

File tree

1 file changed

+17
-0
lines changed

1 file changed

+17
-0
lines changed

terraform/core/39-housing-interim-finance-db-ingestion.tf

Lines changed: 17 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -70,6 +70,7 @@ module "ingest_housing_interim_finance_database_to_housing_raw_zone" {
7070
configuration = jsonencode({
7171
Version = 1.0
7272
Grouping = {
73+
TableGroupingPolicy = "CombineCompatibleSchemas"
7374
TableLevelConfiguration = 3
7475
}
7576
CrawlerOutput = {
@@ -78,6 +79,22 @@ module "ingest_housing_interim_finance_database_to_housing_raw_zone" {
7879
})
7980
table_prefix = null
8081
}
82+
glue_crawler_excluded_blobs = [
83+
"*/archive*",
84+
"*/data-quality*",
85+
"*/glue-*",
86+
"*/google-sheets*",
87+
"*/govnotify*",
88+
"*/housingfinance*",
89+
"*/ingestion-details*",
90+
"*/mtfh*",
91+
"*/temp_backup*",
92+
"*.json",
93+
"*.txt",
94+
"*.zip",
95+
"*.xlsx",
96+
"*.html",
97+
]
8198
}
8299

83100
resource "aws_ssm_parameter" "ingest_housing_interim_finance_database_to_housing_raw_zone_crawler_name" {

0 commit comments

Comments
 (0)