We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent b5152c2 commit 164157aCopy full SHA for 164157a
terraform/account-wide-infrastructure/modules/glue/src/pipeline.py
@@ -104,9 +104,9 @@ def load(self, data):
104
self.logger.info(f"Loading data into {self.target_path} as Parquet")
105
for name, dataframe in data.items():
106
name = name.replace("--", "_")
107
- dataframe.write.mode("append").partitionBy(*self.partition_cols).parquet(
108
- f"{self.target_path}{name}"
109
- )
+ dataframe.coalesce(1).write.mode("append").partitionBy(
+ *self.partition_cols
+ ).parquet(f"{self.target_path}{name}")
110
111
def trigger_crawler(self):
112
self.glue.start_crawler(Name=f"{self.name_prefix}-log-crawler")
0 commit comments