Skip to content

Commit a8a4bac

Browse files
author
Ilyas Gasanov
committed
[DOP-21450] Add compressions for file formats
1 parent 1c8f5bd commit a8a4bac

File tree

3 files changed

+7
-6
lines changed

3 files changed

+7
-6
lines changed

tests/test_integration/test_run_transfer/test_hdfs.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -184,7 +184,7 @@ async def test_run_transfer_hdfs_to_postgres(
184184
)
185185
df = reader.run()
186186

187-
# as these file formats do not support datetime values with precision greater than milliseconds
187+
# as Excel does not support datetime values with precision greater than milliseconds
188188
if file_format in ("excel", "parquet", "orc"):
189189
df = df.withColumn("REGISTERED_AT", date_trunc("second", col("REGISTERED_AT")))
190190
init_df = init_df.withColumn("REGISTERED_AT", date_trunc("second", col("REGISTERED_AT")))
@@ -275,8 +275,8 @@ async def test_run_transfer_postgres_to_hdfs(
275275
)
276276
df = reader.run()
277277

278-
# as these file formats do not support datetime values with precision greater than milliseconds
279-
if format_name in ("excel", "parquet", "orc"):
278+
# as Excel does not support datetime values with precision greater than milliseconds
279+
if format_name in ("excel", "parquet"):
280280
init_df = init_df.withColumn(
281281
"REGISTERED_AT",
282282
to_timestamp(date_format(col("REGISTERED_AT"), "yyyy-MM-dd HH:mm:ss.SSS")),

tests/test_integration/test_run_transfer/test_s3.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -185,7 +185,7 @@ async def test_run_transfer_s3_to_postgres(
185185
)
186186
df = reader.run()
187187

188-
# as these file formats do not support datetime values with precision greater than milliseconds
188+
# as Excel does not support datetime values with precision greater than milliseconds
189189
if file_format in ("excel", "parquet", "orc"):
190190
df = df.withColumn("REGISTERED_AT", date_trunc("second", col("REGISTERED_AT")))
191191
init_df = init_df.withColumn("REGISTERED_AT", date_trunc("second", col("REGISTERED_AT")))
@@ -276,8 +276,8 @@ async def test_run_transfer_postgres_to_s3(
276276
)
277277
df = reader.run()
278278

279-
# as these file formats do not support datetime values with precision greater than milliseconds
280-
if format_name in ("excel", "parquet", "orc"):
279+
# as Excel does not support datetime values with precision greater than milliseconds
280+
if format_name in ("excel", "parquet"):
281281
init_df = init_df.withColumn(
282282
"REGISTERED_AT",
283283
to_timestamp(date_format(col("REGISTERED_AT"), "yyyy-MM-dd HH:mm:ss.SSS")),

tests/test_unit/test_transfers/transfer_fixtures/transfers_fixture.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -61,6 +61,7 @@ async def group_transfers(
6161
"line_sep": "\n",
6262
"quote": '"',
6363
"type": "csv",
64+
"compression": "none",
6465
}
6566
common_params = {
6667
"file_format": file_format,

0 commit comments

Comments
 (0)