MobileTeleSystems
diff --git a/‎syncmaster/dto/transfers.py‎
Lines changed: 4 additions & 2 deletions b/‎syncmaster/dto/transfers.py‎
Lines changed: 4 additions & 2 deletions
diff --git a/‎syncmaster/schemas/v1/transfers/file_format.py‎
Lines changed: 54 additions & 0 deletions b/‎syncmaster/schemas/v1/transfers/file_format.py‎
Lines changed: 54 additions & 0 deletions
diff --git a/‎tests/test_integration/test_run_transfer/conftest.py‎
Lines changed: 23 additions & 3 deletions b/‎tests/test_integration/test_run_transfer/conftest.py‎
Lines changed: 23 additions & 3 deletions
diff --git a/‎tests/test_integration/test_run_transfer/test_hdfs.py‎
Lines changed: 27 additions & 6 deletions b/‎tests/test_integration/test_run_transfer/test_hdfs.py‎
Lines changed: 27 additions & 6 deletions
diff --git a/‎tests/test_integration/test_run_transfer/test_s3.py‎
Lines changed: 27 additions & 6 deletions b/‎tests/test_integration/test_run_transfer/test_s3.py‎
Lines changed: 27 additions & 6 deletions
@@ -4,7 +4,7 @@
 from dataclasses import dataclass
 from typing import ClassVar
 
-from onetl.file.format import CSV, JSON, Excel, JSONLine
+from onetl.file.format import CSV, JSON, ORC, Excel, JSONLine, Parquet
 
 
 @dataclass
@@ -20,7 +20,7 @@ class DBTransferDTO(TransferDTO):
 @dataclass
 class FileTransferDTO(TransferDTO):
     directory_path: str
-    file_format: CSV | JSONLine | JSON | Excel
+    file_format: CSV | JSONLine | JSON | Excel | ORC | Parquet
     options: dict
     df_schema: dict | None = None
 
@@ -29,6 +29,8 @@ class FileTransferDTO(TransferDTO):
         "jsonline": JSONLine,
         "json": JSON,
         "excel": Excel,
+        "orc": ORC,
+        "parquet": Parquet,
     }
 
     def __post_init__(self):
 
@@ -2,6 +2,8 @@
 # SPDX-License-Identifier: Apache-2.0
 from __future__ import annotations
 
+from enum import Enum
+
 from pydantic import BaseModel
 
 from syncmaster.schemas.v1.file_formats import (
@@ -15,6 +17,52 @@
 )
 
 
+class ORCCompression(str, Enum):
+    UNCOMPRESSED = "uncompressed"
+    NONE = "none"
+    SNAPPY = "snappy"
+    ZLIB = "zlib"
+    LZO = "lzo"
+    ZSTD = "zstd"
+    LZ4 = "lz4"
+
+
+class ParquetCompression(str, Enum):
+    UNCOMPRESSED = "uncompressed"
+    NONE = "none"
+    SNAPPY = "snappy"
+    GZIP = "gzip"
+    LZO = "lzo"
+    ZSTD = "zstd"
+    LZ4 = "lz4"
+    BROTLI = "brotli"
+
+
+class JSONCompression(str, Enum):
+    NONE = "none"
+    BZIP2 = "bzip2"
+    GZIP = "gzip"
+    LZ4 = "lz4"
+    SNAPPY = "snappy"
+    DEFLATE = "deflate"
+
+
+class CSVCompression(str, Enum):
+    NONE = "none"
+    BZIP2 = "bzip2"
+    GZIP = "gzip"
+    LZ4 = "lz4"
+    SNAPPY = "snappy"
+    DEFLATE = "deflate"
+
+
+class XMLCompression(str, Enum):
+    BZIP2 = "bzip2"
+    GZIP = "gzip"
+    LZ4 = "lz4"
+    SNAPPY = "snappy"
+
+
 class CSV(BaseModel):
     type: CSV_FORMAT
     delimiter: str = ","
@@ -23,18 +71,21 @@ class CSV(BaseModel):
     escape: str = "\\"
     include_header: bool = False
     line_sep: str = "\n"
+    compression: CSVCompression = CSVCompression.NONE
 
 
 class JSONLine(BaseModel):
     type: JSONLINE_FORMAT
     encoding: str = "utf-8"
     line_sep: str = "\n"
+    compression: JSONCompression = CSVCompression.NONE
 
 
 class JSON(BaseModel):
     type: JSON_FORMAT
     encoding: str = "utf-8"
     line_sep: str = "\n"
+    compression: JSONCompression = CSVCompression.NONE
 
 
 class Excel(BaseModel):
@@ -47,11 +98,14 @@ class XML(BaseModel):
     type: XML_FORMAT
     root_tag: str
     row_tag: str
+    compression: XMLCompression | None = None
 
 
 class ORC(BaseModel):
     type: ORC_FORMAT
+    compression: ORCCompression = CSVCompression.NONE
 
 
 class Parquet(BaseModel):
     type: PARQUET_FORMAT
+    compression: ParquetCompression = CSVCompression.NONE
@@ -11,7 +11,7 @@
 from onetl.connection import MSSQL, Clickhouse, Hive, MySQL, Oracle, Postgres, SparkS3
 from onetl.connection.file_connection.s3 import S3
 from onetl.db import DBWriter
-from onetl.file.format import CSV, JSON, Excel, JSONLine
+from onetl.file.format import CSV, JSON, ORC, Excel, JSONLine, Parquet
 from pyspark.sql import DataFrame, SparkSession
 from pyspark.sql.types import (
     DateType,
@@ -804,7 +804,7 @@ def fill_with_data(df: DataFrame):
         pass
 
 
-@pytest.fixture(params=[("csv", {}), ("jsonline", {}), ("json", {}), ("excel", {})])
+@pytest.fixture()
 def source_file_format(request: FixtureRequest):
     name, params = request.param
     if name == "csv":
@@ -835,10 +835,20 @@ def source_file_format(request: FixtureRequest):
             **params,
         )
 
+    if name == "orc":
+        return "orc", ORC(
+            **params,
+        )
+
+    if name == "parquet":
+        return "parquet", Parquet(
+            **params,
+        )
+
     raise ValueError(f"Unsupported file format: {name}")
 
 
-@pytest.fixture(params=[("csv", {}), ("jsonline", {}), ("excel", {})])
+@pytest.fixture()
 def target_file_format(request: FixtureRequest):
     name, params = request.param
     if name == "csv":
@@ -863,6 +873,16 @@ def target_file_format(request: FixtureRequest):
             **params,
         )
 
+    if name == "orc":
+        return "orc", ORC(
+            **params,
+        )
+
+    if name == "parquet":
+        return "parquet", Parquet(
+            **params,
+        )
+
     raise ValueError(f"Unsupported file format: {name}")
 
 
 
@@ -13,6 +13,7 @@
 from sqlalchemy.ext.asyncio import AsyncSession
 
 from syncmaster.db.models import Connection, Group, Queue, Status
+from syncmaster.db.models.transfer import Transfer
 from tests.mocks import MockUser
 from tests.test_unit.utils import create_transfer
 from tests.utils import get_run_on_end
@@ -114,8 +115,8 @@ async def postgres_to_hdfs(
             id="csv",
         ),
         pytest.param(
-            ("json", {}),
-            "without_compression",
+            ("json", {"compression": "gzip"}),
+            "with_compression",
             id="json",
         ),
         pytest.param(
@@ -128,6 +129,16 @@ async def postgres_to_hdfs(
             "with_header",
             id="excel",
         ),
+        pytest.param(
+            ("orc", {"compression": "snappy"}),
+            "with_compression",
+            id="orc",
+        ),
+        pytest.param(
+            ("parquet", {"compression": "snappy"}),
+            "with_compression",
+            id="parquet",
+        ),
     ],
     indirect=["source_file_format", "file_format_flavor"],
 )
@@ -136,7 +147,7 @@ async def test_run_transfer_hdfs_to_postgres(
     group_owner: MockUser,
     init_df: DataFrame,
     client: AsyncClient,
-    hdfs_to_postgres: Connection,
+    hdfs_to_postgres: Transfer,
     source_file_format,
     file_format_flavor,
 ):
@@ -188,8 +199,8 @@ async def test_run_transfer_hdfs_to_postgres(
     "target_file_format, file_format_flavor",
     [
         pytest.param(
-            ("csv", {}),
-            "with_header",
+            ("csv", {"compression": "lz4"}),
+            "with_compression",
             id="csv",
         ),
         pytest.param(
@@ -202,6 +213,16 @@ async def test_run_transfer_hdfs_to_postgres(
             "with_header",
             id="excel",
         ),
+        pytest.param(
+            ("orc", {"compression": "lzo"}),
+            "with_compression",
+            id="orc",
+        ),
+        pytest.param(
+            ("parquet", {"compression": "brotli"}),
+            "with_compression",
+            id="parquet",
+        ),
     ],
     indirect=["target_file_format", "file_format_flavor"],
 )
@@ -211,7 +232,7 @@ async def test_run_transfer_postgres_to_hdfs(
     client: AsyncClient,
     prepare_postgres,
     hdfs_file_df_connection: SparkHDFS,
-    postgres_to_hdfs: Connection,
+    postgres_to_hdfs: Transfer,
     hdfs_connection: SparkHDFS,
     target_file_format,
     file_format_flavor: str,
 
@@ -13,6 +13,7 @@
 from sqlalchemy.ext.asyncio import AsyncSession
 
 from syncmaster.db.models import Connection, Group, Queue, Status
+from syncmaster.db.models.transfer import Transfer
 from tests.mocks import MockUser
 from tests.test_unit.utils import create_transfer
 from tests.utils import get_run_on_end
@@ -114,8 +115,8 @@ async def postgres_to_s3(
             id="csv",
         ),
         pytest.param(
-            ("json", {}),
-            "without_compression",
+            ("json", {"compression": "gzip"}),
+            "with_compression",
             id="json",
         ),
         pytest.param(
@@ -128,6 +129,16 @@ async def postgres_to_s3(
             "with_header",
             id="excel",
         ),
+        pytest.param(
+            ("orc", {"compression": "snappy"}),
+            "with_compression",
+            id="orc",
+        ),
+        pytest.param(
+            ("parquet", {"compression": "snappy"}),
+            "with_compression",
+            id="parquet",
+        ),
     ],
     indirect=["source_file_format", "file_format_flavor"],
 )
@@ -136,7 +147,7 @@ async def test_run_transfer_s3_to_postgres(
     group_owner: MockUser,
     init_df: DataFrame,
     client: AsyncClient,
-    s3_to_postgres: Connection,
+    s3_to_postgres: Transfer,
     source_file_format,
     file_format_flavor,
 ):
@@ -189,8 +200,8 @@ async def test_run_transfer_s3_to_postgres(
     "target_file_format, file_format_flavor",
     [
         pytest.param(
-            ("csv", {}),
-            "with_header",
+            ("csv", {"compression": "lz4"}),
+            "with_compression",
             id="csv",
         ),
         pytest.param(
@@ -203,6 +214,16 @@ async def test_run_transfer_s3_to_postgres(
             "with_header",
             id="excel",
         ),
+        pytest.param(
+            ("orc", {"compression": "none"}),
+            "with_compression",
+            id="orc",
+        ),
+        pytest.param(
+            ("parquet", {"compression": "brotli"}),
+            "with_compression",
+            id="parquet",
+        ),
     ],
     indirect=["target_file_format", "file_format_flavor"],
 )
@@ -213,7 +234,7 @@ async def test_run_transfer_postgres_to_s3(
     s3_file_df_connection: SparkS3,
     prepare_postgres,
     prepare_s3,
-    postgres_to_s3: Connection,
+    postgres_to_s3: Transfer,
     target_file_format,
     file_format_flavor: str,
 ):