Skip to content

Commit a7e5f09

Browse files
committed
[DOP-22135] Fix spark.executor.memory value
1 parent 2381c57 commit a7e5f09

File tree

1 file changed

+4
-1
lines changed

1 file changed

+4
-1
lines changed

syncmaster/worker/spark.py

Lines changed: 4 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -3,6 +3,7 @@
33
from __future__ import annotations
44

55
import logging
6+
import math
67
from typing import TYPE_CHECKING
78

89
from syncmaster.db.models import Run
@@ -90,12 +91,14 @@ def get_spark_session_conf(
9091
maven_packages.extend(get_packages(connection_type=db_type.type)) # type: ignore
9192
excluded_packages.extend(get_excluded_packages(db_type=db_type.type)) # type: ignore
9293

94+
memory_mb = math.ceil(resources["ram_bytes_per_task"] / 1024 / 1024)
9395
config = {
9496
"spark.jars.packages": ",".join(maven_packages),
9597
"spark.sql.pyspark.jvmStacktrace.enabled": "true",
9698
"spark.hadoop.mapreduce.fileoutputcommitter.marksuccessfuljobs": "false",
9799
"spark.executor.cores": resources["cpu_cores_per_task"],
98-
"spark.executor.memory": resources["ram_bytes_per_task"],
100+
# Spark expects memory to be in MB
101+
"spark.executor.memory": f"{memory_mb}M",
99102
"spark.executor.instances": resources["max_parallel_tasks"],
100103
}
101104

0 commit comments

Comments
 (0)