File tree Expand file tree Collapse file tree 1 file changed +4
-1
lines changed
Expand file tree Collapse file tree 1 file changed +4
-1
lines changed Original file line number Diff line number Diff line change 33from __future__ import annotations
44
55import logging
6+ import math
67from typing import TYPE_CHECKING
78
89from syncmaster .db .models import Run
@@ -90,12 +91,14 @@ def get_spark_session_conf(
9091 maven_packages .extend (get_packages (connection_type = db_type .type )) # type: ignore
9192 excluded_packages .extend (get_excluded_packages (db_type = db_type .type )) # type: ignore
9293
94+ memory_mb = math .ceil (resources ["ram_bytes_per_task" ] / 1024 / 1024 )
9395 config = {
9496 "spark.jars.packages" : "," .join (maven_packages ),
9597 "spark.sql.pyspark.jvmStacktrace.enabled" : "true" ,
9698 "spark.hadoop.mapreduce.fileoutputcommitter.marksuccessfuljobs" : "false" ,
9799 "spark.executor.cores" : resources ["cpu_cores_per_task" ],
98- "spark.executor.memory" : resources ["ram_bytes_per_task" ],
100+ # Spark expects memory to be in MB
101+ "spark.executor.memory" : f"{ memory_mb } M" ,
99102 "spark.executor.instances" : resources ["max_parallel_tasks" ],
100103 }
101104
You can’t perform that action at this time.
0 commit comments