File tree Expand file tree Collapse file tree 2 files changed +13
-0
lines changed
src/xpk/core/workload_decorators Expand file tree Collapse file tree 2 files changed +13
-0
lines changed Original file line number Diff line number Diff line change @@ -131,6 +131,9 @@ def add_volumes(job_manifest: dict):
131131 })
132132 volumes .append ({'name' : 'sys' , 'hostPath' : {'path' : '/sys' }})
133133 volumes .append ({'name' : 'proc-sys' , 'hostPath' : {'path' : '/proc/sys' }})
134+ volumes .append (
135+ {'name' : 'dshm' , 'emptyDir' : {'medium' : 'Memory' , 'sizeLimit' : '128Gi' }}
136+ )
134137
135138
136139def add_tcpx_daemon_container (job_manifest ):
@@ -177,3 +180,6 @@ def update_gpu_containers(job_manifest):
177180 volumeMounts .append (
178181 {'name' : 'libraries' , 'mountPath' : '/usr/local/nvidia/lib64' }
179182 )
183+ container ['volumeMounts' ].append (
184+ {'name' : 'dshm' , 'mountPath' : '/dev/shm' }
185+ )
Original file line number Diff line number Diff line change 1515"""
1616
1717import yaml
18+
1819from ...utils .yaml import literal_string
1920
2021# Component version
@@ -141,6 +142,9 @@ def add_volumes(job_manifest):
141142 'name' : 'aperture-devices' ,
142143 'hostPath' : {'path' : '/dev/aperture_devices' },
143144 })
145+ volumes .append (
146+ {'name' : 'dshm' , 'emptyDir' : {'medium' : 'Memory' , 'sizeLimit' : '128Gi' }}
147+ )
144148
145149
146150def add_tcpxo_daemon_container (job_manifest ):
@@ -189,3 +193,6 @@ def update_gpu_containers(job_manifest):
189193 container ['volumeMounts' ].append (
190194 {'name' : 'libraries' , 'mountPath' : '/usr/local/nvidia' }
191195 )
196+ container ['volumeMounts' ].append (
197+ {'name' : 'dshm' , 'mountPath' : '/dev/shm' }
198+ )
You can’t perform that action at this time.
0 commit comments