@@ -1155,7 +1155,7 @@ def runLLMTestlistWithSbatch(pipeline, platform, testList, config=VANILLA_CONFIG
11551155 export pytestCommand="$pytestCommand "
11561156 export coverageConfigFile="$coverageConfigFile "
11571157 export NVIDIA_IMEX_CHANNELS=\$ {NVIDIA_IMEX_CHANNELS:-0}
1158- export NVIDIA_VISIBLE_DEVICES=\$ {NVIDIA_VISIBLE_DEVICES:-\$ (seq -s, 0 \$ ((\$ (nvidia-smi --query-gpu=count -i 0 --format=noheader)-1)))}
1158+ export NVIDIA_VISIBLE_DEVICES=\$ {NVIDIA_VISIBLE_DEVICES:-\$ (seq -s, 0 \$ ((\$ (nvidia-smi --query-gpu=count -i 0 --format=csv, noheader)-1)))}
11591159 ${ envExportStatements}
11601160
11611161 echo "Env NVIDIA_IMEX_CHANNELS: \$ NVIDIA_IMEX_CHANNELS"
@@ -3249,10 +3249,12 @@ def launchTestJobs(pipeline, testFilter)
32493249 fullSet = parallelJobs. keySet()
32503250
32513251 x86SlurmTestConfigs = [
3252- " DGX_H100-2_GPUs-PyTorch-Others-1" : [" dgx-h100-x2-oci" , " l0_dgx_h100" , 1 , 1 , 2 ],
3252+ " DGX_H100-2_GPUs-PyTorch-Others-1" : [" dgx-h100-x2-oci" , " l0_dgx_h100" , 1 , 2 , 2 ],
3253+ " DGX_H100-2_GPUs-PyTorch-Others-2" : [" dgx-h100-x2-oci" , " l0_dgx_h100" , 2 , 2 , 2 ],
32533254 " DGX_H100-2_GPUs-PyTorch-GptOss-1" : [" dgx-h100-x2-oci" , " l0_dgx_h100" , 1 , 1 , 2 ],
32543255 " DGX_H100-2_GPUs-PyTorch-Ray-1" : [" dgx-h100-x2-oci" , " l0_dgx_h100" , 1 , 1 , 2 ],
3255- " DGX_H100-4_GPUs-PyTorch-DeepSeek-1" : [" dgx-h100-x4-oci" , " l0_dgx_h100" , 1 , 1 , 4 ],
3256+ " DGX_H100-4_GPUs-PyTorch-DeepSeek-1" : [" dgx-h100-x4-oci" , " l0_dgx_h100" , 1 , 2 , 4 ],
3257+ " DGX_H100-4_GPUs-PyTorch-DeepSeek-2" : [" dgx-h100-x4-oci" , " l0_dgx_h100" , 2 , 2 , 4 ],
32563258 " DGX_H100-4_GPUs-PyTorch-GptOss-1" : [" dgx-h100-x4-oci" , " l0_dgx_h100" , 1 , 1 , 4 ],
32573259 " DGX_H100-4_GPUs-PyTorch-Others-1" : [" dgx-h100-x4-oci" , " l0_dgx_h100" , 1 , 1 , 4 ],
32583260 " DGX_H100-4_GPUs-PyTorch-Ray-1" : [" dgx-h100-x4-oci" , " l0_dgx_h100" , 1 , 1 , 4 ],
0 commit comments