Address feedbacks

yuanjingx87 · yuanjingx87 · commit 5472822a1333 · 2026-01-02T13:19:15.000-08:00
Signed-off-by: Yuanjing Xue &lt;197832395+yuanjingx87@users.noreply.github.com&gt;
diff --git a/jenkins/L0_Test.groovy b/jenkins/L0_Test.groovy
@@ -1138,9 +1138,9 @@ def runLLMTestlistWithSbatch(pipeline, platform, testList, config=VANILLA_CONFIG
                     "export ${varName}=\"${escapedValue}\""
                 }.join('\n')
 
-                def scriptContent = """#!/bin/bash
+                def scriptLaunchPrefix = """#!/bin/bash
                     #SBATCH ${exemptionComment}
-                    #SBATCH --output=${outputPath}
+                    #SBATCH --output=${sbatchLogPath}
                     ${taskArgs.collect { "#SBATCH $it" }.join('\n')}
                     #SBATCH ${partition.additionalArgs}
                     ${partition?.time ? "#SBATCH --time=${partition.time}" : "#SBATCH --time=${SlurmConfig.DEFAULT_TIMEOUT_SHORT}"}
@@ -1266,14 +1266,22 @@ def runLLMTestlistWithSbatch(pipeline, platform, testList, config=VANILLA_CONFIG
                     ),
                     numRetries: 3
                 )
+                def sbatchJobId = Utils.exec(
+                    pipeline,
+                    returnStdout: true,
+                    script: Utils.sshUserCmd(
+                        remote,
+                        "cat $jobWorkspace/slurm_job_id.txt"
+                    )
+                ).trim()
                 def scriptTrack = """#!/bin/bash
                     jobId=\$(cat $jobWorkspace/slurm_job_id.txt)
                     tail -f ${sbatchLogPath} &
                     tailPid=\$!
                     # Wait until sbatch job is done.
                     while true; do
                         state=\$(sacct -j \$jobId --format=JobIDRaw,State --noheader | awk -v jobId=\$jobId '""\$1"" == jobId {print \$2}')
-                        if [[ -z \$state || \$state == "RUNNING" || \$state == "PENDING" ]]; then
+                        if [[ -z \$state || \$state == "RUNNING" || \$state == "PENDING" || \$state == "CONFIGURING" ]]; then
                             echo "job is still running"
                             sleep 300
                         else
@@ -1337,22 +1345,6 @@ def runLLMTestlistWithSbatch(pipeline, platform, testList, config=VANILLA_CONFIG
                     true
                 )
 
-                if (perfSanityMode) {
-                    stage("[${stageName}] Check perf result") {
-                        def perfCheckResult = Utils.exec(
-                            pipeline,
-                            script: Utils.sshUserCmd(
-                                remote,
-                                "python3 ${perfCheckScriptNode} ${jobWorkspace}"
-                            ),
-                            returnStatus: true
-                        )
-                        if (perfCheckResult != 0) {
-                            error "Performance regression detected and failing the build (exit code: ${perfCheckResult})"
-                        }
-                    }
-                }
-
                 sh "cat $scriptStatusPathLocal"
                 while (true) {
                     // Check if the job is done by running sacct via SSH
@@ -1364,8 +1356,8 @@ def runLLMTestlistWithSbatch(pipeline, platform, testList, config=VANILLA_CONFIG
                             scriptStatusPathNode
                         )
                     ).trim()
-                    if (!result || result == "RUNNING" || result == "PENDING") {
-                        echo "Job is still running, pulling the job log."
+                    if (!result || result == "RUNNING" || result == "PENDING" || result == "CONFIGURING") {
+                        echo "Slurm job $sbatchJobId is still running, pulling the job log."
                         // Pulling the sbatch output log
                         Utils.exec(
                             pipeline,
@@ -1376,7 +1368,7 @@ def runLLMTestlistWithSbatch(pipeline, platform, testList, config=VANILLA_CONFIG
                             )
                         )
                     } else {
-                        echo "Job is done."
+                        echo "Slurm job $sbatchJobId is done."
                         break
                     }
                 }