Skip to content

Commit bb86a94

Browse files
committed
Merge remote-tracking branch 'upstream/main'
2 parents 0e36f38 + ef1c851 commit bb86a94

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

tests/kfto/kfto_mnist_training_test.go

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -155,7 +155,7 @@ func runKFTOPyTorchMnistJob(t *testing.T, accelerator Accelerator, image string,
155155
defer test.Client().Kubeflow().KubeflowV1().PyTorchJobs(namespace.Name).Delete(test.Ctx(), tuningJob.Name, *metav1.NewDeleteOptions(0))
156156

157157
// Make sure the Workload is created and running
158-
test.Eventually(GetKueueWorkloads(test, namespace.Name), TestTimeoutMedium).
158+
test.Eventually(KueueWorkloads(test, namespace.Name), TestTimeoutMedium).
159159
Should(
160160
And(
161161
HaveLen(1),
@@ -238,7 +238,7 @@ func createKFTOPyTorchMnistJob(test Test, namespace string, config corev1.Config
238238
python3 /mnt/files/download_mnist_datasets.py --dataset_path "/tmp/datasets/mnist" && \
239239
echo -e "\n\n Dataset downloaded to /tmp/datasets/mnist" && ls -R /tmp/datasets/mnist && \
240240
echo -e "\n\n Starting training..." && \
241-
torchrun --nproc_per_node=%d /mnt/files/mnist.py --dataset_path "/tmp/datasets/mnist" --epochs 7 --save_every 2 --batch_size 128 --lr 0.001 --snapshot_path "mnist_snapshot.pt" --backend %s`, numProcPerNode, backend),
241+
torchrun --nproc_per_node=%d /mnt/files/mnist.py --dataset_path "/tmp/datasets/mnist" --epochs 3 --save_every 2 --batch_size 128 --lr 0.001 --snapshot_path "mnist_snapshot.pt" --backend %s`, numProcPerNode, backend),
242242
},
243243
VolumeMounts: []corev1.VolumeMount{
244244
{

0 commit comments

Comments
 (0)