Skip to content

Commit 2bb8923

Browse files
committed
Merge remote-tracking branch 'upstream/main' into rhoai-3.2
2 parents 34565ae + 6dd2c37 commit 2bb8923

File tree

4 files changed

+692
-0
lines changed

4 files changed

+692
-0
lines changed

tests/common/support/environment.go

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -58,6 +58,7 @@ const (
5858
storageBucketName = "AWS_STORAGE_BUCKET"
5959
storageBucketMnistDir = "AWS_STORAGE_BUCKET_MNIST_DIR"
6060
storageBucketFashionMnistDir = "AWS_STORAGE_BUCKET_FASHION_MNIST_DIR"
61+
storageBucketOsftDir = "AWS_STORAGE_BUCKET_OSFT_DIR"
6162

6263
// Name of existing namespace to be used for test
6364
testNamespaceNameEnvVar = "TEST_NAMESPACE_NAME"
@@ -185,6 +186,11 @@ func GetStorageBucketFashionMnistDir() (string, bool) {
185186
return storage_bucket_fashion_mnist_dir, exists
186187
}
187188

189+
func GetStorageBucketOsftDir() (string, bool) {
190+
storage_bucket_osft_dir, exists := os.LookupEnv(storageBucketOsftDir)
191+
return storage_bucket_osft_dir, exists
192+
}
193+
188194
func GetPipIndexURL() string {
189195
return lookupEnvOrDefault(pipIndexURL, "https://pypi.python.org/simple")
190196
}

tests/trainer/kubeflow_sdk_test.go

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -20,10 +20,17 @@ import (
2020
"testing"
2121

2222
. "github.com/opendatahub-io/distributed-workloads/tests/common"
23+
support "github.com/opendatahub-io/distributed-workloads/tests/common/support"
2324
sdktests "github.com/opendatahub-io/distributed-workloads/tests/trainer/sdk_tests"
2425
)
2526

2627
func TestKubeflowSdkSanity(t *testing.T) {
2728
Tags(t, Sanity)
2829
sdktests.RunFashionMnistCpuDistributedTraining(t)
2930
}
31+
32+
// TestOsftTrainingHubMultiNodeMultiGPU tests OSFT training using TrainingHubTrainer
33+
func TestOsftTrainingHubMultiNodeMultiGPU(t *testing.T) {
34+
Tags(t, KftoCuda, MultiNodeMultiGpu(2, support.NVIDIA, 1)) // TODO: may need to be updated once https://issues.redhat.com/browse/RHOAIENG-30719 and https://issues.redhat.com/browse/RHOAIENG-24552 are resolved
35+
sdktests.RunOsftTrainingHubMultiGpuDistributedTraining(t)
36+
}

0 commit comments

Comments
 (0)