Skip to content

Commit 2683932

Browse files
Inference integ test passed on beta account (#140)
* baseline inference integration test for CLI and SDK, minor bug fix for inference cli, clear inference sdk notebook output * update integ test in progress * update cli code, notebook, integ and unit test to add list_pods and get_logs * clean up merge header * inference integ tests all passing in chait's account * integ test passing on beta account
1 parent d0c6f14 commit 2683932

File tree

2 files changed

+4
-9
lines changed

2 files changed

+4
-9
lines changed

test/integration_tests/cli/test_cli_jumpstart_inference.py

Lines changed: 1 addition & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -34,10 +34,8 @@ def test_js_create(runner, js_endpoint_name):
3434
"--namespace", NAMESPACE,
3535
"--version", VERSION,
3636
"--model-id", "deepseek-llm-r1-distill-qwen-1-5b",
37-
"--model-version", "2.0.4",
38-
"--instance-type", "ml.g5.8xlarge",
37+
"--instance-type", "ml.g5.4xlarge",
3938
"--endpoint-name", js_endpoint_name,
40-
"--tls-certificate-output-s3-uri", "s3://tls-bucket-inf1-beta2"
4139
])
4240
assert result.exit_code == 0, result.output
4341

test/integration_tests/sdk/test_sdk_jumpstart_inference.py

Lines changed: 3 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -15,10 +15,8 @@
1515
REGION = "us-east-2"
1616
ENDPOINT_NAME = "js-sdk-integration"
1717

18-
INSTANCE_TYPE = "ml.g5.8xlarge"
18+
INSTANCE_TYPE = "ml.g5.4xlarge"
1919
MODEL_ID = "deepseek-llm-r1-distill-qwen-1-5b"
20-
MODEL_VERSION = "2.0.4"
21-
TLS_S3_URI = "s3://tls-bucket-inf1-beta2"
2220

2321
TIMEOUT_MINUTES = 15
2422
POLL_INTERVAL_SECONDS = 30
@@ -29,12 +27,11 @@ def sagemaker_client():
2927

3028
@pytest.fixture(scope="module")
3129
def endpoint_obj():
32-
model = Model(model_id=MODEL_ID, model_version=MODEL_VERSION)
30+
model = Model(model_id=MODEL_ID)
3331
server = Server(instance_type=INSTANCE_TYPE)
3432
sm_endpoint = SageMakerEndpoint(name=ENDPOINT_NAME)
35-
tls = TlsConfig(tls_certificate_output_s3_uri=TLS_S3_URI)
3633

37-
return HPJumpStartEndpoint(model=model, server=server, sage_maker_endpoint=sm_endpoint, tls_config=tls)
34+
return HPJumpStartEndpoint(model=model, server=server, sage_maker_endpoint=sm_endpoint)
3835

3936
def test_create_endpoint(endpoint_obj):
4037
endpoint_obj.create(namespace=NAMESPACE)

0 commit comments

Comments
 (0)