|
46 | 46 | ROLE = "dummy_role" |
47 | 47 | REGION = "us-west-2" |
48 | 48 | BUCKET = "mybucket" |
49 | | -IMAGE_URI = "763104351884.dkr.ecr.us-west-2.amazon.com/djl-inference:0.20.0-deepspeed0.7.5-cu116" |
| 49 | +IMAGE_URI = "763104351884.dkr.ecr.us-west-2.amazon.com/djl-inference:0.22.1-deepspeed0.9.2-cu118" |
50 | 50 | GPU_INSTANCE = "ml.g5.12xlarge" |
51 | 51 |
|
52 | 52 |
|
@@ -111,7 +111,6 @@ def test_create_model_valid_hf_hub_model_id( |
111 | 111 |
|
112 | 112 | serving_properties = model.generate_serving_properties() |
113 | 113 | assert serving_properties["option.model_id"] == HF_MODEL_ID |
114 | | - assert "option.s3url" not in serving_properties |
115 | 114 |
|
116 | 115 |
|
117 | 116 | @patch("json.load") |
@@ -396,7 +395,7 @@ def test_generate_serving_properties_with_valid_configurations( |
396 | 395 | expected_dict = { |
397 | 396 | "engine": "Python", |
398 | 397 | "option.entryPoint": ENTRY_POINT, |
399 | | - "option.s3url": VALID_UNCOMPRESSED_MODEL_DATA, |
| 398 | + "option.model_id": VALID_UNCOMPRESSED_MODEL_DATA, |
400 | 399 | "option.tensor_parallel_degree": 4, |
401 | 400 | "option.task": "text-classification", |
402 | 401 | "option.dtype": "fp16", |
@@ -431,7 +430,7 @@ def test_generate_serving_properties_with_valid_configurations( |
431 | 430 | expected_dict = { |
432 | 431 | "engine": "DeepSpeed", |
433 | 432 | "option.entryPoint": "djl_python.deepspeed", |
434 | | - "option.s3url": VALID_UNCOMPRESSED_MODEL_DATA, |
| 433 | + "option.model_id": VALID_UNCOMPRESSED_MODEL_DATA, |
435 | 434 | "option.tensor_parallel_degree": 1, |
436 | 435 | "option.task": "text-generation", |
437 | 436 | "option.dtype": "bf16", |
@@ -459,7 +458,7 @@ def test_generate_serving_properties_with_valid_configurations( |
459 | 458 | expected_dict = { |
460 | 459 | "engine": "Python", |
461 | 460 | "option.entryPoint": "djl_python.huggingface", |
462 | | - "option.s3url": VALID_UNCOMPRESSED_MODEL_DATA, |
| 461 | + "option.model_id": VALID_UNCOMPRESSED_MODEL_DATA, |
463 | 462 | "option.tensor_parallel_degree": 1, |
464 | 463 | "option.dtype": "fp32", |
465 | 464 | "option.device_id": 4, |
|
0 commit comments