|
46 | 46 | ROLE = "dummy_role"
|
47 | 47 | REGION = "us-west-2"
|
48 | 48 | BUCKET = "mybucket"
|
49 |
| -IMAGE_URI = "763104351884.dkr.ecr.us-west-2.amazon.com/djl-inference:0.20.0-deepspeed0.7.5-cu116" |
| 49 | +IMAGE_URI = "763104351884.dkr.ecr.us-west-2.amazon.com/djl-inference:0.22.1-deepspeed0.9.2-cu118" |
50 | 50 | GPU_INSTANCE = "ml.g5.12xlarge"
|
51 | 51 |
|
52 | 52 |
|
@@ -111,7 +111,6 @@ def test_create_model_valid_hf_hub_model_id(
|
111 | 111 |
|
112 | 112 | serving_properties = model.generate_serving_properties()
|
113 | 113 | assert serving_properties["option.model_id"] == HF_MODEL_ID
|
114 |
| - assert "option.s3url" not in serving_properties |
115 | 114 |
|
116 | 115 |
|
117 | 116 | @patch("json.load")
|
@@ -396,7 +395,7 @@ def test_generate_serving_properties_with_valid_configurations(
|
396 | 395 | expected_dict = {
|
397 | 396 | "engine": "Python",
|
398 | 397 | "option.entryPoint": ENTRY_POINT,
|
399 |
| - "option.s3url": VALID_UNCOMPRESSED_MODEL_DATA, |
| 398 | + "option.model_id": VALID_UNCOMPRESSED_MODEL_DATA, |
400 | 399 | "option.tensor_parallel_degree": 4,
|
401 | 400 | "option.task": "text-classification",
|
402 | 401 | "option.dtype": "fp16",
|
@@ -431,7 +430,7 @@ def test_generate_serving_properties_with_valid_configurations(
|
431 | 430 | expected_dict = {
|
432 | 431 | "engine": "DeepSpeed",
|
433 | 432 | "option.entryPoint": "djl_python.deepspeed",
|
434 |
| - "option.s3url": VALID_UNCOMPRESSED_MODEL_DATA, |
| 433 | + "option.model_id": VALID_UNCOMPRESSED_MODEL_DATA, |
435 | 434 | "option.tensor_parallel_degree": 1,
|
436 | 435 | "option.task": "text-generation",
|
437 | 436 | "option.dtype": "bf16",
|
@@ -459,7 +458,7 @@ def test_generate_serving_properties_with_valid_configurations(
|
459 | 458 | expected_dict = {
|
460 | 459 | "engine": "Python",
|
461 | 460 | "option.entryPoint": "djl_python.huggingface",
|
462 |
| - "option.s3url": VALID_UNCOMPRESSED_MODEL_DATA, |
| 461 | + "option.model_id": VALID_UNCOMPRESSED_MODEL_DATA, |
463 | 462 | "option.tensor_parallel_degree": 1,
|
464 | 463 | "option.dtype": "fp32",
|
465 | 464 | "option.device_id": 4,
|
|
0 commit comments