|
75 | 75 | "-inference:2.1.1-tgi1.4.0-gpu-py310-cu121-ubuntu20.04" |
76 | 76 | ) |
77 | 77 | mock_djl_image_uri = ( |
78 | | - "123456789712.dkr.ecr.us-west-2.amazonaws.com/djl-inference:0.24.0-neuronx-sdk2.14.1" |
| 78 | + "763104351884.dkr.ecr.us-west-2.amazonaws.com/djl-inference:0.31.0-lmi13.0.0-cu124" |
79 | 79 | ) |
80 | 80 |
|
81 | 81 | mock_model_data = { |
@@ -1166,6 +1166,7 @@ def test_optimize_quantize_for_jumpstart( |
1166 | 1166 | mock_pysdk_model.image_uri = mock_tgi_image_uri |
1167 | 1167 | mock_pysdk_model.list_deployment_configs.return_value = DEPLOYMENT_CONFIGS |
1168 | 1168 | mock_pysdk_model.deployment_config = DEPLOYMENT_CONFIGS[0] |
| 1169 | + mock_pysdk_model.init_kwargs = {"image_uri": "763104351884.dkr.ecr.us-west-2.amazonaws.com/djl-inference:0.29.0-lmi11.0.0-cu124"} |
1169 | 1170 |
|
1170 | 1171 | sample_input = { |
1171 | 1172 | "inputs": "The diamondback terrapin or simply terrapin is a species " |
@@ -1201,6 +1202,9 @@ def test_optimize_quantize_for_jumpstart( |
1201 | 1202 | ) |
1202 | 1203 |
|
1203 | 1204 | self.assertIsNotNone(out_put) |
| 1205 | + self.assertEqual( |
| 1206 | + out_put["OptimizationConfigs"][0]["ModelQuantizationConfig"]["Image"], "763104351884.dkr.ecr.us-west-2.amazonaws.com/djl-inference:0.31.0-lmi13.0.0-cu124" |
| 1207 | + ) |
1204 | 1208 |
|
1205 | 1209 | @patch("sagemaker.serve.builder.jumpstart_builder._capture_telemetry", side_effect=None) |
1206 | 1210 | @patch.object(ModelBuilder, "_get_serve_setting", autospec=True) |
@@ -1287,6 +1291,7 @@ def test_optimize_quantize_and_compile_for_jumpstart( |
1287 | 1291 | mock_pysdk_model.deployment_config = DEPLOYMENT_CONFIGS[0] |
1288 | 1292 | mock_pysdk_model.config_name = "config_name" |
1289 | 1293 | mock_pysdk_model._metadata_configs = {"config_name": mock_metadata_config} |
| 1294 | + mock_pysdk_model.init_kwargs = {"image_uri": "763104351884.dkr.ecr.us-west-2.amazonaws.com/djl-inference:0.29.0-lmi11.0.0-cu124"} |
1290 | 1295 |
|
1291 | 1296 | sample_input = { |
1292 | 1297 | "inputs": "The diamondback terrapin or simply terrapin is a species " |
@@ -1319,6 +1324,8 @@ def test_optimize_quantize_and_compile_for_jumpstart( |
1319 | 1324 | ) |
1320 | 1325 |
|
1321 | 1326 | self.assertIsNotNone(out_put) |
| 1327 | + self.assertIsNone(out_put["OptimizationConfigs"][1]["ModelCompilationConfig"].get("Image")) |
| 1328 | + self.assertIsNone(out_put["OptimizationConfigs"][0]["ModelQuantizationConfig"].get("Image")) |
1322 | 1329 |
|
1323 | 1330 | @patch("sagemaker.serve.builder.jumpstart_builder._capture_telemetry", side_effect=None) |
1324 | 1331 | @patch.object(ModelBuilder, "_get_serve_setting", autospec=True) |
@@ -1640,6 +1647,7 @@ def test_optimize_on_js_model_should_ignore_pre_optimized_configurations( |
1640 | 1647 |
|
1641 | 1648 | mock_lmi_js_model = MagicMock() |
1642 | 1649 | mock_lmi_js_model.image_uri = mock_djl_image_uri |
| 1650 | + mock_lmi_js_model.init_kwargs = {"image_uri": "763104351884.dkr.ecr.us-west-2.amazonaws.com/djl-inference:0.29.0-lmi11.0.0-cu124"} |
1643 | 1651 | mock_lmi_js_model.env = { |
1644 | 1652 | "SAGEMAKER_PROGRAM": "inference.py", |
1645 | 1653 | "ENDPOINT_SERVER_TIMEOUT": "3600", |
@@ -1718,6 +1726,7 @@ def test_optimize_on_js_model_should_ignore_pre_optimized_configurations_no_over |
1718 | 1726 |
|
1719 | 1727 | mock_lmi_js_model = MagicMock() |
1720 | 1728 | mock_lmi_js_model.image_uri = mock_djl_image_uri |
| 1729 | + mock_lmi_js_model.init_kwargs = {"image_uri": "763104351884.dkr.ecr.us-west-2.amazonaws.com/djl-inference:0.29.0-lmi11.0.0-cu124"} |
1721 | 1730 | mock_lmi_js_model.env = { |
1722 | 1731 | "SAGEMAKER_PROGRAM": "inference.py", |
1723 | 1732 | "ENDPOINT_SERVER_TIMEOUT": "3600", |
|
0 commit comments