|
53 | 53 | ModelServer.DJL_SERVING,
|
54 | 54 | }
|
55 | 55 |
|
56 |
| -MIB_CONVERSION_FACTOR = 0.00000095367431640625 |
57 |
| -MEMORY_BUFFER_MULTIPLIER = 1.2 # 20% buffer |
58 |
| - |
59 | 56 | mock_session = MagicMock()
|
60 | 57 |
|
61 | 58 |
|
@@ -1205,7 +1202,7 @@ def test_build_for_transformers_happy_case(
|
1205 | 1202 |
|
1206 | 1203 | @patch("sagemaker.serve.builder.model_builder.ModelBuilder._build_for_transformers")
|
1207 | 1204 | @patch("sagemaker.serve.builder.model_builder.ModelBuilder._try_fetch_gpu_info")
|
1208 |
| - @patch("sagemaker.serve.builder.model_builder.ModelBuilder._total_inference_model_size_mib") |
| 1205 | + @patch("sagemaker.serve.builder.model_builder._total_inference_model_size_mib") |
1209 | 1206 | @patch("sagemaker.image_uris.retrieve")
|
1210 | 1207 | @patch("sagemaker.djl_inference.model.urllib")
|
1211 | 1208 | @patch("sagemaker.djl_inference.model.json")
|
@@ -1248,7 +1245,7 @@ def test_build_for_transformers_happy_case_with_values(
|
1248 | 1245 |
|
1249 | 1246 | @patch("sagemaker.serve.builder.model_builder.ModelBuilder._build_for_djl", Mock())
|
1250 | 1247 | @patch("sagemaker.serve.builder.model_builder._get_gpu_info")
|
1251 |
| - @patch("sagemaker.serve.builder.model_builder.ModelBuilder._total_inference_model_size_mib") |
| 1248 | + @patch("sagemaker.serve.builder.model_builder._total_inference_model_size_mib") |
1252 | 1249 | @patch("sagemaker.image_uris.retrieve")
|
1253 | 1250 | @patch("sagemaker.djl_inference.model.urllib")
|
1254 | 1251 | @patch("sagemaker.djl_inference.model.json")
|
@@ -1293,7 +1290,7 @@ def test_build_for_transformers_happy_case_with_valid_gpu_info(
|
1293 | 1290 | @patch("sagemaker.serve.builder.model_builder.ModelBuilder._build_for_transformers", Mock())
|
1294 | 1291 | @patch("sagemaker.serve.builder.model_builder._get_gpu_info")
|
1295 | 1292 | @patch("sagemaker.serve.builder.model_builder._get_gpu_info_fallback")
|
1296 |
| - @patch("sagemaker.serve.builder.model_builder.ModelBuilder._total_inference_model_size_mib") |
| 1293 | + @patch("sagemaker.serve.builder.model_builder._total_inference_model_size_mib") |
1297 | 1294 | @patch("sagemaker.image_uris.retrieve")
|
1298 | 1295 | @patch("sagemaker.djl_inference.model.urllib")
|
1299 | 1296 | @patch("sagemaker.djl_inference.model.json")
|
@@ -1342,61 +1339,6 @@ def test_build_for_transformers_happy_case_with_valid_gpu_fallback(
|
1342 | 1339 | )
|
1343 | 1340 | self.assertEqual(model_builder._can_fit_on_single_gpu(), True)
|
1344 | 1341 |
|
1345 |
| - @patch("sagemaker.serve.builder.model_builder.ModelBuilder._build_for_transformers", Mock()) |
1346 |
| - @patch("sagemaker.serve.builder.model_builder.estimate_command_parser") |
1347 |
| - @patch("sagemaker.serve.builder.model_builder.gather_data") |
1348 |
| - @patch("sagemaker.image_uris.retrieve") |
1349 |
| - @patch("sagemaker.djl_inference.model.urllib") |
1350 |
| - @patch("sagemaker.djl_inference.model.json") |
1351 |
| - @patch("sagemaker.huggingface.llm_utils.urllib") |
1352 |
| - @patch("sagemaker.huggingface.llm_utils.json") |
1353 |
| - @patch("sagemaker.model_uris.retrieve") |
1354 |
| - @patch("sagemaker.serve.builder.model_builder._ServeSettings") |
1355 |
| - def test_build_for_transformers_happy_case_hugging_face_responses( |
1356 |
| - self, |
1357 |
| - mock_serveSettings, |
1358 |
| - mock_model_uris_retrieve, |
1359 |
| - mock_llm_utils_json, |
1360 |
| - mock_llm_utils_urllib, |
1361 |
| - mock_model_json, |
1362 |
| - mock_model_urllib, |
1363 |
| - mock_image_uris_retrieve, |
1364 |
| - mock_gather_data, |
1365 |
| - mock_parser, |
1366 |
| - ): |
1367 |
| - mock_setting_object = mock_serveSettings.return_value |
1368 |
| - mock_setting_object.role_arn = mock_role_arn |
1369 |
| - mock_setting_object.s3_model_data_url = mock_s3_model_data_url |
1370 |
| - |
1371 |
| - mock_model_uris_retrieve.side_effect = KeyError |
1372 |
| - mock_llm_utils_json.load.return_value = {"pipeline_tag": "text-classification"} |
1373 |
| - mock_llm_utils_urllib.request.Request.side_effect = Mock() |
1374 |
| - |
1375 |
| - mock_model_json.load.return_value = {"some": "config"} |
1376 |
| - mock_model_urllib.request.Request.side_effect = Mock() |
1377 |
| - mock_image_uris_retrieve.return_value = "https://some-image-uri" |
1378 |
| - |
1379 |
| - mock_parser.return_value = Mock() |
1380 |
| - mock_gather_data.return_value = [[1, 1, 1, 1]] |
1381 |
| - product = MIB_CONVERSION_FACTOR * 1 * MEMORY_BUFFER_MULTIPLIER |
1382 |
| - |
1383 |
| - model_builder = ModelBuilder( |
1384 |
| - model="stable-diffusion", |
1385 |
| - sagemaker_session=mock_session, |
1386 |
| - instance_type=mock_instance_type, |
1387 |
| - ) |
1388 |
| - self.assertEqual(model_builder._total_inference_model_size_mib(), product) |
1389 |
| - |
1390 |
| - mock_parser.return_value = Mock() |
1391 |
| - mock_gather_data.return_value = None |
1392 |
| - model_builder = ModelBuilder( |
1393 |
| - model="stable-diffusion", |
1394 |
| - sagemaker_session=mock_session, |
1395 |
| - instance_type=mock_instance_type, |
1396 |
| - ) |
1397 |
| - with self.assertRaises(ValueError) as _: |
1398 |
| - model_builder._total_inference_model_size_mib() |
1399 |
| - |
1400 | 1342 | @patch("sagemaker.serve.builder.model_builder.ModelBuilder._build_for_djl")
|
1401 | 1343 | @patch("sagemaker.serve.builder.model_builder.ModelBuilder._can_fit_on_single_gpu")
|
1402 | 1344 | @patch("sagemaker.image_uris.retrieve")
|
@@ -1556,7 +1498,7 @@ def test_try_fetch_gpu_info_throws(
|
1556 | 1498 | self.assertEqual(model_builder._can_fit_on_single_gpu(), False)
|
1557 | 1499 |
|
1558 | 1500 | @patch("sagemaker.serve.builder.model_builder.ModelBuilder._build_for_transformers", Mock())
|
1559 |
| - @patch("sagemaker.serve.builder.model_builder.ModelBuilder._total_inference_model_size_mib") |
| 1501 | + @patch("sagemaker.serve.builder.model_builder._total_inference_model_size_mib") |
1560 | 1502 | @patch("sagemaker.image_uris.retrieve")
|
1561 | 1503 | @patch("sagemaker.djl_inference.model.urllib")
|
1562 | 1504 | @patch("sagemaker.djl_inference.model.json")
|
|
0 commit comments