|
53 | 53 | ModelServer.DJL_SERVING, |
54 | 54 | } |
55 | 55 |
|
56 | | -MIB_CONVERSION_FACTOR = 0.00000095367431640625 |
57 | | -MEMORY_BUFFER_MULTIPLIER = 1.2 # 20% buffer |
58 | | - |
59 | 56 | mock_session = MagicMock() |
60 | 57 |
|
61 | 58 |
|
@@ -1205,7 +1202,7 @@ def test_build_for_transformers_happy_case( |
1205 | 1202 |
|
1206 | 1203 | @patch("sagemaker.serve.builder.model_builder.ModelBuilder._build_for_transformers") |
1207 | 1204 | @patch("sagemaker.serve.builder.model_builder.ModelBuilder._try_fetch_gpu_info") |
1208 | | - @patch("sagemaker.serve.builder.model_builder.ModelBuilder._total_inference_model_size_mib") |
| 1205 | + @patch("sagemaker.serve.builder.model_builder._total_inference_model_size_mib") |
1209 | 1206 | @patch("sagemaker.image_uris.retrieve") |
1210 | 1207 | @patch("sagemaker.djl_inference.model.urllib") |
1211 | 1208 | @patch("sagemaker.djl_inference.model.json") |
@@ -1248,7 +1245,7 @@ def test_build_for_transformers_happy_case_with_values( |
1248 | 1245 |
|
1249 | 1246 | @patch("sagemaker.serve.builder.model_builder.ModelBuilder._build_for_djl", Mock()) |
1250 | 1247 | @patch("sagemaker.serve.builder.model_builder._get_gpu_info") |
1251 | | - @patch("sagemaker.serve.builder.model_builder.ModelBuilder._total_inference_model_size_mib") |
| 1248 | + @patch("sagemaker.serve.builder.model_builder._total_inference_model_size_mib") |
1252 | 1249 | @patch("sagemaker.image_uris.retrieve") |
1253 | 1250 | @patch("sagemaker.djl_inference.model.urllib") |
1254 | 1251 | @patch("sagemaker.djl_inference.model.json") |
@@ -1293,7 +1290,7 @@ def test_build_for_transformers_happy_case_with_valid_gpu_info( |
1293 | 1290 | @patch("sagemaker.serve.builder.model_builder.ModelBuilder._build_for_transformers", Mock()) |
1294 | 1291 | @patch("sagemaker.serve.builder.model_builder._get_gpu_info") |
1295 | 1292 | @patch("sagemaker.serve.builder.model_builder._get_gpu_info_fallback") |
1296 | | - @patch("sagemaker.serve.builder.model_builder.ModelBuilder._total_inference_model_size_mib") |
| 1293 | + @patch("sagemaker.serve.builder.model_builder._total_inference_model_size_mib") |
1297 | 1294 | @patch("sagemaker.image_uris.retrieve") |
1298 | 1295 | @patch("sagemaker.djl_inference.model.urllib") |
1299 | 1296 | @patch("sagemaker.djl_inference.model.json") |
@@ -1342,61 +1339,6 @@ def test_build_for_transformers_happy_case_with_valid_gpu_fallback( |
1342 | 1339 | ) |
1343 | 1340 | self.assertEqual(model_builder._can_fit_on_single_gpu(), True) |
1344 | 1341 |
|
1345 | | - @patch("sagemaker.serve.builder.model_builder.ModelBuilder._build_for_transformers", Mock()) |
1346 | | - @patch("sagemaker.serve.builder.model_builder.estimate_command_parser") |
1347 | | - @patch("sagemaker.serve.builder.model_builder.gather_data") |
1348 | | - @patch("sagemaker.image_uris.retrieve") |
1349 | | - @patch("sagemaker.djl_inference.model.urllib") |
1350 | | - @patch("sagemaker.djl_inference.model.json") |
1351 | | - @patch("sagemaker.huggingface.llm_utils.urllib") |
1352 | | - @patch("sagemaker.huggingface.llm_utils.json") |
1353 | | - @patch("sagemaker.model_uris.retrieve") |
1354 | | - @patch("sagemaker.serve.builder.model_builder._ServeSettings") |
1355 | | - def test_build_for_transformers_happy_case_hugging_face_responses( |
1356 | | - self, |
1357 | | - mock_serveSettings, |
1358 | | - mock_model_uris_retrieve, |
1359 | | - mock_llm_utils_json, |
1360 | | - mock_llm_utils_urllib, |
1361 | | - mock_model_json, |
1362 | | - mock_model_urllib, |
1363 | | - mock_image_uris_retrieve, |
1364 | | - mock_gather_data, |
1365 | | - mock_parser, |
1366 | | - ): |
1367 | | - mock_setting_object = mock_serveSettings.return_value |
1368 | | - mock_setting_object.role_arn = mock_role_arn |
1369 | | - mock_setting_object.s3_model_data_url = mock_s3_model_data_url |
1370 | | - |
1371 | | - mock_model_uris_retrieve.side_effect = KeyError |
1372 | | - mock_llm_utils_json.load.return_value = {"pipeline_tag": "text-classification"} |
1373 | | - mock_llm_utils_urllib.request.Request.side_effect = Mock() |
1374 | | - |
1375 | | - mock_model_json.load.return_value = {"some": "config"} |
1376 | | - mock_model_urllib.request.Request.side_effect = Mock() |
1377 | | - mock_image_uris_retrieve.return_value = "https://some-image-uri" |
1378 | | - |
1379 | | - mock_parser.return_value = Mock() |
1380 | | - mock_gather_data.return_value = [[1, 1, 1, 1]] |
1381 | | - product = MIB_CONVERSION_FACTOR * 1 * MEMORY_BUFFER_MULTIPLIER |
1382 | | - |
1383 | | - model_builder = ModelBuilder( |
1384 | | - model="stable-diffusion", |
1385 | | - sagemaker_session=mock_session, |
1386 | | - instance_type=mock_instance_type, |
1387 | | - ) |
1388 | | - self.assertEqual(model_builder._total_inference_model_size_mib(), product) |
1389 | | - |
1390 | | - mock_parser.return_value = Mock() |
1391 | | - mock_gather_data.return_value = None |
1392 | | - model_builder = ModelBuilder( |
1393 | | - model="stable-diffusion", |
1394 | | - sagemaker_session=mock_session, |
1395 | | - instance_type=mock_instance_type, |
1396 | | - ) |
1397 | | - with self.assertRaises(ValueError) as _: |
1398 | | - model_builder._total_inference_model_size_mib() |
1399 | | - |
1400 | 1342 | @patch("sagemaker.serve.builder.model_builder.ModelBuilder._build_for_djl") |
1401 | 1343 | @patch("sagemaker.serve.builder.model_builder.ModelBuilder._can_fit_on_single_gpu") |
1402 | 1344 | @patch("sagemaker.image_uris.retrieve") |
@@ -1556,7 +1498,7 @@ def test_try_fetch_gpu_info_throws( |
1556 | 1498 | self.assertEqual(model_builder._can_fit_on_single_gpu(), False) |
1557 | 1499 |
|
1558 | 1500 | @patch("sagemaker.serve.builder.model_builder.ModelBuilder._build_for_transformers", Mock()) |
1559 | | - @patch("sagemaker.serve.builder.model_builder.ModelBuilder._total_inference_model_size_mib") |
| 1501 | + @patch("sagemaker.serve.builder.model_builder._total_inference_model_size_mib") |
1560 | 1502 | @patch("sagemaker.image_uris.retrieve") |
1561 | 1503 | @patch("sagemaker.djl_inference.model.urllib") |
1562 | 1504 | @patch("sagemaker.djl_inference.model.json") |
|
0 commit comments