@@ -1205,7 +1205,7 @@ def test_build_for_transformers_happy_case(
1205
1205
1206
1206
@patch ("sagemaker.serve.builder.model_builder.ModelBuilder._build_for_transformers" )
1207
1207
@patch ("sagemaker.serve.builder.model_builder.ModelBuilder._try_fetch_gpu_info" )
1208
- @patch ("sagemaker.serve.builder.model_builder.ModelBuilder. _total_inference_model_size_mib" )
1208
+ @patch ("sagemaker.serve.builder.model_builder._total_inference_model_size_mib" )
1209
1209
@patch ("sagemaker.image_uris.retrieve" )
1210
1210
@patch ("sagemaker.djl_inference.model.urllib" )
1211
1211
@patch ("sagemaker.djl_inference.model.json" )
@@ -1248,7 +1248,7 @@ def test_build_for_transformers_happy_case_with_values(
1248
1248
1249
1249
@patch ("sagemaker.serve.builder.model_builder.ModelBuilder._build_for_djl" , Mock ())
1250
1250
@patch ("sagemaker.serve.builder.model_builder._get_gpu_info" )
1251
- @patch ("sagemaker.serve.builder.model_builder.ModelBuilder. _total_inference_model_size_mib" )
1251
+ @patch ("sagemaker.serve.builder.model_builder._total_inference_model_size_mib" )
1252
1252
@patch ("sagemaker.image_uris.retrieve" )
1253
1253
@patch ("sagemaker.djl_inference.model.urllib" )
1254
1254
@patch ("sagemaker.djl_inference.model.json" )
@@ -1293,7 +1293,7 @@ def test_build_for_transformers_happy_case_with_valid_gpu_info(
1293
1293
@patch ("sagemaker.serve.builder.model_builder.ModelBuilder._build_for_transformers" , Mock ())
1294
1294
@patch ("sagemaker.serve.builder.model_builder._get_gpu_info" )
1295
1295
@patch ("sagemaker.serve.builder.model_builder._get_gpu_info_fallback" )
1296
- @patch ("sagemaker.serve.builder.model_builder.ModelBuilder. _total_inference_model_size_mib" )
1296
+ @patch ("sagemaker.serve.builder.model_builder._total_inference_model_size_mib" )
1297
1297
@patch ("sagemaker.image_uris.retrieve" )
1298
1298
@patch ("sagemaker.djl_inference.model.urllib" )
1299
1299
@patch ("sagemaker.djl_inference.model.json" )
@@ -1342,61 +1342,6 @@ def test_build_for_transformers_happy_case_with_valid_gpu_fallback(
1342
1342
)
1343
1343
self .assertEqual (model_builder ._can_fit_on_single_gpu (), True )
1344
1344
1345
- @patch ("sagemaker.serve.builder.model_builder.ModelBuilder._build_for_transformers" , Mock ())
1346
- @patch ("sagemaker.serve.builder.model_builder.estimate_command_parser" )
1347
- @patch ("sagemaker.serve.builder.model_builder.gather_data" )
1348
- @patch ("sagemaker.image_uris.retrieve" )
1349
- @patch ("sagemaker.djl_inference.model.urllib" )
1350
- @patch ("sagemaker.djl_inference.model.json" )
1351
- @patch ("sagemaker.huggingface.llm_utils.urllib" )
1352
- @patch ("sagemaker.huggingface.llm_utils.json" )
1353
- @patch ("sagemaker.model_uris.retrieve" )
1354
- @patch ("sagemaker.serve.builder.model_builder._ServeSettings" )
1355
- def test_build_for_transformers_happy_case_hugging_face_responses (
1356
- self ,
1357
- mock_serveSettings ,
1358
- mock_model_uris_retrieve ,
1359
- mock_llm_utils_json ,
1360
- mock_llm_utils_urllib ,
1361
- mock_model_json ,
1362
- mock_model_urllib ,
1363
- mock_image_uris_retrieve ,
1364
- mock_gather_data ,
1365
- mock_parser ,
1366
- ):
1367
- mock_setting_object = mock_serveSettings .return_value
1368
- mock_setting_object .role_arn = mock_role_arn
1369
- mock_setting_object .s3_model_data_url = mock_s3_model_data_url
1370
-
1371
- mock_model_uris_retrieve .side_effect = KeyError
1372
- mock_llm_utils_json .load .return_value = {"pipeline_tag" : "text-classification" }
1373
- mock_llm_utils_urllib .request .Request .side_effect = Mock ()
1374
-
1375
- mock_model_json .load .return_value = {"some" : "config" }
1376
- mock_model_urllib .request .Request .side_effect = Mock ()
1377
- mock_image_uris_retrieve .return_value = "https://some-image-uri"
1378
-
1379
- mock_parser .return_value = Mock ()
1380
- mock_gather_data .return_value = [[1 , 1 , 1 , 1 ]]
1381
- product = MIB_CONVERSION_FACTOR * 1 * MEMORY_BUFFER_MULTIPLIER
1382
-
1383
- model_builder = ModelBuilder (
1384
- model = "stable-diffusion" ,
1385
- sagemaker_session = mock_session ,
1386
- instance_type = mock_instance_type ,
1387
- )
1388
- self .assertEqual (model_builder ._total_inference_model_size_mib (), product )
1389
-
1390
- mock_parser .return_value = Mock ()
1391
- mock_gather_data .return_value = None
1392
- model_builder = ModelBuilder (
1393
- model = "stable-diffusion" ,
1394
- sagemaker_session = mock_session ,
1395
- instance_type = mock_instance_type ,
1396
- )
1397
- with self .assertRaises (ValueError ) as _ :
1398
- model_builder ._total_inference_model_size_mib ()
1399
-
1400
1345
@patch ("sagemaker.serve.builder.model_builder.ModelBuilder._build_for_djl" )
1401
1346
@patch ("sagemaker.serve.builder.model_builder.ModelBuilder._can_fit_on_single_gpu" )
1402
1347
@patch ("sagemaker.image_uris.retrieve" )
@@ -1556,7 +1501,7 @@ def test_try_fetch_gpu_info_throws(
1556
1501
self .assertEqual (model_builder ._can_fit_on_single_gpu (), False )
1557
1502
1558
1503
@patch ("sagemaker.serve.builder.model_builder.ModelBuilder._build_for_transformers" , Mock ())
1559
- @patch ("sagemaker.serve.builder.model_builder.ModelBuilder. _total_inference_model_size_mib" )
1504
+ @patch ("sagemaker.serve.builder.model_builder._total_inference_model_size_mib" )
1560
1505
@patch ("sagemaker.image_uris.retrieve" )
1561
1506
@patch ("sagemaker.djl_inference.model.urllib" )
1562
1507
@patch ("sagemaker.djl_inference.model.json" )
0 commit comments