34
34
from sagemaker .serve .utils .local_hardware import _get_nb_instance , _get_ram_usage_mb
35
35
from sagemaker .serve .utils .telemetry_logger import _capture_telemetry
36
36
from sagemaker .serve .utils .tuning import _serial_benchmark , _concurrent_benchmark , _more_performant , \
37
- _pretty_print_results_tgi
37
+ _pretty_print_results_tgi , _pretty_print_results_tgi_js
38
38
from sagemaker .serve .utils .types import ModelServer
39
39
from sagemaker .base_predictor import PredictorBase
40
40
from sagemaker .jumpstart .model import JumpStartModel
@@ -392,7 +392,7 @@ def tune_for_djl_jumpstart(self, max_tuning_duration: int = 1800):
392
392
logger .debug (
393
393
"Failed to gather any tuning results. "
394
394
"Please inspect the stack trace emitted from live logging for more details. "
395
- "Falling back to default serving.properties : %s" ,
395
+ "Falling back to default model environment variable configurations : %s" ,
396
396
self .pysdk_model .env ,
397
397
)
398
398
@@ -517,7 +517,8 @@ def tune_for_tgi_jumpstart(self, max_tuning_duration: int = 1800):
517
517
str (e ),
518
518
)
519
519
break
520
- except Exception :
520
+ except Exception as e :
521
+ logger .exception (e )
521
522
logger .exception (
522
523
"Deployment unsuccessful with SM_NUM_GPUS: %s. "
523
524
"with uncovered exception" ,
@@ -530,7 +531,7 @@ def tune_for_tgi_jumpstart(self, max_tuning_duration: int = 1800):
530
531
"SM_NUM_GPUS" : str (best_tuned_combination [1 ])
531
532
})
532
533
533
- _pretty_print_results_tgi (benchmark_results )
534
+ _pretty_print_results_tgi_js (benchmark_results )
534
535
logger .info (
535
536
"Model Configuration: %s was most performant with avg latency: %s, "
536
537
"p90 latency: %s, average tokens per second: %s, throughput/s: %s, "
@@ -547,7 +548,7 @@ def tune_for_tgi_jumpstart(self, max_tuning_duration: int = 1800):
547
548
logger .debug (
548
549
"Failed to gather any tuning results. "
549
550
"Please inspect the stack trace emitted from live logging for more details. "
550
- "Falling back to default serving.properties : %s" ,
551
+ "Falling back to default model environment variable configurations : %s" ,
551
552
self .pysdk_model .env ,
552
553
)
553
554
0 commit comments