Skip to content

Commit 22042c8

Browse files
committed
Integ test updates
1 parent cffe46a commit 22042c8

File tree

2 files changed

+7
-4
lines changed

2 files changed

+7
-4
lines changed

src/sagemaker/serve/builder/tei_builder.py

Lines changed: 6 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -16,10 +16,11 @@
1616
from typing import Type
1717
from abc import ABC, abstractmethod
1818

19+
from sagemaker import image_uris
1920
from sagemaker.model import Model
2021
from sagemaker.djl_inference.model import _get_model_config_properties_from_hf
2122

22-
from sagemaker.huggingface import HuggingFaceModel, get_huggingface_llm_image_uri
23+
from sagemaker.huggingface import HuggingFaceModel
2324
from sagemaker.serve.utils.local_hardware import (
2425
_get_nb_instance,
2526
)
@@ -87,8 +88,10 @@ def _set_to_tgi(self):
8788
def _create_tei_model(self) -> Type[Model]:
8889
"""Placeholder docstring"""
8990
if not self.image_uri:
90-
self.image_uri = get_huggingface_llm_image_uri(
91-
"huggingface-tei", session=self.sagemaker_session
91+
self.image_uri = image_uris.retrieve(
92+
"huggingface-tei",
93+
image_scope="inference",
94+
instance_type=self.nb_instance_type
9295
)
9396

9497
pysdk_model = HuggingFaceModel(

src/sagemaker/serve/model_server/tgi/server.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -74,7 +74,7 @@ def _invoke_tgi_serving(self, request: object, content_type: str, accept: str):
7474
"""Placeholder docstring"""
7575
try:
7676
response = requests.post(
77-
f"http://{get_docker_host()}:8080/generate",
77+
f"http://{get_docker_host()}:8080/invocations",
7878
data=request,
7979
headers={"Content-Type": content_type, "Accept": accept},
8080
timeout=600,

0 commit comments

Comments
 (0)