We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 166e570 commit 4bb5522Copy full SHA for 4bb5522
src/sagemaker/serve/model_server/tgi/server.py
@@ -74,7 +74,7 @@ def _invoke_tgi_serving(self, request: object, content_type: str, accept: str):
74
"""Placeholder docstring"""
75
try:
76
response = requests.post(
77
- f"http://{get_docker_host()}:8080/invocations",
+ f"http://{get_docker_host()}:8080/generate",
78
data=request,
79
headers={"Content-Type": content_type, "Accept": accept},
80
timeout=600,
0 commit comments