Skip to content

Commit

Permalink
Integ test updates
Browse files Browse the repository at this point in the history
  • Loading branch information
samruds committed May 17, 2024
1 parent 4bb5522 commit ed9d005
Show file tree
Hide file tree
Showing 2 changed files with 2 additions and 2 deletions.
2 changes: 1 addition & 1 deletion src/sagemaker/serve/model_server/tgi/server.py
Original file line number Diff line number Diff line change
Expand Up @@ -74,7 +74,7 @@ def _invoke_tgi_serving(self, request: object, content_type: str, accept: str):
"""Placeholder docstring"""
try:
response = requests.post(
f"http://{get_docker_host()}:8080/generate",
f"http://{get_docker_host()}:8080/invocations",
data=request,
headers={"Content-Type": content_type, "Accept": accept},
timeout=600,
Expand Down
2 changes: 1 addition & 1 deletion tests/integ/sagemaker/serve/test_serve_tei.py
Original file line number Diff line number Diff line change
Expand Up @@ -107,7 +107,7 @@ def test_tei_sagemaker_endpoint(sagemaker_session, model_builder, model_input):
with timeout(minutes=SERVE_SAGEMAKER_ENDPOINT_TIMEOUT):
try:
logger.info("Deploying and predicting in SAGEMAKER_ENDPOINT mode...")
predictor = model.deploy(instance_type="ml.g5.12xlarge", initial_instance_count=2)
predictor = model.deploy(instance_type="ml.g5.2xlarge", initial_instance_count=1)
logger.info("Endpoint successfully deployed.")
predictor.predict(model_input)
assert predictor is not None
Expand Down

0 comments on commit ed9d005

Please sign in to comment.