diff --git a/tests/unittest/llmapi/apps/openai_server.py b/tests/unittest/llmapi/apps/openai_server.py index ca98f7e1ece..9a9f38193cd 100644 --- a/tests/unittest/llmapi/apps/openai_server.py +++ b/tests/unittest/llmapi/apps/openai_server.py @@ -16,7 +16,7 @@ class RemoteOpenAIServer: DUMMY_API_KEY = "tensorrt_llm" - MAX_SERVER_START_WAIT_S = 600 # wait for server to start for 600 seconds + MAX_SERVER_START_WAIT_S = 7200 # wait for server to start for 7200 seconds (~ 2 hours) for LLM models weight loading def __init__(self, model: str,