From fb72c479a8db0a271af19d259057bee7e61bf250 Mon Sep 17 00:00:00 2001 From: youkaichao Date: Thu, 9 Jan 2025 22:47:29 +0800 Subject: [PATCH] [ci]try to fix flaky multi-step tests (#11894) Signed-off-by: youkaichao --- tests/multi_step/test_correctness_async_llm.py | 3 +-- tests/utils.py | 9 +++++++-- 2 files changed, 8 insertions(+), 4 deletions(-) diff --git a/tests/multi_step/test_correctness_async_llm.py b/tests/multi_step/test_correctness_async_llm.py index 7203d635c2fa8..8456a463adeeb 100644 --- a/tests/multi_step/test_correctness_async_llm.py +++ b/tests/multi_step/test_correctness_async_llm.py @@ -16,7 +16,6 @@ NUM_PROMPTS = [10] DEFAULT_SERVER_ARGS: List[str] = [ - "--disable-log-requests", "--worker-use-ray", "--gpu-memory-utilization", "0.85", @@ -110,7 +109,7 @@ async def test_multi_step( # Spin up client/server & issue completion API requests. # Default `max_wait_seconds` is 240 but was empirically - # was raised 3x to 720 *just for this test* due to + # was raised 5x to 1200 *just for this test* due to # observed timeouts in GHA CI ref_completions = await completions_with_server_args( prompts, diff --git a/tests/utils.py b/tests/utils.py index bf3d88194e4ca..f4eecf19e8c64 100644 --- a/tests/utils.py +++ b/tests/utils.py @@ -157,13 +157,19 @@ def url_root(self) -> str: def url_for(self, *parts: str) -> str: return self.url_root + "/" + "/".join(parts) - def get_client(self): + def get_client(self, **kwargs): + if "timeout" not in kwargs: + kwargs["timeout"] = 600 return openai.OpenAI( base_url=self.url_for("v1"), api_key=self.DUMMY_API_KEY, + max_retries=0, + **kwargs, ) def get_async_client(self, **kwargs): + if "timeout" not in kwargs: + kwargs["timeout"] = 600 return openai.AsyncOpenAI(base_url=self.url_for("v1"), api_key=self.DUMMY_API_KEY, max_retries=0, @@ -780,7 +786,6 @@ async def completions_with_server_args( assert len(max_tokens) == len(prompts) outputs = None - max_wait_seconds = 240 * 3 # 240 is default with RemoteOpenAIServer(model_name, server_cli_args, max_wait_seconds=max_wait_seconds) as server: