diff --git a/tests/entrypoints/openai/test_async_tokenization.py b/tests/entrypoints/openai/test_async_tokenization.py index c52f7dd658f31..fcce8b46c4344 100644 --- a/tests/entrypoints/openai/test_async_tokenization.py +++ b/tests/entrypoints/openai/test_async_tokenization.py @@ -127,7 +127,7 @@ def get_response_time(url): tasks = [ asyncio.create_task(create_func(**body)) for _ in range(num_requests) ] - await asyncio.sleep(1) + await asyncio.sleep(1) # give the tasks a chance to start running load_response_time = get_response_time(server.url_for("health")) with contextlib.suppress(openai.APIStatusError):