diff --git a/tests/entrypoints/openai/test_async_tokenization.py b/tests/entrypoints/openai/test_async_tokenization.py
index c52f7dd658f31..fcce8b46c4344 100644
--- a/tests/entrypoints/openai/test_async_tokenization.py
+++ b/tests/entrypoints/openai/test_async_tokenization.py
@@ -127,7 +127,7 @@ def get_response_time(url):
     tasks = [
         asyncio.create_task(create_func(**body)) for _ in range(num_requests)
     ]
-    await asyncio.sleep(1)
+    await asyncio.sleep(1)  # give the tasks a chance to start running
     load_response_time = get_response_time(server.url_for("health"))
 
     with contextlib.suppress(openai.APIStatusError):