diff --git a/python/sglang/bench_serving.py b/python/sglang/bench_serving.py index 96e8677bb60..ac247454987 100644 --- a/python/sglang/bench_serving.py +++ b/python/sglang/bench_serving.py @@ -924,6 +924,7 @@ async def limited_request_func(request_func_input, pbar): f"are correctly specified. Error: {test_output.error}" ) else: + requests.post(base_url + "/flush_cache") print("Initial test run completed. Starting main benchmark run...") time.sleep(1.5)