removed 5 sec sleep and warmup request on load

This commit is contained in:
Colter Downing
2025-10-28 15:28:30 -07:00
parent 5d5bc197d7
commit 8d9ffb3a6c
+5 -5
View File
@@ -325,10 +325,10 @@ class Backend:
with open(BENCHMARK_INDICATOR_FILE, "r") as f:
log.debug("already ran benchmark")
# trigger model load
payload = self.benchmark_handler.make_benchmark_payload()
_ = await self.__call_api(
handler=self.benchmark_handler, payload=payload
)
# payload = self.benchmark_handler.make_benchmark_payload()
# _ = await self.__call_api(
# handler=self.benchmark_handler, payload=payload
# )
return float(f.readline())
except FileNotFoundError:
pass
@@ -404,7 +404,7 @@ class Backend:
log.debug(f"ModelLoaded observed after {elapsed:.2f}s: {log_line}")
# some backends need a few seconds after logging successful startup before
# they can begin accepting requests
await sleep(5)
# await sleep(5)
try:
t_bench0 = time.time()
max_throughput = await run_benchmark()