reduce vllm benchmark runs to 2

This commit is contained in:
Lucas Armand
2025-11-25 16:54:17 -08:00
parent 74d7330800
commit 4bcc508473
+2 -1
View File
@@ -57,7 +57,8 @@ worker_config = WorkerConfig(
max_queue_time=60.0,
benchmark_config=BenchmarkConfig(
generator=completions_benchmark_generator,
concurrency=100
concurrency=100,
runs=2
)
),
HandlerConfig(