From 5dbf12c2a447b7ed5e992f9d12998f760141a24c Mon Sep 17 00:00:00 2001 From: DarkLight1337 Date: Wed, 22 Oct 2025 16:17:15 +0000 Subject: [PATCH 1/2] [Bugfix] Fix SLA tuner initialization Signed-off-by: DarkLight1337 --- vllm/benchmarks/sweep/serve_sla.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/vllm/benchmarks/sweep/serve_sla.py b/vllm/benchmarks/sweep/serve_sla.py index 62e2917dc22b..6159aba4bbb5 100644 --- a/vllm/benchmarks/sweep/serve_sla.py +++ b/vllm/benchmarks/sweep/serve_sla.py @@ -401,7 +401,8 @@ class SweepServeSLAArgs(SweepServeArgs): @classmethod def from_cli_args(cls, args: argparse.Namespace): - base_args = super().from_cli_args(args) + # NOTE: Don't use super() as `from_cli_args` calls `cls()` + base_args = SweepServeArgs.from_cli_args(args) if args.sla_params: sla_params = SLASweep.read_json(args.sla_params) From 658f4c34fb9c2313e1061db0b522a83bb9c33333 Mon Sep 17 00:00:00 2001 From: DarkLight1337 Date: Wed, 22 Oct 2025 16:39:57 +0000 Subject: [PATCH 2/2] Fix missing metric Signed-off-by: DarkLight1337 --- vllm/benchmarks/sweep/serve.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/vllm/benchmarks/sweep/serve.py b/vllm/benchmarks/sweep/serve.py index 6e408dac0b49..a06d4d6d6098 100644 --- a/vllm/benchmarks/sweep/serve.py +++ b/vllm/benchmarks/sweep/serve.py @@ -66,6 +66,8 @@ def run_benchmark( ): benchmark_cmd = [ *bench_overrides.apply_to_cmd(bench_cmd), + "--percentile-metrics", + "ttft,tpot,itl,e2el", "--save-result", "--result-dir", str(output_path.parent),