We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent d4d766b commit e36e8b8Copy full SHA for e36e8b8
benchmarks/benchmark_latency.py
@@ -52,7 +52,7 @@ def run_to_completion(profile_dir: Optional[str] = None):
52
llm.generate(dummy_prompts,
53
sampling_params=sampling_params,
54
use_tqdm=False)
55
- print(p.key_averages())
+ print(p.key_averages().table(sort_by="self_cuda_time_total"))
56
else:
57
start_time = time.perf_counter()
58
0 commit comments