Skip to content

Commit 05fb47d

Browse files
authored
[Benchmark CI] Use fewer num_inputs for flash_attention to avoid timeout (#857)
1 parent 5a772d1 commit 05fb47d

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

benchmarks/run.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -193,7 +193,7 @@ class RunResult:
193193
"attention",
194194
{
195195
"d_head": 128, # Set default head dimension to 128 for TLX attention compatibility
196-
"num_inputs": 10, # flash_attention takes long time on Benchmark CI, so use fewer inputs instead.
196+
"num_inputs": 6, # flash_attention takes long time on Benchmark CI, so use fewer inputs instead.
197197
},
198198
),
199199
"cross_entropy": (

0 commit comments

Comments
 (0)