Skip to content

Commit 06127d3

Browse files
author
Varun Sundar Rabindranath
committed
fix comment print
test only benchmark tensors that participated Signed-off-by: Varun Sundar Rabindranath <[email protected]>
1 parent c7d6620 commit 06127d3

File tree

1 file changed

+3
-2
lines changed

1 file changed

+3
-2
lines changed

benchmarks/kernels/benchmark_lora.py

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -709,7 +709,8 @@ def bench_optype(ctx: BenchmarkContext,
709709
if test_correctness:
710710
assert all([
711711
bt.test_correctness(op_type, expand_fn_add_inputs)
712-
for bt in bench_tensors
712+
for bt in bench_tensors[:cuda_graph_nops if cuda_graph_nops
713+
is not None else arg_pool_size]
713714
])
714715

715716
return timer
@@ -778,7 +779,7 @@ def print_timers(timers: List[TMeasurement],
778779
if args and args.cuda_graph_nops:
779780
print(f"The timings reported above is for {args.cuda_graph_nops} "
780781
"consecutive invocations of the benchmarking functions. "
781-
"Please divide by {args.cuda_graph_nops} for single invocation "
782+
f"Please divide by {args.cuda_graph_nops} for single invocation "
782783
"timings ")
783784

784785

0 commit comments

Comments
 (0)