File tree Expand file tree Collapse file tree 1 file changed +11
-2
lines changed
tensorrt_llm/bench/benchmark Expand file tree Collapse file tree 1 file changed +11
-2
lines changed Original file line number Diff line number Diff line change 94
94
required = False ,
95
95
help = "Pass in a dataset file for parsing instead of stdin." ,
96
96
)
97
+ @optgroup .option (
98
+ "--eos_id" ,
99
+ type = int ,
100
+ default = - 1 ,
101
+ required = False ,
102
+ help =
103
+ "Set the end-of-sequence token for the benchmark. Set to -1 to disable EOS." ,
104
+ )
97
105
@optgroup .option (
98
106
"--modality" ,
99
107
type = click .Choice (["image" , "video" ]),
@@ -222,6 +230,7 @@ def throughput_command(
222
230
# Parameters from CLI
223
231
# Model, experiment, and engine params
224
232
dataset_path : Path = params .pop ("dataset" )
233
+ eos_id : int = params .pop ("eos_id" )
225
234
warmup : int = params .get ("warmup" )
226
235
num_requests : int = params .pop ("num_requests" )
227
236
max_seq_len : int = params .pop ("max_seq_len" )
@@ -333,8 +342,8 @@ def throughput_command(
333
342
else :
334
343
llm = LLM (** kwargs )
335
344
336
- sampling_params = SamplingParams (end_id = - 1 ,
337
- pad_id = - 1 ,
345
+ sampling_params = SamplingParams (end_id = eos_id ,
346
+ pad_id = eos_id ,
338
347
beam_width = beam_width )
339
348
340
349
# Perform warmup if requested.
You can’t perform that action at this time.
0 commit comments