Skip to content

Commit b409e64

Browse files
Isotr0pyrasmith
authored andcommitted
[Bugfix] Fix missing seq_start_loc in xformers prefill metadata (vllm-project#12464)
Signed-off-by: Isotr0py <[email protected]>
1 parent 6753b86 commit b409e64

File tree

1 file changed

+3
-0
lines changed

1 file changed

+3
-0
lines changed

vllm/attention/backends/xformers.py

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -199,6 +199,8 @@ def prefill_metadata(self) -> Optional["XFormersMetadata"]:
199199
# Compute some attn_metadata fields which default to None
200200
query_start_loc = (None if self.query_start_loc is None else
201201
self.query_start_loc[:self.num_prefills + 1])
202+
seq_start_loc = (None if self.seq_start_loc is None else
203+
self.seq_start_loc[:self.num_prefills + 1])
202204
slot_mapping = (None if self.slot_mapping is None else
203205
self.slot_mapping[:self.num_prefill_tokens])
204206
seq_lens = (None if self.seq_lens is None else
@@ -225,6 +227,7 @@ def prefill_metadata(self) -> Optional["XFormersMetadata"]:
225227
max_prefill_seq_len=self.max_prefill_seq_len,
226228
max_decode_seq_len=0,
227229
query_start_loc=query_start_loc,
230+
seq_start_loc=seq_start_loc,
228231
context_lens_tensor=context_lens_tensor,
229232
block_tables=block_tables,
230233
use_cuda_graph=False,

0 commit comments

Comments
 (0)