Skip to content

Commit b666bd4

Browse files
committed
remove assertions that cause synchronizations
Signed-off-by: Chih-Chieh-Yang <[email protected]>
1 parent 74f9013 commit b666bd4

File tree

2 files changed

+0
-6
lines changed

2 files changed

+0
-6
lines changed

vllm/model_executor/layers/mamba/ops/ssd_chunk_scan.py

Lines changed: 0 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -511,9 +511,6 @@ def _chunk_scan_fwd(
511511
# with initial states, we need to take care of how
512512
# seq_idx crosses the boundaries
513513
assert batch == 1, "chunk scan only supports initial states with batch 1"
514-
# The following assertion causes D2H copy - removing for now
515-
# assert initial_states.shape == (seq_idx[0].max() + 1, nheads,
516-
# headdim, dstate)
517514

518515
if initial_states.shape[0] == 1:
519516
# no in this case no point to use initial states

vllm/model_executor/layers/mamba/ops/ssd_state_passing.py

Lines changed: 0 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -150,9 +150,6 @@ def _state_passing_fwd(
150150
# are used for continuous batching. In which case we
151151
# require seq_idx to be provided
152152
assert seq_idx is not None, ""
153-
# The following assertion causes D2H copy - removing for now
154-
# assert initial_states.shape == (seq_idx.max().item() + 1, nheads,
155-
# dim)
156153
else:
157154
# - this is the regular batching case, where initial
158155
# states are used are for each example of the batch.

0 commit comments

Comments
 (0)