Skip to content

Commit a4e2b26

Browse files
authored
[Bugfix] Significant performance drop on CPUs with --num-scheduler-steps > 1 (#11794)
1 parent 973f5dc commit a4e2b26

File tree

1 file changed

+6
-0
lines changed

1 file changed

+6
-0
lines changed

vllm/engine/arg_utils.py

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1157,6 +1157,12 @@ def create_engine_config(self,
11571157
if self.enable_chunked_prefill and self.pipeline_parallel_size > 1:
11581158
raise ValueError("Multi-Step Chunked-Prefill is not supported "
11591159
"for pipeline-parallel-size > 1")
1160+
from vllm.platforms import current_platform
1161+
if current_platform.is_cpu():
1162+
logger.warning("Multi-Step (--num-scheduler-steps > 1) is "
1163+
"currently not supported for CPUs and has been "
1164+
"disabled.")
1165+
self.num_scheduler_steps = 1
11601166

11611167
# make sure num_lookahead_slots is set the higher value depending on
11621168
# if we are using speculative decoding or multi-step

0 commit comments

Comments
 (0)