Skip to content

Commit 3351973

Browse files
enforce v2 block manager and check logit processor
1 parent 8663c7d commit 3351973

File tree

2 files changed

+6
-2
lines changed

2 files changed

+6
-2
lines changed

vllm/engine/arg_utils.py

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -871,6 +871,9 @@ def create_engine_config(self, ) -> EngineConfig:
871871
if self.enable_chunked_prefill:
872872
raise ValueError("Chunked prefill is not supported with "
873873
"multi-step (--num-scheduler-steps > 1)")
874+
if not self.use_v2_block_manager:
875+
raise ValueError("BlockSpaceManagerV2 is required for "
876+
"multi-step (--num-scheduler-steps > 1)")
874877

875878
# make sure num_lookahead_slots is set the higher value depending on
876879
# if we are using speculative decoding or multi-step

vllm/worker/multi_step_model_runner.py

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -497,8 +497,9 @@ def _pythonize_sampler_output(
497497
next_token_ids = sample_result
498498
parent_ids = [0]
499499
seq_outputs: List[SequenceOutput] = []
500-
assert len(seq_group.sampling_params.logits_processors) == 0, (
501-
"Logits Processors are not supported in multi-step decoding")
500+
if seq_group.sampling_params.logits_processors:
501+
assert len(seq_group.sampling_params.logits_processors) == 0, (
502+
"Logits Processors are not supported in multi-step decoding")
502503
for parent_id, next_token_id in zip(parent_ids, next_token_ids):
503504
# TODO(will): support logprobs
504505
# Hard coded logprob

0 commit comments

Comments
 (0)