Skip to content
Merged
Changes from 1 commit
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
3 changes: 2 additions & 1 deletion tests/llm_cache.py
Original file line number Diff line number Diff line change
Expand Up @@ -191,7 +191,7 @@ def get_engine(
model=model_name,
tokenizer=model_name,
max_model_len=max(max_model_len, 256),
max_num_seqs=max_num_seqs,
max_num_seqs=max(max_num_seqs, 4),
Copy link
Collaborator

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

this will leave the test name as-is, which might be confusing (since the test will still say BS 2)

num_gpu_blocks_override=None,
revision=revision,
)
Expand All @@ -203,6 +203,7 @@ def get_engine(
log_stats=False)

engine_core.scheduler.scheduler_config.max_model_len = max_model_len
engine_core.scheduler.scheduler_config.max_num_seqs = max_num_seqs

if available_blocks is not None:
worker = engine_core.model_executor.driver_worker.worker
Expand Down
Loading