File tree Expand file tree Collapse file tree 2 files changed +6
-6
lines changed
Expand file tree Collapse file tree 2 files changed +6
-6
lines changed Original file line number Diff line number Diff line change @@ -135,11 +135,12 @@ class SchedulerConfig:
135135 like full attention and sliding window attention.
136136 """
137137
138- async_scheduling : bool = False
139- """If set to True, perform async scheduling. This helps to avoid gaps in
140- GPU utilization, leading to better latency and throughput.
141- Async scheduling is currently not supported with some features such as
142- speculative decoding and pipeline parallelism.
138+ async_scheduling : bool = Field (default = None )
139+ """If set to False, disable async scheduling. Async scheduling helps to
140+ avoid gaps in GPU utilization, leading to better latency and throughput.
141+ It is currently not supported with some features such as
142+ speculative decoding and pipeline parallelism, and will be automatically
143+ disabled in those cases.
143144 """
144145
145146 def get_scheduler_cls (self ) -> type ["SchedulerInterface" ]:
Original file line number Diff line number Diff line change @@ -379,7 +379,6 @@ def __post_init__(self):
379379 )
380380 elif self .scheduler_config .async_scheduling is None :
381381 # Enable async scheduling unless there is an incompatible option.
382- # NOTE: we won't reach here until async scheduling is enabled by default.
383382 if (
384383 self .parallel_config .pipeline_parallel_size > 1
385384 or self .speculative_config is not None
You can’t perform that action at this time.
0 commit comments