Skip to content

Commit 7670954

Browse files
[Feature] Non-Blocking EPLB
Signed-off-by: SunChenxiang123 <[email protected]>
1 parent 712d0f8 commit 7670954

File tree

5 files changed

+409
-111
lines changed

5 files changed

+409
-111
lines changed

vllm/config/parallel.py

Lines changed: 15 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -55,6 +55,10 @@ class EPLBConfig:
5555
Log the balancedness each step of expert parallelism.
5656
This is turned off by default since it will cause communication overhead.
5757
"""
58+
use_async: bool = False
59+
"""
60+
Whether to use non-blocking EPLB.
61+
"""
5862

5963

6064
@config
@@ -118,6 +122,10 @@ class ParallelConfig:
118122
"""`eplb_log_balancedness` is deprecated and has been replaced with
119123
`eplb_config.log_balancedness`. This will be removed in v0.12.0.
120124
Please use `eplb_config.log_balancedness` instead."""
125+
eplb_use_async: Optional[bool] = None
126+
"""`eplb_use_async` is deprecated and has been replaced with
127+
`eplb_config.use_async`. This will be removed in v0.12.0.
128+
Please use `eplb_config.use_async` instead."""
121129

122130
max_parallel_loading_workers: Optional[int] = None
123131
"""Maximum number of parallel loading workers when loading model
@@ -304,6 +312,13 @@ def __post_init__(self) -> None:
304312
"with eplb_config.log_balancedness. This will be removed "
305313
"in v0.12.0. Changing this field after initialization will "
306314
"have no effect.")
315+
if self.eplb_use_async is not None:
316+
self.eplb_config.use_async = self.eplb_use_async
317+
logger.warning_once(
318+
"eplb_use_async is deprecated and has been replaced "
319+
"with eplb_config.use_asnyc. This will be removed "
320+
"in v0.12.0. Changing this field after initialization will "
321+
"have no effect.")
307322

308323
# Continue with the rest of the initialization
309324
self.world_size = self.pipeline_parallel_size * \

0 commit comments

Comments
 (0)