@@ -55,6 +55,10 @@ class EPLBConfig:
5555 Log the balancedness each step of expert parallelism.
5656 This is turned off by default since it will cause communication overhead.
5757 """
58+ use_async : bool = False
59+ """
60+ Whether to use non-blocking EPLB.
61+ """
5862
5963
6064@config
@@ -118,6 +122,10 @@ class ParallelConfig:
118122 """`eplb_log_balancedness` is deprecated and has been replaced with
119123 `eplb_config.log_balancedness`. This will be removed in v0.12.0.
120124 Please use `eplb_config.log_balancedness` instead."""
125+ eplb_use_async : Optional [bool ] = None
126+ """`eplb_use_async` is deprecated and has been replaced with
127+ `eplb_config.use_async`. This will be removed in v0.12.0.
128+ Please use `eplb_config.use_async` instead."""
121129
122130 max_parallel_loading_workers : Optional [int ] = None
123131 """Maximum number of parallel loading workers when loading model
@@ -304,6 +312,13 @@ def __post_init__(self) -> None:
304312 "with eplb_config.log_balancedness. This will be removed "
305313 "in v0.12.0. Changing this field after initialization will "
306314 "have no effect." )
315+ if self .eplb_use_async is not None :
316+ self .eplb_config .use_async = self .eplb_use_async
317+ logger .warning_once (
318+ "eplb_use_async is deprecated and has been replaced "
319+ "with eplb_config.use_asnyc. This will be removed "
320+ "in v0.12.0. Changing this field after initialization will "
321+ "have no effect." )
307322
308323 # Continue with the rest of the initialization
309324 self .world_size = self .pipeline_parallel_size * \
0 commit comments