Skip to content

Commit 0d06277

Browse files
fix gptoss ckpt
1 parent 1e9a459 commit 0d06277

File tree

2 files changed

+3
-3
lines changed

2 files changed

+3
-3
lines changed

src/megatron/bridge/models/gpt_oss/gpt_oss_provider.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -63,8 +63,8 @@ class GPTOSSProvider(GPTModelProvider):
6363
yarn_beta_fast: float = 32.0
6464
yarn_beta_slow: float = 1.0
6565
yarn_correction_range_round_to_int: bool = False
66-
yarn_mscale: Optional[float] = None
67-
yarn_mscale_all_dim: Optional[float] = None
66+
yarn_mscale: Optional[float] = 1.0 # NOTE (yiakwy) : None
67+
yarn_mscale_all_dim: Optional[float] = 1.0 # NOTE(yiakwy) : None
6868

6969
moe_router_topk: int = 4
7070
moe_router_pre_softmax: bool = False

src/megatron/bridge/training/config.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -153,7 +153,7 @@ class DistributedInitConfig:
153153
Make sure EP and CP aren't used with this option enabled.
154154
"""
155155

156-
use_gloo_process_groups: bool = True
156+
use_gloo_process_groups: bool = False # True NOTE (yiakwy)
157157
"""If set, create Gloo process groups for communications."""
158158

159159
use_sharp: bool = False

0 commit comments

Comments
 (0)