File tree Expand file tree Collapse file tree 2 files changed +2
-2
lines changed
Expand file tree Collapse file tree 2 files changed +2
-2
lines changed Original file line number Diff line number Diff line change @@ -29,7 +29,7 @@ actor_rollout_ref:
2929 use_torch_compile : True # False to disable torch compile
3030 clip_ratio : 0.2
3131 use_dual_clip : False # add Dual-clip PPO from https://arxiv.org/pdf/1912.09729
32- clip_ratio_c : 3 # lower bound of the value for Dual-clip PPO from https://arxiv.org/pdf/1912.09729
32+ clip_ratio_c : 3.0 # lower bound of the value for Dual-clip PPO from https://arxiv.org/pdf/1912.09729
3333 entropy_coeff : 0.001
3434 use_kl_loss : False # True for GRPO
3535 kl_loss_coef : 0.001 # for grpo
Original file line number Diff line number Diff line change @@ -32,7 +32,7 @@ actor_rollout_ref:
3232 grad_clip : 1.0
3333 clip_ratio : 0.2
3434 use_dual_clip : False # add Dual-clip PPO from https://arxiv.org/pdf/1912.09729
35- clip_ratio_c : 3i # lower bound of the value for Dual-clip PPO from https://arxiv.org/pdf/1912.09729
35+ clip_ratio_c : 3.0 # lower bound of the value for Dual-clip PPO from https://arxiv.org/pdf/1912.09729
3636 entropy_coeff : 0.001
3737 use_kl_loss : False # True for GRPO
3838 use_torch_compile : True # False to disable torch compile
You can’t perform that action at this time.
0 commit comments