Skip to content
1 change: 1 addition & 0 deletions verl/workers/rollout/vllm_rollout/vllm_rollout_spmd.py
Original file line number Diff line number Diff line change
Expand Up @@ -208,6 +208,7 @@ def __init__(self, model_path: str, config: RolloutConfig, tokenizer, model_hf_c
n=1,
logprobs=0, # can be set to 0 and let actor to recompute
max_tokens=config.response_length,
repetition_penalty=config.get("repetition_penalty", 1.0),
)

kwargs["detokenize"] = False
Expand Down