We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent fb626ee commit 451612cCopy full SHA for 451612c
swift/trainers/rlhf_trainer/grpo_trainer.py
@@ -251,7 +251,7 @@ def __init__(self,
251
self.vllm_use_async_engine = False
252
self.enable_offload = False
253
self.use_gym_env = False
254
- self.enable_server_multi_turn = self.args.multi_turn_scheduler is not None
+ self.enable_server_multi_turn = False
255
# for multi-turn server, maybe the num of rollout outputs is not equal to the num of rollout inputs
256
self.dynamic_num_samples = False
257
if self.use_vllm:
0 commit comments