add multinode support

This commit is contained in:
PeterGriffinJin
2025-04-10 12:26:43 +00:00
parent 968c38c38b
commit a2870cb320
2 changed files with 136 additions and 2 deletions

View File

@@ -448,7 +448,7 @@ class RayPPOTrainer(object):
max_prompt_length=self.config.data.max_prompt_length,
max_response_length=self.config.data.max_response_length,
max_obs_length=self.config.data.max_obs_length,
num_gpus=self.config.trainer.n_gpus_per_node,
num_gpus=self.config.trainer.n_gpus_per_node * self.config.trainer.nnodes,
no_think_rl=self.config.algorithm.no_think_rl,
search_url = self.config.retriever.url,
topk = self.config.retriever.topk,
@@ -679,7 +679,7 @@ class RayPPOTrainer(object):
max_prompt_length=self.config.data.max_prompt_length,
max_response_length=self.config.data.max_response_length,
max_obs_length=self.config.data.max_obs_length,
num_gpus=self.config.trainer.n_gpus_per_node,
num_gpus=self.config.trainer.n_gpus_per_node * self.config.trainer.nnodes,
no_think_rl=self.config.algorithm.no_think_rl,
search_url = self.config.retriever.url,
topk = self.config.retriever.topk,