Merge branch 'grpo-latest-rebase-main' of https://github.com/hpcaitech/ColossalAI into grpo-latest-rebase-main

This commit is contained in:
YeAnbang
2025-08-14 19:03:04 +08:00
4 changed files with 12 additions and 4 deletions

View File

@@ -530,4 +530,4 @@ class GRPOConsumer(BaseConsumer):
model = self.policy_model.unwrap()
state_dict = model.state_dict()
state_dict["consumer_global_step"] = torch.tensor([self.global_step], device=self.device)
return state_dict
return state_dict