mirror of
https://github.com/hpcaitech/ColossalAI.git
synced 2025-08-13 13:45:51 +00:00
fix logging
This commit is contained in:
parent
1f31f4f4fb
commit
275c083bab
@ -474,19 +474,14 @@ class GRPOConsumer(BaseConsumer):
|
|||||||
if (not self.plugin.pp_size > 1 and self.rank == 0) or (
|
if (not self.plugin.pp_size > 1 and self.rank == 0) or (
|
||||||
self.plugin.pp_size > 1 and self.booster.plugin.stage_manager.is_last_stage() and self.tp_rank == 0
|
self.plugin.pp_size > 1 and self.booster.plugin.stage_manager.is_last_stage() and self.tp_rank == 0
|
||||||
):
|
):
|
||||||
to_log_msg = (
|
to_log_msg = [
|
||||||
[
|
f"Loss: {self.accum_loss.item() / self.accum_count:.4f}",
|
||||||
f"Loss: {self.accum_loss.item() / self.accum_count:.4f}",
|
f"Reward: {self.accum_reward.item() / self.accum_count:.4f}",
|
||||||
f"Reward: {self.accum_reward.item() / self.accum_count:.4f}",
|
f"format Reward: {self.accum_format_acc.item() / self.accum_count:.4f}",
|
||||||
f"format Reward: {self.accum_format_acc.item() / self.accum_count:.4f}",
|
f"Acc Reward: {self.accum_ans_acc.item() / self.accum_count:.4f}",
|
||||||
f"Acc Reward: {self.accum_ans_acc.item() / self.accum_count:.4f}",
|
f"Advantages: {self.accum_advantages.item() / self.accum_count:.4f}",
|
||||||
f"Advantages: {self.accum_advantages.item() / self.accum_count:.4f}",
|
f"Response Length: {self.accum_response_length.item() / self.accum_count:.4f}",
|
||||||
f"Response Length: {self.accum_response_length.item() / self.accum_count:.4f}",
|
] + ([f"KL: {self.accum_kl.item() / self.accum_count:.4f}"] if self.policy_loss_fn.beta > 0 else [])
|
||||||
]
|
|
||||||
+ [f"KL: {self.accum_kl.item() / self.accum_count:.4f}"]
|
|
||||||
if self.policy_loss_fn.beta > 0
|
|
||||||
else []
|
|
||||||
)
|
|
||||||
print("\n".join(to_log_msg))
|
print("\n".join(to_log_msg))
|
||||||
metrics = {
|
metrics = {
|
||||||
"metrics/reward": self.accum_reward.item() / self.accum_count,
|
"metrics/reward": self.accum_reward.item() / self.accum_count,
|
||||||
|
Loading…
Reference in New Issue
Block a user