mirror of
https://github.com/hpcaitech/ColossalAI.git
synced 2025-08-03 17:19:51 +00:00
update reward
This commit is contained in:
parent
754b16dfbf
commit
71a0181fce
@ -21,7 +21,7 @@ class VerifiableReward:
|
|||||||
# Get batch size
|
# Get batch size
|
||||||
bs = input_ids.size(0)
|
bs = input_ids.size(0)
|
||||||
# Initialize reward
|
# Initialize reward
|
||||||
rewards = torch.zeros(bs, device=input_ids.device)
|
rewards = torch.zeros((bs, 3), device=input_ids.device)
|
||||||
|
|
||||||
# Loop through reward functions
|
# Loop through reward functions
|
||||||
for reward_fn in self.reward_fns:
|
for reward_fn in self.reward_fns:
|
||||||
|
Loading…
Reference in New Issue
Block a user