mirror of
https://github.com/hpcaitech/ColossalAI.git
synced 2025-08-23 10:11:37 +00:00
update reward
This commit is contained in:
parent
c8db826782
commit
a537aa1c20
@ -21,7 +21,7 @@ class VerifiableReward:
|
|||||||
# Get batch size
|
# Get batch size
|
||||||
bs = input_ids.size(0)
|
bs = input_ids.size(0)
|
||||||
# Initialize reward
|
# Initialize reward
|
||||||
rewards = torch.zeros(bs, device=input_ids.device)
|
rewards = torch.zeros((bs, 3), device=input_ids.device)
|
||||||
|
|
||||||
# Loop through reward functions
|
# Loop through reward functions
|
||||||
for reward_fn in self.reward_fns:
|
for reward_fn in self.reward_fns:
|
||||||
|
Loading…
Reference in New Issue
Block a user