mirror of
https://github.com/hpcaitech/ColossalAI.git
synced 2025-08-02 00:01:52 +00:00
update reward
This commit is contained in:
parent
754b16dfbf
commit
71a0181fce
@ -21,7 +21,7 @@ class VerifiableReward:
|
||||
# Get batch size
|
||||
bs = input_ids.size(0)
|
||||
# Initialize reward
|
||||
rewards = torch.zeros(bs, device=input_ids.device)
|
||||
rewards = torch.zeros((bs, 3), device=input_ids.device)
|
||||
|
||||
# Loop through reward functions
|
||||
for reward_fn in self.reward_fns:
|
||||
|
Loading…
Reference in New Issue
Block a user