mirror of
https://github.com/hpcaitech/ColossalAI.git
synced 2025-09-05 02:51:59 +00:00
add simple grpo
This commit is contained in:
@@ -210,6 +210,8 @@ class VLLMInferenceBackend(BaseInferenceBackend):
|
||||
"action_log_probs": log_probs,
|
||||
"action_mask": action_mask,
|
||||
}
|
||||
if "gt_answer" in kwargs:
|
||||
data["gt_answer"] = kwargs["gt_answer"]
|
||||
data = {k: v.to(get_current_device()) for k, v in data.items()}
|
||||
return data
|
||||
|
||||
|
Reference in New Issue
Block a user