[chatgpt]fix train_rm bug with lora (#2741)

2025-09-13 05:01:44 +00:00 · 2023-02-16 10:25:17 +08:00
parent b6e3b955c3
commit 648183a960
1 changed files with 1 additions and 1 deletions
--- a/applications/ChatGPT/chatgpt/trainer/rm.py
+++ b/applications/ChatGPT/chatgpt/trainer/rm.py
@@ -43,7 +43,7 @@ class RewardModelTrainer(ABC):
            # train
            if use_lora > 0:
                print("Using Lora")
-                lora.mark_only_lora_as_trainable(self.model)
+                lora.mark_only_lora_as_trainable(self.model.model)
            else:
                self.model.train()
            for chosen_ids, c_mask, reject_ids, r_mask in self.train_dataloader: