[chatgpt] startegy add prepare method (#2766)

* [chatgpt] startegy add prepare method * [chatgpt] refactor examples * [chatgpt] refactor strategy.prepare * [chatgpt] support save/load checkpoint * [chatgpt] fix unwrap actor * [chatgpt] fix unwrap actor
2025-09-11 13:59:08 +00:00 · 2023-02-17 11:27:27 +08:00
parent a2b43e393d
commit 4ee311c026
9 changed files with 164 additions and 15 deletions
--- a/applications/ChatGPT/examples/train_dummy.py
+++ b/applications/ChatGPT/examples/train_dummy.py
@@ -68,6 +68,9 @@ def main(args):
    else:
        raise ValueError(f'Unsupported model "{args.model}"')

+    (actor, actor_optim), (critic, critic_optim), reward_model, initial_model = strategy.prepare(
+        (actor, actor_optim), (critic, critic_optim), reward_model, initial_model)
+
    # configure trainer
    trainer = PPOTrainer(
        strategy,
--- a/applications/ChatGPT/examples/train_prompts.py
+++ b/applications/ChatGPT/examples/train_prompts.py
@@ -68,6 +68,9 @@ def main(args):
        batch = tokenizer(texts, return_tensors='pt', max_length=96, padding=True, truncation=True)
        return {k: v.cuda() for k, v in batch.items()}

+    (actor, actor_optim), (critic, critic_optim), reward_model, initial_model = strategy.prepare(
+        (actor, actor_optim), (critic, critic_optim), reward_model, initial_model)
+
    # configure trainer
    trainer = PPOTrainer(
        strategy,