[chat] polish code note typo (#3612)

2025-09-22 09:59:38 +00:00 · 2023-04-20 17:22:15 +08:00
parent c4709d34cf
commit d7bf284706
10 changed files with 18 additions and 18 deletions
--- a/applications/Chat/coati/ray/src/detached_trainer_ppo.py
+++ b/applications/Chat/coati/ray/src/detached_trainer_ppo.py
@@ -29,7 +29,7 @@ class DetachedPPOTrainer(DetachedTrainer):
        lora_rank (int) : for actor / critic init
        train_batch_size (int, defaults to 8): the batch size to use for training
        train_batch_size (int, defaults to 8): the batch size to use for training
-        buffer_limit (int, defaults to 0): the max_size limitaiton of replay buffer
+        buffer_limit (int, defaults to 0): the max_size limitation of replay buffer
        buffer_cpu_offload (bool, defaults to True): whether to offload replay buffer to cpu
        eps_clip (float, defaults to 0.2): the clip coefficient of policy loss
        value_clip (float, defaults to 0.4): the clip coefficient of value loss
--- a/applications/Chat/coati/ray/src/experience_maker_holder.py
+++ b/applications/Chat/coati/ray/src/experience_maker_holder.py
@@ -83,7 +83,7 @@ class ExperienceMakerHolder:
        chosen_trainer = None
        min_length = None
        if 'debug' in self.generate_kwargs and self.generate_kwargs['debug'] == True:
-            print("[maker] choosing tartget trainer")
+            print("[maker] choosing target trainer")
        while chosen_trainer is None:
            for target_trainer in self.target_trainer_list:
                try: