[chat] polish code note typo (#3612)

This commit is contained in:
digger-yu
2023-04-20 17:22:15 +08:00
committed by GitHub
parent c4709d34cf
commit d7bf284706
10 changed files with 18 additions and 18 deletions

View File

@@ -29,7 +29,7 @@ class DetachedPPOTrainer(DetachedTrainer):
lora_rank (int) : for actor / critic init
train_batch_size (int, defaults to 8): the batch size to use for training
train_batch_size (int, defaults to 8): the batch size to use for training
buffer_limit (int, defaults to 0): the max_size limitaiton of replay buffer
buffer_limit (int, defaults to 0): the max_size limitation of replay buffer
buffer_cpu_offload (bool, defaults to True): whether to offload replay buffer to cpu
eps_clip (float, defaults to 0.2): the clip coefficient of policy loss
value_clip (float, defaults to 0.4): the clip coefficient of value loss

View File

@@ -83,7 +83,7 @@ class ExperienceMakerHolder:
chosen_trainer = None
min_length = None
if 'debug' in self.generate_kwargs and self.generate_kwargs['debug'] == True:
print("[maker] choosing tartget trainer")
print("[maker] choosing target trainer")
while chosen_trainer is None:
for target_trainer in self.target_trainer_list:
try: