From d0f3517b93a926aec1f720e47654c4f041f721d8 Mon Sep 17 00:00:00 2001 From: Tong Li Date: Tue, 22 Apr 2025 14:13:55 +0800 Subject: [PATCH] default 1 episode --- applications/ColossalChat/rl_example.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/applications/ColossalChat/rl_example.py b/applications/ColossalChat/rl_example.py index 317446695..f42a660b7 100644 --- a/applications/ColossalChat/rl_example.py +++ b/applications/ColossalChat/rl_example.py @@ -107,7 +107,7 @@ if __name__ == "__main__": num_producers=args.num_inferencer, num_proc_per_producer=1, num_consumer_procs=args.num_trainers, - num_episodes=10, + num_episodes=1, inference_batch_size=args.inference_batch_size, inference_microbatch_size=args.inference_microbatch_size, train_batch_size=args.train_batch_size,