[Distributed RLHF] Integration of PP (#6257)

* update help information * update style * fix * minor fix * support PP training * add pp support * remove unused code * address conversation --------- Co-authored-by: Tong Li <tong.li35271158@gmail.com>
2025-09-04 02:26:51 +00:00 · 2025-04-09 13:23:24 +08:00
parent 50153005b4
commit ed43a4be04
7 changed files with 263 additions and 116 deletions
--- a/applications/ColossalChat/coati/distributed/consumer.py
+++ b/applications/ColossalChat/coati/distributed/consumer.py
@@ -54,7 +54,6 @@ class BaseConsumer:

        self.model_config = model_config
        self.plugin_config = plugin_config
-        assert self.plugin_config.get("pp_size", 1) == 1, "pp_size > 1 is not supported now"

        self.device = get_current_device()
        self.lr_scheduler = None
@@ -95,7 +94,6 @@ class BaseConsumer:
                    i = 0
                    for _ in range(self.num_recv_per_update):
                        # receive data from producers
-
                        for r in range(self.num_producers):
                            print(f"[T{dist.get_rank()}] Recv data episode {episode} step {step} from {r}")
                            self.buffer.extend(