[pipeline] refactor the pipeline module (#1087)

* [pipeline] refactor the pipeline module * polish code
2025-09-10 21:40:02 +00:00 · 2022-06-10 11:27:38 +08:00
parent bad5d4c0a1
commit 2b2dc1c86b
29 changed files with 366 additions and 1127 deletions
--- a/tests/test_utils/test_checkpoint/test_checkpoint_1d.py
+++ b/tests/test_utils/test_checkpoint/test_checkpoint_1d.py
@@ -19,7 +19,7 @@ from colossalai.testing import rerun_on_exception, skip_if_not_enough_gpus


 def build_pipeline(model):
-    from colossalai.builder.pipeline import partition_uniform
+    from colossalai.pipeline.utils import partition_uniform

    pipeline_size = gpc.get_world_size(ParallelMode.PIPELINE)
    pipeline_rank = gpc.get_local_rank(ParallelMode.PIPELINE)
--- a/tests/test_utils/test_checkpoint/test_checkpoint_2d.py
+++ b/tests/test_utils/test_checkpoint/test_checkpoint_2d.py
@@ -19,7 +19,7 @@ from colossalai.testing import rerun_on_exception, skip_if_not_enough_gpus


 def build_pipeline(model):
-    from colossalai.builder.pipeline import partition_uniform
+    from colossalai.pipeline.utils import partition_uniform

    pipeline_size = gpc.get_world_size(ParallelMode.PIPELINE)
    pipeline_rank = gpc.get_local_rank(ParallelMode.PIPELINE)
--- a/tests/test_utils/test_checkpoint/test_checkpoint_2p5d.py
+++ b/tests/test_utils/test_checkpoint/test_checkpoint_2p5d.py
@@ -19,7 +19,7 @@ from colossalai.testing import rerun_on_exception, skip_if_not_enough_gpus


 def build_pipeline(model):
-    from colossalai.builder.pipeline import partition_uniform
+    from colossalai.pipeline.utils import partition_uniform

    pipeline_size = gpc.get_world_size(ParallelMode.PIPELINE)
    pipeline_rank = gpc.get_local_rank(ParallelMode.PIPELINE)
--- a/tests/test_utils/test_checkpoint/test_checkpoint_3d.py
+++ b/tests/test_utils/test_checkpoint/test_checkpoint_3d.py
@@ -19,7 +19,7 @@ from colossalai.testing import rerun_on_exception, skip_if_not_enough_gpus


 def build_pipeline(model):
-    from colossalai.builder.pipeline import partition_uniform
+    from colossalai.pipeline.utils import partition_uniform

    pipeline_size = gpc.get_world_size(ParallelMode.PIPELINE)
    pipeline_rank = gpc.get_local_rank(ParallelMode.PIPELINE)
--- a/tests/test_utils/test_pipelinable.py
+++ b/tests/test_utils/test_pipelinable.py
@@ -1,59 +0,0 @@
-import torch
-import torch.multiprocessing as mp
-
-from colossalai.utils.model.pipelinable import PipelinableContext
-
-from colossalai.testing import rerun_on_exception
-
-NUM_CHUNKS = 1
-PIPELINE_SIZE = 2
-
-
-class MLP(torch.nn.Module):
-
-    def __init__(self, dim: int = 256):
-        super().__init__()
-        intermediate_dim = dim * 4
-        self.dense_1 = torch.nn.Linear(dim, intermediate_dim)
-        self.activation = torch.nn.GELU()
-        self.dense_2 = torch.nn.Linear(intermediate_dim, dim)
-        self.dropout = torch.nn.Dropout(0.1)
-
-    def forward(self, x):
-        x = self.dense_1(x)
-        x = self.activation(x)
-        x = self.dense_2(x)
-        x = self.dropout(x)
-        return x
-
-
-def run_pipelinable(rank):
-    pipelinable = PipelinableContext()
-    with pipelinable:
-        model = MLP()
-
-    assert pipelinable.policy == "balanced"
-    pipelinable.load_policy("uniform")
-    assert pipelinable.policy == "uniform"
-    pipelinable.to_layer_list()
-
-    assert pipelinable.layers_count == len(list(model.children()))
-
-    pipeline_model_part_0 = pipelinable.partition(NUM_CHUNKS, PIPELINE_SIZE, 0)
-    assert isinstance(pipeline_model_part_0, torch.nn.Module)
-    pipeline_model_part_1 = pipelinable.partition(NUM_CHUNKS, PIPELINE_SIZE, 1)
-    assert isinstance(pipeline_model_part_1, torch.nn.Module)
-
-    layers_count_in_part_0 = len(list(pipeline_model_part_0._module_list))
-    layers_count_in_part_1 = len(list(pipeline_model_part_1._module_list))
-
-    assert layers_count_in_part_0 + layers_count_in_part_1 == pipelinable.layers_count
-
-
-@rerun_on_exception(exception_type=mp.ProcessRaisedException, pattern=".*Address already in use.*")
-def test_pipelinable():
-    mp.spawn(run_pipelinable, nprocs=1)
-
-
-if __name__ == '__main__':
-    test_pipelinable()