mirror of
https://github.com/hpcaitech/ColossalAI.git
synced 2025-09-13 21:22:49 +00:00
[misc] refactor launch API and tensor constructor (#5666)
* [misc] remove config arg from initialize * [misc] remove old tensor contrusctor * [plugin] add npu support for ddp * [pre-commit.ci] auto fixes from pre-commit.com hooks for more information, see https://pre-commit.ci * [devops] fix doc test ci * [test] fix test launch * [doc] update launch doc --------- Co-authored-by: pre-commit-ci[bot] <66853113+pre-commit-ci[bot]@users.noreply.github.com>
This commit is contained in:
@@ -8,7 +8,7 @@ from colossalai.testing import parameterize, rerun_if_address_is_in_use, spawn
|
||||
|
||||
def check_alpha_beta(rank, world_size, port, physical_devices):
|
||||
disable_existing_loggers()
|
||||
launch(config={}, rank=rank, world_size=world_size, host="localhost", port=port, backend="nccl")
|
||||
launch(rank=rank, world_size=world_size, host="localhost", port=port, backend="nccl")
|
||||
profiler = AlphaBetaProfiler(physical_devices)
|
||||
ab_dict = profiler.profile_ab()
|
||||
for _, (alpha, beta) in ab_dict.items():
|
||||
|
@@ -75,7 +75,7 @@ def check_2d_device_mesh():
|
||||
|
||||
|
||||
def check_init_from_process_group(rank, world_size, port):
|
||||
colossalai.launch(config={}, rank=rank, world_size=world_size, host="localhost", port=port, backend="nccl")
|
||||
colossalai.launch(rank=rank, world_size=world_size, host="localhost", port=port, backend="nccl")
|
||||
|
||||
|
||||
@pytest.mark.dist
|
||||
|
@@ -8,7 +8,7 @@ from colossalai.testing import parameterize, rerun_if_address_is_in_use, spawn
|
||||
|
||||
def check_extract_alpha_beta(rank, world_size, port, physical_devices):
|
||||
disable_existing_loggers()
|
||||
launch(config={}, rank=rank, world_size=world_size, host="localhost", port=port, backend="nccl")
|
||||
launch(rank=rank, world_size=world_size, host="localhost", port=port, backend="nccl")
|
||||
profiler = AlphaBetaProfiler(physical_devices)
|
||||
|
||||
mesh_alpha, mesh_beta = profiler.extract_alpha_beta_for_device_mesh()
|
||||
|
@@ -9,7 +9,7 @@ from colossalai.testing import rerun_if_address_is_in_use, spawn
|
||||
|
||||
|
||||
def check_layer(rank, world_size, port):
|
||||
launch(config={}, rank=rank, world_size=world_size, host="localhost", port=port, backend="nccl")
|
||||
launch(rank=rank, world_size=world_size, host="localhost", port=port, backend="nccl")
|
||||
|
||||
physical_mesh_id = torch.arange(0, 4)
|
||||
assert rank == dist.get_rank()
|
||||
|
@@ -8,7 +8,7 @@ from colossalai.testing import parameterize, rerun_if_address_is_in_use, spawn
|
||||
|
||||
def check_alpha_beta(rank, world_size, port, physical_devices):
|
||||
disable_existing_loggers()
|
||||
launch(config={}, rank=rank, world_size=world_size, host="localhost", port=port, backend="nccl")
|
||||
launch(rank=rank, world_size=world_size, host="localhost", port=port, backend="nccl")
|
||||
profiler = AlphaBetaProfiler(physical_devices)
|
||||
best_logical_mesh = profiler.search_best_logical_mesh()
|
||||
|
||||
|
Reference in New Issue
Block a user