mirror of
https://github.com/hpcaitech/ColossalAI.git
synced 2026-05-18 05:23:00 +00:00
[feat] support meta cache, meta_grad_send, meta_tensor_send; fix runtime too long in Recv Bwd; benchmark for llama + Hybrid(tp+pp);
This commit is contained in:
@@ -758,11 +758,11 @@ def run_with_hybridplugin(test_config):
|
||||
@parameterize(
|
||||
"config",
|
||||
[
|
||||
(0, 1, 4, 1, 1),
|
||||
(1, 2, 2, 1, 1),
|
||||
# (0, 1, 4, 1, 1),
|
||||
# (1, 2, 2, 1, 1),
|
||||
(1, 1, 2, 2, 1),
|
||||
(1, 2, 1, 2, 1),
|
||||
(1, 2, 1, 1, 2),
|
||||
# (1, 2, 1, 2, 1),
|
||||
# (1, 2, 1, 1, 2),
|
||||
],
|
||||
)
|
||||
def run_with_booster_moehybridplugin(config: Tuple[int, ...]):
|
||||
@@ -923,10 +923,10 @@ def run_with_booster_moehybridplugin(config: Tuple[int, ...]):
|
||||
@parameterize(
|
||||
"config",
|
||||
[
|
||||
(0, 4, 1, 1),
|
||||
# (0, 4, 1, 1),
|
||||
(1, 2, 2, 1),
|
||||
(1, 2, 1, 2),
|
||||
(1, 1, 2, 2),
|
||||
# (1, 2, 1, 2),
|
||||
# (1, 1, 2, 2), # TODO: no pp show gather result err
|
||||
],
|
||||
)
|
||||
def run_with_booster_hybridplugin(config: Tuple[int, ...]):
|
||||
@@ -976,7 +976,7 @@ def run_with_booster_hybridplugin(config: Tuple[int, ...]):
|
||||
|
||||
zbv_schedule = graph.get_v_schedule()
|
||||
|
||||
# init MoeHybridPlugin
|
||||
# init HybridParallelPlugin
|
||||
plugin = HybridParallelPlugin(
|
||||
pp_size=pp_size,
|
||||
num_microbatches=pp_size,
|
||||
|
||||
Reference in New Issue
Block a user