mirror of
https://github.com/hpcaitech/ColossalAI.git
synced 2025-04-28 19:55:29 +00:00
[hotfix] fix zero comm buffer init (#6154)
This commit is contained in:
parent
8d826a336e
commit
de3d371f65
@ -371,7 +371,7 @@ class LowLevelZeroOptimizer(OptimizerWrapper):
|
|||||||
for i, sz in enumerate(bucket_store.sizes):
|
for i, sz in enumerate(bucket_store.sizes):
|
||||||
grp = bucket_store.torch_pg if len(bucket_store.sizes) == 1 else bucket_store.torch_pg[i]
|
grp = bucket_store.torch_pg if len(bucket_store.sizes) == 1 else bucket_store.torch_pg[i]
|
||||||
flat_grads_list = list(cur_flat_grads.split(len(cur_flat_grads) // sz))
|
flat_grads_list = list(cur_flat_grads.split(len(cur_flat_grads) // sz))
|
||||||
received_grad = torch.zeros_like(flat_grads_list[0])
|
received_grad = torch.empty_like(flat_grads_list[0])
|
||||||
if self._fp8_communication:
|
if self._fp8_communication:
|
||||||
reduce_scatter_fp8(
|
reduce_scatter_fp8(
|
||||||
received_grad,
|
received_grad,
|
||||||
|
Loading…
Reference in New Issue
Block a user