[gemini] gemini supports lazy init (#3379)

* [gemini] fix nvme optimizer init * [gemini] gemini supports lazy init * [gemini] add init example * [gemini] add fool model * [zero] update gemini ddp * [zero] update init example * add chunk method * add chunk method * [lazyinit] fix lazy tensor tolist * [gemini] fix buffer materialization * [misc] remove useless file * [booster] update gemini plugin * [test] update gemini plugin test * [test] fix gemini plugin test * [gemini] fix import * [gemini] fix import * [lazyinit] use new metatensor * [lazyinit] use new metatensor * [lazyinit] fix __set__ method
2025-09-05 19:13:01 +00:00 · 2023-04-12 16:03:25 +08:00
parent 366a035552
commit 152239bbfa
7 changed files with 80 additions and 72 deletions
--- a/colossalai/_analyzer/_subclasses/_monkey_patch.py
+++ b/colossalai/_analyzer/_subclasses/_monkey_patch.py
@@ -2,8 +2,6 @@ import torch
 import torch.distributed as dist
 from packaging import version

-aten = torch.ops.aten
-
 __all__ = [
    "_TorchFactoryMethod",
    "_TorchOverrideableFactoryMethod",
@@ -51,6 +49,7 @@ _DistCommMethod = [
 ]

 if version.parse(torch.__version__) >= version.parse('1.12.0'):
+    aten = torch.ops.aten
    # TODO: dive deep here
    # refer to https://github.com/pytorch/pytorch/blob/master/aten/src/ATen/native/TensorShape.cpp
    _AliasATen = [