mirror of
https://github.com/hpcaitech/ColossalAI.git
synced 2025-09-01 09:07:51 +00:00
[Inference/Refactor] Refactor compilation mechanism and unified multi hw (#5613)
* refactor compilation mechanism and unified multi hw * fix file path bug * add init.py to make pybind a module to avoid relative path error caused by softlink * delete duplicated micros * fix micros bug in gcc
This commit is contained in:
@@ -1,10 +1,14 @@
|
||||
from .cpu_adam import CpuAdamArmExtension, CpuAdamX86Extension
|
||||
from .flash_attention import FlashAttentionDaoCudaExtension, FlashAttentionNpuExtension, FlashAttentionSdpaCudaExtension
|
||||
from .inference import InferenceOpsCudaExtension
|
||||
from .layernorm import LayerNormCudaExtension
|
||||
from .moe import MoeCudaExtension
|
||||
from .optimizer import FusedOptimizerCudaExtension
|
||||
from .softmax import ScaledMaskedSoftmaxCudaExtension, ScaledUpperTriangleMaskedSoftmaxCudaExtension
|
||||
from .pybind.cpu_adam import CpuAdamArmExtension, CpuAdamX86Extension
|
||||
from .pybind.flash_attention import (
|
||||
FlashAttentionDaoCudaExtension,
|
||||
FlashAttentionNpuExtension,
|
||||
FlashAttentionSdpaCudaExtension,
|
||||
)
|
||||
from .pybind.inference import InferenceOpsCudaExtension
|
||||
from .pybind.layernorm import LayerNormCudaExtension
|
||||
from .pybind.moe import MoeCudaExtension
|
||||
from .pybind.optimizer import FusedOptimizerCudaExtension
|
||||
from .pybind.softmax import ScaledMaskedSoftmaxCudaExtension, ScaledUpperTriangleMaskedSoftmaxCudaExtension
|
||||
|
||||
ALL_EXTENSIONS = [
|
||||
CpuAdamArmExtension,
|
||||
|
Reference in New Issue
Block a user