[Inference/Refactor] Delete Duplicated code and refactor vec_copy utils and reduce utils (#5593)

* delete duplicated code and refactor vec_copy utils and reduce utils

* delete unused header file
This commit is contained in:
傅剑寒
2024-04-15 10:57:51 +08:00
committed by GitHub
parent a21912339a
commit d4cb023b62
16 changed files with 161 additions and 345 deletions

View File

@@ -1,11 +0,0 @@
from .layer_norm import MixedFusedLayerNorm as LayerNorm
from .multihead_attention import MultiHeadAttention
from .scaled_softmax import AttnMaskType, FusedScaleMaskSoftmax, ScaledUpperTriangMaskedSoftmax
__all__ = [
"LayerNorm",
"MultiHeadAttention",
"FusedScaleMaskSoftmax",
"ScaledUpperTriangMaskedSoftmax",
"AttnMaskType",
]