mirror of
https://github.com/hpcaitech/ColossalAI.git
synced 2025-09-09 04:50:17 +00:00
[inference/model]Adapted to the baichuan2-7B model (#5591)
* Adapted to the baichuan2-7B model * modified according to the review comments. * Modified the method of obtaining random weights. * modified according to the review comments. * change mlp layewr 'NOTE'
This commit is contained in:
@@ -479,7 +479,7 @@ class NopadLlamaAttention(LlamaAttention):
|
||||
return attn_output
|
||||
|
||||
|
||||
# NOTE This will cause the result to be different from the transformer in some cases.
|
||||
# NOTE This will cause difference as out length increases.
|
||||
class NopadLlamaMLP(LlamaMLP):
|
||||
def __init__(
|
||||
self,
|
||||
|
Reference in New Issue
Block a user