[inference/model]Adapted to the baichuan2-7B model (#5591)

* Adapted to the baichuan2-7B model

* modified according to the review comments.

* Modified the method of obtaining random weights.

* modified according to the review comments.

* change mlp layewr 'NOTE'
This commit is contained in:
yuehuayingxueluo
2024-04-15 16:53:02 +08:00
committed by GitHub
parent d4cb023b62
commit 56b222eff8
8 changed files with 354 additions and 2 deletions

View File

@@ -27,6 +27,7 @@ PP_AXIS, TP_AXIS = 0, 1
_supported_models = [
"LlamaForCausalLM",
"BaichuanForCausalLM",
]
_BATCH_SIZES_TO_CAPTURE = [1, 2, 4] + [8 * i for i in range(1, 33)]