mirror of
https://github.com/hpcaitech/ColossalAI.git
synced 2025-09-02 01:28:31 +00:00
[inference/model]Adapted to the baichuan2-7B model (#5591)
* Adapted to the baichuan2-7B model * modified according to the review comments. * Modified the method of obtaining random weights. * modified according to the review comments. * change mlp layewr 'NOTE'
This commit is contained in:
@@ -117,6 +117,7 @@ def benchmark_inference(args):
|
||||
max_output_len=args.output_len,
|
||||
prefill_ratio=1.2,
|
||||
block_size=32,
|
||||
use_cuda_kernel=True,
|
||||
)
|
||||
engine = InferenceEngine(model, tokenizer, inference_config, verbose=True)
|
||||
elif args.mode == "vllm":
|
||||
|
Reference in New Issue
Block a user