mirror of
https://github.com/hpcaitech/ColossalAI.git
synced 2025-09-06 11:32:10 +00:00
[Feat]Tensor Model Parallel Support For Inference (#5563)
* tensor parallel support naive source * [fix]precision, model load and refactor the framework * add tp unit test * docstring * fix do_sample
This commit is contained in:
@@ -40,7 +40,7 @@ def check_inference_engine(use_cuda_graph=False, batch_size=32):
|
||||
|
||||
input_len = 1024
|
||||
output_len = 128
|
||||
do_sample = True
|
||||
do_sample = False
|
||||
top_p = 0.5
|
||||
top_k = 50
|
||||
|
||||
|
Reference in New Issue
Block a user