mirror of
https://github.com/hpcaitech/ColossalAI.git
synced 2025-09-09 04:50:17 +00:00
[Inference] Fix API server, test and example (#5712)
* fix api server * fix generation config * fix api server * fix comments * fix infer hanging bug * resolve comments, change backend to free port
This commit is contained in:
@@ -23,7 +23,7 @@ class CompletionServing:
|
||||
|
||||
# it is not a intuitive way
|
||||
self.engine.engine.generation_config = generation_config
|
||||
result_generator = self.engine.generate(request_id, prompt=prompt)
|
||||
result_generator = self.engine.generate(request_id, prompt=prompt, generation_config=generation_config)
|
||||
|
||||
if await request.is_disconnected():
|
||||
# Abort the request if the client disconnects.
|
||||
|
Reference in New Issue
Block a user