diff --git a/pilot/server/vicuna_server.py b/pilot/server/vicuna_server.py index 868e8b6d9..95781b69b 100644 --- a/pilot/server/vicuna_server.py +++ b/pilot/server/vicuna_server.py @@ -10,8 +10,6 @@ from fastapi.responses import StreamingResponse from pilot.model.inference import generate_stream from pydantic import BaseModel from pilot.model.inference import generate_output, get_embeddings -from fastchat.serve.inference import load_model - from pilot.model.loader import ModelLoader from pilot.configs.model_config import *