feat(model): Support llama.cpp server deploy (#2263)

This commit is contained in:
Fangyin Cheng
2025-01-02 16:50:53 +08:00
committed by GitHub
parent 576da34e92
commit 0b2af2e9a2
14 changed files with 823 additions and 44 deletions

View File

@@ -42,6 +42,13 @@ def get_llm_model_adapter(
from dbgpt.model.adapter.vllm_adapter import VLLMModelAdapterWrapper
return VLLMModelAdapterWrapper(conv_factory)
if model_type == ModelType.LLAMA_CPP_SERVER:
logger.info(
"Current model type is llama_cpp_server, return LLamaServerModelAdapter"
)
from dbgpt.model.adapter.llama_cpp_adapter import LLamaServerModelAdapter
return LLamaServerModelAdapter()
# Import NewHFChatModelAdapter for it can be registered
from dbgpt.model.adapter.hf_adapter import NewHFChatModelAdapter