mirror of
https://github.com/csunny/DB-GPT.git
synced 2025-10-24 19:08:58 +00:00
293 lines
9.6 KiB
Python
293 lines
9.6 KiB
Python
"""
|
|
This code file will be deprecated in the future.
|
|
We have integrated fastchat. For details, see: dbgpt/model/model_adapter.py
|
|
"""
|
|
#!/usr/bin/env python3
|
|
# -*- coding: utf-8 -*-
|
|
|
|
from functools import cache
|
|
from typing import Dict, List, Tuple
|
|
|
|
from dbgpt.core.interface.message import ModelMessage, ModelMessageRoleType
|
|
from dbgpt.model.llm.conversation import Conversation, get_conv_template
|
|
|
|
|
|
class BaseChatAdpter:
|
|
"""The Base class for chat with llm models. it will match the model,
|
|
and fetch output from model"""
|
|
|
|
def match(self, model_path: str):
|
|
return False
|
|
|
|
def get_generate_stream_func(self, model_path: str):
|
|
"""Return the generate stream handler func"""
|
|
from dbgpt.model.llm.inference import generate_stream
|
|
|
|
return generate_stream
|
|
|
|
def get_conv_template(self, model_path: str) -> Conversation:
|
|
return None
|
|
|
|
def model_adaptation(
|
|
self, params: Dict, model_path: str, prompt_template: str = None
|
|
) -> Tuple[Dict, Dict]:
|
|
"""Params adaptation"""
|
|
conv = self.get_conv_template(model_path)
|
|
messages = params.get("messages")
|
|
# Some model scontext to dbgpt server
|
|
model_context = {"prompt_echo_len_char": -1}
|
|
|
|
if messages:
|
|
# Dict message to ModelMessage
|
|
messages = [
|
|
m if isinstance(m, ModelMessage) else ModelMessage(**m)
|
|
for m in messages
|
|
]
|
|
params["messages"] = messages
|
|
|
|
if prompt_template:
|
|
print(f"Use prompt template {prompt_template} from config")
|
|
conv = get_conv_template(prompt_template)
|
|
|
|
if not conv or not messages:
|
|
# Nothing to do
|
|
print(
|
|
f"No conv from model_path {model_path} or no messages in params, {self}"
|
|
)
|
|
return params, model_context
|
|
conv = conv.copy()
|
|
system_messages = []
|
|
for message in messages:
|
|
role, content = None, None
|
|
if isinstance(message, ModelMessage):
|
|
role = message.role
|
|
content = message.content
|
|
elif isinstance(message, dict):
|
|
role = message["role"]
|
|
content = message["content"]
|
|
else:
|
|
raise ValueError(f"Invalid message type: {message}")
|
|
|
|
if role == ModelMessageRoleType.SYSTEM:
|
|
# Support for multiple system messages
|
|
system_messages.append(content)
|
|
elif role == ModelMessageRoleType.HUMAN:
|
|
conv.append_message(conv.roles[0], content)
|
|
elif role == ModelMessageRoleType.AI:
|
|
conv.append_message(conv.roles[1], content)
|
|
else:
|
|
raise ValueError(f"Unknown role: {role}")
|
|
if system_messages:
|
|
conv.update_system_message("".join(system_messages))
|
|
# Add a blank message for the assistant.
|
|
conv.append_message(conv.roles[1], None)
|
|
new_prompt = conv.get_prompt()
|
|
# Overwrite the original prompt
|
|
# TODO remote bos token and eos token from tokenizer_config.json of model
|
|
prompt_echo_len_char = len(new_prompt.replace("</s>", "").replace("<s>", ""))
|
|
model_context["prompt_echo_len_char"] = prompt_echo_len_char
|
|
model_context["echo"] = params.get("echo", True)
|
|
params["prompt"] = new_prompt
|
|
|
|
# Overwrite model params:
|
|
params["stop"] = conv.stop_str
|
|
|
|
return params, model_context
|
|
|
|
|
|
llm_model_chat_adapters: List[BaseChatAdpter] = []
|
|
|
|
|
|
def register_llm_model_chat_adapter(cls):
|
|
"""Register a chat adapter"""
|
|
llm_model_chat_adapters.append(cls())
|
|
|
|
|
|
@cache
|
|
def get_llm_chat_adapter(model_name: str, model_path: str) -> BaseChatAdpter:
|
|
"""Get a chat generate func for a model"""
|
|
for adapter in llm_model_chat_adapters:
|
|
if adapter.match(model_name):
|
|
print(f"Get model chat adapter with model name {model_name}, {adapter}")
|
|
return adapter
|
|
for adapter in llm_model_chat_adapters:
|
|
if adapter.match(model_path):
|
|
print(f"Get model chat adapter with model path {model_path}, {adapter}")
|
|
return adapter
|
|
raise ValueError(
|
|
f"Invalid model for chat adapter with model name {model_name} and model path {model_path}"
|
|
)
|
|
|
|
|
|
class VicunaChatAdapter(BaseChatAdpter):
|
|
"""Model chat Adapter for vicuna"""
|
|
|
|
def _is_llama2_based(self, model_path: str):
|
|
# see https://huggingface.co/lmsys/vicuna-13b-v1.5
|
|
return "v1.5" in model_path.lower()
|
|
|
|
def match(self, model_path: str):
|
|
return "vicuna" in model_path.lower()
|
|
|
|
def get_conv_template(self, model_path: str) -> Conversation:
|
|
if self._is_llama2_based(model_path):
|
|
return get_conv_template("vicuna_v1.1")
|
|
return None
|
|
|
|
def get_generate_stream_func(self, model_path: str):
|
|
from dbgpt.model.llm_out.vicuna_base_llm import generate_stream
|
|
|
|
if self._is_llama2_based(model_path):
|
|
return super().get_generate_stream_func(model_path)
|
|
return generate_stream
|
|
|
|
|
|
class ChatGLMChatAdapter(BaseChatAdpter):
|
|
"""Model chat Adapter for ChatGLM"""
|
|
|
|
def match(self, model_path: str):
|
|
return "chatglm" in model_path
|
|
|
|
def get_generate_stream_func(self, model_path: str):
|
|
from dbgpt.model.llm_out.chatglm_llm import chatglm_generate_stream
|
|
|
|
return chatglm_generate_stream
|
|
|
|
|
|
class GuanacoChatAdapter(BaseChatAdpter):
|
|
"""Model chat adapter for Guanaco"""
|
|
|
|
def match(self, model_path: str):
|
|
return "guanaco" in model_path
|
|
|
|
def get_generate_stream_func(self, model_path: str):
|
|
from dbgpt.model.llm_out.guanaco_llm import guanaco_generate_stream
|
|
|
|
return guanaco_generate_stream
|
|
|
|
|
|
class FalconChatAdapter(BaseChatAdpter):
|
|
"""Model chat adapter for Guanaco"""
|
|
|
|
def match(self, model_path: str):
|
|
return "falcon" in model_path
|
|
|
|
def get_generate_stream_func(self, model_path: str):
|
|
from dbgpt.model.llm_out.falcon_llm import falcon_generate_output
|
|
|
|
return falcon_generate_output
|
|
|
|
|
|
#
|
|
# class ProxyllmChatAdapter(BaseChatAdpter):
|
|
# def match(self, model_path: str):
|
|
# return "proxyllm" in model_path
|
|
#
|
|
# def get_generate_stream_func(self, model_path: str):
|
|
# from dbgpt.model.llm_out.proxy_llm import proxyllm_generate_stream
|
|
#
|
|
# return proxyllm_generate_stream
|
|
|
|
|
|
class GorillaChatAdapter(BaseChatAdpter):
|
|
def match(self, model_path: str):
|
|
return "gorilla" in model_path
|
|
|
|
def get_generate_stream_func(self, model_path: str):
|
|
from dbgpt.model.llm_out.gorilla_llm import generate_stream
|
|
|
|
return generate_stream
|
|
|
|
|
|
class GPT4AllChatAdapter(BaseChatAdpter):
|
|
def match(self, model_path: str):
|
|
return "gptj-6b" in model_path
|
|
|
|
def get_generate_stream_func(self, model_path: str):
|
|
from dbgpt.model.llm_out.gpt4all_llm import gpt4all_generate_stream
|
|
|
|
return gpt4all_generate_stream
|
|
|
|
|
|
class Llama2ChatAdapter(BaseChatAdpter):
|
|
def match(self, model_path: str):
|
|
return "llama-2" in model_path.lower()
|
|
|
|
def get_conv_template(self, model_path: str) -> Conversation:
|
|
return get_conv_template("llama-2")
|
|
|
|
|
|
class CodeLlamaChatAdapter(BaseChatAdpter):
|
|
"""The model ChatAdapter for codellama ."""
|
|
|
|
def match(self, model_path: str):
|
|
return "codellama" in model_path.lower()
|
|
|
|
def get_conv_template(self, model_path: str) -> Conversation:
|
|
return get_conv_template("codellama")
|
|
|
|
|
|
class BaichuanChatAdapter(BaseChatAdpter):
|
|
def match(self, model_path: str):
|
|
return "baichuan" in model_path.lower()
|
|
|
|
def get_conv_template(self, model_path: str) -> Conversation:
|
|
if "chat" in model_path.lower():
|
|
return get_conv_template("baichuan-chat")
|
|
return get_conv_template("zero_shot")
|
|
|
|
|
|
class WizardLMChatAdapter(BaseChatAdpter):
|
|
def match(self, model_path: str):
|
|
return "wizardlm" in model_path.lower()
|
|
|
|
def get_conv_template(self, model_path: str) -> Conversation:
|
|
return get_conv_template("vicuna_v1.1")
|
|
|
|
|
|
class LlamaCppChatAdapter(BaseChatAdpter):
|
|
def match(self, model_path: str):
|
|
from dbgpt.model.adapter.old_adapter import LlamaCppAdapater
|
|
|
|
if "llama-cpp" == model_path:
|
|
return True
|
|
is_match, _ = LlamaCppAdapater._parse_model_path(model_path)
|
|
return is_match
|
|
|
|
def get_conv_template(self, model_path: str) -> Conversation:
|
|
return get_conv_template("llama-2")
|
|
|
|
def get_generate_stream_func(self, model_path: str):
|
|
from dbgpt.model.llm_out.llama_cpp_llm import generate_stream
|
|
|
|
return generate_stream
|
|
|
|
|
|
class InternLMChatAdapter(BaseChatAdpter):
|
|
"""The model adapter for internlm/internlm-chat-7b"""
|
|
|
|
def match(self, model_path: str):
|
|
return "internlm" in model_path.lower()
|
|
|
|
def get_conv_template(self, model_path: str) -> Conversation:
|
|
return get_conv_template("internlm-chat")
|
|
|
|
|
|
register_llm_model_chat_adapter(VicunaChatAdapter)
|
|
register_llm_model_chat_adapter(ChatGLMChatAdapter)
|
|
register_llm_model_chat_adapter(GuanacoChatAdapter)
|
|
register_llm_model_chat_adapter(FalconChatAdapter)
|
|
register_llm_model_chat_adapter(GorillaChatAdapter)
|
|
register_llm_model_chat_adapter(GPT4AllChatAdapter)
|
|
register_llm_model_chat_adapter(Llama2ChatAdapter)
|
|
register_llm_model_chat_adapter(CodeLlamaChatAdapter)
|
|
register_llm_model_chat_adapter(BaichuanChatAdapter)
|
|
register_llm_model_chat_adapter(WizardLMChatAdapter)
|
|
register_llm_model_chat_adapter(LlamaCppChatAdapter)
|
|
register_llm_model_chat_adapter(InternLMChatAdapter)
|
|
|
|
# Proxy model for test and develop, it's cheap for us now.
|
|
# register_llm_model_chat_adapter(ProxyllmChatAdapter)
|
|
|
|
register_llm_model_chat_adapter(BaseChatAdpter)
|