feat(model): Support llama.cpp server deploy (#2263)

2025-09-12 20:53:48 +00:00 · 2025-01-02 16:50:53 +08:00
parent 576da34e92
commit 0b2af2e9a2
14 changed files with 823 additions and 44 deletions
--- a/dbgpt/model/llm/llama_cpp/llama_cpp.py
+++ b/dbgpt/model/llm/llama_cpp/llama_cpp.py
@@ -1,6 +1,7 @@
 """
 Fork from text-generation-webui https://github.com/oobabooga/text-generation-webui/blob/main/modules/llamacpp_model.py
 """
+
 import logging
 import re
 from typing import Dict
@@ -62,11 +63,11 @@ class LlamaCppModel:
            self.model.__del__()

    @classmethod
-    def from_pretrained(self, model_path, model_params: LlamaCppModelParameters):
+    def from_pretrained(cls, model_path, model_params: LlamaCppModelParameters):
        Llama = llama_cpp_lib(prefer_cpu=model_params.prefer_cpu).Llama
        LlamaCache = llama_cpp_lib(prefer_cpu=model_params.prefer_cpu).LlamaCache

-        result = self()
+        result = cls()
        cache_capacity = 0
        cache_capacity_str = model_params.cache_capacity
        if cache_capacity_str is not None: