fix: lint

2025-08-26 03:49:10 +00:00 · 2023-05-30 19:11:34 +08:00 · 2023-05-30 19:11:34 +08:00 · 16c6986666
commit 16c6986666
parent 1bbed02a3c
6 changed files with 34 additions and 26 deletions
--- a/pilot/model/adapter.py
+++ b/pilot/model/adapter.py
@ -85,8 +85,10 @@ class ChatGLMAdapater(BaseLLMAdaper):
 class GuanacoAdapter(BaseLLMAdaper):
    """TODO Support guanaco"""
    pass
 class CodeGenAdapter(BaseLLMAdaper):
    pass
@ -127,9 +129,11 @@ class GPT4AllAdapter(BaseLLMAdaper):
        # TODO
        pass
 class ProxyllmAdapter(BaseLLMAdaper):
    """The model adapter for local proxy"""
    def match(self, model_path: str):
        return "proxyllm" in model_path
--- a/pilot/model/loader.py
+++ b/pilot/model/loader.py
@ -109,8 +109,10 @@ class ModelLoader(metaclass=Singleton):
                compress_module(model, self.device)
        if (
-            self.device == "cuda" and num_gpus == 1 and not cpu_offloading
+            (self.device == "cuda" and num_gpus == 1 and not cpu_offloading)
-        ) or self.device == "mps" and tokenizer:
+            or self.device == "mps"
            and tokenizer
        ):
            model.to(self.device)
        if debug:
--- a/pilot/model/proxy_llm.py
+++ b/pilot/model/proxy_llm.py
@ -8,10 +8,8 @@ from pilot.conversation import ROLE_ASSISTANT, ROLE_USER
 CFG = Config()
 def proxyllm_generate_stream(
    model, tokenizer, params, device, context_len=2048
 ):
 def proxyllm_generate_stream(model, tokenizer, params, device, context_len=2048):
    history = []
    prompt = params["prompt"]
@ -19,7 +17,7 @@ def proxyllm_generate_stream(
    headers = {
        "Authorization": "Bearer " + CFG.proxy_api_key,
-        "Token": CFG.proxy_api_key 
+        "Token": CFG.proxy_api_key,
    }
    messages = prompt.split(stop)
@ -30,14 +28,15 @@ def proxyllm_generate_stream(
            {"role": "user", "content": messages[i].split(ROLE_USER + ":")[1]},
        )
        history.append(
-            {"role": "system", "content": messages[i + 1].split(ROLE_ASSISTANT + ":")[1]}
+            {
                "role": "system",
                "content": messages[i + 1].split(ROLE_ASSISTANT + ":")[1],
            }
        )
    # Add user query
    query = messages[-2].split(ROLE_USER + ":")[1]
-    history.append(
+    history.append({"role": "user", "content": query})
        {"role": "user", "content": query}
    )
    payloads = {
        "model": "gpt-3.5-turbo",  # just for test, remove this later
        "messages": history,
@ -47,14 +46,16 @@ def proxyllm_generate_stream(
    print(payloads)
    print(headers)
-    res = requests.post(CFG.proxy_server_url, headers=headers, json=payloads, stream=True)
+    res = requests.post(
        CFG.proxy_server_url, headers=headers, json=payloads, stream=True
    )
    text = ""
    print("====================================res================")
    print(res)
    for line in res.iter_lines():
        if line:
-            decoded_line = line.decode('utf-8')
+            decoded_line = line.decode("utf-8")
            json_line = json.loads(decoded_line)
            print(json_line)
            text += json_line["choices"][0]["message"]["content"]
--- a/pilot/server/chat_adapter.py
+++ b/pilot/server/chat_adapter.py
@ -101,6 +101,7 @@ class ProxyllmChatAdapter(BaseChatAdpter):
    def get_generate_stream_func(self):
        from pilot.model.proxy_llm import proxyllm_generate_stream
        return proxyllm_generate_stream