fix problem

2025-07-26 13:27:46 +00:00 · 2023-04-29 21:50:47 +08:00 · 2023-04-29 21:50:47 +08:00 · acf9dbbd82
commit acf9dbbd82
parent 0767537606
3 changed files with 4 additions and 5 deletions
--- a/pilot/model/loader.py
+++ b/pilot/model/loader.py
@ -29,8 +29,8 @@ class ModerLoader:
        if debug:
            print(model)
-        if self.device == "cuda":
+        # if self.device == "cuda":
-            model.to(self.device)
+        #     model.to(self.device)
        return model, tokenizer
--- a/pilot/server/chatbot.py
+++ b/pilot/server/chatbot.py
@ -6,7 +6,7 @@ import json
 import time
 from urllib.parse import urljoin
 import gradio as gr
-from configs.model_config import *
+from pilot.configs.model_config import *
 vicuna_base_uri = "http://192.168.31.114:21002/"
 vicuna_stream_path = "worker_generate_stream"
 vicuna_status_path = "worker_get_status"
--- a/pilot/server/sqlgpt.py
+++ b/pilot/server/sqlgpt.py
@ -5,7 +5,7 @@
 import json
 import torch
 import gradio as gr
-from fastchat.serve.inference import generate_stream, compress_module
+from fastchat.serve.inference import generate_stream 
 from transformers import AutoTokenizer, AutoModelForCausalLM
 device = "cuda" if torch.cuda.is_available() else "cpu"
@ -20,7 +20,6 @@ model = AutoModelForCausalLM.from_pretrained(
 )
 def generate(prompt):    
    compress_module(model, device) 
    model.to(device)
    print(model, tokenizer)
    params = {