fix problem

2025-10-27 21:00:36 +00:00 · 2023-04-29 21:50:47 +08:00
parent 0767537606
commit acf9dbbd82
3 changed files with 4 additions and 5 deletions
--- a/pilot/server/sqlgpt.py
+++ b/pilot/server/sqlgpt.py
@@ -5,7 +5,7 @@
 import json
 import torch
 import gradio as gr
-from fastchat.serve.inference import generate_stream, compress_module
+from fastchat.serve.inference import generate_stream 

 from transformers import AutoTokenizer, AutoModelForCausalLM
 device = "cuda" if torch.cuda.is_available() else "cpu"
@@ -20,7 +20,6 @@ model = AutoModelForCausalLM.from_pretrained(
 )

 def generate(prompt):    
-    compress_module(model, device) 
    model.to(device)
    print(model, tokenizer)
    params = {