init model and tokenizer

2025-07-30 07:11:56 +00:00 · 2023-04-28 22:18:08 +08:00 · 2023-04-28 22:18:08 +08:00 · 0861a09a00
commit 0861a09a00
parent c72ae1a87f
6 changed files with 15 additions and 4 deletions
--- a/pilot/init.py
+++ b/pilot/init.py
@ -0,0 +1,3 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+__version__ = "0.0.1"
--- a/pilot/configs/model_config.py
+++ b/pilot/configs/model_config.py
--- a/pilot/model/init.py
+++ b/pilot/model/init.py
@ -0,0 +1,2 @@
+
+from model.loader import *
--- a/pilot/model/loader.py
+++ b/pilot/model/loader.py
@ -2,7 +2,7 @@
 # -*- coding: utf-8 -*-

 import torch
-from utils import get_gpu_memory
+from pilot.utils import get_gpu_memory
 from fastchat.serve.inference import compress_module
 from transformers import (
    AutoTokenizer,
--- a/pilot/server/init.py
+++ b/pilot/server/init.py
--- a/pilot/server/sqlgpt.py
+++ b/pilot/server/sqlgpt.py
@ -1,9 +1,15 @@
 #!/usr/bin/env python3
 #-*- coding: utf-8 -*-

-from model.loader import ModerLoader
+from pilot.model.loader import ModerLoader
 from fastchat.serve.inference import generate_stream
-from configs.model_config import *
+from pilot.configs.model_config import *

 if __name__ == "__main__":
-    pass
+
+    model_path = llm_model_config[LLM_MODEL]
+
+    ml = ModerLoader(model_path)
+    model, tokenizer = ml.loader(load_8bit=True) 
+    print(model)
+    print(tokenizer)