fix: can not answer on mac m1-> mps device (#85)

fix: #86
2025-08-05 02:20:08 +00:00 · 2023-05-24 13:33:35 +08:00 · 2023-05-24 13:33:35 +08:00 · 562d5a98cc
commit 562d5a98cc
parent 0ae64175ef 60ecde5892
1 changed files with 2 additions and 1 deletions
--- a/pilot/model/loader.py
+++ b/pilot/model/loader.py
@ -9,6 +9,7 @@ from typing import Optional
 from pilot.model.compression import compress_module 
 from pilot.model.adapter import get_llm_model_adapter
 from pilot.utils import get_gpu_memory
 from pilot.configs.model_config import DEVICE
 from pilot.model.llm.monkey_patch import replace_llama_attn_with_non_inplace_operations
 def raise_warning_for_incompatible_cpu_offloading_configuration(
@ -50,7 +51,7 @@ class ModelLoader(metaclass=Singleton):
    def __init__(self, 
                 model_path) -> None:
-        self.device = "cuda" if torch.cuda.is_available() else "cpu"
+        self.device = DEVICE
        self.model_path = model_path 
        self.kwargs = {
            "torch_dtype": torch.float16,