diff --git a/pilot/configs/model_config.py b/pilot/configs/model_config.py index 16deee50a..803d0fae9 100644 --- a/pilot/configs/model_config.py +++ b/pilot/configs/model_config.py @@ -78,8 +78,15 @@ LLM_MODEL_CONFIG = { "internlm-7b": os.path.join(MODEL_PATH, "internlm-chat-7b"), "internlm-7b-8k": os.path.join(MODEL_PATH, "internlm-chat-7b-8k"), "internlm-20b": os.path.join(MODEL_PATH, "internlm-chat-20b"), + "codellama-7b": os.path.join(MODEL_PATH, "CodeLlama-7b-Instruct-hf"), + "codellama-7b-sql-sft": os.path.join(MODEL_PATH, "codellama-7b-sql-sft"), + "codellama-13b": os.path.join(MODEL_PATH, "CodeLlama-13b-Instruct-hf"), "codellama-13b-sql-sft": os.path.join(MODEL_PATH, "codellama-13b-sql-sft"), + + + + # For test now "opt-125m": os.path.join(MODEL_PATH, "opt-125m"), } diff --git a/pilot/model/adapter.py b/pilot/model/adapter.py index 02fbe8aa9..cb9885d2a 100644 --- a/pilot/model/adapter.py +++ b/pilot/model/adapter.py @@ -323,7 +323,7 @@ class CodeLlamaAdapter(BaseLLMAdaper): """The model adapter for codellama """ def match(self, model_path: str): - return "codelama" in model_path.lower() + return "codellama" in model_path.lower() def loader(self, model_path: str, from_pretrained_kwargs: dict): model, tokenizer = super().loader(model_path, from_pretrained_kwargs) diff --git a/pilot/model/model_adapter.py b/pilot/model/model_adapter.py index 112fb468a..cadb1cebd 100644 --- a/pilot/model/model_adapter.py +++ b/pilot/model/model_adapter.py @@ -45,7 +45,10 @@ _OLD_MODELS = [ "llama-cpp", "proxyllm", "gptj-6b", - "codellama-13b-sql-sft" + "codellama-13b-sql-sft", + "codellama-7b", + "codellama-7b-sql-sft", + "codellama-13b" ]