feat(model): Support gemma-2 model (#1675)

This commit is contained in:
Fangyin Cheng
2024-06-28 13:33:57 +08:00
committed by GitHub
parent cd2163e444
commit 374b6ad151
8 changed files with 108 additions and 8 deletions

View File

@@ -116,7 +116,9 @@ class DefaultModelWorker(ModelWorker):
self.model, self.tokenizer = self.ml.loader_with_params(
model_params, self.llm_adapter
)
model_max_length = _parse_model_max_length(self.model, self.tokenizer)
model_max_length = self.llm_adapter.parse_max_length(
self.model, self.tokenizer
)
if model_max_length:
logger.info(
f"Parse model max length {model_max_length} from model {self.model_name}."