backend: dedupe tokenizing code in mpt/gptj

2025-09-06 11:00:48 +00:00 · 2023-05-15 17:42:20 -07:00
parent 6182026c70
commit d14936bfd6
4 changed files with 6 additions and 102 deletions
--- a/gpt4all-backend/gptj.cpp
+++ b/gpt4all-backend/gptj.cpp
@@ -983,7 +983,7 @@ void GPTJ::prompt(const std::string &prompt,
        gpt_vocab::id id = 0;
        {
            const int64_t t_start_sample_us = ggml_time_us();
-            id = gpt_sample_top_k_top_p(d_ptr->vocab,
+            id = gpt_sample_top_k_top_p(d_ptr->vocab, n_vocab,
                promptCtx.tokens.data() + promptCtx.n_ctx - promptCtx.n_ctx,
                promptCtx.n_ctx,
                promptCtx.logits,