Erase the correct amount of logits when regenerating which is not the same

as the number of tokens.
2025-09-29 00:36:01 +00:00 · 2023-04-15 09:19:06 -04:00
parent b1bb9866ab
commit 078b755ab8
2 changed files with 6 additions and 1 deletions
--- a/llm.h
+++ b/llm.h
@@ -42,6 +42,7 @@ private:
    LLModel *m_llmodel;
    std::string m_response;
    quint32 m_responseTokens;
+    quint32 m_responseLogits;
    QString m_modelName;
    QThread m_llmThread;
    std::atomic<bool> m_stopGenerating;