Erase the correct amount of logits when regenerating which is not the same

as the number of tokens.
This commit is contained in:
Adam Treat
2023-04-15 09:19:06 -04:00
parent b1bb9866ab
commit 078b755ab8
2 changed files with 6 additions and 1 deletions

1
llm.h
View File

@@ -42,6 +42,7 @@ private:
LLModel *m_llmodel;
std::string m_response;
quint32 m_responseTokens;
quint32 m_responseLogits;
QString m_modelName;
QThread m_llmThread;
std::atomic<bool> m_stopGenerating;