Backend prompt dedup (#822)

* Deduplicated prompt() function code
2025-09-13 14:29:19 +00:00 · 2023-06-04 08:59:24 -04:00
parent 945297d837
commit bbe195ee02
10 changed files with 286 additions and 457 deletions
--- a/gpt4all-chat/chatgpt.h
+++ b/gpt4all-chat/chatgpt.h
@@ -24,7 +24,7 @@ public:
        std::function<bool(int32_t, const std::string&)> responseCallback,
        std::function<bool(bool)> recalculateCallback,
        PromptContext &ctx) override;
-    bool evalTokens(PromptContext &ctx, const std::vector<int32_t> &tokens) override { return true; }
+
    void setThreadCount(int32_t n_threads) override;
    int32_t threadCount() const override;

@@ -34,6 +34,17 @@ public:
    QList<QString> context() const { return m_context; }
    void setContext(const QList<QString> &context) { m_context = context; }

+protected:
+    // We have to implement these as they are pure virtual in base class, but we don't actually use
+    // them as they are only called from the default implementation of 'prompt' which we override and
+    // completely replace
+    std::vector<Token> tokenize(const std::string&) const override { return std::vector<Token>(); }
+    std::string_view tokenToString(Token) const override { return std::string_view(); }
+    Token sampleToken(PromptContext &ctx) const override { return -1; }
+    bool evalTokens(PromptContext &/*ctx*/, const std::vector<int32_t>& /*tokens*/) const override { return false; }
+    int32_t contextLength() const override { return -1; }
+    const std::vector<Token>& endTokens() const override { static const std::vector<Token> fres; return fres; }
+
 private Q_SLOTS:
    void handleFinished();
    void handleReadyRead();