community[patch]: callback before yield for _stream/_astream (#17907)

- Description: callback on_llm_new_token before yield chunk for _stream/_astream for some chat models, make all chat models in a consistent behaviour. - Issue: N/A - Dependencies: N/A
2025-09-24 03:52:10 +00:00 · 2024-02-23 08:15:21 +08:00
parent 15e42f1799
commit 9678797625
22 changed files with 66 additions and 55 deletions
--- a/libs/community/langchain_community/chat_models/ollama.py
+++ b/libs/community/langchain_community/chat_models/ollama.py
@@ -318,6 +318,7 @@ class ChatOllama(BaseChatModel, _OllamaCommon):
                    if run_manager:
                        run_manager.on_llm_new_token(
                            chunk.text,
+                            chunk=chunk,
                            verbose=self.verbose,
                        )
                    yield chunk
@@ -337,6 +338,7 @@ class ChatOllama(BaseChatModel, _OllamaCommon):
                if run_manager:
                    await run_manager.on_llm_new_token(
                        chunk.text,
+                        chunk=chunk,
                        verbose=self.verbose,
                    )
                yield chunk
@@ -356,6 +358,7 @@ class ChatOllama(BaseChatModel, _OllamaCommon):
                if run_manager:
                    run_manager.on_llm_new_token(
                        chunk.text,
+                        chunk=chunk,
                        verbose=self.verbose,
                    )
                yield chunk