community[patch]: callback before yield for _stream/_astream (#17907)

- Description: callback on_llm_new_token before yield chunk for _stream/_astream for some chat models, make all chat models in a consistent behaviour. - Issue: N/A - Dependencies: N/A
2025-09-24 12:01:54 +00:00 · 2024-02-23 08:15:21 +08:00
parent 15e42f1799
commit 9678797625
22 changed files with 66 additions and 55 deletions
--- a/libs/community/langchain_community/chat_models/anthropic.py
+++ b/libs/community/langchain_community/chat_models/anthropic.py
@@ -143,9 +143,9 @@ class ChatAnthropic(BaseChatModel, _AnthropicCommon):
        for data in stream_resp:
            delta = data.completion
            chunk = ChatGenerationChunk(message=AIMessageChunk(content=delta))
-            yield chunk
            if run_manager:
                run_manager.on_llm_new_token(delta, chunk=chunk)
+            yield chunk

    async def _astream(
        self,
@@ -163,9 +163,9 @@ class ChatAnthropic(BaseChatModel, _AnthropicCommon):
        async for data in stream_resp:
            delta = data.completion
            chunk = ChatGenerationChunk(message=AIMessageChunk(content=delta))
-            yield chunk
            if run_manager:
                await run_manager.on_llm_new_token(delta, chunk=chunk)
+            yield chunk

    def _generate(
        self,