feat(core): zero-out token costs for cache hits (#32437)

2025-09-24 12:01:54 +00:00 · 2025-08-07 09:49:34 -03:00
parent bc4251b9e0
commit 6e108c1cb4
2 changed files with 30 additions and 0 deletions
--- a/libs/core/langchain_core/language_models/chat_models.py
+++ b/libs/core/langchain_core/language_models/chat_models.py
@@ -666,6 +666,16 @@ class BaseChatModel(BaseLanguageModel[BaseMessage], ABC):
                converted_generations.append(chat_gen)
            else:
                # Already a ChatGeneration or other expected type
+                if hasattr(gen, "message") and isinstance(gen.message, AIMessage):
+                    # We zero out cost on cache hits
+                    gen.message = gen.message.model_copy(
+                        update={
+                            "usage_metadata": {
+                                **(gen.message.usage_metadata or {}),
+                                "total_cost": 0,
+                            }
+                        }
+                    )
                converted_generations.append(gen)
        return converted_generations