diff --git a/docs/docs/versions/migrating_chains/conversation_chain.ipynb b/docs/docs/versions/migrating_chains/conversation_chain.ipynb
index e984fc139ce..ba56524614a 100644
--- a/docs/docs/versions/migrating_chains/conversation_chain.ipynb
+++ b/docs/docs/versions/migrating_chains/conversation_chain.ipynb
@@ -54,12 +54,9 @@
"id": "00df631d-5121-4918-94aa-b88acce9b769",
"metadata": {},
"source": [
- "import { ColumnContainer, Column } from \"@theme/Columns\";\n",
+ "## Legacy\n",
"\n",
- "\n",
- "\n",
- "\n",
- "#### Legacy\n"
+ ""
]
},
{
@@ -111,12 +108,11 @@
"id": "f8e36b0e-c7dc-4130-a51b-189d4b756c7f",
"metadata": {},
"source": [
- " \n",
+ "\n",
"\n",
- "\n",
+ "## LCEL\n",
"\n",
- "#### LCEL\n",
- "\n"
+ ""
]
},
{
@@ -174,10 +170,6 @@
"id": "6b386ce6-895e-442c-88f3-7bec0ab9f401",
"metadata": {},
"source": [
- "\n",
- " \n",
- "\n",
- "\n",
"The above example uses the same `history` for all sessions. The example below shows how to use a different chat history for each session."
]
},
@@ -230,6 +222,8 @@
"id": "b2717810",
"metadata": {},
"source": [
+ "\n",
+ "\n",
"## Next steps\n",
"\n",
"See [this tutorial](/docs/tutorials/chatbot) for a more end-to-end guide on building with [`RunnableWithMessageHistory`](https://api.python.langchain.com/en/latest/runnables/langchain_core.runnables.history.RunnableWithMessageHistory.html).\n",
diff --git a/docs/docs/versions/migrating_chains/conversation_retrieval_chain.ipynb b/docs/docs/versions/migrating_chains/conversation_retrieval_chain.ipynb
index 91a331232ee..70de0606e78 100644
--- a/docs/docs/versions/migrating_chains/conversation_retrieval_chain.ipynb
+++ b/docs/docs/versions/migrating_chains/conversation_retrieval_chain.ipynb
@@ -83,13 +83,9 @@
"id": "8bc06416",
"metadata": {},
"source": [
- "import { ColumnContainer, Column } from \"@theme/Columns\";\n",
+ "## Legacy\n",
"\n",
- "\n",
- "\n",
- "\n",
- "\n",
- "#### Legacy"
+ ""
]
},
{
@@ -165,12 +161,11 @@
"id": "43a8a23c",
"metadata": {},
"source": [
- " \n",
+ "\n",
"\n",
- "\n",
+ "## LCEL\n",
"\n",
- "#### LCEL\n",
- "\n"
+ ""
]
},
{
@@ -253,9 +248,7 @@
"id": "b2717810",
"metadata": {},
"source": [
- " \n",
- "\n",
- "\n",
+ "\n",
"\n",
"## Next steps\n",
"\n",
@@ -263,6 +256,14 @@
"\n",
"Next, check out the [LCEL conceptual docs](/docs/concepts/#langchain-expression-language-lcel) for more background information."
]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": null,
+ "id": "7bfc38bd-0ff8-40ee-83a3-9d7553364fd7",
+ "metadata": {},
+ "outputs": [],
+ "source": []
}
],
"metadata": {
diff --git a/docs/docs/versions/migrating_chains/index.mdx b/docs/docs/versions/migrating_chains/index.mdx
index 6d3aabe178b..4f809972e0a 100644
--- a/docs/docs/versions/migrating_chains/index.mdx
+++ b/docs/docs/versions/migrating_chains/index.mdx
@@ -2,33 +2,48 @@
sidebar_position: 1
---
-# How to migrate chains to LCEL
+# How to migrate from v0.0 chains
:::info Prerequisites
This guide assumes familiarity with the following concepts:
- [LangChain Expression Language](/docs/concepts#langchain-expression-language-lcel)
-
+- [LangGraph](https://langchain-ai.github.io/langgraph/)
:::
-LCEL is designed to streamline the process of building useful apps with LLMs and combining related components. It does this by providing:
+LangChain maintains a number of legacy abstractions. Many of these can be reimplemented via short combinations of LCEL and LangGraph primitives.
+
+### LCEL
+[LCEL](/docs/concepts/#langchain-expression-language-lcel) is designed to streamline the process of building useful apps with LLMs and combining related components. It does this by providing:
1. **A unified interface**: Every LCEL object implements the `Runnable` interface, which defines a common set of invocation methods (`invoke`, `batch`, `stream`, `ainvoke`, ...). This makes it possible to also automatically and consistently support useful operations like streaming of intermediate steps and batching, since every chain composed of LCEL objects is itself an LCEL object.
2. **Composition primitives**: LCEL provides a number of primitives that make it easy to compose chains, parallelize components, add fallbacks, dynamically configure chain internals, and more.
-LangChain maintains a number of legacy abstractions. Many of these can be reimplemented via short combinations of LCEL primitives. Doing so confers some general advantages:
+### LangGraph
+[LangGraph](https://langchain-ai.github.io/langgraph/), built on top of LCEL, allows for performant orchestrations of application components while maintaining concise and readable code. It includes built-in persistence, support for cycles, and prioritizes controllability.
+If LCEL grows unwieldy for larger or more complex chains, they may benefit from a LangGraph implementation.
+
+### Advantages
+Using these frameworks for existing v0.0 chains confers some advantages:
- The resulting chains typically implement the full `Runnable` interface, including streaming and asynchronous support where appropriate;
- The chains may be more easily extended or modified;
- The parameters of the chain are typically surfaced for easier customization (e.g., prompts) over previous versions, which tended to be subclasses and had opaque parameters and internals.
+- If using LangGraph, the chain supports built-in persistence, allowing for conversational experiences via a "memory" of the chat history.
+- If using LangGraph, the steps of the chain can be streamed, allowing for greater control and customizability.
-The LCEL implementations can be slightly more verbose, but there are significant benefits in transparency and customizability.
-The below pages assist with migration from various specific chains to LCEL:
+The below pages assist with migration from various specific chains to LCEL and LangGraph:
- [LLMChain](/docs/versions/migrating_chains/llm_chain)
- [ConversationChain](/docs/versions/migrating_chains/conversation_chain)
- [RetrievalQA](/docs/versions/migrating_chains/retrieval_qa)
- [ConversationalRetrievalChain](/docs/versions/migrating_chains/conversation_retrieval_chain)
+- [StuffDocumentsChain](/docs/versions/migrating_chains/stuff_docs_chain)
+- [MapReduceDocumentsChain](/docs/versions/migrating_chains/map_reduce_chain)
+- [MapRerankDocumentsChain](/docs/versions/migrating_chains/map_rerank_docs_chain)
+- [RefineDocumentsChain](/docs/versions/migrating_chains/refine_docs_chain)
+- [LLMRouterChain](/docs/versions/migrating_chains/llm_router_chain)
+- [MultiPromptChain](/docs/versions/migrating_chains/multi_prompt_chain)
-Check out the [LCEL conceptual docs](/docs/concepts/#langchain-expression-language-lcel) for more background information.
\ No newline at end of file
+Check out the [LCEL conceptual docs](/docs/concepts/#langchain-expression-language-lcel) and [LangGraph docs](https://langchain-ai.github.io/langgraph/) for more background information.
\ No newline at end of file
diff --git a/docs/docs/versions/migrating_chains/llm_chain.ipynb b/docs/docs/versions/migrating_chains/llm_chain.ipynb
index 48de1ac9b73..c288cadf0d1 100644
--- a/docs/docs/versions/migrating_chains/llm_chain.ipynb
+++ b/docs/docs/versions/migrating_chains/llm_chain.ipynb
@@ -52,13 +52,9 @@
"id": "e3621b62-a037-42b8-8faa-59575608bb8b",
"metadata": {},
"source": [
- "import { ColumnContainer, Column } from \"@theme/Columns\";\n",
+ "## Legacy\n",
"\n",
- "\n",
- "\n",
- "\n",
- "\n",
- "#### Legacy\n"
+ ""
]
},
{
@@ -98,13 +94,11 @@
"id": "cdc3b527-c09e-4c77-9711-c3cc4506cd95",
"metadata": {},
"source": [
+ " \n",
"\n",
- "\n",
+ "## LCEL\n",
"\n",
- "\n",
- "\n",
- "#### LCEL\n",
- "\n"
+ ""
]
},
{
@@ -143,10 +137,6 @@
"id": "3c0b0513-77b8-4371-a20e-3e487cec7e7f",
"metadata": {},
"source": [
- "\n",
- " \n",
- "\n",
- "\n",
"Note that `LLMChain` by default returns a `dict` containing both the input and the output. If this behavior is desired, we can replicate it using another LCEL primitive, [`RunnablePassthrough`](https://api.python.langchain.com/en/latest/runnables/langchain_core.runnables.passthrough.RunnablePassthrough.html):"
]
},
@@ -181,6 +171,8 @@
"id": "b2717810",
"metadata": {},
"source": [
+ "\n",
+ "\n",
"## Next steps\n",
"\n",
"See [this tutorial](/docs/tutorials/llm_chain) for more detail on building with prompt templates, LLMs, and output parsers.\n",
diff --git a/docs/docs/versions/migrating_chains/llm_router_chain.ipynb b/docs/docs/versions/migrating_chains/llm_router_chain.ipynb
new file mode 100644
index 00000000000..64561caa965
--- /dev/null
+++ b/docs/docs/versions/migrating_chains/llm_router_chain.ipynb
@@ -0,0 +1,283 @@
+{
+ "cells": [
+ {
+ "cell_type": "markdown",
+ "id": "575befea-4d98-4941-8e55-1581b169a674",
+ "metadata": {},
+ "source": [
+ "---\n",
+ "title: Migrating from LLMRouterChain\n",
+ "---"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "14625d35-efca-41cf-b203-be9f4c375700",
+ "metadata": {},
+ "source": [
+ "The [`LLMRouterChain`](https://api.python.langchain.com/en/latest/chains/langchain.chains.router.llm_router.LLMRouterChain.html) routed an input query to one of multiple destinations-- that is, given an input query, it used a LLM to select from a list of destination chains, and passed its inputs to the selected chain.\n",
+ "\n",
+ "`LLMRouterChain` does not support common [chat model](/docs/concepts/#chat-models) features, such as message roles and [tool calling](/docs/concepts/#functiontool-calling). Under the hood, `LLMRouterChain` routes a query by instructing the LLM to generate JSON-formatted text, and parsing out the intended destination.\n",
+ "\n",
+ "Consider an example from a [MultiPromptChain](/docs/versions/migrating_chains/multi_prompt_chain), which uses `LLMRouterChain`. Below is an (example) default prompt:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 1,
+ "id": "364814a5-d15c-41bb-bf3f-581df51a4721",
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "Given a raw text input to a language model select the model prompt best suited for the input. You will be given the names of the available prompts and a description of what the prompt is best suited for. You may also revise the original input if you think that revising it will ultimately lead to a better response from the language model.\n",
+ "\n",
+ "<< FORMATTING >>\n",
+ "Return a markdown code snippet with a JSON object formatted to look like:\n",
+ "'''json\n",
+ "{{\n",
+ " \"destination\": string \\ name of the prompt to use or \"DEFAULT\"\n",
+ " \"next_inputs\": string \\ a potentially modified version of the original input\n",
+ "}}\n",
+ "'''\n",
+ "\n",
+ "REMEMBER: \"destination\" MUST be one of the candidate prompt names specified below OR it can be \"DEFAULT\" if the input is not well suited for any of the candidate prompts.\n",
+ "REMEMBER: \"next_inputs\" can just be the original input if you don't think any modifications are needed.\n",
+ "\n",
+ "<< CANDIDATE PROMPTS >>\n",
+ "\n",
+ "animals: prompt for animal expert\n",
+ "vegetables: prompt for a vegetable expert\n",
+ "\n",
+ "\n",
+ "<< INPUT >>\n",
+ "{input}\n",
+ "\n",
+ "<< OUTPUT (must include '''json at the start of the response) >>\n",
+ "<< OUTPUT (must end with ''') >>\n",
+ "\n"
+ ]
+ }
+ ],
+ "source": [
+ "from langchain.chains.router.multi_prompt import MULTI_PROMPT_ROUTER_TEMPLATE\n",
+ "\n",
+ "destinations = \"\"\"\n",
+ "animals: prompt for animal expert\n",
+ "vegetables: prompt for a vegetable expert\n",
+ "\"\"\"\n",
+ "\n",
+ "router_template = MULTI_PROMPT_ROUTER_TEMPLATE.format(destinations=destinations)\n",
+ "\n",
+ "print(router_template.replace(\"`\", \"'\")) # for rendering purposes"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "934937d1-fc0a-4d3f-b297-29f96e6a8f5e",
+ "metadata": {},
+ "source": [
+ "Most of the behavior is determined via a single natural language prompt. Chat models that support [tool calling](/docs/how_to/tool_calling/) features confer a number of advantages for this task:\n",
+ "\n",
+ "- Supports chat prompt templates, including messages with `system` and other roles;\n",
+ "- Tool-calling models are fine-tuned to generate structured output;\n",
+ "- Support for runnable methods like streaming and async operations.\n",
+ "\n",
+ "Now let's look at `LLMRouterChain` side-by-side with an LCEL implementation that uses tool-calling. Note that for this guide we will `langchain-openai >= 0.1.20`:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": null,
+ "id": "ed12b22b-5452-4776-aee3-b67d9f965082",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "%pip install -qU langchain-core langchain-openai"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": null,
+ "id": "b0edbba1-a497-49ef-ade7-4fe7967360eb",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "import os\n",
+ "from getpass import getpass\n",
+ "\n",
+ "os.environ[\"OPENAI_API_KEY\"] = getpass()"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "5d4dc41c-3fdc-4093-ba5e-31a9ebb54e13",
+ "metadata": {},
+ "source": [
+ "## Legacy\n",
+ "\n",
+ ""
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 2,
+ "id": "c58c9269-5a1d-4234-88b5-7168944618bf",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "from langchain.chains.router.llm_router import LLMRouterChain, RouterOutputParser\n",
+ "from langchain_core.prompts import PromptTemplate\n",
+ "from langchain_openai import ChatOpenAI\n",
+ "\n",
+ "llm = ChatOpenAI(model=\"gpt-4o-mini\")\n",
+ "\n",
+ "router_prompt = PromptTemplate(\n",
+ " # Note: here we use the prompt template from above. Generally this would need\n",
+ " # to be customized.\n",
+ " template=router_template,\n",
+ " input_variables=[\"input\"],\n",
+ " output_parser=RouterOutputParser(),\n",
+ ")\n",
+ "\n",
+ "chain = LLMRouterChain.from_llm(llm, router_prompt)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 3,
+ "id": "a22ebdca-5f53-459e-9cff-a97b2354ffe0",
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "vegetables\n"
+ ]
+ }
+ ],
+ "source": [
+ "result = chain.invoke({\"input\": \"What color are carrots?\"})\n",
+ "\n",
+ "print(result[\"destination\"])"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "6fd48120-056f-4c58-a04f-da5198c23068",
+ "metadata": {},
+ "source": [
+ " \n",
+ "\n",
+ "## LCEL\n",
+ "\n",
+ ""
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 4,
+ "id": "5bbebac2-df19-4f59-8a69-f61cd7286e59",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "from operator import itemgetter\n",
+ "from typing import Literal\n",
+ "\n",
+ "from langchain_core.prompts import ChatPromptTemplate\n",
+ "from langchain_core.runnables import RunnablePassthrough\n",
+ "from langchain_openai import ChatOpenAI\n",
+ "from typing_extensions import TypedDict\n",
+ "\n",
+ "llm = ChatOpenAI(model=\"gpt-4o-mini\")\n",
+ "\n",
+ "route_system = \"Route the user's query to either the animal or vegetable expert.\"\n",
+ "route_prompt = ChatPromptTemplate.from_messages(\n",
+ " [\n",
+ " (\"system\", route_system),\n",
+ " (\"human\", \"{input}\"),\n",
+ " ]\n",
+ ")\n",
+ "\n",
+ "\n",
+ "# Define schema for output:\n",
+ "class RouteQuery(TypedDict):\n",
+ " \"\"\"Route query to destination expert.\"\"\"\n",
+ "\n",
+ " destination: Literal[\"animal\", \"vegetable\"]\n",
+ "\n",
+ "\n",
+ "# Instead of writing formatting instructions into the prompt, we\n",
+ "# leverage .with_structured_output to coerce the output into a simple\n",
+ "# schema.\n",
+ "chain = route_prompt | llm.with_structured_output(RouteQuery)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 5,
+ "id": "88012e10-8def-44fa-833f-989935824182",
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "vegetable\n"
+ ]
+ }
+ ],
+ "source": [
+ "result = chain.invoke({\"input\": \"What color are carrots?\"})\n",
+ "\n",
+ "print(result[\"destination\"])"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "baf7ba9e-65b4-48af-8a39-453c01a7b7cb",
+ "metadata": {},
+ "source": [
+ " \n",
+ "\n",
+ "## Next steps\n",
+ "\n",
+ "See [this tutorial](/docs/tutorials/llm_chain) for more detail on building with prompt templates, LLMs, and output parsers.\n",
+ "\n",
+ "Check out the [LCEL conceptual docs](/docs/concepts/#langchain-expression-language-lcel) for more background information."
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": null,
+ "id": "353e4bab-3b8a-4e89-89e2-200a8d8eb8dd",
+ "metadata": {},
+ "outputs": [],
+ "source": []
+ }
+ ],
+ "metadata": {
+ "kernelspec": {
+ "display_name": "Python 3 (ipykernel)",
+ "language": "python",
+ "name": "python3"
+ },
+ "language_info": {
+ "codemirror_mode": {
+ "name": "ipython",
+ "version": 3
+ },
+ "file_extension": ".py",
+ "mimetype": "text/x-python",
+ "name": "python",
+ "nbconvert_exporter": "python",
+ "pygments_lexer": "ipython3",
+ "version": "3.10.4"
+ }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/docs/docs/versions/migrating_chains/map_reduce_chain.ipynb b/docs/docs/versions/migrating_chains/map_reduce_chain.ipynb
new file mode 100644
index 00000000000..0520e67f8d7
--- /dev/null
+++ b/docs/docs/versions/migrating_chains/map_reduce_chain.ipynb
@@ -0,0 +1,706 @@
+{
+ "cells": [
+ {
+ "cell_type": "markdown",
+ "id": "3270b34b-8958-425c-886a-ea4b9e26b475",
+ "metadata": {},
+ "source": [
+ "---\n",
+ "title: Migrating from MapReduceDocumentsChain\n",
+ "---"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "2c7bdc91-9b89-4e59-bc27-89508b024635",
+ "metadata": {},
+ "source": [
+ "[MapReduceDocumentsChain](https://api.python.langchain.com/en/latest/chains/langchain.chains.combine_documents.map_reduce.MapReduceDocumentsChain.html) implements a map-reduce strategy over (potentially long) texts. The strategy is as follows:\n",
+ "\n",
+ "- Split a text into smaller documents;\n",
+ "- Map a process onto the smaller documents;\n",
+ "- Reduce or consolidate the results of the process into a final result.\n",
+ "\n",
+ "Note that the map step is typically parallelized over the input documents.\n",
+ "\n",
+ "A common process applied in this context is summarization, in which the map step summarizes individual documents, and the reduce step generates a summary of the summaries.\n",
+ "\n",
+ "In the reduce step, `MapReduceDocumentsChain` supports a recursive \"collapsing\" of the summaries: the inputs would be partitioned based on a token limit, and summaries would be generated of the partitions. This step would be repeated until the total length of the summaries was within a desired limit, allowing for the summarization of arbitrary-length text. This is particularly useful for models with smaller context windows.\n",
+ "\n",
+ "LangGraph suports [map-reduce](https://langchain-ai.github.io/langgraph/how-tos/map-reduce/) workflows, and confers a number of advantages for this problem:\n",
+ "\n",
+ "- LangGraph allows for individual steps (such as successive summarizations) to be streamed, allowing for greater control of execution;\n",
+ "- LangGraph's [checkpointing](https://langchain-ai.github.io/langgraph/how-tos/persistence/) supports error recovery, extending with human-in-the-loop workflows, and easier incorporation into conversational applications.\n",
+ "- The LangGraph implementation is easier to extend, as we will see below.\n",
+ "\n",
+ "Below we will go through both `MapReduceDocumentsChain` and a corresponding LangGraph implementation, first on a simple example for illustrative purposes, and second on a longer example text to demonstrate the recursive reduce step.\n",
+ "\n",
+ "Let's first load a chat model:\n",
+ "\n",
+ "```{=mdx}\n",
+ "import ChatModelTabs from \"@theme/ChatModelTabs\";\n",
+ "\n",
+ "\n",
+ "```"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 1,
+ "id": "0bdf886b-aeeb-407e-81b8-28bad59ad57a",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "# | output: false\n",
+ "# | echo: false\n",
+ "\n",
+ "from langchain_openai import ChatOpenAI\n",
+ "\n",
+ "llm = ChatOpenAI(model=\"gpt-3.5-turbo-0125\", temperature=0)"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "41cfb569-f7e6-48cb-a90e-45a482009971",
+ "metadata": {},
+ "source": [
+ "## Basic example (short documents)\n",
+ "\n",
+ "Let's generate some simple documents for illustrative purposes."
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 2,
+ "id": "b221a71f-982b-4c08-8597-96c890e00965",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "from langchain_core.documents import Document\n",
+ "\n",
+ "documents = [\n",
+ " Document(page_content=\"Apples are red\", metadata={\"title\": \"apple_book\"}),\n",
+ " Document(page_content=\"Blueberries are blue\", metadata={\"title\": \"blueberry_book\"}),\n",
+ " Document(page_content=\"Bananas are yelow\", metadata={\"title\": \"banana_book\"}),\n",
+ "]"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "c717514a-1b6d-4a0f-9093-ef594b9a0b17",
+ "metadata": {},
+ "source": [
+ "### Legacy\n",
+ "\n",
+ "\n",
+ " \n",
+ "Below we show an implementation with `MapReduceDocumentsChain`. We define the prompt templates for the map and reduce steps, instantiate separate chains for these steps, and finally instantiate the `MapReduceDocumentsChain`:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 4,
+ "id": "84ee3851-b4a9-4fbe-a78f-d05168715b91",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "from langchain.chains import MapReduceDocumentsChain, ReduceDocumentsChain\n",
+ "from langchain.chains.combine_documents.stuff import StuffDocumentsChain\n",
+ "from langchain.chains.llm import LLMChain\n",
+ "from langchain_core.prompts import ChatPromptTemplate\n",
+ "from langchain_text_splitters import CharacterTextSplitter\n",
+ "\n",
+ "# Map\n",
+ "map_template = \"Write a concise summary of the following: {docs}.\"\n",
+ "map_prompt = ChatPromptTemplate([(\"human\", map_template)])\n",
+ "map_chain = LLMChain(llm=llm, prompt=map_prompt)\n",
+ "\n",
+ "\n",
+ "# Reduce\n",
+ "reduce_template = \"\"\"\n",
+ "The following is a set of summaries:\n",
+ "{docs}\n",
+ "Take these and distill it into a final, consolidated summary\n",
+ "of the main themes.\n",
+ "\"\"\"\n",
+ "reduce_prompt = ChatPromptTemplate([(\"human\", reduce_template)])\n",
+ "reduce_chain = LLMChain(llm=llm, prompt=reduce_prompt)\n",
+ "\n",
+ "\n",
+ "# Takes a list of documents, combines them into a single string, and passes this to an LLMChain\n",
+ "combine_documents_chain = StuffDocumentsChain(\n",
+ " llm_chain=reduce_chain, document_variable_name=\"docs\"\n",
+ ")\n",
+ "\n",
+ "# Combines and iteratively reduces the mapped documents\n",
+ "reduce_documents_chain = ReduceDocumentsChain(\n",
+ " # This is final chain that is called.\n",
+ " combine_documents_chain=combine_documents_chain,\n",
+ " # If documents exceed context for `StuffDocumentsChain`\n",
+ " collapse_documents_chain=combine_documents_chain,\n",
+ " # The maximum number of tokens to group documents into.\n",
+ " token_max=1000,\n",
+ ")\n",
+ "\n",
+ "# Combining documents by mapping a chain over them, then combining results\n",
+ "map_reduce_chain = MapReduceDocumentsChain(\n",
+ " # Map chain\n",
+ " llm_chain=map_chain,\n",
+ " # Reduce chain\n",
+ " reduce_documents_chain=reduce_documents_chain,\n",
+ " # The variable name in the llm_chain to put the documents in\n",
+ " document_variable_name=\"docs\",\n",
+ " # Return the results of the map steps in the output\n",
+ " return_intermediate_steps=False,\n",
+ ")"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 5,
+ "id": "4f57ed52-08a5-49f6-ab19-1be51a853a2f",
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "Fruits come in a variety of colors, with apples being red, blueberries being blue, and bananas being yellow.\n"
+ ]
+ }
+ ],
+ "source": [
+ "result = map_reduce_chain.invoke(documents)\n",
+ "\n",
+ "print(result[\"output_text\"])"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "46d29559-5948-4ce9-b7c5-fa6729cf2485",
+ "metadata": {},
+ "source": [
+ "In the [LangSmith trace](https://smith.langchain.com/public/8d88a2c0-5d26-41f6-9176-d06549b17aa6/r) we observe four LLM calls: one summarizing each of the three input documents, and one summarizing the summaries."
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "b5399533-8662-4fad-b885-e3df3d809c44",
+ "metadata": {},
+ "source": [
+ " \n",
+ "\n",
+ "### LangGraph\n",
+ "\n",
+ "Below we show a LangGraph implementation, using the same prompt templates as above. The graph includes a node for generating summaries which is mapped across a list of input documents. This node then flows to a second node that generates the final summary.\n",
+ "\n",
+ "\n",
+ "\n",
+ "We will need to install `langgraph`:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": null,
+ "id": "815f889b-7f19-4702-8e61-8dadcee7c729",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "pip install -qU langgraph"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 6,
+ "id": "2c710a66-2d3d-44be-b9e7-9dfee8c22a50",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "import operator\n",
+ "from typing import Annotated, List, TypedDict\n",
+ "\n",
+ "from langchain_core.output_parsers import StrOutputParser\n",
+ "from langchain_core.prompts import ChatPromptTemplate\n",
+ "from langgraph.constants import Send\n",
+ "from langgraph.graph import END, START, StateGraph\n",
+ "\n",
+ "map_template = \"Write a concise summary of the following: {context}.\"\n",
+ "\n",
+ "reduce_template = \"\"\"\n",
+ "The following is a set of summaries:\n",
+ "{docs}\n",
+ "Take these and distill it into a final, consolidated summary\n",
+ "of the main themes.\n",
+ "\"\"\"\n",
+ "\n",
+ "map_prompt = ChatPromptTemplate([(\"human\", map_template)])\n",
+ "reduce_prompt = ChatPromptTemplate([(\"human\", reduce_template)])\n",
+ "\n",
+ "map_chain = map_prompt | llm | StrOutputParser()\n",
+ "reduce_chain = reduce_prompt | llm | StrOutputParser()\n",
+ "\n",
+ "# Graph components: define the components that will make up the graph\n",
+ "\n",
+ "\n",
+ "# This will be the overall state of the main graph.\n",
+ "# It will contain the input document contents, corresponding\n",
+ "# summaries, and a final summary.\n",
+ "class OverallState(TypedDict):\n",
+ " # Notice here we use the operator.add\n",
+ " # This is because we want combine all the summaries we generate\n",
+ " # from individual nodes back into one list - this is essentially\n",
+ " # the \"reduce\" part\n",
+ " contents: List[str]\n",
+ " summaries: Annotated[list, operator.add]\n",
+ " final_summary: str\n",
+ "\n",
+ "\n",
+ "# This will be the state of the node that we will \"map\" all\n",
+ "# documents to in order to generate summaries\n",
+ "class SummaryState(TypedDict):\n",
+ " content: str\n",
+ "\n",
+ "\n",
+ "# Here we generate a summary, given a document\n",
+ "async def generate_summary(state: SummaryState):\n",
+ " response = await map_chain.ainvoke(state[\"content\"])\n",
+ " return {\"summaries\": [response]}\n",
+ "\n",
+ "\n",
+ "# Here we define the logic to map out over the documents\n",
+ "# We will use this an edge in the graph\n",
+ "def map_summaries(state: OverallState):\n",
+ " # We will return a list of `Send` objects\n",
+ " # Each `Send` object consists of the name of a node in the graph\n",
+ " # as well as the state to send to that node\n",
+ " return [\n",
+ " Send(\"generate_summary\", {\"content\": content}) for content in state[\"contents\"]\n",
+ " ]\n",
+ "\n",
+ "\n",
+ "# Here we will generate the final summary\n",
+ "async def generate_final_summary(state: OverallState):\n",
+ " response = await reduce_chain.ainvoke(state[\"summaries\"])\n",
+ " return {\"final_summary\": response}\n",
+ "\n",
+ "\n",
+ "# Construct the graph: here we put everything together to construct our graph\n",
+ "graph = StateGraph(OverallState)\n",
+ "graph.add_node(\"generate_summary\", generate_summary)\n",
+ "graph.add_node(\"generate_final_summary\", generate_final_summary)\n",
+ "graph.add_conditional_edges(START, map_summaries, [\"generate_summary\"])\n",
+ "graph.add_edge(\"generate_summary\", \"generate_final_summary\")\n",
+ "graph.add_edge(\"generate_final_summary\", END)\n",
+ "app = graph.compile()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 7,
+ "id": "934cf1a5-ce6d-48ac-8151-942d14586052",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "image/jpeg": "",
+ "text/plain": [
+ ""
+ ]
+ },
+ "execution_count": 7,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "from IPython.display import Image\n",
+ "\n",
+ "Image(app.get_graph().draw_mermaid_png())"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "cc38735a-004e-41cc-944d-288334e04850",
+ "metadata": {},
+ "source": [
+ "Note that calling the graph in streaming mode allows us to monitor steps and potentially take action on them during execution."
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 8,
+ "id": "7b1994f4-5a7a-4dda-bc0c-b9548cc8242f",
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "{'generate_summary': {'summaries': ['Apples are typically red in color.']}}\n",
+ "{'generate_summary': {'summaries': ['Bananas are yellow in color.']}}\n",
+ "{'generate_summary': {'summaries': ['Blueberries are a type of fruit that are blue in color.']}}\n",
+ "{'generate_final_summary': {'final_summary': 'The main themes are the colors of different fruits: apples are red, blueberries are blue, and bananas are yellow.'}}\n"
+ ]
+ }
+ ],
+ "source": [
+ "# Call the graph:\n",
+ "async for step in app.astream({\"contents\": [doc.page_content for doc in documents]}):\n",
+ " print(step)"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "c4d4e16c-4279-4a55-b3a8-5adbe63febe5",
+ "metadata": {},
+ "source": [
+ "In the [LangSmith trace](https://smith.langchain.com/public/8ecbe9fd-eb02-4c6e-90ae-659952c9360a/r) we recover the same four LLM calls as before."
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "b8027c94-c151-4fa4-8180-088fa52bb042",
+ "metadata": {},
+ "source": [
+ " \n",
+ "\n",
+ "## Summarizing long documents"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "2b50a081-7dec-4680-88f2-2d43f0079e1c",
+ "metadata": {},
+ "source": [
+ "Map-reduce flows are particularly useful when texts are long compared to the context window of a LLM. `MapReduceDocumentsChain` supports a recursive \"collapsing\" of the summaries: the inputs are partitioned based on a token limit, and summaries are generated of the partitions. This step is repeated until the total length of the summaries is within a desired limit, allowing for the summarization of arbitrary-length text.\n",
+ "\n",
+ "This \"collapse\" step is implemented as a `while` loop within `MapReduceDocumentsChain`. We can demonstrate this step on a longer text, a [LLM Powered Autonomous Agents](https://lilianweng.github.io/posts/2023-06-23-agent/) blog post by Lilian Weng (as featured in the [RAG tutorial](/docs/tutorials/rag) and other documentation).\n",
+ "\n",
+ "First we load the post and chunk it into smaller \"sub documents\":"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 9,
+ "id": "dfbb6ce8-9183-41d4-b022-924ee01669e0",
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stderr",
+ "output_type": "stream",
+ "text": [
+ "USER_AGENT environment variable not set, consider setting it to identify your requests.\n",
+ "Created a chunk of size 1003, which is longer than the specified 1000\n"
+ ]
+ },
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "Generated 14 documents.\n"
+ ]
+ }
+ ],
+ "source": [
+ "from langchain_community.document_loaders import WebBaseLoader\n",
+ "from langchain_text_splitters import CharacterTextSplitter\n",
+ "\n",
+ "loader = WebBaseLoader(\"https://lilianweng.github.io/posts/2023-06-23-agent/\")\n",
+ "documents = loader.load()\n",
+ "\n",
+ "text_splitter = CharacterTextSplitter.from_tiktoken_encoder(\n",
+ " chunk_size=1000, chunk_overlap=0\n",
+ ")\n",
+ "split_docs = text_splitter.split_documents(documents)\n",
+ "print(f\"Generated {len(split_docs)} documents.\")"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "06b84ce2-4405-4f0c-aae3-6eff92de6bd9",
+ "metadata": {},
+ "source": [
+ "### Legacy\n",
+ "\n",
+ "\n",
+ "We can invoke `MapReduceDocumentsChain` as before:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 12,
+ "id": "ec58fdce-c6f1-4964-bea6-0fcba0e0ae8a",
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "The article discusses the use of Large Language Models (LLMs) to power autonomous agents in various tasks, showcasing their capabilities in problem-solving beyond generating written content. Key components such as planning, memory optimization, and tool use are explored, with proof-of-concept demos like AutoGPT and GPT-Engineer demonstrating the potential of LLM-powered agents. Challenges include limitations in historical information retention and natural language interface reliability, while the potential of LLMs in enhancing reasoning, problem-solving, and planning proficiency for autonomous agents is highlighted. Overall, the article emphasizes the versatility and power of LLMs in creating intelligent agents for tasks like scientific discovery and experiment design.\n"
+ ]
+ }
+ ],
+ "source": [
+ "result = map_reduce_chain.invoke(split_docs)\n",
+ "\n",
+ "print(result[\"output_text\"])"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "705b9c3b-6674-4c7e-8843-1d08dde078f8",
+ "metadata": {},
+ "source": [
+ "Consider the [LangSmith trace](https://smith.langchain.com/public/d8b3311d-2220-487a-8eaf-104ef90678dd/r) for the above invocation. When instantiating our `ReduceDocumentsChain`, we set a `token_max` of 1,000 tokens. This results in a total of 17 LLM calls:\n",
+ "\n",
+ "- 14 calls are for summarizing the 14 sub-documents generated by our text splitter.\n",
+ "- This generated summaries that totaled about 1,000 - 2,000 tokens. Because we set a `token_max` of 1,000, there are two more calls to summarize (or \"collapse\") these summaries.\n",
+ "- One final call is for generating a final summary of the two \"collapsed\" summaries."
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "4100aedb-0170-45a1-97d5-aa7e9bdb0419",
+ "metadata": {},
+ "source": [
+ " \n",
+ "\n",
+ "### LangGraph\n",
+ "\n",
+ "\n",
+ "We can extend our original map-reduce implementation in LangGraph to implement the same recursive collapsing step. We make the following changes:\n",
+ "\n",
+ "- Add a `collapsed_summaries` key to the state to store the collapsed summaries;\n",
+ "- Update the final summarization node to summarize the collapsed summaries;\n",
+ "- Add a `collapse_summaries` node that partitions a list of documents based on a token length (1,000 tokens here, as before) and generates summaries of each partition and stores the result in `collapsed_summaries`.\n",
+ "\n",
+ "We add a conditional edge from `collapse_summaries` to itself to form a loop: if the collapsed summaries total more than the `token_max`, we re-run the node."
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 11,
+ "id": "a1cb9fcf-3a27-45e0-84bc-83c66aa65421",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "from typing import Literal\n",
+ "\n",
+ "from langchain.chains.combine_documents.reduce import (\n",
+ " acollapse_docs,\n",
+ " split_list_of_docs,\n",
+ ")\n",
+ "\n",
+ "\n",
+ "def length_function(documents: List[Document]) -> int:\n",
+ " \"\"\"Get number of tokens for input contents.\"\"\"\n",
+ " return sum(llm.get_num_tokens(doc.page_content) for doc in documents)\n",
+ "\n",
+ "\n",
+ "token_max = 1000\n",
+ "\n",
+ "\n",
+ "class OverallState(TypedDict):\n",
+ " contents: List[str]\n",
+ " summaries: Annotated[list, operator.add]\n",
+ " collapsed_summaries: List[Document] # add key for collapsed summaries\n",
+ " final_summary: str\n",
+ "\n",
+ "\n",
+ "# Add node to store summaries for collapsing\n",
+ "def collect_summaries(state: OverallState):\n",
+ " return {\n",
+ " \"collapsed_summaries\": [Document(summary) for summary in state[\"summaries\"]]\n",
+ " }\n",
+ "\n",
+ "\n",
+ "# Modify final summary to read off collapsed summaries\n",
+ "async def generate_final_summary(state: OverallState):\n",
+ " response = await reduce_chain.ainvoke(state[\"collapsed_summaries\"])\n",
+ " return {\"final_summary\": response}\n",
+ "\n",
+ "\n",
+ "graph = StateGraph(OverallState)\n",
+ "graph.add_node(\"generate_summary\", generate_summary) # same as before\n",
+ "graph.add_node(\"collect_summaries\", collect_summaries)\n",
+ "graph.add_node(\"generate_final_summary\", generate_final_summary)\n",
+ "\n",
+ "\n",
+ "# Add node to collapse summaries\n",
+ "async def collapse_summaries(state: OverallState):\n",
+ " doc_lists = split_list_of_docs(\n",
+ " state[\"collapsed_summaries\"], length_function, token_max\n",
+ " )\n",
+ " results = []\n",
+ " for doc_list in doc_lists:\n",
+ " results.append(await acollapse_docs(doc_list, reduce_chain.ainvoke))\n",
+ "\n",
+ " return {\"collapsed_summaries\": results}\n",
+ "\n",
+ "\n",
+ "graph.add_node(\"collapse_summaries\", collapse_summaries)\n",
+ "\n",
+ "\n",
+ "def should_collapse(\n",
+ " state: OverallState,\n",
+ ") -> Literal[\"collapse_summaries\", \"generate_final_summary\"]:\n",
+ " num_tokens = length_function(state[\"collapsed_summaries\"])\n",
+ " if num_tokens > token_max:\n",
+ " return \"collapse_summaries\"\n",
+ " else:\n",
+ " return \"generate_final_summary\"\n",
+ "\n",
+ "\n",
+ "graph.add_conditional_edges(START, map_summaries, [\"generate_summary\"])\n",
+ "graph.add_edge(\"generate_summary\", \"collect_summaries\")\n",
+ "graph.add_conditional_edges(\"collect_summaries\", should_collapse)\n",
+ "graph.add_conditional_edges(\"collapse_summaries\", should_collapse)\n",
+ "graph.add_edge(\"generate_final_summary\", END)\n",
+ "app = graph.compile()"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "c93f1c59-0e76-4528-9971-5aeb837b97aa",
+ "metadata": {},
+ "source": [
+ "LangGraph allows the graph structure to be plotted to help visualize its function:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 12,
+ "id": "4c1704a1-d7e3-43a4-8ea8-7af765253194",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "image/jpeg": "",
+ "text/plain": [
+ ""
+ ]
+ },
+ "execution_count": 12,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "from IPython.display import Image\n",
+ "\n",
+ "Image(app.get_graph().draw_mermaid_png())"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "9fcc664b-9d8e-4b16-90bd-5074c778d4ec",
+ "metadata": {},
+ "source": [
+ "As before, we can stream the graph to observe its sequence of steps. Below, we will simply print out the name of the step.\n",
+ "\n",
+ "Note that because we have a loop in the graph, it can be helpful to specify a [recursion_limit](https://langchain-ai.github.io/langgraph/reference/errors/#langgraph.errors.GraphRecursionError) on its execution. This is analogous to [ReduceDocumentsChain.token_max](https://api.python.langchain.com/en/latest/chains/langchain.chains.combine_documents.reduce.ReduceDocumentsChain.html#langchain.chains.combine_documents.reduce.ReduceDocumentsChain.token_max) to will raise a specific error when the specified limit is exceeded."
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 13,
+ "id": "bf2b5408-580b-4fc6-857d-55ceae94ba23",
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "['generate_summary']\n",
+ "['generate_summary']\n",
+ "['generate_summary']\n",
+ "['generate_summary']\n",
+ "['generate_summary']\n",
+ "['generate_summary']\n",
+ "['generate_summary']\n",
+ "['generate_summary']\n",
+ "['generate_summary']\n",
+ "['generate_summary']\n",
+ "['generate_summary']\n",
+ "['generate_summary']\n",
+ "['generate_summary']\n",
+ "['generate_summary']\n",
+ "['collect_summaries']\n",
+ "['collapse_summaries']\n",
+ "['generate_final_summary']\n"
+ ]
+ }
+ ],
+ "source": [
+ "async for step in app.astream(\n",
+ " {\"contents\": [doc.page_content for doc in split_docs]},\n",
+ " {\"recursion_limit\": 10},\n",
+ "):\n",
+ " print(list(step.keys()))"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 19,
+ "id": "e86c67ff-eaf8-410e-99e5-150602022283",
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "{'generate_final_summary': {'final_summary': 'The summaries discuss the use of Large Language Models (LLMs) to power autonomous agents in various tasks such as problem-solving, planning, and tool use. Key components like planning, memory, and task decomposition are highlighted, along with challenges such as inefficient planning and hallucination. Techniques like Algorithm Distillation and Maximum Inner Product Search are explored for optimization, while frameworks like ReAct and Reflexion show improvements in knowledge-intensive tasks. The importance of accurate interpretation of user input and well-structured code for functional autonomy is emphasized, along with the potential of LLMs in prompting, reasoning, and emergent social behavior in simulation environments. Challenges in real-world scenarios and the use of LLMs with expert-designed tools for tasks like organic synthesis and drug discovery are also discussed.'}}\n"
+ ]
+ }
+ ],
+ "source": [
+ "print(step)"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "47df3079-bd67-4384-8609-1de3d966420b",
+ "metadata": {},
+ "source": [
+ "In the corresponding [LangSmith trace](https://smith.langchain.com/public/9d7b1d50-e1d6-44c9-9ab2-eabef621c883/r) we can see the same 17 LLM calls as before, this time grouped under their respective nodes.\n",
+ "\n",
+ " \n",
+ "\n",
+ "## Next steps\n",
+ "\n",
+ "Check out the [LangGraph documentation](https://langchain-ai.github.io/langgraph/) for detail on building with LangGraph, including [this guide](https://langchain-ai.github.io/langgraph/how-tos/map-reduce/) on the details of map-reduce in LangGraph.\n",
+ "\n",
+ "See [this tutorial](/docs/tutorials/summarization/) for more LLM-based summarization strategies."
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": null,
+ "id": "1d9ed018-f9a8-4cc9-9f42-405da6f05206",
+ "metadata": {},
+ "outputs": [],
+ "source": []
+ }
+ ],
+ "metadata": {
+ "kernelspec": {
+ "display_name": "Python 3 (ipykernel)",
+ "language": "python",
+ "name": "python3"
+ },
+ "language_info": {
+ "codemirror_mode": {
+ "name": "ipython",
+ "version": 3
+ },
+ "file_extension": ".py",
+ "mimetype": "text/x-python",
+ "name": "python",
+ "nbconvert_exporter": "python",
+ "pygments_lexer": "ipython3",
+ "version": "3.10.4"
+ }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/docs/docs/versions/migrating_chains/map_rerank_docs_chain.ipynb b/docs/docs/versions/migrating_chains/map_rerank_docs_chain.ipynb
new file mode 100644
index 00000000000..43b3408b2ba
--- /dev/null
+++ b/docs/docs/versions/migrating_chains/map_rerank_docs_chain.ipynb
@@ -0,0 +1,341 @@
+{
+ "cells": [
+ {
+ "cell_type": "markdown",
+ "id": "9db5ad7a-857e-46ea-9d0c-ba3fbe62fc81",
+ "metadata": {},
+ "source": [
+ "---\n",
+ "title: Migrating from MapRerankDocumentsChain\n",
+ "---\n",
+ "\n",
+ "[MapRerankDocumentsChain](https://api.python.langchain.com/en/latest/chains/langchain.chains.combine_documents.map_rerank.MapRerankDocumentsChain.html) implements a strategy for analyzing long texts. The strategy is as follows:\n",
+ "\n",
+ "- Split a text into smaller documents;\n",
+ "- Map a process to the set of documents, where the process includes generating a score;\n",
+ "- Rank the results by score and return the maximum.\n",
+ "\n",
+ "A common process in this scenario is question-answering using pieces of context from a document. Forcing the model to generate score along with its answer helps to select for answers generated only by relevant context.\n",
+ "\n",
+ "An [LangGraph](https://langchain-ai.github.io/langgraph/) implementation allows for the incorporation of [tool calling](/docs/concepts/#functiontool-calling) and other features for this problem. Below we will go through both `MapRerankDocumentsChain` and a corresponding LangGraph implementation on a simple example for illustrative purposes."
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "39f11f9f-ac24-485e-bc15-285bebb9c12e",
+ "metadata": {},
+ "source": [
+ "## Example\n",
+ "\n",
+ "Let's go through an example where we analyze a set of documents. We first generate some simple documents for illustrative purposes:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 2,
+ "id": "ef975d40-6ea3-4280-84cb-fae4c285c72b",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "from langchain_core.documents import Document\n",
+ "\n",
+ "documents = [\n",
+ " Document(page_content=\"Alice has blue eyes\", metadata={\"title\": \"book_chapter_2\"}),\n",
+ " Document(page_content=\"Bob has brown eyes\", metadata={\"title\": \"book_chapter_1\"}),\n",
+ " Document(\n",
+ " page_content=\"Charlie has green eyes\", metadata={\"title\": \"book_chapter_3\"}\n",
+ " ),\n",
+ "]"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "e3b99cfc-b99c-4da8-9c87-903e0249d227",
+ "metadata": {},
+ "source": [
+ "### Legacy\n",
+ "\n",
+ "\n",
+ "\n",
+ "Below we show an implementation with `MapRerankDocumentsChain`. We define the prompt template for a question-answering task and instantiate a [LLMChain](https://api.python.langchain.com/en/latest/chains/langchain.chains.llm.LLMChain.html) object for this purpose. We define how documents are formatted into the prompt and ensure consistency among the keys in the various prompts."
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 4,
+ "id": "3b65e056-d739-4985-8bfc-0edf783f2b16",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "from langchain.chains import LLMChain, MapRerankDocumentsChain\n",
+ "from langchain.output_parsers.regex import RegexParser\n",
+ "from langchain_core.prompts import PromptTemplate\n",
+ "from langchain_openai import OpenAI\n",
+ "\n",
+ "document_variable_name = \"context\"\n",
+ "llm = OpenAI()\n",
+ "# The prompt here should take as an input variable the\n",
+ "# `document_variable_name`\n",
+ "# The actual prompt will need to be a lot more complex, this is just\n",
+ "# an example.\n",
+ "prompt_template = (\n",
+ " \"What color are Bob's eyes? \"\n",
+ " \"Output both your answer and a score (1-10) of how confident \"\n",
+ " \"you are in the format: \\nScore: .\\n\\n\"\n",
+ " \"Provide no other commentary.\\n\\n\"\n",
+ " \"Context: {context}\"\n",
+ ")\n",
+ "output_parser = RegexParser(\n",
+ " regex=r\"(.*?)\\nScore: (.*)\",\n",
+ " output_keys=[\"answer\", \"score\"],\n",
+ ")\n",
+ "prompt = PromptTemplate(\n",
+ " template=prompt_template,\n",
+ " input_variables=[\"context\"],\n",
+ " output_parser=output_parser,\n",
+ ")\n",
+ "llm_chain = LLMChain(llm=llm, prompt=prompt)\n",
+ "chain = MapRerankDocumentsChain(\n",
+ " llm_chain=llm_chain,\n",
+ " document_variable_name=document_variable_name,\n",
+ " rank_key=\"score\",\n",
+ " answer_key=\"answer\",\n",
+ ")"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 9,
+ "id": "fe94c2e5-4c56-4604-a16c-055c196f4a57",
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stderr",
+ "output_type": "stream",
+ "text": [
+ "/langchain/libs/langchain/langchain/chains/llm.py:369: UserWarning: The apply_and_parse method is deprecated, instead pass an output parser directly to LLMChain.\n",
+ " warnings.warn(\n"
+ ]
+ },
+ {
+ "data": {
+ "text/plain": [
+ "'Brown'"
+ ]
+ },
+ "execution_count": 9,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "response = chain.invoke(documents)\n",
+ "response[\"output_text\"]"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "317e51c2-810f-463b-9da2-604fe95a8b48",
+ "metadata": {},
+ "source": [
+ "Inspecting the [LangSmith trace](https://smith.langchain.com/public/7a071bd1-0283-4b90-898c-6e4a2b5a0593/r) for the above run, we can see three LLM calls-- one for each document-- and that the scoring mechanism mitigated against hallucinations.\n",
+ "\n",
+ " \n",
+ "\n",
+ "### LangGraph\n",
+ "\n",
+ "\n",
+ "\n",
+ "Below we show a LangGraph implementation of this process. Note that our template is simplified, as we delegate the formatting instructions to the chat model's tool-calling features via the [.with_structured_output](/docs/how_to/structured_output/) method.\n",
+ "\n",
+ "Here we follow a basic [map-reduce](https://langchain-ai.github.io/langgraph/how-tos/map-reduce/) workflow to execute the LLM calls in parallel.\n",
+ "\n",
+ "We will need to install `langgraph`:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": null,
+ "id": "b8fab4f6-eed1-4662-8d3f-82846a2edfb3",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "pip install -qU langgraph"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 6,
+ "id": "b8493533-7ab3-4f75-aab1-390340bff2ea",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "import operator\n",
+ "from typing import Annotated, List, TypedDict\n",
+ "\n",
+ "from langchain_core.prompts import ChatPromptTemplate\n",
+ "from langchain_openai import ChatOpenAI\n",
+ "from langgraph.constants import Send\n",
+ "from langgraph.graph import END, START, StateGraph\n",
+ "\n",
+ "\n",
+ "class AnswerWithScore(TypedDict):\n",
+ " answer: str\n",
+ " score: Annotated[int, ..., \"Score from 1-10.\"]\n",
+ "\n",
+ "\n",
+ "llm = ChatOpenAI(model=\"gpt-4o-mini\", temperature=0)\n",
+ "\n",
+ "prompt_template = \"What color are Bob's eyes?\\n\\n\" \"Context: {context}\"\n",
+ "prompt = ChatPromptTemplate.from_template(prompt_template)\n",
+ "\n",
+ "# The below chain formats context from a document into a prompt, then\n",
+ "# generates a response structured according to the AnswerWithScore schema.\n",
+ "map_chain = prompt | llm.with_structured_output(AnswerWithScore)\n",
+ "\n",
+ "# Below we define the components that will make up the graph\n",
+ "\n",
+ "\n",
+ "# This will be the overall state of the graph.\n",
+ "# It will contain the input document contents, corresponding\n",
+ "# answers with scores, and a final answer.\n",
+ "class State(TypedDict):\n",
+ " contents: List[str]\n",
+ " answers_with_scores: Annotated[list, operator.add]\n",
+ " answer: str\n",
+ "\n",
+ "\n",
+ "# This will be the state of the node that we will \"map\" all\n",
+ "# documents to in order to generate answers with scores\n",
+ "class MapState(TypedDict):\n",
+ " content: str\n",
+ "\n",
+ "\n",
+ "# Here we define the logic to map out over the documents\n",
+ "# We will use this an edge in the graph\n",
+ "def map_analyses(state: State):\n",
+ " # We will return a list of `Send` objects\n",
+ " # Each `Send` object consists of the name of a node in the graph\n",
+ " # as well as the state to send to that node\n",
+ " return [\n",
+ " Send(\"generate_analysis\", {\"content\": content}) for content in state[\"contents\"]\n",
+ " ]\n",
+ "\n",
+ "\n",
+ "# Here we generate an answer with score, given a document\n",
+ "async def generate_analysis(state: MapState):\n",
+ " response = await map_chain.ainvoke(state[\"content\"])\n",
+ " return {\"answers_with_scores\": [response]}\n",
+ "\n",
+ "\n",
+ "# Here we will select the top answer\n",
+ "def pick_top_ranked(state: State):\n",
+ " ranked_answers = sorted(\n",
+ " state[\"answers_with_scores\"], key=lambda x: -int(x[\"score\"])\n",
+ " )\n",
+ " return {\"answer\": ranked_answers[0]}\n",
+ "\n",
+ "\n",
+ "# Construct the graph: here we put everything together to construct our graph\n",
+ "graph = StateGraph(State)\n",
+ "graph.add_node(\"generate_analysis\", generate_analysis)\n",
+ "graph.add_node(\"pick_top_ranked\", pick_top_ranked)\n",
+ "graph.add_conditional_edges(START, map_analyses, [\"generate_analysis\"])\n",
+ "graph.add_edge(\"generate_analysis\", \"pick_top_ranked\")\n",
+ "graph.add_edge(\"pick_top_ranked\", END)\n",
+ "app = graph.compile()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 7,
+ "id": "ccf10061-f0dc-4333-9053-ebebe3f2e196",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "image/jpeg": "",
+ "text/plain": [
+ ""
+ ]
+ },
+ "execution_count": 7,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "from IPython.display import Image\n",
+ "\n",
+ "Image(app.get_graph().draw_mermaid_png())"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 8,
+ "id": "5d7bf45e-d615-45f7-a3d6-54700993f69e",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "{'answer': 'Bob has brown eyes.', 'score': 10}"
+ ]
+ },
+ "execution_count": 8,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "result = await app.ainvoke({\"contents\": [doc.page_content for doc in documents]})\n",
+ "result[\"answer\"]"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "337f8f18-f048-495a-ade2-870790c01f70",
+ "metadata": {},
+ "source": [
+ "Inspecting the [LangSmith trace](https://smith.langchain.com/public/b64bf9aa-7558-4c1b-be5c-ba8924069039/r) for the above run, we can see three LLM calls as before. Using the model's tool-calling features have also enabled us to remove the parsing step.\n",
+ "\n",
+ " \n",
+ "\n",
+ "## Next steps\n",
+ "\n",
+ "See these [how-to guides](/docs/how_to/#qa-with-rag) for more on question-answering tasks with RAG.\n",
+ "\n",
+ "Check out the [LangGraph documentation](https://langchain-ai.github.io/langgraph/) for detail on building with LangGraph, including [this guide](https://langchain-ai.github.io/langgraph/how-tos/map-reduce/) on the details of map-reduce in LangGraph."
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": null,
+ "id": "54e88df8-7d12-4ee1-9e0a-bf8a7baacba7",
+ "metadata": {},
+ "outputs": [],
+ "source": []
+ }
+ ],
+ "metadata": {
+ "kernelspec": {
+ "display_name": "Python 3 (ipykernel)",
+ "language": "python",
+ "name": "python3"
+ },
+ "language_info": {
+ "codemirror_mode": {
+ "name": "ipython",
+ "version": 3
+ },
+ "file_extension": ".py",
+ "mimetype": "text/x-python",
+ "name": "python",
+ "nbconvert_exporter": "python",
+ "pygments_lexer": "ipython3",
+ "version": "3.10.4"
+ }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/docs/docs/versions/migrating_chains/multi_prompt_chain.ipynb b/docs/docs/versions/migrating_chains/multi_prompt_chain.ipynb
new file mode 100644
index 00000000000..c1613464382
--- /dev/null
+++ b/docs/docs/versions/migrating_chains/multi_prompt_chain.ipynb
@@ -0,0 +1,362 @@
+{
+ "cells": [
+ {
+ "cell_type": "markdown",
+ "id": "575befea-4d98-4941-8e55-1581b169a674",
+ "metadata": {},
+ "source": [
+ "---\n",
+ "title: Migrating from MultiPromptChain\n",
+ "---"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "14625d35-efca-41cf-b203-be9f4c375700",
+ "metadata": {},
+ "source": [
+ "The [`MultiPromptChain`](https://api.python.langchain.com/en/latest/chains/langchain.chains.router.multi_prompt.MultiPromptChain.html) routed an input query to one of multiple LLMChains-- that is, given an input query, it used a LLM to select from a list of prompts, formatted the query into the prompt, and generated a response.\n",
+ "\n",
+ "`MultiPromptChain` does not support common [chat model](/docs/concepts/#chat-models) features, such as message roles and [tool calling](/docs/concepts/#functiontool-calling).\n",
+ "\n",
+ "A [LangGraph](https://langchain-ai.github.io/langgraph/) implementation confers a number of advantages for this problem:\n",
+ "\n",
+ "- Supports chat prompt templates, including messages with `system` and other roles;\n",
+ "- Supports the use of tool calling for the routing step;\n",
+ "- Supports streaming of both individual steps and output tokens.\n",
+ "\n",
+ "Now let's look at them side-by-side. Note that for this guide we will `langchain-openai >= 0.1.20`"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": null,
+ "id": "cba0c648-63e9-4f4a-b4ba-cd36fcb21466",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "%pip install -qU langchain-core langchain-openai"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": null,
+ "id": "d05ae3aa-96cc-49f2-8dd0-601c2503b7ca",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "import os\n",
+ "from getpass import getpass\n",
+ "\n",
+ "os.environ[\"OPENAI_API_KEY\"] = getpass()"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "707283ee-fbd8-43e0-9796-343fc2534658",
+ "metadata": {},
+ "source": [
+ "## Legacy\n",
+ "\n",
+ ""
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 4,
+ "id": "4cca7a1a-3ce5-4c60-9664-cbbff14fc7d5",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "from langchain.chains.router.multi_prompt import MultiPromptChain\n",
+ "from langchain_openai import ChatOpenAI\n",
+ "\n",
+ "llm = ChatOpenAI(model=\"gpt-4o-mini\")\n",
+ "\n",
+ "prompt_1_template = \"\"\"\n",
+ "You are an expert on animals. Please answer the below query:\n",
+ "\n",
+ "{input}\n",
+ "\"\"\"\n",
+ "\n",
+ "prompt_2_template = \"\"\"\n",
+ "You are an expert on vegetables. Please answer the below query:\n",
+ "\n",
+ "{input}\n",
+ "\"\"\"\n",
+ "\n",
+ "prompt_infos = [\n",
+ " {\n",
+ " \"name\": \"animals\",\n",
+ " \"description\": \"prompt for an animal expert\",\n",
+ " \"prompt_template\": prompt_1_template,\n",
+ " },\n",
+ " {\n",
+ " \"name\": \"vegetables\",\n",
+ " \"description\": \"prompt for a vegetable expert\",\n",
+ " \"prompt_template\": prompt_2_template,\n",
+ " },\n",
+ "]\n",
+ "\n",
+ "chain = MultiPromptChain.from_prompts(llm, prompt_infos)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 5,
+ "id": "fcb635d2-0402-4afb-ab64-044811d5348c",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "{'input': 'What color are carrots?',\n",
+ " 'text': 'Carrots are most commonly orange, but they can also be found in a variety of other colors including purple, yellow, white, and red. The orange variety is the most popular and widely recognized.'}"
+ ]
+ },
+ "execution_count": 5,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "chain.invoke({\"input\": \"What color are carrots?\"})"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "10ff8cd1-7e47-4133-a793-1ccd61a57f04",
+ "metadata": {},
+ "source": [
+ "In the [LangSmith trace](https://smith.langchain.com/public/e935238b-0b63-4984-abc8-873b2170a32d/r) we can see the two steps of this process, including the prompts for routing the query and the final selected prompt.\n",
+ "\n",
+ " \n",
+ "\n",
+ "## LangGraph\n",
+ "\n",
+ ""
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": null,
+ "id": "4a864796-ec89-4962-87b3-633f90687e1d",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "pip install -qU langgraph"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 1,
+ "id": "cf1edd2b-7592-47f4-ba8d-94a56742a585",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "from operator import itemgetter\n",
+ "from typing import Literal\n",
+ "\n",
+ "from langchain_core.output_parsers import StrOutputParser\n",
+ "from langchain_core.prompts import ChatPromptTemplate\n",
+ "from langchain_core.runnables import RunnableConfig\n",
+ "from langchain_openai import ChatOpenAI\n",
+ "from langgraph.graph import END, START, StateGraph\n",
+ "from typing_extensions import TypedDict\n",
+ "\n",
+ "llm = ChatOpenAI(model=\"gpt-4o-mini\")\n",
+ "\n",
+ "# Define the prompts we will route to\n",
+ "prompt_1 = ChatPromptTemplate.from_messages(\n",
+ " [\n",
+ " (\"system\", \"You are an expert on animals.\"),\n",
+ " (\"human\", \"{input}\"),\n",
+ " ]\n",
+ ")\n",
+ "prompt_2 = ChatPromptTemplate.from_messages(\n",
+ " [\n",
+ " (\"system\", \"You are an expert on vegetables.\"),\n",
+ " (\"human\", \"{input}\"),\n",
+ " ]\n",
+ ")\n",
+ "\n",
+ "# Construct the chains we will route to. These format the input query\n",
+ "# into the respective prompt, run it through a chat model, and cast\n",
+ "# the result to a string.\n",
+ "chain_1 = prompt_1 | llm | StrOutputParser()\n",
+ "chain_2 = prompt_2 | llm | StrOutputParser()\n",
+ "\n",
+ "\n",
+ "# Next: define the chain that selects which branch to route to.\n",
+ "# Here we will take advantage of tool-calling features to force\n",
+ "# the output to select one of two desired branches.\n",
+ "route_system = \"Route the user's query to either the animal or vegetable expert.\"\n",
+ "route_prompt = ChatPromptTemplate.from_messages(\n",
+ " [\n",
+ " (\"system\", route_system),\n",
+ " (\"human\", \"{input}\"),\n",
+ " ]\n",
+ ")\n",
+ "\n",
+ "\n",
+ "# Define schema for output:\n",
+ "class RouteQuery(TypedDict):\n",
+ " \"\"\"Route query to destination expert.\"\"\"\n",
+ "\n",
+ " destination: Literal[\"animal\", \"vegetable\"]\n",
+ "\n",
+ "\n",
+ "route_chain = route_prompt | llm.with_structured_output(RouteQuery)\n",
+ "\n",
+ "\n",
+ "# For LangGraph, we will define the state of the graph to hold the query,\n",
+ "# destination, and final answer.\n",
+ "class State(TypedDict):\n",
+ " query: str\n",
+ " destination: RouteQuery\n",
+ " answer: str\n",
+ "\n",
+ "\n",
+ "# We define functions for each node, including routing the query:\n",
+ "async def route_query(state: State, config: RunnableConfig):\n",
+ " destination = await route_chain.ainvoke(state[\"query\"], config)\n",
+ " return {\"destination\": destination}\n",
+ "\n",
+ "\n",
+ "# And one node for each prompt\n",
+ "async def prompt_1(state: State, config: RunnableConfig):\n",
+ " return {\"answer\": await chain_1.ainvoke(state[\"query\"], config)}\n",
+ "\n",
+ "\n",
+ "async def prompt_2(state: State, config: RunnableConfig):\n",
+ " return {\"answer\": await chain_2.ainvoke(state[\"query\"], config)}\n",
+ "\n",
+ "\n",
+ "# We then define logic that selects the prompt based on the classification\n",
+ "def select_node(state: State) -> Literal[\"prompt_1\", \"prompt_2\"]:\n",
+ " if state[\"destination\"] == \"animal\":\n",
+ " return \"prompt_1\"\n",
+ " else:\n",
+ " return \"prompt_2\"\n",
+ "\n",
+ "\n",
+ "# Finally, assemble the multi-prompt chain. This is a sequence of two steps:\n",
+ "# 1) Select \"animal\" or \"vegetable\" via the route_chain, and collect the answer\n",
+ "# alongside the input query.\n",
+ "# 2) Route the input query to chain_1 or chain_2, based on the\n",
+ "# selection.\n",
+ "graph = StateGraph(State)\n",
+ "graph.add_node(\"route_query\", route_query)\n",
+ "graph.add_node(\"prompt_1\", prompt_1)\n",
+ "graph.add_node(\"prompt_2\", prompt_2)\n",
+ "\n",
+ "graph.add_edge(START, \"route_query\")\n",
+ "graph.add_conditional_edges(\"route_query\", select_node)\n",
+ "graph.add_edge(\"prompt_1\", END)\n",
+ "graph.add_edge(\"prompt_2\", END)\n",
+ "app = graph.compile()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 2,
+ "id": "92ef8d86-daa6-4ff3-b722-468e7cf8bcb2",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "image/jpeg": "",
+ "text/plain": [
+ ""
+ ]
+ },
+ "execution_count": 2,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "from IPython.display import Image\n",
+ "\n",
+ "Image(app.get_graph().draw_mermaid_png())"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "8a665dd1-7459-4511-8556-418f15cfec57",
+ "metadata": {},
+ "source": [
+ "We can invoke the chain as follows:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 3,
+ "id": "61838f81-4e60-445f-9c05-563e3520ab33",
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "{'destination': 'vegetable'}\n",
+ "Carrots are most commonly orange, but they can also come in a variety of other colors, including purple, red, yellow, and white. The different colors often indicate varying flavors and nutritional profiles. For example, purple carrots contain anthocyanins, while orange carrots are rich in beta-carotene, which is converted to vitamin A in the body.\n"
+ ]
+ }
+ ],
+ "source": [
+ "state = await app.ainvoke({\"query\": \"what color are carrots\"})\n",
+ "print(state[\"destination\"])\n",
+ "print(state[\"answer\"])"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "e7e46205-9d80-45b8-a3d5-cfbc8ebbe19a",
+ "metadata": {},
+ "source": [
+ "In the [LangSmith trace](https://smith.langchain.com/public/1017a9d2-2d2a-4954-a5fd-5689632b4c5f/r) we can see the tool call that routed the query and the prompt that was selected to generate the answer.\n",
+ "\n",
+ " \n",
+ "\n",
+ "## Overview:\n",
+ "\n",
+ "- Under the hood, `MultiPromptChain` routes the query by instructing the LLM to generate JSON-formatted text, and parses out the intended destination. It takes a registry of string prompt templates as input.\n",
+ "- The LangGraph implementation, implemented above via lower-level primitives, uses tool-calling to route to arbitrary chains. In this example, the chains include chat model templates and chat models."
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "cf89de23-377b-4933-839c-d2f2483d09d2",
+ "metadata": {},
+ "source": [
+ "## Next steps\n",
+ "\n",
+ "See [this tutorial](/docs/tutorials/llm_chain) for more detail on building with prompt templates, LLMs, and output parsers.\n",
+ "\n",
+ "Check out the [LangGraph documentation](https://langchain-ai.github.io/langgraph/) for detail on building with LangGraph."
+ ]
+ }
+ ],
+ "metadata": {
+ "kernelspec": {
+ "display_name": "Python 3 (ipykernel)",
+ "language": "python",
+ "name": "python3"
+ },
+ "language_info": {
+ "codemirror_mode": {
+ "name": "ipython",
+ "version": 3
+ },
+ "file_extension": ".py",
+ "mimetype": "text/x-python",
+ "name": "python",
+ "nbconvert_exporter": "python",
+ "pygments_lexer": "ipython3",
+ "version": "3.10.4"
+ }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/docs/docs/versions/migrating_chains/refine_docs_chain.ipynb b/docs/docs/versions/migrating_chains/refine_docs_chain.ipynb
new file mode 100644
index 00000000000..51fd1bbcc43
--- /dev/null
+++ b/docs/docs/versions/migrating_chains/refine_docs_chain.ipynb
@@ -0,0 +1,452 @@
+{
+ "cells": [
+ {
+ "cell_type": "markdown",
+ "id": "32eee276-7847-45d8-b303-dccc330c8a1a",
+ "metadata": {},
+ "source": [
+ "---\n",
+ "title: Migrating from RefineDocumentsChain\n",
+ "---\n",
+ "\n",
+ "[RefineDocumentsChain](https://api.python.langchain.com/en/latest/chains/langchain.chains.combine_documents.refine.RefineDocumentsChain.html) implements a strategy for analyzing long texts. The strategy is as follows:\n",
+ "\n",
+ "- Split a text into smaller documents;\n",
+ "- Apply a process to the first document;\n",
+ "- Refine or update the result based on the next document;\n",
+ "- Repeat through the sequence of documents until finished.\n",
+ "\n",
+ "A common process applied in this context is summarization, in which a running summary is modified as we proceed through chunks of a long text. This is particularly useful for texts that are large compared to the context window of a given LLM.\n",
+ "\n",
+ "A [LangGraph](https://langchain-ai.github.io/langgraph/) implementation confers a number of advantages for this problem:\n",
+ "\n",
+ "- Where `RefineDocumentsChain` refines the summary via a `for` loop inside the class, a LangGraph implementation lets you step through the execution to monitor or otherwise steer it if needed.\n",
+ "- The LangGraph implementation supports streaming of both execution steps and individual tokens.\n",
+ "- Because it is assembled from modular components, it is also simple to extend or modify (e.g., to incorporate [tool calling](/docs/concepts/#functiontool-calling) or other behavior).\n",
+ "\n",
+ "Below we will go through both `RefineDocumentsChain` and a corresponding LangGraph implementation on a simple example for illustrative purposes.\n",
+ "\n",
+ "Let's first load a chat model:\n",
+ "\n",
+ "```{=mdx}\n",
+ "import ChatModelTabs from \"@theme/ChatModelTabs\";\n",
+ "\n",
+ "\n",
+ "```"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 1,
+ "id": "34fc8315-4354-4d4e-952a-c0465d93b23c",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "# | output: false\n",
+ "# | echo: false\n",
+ "\n",
+ "from langchain_openai import ChatOpenAI\n",
+ "\n",
+ "llm = ChatOpenAI(model=\"gpt-4o-mini\", temperature=0)"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "9950d6e1-7ca0-4b46-8622-813b3c30b85d",
+ "metadata": {},
+ "source": [
+ "## Example\n",
+ "\n",
+ "Let's go through an example where we summarize a sequence of documents. We first generate some simple documents for illustrative purposes:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 2,
+ "id": "abb1abb0-0c5e-4179-8431-c2b2d52bd57b",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "from langchain_core.documents import Document\n",
+ "\n",
+ "documents = [\n",
+ " Document(page_content=\"Apples are red\", metadata={\"title\": \"apple_book\"}),\n",
+ " Document(page_content=\"Blueberries are blue\", metadata={\"title\": \"blueberry_book\"}),\n",
+ " Document(page_content=\"Bananas are yelow\", metadata={\"title\": \"banana_book\"}),\n",
+ "]"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "ffd939c9-1717-4afd-a615-4a1d560ca814",
+ "metadata": {},
+ "source": [
+ "### Legacy\n",
+ "\n",
+ "\n",
+ "\n",
+ "Below we show an implementation with `RefineDocumentsChain`. We define the prompt templates for the initial summarization and successive refinements, instantiate separate [LLMChain](https://api.python.langchain.com/en/latest/chains/langchain.chains.llm.LLMChain.html) objects for these two purposes, and instantiate `RefineDocumentsChain` with these components."
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 4,
+ "id": "4b2dd248-8bf3-40a5-9569-df32558b5d21",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "from langchain.chains import LLMChain, RefineDocumentsChain\n",
+ "from langchain_core.prompts import ChatPromptTemplate, PromptTemplate\n",
+ "from langchain_openai import ChatOpenAI\n",
+ "\n",
+ "# This controls how each document will be formatted. Specifically,\n",
+ "# it will be passed to `format_document` - see that function for more\n",
+ "# details.\n",
+ "document_prompt = PromptTemplate(\n",
+ " input_variables=[\"page_content\"], template=\"{page_content}\"\n",
+ ")\n",
+ "document_variable_name = \"context\"\n",
+ "# The prompt here should take as an input variable the\n",
+ "# `document_variable_name`\n",
+ "summarize_prompt = ChatPromptTemplate(\n",
+ " [\n",
+ " (\"human\", \"Write a concise summary of the following: {context}\"),\n",
+ " ]\n",
+ ")\n",
+ "initial_llm_chain = LLMChain(llm=llm, prompt=summarize_prompt)\n",
+ "initial_response_name = \"existing_answer\"\n",
+ "# The prompt here should take as an input variable the\n",
+ "# `document_variable_name` as well as `initial_response_name`\n",
+ "refine_template = \"\"\"\n",
+ "Produce a final summary.\n",
+ "\n",
+ "Existing summary up to this point:\n",
+ "{existing_answer}\n",
+ "\n",
+ "New context:\n",
+ "------------\n",
+ "{context}\n",
+ "------------\n",
+ "\n",
+ "Given the new context, refine the original summary.\n",
+ "\"\"\"\n",
+ "refine_prompt = ChatPromptTemplate([(\"human\", refine_template)])\n",
+ "refine_llm_chain = LLMChain(llm=llm, prompt=refine_prompt)\n",
+ "chain = RefineDocumentsChain(\n",
+ " initial_llm_chain=initial_llm_chain,\n",
+ " refine_llm_chain=refine_llm_chain,\n",
+ " document_prompt=document_prompt,\n",
+ " document_variable_name=document_variable_name,\n",
+ " initial_response_name=initial_response_name,\n",
+ ")"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "06ee50d8-5f37-4bcd-9181-5280b54b1b44",
+ "metadata": {},
+ "source": [
+ "We can now invoke our chain:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 5,
+ "id": "8686f56f-992f-4556-a74c-8d3903d0db38",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "'Apples are typically red in color, blueberries are blue, and bananas are yellow.'"
+ ]
+ },
+ "execution_count": 5,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "result = chain.invoke(documents)\n",
+ "result[\"output_text\"]"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "22d5f5d2-b7f3-431c-bb25-fa1b4d353663",
+ "metadata": {},
+ "source": [
+ "The [LangSmith trace](https://smith.langchain.com/public/8ec51479-9420-412f-bb21-cb8c9f59dfde/r) is composed of three LLM calls: one for the initial summary, and two more updates of that summary. The process completes when we update the summary with content from the final document."
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "8f5caba4-f363-4bcf-8dd4-1d015e27a18d",
+ "metadata": {},
+ "source": [
+ " \n",
+ "\n",
+ "### LangGraph\n",
+ "\n",
+ "\n",
+ "\n",
+ "Below we show a LangGraph implementation of this process:\n",
+ "\n",
+ "- We use the same two templates as before.\n",
+ "- We generate a simple chain for the initial summary that plucks out the first document, formats it into a prompt and runs inference with our LLM.\n",
+ "- We generate a second `refine_summary_chain` that operates on each successive document, refining the initial summary.\n",
+ "\n",
+ "We will need to install `langgraph`:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": null,
+ "id": "bda06266-f4fe-43cf-9044-0ce5ee76c793",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "pip install -qU langgraph"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 4,
+ "id": "3477bef6-97cc-492f-87fe-cf5336edd581",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "import operator\n",
+ "from typing import List, Literal, TypedDict\n",
+ "\n",
+ "from langchain_core.output_parsers import StrOutputParser\n",
+ "from langchain_core.prompts import ChatPromptTemplate\n",
+ "from langchain_core.runnables import RunnableConfig\n",
+ "from langchain_openai import ChatOpenAI\n",
+ "from langgraph.constants import Send\n",
+ "from langgraph.graph import END, START, StateGraph\n",
+ "\n",
+ "llm = ChatOpenAI(model=\"gpt-4o-mini\", temperature=0)\n",
+ "\n",
+ "# Initial summary\n",
+ "summarize_prompt = ChatPromptTemplate(\n",
+ " [\n",
+ " (\"human\", \"Write a concise summary of the following: {context}\"),\n",
+ " ]\n",
+ ")\n",
+ "initial_summary_chain = summarize_prompt | llm | StrOutputParser()\n",
+ "\n",
+ "# Refining the summary with new docs\n",
+ "refine_template = \"\"\"\n",
+ "Produce a final summary.\n",
+ "\n",
+ "Existing summary up to this point:\n",
+ "{existing_answer}\n",
+ "\n",
+ "New context:\n",
+ "------------\n",
+ "{context}\n",
+ "------------\n",
+ "\n",
+ "Given the new context, refine the original summary.\n",
+ "\"\"\"\n",
+ "refine_prompt = ChatPromptTemplate([(\"human\", refine_template)])\n",
+ "\n",
+ "refine_summary_chain = refine_prompt | llm | StrOutputParser()\n",
+ "\n",
+ "\n",
+ "# For LangGraph, we will define the state of the graph to hold the query,\n",
+ "# destination, and final answer.\n",
+ "class State(TypedDict):\n",
+ " contents: List[str]\n",
+ " index: int\n",
+ " summary: str\n",
+ "\n",
+ "\n",
+ "# We define functions for each node, including a node that generates\n",
+ "# the initial summary:\n",
+ "async def generate_initial_summary(state: State, config: RunnableConfig):\n",
+ " summary = await initial_summary_chain.ainvoke(\n",
+ " state[\"contents\"][0],\n",
+ " config,\n",
+ " )\n",
+ " return {\"summary\": summary, \"index\": 1}\n",
+ "\n",
+ "\n",
+ "# And a node that refines the summary based on the next document\n",
+ "async def refine_summary(state: State, config: RunnableConfig):\n",
+ " content = state[\"contents\"][state[\"index\"]]\n",
+ " summary = await refine_summary_chain.ainvoke(\n",
+ " {\"existing_answer\": state[\"summary\"], \"context\": content},\n",
+ " config,\n",
+ " )\n",
+ "\n",
+ " return {\"summary\": summary, \"index\": state[\"index\"] + 1}\n",
+ "\n",
+ "\n",
+ "# Here we implement logic to either exit the application or refine\n",
+ "# the summary.\n",
+ "def should_refine(state: State) -> Literal[\"refine_summary\", END]:\n",
+ " if state[\"index\"] >= len(state[\"contents\"]):\n",
+ " return END\n",
+ " else:\n",
+ " return \"refine_summary\"\n",
+ "\n",
+ "\n",
+ "graph = StateGraph(State)\n",
+ "graph.add_node(\"generate_initial_summary\", generate_initial_summary)\n",
+ "graph.add_node(\"refine_summary\", refine_summary)\n",
+ "\n",
+ "graph.add_edge(START, \"generate_initial_summary\")\n",
+ "graph.add_conditional_edges(\"generate_initial_summary\", should_refine)\n",
+ "graph.add_conditional_edges(\"refine_summary\", should_refine)\n",
+ "app = graph.compile()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 5,
+ "id": "0f1f0f00-5378-4687-987f-5feec0805d7a",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "image/jpeg": "",
+ "text/plain": [
+ ""
+ ]
+ },
+ "execution_count": 5,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "from IPython.display import Image\n",
+ "\n",
+ "Image(app.get_graph().draw_mermaid_png())"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "9487118a-25ea-4ecf-982b-10c72bec3325",
+ "metadata": {},
+ "source": [
+ "We can step through the execution as follows, printing out the summary as it is refined:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 6,
+ "id": "9572e4bd-5e7d-4884-8283-d516396d7c29",
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "Apples are typically red in color.\n",
+ "Apples are typically red in color, while blueberries are blue.\n",
+ "Apples are typically red in color, blueberries are blue, and bananas are yellow.\n"
+ ]
+ }
+ ],
+ "source": [
+ "async for step in app.astream(\n",
+ " {\"contents\": [doc.page_content for doc in documents]},\n",
+ " stream_mode=\"values\",\n",
+ "):\n",
+ " if summary := step.get(\"summary\"):\n",
+ " print(summary)"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "cb390e43-58db-43af-9118-aed6f08ce351",
+ "metadata": {},
+ "source": [
+ "In the [LangSmith trace](https://smith.langchain.com/public/d6656f49-4fa1-44b9-b6d3-10af921037fa/r) we again recover three LLM calls, performing the same functions as before.\n",
+ "\n",
+ "Note that we can stream tokens from the application, including from intermediate steps:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 8,
+ "id": "105d71ee-0eb8-40bf-aa82-c94121dba2f2",
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "Ap|ples| are| characterized| by| their| red| color|.|\n",
+ "\n",
+ "\n",
+ "Ap|ples| are| characterized| by| their| red| color|,| while| blueberries| are| known| for| their| blue| hue|.|\n",
+ "\n",
+ "\n",
+ "Ap|ples| are| characterized| by| their| red| color|,| blueberries| are| known| for| their| blue| hue|,| and| bananas| are| recognized| for| their| yellow| color|.|\n",
+ "\n",
+ "\n"
+ ]
+ }
+ ],
+ "source": [
+ "async for event in app.astream_events(\n",
+ " {\"contents\": [doc.page_content for doc in documents]}, version=\"v2\"\n",
+ "):\n",
+ " kind = event[\"event\"]\n",
+ " if kind == \"on_chat_model_stream\":\n",
+ " content = event[\"data\"][\"chunk\"].content\n",
+ " if content:\n",
+ " print(content, end=\"|\")\n",
+ " elif kind == \"on_chat_model_end\":\n",
+ " print(\"\\n\\n\")"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "5ad2a8f1-e453-4f0b-8911-8c8ddf607f64",
+ "metadata": {},
+ "source": [
+ " \n",
+ "\n",
+ "## Next steps\n",
+ "\n",
+ "See [this tutorial](/docs/tutorials/summarization/) for more LLM-based summarization strategies.\n",
+ "\n",
+ "Check out the [LangGraph documentation](https://langchain-ai.github.io/langgraph/) for detail on building with LangGraph."
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": null,
+ "id": "f52a8a4b-4dbe-4a82-9267-e9a7c7fa188d",
+ "metadata": {},
+ "outputs": [],
+ "source": []
+ }
+ ],
+ "metadata": {
+ "kernelspec": {
+ "display_name": "Python 3 (ipykernel)",
+ "language": "python",
+ "name": "python3"
+ },
+ "language_info": {
+ "codemirror_mode": {
+ "name": "ipython",
+ "version": 3
+ },
+ "file_extension": ".py",
+ "mimetype": "text/x-python",
+ "name": "python",
+ "nbconvert_exporter": "python",
+ "pygments_lexer": "ipython3",
+ "version": "3.10.4"
+ }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/docs/docs/versions/migrating_chains/retrieval_qa.ipynb b/docs/docs/versions/migrating_chains/retrieval_qa.ipynb
index 477e3cf6247..7cab33d02b4 100644
--- a/docs/docs/versions/migrating_chains/retrieval_qa.ipynb
+++ b/docs/docs/versions/migrating_chains/retrieval_qa.ipynb
@@ -82,13 +82,9 @@
"id": "c7e16438",
"metadata": {},
"source": [
- "import { ColumnContainer, Column } from \"@theme/Columns\";\n",
+ "## Legacy\n",
"\n",
- "\n",
- "\n",
- "\n",
- "\n",
- "#### Legacy"
+ ""
]
},
{
@@ -128,12 +124,11 @@
"id": "081948e5",
"metadata": {},
"source": [
- " \n",
+ "\n",
"\n",
- "\n",
+ "## LCEL\n",
"\n",
- "#### LCEL\n",
- "\n"
+ ""
]
},
{
@@ -184,9 +179,6 @@
"id": "d6f44fe8",
"metadata": {},
"source": [
- " \n",
- "\n",
- "\n",
"The LCEL implementation exposes the internals of what's happening around retrieving, formatting documents, and passing them through a prompt to the LLM, but it is more verbose. You can customize and wrap this composition logic in a helper function, or use the higher-level [`create_retrieval_chain`](https://api.python.langchain.com/en/latest/chains/langchain.chains.retrieval.create_retrieval_chain.html) and [`create_stuff_documents_chain`](https://api.python.langchain.com/en/latest/chains/langchain.chains.combine_documents.stuff.create_stuff_documents_chain.html) helper method:"
]
},
@@ -231,6 +223,8 @@
"id": "b2717810",
"metadata": {},
"source": [
+ "\n",
+ "\n",
"## Next steps\n",
"\n",
"Check out the [LCEL conceptual docs](/docs/concepts/#langchain-expression-language-lcel) for more background information."
diff --git a/docs/docs/versions/migrating_chains/stuff_docs_chain.ipynb b/docs/docs/versions/migrating_chains/stuff_docs_chain.ipynb
new file mode 100644
index 00000000000..c7e255b8845
--- /dev/null
+++ b/docs/docs/versions/migrating_chains/stuff_docs_chain.ipynb
@@ -0,0 +1,281 @@
+{
+ "cells": [
+ {
+ "cell_type": "markdown",
+ "id": "ed78c53c-55ad-4ea2-9cc2-a39a1963c098",
+ "metadata": {},
+ "source": [
+ "---\n",
+ "title: Migrating from StuffDocumentsChain\n",
+ "---\n",
+ "\n",
+ "[StuffDocumentsChain](https://api.python.langchain.com/en/latest/chains/langchain.chains.combine_documents.stuff.StuffDocumentsChain.html) combines documents by concatenating them into a single context window. It is a straightforward and effective strategy for combining documents for question-answering, summarization, and other purposes.\n",
+ "\n",
+ "[create_stuff_documents_chain](https://api.python.langchain.com/en/latest/chains/langchain.chains.combine_documents.stuff.create_stuff_documents_chain.html) is the recommended alternative. It functions the same as `StuffDocumentsChain`, with better support for streaming and batch functionality. Because it is a simple combination of [LCEL primitives](/docs/concepts/#langchain-expression-language-lcel), it is also easier to extend and incorporate into other LangChain applications.\n",
+ "\n",
+ "Below we will go through both `StuffDocumentsChain` and `create_stuff_documents_chain` on a simple example for illustrative purposes.\n",
+ "\n",
+ "Let's first load a chat model:\n",
+ "\n",
+ "```{=mdx}\n",
+ "import ChatModelTabs from \"@theme/ChatModelTabs\";\n",
+ "\n",
+ "\n",
+ "```"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 1,
+ "id": "dac0bef2-9453-46f2-a893-f7569b6a0170",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "# | output: false\n",
+ "# | echo: false\n",
+ "\n",
+ "from langchain_openai import ChatOpenAI\n",
+ "\n",
+ "llm = ChatOpenAI(model=\"gpt-3.5-turbo-0125\", temperature=0)"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "d4022d03-7b5e-4c81-98ff-5b82a2a4eaae",
+ "metadata": {},
+ "source": [
+ "## Example\n",
+ "\n",
+ "Let's go through an example where we analyze a set of documents. We first generate some simple documents for illustrative purposes:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 2,
+ "id": "24fa0ba9-e245-47d1-bc2e-6286dd884117",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "from langchain_core.documents import Document\n",
+ "\n",
+ "documents = [\n",
+ " Document(page_content=\"Apples are red\", metadata={\"title\": \"apple_book\"}),\n",
+ " Document(page_content=\"Blueberries are blue\", metadata={\"title\": \"blueberry_book\"}),\n",
+ " Document(page_content=\"Bananas are yelow\", metadata={\"title\": \"banana_book\"}),\n",
+ "]"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "3a769128-205f-417d-a25d-519e7cb03be7",
+ "metadata": {},
+ "source": [
+ "### Legacy\n",
+ "\n",
+ "\n",
+ "\n",
+ "Below we show an implementation with `StuffDocumentsChain`. We define the prompt template for a summarization task and instantiate a [LLMChain](https://api.python.langchain.com/en/latest/chains/langchain.chains.llm.LLMChain.html) object for this purpose. We define how documents are formatted into the prompt and ensure consistency among the keys in the various prompts."
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 15,
+ "id": "9734c0f3-64e7-4ae6-8578-df03b3dabb26",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "from langchain.chains import LLMChain, StuffDocumentsChain\n",
+ "from langchain_core.prompts import ChatPromptTemplate, PromptTemplate\n",
+ "\n",
+ "# This controls how each document will be formatted. Specifically,\n",
+ "# it will be passed to `format_document` - see that function for more\n",
+ "# details.\n",
+ "document_prompt = PromptTemplate(\n",
+ " input_variables=[\"page_content\"], template=\"{page_content}\"\n",
+ ")\n",
+ "document_variable_name = \"context\"\n",
+ "# The prompt here should take as an input variable the\n",
+ "# `document_variable_name`\n",
+ "prompt = ChatPromptTemplate.from_template(\"Summarize this content: {context}\")\n",
+ "\n",
+ "llm_chain = LLMChain(llm=llm, prompt=prompt)\n",
+ "chain = StuffDocumentsChain(\n",
+ " llm_chain=llm_chain,\n",
+ " document_prompt=document_prompt,\n",
+ " document_variable_name=document_variable_name,\n",
+ ")"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "0cb733bf-eb71-4fae-a8f4-d522924020cb",
+ "metadata": {},
+ "source": [
+ "We can now invoke our chain:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 19,
+ "id": "d7d1ce10-bbee-4cb0-879d-7de4f69191c4",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "'This content describes the colors of different fruits: apples are red, blueberries are blue, and bananas are yellow.'"
+ ]
+ },
+ "execution_count": 19,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "result = chain.invoke(documents)\n",
+ "result[\"output_text\"]"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 20,
+ "id": "79b10d40-1521-433b-9026-6ec836ffeeb3",
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "{'input_documents': [Document(metadata={'title': 'apple_book'}, page_content='Apples are red'), Document(metadata={'title': 'blueberry_book'}, page_content='Blueberries are blue'), Document(metadata={'title': 'banana_book'}, page_content='Bananas are yelow')], 'output_text': 'This content describes the colors of different fruits: apples are red, blueberries are blue, and bananas are yellow.'}\n"
+ ]
+ }
+ ],
+ "source": [
+ "for chunk in chain.stream(documents):\n",
+ " print(chunk)"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "b4cb6a5b-37ea-48cc-a096-b948d3ff7e9f",
+ "metadata": {},
+ "source": [
+ " \n",
+ "\n",
+ "### LCEL\n",
+ "\n",
+ "\n",
+ "\n",
+ "Below we show an implementation using `create_stuff_documents_chain`:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 21,
+ "id": "de38f27a-c648-44be-8c37-0a458c2920a9",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "from langchain.chains.combine_documents import create_stuff_documents_chain\n",
+ "from langchain_core.prompts import ChatPromptTemplate\n",
+ "\n",
+ "prompt = ChatPromptTemplate.from_template(\"Summarize this content: {context}\")\n",
+ "chain = create_stuff_documents_chain(llm, prompt)"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "9d0e6996-9bf8-4097-9c1a-1c539eac3ed1",
+ "metadata": {},
+ "source": [
+ "Invoking the chain, we obtain a similar result as before:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 24,
+ "id": "f2d2bdfb-3a6a-464b-b4c2-e4252b2e53a0",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "'This content describes the colors of different fruits: apples are red, blueberries are blue, and bananas are yellow.'"
+ ]
+ },
+ "execution_count": 24,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "result = chain.invoke({\"context\": documents})\n",
+ "result"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "493e6270-c61d-46c5-91b3-0cf7740a88f9",
+ "metadata": {},
+ "source": [
+ "Note that this implementation supports streaming of output tokens:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 26,
+ "id": "b5adcabd-9bc1-4c91-a12b-7be82d64e457",
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ " | This | content | describes | the | colors | of | different | fruits | : | apples | are | red | , | blue | berries | are | blue | , | and | bananas | are | yellow | . | | "
+ ]
+ }
+ ],
+ "source": [
+ "for chunk in chain.stream({\"context\": documents}):\n",
+ " print(chunk, end=\" | \")"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "181c5633-38ea-4692-a869-32f4f78398e4",
+ "metadata": {},
+ "source": [
+ " \n",
+ "\n",
+ "## Next steps\n",
+ "\n",
+ "Check out the [LCEL conceptual docs](/docs/concepts/#langchain-expression-language-lcel) for more background information.\n",
+ "\n",
+ "See these [how-to guides](/docs/how_to/#qa-with-rag) for more on question-answering tasks with RAG.\n",
+ "\n",
+ "See [this tutorial](/docs/tutorials/summarization/) for more LLM-based summarization strategies."
+ ]
+ }
+ ],
+ "metadata": {
+ "kernelspec": {
+ "display_name": "Python 3 (ipykernel)",
+ "language": "python",
+ "name": "python3"
+ },
+ "language_info": {
+ "codemirror_mode": {
+ "name": "ipython",
+ "version": 3
+ },
+ "file_extension": ".py",
+ "mimetype": "text/x-python",
+ "name": "python",
+ "nbconvert_exporter": "python",
+ "pygments_lexer": "ipython3",
+ "version": "3.10.4"
+ }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/docs/sidebars.js b/docs/sidebars.js
index a9a9d11cd3b..670768d07cd 100644
--- a/docs/sidebars.js
+++ b/docs/sidebars.js
@@ -93,7 +93,7 @@ module.exports = {
},
{
type: "category",
- label: "Migrating to LCEL",
+ label: "Migrating from v0.0 chains",
link: {type: 'doc', id: 'versions/migrating_chains/index'},
collapsible: false,
collapsed: false,
diff --git a/libs/langchain/langchain/agents/agent_toolkits/vectorstore/base.py b/libs/langchain/langchain/agents/agent_toolkits/vectorstore/base.py
index 79c2a477b59..a9b7fdc4528 100644
--- a/libs/langchain/langchain/agents/agent_toolkits/vectorstore/base.py
+++ b/libs/langchain/langchain/agents/agent_toolkits/vectorstore/base.py
@@ -2,6 +2,7 @@
from typing import Any, Dict, Optional
+from langchain_core._api import deprecated
from langchain_core.callbacks.base import BaseCallbackManager
from langchain_core.language_models import BaseLanguageModel
@@ -15,6 +16,16 @@ from langchain.agents.mrkl.base import ZeroShotAgent
from langchain.chains.llm import LLMChain
+@deprecated(
+ since="0.2.13",
+ removal="1.0",
+ message=(
+ "See API reference for this function for a replacement implementation: "
+ "https://api.python.langchain.com/en/latest/agents/langchain.agents.agent_toolkits.vectorstore.base.create_vectorstore_agent.html " # noqa: E501
+ "Read more here on how to create agents that query vector stores: "
+ "https://python.langchain.com/v0.2/docs/how_to/qa_chat_history_how_to/#agents"
+ ),
+)
def create_vectorstore_agent(
llm: BaseLanguageModel,
toolkit: VectorStoreToolkit,
@@ -26,6 +37,44 @@ def create_vectorstore_agent(
) -> AgentExecutor:
"""Construct a VectorStore agent from an LLM and tools.
+ Note: this class is deprecated. See below for a replacement that uses tool
+ calling methods and LangGraph. Install LangGraph with:
+
+ .. code-block:: bash
+
+ pip install -U langgraph
+
+ .. code-block:: python
+
+ from langchain_core.tools import create_retriever_tool
+ from langchain_core.vectorstores import InMemoryVectorStore
+ from langchain_openai import ChatOpenAI, OpenAIEmbeddings
+ from langgraph.prebuilt import create_react_agent
+
+ llm = ChatOpenAI(model="gpt-4o-mini", temperature=0)
+
+ vector_store = InMemoryVectorStore.from_texts(
+ [
+ "Dogs are great companions, known for their loyalty and friendliness.",
+ "Cats are independent pets that often enjoy their own space.",
+ ],
+ OpenAIEmbeddings(),
+ )
+
+ tool = create_retriever_tool(
+ vector_store.as_retriever(),
+ "pet_information_retriever",
+ "Fetches information about pets.",
+ )
+
+ agent = create_react_agent(llm, [tool])
+
+ for step in agent.stream(
+ {"messages": [("human", "What are dogs known for?")]},
+ stream_mode="values",
+ ):
+ step["messages"][-1].pretty_print()
+
Args:
llm (BaseLanguageModel): LLM that will be used by the agent
toolkit (VectorStoreToolkit): Set of tools for the agent
@@ -56,6 +105,16 @@ def create_vectorstore_agent(
)
+@deprecated(
+ since="0.2.13",
+ removal="1.0",
+ message=(
+ "See API reference for this function for a replacement implementation: "
+ "https://api.python.langchain.com/en/latest/agents/langchain.agents.agent_toolkits.vectorstore.base.create_vectorstore_router_agent.html " # noqa: E501
+ "Read more here on how to create agents that query vector stores: "
+ "https://python.langchain.com/v0.2/docs/how_to/qa_chat_history_how_to/#agents"
+ ),
+)
def create_vectorstore_router_agent(
llm: BaseLanguageModel,
toolkit: VectorStoreRouterToolkit,
@@ -67,6 +126,59 @@ def create_vectorstore_router_agent(
) -> AgentExecutor:
"""Construct a VectorStore router agent from an LLM and tools.
+ Note: this class is deprecated. See below for a replacement that uses tool
+ calling methods and LangGraph. Install LangGraph with:
+
+ .. code-block:: bash
+
+ pip install -U langgraph
+
+ .. code-block:: python
+
+ from langchain_core.tools import create_retriever_tool
+ from langchain_core.vectorstores import InMemoryVectorStore
+ from langchain_openai import ChatOpenAI, OpenAIEmbeddings
+ from langgraph.prebuilt import create_react_agent
+
+ llm = ChatOpenAI(model="gpt-4o-mini", temperature=0)
+
+ pet_vector_store = InMemoryVectorStore.from_texts(
+ [
+ "Dogs are great companions, known for their loyalty and friendliness.",
+ "Cats are independent pets that often enjoy their own space.",
+ ],
+ OpenAIEmbeddings(),
+ )
+
+ food_vector_store = InMemoryVectorStore.from_texts(
+ [
+ "Carrots are orange and delicious.",
+ "Apples are red and delicious.",
+ ],
+ OpenAIEmbeddings(),
+ )
+
+ tools = [
+ create_retriever_tool(
+ pet_vector_store.as_retriever(),
+ "pet_information_retriever",
+ "Fetches information about pets.",
+ ),
+ create_retriever_tool(
+ food_vector_store.as_retriever(),
+ "food_information_retriever",
+ "Fetches information about food.",
+ )
+ ]
+
+ agent = create_react_agent(llm, tools)
+
+ for step in agent.stream(
+ {"messages": [("human", "Tell me about carrots.")]},
+ stream_mode="values",
+ ):
+ step["messages"][-1].pretty_print()
+
Args:
llm (BaseLanguageModel): LLM that will be used by the agent
toolkit (VectorStoreRouterToolkit): Set of tools for the agent which have routing capability with multiple vector stores
diff --git a/libs/langchain/langchain/chains/__init__.py b/libs/langchain/langchain/chains/__init__.py
index f1c8061d594..39b9156bc65 100644
--- a/libs/langchain/langchain/chains/__init__.py
+++ b/libs/langchain/langchain/chains/__init__.py
@@ -59,6 +59,7 @@ _module_lookup = {
"OpenAIModerationChain": "langchain.chains.moderation",
"NatBotChain": "langchain.chains.natbot.base",
"create_citation_fuzzy_match_chain": "langchain.chains.openai_functions",
+ "create_citation_fuzzy_match_runnable": "langchain.chains.openai_functions",
"create_extraction_chain": "langchain.chains.openai_functions",
"create_extraction_chain_pydantic": "langchain.chains.openai_functions",
"create_qa_with_sources_chain": "langchain.chains.openai_functions",
diff --git a/libs/langchain/langchain/chains/api/base.py b/libs/langchain/langchain/chains/api/base.py
index 697d68f1ada..94896102dc6 100644
--- a/libs/langchain/langchain/chains/api/base.py
+++ b/libs/langchain/langchain/chains/api/base.py
@@ -5,6 +5,7 @@ from __future__ import annotations
from typing import Any, Dict, List, Optional, Sequence, Tuple
from urllib.parse import urlparse
+from langchain_core._api import deprecated
from langchain_core.callbacks import (
AsyncCallbackManagerForChainRun,
CallbackManagerForChainRun,
@@ -53,6 +54,15 @@ def _check_in_allowed_domain(url: str, limit_to_domains: Sequence[str]) -> bool:
try:
from langchain_community.utilities.requests import TextRequestsWrapper
+ @deprecated(
+ since="0.2.13",
+ message=(
+ "This class is deprecated and will be removed in langchain 1.0. "
+ "See API reference for replacement: "
+ "https://api.python.langchain.com/en/latest/chains/langchain.chains.api.base.APIChain.html" # noqa: E501
+ ),
+ removal="1.0",
+ )
class APIChain(Chain):
"""Chain that makes API calls and summarizes the responses to answer a question.
@@ -69,7 +79,117 @@ try:
what network access it has.
See https://python.langchain.com/docs/security for more information.
- """
+
+ Note: this class is deprecated. See below for a replacement implementation
+ using LangGraph. The benefits of this implementation are:
+
+ - Uses LLM tool calling features to encourage properly-formatted API requests;
+ - Support for both token-by-token and step-by-step streaming;
+ - Support for checkpointing and memory of chat history;
+ - Easier to modify or extend (e.g., with additional tools, structured responses, etc.)
+
+ Install LangGraph with:
+
+ .. code-block:: bash
+
+ pip install -U langgraph
+
+ .. code-block:: python
+
+ from typing import Annotated, Sequence
+ from typing_extensions import TypedDict
+
+ from langchain.chains.api.prompt import API_URL_PROMPT
+ from langchain_community.agent_toolkits.openapi.toolkit import RequestsToolkit
+ from langchain_community.utilities.requests import TextRequestsWrapper
+ from langchain_core.messages import BaseMessage
+ from langchain_core.prompts import ChatPromptTemplate
+ from langchain_openai import ChatOpenAI
+ from langchain_core.runnables import RunnableConfig
+ from langgraph.graph import END, StateGraph
+ from langgraph.graph.message import add_messages
+ from langgraph.prebuilt.tool_node import ToolNode
+
+ # NOTE: There are inherent risks in giving models discretion
+ # to execute real-world actions. We must "opt-in" to these
+ # risks by setting allow_dangerous_request=True to use these tools.
+ # This can be dangerous for calling unwanted requests. Please make
+ # sure your custom OpenAPI spec (yaml) is safe and that permissions
+ # associated with the tools are narrowly-scoped.
+ ALLOW_DANGEROUS_REQUESTS = True
+
+ # Subset of spec for https://jsonplaceholder.typicode.com
+ api_spec = \"\"\"
+ openapi: 3.0.0
+ info:
+ title: JSONPlaceholder API
+ version: 1.0.0
+ servers:
+ - url: https://jsonplaceholder.typicode.com
+ paths:
+ /posts:
+ get:
+ summary: Get posts
+ parameters: &id001
+ - name: _limit
+ in: query
+ required: false
+ schema:
+ type: integer
+ example: 2
+ description: Limit the number of results
+ \"\"\"
+
+ llm = ChatOpenAI(model="gpt-4o-mini", temperature=0)
+ toolkit = RequestsToolkit(
+ requests_wrapper=TextRequestsWrapper(headers={}), # no auth required
+ allow_dangerous_requests=ALLOW_DANGEROUS_REQUESTS,
+ )
+ tools = toolkit.get_tools()
+
+ api_request_chain = (
+ API_URL_PROMPT.partial(api_docs=api_spec)
+ | llm.bind_tools(tools, tool_choice="any")
+ )
+
+ class ChainState(TypedDict):
+ \"\"\"LangGraph state.\"\"\"
+
+ messages: Annotated[Sequence[BaseMessage], add_messages]
+
+
+ async def acall_request_chain(state: ChainState, config: RunnableConfig):
+ last_message = state["messages"][-1]
+ response = await api_request_chain.ainvoke(
+ {"question": last_message.content}, config
+ )
+ return {"messages": [response]}
+
+ async def acall_model(state: ChainState, config: RunnableConfig):
+ response = await llm.ainvoke(state["messages"], config)
+ return {"messages": [response]}
+
+ graph_builder = StateGraph(ChainState)
+ graph_builder.add_node("call_tool", acall_request_chain)
+ graph_builder.add_node("execute_tool", ToolNode(tools))
+ graph_builder.add_node("call_model", acall_model)
+ graph_builder.set_entry_point("call_tool")
+ graph_builder.add_edge("call_tool", "execute_tool")
+ graph_builder.add_edge("execute_tool", "call_model")
+ graph_builder.add_edge("call_model", END)
+ chain = graph_builder.compile()
+
+ .. code-block:: python
+
+ example_query = "Fetch the top two posts. What are their titles?"
+
+ events = chain.astream(
+ {"messages": [("user", example_query)]},
+ stream_mode="values",
+ )
+ async for event in events:
+ event["messages"][-1].pretty_print()
+ """ # noqa: E501
api_request_chain: LLMChain
api_answer_chain: LLMChain
diff --git a/libs/langchain/langchain/chains/combine_documents/map_rerank.py b/libs/langchain/langchain/chains/combine_documents/map_rerank.py
index e05592caf11..0fa346dee8b 100644
--- a/libs/langchain/langchain/chains/combine_documents/map_rerank.py
+++ b/libs/langchain/langchain/chains/combine_documents/map_rerank.py
@@ -25,7 +25,7 @@ class MapRerankDocumentsChain(BaseCombineDocumentsChain):
Example:
.. code-block:: python
- from langchain.chains import StuffDocumentsChain, LLMChain
+ from langchain.chains import MapRerankDocumentsChain, LLMChain
from langchain_core.prompts import PromptTemplate
from langchain_community.llms import OpenAI
from langchain.output_parsers.regex import RegexParser
@@ -39,7 +39,7 @@ class MapRerankDocumentsChain(BaseCombineDocumentsChain):
prompt_template = (
"Use the following context to tell me the chemical formula "
"for water. Output both your answer and a score of how confident "
- "you are. Context: {content}"
+ "you are. Context: {context}"
)
output_parser = RegexParser(
regex=r"(.*?)\nScore: (.*)",
diff --git a/libs/langchain/langchain/chains/combine_documents/stuff.py b/libs/langchain/langchain/chains/combine_documents/stuff.py
index 544adc50b7a..5ffd86c9718 100644
--- a/libs/langchain/langchain/chains/combine_documents/stuff.py
+++ b/libs/langchain/langchain/chains/combine_documents/stuff.py
@@ -2,6 +2,7 @@
from typing import Any, Dict, List, Optional, Tuple
+from langchain_core._api import deprecated
from langchain_core.callbacks import Callbacks
from langchain_core.documents import Document
from langchain_core.language_models import LanguageModelLike
@@ -95,6 +96,15 @@ def create_stuff_documents_chain(
).with_config(run_name="stuff_documents_chain")
+@deprecated(
+ since="0.2.13",
+ removal="1.0",
+ message=(
+ "This class is deprecated. Use the `create_stuff_documents_chain` constructor "
+ "instead. See migration guide here: "
+ "https://python.langchain.com/v0.2/docs/versions/migrating_chains/stuff_docs_chain/" # noqa: E501
+ ),
+)
class StuffDocumentsChain(BaseCombineDocumentsChain):
"""Chain that combines documents by stuffing into context.
diff --git a/libs/langchain/langchain/chains/elasticsearch_database/base.py b/libs/langchain/langchain/chains/elasticsearch_database/base.py
index 2e4b97c8dee..89875f2d8a4 100644
--- a/libs/langchain/langchain/chains/elasticsearch_database/base.py
+++ b/libs/langchain/langchain/chains/elasticsearch_database/base.py
@@ -6,14 +6,14 @@ from typing import TYPE_CHECKING, Any, Dict, List, Optional
from langchain_core.callbacks import CallbackManagerForChainRun
from langchain_core.language_models import BaseLanguageModel
-from langchain_core.output_parsers import BaseLLMOutputParser
+from langchain_core.output_parsers import BaseOutputParser, StrOutputParser
from langchain_core.output_parsers.json import SimpleJsonOutputParser
from langchain_core.prompts import BasePromptTemplate
from langchain_core.pydantic_v1 import root_validator
+from langchain_core.runnables import Runnable
from langchain.chains.base import Chain
from langchain.chains.elasticsearch_database.prompts import ANSWER_PROMPT, DSL_PROMPT
-from langchain.chains.llm import LLMChain
if TYPE_CHECKING:
from elasticsearch import Elasticsearch
@@ -35,9 +35,9 @@ class ElasticsearchDatabaseChain(Chain):
db_chain = ElasticsearchDatabaseChain.from_llm(OpenAI(), database)
"""
- query_chain: LLMChain
+ query_chain: Runnable
"""Chain for creating the ES query."""
- answer_chain: LLMChain
+ answer_chain: Runnable
"""Chain for answering the user question."""
database: Any
"""Elasticsearch database to connect to of type elasticsearch.Elasticsearch."""
@@ -135,9 +135,9 @@ class ElasticsearchDatabaseChain(Chain):
intermediate_steps: List = []
try:
intermediate_steps.append(query_inputs) # input: es generation
- es_cmd = self.query_chain.run(
- callbacks=_run_manager.get_child(),
- **query_inputs,
+ es_cmd = self.query_chain.invoke(
+ query_inputs,
+ config={"callbacks": _run_manager.get_child()},
)
_run_manager.on_text(es_cmd, color="green", verbose=self.verbose)
@@ -154,9 +154,9 @@ class ElasticsearchDatabaseChain(Chain):
_run_manager.on_text("\nAnswer:", verbose=self.verbose)
answer_inputs: dict = {"data": result, "input": input_text}
intermediate_steps.append(answer_inputs) # input: final answer
- final_result = self.answer_chain.run(
- callbacks=_run_manager.get_child(),
- **answer_inputs,
+ final_result = self.answer_chain.invoke(
+ answer_inputs,
+ config={"callbacks": _run_manager.get_child()},
)
intermediate_steps.append(final_result) # output: final answer
@@ -183,7 +183,7 @@ class ElasticsearchDatabaseChain(Chain):
*,
query_prompt: Optional[BasePromptTemplate] = None,
answer_prompt: Optional[BasePromptTemplate] = None,
- query_output_parser: Optional[BaseLLMOutputParser] = None,
+ query_output_parser: Optional[BaseOutputParser] = None,
**kwargs: Any,
) -> ElasticsearchDatabaseChain:
"""Convenience method to construct ElasticsearchDatabaseChain from an LLM.
@@ -199,11 +199,9 @@ class ElasticsearchDatabaseChain(Chain):
"""
query_prompt = query_prompt or DSL_PROMPT
query_output_parser = query_output_parser or SimpleJsonOutputParser()
- query_chain = LLMChain(
- llm=llm, prompt=query_prompt, output_parser=query_output_parser
- )
+ query_chain = query_prompt | llm | query_output_parser
answer_prompt = answer_prompt or ANSWER_PROMPT
- answer_chain = LLMChain(llm=llm, prompt=answer_prompt)
+ answer_chain = answer_prompt | llm | StrOutputParser()
return cls(
query_chain=query_chain,
answer_chain=answer_chain,
diff --git a/libs/langchain/langchain/chains/example_generator.py b/libs/langchain/langchain/chains/example_generator.py
index 8aae0565bfa..9cd4e6f01ee 100644
--- a/libs/langchain/langchain/chains/example_generator.py
+++ b/libs/langchain/langchain/chains/example_generator.py
@@ -1,11 +1,10 @@
from typing import List
from langchain_core.language_models import BaseLanguageModel
+from langchain_core.output_parsers import StrOutputParser
from langchain_core.prompts.few_shot import FewShotPromptTemplate
from langchain_core.prompts.prompt import PromptTemplate
-from langchain.chains.llm import LLMChain
-
TEST_GEN_TEMPLATE_SUFFIX = "Add another example."
@@ -19,5 +18,5 @@ def generate_example(
input_variables=[],
example_prompt=prompt_template,
)
- chain = LLMChain(llm=llm, prompt=prompt)
- return chain.predict()
+ chain = prompt | llm | StrOutputParser()
+ return chain.invoke({})
diff --git a/libs/langchain/langchain/chains/llm_checker/base.py b/libs/langchain/langchain/chains/llm_checker/base.py
index 2e2fa61d725..ea2bc546a57 100644
--- a/libs/langchain/langchain/chains/llm_checker/base.py
+++ b/libs/langchain/langchain/chains/llm_checker/base.py
@@ -5,6 +5,7 @@ from __future__ import annotations
import warnings
from typing import Any, Dict, List, Optional
+from langchain_core._api import deprecated
from langchain_core.callbacks import CallbackManagerForChainRun
from langchain_core.language_models import BaseLanguageModel
from langchain_core.prompts import PromptTemplate
@@ -63,6 +64,15 @@ def _load_question_to_checked_assertions_chain(
return question_to_checked_assertions_chain
+@deprecated(
+ since="0.2.13",
+ message=(
+ "See LangGraph guides for a variety of self-reflection and corrective "
+ "strategies for question-answering and other tasks: "
+ "https://langchain-ai.github.io/langgraph/tutorials/rag/langgraph_self_rag/"
+ ),
+ removal="1.0",
+)
class LLMCheckerChain(Chain):
"""Chain for question-answering with self-verification.
diff --git a/libs/langchain/langchain/chains/llm_summarization_checker/base.py b/libs/langchain/langchain/chains/llm_summarization_checker/base.py
index da310232cf7..f177f401529 100644
--- a/libs/langchain/langchain/chains/llm_summarization_checker/base.py
+++ b/libs/langchain/langchain/chains/llm_summarization_checker/base.py
@@ -6,6 +6,7 @@ import warnings
from pathlib import Path
from typing import Any, Dict, List, Optional
+from langchain_core._api import deprecated
from langchain_core.callbacks import CallbackManagerForChainRun
from langchain_core.language_models import BaseLanguageModel
from langchain_core.prompts.prompt import PromptTemplate
@@ -65,6 +66,15 @@ def _load_sequential_chain(
return chain
+@deprecated(
+ since="0.2.13",
+ message=(
+ "See LangGraph guides for a variety of self-reflection and corrective "
+ "strategies for question-answering and other tasks: "
+ "https://langchain-ai.github.io/langgraph/tutorials/rag/langgraph_self_rag/"
+ ),
+ removal="1.0",
+)
class LLMSummarizationCheckerChain(Chain):
"""Chain for question-answering with self-verification.
diff --git a/libs/langchain/langchain/chains/loading.py b/libs/langchain/langchain/chains/loading.py
index da6bd0cc228..2371edf24ab 100644
--- a/libs/langchain/langchain/chains/loading.py
+++ b/libs/langchain/langchain/chains/loading.py
@@ -7,6 +7,7 @@ from pathlib import Path
from typing import TYPE_CHECKING, Any, Union
import yaml
+from langchain_core._api import deprecated
from langchain_core.prompts.loading import (
_load_output_parser,
load_prompt,
@@ -649,6 +650,14 @@ type_to_loader_dict = {
}
+@deprecated(
+ since="0.2.13",
+ message=(
+ "This function is deprecated and will be removed in langchain 1.0. "
+ "At that point chains must be imported from their respective modules."
+ ),
+ removal="1.0",
+)
def load_chain_from_config(config: dict, **kwargs: Any) -> Chain:
"""Load chain from Config Dict."""
if "_type" not in config:
@@ -662,6 +671,14 @@ def load_chain_from_config(config: dict, **kwargs: Any) -> Chain:
return chain_loader(config, **kwargs)
+@deprecated(
+ since="0.2.13",
+ message=(
+ "This function is deprecated and will be removed in langchain 1.0. "
+ "At that point chains must be imported from their respective modules."
+ ),
+ removal="1.0",
+)
def load_chain(path: Union[str, Path], **kwargs: Any) -> Chain:
"""Unified method for loading a chain from LangChainHub or local fs."""
if isinstance(path, str) and path.startswith("lc://"):
diff --git a/libs/langchain/langchain/chains/mapreduce.py b/libs/langchain/langchain/chains/mapreduce.py
index 359133f0de2..1eaccf67a85 100644
--- a/libs/langchain/langchain/chains/mapreduce.py
+++ b/libs/langchain/langchain/chains/mapreduce.py
@@ -8,6 +8,7 @@ from __future__ import annotations
from typing import Any, Dict, List, Mapping, Optional
+from langchain_core._api import deprecated
from langchain_core.callbacks import CallbackManagerForChainRun, Callbacks
from langchain_core.documents import Document
from langchain_core.language_models import BaseLanguageModel
@@ -22,6 +23,16 @@ from langchain.chains.combine_documents.stuff import StuffDocumentsChain
from langchain.chains.llm import LLMChain
+@deprecated(
+ since="0.2.13",
+ removal="1.0",
+ message=(
+ "Refer here for a recommended map-reduce implementation using langgraph: "
+ "https://langchain-ai.github.io/langgraph/how-tos/map-reduce/. See also "
+ "migration guide: "
+ "https://python.langchain.com/v0.2/docs/versions/migrating_chains/map_reduce_chain/" # noqa: E501
+ ),
+)
class MapReduceChain(Chain):
"""Map-reduce chain."""
diff --git a/libs/langchain/langchain/chains/openai_functions/__init__.py b/libs/langchain/langchain/chains/openai_functions/__init__.py
index 0bed9159a75..6312b619890 100644
--- a/libs/langchain/langchain/chains/openai_functions/__init__.py
+++ b/libs/langchain/langchain/chains/openai_functions/__init__.py
@@ -6,6 +6,7 @@ from langchain.chains.openai_functions.base import (
)
from langchain.chains.openai_functions.citation_fuzzy_match import (
create_citation_fuzzy_match_chain,
+ create_citation_fuzzy_match_runnable,
)
from langchain.chains.openai_functions.extraction import (
create_extraction_chain,
@@ -32,6 +33,7 @@ __all__ = [
"create_extraction_chain_pydantic",
"create_extraction_chain",
"create_citation_fuzzy_match_chain",
+ "create_citation_fuzzy_match_runnable",
"create_qa_with_structure_chain",
"create_qa_with_sources_chain",
"create_structured_output_chain",
diff --git a/libs/langchain/langchain/chains/openai_functions/citation_fuzzy_match.py b/libs/langchain/langchain/chains/openai_functions/citation_fuzzy_match.py
index 05bb27d7a9a..038489d13a6 100644
--- a/libs/langchain/langchain/chains/openai_functions/citation_fuzzy_match.py
+++ b/libs/langchain/langchain/chains/openai_functions/citation_fuzzy_match.py
@@ -1,10 +1,12 @@
from typing import Iterator, List
-from langchain_core.language_models import BaseLanguageModel
+from langchain_core._api import deprecated
+from langchain_core.language_models import BaseChatModel, BaseLanguageModel
from langchain_core.messages import HumanMessage, SystemMessage
from langchain_core.output_parsers.openai_functions import PydanticOutputFunctionsParser
from langchain_core.prompts.chat import ChatPromptTemplate, HumanMessagePromptTemplate
from langchain_core.pydantic_v1 import BaseModel, Field
+from langchain_core.runnables import Runnable
from langchain.chains.llm import LLMChain
from langchain.chains.openai_functions.utils import get_llm_kwargs
@@ -61,6 +63,57 @@ class QuestionAnswer(BaseModel):
)
+def create_citation_fuzzy_match_runnable(llm: BaseChatModel) -> Runnable:
+ """Create a citation fuzzy match Runnable.
+
+ Example usage:
+
+ .. code-block:: python
+
+ from langchain.chains import create_citation_fuzzy_match_runnable
+ from langchain_openai import ChatOpenAI
+
+ llm = ChatOpenAI(model="gpt-4o-mini")
+
+ context = "Alice has blue eyes. Bob has brown eyes. Charlie has green eyes."
+ question = "What color are Bob's eyes?"
+
+ chain = create_citation_fuzzy_match_runnable(llm)
+ chain.invoke({"question": question, "context": context})
+
+ Args:
+ llm: Language model to use for the chain. Must implement bind_tools.
+
+ Returns:
+ Runnable that can be used to answer questions with citations.
+ """
+ if llm.bind_tools is BaseChatModel.bind_tools:
+ raise ValueError(
+ "Language model must implement bind_tools to use this function."
+ )
+ prompt = ChatPromptTemplate(
+ [
+ SystemMessage(
+ "You are a world class algorithm to answer "
+ "questions with correct and exact citations."
+ ),
+ HumanMessagePromptTemplate.from_template(
+ "Answer question using the following context."
+ "\n\n{context}"
+ "\n\nQuestion: {question}"
+ "\n\nTips: Make sure to cite your sources, "
+ "and use the exact words from the context."
+ ),
+ ]
+ )
+ return prompt | llm.with_structured_output(QuestionAnswer)
+
+
+@deprecated(
+ since="0.2.13",
+ removal="1.0",
+ alternative="create_citation_fuzzy_match_runnable",
+)
def create_citation_fuzzy_match_chain(llm: BaseLanguageModel) -> LLMChain:
"""Create a citation fuzzy match chain.
diff --git a/libs/langchain/langchain/chains/openai_functions/openapi.py b/libs/langchain/langchain/chains/openai_functions/openapi.py
index 79c78fdc2ef..de4ba38dcd7 100644
--- a/libs/langchain/langchain/chains/openai_functions/openapi.py
+++ b/libs/langchain/langchain/chains/openai_functions/openapi.py
@@ -6,6 +6,7 @@ from collections import defaultdict
from typing import TYPE_CHECKING, Any, Callable, Dict, List, Optional, Tuple, Union
import requests
+from langchain_core._api import deprecated
from langchain_core.callbacks import CallbackManagerForChainRun
from langchain_core.language_models import BaseLanguageModel
from langchain_core.output_parsers.openai_functions import JsonOutputFunctionsParser
@@ -242,6 +243,15 @@ class SimpleRequestChain(Chain):
return {self.output_key: response}
+@deprecated(
+ since="0.2.13",
+ message=(
+ "This function is deprecated and will be removed in langchain 1.0. "
+ "See API reference for replacement: "
+ "https://api.python.langchain.com/en/latest/chains/langchain.chains.openai_functions.openapi.get_openapi_chain.html" # noqa: E501
+ ),
+ removal="1.0",
+)
def get_openapi_chain(
spec: Union[OpenAPISpec, str],
llm: Optional[BaseLanguageModel] = None,
@@ -255,13 +265,90 @@ def get_openapi_chain(
) -> SequentialChain:
"""Create a chain for querying an API from a OpenAPI spec.
+ Note: this class is deprecated. See below for a replacement implementation.
+ The benefits of this implementation are:
+
+ - Uses LLM tool calling features to encourage properly-formatted API requests;
+ - Includes async support.
+
+ .. code-block:: python
+
+ from typing import Any
+
+ from langchain.chains.openai_functions.openapi import openapi_spec_to_openai_fn
+ from langchain_community.utilities.openapi import OpenAPISpec
+ from langchain_core.prompts import ChatPromptTemplate
+ from langchain_openai import ChatOpenAI
+
+ # Define API spec. Can be JSON or YAML
+ api_spec = \"\"\"
+ {
+ "openapi": "3.1.0",
+ "info": {
+ "title": "JSONPlaceholder API",
+ "version": "1.0.0"
+ },
+ "servers": [
+ {
+ "url": "https://jsonplaceholder.typicode.com"
+ }
+ ],
+ "paths": {
+ "/posts": {
+ "get": {
+ "summary": "Get posts",
+ "parameters": [
+ {
+ "name": "_limit",
+ "in": "query",
+ "required": false,
+ "schema": {
+ "type": "integer",
+ "example": 2
+ },
+ "description": "Limit the number of results"
+ }
+ ]
+ }
+ }
+ }
+ }
+ \"\"\"
+
+ parsed_spec = OpenAPISpec.from_text(api_spec)
+ openai_fns, call_api_fn = openapi_spec_to_openai_fn(parsed_spec)
+ tools = [
+ {"type": "function", "function": fn}
+ for fn in openai_fns
+ ]
+
+ prompt = ChatPromptTemplate.from_template(
+ "Use the provided APIs to respond to this user query:\\n\\n{query}"
+ )
+ llm = ChatOpenAI(model="gpt-4o-mini", temperature=0).bind_tools(tools)
+
+ def _execute_tool(message) -> Any:
+ if tool_calls := message.tool_calls:
+ tool_call = message.tool_calls[0]
+ response = call_api_fn(name=tool_call["name"], fn_args=tool_call["args"])
+ response.raise_for_status()
+ return response.json()
+ else:
+ return message.content
+
+ chain = prompt | llm | _execute_tool
+
+ .. code-block:: python
+
+ response = chain.invoke({"query": "Get me top two posts."})
+
Args:
spec: OpenAPISpec or url/file/text string corresponding to one.
llm: language model, should be an OpenAI function-calling model, e.g.
`ChatOpenAI(model="gpt-3.5-turbo-0613")`.
prompt: Main prompt template to use.
request_chain: Chain for taking the functions output and executing the request.
- """
+ """ # noqa: E501
try:
from langchain_community.utilities.openapi import OpenAPISpec
except ImportError as e:
diff --git a/libs/langchain/langchain/chains/openai_functions/qa_with_structure.py b/libs/langchain/langchain/chains/openai_functions/qa_with_structure.py
index 9ef856d8b96..f13e2f9e522 100644
--- a/libs/langchain/langchain/chains/openai_functions/qa_with_structure.py
+++ b/libs/langchain/langchain/chains/openai_functions/qa_with_structure.py
@@ -1,5 +1,6 @@
from typing import Any, List, Optional, Type, Union, cast
+from langchain_core._api import deprecated
from langchain_core.language_models import BaseLanguageModel
from langchain_core.messages import HumanMessage, SystemMessage
from langchain_core.output_parsers import BaseLLMOutputParser
@@ -25,6 +26,15 @@ class AnswerWithSources(BaseModel):
)
+@deprecated(
+ since="0.2.13",
+ removal="1.0",
+ message=(
+ "This function is deprecated. Refer to this guide on retrieval and question "
+ "answering with structured responses: "
+ "https://python.langchain.com/v0.2/docs/how_to/qa_sources/#structure-sources-in-model-response" # noqa: E501
+ ),
+)
def create_qa_with_structure_chain(
llm: BaseLanguageModel,
schema: Union[dict, Type[BaseModel]],
@@ -95,6 +105,15 @@ def create_qa_with_structure_chain(
return chain
+@deprecated(
+ since="0.2.13",
+ removal="1.0",
+ message=(
+ "This function is deprecated. Refer to this guide on retrieval and question "
+ "answering with sources: "
+ "https://python.langchain.com/v0.2/docs/how_to/qa_sources/#structure-sources-in-model-response" # noqa: E501
+ ),
+)
def create_qa_with_sources_chain(
llm: BaseLanguageModel, verbose: bool = False, **kwargs: Any
) -> LLMChain:
diff --git a/libs/langchain/langchain/chains/openai_functions/tagging.py b/libs/langchain/langchain/chains/openai_functions/tagging.py
index e96a138dfd1..aab5421156a 100644
--- a/libs/langchain/langchain/chains/openai_functions/tagging.py
+++ b/libs/langchain/langchain/chains/openai_functions/tagging.py
@@ -1,5 +1,6 @@
from typing import Any, Optional
+from langchain_core._api import deprecated
from langchain_core.language_models import BaseLanguageModel
from langchain_core.output_parsers.openai_functions import (
JsonOutputFunctionsParser,
@@ -29,6 +30,21 @@ Passage:
"""
+@deprecated(
+ since="0.2.13",
+ message=(
+ "LangChain has introduced a method called `with_structured_output` that "
+ "is available on ChatModels capable of tool calling. "
+ "See API reference for this function for replacement: "
+ " " # noqa: E501
+ "You can read more about `with_structured_output` here: "
+ ". "
+ "If you notice other issues, please provide "
+ "feedback here: "
+ ""
+ ),
+ removal="1.0",
+)
def create_tagging_chain(
schema: dict,
llm: BaseLanguageModel,
@@ -38,6 +54,32 @@ def create_tagging_chain(
"""Create a chain that extracts information from a passage
based on a schema.
+ This function is deprecated. Please use `with_structured_output` instead.
+ See example usage below:
+
+ .. code-block:: python
+
+ from typing_extensions import Annotated, TypedDict
+ from langchain_anthropic import ChatAnthropic
+
+ class Joke(TypedDict):
+ \"\"\"Tagged joke.\"\"\"
+
+ setup: Annotated[str, ..., "The setup of the joke"]
+ punchline: Annotated[str, ..., "The punchline of the joke"]
+
+ # Or any other chat model that supports tools.
+ # Please reference to to the documentation of structured_output
+ # to see an up to date list of which models support
+ # with_structured_output.
+ model = ChatAnthropic(model="claude-3-haiku-20240307", temperature=0)
+ structured_llm = model.with_structured_output(Joke)
+ structured_llm.invoke(
+ "Why did the cat cross the road? To get to the other "
+ "side... and then lay down in the middle of it!"
+ )
+ Read more here: https://python.langchain.com/v0.2/docs/how_to/structured_output/
+
Args:
schema: The schema of the entities to extract.
llm: The language model to use.
@@ -59,6 +101,21 @@ def create_tagging_chain(
return chain
+@deprecated(
+ since="0.2.13",
+ message=(
+ "LangChain has introduced a method called `with_structured_output` that "
+ "is available on ChatModels capable of tool calling. "
+ "See API reference for this function for replacement: "
+ " " # noqa: E501
+ "You can read more about `with_structured_output` here: "
+ ". "
+ "If you notice other issues, please provide "
+ "feedback here: "
+ ""
+ ),
+ removal="1.0",
+)
def create_tagging_chain_pydantic(
pydantic_schema: Any,
llm: BaseLanguageModel,
@@ -68,6 +125,30 @@ def create_tagging_chain_pydantic(
"""Create a chain that extracts information from a passage
based on a pydantic schema.
+ This function is deprecated. Please use `with_structured_output` instead.
+ See example usage below:
+
+ .. code-block:: python
+
+ from langchain_core.pydantic_v1 import BaseModel, Field
+ from langchain_anthropic import ChatAnthropic
+
+ class Joke(BaseModel):
+ setup: str = Field(description="The setup of the joke")
+ punchline: str = Field(description="The punchline to the joke")
+
+ # Or any other chat model that supports tools.
+ # Please reference to to the documentation of structured_output
+ # to see an up to date list of which models support
+ # with_structured_output.
+ model = ChatAnthropic(model="claude-3-opus-20240229", temperature=0)
+ structured_llm = model.with_structured_output(Joke)
+ structured_llm.invoke(
+ "Why did the cat cross the road? To get to the other "
+ "side... and then lay down in the middle of it!"
+ )
+ Read more here: https://python.langchain.com/v0.2/docs/how_to/structured_output/
+
Args:
pydantic_schema: The pydantic schema of the entities to extract.
llm: The language model to use.
diff --git a/libs/langchain/langchain/chains/qa_with_sources/base.py b/libs/langchain/langchain/chains/qa_with_sources/base.py
index c7324a7e32f..aed2d57cf91 100644
--- a/libs/langchain/langchain/chains/qa_with_sources/base.py
+++ b/libs/langchain/langchain/chains/qa_with_sources/base.py
@@ -7,6 +7,7 @@ import re
from abc import ABC, abstractmethod
from typing import Any, Dict, List, Optional, Tuple
+from langchain_core._api import deprecated
from langchain_core.callbacks import (
AsyncCallbackManagerForChainRun,
CallbackManagerForChainRun,
@@ -30,6 +31,15 @@ from langchain.chains.qa_with_sources.map_reduce_prompt import (
)
+@deprecated(
+ since="0.2.13",
+ removal="1.0",
+ message=(
+ "This class is deprecated. Refer to this guide on retrieval and question "
+ "answering with sources: "
+ "https://python.langchain.com/v0.2/docs/how_to/qa_sources/"
+ ),
+)
class BaseQAWithSourcesChain(Chain, ABC):
"""Question answering chain with sources over documents."""
@@ -198,6 +208,15 @@ class BaseQAWithSourcesChain(Chain, ABC):
return result
+@deprecated(
+ since="0.2.13",
+ removal="1.0",
+ message=(
+ "This class is deprecated. Refer to this guide on retrieval and question "
+ "answering with sources: "
+ "https://python.langchain.com/v0.2/docs/how_to/qa_sources/"
+ ),
+)
class QAWithSourcesChain(BaseQAWithSourcesChain):
"""Question answering with sources over documents."""
diff --git a/libs/langchain/langchain/chains/qa_with_sources/loading.py b/libs/langchain/langchain/chains/qa_with_sources/loading.py
index c24a20bb556..24578216849 100644
--- a/libs/langchain/langchain/chains/qa_with_sources/loading.py
+++ b/libs/langchain/langchain/chains/qa_with_sources/loading.py
@@ -4,6 +4,7 @@ from __future__ import annotations
from typing import Any, Mapping, Optional, Protocol
+from langchain_core._api import deprecated
from langchain_core.language_models import BaseLanguageModel
from langchain_core.prompts import BasePromptTemplate
@@ -151,6 +152,21 @@ def _load_refine_chain(
)
+@deprecated(
+ since="0.2.13",
+ removal="1.0",
+ message=(
+ "This function is deprecated. Refer to this guide on retrieval and question "
+ "answering with sources: "
+ "https://python.langchain.com/v0.2/docs/how_to/qa_sources/"
+ "\nSee also the following migration guides for replacements "
+ "based on `chain_type`:\n"
+ "stuff: https://python.langchain.com/v0.2/docs/versions/migrating_chains/stuff_docs_chain\n" # noqa: E501
+ "map_reduce: https://python.langchain.com/v0.2/docs/versions/migrating_chains/map_reduce_chain\n" # noqa: E501
+ "refine: https://python.langchain.com/v0.2/docs/versions/migrating_chains/refine_chain\n" # noqa: E501
+ "map_rerank: https://python.langchain.com/v0.2/docs/versions/migrating_chains/map_rerank_docs_chain\n" # noqa: E501
+ ),
+)
def load_qa_with_sources_chain(
llm: BaseLanguageModel,
chain_type: str = "stuff",
diff --git a/libs/langchain/langchain/chains/query_constructor/base.py b/libs/langchain/langchain/chains/query_constructor/base.py
index 0d303f6a616..419cd6002ad 100644
--- a/libs/langchain/langchain/chains/query_constructor/base.py
+++ b/libs/langchain/langchain/chains/query_constructor/base.py
@@ -5,6 +5,7 @@ from __future__ import annotations
import json
from typing import Any, Callable, List, Optional, Sequence, Tuple, Union, cast
+from langchain_core._api import deprecated
from langchain_core.exceptions import OutputParserException
from langchain_core.language_models import BaseLanguageModel
from langchain_core.output_parsers import BaseOutputParser
@@ -257,6 +258,11 @@ def get_query_constructor_prompt(
)
+@deprecated(
+ since="0.2.13",
+ alternative="load_query_constructor_runnable",
+ removal="1.0",
+)
def load_query_constructor_chain(
llm: BaseLanguageModel,
document_contents: str,
diff --git a/libs/langchain/langchain/chains/question_answering/chain.py b/libs/langchain/langchain/chains/question_answering/chain.py
index f83ae8fa8dd..c83895dc2a8 100644
--- a/libs/langchain/langchain/chains/question_answering/chain.py
+++ b/libs/langchain/langchain/chains/question_answering/chain.py
@@ -2,6 +2,7 @@
from typing import Any, Mapping, Optional, Protocol
+from langchain_core._api import deprecated
from langchain_core.callbacks import BaseCallbackManager, Callbacks
from langchain_core.language_models import BaseLanguageModel
from langchain_core.prompts import BasePromptTemplate
@@ -216,6 +217,20 @@ def _load_refine_chain(
)
+@deprecated(
+ since="0.2.13",
+ removal="1.0",
+ message=(
+ "This class is deprecated. See the following migration guides for replacements "
+ "based on `chain_type`:\n"
+ "stuff: https://python.langchain.com/v0.2/docs/versions/migrating_chains/stuff_docs_chain\n" # noqa: E501
+ "map_reduce: https://python.langchain.com/v0.2/docs/versions/migrating_chains/map_reduce_chain\n" # noqa: E501
+ "refine: https://python.langchain.com/v0.2/docs/versions/migrating_chains/refine_chain\n" # noqa: E501
+ "map_rerank: https://python.langchain.com/v0.2/docs/versions/migrating_chains/map_rerank_docs_chain\n" # noqa: E501
+ "\nSee also guides on retrieval and question-answering here: "
+ "https://python.langchain.com/v0.2/docs/how_to/#qa-with-rag"
+ ),
+)
def load_qa_chain(
llm: BaseLanguageModel,
chain_type: str = "stuff",
diff --git a/libs/langchain/langchain/chains/retrieval_qa/base.py b/libs/langchain/langchain/chains/retrieval_qa/base.py
index 0b25dc00b0b..689dd8b0c21 100644
--- a/libs/langchain/langchain/chains/retrieval_qa/base.py
+++ b/libs/langchain/langchain/chains/retrieval_qa/base.py
@@ -28,6 +28,15 @@ from langchain.chains.question_answering import load_qa_chain
from langchain.chains.question_answering.stuff_prompt import PROMPT_SELECTOR
+@deprecated(
+ since="0.2.13",
+ removal="1.0",
+ message=(
+ "This class is deprecated. Use the `create_retrieval_chain` constructor "
+ "instead. See migration guide here: "
+ "https://python.langchain.com/v0.2/docs/versions/migrating_chains/retrieval_qa/"
+ ),
+)
class BaseRetrievalQA(Chain):
"""Base class for question-answering chains."""
@@ -194,7 +203,15 @@ class BaseRetrievalQA(Chain):
return {self.output_key: answer}
-@deprecated(since="0.1.17", alternative="create_retrieval_chain", removal="0.3.0")
+@deprecated(
+ since="0.1.17",
+ removal="1.0",
+ message=(
+ "This class is deprecated. Use the `create_retrieval_chain` constructor "
+ "instead. See migration guide here: "
+ "https://python.langchain.com/v0.2/docs/versions/migrating_chains/retrieval_qa/"
+ ),
+)
class RetrievalQA(BaseRetrievalQA):
"""Chain for question-answering against an index.
@@ -271,6 +288,15 @@ class RetrievalQA(BaseRetrievalQA):
return "retrieval_qa"
+@deprecated(
+ since="0.2.13",
+ removal="1.0",
+ message=(
+ "This class is deprecated. Use the `create_retrieval_chain` constructor "
+ "instead. See migration guide here: "
+ "https://python.langchain.com/v0.2/docs/versions/migrating_chains/retrieval_qa/"
+ ),
+)
class VectorDBQA(BaseRetrievalQA):
"""Chain for question-answering against a vector database."""
diff --git a/libs/langchain/langchain/chains/router/llm_router.py b/libs/langchain/langchain/chains/router/llm_router.py
index f08d34ab553..132f350e819 100644
--- a/libs/langchain/langchain/chains/router/llm_router.py
+++ b/libs/langchain/langchain/chains/router/llm_router.py
@@ -4,6 +4,7 @@ from __future__ import annotations
from typing import Any, Dict, List, Optional, Type, cast
+from langchain_core._api import deprecated
from langchain_core.callbacks import (
AsyncCallbackManagerForChainRun,
CallbackManagerForChainRun,
@@ -19,8 +20,82 @@ from langchain.chains import LLMChain
from langchain.chains.router.base import RouterChain
+@deprecated(
+ since="0.2.12",
+ removal="1.0",
+ message=(
+ "Use RunnableLambda to select from multiple prompt templates. See example "
+ "in API reference: "
+ "https://api.python.langchain.com/en/latest/chains/langchain.chains.router.llm_router.LLMRouterChain.html" # noqa: E501
+ ),
+)
class LLMRouterChain(RouterChain):
- """A router chain that uses an LLM chain to perform routing."""
+ """A router chain that uses an LLM chain to perform routing.
+
+ This class is deprecated. See below for a replacement, which offers several
+ benefits, including streaming and batch support.
+
+ Below is an example implementation:
+
+ .. code-block:: python
+
+ from operator import itemgetter
+ from typing import Literal
+ from typing_extensions import TypedDict
+
+ from langchain_core.output_parsers import StrOutputParser
+ from langchain_core.prompts import ChatPromptTemplate
+ from langchain_core.runnables import RunnableLambda, RunnablePassthrough
+ from langchain_openai import ChatOpenAI
+
+ llm = ChatOpenAI(model="gpt-4o-mini")
+
+ prompt_1 = ChatPromptTemplate.from_messages(
+ [
+ ("system", "You are an expert on animals."),
+ ("human", "{query}"),
+ ]
+ )
+ prompt_2 = ChatPromptTemplate.from_messages(
+ [
+ ("system", "You are an expert on vegetables."),
+ ("human", "{query}"),
+ ]
+ )
+
+ chain_1 = prompt_1 | llm | StrOutputParser()
+ chain_2 = prompt_2 | llm | StrOutputParser()
+
+ route_system = "Route the user's query to either the animal or vegetable expert."
+ route_prompt = ChatPromptTemplate.from_messages(
+ [
+ ("system", route_system),
+ ("human", "{query}"),
+ ]
+ )
+
+
+ class RouteQuery(TypedDict):
+ \"\"\"Route query to destination.\"\"\"
+ destination: Literal["animal", "vegetable"]
+
+
+ route_chain = (
+ route_prompt
+ | llm.with_structured_output(RouteQuery)
+ | itemgetter("destination")
+ )
+
+ chain = {
+ "destination": route_chain, # "animal" or "vegetable"
+ "query": lambda x: x["query"], # pass through input query
+ } | RunnableLambda(
+ # if animal, chain_1. otherwise, chain_2.
+ lambda x: chain_1 if x["destination"] == "animal" else chain_2,
+ )
+
+ chain.invoke({"query": "what color are carrots"})
+ """ # noqa: E501
llm_chain: LLMChain
"""LLM chain used to perform routing"""
diff --git a/libs/langchain/langchain/chains/router/multi_prompt.py b/libs/langchain/langchain/chains/router/multi_prompt.py
index fe10e1db7d6..214b9a2b372 100644
--- a/libs/langchain/langchain/chains/router/multi_prompt.py
+++ b/libs/langchain/langchain/chains/router/multi_prompt.py
@@ -4,6 +4,7 @@ from __future__ import annotations
from typing import Any, Dict, List, Optional
+from langchain_core._api import deprecated
from langchain_core.language_models import BaseLanguageModel
from langchain_core.prompts import PromptTemplate
@@ -15,8 +16,82 @@ from langchain.chains.router.llm_router import LLMRouterChain, RouterOutputParse
from langchain.chains.router.multi_prompt_prompt import MULTI_PROMPT_ROUTER_TEMPLATE
+@deprecated(
+ since="0.2.12",
+ removal="1.0",
+ message=(
+ "Use RunnableLambda to select from multiple prompt templates. See example "
+ "in API reference: "
+ "https://api.python.langchain.com/en/latest/chains/langchain.chains.router.multi_prompt.MultiPromptChain.html" # noqa: E501
+ ),
+)
class MultiPromptChain(MultiRouteChain):
- """A multi-route chain that uses an LLM router chain to choose amongst prompts."""
+ """A multi-route chain that uses an LLM router chain to choose amongst prompts.
+
+ This class is deprecated. See below for a replacement, which offers several
+ benefits, including streaming and batch support.
+
+ Below is an example implementation:
+
+ .. code-block:: python
+
+ from operator import itemgetter
+ from typing import Literal
+ from typing_extensions import TypedDict
+
+ from langchain_core.output_parsers import StrOutputParser
+ from langchain_core.prompts import ChatPromptTemplate
+ from langchain_core.runnables import RunnableLambda, RunnablePassthrough
+ from langchain_openai import ChatOpenAI
+
+ llm = ChatOpenAI(model="gpt-4o-mini")
+
+ prompt_1 = ChatPromptTemplate.from_messages(
+ [
+ ("system", "You are an expert on animals."),
+ ("human", "{query}"),
+ ]
+ )
+ prompt_2 = ChatPromptTemplate.from_messages(
+ [
+ ("system", "You are an expert on vegetables."),
+ ("human", "{query}"),
+ ]
+ )
+
+ chain_1 = prompt_1 | llm | StrOutputParser()
+ chain_2 = prompt_2 | llm | StrOutputParser()
+
+ route_system = "Route the user's query to either the animal or vegetable expert."
+ route_prompt = ChatPromptTemplate.from_messages(
+ [
+ ("system", route_system),
+ ("human", "{query}"),
+ ]
+ )
+
+
+ class RouteQuery(TypedDict):
+ \"\"\"Route query to destination.\"\"\"
+ destination: Literal["animal", "vegetable"]
+
+
+ route_chain = (
+ route_prompt
+ | llm.with_structured_output(RouteQuery)
+ | itemgetter("destination")
+ )
+
+ chain = {
+ "destination": route_chain, # "animal" or "vegetable"
+ "query": lambda x: x["query"], # pass through input query
+ } | RunnableLambda(
+ # if animal, chain_1. otherwise, chain_2.
+ lambda x: chain_1 if x["destination"] == "animal" else chain_2,
+ )
+
+ chain.invoke({"query": "what color are carrots"})
+ """ # noqa: E501
@property
def output_keys(self) -> List[str]:
diff --git a/libs/langchain/langchain/memory/summary.py b/libs/langchain/langchain/memory/summary.py
index 166c1b3d4dd..23c3f2bca1f 100644
--- a/libs/langchain/langchain/memory/summary.py
+++ b/libs/langchain/langchain/memory/summary.py
@@ -2,6 +2,7 @@ from __future__ import annotations
from typing import Any, Dict, List, Type
+from langchain_core._api import deprecated
from langchain_core.chat_history import BaseChatMessageHistory
from langchain_core.language_models import BaseLanguageModel
from langchain_core.messages import BaseMessage, SystemMessage, get_buffer_string
@@ -14,6 +15,14 @@ from langchain.memory.chat_memory import BaseChatMemory
from langchain.memory.prompt import SUMMARY_PROMPT
+@deprecated(
+ since="0.2.12",
+ removal="1.0",
+ message=(
+ "Refer here for how to incorporate summaries of conversation history: "
+ "https://langchain-ai.github.io/langgraph/how-tos/memory/add-summary-conversation-history/" # noqa: E501
+ ),
+)
class SummarizerMixin(BaseModel):
"""Mixin for summarizer."""
diff --git a/libs/langchain/tests/integration_tests/chains/openai_functions/test_openapi.py b/libs/langchain/tests/integration_tests/chains/openai_functions/test_openapi.py
index 5d7ea309f3d..d3c294cbd56 100644
--- a/libs/langchain/tests/integration_tests/chains/openai_functions/test_openapi.py
+++ b/libs/langchain/tests/integration_tests/chains/openai_functions/test_openapi.py
@@ -1,25 +1,38 @@
-import os
-from pathlib import Path
+import json
+
+import pytest
from langchain.chains.openai_functions.openapi import get_openapi_chain
-
-def test_openai_opeanapi() -> None:
- chain = get_openapi_chain(
- "https://www.klarna.com/us/shopping/public/openai/v0/api-docs/"
- )
- output = chain.run("What are some options for a men's large blue button down shirt")
-
- assert isinstance(output, dict)
+api_spec = {
+ "openapi": "3.0.0",
+ "info": {"title": "JSONPlaceholder API", "version": "1.0.0"},
+ "servers": [{"url": "https://jsonplaceholder.typicode.com"}],
+ "paths": {
+ "/posts": {
+ "get": {
+ "summary": "Get posts",
+ "parameters": [
+ {
+ "name": "_limit",
+ "in": "query",
+ "required": False,
+ "schema": {"type": "integer", "example": 2},
+ "description": "Limit the number of results",
+ },
+ ],
+ }
+ }
+ },
+}
-def test_openai_opeanapi_headers() -> None:
- BRANDFETCH_API_KEY = os.environ.get("BRANDFETCH_API_KEY")
- headers = {"Authorization": f"Bearer {BRANDFETCH_API_KEY}"}
- file_path = str(
- Path(__file__).parents[2] / "examples/brandfetch-brandfetch-2.0.0-resolved.json"
- )
- chain = get_openapi_chain(file_path, headers=headers)
- output = chain.run("I want to know about nike.comgg")
+@pytest.mark.requires("openapi_pydantic")
+@pytest.mark.requires("langchain_openai")
+def test_openai_openapi_chain() -> None:
+ from langchain_openai import ChatOpenAI
- assert isinstance(output, str)
+ llm = ChatOpenAI(model="gpt-4o-mini", temperature=0)
+ chain = get_openapi_chain(json.dumps(api_spec), llm)
+ output = chain.invoke({"query": "Fetch the top two posts."})
+ assert len(output["response"]) == 2
diff --git a/libs/langchain/tests/unit_tests/chains/test_imports.py b/libs/langchain/tests/unit_tests/chains/test_imports.py
index 797b81b440f..501c706fdf0 100644
--- a/libs/langchain/tests/unit_tests/chains/test_imports.py
+++ b/libs/langchain/tests/unit_tests/chains/test_imports.py
@@ -49,6 +49,7 @@ EXPECTED_ALL = [
"VectorDBQA",
"VectorDBQAWithSourcesChain",
"create_citation_fuzzy_match_chain",
+ "create_citation_fuzzy_match_runnable",
"create_extraction_chain",
"create_extraction_chain_pydantic",
"create_qa_with_sources_chain",