x

fix web loader (#8538 )
Rely less on positional arg order in subclasses of vector store when calling async methods (#8534 )
2026-02-10 11:10:23 +00:00 · 2023-07-31 22:48:54 -04:00 · 2023-07-31 12:47:33 -07:00 · 2023-07-31 20:13:11 +01:00 · 2023-07-31 11:07:10 -07:00 · 2023-07-31 09:54:59 -07:00
35 changed files with 1612 additions and 556 deletions
--- a/docs/api_reference/templates/class.rst
+++ b/docs/api_reference/templates/class.rst
@@ -3,28 +3,44 @@

 .. currentmodule:: {{ module }}

+{% if '_value2member_map_' in  all_attributes %}
+    {% set classType = "enum" %}
+{% else %}
+    {% set classType = "default" %}
+{% endif %}
+
 .. autoclass:: {{ objname }}

-   {% block methods %}
-   {% if methods %}
-   .. rubric:: {{ _('Methods') }}
+   {% if classType == "enum" %}
+       {% if attributes %}
+       .. rubric:: {{ _('Attributes') }}
+       {% endif %}
+   {% else %}
+       {% if attributes %}
+       .. rubric:: {{ _('Attributes') }}
+       {% endif %}

-   .. autosummary::
-   {% for item in methods %}
-      ~{{ name }}.{{ item }}
-   {%- endfor %}
-   {% endif %}
-   {% endblock %}
+       {% block methods %}
+       {% if methods %}
+       .. rubric:: {{ _('Methods') }}

-   {% block attributes %}
-   {% if attributes %}
-   .. rubric:: {{ _('Attributes') }}
+       .. autosummary::
+       {% for item in methods %}
+          ~{{ name }}.{{ item }}
+       {%- endfor %}
+       {% endif %}
+       {% endblock %}

-   .. autosummary::
-   {% for item in attributes %}
-      ~{{ name }}.{{ item }}
-   {%- endfor %}
-   {% endif %}
-   {% endblock %}
+       {% block attributes %}
+       {% if attributes %}
+       .. rubric:: {{ _('Attributes') }}

-.. example_links:: {{ objname }}
+       .. autosummary::
+       {% for item in attributes %}
+          ~{{ name }}.{{ item }}
+       {%- endfor %}
+       {% endif %}
+       {% endblock %}
+    {% endif %}
+
+.. example_links:: {{ objname }}
--- a/docs/docs_skeleton/generate_api_reference_links.py
+++ b/docs/docs_skeleton/generate_api_reference_links.py
@@ -10,7 +10,7 @@ import argparse
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
 # Base URL for all class documentation
-_BASE_URL = "https://api.python.langchain.com/en/latest"
+_BASE_URL = "https://api.python.langchain.com/en/latest/"

 # Regular expression to match Python code blocks
 code_block_re = re.compile(r"^(```python\n)(.*?)(```\n)", re.DOTALL | re.MULTILINE)
--- a/docs/docs_skeleton/vercel.json
+++ b/docs/docs_skeleton/vercel.json
@@ -3476,6 +3476,10 @@
      "source": "/en/latest/modules/prompts/output_parsers/examples/retry.html",
      "destination": "/docs/modules/model_io/output_parsers/retry"
    },
+    {
+      "source": "/en/latest/modules/prompts/example_selectors.html",
+      "destination": "/docs/modules/model_io/example_selectors"
+    },
    {
      "source": "/en/latest/modules/prompts/example_selectors/examples/custom_example_selector.html",
      "destination": "/docs/modules/model_io/prompts/example_selectors/custom_example_selector"
@@ -3488,6 +3492,10 @@
      "source": "/en/latest/modules/prompts/example_selectors/examples/ngram_overlap.html",
      "destination": "/docs/modules/model_io/prompts/example_selectors/ngram_overlap"
    },
+    {
+      "source": "/en/latest/modules/prompts/prompt_templates.html",
+      "destination": "/docs/modules/model_io/prompt_templates"
+    },
    {
      "source": "/en/latest/modules/prompts/prompt_templates/examples/connecting_to_a_feature_store.html",
      "destination": "/docs/modules/model_io/prompts/prompt_templates/connecting_to_a_feature_store"
@@ -3740,6 +3748,10 @@
      "source": "/docs/modules/evaluation/:path*(/?)",
      "destination": "/docs/guides/evaluation/:path*"
    },
+    {
+      "source": "/en/latest/modules/indexes.html",
+      "destination": "/docs/modules/data_connection"
+    },
    {
      "source": "/en/latest/modules/indexes/:path*",
      "destination": "/docs/modules/data_connection/:path*"
--- a/docs/extras/guides/expression_language/cookbook.ipynb
+++ b/docs/extras/guides/expression_language/cookbook.ipynb
@@ -22,10 +22,19 @@
  },
  {
   "cell_type": "code",
-   "execution_count": 4,
+   "execution_count": 1,
   "id": "466b65b3",
   "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "/Users/harrisonchase/.pyenv/versions/3.9.1/envs/langchain/lib/python3.9/site-packages/deeplake/util/check_latest_version.py:32: UserWarning: A newer version of deeplake (3.6.14) is available. It's recommended that you update to the latest version using `pip install -U deeplake`.\n",
+      "  warnings.warn(\n"
+     ]
+    }
+   ],
   "source": [
    "from langchain.prompts import ChatPromptTemplate\n",
    "from langchain.chat_models import ChatOpenAI"
@@ -33,7 +42,7 @@
  },
  {
   "cell_type": "code",
-   "execution_count": 5,
+   "execution_count": 2,
   "id": "3c634ef0",
   "metadata": {},
   "outputs": [],
@@ -583,6 +592,98 @@
    "chain2.invoke({})"
   ]
  },
+  {
+   "cell_type": "markdown",
+   "id": "d094d637",
+   "metadata": {},
+   "source": [
+    "## Router\n",
+    "\n",
+    "You can also use the router runnable to conditionally route inputs to different runnables."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "id": "252625fd",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from langchain.chains import create_tagging_chain_pydantic\n",
+    "from pydantic import BaseModel, Field\n",
+    "\n",
+    "class PromptToUse(BaseModel):\n",
+    "    \"\"\"Used to determine which prompt to use to answer the user's input.\"\"\"\n",
+    "    \n",
+    "    name: str = Field(description=\"Should be one of `math` or `english`\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "id": "57886e84",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "tagger = create_tagging_chain_pydantic(PromptToUse, ChatOpenAI(temperature=0))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "id": "a303b089",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "chain1 = ChatPromptTemplate.from_template(\"You are a math genius. Answer the question: {question}\") | ChatOpenAI()\n",
+    "chain2 = ChatPromptTemplate.from_template(\"You are an english major. Answer the question: {question}\") | ChatOpenAI()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "id": "7aa9ea06",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from langchain.schema.runnable import RouterRunnable\n",
+    "router = RouterRunnable({\"math\": chain1, \"english\": chain2})"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "id": "6a3d3f5d",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "chain = {\n",
+    "    \"key\": {\"input\": lambda x: x[\"question\"]} | tagger | (lambda x: x['text'].name),\n",
+    "    \"input\": {\"question\": lambda x: x[\"question\"]}\n",
+    "} | router"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "id": "8aeda930",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "AIMessage(content='Thank you for the compliment! The sum of 2 + 2 is equal to 4.', additional_kwargs={}, example=False)"
+      ]
+     },
+     "execution_count": 9,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "chain.invoke({\"question\": \"whats 2 + 2\"})"
+   ]
+  },
  {
   "cell_type": "markdown",
   "id": "29781123",
--- a/docs/extras/integrations/chat/anthropic_functions.ipynb
+++ b/docs/extras/integrations/chat/anthropic_functions.ipynb
@@ -0,0 +1,287 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "5125a1e3",
+   "metadata": {},
+   "source": [
+    "# Anthropic Functions\n",
+    "\n",
+    "This notebook shows how to use an experimental wrapper around Anthropic that gives it the same API as OpenAI Functions."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "id": "378be79b",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "/Users/harrisonchase/.pyenv/versions/3.9.1/envs/langchain/lib/python3.9/site-packages/deeplake/util/check_latest_version.py:32: UserWarning: A newer version of deeplake (3.6.14) is available. It's recommended that you update to the latest version using `pip install -U deeplake`.\n",
+      "  warnings.warn(\n"
+     ]
+    }
+   ],
+   "source": [
+    "from langchain_experimental.llms.anthropic_functions import AnthropicFunctions"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "65499965",
+   "metadata": {},
+   "source": [
+    "## Initialize Model\n",
+    "\n",
+    "You can initialize this wrapper the same way you'd initialize ChatAnthropic"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "id": "e1d535f6",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model = AnthropicFunctions(model='claude-2')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "fcc9eaf4",
+   "metadata": {},
+   "source": [
+    "## Passing in functions\n",
+    "\n",
+    "You can now pass in functions in a similar way"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "id": "0779c320",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "functions=[\n",
+    "    {\n",
+    "      \"name\": \"get_current_weather\",\n",
+    "      \"description\": \"Get the current weather in a given location\",\n",
+    "      \"parameters\": {\n",
+    "        \"type\": \"object\",\n",
+    "        \"properties\": {\n",
+    "          \"location\": {\n",
+    "            \"type\": \"string\",\n",
+    "            \"description\": \"The city and state, e.g. San Francisco, CA\"\n",
+    "          },\n",
+    "          \"unit\": {\n",
+    "            \"type\": \"string\",\n",
+    "            \"enum\": [\"celsius\", \"fahrenheit\"]\n",
+    "          }\n",
+    "        },\n",
+    "        \"required\": [\"location\"]\n",
+    "      }\n",
+    "    }\n",
+    "  ]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "id": "ad75a933",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from langchain.schema import HumanMessage"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "id": "fc703085",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "response = model.predict_messages(\n",
+    "    [HumanMessage(content=\"whats the weater in boston?\")], \n",
+    "    functions=functions\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "id": "04d7936a",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "AIMessage(content=' ', additional_kwargs={'function_call': {'name': 'get_current_weather', 'arguments': '{\"location\": \"Boston, MA\", \"unit\": \"fahrenheit\"}'}}, example=False)"
+      ]
+     },
+     "execution_count": 7,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "response"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "0072fdba",
+   "metadata": {},
+   "source": [
+    "## Using for extraction\n",
+    "\n",
+    "You can now use this for extraction."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "id": "7af5c567",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from langchain.chains import create_extraction_chain\n",
+    "schema = {\n",
+    "    \"properties\": {\n",
+    "        \"name\": {\"type\": \"string\"},\n",
+    "        \"height\": {\"type\": \"integer\"},\n",
+    "        \"hair_color\": {\"type\": \"string\"},\n",
+    "    },\n",
+    "    \"required\": [\"name\", \"height\"],\n",
+    "}\n",
+    "inp = \"\"\"\n",
+    "Alex is 5 feet tall. Claudia is 1 feet taller Alex and jumps higher than him. Claudia is a brunette and Alex is blonde.\n",
+    "        \"\"\""
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "id": "bd01082a",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "chain = create_extraction_chain(schema, model)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "id": "b5a23e9f",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "[{'name': 'Alex', 'height': '5', 'hair_color': 'blonde'},\n",
+       " {'name': 'Claudia', 'height': '6', 'hair_color': 'brunette'}]"
+      ]
+     },
+     "execution_count": 10,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "chain.run(inp)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "90ec959e",
+   "metadata": {},
+   "source": [
+    "## Using for tagging\n",
+    "\n",
+    "You can now use this for tagging"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 11,
+   "id": "03c1eb0d",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from langchain.chains import create_tagging_chain"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 12,
+   "id": "581c0ece",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "schema = {\n",
+    "    \"properties\": {\n",
+    "        \"sentiment\": {\"type\": \"string\"},\n",
+    "        \"aggressiveness\": {\"type\": \"integer\"},\n",
+    "        \"language\": {\"type\": \"string\"},\n",
+    "    }\n",
+    "}"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 14,
+   "id": "d9a8570e",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "chain = create_tagging_chain(schema, model)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 15,
+   "id": "cf37d679",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "{'sentiment': 'positive', 'aggressiveness': '0', 'language': 'english'}"
+      ]
+     },
+     "execution_count": 15,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "chain.run(\"this is really cool\")"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.9.1"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
--- a/docs/extras/integrations/vectorstores/chroma.ipynb
+++ b/docs/extras/integrations/vectorstores/chroma.ipynb
@@ -215,10 +215,23 @@
    "Chroma has the ability to handle multiple `Collections` of documents, but the LangChain interface expects one, so we need to specify the collection name. The default collection name used by LangChain is \"langchain\".\n",
    "\n",
    "Here is how to clone, build, and run the Docker Image:\n",
-    "```\n",
+    "```sh\n",
    "git clone git@github.com:chroma-core/chroma.git\n",
-    "docker-compose up -d --build\n",
-    "```"
+    "```\n",
+    "\n",
+    "Edit the `docker-compose.yml` file and add `ALLOW_RESET=TRUE` under `environment`\n",
+    "```yaml\n",
+    "    ...\n",
+    "    command: uvicorn chromadb.app:app --reload --workers 1 --host 0.0.0.0 --port 8000 --log-config log_config.yml\n",
+    "    environment:\n",
+    "      - IS_PERSISTENT=TRUE\n",
+    "      - ALLOW_RESET=TRUE\n",
+    "    ports:\n",
+    "      - 8000:8000\n",
+    "    ...\n",
+    "```\n",
+    "\n",
+    "Then run `docker-compose up -d --build`"
   ]
  },
  {
--- a/docs/extras/integrations/vectorstores/faiss.ipynb
+++ b/docs/extras/integrations/vectorstores/faiss.ipynb
@@ -23,9 +23,9 @@
   },
   "outputs": [],
   "source": [
-    "#!pip install faiss\n",
+    "!pip install faiss-gpu # For CUDA 7.5+ Supported GPU's.\n",
    "# OR\n",
-    "!pip install faiss-cpu"
+    "!pip install faiss-cpu # For CPU Installation"
   ]
  },
  {
--- a/docs/extras/integrations/vectorstores/qdrant.ipynb
+++ b/docs/extras/integrations/vectorstores/qdrant.ipynb
@@ -202,7 +202,7 @@
        "qdrant = Qdrant.from_documents(\n",
        "    docs,\n",
        "    embeddings,\n",
-        "    url,\n",
+        "    url=url,\n",
        "    prefer_grpc=True,\n",
        "    collection_name=\"my_documents\",\n",
        ")"
@@ -236,7 +236,7 @@
        "qdrant = Qdrant.from_documents(\n",
        "    docs,\n",
        "    embeddings,\n",
-        "    url,\n",
+        "    url=url,\n",
        "    prefer_grpc=True,\n",
        "    api_key=api_key,\n",
        "    collection_name=\"my_documents\",\n",
@@ -270,7 +270,7 @@
        "qdrant = Qdrant.from_documents(\n",
        "    docs,\n",
        "    embeddings,\n",
-        "    url,\n",
+        "    url=url,\n",
        "    prefer_grpc=True,\n",
        "    collection_name=\"my_documents\",\n",
        "    force_recreate=True,\n",
--- a/docs/extras/integrations/vectorstores/rockset.ipynb
+++ b/docs/extras/integrations/vectorstores/rockset.ipynb
@@ -2,131 +2,141 @@
 "cells": [
  {
   "cell_type": "markdown",
-   "id": "20b588b4",
+   "id": "9787b308",
   "metadata": {},
   "source": [
    "# Rockset\n",
    "\n",
-    ">[Rockset](https://rockset.com/product/) is a real-time analytics database service for serving low latency, high concurrency analytical queries at scale. It builds a Converged Index™ on structured and semi-structured data with an efficient store for vector embeddings. Its support for running SQL on schemaless data makes it a perfect choice for running vector search with metadata filters. \n",
+    ">[Rockset](https://rockset.com/) is a real-time search and analytics database built for the cloud. Rockset uses a [Converged Index™](https://rockset.com/blog/converged-indexing-the-secret-sauce-behind-rocksets-fast-queries/) with an efficient store for vector embeddings to serve low latency, high concurrency search queries at scale. Rockset has full support for metadata filtering and  handles real-time ingestion for constantly updating, streaming data.\n",
    "\n",
-    "This notebook demonstrates how to use `Rockset` as a vectorstore in langchain. To get started, make sure you have a `Rockset` account and an API key available."
+    "This notebook demonstrates how to use `Rockset` as a vector store in LangChain. Before getting started, make sure you have access to a `Rockset` account and an API key available. [Start your free trial today.](https://rockset.com/create/)\n"
   ]
  },
  {
   "cell_type": "markdown",
-   "id": "e290ddc0",
+   "id": "b823d64a",
   "metadata": {},
   "source": [
-    "## Setting up environment\n",
+    "## Setting Up Your Environment[](https://python.langchain.com/docs/modules/data_connection/vectorstores/integrations/rockset#setting-up-environment)\n",
    "\n",
-    "1. Make sure you have Rockset account and go to the web console to get the API key. Details can be found on [the website](https://rockset.com/docs/rest-api/). For the purpose of this notebook, we will assume you're using Rockset from `Oregon(us-west-2)`."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "7d77bbbe",
-   "metadata": {},
-   "source": [
-    "2. Now you will need to create a Rockset collection to write to, use the Rockset web console to do this. For the purpose of this exercise, we will create a collection called `langchain_demo`. Since Rockset supports schemaless ingest, you don't need to inform us of the shape of metadata for your texts. However, you do need to decide on two columns upfront:\n",
-    "- Where to store the text. We will use the column `description` for this.\n",
-    "- Where to store the vector-embedding for the text. We will use the column `description_embedding` for this.\n",
-    "\n",
-    "Also you will need to inform Rockset that `description_embedding` is a vector-embedding, so that we can optimize its format. You can do this using a **Rockset ingest transformation** while creating your collection:"
-   ]
-  },
-  {
-   "cell_type": "raw",
-   "id": "3daa76ba",
-   "metadata": {},
-   "source": [
-    "SELECT\n",
-    "    _input.* EXCEPT(_meta),\n",
-    "    VECTOR_ENFORCE(_input.description_embedding, #length_of_vector_embedding, 'float') as description_embedding\n",
-    "FROM\n",
-    "    _input\n",
+    "1. Leverage the `Rockset` console to create a [collection](https://rockset.com/docs/collections/) with the Write API as your source. In this walkthrough, we create a collection named `langchain_demo`. \n",
    "    \n",
-    "// We used OpenAI `text-embedding-ada-002` for this examples, where #length_of_vector_embedding = 1536"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "7951c9cd",
-   "metadata": {},
-   "source": [
-    "3. Now let's install the [rockset-python-client](https://github.com/rockset/rockset-python-client). This is used by langchain to talk to the Rockset database."
+    "    Configure the following [ingest transformation](https://rockset.com/docs/ingest-transformation/) to mark your embeddings field and take advantage of performance and storage optimizations:"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
-   "id": "2aac7ae6",
-   "metadata": {},
+   "id": "aac58387",
+   "metadata": {
+    "vscode": {
+     "languageId": "sql"
+    }
+   },
   "outputs": [],
   "source": [
-    "!pip install rockset"
+    "SELECT _input.* EXCEPT(_meta), \n",
+    "VECTOR_ENFORCE(_input.description_embedding, #length_of_vector_embedding, 'float') as description_embedding \n",
+    "FROM _input"
   ]
  },
  {
   "cell_type": "markdown",
-   "id": "8600900d",
+   "id": "df380e1c",
   "metadata": {},
   "source": [
-    "This is it! Now you're ready to start writing some python code to store vector embeddings in Rockset, and querying the database to find texts similar to your query! We support 3 distance functions: `COSINE_SIM`, `EUCLIDEAN_DIST` and `DOT_PRODUCT`."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "3bf2f818",
-   "metadata": {},
-   "source": [
-    "## Example"
+    "2. After creating your collection, use the console to retrieve an [API key](https://rockset.com/docs/iam/#users-api-keys-and-roles). For the purpose of this notebook, we assume you are using the `Oregon(us-west-2)` region.\n",
+    "\n",
+    "3. Install the [rockset-python-client](https://github.com/rockset/rockset-python-client) to enable LangChain to communicate directly with `Rockset`."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
-   "id": "a7b39626",
+   "id": "00d16b83",
   "metadata": {},
   "outputs": [],
+   "source": [
+    "pip install rockset"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "e79550eb",
+   "metadata": {},
+   "source": [
+    "## LangChain Tutorial\n",
+    "\n",
+    "Follow along in your own Python notebook to generate and store vector embeddings in Rockset.\n",
+    "Start using Rockset to search for documents similar to your search queries.\n",
+    "\n",
+    "### 1. Define Key Variables"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "id": "29505c1e",
+   "metadata": {},
+   "outputs": [
+    {
+     "ename": "InitializationException",
+     "evalue": "The rockset client was initialized incorrectly: An api key must be provided as a parameter to the RocksetClient or the Configuration object.",
+     "output_type": "error",
+     "traceback": [
+      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
+      "\u001b[0;31mInitializationException\u001b[0m                   Traceback (most recent call last)",
+      "Cell \u001b[0;32mIn[5], line 6\u001b[0m\n\u001b[1;32m      4\u001b[0m ROCKSET_API_KEY \u001b[39m=\u001b[39m os\u001b[39m.\u001b[39menviron\u001b[39m.\u001b[39mget(\u001b[39m\"\u001b[39m\u001b[39mROCKSET_API_KEY\u001b[39m\u001b[39m\"\u001b[39m) \u001b[39m# Verify ROCKSET_API_KEY environment variable\u001b[39;00m\n\u001b[1;32m      5\u001b[0m ROCKSET_API_SERVER \u001b[39m=\u001b[39m rockset\u001b[39m.\u001b[39mRegions\u001b[39m.\u001b[39musw2a1 \u001b[39m# Verify Rockset region\u001b[39;00m\n\u001b[0;32m----> 6\u001b[0m rockset_client \u001b[39m=\u001b[39m rockset\u001b[39m.\u001b[39;49mRocksetClient(ROCKSET_API_SERVER, ROCKSET_API_KEY)\n\u001b[1;32m      8\u001b[0m COLLECTION_NAME\u001b[39m=\u001b[39m\u001b[39m'\u001b[39m\u001b[39mlangchain_demo\u001b[39m\u001b[39m'\u001b[39m\n\u001b[1;32m      9\u001b[0m TEXT_KEY\u001b[39m=\u001b[39m\u001b[39m'\u001b[39m\u001b[39mdescription\u001b[39m\u001b[39m'\u001b[39m\n",
+      "File \u001b[0;32m~/Library/Python/3.9/lib/python/site-packages/rockset/rockset_client.py:242\u001b[0m, in \u001b[0;36mRocksetClient.__init__\u001b[0;34m(self, host, api_key, max_workers, config)\u001b[0m\n\u001b[1;32m    239\u001b[0m     config\u001b[39m.\u001b[39mhost \u001b[39m=\u001b[39m host\n\u001b[1;32m    241\u001b[0m \u001b[39mif\u001b[39;00m \u001b[39mnot\u001b[39;00m config\u001b[39m.\u001b[39mapi_key:\n\u001b[0;32m--> 242\u001b[0m     \u001b[39mraise\u001b[39;00m InitializationException(\n\u001b[1;32m    243\u001b[0m         \u001b[39m\"\u001b[39m\u001b[39mAn api key must be provided as a parameter to the RocksetClient or the Configuration object.\u001b[39m\u001b[39m\"\u001b[39m\n\u001b[1;32m    244\u001b[0m     )\n\u001b[1;32m    246\u001b[0m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39mapi_client \u001b[39m=\u001b[39m ApiClient(config, max_workers\u001b[39m=\u001b[39mmax_workers)\n\u001b[1;32m    248\u001b[0m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39mAliases \u001b[39m=\u001b[39m AliasesApiWrapper(\u001b[39mself\u001b[39m\u001b[39m.\u001b[39mapi_client)\n",
+      "\u001b[0;31mInitializationException\u001b[0m: The rockset client was initialized incorrectly: An api key must be provided as a parameter to the RocksetClient or the Configuration object."
+     ]
+    }
+   ],
   "source": [
    "import os\n",
    "import rockset\n",
    "\n",
-    "# Make sure env variable ROCKSET_API_KEY is set\n",
-    "ROCKSET_API_KEY = os.environ.get(\"ROCKSET_API_KEY\")\n",
-    "ROCKSET_API_SERVER = (\n",
-    "    rockset.Regions.usw2a1\n",
-    ")  # Make sure this points to the correct Rockset region\n",
+    "ROCKSET_API_KEY = os.environ.get(\"ROCKSET_API_KEY\") # Verify ROCKSET_API_KEY environment variable\n",
+    "ROCKSET_API_SERVER = rockset.Regions.usw2a1 # Verify Rockset region\n",
    "rockset_client = rockset.RocksetClient(ROCKSET_API_SERVER, ROCKSET_API_KEY)\n",
    "\n",
-    "COLLECTION_NAME = \"langchain_demo\"\n",
-    "TEXT_KEY = \"description\"\n",
-    "EMBEDDING_KEY = \"description_embedding\""
+    "COLLECTION_NAME='langchain_demo'\n",
+    "TEXT_KEY='description'\n",
+    "EMBEDDING_KEY='description_embedding'"
   ]
  },
  {
   "cell_type": "markdown",
-   "id": "474636a2",
+   "id": "07625be2",
   "metadata": {},
   "source": [
-    "Now let's use this client to create a Rockset Langchain Vectorstore!\n",
-    "\n",
-    "### 1. Inserting texts"
+    "### 2. Prepare Documents"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
-   "id": "0d73c5bb",
+   "id": "9740d8c4",
   "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "ename": "",
+     "evalue": "",
+     "output_type": "error",
+     "traceback": [
+      "\u001b[1;31mRunning cells with '/opt/local/bin/python3.11' requires the ipykernel package.\n",
+      "\u001b[1;31mRun the following command to install 'ipykernel' into the Python environment. \n",
+      "\u001b[1;31mCommand: '/opt/local/bin/python3.11 -m pip install ipykernel -U --user --force-reinstall'"
+     ]
+    }
+   ],
   "source": [
    "from langchain.embeddings.openai import OpenAIEmbeddings\n",
    "from langchain.text_splitter import CharacterTextSplitter\n",
    "from langchain.document_loaders import TextLoader\n",
    "from langchain.vectorstores import Rockset\n",
    "\n",
-    "loader = TextLoader(\"../../../state_of_the_union.txt\")\n",
+    "loader = TextLoader('../../../state_of_the_union.txt')\n",
    "documents = loader.load()\n",
    "text_splitter = CharacterTextSplitter(chunk_size=1000, chunk_overlap=0)\n",
    "docs = text_splitter.split_documents(documents)"
@@ -134,21 +144,31 @@
  },
  {
   "cell_type": "markdown",
-   "id": "1404cada",
+   "id": "a068be18",
   "metadata": {},
   "source": [
-    "Now we have the documents we want to insert. Let's create a Rockset vectorstore and insert these docs into the Rockset collection. We will use `OpenAIEmbeddings` to create embeddings for the texts, but you're free to use whatever you want."
+    "### 3. Insert Documents"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
-   "id": "63c98bac",
+   "id": "85b6a6c5",
   "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "ename": "",
+     "evalue": "",
+     "output_type": "error",
+     "traceback": [
+      "\u001b[1;31mRunning cells with '/opt/local/bin/python3.11' requires the ipykernel package.\n",
+      "\u001b[1;31mRun the following command to install 'ipykernel' into the Python environment. \n",
+      "\u001b[1;31mCommand: '/opt/local/bin/python3.11 -m pip install ipykernel -U --user --force-reinstall'"
+     ]
+    }
+   ],
   "source": [
-    "# Make sure the environment variable OPENAI_API_KEY is set up\n",
-    "embeddings = OpenAIEmbeddings()\n",
+    "embeddings = OpenAIEmbeddings() # Verify OPENAI_KEY environment variable\n",
    "\n",
    "docsearch = Rockset(\n",
    "    client=rockset_client,\n",
@@ -158,30 +178,38 @@
    "    embedding_key=EMBEDDING_KEY,\n",
    ")\n",
    "\n",
-    "ids = docsearch.add_texts(\n",
+    "ids=docsearch.add_texts(\n",
    "    texts=[d.page_content for d in docs],\n",
    "    metadatas=[d.metadata for d in docs],\n",
-    ")\n",
-    "\n",
-    "## If you go to the Rockset console now, you should be able to see this docs along with the metadata `source`"
+    ")"
   ]
  },
  {
   "cell_type": "markdown",
-   "id": "f1290844",
+   "id": "56eef48d",
   "metadata": {},
   "source": [
-    "### 2. Searching similar texts\n",
-    "\n",
-    "Now let's try to search Rockset to find strings similar to our query string!"
+    "### 4. Search for Similar Documents"
   ]
  },
  {
   "cell_type": "code",
-   "execution_count": null,
-   "id": "96e73ac1",
+   "execution_count": 1,
+   "id": "0bbf3df0",
   "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "ename": "NameError",
+     "evalue": "name 'docsearch' is not defined",
+     "output_type": "error",
+     "traceback": [
+      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
+      "\u001b[0;31mNameError\u001b[0m                                 Traceback (most recent call last)",
+      "Cell \u001b[0;32mIn[1], line 2\u001b[0m\n\u001b[1;32m      1\u001b[0m query \u001b[39m=\u001b[39m \u001b[39m\"\u001b[39m\u001b[39mWhat did the president say about Ketanji Brown Jackson?\u001b[39m\u001b[39m\"\u001b[39m\n\u001b[0;32m----> 2\u001b[0m output \u001b[39m=\u001b[39m docsearch\u001b[39m.\u001b[39msimilarity_search_with_relevance_scores(query, \u001b[39m4\u001b[39m, Rockset\u001b[39m.\u001b[39mDistanceFunction\u001b[39m.\u001b[39mCOSINE_SIM)\n\u001b[1;32m      4\u001b[0m \u001b[39mprint\u001b[39m(\u001b[39m\"\u001b[39m\u001b[39moutput length:\u001b[39m\u001b[39m\"\u001b[39m, \u001b[39mlen\u001b[39m(output))\n\u001b[1;32m      5\u001b[0m \u001b[39mfor\u001b[39;00m d, dist \u001b[39min\u001b[39;00m output:\n",
+      "\u001b[0;31mNameError\u001b[0m: name 'docsearch' is not defined"
+     ]
+    }
+   ],
   "source": [
    "query = \"What did the president say about Ketanji Brown Jackson\"\n",
    "output = docsearch.similarity_search_with_relevance_scores(\n",
@@ -189,7 +217,7 @@
    ")\n",
    "print(\"output length:\", len(output))\n",
    "for d, dist in output:\n",
-    "    print(dist, d.metadata, d.page_content[:20] + \"...\")\n",
+    "    print(dist, d.metadata, d.page_content[:20] + '...')\n",
    "\n",
    "##\n",
    "# output length: 4\n",
@@ -201,20 +229,16 @@
  },
  {
   "cell_type": "markdown",
-   "id": "5e15d630",
+   "id": "7037a22f",
   "metadata": {},
   "source": [
-    "You can also use a where filter to prune your search space. You can add filters on text key, or any of the metadata fields. \n",
-    "\n",
-    "> **Note**: Since Rockset stores each metadata field as a separate column internally, these filters are much faster than other vector databases which store all metadata as a single JSON.\n",
-    "\n",
-    "For eg, to find all texts NOT containing the substring \"and\", you can use the following code:"
+    "### 5. Search for Similar Documents with Filtering"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
-   "id": "c1c44d41",
+   "id": "b64a290f",
   "metadata": {},
   "outputs": [],
   "source": [
@@ -226,7 +250,7 @@
    ")\n",
    "print(\"output length:\", len(output))\n",
    "for d, dist in output:\n",
-    "    print(dist, d.metadata, d.page_content[:20] + \"...\")\n",
+    "    print(dist, d.metadata, d.page_content[:20] + '...')\n",
    "\n",
    "##\n",
    "# output length: 4\n",
@@ -239,12 +263,13 @@
  {
   "attachments": {},
   "cell_type": "markdown",
-   "id": "0765b822",
+   "id": "13a52b38",
   "metadata": {},
   "source": [
-    "### 3. [Optional] Drop all inserted documents\n",
+    "### 6. [Optional] Delete Inserted Documents\n",
    "\n",
-    "In order to delete texts from the Rockset collection, you need to know the unique ID associated with each document inside Rockset. These ids can either be supplied directly by the user while inserting the texts (in the `Rockset.add_texts()` function), else Rockset will generate a unique ID or each document. Either way, `Rockset.add_texts()` returns the ids for the inserted documents.\n",
+    "You must have the unique ID associated with each document to delete them from your collection.\n",
+    "Define IDs when inserting documents with `Rockset.add_texts()`. Rockset will otherwise generate a unique ID for each document. Regardless, `Rockset.add_texts()` returns the IDs of inserted documents.\n",
    "\n",
    "To delete these docs, simply use the `Rockset.delete_texts()` function."
   ]
@@ -252,7 +277,7 @@
  {
   "cell_type": "code",
   "execution_count": null,
-   "id": "31738966",
+   "id": "1f755924",
   "metadata": {},
   "outputs": [],
   "source": [
@@ -261,23 +286,15 @@
  },
  {
   "cell_type": "markdown",
-   "id": "03fa12a9",
+   "id": "d468f431",
   "metadata": {},
   "source": [
-    "## Congratulations!\n",
+    "## Summary\n",
    "\n",
-    "Voila! In this example you successfuly created a Rockset collection, inserted documents along with their OpenAI vector embeddings, and searched for similar docs both with and without any metadata filters.\n",
+    "In this tutorial, we successfully created a `Rockset` collection, `inserted` documents with  OpenAI embeddings, and searched for similar documents with and without metadata filters.\n",
    "\n",
-    "Keep an eye on https://rockset.com/blog/introducing-vector-search-on-rockset/ for future updates in this space!"
+    "Keep an eye on https://rockset.com/ for future updates in this space."
   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "2763dddb-e87d-4d3b-b0bf-c246b0573d87",
-   "metadata": {},
-   "outputs": [],
-   "source": []
  }
 ],
 "metadata": {
@@ -296,7 +313,7 @@
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
-   "version": "3.10.6"
+   "version": "3.9.6"
  }
 },
 "nbformat": 4,
--- a/docs/extras/modules/agents/agent_types/anthropic_agent.ipynb
+++ b/docs/extras/modules/agents/agent_types/anthropic_agent.ipynb
@@ -1,274 +0,0 @@
-{
- "cells": [
-  {
-   "cell_type": "code",
-   "execution_count": 1,
-   "id": "9926203f",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import os\n",
-    "\n",
-    "os.environ[\"LANGCHAIN_TRACING_V2\"] = \"true\"\n",
-    "os.environ[\"LANGCHAIN_ENDPOINT\"] = \"https://api.smith.langchain.com\"\n",
-    "os.environ[\"LANGCHAIN_API_KEY\"] = \"\""
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 2,
-   "id": "45bc4149",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "agent_instructions = \"\"\"You are a helpful assistant. Help the user answer any questions.\n",
-    "\n",
-    "You have access to the following tools:\n",
-    "\n",
-    "{tools}\n",
-    "\n",
-    "In order to use a tool, you can use <tool></tool> and <tool_input></tool_input> tags. \\\n",
-    "You will then get back a response in the form <observation></observation>\n",
-    "For example, if you have a tool called 'search' that could run a google search, in order to search for the weather in SF you would respond:\n",
-    "\n",
-    "<tool>search</tool><tool_input>weather in SF</tool_input>\n",
-    "<observation>64 degrees</observation>\n",
-    "\n",
-    "When you are done, respond with a final answer between <final_answer></final_answer>. For example:\n",
-    "\n",
-    "<final_answer>The weather in SF is 64 degrees</final_answer>\n",
-    "\n",
-    "Begin!\n",
-    "\n",
-    "Question: {question}\"\"\""
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 3,
-   "id": "4da4c0d2",
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "/Users/harrisonchase/.pyenv/versions/3.9.1/envs/langchain/lib/python3.9/site-packages/deeplake/util/check_latest_version.py:32: UserWarning: A newer version of deeplake (3.6.14) is available. It's recommended that you update to the latest version using `pip install -U deeplake`.\n",
-      "  warnings.warn(\n"
-     ]
-    }
-   ],
-   "source": [
-    "from langchain.chat_models import ChatAnthropic\n",
-    "from langchain.prompts import ChatPromptTemplate, AIMessagePromptTemplate\n",
-    "from langchain.agents import tool"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 4,
-   "id": "b81e9120",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "model = ChatAnthropic(model=\"claude-2\")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 5,
-   "id": "5271f612",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "prompt_template = ChatPromptTemplate.from_template(agent_instructions) + AIMessagePromptTemplate.from_template(\"{intermediate_steps}\")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 6,
-   "id": "83780d81",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "chain = prompt_template | model.bind(stop=[\"</tool_input>\", \"</final_answer>\"])"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 7,
-   "id": "c091d0e1",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "@tool\n",
-    "def search(query: str) -> str:\n",
-    "    \"\"\"Search things about current events.\"\"\"\n",
-    "    return \"32 degrees\""
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 8,
-   "id": "1e81b05d",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "tool_list = [search]"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 9,
-   "id": "5f0d986f",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from langchain.agents import Tool, AgentExecutor, BaseSingleActionAgent\n",
-    "from typing import List, Tuple, Any, Union\n",
-    "from langchain.schema import AgentAction, AgentFinish\n",
-    "\n",
-    "\n",
-    "class AnthropicAgent(BaseSingleActionAgent):\n",
-    "    \n",
-    "    tools: List[Tool]\n",
-    "    chain: Any\n",
-    "\n",
-    "    @property\n",
-    "    def input_keys(self):\n",
-    "        return [\"input\"]\n",
-    "\n",
-    "    def plan(\n",
-    "        self, intermediate_steps: List[Tuple[AgentAction, str]], **kwargs: Any\n",
-    "    ) -> Union[AgentAction, AgentFinish]:\n",
-    "        \"\"\"Given input, decided what to do.\n",
-    "\n",
-    "        Args:\n",
-    "            intermediate_steps: Steps the LLM has taken to date,\n",
-    "                along with observations\n",
-    "            **kwargs: User inputs.\n",
-    "\n",
-    "        Returns:\n",
-    "            Action specifying what tool to use.\n",
-    "        \"\"\"\n",
-    "        log = \"\"\n",
-    "        for action, observation in intermediate_steps:\n",
-    "            log += f\"<tool>{action.tool}</tool><tool_input>{action.tool_input}</tool_input><observation>{observation}</observation>\"\n",
-    "        tools = \"\"\n",
-    "        for tool in self.tools:\n",
-    "            tools += f\"{tool.name}: {tool.description}\\n\"\n",
-    "        response = self.chain.invoke({\"intermediate_steps\": log, \"tools\": tools, \"question\": kwargs[\"input\"]})\n",
-    "        if \"</tool>\" in response.content:\n",
-    "            t, ti = response.content.split(\"</tool>\")\n",
-    "            _t = t.split(\"<tool>\")[1]\n",
-    "            _ti = ti.split(\"<tool_input>\")[1]\n",
-    "            return AgentAction(tool=_t, tool_input=_ti, log=response.content)\n",
-    "        elif \"<final_answer>\" in response.content:\n",
-    "            t, ti = response.content.split(\"<final_answer>\")\n",
-    "            return AgentFinish(return_values={\"output\": ti}, log=response.content)\n",
-    "        else:\n",
-    "            raise ValueError\n",
-    "\n",
-    "    async def aplan(\n",
-    "        self, intermediate_steps: List[Tuple[AgentAction, str]], **kwargs: Any\n",
-    "    ) -> Union[AgentAction, AgentFinish]:\n",
-    "        \"\"\"Given input, decided what to do.\n",
-    "\n",
-    "        Args:\n",
-    "            intermediate_steps: Steps the LLM has taken to date,\n",
-    "                along with observations\n",
-    "            **kwargs: User inputs.\n",
-    "\n",
-    "        Returns:\n",
-    "            Action specifying what tool to use.\n",
-    "        \"\"\"\n",
-    "        raise ValueError"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 10,
-   "id": "315361c5",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "agent = AnthropicAgent(tools=tool_list, chain=chain)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 11,
-   "id": "bca6096f",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "agent_executor = AgentExecutor(agent=agent, tools=tool_list, verbose=True)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 12,
-   "id": "71b872b1",
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\n",
-      "\n",
-      "\u001b[1m> Entering new AgentExecutor chain...\u001b[0m\n",
-      "\u001b[32;1m\u001b[1;3m <tool>search</tool>\n",
-      "<tool_input>weather in new york\u001b[0m\u001b[36;1m\u001b[1;3m32 degrees\u001b[0m\u001b[32;1m\u001b[1;3m\n",
-      "\n",
-      "<final_answer>The weather in New York is 32 degrees\u001b[0m\n",
-      "\n",
-      "\u001b[1m> Finished chain.\u001b[0m\n"
-     ]
-    },
-    {
-     "data": {
-      "text/plain": [
-       "'The weather in New York is 32 degrees'"
-      ]
-     },
-     "execution_count": 12,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
-   "source": [
-    "agent_executor.run(\"whats the weather in New york?\")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "cca87246",
-   "metadata": {},
-   "outputs": [],
-   "source": []
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "Python 3 (ipykernel)",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.9.1"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 5
-}
--- a/docs/extras/modules/agents/agent_types/xml_agent.ipynb
+++ b/docs/extras/modules/agents/agent_types/xml_agent.ipynb
@@ -0,0 +1,149 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "3c284df8",
+   "metadata": {},
+   "source": [
+    "# XML Agent\n",
+    "\n",
+    "Some language models (like Anthropic's Claude) are particularly good at reasoning/writing XML. This goes over how to use an agent that uses XML when prompting. "
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "id": "f9d2ead2",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from langchain.agents import XMLAgent, tool, AgentExecutor\n",
+    "from langchain.chat_models import ChatAnthropic\n",
+    "from langchain.chains import LLMChain"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "id": "ebadf04f",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model = ChatAnthropic(model=\"claude-2\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "id": "6ce9f9a5",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "@tool\n",
+    "def search(query: str) -> str:\n",
+    "    \"\"\"Search things about current events.\"\"\"\n",
+    "    return \"32 degrees\""
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "id": "c589944e",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "tool_list = [search]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 11,
+   "id": "2d8454be",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "chain = LLMChain(\n",
+    "    llm=model,\n",
+    "    prompt=XMLAgent.get_default_prompt(),\n",
+    "    output_parser=XMLAgent.get_default_output_parser()\n",
+    ")\n",
+    "agent = XMLAgent(tools=tool_list, llm_chain=chain)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 12,
+   "id": "bca6096f",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "agent_executor = AgentExecutor(agent=agent, tools=tool_list, verbose=True)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 13,
+   "id": "71b872b1",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "\n",
+      "\u001b[1m> Entering new AgentExecutor chain...\u001b[0m\n",
+      "\u001b[32;1m\u001b[1;3m <tool>search</tool>\n",
+      "<tool_input>weather in New York\u001b[0m\u001b[36;1m\u001b[1;3m32 degrees\u001b[0m\u001b[32;1m\u001b[1;3m\n",
+      "\n",
+      "<final_answer>The weather in New York is 32 degrees\u001b[0m\n",
+      "\n",
+      "\u001b[1m> Finished chain.\u001b[0m\n"
+     ]
+    },
+    {
+     "data": {
+      "text/plain": [
+       "'The weather in New York is 32 degrees'"
+      ]
+     },
+     "execution_count": 13,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "agent_executor.run(\"whats the weather in New york?\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "cca87246",
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.9.1"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
--- a/docs/extras/use_cases/graph/neptune_cypher_qa.ipynb
+++ b/docs/extras/use_cases/graph/neptune_cypher_qa.ipynb
@@ -10,11 +10,11 @@
  },
  {
   "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
-    "from langchain.graphs.neptune_graph import NeptuneGraph\n",
+    "from langchain.graphs import NeptuneGraph\n",
    "\n",
    "\n",
    "host = \"<neptune-host>\"\n",
@@ -26,12 +26,23 @@
  },
  {
   "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 3,
   "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "'The Austin airport has 98 outgoing routes.'"
+      ]
+     },
+     "execution_count": 3,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
   "source": [
    "from langchain.chat_models import ChatOpenAI\n",
-    "from langchain.chains.graph_qa.neptune_cypher import NeptuneOpenCypherQAChain\n",
+    "from langchain.chains import NeptuneOpenCypherQAChain\n",
    "\n",
    "llm = ChatOpenAI(temperature=0, model=\"gpt-4\")\n",
    "\n",
@@ -42,8 +53,22 @@
  }
 ],
 "metadata": {
+  "kernelspec": {
+   "display_name": ".venv",
+   "language": "python",
+   "name": "python3"
+  },
  "language_info": {
-   "name": "python"
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.9.13"
  },
  "orig_nbformat": 4
 },
--- a/docs/extras/use_cases/graph/tot.ipynb
+++ b/docs/extras/use_cases/graph/tot.ipynb
@@ -6,7 +6,7 @@
   "source": [
    "# Tree of Thought (ToT) example\n",
    "\n",
-    "The Tree of Thought (ToT) is a chain that allows you to query a Large Language Model (LLM) using the Tree of Thought technique. This is based on the papaer [\"Large Language Model Guided Tree-of-Thought\"](https://arxiv.org/pdf/2305.08291.pdf)"
+    "The Tree of Thought (ToT) is a chain that allows you to query a Large Language Model (LLM) using the Tree of Thought technique. This is based on the paper [\"Large Language Model Guided Tree-of-Thought\"](https://arxiv.org/pdf/2305.08291.pdf)"
   ]
  },
  {
--- a/libs/experimental/langchain_experimental/llms/anthropic_functions.py
+++ b/libs/experimental/langchain_experimental/llms/anthropic_functions.py
@@ -0,0 +1,206 @@
+import json
+from collections import defaultdict
+from html.parser import HTMLParser
+from typing import Any, DefaultDict, Dict, List, Optional
+
+from langchain.callbacks.manager import (
+    CallbackManagerForLLMRun,
+    Callbacks,
+)
+from langchain.chat_models.anthropic import ChatAnthropic
+from langchain.chat_models.base import BaseChatModel
+from langchain.schema import (
+    ChatGeneration,
+    ChatResult,
+    LLMResult,
+)
+from langchain.schema.messages import (
+    AIMessage,
+    BaseMessage,
+    SystemMessage,
+)
+from pydantic import root_validator
+
+prompt = """In addition to responding, you can use tools. \
+You have access to the following tools.
+
+{tools}
+
+In order to use a tool, you can use <tool></tool> to specify the name, \
+and the <tool_input></tool_input> tags to specify the parameters. \
+Each parameter should be passed in as <$param_name>$value</$param_name>, \
+Where $param_name is the name of the specific parameter, and $value \
+is the value for that parameter.
+
+You will then get back a response in the form <observation></observation>
+For example, if you have a tool called 'search' that accepts a single \
+parameter 'query' that could run a google search, in order to search \
+for the weather in SF you would respond:
+
+<tool>search</tool><tool_input><query>weather in SF</query></tool_input>
+<observation>64 degrees</observation>"""
+
+
+class TagParser(HTMLParser):
+    def __init__(self) -> None:
+        """A heavy-handed solution, but it's fast for prototyping.
+
+        Might be re-implemented later to restrict scope to the limited grammar, and
+        more efficiency.
+
+        Uses an HTML parser to parse a limited grammar that allows
+        for syntax of the form:
+
+            INPUT -> JUNK? VALUE*
+            JUNK -> JUNK_CHARACTER+
+            JUNK_CHARACTER -> whitespace | ,
+            VALUE -> <IDENTIFIER>DATA</IDENTIFIER> | OBJECT
+            OBJECT -> <IDENTIFIER>VALUE+</IDENTIFIER>
+            IDENTIFIER -> [a-Z][a-Z0-9_]*
+            DATA -> .*
+
+        Interprets the data to allow repetition of tags and recursion
+        to support representation of complex types.
+
+        ^ Just another approximately wrong grammar specification.
+        """
+        super().__init__()
+
+        self.parse_data: DefaultDict[str, List[Any]] = defaultdict(list)
+        self.stack: List[DefaultDict[str, List[str]]] = [self.parse_data]
+        self.success = True
+        self.depth = 0
+        self.data: Optional[str] = None
+
+    def handle_starttag(self, tag: str, attrs: Any) -> None:
+        """Hook when a new tag is encountered."""
+        self.depth += 1
+        self.stack.append(defaultdict(list))
+        self.data = None
+
+    def handle_endtag(self, tag: str) -> None:
+        """Hook when a tag is closed."""
+        self.depth -= 1
+        top_of_stack = dict(self.stack.pop(-1))  # Pop the dictionary we don't need it
+
+        # If a lead node
+        is_leaf = self.data is not None
+        # Annoying to type here, code is tested, hopefully OK
+        value = self.data if is_leaf else top_of_stack
+        # Difficult to type this correctly with mypy (maybe impossible?)
+        # Can be nested indefinitely, so requires self referencing type
+        self.stack[-1][tag].append(value)  # type: ignore
+        # Reset the data so we if we encounter a sequence of end tags, we
+        # don't confuse an outer end tag for belonging to a leaf node.
+        self.data = None
+
+    def handle_data(self, data: str) -> None:
+        """Hook when handling data."""
+        stripped_data = data.strip()
+        # The only data that's allowed is whitespace or a comma surrounded by whitespace
+        if self.depth == 0 and stripped_data not in (",", ""):
+            # If this is triggered the parse should be considered invalid.
+            self.success = False
+        if stripped_data:  # ignore whitespace-only strings
+            self.data = stripped_data
+
+
+def _destrip(tool_input: Any) -> Any:
+    if isinstance(tool_input, dict):
+        return {k: _destrip(v) for k, v in tool_input.items()}
+    elif isinstance(tool_input, list):
+        if isinstance(tool_input[0], str):
+            if len(tool_input) == 1:
+                return tool_input[0]
+            else:
+                raise ValueError
+        elif isinstance(tool_input[0], dict):
+            return [_destrip(v) for v in tool_input]
+        else:
+            raise ValueError
+    else:
+        raise ValueError
+
+
+class AnthropicFunctions(BaseChatModel):
+    model: ChatAnthropic
+
+    @root_validator(pre=True)
+    def validate_environment(cls, values: Dict) -> Dict:
+        return {"model": ChatAnthropic(**values)}
+
+    def _generate(
+        self,
+        messages: List[BaseMessage],
+        stop: Optional[List[str]] = None,
+        run_manager: Optional[CallbackManagerForLLMRun] = None,
+        **kwargs: Any,
+    ) -> ChatResult:
+        forced = False
+        function_call = ""
+        if "functions" in kwargs:
+            content = prompt.format(tools=json.dumps(kwargs["functions"], indent=2))
+            system = SystemMessage(content=content)
+            messages = [system] + messages
+            del kwargs["functions"]
+            if stop is None:
+                stop = ["</tool_input>"]
+            else:
+                stop.append("</tool_input>")
+            if "function_call" in kwargs:
+                forced = True
+                function_call = kwargs["function_call"]["name"]
+                AIMessage(content=f"<tool>{function_call}</tool>")
+                del kwargs["function_call"]
+        else:
+            if "function_call" in kwargs:
+                raise ValueError(
+                    "if `function_call` provided, `functions` must also be"
+                )
+        response = self.model.predict_messages(
+            messages, stop=stop, callbacks=run_manager, **kwargs
+        )
+        completion = response.content
+        if forced:
+            tag_parser = TagParser()
+            tag_parser.feed(completion.strip() + "</tool_input>")
+            v1 = tag_parser.parse_data["tool_input"][0]
+            kwargs = {
+                "function_call": {
+                    "name": function_call,
+                    "arguments": json.dumps(_destrip(v1)),
+                }
+            }
+            message = AIMessage(content="", additional_kwargs=kwargs)
+            return ChatResult(generations=[ChatGeneration(message=message)])
+        elif "<tool>" in completion:
+            tag_parser = TagParser()
+            tag_parser.feed(completion.strip() + "</tool_input>")
+            msg = completion.split("<tool>")[0]
+            v1 = tag_parser.parse_data["tool_input"][0]
+            kwargs = {
+                "function_call": {
+                    "name": tag_parser.parse_data["tool"][0],
+                    "arguments": json.dumps(_destrip(v1)),
+                }
+            }
+            message = AIMessage(content=msg, additional_kwargs=kwargs)
+            return ChatResult(generations=[ChatGeneration(message=message)])
+        else:
+            return ChatResult(generations=[ChatGeneration(message=response)])
+
+    async def agenerate(
+        self,
+        messages: List[List[BaseMessage]],
+        stop: Optional[List[str]] = None,
+        callbacks: Callbacks = None,
+        *,
+        tags: Optional[List[str]] = None,
+        metadata: Optional[Dict[str, Any]] = None,
+        **kwargs: Any,
+    ) -> LLMResult:
+        raise NotImplementedError
+
+    @property
+    def _llm_type(self) -> str:
+        return "anthropic_functions"
--- a/libs/experimental/pyproject.toml
+++ b/libs/experimental/pyproject.toml
@@ -1,6 +1,6 @@
 [tool.poetry]
 name = "langchain-experimental"
-version = "0.0.7"
+version = "0.0.8"
 description = "Building applications with LLMs through composability"
 authors = []
 license = "MIT"
--- a/libs/langchain/langchain/chains/init.py
+++ b/libs/langchain/langchain/chains/init.py
@@ -34,6 +34,7 @@ from langchain.chains.graph_qa.cypher import GraphCypherQAChain
 from langchain.chains.graph_qa.hugegraph import HugeGraphQAChain
 from langchain.chains.graph_qa.kuzu import KuzuQAChain
 from langchain.chains.graph_qa.nebulagraph import NebulaGraphQAChain
+from langchain.chains.graph_qa.neptune_cypher import NeptuneOpenCypherQAChain
 from langchain.chains.graph_qa.sparql import GraphSparqlQAChain
 from langchain.chains.hyde.base import HypotheticalDocumentEmbedder
 from langchain.chains.llm import LLMChain
@@ -101,6 +102,7 @@ __all__ = [
    "MultiRouteChain",
    "NatBotChain",
    "NebulaGraphQAChain",
+    "NeptuneOpenCypherQAChain",
    "OpenAIModerationChain",
    "OpenAPIEndpointChain",
    "QAGenerationChain",
--- a/libs/langchain/langchain/document_loaders/async_html.py
+++ b/libs/langchain/langchain/document_loaders/async_html.py
@@ -26,23 +26,15 @@ default_header_template = {
 class AsyncHtmlLoader(BaseLoader):
    """Loads HTML asynchronously."""

-    web_paths: List[str]
-
-    requests_per_second: int = 2
-    """Max number of concurrent requests to make."""
-
-    requests_kwargs: Dict[str, Any] = {}
-    """kwargs for requests"""
-
-    raise_for_status: bool = False
-    """Raise an exception if http status code denotes an error."""
-
    def __init__(
        self,
        web_path: Union[str, List[str]],
        header_template: Optional[dict] = None,
        verify_ssl: Optional[bool] = True,
        proxies: Optional[dict] = None,
+        requests_per_second: int = 2,
+        requests_kwargs: Dict[str, Any] = {},
+        raise_for_status: bool = False,
    ):
        """Initialize with webpage path."""

@@ -74,6 +66,10 @@ class AsyncHtmlLoader(BaseLoader):
        if proxies:
            self.session.proxies.update(proxies)

+        self.requests_per_second = requests_per_second
+        self.requests_kwargs = requests_kwargs
+        self.raise_for_status = raise_for_status
+
    async def _fetch(
        self, url: str, retries: int = 3, cooldown: int = 2, backoff: float = 1.5
    ) -> str:
--- a/libs/langchain/langchain/document_loaders/git.py
+++ b/libs/langchain/langchain/document_loaders/git.py
@@ -49,7 +49,18 @@ class GitLoader(BaseLoader):
        if not os.path.exists(self.repo_path) and self.clone_url is None:
            raise ValueError(f"Path {self.repo_path} does not exist")
        elif self.clone_url:
-            repo = Repo.clone_from(self.clone_url, self.repo_path)
+            # If the repo_path already contains a git repository, verify that it's the
+            # same repository as the one we're trying to clone.
+            if os.path.isdir(os.path.join(self.repo_path, ".git")):
+                repo = Repo(self.repo_path)
+                # If the existing repository is not the same as the one we're trying to
+                # clone, raise an error.
+                if repo.remotes.origin.url != self.clone_url:
+                    raise ValueError(
+                        "A different repository is already cloned at this path."
+                    )
+            else:
+                repo = Repo.clone_from(self.clone_url, self.repo_path)
            repo.git.checkout(self.branch)
        else:
            repo = Repo(self.repo_path)
--- a/libs/langchain/langchain/prompts/chat.py
+++ b/libs/langchain/langchain/prompts/chat.py
@@ -469,7 +469,7 @@ class ChatPromptTemplate(BaseChatPromptTemplate, ABC):

        Examples:

-            Instantiation from a list of role strings and templates:
+            Instantiation from a list of message templates:

            .. code-block:: python

@@ -488,18 +488,6 @@ class ChatPromptTemplate(BaseChatPromptTemplate, ABC):
                    ("human", "Hello, how are you?"),
                ])

-            Instantiation from a list message templates:
-
-
-            .. code-block:: python
-
-                template = ChatPromptTemplate.from_messages([
-                    ("human", "Hello, how are you?"),
-                    ("ai", "I'm doing well, thanks!"),
-                    ("human", "That's good to hear."),
-                ])
-
-
        Args:
            messages: sequence of message representations.
                  A message can be represented using the following formats:
--- a/libs/langchain/langchain/prompts/few_shot.py
+++ b/libs/langchain/langchain/prompts/few_shot.py
@@ -190,12 +190,9 @@ class FewShotChatMessagePromptTemplate(

        .. code-block:: python

-            from langchain.schema import SystemMessage
            from langchain.prompts import (
                FewShotChatMessagePromptTemplate,
-                HumanMessagePromptTemplate,
-                SystemMessagePromptTemplate,
-                AIMessagePromptTemplate
+                ChatPromptTemplate
            )

            examples = [
@@ -203,24 +200,23 @@ class FewShotChatMessagePromptTemplate(
                {"input": "2+3", "output": "5"},
            ]

+            example_prompt = ChatPromptTemplate.from_messages(
+                [('human', '{input}'), ('ai', '{output}')]
+            )
+
            few_shot_prompt = FewShotChatMessagePromptTemplate(
                examples=examples,
                # This is a prompt template used to format each individual example.
-                example_prompt=(
-                    HumanMessagePromptTemplate.from_template("{input}")
-                    + AIMessagePromptTemplate.from_template("{output}")
-                ),
+                example_prompt=example_prompt,
            )

-
-            final_prompt = (
-                SystemMessagePromptTemplate.from_template(
-                    "You are a helpful AI Assistant"
-                )
-                + few_shot_prompt
-                + HumanMessagePromptTemplate.from_template("{input}")
+            final_prompt = ChatPromptTemplate.from_messages(
+                [
+                    ('system', 'You are a helpful AI Assistant'),
+                    few_shot_prompt,
+                    ('human', '{input}'),
+                ]
            )
-
            final_prompt.format(input="What is 4+4?")

        Prompt template with dynamically selected examples:
--- a/libs/langchain/langchain/retrievers/web_research.py
+++ b/libs/langchain/langchain/retrievers/web_research.py
@@ -34,18 +34,18 @@ class SearchQueries(BaseModel):

 DEFAULT_LLAMA_SEARCH_PROMPT = PromptTemplate(
    input_variables=["question"],
-    template="""<<SYS>> \n You are an assistant tasked with improving Google search 
-    results. \n <</SYS>> \n\n [INST] Generate THREE Google search queries that 
-    are similar to this question. The output should be a numbered list of questions 
-    and each should have a question mark at the end: \n\n {question} [/INST]""",
+    template="""<<SYS>> \n You are an assistant tasked with improving Google search \
+results. \n <</SYS>> \n\n [INST] Generate THREE Google search queries that \
+are similar to this question. The output should be a numbered list of questions \
+and each should have a question mark at the end: \n\n {question} [/INST]""",
 )

 DEFAULT_SEARCH_PROMPT = PromptTemplate(
    input_variables=["question"],
-    template="""You are an assistant tasked with improving Google search 
-    results. Generate THREE Google search queries that are similar to
-    this question. The output should be a numbered list of questions and each
-    should have a question mark at the end: {question}""",
+    template="""You are an assistant tasked with improving Google search \
+results. Generate THREE Google search queries that are similar to \
+this question. The output should be a numbered list of questions and each \
+should have a question mark at the end: {question}""",
 )


--- a/libs/langchain/langchain/schema/runnable.py
+++ b/libs/langchain/langchain/schema/runnable.py
@@ -108,6 +108,10 @@ class Runnable(Generic[Input, Output], ABC):
    ) -> List[Output]:
        configs = self._get_config_list(config, len(inputs))

+        # If there's only one input, don't bother with the executor
+        if len(inputs) == 1:
+            return [self.invoke(inputs[0], configs[0])]
+
        with ThreadPoolExecutor(max_workers=max_concurrency) as executor:
            return list(executor.map(self.invoke, inputs, configs))

@@ -759,6 +763,140 @@ class RunnableBinding(Serializable, Runnable[Input, Output]):
            yield item


+class RouterInput(TypedDict):
+    key: str
+    input: Any
+
+
+class RouterRunnable(
+    Serializable, Generic[Input, Output], Runnable[RouterInput, Output]
+):
+    runnables: Mapping[str, Runnable[Input, Output]]
+
+    def __init__(self, runnables: Mapping[str, Runnable[Input, Output]]) -> None:
+        super().__init__(runnables=runnables)
+
+    class Config:
+        arbitrary_types_allowed = True
+
+    @property
+    def lc_serializable(self) -> bool:
+        return True
+
+    def __or__(
+        self,
+        other: Union[
+            Runnable[Any, Other],
+            Callable[[Any], Other],
+            Mapping[str, Union[Runnable[Any, Other], Callable[[Any], Other]]],
+            Mapping[str, Any],
+        ],
+    ) -> RunnableSequence[RouterInput, Other]:
+        return RunnableSequence(first=self, last=_coerce_to_runnable(other))
+
+    def __ror__(
+        self,
+        other: Union[
+            Runnable[Other, Any],
+            Callable[[Any], Other],
+            Mapping[str, Union[Runnable[Other, Any], Callable[[Other], Any]]],
+            Mapping[str, Any],
+        ],
+    ) -> RunnableSequence[Other, Output]:
+        return RunnableSequence(first=_coerce_to_runnable(other), last=self)
+
+    def invoke(
+        self, input: RouterInput, config: Optional[RunnableConfig] = None
+    ) -> Output:
+        key = input["key"]
+        actual_input = input["input"]
+        if key not in self.runnables:
+            raise ValueError(f"No runnable associated with key '{key}'")
+
+        runnable = self.runnables[key]
+        return runnable.invoke(actual_input, config)
+
+    async def ainvoke(
+        self, input: RouterInput, config: Optional[RunnableConfig] = None
+    ) -> Output:
+        key = input["key"]
+        actual_input = input["input"]
+        if key not in self.runnables:
+            raise ValueError(f"No runnable associated with key '{key}'")
+
+        runnable = self.runnables[key]
+        return await runnable.ainvoke(actual_input, config)
+
+    def batch(
+        self,
+        inputs: List[RouterInput],
+        config: Optional[Union[RunnableConfig, List[RunnableConfig]]] = None,
+        *,
+        max_concurrency: Optional[int] = None,
+    ) -> List[Output]:
+        keys = [input["key"] for input in inputs]
+        actual_inputs = [input["input"] for input in inputs]
+        if any(key not in self.runnables for key in keys):
+            raise ValueError("One or more keys do not have a corresponding runnable")
+
+        runnables = [self.runnables[key] for key in keys]
+        configs = self._get_config_list(config, len(inputs))
+        with ThreadPoolExecutor(max_workers=max_concurrency) as executor:
+            return list(
+                executor.map(
+                    lambda runnable, input, config: runnable.invoke(input, config),
+                    runnables,
+                    actual_inputs,
+                    configs,
+                )
+            )
+
+    async def abatch(
+        self,
+        inputs: List[RouterInput],
+        config: Optional[Union[RunnableConfig, List[RunnableConfig]]] = None,
+        *,
+        max_concurrency: Optional[int] = None,
+    ) -> List[Output]:
+        keys = [input["key"] for input in inputs]
+        actual_inputs = [input["input"] for input in inputs]
+        if any(key not in self.runnables for key in keys):
+            raise ValueError("One or more keys do not have a corresponding runnable")
+
+        runnables = [self.runnables[key] for key in keys]
+        configs = self._get_config_list(config, len(inputs))
+        return await _gather_with_concurrency(
+            max_concurrency,
+            *(
+                runnable.ainvoke(input, config)
+                for runnable, input, config in zip(runnables, actual_inputs, configs)
+            ),
+        )
+
+    def stream(
+        self, input: RouterInput, config: Optional[RunnableConfig] = None
+    ) -> Iterator[Output]:
+        key = input["key"]
+        actual_input = input["input"]
+        if key not in self.runnables:
+            raise ValueError(f"No runnable associated with key '{key}'")
+
+        runnable = self.runnables[key]
+        yield from runnable.stream(actual_input, config)
+
+    async def astream(
+        self, input: RouterInput, config: Optional[RunnableConfig] = None
+    ) -> AsyncIterator[Output]:
+        key = input["key"]
+        actual_input = input["input"]
+        if key not in self.runnables:
+            raise ValueError(f"No runnable associated with key '{key}'")
+
+        runnable = self.runnables[key]
+        async for output in runnable.astream(actual_input, config):
+            yield output
+
+
 def _patch_config(
    config: RunnableConfig, callback_manager: BaseCallbackManager
 ) -> RunnableConfig:
--- a/libs/langchain/langchain/vectorstores/base.py
+++ b/libs/langchain/langchain/vectorstores/base.py
@@ -280,7 +280,9 @@ class VectorStore(ABC):
        # This is a temporary workaround to make the similarity search
        # asynchronous. The proper solution is to make the similarity search
        # asynchronous in the vector store implementations.
-        func = partial(self.similarity_search_with_relevance_scores, query, k, **kwargs)
+        func = partial(
+            self.similarity_search_with_relevance_scores, query, k=k, **kwargs
+        )
        return await asyncio.get_event_loop().run_in_executor(None, func)

    async def asimilarity_search(
@@ -291,7 +293,7 @@ class VectorStore(ABC):
        # This is a temporary workaround to make the similarity search
        # asynchronous. The proper solution is to make the similarity search
        # asynchronous in the vector store implementations.
-        func = partial(self.similarity_search, query, k, **kwargs)
+        func = partial(self.similarity_search, query, k=k, **kwargs)
        return await asyncio.get_event_loop().run_in_executor(None, func)

    def similarity_search_by_vector(
@@ -316,7 +318,7 @@ class VectorStore(ABC):
        # This is a temporary workaround to make the similarity search
        # asynchronous. The proper solution is to make the similarity search
        # asynchronous in the vector store implementations.
-        func = partial(self.similarity_search_by_vector, embedding, k, **kwargs)
+        func = partial(self.similarity_search_by_vector, embedding, k=k, **kwargs)
        return await asyncio.get_event_loop().run_in_executor(None, func)

    def max_marginal_relevance_search(
@@ -359,7 +361,12 @@ class VectorStore(ABC):
        # asynchronous. The proper solution is to make the similarity search
        # asynchronous in the vector store implementations.
        func = partial(
-            self.max_marginal_relevance_search, query, k, fetch_k, lambda_mult, **kwargs
+            self.max_marginal_relevance_search,
+            query,
+            k=k,
+            fetch_k=fetch_k,
+            lambda_mult=lambda_mult,
+            **kwargs,
        )
        return await asyncio.get_event_loop().run_in_executor(None, func)

--- a/libs/langchain/langchain/vectorstores/faiss.py
+++ b/libs/langchain/langchain/vectorstores/faiss.py
@@ -40,7 +40,7 @@ def dependable_faiss_import(no_avx2: Optional[bool] = None) -> Any:
    except ImportError:
        raise ImportError(
            "Could not import faiss python package. "
-            "Please install it with `pip install faiss` "
+            "Please install it with `pip install faiss-gpu` (for CUDA supported GPU) "
            "or `pip install faiss-cpu` (depending on Python version)."
        )
    return faiss
--- a/libs/langchain/langchain/vectorstores/rocksetdb.py
+++ b/libs/langchain/langchain/vectorstores/rocksetdb.py
@@ -23,7 +23,6 @@ class Rockset(VectorStore):
    See: https://rockset.com/blog/introducing-vector-search-on-rockset/ for more details

    Everything below assumes `commons` Rockset workspace.
-    TODO: Add support for workspace args.

    Example:
        .. code-block:: python
@@ -50,6 +49,7 @@ class Rockset(VectorStore):
        collection_name: str,
        text_key: str,
        embedding_key: str,
+        workspace: str = "commons",
    ):
        """Initialize with Rockset client.
        Args:
@@ -82,6 +82,7 @@ class Rockset(VectorStore):
        self._embeddings = embeddings
        self._text_key = text_key
        self._embedding_key = embedding_key
+        self._workspace = workspace

    @property
    def embeddings(self) -> Embeddings:
@@ -303,7 +304,7 @@ class Rockset(VectorStore):
        where_str = f"WHERE {where_str}\n" if where_str else ""
        return f"""\
 SELECT * EXCEPT({self._embedding_key}), {distance_str}
-FROM {self._collection_name}
+FROM {self._workspace}.{self._collection_name}
 {where_str}\
 ORDER BY dist {distance_func.order_by()}
 LIMIT {str(k)}
@@ -311,7 +312,7 @@ LIMIT {str(k)}

    def _write_documents_to_rockset(self, batch: List[dict]) -> List[str]:
        add_doc_res = self._client.Documents.add_documents(
-            collection=self._collection_name, data=batch
+            collection=self._collection_name, data=batch, workspace=self._workspace
        )
        return [doc_status._id for doc_status in add_doc_res.data]

@@ -328,4 +329,5 @@ LIMIT {str(k)}
        self._client.Documents.delete_documents(
            collection=self._collection_name,
            data=[DeleteDocumentsRequestData(id=i) for i in ids],
+            workspace=self._workspace,
        )
--- a/libs/langchain/poetry.lock
+++ b/libs/langchain/poetry.lock
@@ -3269,14 +3269,14 @@ smmap = ">=3.0.1,<6"

 [[package]]
 name = "gitpython"
-version = "3.1.31"
+version = "3.1.32"
 description = "GitPython is a Python library used to interact with Git repositories"
 category = "main"
 optional = true
 python-versions = ">=3.7"
 files = [
-    {file = "GitPython-3.1.31-py3-none-any.whl", hash = "sha256:f04893614f6aa713a60cbbe1e6a97403ef633103cdd0ef5eb6efe0deb98dbe8d"},
-    {file = "GitPython-3.1.31.tar.gz", hash = "sha256:8ce3bcf69adfdf7c7d503e78fd3b1c492af782d58893b650adb2ac8912ddd573"},
+    {file = "GitPython-3.1.32-py3-none-any.whl", hash = "sha256:e3d59b1c2c6ebb9dfa7a184daf3b6dd4914237e7488a1730a6d8f6f5d0b4187f"},
+    {file = "GitPython-3.1.32.tar.gz", hash = "sha256:8d9b8cb1e80b9735e8717c9362079d3ce4c6e5ddeebedd0361b228c3a67a62f6"},
 ]

 [package.dependencies]
@@ -4652,6 +4652,7 @@ optional = false
 python-versions = ">=2.7, !=3.0.*, !=3.1.*, !=3.2.*, !=3.3.*, !=3.4.*, !=3.5.*, !=3.6.*"
 files = [
    {file = "jsonpointer-2.4-py2.py3-none-any.whl", hash = "sha256:15d51bba20eea3165644553647711d150376234112651b4f1811022aecad7d7a"},
+    {file = "jsonpointer-2.4.tar.gz", hash = "sha256:585cee82b70211fa9e6043b7bb89db6e1aa49524340dde8ad6b63206ea689d88"},
 ]

 [[package]]
@@ -13229,7 +13230,7 @@ clarifai = ["clarifai"]
 cohere = ["cohere"]
 docarray = ["docarray"]
 embeddings = ["sentence-transformers"]
-extended-testing = ["atlassian-python-api", "beautifulsoup4", "bibtexparser", "cassio", "chardet", "esprima", "geopandas", "gql", "html2text", "jinja2", "jq", "lxml", "mwparserfromhell", "mwxml", "openai", "openai", "pandas", "pdfminer-six", "pgvector", "psychicapi", "py-trello", "pymupdf", "pypdf", "pypdfium2", "pyspark", "rank-bm25", "rapidfuzz", "requests-toolbelt", "scikit-learn", "streamlit", "sympy", "telethon", "tqdm", "xinference", "zep-python"]
+extended-testing = ["atlassian-python-api", "beautifulsoup4", "bibtexparser", "cassio", "chardet", "esprima", "geopandas", "gitpython", "gql", "html2text", "jinja2", "jq", "lxml", "mwparserfromhell", "mwxml", "openai", "openai", "pandas", "pdfminer-six", "pgvector", "psychicapi", "py-trello", "pymupdf", "pypdf", "pypdfium2", "pyspark", "rank-bm25", "rapidfuzz", "requests-toolbelt", "scikit-learn", "streamlit", "sympy", "telethon", "tqdm", "xinference", "zep-python"]
 javascript = ["esprima"]
 llms = ["anthropic", "clarifai", "cohere", "huggingface_hub", "manifest-ml", "nlpcloud", "openai", "openllm", "openlm", "torch", "transformers", "xinference"]
 openai = ["openai", "tiktoken"]
@@ -13239,4 +13240,4 @@ text-helpers = ["chardet"]
 [metadata]
 lock-version = "2.0"
 python-versions = ">=3.8.1,<4.0"
-content-hash = "5b1c718874d76c0e3b4023b2bceebe11a5e26e5e05d6797acf91b01b0438b2f7"
+content-hash = "ef2b1d30e0fa872ce764c8a4cbc6e0a460bc9391a6465ee29d657e83b5459391"
--- a/libs/langchain/pyproject.toml
+++ b/libs/langchain/pyproject.toml
@@ -1,6 +1,6 @@
 [tool.poetry]
 name = "langchain"
-version = "0.0.247"
+version = "0.0.248"
 description = "Building applications with LLMs through composability"
 authors = []
 license = "MIT"
@@ -126,6 +126,7 @@ amadeus = {version = ">=8.1.0", optional = true}
 geopandas = {version = "^0.13.1", optional = true}
 xinference = {version = "^0.0.6", optional = true}
 python-arango = {version = "^7.5.9", optional = true}
+gitpython = {version = "^3.1.32", optional = true}

 [tool.poetry.group.test.dependencies]
 # The only dependencies that should be added are
@@ -359,6 +360,7 @@ extended_testing = [
 "geopandas",
 "jinja2",
 "xinference",
+ "gitpython",
 ]

 [tool.ruff]
--- a/libs/langchain/tests/integration_tests/document_loaders/test_rocksetdb.py
+++ b/libs/langchain/tests/integration_tests/document_loaders/test_rocksetdb.py
@@ -34,12 +34,12 @@ def test_sql_query() -> None:

    client = rockset.RocksetClient(host, api_key)

-    col_1 = "Rockset is a real-time analytics database which enables queries on massive, semi-structured data without operational burden. Rockset is serverless and fully managed. It offloads the work of managing configuration, cluster provisioning, denormalization, and shard / index management. Rockset is also SOC 2 Type II compliant and offers encryption at rest and in flight, securing and protecting any sensitive data. Most teams can ingest data into Rockset and start executing queries in less than 15 minutes."  # noqa: E501
+    col_1 = "Rockset is a real-time analytics database"
    col_2 = 2
    col_3 = "e903e069-b0b5-4b80-95e2-86471b41f55f"
    id = 7320132

-    """Run a simple SQL query query"""
+    """Run a simple SQL query"""
    loader = RocksetLoader(
        client,
        rockset.models.QueryRequestSql(
--- a/libs/langchain/tests/integration_tests/vectorstores/test_rocksetdb.py
+++ b/libs/langchain/tests/integration_tests/vectorstores/test_rocksetdb.py
@@ -33,6 +33,7 @@ logger = logging.getLogger(__name__)
 #
 # See https://rockset.com/blog/introducing-vector-search-on-rockset/ for more details.

+workspace = "langchain_tests"
 collection_name = "langchain_demo"
 text_key = "description"
 embedding_key = "description_embedding"
@@ -71,10 +72,9 @@ class TestRockset:
                "Deleting all existing documents from the Rockset collection %s",
                collection_name,
            )
+            query = f"select _id from {workspace}.{collection_name}"

-            query_response = client.Queries.query(
-                sql={"query": "select _id from {}".format(collection_name)}
-            )
+            query_response = client.Queries.query(sql={"query": query})
            ids = [
                str(r["_id"])
                for r in getattr(
@@ -85,12 +85,13 @@ class TestRockset:
            client.Documents.delete_documents(
                collection=collection_name,
                data=[rockset.models.DeleteDocumentsRequestData(id=i) for i in ids],
+                workspace=workspace,
            )

        embeddings = ConsistentFakeEmbeddings()
        embeddings.embed_documents(fake_texts)
        cls.rockset_vectorstore = Rockset(
-            client, embeddings, collection_name, text_key, embedding_key
+            client, embeddings, collection_name, text_key, embedding_key, workspace
        )

    def test_rockset_insert_and_search(self) -> None:
@@ -127,9 +128,9 @@ class TestRockset:
        )
        vector_str = ",".join(map(str, vector))
        expected = f"""\
-SELECT * EXCEPT(description_embedding), \
-COSINE_SIM(description_embedding, [{vector_str}]) as dist
-FROM langchain_demo
+SELECT * EXCEPT({embedding_key}), \
+COSINE_SIM({embedding_key}, [{vector_str}]) as dist
+FROM {workspace}.{collection_name}
 ORDER BY dist DESC
 LIMIT 4
 """
@@ -145,9 +146,9 @@ LIMIT 4
        )
        vector_str = ",".join(map(str, vector))
        expected = f"""\
-SELECT * EXCEPT(description_embedding), \
-COSINE_SIM(description_embedding, [{vector_str}]) as dist
-FROM langchain_demo
+SELECT * EXCEPT({embedding_key}), \
+COSINE_SIM({embedding_key}, [{vector_str}]) as dist
+FROM {workspace}.{collection_name}
 WHERE age >= 10
 ORDER BY dist DESC
 LIMIT 4
--- a/libs/langchain/tests/unit_tests/chains/test_neptune_cypher_qa.py
+++ b/libs/langchain/tests/unit_tests/chains/test_neptune_cypher_qa.py
@@ -0,0 +1,2 @@
+def test_import() -> None:
+    from langchain.chains import NeptuneOpenCypherQAChain  # noqa: F401
--- a/libs/langchain/tests/unit_tests/document_loaders/test_git.py
+++ b/libs/langchain/tests/unit_tests/document_loaders/test_git.py
@@ -0,0 +1,65 @@
+import os
+
+import py
+import pytest
+
+from langchain.document_loaders import GitLoader
+
+
+def init_repo(tmpdir: py.path.local, dir_name: str) -> str:
+    from git import Repo
+
+    repo_dir = tmpdir.mkdir(dir_name)
+    repo = Repo.init(repo_dir)
+    git = repo.git
+    git.checkout(b="main")
+
+    git.config("user.name", "Test User")
+    git.config("user.email", "test@example.com")
+
+    sample_file = "file.txt"
+    with open(os.path.join(repo_dir, sample_file), "w") as f:
+        f.write("content")
+    git.add([sample_file])
+    git.commit(m="Initial commit")
+
+    return repo_dir
+
+
+@pytest.mark.requires("git")
+def test_load_twice(tmpdir: py.path.local) -> None:
+    """
+    Test that loading documents twice from the same repository does not raise an error.
+    """
+
+    clone_url = init_repo(tmpdir, "remote_repo")
+
+    repo_path = tmpdir.mkdir("local_repo").strpath
+    loader = GitLoader(repo_path=repo_path, clone_url=clone_url)
+
+    documents = loader.load()
+    assert len(documents) == 1
+
+    documents = loader.load()
+    assert len(documents) == 1
+
+
+@pytest.mark.requires("git")
+def test_clone_different_repo(tmpdir: py.path.local) -> None:
+    """
+    Test that trying to clone a different repository into a directory already
+    containing a clone raises a ValueError.
+    """
+
+    clone_url = init_repo(tmpdir, "remote_repo")
+
+    repo_path = tmpdir.mkdir("local_repo").strpath
+    loader = GitLoader(repo_path=repo_path, clone_url=clone_url)
+
+    documents = loader.load()
+    assert len(documents) == 1
+
+    other_clone_url = init_repo(tmpdir, "other_remote_repo")
+    other_loader = GitLoader(repo_path=repo_path, clone_url=other_clone_url)
+    with pytest.raises(ValueError):
+        other_loader.load()
--- a/libs/langchain/tests/unit_tests/graphs/test_neptune_graph.py
+++ b/libs/langchain/tests/unit_tests/graphs/test_neptune_graph.py
@@ -0,0 +1,2 @@
+def test_import() -> None:
+    from langchain.graphs import NeptuneGraph  # noqa: F401
--- a/libs/langchain/tests/unit_tests/retrievers/test_time_weighted_retriever.py
+++ b/libs/langchain/tests/unit_tests/retrievers/test_time_weighted_retriever.py
@@ -1,6 +1,6 @@
 """Tests for the time-weighted retriever class."""

-from datetime import datetime
+from datetime import datetime, timedelta
 from typing import Any, Iterable, List, Optional, Tuple, Type

 import pytest
@@ -139,7 +139,11 @@ def test_get_salient_docs(
 ) -> None:
    query = "Test query"
    docs_and_scores = time_weighted_retriever.get_salient_docs(query)
+    want = [(doc, 0.5) for doc in _get_example_memories()]
    assert isinstance(docs_and_scores, dict)
+    assert len(docs_and_scores) == len(want)
+    for k, doc in docs_and_scores.items():
+        assert doc in want


 def test_get_relevant_documents(
@@ -147,7 +151,17 @@ def test_get_relevant_documents(
 ) -> None:
    query = "Test query"
    relevant_documents = time_weighted_retriever.get_relevant_documents(query)
+    want = [(doc, 0.5) for doc in _get_example_memories()]
    assert isinstance(relevant_documents, list)
+    assert len(relevant_documents) == len(want)
+    now = datetime.now()
+    for doc in relevant_documents:
+        # assert that the last_accessed_at is close to now.
+        assert now - timedelta(hours=1) < doc.metadata["last_accessed_at"] <= now
+
+    # assert that the last_accessed_at in the memory stream is updated.
+    for d in time_weighted_retriever.memory_stream:
+        assert now - timedelta(hours=1) < d.metadata["last_accessed_at"] <= now


 def test_add_documents(
--- a/libs/langchain/tests/unit_tests/schema/snapshots/test_runnable.ambr
+++ b/libs/langchain/tests/unit_tests/schema/snapshots/test_runnable.ambr
--- a/libs/langchain/tests/unit_tests/schema/test_runnable.py
+++ b/libs/langchain/tests/unit_tests/schema/test_runnable.py
@@ -23,6 +23,7 @@ from langchain.schema.document import Document
 from langchain.schema.messages import AIMessage, HumanMessage, SystemMessage
 from langchain.schema.retriever import BaseRetriever
 from langchain.schema.runnable import (
+    RouterRunnable,
    Runnable,
    RunnableConfig,
    RunnableLambda,
@@ -33,16 +34,38 @@ from langchain.schema.runnable import (


 class FakeTracer(BaseTracer):
-    """Fake tracer that records LangChain execution."""
+    """Fake tracer that records LangChain execution.
+    It replaces run ids with deterministic UUIDs for snapshotting."""

    def __init__(self) -> None:
        """Initialize the tracer."""
        super().__init__()
        self.runs: List[Run] = []
+        self.uuids_map: Dict[UUID, UUID] = {}
+        self.uuids_generator = (
+            UUID(f"00000000-0000-4000-8000-{i:012}", version=4) for i in range(10000)
+        )
+
+    def _replace_uuid(self, uuid: UUID) -> UUID:
+        if uuid not in self.uuids_map:
+            self.uuids_map[uuid] = next(self.uuids_generator)
+        return self.uuids_map[uuid]
+
+    def _copy_run(self, run: Run) -> Run:
+        return run.copy(
+            update={
+                "id": self._replace_uuid(run.id),
+                "parent_run_id": self.uuids_map[run.parent_run_id]
+                if run.parent_run_id
+                else None,
+                "child_runs": [self._copy_run(child) for child in run.child_runs],
+            }
+        )

    def _persist_run(self, run: Run) -> None:
        """Persist a run."""
-        self.runs.append(run)
+
+        self.runs.append(self._copy_run(run))


 class FakeRunnable(Runnable[str, int]):
@@ -78,20 +101,6 @@ class FakeRetriever(BaseRetriever):
        return [Document(page_content="foo"), Document(page_content="bar")]


-@pytest.fixture()
-def fixed_uuids(mocker: MockerFixture) -> MockerFixture._Patcher:
-    """Note this mock only works with `import uuid; uuid.uuid4()`,
-    it does not work with `from uuid import uuid4; uuid4()`."""
-
-    # Disable tracing to avoid fixed UUIDs causing tracing errors.
-    mocker.patch.dict("os.environ", {"LANGCHAIN_TRACING_V2": "false"})
-
-    side_effect = (
-        UUID(f"00000000-0000-4000-8000-{i:012}", version=4) for i in range(10000)
-    )
-    return mocker.patch("uuid.uuid4", side_effect=side_effect)
-
-
@pytest.mark.asyncio
 async def test_default_method_implementations(mocker: MockerFixture) -> None:
    fake = FakeRunnable()
@@ -206,13 +215,13 @@ async def test_prompt() -> None:
@pytest.mark.asyncio
@freeze_time("2023-01-01")
 async def test_prompt_with_chat_model(
-    mocker: MockerFixture, snapshot: SnapshotAssertion, fixed_uuids: None
+    mocker: MockerFixture, snapshot: SnapshotAssertion
 ) -> None:
    prompt = (
        SystemMessagePromptTemplate.from_template("You are a nice assistant.")
        + "{question}"
    )
-    chat = FakeListChatModel(responses=["foo", "bar"])
+    chat = FakeListChatModel(responses=["foo"])

    chain = prompt | chat

@@ -251,7 +260,7 @@ async def test_prompt_with_chat_model(
        ],
        dict(callbacks=[tracer]),
    ) == [
-        AIMessage(content="bar"),
+        AIMessage(content="foo"),
        AIMessage(content="foo"),
    ]
    assert prompt_spy.call_args.args[1] == [
@@ -272,7 +281,16 @@ async def test_prompt_with_chat_model(
            ]
        ),
    ]
-    assert tracer.runs == snapshot
+    assert (
+        len(
+            [
+                r
+                for r in tracer.runs
+                if r.parent_run_id is None and len(r.child_runs) == 2
+            ]
+        )
+        == 2
+    ), "Each of 2 outer runs contains exactly two inner runs (1 prompt, 1 chat)"
    mocker.stop(prompt_spy)
    mocker.stop(chat_spy)

@@ -282,7 +300,7 @@ async def test_prompt_with_chat_model(
    tracer = FakeTracer()
    assert [
        *chain.stream({"question": "What is your name?"}, dict(callbacks=[tracer]))
-    ] == [AIMessage(content="bar")]
+    ] == [AIMessage(content="foo")]
    assert prompt_spy.call_args.args[1] == {"question": "What is your name?"}
    assert chat_spy.call_args.args[1] == ChatPromptValue(
        messages=[
@@ -295,7 +313,7 @@ async def test_prompt_with_chat_model(
@pytest.mark.asyncio
@freeze_time("2023-01-01")
 async def test_prompt_with_llm(
-    mocker: MockerFixture, snapshot: SnapshotAssertion, fixed_uuids: None
+    mocker: MockerFixture, snapshot: SnapshotAssertion
 ) -> None:
    prompt = (
        SystemMessagePromptTemplate.from_template("You are a nice assistant.")
@@ -386,7 +404,7 @@ async def test_prompt_with_llm(

@freeze_time("2023-01-01")
 def test_prompt_with_chat_model_and_parser(
-    mocker: MockerFixture, snapshot: SnapshotAssertion, fixed_uuids: None
+    mocker: MockerFixture, snapshot: SnapshotAssertion
 ) -> None:
    prompt = (
        SystemMessagePromptTemplate.from_template("You are a nice assistant.")
@@ -424,7 +442,7 @@ def test_prompt_with_chat_model_and_parser(

@freeze_time("2023-01-01")
 def test_seq_dict_prompt_llm(
-    mocker: MockerFixture, snapshot: SnapshotAssertion, fixed_uuids: None
+    mocker: MockerFixture, snapshot: SnapshotAssertion
 ) -> None:
    passthrough = mocker.Mock(side_effect=lambda x: x)

@@ -487,13 +505,16 @@ What is your name?"""
        ]
    )
    assert parser_spy.call_args.args[1] == AIMessage(content="foo, bar")
-    assert tracer.runs == snapshot
+    assert len([r for r in tracer.runs if r.parent_run_id is None]) == 1
+    parent_run = next(r for r in tracer.runs if r.parent_run_id is None)
+    assert len(parent_run.child_runs) == 4
+    map_run = parent_run.child_runs[0]
+    assert map_run.name == "RunnableMap"
+    assert len(map_run.child_runs) == 3


@freeze_time("2023-01-01")
-def test_seq_prompt_dict(
-    mocker: MockerFixture, snapshot: SnapshotAssertion, fixed_uuids: None
-) -> None:
+def test_seq_prompt_dict(mocker: MockerFixture, snapshot: SnapshotAssertion) -> None:
    passthrough = mocker.Mock(side_effect=lambda x: x)

    prompt = (
@@ -544,13 +565,64 @@ def test_seq_prompt_dict(
            HumanMessage(content="What is your name?"),
        ]
    )
+    assert len([r for r in tracer.runs if r.parent_run_id is None]) == 1
+    parent_run = next(r for r in tracer.runs if r.parent_run_id is None)
+    assert len(parent_run.child_runs) == 3
+    map_run = parent_run.child_runs[2]
+    assert map_run.name == "RunnableMap"
+    assert len(map_run.child_runs) == 2
+
+
+@pytest.mark.asyncio
+@freeze_time("2023-01-01")
+async def test_router_runnable(
+    mocker: MockerFixture, snapshot: SnapshotAssertion
+) -> None:
+    chain1 = ChatPromptTemplate.from_template(
+        "You are a math genius. Answer the question: {question}"
+    ) | FakeListLLM(responses=["4"])
+    chain2 = ChatPromptTemplate.from_template(
+        "You are an english major. Answer the question: {question}"
+    ) | FakeListLLM(responses=["2"])
+    router = RouterRunnable({"math": chain1, "english": chain2})
+    chain: Runnable = {
+        "key": lambda x: x["key"],
+        "input": {"question": lambda x: x["question"]},
+    } | router
+    assert dumps(chain, pretty=True) == snapshot
+
+    result = chain.invoke({"key": "math", "question": "2 + 2"})
+    assert result == "4"
+
+    result2 = chain.batch(
+        [{"key": "math", "question": "2 + 2"}, {"key": "english", "question": "2 + 2"}]
+    )
+    assert result2 == ["4", "2"]
+
+    result = await chain.ainvoke({"key": "math", "question": "2 + 2"})
+    assert result == "4"
+
+    result2 = await chain.abatch(
+        [{"key": "math", "question": "2 + 2"}, {"key": "english", "question": "2 + 2"}]
+    )
+    assert result2 == ["4", "2"]
+
+    # Test invoke
+    router_spy = mocker.spy(router.__class__, "invoke")
+    tracer = FakeTracer()
+    assert (
+        chain.invoke({"key": "math", "question": "2 + 2"}, dict(callbacks=[tracer]))
+        == "4"
+    )
+    assert router_spy.call_args.args[1] == {
+        "key": "math",
+        "input": {"question": "2 + 2"},
+    }
    assert tracer.runs == snapshot


@freeze_time("2023-01-01")
-def test_seq_prompt_map(
-    mocker: MockerFixture, snapshot: SnapshotAssertion, fixed_uuids: None
-) -> None:
+def test_seq_prompt_map(mocker: MockerFixture, snapshot: SnapshotAssertion) -> None:
    passthrough = mocker.Mock(side_effect=lambda x: x)

    prompt = (
@@ -608,7 +680,12 @@ def test_seq_prompt_map(
            HumanMessage(content="What is your name?"),
        ]
    )
-    assert tracer.runs == snapshot
+    assert len([r for r in tracer.runs if r.parent_run_id is None]) == 1
+    parent_run = next(r for r in tracer.runs if r.parent_run_id is None)
+    assert len(parent_run.child_runs) == 3
+    map_run = parent_run.child_runs[2]
+    assert map_run.name == "RunnableMap"
+    assert len(map_run.child_runs) == 3


 def test_bind_bind() -> None:
Author	SHA1	Message	Date
Eugene Yurtsev	71450f2a7e	x	2023-07-31 22:48:54 -04:00
Harrison Chase	15de57b848	fix web loader (#8538 )	2023-07-31 12:47:33 -07:00
Nuno Campos	4780156955	Rely less on positional arg order in subclasses of vector store when calling async methods (#8534 )	2023-07-31 20:13:11 +01:00
Harrison Chase	5e3b968078	router runnable (#8496 ) Co-authored-by: Nuno Campos <nuno@boringbits.io>	2023-07-31 11:07:10 -07:00
Anubhav Bindlish	913a156cff	Minor improvements to rockset vectorstore (#8416 ) This PR makes minor improvements to our python notebook, and adds support for `Rockset` workspaces in our vectorstore client. @rlancemartin, @eyurtsev --------- Co-authored-by: Bagatur <baskaryan@gmail.com>	2023-07-31 09:54:59 -07:00
Harrison Chase	893f3014af	add xml agent notebook	2023-07-31 07:33:22 -07:00
Bagatur	a8be207ea3	bump 248 (#8518 )	2023-07-31 07:14:45 -07:00
Harrison Chase	6556a8fcfd	add initial anthropic agent (#8468 ) Co-authored-by: Nuno Campos <nuno@boringbits.io>	2023-07-30 21:30:49 -07:00
os1ma	a795c3d860	Fix GitLoader to handle repeated load calls (#8412 ) Description: a description of the change In this pull request, GitLoader has been updated to handle multiple load calls, provided the same repository is being cloned. Previously, calling `load` multiple times would raise an error if a clone URL was provided. Additionally, a check has been added to raise a ValueError when attempting to clone a different repository into an existing path. New tests have also been introduced to verify the correct behavior of the GitLoader class when `load` is called multiple times. Lastly, the GitPython package, a dependency for the GitLoader class, has been added to the project dependencies (pyproject.toml and poetry.lock). Issue: the issue # it fixes (if applicable) None Dependencies: any dependencies required for this change GitPython Tag maintainer: for a quicker response, tag the relevant maintainer (see below) - DataLoaders / VectorStores / Retrievers: @rlancemartin, @eyurtsev	2023-07-30 21:27:20 -07:00
Muhammed Al-Dulaimi	9975ba4124	Fix ChromaDB integration -> docker container instructions (#8447 ) ## Description This PR handles modifying the Chroma DB integration's documentation. It modifies the Docker container example to fix the instructions mentioned in the documentation. In the current documentation, the below `client.reset()` line causes a runtime error: ```py ... client = chromadb.HttpClient(settings=Settings(allow_reset=True)) client.reset() # resets the database collection = client.create_collection("my_collection") ... ``` `Exception: {"error":"ValueError('Resetting is not allowed by this configuration')"}` This is due to the Chroma DB server needing to have the `allow_reset` flag set to `true` there as well. This is fixed by adding the `ALLOW_RESET=TRUE` to the `docker-compose` file environment variable to the docker container before spinning it ## Issue This fixes the runtime error that occurs when running the docker container example code ## Tag Maintainer @rlancemartin, @eyurtsev	2023-07-30 21:11:56 -07:00
Nicolas Raoul	7f9c6c3baa	Fixed typo: papaer -> paper (#8500 )	2023-07-30 21:08:11 -07:00
Piyush Jain	b2f8a5bae9	Fixed exports for NeptuneOpenCypherQAChain (#8439 ) ## Description The imports for `NeptuneOpenCypherQAChain` are failing. This PR adds the chain class to the `__init__.py` file to fix this issue. ## Maintainers @dev2049 @krlawrence	2023-07-30 20:36:22 -07:00
Eugene Yurtsev	e98e2b2b81	ChatPromptTemplate: clean up doc-string (#8473 ) Minor doc-string clean up --------- Co-authored-by: Harrison Chase <hw.chase.17@gmail.com>	2023-07-30 20:11:04 -07:00
Eugene Yurtsev	529cb2e30c	Update doc-string in few shot template (#8474 ) Partial update of doc-string, need to update other instances in documentation	2023-07-30 19:39:14 -07:00
Bharat Raghunathan	04ebdbe98f	doc(prompts): Add redirects in Prompt subcategories pages (#8478 ) - Description: Fixes broken links in some Prompts subcategories in documentation (Example Selectors, Prompt Templates) - Issue: #8477 (Fixes #8477) - Dependencies: None - Tag maintainer: @baskaryan - Twitter handle: [@BharatR123](https://twitter.com/BharatR123)	2023-07-30 19:38:52 -07:00
Ludwig Hubert	08f5e6b801	Fix documentation for from_documents signature (#8482 ) Docs for from_documents() were outdated as seen in https://github.com/langchain-ai/langchain/issues/8457 . fixes #8457 <!-- Thank you for contributing to LangChain! Replace this comment with: - Description: a description of the change, - Issue: the issue # it fixes (if applicable), - Dependencies: any dependencies required for this change, - Tag maintainer: for a quicker response, tag the relevant maintainer (see below), - Twitter handle: we announce bigger features on Twitter. If your PR gets announced and you'd like a mention, we'll gladly shout you out! Please make sure you're PR is passing linting and testing before submitting. Run `make format`, `make lint` and `make test` to check this locally. If you're adding a new integration, please include: 1. a test for the integration, preferably unit tests that do not rely on network access, 2. an example notebook showing its use. Maintainer responsibilities: - General / Misc / if you don't know who to tag: @baskaryan - DataLoaders / VectorStores / Retrievers: @rlancemartin, @eyurtsev - Models / Prompts: @hwchase17, @baskaryan - Memory: @hwchase17 - Agents / Tools / Toolkits: @hinthornw - Tracing / Callbacks: @agola11 - Async: @agola11 If no one reviews your PR within a few days, feel free to @-mention the same people again. See contribution guidelines for more information on how to write/run tests, lint, etc: https://github.com/hwchase17/langchain/blob/master/.github/CONTRIBUTING.md -->	2023-07-30 13:24:44 -07:00
Muneeb Ahmad	4923cf029a	Added Proper Documentation for `faiss-gpu` Installation (#8492 ) ### Description In the LangChain Documentation and Comments, I've Noticed that `pip install faiss` was mentioned, instead of `pip install faiss-gpu`, since installing `pip install faiss` results in an error. I've gone ahead and updated the Documentation, and `faiss.ipynb`. This Change will ensure ease of use for the end user, trying to install `faiss-gpu`. ### Issue: Documentation / Comments Related. ### Dependencies: No Dependencies we're changed only updated the files with the wrong reference. ### Tag maintainer: @rlancemartin, @eyurtsev (Thank You for your contributions 😄 )	2023-07-30 13:24:30 -07:00
shibuiwilliam	549720ae51	add test to ensure values in time weighted retriever are updated (#8479 ) # What - add test to ensure values in time weighted retriever are updated <!-- Thank you for contributing to LangChain! Replace this comment with: - Description: add test to ensure values in time weighted retriever are updated - Issue: None - Dependencies: None - Tag maintainer: @rlancemartin, @eyurtsev - Twitter handle: @MlopsJ Please make sure you're PR is passing linting and testing before submitting. Run `make format`, `make lint` and `make test` to check this locally. If you're adding a new integration, please include: 1. a test for the integration, preferably unit tests that do not rely on network access, 2. an example notebook showing its use. Maintainer responsibilities: - General / Misc / if you don't know who to tag: @baskaryan - DataLoaders / VectorStores / Retrievers: @rlancemartin, @eyurtsev - Models / Prompts: @hwchase17, @baskaryan - Memory: @hwchase17 - Agents / Tools / Toolkits: @hinthornw - Tracing / Callbacks: @agola11 - Async: @agola11 If no one reviews your PR within a few days, feel free to @-mention the same people again. See contribution guidelines for more information on how to write/run tests, lint, etc: https://github.com/hwchase17/langchain/blob/master/.github/CONTRIBUTING.md -->	2023-07-30 11:42:25 -07:00
Harrison Chase	18a2452121	prompt cleanup (#8470 )	2023-07-30 10:47:31 -07:00
Harrison Chase	4d526c49ed	bump experimental to 008 (#8490 )	2023-07-30 07:28:18 -07:00
Harrison Chase	8f14ddefdf	add anthropic functions wrapper (#8475 ) a cheeky wrapper around claude that adds in function calling support (kind of, hence it going in experimental)	2023-07-30 07:23:46 -07:00
Harrison Chase	490ad93b3c	fix links generation (#8471 )	2023-07-29 18:31:33 -07:00