couchbase: Add ttl support to caches & chat_message_history (#26214)

**Description:** Add support to delete documents automatically from the caches & chat message history by adding a new optional parameter, `ttl`. - [x] **Add tests and docs**: If you're adding a new integration, please include 1. a test for the integration, preferably unit tests that do not rely on network access, 2. an example notebook showing its use. It lives in `docs/docs/integrations` directory. - [x] **Lint and test**: Run `make format`, `make lint` and `make test` from the root of the package(s) you've modified. See contribution guidelines for more: https://python.langchain.com/docs/contributing/ --------- Co-authored-by: Nithish Raghunandanan <nithishr@users.noreply.github.com> Co-authored-by: Erick Friis <erick@langchain.dev>
2025-09-10 23:41:28 +00:00 · 2024-09-21 01:44:29 +02:00
parent c6c508ee96
commit 2d21274bf6
10 changed files with 901 additions and 417 deletions
--- a/libs/partners/couchbase/langchain_couchbase/cache.py
+++ b/libs/partners/couchbase/langchain_couchbase/cache.py
@@ -9,6 +9,7 @@ are duplicated in this utility from modules:
 import hashlib
 import json
 import logging
+from datetime import timedelta
 from typing import Any, Dict, Optional, Union

 from couchbase.cluster import Cluster
@@ -87,6 +88,16 @@ def _loads_generations(generations_str: str) -> Union[RETURN_VAL_TYPE, None]:
        return None


+def _validate_ttl(ttl: Optional[timedelta]) -> None:
+    """Validate the time to live"""
+    if not isinstance(ttl, timedelta):
+        raise ValueError(f"ttl should be of type timedelta but was {type(ttl)}.")
+    if ttl <= timedelta(seconds=0):
+        raise ValueError(
+            f"ttl must be greater than 0 but was {ttl.total_seconds()} seconds."
+        )
+
+
 class CouchbaseCache(BaseCache):
    """Couchbase LLM Cache
    LLM Cache that uses Couchbase as the backend
@@ -140,6 +151,7 @@ class CouchbaseCache(BaseCache):
        bucket_name: str,
        scope_name: str,
        collection_name: str,
+        ttl: Optional[timedelta] = None,
        **kwargs: Dict[str, Any],
    ) -> None:
        """Initialize the Couchbase LLM Cache
@@ -149,6 +161,8 @@ class CouchbaseCache(BaseCache):
            scope_name (str): name of the scope in bucket to store documents in.
            collection_name (str): name of the collection in the scope to store
                documents in.
+            ttl (Optional[timedelta]): TTL or time for the document to live in the cache
+                After this time, the document will get deleted from the cache.
        """
        if not isinstance(cluster, Cluster):
            raise ValueError(
@@ -162,6 +176,8 @@ class CouchbaseCache(BaseCache):
        self._scope_name = scope_name
        self._collection_name = collection_name

+        self._ttl = None
+
        # Check if the bucket exists
        if not self._check_bucket_exists():
            raise ValueError(
@@ -185,6 +201,11 @@ class CouchbaseCache(BaseCache):
        except Exception as e:
            raise e

+        # Check if the time to live is provided and valid
+        if ttl is not None:
+            _validate_ttl(ttl)
+            self._ttl = ttl
+
    def lookup(self, prompt: str, llm_string: str) -> Optional[RETURN_VAL_TYPE]:
        """Look up from cache based on prompt and llm_string."""
        try:
@@ -206,10 +227,16 @@ class CouchbaseCache(BaseCache):
            self.LLM: llm_string,
            self.RETURN_VAL: _dumps_generations(return_val),
        }
+        document_key = self._generate_key(prompt, llm_string)
        try:
-            self._collection.upsert(
-                key=self._generate_key(prompt, llm_string), value=doc
-            )
+            if self._ttl:
+                self._collection.upsert(
+                    key=document_key,
+                    value=doc,
+                    expiry=self._ttl,
+                )
+            else:
+                self._collection.upsert(key=document_key, value=doc)
        except Exception:
            logger.error("Error updating cache")

@@ -242,6 +269,7 @@ class CouchbaseSemanticCache(BaseCache, CouchbaseVectorStore):
        collection_name: str,
        index_name: str,
        score_threshold: Optional[float] = None,
+        ttl: Optional[timedelta] = None,
    ) -> None:
        """Initialize the Couchbase LLM Cache
        Args:
@@ -253,6 +281,8 @@ class CouchbaseSemanticCache(BaseCache, CouchbaseVectorStore):
                documents in.
            index_name (str): name of the Search index to use.
            score_threshold (float): score threshold to use for filtering results.
+            ttl (Optional[timedelta]): TTL or time for the document to live in the cache
+                After this time, the document will get deleted from the cache.
        """
        if not isinstance(cluster, Cluster):
            raise ValueError(
@@ -265,6 +295,7 @@ class CouchbaseSemanticCache(BaseCache, CouchbaseVectorStore):
        self._bucket_name = bucket_name
        self._scope_name = scope_name
        self._collection_name = collection_name
+        self._ttl = None

        # Check if the bucket exists
        if not self._check_bucket_exists():
@@ -291,6 +322,10 @@ class CouchbaseSemanticCache(BaseCache, CouchbaseVectorStore):

        self.score_threshold = score_threshold

+        if ttl is not None:
+            _validate_ttl(ttl)
+            self._ttl = ttl
+
        # Initialize the vector store
        super().__init__(
            cluster=cluster,
@@ -334,6 +369,7 @@ class CouchbaseSemanticCache(BaseCache, CouchbaseVectorStore):
                        self.RETURN_VAL: _dumps_generations(return_val),
                    }
                ],
+                ttl=self._ttl,
            )
        except Exception:
            logger.error("Error updating cache")