databricks: mv to partner repo (#25788)

2025-08-10 13:27:36 +00:00 · 2024-08-27 18:51:17 -07:00 · 2024-08-27 18:51:17 -07:00 · 1023fbc98a
commit 1023fbc98a
parent 2e5c379632
23 changed files with 0 additions and 5437 deletions
--- a/libs/partners/databricks/.gitignore
+++ b/libs/partners/databricks/.gitignore
@ -1 +0,0 @@
 __pycache__
--- a/libs/partners/databricks/LICENSE
+++ b/libs/partners/databricks/LICENSE
@ -1,21 +0,0 @@
 MIT License
 Copyright (c) 2024 LangChain, Inc.
 Permission is hereby granted, free of charge, to any person obtaining a copy
 of this software and associated documentation files (the "Software"), to deal
 in the Software without restriction, including without limitation the rights
 to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 copies of the Software, and to permit persons to whom the Software is
 furnished to do so, subject to the following conditions:
 The above copyright notice and this permission notice shall be included in all
 copies or substantial portions of the Software.
 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
 AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
 SOFTWARE.
--- a/libs/partners/databricks/Makefile
+++ b/libs/partners/databricks/Makefile
@ -1,62 +0,0 @@
 .PHONY: all format lint test tests integration_tests docker_tests help extended_tests
 # Default target executed when no arguments are given to make.
 all: help
 # Define a variable for the test file path.
 TEST_FILE ?= tests/unit_tests/
 integration_test integration_tests: TEST_FILE = tests/integration_tests/
 # unit tests are run with the --disable-socket flag to prevent network calls
 test tests:
 	poetry run pytest --disable-socket --allow-unix-socket $(TEST_FILE)
 # integration tests are run without the --disable-socket flag to allow network calls
 integration_test integration_tests:
 	poetry run pytest $(TEST_FILE)
 ######################
 # LINTING AND FORMATTING
 ######################
 # Define a variable for Python and notebook files.
 PYTHON_FILES=.
 MYPY_CACHE=.mypy_cache
 lint format: PYTHON_FILES=.
 lint_diff format_diff: PYTHON_FILES=$(shell git diff --relative=libs/partners/databricks --name-only --diff-filter=d master | grep -E '\.py$$|\.ipynb$$')
 lint_package: PYTHON_FILES=langchain_databricks
 lint_tests: PYTHON_FILES=tests
 lint_tests: MYPY_CACHE=.mypy_cache_test
 lint lint_diff lint_package lint_tests:
 	poetry run ruff check .
 	poetry run ruff format $(PYTHON_FILES) --diff
 	poetry run ruff check --select I $(PYTHON_FILES)
 	mkdir -p $(MYPY_CACHE); poetry run mypy $(PYTHON_FILES) --cache-dir $(MYPY_CACHE)
 format format_diff:
 	poetry run ruff format $(PYTHON_FILES)
 	poetry run ruff check --select I --fix $(PYTHON_FILES)
 spell_check:
 	poetry run codespell --toml pyproject.toml
 spell_fix:
 	poetry run codespell --toml pyproject.toml -w
 check_imports: $(shell find langchain_databricks -name '*.py')
 	poetry run python ./scripts/check_imports.py $^
 ######################
 # HELP
 ######################
 help:
 	@echo '----'
 	@echo 'check_imports				- check imports'
 	@echo 'format                       - run code formatters'
 	@echo 'lint                         - run linters'
 	@echo 'test                         - run unit tests'
 	@echo 'tests                        - run unit tests'
 	@echo 'test TEST_FILE=<test_file>   - run all tests in file'
--- a/libs/partners/databricks/README.md
+++ b/libs/partners/databricks/README.md
@ -1,24 +0,0 @@
 # langchain-databricks
 This package contains the LangChain integration with Databricks
 ## Installation
 ```bash
 pip install -U langchain-databricks
 ```
 And you should configure credentials by setting the following environment variables:
 * TODO: fill this out
 ## Chat Models
 `ChatDatabricks` class exposes chat models from Databricks.
 ```python
 from langchain_databricks import ChatDatabricks
 llm = ChatDatabricks()
 llm.invoke("Sing a ballad of LangChain.")
 ```
--- a/libs/partners/databricks/langchain_databricks/init.py
+++ b/libs/partners/databricks/langchain_databricks/init.py
@ -1,19 +0,0 @@
 from importlib import metadata
 from langchain_databricks.chat_models import ChatDatabricks
 from langchain_databricks.embeddings import DatabricksEmbeddings
 from langchain_databricks.vectorstores import DatabricksVectorSearch
 try:
    __version__ = metadata.version(__package__)
 except metadata.PackageNotFoundError:
    # Case where package metadata is not available.
    __version__ = ""
 del metadata  # optional, avoids polluting the results of dir(__package__)
 __all__ = [
    "ChatDatabricks",
    "DatabricksEmbeddings",
    "DatabricksVectorSearch",
    "__version__",
 ]
--- a/libs/partners/databricks/langchain_databricks/chat_models.py
+++ b/libs/partners/databricks/langchain_databricks/chat_models.py
@ -1,556 +0,0 @@
 """Databricks chat models."""
 import json
 import logging
 from typing import (
    Any,
    Callable,
    Dict,
    Iterator,
    List,
    Literal,
    Mapping,
    Optional,
    Sequence,
    Type,
    Union,
 )
 from langchain_core.callbacks import CallbackManagerForLLMRun
 from langchain_core.language_models import BaseChatModel
 from langchain_core.language_models.base import LanguageModelInput
 from langchain_core.messages import (
    AIMessage,
    AIMessageChunk,
    BaseMessage,
    BaseMessageChunk,
    ChatMessage,
    ChatMessageChunk,
    FunctionMessage,
    HumanMessage,
    HumanMessageChunk,
    SystemMessage,
    SystemMessageChunk,
    ToolMessage,
    ToolMessageChunk,
 )
 from langchain_core.messages.tool import tool_call_chunk
 from langchain_core.output_parsers.openai_tools import (
    make_invalid_tool_call,
    parse_tool_call,
 )
 from langchain_core.outputs import ChatGeneration, ChatGenerationChunk, ChatResult
 from langchain_core.pydantic_v1 import (
    BaseModel,
    Field,
    PrivateAttr,
 )
 from langchain_core.runnables import Runnable
 from langchain_core.tools import BaseTool
 from langchain_core.utils.function_calling import convert_to_openai_tool
 from langchain_databricks.utils import get_deployment_client
 logger = logging.getLogger(__name__)
 class ChatDatabricks(BaseChatModel):
    """Databricks chat model integration.
    Setup:
        Install ``langchain-databricks``.
        .. code-block:: bash
            pip install -U langchain-databricks
        If you are outside Databricks, set the Databricks workspace hostname and personal access token to environment variables:
        .. code-block:: bash
            export DATABRICKS_HOSTNAME="https://your-databricks-workspace"
            export DATABRICKS_TOKEN="your-personal-access-token"
    Key init args — completion params:
        endpoint: str
            Name of Databricks Model Serving endpoint to query.
        target_uri: str
            The target URI to use. Defaults to ``databricks``.
        temperature: float
            Sampling temperature. Higher values make the model more creative.
        n: Optional[int]
            The number of completion choices to generate.
        stop: Optional[List[str]]
            List of strings to stop generation at.
        max_tokens: Optional[int]
            Max number of tokens to generate.
        extra_params: Optional[Dict[str, Any]]
            Any extra parameters to pass to the endpoint.
    Instantiate:
        .. code-block:: python
            from langchain_databricks import ChatDatabricks
            llm = ChatDatabricks(
                endpoint="databricks-meta-llama-3-1-405b-instruct",
                temperature=0,
                max_tokens=500,
            )
    Invoke:
        .. code-block:: python
            messages = [
                ("system", "You are a helpful translator. Translate the user sentence to French."),
                ("human", "I love programming."),
            ]
            llm.invoke(messages)
        .. code-block:: python
            AIMessage(
                content="J'adore la programmation.",
                response_metadata={
                    'prompt_tokens': 32,
                    'completion_tokens': 9,
                    'total_tokens': 41
                },
                id='run-64eebbdd-88a8-4a25-b508-21e9a5f146c5-0'
            )
    Stream:
        .. code-block:: python
            for chunk in llm.stream(messages):
                print(chunk)
        .. code-block:: python
            content='J' id='run-609b8f47-e580-4691-9ee4-e2109f53155e'
            content="'" id='run-609b8f47-e580-4691-9ee4-e2109f53155e'
            content='ad' id='run-609b8f47-e580-4691-9ee4-e2109f53155e'
            content='ore' id='run-609b8f47-e580-4691-9ee4-e2109f53155e'
            content=' la' id='run-609b8f47-e580-4691-9ee4-e2109f53155e'
            content=' programm' id='run-609b8f47-e580-4691-9ee4-e2109f53155e'
            content='ation' id='run-609b8f47-e580-4691-9ee4-e2109f53155e'
            content='.' id='run-609b8f47-e580-4691-9ee4-e2109f53155e'
            content='' response_metadata={'finish_reason': 'stop'} id='run-609b8f47-e580-4691-9ee4-e2109f53155e'
        .. code-block:: python
            stream = llm.stream(messages)
            full = next(stream)
            for chunk in stream:
                full += chunk
            full
        .. code-block:: python
            AIMessageChunk(
                content="J'adore la programmation.",
                response_metadata={
                    'finish_reason': 'stop'
                },
                id='run-4cef851f-6223-424f-ad26-4a54e5852aa5'
            )
    Async:
        .. code-block:: python
            await llm.ainvoke(messages)
            # stream:
            # async for chunk in llm.astream(messages)
            # batch:
            # await llm.abatch([messages])
        .. code-block:: python
            AIMessage(
                content="J'adore la programmation.",
                response_metadata={
                    'prompt_tokens': 32,
                    'completion_tokens': 9,
                    'total_tokens': 41
                },
                id='run-e4bb043e-772b-4e1d-9f98-77ccc00c0271-0'
            )
    Tool calling:
        .. code-block:: python
            from langchain_core.pydantic_v1 import BaseModel, Field
            class GetWeather(BaseModel):
                '''Get the current weather in a given location'''
                location: str = Field(..., description="The city and state, e.g. San Francisco, CA")
            class GetPopulation(BaseModel):
                '''Get the current population in a given location'''
                location: str = Field(..., description="The city and state, e.g. San Francisco, CA")
            llm_with_tools = llm.bind_tools([GetWeather, GetPopulation])
            ai_msg = llm_with_tools.invoke("Which city is hotter today and which is bigger: LA or NY?")
            ai_msg.tool_calls
        .. code-block:: python
            [
                {
                    'name': 'GetWeather',
                    'args': {
                        'location': 'Los Angeles, CA'
                    },
                    'id': 'call_ea0a6004-8e64-4ae8-a192-a40e295bfa24',
                    'type': 'tool_call'
                }
            ]
        To use tool calls, your model endpoint must support ``tools`` parameter. See [Function calling on Databricks](https://python.langchain.com/v0.2/docs/integrations/chat/databricks/#function-calling-on-databricks) for more information.
    """  # noqa: E501
    endpoint: str
    """Name of Databricks Model Serving endpoint to query."""
    target_uri: str = "databricks"
    """The target URI to use. Defaults to ``databricks``."""
    temperature: float = 0.0
    """Sampling temperature. Higher values make the model more creative."""
    n: int = 1
    """The number of completion choices to generate."""
    stop: Optional[List[str]] = None
    """List of strings to stop generation at."""
    max_tokens: Optional[int] = None
    """The maximum number of tokens to generate."""
    extra_params: dict = Field(default_factory=dict)
    """Any extra parameters to pass to the endpoint."""
    _client: Any = PrivateAttr()
    def __init__(self, **kwargs: Any):
        super().__init__(**kwargs)
        self._client = get_deployment_client(self.target_uri)
    @property
    def _default_params(self) -> Dict[str, Any]:
        params: Dict[str, Any] = {
            "target_uri": self.target_uri,
            "endpoint": self.endpoint,
            "temperature": self.temperature,
            "n": self.n,
            "stop": self.stop,
            "max_tokens": self.max_tokens,
            "extra_params": self.extra_params,
        }
        return params
    def _generate(
        self,
        messages: List[BaseMessage],
        stop: Optional[List[str]] = None,
        run_manager: Optional[CallbackManagerForLLMRun] = None,
        **kwargs: Any,
    ) -> ChatResult:
        data = self._prepare_inputs(messages, stop, **kwargs)
        resp = self._client.predict(endpoint=self.endpoint, inputs=data)
        return self._convert_response_to_chat_result(resp)
    def _prepare_inputs(
        self,
        messages: List[BaseMessage],
        stop: Optional[List[str]] = None,
        **kwargs: Any,
    ) -> Dict[str, Any]:
        data: Dict[str, Any] = {
            "messages": [_convert_message_to_dict(msg) for msg in messages],
            "temperature": self.temperature,
            "n": self.n,
            **self.extra_params,
            **kwargs,
        }
        if stop := self.stop or stop:
            data["stop"] = stop
        if self.max_tokens is not None:
            data["max_tokens"] = self.max_tokens
        return data
    def _convert_response_to_chat_result(
        self, response: Mapping[str, Any]
    ) -> ChatResult:
        generations = [
            ChatGeneration(
                message=_convert_dict_to_message(choice["message"]),
                generation_info=choice.get("usage", {}),
            )
            for choice in response["choices"]
        ]
        usage = response.get("usage", {})
        return ChatResult(generations=generations, llm_output=usage)
    def _stream(
        self,
        messages: List[BaseMessage],
        stop: Optional[List[str]] = None,
        run_manager: Optional[CallbackManagerForLLMRun] = None,
        **kwargs: Any,
    ) -> Iterator[ChatGenerationChunk]:
        data = self._prepare_inputs(messages, stop, **kwargs)
        first_chunk_role = None
        for chunk in self._client.predict_stream(endpoint=self.endpoint, inputs=data):
            if chunk["choices"]:
                choice = chunk["choices"][0]
                chunk_delta = choice["delta"]
                if first_chunk_role is None:
                    first_chunk_role = chunk_delta.get("role")
                chunk_message = _convert_dict_to_message_chunk(
                    chunk_delta, first_chunk_role
                )
                generation_info = {}
                if finish_reason := choice.get("finish_reason"):
                    generation_info["finish_reason"] = finish_reason
                if logprobs := choice.get("logprobs"):
                    generation_info["logprobs"] = logprobs
                chunk = ChatGenerationChunk(
                    message=chunk_message, generation_info=generation_info or None
                )
                if run_manager:
                    run_manager.on_llm_new_token(
                        chunk.text, chunk=chunk, logprobs=logprobs
                    )
                yield chunk
            else:
                # Handle the case where choices are empty if needed
                continue
    def bind_tools(
        self,
        tools: Sequence[Union[Dict[str, Any], Type[BaseModel], Callable, BaseTool]],
        *,
        tool_choice: Optional[
            Union[dict, str, Literal["auto", "none", "required", "any"], bool]
        ] = None,
        **kwargs: Any,
    ) -> Runnable[LanguageModelInput, BaseMessage]:
        """Bind tool-like objects to this chat model.
        Assumes model is compatible with OpenAI tool-calling API.
        Args:
            tools: A list of tool definitions to bind to this chat model.
                Can be  a dictionary, pydantic model, callable, or BaseTool. Pydantic
                models, callables, and BaseTools will be automatically converted to
                their schema dictionary representation.
            tool_choice: Which tool to require the model to call.
                Options are:
                name of the tool (str): calls corresponding tool;
                "auto": automatically selects a tool (including no tool);
                "none": model does not generate any tool calls and instead must
                    generate a standard assistant message;
                "required": the model picks the most relevant tool in tools and
                    must generate a tool call;
                or a dict of the form:
                {"type": "function", "function": {"name": <<tool_name>>}}.
            **kwargs: Any additional parameters to pass to the
                :class:`~langchain.runnable.Runnable` constructor.
        """
        formatted_tools = [convert_to_openai_tool(tool) for tool in tools]
        if tool_choice:
            if isinstance(tool_choice, str):
                # tool_choice is a tool/function name
                if tool_choice not in ("auto", "none", "required"):
                    tool_choice = {
                        "type": "function",
                        "function": {"name": tool_choice},
                    }
            elif isinstance(tool_choice, dict):
                tool_names = [
                    formatted_tool["function"]["name"]
                    for formatted_tool in formatted_tools
                ]
                if not any(
                    tool_name == tool_choice["function"]["name"]
                    for tool_name in tool_names
                ):
                    raise ValueError(
                        f"Tool choice {tool_choice} was specified, but the only "
                        f"provided tools were {tool_names}."
                    )
            else:
                raise ValueError(
                    f"Unrecognized tool_choice type. Expected str, bool or dict. "
                    f"Received: {tool_choice}"
                )
            kwargs["tool_choice"] = tool_choice
        return super().bind(tools=formatted_tools, **kwargs)
    @property
    def _llm_type(self) -> str:
        """Return type of chat model."""
        return "chat-databricks"
 ### Conversion function to convert Pydantic models to dictionaries and vice versa. ###
 def _convert_message_to_dict(message: BaseMessage) -> dict:
    message_dict = {"content": message.content}
    # OpenAI supports "name" field in messages.
    if (name := message.name or message.additional_kwargs.get("name")) is not None:
        message_dict["name"] = name
    if id := message.id:
        message_dict["id"] = id
    if isinstance(message, ChatMessage):
        return {"role": message.role, **message_dict}
    elif isinstance(message, HumanMessage):
        return {"role": "user", **message_dict}
    elif isinstance(message, AIMessage):
        if tool_calls := _get_tool_calls_from_ai_message(message):
            message_dict["tool_calls"] = tool_calls  # type: ignore[assignment]
            # If tool calls present, content null value should be None not empty string.
            message_dict["content"] = message_dict["content"] or None  # type: ignore[assignment]
        return {"role": "assistant", **message_dict}
    elif isinstance(message, SystemMessage):
        return {"role": "system", **message_dict}
    elif isinstance(message, ToolMessage):
        return {
            "role": "tool",
            "tool_call_id": message.tool_call_id,
            **message_dict,
        }
    elif (
        isinstance(message, FunctionMessage)
        or "function_call" in message.additional_kwargs
    ):
        raise ValueError(
            "Function messages are not supported by Databricks. Please"
            " create a feature request at https://github.com/mlflow/mlflow/issues."
        )
    else:
        raise ValueError(f"Got unknown message type: {type(message)}")
 def _get_tool_calls_from_ai_message(message: AIMessage) -> List[Dict]:
    tool_calls = [
        {
            "type": "function",
            "id": tc["id"],
            "function": {
                "name": tc["name"],
                "arguments": json.dumps(tc["args"]),
            },
        }
        for tc in message.tool_calls
    ]
    invalid_tool_calls = [
        {
            "type": "function",
            "id": tc["id"],
            "function": {
                "name": tc["name"],
                "arguments": tc["args"],
            },
        }
        for tc in message.invalid_tool_calls
    ]
    if tool_calls or invalid_tool_calls:
        return tool_calls + invalid_tool_calls
    # Get tool calls from additional kwargs if present.
    return [
        {
            k: v
            for k, v in tool_call.items()  # type: ignore[union-attr]
            if k in {"id", "type", "function"}
        }
        for tool_call in message.additional_kwargs.get("tool_calls", [])
    ]
 def _convert_dict_to_message(_dict: Dict) -> BaseMessage:
    role = _dict["role"]
    content = _dict.get("content")
    content = content if content is not None else ""
    if role == "user":
        return HumanMessage(content=content)
    elif role == "system":
        return SystemMessage(content=content)
    elif role == "assistant":
        additional_kwargs: Dict = {}
        tool_calls = []
        invalid_tool_calls = []
        if raw_tool_calls := _dict.get("tool_calls"):
            additional_kwargs["tool_calls"] = raw_tool_calls
            for raw_tool_call in raw_tool_calls:
                try:
                    tool_calls.append(parse_tool_call(raw_tool_call, return_id=True))
                except Exception as e:
                    invalid_tool_calls.append(
                        make_invalid_tool_call(raw_tool_call, str(e))
                    )
        return AIMessage(
            content=content,
            additional_kwargs=additional_kwargs,
            id=_dict.get("id"),
            tool_calls=tool_calls,
            invalid_tool_calls=invalid_tool_calls,
        )
    else:
        return ChatMessage(content=content, role=role)
 def _convert_dict_to_message_chunk(
    _dict: Mapping[str, Any], default_role: str
 ) -> BaseMessageChunk:
    role = _dict.get("role", default_role)
    content = _dict.get("content")
    content = content if content is not None else ""
    if role == "user":
        return HumanMessageChunk(content=content)
    elif role == "system":
        return SystemMessageChunk(content=content)
    elif role == "tool":
        return ToolMessageChunk(
            content=content, tool_call_id=_dict["tool_call_id"], id=_dict.get("id")
        )
    elif role == "assistant":
        additional_kwargs: Dict = {}
        tool_call_chunks = []
        if raw_tool_calls := _dict.get("tool_calls"):
            additional_kwargs["tool_calls"] = raw_tool_calls
            try:
                tool_call_chunks = [
                    tool_call_chunk(
                        name=tc["function"].get("name"),
                        args=tc["function"].get("arguments"),
                        id=tc.get("id"),
                        index=tc["index"],
                    )
                    for tc in raw_tool_calls
                ]
            except KeyError:
                pass
        return AIMessageChunk(
            content=content,
            additional_kwargs=additional_kwargs,
            id=_dict.get("id"),
            tool_call_chunks=tool_call_chunks,
        )
    else:
        return ChatMessageChunk(content=content, role=role)
--- a/libs/partners/databricks/langchain_databricks/embeddings.py
+++ b/libs/partners/databricks/langchain_databricks/embeddings.py
@ -1,91 +0,0 @@
 from typing import Any, Dict, Iterator, List
 from langchain_core.embeddings import Embeddings
 from langchain_core.pydantic_v1 import BaseModel, PrivateAttr
 from langchain_databricks.utils import get_deployment_client
 class DatabricksEmbeddings(Embeddings, BaseModel):
    """Databricks embedding model integration.
    Setup:
        Install ``langchain-databricks``.
        .. code-block:: bash
            pip install -U langchain-databricks
        If you are outside Databricks, set the Databricks workspace
        hostname and personal access token to environment variables:
        .. code-block:: bash
            export DATABRICKS_HOSTNAME="https://your-databricks-workspace"
            export DATABRICKS_TOKEN="your-personal-access-token"
    Key init args — completion params:
        endpoint: str
            Name of Databricks Model Serving endpoint to query.
        target_uri: str
            The target URI to use. Defaults to ``databricks``.
        query_params: Dict[str, str]
            The parameters to use for queries.
        documents_params: Dict[str, str]
            The parameters to use for documents.
    Instantiate:
        .. code-block:: python
            from langchain_databricks import DatabricksEmbeddings
            embed = DatabricksEmbeddings(
                endpoint="databricks-bge-large-en",
            )
    Embed single text:
        .. code-block:: python
            input_text = "The meaning of life is 42"
            embed.embed_query(input_text)
        .. code-block:: python
            [
                0.01605224609375,
                -0.0298309326171875,
                ...
            ]
    """
    endpoint: str
    """The endpoint to use."""
    target_uri: str = "databricks"
    """The parameters to use for queries."""
    query_params: Dict[str, Any] = {}
    """The parameters to use for documents."""
    documents_params: Dict[str, Any] = {}
    """The target URI to use."""
    _client: Any = PrivateAttr()
    def __init__(self, **kwargs: Any):
        super().__init__(**kwargs)
        self._client = get_deployment_client(self.target_uri)
    def embed_documents(self, texts: List[str]) -> List[List[float]]:
        return self._embed(texts, params=self.documents_params)
    def embed_query(self, text: str) -> List[float]:
        return self._embed([text], params=self.query_params)[0]
    def _embed(self, texts: List[str], params: Dict[str, str]) -> List[List[float]]:
        embeddings: List[List[float]] = []
        for txt in _chunk(texts, 20):
            resp = self._client.predict(
                endpoint=self.endpoint,
                inputs={"input": txt, **params},  # type: ignore[arg-type]
            )
            embeddings.extend(r["embedding"] for r in resp["data"])
        return embeddings
 def _chunk(texts: List[str], size: int) -> Iterator[List[str]]:
    for i in range(0, len(texts), size):
        yield texts[i : i + size]
--- a/libs/partners/databricks/langchain_databricks/py.typed
+++ b/libs/partners/databricks/langchain_databricks/py.typed
--- a/libs/partners/databricks/langchain_databricks/utils.py
+++ b/libs/partners/databricks/langchain_databricks/utils.py
@ -1,101 +0,0 @@
 from typing import Any, List, Union
 from urllib.parse import urlparse
 import numpy as np
 def get_deployment_client(target_uri: str) -> Any:
    if (target_uri != "databricks") and (urlparse(target_uri).scheme != "databricks"):
        raise ValueError(
            "Invalid target URI. The target URI must be a valid databricks URI."
        )
    try:
        from mlflow.deployments import get_deploy_client  # type: ignore[import-untyped]
        return get_deploy_client(target_uri)
    except ImportError as e:
        raise ImportError(
            "Failed to create the client. "
            "Please run `pip install mlflow` to install "
            "required dependencies."
        ) from e
 # Utility function for Maximal Marginal Relevance (MMR) reranking.
 # Copied from langchain_community/vectorstores/utils.py to avoid cross-dependency
 Matrix = Union[List[List[float]], List[np.ndarray], np.ndarray]
 def maximal_marginal_relevance(
    query_embedding: np.ndarray,
    embedding_list: list,
    lambda_mult: float = 0.5,
    k: int = 4,
 ) -> List[int]:
    """Calculate maximal marginal relevance.
    Args:
        query_embedding: Query embedding.
        embedding_list: List of embeddings to select from.
        lambda_mult: Number between 0 and 1 that determines the degree
                of diversity among the results with 0 corresponding
                to maximum diversity and 1 to minimum diversity.
                Defaults to 0.5.
        k: Number of Documents to return. Defaults to 4.
    Returns:
        List of indices of embeddings selected by maximal marginal relevance.
    """
    if min(k, len(embedding_list)) <= 0:
        return []
    if query_embedding.ndim == 1:
        query_embedding = np.expand_dims(query_embedding, axis=0)
    similarity_to_query = cosine_similarity(query_embedding, embedding_list)[0]
    most_similar = int(np.argmax(similarity_to_query))
    idxs = [most_similar]
    selected = np.array([embedding_list[most_similar]])
    while len(idxs) < min(k, len(embedding_list)):
        best_score = -np.inf
        idx_to_add = -1
        similarity_to_selected = cosine_similarity(embedding_list, selected)
        for i, query_score in enumerate(similarity_to_query):
            if i in idxs:
                continue
            redundant_score = max(similarity_to_selected[i])
            equation_score = (
                lambda_mult * query_score - (1 - lambda_mult) * redundant_score
            )
            if equation_score > best_score:
                best_score = equation_score
                idx_to_add = i
        idxs.append(idx_to_add)
        selected = np.append(selected, [embedding_list[idx_to_add]], axis=0)
    return idxs
 def cosine_similarity(X: Matrix, Y: Matrix) -> np.ndarray:
    """Row-wise cosine similarity between two equal-width matrices.
    Raises:
        ValueError: If the number of columns in X and Y are not the same.
    """
    if len(X) == 0 or len(Y) == 0:
        return np.array([])
    X = np.array(X)
    Y = np.array(Y)
    if X.shape[1] != Y.shape[1]:
        raise ValueError(
            "Number of columns in X and Y must be the same. X has shape"
            f"{X.shape} "
            f"and Y has shape {Y.shape}."
        )
    X_norm = np.linalg.norm(X, axis=1)
    Y_norm = np.linalg.norm(Y, axis=1)
    # Ignore divide by zero errors run time warnings as those are handled below.
    with np.errstate(divide="ignore", invalid="ignore"):
        similarity = np.dot(X, Y.T) / np.outer(X_norm, Y_norm)
    similarity[np.isnan(similarity) | np.isinf(similarity)] = 0.0
    return similarity
--- a/libs/partners/databricks/langchain_databricks/vectorstores.py
+++ b/libs/partners/databricks/langchain_databricks/vectorstores.py
@ -1,837 +0,0 @@
 from __future__ import annotations
 import asyncio
 import json
 import logging
 import uuid
 from enum import Enum
 from functools import partial
 from typing import (
    Any,
    Callable,
    Dict,
    Iterable,
    List,
    Optional,
    Tuple,
    Type,
 )
 import numpy as np
 from langchain_core.documents import Document
 from langchain_core.embeddings import Embeddings
 from langchain_core.vectorstores import VST, VectorStore
 from langchain_databricks.utils import maximal_marginal_relevance
 logger = logging.getLogger(__name__)
 class IndexType(str, Enum):
    DIRECT_ACCESS = "DIRECT_ACCESS"
    DELTA_SYNC = "DELTA_SYNC"
 _DIRECT_ACCESS_ONLY_MSG = "`%s` is only supported for direct-access index."
 _NON_MANAGED_EMB_ONLY_MSG = (
    "`%s` is not supported for index with Databricks-managed embeddings."
 )
 class DatabricksVectorSearch(VectorStore):
    """Databricks vector store integration.
    Setup:
        Install ``langchain-databricks`` and ``databricks-vectorsearch`` python packages.
        .. code-block:: bash
            pip install -U langchain-databricks databricks-vectorsearch
        If you don't have a Databricks Vector Search endpoint already, you can create one by following the instructions here: https://docs.databricks.com/en/generative-ai/create-query-vector-search.html
        If you are outside Databricks, set the Databricks workspace
        hostname and personal access token to environment variables:
        .. code-block:: bash
            export DATABRICKS_HOSTNAME="https://your-databricks-workspace"
            export DATABRICKS_TOKEN="your-personal-access-token"
    Key init args — indexing params:
        endpoint: The name of the Databricks Vector Search endpoint.
        index_name: The name of the index to use. Format: "catalog.schema.index".
        embedding: The embedding model.
                  Required for direct-access index or delta-sync index
                  with self-managed embeddings.
        text_column: The name of the text column to use for the embeddings.
                    Required for direct-access index or delta-sync index
                    with self-managed embeddings.
                    Make sure the text column specified is in the index.
        columns: The list of column names to get when doing the search.
                Defaults to ``[primary_key, text_column]``.
    Instantiate:
        `DatabricksVectorSearch` supports two types of indexes:
        * **Delta Sync Index** automatically syncs with a source Delta Table, automatically and incrementally updating the index as the underlying data in the Delta Table changes.
        * **Direct Vector Access Index** supports direct read and write of vectors and metadata. The user is responsible for updating this table using the REST API or the Python SDK.
        Also for delta-sync index, you can choose to use Databricks-managed embeddings or self-managed embeddings (via LangChain embeddings classes).
        If you are using a delta-sync index with Databricks-managed embeddings:
        .. code-block:: python
            from langchain_databricks.vectorstores import DatabricksVectorSearch
            vector_store = DatabricksVectorSearch(
                endpoint="<your-endpoint-name>",
                index_name="<your-index-name>"
            )
        If you are using a direct-access index or a delta-sync index with self-managed embeddings,
        you also need to provide the embedding model and text column in your source table to
        use for the embeddings:
        .. code-block:: python
            from langchain_openai import OpenAIEmbeddings
            vector_store = DatabricksVectorSearch(
                endpoint="<your-endpoint-name>",
                index_name="<your-index-name>",
                embedding=OpenAIEmbeddings(),
                text_column="document_content"
            )
    Add Documents:
        .. code-block:: python
            from langchain_core.documents import Document
            document_1 = Document(page_content="foo", metadata={"baz": "bar"})
            document_2 = Document(page_content="thud", metadata={"bar": "baz"})
            document_3 = Document(page_content="i will be deleted :(")
            documents = [document_1, document_2, document_3]
            ids = ["1", "2", "3"]
            vector_store.add_documents(documents=documents, ids=ids)
    Delete Documents:
        .. code-block:: python
            vector_store.delete(ids=["3"])
        .. note::
            The `delete` method is only supported for direct-access index.
    Search:
        .. code-block:: python
            results = vector_store.similarity_search(query="thud",k=1)
            for doc in results:
                print(f"* {doc.page_content} [{doc.metadata}]")
        .. code-block:: python
            * thud [{'id': '2'}]
        .. note:
            By default, similarity search only returns the primary key and text column.
            If you want to retrieve the custom metadata associated with the document,
            pass the additional columns in the `columns` parameter when initializing the vector store.
            .. code-block:: python
                vector_store = DatabricksVectorSearch(
                    endpoint="<your-endpoint-name>",
                    index_name="<your-index-name>",
                    columns=["baz", "bar"],
                )
                vector_store.similarity_search(query="thud",k=1)
                # Output: * thud [{'bar': 'baz', 'baz': None, 'id': '2'}]
    Search with filter:
        .. code-block:: python
            results = vector_store.similarity_search(query="thud",k=1,filter={"bar": "baz"})
            for doc in results:
                print(f"* {doc.page_content} [{doc.metadata}]")
        .. code-block:: python
            * thud [{'id': '2'}]
    Search with score:
        .. code-block:: python
            results = vector_store.similarity_search_with_score(query="qux",k=1)
            for doc, score in results:
                print(f"* [SIM={score:3f}] {doc.page_content} [{doc.metadata}]")
        .. code-block:: python
            * [SIM=0.748804] foo [{'id': '1'}]
    Async:
        .. code-block:: python
            # add documents
            await vector_store.aadd_documents(documents=documents, ids=ids)
            # delete documents
            await vector_store.adelete(ids=["3"])
            # search
            results = vector_store.asimilarity_search(query="thud",k=1)
            # search with score
            results = await vector_store.asimilarity_search_with_score(query="qux",k=1)
            for doc,score in results:
                print(f"* [SIM={score:3f}] {doc.page_content} [{doc.metadata}]")
        .. code-block:: python
            * [SIM=0.748807] foo [{'id': '1'}]
    Use as Retriever:
        .. code-block:: python
            retriever = vector_store.as_retriever(
                search_type="mmr",
                search_kwargs={"k": 1, "fetch_k": 2, "lambda_mult": 0.5},
            )
            retriever.invoke("thud")
        .. code-block:: python
            [Document(metadata={'id': '2'}, page_content='thud')]
    """  # noqa: E501
    def __init__(
        self,
        endpoint: str,
        index_name: str,
        embedding: Optional[Embeddings] = None,
        text_column: Optional[str] = None,
        columns: Optional[List[str]] = None,
    ):
        try:
            from databricks.vector_search.client import (  # type: ignore[import]
                VectorSearchClient,
            )
        except ImportError as e:
            raise ImportError(
                "Could not import databricks-vectorsearch python package. "
                "Please install it with `pip install databricks-vectorsearch`."
            ) from e
        self.index = VectorSearchClient().get_index(endpoint, index_name)
        self._index_details = IndexDetails(self.index)
        _validate_embedding(embedding, self._index_details)
        self._embeddings = embedding
        self._text_column = _validate_and_get_text_column(
            text_column, self._index_details
        )
        self._columns = _validate_and_get_return_columns(
            columns or [], self._text_column, self._index_details
        )
        self._primary_key = self._index_details.primary_key
    @property
    def embeddings(self) -> Optional[Embeddings]:
        """Access the query embedding object if available."""
        return self._embeddings
    @classmethod
    def from_texts(
        cls: Type[VST],
        texts: List[str],
        embedding: Embeddings,
        metadatas: Optional[List[Dict]] = None,
        **kwargs: Any,
    ) -> VST:
        raise NotImplementedError(
            "`from_texts` is not supported. "
            "Use `add_texts` to add to existing direct-access index."
        )
    def add_texts(
        self,
        texts: Iterable[str],
        metadatas: Optional[List[Dict]] = None,
        ids: Optional[List[Any]] = None,
        **kwargs: Any,
    ) -> List[str]:
        """Add texts to the index.
        .. note::
            This method is only supported for a direct-access index.
        Args:
            texts: List of texts to add.
            metadatas: List of metadata for each text. Defaults to None.
            ids: List of ids for each text. Defaults to None.
                If not provided, a random uuid will be generated for each text.
        Returns:
            List of ids from adding the texts into the index.
        """
        if self._index_details.is_delta_sync_index():
            raise NotImplementedError(_DIRECT_ACCESS_ONLY_MSG % "add_texts")
        # Wrap to list if input texts is a single string
        if isinstance(texts, str):
            texts = [texts]
        texts = list(texts)
        vectors = self._embeddings.embed_documents(texts)  # type: ignore[union-attr]
        ids = ids or [str(uuid.uuid4()) for _ in texts]
        metadatas = metadatas or [{} for _ in texts]
        updates = [
            {
                self._primary_key: id_,
                self._text_column: text,
                self._index_details.embedding_vector_column["name"]: vector,
                **metadata,
            }
            for text, vector, id_, metadata in zip(texts, vectors, ids, metadatas)
        ]
        upsert_resp = self.index.upsert(updates)
        if upsert_resp.get("status") in ("PARTIAL_SUCCESS", "FAILURE"):
            failed_ids = upsert_resp.get("result", dict()).get(
                "failed_primary_keys", []
            )
            if upsert_resp.get("status") == "FAILURE":
                logger.error("Failed to add texts to the index.")
            else:
                logger.warning("Some texts failed to be added to the index.")
            return [id_ for id_ in ids if id_ not in failed_ids]
        return ids
    async def aadd_texts(
        self,
        texts: Iterable[str],
        metadatas: Optional[List[dict]] = None,
        **kwargs: Any,
    ) -> List[str]:
        return await asyncio.get_running_loop().run_in_executor(
            None, partial(self.add_texts, **kwargs), texts, metadatas
        )
    def delete(self, ids: Optional[List[Any]] = None, **kwargs: Any) -> Optional[bool]:
        """Delete documents from the index.
        .. note::
            This method is only supported for a direct-access index.
        Args:
            ids: List of ids of documents to delete.
        Returns:
            True if successful.
        """
        if self._index_details.is_delta_sync_index():
            raise NotImplementedError(_DIRECT_ACCESS_ONLY_MSG % "delete")
        if ids is None:
            raise ValueError("ids must be provided.")
        self.index.delete(ids)
        return True
    def similarity_search(
        self,
        query: str,
        k: int = 4,
        filter: Optional[Dict[str, Any]] = None,
        *,
        query_type: Optional[str] = None,
        **kwargs: Any,
    ) -> List[Document]:
        """Return docs most similar to query.
        Args:
            query: Text to look up documents similar to.
            k: Number of Documents to return. Defaults to 4.
            filter: Filters to apply to the query. Defaults to None.
            query_type: The type of this query. Supported values are "ANN" and "HYBRID".
        Returns:
            List of Documents most similar to the embedding.
        """
        docs_with_score = self.similarity_search_with_score(
            query=query,
            k=k,
            filter=filter,
            query_type=query_type,
            **kwargs,
        )
        return [doc for doc, _ in docs_with_score]
    async def asimilarity_search(
        self, query: str, k: int = 4, **kwargs: Any
    ) -> List[Document]:
        # This is a temporary workaround to make the similarity search
        # asynchronous. The proper solution is to make the similarity search
        # asynchronous in the vector store implementations.
        func = partial(self.similarity_search, query, k=k, **kwargs)
        return await asyncio.get_event_loop().run_in_executor(None, func)
    def similarity_search_with_score(
        self,
        query: str,
        k: int = 4,
        filter: Optional[Dict[str, Any]] = None,
        *,
        query_type: Optional[str] = None,
        **kwargs: Any,
    ) -> List[Tuple[Document, float]]:
        """Return docs most similar to query, along with scores.
        Args:
            query: Text to look up documents similar to.
            k: Number of Documents to return. Defaults to 4.
            filter: Filters to apply to the query. Defaults to None.
            query_type: The type of this query. Supported values are "ANN" and "HYBRID".
        Returns:
            List of Documents most similar to the embedding and score for each.
        """
        if self._index_details.is_databricks_managed_embeddings():
            query_text = query
            query_vector = None
        else:
            # The value for `query_text` needs to be specified only for hybrid search.
            if query_type is not None and query_type.upper() == "HYBRID":
                query_text = query
            else:
                query_text = None
            query_vector = self._embeddings.embed_query(query)  # type: ignore[union-attr]
        search_resp = self.index.similarity_search(
            columns=self._columns,
            query_text=query_text,
            query_vector=query_vector,
            filters=filter,
            num_results=k,
            query_type=query_type,
        )
        return self._parse_search_response(search_resp)
    def _select_relevance_score_fn(self) -> Callable[[float], float]:
        """
        Databricks Vector search uses a normalized score 1/(1+d) where d
        is the L2 distance. Hence, we simply return the identity function.
        """
        return lambda score: score
    async def asimilarity_search_with_score(
        self, *args: Any, **kwargs: Any
    ) -> List[Tuple[Document, float]]:
        # This is a temporary workaround to make the similarity search
        # asynchronous. The proper solution is to make the similarity search
        # asynchronous in the vector store implementations.
        func = partial(self.similarity_search_with_score, *args, **kwargs)
        return await asyncio.get_event_loop().run_in_executor(None, func)
    def similarity_search_by_vector(
        self,
        embedding: List[float],
        k: int = 4,
        filter: Optional[Any] = None,
        *,
        query_type: Optional[str] = None,
        query: Optional[str] = None,
        **kwargs: Any,
    ) -> List[Document]:
        """Return docs most similar to embedding vector.
        Args:
            embedding: Embedding to look up documents similar to.
            k: Number of Documents to return. Defaults to 4.
            filter: Filters to apply to the query. Defaults to None.
            query_type: The type of this query. Supported values are "ANN" and "HYBRID".
        Returns:
            List of Documents most similar to the embedding.
        """
        if self._index_details.is_databricks_managed_embeddings():
            raise NotImplementedError(
                _NON_MANAGED_EMB_ONLY_MSG % "similarity_search_by_vector"
            )
        docs_with_score = self.similarity_search_by_vector_with_score(
            embedding=embedding,
            k=k,
            filter=filter,
            query_type=query_type,
            query=query,
            **kwargs,
        )
        return [doc for doc, _ in docs_with_score]
    async def asimilarity_search_by_vector(
        self, embedding: List[float], k: int = 4, **kwargs: Any
    ) -> List[Document]:
        # This is a temporary workaround to make the similarity search
        # asynchronous. The proper solution is to make the similarity search
        # asynchronous in the vector store implementations.
        func = partial(self.similarity_search_by_vector, embedding, k=k, **kwargs)
        return await asyncio.get_event_loop().run_in_executor(None, func)
    def similarity_search_by_vector_with_score(
        self,
        embedding: List[float],
        k: int = 4,
        filter: Optional[Any] = None,
        *,
        query_type: Optional[str] = None,
        query: Optional[str] = None,
        **kwargs: Any,
    ) -> List[Tuple[Document, float]]:
        """Return docs most similar to embedding vector, along with scores.
        .. note::
            This method is not supported for index with Databricks-managed embeddings.
        Args:
            embedding: Embedding to look up documents similar to.
            k: Number of Documents to return. Defaults to 4.
            filter: Filters to apply to the query. Defaults to None.
            query_type: The type of this query. Supported values are "ANN" and "HYBRID".
        Returns:
            List of Documents most similar to the embedding and score for each.
        """
        if self._index_details.is_databricks_managed_embeddings():
            raise NotImplementedError(
                _NON_MANAGED_EMB_ONLY_MSG % "similarity_search_by_vector_with_score"
            )
        if query_type is not None and query_type.upper() == "HYBRID":
            if query is None:
                raise ValueError(
                    "A value for `query` must be specified for hybrid search."
                )
            query_text = query
        else:
            if query is not None:
                raise ValueError(
                    (
                        "Cannot specify both `embedding` and "
                        '`query` unless `query_type="HYBRID"'
                    )
                )
            query_text = None
        search_resp = self.index.similarity_search(
            columns=self._columns,
            query_vector=embedding,
            query_text=query_text,
            filters=filter,
            num_results=k,
            query_type=query_type,
        )
        return self._parse_search_response(search_resp)
    def max_marginal_relevance_search(
        self,
        query: str,
        k: int = 4,
        fetch_k: int = 20,
        lambda_mult: float = 0.5,
        filter: Optional[Dict[str, Any]] = None,
        *,
        query_type: Optional[str] = None,
        **kwargs: Any,
    ) -> List[Document]:
        """Return docs selected using the maximal marginal relevance.
        Maximal marginal relevance optimizes for similarity to query AND diversity
        among selected documents.
        .. note::
            This method is not supported for index with Databricks-managed embeddings.
        Args:
            query: Text to look up documents similar to.
            k: Number of Documents to return. Defaults to 4.
            fetch_k: Number of Documents to fetch to pass to MMR algorithm.
            lambda_mult: Number between 0 and 1 that determines the degree
                        of diversity among the results with 0 corresponding
                        to maximum diversity and 1 to minimum diversity.
                        Defaults to 0.5.
            filter: Filters to apply to the query. Defaults to None.
            query_type: The type of this query. Supported values are "ANN" and "HYBRID".
        Returns:
            List of Documents selected by maximal marginal relevance.
        """
        if self._index_details.is_databricks_managed_embeddings():
            raise NotImplementedError(
                _NON_MANAGED_EMB_ONLY_MSG % "max_marginal_relevance_search"
            )
        query_vector = self._embeddings.embed_query(query)  # type: ignore[union-attr]
        docs = self.max_marginal_relevance_search_by_vector(
            query_vector,
            k,
            fetch_k,
            lambda_mult=lambda_mult,
            filter=filter,
            query_type=query_type,
        )
        return docs
    async def amax_marginal_relevance_search(
        self,
        query: str,
        k: int = 4,
        fetch_k: int = 20,
        lambda_mult: float = 0.5,
        **kwargs: Any,
    ) -> List[Document]:
        # This is a temporary workaround to make the similarity search
        # asynchronous. The proper solution is to make the similarity search
        # asynchronous in the vector store implementations.
        func = partial(
            self.max_marginal_relevance_search,
            query,
            k=k,
            fetch_k=fetch_k,
            lambda_mult=lambda_mult,
            **kwargs,
        )
        return await asyncio.get_event_loop().run_in_executor(None, func)
    def max_marginal_relevance_search_by_vector(
        self,
        embedding: List[float],
        k: int = 4,
        fetch_k: int = 20,
        lambda_mult: float = 0.5,
        filter: Optional[Any] = None,
        *,
        query_type: Optional[str] = None,
        **kwargs: Any,
    ) -> List[Document]:
        """Return docs selected using the maximal marginal relevance.
        Maximal marginal relevance optimizes for similarity to query AND diversity
        among selected documents.
        .. note::
            This method is not supported for index with Databricks-managed embeddings.
        Args:
            embedding: Embedding to look up documents similar to.
            k: Number of Documents to return. Defaults to 4.
            fetch_k: Number of Documents to fetch to pass to MMR algorithm.
            lambda_mult: Number between 0 and 1 that determines the degree
                        of diversity among the results with 0 corresponding
                        to maximum diversity and 1 to minimum diversity.
                        Defaults to 0.5.
            filter: Filters to apply to the query. Defaults to None.
            query_type: The type of this query. Supported values are "ANN" and "HYBRID".
        Returns:
            List of Documents selected by maximal marginal relevance.
        """
        if self._index_details.is_databricks_managed_embeddings():
            raise NotImplementedError(
                _NON_MANAGED_EMB_ONLY_MSG % "max_marginal_relevance_search_by_vector"
            )
        embedding_column = self._index_details.embedding_vector_column["name"]
        search_resp = self.index.similarity_search(
            columns=list(set(self._columns + [embedding_column])),
            query_text=None,
            query_vector=embedding,
            filters=filter,
            num_results=fetch_k,
            query_type=query_type,
        )
        embeddings_result_index = (
            search_resp.get("manifest").get("columns").index({"name": embedding_column})
        )
        embeddings = [
            doc[embeddings_result_index]
            for doc in search_resp.get("result").get("data_array")
        ]
        mmr_selected = maximal_marginal_relevance(
            np.array(embedding, dtype=np.float32),
            embeddings,
            k=k,
            lambda_mult=lambda_mult,
        )
        ignore_cols: List = (
            [embedding_column] if embedding_column not in self._columns else []
        )
        candidates = self._parse_search_response(search_resp, ignore_cols=ignore_cols)
        selected_results = [r[0] for i, r in enumerate(candidates) if i in mmr_selected]
        return selected_results
    async def amax_marginal_relevance_search_by_vector(
        self,
        embedding: List[float],
        k: int = 4,
        fetch_k: int = 20,
        lambda_mult: float = 0.5,
        **kwargs: Any,
    ) -> List[Document]:
        raise NotImplementedError
    def _parse_search_response(
        self, search_resp: Dict, ignore_cols: Optional[List[str]] = None
    ) -> List[Tuple[Document, float]]:
        """Parse the search response into a list of Documents with score."""
        if ignore_cols is None:
            ignore_cols = []
        columns = [
            col["name"]
            for col in search_resp.get("manifest", dict()).get("columns", [])
        ]
        docs_with_score = []
        for result in search_resp.get("result", dict()).get("data_array", []):
            doc_id = result[columns.index(self._primary_key)]
            text_content = result[columns.index(self._text_column)]
            ignore_cols = [self._primary_key, self._text_column] + ignore_cols
            metadata = {
                col: value
                for col, value in zip(columns[:-1], result[:-1])
                if col not in ignore_cols
            }
            metadata[self._primary_key] = doc_id
            score = result[-1]
            doc = Document(page_content=text_content, metadata=metadata)
            docs_with_score.append((doc, score))
        return docs_with_score
 def _validate_and_get_text_column(
    text_column: Optional[str], index_details: IndexDetails
 ) -> str:
    if index_details.is_databricks_managed_embeddings():
        index_source_column: str = index_details.embedding_source_column["name"]
        # check if input text column matches the source column of the index
        if text_column is not None:
            raise ValueError(
                f"The index '{index_details.name}' has the source column configured as "
                f"'{index_source_column}'. Do not pass the `text_column` parameter."
            )
        return index_source_column
    else:
        if text_column is None:
            raise ValueError("The `text_column` parameter is required for this index.")
        return text_column
 def _validate_and_get_return_columns(
    columns: List[str], text_column: str, index_details: IndexDetails
 ) -> List[str]:
    """
    Get a list of columns to retrieve from the index.
    If the index is direct-access index, validate the given columns against the schema.
    """
    # add primary key column and source column if not in columns
    if index_details.primary_key not in columns:
        columns.append(index_details.primary_key)
    if text_column and text_column not in columns:
        columns.append(text_column)
    # Validate specified columns are in the index
    if index_details.is_direct_access_index() and (
        index_schema := index_details.schema
    ):
        if missing_columns := [c for c in columns if c not in index_schema]:
            raise ValueError(
                "Some columns specified in `columns` are not "
                f"in the index schema: {missing_columns}"
            )
    return columns
 def _validate_embedding(
    embedding: Optional[Embeddings], index_details: IndexDetails
 ) -> None:
    if index_details.is_databricks_managed_embeddings():
        if embedding is not None:
            raise ValueError(
                f"The index '{index_details.name}' uses Databricks-managed embeddings. "
                "Do not pass the `embedding` parameter when initializing vector store."
            )
    else:
        if not embedding:
            raise ValueError(
                "The `embedding` parameter is required for a direct-access index "
                "or delta-sync index with self-managed embedding."
            )
        _validate_embedding_dimension(embedding, index_details)
 def _validate_embedding_dimension(
    embeddings: Embeddings, index_details: IndexDetails
 ) -> None:
    """validate if the embedding dimension matches with the index's configuration."""
    if index_embedding_dimension := index_details.embedding_vector_column.get(
        "embedding_dimension"
    ):
        # Infer the embedding dimension from the embedding function."""
        actual_dimension = len(embeddings.embed_query("test"))
        if actual_dimension != index_embedding_dimension:
            raise ValueError(
                f"The specified embedding model's dimension '{actual_dimension}' does "
                f"not match with the index configuration '{index_embedding_dimension}'."
            )
 class IndexDetails:
    """An utility class to store the configuration details of an index."""
    def __init__(self, index: Any):
        self._index_details = index.describe()
    @property
    def name(self) -> str:
        return self._index_details["name"]
    @property
    def schema(self) -> Optional[Dict]:
        if self.is_direct_access_index():
            schema_json = self.index_spec.get("schema_json")
            if schema_json is not None:
                return json.loads(schema_json)
        return None
    @property
    def primary_key(self) -> str:
        return self._index_details["primary_key"]
    @property
    def index_spec(self) -> Dict:
        return (
            self._index_details.get("delta_sync_index_spec", {})
            if self.is_delta_sync_index()
            else self._index_details.get("direct_access_index_spec", {})
        )
    @property
    def embedding_vector_column(self) -> Dict:
        if vector_columns := self.index_spec.get("embedding_vector_columns"):
            return vector_columns[0]
        return {}
    @property
    def embedding_source_column(self) -> Dict:
        if source_columns := self.index_spec.get("embedding_source_columns"):
            return source_columns[0]
        return {}
    def is_delta_sync_index(self) -> bool:
        return self._index_details["index_type"] == IndexType.DELTA_SYNC.value
    def is_direct_access_index(self) -> bool:
        return self._index_details["index_type"] == IndexType.DIRECT_ACCESS.value
    def is_databricks_managed_embeddings(self) -> bool:
        return (
            self.is_delta_sync_index()
            and self.embedding_source_column.get("name") is not None
        )
--- a/libs/partners/databricks/poetry.lock
+++ b/libs/partners/databricks/poetry.lock
--- a/libs/partners/databricks/pyproject.toml
+++ b/libs/partners/databricks/pyproject.toml
@ -1,100 +0,0 @@
 [tool.poetry]
 name = "langchain-databricks"
 version = "0.1.0"
 description = "An integration package connecting Databricks and LangChain"
 authors = []
 readme = "README.md"
 repository = "https://github.com/langchain-ai/langchain"
 license = "MIT"
 [tool.poetry.urls]
 "Source Code" = "https://github.com/langchain-ai/langchain/tree/master/libs/partners/databricks"
 "Release Notes" = "https://github.com/langchain-ai/langchain/releases?q=tag%3A%22databricks%3D%3D0%22&expanded=true"
 [tool.poetry.dependencies]
 # TODO: Replace <3.12 to <4.0 once https://github.com/mlflow/mlflow/commit/04370119fcc1b2ccdbcd9a50198ab00566d58cd2 is released
 python = ">=3.8.1,<3.12"
 langchain-core = "^0.2.0"
 mlflow = ">=2.9"
 # MLflow depends on following libraries, which require different version for Python 3.8 vs 3.12
 numpy = [
    {version = ">=1.26.0", python = ">=3.12"},
    {version = ">=1.24.0", python = "<3.12"},
 ]
 scipy = [
    {version = ">=1.11", python = ">=3.12"},
    {version = "<2", python = "<3.12"}
 ]
 databricks-vectorsearch = "^0.40"
 [tool.poetry.group.test]
 optional = true
 [tool.poetry.group.test.dependencies]
 pytest = "^7.4.3"
 pytest-asyncio = "^0.23.2"
 pytest-socket = "^0.7.0"
 langchain-core = { path = "../../core", develop = true }
 [tool.poetry.group.codespell]
 optional = true
 [tool.poetry.group.codespell.dependencies]
 codespell = "^2.2.6"
 [tool.poetry.group.test_integration]
 optional = true
 [tool.poetry.group.test_integration.dependencies]
 [tool.poetry.group.lint]
 optional = true
 [tool.poetry.group.lint.dependencies]
 ruff = "^0.5"
 [tool.poetry.group.typing.dependencies]
 mypy = "^1.10"
 langchain-core = { path = "../../core", develop = true }
 [tool.poetry.group.dev]
 optional = true
 [tool.poetry.group.dev.dependencies]
 langchain-core = { path = "../../core", develop = true }
 [tool.ruff.lint]
 select = [
  "E",    # pycodestyle
  "F",    # pyflakes
  "I",    # isort
  "T201", # print
 ]
 [tool.mypy]
 disallow_untyped_defs = "True"
 [tool.coverage.run]
 omit = ["tests/*"]
 [build-system]
 requires = ["poetry-core>=1.0.0"]
 build-backend = "poetry.core.masonry.api"
 [tool.pytest.ini_options]
 # --strict-markers will raise errors on unknown marks.
 # https://docs.pytest.org/en/7.1.x/how-to/mark.html#raising-errors-on-unknown-marks
 #
 # https://docs.pytest.org/en/7.1.x/reference/reference.html
 # --strict-config       any warnings encountered while parsing the `pytest`
 #                       section of the configuration file raise errors.
 #
 # https://github.com/tophat/syrupy
 addopts = "--strict-markers --strict-config --durations=5"
 # Registering custom markers.
 # https://docs.pytest.org/en/7.1.x/example/markers.html#registering-markers
 markers = [
  "compile: mark placeholder test used to compile integration tests without running them",
 ]
 asyncio_mode = "auto"
--- a/libs/partners/databricks/scripts/check_imports.py
+++ b/libs/partners/databricks/scripts/check_imports.py
@ -1,17 +0,0 @@
 import sys
 import traceback
 from importlib.machinery import SourceFileLoader
 if __name__ == "__main__":
    files = sys.argv[1:]
    has_failure = False
    for file in files:
        try:
            SourceFileLoader("x", file).load_module()
        except Exception:
            has_failure = True
            print(file)  # noqa: T201
            traceback.print_exc()
            print()  # noqa: T201
    sys.exit(1 if has_failure else 0)
--- a/libs/partners/databricks/scripts/check_pydantic.sh
+++ b/libs/partners/databricks/scripts/check_pydantic.sh
@ -1,27 +0,0 @@
 #!/bin/bash
 #
 # This script searches for lines starting with "import pydantic" or "from pydantic"
 # in tracked files within a Git repository.
 #
 # Usage: ./scripts/check_pydantic.sh /path/to/repository
 # Check if a path argument is provided
 if [ $# -ne 1 ]; then
  echo "Usage: $0 /path/to/repository"
  exit 1
 fi
 repository_path="$1"
 # Search for lines matching the pattern within the specified repository
 result=$(git -C "$repository_path" grep -E '^import pydantic|^from pydantic')
 # Check if any matching lines were found
 if [ -n "$result" ]; then
  echo "ERROR: The following lines need to be updated:"
  echo "$result"
  echo "Please replace the code with an import from langchain_core.pydantic_v1."
  echo "For example, replace 'from pydantic import BaseModel'"
  echo "with 'from langchain_core.pydantic_v1 import BaseModel'"
  exit 1
 fi
--- a/libs/partners/databricks/scripts/lint_imports.sh
+++ b/libs/partners/databricks/scripts/lint_imports.sh
@ -1,18 +0,0 @@
 #!/bin/bash
 set -eu
 # Initialize a variable to keep track of errors
 errors=0
 # make sure not importing from langchain, langchain_experimental, or langchain_community
 git --no-pager grep '^from langchain\.' . && errors=$((errors+1))
 git --no-pager grep '^from langchain_experimental\.' . && errors=$((errors+1))
 git --no-pager grep '^from langchain_community\.' . && errors=$((errors+1))
 # Decide on an exit status based on the errors
 if [ "$errors" -gt 0 ]; then
    exit 1
 else
    exit 0
 fi
--- a/libs/partners/databricks/tests/init.py
+++ b/libs/partners/databricks/tests/init.py
--- a/libs/partners/databricks/tests/integration_tests/init.py
+++ b/libs/partners/databricks/tests/integration_tests/init.py
--- a/libs/partners/databricks/tests/integration_tests/test_compile.py
+++ b/libs/partners/databricks/tests/integration_tests/test_compile.py
@ -1,7 +0,0 @@
 import pytest
@pytest.mark.compile
 def test_placeholder() -> None:
    """Used for compiling integration tests without running any real tests."""
    pass
--- a/libs/partners/databricks/tests/unit_tests/init.py
+++ b/libs/partners/databricks/tests/unit_tests/init.py
--- a/libs/partners/databricks/tests/unit_tests/test_chat_models.py
+++ b/libs/partners/databricks/tests/unit_tests/test_chat_models.py
@ -1,321 +0,0 @@
 """Test chat model integration."""
 import json
 from typing import Generator
 from unittest import mock
 import mlflow  # type: ignore # noqa: F401
 import pytest
 from langchain_core.messages import (
    AIMessage,
    AIMessageChunk,
    BaseMessage,
    ChatMessage,
    ChatMessageChunk,
    FunctionMessage,
    HumanMessage,
    HumanMessageChunk,
    SystemMessage,
    SystemMessageChunk,
    ToolMessageChunk,
 )
 from langchain_core.messages.tool import ToolCallChunk
 from langchain_core.pydantic_v1 import BaseModel, Field
 from langchain_databricks.chat_models import (
    ChatDatabricks,
    _convert_dict_to_message,
    _convert_dict_to_message_chunk,
    _convert_message_to_dict,
 )
 _MOCK_CHAT_RESPONSE = {
    "id": "chatcmpl_id",
    "object": "chat.completion",
    "created": 1721875529,
    "model": "meta-llama-3.1-70b-instruct-072424",
    "choices": [
        {
            "index": 0,
            "message": {
                "role": "assistant",
                "content": "To calculate the result of 36939 multiplied by 8922.4, "
                "I get:\n\n36939 x 8922.4 = 329,511,111.6",
            },
            "finish_reason": "stop",
            "logprobs": None,
        }
    ],
    "usage": {"prompt_tokens": 30, "completion_tokens": 36, "total_tokens": 66},
 }
 _MOCK_STREAM_RESPONSE = [
    {
        "id": "chatcmpl_bb1fce87-f14e-4ae1-ac22-89facc74898a",
        "object": "chat.completion.chunk",
        "created": 1721877054,
        "model": "meta-llama-3.1-70b-instruct-072424",
        "choices": [
            {
                "index": 0,
                "delta": {"role": "assistant", "content": "36939"},
                "finish_reason": None,
                "logprobs": None,
            }
        ],
        "usage": {"prompt_tokens": 30, "completion_tokens": 20, "total_tokens": 50},
    },
    {
        "id": "chatcmpl_bb1fce87-f14e-4ae1-ac22-89facc74898a",
        "object": "chat.completion.chunk",
        "created": 1721877054,
        "model": "meta-llama-3.1-70b-instruct-072424",
        "choices": [
            {
                "index": 0,
                "delta": {"role": "assistant", "content": "x"},
                "finish_reason": None,
                "logprobs": None,
            }
        ],
        "usage": {"prompt_tokens": 30, "completion_tokens": 22, "total_tokens": 52},
    },
    {
        "id": "chatcmpl_bb1fce87-f14e-4ae1-ac22-89facc74898a",
        "object": "chat.completion.chunk",
        "created": 1721877054,
        "model": "meta-llama-3.1-70b-instruct-072424",
        "choices": [
            {
                "index": 0,
                "delta": {"role": "assistant", "content": "8922.4"},
                "finish_reason": None,
                "logprobs": None,
            }
        ],
        "usage": {"prompt_tokens": 30, "completion_tokens": 24, "total_tokens": 54},
    },
    {
        "id": "chatcmpl_bb1fce87-f14e-4ae1-ac22-89facc74898a",
        "object": "chat.completion.chunk",
        "created": 1721877054,
        "model": "meta-llama-3.1-70b-instruct-072424",
        "choices": [
            {
                "index": 0,
                "delta": {"role": "assistant", "content": " = "},
                "finish_reason": None,
                "logprobs": None,
            }
        ],
        "usage": {"prompt_tokens": 30, "completion_tokens": 28, "total_tokens": 58},
    },
    {
        "id": "chatcmpl_bb1fce87-f14e-4ae1-ac22-89facc74898a",
        "object": "chat.completion.chunk",
        "created": 1721877054,
        "model": "meta-llama-3.1-70b-instruct-072424",
        "choices": [
            {
                "index": 0,
                "delta": {"role": "assistant", "content": "329,511,111.6"},
                "finish_reason": None,
                "logprobs": None,
            }
        ],
        "usage": {"prompt_tokens": 30, "completion_tokens": 30, "total_tokens": 60},
    },
    {
        "id": "chatcmpl_bb1fce87-f14e-4ae1-ac22-89facc74898a",
        "object": "chat.completion.chunk",
        "created": 1721877054,
        "model": "meta-llama-3.1-70b-instruct-072424",
        "choices": [
            {
                "index": 0,
                "delta": {"role": "assistant", "content": ""},
                "finish_reason": "stop",
                "logprobs": None,
            }
        ],
        "usage": {"prompt_tokens": 30, "completion_tokens": 36, "total_tokens": 66},
    },
 ]
@pytest.fixture(autouse=True)
 def mock_client() -> Generator:
    client = mock.MagicMock()
    client.predict.return_value = _MOCK_CHAT_RESPONSE
    client.predict_stream.return_value = _MOCK_STREAM_RESPONSE
    with mock.patch("mlflow.deployments.get_deploy_client", return_value=client):
        yield
@pytest.fixture
 def llm() -> ChatDatabricks:
    return ChatDatabricks(
        endpoint="databricks-meta-llama-3-70b-instruct", target_uri="databricks"
    )
 def test_chat_mlflow_predict(llm: ChatDatabricks) -> None:
    res = llm.invoke(
        [
            {"role": "system", "content": "You are a helpful assistant."},
            {"role": "user", "content": "36939 * 8922.4"},
        ]
    )
    assert res.content == _MOCK_CHAT_RESPONSE["choices"][0]["message"]["content"]  # type: ignore[index]
 def test_chat_mlflow_stream(llm: ChatDatabricks) -> None:
    res = llm.stream(
        [
            {"role": "system", "content": "You are a helpful assistant."},
            {"role": "user", "content": "36939 * 8922.4"},
        ]
    )
    for chunk, expected in zip(res, _MOCK_STREAM_RESPONSE):
        assert chunk.content == expected["choices"][0]["delta"]["content"]  # type: ignore[index]
 def test_chat_mlflow_bind_tools(llm: ChatDatabricks) -> None:
    class GetWeather(BaseModel):
        """Get the current weather in a given location"""
        location: str = Field(
            ..., description="The city and state, e.g. San Francisco, CA"
        )
    class GetPopulation(BaseModel):
        """Get the current population in a given location"""
        location: str = Field(
            ..., description="The city and state, e.g. San Francisco, CA"
        )
    llm_with_tools = llm.bind_tools([GetWeather, GetPopulation])
    response = llm_with_tools.invoke(
        "Which city is hotter today and which is bigger: LA or NY?"
    )
    assert isinstance(response, AIMessage)
 ### Test data conversion functions ###
@pytest.mark.parametrize(
    ("role", "expected_output"),
    [
        ("user", HumanMessage("foo")),
        ("system", SystemMessage("foo")),
        ("assistant", AIMessage("foo")),
        ("any_role", ChatMessage(content="foo", role="any_role")),
    ],
 )
 def test_convert_message(role: str, expected_output: BaseMessage) -> None:
    message = {"role": role, "content": "foo"}
    result = _convert_dict_to_message(message)
    assert result == expected_output
    # convert back
    dict_result = _convert_message_to_dict(result)
    assert dict_result == message
 def test_convert_message_with_tool_calls() -> None:
    ID = "call_fb5f5e1a-bac0-4422-95e9-d06e6022ad12"
    tool_calls = [
        {
            "id": ID,
            "type": "function",
            "function": {
                "name": "main__test__python_exec",
                "arguments": '{"code": "result = 36939 * 8922.4"}',
            },
        }
    ]
    message_with_tools = {
        "role": "assistant",
        "content": None,
        "tool_calls": tool_calls,
        "id": ID,
    }
    result = _convert_dict_to_message(message_with_tools)
    expected_output = AIMessage(
        content="",
        additional_kwargs={"tool_calls": tool_calls},
        id=ID,
        tool_calls=[
            {
                "name": tool_calls[0]["function"]["name"],  # type: ignore[index]
                "args": json.loads(tool_calls[0]["function"]["arguments"]),  # type: ignore[index]
                "id": ID,
                "type": "tool_call",
            }
        ],
    )
    assert result == expected_output
    # convert back
    dict_result = _convert_message_to_dict(result)
    assert dict_result == message_with_tools
@pytest.mark.parametrize(
    ("role", "expected_output"),
    [
        ("user", HumanMessageChunk(content="foo")),
        ("system", SystemMessageChunk(content="foo")),
        ("assistant", AIMessageChunk(content="foo")),
        ("any_role", ChatMessageChunk(content="foo", role="any_role")),
    ],
 )
 def test_convert_message_chunk(role: str, expected_output: BaseMessage) -> None:
    delta = {"role": role, "content": "foo"}
    result = _convert_dict_to_message_chunk(delta, "default_role")
    assert result == expected_output
    # convert back
    dict_result = _convert_message_to_dict(result)
    assert dict_result == delta
 def test_convert_message_chunk_with_tool_calls() -> None:
    delta_with_tools = {
        "role": "assistant",
        "content": None,
        "tool_calls": [{"index": 0, "function": {"arguments": " }"}}],
    }
    result = _convert_dict_to_message_chunk(delta_with_tools, "role")
    expected_output = AIMessageChunk(
        content="",
        additional_kwargs={"tool_calls": delta_with_tools["tool_calls"]},
        id=None,
        tool_call_chunks=[ToolCallChunk(name=None, args=" }", id=None, index=0)],
    )
    assert result == expected_output
 def test_convert_tool_message_chunk() -> None:
    delta = {
        "role": "tool",
        "content": "foo",
        "tool_call_id": "tool_call_id",
        "id": "some_id",
    }
    result = _convert_dict_to_message_chunk(delta, "default_role")
    expected_output = ToolMessageChunk(
        content="foo", id="some_id", tool_call_id="tool_call_id"
    )
    assert result == expected_output
    # convert back
    dict_result = _convert_message_to_dict(result)
    assert dict_result == delta
 def test_convert_message_to_dict_function() -> None:
    with pytest.raises(ValueError, match="Function messages are not supported"):
        _convert_message_to_dict(FunctionMessage(content="", name="name"))
--- a/libs/partners/databricks/tests/unit_tests/test_embeddings.py
+++ b/libs/partners/databricks/tests/unit_tests/test_embeddings.py
@ -1,69 +0,0 @@
 """Test Together AI embeddings."""
 from typing import Any, Dict, Generator
 from unittest import mock
 import pytest
 from mlflow.deployments import BaseDeploymentClient  # type: ignore[import-untyped]
 from langchain_databricks import DatabricksEmbeddings
 def _mock_embeddings(endpoint: str, inputs: Dict[str, Any]) -> Dict[str, Any]:
    return {
        "object": "list",
        "data": [
            {
                "object": "embedding",
                "embedding": list(range(1536)),
                "index": 0,
            }
            for _ in inputs["input"]
        ],
        "model": "text-embedding-3-small",
        "usage": {"prompt_tokens": 8, "total_tokens": 8},
    }
@pytest.fixture
 def mock_client() -> Generator:
    client = mock.MagicMock()
    client.predict.side_effect = _mock_embeddings
    with mock.patch("mlflow.deployments.get_deploy_client", return_value=client):
        yield client
@pytest.fixture
 def embeddings() -> DatabricksEmbeddings:
    return DatabricksEmbeddings(
        endpoint="text-embedding-3-small",
        documents_params={"fruit": "apple"},
        query_params={"fruit": "banana"},
    )
 def test_embed_documents(
    mock_client: BaseDeploymentClient, embeddings: DatabricksEmbeddings
 ) -> None:
    documents = ["foo"] * 30
    output = embeddings.embed_documents(documents)
    assert len(output) == 30
    assert len(output[0]) == 1536
    assert mock_client.predict.call_count == 2
    assert all(
        call_arg[1]["inputs"]["fruit"] == "apple"
        for call_arg in mock_client().predict.call_args_list
    )
 def test_embed_query(
    mock_client: BaseDeploymentClient, embeddings: DatabricksEmbeddings
 ) -> None:
    query = "foo bar"
    output = embeddings.embed_query(query)
    assert len(output) == 1536
    mock_client.predict.assert_called_once()
    assert mock_client.predict.call_args[1] == {
        "endpoint": "text-embedding-3-small",
        "inputs": {"input": [query], "fruit": "banana"},
    }
--- a/libs/partners/databricks/tests/unit_tests/test_imports.py
+++ b/libs/partners/databricks/tests/unit_tests/test_imports.py
@ -1,12 +0,0 @@
 from langchain_databricks import __all__
 EXPECTED_ALL = [
    "ChatDatabricks",
    "DatabricksEmbeddings",
    "DatabricksVectorSearch",
    "__version__",
 ]
 def test_all_imports() -> None:
    assert sorted(EXPECTED_ALL) == sorted(__all__)
--- a/libs/partners/databricks/tests/unit_tests/test_vectorstore.py
+++ b/libs/partners/databricks/tests/unit_tests/test_vectorstore.py
@ -1,629 +0,0 @@
 import uuid
 from typing import Any, Dict, Generator, List, Optional, Set
 from unittest import mock
 from unittest.mock import MagicMock, patch
 import pytest
 from langchain_core.embeddings import Embeddings
 from langchain_databricks.vectorstores import DatabricksVectorSearch
 INPUT_TEXTS = ["foo", "bar", "baz"]
 DEFAULT_VECTOR_DIMENSION = 4
 class FakeEmbeddings(Embeddings):
    """Fake embeddings functionality for testing."""
    def __init__(self, dimension: int = DEFAULT_VECTOR_DIMENSION):
        super().__init__()
        self.dimension = dimension
    def embed_documents(self, embedding_texts: List[str]) -> List[List[float]]:
        """Return simple embeddings."""
        return [
            [float(1.0)] * (self.dimension - 1) + [float(i)]
            for i in range(len(embedding_texts))
        ]
    def embed_query(self, text: str) -> List[float]:
        """Return simple embeddings."""
        return [float(1.0)] * (self.dimension - 1) + [float(0.0)]
 EMBEDDING_MODEL = FakeEmbeddings()
 ### Dummy similarity_search() Response ###
 EXAMPLE_SEARCH_RESPONSE = {
    "manifest": {
        "column_count": 3,
        "columns": [
            {"name": "id"},
            {"name": "text"},
            {"name": "text_vector"},
            {"name": "score"},
        ],
    },
    "result": {
        "row_count": len(INPUT_TEXTS),
        "data_array": sorted(
            [
                [str(uuid.uuid4()), s, e, 0.5]
                for s, e in zip(
                    INPUT_TEXTS, EMBEDDING_MODEL.embed_documents(INPUT_TEXTS)
                )
            ],
            key=lambda x: x[2],  # type: ignore
            reverse=True,
        ),
    },
    "next_page_token": "",
 }
 ### Dummy Indices ####
 ENDPOINT_NAME = "test-endpoint"
 DIRECT_ACCESS_INDEX = "test-direct-access-index"
 DELTA_SYNC_INDEX = "test-delta-sync-index"
 DELTA_SYNC_SELF_MANAGED_EMBEDDINGS_INDEX = "test-delta-sync-self-managed-index"
 ALL_INDEX_NAMES = {
    DIRECT_ACCESS_INDEX,
    DELTA_SYNC_INDEX,
    DELTA_SYNC_SELF_MANAGED_EMBEDDINGS_INDEX,
 }
 INDEX_DETAILS = {
    DELTA_SYNC_INDEX: {
        "name": DELTA_SYNC_INDEX,
        "endpoint_name": ENDPOINT_NAME,
        "index_type": "DELTA_SYNC",
        "primary_key": "id",
        "delta_sync_index_spec": {
            "source_table": "ml.llm.source_table",
            "pipeline_type": "CONTINUOUS",
            "embedding_source_columns": [
                {
                    "name": "text",
                    "embedding_model_endpoint_name": "openai-text-embedding",
                }
            ],
        },
    },
    DELTA_SYNC_SELF_MANAGED_EMBEDDINGS_INDEX: {
        "name": DELTA_SYNC_SELF_MANAGED_EMBEDDINGS_INDEX,
        "endpoint_name": ENDPOINT_NAME,
        "index_type": "DELTA_SYNC",
        "primary_key": "id",
        "delta_sync_index_spec": {
            "source_table": "ml.llm.source_table",
            "pipeline_type": "CONTINUOUS",
            "embedding_vector_columns": [
                {
                    "name": "text_vector",
                    "embedding_dimension": DEFAULT_VECTOR_DIMENSION,
                }
            ],
        },
    },
    DIRECT_ACCESS_INDEX: {
        "name": DIRECT_ACCESS_INDEX,
        "endpoint_name": ENDPOINT_NAME,
        "index_type": "DIRECT_ACCESS",
        "primary_key": "id",
        "direct_access_index_spec": {
            "embedding_vector_columns": [
                {
                    "name": "text_vector",
                    "embedding_dimension": DEFAULT_VECTOR_DIMENSION,
                }
            ],
            "schema_json": f"{{"
            f'"{"id"}": "int", '
            f'"feat1": "str", '
            f'"feat2": "float", '
            f'"text": "string", '
            f'"{"text_vector"}": "array<float>"'
            f"}}",
        },
    },
 }
@pytest.fixture(autouse=True)
 def mock_vs_client() -> Generator:
    def _get_index(endpoint: str, index_name: str) -> MagicMock:
        from databricks.vector_search.client import VectorSearchIndex  # type: ignore
        if endpoint != ENDPOINT_NAME:
            raise ValueError(f"Unknown endpoint: {endpoint}")
        index = MagicMock(spec=VectorSearchIndex)
        index.describe.return_value = INDEX_DETAILS[index_name]
        index.similarity_search.return_value = EXAMPLE_SEARCH_RESPONSE
        return index
    mock_client = MagicMock()
    mock_client.get_index.side_effect = _get_index
    with mock.patch(
        "databricks.vector_search.client.VectorSearchClient",
        return_value=mock_client,
    ):
        yield
 def init_vector_search(
    index_name: str, columns: Optional[List[str]] = None
 ) -> DatabricksVectorSearch:
    kwargs: Dict[str, Any] = {
        "endpoint": ENDPOINT_NAME,
        "index_name": index_name,
        "columns": columns,
    }
    if index_name != DELTA_SYNC_INDEX:
        kwargs.update(
            {
                "embedding": EMBEDDING_MODEL,
                "text_column": "text",
            }
        )
    return DatabricksVectorSearch(**kwargs)  # type: ignore[arg-type]
@pytest.mark.parametrize("index_name", ALL_INDEX_NAMES)
 def test_init(index_name: str) -> None:
    vectorsearch = init_vector_search(index_name)
    assert vectorsearch.index.describe() == INDEX_DETAILS[index_name]
 def test_init_fail_text_column_mismatch() -> None:
    with pytest.raises(ValueError, match=f"The index '{DELTA_SYNC_INDEX}' has"):
        DatabricksVectorSearch(
            endpoint=ENDPOINT_NAME,
            index_name=DELTA_SYNC_INDEX,
            text_column="some_other_column",
        )
@pytest.mark.parametrize("index_name", ALL_INDEX_NAMES - {DELTA_SYNC_INDEX})
 def test_init_fail_no_text_column(index_name: str) -> None:
    with pytest.raises(ValueError, match="The `text_column` parameter is required"):
        DatabricksVectorSearch(
            endpoint=ENDPOINT_NAME,
            index_name=index_name,
            embedding=EMBEDDING_MODEL,
        )
 def test_init_fail_columns_not_in_schema() -> None:
    columns = ["some_random_column"]
    with pytest.raises(ValueError, match="Some columns specified in `columns`"):
        init_vector_search(DIRECT_ACCESS_INDEX, columns=columns)
@pytest.mark.parametrize("index_name", ALL_INDEX_NAMES - {DELTA_SYNC_INDEX})
 def test_init_fail_no_embedding(index_name: str) -> None:
    with pytest.raises(ValueError, match="The `embedding` parameter is required"):
        DatabricksVectorSearch(
            endpoint=ENDPOINT_NAME,
            index_name=index_name,
            text_column="text",
        )
 def test_init_fail_embedding_already_specified_in_source() -> None:
    with pytest.raises(ValueError, match=f"The index '{DELTA_SYNC_INDEX}' uses"):
        DatabricksVectorSearch(
            endpoint=ENDPOINT_NAME,
            index_name=DELTA_SYNC_INDEX,
            embedding=EMBEDDING_MODEL,
        )
@pytest.mark.parametrize("index_name", ALL_INDEX_NAMES - {DELTA_SYNC_INDEX})
 def test_init_fail_embedding_dim_mismatch(index_name: str) -> None:
    with pytest.raises(
        ValueError, match="embedding model's dimension '1000' does not match"
    ):
        DatabricksVectorSearch(
            endpoint=ENDPOINT_NAME,
            index_name=index_name,
            text_column="text",
            embedding=FakeEmbeddings(1000),
        )
 def test_from_texts_not_supported() -> None:
    with pytest.raises(NotImplementedError, match="`from_texts` is not supported"):
        DatabricksVectorSearch.from_texts(INPUT_TEXTS, EMBEDDING_MODEL)
@pytest.mark.parametrize("index_name", ALL_INDEX_NAMES - {DIRECT_ACCESS_INDEX})
 def test_add_texts_not_supported_for_delta_sync_index(index_name: str) -> None:
    vectorsearch = init_vector_search(index_name)
    with pytest.raises(
        NotImplementedError,
        match="`add_texts` is only supported for direct-access index.",
    ):
        vectorsearch.add_texts(INPUT_TEXTS)
 def is_valid_uuid(val: str) -> bool:
    try:
        uuid.UUID(str(val))
        return True
    except ValueError:
        return False
 def test_add_texts() -> None:
    vectorsearch = init_vector_search(DIRECT_ACCESS_INDEX)
    ids = [idx for idx, i in enumerate(INPUT_TEXTS)]
    vectors = EMBEDDING_MODEL.embed_documents(INPUT_TEXTS)
    added_ids = vectorsearch.add_texts(INPUT_TEXTS, ids=ids)
    vectorsearch.index.upsert.assert_called_once_with(
        [
            {
                "id": id_,
                "text": text,
                "text_vector": vector,
            }
            for text, vector, id_ in zip(INPUT_TEXTS, vectors, ids)
        ]
    )
    assert len(added_ids) == len(INPUT_TEXTS)
    assert added_ids == ids
 def test_add_texts_handle_single_text() -> None:
    vectorsearch = init_vector_search(DIRECT_ACCESS_INDEX)
    vectors = EMBEDDING_MODEL.embed_documents(INPUT_TEXTS)
    added_ids = vectorsearch.add_texts(INPUT_TEXTS[0])
    vectorsearch.index.upsert.assert_called_once_with(
        [
            {
                "id": id_,
                "text": text,
                "text_vector": vector,
            }
            for text, vector, id_ in zip(INPUT_TEXTS, vectors, added_ids)
        ]
    )
    assert len(added_ids) == 1
    assert is_valid_uuid(added_ids[0])
 def test_add_texts_with_default_id() -> None:
    vectorsearch = init_vector_search(DIRECT_ACCESS_INDEX)
    vectors = EMBEDDING_MODEL.embed_documents(INPUT_TEXTS)
    added_ids = vectorsearch.add_texts(INPUT_TEXTS)
    vectorsearch.index.upsert.assert_called_once_with(
        [
            {
                "id": id_,
                "text": text,
                "text_vector": vector,
            }
            for text, vector, id_ in zip(INPUT_TEXTS, vectors, added_ids)
        ]
    )
    assert len(added_ids) == len(INPUT_TEXTS)
    assert all([is_valid_uuid(id_) for id_ in added_ids])
 def test_add_texts_with_metadata() -> None:
    vectorsearch = init_vector_search(DIRECT_ACCESS_INDEX)
    vectors = EMBEDDING_MODEL.embed_documents(INPUT_TEXTS)
    metadatas = [{"feat1": str(i), "feat2": i + 1000} for i in range(len(INPUT_TEXTS))]
    added_ids = vectorsearch.add_texts(INPUT_TEXTS, metadatas=metadatas)
    vectorsearch.index.upsert.assert_called_once_with(
        [
            {
                "id": id_,
                "text": text,
                "text_vector": vector,
                **metadata,  # type: ignore[arg-type]
            }
            for text, vector, id_, metadata in zip(
                INPUT_TEXTS, vectors, added_ids, metadatas
            )
        ]
    )
    assert len(added_ids) == len(INPUT_TEXTS)
    assert all([is_valid_uuid(id_) for id_ in added_ids])
@pytest.mark.parametrize("index_name", ALL_INDEX_NAMES - {DELTA_SYNC_INDEX})
 def test_embeddings_property(index_name: str) -> None:
    vectorsearch = init_vector_search(index_name)
    assert vectorsearch.embeddings == EMBEDDING_MODEL
 def test_delete() -> None:
    vectorsearch = init_vector_search(DIRECT_ACCESS_INDEX)
    vectorsearch.delete(["some id"])
    vectorsearch.index.delete.assert_called_once_with(["some id"])
 def test_delete_fail_no_ids() -> None:
    vectorsearch = init_vector_search(DIRECT_ACCESS_INDEX)
    with pytest.raises(ValueError, match="ids must be provided."):
        vectorsearch.delete()
@pytest.mark.parametrize("index_name", ALL_INDEX_NAMES - {DIRECT_ACCESS_INDEX})
 def test_delete_not_supported_for_delta_sync_index(index_name: str) -> None:
    vectorsearch = init_vector_search(index_name)
    with pytest.raises(
        NotImplementedError, match="`delete` is only supported for direct-access"
    ):
        vectorsearch.delete(["some id"])
@pytest.mark.parametrize("index_name", ALL_INDEX_NAMES)
@pytest.mark.parametrize("query_type", [None, "ANN"])
 def test_similarity_search(index_name: str, query_type: Optional[str]) -> None:
    vectorsearch = init_vector_search(index_name)
    query = "foo"
    filters = {"some filter": True}
    limit = 7
    search_result = vectorsearch.similarity_search(
        query, k=limit, filter=filters, query_type=query_type
    )
    if index_name == DELTA_SYNC_INDEX:
        vectorsearch.index.similarity_search.assert_called_once_with(
            columns=["id", "text"],
            query_text=query,
            query_vector=None,
            filters=filters,
            num_results=limit,
            query_type=query_type,
        )
    else:
        vectorsearch.index.similarity_search.assert_called_once_with(
            columns=["id", "text"],
            query_text=None,
            query_vector=EMBEDDING_MODEL.embed_query(query),
            filters=filters,
            num_results=limit,
            query_type=query_type,
        )
    assert len(search_result) == len(INPUT_TEXTS)
    assert sorted([d.page_content for d in search_result]) == sorted(INPUT_TEXTS)
    assert all(["id" in d.metadata for d in search_result])
@pytest.mark.parametrize("index_name", ALL_INDEX_NAMES)
 def test_similarity_search_hybrid(index_name: str) -> None:
    vectorsearch = init_vector_search(index_name)
    query = "foo"
    filters = {"some filter": True}
    limit = 7
    search_result = vectorsearch.similarity_search(
        query, k=limit, filter=filters, query_type="HYBRID"
    )
    if index_name == DELTA_SYNC_INDEX:
        vectorsearch.index.similarity_search.assert_called_once_with(
            columns=["id", "text"],
            query_text=query,
            query_vector=None,
            filters=filters,
            num_results=limit,
            query_type="HYBRID",
        )
    else:
        vectorsearch.index.similarity_search.assert_called_once_with(
            columns=["id", "text"],
            query_text=query,
            query_vector=EMBEDDING_MODEL.embed_query(query),
            filters=filters,
            num_results=limit,
            query_type="HYBRID",
        )
    assert len(search_result) == len(INPUT_TEXTS)
    assert sorted([d.page_content for d in search_result]) == sorted(INPUT_TEXTS)
    assert all(["id" in d.metadata for d in search_result])
 def test_similarity_search_both_filter_and_filters_passed() -> None:
    vectorsearch = init_vector_search(DIRECT_ACCESS_INDEX)
    query = "foo"
    filter = {"some filter": True}
    filters = {"some other filter": False}
    vectorsearch.similarity_search(query, filter=filter, filters=filters)
    vectorsearch.index.similarity_search.assert_called_once_with(
        columns=["id", "text"],
        query_vector=EMBEDDING_MODEL.embed_query(query),
        # `filter` should prevail over `filters`
        filters=filter,
        num_results=4,
        query_text=None,
        query_type=None,
    )
@pytest.mark.parametrize("index_name", ALL_INDEX_NAMES - {DELTA_SYNC_INDEX})
@pytest.mark.parametrize(
    "columns, expected_columns",
    [
        (None, {"id"}),
        (["id", "text", "text_vector"], {"text_vector", "id"}),
    ],
 )
 def test_mmr_search(
    index_name: str, columns: Optional[List[str]], expected_columns: Set[str]
 ) -> None:
    vectorsearch = init_vector_search(index_name, columns=columns)
    query = INPUT_TEXTS[0]
    filters = {"some filter": True}
    limit = 1
    search_result = vectorsearch.max_marginal_relevance_search(
        query, k=limit, filters=filters
    )
    assert [doc.page_content for doc in search_result] == [INPUT_TEXTS[0]]
    assert [set(doc.metadata.keys()) for doc in search_result] == [expected_columns]
@pytest.mark.parametrize("index_name", ALL_INDEX_NAMES - {DELTA_SYNC_INDEX})
 def test_mmr_parameters(index_name: str) -> None:
    vectorsearch = init_vector_search(index_name)
    query = INPUT_TEXTS[0]
    limit = 1
    fetch_k = 3
    lambda_mult = 0.25
    filters = {"some filter": True}
    with patch(
        "langchain_databricks.vectorstores.maximal_marginal_relevance"
    ) as mock_mmr:
        mock_mmr.return_value = [2]
        retriever = vectorsearch.as_retriever(
            search_type="mmr",
            search_kwargs={
                "k": limit,
                "fetch_k": fetch_k,
                "lambda_mult": lambda_mult,
                "filter": filters,
            },
        )
        search_result = retriever.invoke(query)
    mock_mmr.assert_called_once()
    assert mock_mmr.call_args[1]["lambda_mult"] == lambda_mult
    assert vectorsearch.index.similarity_search.call_args[1]["num_results"] == fetch_k
    assert vectorsearch.index.similarity_search.call_args[1]["filters"] == filters
    assert len(search_result) == limit
@pytest.mark.parametrize("index_name", ALL_INDEX_NAMES)
@pytest.mark.parametrize("threshold", [0.4, 0.5, 0.8])
 def test_similarity_score_threshold(index_name: str, threshold: float) -> None:
    query = INPUT_TEXTS[0]
    limit = len(INPUT_TEXTS)
    vectorsearch = init_vector_search(index_name)
    retriever = vectorsearch.as_retriever(
        search_type="similarity_score_threshold",
        search_kwargs={"k": limit, "score_threshold": threshold},
    )
    search_result = retriever.invoke(query)
    if threshold <= 0.5:
        assert len(search_result) == len(INPUT_TEXTS)
    else:
        assert len(search_result) == 0
 def test_standard_params() -> None:
    vectorstore = init_vector_search(DIRECT_ACCESS_INDEX)
    retriever = vectorstore.as_retriever()
    ls_params = retriever._get_ls_params()
    assert ls_params == {
        "ls_retriever_name": "vectorstore",
        "ls_vector_store_provider": "DatabricksVectorSearch",
        "ls_embedding_provider": "FakeEmbeddings",
    }
    vectorstore = init_vector_search(DELTA_SYNC_INDEX)
    retriever = vectorstore.as_retriever()
    ls_params = retriever._get_ls_params()
    assert ls_params == {
        "ls_retriever_name": "vectorstore",
        "ls_vector_store_provider": "DatabricksVectorSearch",
    }
@pytest.mark.parametrize("index_name", ALL_INDEX_NAMES - {DELTA_SYNC_INDEX})
@pytest.mark.parametrize("query_type", [None, "ANN"])
 def test_similarity_search_by_vector(
    index_name: str, query_type: Optional[str]
 ) -> None:
    vectorsearch = init_vector_search(index_name)
    query_embedding = EMBEDDING_MODEL.embed_query("foo")
    filters = {"some filter": True}
    limit = 7
    search_result = vectorsearch.similarity_search_by_vector(
        query_embedding, k=limit, filter=filters, query_type=query_type
    )
    vectorsearch.index.similarity_search.assert_called_once_with(
        columns=["id", "text"],
        query_vector=query_embedding,
        filters=filters,
        num_results=limit,
        query_type=query_type,
        query_text=None,
    )
    assert len(search_result) == len(INPUT_TEXTS)
    assert sorted([d.page_content for d in search_result]) == sorted(INPUT_TEXTS)
    assert all(["id" in d.metadata for d in search_result])
@pytest.mark.parametrize("index_name", ALL_INDEX_NAMES - {DELTA_SYNC_INDEX})
 def test_similarity_search_by_vector_hybrid(index_name: str) -> None:
    vectorsearch = init_vector_search(index_name)
    query_embedding = EMBEDDING_MODEL.embed_query("foo")
    filters = {"some filter": True}
    limit = 7
    search_result = vectorsearch.similarity_search_by_vector(
        query_embedding, k=limit, filter=filters, query_type="HYBRID", query="foo"
    )
    vectorsearch.index.similarity_search.assert_called_once_with(
        columns=["id", "text"],
        query_vector=query_embedding,
        filters=filters,
        num_results=limit,
        query_type="HYBRID",
        query_text="foo",
    )
    assert len(search_result) == len(INPUT_TEXTS)
    assert sorted([d.page_content for d in search_result]) == sorted(INPUT_TEXTS)
    assert all(["id" in d.metadata for d in search_result])
@pytest.mark.parametrize("index_name", ALL_INDEX_NAMES)
 def test_similarity_search_empty_result(index_name: str) -> None:
    vectorsearch = init_vector_search(index_name)
    vectorsearch.index.similarity_search.return_value = {
        "manifest": {
            "column_count": 3,
            "columns": [
                {"name": "id"},
                {"name": "text"},
                {"name": "score"},
            ],
        },
        "result": {
            "row_count": 0,
            "data_array": [],
        },
        "next_page_token": "",
    }
    search_result = vectorsearch.similarity_search("foo")
    assert len(search_result) == 0
 def test_similarity_search_by_vector_not_supported_for_managed_embedding() -> None:
    vectorsearch = init_vector_search(DELTA_SYNC_INDEX)
    query_embedding = EMBEDDING_MODEL.embed_query("foo")
    filters = {"some filter": True}
    limit = 7
    with pytest.raises(
        NotImplementedError, match="`similarity_search_by_vector` is not supported"
    ):
        vectorsearch.similarity_search_by_vector(
            query_embedding, k=limit, filters=filters
        )