langchain/libs/partners/ollama/langchain_ollama/_compat.py

"""LangChain v1 message conversion utilities for Ollama."""

from __future__ import annotations

from typing import Any, cast
from uuid import uuid4

from langchain_core.messages import content_blocks as types
from langchain_core.messages.ai import UsageMetadata
from langchain_core.messages.content_blocks import (
    ImageContentBlock,
    ReasoningContentBlock,
    TextContentBlock,
    ToolCall,
    ToolCallChunk,
)
from langchain_core.v1.messages import (
    AIMessage,
    AIMessageChunk,
    HumanMessage,
    MessageV1,
    ResponseMetadata,
    SystemMessage,
    ToolMessage,
)


def _get_usage_metadata_from_response(
    response: dict[str, Any],
) -> UsageMetadata | None:
    """Extract usage metadata from Ollama response."""
    input_tokens = response.get("prompt_eval_count")
    output_tokens = response.get("eval_count")
    if input_tokens is not None and output_tokens is not None:
        return UsageMetadata(
            input_tokens=input_tokens,
            output_tokens=output_tokens,
            total_tokens=input_tokens + output_tokens,
        )
    return None


def _convert_from_v1_to_ollama_format(message: MessageV1) -> dict[str, Any]:
    """Convert v1 message to Ollama API format."""
    if isinstance(message, HumanMessage):
        return _convert_human_message_v1(message)
    if isinstance(message, AIMessage):
        return _convert_ai_message_v1(message)
    if isinstance(message, SystemMessage):
        return _convert_system_message_v1(message)
    if isinstance(message, ToolMessage):
        return _convert_tool_message_v1(message)
    msg = f"Unsupported message type: {type(message)}"
    raise ValueError(msg)


def _convert_content_blocks_to_ollama_format(
    content: list[types.ContentBlock],
) -> tuple[str, list[str], list[dict[str, Any]]]:
    """Convert v1 content blocks to Ollama API format.

    Returns:
        Tuple of `(text_content, images, tool_calls)`
    """
    text_content = ""

    images = []
    """Base64 encoded image data."""

    tool_calls = []

    for block in content:
        block_type = block.get("type")
        if block_type == "text":
            text_block = cast(TextContentBlock, block)
            text_content += text_block["text"]
        elif block_type == "image":
            image_block = cast(ImageContentBlock, block)
            if image_block.get("base64"):
                # Ollama doesn't need MIME type or other metadata
                if not isinstance(image_block.get("base64"), str):
                    # (This shouldn't happen in practice, but just in case)
                    msg = "Image content must be base64 encoded string"
                    raise ValueError(msg)
                if not image_block.get("base64", "").strip():
                    msg = "Image content cannot be empty"
                    raise ValueError(msg)
                # Ensure we have plain/raw base64 data
                if image_block.get("base64", "").startswith("data:"):
                    # Strip the data URI scheme (e.g., 'data:image/png;base64,')
                    image_block["base64"] = image_block.get("base64", "").split(",")[1]
                images.append(image_block.get("base64", ""))
            else:
                msg = "Only base64 image data is supported by Ollama"
                raise ValueError(msg)
        elif block_type == "tool_call":
            tool_call_block = cast(ToolCall, block)
            tool_calls.append(
                {
                    "type": "function",
                    "id": tool_call_block["id"],
                    "function": {
                        "name": tool_call_block["name"],
                        "arguments": tool_call_block["args"],
                    },
                }
            )
        elif block_type == "invalid_tool_call":
            # InvalidToolCall blocks are handled by converting to text
            # May revisit this in the future
            name = block.get("name", "unknown")
            error = block.get("error", "unknown error")
            text_content += f"[Invalid tool call: {name} - {error}]"
        else:
            # Skip other content block types that aren't supported
            msg = f"Unsupported content block type: {block_type}"
            raise ValueError(msg)

    return text_content, images, tool_calls


def _convert_human_message_v1(message: HumanMessage) -> dict[str, Any]:
    """Convert HumanMessage to Ollama format."""
    text_content, images, _ = _convert_content_blocks_to_ollama_format(message.content)

    msg: dict[str, Any] = {
        "role": "user",
        "content": text_content,
        "images": images,
    }
    if message.name:
        # Ollama doesn't have direct name support, include in content
        msg["content"] = f"[{message.name}]: {text_content}"

    return msg


def _convert_ai_message_v1(message: AIMessage) -> dict[str, Any]:
    """Convert AIMessage to Ollama format."""
    text_content, _, tool_calls = _convert_content_blocks_to_ollama_format(
        message.content
    )

    msg: dict[str, Any] = {
        "role": "assistant",
        "content": text_content,
    }

    if tool_calls:
        msg["tool_calls"] = tool_calls

    if message.name:
        # Ollama doesn't have direct name support, include in content
        msg["content"] = f"[{message.name}]: {text_content}"

    return msg


def _convert_system_message_v1(message: SystemMessage) -> dict[str, Any]:
    """Convert SystemMessage to Ollama format."""
    text_content, _, _ = _convert_content_blocks_to_ollama_format(message.content)

    return {
        "role": "system",
        "content": text_content,
    }


def _convert_tool_message_v1(message: ToolMessage) -> dict[str, Any]:
    """Convert ToolMessage to Ollama format."""
    text_content, _, _ = _convert_content_blocks_to_ollama_format(message.content)

    return {
        "role": "tool",
        "content": text_content,
        "tool_call_id": message.tool_call_id,
    }


def _convert_to_v1_from_ollama_format(response: dict[str, Any]) -> AIMessage:
    """Convert Ollama API response to AIMessage."""
    content: list[types.ContentBlock] = []

    # Handle reasoning content first (should come before main response)
    if "message" in response and "thinking" in response["message"]:
        thinking_content = response["message"]["thinking"]
        if thinking_content:
            content.append(
                ReasoningContentBlock(
                    type="reasoning",
                    reasoning=thinking_content,
                )
            )

    # Handle text content
    if "message" in response and "content" in response["message"]:
        text_content = response["message"]["content"]
        if text_content:
            content.append(TextContentBlock(type="text", text=text_content))

    # Handle tool calls
    if "message" in response and "tool_calls" in response["message"]:
        tool_calls = response["message"]["tool_calls"]
        content.extend(
            [
                ToolCall(
                    type="tool_call",
                    id=tool_call.get("id", str(uuid4())),
                    name=tool_call["function"]["name"],
                    args=tool_call["function"]["arguments"],
                )
                for tool_call in tool_calls
            ]
        )

    # Build response metadata
    response_metadata = ResponseMetadata()
    if "model" in response:
        response_metadata["model_name"] = response["model"]

    # Cast to dict[str, Any] to allow provider-specific fields
    # ResponseMetadata TypedDict only defines standard fields, but mypy doesn't
    # understand that total=False allows arbitrary additional keys at runtime
    metadata_as_dict = cast(dict[str, Any], response_metadata)
    if "created_at" in response:
        metadata_as_dict["created_at"] = response["created_at"]
    if "done" in response:
        metadata_as_dict["done"] = response["done"]
    if "done_reason" in response:
        metadata_as_dict["done_reason"] = response["done_reason"]
    if "total_duration" in response:
        metadata_as_dict["total_duration"] = response["total_duration"]
    if "load_duration" in response:
        metadata_as_dict["load_duration"] = response["load_duration"]
    if "prompt_eval_count" in response:
        metadata_as_dict["prompt_eval_count"] = response["prompt_eval_count"]
    if "prompt_eval_duration" in response:
        metadata_as_dict["prompt_eval_duration"] = response["prompt_eval_duration"]
    if "eval_count" in response:
        metadata_as_dict["eval_count"] = response["eval_count"]
    if "eval_duration" in response:
        metadata_as_dict["eval_duration"] = response["eval_duration"]
    if "context" in response:
        metadata_as_dict["context"] = response["context"]

    return AIMessage(
        content=content,
        response_metadata=response_metadata,
        usage_metadata=_get_usage_metadata_from_response(response),
    )


def _convert_chunk_to_v1(chunk: dict[str, Any]) -> AIMessageChunk:
    """Convert Ollama streaming chunk to AIMessageChunk."""
    content: list[types.ContentBlock] = []
    tool_call_chunks: list[ToolCallChunk] = []

    # Handle reasoning content first in chunks
    if "message" in chunk and "thinking" in chunk["message"]:
        thinking_content = chunk["message"]["thinking"]
        if thinking_content:
            content.append(
                ReasoningContentBlock(
                    type="reasoning",
                    reasoning=thinking_content,
                )
            )

    # Handle streaming text content
    if "message" in chunk and "content" in chunk["message"]:
        text_content = chunk["message"]["content"]
        if text_content:
            content.append(TextContentBlock(type="text", text=text_content))

    # Handle streaming tool calls
    if "message" in chunk and "tool_calls" in chunk["message"]:
        tool_calls = chunk["message"]["tool_calls"]
        for i, tool_call in enumerate(tool_calls):
            tool_call_id = tool_call.get("id", f"lc_{uuid4()}")
            tool_name = tool_call.get("function", {}).get("name", "")
            tool_args = tool_call.get("function", {}).get("arguments", {})

            # Add to content blocks for final representation
            content.append(
                ToolCall(
                    type="tool_call",
                    id=tool_call_id,
                    name=tool_name,
                    args=tool_args,
                )
            )

            # Add to tool call chunks for streaming
            tool_call_chunks.append(
                ToolCallChunk(
                    type="tool_call_chunk",
                    id=tool_call_id,
                    name=tool_name,
                    args=tool_args,
                    index=i,
                )
            )

    # Build response metadata for final chunks
    response_metadata = None
    if chunk.get("done") is True:
        response_metadata = ResponseMetadata()
        if "model" in chunk:
            response_metadata["model_name"] = chunk["model"]
        if "created_at" in chunk:
            response_metadata["created_at"] = chunk["created_at"]  # type: ignore[typeddict-unknown-key]
        if "done_reason" in chunk:
            response_metadata["done_reason"] = chunk["done_reason"]  # type: ignore[typeddict-unknown-key]
        if "total_duration" in chunk:
            response_metadata["total_duration"] = chunk["total_duration"]  # type: ignore[typeddict-unknown-key]
        if "load_duration" in chunk:
            response_metadata["load_duration"] = chunk["load_duration"]  # type: ignore[typeddict-unknown-key]
        if "prompt_eval_count" in chunk:
            response_metadata["prompt_eval_count"] = chunk["prompt_eval_count"]  # type: ignore[typeddict-unknown-key]
        if "prompt_eval_duration" in chunk:
            response_metadata["prompt_eval_duration"] = chunk["prompt_eval_duration"]  # type: ignore[typeddict-unknown-key]
        if "eval_count" in chunk:
            response_metadata["eval_count"] = chunk["eval_count"]  # type: ignore[typeddict-unknown-key]
        if "eval_duration" in chunk:
            response_metadata["eval_duration"] = chunk["eval_duration"]  # type: ignore[typeddict-unknown-key]
        if "context" in chunk:
            response_metadata["context"] = chunk["context"]  # type: ignore[typeddict-unknown-key]

    usage_metadata = None
    if chunk.get("done") is True:
        usage_metadata = _get_usage_metadata_from_response(chunk)

    return AIMessageChunk(
        content=content,
        response_metadata=response_metadata or ResponseMetadata(),
        usage_metadata=usage_metadata,
        tool_call_chunks=tool_call_chunks,
    )