more tests refactors

2025-08-15 07:36:08 +00:00 · 2025-08-06 13:11:46 -04:00 · 2025-08-06 13:11:46 -04:00 · 4d261089c6
commit 4d261089c6
parent 21e64987d0
6 changed files with 381 additions and 103 deletions
--- a/libs/partners/ollama/README.md
+++ b/libs/partners/ollama/README.md
@ -32,6 +32,14 @@ llm = ChatOllama(model="llama3.1")
 llm.invoke("Sing a ballad of LangChain.")
 ```

+### v1 Chat Models
+
+For v1 chat models, you can use the `ChatOllama` class with the `v1` namespace.
+
+```python
+from langchain_ollama.v1.chat_models import ChatOllama
+```
+
 ## [Embeddings](https://python.langchain.com/api_reference/ollama/embeddings/langchain_ollama.embeddings.OllamaEmbeddings.html#ollamaembeddings)

 `OllamaEmbeddings` class exposes embeddings from Ollama.
--- a/libs/partners/ollama/tests/integration_tests/chat_models/test_chat_models_reasoning.py
+++ b/libs/partners/ollama/tests/integration_tests/chat_models/test_chat_models_reasoning.py
@ -1,21 +1,13 @@
-"""Ollama specific chat model integration tests for reasoning models."""
+"""Ollama integration tests for reasoning chat models."""

 import pytest
 from langchain_core.messages import AIMessageChunk, BaseMessageChunk, HumanMessage
-from pydantic import BaseModel, Field

 from langchain_ollama import ChatOllama

 SAMPLE = "What is 3^3?"


-class MathAnswer(BaseModel):
-    """A mathematical expression and its numerical answer."""
-
-    expression: str = Field(description="The mathematical expression to evaluate.")
-    answer: int = Field(description="The numerical answer to the expression.")
-
-
@pytest.mark.parametrize(("model"), [("deepseek-r1:1.5b")])
 def test_stream_no_reasoning(model: str) -> None:
    """Test streaming with `reasoning=False`"""
@ -36,8 +28,6 @@ def test_stream_no_reasoning(model: str) -> None:
    assert isinstance(result, AIMessageChunk)
    assert result.content
    assert "<think>" not in result.content and "</think>" not in result.content
-    if hasattr(result, "additional_kwargs"):
-        # v0 format
    assert "reasoning_content" not in result.additional_kwargs


@ -61,8 +51,6 @@ async def test_astream_no_reasoning(model: str) -> None:
    assert isinstance(result, AIMessageChunk)
    assert result.content
    assert "<think>" not in result.content and "</think>" not in result.content
-    if hasattr(result, "additional_kwargs"):
-        # v0 format
    assert "reasoning_content" not in result.additional_kwargs


@ -85,10 +73,8 @@ def test_stream_reasoning_none(model: str) -> None:
        result += chunk
    assert isinstance(result, AIMessageChunk)
    assert result.content
-    assert "reasoning_content" not in result.additional_kwargs
    assert "<think>" in result.content and "</think>" in result.content
-    if not isinstance(result.content, list):
-        # v0 format (content as string)
+    assert "reasoning_content" not in result.additional_kwargs
    assert "<think>" not in result.additional_kwargs.get("reasoning_content", "")
    assert "</think>" not in result.additional_kwargs.get("reasoning_content", "")

@ -112,10 +98,8 @@ async def test_astream_reasoning_none(model: str) -> None:
        result += chunk
    assert isinstance(result, AIMessageChunk)
    assert result.content
-    assert "reasoning_content" not in result.additional_kwargs
    assert "<think>" in result.content and "</think>" in result.content
-    if not isinstance(result.content, list):
-        # v0 format (content as string)
+    assert "reasoning_content" not in result.additional_kwargs
    assert "<think>" not in result.additional_kwargs.get("reasoning_content", "")
    assert "</think>" not in result.additional_kwargs.get("reasoning_content", "")

@ -142,8 +126,6 @@ def test_reasoning_stream(model: str) -> None:
    assert "reasoning_content" in result.additional_kwargs
    assert len(result.additional_kwargs["reasoning_content"]) > 0
    assert "<think>" not in result.content and "</think>" not in result.content
-    if not isinstance(result.content, list):
-        # v0 format (content as string)
    assert "<think>" not in result.additional_kwargs["reasoning_content"]
    assert "</think>" not in result.additional_kwargs["reasoning_content"]

@ -170,8 +152,6 @@ async def test_reasoning_astream(model: str) -> None:
    assert "reasoning_content" in result.additional_kwargs
    assert len(result.additional_kwargs["reasoning_content"]) > 0
    assert "<think>" not in result.content and "</think>" not in result.content
-    if not isinstance(result.content, list):
-        # v0 format (content as string)
    assert "<think>" not in result.additional_kwargs["reasoning_content"]
    assert "</think>" not in result.additional_kwargs["reasoning_content"]

@ -183,10 +163,8 @@ def test_invoke_no_reasoning(model: str) -> None:
    message = HumanMessage(content=SAMPLE)
    result = llm.invoke([message])
    assert result.content
-    assert "<think>" not in result.content and "</think>" not in result.content
-    if hasattr(result, "additional_kwargs"):
-        # v0 format
    assert "reasoning_content" not in result.additional_kwargs
+    assert "<think>" not in result.content and "</think>" not in result.content


@pytest.mark.parametrize(("model"), [("deepseek-r1:1.5b")])
@ -196,10 +174,8 @@ async def test_ainvoke_no_reasoning(model: str) -> None:
    message = HumanMessage(content=SAMPLE)
    result = await llm.ainvoke([message])
    assert result.content
-    assert "<think>" not in result.content and "</think>" not in result.content
-    if hasattr(result, "additional_kwargs"):
-        # v0 format
    assert "reasoning_content" not in result.additional_kwargs
+    assert "<think>" not in result.content and "</think>" not in result.content


@pytest.mark.parametrize(("model"), [("deepseek-r1:1.5b")])
@ -211,8 +187,6 @@ def test_invoke_reasoning_none(model: str) -> None:
    assert result.content
    assert "reasoning_content" not in result.additional_kwargs
    assert "<think>" in result.content and "</think>" in result.content
-    if not isinstance(result.content, list):
-        # v0 format (content as string)
    assert "<think>" not in result.additional_kwargs.get("reasoning_content", "")
    assert "</think>" not in result.additional_kwargs.get("reasoning_content", "")

@ -226,8 +200,6 @@ async def test_ainvoke_reasoning_none(model: str) -> None:
    assert result.content
    assert "reasoning_content" not in result.additional_kwargs
    assert "<think>" in result.content and "</think>" in result.content
-    if not isinstance(result.content, list):
-        # v0 format (content as string)
    assert "<think>" not in result.additional_kwargs.get("reasoning_content", "")
    assert "</think>" not in result.additional_kwargs.get("reasoning_content", "")

@ -242,8 +214,6 @@ def test_reasoning_invoke(model: str) -> None:
    assert "reasoning_content" in result.additional_kwargs
    assert len(result.additional_kwargs["reasoning_content"]) > 0
    assert "<think>" not in result.content and "</think>" not in result.content
-    if not isinstance(result.content, list):
-        # v0 format (content as string)
    assert "<think>" not in result.additional_kwargs["reasoning_content"]
    assert "</think>" not in result.additional_kwargs["reasoning_content"]

@ -258,8 +228,6 @@ async def test_reasoning_ainvoke(model: str) -> None:
    assert "reasoning_content" in result.additional_kwargs
    assert len(result.additional_kwargs["reasoning_content"]) > 0
    assert "<think>" not in result.content and "</think>" not in result.content
-    # Only check additional_kwargs for v0 format (content as string)
-    if not isinstance(result.content, list):
    assert "<think>" not in result.additional_kwargs["reasoning_content"]
    assert "</think>" not in result.additional_kwargs["reasoning_content"]

--- a/libs/partners/ollama/tests/integration_tests/test_llms.py
+++ b/libs/partners/ollama/tests/integration_tests/test_llms.py
@ -7,6 +7,7 @@ from langchain_core.runnables import RunnableConfig
 from langchain_ollama.llms import OllamaLLM

 MODEL_NAME = "llama3.1"
+REASONING_MODEL_NAME = "deepseek-r1:1.5b"
 SAMPLE = "What is 3^3?"


@ -18,7 +19,7 @@ def test_stream_text_tokens() -> None:
        assert isinstance(token, str)


-@pytest.mark.parametrize(("model"), [("deepseek-r1:1.5b")])
+@pytest.mark.parametrize(("model"), [(REASONING_MODEL_NAME)])
 def test__stream_no_reasoning(model: str) -> None:
    """Test low-level chunk streaming of a simple prompt with `reasoning=False`."""
    llm = OllamaLLM(model=model, num_ctx=2**12)
@ -39,7 +40,7 @@ def test__stream_no_reasoning(model: str) -> None:
    assert "reasoning_content" not in result_chunk.generation_info  # type: ignore[operator]


-@pytest.mark.parametrize(("model"), [("deepseek-r1:1.5b")])
+@pytest.mark.parametrize(("model"), [(REASONING_MODEL_NAME)])
 def test__stream_with_reasoning(model: str) -> None:
    """Test low-level chunk streaming with `reasoning=True`."""
    llm = OllamaLLM(model=model, num_ctx=2**12, reasoning=True)
@ -71,7 +72,7 @@ async def test_astream_text_tokens() -> None:
        assert isinstance(token, str)


-@pytest.mark.parametrize(("model"), [("deepseek-r1:1.5b")])
+@pytest.mark.parametrize(("model"), [(REASONING_MODEL_NAME)])
 async def test__astream_no_reasoning(model: str) -> None:
    """Test low-level async chunk streaming with `reasoning=False`."""
    llm = OllamaLLM(model=model, num_ctx=2**12)
@ -89,7 +90,7 @@ async def test__astream_no_reasoning(model: str) -> None:
    assert "reasoning_content" not in result_chunk.generation_info  # type: ignore[operator]


-@pytest.mark.parametrize(("model"), [("deepseek-r1:1.5b")])
+@pytest.mark.parametrize(("model"), [(REASONING_MODEL_NAME)])
 async def test__astream_with_reasoning(model: str) -> None:
    """Test low-level async chunk streaming with `reasoning=True`."""
    llm = OllamaLLM(model=model, num_ctx=2**12, reasoning=True)
--- a/libs/partners/ollama/tests/integration_tests/v1/chat_models/test_chat_models_standard_v1.py
+++ b/libs/partners/ollama/tests/integration_tests/v1/chat_models/test_chat_models_standard_v1.py
@ -15,6 +15,7 @@ from pydantic import ValidationError
 from langchain_ollama.v1.chat_models import ChatOllama

 DEFAULT_MODEL_NAME = "llama3.1"
+REASONING_MODEL_NAME = "deepseek-r1:1.5b"


@tool
@ -219,8 +220,8 @@ class TestChatOllamaV1(ChatModelV1IntegrationTests):

    @pytest.mark.xfail(
        reason=(
-            "Default llama3.1 model does not support reasoning. Override uses "
-            "reasoning-capable model with reasoning=True enabled."
+            f"{DEFAULT_MODEL_NAME} does not support reasoning. Override uses "
+            "reasoning-capable model with `reasoning=True` enabled."
        ),
        strict=False,
    )
@ -234,7 +235,7 @@ class TestChatOllamaV1(ChatModelV1IntegrationTests):
            pytest.skip("Model does not support ReasoningContentBlock.")

        reasoning_enabled_model = ChatOllama(
-            model="deepseek-r1:1.5b", reasoning=True, validate_model_on_init=True
+            model=REASONING_MODEL_NAME, reasoning=True, validate_model_on_init=True
        )

        message = HumanMessage("Think step by step: What is 2 + 2?")
@ -251,6 +252,8 @@ class TestChatOllamaV1(ChatModelV1IntegrationTests):
                f"Content blocks: {[block.get('type') for block in result.content]}"
            )

+    # Additional Ollama reasoning tests in v1/chat_models/test_chat_models_v1.py
+
    @patch("langchain_ollama.v1.chat_models.Client.list")
    def test_init_model_not_found(self, mock_list: MagicMock) -> None:
        """Test that a ValueError is raised when the model is not found."""
--- a/libs/partners/ollama/tests/integration_tests/v1/chat_models/test_chat_models_v1.py
+++ b/libs/partners/ollama/tests/integration_tests/v1/chat_models/test_chat_models_v1.py
@ -9,12 +9,17 @@ from __future__ import annotations
 from typing import Annotated, Optional

 import pytest
+from langchain_core.messages.content_blocks import is_reasoning_block
+from langchain_core.v1.messages import AIMessageChunk, HumanMessage
 from pydantic import BaseModel, Field
 from typing_extensions import TypedDict

 from langchain_ollama.v1.chat_models import ChatOllama

 DEFAULT_MODEL_NAME = "llama3.1"
+REASONING_MODEL_NAME = "deepseek-r1:1.5b"
+
+SAMPLE = "What is 3^3?"


@pytest.mark.parametrize(("method"), [("function_calling"), ("json_schema")])
@ -104,50 +109,335 @@ def test_structured_output_deeply_nested(model: str) -> None:
        assert isinstance(chunk, Data)


-# def test_reasoning_content_blocks() -> None:
-#     """Test that the model supports reasoning content blocks."""
-#     llm = ChatOllama(model=DEFAULT_MODEL_NAME, temperature=0)
+@pytest.mark.parametrize(("model"), [(REASONING_MODEL_NAME)])
+def test_stream_no_reasoning(model: str) -> None:
+    """Test streaming with `reasoning=False`"""
+    llm = ChatOllama(model=model, num_ctx=2**12, reasoning=False)
+    result = None
+    for chunk in llm.stream(SAMPLE):
+        assert isinstance(chunk, AIMessageChunk)
+        if result is None:
+            result = chunk
+            continue
+        result += chunk
+    assert isinstance(result, AIMessageChunk)
+    assert result.content

-#     # Test with a reasoning prompt
-#     messages = [HumanMessage("Think step by step and solve: What is 2 + 2?")]
+    content_types = set()
+    for content_block in result.content:
+        type_ = content_block.get("type")
+        if type_:
+            content_types.add(type_)

-#     result = llm.invoke(messages)
-
-#     # Check that we get an AIMessage with content blocks
-#     assert isinstance(result, AIMessage)
-#     assert len(result.content) > 0
-
-#     # For streaming, check that reasoning blocks are properly handled
-#     chunks = []
-#     for chunk in llm.stream(messages):
-#         chunks.append(chunk)
-#         assert isinstance(chunk, AIMessageChunk)
-
-#     assert len(chunks) > 0
+    assert "reasoning" not in content_types, (
+        f"Expected no reasoning content, got types: {content_types}"
+    )
+    assert "non_standard" not in content_types, (
+        f"Expected no non-standard content, got types: {content_types}"
+    )
+    assert "<think>" not in result.text and "</think>" not in result.text


-# def test_multimodal_support() -> None:
-#     """Test that the model supports image content blocks."""
-#     llm = ChatOllama(model=DEFAULT_MODEL_NAME, temperature=0)
+@pytest.mark.parametrize(("model"), [(REASONING_MODEL_NAME)])
+async def test_astream_no_reasoning(model: str) -> None:
+    """Test async streaming with `reasoning=False`"""
+    llm = ChatOllama(model=model, num_ctx=2**12, reasoning=False)
+    result = None
+    async for chunk in llm.astream(SAMPLE):
+        assert isinstance(chunk, AIMessageChunk)
+        if result is None:
+            result = chunk
+            continue
+        result += chunk
+    assert isinstance(result, AIMessageChunk)
+    assert result.content

-#     # Create a message with image content block
-#     from langchain_core.messages.content_blocks import (
-#         create_image_block,
-#         create_text_block,
-#     )
+    content_types = set()
+    for content_block in result.content:
+        type_ = content_block.get("type")
+        if type_:
+            content_types.add(type_)

-#     # Test with a simple base64 placeholder (real integration would use actual image)
-#     message = HumanMessage(
-#         content=[
-#             create_text_block("Describe this image:"),
-#             create_image_block(
-#                 base64="iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAYAAAAfFcSJAAAADUlEQVR42mNkYPhfDwAChwGA60e6kgAAAABJRU5ErkJggg=="  # noqa: E501
-#             ),
-#         ]
-#     )
+    assert "reasoning" not in content_types, (
+        f"Expected no reasoning content, got types: {content_types}"
+    )
+    assert "non_standard" not in content_types, (
+        f"Expected no non-standard content, got types: {content_types}"
+    )
+    assert "<think>" not in result.text and "</think>" not in result.text

-#     result = llm.invoke([message])

-#     # Check that we get a response (even if it's just acknowledging the image)
-#     assert isinstance(result, AIMessage)
-#     assert len(result.content) > 0
+@pytest.mark.parametrize(("model"), [(REASONING_MODEL_NAME)])
+def test_stream_reasoning_none(model: str) -> None:
+    """Test streaming with `reasoning=None`"""
+    llm = ChatOllama(model=model, num_ctx=2**12, reasoning=None)
+    result = None
+    for chunk in llm.stream(SAMPLE):
+        assert isinstance(chunk, AIMessageChunk)
+        if result is None:
+            result = chunk
+            continue
+        result += chunk
+    assert isinstance(result, AIMessageChunk)
+    assert result.content
+
+    assert "<think>" in result.text and "</think>" in result.text
+
+
+@pytest.mark.parametrize(("model"), [(REASONING_MODEL_NAME)])
+async def test_astream_reasoning_none(model: str) -> None:
+    """Test async streaming with `reasoning=None`"""
+    llm = ChatOllama(model=model, num_ctx=2**12, reasoning=None)
+    result = None
+    async for chunk in llm.astream(SAMPLE):
+        assert isinstance(chunk, AIMessageChunk)
+        if result is None:
+            result = chunk
+            continue
+        result += chunk
+    assert isinstance(result, AIMessageChunk)
+    assert result.content
+
+    assert "<think>" in result.text and "</think>" in result.text
+
+
+@pytest.mark.parametrize(("model"), [(REASONING_MODEL_NAME)])
+def test_reasoning_stream(model: str) -> None:
+    """Test streaming with `reasoning=True`"""
+    llm = ChatOllama(model=model, num_ctx=2**12, reasoning=True)
+    result = None
+    for chunk in llm.stream(SAMPLE):
+        assert isinstance(chunk, AIMessageChunk)
+        if result is None:
+            result = chunk
+            continue
+        result += chunk
+    assert isinstance(result, AIMessageChunk)
+    assert result.content
+
+    content_types = set()
+    for content_block in result.content:
+        type_ = content_block.get("type")
+        if type_:
+            content_types.add(type_)
+
+    assert "reasoning" in content_types, (
+        f"Expected reasoning content, got types: {content_types}"
+    )
+    assert "non_standard" not in content_types, (
+        f"Expected no non-standard content, got types: {content_types}"
+    )
+    assert "<think>" not in result.text and "</think>" not in result.text
+
+    # Assert non-empty reasoning content in ReasoningContentBlock
+    reasoning_blocks = [block for block in result.content if is_reasoning_block(block)]
+    for block in reasoning_blocks:
+        assert block.get("reasoning"), "Expected non-empty reasoning content"
+        assert len(block.get("reasoning", "")) > 0, (
+            "Expected reasoning content to be non-empty"
+        )
+
+
+@pytest.mark.parametrize(("model"), [(REASONING_MODEL_NAME)])
+async def test_reasoning_astream(model: str) -> None:
+    """Test async streaming with `reasoning=True`"""
+    llm = ChatOllama(model=model, num_ctx=2**12, reasoning=True)
+    result = None
+    async for chunk in llm.astream(SAMPLE):
+        assert isinstance(chunk, AIMessageChunk)
+        if result is None:
+            result = chunk
+            continue
+        result += chunk
+    assert isinstance(result, AIMessageChunk)
+    assert result.content
+
+    content_types = set()
+    for content_block in result.content:
+        type_ = content_block.get("type")
+        if type_:
+            content_types.add(type_)
+
+    assert "reasoning" in content_types, (
+        f"Expected reasoning content, got types: {content_types}"
+    )
+    assert "non_standard" not in content_types, (
+        f"Expected no non-standard content, got types: {content_types}"
+    )
+    assert "<think>" not in result.text and "</think>" not in result.text
+
+    # Assert non-empty reasoning content in ReasoningContentBlock
+    reasoning_blocks = [block for block in result.content if is_reasoning_block(block)]
+    for block in reasoning_blocks:
+        assert block.get("reasoning"), "Expected non-empty reasoning content"
+        assert len(block.get("reasoning", "")) > 0, (
+            "Expected reasoning content to be non-empty"
+        )
+
+
+@pytest.mark.parametrize(("model"), [(REASONING_MODEL_NAME)])
+def test_invoke_no_reasoning(model: str) -> None:
+    """Test using invoke with `reasoning=False`"""
+    llm = ChatOllama(model=model, num_ctx=2**12, reasoning=False)
+    message = HumanMessage(SAMPLE)
+    result = llm.invoke([message])
+    assert result.content
+
+    content_types = set()
+    for content_block in result.content:
+        type_ = content_block.get("type")
+        if type_:
+            content_types.add(type_)
+
+    assert "reasoning" not in content_types, (
+        f"Expected no reasoning content, got types: {content_types}"
+    )
+    assert "non_standard" not in content_types, (
+        f"Expected no non-standard content, got types: {content_types}"
+    )
+    assert "<think>" not in result.text and "</think>" not in result.text
+
+
+@pytest.mark.parametrize(("model"), [(REASONING_MODEL_NAME)])
+async def test_ainvoke_no_reasoning(model: str) -> None:
+    """Test using async invoke with `reasoning=False`"""
+    llm = ChatOllama(model=model, num_ctx=2**12, reasoning=False)
+    message = HumanMessage(content=SAMPLE)
+    result = await llm.ainvoke([message])
+    assert result.content
+
+    content_types = set()
+    for content_block in result.content:
+        type_ = content_block.get("type")
+        if type_:
+            content_types.add(type_)
+
+    assert "reasoning" not in content_types, (
+        f"Expected no reasoning content, got types: {content_types}"
+    )
+    assert "non_standard" not in content_types, (
+        f"Expected no non-standard content, got types: {content_types}"
+    )
+    assert "<think>" not in result.text and "</think>" not in result.text
+
+
+@pytest.mark.parametrize(("model"), [(REASONING_MODEL_NAME)])
+def test_invoke_reasoning_none(model: str) -> None:
+    """Test using invoke with `reasoning=None`"""
+    llm = ChatOllama(model=model, num_ctx=2**12, reasoning=None)
+    message = HumanMessage(content=SAMPLE)
+    result = llm.invoke([message])
+    assert result.content
+
+    assert "<think>" in result.text and "</think>" in result.text
+
+
+@pytest.mark.parametrize(("model"), [(REASONING_MODEL_NAME)])
+async def test_ainvoke_reasoning_none(model: str) -> None:
+    """Test using async invoke with `reasoning=None`"""
+    llm = ChatOllama(model=model, num_ctx=2**12, reasoning=None)
+    message = HumanMessage(content=SAMPLE)
+    result = await llm.ainvoke([message])
+    assert result.content
+
+    assert "<think>" in result.text and "</think>" in result.text
+
+
+@pytest.mark.parametrize(("model"), [(REASONING_MODEL_NAME)])
+def test_reasoning_invoke(model: str) -> None:
+    """Test invoke with `reasoning=True`"""
+    llm = ChatOllama(model=model, num_ctx=2**12, reasoning=True)
+    message = HumanMessage(content=SAMPLE)
+    result = llm.invoke([message])
+    assert result.content
+
+    content_types = set()
+    for content_block in result.content:
+        type_ = content_block.get("type")
+        if type_:
+            content_types.add(type_)
+
+    assert "reasoning" in content_types, (
+        f"Expected reasoning content, got types: {content_types}"
+    )
+    assert "non_standard" not in content_types, (
+        f"Expected no non-standard content, got types: {content_types}"
+    )
+    assert "<think>" not in result.text and "</think>" not in result.text
+
+    # Assert non-empty reasoning content in ReasoningContentBlock
+    reasoning_blocks = [block for block in result.content if is_reasoning_block(block)]
+    for block in reasoning_blocks:
+        assert block.get("reasoning"), "Expected non-empty reasoning content"
+        assert len(block.get("reasoning", "")) > 0, (
+            "Expected reasoning content to be non-empty"
+        )
+
+
+@pytest.mark.parametrize(("model"), [(REASONING_MODEL_NAME)])
+async def test_reasoning_ainvoke(model: str) -> None:
+    """Test invoke with `reasoning=True`"""
+    llm = ChatOllama(model=model, num_ctx=2**12, reasoning=True)
+    message = HumanMessage(content=SAMPLE)
+    result = await llm.ainvoke([message])
+    assert result.content
+
+    content_types = set()
+    for content_block in result.content:
+        type_ = content_block.get("type")
+        if type_:
+            content_types.add(type_)
+
+    assert "reasoning" in content_types, (
+        f"Expected reasoning content, got types: {content_types}"
+    )
+    assert "non_standard" not in content_types, (
+        f"Expected no non-standard content, got types: {content_types}"
+    )
+    assert "<think>" not in result.text and "</think>" not in result.text
+
+    # Assert non-empty reasoning content in ReasoningContentBlock
+    reasoning_blocks = [block for block in result.content if is_reasoning_block(block)]
+    for block in reasoning_blocks:
+        assert block.get("reasoning"), "Expected non-empty reasoning content"
+        assert len(block.get("reasoning", "")) > 0, (
+            "Expected reasoning content to be non-empty"
+        )
+
+
+@pytest.mark.parametrize(("model"), [(REASONING_MODEL_NAME)])
+def test_think_tag_stripping_necessity(model: str) -> None:
+    """Test that demonstrates why ``_strip_think_tags`` is necessary.
+
+    DeepSeek R1 models include reasoning/thinking as their default behavior.
+    When ``reasoning=False`` is set, the user explicitly wants no reasoning content,
+    but Ollama cannot disable thinking at the API level for these models.
+    Therefore, post-processing is required to strip the ``<think>`` tags.
+
+    This test documents the specific behavior that necessitates the
+    ``_strip_think_tags`` function in the chat_models.py implementation.
+    """
+    # Test with reasoning=None (default behavior - should include think tags)
+    llm_default = ChatOllama(model=model, reasoning=None, num_ctx=2**12)
+    message = HumanMessage(content=SAMPLE)
+
+    result_default = llm_default.invoke([message])
+
+    # With reasoning=None, the model's default behavior includes <think> tags
+    # This demonstrates why we need the stripping logic
+    assert "<think>" in result_default.text
+    assert "</think>" in result_default.text
+
+    # Test with reasoning=False (explicit disable - should NOT include think tags)
+    llm_disabled = ChatOllama(model=model, reasoning=False, num_ctx=2**12)
+
+    result_disabled = llm_disabled.invoke([message])
+
+    # With reasoning=False, think tags should be stripped from content
+    # This verifies that _strip_think_tags is working correctly
+    assert "<think>" not in result_disabled.text
+    assert "</think>" not in result_disabled.text
+
+    # Verify the difference: same model, different reasoning settings
+    # Default includes tags, disabled strips them
+    assert result_default.content != result_disabled.content
--- a/libs/standard-tests/langchain_tests/integration_tests/chat_models_v1.py
+++ b/libs/standard-tests/langchain_tests/integration_tests/chat_models_v1.py
@ -3188,7 +3188,12 @@ class ChatModelV1IntegrationTests(ChatModelV1Tests):
        assert result.content is not None

    def test_reasoning_content_blocks_basic(self, model: BaseChatModel) -> None:
-        """Test that the model can generate ``ReasoningContentBlock``."""
+        """Test that the model can generate ``ReasoningContentBlock``.
+
+        If your integration requires a reasoning parameter to be explicitly set, you
+        will need to override this test to set it appropriately.
+
+        """
        if not self.supports_reasoning_content_blocks:
            pytest.skip("Model does not support ReasoningContentBlock.")

@ -3202,7 +3207,10 @@ class ChatModelV1IntegrationTests(ChatModelV1Tests):
                for block in result.content
                if isinstance(block, dict) and is_reasoning_block(block)
            ]
-            assert len(reasoning_blocks) > 0
+            assert len(reasoning_blocks) > 0, (
+                "Expected reasoning content blocks but found none. "
+                f"Content blocks: {[block.get('type') for block in result.content]}"
+            )

    def test_non_standard_content_blocks_basic(self, model: BaseChatModel) -> None:
        """Test that the model can handle ``NonStandardContentBlock``."""