test(mistralai): stabilize integration tests with rate limiting and retries (#37588)

Mistral integration tests have been flaky against the live API. This
adds a shared, xdist-aware rate limiter and a global retry policy so
transient 429s no longer fail the suite.
This commit is contained in:
Mason Daugherty
2026-05-20 19:49:25 -05:00
committed by GitHub
parent 5197dd5985
commit 4d2efcd756
6 changed files with 51 additions and 7 deletions

View File

@@ -21,7 +21,7 @@ test_watch:
integration_test integration_tests: integration_test integration_tests:
uv run --group test --group test_integration pytest -v --tb=short -n auto $(TEST_FILE) uv run --group test --group test_integration pytest -v --tb=short -n auto --retries 3 --retry-delay 2 $(TEST_FILE)
###################### ######################

View File

@@ -44,6 +44,7 @@ Reddit = "https://www.reddit.com/r/LangChain/"
test = [ test = [
"pytest>=9.0.3,<10.0.0", "pytest>=9.0.3,<10.0.0",
"pytest-asyncio>=1.3.0,<2.0.0", "pytest-asyncio>=1.3.0,<2.0.0",
"pytest-retry>=1.7.0,<1.8.0",
"pytest-watcher>=0.3.4,<1.0.0", "pytest-watcher>=0.3.4,<1.0.0",
"pytest-xdist>=3.6.1,<4.0.0", "pytest-xdist>=3.6.1,<4.0.0",
"langchain-core>=1.4.0,<2.0.0", "langchain-core>=1.4.0,<2.0.0",

View File

@@ -0,0 +1,18 @@
"""Shared rate limiter for Mistral integration tests.
Scaled by ``PYTEST_XDIST_WORKER_COUNT`` so aggregate QPS across all xdist
workers stays bounded near the target rate.
"""
from __future__ import annotations
import os
from langchain_core.rate_limiters import InMemoryRateLimiter
_TARGET_REQUESTS_PER_SECOND = 0.5
_WORKER_COUNT = max(1, int(os.environ.get("PYTEST_XDIST_WORKER_COUNT", "1")))
rate_limiter = InMemoryRateLimiter(
requests_per_second=_TARGET_REQUESTS_PER_SECOND / _WORKER_COUNT,
)

View File

@@ -13,11 +13,12 @@ from pydantic import BaseModel
from typing_extensions import TypedDict from typing_extensions import TypedDict
from langchain_mistralai.chat_models import ChatMistralAI from langchain_mistralai.chat_models import ChatMistralAI
from tests.integration_tests._rate_limiter import rate_limiter
async def test_astream() -> None: async def test_astream() -> None:
"""Test streaming tokens from ChatMistralAI.""" """Test streaming tokens from ChatMistralAI."""
llm = ChatMistralAI() llm = ChatMistralAI(rate_limiter=rate_limiter)
full: BaseMessageChunk | None = None full: BaseMessageChunk | None = None
chunks_with_token_counts = 0 chunks_with_token_counts = 0
@@ -70,7 +71,7 @@ def _check_parsed_result(result: Any, schema: Any) -> None:
@pytest.mark.parametrize("schema", [Book, BookDict, Book.model_json_schema()]) @pytest.mark.parametrize("schema", [Book, BookDict, Book.model_json_schema()])
def test_structured_output_json_schema(schema: Any) -> None: def test_structured_output_json_schema(schema: Any) -> None:
llm = ChatMistralAI(model="ministral-8b-latest") # type: ignore[call-arg] llm = ChatMistralAI(model="ministral-8b-latest", rate_limiter=rate_limiter) # type: ignore[call-arg]
structured_llm = llm.with_structured_output(schema, method="json_schema") structured_llm = llm.with_structured_output(schema, method="json_schema")
messages = [ messages = [
@@ -91,7 +92,7 @@ def test_structured_output_json_schema(schema: Any) -> None:
@pytest.mark.parametrize("schema", [Book, BookDict, Book.model_json_schema()]) @pytest.mark.parametrize("schema", [Book, BookDict, Book.model_json_schema()])
async def test_structured_output_json_schema_async(schema: Any) -> None: async def test_structured_output_json_schema_async(schema: Any) -> None:
llm = ChatMistralAI(model="ministral-8b-latest") # type: ignore[call-arg] llm = ChatMistralAI(model="ministral-8b-latest", rate_limiter=rate_limiter) # type: ignore[call-arg]
structured_llm = llm.with_structured_output(schema, method="json_schema") structured_llm = llm.with_structured_output(schema, method="json_schema")
messages = [ messages = [
@@ -116,6 +117,7 @@ def test_retry_parameters(caplog: pytest.LogCaptureFixture) -> None:
mistral = ChatMistralAI( mistral = ChatMistralAI(
timeout=1, # Very short timeout to trigger timeouts timeout=1, # Very short timeout to trigger timeouts
max_retries=3, # Should retry 3 times max_retries=3, # Should retry 3 times
rate_limiter=rate_limiter,
) )
# Simple test input that should take longer than 1 second to process # Simple test input that should take longer than 1 second to process
@@ -148,7 +150,7 @@ def test_retry_parameters(caplog: pytest.LogCaptureFixture) -> None:
def test_reasoning() -> None: def test_reasoning() -> None:
model = ChatMistralAI(model="magistral-medium-latest") # type: ignore[call-arg] model = ChatMistralAI(model="magistral-medium-latest", rate_limiter=rate_limiter) # type: ignore[call-arg]
input_message = { input_message = {
"role": "user", "role": "user",
"content": "Hello, my name is Bob.", "content": "Hello, my name is Bob.",
@@ -172,7 +174,11 @@ def test_reasoning() -> None:
def test_reasoning_v1() -> None: def test_reasoning_v1() -> None:
model = ChatMistralAI(model="magistral-medium-latest", output_version="v1") # type: ignore[call-arg] model = ChatMistralAI( # type: ignore[call-arg]
model="magistral-medium-latest",
output_version="v1",
rate_limiter=rate_limiter,
)
input_message = { input_message = {
"role": "user", "role": "user",
"content": "Hello, my name is Bob.", "content": "Hello, my name is Bob.",

View File

@@ -7,6 +7,7 @@ from langchain_tests.integration_tests import ( # type: ignore[import-not-found
) )
from langchain_mistralai import ChatMistralAI from langchain_mistralai import ChatMistralAI
from tests.integration_tests._rate_limiter import rate_limiter
class TestMistralStandard(ChatModelIntegrationTests): class TestMistralStandard(ChatModelIntegrationTests):
@@ -16,7 +17,11 @@ class TestMistralStandard(ChatModelIntegrationTests):
@property @property
def chat_model_params(self) -> dict: def chat_model_params(self) -> dict:
return {"model": "mistral-large-latest", "temperature": 0} return {
"model": "mistral-large-latest",
"temperature": 0,
"rate_limiter": rate_limiter,
}
@property @property
def supports_json_mode(self) -> bool: def supports_json_mode(self) -> bool:

View File

@@ -454,6 +454,7 @@ test = [
{ name = "langchain-tests" }, { name = "langchain-tests" },
{ name = "pytest" }, { name = "pytest" },
{ name = "pytest-asyncio" }, { name = "pytest-asyncio" },
{ name = "pytest-retry" },
{ name = "pytest-watcher" }, { name = "pytest-watcher" },
{ name = "pytest-xdist" }, { name = "pytest-xdist" },
] ]
@@ -479,6 +480,7 @@ test = [
{ name = "langchain-tests", editable = "../../standard-tests" }, { name = "langchain-tests", editable = "../../standard-tests" },
{ name = "pytest", specifier = ">=9.0.3,<10.0.0" }, { name = "pytest", specifier = ">=9.0.3,<10.0.0" },
{ name = "pytest-asyncio", specifier = ">=1.3.0,<2.0.0" }, { name = "pytest-asyncio", specifier = ">=1.3.0,<2.0.0" },
{ name = "pytest-retry", specifier = ">=1.7.0,<1.8.0" },
{ name = "pytest-watcher", specifier = ">=0.3.4,<1.0.0" }, { name = "pytest-watcher", specifier = ">=0.3.4,<1.0.0" },
{ name = "pytest-xdist", specifier = ">=3.6.1,<4.0.0" }, { name = "pytest-xdist", specifier = ">=3.6.1,<4.0.0" },
] ]
@@ -1137,6 +1139,18 @@ wheels = [
{ url = "https://files.pythonhosted.org/packages/42/c2/ce34735972cc42d912173e79f200fe66530225190c06655c5632a9d88f1e/pytest_recording-0.13.4-py3-none-any.whl", hash = "sha256:ad49a434b51b1c4f78e85b1e6b74fdcc2a0a581ca16e52c798c6ace971f7f439", size = 13723, upload-time = "2025-05-08T10:41:09.684Z" }, { url = "https://files.pythonhosted.org/packages/42/c2/ce34735972cc42d912173e79f200fe66530225190c06655c5632a9d88f1e/pytest_recording-0.13.4-py3-none-any.whl", hash = "sha256:ad49a434b51b1c4f78e85b1e6b74fdcc2a0a581ca16e52c798c6ace971f7f439", size = 13723, upload-time = "2025-05-08T10:41:09.684Z" },
] ]
[[package]]
name = "pytest-retry"
version = "1.7.0"
source = { registry = "https://pypi.org/simple" }
dependencies = [
{ name = "pytest" },
]
sdist = { url = "https://files.pythonhosted.org/packages/c5/5b/607b017994cca28de3a1ad22a3eee8418e5d428dcd8ec25b26b18e995a73/pytest_retry-1.7.0.tar.gz", hash = "sha256:f8d52339f01e949df47c11ba9ee8d5b362f5824dff580d3870ec9ae0057df80f", size = 19977, upload-time = "2025-01-19T01:56:13.115Z" }
wheels = [
{ url = "https://files.pythonhosted.org/packages/7c/ff/3266c8a73b9b93c4b14160a7e2b31d1e1088e28ed29f4c2d93ae34093bfd/pytest_retry-1.7.0-py3-none-any.whl", hash = "sha256:a2dac85b79a4e2375943f1429479c65beb6c69553e7dae6b8332be47a60954f4", size = 13775, upload-time = "2025-01-19T01:56:11.199Z" },
]
[[package]] [[package]]
name = "pytest-socket" name = "pytest-socket"
version = "0.7.0" version = "0.7.0"