chore(partners): standardize integration test invocation (#36958)

Standardize the `integration_tests` Makefile target across all 15
partner packages in `libs/partners/`, mirroring the deepagents
`libs/evals` pattern (`-v --tb=short`). Previously each partner had its
own ad-hoc flag stack (some missing `-n auto`, some with `-vvv`, others
with nothing), and every partner that used `-n auto` was emitting a
`PytestBenchmarkWarning` because `pytest-benchmark` is pulled in
transitively via `langchain-tests` even though no partner has benchmark
tests.
This commit is contained in:
Mason Daugherty
2026-04-22 17:28:04 -04:00
committed by GitHub
parent 4176a8cfbe
commit ec337534c5
15 changed files with 23 additions and 17 deletions

View File

@@ -27,7 +27,7 @@ test_watch:
# integration tests are run without the --disable-socket flag to allow network calls
integration_test:
OLLAMA_TEST_MODEL=$(OLLAMA_TEST_MODEL) OLLAMA_REASONING_TEST_MODEL=$(OLLAMA_REASONING_TEST_MODEL) uv run --group test --group test_integration pytest $(TEST_FILE)
OLLAMA_TEST_MODEL=$(OLLAMA_TEST_MODEL) OLLAMA_REASONING_TEST_MODEL=$(OLLAMA_REASONING_TEST_MODEL) uv run --group test --group test_integration pytest -v --tb=short -p no:benchmark -n auto $(TEST_FILE)
# CI integration tests - disabled until ollama service is configured in CI