feat(model-profiles): add text_inputs and text_outputs (#35084)

- Add `text_inputs` and `text_outputs` fields to `ModelProfile`
- Regenerate `_profiles.py` for all providers

## Why

models.dev data includes `'text'` as both an input and output modality,
but we didn't capture it.

models.dev broadly contains models without text input (Whisper/ASR) and
without text output (image generators, TTS).

Without this, downstream consumers can't filter on model text support
(e.g. preventing users from passing text input to an audio-only model).

---

We'd need to also run for Google, AWS and cut releases for all to
propagate
This commit is contained in:
Mason Daugherty
2026-02-09 14:50:09 -05:00
committed by GitHub
parent e8e47b083e
commit 4ca586b322
13 changed files with 624 additions and 60 deletions

View File

@@ -19,9 +19,25 @@ _PROFILES: dict[str, dict[str, Any]] = {
"devstral-medium-2507": {
"max_input_tokens": 128000,
"max_output_tokens": 128000,
"text_inputs": True,
"image_inputs": False,
"audio_inputs": False,
"video_inputs": False,
"text_outputs": True,
"image_outputs": False,
"audio_outputs": False,
"video_outputs": False,
"reasoning_output": False,
"tool_calling": True,
},
"mistral-large-2512": {
"max_input_tokens": 262144,
"max_output_tokens": 262144,
"text_inputs": True,
"image_inputs": True,
"audio_inputs": False,
"video_inputs": False,
"text_outputs": True,
"image_outputs": False,
"audio_outputs": False,
"video_outputs": False,
@@ -31,9 +47,11 @@ _PROFILES: dict[str, dict[str, Any]] = {
"open-mixtral-8x22b": {
"max_input_tokens": 64000,
"max_output_tokens": 64000,
"text_inputs": True,
"image_inputs": False,
"audio_inputs": False,
"video_inputs": False,
"text_outputs": True,
"image_outputs": False,
"audio_outputs": False,
"video_outputs": False,
@@ -43,9 +61,11 @@ _PROFILES: dict[str, dict[str, Any]] = {
"ministral-8b-latest": {
"max_input_tokens": 128000,
"max_output_tokens": 128000,
"text_inputs": True,
"image_inputs": False,
"audio_inputs": False,
"video_inputs": False,
"text_outputs": True,
"image_outputs": False,
"audio_outputs": False,
"video_outputs": False,
@@ -55,9 +75,39 @@ _PROFILES: dict[str, dict[str, Any]] = {
"pixtral-large-latest": {
"max_input_tokens": 128000,
"max_output_tokens": 128000,
"text_inputs": True,
"image_inputs": True,
"audio_inputs": False,
"video_inputs": False,
"text_outputs": True,
"image_outputs": False,
"audio_outputs": False,
"video_outputs": False,
"reasoning_output": False,
"tool_calling": True,
},
"mistral-small-2506": {
"max_input_tokens": 128000,
"max_output_tokens": 16384,
"text_inputs": True,
"image_inputs": True,
"audio_inputs": False,
"video_inputs": False,
"text_outputs": True,
"image_outputs": False,
"audio_outputs": False,
"video_outputs": False,
"reasoning_output": False,
"tool_calling": True,
},
"devstral-2512": {
"max_input_tokens": 262144,
"max_output_tokens": 262144,
"text_inputs": True,
"image_inputs": False,
"audio_inputs": False,
"video_inputs": False,
"text_outputs": True,
"image_outputs": False,
"audio_outputs": False,
"video_outputs": False,
@@ -67,9 +117,11 @@ _PROFILES: dict[str, dict[str, Any]] = {
"ministral-3b-latest": {
"max_input_tokens": 128000,
"max_output_tokens": 128000,
"text_inputs": True,
"image_inputs": False,
"audio_inputs": False,
"video_inputs": False,
"text_outputs": True,
"image_outputs": False,
"audio_outputs": False,
"video_outputs": False,
@@ -79,9 +131,11 @@ _PROFILES: dict[str, dict[str, Any]] = {
"pixtral-12b": {
"max_input_tokens": 128000,
"max_output_tokens": 128000,
"text_inputs": True,
"image_inputs": True,
"audio_inputs": False,
"video_inputs": False,
"text_outputs": True,
"image_outputs": False,
"audio_outputs": False,
"video_outputs": False,
@@ -91,9 +145,39 @@ _PROFILES: dict[str, dict[str, Any]] = {
"mistral-medium-2505": {
"max_input_tokens": 131072,
"max_output_tokens": 131072,
"text_inputs": True,
"image_inputs": True,
"audio_inputs": False,
"video_inputs": False,
"text_outputs": True,
"image_outputs": False,
"audio_outputs": False,
"video_outputs": False,
"reasoning_output": False,
"tool_calling": True,
},
"labs-devstral-small-2512": {
"max_input_tokens": 256000,
"max_output_tokens": 256000,
"text_inputs": True,
"image_inputs": True,
"audio_inputs": False,
"video_inputs": False,
"text_outputs": True,
"image_outputs": False,
"audio_outputs": False,
"video_outputs": False,
"reasoning_output": False,
"tool_calling": True,
},
"devstral-medium-latest": {
"max_input_tokens": 262144,
"max_output_tokens": 262144,
"text_inputs": True,
"image_inputs": False,
"audio_inputs": False,
"video_inputs": False,
"text_outputs": True,
"image_outputs": False,
"audio_outputs": False,
"video_outputs": False,
@@ -103,9 +187,11 @@ _PROFILES: dict[str, dict[str, Any]] = {
"devstral-small-2505": {
"max_input_tokens": 128000,
"max_output_tokens": 128000,
"text_inputs": True,
"image_inputs": False,
"audio_inputs": False,
"video_inputs": False,
"text_outputs": True,
"image_outputs": False,
"audio_outputs": False,
"video_outputs": False,
@@ -115,21 +201,39 @@ _PROFILES: dict[str, dict[str, Any]] = {
"mistral-medium-2508": {
"max_input_tokens": 262144,
"max_output_tokens": 262144,
"text_inputs": True,
"image_inputs": True,
"audio_inputs": False,
"video_inputs": False,
"text_outputs": True,
"image_outputs": False,
"audio_outputs": False,
"video_outputs": False,
"reasoning_output": False,
"tool_calling": True,
},
"mistral-embed": {
"max_input_tokens": 8000,
"max_output_tokens": 3072,
"text_inputs": True,
"image_inputs": False,
"audio_inputs": False,
"video_inputs": False,
"text_outputs": True,
"image_outputs": False,
"audio_outputs": False,
"video_outputs": False,
"reasoning_output": False,
"tool_calling": False,
},
"mistral-small-latest": {
"max_input_tokens": 128000,
"max_output_tokens": 16384,
"text_inputs": True,
"image_inputs": True,
"audio_inputs": False,
"video_inputs": False,
"text_outputs": True,
"image_outputs": False,
"audio_outputs": False,
"video_outputs": False,
@@ -139,9 +243,11 @@ _PROFILES: dict[str, dict[str, Any]] = {
"magistral-small": {
"max_input_tokens": 128000,
"max_output_tokens": 128000,
"text_inputs": True,
"image_inputs": False,
"audio_inputs": False,
"video_inputs": False,
"text_outputs": True,
"image_outputs": False,
"audio_outputs": False,
"video_outputs": False,
@@ -151,9 +257,11 @@ _PROFILES: dict[str, dict[str, Any]] = {
"devstral-small-2507": {
"max_input_tokens": 128000,
"max_output_tokens": 128000,
"text_inputs": True,
"image_inputs": False,
"audio_inputs": False,
"video_inputs": False,
"text_outputs": True,
"image_outputs": False,
"audio_outputs": False,
"video_outputs": False,
@@ -163,9 +271,11 @@ _PROFILES: dict[str, dict[str, Any]] = {
"codestral-latest": {
"max_input_tokens": 256000,
"max_output_tokens": 4096,
"text_inputs": True,
"image_inputs": False,
"audio_inputs": False,
"video_inputs": False,
"text_outputs": True,
"image_outputs": False,
"audio_outputs": False,
"video_outputs": False,
@@ -175,9 +285,11 @@ _PROFILES: dict[str, dict[str, Any]] = {
"open-mixtral-8x7b": {
"max_input_tokens": 32000,
"max_output_tokens": 32000,
"text_inputs": True,
"image_inputs": False,
"audio_inputs": False,
"video_inputs": False,
"text_outputs": True,
"image_outputs": False,
"audio_outputs": False,
"video_outputs": False,
@@ -187,9 +299,11 @@ _PROFILES: dict[str, dict[str, Any]] = {
"mistral-nemo": {
"max_input_tokens": 128000,
"max_output_tokens": 128000,
"text_inputs": True,
"image_inputs": False,
"audio_inputs": False,
"video_inputs": False,
"text_outputs": True,
"image_outputs": False,
"audio_outputs": False,
"video_outputs": False,
@@ -199,9 +313,11 @@ _PROFILES: dict[str, dict[str, Any]] = {
"open-mistral-7b": {
"max_input_tokens": 8000,
"max_output_tokens": 8000,
"text_inputs": True,
"image_inputs": False,
"audio_inputs": False,
"video_inputs": False,
"text_outputs": True,
"image_outputs": False,
"audio_outputs": False,
"video_outputs": False,
@@ -209,11 +325,13 @@ _PROFILES: dict[str, dict[str, Any]] = {
"tool_calling": True,
},
"mistral-large-latest": {
"max_input_tokens": 131072,
"max_output_tokens": 16384,
"image_inputs": False,
"max_input_tokens": 262144,
"max_output_tokens": 262144,
"text_inputs": True,
"image_inputs": True,
"audio_inputs": False,
"video_inputs": False,
"text_outputs": True,
"image_outputs": False,
"audio_outputs": False,
"video_outputs": False,
@@ -223,9 +341,25 @@ _PROFILES: dict[str, dict[str, Any]] = {
"mistral-medium-latest": {
"max_input_tokens": 128000,
"max_output_tokens": 16384,
"text_inputs": True,
"image_inputs": True,
"audio_inputs": False,
"video_inputs": False,
"text_outputs": True,
"image_outputs": False,
"audio_outputs": False,
"video_outputs": False,
"reasoning_output": False,
"tool_calling": True,
},
"mistral-large-2411": {
"max_input_tokens": 131072,
"max_output_tokens": 16384,
"text_inputs": True,
"image_inputs": False,
"audio_inputs": False,
"video_inputs": False,
"text_outputs": True,
"image_outputs": False,
"audio_outputs": False,
"video_outputs": False,
@@ -235,9 +369,11 @@ _PROFILES: dict[str, dict[str, Any]] = {
"magistral-medium-latest": {
"max_input_tokens": 128000,
"max_output_tokens": 16384,
"text_inputs": True,
"image_inputs": False,
"audio_inputs": False,
"video_inputs": False,
"text_outputs": True,
"image_outputs": False,
"audio_outputs": False,
"video_outputs": False,