mirror of
https://github.com/hwchase17/langchain.git
synced 2026-02-03 15:55:44 +00:00
Compare commits
3 Commits
langchain-
...
bagatur/us
| Author | SHA1 | Date | |
|---|---|---|---|
|
|
87d8012ef6 | ||
|
|
47b386d28f | ||
|
|
22863b8ac3 |
@@ -2,7 +2,7 @@ import json
|
||||
import operator
|
||||
from typing import Any, Literal, Optional, Union, cast
|
||||
|
||||
from pydantic import model_validator
|
||||
from pydantic import BaseModel, model_validator
|
||||
from typing_extensions import NotRequired, Self, TypedDict
|
||||
|
||||
from langchain_core.messages.base import (
|
||||
@@ -163,6 +163,8 @@ class AIMessage(BaseMessage):
|
||||
|
||||
This is a standard representation of token usage that is consistent across models.
|
||||
"""
|
||||
parsed: Optional[Union[dict, BaseModel]] = None
|
||||
"""The auto-parsed message contents."""
|
||||
|
||||
type: Literal["ai"] = "ai"
|
||||
"""The type of the message (used for deserialization). Defaults to "ai"."""
|
||||
@@ -440,11 +442,20 @@ def add_ai_message_chunks(
|
||||
else:
|
||||
usage_metadata = None
|
||||
|
||||
# 'parsed' always represents an aggregation not an incremental value, so the last
|
||||
# non-null value is kept.
|
||||
parsed = None
|
||||
for m in reversed([left, *others]):
|
||||
if m.parsed is not None:
|
||||
parsed = m.parsed
|
||||
break
|
||||
|
||||
return left.__class__(
|
||||
example=left.example,
|
||||
content=content,
|
||||
additional_kwargs=additional_kwargs,
|
||||
tool_call_chunks=tool_call_chunks,
|
||||
parsed=parsed,
|
||||
response_metadata=response_metadata,
|
||||
usage_metadata=usage_metadata,
|
||||
id=left.id,
|
||||
|
||||
@@ -9,6 +9,7 @@ from typing import (
|
||||
Optional,
|
||||
TypeVar,
|
||||
Union,
|
||||
cast,
|
||||
)
|
||||
|
||||
from typing_extensions import override
|
||||
@@ -65,6 +66,8 @@ class BaseGenerationOutputParser(
|
||||
):
|
||||
"""Base class to parse the output of an LLM call."""
|
||||
|
||||
return_message: bool = False
|
||||
|
||||
@property
|
||||
@override
|
||||
def InputType(self) -> Any:
|
||||
@@ -75,9 +78,12 @@ class BaseGenerationOutputParser(
|
||||
@override
|
||||
def OutputType(self) -> type[T]:
|
||||
"""Return the output type for the parser."""
|
||||
# even though mypy complains this isn't valid,
|
||||
# it is good enough for pydantic to build the schema from
|
||||
return T # type: ignore[misc]
|
||||
if self.return_message:
|
||||
return cast(type[T], AnyMessage)
|
||||
else:
|
||||
# even though mypy complains this isn't valid,
|
||||
# it is good enough for pydantic to build the schema from
|
||||
return T # type: ignore[misc]
|
||||
|
||||
def invoke(
|
||||
self,
|
||||
@@ -86,7 +92,7 @@ class BaseGenerationOutputParser(
|
||||
**kwargs: Any,
|
||||
) -> T:
|
||||
if isinstance(input, BaseMessage):
|
||||
return self._call_with_config(
|
||||
parsed = self._call_with_config(
|
||||
lambda inner_input: self.parse_result(
|
||||
[ChatGeneration(message=inner_input)]
|
||||
),
|
||||
@@ -94,6 +100,10 @@ class BaseGenerationOutputParser(
|
||||
config,
|
||||
run_type="parser",
|
||||
)
|
||||
if self.return_message:
|
||||
return cast(T, input.model_copy(update={"parsed": parsed}))
|
||||
else:
|
||||
return parsed
|
||||
else:
|
||||
return self._call_with_config(
|
||||
lambda inner_input: self.parse_result([Generation(text=inner_input)]),
|
||||
@@ -109,7 +119,7 @@ class BaseGenerationOutputParser(
|
||||
**kwargs: Optional[Any],
|
||||
) -> T:
|
||||
if isinstance(input, BaseMessage):
|
||||
return await self._acall_with_config(
|
||||
parsed = await self._acall_with_config(
|
||||
lambda inner_input: self.aparse_result(
|
||||
[ChatGeneration(message=inner_input)]
|
||||
),
|
||||
@@ -117,6 +127,10 @@ class BaseGenerationOutputParser(
|
||||
config,
|
||||
run_type="parser",
|
||||
)
|
||||
if self.return_message:
|
||||
return cast(T, input.model_copy(update={"parsed": parsed}))
|
||||
else:
|
||||
return parsed
|
||||
else:
|
||||
return await self._acall_with_config(
|
||||
lambda inner_input: self.aparse_result([Generation(text=inner_input)]),
|
||||
@@ -155,6 +169,8 @@ class BaseOutputParser(
|
||||
return "boolean_output_parser"
|
||||
""" # noqa: E501
|
||||
|
||||
return_message: bool = False
|
||||
|
||||
@property
|
||||
@override
|
||||
def InputType(self) -> Any:
|
||||
@@ -171,6 +187,9 @@ class BaseOutputParser(
|
||||
Raises:
|
||||
TypeError: If the class doesn't have an inferable OutputType.
|
||||
"""
|
||||
if self.return_message:
|
||||
return cast(type[T], AnyMessage)
|
||||
|
||||
for base in self.__class__.mro():
|
||||
if hasattr(base, "__pydantic_generic_metadata__"):
|
||||
metadata = base.__pydantic_generic_metadata__
|
||||
@@ -190,7 +209,7 @@ class BaseOutputParser(
|
||||
**kwargs: Any,
|
||||
) -> T:
|
||||
if isinstance(input, BaseMessage):
|
||||
return self._call_with_config(
|
||||
parsed = self._call_with_config(
|
||||
lambda inner_input: self.parse_result(
|
||||
[ChatGeneration(message=inner_input)]
|
||||
),
|
||||
@@ -198,6 +217,10 @@ class BaseOutputParser(
|
||||
config,
|
||||
run_type="parser",
|
||||
)
|
||||
if self.return_message:
|
||||
return cast(T, input.model_copy(update={"parsed": parsed}))
|
||||
else:
|
||||
return parsed
|
||||
else:
|
||||
return self._call_with_config(
|
||||
lambda inner_input: self.parse_result([Generation(text=inner_input)]),
|
||||
@@ -213,7 +236,7 @@ class BaseOutputParser(
|
||||
**kwargs: Optional[Any],
|
||||
) -> T:
|
||||
if isinstance(input, BaseMessage):
|
||||
return await self._acall_with_config(
|
||||
parsed = await self._acall_with_config(
|
||||
lambda inner_input: self.aparse_result(
|
||||
[ChatGeneration(message=inner_input)]
|
||||
),
|
||||
@@ -221,6 +244,10 @@ class BaseOutputParser(
|
||||
config,
|
||||
run_type="parser",
|
||||
)
|
||||
if self.return_message:
|
||||
return cast(T, input.model_copy(update={"parsed": parsed}))
|
||||
else:
|
||||
return parsed
|
||||
else:
|
||||
return await self._acall_with_config(
|
||||
lambda inner_input: self.aparse_result([Generation(text=inner_input)]),
|
||||
|
||||
@@ -77,6 +77,21 @@
|
||||
'default': None,
|
||||
'title': 'Name',
|
||||
}),
|
||||
'parsed': dict({
|
||||
'anyOf': list([
|
||||
dict({
|
||||
'type': 'object',
|
||||
}),
|
||||
dict({
|
||||
'$ref': '#/$defs/BaseModel',
|
||||
}),
|
||||
dict({
|
||||
'type': 'null',
|
||||
}),
|
||||
]),
|
||||
'default': None,
|
||||
'title': 'Parsed',
|
||||
}),
|
||||
'response_metadata': dict({
|
||||
'title': 'Response Metadata',
|
||||
'type': 'object',
|
||||
@@ -181,6 +196,21 @@
|
||||
'default': None,
|
||||
'title': 'Name',
|
||||
}),
|
||||
'parsed': dict({
|
||||
'anyOf': list([
|
||||
dict({
|
||||
'type': 'object',
|
||||
}),
|
||||
dict({
|
||||
'$ref': '#/$defs/BaseModel',
|
||||
}),
|
||||
dict({
|
||||
'type': 'null',
|
||||
}),
|
||||
]),
|
||||
'default': None,
|
||||
'title': 'Parsed',
|
||||
}),
|
||||
'response_metadata': dict({
|
||||
'title': 'Response Metadata',
|
||||
'type': 'object',
|
||||
@@ -227,6 +257,12 @@
|
||||
'title': 'AIMessageChunk',
|
||||
'type': 'object',
|
||||
}),
|
||||
'BaseModel': dict({
|
||||
'properties': dict({
|
||||
}),
|
||||
'title': 'BaseModel',
|
||||
'type': 'object',
|
||||
}),
|
||||
'ChatMessage': dict({
|
||||
'additionalProperties': True,
|
||||
'description': 'Message that can be assigned an arbitrary speaker (i.e. role).',
|
||||
@@ -1507,6 +1543,21 @@
|
||||
'default': None,
|
||||
'title': 'Name',
|
||||
}),
|
||||
'parsed': dict({
|
||||
'anyOf': list([
|
||||
dict({
|
||||
'type': 'object',
|
||||
}),
|
||||
dict({
|
||||
'$ref': '#/$defs/BaseModel',
|
||||
}),
|
||||
dict({
|
||||
'type': 'null',
|
||||
}),
|
||||
]),
|
||||
'default': None,
|
||||
'title': 'Parsed',
|
||||
}),
|
||||
'response_metadata': dict({
|
||||
'title': 'Response Metadata',
|
||||
'type': 'object',
|
||||
@@ -1611,6 +1662,21 @@
|
||||
'default': None,
|
||||
'title': 'Name',
|
||||
}),
|
||||
'parsed': dict({
|
||||
'anyOf': list([
|
||||
dict({
|
||||
'type': 'object',
|
||||
}),
|
||||
dict({
|
||||
'$ref': '#/$defs/BaseModel',
|
||||
}),
|
||||
dict({
|
||||
'type': 'null',
|
||||
}),
|
||||
]),
|
||||
'default': None,
|
||||
'title': 'Parsed',
|
||||
}),
|
||||
'response_metadata': dict({
|
||||
'title': 'Response Metadata',
|
||||
'type': 'object',
|
||||
@@ -1657,6 +1723,12 @@
|
||||
'title': 'AIMessageChunk',
|
||||
'type': 'object',
|
||||
}),
|
||||
'BaseModel': dict({
|
||||
'properties': dict({
|
||||
}),
|
||||
'title': 'BaseModel',
|
||||
'type': 'object',
|
||||
}),
|
||||
'ChatMessage': dict({
|
||||
'additionalProperties': True,
|
||||
'description': 'Message that can be assigned an arbitrary speaker (i.e. role).',
|
||||
|
||||
@@ -451,6 +451,21 @@
|
||||
'default': None,
|
||||
'title': 'Name',
|
||||
}),
|
||||
'parsed': dict({
|
||||
'anyOf': list([
|
||||
dict({
|
||||
'type': 'object',
|
||||
}),
|
||||
dict({
|
||||
'$ref': '#/$defs/BaseModel',
|
||||
}),
|
||||
dict({
|
||||
'type': 'null',
|
||||
}),
|
||||
]),
|
||||
'default': None,
|
||||
'title': 'Parsed',
|
||||
}),
|
||||
'response_metadata': dict({
|
||||
'title': 'Response Metadata',
|
||||
'type': 'object',
|
||||
@@ -555,6 +570,21 @@
|
||||
'default': None,
|
||||
'title': 'Name',
|
||||
}),
|
||||
'parsed': dict({
|
||||
'anyOf': list([
|
||||
dict({
|
||||
'type': 'object',
|
||||
}),
|
||||
dict({
|
||||
'$ref': '#/$defs/BaseModel',
|
||||
}),
|
||||
dict({
|
||||
'type': 'null',
|
||||
}),
|
||||
]),
|
||||
'default': None,
|
||||
'title': 'Parsed',
|
||||
}),
|
||||
'response_metadata': dict({
|
||||
'title': 'Response Metadata',
|
||||
'type': 'object',
|
||||
@@ -601,6 +631,12 @@
|
||||
'title': 'AIMessageChunk',
|
||||
'type': 'object',
|
||||
}),
|
||||
'BaseModel': dict({
|
||||
'properties': dict({
|
||||
}),
|
||||
'title': 'BaseModel',
|
||||
'type': 'object',
|
||||
}),
|
||||
'ChatMessage': dict({
|
||||
'additionalProperties': True,
|
||||
'description': 'Message that can be assigned an arbitrary speaker (i.e. role).',
|
||||
|
||||
@@ -10,7 +10,6 @@ import sys
|
||||
import warnings
|
||||
from io import BytesIO
|
||||
from math import ceil
|
||||
from operator import itemgetter
|
||||
from typing import (
|
||||
Any,
|
||||
AsyncIterator,
|
||||
@@ -85,11 +84,7 @@ from langchain_core.utils.function_calling import (
|
||||
convert_to_openai_function,
|
||||
convert_to_openai_tool,
|
||||
)
|
||||
from langchain_core.utils.pydantic import (
|
||||
PydanticBaseModel,
|
||||
TypeBaseModel,
|
||||
is_basemodel_subclass,
|
||||
)
|
||||
from langchain_core.utils.pydantic import TypeBaseModel, is_basemodel_subclass
|
||||
from langchain_core.utils.utils import _build_model_kwargs, from_env, secret_from_env
|
||||
from pydantic import BaseModel, ConfigDict, Field, SecretStr, model_validator
|
||||
from typing_extensions import Self
|
||||
@@ -777,6 +772,8 @@ class BaseChatOpenAI(BaseChatModel):
|
||||
):
|
||||
message = response.choices[0].message # type: ignore[attr-defined]
|
||||
if hasattr(message, "parsed"):
|
||||
cast(AIMessage, generations[0].message).parsed = message.parsed
|
||||
# For backwards compatibility.
|
||||
generations[0].message.additional_kwargs["parsed"] = message.parsed
|
||||
if hasattr(message, "refusal"):
|
||||
generations[0].message.additional_kwargs["refusal"] = message.refusal
|
||||
@@ -1472,17 +1469,18 @@ class BaseChatOpenAI(BaseChatModel):
|
||||
output_parser: Runnable = PydanticToolsParser(
|
||||
tools=[schema], # type: ignore[list-item]
|
||||
first_tool_only=True, # type: ignore[list-item]
|
||||
return_message=True,
|
||||
)
|
||||
else:
|
||||
output_parser = JsonOutputKeyToolsParser(
|
||||
key_name=tool_name, first_tool_only=True
|
||||
key_name=tool_name, first_tool_only=True, return_message=True
|
||||
)
|
||||
elif method == "json_mode":
|
||||
llm = self.bind(response_format={"type": "json_object"})
|
||||
output_parser = (
|
||||
PydanticOutputParser(pydantic_object=schema) # type: ignore[arg-type]
|
||||
PydanticOutputParser(pydantic_object=schema, return_message=True) # type: ignore[arg-type]
|
||||
if is_pydantic_schema
|
||||
else JsonOutputParser()
|
||||
else JsonOutputParser(return_message=True)
|
||||
)
|
||||
elif method == "json_schema":
|
||||
if schema is None:
|
||||
@@ -1494,10 +1492,10 @@ class BaseChatOpenAI(BaseChatModel):
|
||||
llm = self.bind(response_format=response_format)
|
||||
if is_pydantic_schema:
|
||||
output_parser = _oai_structured_outputs_parser.with_types(
|
||||
output_type=cast(type, schema)
|
||||
output_type=AIMessage
|
||||
)
|
||||
else:
|
||||
output_parser = JsonOutputParser()
|
||||
output_parser = JsonOutputParser(return_message=True)
|
||||
else:
|
||||
raise ValueError(
|
||||
f"Unrecognized method argument. Expected one of 'function_calling' or "
|
||||
@@ -1505,8 +1503,8 @@ class BaseChatOpenAI(BaseChatModel):
|
||||
)
|
||||
|
||||
if include_raw:
|
||||
parser_assign = RunnablePassthrough.assign(
|
||||
parsed=itemgetter("raw") | output_parser, parsing_error=lambda _: None
|
||||
parser_assign = RunnablePassthrough.assign(raw=output_parser).assign(
|
||||
parsed=lambda x: x["raw"].parsed, parsing_error=lambda _: None
|
||||
)
|
||||
parser_none = RunnablePassthrough.assign(parsed=lambda _: None)
|
||||
parser_with_fallback = parser_assign.with_fallbacks(
|
||||
@@ -2229,15 +2227,15 @@ def _convert_to_openai_response_format(
|
||||
|
||||
|
||||
@chain
|
||||
def _oai_structured_outputs_parser(ai_msg: AIMessage) -> PydanticBaseModel:
|
||||
if ai_msg.additional_kwargs.get("parsed"):
|
||||
return ai_msg.additional_kwargs["parsed"]
|
||||
def _oai_structured_outputs_parser(ai_msg: AIMessage) -> AIMessage:
|
||||
if ai_msg.parsed is not None:
|
||||
return ai_msg
|
||||
elif ai_msg.additional_kwargs.get("refusal"):
|
||||
raise OpenAIRefusalError(ai_msg.additional_kwargs["refusal"])
|
||||
else:
|
||||
raise ValueError(
|
||||
"Structured Output response does not have a 'parsed' field nor a 'refusal' "
|
||||
"field. Received message:\n\n{ai_msg}"
|
||||
f"field. Received message:\n\n{ai_msg}"
|
||||
)
|
||||
|
||||
|
||||
|
||||
Reference in New Issue
Block a user