mirror of
https://github.com/hwchase17/langchain.git
synced 2025-05-14 11:33:00 +00:00
Fixes for Eden AI Custom tools and ChatEdenAI: - add missing import in __init__ of chat_models - add `args_schema` to custom tools. otherwise '__arg1' would sometimes be passed to the `run` method - fix IndexError when no human msg is added in ChatEdenAI
79 lines
2.4 KiB
Python
79 lines
2.4 KiB
Python
from __future__ import annotations
|
|
|
|
import logging
|
|
from typing import Optional, Type
|
|
|
|
from langchain_core.callbacks import CallbackManagerForToolRun
|
|
from langchain_core.pydantic_v1 import BaseModel, Field, HttpUrl
|
|
|
|
from langchain_community.tools.edenai.edenai_base_tool import EdenaiTool
|
|
|
|
logger = logging.getLogger(__name__)
|
|
|
|
|
|
class InvoiceParsingInput(BaseModel):
|
|
query: HttpUrl = Field(description="url of the document to parse")
|
|
|
|
|
|
class EdenAiParsingInvoiceTool(EdenaiTool):
|
|
"""Tool that queries the Eden AI Invoice parsing API.
|
|
|
|
for api reference check edenai documentation:
|
|
https://docs.edenai.co/reference/ocr_invoice_parser_create.
|
|
|
|
To use, you should have
|
|
the environment variable ``EDENAI_API_KEY`` set with your API token.
|
|
You can find your token here: https://app.edenai.run/admin/account/settings
|
|
|
|
"""
|
|
|
|
name: str = "edenai_invoice_parsing"
|
|
description: str = (
|
|
"A wrapper around edenai Services invoice parsing. "
|
|
"""Useful for when you have to extract information from
|
|
an image it enables to take invoices
|
|
in a variety of formats and returns the data in contains
|
|
(items, prices, addresses, vendor name, etc.)
|
|
in a structured format to automate the invoice processing """
|
|
"Input should be the string url of the document to parse."
|
|
)
|
|
args_schema: Type[BaseModel] = InvoiceParsingInput
|
|
|
|
language: Optional[str] = None
|
|
"""
|
|
language of the image passed to the model.
|
|
"""
|
|
|
|
feature: str = "ocr"
|
|
subfeature: str = "invoice_parser"
|
|
|
|
def _parse_response(self, response: list) -> str:
|
|
formatted_list: list = []
|
|
|
|
if len(response) == 1:
|
|
self._parse_json_multilevel(
|
|
response[0]["extracted_data"][0], formatted_list
|
|
)
|
|
else:
|
|
for entry in response:
|
|
if entry.get("provider") == "eden-ai":
|
|
self._parse_json_multilevel(
|
|
entry["extracted_data"][0], formatted_list
|
|
)
|
|
|
|
return "\n".join(formatted_list)
|
|
|
|
def _run(
|
|
self,
|
|
query: str,
|
|
run_manager: Optional[CallbackManagerForToolRun] = None,
|
|
) -> str:
|
|
"""Use the tool."""
|
|
query_params = {
|
|
"file_url": query,
|
|
"language": self.language,
|
|
"attributes_as_list": False,
|
|
}
|
|
|
|
return self._call_eden_ai(query_params)
|