diff --git a/libs/community/langchain_community/document_loaders/parsers/audio.py b/libs/community/langchain_community/document_loaders/parsers/audio.py index c8fa4c3ed39..9741a32f3de 100644 --- a/libs/community/langchain_community/document_loaders/parsers/audio.py +++ b/libs/community/langchain_community/document_loaders/parsers/audio.py @@ -129,7 +129,9 @@ class OpenAIWhisperParser(BaseBlobParser): continue yield Document( - page_content=transcript.text, + page_content=transcript.text + if not isinstance(transcript, str) + else transcript, metadata={"source": blob.source, "chunk": split_number}, )