diff --git a/docs/extras/integrations/document_loaders/docugami.ipynb b/docs/extras/integrations/document_loaders/docugami.ipynb index d3f94a8d1ce..607cf2b145f 100644 --- a/docs/extras/integrations/document_loaders/docugami.ipynb +++ b/docs/extras/integrations/document_loaders/docugami.ipynb @@ -19,18 +19,10 @@ "metadata": { "tags": [] }, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Requirement already satisfied: lxml in /root/Source/github/docugami.langchain/libs/langchain/.venv/lib/python3.9/site-packages (4.9.3)\n" - ] - } - ], + "outputs": [], "source": [ "# You need the lxml package to use the DocugamiLoader\n", - "!poetry run pip install lxml" + "!poetry run pip install lxml --quiet" ] }, { diff --git a/libs/langchain/langchain/document_loaders/docugami.py b/libs/langchain/langchain/document_loaders/docugami.py index af2c95f57f9..cd05a9612d9 100644 --- a/libs/langchain/langchain/document_loaders/docugami.py +++ b/libs/langchain/langchain/document_loaders/docugami.py @@ -147,6 +147,7 @@ class DocugamiLoader(BaseLoader, BaseModel): metadata = { XPATH_KEY: _xpath_for_chunk(node), DOCUMENT_ID_KEY: document[DOCUMENT_ID_KEY], + DOCUMENT_NAME_KEY: document[DOCUMENT_NAME_KEY], DOCUMENT_SOURCE_KEY: document[DOCUMENT_NAME_KEY], STRUCTURE_KEY: node.attrib.get("structure", ""), TAG_KEY: re.sub(r"\{.*\}", "", node.tag),