From efa67ed0efbbdaadf954e2181cc99f4537f32e21 Mon Sep 17 00:00:00 2001 From: Wilson Leao Neto Date: Wed, 19 Jul 2023 03:46:23 +0200 Subject: [PATCH] fix #7782: check title and excerpt separately for page_content (#7783) - Description: check title and excerpt separately for page_content so that if title is empty but excerpt is present, the page_content will only contain the excerpt - Issue: #7782 - Tag maintainer: @3coins @baskaryan - Twitter handle: wilsonleao --- langchain/retrievers/kendra.py | 9 ++++++--- 1 file changed, 6 insertions(+), 3 deletions(-) diff --git a/langchain/retrievers/kendra.py b/langchain/retrievers/kendra.py index 2ceeb1d0fcd..64fab753295 100644 --- a/langchain/retrievers/kendra.py +++ b/langchain/retrievers/kendra.py @@ -38,9 +38,12 @@ def combined_text(title: str, excerpt: str) -> str: The combined text. """ - if not title or not excerpt: - return "" - return f"Document Title: {title} \nDocument Excerpt: \n{excerpt}\n" + text = "" + if title: + text += f"Document Title: {title}\n" + if excerpt: + text += f"Document Excerpt: \n{excerpt}\n" + return text class Highlight(BaseModel, extra=Extra.allow):