fix: ensure UTF-8 encoding when reading text files in ingestion helper

This commit is contained in:
Akshay Jalluri 2025-01-23 14:42:21 +05:30
parent b7ee43788d
commit b77f90e177

View File

@ -89,7 +89,7 @@ class IngestionHelper:
)
# Read as a plain text
string_reader = StringIterableReader()
return string_reader.load_data([file_data.read_text()])
return string_reader.load_data([file_data.read_text(encoding="utf8")])
logger.debug("Specific reader found for extension=%s", extension)
documents = reader_cls().load_data(file_data)