fix: ensure UTF-8 encoding when reading text files in ingestion helper

This commit is contained in:
Akshay Jalluri 2025-01-23 14:42:21 +05:30
parent b7ee43788d
commit b77f90e177

View File

@ -89,7 +89,7 @@ class IngestionHelper:
) )
# Read as a plain text # Read as a plain text
string_reader = StringIterableReader() string_reader = StringIterableReader()
return string_reader.load_data([file_data.read_text()]) return string_reader.load_data([file_data.read_text(encoding="utf8")])
logger.debug("Specific reader found for extension=%s", extension) logger.debug("Specific reader found for extension=%s", extension)
documents = reader_cls().load_data(file_data) documents = reader_cls().load_data(file_data)