infra: add print rule to ruff (#16221)

Added noqa for existing prints. Can slowly remove / will prevent more
being intro'd
This commit is contained in:
Erick Friis
2024-02-09 16:13:30 -08:00
committed by GitHub
parent c07c0da01a
commit 3a2eb6e12b
246 changed files with 563 additions and 470 deletions

View File

@@ -17,7 +17,7 @@ def ingest_documents():
data_path = "data/"
doc = [os.path.join(data_path, file) for file in os.listdir(data_path)][0]
print("Parsing 10k filing doc for NIKE", doc)
print("Parsing 10k filing doc for NIKE", doc) # noqa: T201
text_splitter = RecursiveCharacterTextSplitter(
chunk_size=1500, chunk_overlap=100, add_start_index=True
@@ -25,7 +25,7 @@ def ingest_documents():
loader = UnstructuredFileLoader(doc, mode="single", strategy="fast")
chunks = loader.load_and_split(text_splitter)
print("Done preprocessing. Created", len(chunks), "chunks of the original pdf")
print("Done preprocessing. Created", len(chunks), "chunks of the original pdf") # noqa: T201
# Create vectorstore
embedder = HuggingFaceEmbeddings(model_name=EMBED_MODEL)