DOCS: format notebooks (#13371)

This commit is contained in:
Bagatur
2023-11-14 14:17:44 -08:00
committed by GitHub
parent d63d4994c0
commit 3596be5210
455 changed files with 3168 additions and 3136 deletions

View File

@@ -92,8 +92,9 @@
"metadata": {},
"outputs": [],
"source": [
"from pydantic import BaseModel\n",
"from typing import Any\n",
"\n",
"from pydantic import BaseModel\n",
"from unstructured.partition.pdf import partition_pdf\n",
"\n",
"# Get elements\n",
@@ -336,8 +337,8 @@
"metadata": {},
"outputs": [],
"source": [
"import os\n",
"import glob\n",
"import os\n",
"\n",
"# Get all .txt file summaries\n",
"file_paths = glob.glob(os.path.expanduser(os.path.join(path, \"*.txt\")))\n",
@@ -371,11 +372,12 @@
"outputs": [],
"source": [
"import uuid\n",
"from langchain.vectorstores import Chroma\n",
"from langchain.storage import InMemoryStore\n",
"from langchain.schema.document import Document\n",
"\n",
"from langchain.embeddings import OpenAIEmbeddings\n",
"from langchain.retrievers.multi_vector import MultiVectorRetriever\n",
"from langchain.schema.document import Document\n",
"from langchain.storage import InMemoryStore\n",
"from langchain.vectorstores import Chroma\n",
"\n",
"# The vectorstore to use to index the child chunks\n",
"vectorstore = Chroma(collection_name=\"summaries\", embedding_function=OpenAIEmbeddings())\n",