mirror of
https://github.com/csunny/DB-GPT.git
synced 2025-09-11 05:49:22 +00:00
feature:url,csv embedding
This commit is contained in:
13
examples/knowledge_embedding/csv_embedding_test.py
Normal file
13
examples/knowledge_embedding/csv_embedding_test.py
Normal file
@@ -0,0 +1,13 @@
|
||||
|
||||
|
||||
from pilot.source_embedding.csv_embedding import CSVEmbedding
|
||||
|
||||
# path = "/Users/chenketing/Downloads/share_ireserve双写数据异常2.xlsx"
|
||||
path = "/Users/chenketing/Downloads/vectors.csv"
|
||||
model_name = "/Users/chenketing/Desktop/project/all-MiniLM-L6-v2"
|
||||
vector_store_path = "/pilot/source_embedding/"
|
||||
|
||||
|
||||
pdf_embedding = CSVEmbedding(file_path=path, model_name=model_name, vector_store_config={"vector_store_name": "url", "vector_store_path": "vector_store_path"})
|
||||
pdf_embedding.source_embedding()
|
||||
print("success")
|
10
examples/knowledge_embedding/url_embedding_test.py
Normal file
10
examples/knowledge_embedding/url_embedding_test.py
Normal file
@@ -0,0 +1,10 @@
|
||||
from pilot.source_embedding.url_embedding import URLEmbedding
|
||||
|
||||
path = "https://www.understandingwar.org/backgrounder/russian-offensive-campaign-assessment-february-8-2023"
|
||||
model_name = "/Users/chenketing/Desktop/project/all-MiniLM-L6-v2"
|
||||
vector_store_path = "/pilot/source_embedding/"
|
||||
|
||||
|
||||
pdf_embedding = URLEmbedding(file_path=path, model_name=model_name, vector_store_config={"vector_store_name": "url", "vector_store_path": "vector_store_path"})
|
||||
pdf_embedding.source_embedding()
|
||||
print("success")
|
Reference in New Issue
Block a user