diff --git a/dbgpt/_version.py b/dbgpt/_version.py index c484a1d8b..f22beb48e 100644 --- a/dbgpt/_version.py +++ b/dbgpt/_version.py @@ -1 +1 @@ -version = "0.5.6" +version = "0.5.7" diff --git a/dbgpt/app/scene/chat_dashboard/data_loader.py b/dbgpt/app/scene/chat_dashboard/data_loader.py index 7d1724780..57c9e5bf2 100644 --- a/dbgpt/app/scene/chat_dashboard/data_loader.py +++ b/dbgpt/app/scene/chat_dashboard/data_loader.py @@ -1,7 +1,7 @@ +import datetime import logging from decimal import Decimal from typing import List -import datetime from dbgpt._private.config import Config from dbgpt.app.scene.chat_dashboard.data_preparation.report_schma import ValueItem diff --git a/dbgpt/rag/assembler/bm25.py b/dbgpt/rag/assembler/bm25.py index b20da1375..6cb710b0e 100644 --- a/dbgpt/rag/assembler/bm25.py +++ b/dbgpt/rag/assembler/bm25.py @@ -15,6 +15,7 @@ from ..retriever.bm25 import BM25Retriever class BM25Assembler(BaseAssembler): """BM25 Assembler. + refer https://www.elastic.co/guide/en/elasticsearch/reference/8.9/index- modules-similarity.html TF/IDF based similarity that has built-in tf normalization and is supposed to @@ -43,7 +44,7 @@ class BM25Assembler(BaseAssembler): def __init__( self, knowledge: Knowledge, - es_config: ElasticsearchVectorConfig = None, + es_config: ElasticsearchVectorConfig, k1: Optional[float] = 2.0, b: Optional[float] = 0.75, chunk_parameters: Optional[ChunkParameters] = None, @@ -122,7 +123,7 @@ class BM25Assembler(BaseAssembler): def load_from_knowledge( cls, knowledge: Knowledge, - es_config: ElasticsearchVectorConfig = None, + es_config: ElasticsearchVectorConfig, k1: Optional[float] = 2.0, b: Optional[float] = 0.75, chunk_parameters: Optional[ChunkParameters] = None, @@ -152,7 +153,7 @@ class BM25Assembler(BaseAssembler): async def aload_from_knowledge( cls, knowledge: Knowledge, - es_config: ElasticsearchVectorConfig = None, + es_config: ElasticsearchVectorConfig, k1: Optional[float] = 2.0, b: Optional[float] = 0.75, chunk_parameters: Optional[ChunkParameters] = None, diff --git a/dbgpt/rag/retriever/bm25.py b/dbgpt/rag/retriever/bm25.py index 244feb8f6..0ef717b9b 100644 --- a/dbgpt/rag/retriever/bm25.py +++ b/dbgpt/rag/retriever/bm25.py @@ -14,16 +14,17 @@ from dbgpt.util.executor_utils import blocking_func_to_async class BM25Retriever(BaseRetriever): """BM25 retriever. - refer https://www.elastic.co/guide/en/elasticsearch/reference/8.9/index- - modules-similarity.html + + refer https://www.elastic.co/guide/en/elasticsearch/reference/8.9/ + index-modules-similarity.html; TF/IDF based similarity that has built-in tf normalization and is supposed to work better for short fields (like names). See Okapi_BM25 for more details. - This similarity has the following options:""" + """ def __init__( self, top_k: int = 4, - es_index: str = None, + es_index: str = "dbgpt", es_client: Any = None, query_rewrite: Optional[QueryRewrite] = None, rerank: Optional[Ranker] = None, diff --git a/setup.py b/setup.py index 0ee8c9fa9..6e3666a78 100644 --- a/setup.py +++ b/setup.py @@ -19,7 +19,7 @@ with open("README.md", mode="r", encoding="utf-8") as fh: IS_DEV_MODE = os.getenv("IS_DEV_MODE", "true").lower() == "true" # If you modify the version, please modify the version in the following files: # dbgpt/_version.py -DB_GPT_VERSION = os.getenv("DB_GPT_VERSION", "0.5.6") +DB_GPT_VERSION = os.getenv("DB_GPT_VERSION", "0.5.7") BUILD_NO_CACHE = os.getenv("BUILD_NO_CACHE", "true").lower() == "true" LLAMA_CPP_GPU_ACCELERATION = (