mirror of
https://github.com/csunny/DB-GPT.git
synced 2025-09-06 03:20:41 +00:00
feat: Support llama.cpp
This commit is contained in:
121
setup.py
121
setup.py
@@ -1,6 +1,11 @@
|
||||
from typing import List
|
||||
from typing import List, Tuple
|
||||
|
||||
import setuptools
|
||||
import platform
|
||||
import subprocess
|
||||
import os
|
||||
from enum import Enum
|
||||
|
||||
from setuptools import find_packages
|
||||
|
||||
with open("README.md", "r") as fh:
|
||||
@@ -16,6 +21,117 @@ def parse_requirements(file_name: str) -> List[str]:
|
||||
]
|
||||
|
||||
|
||||
class SetupSpec:
|
||||
def __init__(self) -> None:
|
||||
self.extras: dict = {}
|
||||
|
||||
|
||||
setup_spec = SetupSpec()
|
||||
|
||||
|
||||
class AVXType(Enum):
|
||||
BASIC = "basic"
|
||||
AVX = "AVX"
|
||||
AVX2 = "AVX2"
|
||||
AVX512 = "AVX512"
|
||||
|
||||
@staticmethod
|
||||
def of_type(avx: str):
|
||||
for item in AVXType:
|
||||
if item._value_ == avx:
|
||||
return item
|
||||
return None
|
||||
|
||||
|
||||
class OSType(Enum):
|
||||
WINDOWS = "win"
|
||||
LINUX = "linux"
|
||||
DARWIN = "darwin"
|
||||
OTHER = "other"
|
||||
|
||||
|
||||
def get_cpu_avx_support() -> Tuple[OSType, AVXType]:
|
||||
system = platform.system()
|
||||
os_type = OSType.OTHER
|
||||
cpu_avx = AVXType.BASIC
|
||||
env_cpu_avx = AVXType.of_type(os.getenv("DBGPT_LLAMA_CPP_AVX"))
|
||||
|
||||
cmds = ["lscpu"]
|
||||
if system == "Windows":
|
||||
cmds = ["coreinfo"]
|
||||
os_type = OSType.WINDOWS
|
||||
elif system == "Linux":
|
||||
cmds = ["lscpu"]
|
||||
os_type = OSType.LINUX
|
||||
elif system == "Darwin":
|
||||
cmds = ["sysctl", "-a"]
|
||||
os_type = OSType.DARWIN
|
||||
else:
|
||||
os_type = OSType.OTHER
|
||||
print("Unsupported OS to get cpu avx, use default")
|
||||
return os_type, env_cpu_avx if env_cpu_avx else cpu_avx
|
||||
result = subprocess.run(cmds, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
|
||||
output = result.stdout.decode()
|
||||
if "avx512" in output.lower():
|
||||
cpu_avx = AVXType.AVX512
|
||||
elif "avx2" in output.lower():
|
||||
cpu_avx = AVXType.AVX2
|
||||
elif "avx " in output.lower():
|
||||
# cpu_avx = AVXType.AVX
|
||||
pass
|
||||
return os_type, env_cpu_avx if env_cpu_avx else cpu_avx
|
||||
|
||||
|
||||
def get_cuda_version() -> str:
|
||||
try:
|
||||
import torch
|
||||
|
||||
return torch.version.cuda
|
||||
except Exception:
|
||||
return None
|
||||
|
||||
|
||||
def llama_cpp_python_cuda_requires():
|
||||
cuda_version = get_cuda_version()
|
||||
device = "cpu"
|
||||
if not cuda_version:
|
||||
print("CUDA not support, use cpu version")
|
||||
return
|
||||
device = "cu" + cuda_version.replace(".", "")
|
||||
os_type, cpu_avx = get_cpu_avx_support()
|
||||
supported_os = [OSType.WINDOWS, OSType.LINUX]
|
||||
if os_type not in supported_os:
|
||||
print(
|
||||
f"llama_cpp_python_cuda just support in os: {[r._value_ for r in supported_os]}"
|
||||
)
|
||||
return
|
||||
cpu_avx = cpu_avx._value_
|
||||
base_url = "https://github.com/jllllll/llama-cpp-python-cuBLAS-wheels/releases/download/textgen-webui"
|
||||
llama_cpp_version = "0.1.77"
|
||||
py_version = "cp310"
|
||||
os_pkg_name = "linux_x86_64" if os_type == OSType.LINUX else "win_amd64"
|
||||
extra_index_url = f"{base_url}/llama_cpp_python_cuda-{llama_cpp_version}+{device}{cpu_avx}-{py_version}-{py_version}-{os_pkg_name}.whl"
|
||||
print(f"Install llama_cpp_python_cuda from {extra_index_url}")
|
||||
|
||||
setup_spec.extras["llama_cpp"].append(f"llama_cpp_python_cuda @ {extra_index_url}")
|
||||
|
||||
|
||||
def llama_cpp_requires():
|
||||
setup_spec.extras["llama_cpp"] = ["llama-cpp-python"]
|
||||
llama_cpp_python_cuda_requires()
|
||||
|
||||
|
||||
def all_requires():
|
||||
requires = set()
|
||||
for _, pkgs in setup_spec.extras.items():
|
||||
for pkg in pkgs:
|
||||
requires.add(pkg)
|
||||
setup_spec.extras["all"] = list(requires)
|
||||
|
||||
|
||||
llama_cpp_requires()
|
||||
all_requires()
|
||||
|
||||
setuptools.setup(
|
||||
name="db-gpt",
|
||||
packages=find_packages(),
|
||||
@@ -27,9 +143,10 @@ setuptools.setup(
|
||||
long_description=long_description,
|
||||
long_description_content_type="text/markdown",
|
||||
install_requires=parse_requirements("requirements.txt"),
|
||||
url="https://github.com/csunny/DB-GPT",
|
||||
url="https://github.com/eosphoros-ai/DB-GPT",
|
||||
license="https://opensource.org/license/mit/",
|
||||
python_requires=">=3.10",
|
||||
extras_require=setup_spec.extras,
|
||||
entry_points={
|
||||
"console_scripts": [
|
||||
"dbgpt_server=pilot.server:webserver",
|
||||
|
Reference in New Issue
Block a user