Build & release image

2025-09-04 00:35:22 +00:00 · 2024-04-29 11:43:20 +03:00
parent c2b4d4af8c
commit 613fcd070f
5 changed files with 55 additions and 7 deletions
--- a/.github/workflows/apolo-release.yml
+++ b/.github/workflows/apolo-release.yml
@@ -0,0 +1,32 @@
 name: CI
 on:
  push:
    branches: [master]
    tags: ["v*"]
  pull_request:
    branches: [master]
 jobs:
  release:
    name: Release image
    runs-on: ubuntu-latest
    if: github.event_name == 'push' && startsWith(github.ref, 'refs/tags/v')
    steps:
      - name: Checkout commit
        uses: actions/checkout@v4
      - name: Login to ghcr.io
        uses: docker/login-action@v3.1.0
        with:
          registry: ghcr.io
          username: ${{ github.actor }}
          password: ${{ github.token }}
      - name: Build Docker image
        run: make build-image
      - name: Push image
        run: |
          export IMAGE_TAG=${GITHUB_REF#refs/tags/v}
          make push-image
          export IMAGE_TAG=latest
          make push-image
--- a/.neuro/live.yaml
+++ b/.neuro/live.yaml
@@ -66,6 +66,7 @@ jobs:
      OLLAMA_API_BASE: http://${{ inspect_job('ollama').internal_hostname_named }}:11434
      POSTGRES_HOST: ${{ inspect_job('pgvector').internal_hostname_named }}
      VLLM_MODEL: stabilityai/StableBeluga-13B
      VLLM_TOKENIZER: stabilityai/StableBeluga-13B
  vllm:
    image: vllm/vllm-openai:v0.4.0
--- a/Dockerfile.external
+++ b/Dockerfile.external
@@ -19,6 +19,8 @@ RUN poetry install --extras "$POETRY_EXTRAS"
 FROM base as app
 LABEL org.opencontainers.image.source = "https://github.com/neuro-inc/private-gpt"
 ENV PYTHONUNBUFFERED=1
 ENV PORT=8080
 EXPOSE 8080
--- a/14
+++ b/14
@@ -1,6 +1,11 @@
 # Any args passed to the make script, use with $(call args, default_value)
 args = `arg="$(filter-out $@,$(MAKECMDGOALS))" && echo $${arg:-${1}}`
 IMAGE_REPO ?= ghcr.io/neuro-inc
 IMAGE_NAME ?= private-gpt
 IMAGE_TAG ?= latest
 IMAGE_REF = $(IMAGE_REPO)/$(IMAGE_NAME):$(IMAGE_TAG)
 ########################################################################################################################
 # Quality checks
 ########################################################################################################################
@@ -76,3 +81,12 @@ list:
 	@echo "  ingest          : Ingest data using specified script"
 	@echo "  wipe            : Wipe data using specified script"
 	@echo "  setup           : Setup the application"
 .PHONY: build-image
 build-image:
 	docker build -t $(IMAGE_NAME):latest .
 .PHONY: push-image
 push-image:
 	docker tag $(IMAGE_NAME):latest $(IMAGE_REF)
 	docker push $(IMAGE_REF)
--- a/settings/settings-vllm-pgvector.yaml
+++ b/settings/settings-vllm-pgvector.yaml
@@ -4,14 +4,14 @@ server:
 llm:
  mode: openailike
-  tokenizer: ${VLLM_MODEL:lmsys/vicuna-7b-v1.5}
+  tokenizer: ${VLLM_TOKENIZER:lmsys/vicuna-7b-v1.5}
-  max_new_tokens: 5000
+  max_new_tokens: ${VLLM_MAX_NEW_TOKENS:5000}
-  context_window: 2048
+  context_window: ${VLLM_CONTEXT_WINDOW:2048}
-  temperature: 0.1
+  temperature: ${VLLM_TEMPERATURE:0.1}
 openai:
  api_base: ${VLLM_API_BASE:http://localhost:8000/v1}
-  api_key: EMPTY
+  api_key: ${VLLM_API_BASE:EMPTY}
  model: ${VLLM_MODEL:lmsys/vicuna-7b-v1.5}
 embedding:
@@ -21,8 +21,7 @@ embedding:
 ollama:
  # Note: if you change embedding model, you'll need to use a dedicated DB for ingext storage
-  embedding_model: nomic-embed-text
+  embedding_model: ${OLLAMA_EMBEDDING_MODEL:nomic-embed-text}
  # api_base: ${OLLAMA_API_BASE:http://localhost:11434}
  embedding_api_base: ${OLLAMA_API_BASE:http://localhost:11434}
  request_timeout: 300.0