diff --git a/.github/workflows/build_on_pr.yml b/.github/workflows/build_on_pr.yml index 1a7817ee0..926ac383b 100644 --- a/.github/workflows/build_on_pr.yml +++ b/.github/workflows/build_on_pr.yml @@ -34,7 +34,7 @@ jobs: anyExtensionFileChanged: ${{ steps.find-extension-change.outputs.any_changed }} changedLibraryFiles: ${{ steps.find-lib-change.outputs.all_changed_files }} anyLibraryFileChanged: ${{ steps.find-lib-change.outputs.any_changed }} - runs-on: [self-hosted,ubuntu-latest] + runs-on: [self-hosted, ubuntu-latest] concurrency: group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.ref }}-detect-change cancel-in-progress: true @@ -87,7 +87,7 @@ jobs: name: Build and Test Colossal-AI needs: detect if: needs.detect.outputs.anyLibraryFileChanged == 'true' - runs-on: [self-hosted,ubuntu-latest] + runs-on: [self-hosted, ubuntu-latest] container: image: image-cloud.luchentech.com/hpcaitech/pytorch-cuda:2.2.2-12.1.0 options: --gpus all --shm-size=2g --rm -v /dev/shm -v /data/scratch:/data/scratch diff --git a/.github/workflows/build_on_schedule.yml b/.github/workflows/build_on_schedule.yml index 607013851..e71c8a84e 100644 --- a/.github/workflows/build_on_schedule.yml +++ b/.github/workflows/build_on_schedule.yml @@ -10,7 +10,7 @@ jobs: build: name: Build and Test Colossal-AI if: github.repository == 'hpcaitech/ColossalAI' - runs-on: [self-hosted, gpu] + runs-on: [self-hosted, ubuntu-latest] container: image: image-cloud.luchentech.com/hpcaitech/pytorch-cuda:2.2.2-12.1.0 options: --gpus all --rm -v /dev/shm -v /data/scratch/:/data/scratch/ diff --git a/.github/workflows/cuda_ext_check_before_merge.yml b/.github/workflows/cuda_ext_check_before_merge.yml index a12fbfd82..e21cd83f7 100644 --- a/.github/workflows/cuda_ext_check_before_merge.yml +++ b/.github/workflows/cuda_ext_check_before_merge.yml @@ -10,7 +10,7 @@ jobs: matrix_preparation: name: Prepare Container List if: github.repository == 'hpcaitech/ColossalAI' - runs-on: [self-hosted,ubuntu-latest] + runs-on: [self-hosted, ubuntu-latest] outputs: matrix: ${{ steps.set-matrix.outputs.matrix }} steps: diff --git a/.github/workflows/doc_check_on_pr.yml b/.github/workflows/doc_check_on_pr.yml index aabdd2942..3e988d1a7 100644 --- a/.github/workflows/doc_check_on_pr.yml +++ b/.github/workflows/doc_check_on_pr.yml @@ -15,7 +15,7 @@ jobs: if: | github.event.pull_request.draft == false && github.event.pull_request.base.repo.full_name == 'hpcaitech/ColossalAI' - runs-on: ubuntu-[self-hosted, ubuntu-latest] + runs-on: [self-hosted, ubuntu-latest] concurrency: group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.ref }}-check-i18n cancel-in-progress: true diff --git a/.github/workflows/doc_test_on_pr.yml b/.github/workflows/doc_test_on_pr.yml index 03cac58e1..f030a1971 100644 --- a/.github/workflows/doc_test_on_pr.yml +++ b/.github/workflows/doc_test_on_pr.yml @@ -54,7 +54,7 @@ jobs: needs.detect-changed-doc.outputs.any_changed == 'true' name: Test the changed Doc needs: detect-changed-doc - runs-on: [self-hosted, gpu] + runs-on: [self-hosted, ubuntu-latest] container: image: image-cloud.luchentech.com/hpcaitech/pytorch-cuda:2.2.2-12.1.0 options: --gpus all --rm diff --git a/.github/workflows/doc_test_on_schedule.yml b/.github/workflows/doc_test_on_schedule.yml index 42ec8a9de..f6b9948b7 100644 --- a/.github/workflows/doc_test_on_schedule.yml +++ b/.github/workflows/doc_test_on_schedule.yml @@ -10,7 +10,7 @@ jobs: # Add this condition to avoid executing this job if the trigger event is workflow_dispatch. if: github.repository == 'hpcaitech/ColossalAI' name: Test the changed Doc - runs-on: [self-hosted, gpu] + runs-on: [self-hosted, ubuntu-latest] container: image: image-cloud.luchentech.com/hpcaitech/pytorch-cuda:2.2.2-12.1.0 options: --gpus all --rm diff --git a/.github/workflows/example_check_on_dispatch.yml b/.github/workflows/example_check_on_dispatch.yml index 43cd1469b..da80933bb 100644 --- a/.github/workflows/example_check_on_dispatch.yml +++ b/.github/workflows/example_check_on_dispatch.yml @@ -40,7 +40,7 @@ jobs: github.event.pull_request.base.repo.full_name == 'hpcaitech/ColossalAI' name: Manually check example files needs: manual_check_matrix_preparation - runs-on: [self-hosted, gpu] + runs-on: [self-hosted, ubuntu-latest] strategy: fail-fast: false matrix: ${{fromJson(needs.manual_check_matrix_preparation.outputs.matrix)}} diff --git a/.github/workflows/example_check_on_pr.yml b/.github/workflows/example_check_on_pr.yml index a840e1d98..2b66acf00 100644 --- a/.github/workflows/example_check_on_pr.yml +++ b/.github/workflows/example_check_on_pr.yml @@ -85,7 +85,7 @@ jobs: needs.detect-changed-example.outputs.anyChanged == 'true' name: Test the changed example needs: detect-changed-example - runs-on: [self-hosted, gpu] + runs-on: [self-hosted, ubuntu-latest] strategy: fail-fast: false matrix: ${{fromJson(needs.detect-changed-example.outputs.matrix)}} diff --git a/.github/workflows/example_check_on_schedule.yml b/.github/workflows/example_check_on_schedule.yml index cc17e9a30..c23f915af 100644 --- a/.github/workflows/example_check_on_schedule.yml +++ b/.github/workflows/example_check_on_schedule.yml @@ -10,7 +10,7 @@ jobs: matrix_preparation: if: github.repository == 'hpcaitech/ColossalAI' name: Prepare matrix for weekly check - runs-on: ubunt[self-hosted, ubuntu-latest]u-latest + runs-on: [self-hosted, ubuntu-latest] outputs: matrix: ${{ steps.setup-matrix.outputs.matrix }} steps: @@ -29,7 +29,7 @@ jobs: if: github.repository == 'hpcaitech/ColossalAI' name: Weekly check all examples needs: matrix_preparation - runs-on: [self-hosted, gpu] + runs-on: [self-hosted, ubuntu-latest] strategy: fail-fast: false matrix: ${{fromJson(needs.matrix_preparation.outputs.matrix)}} diff --git a/.github/workflows/release_docker_after_publish.yml b/.github/workflows/release_docker_after_publish.yml index d5d3a74ea..163cd825c 100644 --- a/.github/workflows/release_docker_after_publish.yml +++ b/.github/workflows/release_docker_after_publish.yml @@ -9,7 +9,7 @@ jobs: release: name: Publish Docker Image to DockerHub if: github.repository == 'hpcaitech/ColossalAI' - runs-on: [self-hosted, gpu] + runs-on: [self-hosted, ubuntu-latest] container: image: "hpcaitech/docker-in-docker:latest" options: --gpus all --rm -v /var/run/docker.sock:/var/run/docker.sock diff --git a/.github/workflows/release_nightly_on_schedule.yml b/.github/workflows/release_nightly_on_schedule.yml index 7b8f52c9e..30ffa22f6 100644 --- a/.github/workflows/release_nightly_on_schedule.yml +++ b/.github/workflows/release_nightly_on_schedule.yml @@ -9,7 +9,7 @@ jobs: publish: if: github.repository == 'hpcaitech/ColossalAI' name: Build and publish Python 🐍 distributions 📦 to PyPI - runs-on: ubuntu-[self-hosted, ubuntu-latest] + runs-on: [self-hosted, ubuntu-latest] timeout-minutes: 20 outputs: status: ${{ steps.publish.outcome }} diff --git a/.github/workflows/release_test_pypi_before_merge.yml b/.github/workflows/release_test_pypi_before_merge.yml index 3da222ce7..d950c1d83 100644 --- a/.github/workflows/release_test_pypi_before_merge.yml +++ b/.github/workflows/release_test_pypi_before_merge.yml @@ -6,6 +6,10 @@ on: - 'version.txt' +permissions: + id-token: write + contents: read + jobs: build-n-publish: if: github.event_name == 'workflow_dispatch' || github.repository == 'hpcaitech/ColossalAI' diff --git a/.github/workflows/report_leaderboard_to_lark.yml b/.github/workflows/report_leaderboard_to_lark.yml index 70a13270d..fbd077bd0 100644 --- a/.github/workflows/report_leaderboard_to_lark.yml +++ b/.github/workflows/report_leaderboard_to_lark.yml @@ -10,7 +10,7 @@ jobs: generate-and-publish: if: github.repository == 'hpcaitech/ColossalAI' name: Generate leaderboard report and publish to Lark - runs-on: ubuntu-[self-hosted, ubuntu-latest] + runs-on: [self-hosted, ubuntu-latest] timeout-minutes: 20 steps: - uses: actions/checkout@v2 diff --git a/.github/workflows/report_test_coverage.yml b/.github/workflows/report_test_coverage.yml index 1c17b63a9..2f4c58bf9 100644 --- a/.github/workflows/report_test_coverage.yml +++ b/.github/workflows/report_test_coverage.yml @@ -8,7 +8,7 @@ on: jobs: report-test-coverage: - runs-on: ubuntu-[self-hosted, ubuntu-latest] + runs-on: [self-hosted, ubuntu-latest] if: ${{ github.event.workflow_run.conclusion == 'success' }} steps: - name: "Download artifact" diff --git a/.github/workflows/run_chatgpt_examples.yml b/.github/workflows/run_chatgpt_examples.yml index 5f580e4c1..f25a6189f 100644 --- a/.github/workflows/run_chatgpt_examples.yml +++ b/.github/workflows/run_chatgpt_examples.yml @@ -17,7 +17,7 @@ jobs: github.event.pull_request.draft == false && github.base_ref == 'main' && github.event.pull_request.base.repo.full_name == 'hpcaitech/ColossalAI' - runs-on: [self-hosted, gpu] + runs-on: [self-hosted, ubuntu-latest] container: image: image-cloud.luchentech.com/hpcaitech/pytorch-cuda:2.2.2-12.1.0 options: --gpus all --rm -v /data/scratch/examples-data:/data/scratch/examples-data --shm-size=10.24gb diff --git a/.github/workflows/run_chatgpt_unit_tests.yml b/.github/workflows/run_chatgpt_unit_tests.yml index a67335690..9180ede37 100644 --- a/.github/workflows/run_chatgpt_unit_tests.yml +++ b/.github/workflows/run_chatgpt_unit_tests.yml @@ -17,7 +17,7 @@ jobs: github.event.pull_request.draft == false && github.base_ref == 'main' && github.event.pull_request.base.repo.full_name == 'hpcaitech/ColossalAI' - runs-on: [self-hosted, gpu] + runs-on: [self-hosted, ubuntu-latest] container: image: image-cloud.luchentech.com/hpcaitech/pytorch-cuda:2.2.2-12.1.0 options: --gpus all --rm -v /data/scratch/examples-data:/data/scratch/examples-data diff --git a/.github/workflows/run_colossalqa_unit_tests.yml b/.github/workflows/run_colossalqa_unit_tests.yml index f08831e5f..da2bfb006 100644 --- a/.github/workflows/run_colossalqa_unit_tests.yml +++ b/.github/workflows/run_colossalqa_unit_tests.yml @@ -17,7 +17,7 @@ jobs: github.event.pull_request.draft == false && github.base_ref == 'main' && github.event.pull_request.base.repo.full_name == 'hpcaitech/ColossalAI' - runs-on: [self-hosted, gpu] + runs-on: [self-hosted, ubuntu-latest] container: image: image-cloud.luchentech.com/hpcaitech/pytorch-cuda:2.2.2-12.1.0 volumes: diff --git a/.github/workflows/submodule.yml b/.github/workflows/submodule.yml index 14d85d1d9..5b882dd40 100644 --- a/.github/workflows/submodule.yml +++ b/.github/workflows/submodule.yml @@ -7,7 +7,7 @@ on: jobs: sync-submodule: - runs-on: ubuntu-[self-hosted, ubuntu-latest] + runs-on: [self-hosted, ubuntu-latest] if: github.repository == 'hpcaitech/ColossalAI' steps: - name: Checkout diff --git a/.github/workflows/translate_comment.yml b/.github/workflows/translate_comment.yml index 36113aaad..605396a5b 100644 --- a/.github/workflows/translate_comment.yml +++ b/.github/workflows/translate_comment.yml @@ -7,7 +7,7 @@ on: jobs: build: - runs-on: ubuntu-[self-hosted, ubuntu-latest] + runs-on: [self-hosted, ubuntu-latest] steps: - uses: usthe/issues-translate-action@v2.7 with: