Skip to content

Commit

Permalink
Troubleshoot hanging matrix jobs
Browse files Browse the repository at this point in the history
  • Loading branch information
hcho3 committed Nov 20, 2024
1 parent f30a0c3 commit 916c81a
Show file tree
Hide file tree
Showing 2 changed files with 27 additions and 13 deletions.
12 changes: 9 additions & 3 deletions .github/workflows/jvm_tests.yml
Original file line number Diff line number Diff line change
Expand Up @@ -18,8 +18,10 @@ jobs:
build-containers:
name: Build CI containers (${{ matrix.container_id }})
runs-on:
- runs-on=${{ github.run_id }}
- runs-on
- runner=${{ matrix.runner }}
- run-id=${{ github.run_id }}
- tag=${{ matrix.container_id }}
strategy:
max-parallel: 2
matrix:
Expand Down Expand Up @@ -48,8 +50,10 @@ jobs:
(arch ${{ matrix.arch }}, runner ${{ matrix.runner }})
needs: build-containers
runs-on:
- runs-on=${{ github.run_id }}
- runs-on
- runner=${{ matrix.runner }}
- run-id=${{ github.run_id }}
- tag=${{ matrix.arch }}
strategy:
fail-fast: false
matrix:
Expand Down Expand Up @@ -266,8 +270,10 @@ jobs:
name: Deploy JVM packages to S3 (${{ matrix.variant }})
needs: [build-jvm-gpu, build-test-jvm-packages, test-jvm-packages-gpu]
runs-on:
- runs-on=${{ github.run_id }}
- runs-on
- runner=linux-amd64-cpu
- run-id=${{ github.run_id }}
- tag=${{ matrix.variant }}
strategy:
fail-fast: false
matrix:
Expand Down
28 changes: 18 additions & 10 deletions .github/workflows/main.yml
Original file line number Diff line number Diff line change
Expand Up @@ -18,8 +18,10 @@ jobs:
build-containers:
name: Build CI containers (${{ matrix.container_id }})
runs-on:
- runs-on=${{ github.run_id }}
- runs-on
- runner=${{ matrix.runner }}
- run-id=${{ github.run_id }}
- tag=${{ matrix.container_id }}
strategy:
max-parallel: 2
matrix:
Expand Down Expand Up @@ -169,8 +171,10 @@ jobs:
name: Build manylinux2014_${{ matrix.arch }} wheel
needs: build-containers
runs-on:
- runs-on=${{ github.run_id }}
- runs-on
- runner=${{ matrix.runner }}
- run-id=${{ github.run_id }}
- tag=${{ matrix.arch }}
strategy:
fail-fast: false
matrix:
Expand Down Expand Up @@ -227,8 +231,10 @@ jobs:
(Suite ${{ matrix.suite }}, Runner ${{ matrix.runner }})
needs: [build-cuda, build-cuda-with-rmm]
runs-on:
- runs-on=${{ github.run_id }}
- runs-on
- runner=${{ matrix.runner }}
- run-id=${{ github.run_id }}
- tag=${{ matrix.suite }}
strategy:
fail-fast: false
max-parallel: 2
Expand Down Expand Up @@ -266,39 +272,41 @@ jobs:
name: Run Python tests (${{ matrix.description }})
needs: [build-cuda, build-cpu-arm64]
runs-on:
- runs-on=${{ github.run_id }}
- runs-on
- runner=${{ matrix.runner }}
- run-id=${{ github.run_id }}
- tag=${{ matrix.description }}
strategy:
fail-fast: false
max-parallel: 2
matrix:
include:
- description: "single GPU"
- description: single-gpu
container: xgb-ci.gpu
suite: gpu
runner: linux-amd64-gpu
artifact_from: build-cuda
- description: "single GPU, nightly deps"
- description: single-gpu-nightly-deps
container: xgb-ci.gpu_dev_ver
suite: gpu
runner: linux-amd64-gpu
artifact_from: build-cuda
- description: "multiple GPUs"
- description: multiple-gpu
container: xgb-ci.gpu
suite: mgpu
runner: linux-amd64-mgpu
artifact_from: build-cuda
- description: "multiple GPUs, nightly deps"
- description: multiple-gpu-nightly-deps
container: xgb-ci.gpu_dev_ver
suite: mgpu
runner: linux-amd64-mgpu
artifact_from: build-cuda
- description: "CPU"
- description: cpu-amd64
container: xgb-ci.cpu
suite: cpu
runner: linux-amd64-cpu
artifact_from: build-cuda
- description: "CPU ARM64"
- description: cpu-arm64
container: xgb-ci.aarch64
suite: cpu-arm64
runner: linux-arm64-cpu
Expand Down

0 comments on commit 916c81a

Please sign in to comment.