diff --git a/.github/workflows/update-gpuci.yaml b/.github/workflows/update-gpuci.yaml deleted file mode 100644 index 91a27ec53f..0000000000 --- a/.github/workflows/update-gpuci.yaml +++ /dev/null @@ -1,71 +0,0 @@ -name: Check for gpuCI updates - -on: - # Disabling scheduled runs until gpuCI is back online. - # See https://github.com/dask/community/issues/404 - # schedule: - # - cron: "0 0 * * *" # Daily “At 00:00” UTC - workflow_dispatch: - -jobs: - update-gpuci: - runs-on: ubuntu-latest - if: github.repository == 'dask/distributed' - - steps: - - uses: actions/checkout@v4.1.3 - - - name: Parse current axis YAML - id: rapids_current - uses: the-coding-turtle/ga-yaml-parser@v0.1.2 - with: - file: continuous_integration/gpuci/axis.yaml - - - name: Get latest cuDF nightly version - id: cudf_latest - uses: jacobtomlinson/gha-anaconda-package-version@0.1.4 - with: - org: "rapidsai-nightly" - package: "cudf" - version_system: "CalVer" - - - name: Get latest UCX-Py nightly version - id: ucx_py_latest - uses: jacobtomlinson/gha-anaconda-package-version@0.1.4 - with: - org: "rapidsai-nightly" - package: "ucx-py" - version_system: "CalVer" - - - name: Get old RAPIDS / UCX-Py versions - env: - FULL_RAPIDS_VER: ${{ steps.cudf_latest.outputs.version }} - FULL_UCX_PY_VER: ${{ steps.ucx_py_latest.outputs.version }} - run: | - echo RAPIDS_VER=${{ steps.rapids_current.outputs.RAPIDS_VER_0 }} >> $GITHUB_ENV - echo UCX_PY_VER=$(curl -sL https://version.gpuci.io/rapids/${{ steps.rapids_current.outputs.RAPIDS_VER_0 }}) >> $GITHUB_ENV - echo NEW_RAPIDS_VER=$(echo $FULL_RAPIDS_VER | cut -d'.' -f1,2) >> $GITHUB_ENV - echo NEW_UCX_PY_VER=$(echo $FULL_UCX_PY_VER | cut -d'.' -f1,2) >> $GITHUB_ENV - - - name: Update RAPIDS version - uses: jacobtomlinson/gha-find-replace@v3 - with: - include: 'continuous_integration\/gpuci\/axis\.yaml' - find: "${{ env.RAPIDS_VER }}" - replace: "${{ env.NEW_RAPIDS_VER }}" - regex: false - - - name: Create Pull Request - uses: peter-evans/create-pull-request@v6 - if: ${{ env.UCX_PY_VER != env.NEW_UCX_PY_VER }} # make sure new ucx-py nightlies are available - with: - token: ${{ secrets.GITHUB_TOKEN }} - draft: false - commit-message: "Update gpuCI `RAPIDS_VER` to `${{ env.NEW_RAPIDS_VER }}`" - title: "Update gpuCI `RAPIDS_VER` to `${{ env.NEW_RAPIDS_VER }}`" - author: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> - branch: "upgrade-gpuci-rapids" - body: | - New cuDF and ucx-py nightly versions have been detected. - - Updated `axis.yaml` to use `${{ env.NEW_RAPIDS_VER }}`. diff --git a/CODEOWNERS b/CODEOWNERS index 08ebf86238..38c8a480a8 100644 --- a/CODEOWNERS +++ b/CODEOWNERS @@ -12,4 +12,3 @@ distributed/widgets/* @jacobtomlinson # GPU Support distributed/diagnostics/nvml.py @jacobtomlinson @quasiben -continuous_integration/gpuci/* @jacobtomlinson @quasiben diff --git a/continuous_integration/gpuci/axis.yaml b/continuous_integration/gpuci/axis.yaml deleted file mode 100644 index 41fca92d9f..0000000000 --- a/continuous_integration/gpuci/axis.yaml +++ /dev/null @@ -1,14 +0,0 @@ -PYTHON_VER: -- "3.10" -- "3.11" - -CUDA_VER: -- "11.8.0" - -LINUX_VER: -- ubuntu20.04 - -RAPIDS_VER: -- "24.12" - -excludes: diff --git a/continuous_integration/gpuci/build.sh b/continuous_integration/gpuci/build.sh deleted file mode 100644 index ab3bc95c48..0000000000 --- a/continuous_integration/gpuci/build.sh +++ /dev/null @@ -1,62 +0,0 @@ -############################################## -# Dask GPU build and test script for CI # -############################################## -set -e -NUMARGS=$# -ARGS=$* - -# Arg parsing function -function hasArg { - (( ${NUMARGS} != 0 )) && (echo " ${ARGS} " | grep -q " $1 ") -} - -# Set path and build parallel level -export PATH=/opt/conda/bin:/usr/local/cuda/bin:$PATH -export PARALLEL_LEVEL=${PARALLEL_LEVEL:-4} - -# Set home to the job's workspace -export HOME="$WORKSPACE" - -# Switch to project root; also root of repo checkout -cd "$WORKSPACE" - -# Determine CUDA release version -export CUDA_REL=${CUDA_VERSION%.*} - -# FIXME - monitoring GIL contention causes UCX teardown issues -export DASK_DISTRIBUTED__ADMIN__SYSTEM_MONITOR__GIL__ENABLED=False - -################################################################################ -# SETUP - Check environment -################################################################################ - -rapids-logger "Check environment variables" -env - -rapids-logger "Check GPU usage" -nvidia-smi - -rapids-logger "Activate conda env" -. /opt/conda/etc/profile.d/conda.sh -conda activate dask - -rapids-logger "Install distributed" -python -m pip install -e . - -rapids-logger "Install dask" -python -m pip install git+https://github.com/dask/dask - -rapids-logger "Check Python versions" -python --version - -rapids-logger "Check conda environment" -conda info -conda config --show-sources -conda list --show-channel-urls - -rapids-logger "Python py.test for distributed" -py.test distributed -v -m gpu --runslow --junitxml="$WORKSPACE/junit-distributed.xml" - -# cuDF spill stats monitoring must be enabled for this test -CUDF_SPILL=on CUDF_SPILL_STATS=1 DASK_DISTRIBUTED__DIAGNOSTICS__CUDF=1 \ - py.test distributed/diagnostics/tests/test_cudf_diagnostics.py -v -m gpu --runslow --junitxml="$WORKSPACE/junit-distributed.xml"