From c5df4aebfc22bcb6e5fc2c07f304fd25cbc8a4dd Mon Sep 17 00:00:00 2001 From: ramilbakhshyiev <7597197+ramilbakhshyiev@users.noreply.github.com> Date: Fri, 9 Aug 2024 15:21:34 -0700 Subject: [PATCH] Containerize ROCm build and move it to AMD GPU runners Summary: This change converts the ROCm build to run inside containers and updates it to run on AMD GPU based runners. Still working with the AMD team to resolve test failures before enabled those. Differential Revision: D61049115 --- .github/workflows/build.yml | 13 ++++++++++++- 1 file changed, 12 insertions(+), 1 deletion(-) diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml index 971d8941d5..a17f0838b1 100644 --- a/.github/workflows/build.yml +++ b/.github/workflows/build.yml @@ -93,8 +93,19 @@ jobs: linux-x86_64-GPU-w-ROCm-cmake: name: Linux x86_64 GPU w/ ROCm (cmake) needs: linux-x86_64-cmake - runs-on: 4-core-ubuntu + runs-on: faiss-amd-MI200 + container: + image: ubuntu:22.04 + options: --device=/dev/kfd --device=/dev/dri --ipc=host --shm-size 16G --group-add video --cap-add=SYS_PTRACE --cap-add=SYS_ADMIN steps: + - name: Container setup + run: | + if [ -f /.dockerenv ]; then + apt-get update && apt-get install -y sudo && apt-get install -y git + git config --global --add safe.directory '*' + else + echo 'Skipping. Current job is not running inside a container.' + fi - name: Checkout uses: actions/checkout@v4 - name: Build and Test (cmake)