diff --git a/.github/workflows/ci_cuda.yaml b/.github/workflows/ci_cuda.yaml index fc07f112c7..06f1c68af6 100644 --- a/.github/workflows/ci_cuda.yaml +++ b/.github/workflows/ci_cuda.yaml @@ -10,10 +10,10 @@ jobs: group: ${{ github.workflow }}-${{ github.job }}-${{ github.head_ref || github.run_id }} cancel-in-progress: true runs-on: - group: aws-g4dn-2xlarge + group: aws-g5-4xlarge-cache-k8s container: - image: nvidia/cuda:12.3.1-devel-ubuntu22.04 - options: --gpus 0 + image: nvidia/cuda:13.0.1-cudnn-devel-ubuntu24.04 + options: --gpus 0 if: ${{ github.event.pull_request.head.repo.full_name == github.event.pull_request.base.repo.full_name }} permissions: contents: write @@ -22,11 +22,13 @@ jobs: # with sigstore/fulcio when running outside of PRs. id-token: write security-events: write + env: + CUDA_COMPUTE_CAP: 86 steps: - name: Checkout repository - uses: actions/checkout@v3 + uses: actions/checkout@v5 - name: Install dependencies - run: apt-get update && apt install curl build-essential libssl-dev protobuf-compiler pkg-config -y + run: apt update && apt install curl build-essential libssl-dev protobuf-compiler pkg-config -y - name: Install Rust Stable uses: actions-rust-lang/setup-rust-toolchain@v1 - uses: Swatinem/rust-cache@v2 diff --git a/candle-examples/Cargo.toml b/candle-examples/Cargo.toml index 8fd31ad5aa..0b0760f947 100644 --- a/candle-examples/Cargo.toml +++ b/candle-examples/Cargo.toml @@ -58,7 +58,7 @@ tokio = "1.48.0" [build-dependencies] anyhow = { workspace = true } -bindgen_cuda = { version = "0.1.1", optional = true } +bindgen_cuda = { version = "0.1.5", optional = true } hf-hub = { workspace = true, features = ["tokio"] } [features] diff --git a/candle-flash-attn/Cargo.toml b/candle-flash-attn/Cargo.toml index a681468a1a..6c7281d552 100644 --- a/candle-flash-attn/Cargo.toml +++ b/candle-flash-attn/Cargo.toml @@ -15,7 +15,7 @@ candle = { path = "../candle-core", features = ["cuda"], package = "candle-core" half = { version = "2.3.1", features = ["num-traits"] } [build-dependencies] -bindgen_cuda = "0.1.1" +bindgen_cuda = "0.1.5" anyhow = { version = "1", features = ["backtrace"] } [dev-dependencies] diff --git a/candle-kernels/Cargo.toml b/candle-kernels/Cargo.toml index 8350ed9fc3..5ea1e07928 100644 --- a/candle-kernels/Cargo.toml +++ b/candle-kernels/Cargo.toml @@ -12,4 +12,4 @@ license = "MIT OR Apache-2.0" [dependencies] [build-dependencies] -bindgen_cuda = "0.1.1" +bindgen_cuda = "0.1.5"