Skip to content

Commit

Permalink
feat: cuda support
Browse files Browse the repository at this point in the history
jonafeucht committed Jun 11, 2024
1 parent 0ccd80d commit 4cad922
Showing 3 changed files with 56 additions and 4 deletions.
21 changes: 19 additions & 2 deletions .github/workflows/publish.yml
Original file line number Diff line number Diff line change
@@ -18,6 +18,13 @@ permissions:
jobs:
build_and_publish:
runs-on: ubuntu-latest
strategy:
matrix:
include:
- docker_file: Dockerfile
label: "latest"
- docker_file: Dockerfile.cuda
label: "latest-cuda"
steps:
- uses: actions/checkout@v4

@@ -29,6 +36,13 @@ jobs:
uses: docker/metadata-action@v5
with:
images: ${{ env.REGISTRY }}/${{ env.IMAGE_NAME }}
tags: |
type=ref,event=branch
type=ref,event=pr
type=ref,event=tag
type=sha,prefix=sha-
labels: |
type=raw,value=image-type=${{ matrix.label }}
- uses: docker/login-action@v3
with:
@@ -40,7 +54,10 @@ jobs:
uses: docker/build-push-action@v5
with:
context: .
file: ${{ matrix.docker_file }}
push: ${{ github.event_name != 'pull_request' }}
tags: ${{ steps.meta.outputs.tags }}
labels: ${{ steps.meta.outputs.labels }}
tags: |
${{ steps.meta.outputs.tags }}
${{ env.REGISTRY }}/${{ env.IMAGE_NAME }}:latest${{ matrix.label =='latest-cuda' && '-cuda' || '' }}
# labels: ${{ steps.meta.outputs.labels }}
platforms: linux/amd64,linux/arm64
8 changes: 8 additions & 0 deletions Dockerfile.cuda
Original file line number Diff line number Diff line change
@@ -0,0 +1,8 @@
FROM nvidia/cuda:12.5.0-runtime-ubuntu22.04
WORKDIR /app
COPY . /app
RUN apt-get update && \
apt-get install -y python3-pip && \
pip install --upgrade pip
RUN pip install --no-cache-dir -r requirements.txt --extra-index-url https://download.pytorch.org/whl/cu121
CMD ["fastapi", "run", "main.py", "--proxy-headers", "--host", "0.0.0.0", "--port", "8000"]
31 changes: 29 additions & 2 deletions README.md
Original file line number Diff line number Diff line change
@@ -8,9 +8,9 @@
## Installation

- For ease of use it's recommended to use the provided [docker-compose.yml](https://github.com/doppeltilde/image_video_classification/blob/main/docker-compose.yml).
```yml
version: '3.9'

**CPU Support:** Use the `latest` tag.
```yml
services:
image_video_classification:
image: ghcr.io/doppeltilde/image_video_classification:latest
@@ -30,6 +30,33 @@ volumes:
models:
```
**NVIDIA GPU Support:** Use the `latest-cuda` tag.
```yml
services:
image_video_classification_cuda:
image: ghcr.io/doppeltilde/image_video_classification:latest-cuda
ports:
- "8000:8000"
volumes:
- models:/root/.cache/huggingface/hub:rw
environment:
- DEFAULT_ASR_MODEL_NAME
- COMPUTE_TYPE
- USE_API_KEYS
- API_KEYS
restart: unless-stopped
deploy:
resources:
reservations:
devices:
- driver: nvidia
count: all
capabilities: [ gpu ]
volumes:
models:
```

- Create a `.env` file and set the preferred values.
```sh
DEFAULT_MODEL_NAME=Falconsai/nsfw_image_detection

0 comments on commit 4cad922

Please sign in to comment.