odysseus/docker/gpu.nvidia.yml

# NVIDIA GPU overlay. Enable by setting COMPOSE_FILE in .env:
#   COMPOSE_FILE=docker-compose.yml:docker/gpu.nvidia.yml
#
# Use scripts/check-docker-gpu.sh to diagnose GPU passthrough, optionally
# install the NVIDIA Container Toolkit (Ubuntu/Debian), and write COMPOSE_FILE
# to .env. The script is read-only by default — it installs nothing and never
# edits .env unless explicitly asked.
#
# Requires the NVIDIA Container Toolkit on the host.
#   Arch:    sudo pacman -S nvidia-container-toolkit
#   Debian:  sudo apt install nvidia-container-toolkit
#   Fedora:  sudo dnf install nvidia-container-toolkit
# Then:
#   sudo nvidia-ctk runtime configure --runtime=docker
#   sudo systemctl restart docker
# Verify with:
#   docker info | grep -i nvidia
#
# This overlay only passes the host GPU through to the container.
# The slim Odysseus image does not bundle CUDA userspace or inference
# engines — install vLLM / llama-cpp-python / SGLang via
# Cookbook -> Dependencies (or pip) before serving GPU models.
services:
  odysseus:
    environment:
      - NVIDIA_VISIBLE_DEVICES=all
      - NVIDIA_DRIVER_CAPABILITIES=compute,utility
    deploy:
      resources:
        reservations:
          devices:
            - driver: nvidia
              count: all
              capabilities: [gpu]