services:
  voice-chat:
    build: .
    ports:
      - "8000:8000"
    volumes:
      # Cache models on the host so they survive container rebuilds
      - huggingface-cache:/cache/huggingface
      # Mount config so you can edit backend settings without rebuilding the image
      - ./config.yml:/app/config.yml:ro
    deploy:
      resources:
        reservations:
          devices:
            - driver: nvidia
              count: 1
              capabilities: [gpu]

volumes:
  huggingface-cache: