version: '3.8' services: app: # image: USERNAME/IMAGE:latest command: gunicorn -w 2 -b 0.0.0.0:5000 web:app ports: - 5000:5000 environment: - NVIDIA_VISIBLE_DEVICES=all - NVIDIA_DRIVER_CAPABILITIES=compute,utility deploy: resources: reservations: devices: - capabilities: [gpu] volumes: - /root/model-cache:/root/.cache