version: '3.8' services: mms-api: build: . ports: - "7860:7860" volumes: - .:/app - model_cache:/root/.cache/huggingface environment: - CUDA_VISIBLE_DEVICES=0 shm_size: 4gb deploy: resources: reservations: devices: - driver: nvidia count: 1 capabilities: [ gpu ] volumes: model_cache: