services: fyp-inference-prod: container_name: fyp-inference-prod build: context: ../../ dockerfile: compose/dev/inference/Dockerfile restart: unless-stopped deploy: mode: replicated replicas: 1 resources: reservations: devices: - driver: nvidia count: all capabilities: [gpu] env_file: - ../../.env environment: - INFERENCE_HTTP_HOST=0.0.0.0 - INFERENCE_HTTP_PORT=8001 - NVIDIA_VISIBLE_DEVICES=all ports: - '0.0.0.0:58001:8001' volumes: - ../../:/app