services:
  fyp-inference-prod:
    container_name: fyp-inference-prod
    build:
      context: ../../
      dockerfile: compose/dev/inference/Dockerfile
    restart: unless-stopped
    deploy:
      mode: replicated
      replicas: 1
      resources:
        reservations:
          devices:
            - driver: nvidia
              count: all
              capabilities: [gpu]
    env_file:
      - ../../.env
    environment:
      - INFERENCE_HTTP_HOST=0.0.0.0
      - INFERENCE_HTTP_PORT=8001
      - NVIDIA_VISIBLE_DEVICES=all
    ports:
      - '0.0.0.0:58001:8001'
    volumes:
      - ../../:/app