Dynavera/compose/prod/docker-compose.inference.yml

27 lines
609 B
YAML
Raw Normal View History

services:
fyp-inference-prod:
container_name: fyp-inference-prod
build:
context: ../../
dockerfile: compose/dev/inference/Dockerfile
restart: unless-stopped
deploy:
mode: replicated
replicas: 1
resources:
reservations:
devices:
- driver: nvidia
count: all
capabilities: [gpu]
env_file:
- ../../.env
environment:
- INFERENCE_HTTP_HOST=0.0.0.0
- INFERENCE_HTTP_PORT=8001
- NVIDIA_VISIBLE_DEVICES=all
ports:
- '0.0.0.0:58001:8001'
volumes:
- ../../:/app