Dynavera/compose/prod/docker-compose.inference.yml

32 lines
835 B
YAML
Raw Normal View History

services:
fyp-inference-prod:
container_name: fyp-inference-prod
build:
context: ../../
dockerfile: compose/dev/inference/Dockerfile
deploy:
resources:
reservations:
devices:
- driver: nvidia
count: all
capabilities: [gpu]
restart: unless-stopped
2026-03-22 09:28:53 +00:00
env_file: ../../prod.env
volumes:
- ../../:/app
- ../../models:/app/models
- ../../hf_cache:/root/.cache/huggingface
labels:
- "traefik.enable=true"
- "traefik.http.routers.llm.rule=Host(`${LLM_DOMAIN_NAME}`)"
- "traefik.http.routers.llm.entrypoints=web"
- "traefik.http.services.llm.loadbalancer.server.port=${LLM_PORT}"
- "traefik.docker.network=proxy-net"
networks:
- proxy-net
networks:
proxy-net:
external: true