version: '3.8' services: compact-ai-model: build: . ports: - "8000:8000" environment: - MODEL_SIZE=small - API_HOST=0.0.0.0 - API_PORT=8000 volumes: - ./checkpoints:/app/checkpoints - ./data:/app/data deploy: resources: limits: memory: 4G cpus: '2.0' reservations: memory: 2G cpus: '1.0' healthcheck: test: ["CMD", "curl", "-f", "http://localhost:8000/health"] interval: 30s timeout: 10s retries: 3 restart: unless-stopped # Optional: Add a reverse proxy nginx: image: nginx:alpine ports: - "80:80" volumes: - ./nginx.conf:/etc/nginx/nginx.conf:ro depends_on: - compact-ai-model profiles: - prod