version: '3.8' | |
services: | |
gema-model-api: | |
build: . | |
ports: | |
- "8000:8000" | |
environment: | |
- PYTHONUNBUFFERED=1 | |
volumes: | |
- ./cache:/root/.cache/huggingface # Cache model downloads | |
restart: unless-stopped | |
healthcheck: | |
test: ["CMD", "curl", "-f", "http://localhost:8000/health"] | |
interval: 30s | |
timeout: 10s | |
retries: 3 | |
deploy: | |
resources: | |
limits: | |
memory: 8G # Adjust based on your system | |
reservations: | |
memory: 4G |