llm-apiku / docker-compose.yml
DENNY
Add application file
6d2ea02
raw
history blame contribute delete
517 Bytes
version: '3.8'
services:
gema-model-api:
build: .
ports:
- "8000:8000"
environment:
- PYTHONUNBUFFERED=1
volumes:
- ./cache:/root/.cache/huggingface # Cache model downloads
restart: unless-stopped
healthcheck:
test: ["CMD", "curl", "-f", "http://localhost:8000/health"]
interval: 30s
timeout: 10s
retries: 3
deploy:
resources:
limits:
memory: 8G # Adjust based on your system
reservations:
memory: 4G