Ollama Stack Docker
Posted: Wed May 06, 2026 8:16 pm
For Docker
Code: Select all
services:
ollama:
image: ollama/ollama
container_name: ollama
privileged: true
environment:
- OLLAMA_FLASH_ATTENTION=1
- OLLAMA_MAX_LOADED_MODELS=1
- OLLAMA_KEEP_ALIVE=180m
- OLLAMA_NUM_THREADS=8
ports:
- "11434:11434"
volumes:
- /home/ollama:/root/.ollama
deploy:
resources:
reservations:
devices:
- driver: nvidia
count: all
capabilities: [gpu]
restart: unless-stopped
volumes:
ollama: