[mod] ollama

This commit is contained in:
Andy Bunce 2025-04-27 16:53:14 +01:00
parent bb3ae24a94
commit 25d831f091

View file

@ -12,10 +12,11 @@ services:
environment:
- OLLAMA_MAX_LOADED_MODELS=1
- OLLAMA_NO_CUDA=1
- OLLAMA_FLASH_ATTENTION=1
deploy:
resources:
limits:
cpus: '4' # Limit CPU cores
cpus: 8 # Limit CPU cores
memory: 16G # Limit RAM (adjust based on your system)
# devices:
# - /dev/dri:/dev/dri