[mod] ollama

This commit is contained in:
Andy Bunce 2025-04-27 16:53:14 +01:00
parent bb3ae24a94
commit 25d831f091

View file

@ -12,10 +12,11 @@ services:
environment: environment:
- OLLAMA_MAX_LOADED_MODELS=1 - OLLAMA_MAX_LOADED_MODELS=1
- OLLAMA_NO_CUDA=1 - OLLAMA_NO_CUDA=1
- OLLAMA_FLASH_ATTENTION=1
deploy: deploy:
resources: resources:
limits: limits:
cpus: '4' # Limit CPU cores cpus: 8 # Limit CPU cores
memory: 16G # Limit RAM (adjust based on your system) memory: 16G # Limit RAM (adjust based on your system)
# devices: # devices:
# - /dev/dri:/dev/dri # - /dev/dri:/dev/dri