Ollama
Large Language Model API
Get up and running with Llama 3.2, Mistral, Gemma 2, and other large language models.
Links:
name: ollama
services:
ollama:
# GPU acceleration: set GPU_COMPOSE_SUFFIX=amdgpu in host .env to load ollama-amdgpu.yaml (ROCm/AMD)
image: ollama/ollama:0.31.1
container_name: ollama
restart: unless-stopped
# https://docs.docker.com/config/containers/resource_constraints/#configure-the-default-cfs-scheduler
# https://batey.info/cgroup-cpu-shares-for-docker.html
cpu_shares: 512
volumes:
- ${DOCKER_VOLUMES}/ollama:/root/.ollama
networks:
- proxy
labels:
traefik.enable: true
traefik.http.routers.ollama.middlewares: localaccess@file
traefik.http.services.ollama.loadbalancer.server.port: 11434
homepage.group: AI
homepage.name: "Ollama"
homepage.icon: ollama.png
homepage.href: https://ollama.${MYDOMAIN}/
homepage.description: "Large Language Model API"
networks:
proxy:
external: true