feat: add ollama_research service and update profiles for dual-gpu sub-profiles

This commit is contained in:
pyr0ball 2026-02-27 06:16:17 -08:00
parent 8e88a99a8e
commit d626b20470

View file

@ -1,5 +1,5 @@
# compose.yml — Peregrine by Circuit Forge LLC # compose.yml — Peregrine by Circuit Forge LLC
# Profiles: remote | cpu | single-gpu | dual-gpu # Profiles: remote | cpu | single-gpu | dual-gpu-ollama | dual-gpu-vllm | dual-gpu-mixed
services: services:
app: app:
@ -52,7 +52,21 @@ services:
- OLLAMA_MODELS=/root/.ollama - OLLAMA_MODELS=/root/.ollama
- DEFAULT_OLLAMA_MODEL=${OLLAMA_DEFAULT_MODEL:-llama3.2:3b} - DEFAULT_OLLAMA_MODEL=${OLLAMA_DEFAULT_MODEL:-llama3.2:3b}
entrypoint: ["/bin/bash", "/entrypoint.sh"] entrypoint: ["/bin/bash", "/entrypoint.sh"]
profiles: [cpu, single-gpu, dual-gpu] profiles: [cpu, single-gpu, dual-gpu-ollama, dual-gpu-vllm, dual-gpu-mixed]
restart: unless-stopped
ollama_research:
image: ollama/ollama:latest
ports:
- "${OLLAMA_RESEARCH_PORT:-11435}:11434"
volumes:
- ${OLLAMA_MODELS_DIR:-~/models/ollama}:/root/.ollama
- ./docker/ollama/entrypoint.sh:/entrypoint.sh
environment:
- OLLAMA_MODELS=/root/.ollama
- DEFAULT_OLLAMA_MODEL=${OLLAMA_RESEARCH_MODEL:-llama3.2:3b}
entrypoint: ["/bin/bash", "/entrypoint.sh"]
profiles: [dual-gpu-ollama, dual-gpu-mixed]
restart: unless-stopped restart: unless-stopped
vision: vision:
@ -64,7 +78,7 @@ services:
environment: environment:
- VISION_MODEL=${VISION_MODEL:-vikhyatk/moondream2} - VISION_MODEL=${VISION_MODEL:-vikhyatk/moondream2}
- VISION_REVISION=${VISION_REVISION:-2025-01-09} - VISION_REVISION=${VISION_REVISION:-2025-01-09}
profiles: [single-gpu, dual-gpu] profiles: [single-gpu, dual-gpu-ollama, dual-gpu-vllm, dual-gpu-mixed]
restart: unless-stopped restart: unless-stopped
vllm: vllm:
@ -81,7 +95,7 @@ services:
--enforce-eager --enforce-eager
--max-num-seqs 8 --max-num-seqs 8
--cpu-offload-gb ${CPU_OFFLOAD_GB:-0} --cpu-offload-gb ${CPU_OFFLOAD_GB:-0}
profiles: [dual-gpu] profiles: [dual-gpu-vllm, dual-gpu-mixed]
restart: unless-stopped restart: unless-stopped
finetune: finetune: