feat: add ollama_research service and update profiles for dual-gpu sub-profiles
This commit is contained in:
parent
8e88a99a8e
commit
d626b20470
1 changed files with 18 additions and 4 deletions
22
compose.yml
22
compose.yml
|
|
@ -1,5 +1,5 @@
|
||||||
# compose.yml — Peregrine by Circuit Forge LLC
|
# compose.yml — Peregrine by Circuit Forge LLC
|
||||||
# Profiles: remote | cpu | single-gpu | dual-gpu
|
# Profiles: remote | cpu | single-gpu | dual-gpu-ollama | dual-gpu-vllm | dual-gpu-mixed
|
||||||
services:
|
services:
|
||||||
|
|
||||||
app:
|
app:
|
||||||
|
|
@ -52,7 +52,21 @@ services:
|
||||||
- OLLAMA_MODELS=/root/.ollama
|
- OLLAMA_MODELS=/root/.ollama
|
||||||
- DEFAULT_OLLAMA_MODEL=${OLLAMA_DEFAULT_MODEL:-llama3.2:3b}
|
- DEFAULT_OLLAMA_MODEL=${OLLAMA_DEFAULT_MODEL:-llama3.2:3b}
|
||||||
entrypoint: ["/bin/bash", "/entrypoint.sh"]
|
entrypoint: ["/bin/bash", "/entrypoint.sh"]
|
||||||
profiles: [cpu, single-gpu, dual-gpu]
|
profiles: [cpu, single-gpu, dual-gpu-ollama, dual-gpu-vllm, dual-gpu-mixed]
|
||||||
|
restart: unless-stopped
|
||||||
|
|
||||||
|
ollama_research:
|
||||||
|
image: ollama/ollama:latest
|
||||||
|
ports:
|
||||||
|
- "${OLLAMA_RESEARCH_PORT:-11435}:11434"
|
||||||
|
volumes:
|
||||||
|
- ${OLLAMA_MODELS_DIR:-~/models/ollama}:/root/.ollama
|
||||||
|
- ./docker/ollama/entrypoint.sh:/entrypoint.sh
|
||||||
|
environment:
|
||||||
|
- OLLAMA_MODELS=/root/.ollama
|
||||||
|
- DEFAULT_OLLAMA_MODEL=${OLLAMA_RESEARCH_MODEL:-llama3.2:3b}
|
||||||
|
entrypoint: ["/bin/bash", "/entrypoint.sh"]
|
||||||
|
profiles: [dual-gpu-ollama, dual-gpu-mixed]
|
||||||
restart: unless-stopped
|
restart: unless-stopped
|
||||||
|
|
||||||
vision:
|
vision:
|
||||||
|
|
@ -64,7 +78,7 @@ services:
|
||||||
environment:
|
environment:
|
||||||
- VISION_MODEL=${VISION_MODEL:-vikhyatk/moondream2}
|
- VISION_MODEL=${VISION_MODEL:-vikhyatk/moondream2}
|
||||||
- VISION_REVISION=${VISION_REVISION:-2025-01-09}
|
- VISION_REVISION=${VISION_REVISION:-2025-01-09}
|
||||||
profiles: [single-gpu, dual-gpu]
|
profiles: [single-gpu, dual-gpu-ollama, dual-gpu-vllm, dual-gpu-mixed]
|
||||||
restart: unless-stopped
|
restart: unless-stopped
|
||||||
|
|
||||||
vllm:
|
vllm:
|
||||||
|
|
@ -81,7 +95,7 @@ services:
|
||||||
--enforce-eager
|
--enforce-eager
|
||||||
--max-num-seqs 8
|
--max-num-seqs 8
|
||||||
--cpu-offload-gb ${CPU_OFFLOAD_GB:-0}
|
--cpu-offload-gb ${CPU_OFFLOAD_GB:-0}
|
||||||
profiles: [dual-gpu]
|
profiles: [dual-gpu-vllm, dual-gpu-mixed]
|
||||||
restart: unless-stopped
|
restart: unless-stopped
|
||||||
|
|
||||||
finetune:
|
finetune:
|
||||||
|
|
|
||||||
Loading…
Reference in a new issue