feat(resources): add 24GB, 16GB, 4GB, CPU+32GB, CPU+16GB public profiles
This commit is contained in:
parent
bfc1f7b7b9
commit
5429e3f595
5 changed files with 186 additions and 0 deletions
33
circuitforge_core/resources/profiles/public/cpu-16gb.yaml
Normal file
33
circuitforge_core/resources/profiles/public/cpu-16gb.yaml
Normal file
|
|
@ -0,0 +1,33 @@
|
|||
schema_version: 1
|
||||
name: cpu-16gb
|
||||
eviction_timeout_s: 30.0
|
||||
services:
|
||||
ollama:
|
||||
max_mb: 0
|
||||
priority: 1
|
||||
cf-stt:
|
||||
max_mb: 0
|
||||
priority: 2
|
||||
shared: true
|
||||
max_concurrent: 1
|
||||
backend: moonshine
|
||||
cf-tts:
|
||||
max_mb: 0
|
||||
priority: 2
|
||||
shared: true
|
||||
max_concurrent: 1
|
||||
cf-embed:
|
||||
max_mb: 0
|
||||
priority: 2
|
||||
shared: true
|
||||
max_concurrent: 2
|
||||
always_on: true
|
||||
cf-classify:
|
||||
max_mb: 0
|
||||
priority: 2
|
||||
shared: true
|
||||
max_concurrent: 2
|
||||
always_on: true
|
||||
model_size_hints:
|
||||
llm_max_params: 3b-q4
|
||||
image_gen_max: none
|
||||
33
circuitforge_core/resources/profiles/public/cpu-32gb.yaml
Normal file
33
circuitforge_core/resources/profiles/public/cpu-32gb.yaml
Normal file
|
|
@ -0,0 +1,33 @@
|
|||
schema_version: 1
|
||||
name: cpu-32gb
|
||||
eviction_timeout_s: 30.0
|
||||
services:
|
||||
ollama:
|
||||
max_mb: 0
|
||||
priority: 1
|
||||
cf-stt:
|
||||
max_mb: 0
|
||||
priority: 2
|
||||
shared: true
|
||||
max_concurrent: 2
|
||||
backend: faster-whisper
|
||||
cf-tts:
|
||||
max_mb: 0
|
||||
priority: 2
|
||||
shared: true
|
||||
max_concurrent: 2
|
||||
cf-embed:
|
||||
max_mb: 0
|
||||
priority: 2
|
||||
shared: true
|
||||
max_concurrent: 4
|
||||
always_on: true
|
||||
cf-classify:
|
||||
max_mb: 0
|
||||
priority: 2
|
||||
shared: true
|
||||
max_concurrent: 4
|
||||
always_on: true
|
||||
model_size_hints:
|
||||
llm_max_params: 7b-q4
|
||||
image_gen_max: none
|
||||
|
|
@ -0,0 +1,45 @@
|
|||
schema_version: 1
|
||||
name: single-gpu-16gb
|
||||
vram_total_mb: 16384
|
||||
eviction_timeout_s: 10.0
|
||||
services:
|
||||
vllm:
|
||||
max_mb: 12288
|
||||
priority: 1
|
||||
ollama:
|
||||
max_mb: 12288
|
||||
priority: 1
|
||||
cf-vision:
|
||||
max_mb: 3072
|
||||
priority: 2
|
||||
shared: true
|
||||
max_concurrent: 4
|
||||
cf-stt:
|
||||
max_mb: 1200
|
||||
priority: 2
|
||||
shared: true
|
||||
max_concurrent: 3
|
||||
backend: parakeet-tdt
|
||||
cf-tts:
|
||||
max_mb: 1024
|
||||
priority: 2
|
||||
shared: true
|
||||
max_concurrent: 3
|
||||
cf-embed:
|
||||
max_mb: 512
|
||||
priority: 2
|
||||
shared: true
|
||||
max_concurrent: 6
|
||||
always_on: true
|
||||
cf-classify:
|
||||
max_mb: 512
|
||||
priority: 2
|
||||
shared: true
|
||||
max_concurrent: 6
|
||||
always_on: true
|
||||
comfyui:
|
||||
max_mb: 14336
|
||||
priority: 4
|
||||
model_size_hints:
|
||||
llm_max_params: 34b
|
||||
image_gen_max: flux-dev-fp8
|
||||
|
|
@ -0,0 +1,45 @@
|
|||
schema_version: 1
|
||||
name: single-gpu-24gb
|
||||
vram_total_mb: 24576
|
||||
eviction_timeout_s: 10.0
|
||||
services:
|
||||
vllm:
|
||||
max_mb: 20480
|
||||
priority: 1
|
||||
ollama:
|
||||
max_mb: 18432
|
||||
priority: 1
|
||||
cf-vision:
|
||||
max_mb: 4096
|
||||
priority: 2
|
||||
shared: true
|
||||
max_concurrent: 6
|
||||
cf-stt:
|
||||
max_mb: 1200
|
||||
priority: 2
|
||||
shared: true
|
||||
max_concurrent: 4
|
||||
backend: parakeet-tdt
|
||||
cf-tts:
|
||||
max_mb: 1024
|
||||
priority: 2
|
||||
shared: true
|
||||
max_concurrent: 4
|
||||
cf-embed:
|
||||
max_mb: 512
|
||||
priority: 2
|
||||
shared: true
|
||||
max_concurrent: 8
|
||||
always_on: true
|
||||
cf-classify:
|
||||
max_mb: 512
|
||||
priority: 2
|
||||
shared: true
|
||||
max_concurrent: 8
|
||||
always_on: true
|
||||
comfyui:
|
||||
max_mb: 20480
|
||||
priority: 4
|
||||
model_size_hints:
|
||||
llm_max_params: 70b
|
||||
image_gen_max: flux-dev-fp16
|
||||
|
|
@ -0,0 +1,30 @@
|
|||
schema_version: 1
|
||||
name: single-gpu-4gb
|
||||
vram_total_mb: 4096
|
||||
eviction_timeout_s: 15.0
|
||||
services:
|
||||
ollama:
|
||||
max_mb: 3072
|
||||
priority: 1
|
||||
cf-vision:
|
||||
max_mb: 1024
|
||||
priority: 2
|
||||
shared: true
|
||||
max_concurrent: 1
|
||||
cf-stt:
|
||||
max_mb: 600
|
||||
priority: 2
|
||||
shared: true
|
||||
max_concurrent: 1
|
||||
backend: faster-whisper
|
||||
cf-tts:
|
||||
max_mb: 512
|
||||
priority: 2
|
||||
shared: true
|
||||
max_concurrent: 1
|
||||
comfyui:
|
||||
max_mb: 3584
|
||||
priority: 4
|
||||
model_size_hints:
|
||||
llm_max_params: 3b
|
||||
image_gen_max: sd15-fp8
|
||||
Loading…
Reference in a new issue