diff --git a/app/services/meal_plan/llm_planner.py b/app/services/meal_plan/llm_planner.py index bc017e5..11859b4 100644 --- a/app/services/meal_plan/llm_planner.py +++ b/app/services/meal_plan/llm_planner.py @@ -5,6 +5,10 @@ Returns suggestions for human review — never writes to the DB directly. The API endpoint presents the suggestions and waits for user approval before calling store.upsert_slot(). + +Routing: pass a router from get_meal_plan_router() in llm_router.py. +Cloud: cf-text via cf-orch (3B-7B GGUF, ~2GB VRAM). +Local: LLMRouter (ollama / vllm / openai-compat per llm.yaml). """ from __future__ import annotations diff --git a/app/services/meal_plan/llm_timing.py b/app/services/meal_plan/llm_timing.py index 7847c69..8918b8b 100644 --- a/app/services/meal_plan/llm_timing.py +++ b/app/services/meal_plan/llm_timing.py @@ -3,7 +3,11 @@ """Estimate cook times for recipes missing corpus prep/cook time fields. Used only when tier allows `meal_plan_llm_timing`. Falls back gracefully -when LLMRouter is unavailable. +when no LLM backend is available. + +Routing: pass a router from get_meal_plan_router() in llm_router.py. +Cloud: cf-text via cf-orch (3B GGUF, ~2GB VRAM). +Local: LLMRouter (ollama / vllm / openai-compat per llm.yaml). """ from __future__ import annotations