fix: increase LLM summarize timeout to 120s for remote cf-orch routing

20s was too tight for first-request model swaps in Ollama (model cold load
can take 30-60s). 120s matches coordinator inference timeout.
This commit is contained in:
pyr0ball 2026-05-12 18:27:52 -07:00
parent 8339797b77
commit dda0b453c2

View file

@ -38,7 +38,7 @@ def summarize(
llm_url: str, llm_url: str,
llm_model: str, llm_model: str,
api_key: str | None = None, api_key: str | None = None,
timeout: float = 20.0, timeout: float = 120.0,
) -> str | None: ) -> str | None:
if not entries: if not entries:
return None return None