fix: increase LLM summarize timeout to 120s for remote cf-orch routing
20s was too tight for first-request model swaps in Ollama (model cold load can take 30-60s). 120s matches coordinator inference timeout.
This commit is contained in:
parent
8339797b77
commit
dda0b453c2
1 changed files with 1 additions and 1 deletions
|
|
@ -38,7 +38,7 @@ def summarize(
|
||||||
llm_url: str,
|
llm_url: str,
|
||||||
llm_model: str,
|
llm_model: str,
|
||||||
api_key: str | None = None,
|
api_key: str | None = None,
|
||||||
timeout: float = 20.0,
|
timeout: float = 120.0,
|
||||||
) -> str | None:
|
) -> str | None:
|
||||||
if not entries:
|
if not entries:
|
||||||
return None
|
return None
|
||||||
|
|
|
||||||
Loading…
Reference in a new issue