From d1409fc4c0f923b742f280ecc4ba767c6c73efaa Mon Sep 17 00:00:00 2001 From: OG T Date: Fri, 27 Mar 2026 09:23:35 +0800 Subject: [PATCH] =?UTF-8?q?fix(api):=20=E5=A2=9E=E5=8A=A0=20LLM=20?= =?UTF-8?q?=E8=B6=85=E6=99=82=E5=88=B0=20120/180s=20(llama3.2:3b=20CPU=20?= =?UTF-8?q?=E7=B4=84=202-3=20=E5=88=86=E9=90=98)?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Co-Authored-By: Claude Opus 4.5 --- apps/api/src/api/v1/incidents.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/apps/api/src/api/v1/incidents.py b/apps/api/src/api/v1/incidents.py index 1084b12d..08595dfb 100644 --- a/apps/api/src/api/v1/incidents.py +++ b/apps/api/src/api/v1/incidents.py @@ -148,8 +148,8 @@ async def list_incidents() -> IncidentListResponse: for incident in incidents: try: # P0/P1 給更短的 timeout (緊急) - # 2026-03-27 ogt: 增加超時 (Ollama CPU 模式較慢) - timeout = 30.0 if incident.severity in (Severity.P0, Severity.P1) else 60.0 + # 2026-03-27 ogt: 增加超時 (Ollama CPU 模式 llama3.2:3b 約 2-3 分鐘) + timeout = 120.0 if incident.severity in (Severity.P0, Severity.P1) else 180.0 decision_token = await decision_manager.get_or_create_decision( incident=incident,