fix(ollama): 清除所有硬寫 188:11434 fallback — 全部改指向 111 GPU
All checks were successful
CD Pipeline / build-and-deploy (push) Successful in 15m59s

- decision_manager.py: 兩處 getattr fallback 188 → 111
- routes/agent.py: OLLAMA_BASE_URL 188 → 111
- knowledge_extractor_service.py: _OLLAMA_BASE 188 → 111

config.py 預設早已是 111,此次清掉 code 層殘留的 188 硬寫值。

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
This commit is contained in:
OG T
2026-04-16 03:01:31 +08:00
parent 5f9c9d84a2
commit 27ba97e586
3 changed files with 4 additions and 4 deletions

View File

@@ -19,7 +19,7 @@ router = APIRouter()
logger = logging.getLogger(__name__)
# ==================== Ollama Config ====================
OLLAMA_BASE_URL = "http://192.168.0.188:11434"
OLLAMA_BASE_URL = "http://192.168.0.111:11434"
OLLAMA_MODEL = "llama3.2:latest" # 可根據實際部署調整
OLLAMA_TIMEOUT = 120.0 # 串流超時

View File

@@ -402,7 +402,7 @@ async def _nemoclaw_second_opinion(incident: "Incident", primary_result: dict) -
import httpx as _httpx
from src.services.model_registry import get_model as _get_model
ollama_url = getattr(settings, "OLLAMA_URL", "http://192.168.0.188:11434")
ollama_url = getattr(settings, "OLLAMA_URL", "http://192.168.0.111:11434")
# D1 集中化 2026-04-11: 從 models.json providers.ollama.models.nemoclaw 讀取
model = _get_model("ollama", "nemoclaw")
@@ -495,7 +495,7 @@ async def _generate_playbook_draft_if_new(incident: "Incident") -> None:
)
from src.services.model_registry import get_model as _get_model
ollama_url = getattr(settings, "OLLAMA_URL", "http://192.168.0.188:11434")
ollama_url = getattr(settings, "OLLAMA_URL", "http://192.168.0.111:11434")
# D1 集中化 2026-04-11: 從 models.json providers.ollama.models.playbook_draft 讀取
_pb_model = _get_model("ollama", "playbook_draft")
async with _httpx.AsyncClient(timeout=45.0) as client:

View File

@@ -15,7 +15,7 @@ import structlog
logger = structlog.get_logger(__name__)
_OLLAMA_BASE = "http://192.168.0.188:11434"
_OLLAMA_BASE = "http://192.168.0.111:11434"
_EXTRACT_MODEL = "llama3.2:3b"
_EXTRACT_TIMEOUT = 30.0 # 秒,容忍慢速