diff --git a/apps/api/src/api/v1/monitoring.py b/apps/api/src/api/v1/monitoring.py index f7a47cca..1cad552f 100644 --- a/apps/api/src/api/v1/monitoring.py +++ b/apps/api/src/api/v1/monitoring.py @@ -18,6 +18,7 @@ from datetime import UTC, datetime import httpx from fastapi import APIRouter +from src.core.config import settings from src.core.logging import get_logger logger = get_logger(__name__) @@ -64,7 +65,9 @@ async def _probe_grafana(client: httpx.AsyncClient) -> dict: async def _probe_prometheus(client: httpx.AsyncClient) -> dict: - base = "http://192.168.0.110:9090" + # 2026-04-29 ogt + Claude Opus 4.7: 改用 settings 對齊單一事實源 + # 原本寫死 110:9090 雖巧合正確,但繞過 ConfigMap 注入機制 + base = settings.PROMETHEUS_URL try: health_r = await client.get(f"{base}/-/healthy", timeout=TIMEOUT) if health_r.status_code == 200: diff --git a/k8s/kured/kured.yaml b/k8s/kured/kured.yaml index 18033464..14cf3f78 100644 --- a/k8s/kured/kured.yaml +++ b/k8s/kured/kured.yaml @@ -129,7 +129,10 @@ spec: # PodDisruptionBudget 檢查 - --blocking-pod-selector=app.kubernetes.io/name=awoooi # Prometheus metrics - - --prometheus-url=http://192.168.0.188:9090 + # 2026-04-29 ogt + Claude Opus 4.7: drift fix — 188 是 Ollama Hub + # Prometheus 實際在 110。kured 連錯主機 = 跳過 alert 守門員直接 reboot + # 對齊 ConfigMap 04-configmap.yaml + config.py PROMETHEUS_URL + - --prometheus-url=http://192.168.0.110:9090 resources: limits: cpu: 100m