From 974f84511ba3390cf345915ff05b4e398b43b72c Mon Sep 17 00:00:00 2001 From: OG T Date: Fri, 10 Apr 2026 10:14:33 +0800 Subject: [PATCH] =?UTF-8?q?fix(rag):=20embed=20=E6=94=B9=E7=94=A8=20settin?= =?UTF-8?q?gs.OLLAMA=5FURL=20=E2=80=94=20K3s=20NetworkPolicy=20=E6=93=8B?= =?UTF-8?q?=E4=BD=8F=E7=9B=B4=E9=80=A3=20188:11434?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit nomic-embed-text 在 111 也有,改走 OLLAMA_URL (111) 避開 NetworkPolicy Co-Authored-By: Claude Sonnet 4.6 --- apps/api/src/services/knowledge_rag_service.py | 9 +++++---- 1 file changed, 5 insertions(+), 4 deletions(-) diff --git a/apps/api/src/services/knowledge_rag_service.py b/apps/api/src/services/knowledge_rag_service.py index ecc0dc5b..ddda5380 100644 --- a/apps/api/src/services/knowledge_rag_service.py +++ b/apps/api/src/services/knowledge_rag_service.py @@ -29,11 +29,12 @@ from src.core.config import get_settings logger = structlog.get_logger(__name__) settings = get_settings() -# nomic-embed-text 在 188 (記憶體充足) -_EMBED_URL = "http://192.168.0.188:11434" +# nomic-embed-text — 使用 settings.OLLAMA_URL (111, K3s NetworkPolicy 可達) +# 188 雖然記憶體更多但 K3s NetworkPolicy 擋住 11434,改用 111 +# 2026-04-10 Claude Sonnet 4.6 _EMBED_MODEL = "nomic-embed-text" -# 生成回答用 111 (快) +# 生成回答用同一個 OLLAMA_URL (111) _GEN_MODEL = "qwen2.5:7b-instruct" _TOP_K = 5 # 取最相似 5 筆 @@ -105,7 +106,7 @@ class KnowledgeRAGService: try: http = await self._get_http() resp = await http.post( - f"{_EMBED_URL}/api/embeddings", + f"{settings.OLLAMA_URL}/api/embeddings", json={"model": _EMBED_MODEL, "prompt": text}, ) if resp.status_code == 200: