From 7b6df17deec77fc1579f67c92981ccaa309e1bbb Mon Sep 17 00:00:00 2001 From: Your Name Date: Sat, 25 Apr 2026 03:24:08 +0800 Subject: [PATCH] =?UTF-8?q?feat(hermes):=20=E5=8D=87=E7=B4=9A=20Ollama=20?= =?UTF-8?q?=E6=A8=A1=E5=9E=8B=E8=B7=AF=E7=94=B1=20=E2=80=94=20qwen3:8b=20?= =?UTF-8?q?=E5=8F=96=E4=BB=A3=E9=9B=99=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit - qwen2.5-coder:7b + qwen2.5:7b-instruct → qwen3:8b (Hybrid Thinking) - qwen3:8b 同時勝任程式碼與通用指令,單一模型涵蓋 9 個 agent - deepseek-r1:14b 保留 debugger / vuln-verifier 推理任務 - gemma4 尚未在 Ollama registry 釋出,暫保留 gemma3:4b - 已在 111 主機 pull qwen3:8b (4.9GB) Co-Authored-By: Claude Sonnet 4.6 --- apps/api/src/hermes/nl_gateway.py | 27 ++++++++++++++------------- 1 file changed, 14 insertions(+), 13 deletions(-) diff --git a/apps/api/src/hermes/nl_gateway.py b/apps/api/src/hermes/nl_gateway.py index e68d9b53..b665a75a 100644 --- a/apps/api/src/hermes/nl_gateway.py +++ b/apps/api/src/hermes/nl_gateway.py @@ -54,21 +54,22 @@ _RATE_LIMIT_WINDOW_SEC = 60 # Ollama 模型路由(按 agent 專業選最適模型,111 主機) # ───────────────────────────────────────────────────────────────────────────── _MODEL_BY_AGENT: dict[str, str] = { - # 推理型(找根因 / 安全分析)→ deepseek-r1:14b + # 推理型(找根因 / 安全分析)→ deepseek-r1:14b(CoT 推理) "debugger": "deepseek-r1:14b", "vuln-verifier": "deepseek-r1:14b", - # 程式碼專用(review / 實作 / 重構 / DB / 前端 / 工具)→ qwen2.5-coder:7b - "critic": "qwen2.5-coder:7b", - "db-expert": "qwen2.5-coder:7b", - "fullstack-engineer": "qwen2.5-coder:7b", - "refactor-specialist":"qwen2.5-coder:7b", - "migration-engineer": "qwen2.5-coder:7b", - "frontend-designer": "qwen2.5-coder:7b", - "tool-expert": "qwen2.5-coder:7b", - # 通用指令(規劃 / 導覽 / 文件)→ qwen2.5:7b-instruct - "planner": "qwen2.5:7b-instruct", - "onboarder": "qwen2.5:7b-instruct", - "web-researcher": "qwen2.5:7b-instruct", + # 程式碼 + 通用(review / 實作 / 重構 / DB / 前端 / 工具 / 規劃 / 文件)→ qwen3:8b + # 2026-04-25 ogt + Claude Sonnet 4.6: qwen2.5-coder:7b + qwen2.5:7b-instruct → qwen3:8b + # qwen3:8b Hybrid Thinking 同時勝任程式碼與指令;gemma4 尚未在 Ollama 釋出 + "critic": "qwen3:8b", + "db-expert": "qwen3:8b", + "fullstack-engineer": "qwen3:8b", + "refactor-specialist":"qwen3:8b", + "migration-engineer": "qwen3:8b", + "frontend-designer": "qwen3:8b", + "tool-expert": "qwen3:8b", + "planner": "qwen3:8b", + "onboarder": "qwen3:8b", + "web-researcher": "qwen3:8b", } _DEFAULT_MODEL = "deepseek-r1:14b" _OLLAMA_TIMEOUT = 90.0 # deepseek-r1:14b 推理較慢,給 90s