feat(hermes): 升級 Ollama 模型路由 — qwen3:8b 取代雙模型
Some checks are pending
CD Pipeline / build-and-deploy (push) Has started running

- qwen2.5-coder:7b + qwen2.5:7b-instruct → qwen3:8b (Hybrid Thinking)
- qwen3:8b 同時勝任程式碼與通用指令,單一模型涵蓋 9 個 agent
- deepseek-r1:14b 保留 debugger / vuln-verifier 推理任務
- gemma4 尚未在 Ollama registry 釋出,暫保留 gemma3:4b
- 已在 111 主機 pull qwen3:8b (4.9GB)

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
This commit is contained in:
Your Name
2026-04-25 03:24:08 +08:00
parent 411a285735
commit 7b6df17dee

View File

@@ -54,21 +54,22 @@ _RATE_LIMIT_WINDOW_SEC = 60
# Ollama 模型路由(按 agent 專業選最適模型111 主機)
# ─────────────────────────────────────────────────────────────────────────────
_MODEL_BY_AGENT: dict[str, str] = {
# 推理型(找根因 / 安全分析)→ deepseek-r1:14b
# 推理型(找根因 / 安全分析)→ deepseek-r1:14bCoT 推理)
"debugger": "deepseek-r1:14b",
"vuln-verifier": "deepseek-r1:14b",
# 程式碼review / 實作 / 重構 / DB / 前端 / 工具)→ qwen2.5-coder:7b
"critic": "qwen2.5-coder:7b",
"db-expert": "qwen2.5-coder:7b",
"fullstack-engineer": "qwen2.5-coder:7b",
"refactor-specialist":"qwen2.5-coder:7b",
"migration-engineer": "qwen2.5-coder:7b",
"frontend-designer": "qwen2.5-coder:7b",
"tool-expert": "qwen2.5-coder:7b",
# 通用指令(規劃 / 導覽 / 文件)→ qwen2.5:7b-instruct
"planner": "qwen2.5:7b-instruct",
"onboarder": "qwen2.5:7b-instruct",
"web-researcher": "qwen2.5:7b-instruct",
# 程式碼 + 通review / 實作 / 重構 / DB / 前端 / 工具 / 規劃 / 文件)→ qwen3:8b
# 2026-04-25 ogt + Claude Sonnet 4.6: qwen2.5-coder:7b + qwen2.5:7b-instruct → qwen3:8b
# qwen3:8b Hybrid Thinking 同時勝任程式碼與指令gemma4 尚未在 Ollama 釋出
"critic": "qwen3:8b",
"db-expert": "qwen3:8b",
"fullstack-engineer": "qwen3:8b",
"refactor-specialist":"qwen3:8b",
"migration-engineer": "qwen3:8b",
"frontend-designer": "qwen3:8b",
"tool-expert": "qwen3:8b",
"planner": "qwen3:8b",
"onboarder": "qwen3:8b",
"web-researcher": "qwen3:8b",
}
_DEFAULT_MODEL = "deepseek-r1:14b"
_OLLAMA_TIMEOUT = 90.0 # deepseek-r1:14b 推理較慢,給 90s