perf(nvidia): bump max_tokens to 2048 for full RCA responses
All checks were successful
E2E Health Check / e2e-health (push) Successful in 16s

This commit is contained in:
OG T
2026-03-31 15:07:51 +08:00
parent 3562a67a58
commit dffb535220

View File

@@ -659,7 +659,7 @@ class NvidiaProvider:
prompt: str,
model: str | None = None,
temperature: float = 0.1,
max_tokens: int = 1024,
max_tokens: int = 2048,
) -> tuple[str, bool, int, float]:
"""
一般對話 (非 Tool Calling) - 用於 RCA 分析