From dffb5352200a2bc2cf4ccedfe829f7db7e7dba41 Mon Sep 17 00:00:00 2001 From: OG T Date: Tue, 31 Mar 2026 15:07:51 +0800 Subject: [PATCH] perf(nvidia): bump max_tokens to 2048 for full RCA responses --- apps/api/src/services/nvidia_provider.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/apps/api/src/services/nvidia_provider.py b/apps/api/src/services/nvidia_provider.py index 014395dc..b6d1e20c 100644 --- a/apps/api/src/services/nvidia_provider.py +++ b/apps/api/src/services/nvidia_provider.py @@ -659,7 +659,7 @@ class NvidiaProvider: prompt: str, model: str | None = None, temperature: float = 0.1, - max_tokens: int = 1024, + max_tokens: int = 2048, ) -> tuple[str, bool, int, float]: """ 一般對話 (非 Tool Calling) - 用於 RCA 分析