fix(nvidia): lower default max_tokens to 1024 to fit nemotron-mini 4096 context length
All checks were successful
E2E Health Check / e2e-health (push) Successful in 16s

This commit is contained in:
OG T
2026-03-31 13:44:17 +08:00
parent f458d078df
commit 11627f25f0

View File

@@ -655,7 +655,7 @@ class NvidiaProvider:
prompt: str,
model: str | None = None,
temperature: float = 0.1,
max_tokens: int = 2048,
max_tokens: int = 1024,
) -> tuple[str, bool, int, float]:
"""
一般對話 (非 Tool Calling) - 用於 RCA 分析