feat: loose the max token for vision fallback as some models spend output on internal thinking

This commit is contained in:
Richard Tang
2026-04-30 13:24:49 -07:00
parent 73511a3c59
commit 76a7dd4bd5
@@ -210,7 +210,7 @@ async def caption_tool_image(
kwargs: dict[str, Any] = {
"model": rewritten_model,
"messages": messages,
"max_tokens": 1024,
"max_tokens": 8192,
"timeout": timeout_s,
}
# Pass api_key directly only when there are no proxy-rewritten