From 4a21b7f53f7ee44425c50e70a97d9375cc813586 Mon Sep 17 00:00:00 2001
From: yangdx <gzdaniel@me.com>
Date: Wed, 10 Sep 2025 16:23:10 +0800
Subject: [PATCH] Update OpenAI API config docs for max_tokens and
 max_completion_tokens
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

• Clarify max_tokens vs max_completion_tokens
• Add Gemini exception note
• Update parameter descriptions
• Add new completion tokens option
---
 env.example | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/env.example b/env.example
index b322baa7..e18ee2fb 100644
--- a/env.example
+++ b/env.example
@@ -174,9 +174,12 @@ LLM_BINDING_API_KEY=your_api_key
 # LLM_BINDING_API_KEY=your_api_key
 # LLM_BINDING=openai
 
-### OpenAI Specific Parameters
-### Set the max_output_tokens to mitigate endless output of some LLM (less than LLM_TIMEOUT * llm_output_tokens/second, i.e. 9000 = 180s * 50 tokens/s)
+### OpenAI Compatible API Specific Parameters
+### Set the max_tokens to mitigate endless output of some LLM (less than LLM_TIMEOUT * llm_output_tokens/second, i.e. 9000 = 180s * 50 tokens/s)
+### Typically, max_tokens does not include prompt content, though some models, such as Gemini-2.5-Flash, are exceptions
+#### OpenAI's new API utilizes max_completion_tokens instead of max_tokens
 # OPENAI_LLM_MAX_TOKENS=9000
+# OPENAI_LLM_MAX_COMPLETION_TOKENS=9000
 
 ### OpenRouter Specific Parameters
 # OPENAI_LLM_EXTRA_BODY='{"reasoning": {"enabled": false}}'