diff --git a/.env.example b/.env.example index f8fe128..324a8f4 100644 --- a/.env.example +++ b/.env.example @@ -14,6 +14,10 @@ # Model requests allowed per minute per user. # MODEL_RATE_LIMIT=4 +# Max number of context tokens a user can request at once. +# Increase this if your proxy allow GPT 32k or 128k context +# MAX_CONTEXT_TOKENS_OPENAI=16384 + # Max number of output tokens a user can request at once. # MAX_OUTPUT_TOKENS_OPENAI=400 # MAX_OUTPUT_TOKENS_ANTHROPIC=400