fix(providers): make max_tokens and max_completion_tokens mutually exclusive (#2491)

* fix(providers): make max_tokens and max_completion_tokens mutually exclusive * docs: document supports_max_completion_tokens ProviderSpec option
2026-05-01 23:35:52 +00:00 · 2026-03-27 13:10:04 +03:00 · 2026-03-27 13:10:04 +03:00 · d96b0b7833
commit d96b0b7833
parent 9aa2116e24
3 changed files with 9 additions and 2 deletions
--- a/README.md
+++ b/README.md
@ -110,6 +110,8 @@
 - [🌐 Agent Social Network](#-agent-social-network)
 - [⚙️ Configuration](#️-configuration)
  - [Providers](#providers)
  - [Channel Settings](#channel-settings)
    - [Retry Behavior](#retry-behavior)
  - [Web Search](#web-search)
  - [MCP (Model Context Protocol)](#mcp-model-context-protocol)
  - [Security](#security)
@ -1248,6 +1250,7 @@ That's it! Environment variables, model routing, config matching, and `nanobot s
 | `detect_by_key_prefix` | Detect gateway by API key prefix | `"sk-or-"` |
 | `detect_by_base_keyword` | Detect gateway by API base URL | `"openrouter"` |
 | `strip_model_prefix` | Strip provider prefix before sending to gateway | `True` (for AiHubMix) |
 | `supports_max_completion_tokens` | Use `max_completion_tokens` instead of `max_tokens`; required for providers that reject both being set simultaneously (e.g. VolcEngine) | `True` |
 </details>
--- a/nanobot/providers/openai_compat_provider.py
+++ b/nanobot/providers/openai_compat_provider.py
@ -229,11 +229,14 @@ class OpenAICompatProvider(LLMProvider):
        kwargs: dict[str, Any] = {
            "model": model_name,
            "messages": self._sanitize_messages(self._sanitize_empty_content(messages)),
            "max_tokens": max(1, max_tokens),
            "max_completion_tokens": max(1, max_tokens),
            "temperature": temperature,
        }
        if spec and getattr(spec, "supports_max_completion_tokens", False):
            kwargs["max_completion_tokens"] = max(1, max_tokens)
        else:
            kwargs["max_tokens"] = max(1, max_tokens)
        if spec:
            model_lower = model_name.lower()
            for pattern, overrides in spec.model_overrides:
--- a/nanobot/providers/registry.py
+++ b/nanobot/providers/registry.py
@ -49,6 +49,7 @@ class ProviderSpec:
    # gateway behavior
    strip_model_prefix: bool = False  # strip "provider/" before sending to gateway
    supports_max_completion_tokens: bool = False
    # per-model param overrides, e.g. (("kimi-k2.5", {"temperature": 1.0}),)
    model_overrides: tuple[tuple[str, dict[str, Any]], ...] = ()