mirror of
https://github.com/HKUDS/nanobot.git
synced 2026-05-20 00:22:31 +00:00
fix(config): reduce max_tokens and context_window_tokens in schema
This commit is contained in:
parent
1c2ea1aad2
commit
858b6610c3
@ -93,8 +93,8 @@ class ModelPresetConfig(Base):
|
|||||||
|
|
||||||
model: str
|
model: str
|
||||||
provider: str = "auto"
|
provider: str = "auto"
|
||||||
max_tokens: int = 32_000
|
max_tokens: int = 8192
|
||||||
context_window_tokens: int = 262_144
|
context_window_tokens: int = 65_536
|
||||||
temperature: float = 0.1
|
temperature: float = 0.1
|
||||||
reasoning_effort: str | None = None
|
reasoning_effort: str | None = None
|
||||||
|
|
||||||
@ -116,8 +116,8 @@ class AgentDefaults(Base):
|
|||||||
provider: str = (
|
provider: str = (
|
||||||
"auto" # Provider name (e.g. "anthropic", "openrouter") or "auto" for auto-detection
|
"auto" # Provider name (e.g. "anthropic", "openrouter") or "auto" for auto-detection
|
||||||
)
|
)
|
||||||
max_tokens: int = 32_000
|
max_tokens: int = 8192
|
||||||
context_window_tokens: int = 262_144
|
context_window_tokens: int = 65_536
|
||||||
context_block_limit: int | None = None
|
context_block_limit: int | None = None
|
||||||
temperature: float = 0.1
|
temperature: float = 0.1
|
||||||
fallback_models: list[FallbackCandidate] = Field(default_factory=list)
|
fallback_models: list[FallbackCandidate] = Field(default_factory=list)
|
||||||
|
|||||||
@ -176,7 +176,7 @@ class TestRestartCommand:
|
|||||||
assert response is not None
|
assert response is not None
|
||||||
assert "Model: test-model" in response.content
|
assert "Model: test-model" in response.content
|
||||||
assert "Tokens: 0 in / 0 out" in response.content
|
assert "Tokens: 0 in / 0 out" in response.content
|
||||||
assert "Context: 20k/262k (7% of input budget)" in response.content
|
assert "Context: 20k/65k (31% of input budget)" in response.content
|
||||||
assert "Session: 3 messages" in response.content
|
assert "Session: 3 messages" in response.content
|
||||||
assert "Uptime: 2m 5s" in response.content
|
assert "Uptime: 2m 5s" in response.content
|
||||||
assert "Tasks: 0 active" in response.content
|
assert "Tasks: 0 active" in response.content
|
||||||
@ -240,7 +240,7 @@ class TestRestartCommand:
|
|||||||
|
|
||||||
assert response is not None
|
assert response is not None
|
||||||
assert "Tokens: 1200 in / 34 out" in response.content
|
assert "Tokens: 1200 in / 34 out" in response.content
|
||||||
assert "Context: 1k/262k (0% of input budget)" in response.content
|
assert "Context: 1k/65k (1% of input budget)" in response.content
|
||||||
assert "Tasks: 0 active" in response.content
|
assert "Tasks: 0 active" in response.content
|
||||||
|
|
||||||
@pytest.mark.asyncio
|
@pytest.mark.asyncio
|
||||||
|
|||||||
@ -34,7 +34,7 @@ def test_load_config_keeps_max_tokens_and_ignores_legacy_memory_window(tmp_path)
|
|||||||
config = load_config(config_path)
|
config = load_config(config_path)
|
||||||
|
|
||||||
assert config.agents.defaults.max_tokens == 1234
|
assert config.agents.defaults.max_tokens == 1234
|
||||||
assert config.agents.defaults.context_window_tokens == 262_144
|
assert config.agents.defaults.context_window_tokens == 65_536
|
||||||
assert not hasattr(config.agents.defaults, "memory_window")
|
assert not hasattr(config.agents.defaults, "memory_window")
|
||||||
|
|
||||||
|
|
||||||
@ -60,7 +60,7 @@ def test_save_config_writes_context_window_tokens_but_not_memory_window(tmp_path
|
|||||||
defaults = saved["agents"]["defaults"]
|
defaults = saved["agents"]["defaults"]
|
||||||
|
|
||||||
assert defaults["maxTokens"] == 2222
|
assert defaults["maxTokens"] == 2222
|
||||||
assert defaults["contextWindowTokens"] == 262_144
|
assert defaults["contextWindowTokens"] == 65_536
|
||||||
assert "memoryWindow" not in defaults
|
assert "memoryWindow" not in defaults
|
||||||
|
|
||||||
|
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user