chore(llm): add latest models and default to GPT-5.5

Add Claude Opus 4.8, Gemini 3.5 Flash, Grok 4.3, and Qwen3.7-Max; default
deep model is now GPT-5.5.
This commit is contained in:
Yijia-Xiao
2026-05-31 08:01:03 +00:00
parent c93b92c7a4
commit 2f85be624e
4 changed files with 15 additions and 15 deletions

View File

@@ -226,7 +226,7 @@ from tradingagents.default_config import DEFAULT_CONFIG
config = DEFAULT_CONFIG.copy()
config["llm_provider"] = "openai" # openai, google, anthropic, xai, deepseek, qwen, qwen-cn, glm, glm-cn, minimax, minimax-cn, openrouter, ollama, azure
config["deep_think_llm"] = "gpt-5.4" # Model for complex reasoning
config["deep_think_llm"] = "gpt-5.5" # Model for complex reasoning
config["quick_think_llm"] = "gpt-5.4-mini" # Model for quick tasks
config["max_debate_rounds"] = 2

View File

@@ -21,7 +21,7 @@ def _reload_with_env(monkeypatch, **overrides):
def test_no_env_uses_built_in_defaults(monkeypatch):
dc = _reload_with_env(monkeypatch)
assert dc.DEFAULT_CONFIG["llm_provider"] == "openai"
assert dc.DEFAULT_CONFIG["deep_think_llm"] == "gpt-5.4"
assert dc.DEFAULT_CONFIG["deep_think_llm"] == "gpt-5.5"
assert dc.DEFAULT_CONFIG["quick_think_llm"] == "gpt-5.4-mini"
assert dc.DEFAULT_CONFIG["backend_url"] is None
assert dc.DEFAULT_CONFIG["max_debate_rounds"] == 1

View File

@@ -53,7 +53,7 @@ DEFAULT_CONFIG = _apply_env_overrides({
"memory_log_max_entries": None,
# LLM settings
"llm_provider": "openai",
"deep_think_llm": "gpt-5.4",
"deep_think_llm": "gpt-5.5",
"quick_think_llm": "gpt-5.4-mini",
# When None, each provider's client falls back to its own default endpoint
# (api.openai.com for OpenAI, generativelanguage.googleapis.com for Gemini, ...).

View File

@@ -44,9 +44,9 @@ _QWEN_MODELS: Dict[str, List[ModelOption]] = {
("Custom model ID", "custom"),
],
"deep": [
("Qwen 3.6 Plus - Flagship vision-language, agentic coding SOTA", "qwen3.6-plus"),
("Qwen 3.7 Max - Latest flagship reasoning agent, 1M ctx", "qwen3.7-max"),
("Qwen 3.6 Plus - Vision-language, agentic coding", "qwen3.6-plus"),
("Qwen 3.5 Plus - Previous-gen flagship", "qwen3.5-plus"),
("Qwen 3 Max - Specialized for agent programming + tool use", "qwen3-max"),
("Custom model ID", "custom"),
],
}
@@ -95,37 +95,37 @@ MODEL_OPTIONS: ProviderModeOptions = {
("Claude Sonnet 4.5 - High-performance for agents and coding", "claude-sonnet-4-5"),
],
"deep": [
("Claude Opus 4.7 - Latest frontier, long-running agents and coding", "claude-opus-4-7"),
("Claude Opus 4.8 - Latest frontier, agentic coding and reasoning", "claude-opus-4-8"),
("Claude Opus 4.7 - Previous frontier, long-running agents", "claude-opus-4-7"),
("Claude Opus 4.6 - Frontier intelligence, agents and coding", "claude-opus-4-6"),
("Claude Opus 4.5 - Premium, max intelligence", "claude-opus-4-5"),
("Claude Sonnet 4.6 - Best speed and intelligence balance", "claude-sonnet-4-6"),
],
},
"google": {
"quick": [
("Gemini 3 Flash - Next-gen fast (preview)", "gemini-3-flash-preview"),
("Gemini 2.5 Flash - Balanced, stable", "gemini-2.5-flash"),
("Gemini 3.5 Flash - Latest, frontier agentic + coding (GA)", "gemini-3.5-flash"),
("Gemini 3.1 Flash Lite - Most cost-efficient (GA)", "gemini-3.1-flash-lite"),
("Gemini 2.5 Flash - Balanced, stable", "gemini-2.5-flash"),
("Gemini 2.5 Flash Lite - Fast, low-cost", "gemini-2.5-flash-lite"),
],
"deep": [
("Gemini 3.1 Pro - Reasoning-first, complex workflows (preview)", "gemini-3.1-pro-preview"),
("Gemini 3 Flash - Next-gen fast (preview)", "gemini-3-flash-preview"),
("Gemini 3.5 Flash - Latest GA, strong agentic + coding", "gemini-3.5-flash"),
("Gemini 2.5 Pro - Stable pro model", "gemini-2.5-pro"),
("Gemini 2.5 Flash - Balanced, stable", "gemini-2.5-flash"),
],
},
"xai": {
"quick": [
("Grok 4.20 (Non-Reasoning) - Latest, speed-optimized", "grok-4.20-non-reasoning"),
("Grok 4.3 - Latest flagship, fast with built-in reasoning", "grok-4.3"),
("Grok Build 0.1 - Coding-specialized, 256K ctx", "grok-build-0.1"),
("Grok 4 Fast (Non-Reasoning) - Speed optimized", "grok-4-fast-non-reasoning"),
("Grok 4 Fast (Reasoning) - High-performance", "grok-4-fast-reasoning"),
],
"deep": [
("Grok 4.20 (Reasoning) - Latest frontier reasoning model", "grok-4.20-reasoning"),
("Grok 4 - Flagship (dated build)", "grok-4-0709"),
("Grok 4.3 - Latest flagship, built-in reasoning, 1M ctx", "grok-4.3"),
("Grok 4.20 (Reasoning) - Previous-gen reasoning", "grok-4.20-0309-reasoning"),
("Grok 4 Fast (Reasoning) - High-performance", "grok-4-fast-reasoning"),
("Grok 4.20 - Auto-select reasoning behavior", "grok-4.20"),
("Grok 4 - Flagship (dated build)", "grok-4-0709"),
],
},
"deepseek": {