diff --git a/README.md b/README.md index 8c59fbf83..26ee0f1e9 100644 --- a/README.md +++ b/README.md @@ -226,7 +226,7 @@ from tradingagents.default_config import DEFAULT_CONFIG config = DEFAULT_CONFIG.copy() config["llm_provider"] = "openai" # openai, google, anthropic, xai, deepseek, qwen, qwen-cn, glm, glm-cn, minimax, minimax-cn, openrouter, ollama, azure -config["deep_think_llm"] = "gpt-5.4" # Model for complex reasoning +config["deep_think_llm"] = "gpt-5.5" # Model for complex reasoning config["quick_think_llm"] = "gpt-5.4-mini" # Model for quick tasks config["max_debate_rounds"] = 2 diff --git a/tests/test_env_overrides.py b/tests/test_env_overrides.py index c12ce5f18..f02661ebd 100644 --- a/tests/test_env_overrides.py +++ b/tests/test_env_overrides.py @@ -21,7 +21,7 @@ def _reload_with_env(monkeypatch, **overrides): def test_no_env_uses_built_in_defaults(monkeypatch): dc = _reload_with_env(monkeypatch) assert dc.DEFAULT_CONFIG["llm_provider"] == "openai" - assert dc.DEFAULT_CONFIG["deep_think_llm"] == "gpt-5.4" + assert dc.DEFAULT_CONFIG["deep_think_llm"] == "gpt-5.5" assert dc.DEFAULT_CONFIG["quick_think_llm"] == "gpt-5.4-mini" assert dc.DEFAULT_CONFIG["backend_url"] is None assert dc.DEFAULT_CONFIG["max_debate_rounds"] == 1 diff --git a/tradingagents/default_config.py b/tradingagents/default_config.py index 9162e2ea7..d9fd83f65 100644 --- a/tradingagents/default_config.py +++ b/tradingagents/default_config.py @@ -53,7 +53,7 @@ DEFAULT_CONFIG = _apply_env_overrides({ "memory_log_max_entries": None, # LLM settings "llm_provider": "openai", - "deep_think_llm": "gpt-5.4", + "deep_think_llm": "gpt-5.5", "quick_think_llm": "gpt-5.4-mini", # When None, each provider's client falls back to its own default endpoint # (api.openai.com for OpenAI, generativelanguage.googleapis.com for Gemini, ...). diff --git a/tradingagents/llm_clients/model_catalog.py b/tradingagents/llm_clients/model_catalog.py index d88c0f137..00f2df96e 100644 --- a/tradingagents/llm_clients/model_catalog.py +++ b/tradingagents/llm_clients/model_catalog.py @@ -44,9 +44,9 @@ _QWEN_MODELS: Dict[str, List[ModelOption]] = { ("Custom model ID", "custom"), ], "deep": [ - ("Qwen 3.6 Plus - Flagship vision-language, agentic coding SOTA", "qwen3.6-plus"), + ("Qwen 3.7 Max - Latest flagship reasoning agent, 1M ctx", "qwen3.7-max"), + ("Qwen 3.6 Plus - Vision-language, agentic coding", "qwen3.6-plus"), ("Qwen 3.5 Plus - Previous-gen flagship", "qwen3.5-plus"), - ("Qwen 3 Max - Specialized for agent programming + tool use", "qwen3-max"), ("Custom model ID", "custom"), ], } @@ -95,37 +95,37 @@ MODEL_OPTIONS: ProviderModeOptions = { ("Claude Sonnet 4.5 - High-performance for agents and coding", "claude-sonnet-4-5"), ], "deep": [ - ("Claude Opus 4.7 - Latest frontier, long-running agents and coding", "claude-opus-4-7"), + ("Claude Opus 4.8 - Latest frontier, agentic coding and reasoning", "claude-opus-4-8"), + ("Claude Opus 4.7 - Previous frontier, long-running agents", "claude-opus-4-7"), ("Claude Opus 4.6 - Frontier intelligence, agents and coding", "claude-opus-4-6"), - ("Claude Opus 4.5 - Premium, max intelligence", "claude-opus-4-5"), ("Claude Sonnet 4.6 - Best speed and intelligence balance", "claude-sonnet-4-6"), ], }, "google": { "quick": [ - ("Gemini 3 Flash - Next-gen fast (preview)", "gemini-3-flash-preview"), - ("Gemini 2.5 Flash - Balanced, stable", "gemini-2.5-flash"), + ("Gemini 3.5 Flash - Latest, frontier agentic + coding (GA)", "gemini-3.5-flash"), ("Gemini 3.1 Flash Lite - Most cost-efficient (GA)", "gemini-3.1-flash-lite"), + ("Gemini 2.5 Flash - Balanced, stable", "gemini-2.5-flash"), ("Gemini 2.5 Flash Lite - Fast, low-cost", "gemini-2.5-flash-lite"), ], "deep": [ ("Gemini 3.1 Pro - Reasoning-first, complex workflows (preview)", "gemini-3.1-pro-preview"), - ("Gemini 3 Flash - Next-gen fast (preview)", "gemini-3-flash-preview"), + ("Gemini 3.5 Flash - Latest GA, strong agentic + coding", "gemini-3.5-flash"), ("Gemini 2.5 Pro - Stable pro model", "gemini-2.5-pro"), ("Gemini 2.5 Flash - Balanced, stable", "gemini-2.5-flash"), ], }, "xai": { "quick": [ - ("Grok 4.20 (Non-Reasoning) - Latest, speed-optimized", "grok-4.20-non-reasoning"), + ("Grok 4.3 - Latest flagship, fast with built-in reasoning", "grok-4.3"), + ("Grok Build 0.1 - Coding-specialized, 256K ctx", "grok-build-0.1"), ("Grok 4 Fast (Non-Reasoning) - Speed optimized", "grok-4-fast-non-reasoning"), - ("Grok 4 Fast (Reasoning) - High-performance", "grok-4-fast-reasoning"), ], "deep": [ - ("Grok 4.20 (Reasoning) - Latest frontier reasoning model", "grok-4.20-reasoning"), - ("Grok 4 - Flagship (dated build)", "grok-4-0709"), + ("Grok 4.3 - Latest flagship, built-in reasoning, 1M ctx", "grok-4.3"), + ("Grok 4.20 (Reasoning) - Previous-gen reasoning", "grok-4.20-0309-reasoning"), ("Grok 4 Fast (Reasoning) - High-performance", "grok-4-fast-reasoning"), - ("Grok 4.20 - Auto-select reasoning behavior", "grok-4.20"), + ("Grok 4 - Flagship (dated build)", "grok-4-0709"), ], }, "deepseek": {