feat: update Ollama and OpenRouter model options

- Ollama: Add Qwen3 (8B), GPT-OSS (20B), GLM-4.7-Flash (30B) - OpenRouter: Add NVIDIA Nemotron 3 Nano, Z.AI GLM 4.5 Air - Add explicit Ollama provider handling in OpenAI client for consistency
2026-05-01 14:33:10 +03:00 · 2026-01-26 22:24:59 +00:00
parent d4dadb82fc
commit a3761bdd66
2 changed files with 20 additions and 12 deletions
--- a/cli/utils.py
+++ b/cli/utils.py
@@ -152,14 +152,14 @@ def select_shallow_thinking_agent(provider) -> str:
            ("Grok 4 Fast (Reasoning) - High-performance", "grok-4-fast-reasoning"),
        ],
        "openrouter": [
-            ("Meta: Llama 4 Scout", "meta-llama/llama-4-scout:free"),
+            ("NVIDIA Nemotron 3 Nano 30B (free)", "nvidia/nemotron-3-nano-30b-a3b:free"),
-            ("Meta: Llama 3.3 8B Instruct - A lightweight and ultra-fast variant of Llama 3.3 70B", "meta-llama/llama-3.3-8b-instruct:free"),
+            ("Z.AI GLM 4.5 Air (free)", "z-ai/glm-4.5-air:free"),
            ("google/gemini-2.0-flash-exp:free - Gemini Flash 2.0 offers a significantly faster time to first token", "google/gemini-2.0-flash-exp:free"),
        ],
        "ollama": [
-            ("llama3.1 local", "llama3.1"),
+            ("Qwen3:latest (8B, local)", "qwen3:latest"),
-            ("llama3.2 local", "llama3.2"),
+            ("GPT-OSS:latest (20B, local)", "gpt-oss:latest"),
-        ]
+            ("GLM-4.7-Flash:latest (30B, local)", "glm-4.7-flash:latest"),
        ],
    }
    choice = questionary.select(
@@ -220,15 +220,16 @@ def select_deep_thinking_agent(provider) -> str:
            ("Grok 4 Fast (Non-Reasoning) - Speed optimized", "grok-4-fast-non-reasoning"),
        ],
        "openrouter": [
-            ("DeepSeek V3 - a 685B-parameter, mixture-of-experts model", "deepseek/deepseek-chat-v3-0324:free"),
+            ("Z.AI GLM 4.5 Air (free)", "z-ai/glm-4.5-air:free"),
-            ("Deepseek - latest iteration of the flagship chat model family from the DeepSeek team.", "deepseek/deepseek-chat-v3-0324:free"),
+            ("NVIDIA Nemotron 3 Nano 30B (free)", "nvidia/nemotron-3-nano-30b-a3b:free"),
        ],
        "ollama": [
-            ("llama3.1 local", "llama3.1"),
+            ("GLM-4.7-Flash:latest (30B, local)", "glm-4.7-flash:latest"),
-            ("qwen3", "qwen3"),
+            ("GPT-OSS:latest (20B, local)", "gpt-oss:latest"),
-        ]
+            ("Qwen3:latest (8B, local)", "qwen3:latest"),
        ],
    }
-    
+
    choice = questionary.select(
        "Select Your [Deep-Thinking LLM Engine]:",
        choices=[
--- a/tradingagents/llm_clients/openai_client.py
+++ b/tradingagents/llm_clients/openai_client.py
@@ -50,6 +50,13 @@ class OpenAIClient(BaseLLMClient):
            api_key = os.environ.get("XAI_API_KEY")
            if api_key:
                llm_kwargs["api_key"] = api_key
        elif self.provider == "openrouter":
            llm_kwargs["base_url"] = "https://openrouter.ai/api/v1"
            api_key = os.environ.get("OPENROUTER_API_KEY")
            if api_key:
                llm_kwargs["api_key"] = api_key
        elif self.provider == "ollama":
            llm_kwargs["base_url"] = "http://localhost:11434/v1"
        elif self.base_url:
            llm_kwargs["base_url"] = self.base_url