Categorize tools into 'model capabilities categories' to help determine which type of model to pick when in auto mode

Encourage Claude to pick the best model for the job automatically in auto mode Lots of new tests to ensure automatic model picking works reliably based on user preference or when a matching model is not found or ambiguous Improved error reporting when bogus model is requested and is not configured or available
2025-06-14 02:17:06 +04:00
parent 7fc1186a7c
commit eb388ab2f2
13 changed files with 838 additions and 68 deletions
--- a/tools/chat.py
+++ b/tools/chat.py
@@ -2,11 +2,14 @@
 Chat tool - General development chat and collaborative thinking
 """

-from typing import Any, Optional
+from typing import TYPE_CHECKING, Any, Optional

 from mcp.types import TextContent
 from pydantic import Field

+if TYPE_CHECKING:
+    from tools.models import ToolModelCategory
+
 from config import TEMPERATURE_BALANCED
 from prompts import CHAT_PROMPT

@@ -44,8 +47,6 @@ class ChatTool(BaseTool):
        )

    def get_input_schema(self) -> dict[str, Any]:
-        from config import IS_AUTO_MODE
-
        schema = {
            "type": "object",
            "properties": {
@@ -80,7 +81,7 @@ class ChatTool(BaseTool):
                    "description": "Thread continuation ID for multi-turn conversations. Can be used to continue conversations across different tools. Only provide this if continuing a previous conversation thread.",
                },
            },
-            "required": ["prompt"] + (["model"] if IS_AUTO_MODE else []),
+            "required": ["prompt"] + (["model"] if self.is_effective_auto_mode() else []),
        }

        return schema
@@ -91,6 +92,12 @@ class ChatTool(BaseTool):
    def get_default_temperature(self) -> float:
        return TEMPERATURE_BALANCED

+    def get_model_category(self) -> "ToolModelCategory":
+        """Chat prioritizes fast responses and cost efficiency"""
+        from tools.models import ToolModelCategory
+
+        return ToolModelCategory.FAST_RESPONSE
+
    def get_request_model(self):
        return ChatRequest