Vision support via images / pdfs etc that can be passed on to other models as part of analysis, additional context etc.

Image processing pipeline added OpenAI GPT-4.1 support Chat tool prompt enhancement Lint and code quality improvements
2025-06-16 13:14:53 +04:00
parent d498e9854b
commit 97fa6781cf
26 changed files with 1328 additions and 52 deletions
--- a/tools/chat.py
+++ b/tools/chat.py
@@ -20,12 +20,25 @@ class ChatRequest(ToolRequest):

    prompt: str = Field(
        ...,
-        description="Your question, topic, or current thinking to discuss",
+        description=(
+            "Your thorough, expressive question with as much context as possible. Remember: you're talking to "
+            "another Claude assistant who has deep expertise and can provide nuanced insights. Include your "
+            "current thinking, specific challenges, background context, what you've already tried, and what "
+            "kind of response would be most helpful. The more context and detail you provide, the more "
+            "valuable and targeted the response will be."
+        ),
    )
    files: Optional[list[str]] = Field(
        default_factory=list,
        description="Optional files for context (must be absolute paths)",
    )
+    images: Optional[list[str]] = Field(
+        default_factory=list,
+        description=(
+            "Optional images for visual context. Useful for UI discussions, diagrams, visual problems, "
+            "error screens, or architectural mockups."
+        ),
+    )


 class ChatTool(BaseTool):
@@ -42,7 +55,8 @@ class ChatTool(BaseTool):
            "Also great for: explanations, comparisons, general development questions. "
            "Use this when you want to ask questions, brainstorm ideas, get opinions, discuss topics, "
            "share your thinking, or need explanations about concepts and approaches. "
-            "Note: If you're not currently using a top-tier model such as Opus 4 or above, these tools can provide enhanced capabilities."
+            "Note: If you're not currently using a top-tier model such as Opus 4 or above, these tools can "
+            "provide enhanced capabilities."
        )

    def get_input_schema(self) -> dict[str, Any]:
@@ -51,13 +65,27 @@ class ChatTool(BaseTool):
            "properties": {
                "prompt": {
                    "type": "string",
-                    "description": "Your question, topic, or current thinking to discuss",
+                    "description": (
+                        "Your thorough, expressive question with as much context as possible. Remember: you're "
+                        "talking to another Claude assistant who has deep expertise and can provide nuanced "
+                        "insights. Include your current thinking, specific challenges, background context, what "
+                        "you've already tried, and what kind of response would be most helpful. The more context "
+                        "and detail you provide, the more valuable and targeted the response will be."
+                    ),
                },
                "files": {
                    "type": "array",
                    "items": {"type": "string"},
                    "description": "Optional files for context (must be absolute paths)",
                },
+                "images": {
+                    "type": "array",
+                    "items": {"type": "string"},
+                    "description": (
+                        "Optional images for visual context. Useful for UI discussions, diagrams, visual "
+                        "problems, error screens, or architectural mockups."
+                    ),
+                },
                "model": self.get_model_field_schema(),
                "temperature": {
                    "type": "number",
@@ -68,16 +96,29 @@ class ChatTool(BaseTool):
                "thinking_mode": {
                    "type": "string",
                    "enum": ["minimal", "low", "medium", "high", "max"],
-                    "description": "Thinking depth: minimal (0.5% of model max), low (8%), medium (33%), high (67%), max (100% of model max)",
+                    "description": (
+                        "Thinking depth: minimal (0.5% of model max), low (8%), medium (33%), high (67%), "
+                        "max (100% of model max)"
+                    ),
                },
                "use_websearch": {
                    "type": "boolean",
-                    "description": "Enable web search for documentation, best practices, and current information. Particularly useful for: brainstorming sessions, architectural design discussions, exploring industry best practices, working with specific frameworks/technologies, researching solutions to complex problems, or when current documentation and community insights would enhance the analysis.",
+                    "description": (
+                        "Enable web search for documentation, best practices, and current information. "
+                        "Particularly useful for: brainstorming sessions, architectural design discussions, "
+                        "exploring industry best practices, working with specific frameworks/technologies, "
+                        "researching solutions to complex problems, or when current documentation and "
+                        "community insights would enhance the analysis."
+                    ),
                    "default": True,
                },
                "continuation_id": {
                    "type": "string",
-                    "description": "Thread continuation ID for multi-turn conversations. Can be used to continue conversations across different tools. Only provide this if continuing a previous conversation thread.",
+                    "description": (
+                        "Thread continuation ID for multi-turn conversations. Can be used to continue "
+                        "conversations across different tools. Only provide this if continuing a previous "
+                        "conversation thread."
+                    ),
                },
            },
            "required": ["prompt"] + (["model"] if self.is_effective_auto_mode() else []),
@@ -157,4 +198,7 @@ Please provide a thoughtful, comprehensive response:"""

    def format_response(self, response: str, request: ChatRequest, model_info: Optional[dict] = None) -> str:
        """Format the chat response"""
-        return f"{response}\n\n---\n\n**Claude's Turn:** Evaluate this perspective alongside your analysis to form a comprehensive solution and continue with the user's request and task at hand."
+        return (
+            f"{response}\n\n---\n\n**Claude's Turn:** Evaluate this perspective alongside your analysis to "
+            "form a comprehensive solution and continue with the user's request and task at hand."
+        )