Perform prompt size checks only at the MCP boundary

New test to confirm history build-up and system prompt does not affect prompt size checks Also check for large prompts in focus_on Fixed .env.example incorrectly did not comment out CUSTOM_API causing the run-server script to think at least one key exists
2025-06-15 10:37:08 +04:00
parent 3b03783ea7
commit 4becd70a82
14 changed files with 404 additions and 198 deletions
--- a/tools/testgen.py
+++ b/tools/testgen.py
@@ -17,7 +17,6 @@ import logging
 import os
 from typing import Any, Optional

-from mcp.types import TextContent
 from pydantic import Field

 from config import TEMPERATURE_ANALYTICAL
@@ -25,7 +24,6 @@ from systemprompts import TESTGEN_PROMPT
 from utils.file_utils import translate_file_paths

 from .base import BaseTool, ToolRequest
-from .models import ToolOutput

 logger = logging.getLogger(__name__)

@@ -145,21 +143,6 @@ class TestGenTool(BaseTool):
    def get_request_model(self):
        return TestGenRequest

-    async def execute(self, arguments: dict[str, Any]) -> list[TextContent]:
-        """Override execute to check prompt size before processing"""
-        # First validate request
-        request_model = self.get_request_model()
-        request = request_model(**arguments)
-
-        # Check prompt size if provided
-        if request.prompt:
-            size_check = self.check_prompt_size(request.prompt)
-            if size_check:
-                return [TextContent(type="text", text=ToolOutput(**size_check).model_dump_json())]
-
-        # Continue with normal execution
-        return await super().execute(arguments)
-
    def _process_test_examples(
        self, test_examples: list[str], continuation_id: Optional[str], available_tokens: int = None
    ) -> tuple[str, str]:
@@ -294,6 +277,14 @@ class TestGenTool(BaseTool):
            logger.debug(f"[TESTGEN] Updated files list after prompt.txt processing: {len(updated_files)} files")
            request.files = updated_files

+        # Check user input size at MCP transport boundary (before adding internal content)
+        user_content = request.prompt
+        size_check = self.check_prompt_size(user_content)
+        if size_check:
+            from tools.models import ToolOutput
+
+            raise ValueError(f"MCP_SIZE_CHECK:{ToolOutput(**size_check).model_dump_json()}")
+
        # Calculate available token budget for dynamic allocation
        continuation_id = getattr(request, "continuation_id", None)