feat: Enhanced Gemini MCP server for large-scale code analysis

Major improvements: - Default model set to Gemini 1.5 Pro (more reliable than 2.5 Preview) - Added analyze_code tool for processing large files and codebases - Support for 1M token context window - File reading capabilities for automatic code ingestion - Enhanced documentation with usage examples - Added USAGE.md guide for Claude Code users Changes: - Updated default model configuration with fallback note - Increased default max_tokens to 8192 for better responses - Added CodeAnalysisRequest model for structured code analysis - Implemented file reading with proper error handling - Added token estimation (~4 chars per token) - Created comprehensive test suite for new features This update makes the server ideal for handling large files that exceed Claude's token limits, enabling seamless handoff to Gemini for extended analysis and thinking. 🤖 Generated with [Claude Code](https://claude.ai/code) Co-Authored-By: Claude <noreply@anthropic.com>
2025-06-08 19:46:10 +04:00
parent 18c5ec913d
commit 54d9bb1ee7
4 changed files with 423 additions and 21 deletions
--- a/gemini_server.py
+++ b/gemini_server.py
@@ -1,12 +1,14 @@
 #!/usr/bin/env python3
 """
 Gemini MCP Server - Model Context Protocol server for Google Gemini
+Enhanced for large-scale code analysis with 1M token context window
 """

 import os
 import json
 import asyncio
-from typing import Optional, Dict, Any, List
+from typing import Optional, Dict, Any, List, Union
+from pathlib import Path
 from mcp.server.models import InitializationOptions
 from mcp.server import Server, NotificationOptions
 from mcp.server.stdio import stdio_server
@@ -15,13 +17,30 @@ from pydantic import BaseModel, Field
 import google.generativeai as genai


+# Default to Gemini 2.5 Pro Preview with maximum context
+# Note: 2.5 Pro Preview has restrictions, falling back to 1.5 Pro for better reliability
+DEFAULT_MODEL = "gemini-1.5-pro-latest"  # More reliable, still has large context
+MAX_CONTEXT_TOKENS = 1000000  # 1M tokens
+
+
 class GeminiChatRequest(BaseModel):
    """Request model for Gemini chat"""
    prompt: str = Field(..., description="The prompt to send to Gemini")
    system_prompt: Optional[str] = Field(None, description="Optional system prompt for context")
-    max_tokens: Optional[int] = Field(4096, description="Maximum number of tokens in response")
+    max_tokens: Optional[int] = Field(8192, description="Maximum number of tokens in response")
    temperature: Optional[float] = Field(0.7, description="Temperature for response randomness (0-1)")
-    model: Optional[str] = Field("gemini-1.5-pro-latest", description="Model to use (defaults to gemini-1.5-pro-latest)")
+    model: Optional[str] = Field(DEFAULT_MODEL, description=f"Model to use (defaults to {DEFAULT_MODEL})")
+
+
+class CodeAnalysisRequest(BaseModel):
+    """Request model for code analysis"""
+    files: Optional[List[str]] = Field(None, description="List of file paths to analyze")
+    code: Optional[str] = Field(None, description="Direct code content to analyze")
+    question: str = Field(..., description="Question or analysis request about the code")
+    system_prompt: Optional[str] = Field(None, description="Optional system prompt for context")
+    max_tokens: Optional[int] = Field(8192, description="Maximum number of tokens in response")
+    temperature: Optional[float] = Field(0.3, description="Temperature for response randomness (0-1)")
+    model: Optional[str] = Field(DEFAULT_MODEL, description=f"Model to use (defaults to {DEFAULT_MODEL})")


 # Create the MCP server instance
@@ -37,13 +56,47 @@ def configure_gemini():
    genai.configure(api_key=api_key)


+def read_file_content(file_path: str) -> str:
+    """Read content from a file with error handling"""
+    try:
+        path = Path(file_path)
+        if not path.exists():
+            return f"Error: File not found: {file_path}"
+        if not path.is_file():
+            return f"Error: Not a file: {file_path}"
+        
+        # Read the file
+        with open(path, 'r', encoding='utf-8') as f:
+            content = f.read()
+        
+        return f"=== File: {file_path} ===\n{content}\n"
+    except Exception as e:
+        return f"Error reading {file_path}: {str(e)}"
+
+
+def prepare_code_context(files: Optional[List[str]], code: Optional[str]) -> str:
+    """Prepare code context from files and/or direct code"""
+    context_parts = []
+    
+    # Add file contents
+    if files:
+        for file_path in files:
+            context_parts.append(read_file_content(file_path))
+    
+    # Add direct code
+    if code:
+        context_parts.append("=== Direct Code ===\n" + code + "\n")
+    
+    return "\n".join(context_parts)
+
+
@server.list_tools()
 async def handle_list_tools() -> List[Tool]:
    """List all available tools"""
    return [
        Tool(
            name="chat",
-            description="Chat with Gemini Pro 2.5 model",
+            description="Chat with Gemini (optimized for 2.5 Pro with 1M context)",
            inputSchema={
                "type": "object",
                "properties": {
@@ -58,7 +111,7 @@ async def handle_list_tools() -> List[Tool]:
                    "max_tokens": {
                        "type": "integer",
                        "description": "Maximum number of tokens in response",
-                        "default": 4096
+                        "default": 8192
                    },
                    "temperature": {
                        "type": "number",
@@ -69,13 +122,57 @@ async def handle_list_tools() -> List[Tool]:
                    },
                    "model": {
                        "type": "string",
-                        "description": "Model to use (e.g., gemini-1.5-pro-latest, gemini-2.5-pro-preview-06-05)",
-                        "default": "gemini-1.5-pro-latest"
+                        "description": f"Model to use (defaults to {DEFAULT_MODEL})",
+                        "default": DEFAULT_MODEL
                    }
                },
                "required": ["prompt"]
            }
        ),
+        Tool(
+            name="analyze_code",
+            description="Analyze code files or snippets with Gemini's 1M context window",
+            inputSchema={
+                "type": "object",
+                "properties": {
+                    "files": {
+                        "type": "array",
+                        "items": {"type": "string"},
+                        "description": "List of file paths to analyze"
+                    },
+                    "code": {
+                        "type": "string",
+                        "description": "Direct code content to analyze (alternative to files)"
+                    },
+                    "question": {
+                        "type": "string",
+                        "description": "Question or analysis request about the code"
+                    },
+                    "system_prompt": {
+                        "type": "string",
+                        "description": "Optional system prompt for context"
+                    },
+                    "max_tokens": {
+                        "type": "integer",
+                        "description": "Maximum number of tokens in response",
+                        "default": 8192
+                    },
+                    "temperature": {
+                        "type": "number",
+                        "description": "Temperature for response randomness (0-1)",
+                        "default": 0.3,
+                        "minimum": 0,
+                        "maximum": 1
+                    },
+                    "model": {
+                        "type": "string",
+                        "description": f"Model to use (defaults to {DEFAULT_MODEL})",
+                        "default": DEFAULT_MODEL
+                    }
+                },
+                "required": ["question"]
+            }
+        ),
        Tool(
            name="list_models",
            description="List available Gemini models",
@@ -96,12 +193,13 @@ async def handle_call_tool(name: str, arguments: Dict[str, Any]) -> List[TextCon
        request = GeminiChatRequest(**arguments)
        
        try:
-            # Use the specified model or default to 1.5 Pro
+            # Use the specified model with optimized settings
            model = genai.GenerativeModel(
                model_name=request.model,
                generation_config={
                    "temperature": request.temperature,
                    "max_output_tokens": request.max_tokens,
+                    "candidate_count": 1,
                }
            )
            
@@ -132,6 +230,64 @@ async def handle_call_tool(name: str, arguments: Dict[str, Any]) -> List[TextCon
                text=f"Error calling Gemini API: {str(e)}"
            )]
    
+    elif name == "analyze_code":
+        # Validate request
+        request = CodeAnalysisRequest(**arguments)
+        
+        # Check that we have either files or code
+        if not request.files and not request.code:
+            return [TextContent(
+                type="text",
+                text="Error: Must provide either 'files' or 'code' parameter"
+            )]
+        
+        try:
+            # Prepare code context
+            code_context = prepare_code_context(request.files, request.code)
+            
+            # Count approximate tokens (rough estimate: 1 token ≈ 4 characters)
+            estimated_tokens = len(code_context) // 4
+            if estimated_tokens > MAX_CONTEXT_TOKENS:
+                return [TextContent(
+                    type="text",
+                    text=f"Error: Code context too large (~{estimated_tokens:,} tokens). Maximum is {MAX_CONTEXT_TOKENS:,} tokens."
+                )]
+            
+            # Use the specified model with optimized settings for code analysis
+            model = genai.GenerativeModel(
+                model_name=request.model,
+                generation_config={
+                    "temperature": request.temperature,
+                    "max_output_tokens": request.max_tokens,
+                    "candidate_count": 1,
+                }
+            )
+            
+            # Prepare the full prompt
+            system_prompt = request.system_prompt or "You are an expert code analyst. Provide detailed, accurate analysis of the provided code."
+            full_prompt = f"{system_prompt}\n\nCode to analyze:\n\n{code_context}\n\nQuestion/Request: {request.question}"
+            
+            # Generate response
+            response = model.generate_content(full_prompt)
+            
+            # Handle response
+            if response.candidates and response.candidates[0].content.parts:
+                text = response.candidates[0].content.parts[0].text
+            else:
+                finish_reason = response.candidates[0].finish_reason if response.candidates else "Unknown"
+                text = f"Response blocked or incomplete. Finish reason: {finish_reason}"
+            
+            return [TextContent(
+                type="text",
+                text=text
+            )]
+            
+        except Exception as e:
+            return [TextContent(
+                type="text",
+                text=f"Error analyzing code: {str(e)}"
+            )]
+    
    elif name == "list_models":
        try:
            # List available models
@@ -141,7 +297,8 @@ async def handle_call_tool(name: str, arguments: Dict[str, Any]) -> List[TextCon
                    models.append({
                        "name": model.name,
                        "display_name": model.display_name,
-                        "description": model.description
+                        "description": model.description,
+                        "is_default": model.name == DEFAULT_MODEL
                    })
            
            return [TextContent(
@@ -174,7 +331,7 @@ async def main():
            write_stream,
            InitializationOptions(
                server_name="gemini",
-                server_version="1.0.0",
+                server_version="2.0.0",
                capabilities={
                    "tools": {}
                }