474 lines
16 KiB
JSON
474 lines
16 KiB
JSON
{
|
|
"_README": {
|
|
"description": "Model metadata for OpenRouter-backed providers.",
|
|
"documentation": "https://github.com/BeehiveInnovations/zen-mcp-server/blob/main/docs/custom_models.md",
|
|
"usage": "Models listed here are exposed through OpenRouter. Aliases are case-insensitive.",
|
|
"field_notes": "Matches providers/shared/model_capabilities.py.",
|
|
"field_descriptions": {
|
|
"model_name": "The model identifier - OpenRouter format (e.g., 'anthropic/claude-opus-4') or custom model name (e.g., 'llama3.2')",
|
|
"aliases": "Array of short names users can type instead of the full model name",
|
|
"context_window": "Total number of tokens the model can process (input + output combined)",
|
|
"max_output_tokens": "Maximum number of tokens the model can generate in a single response",
|
|
"supports_extended_thinking": "Whether the model supports extended reasoning tokens (currently none do via OpenRouter or custom APIs)",
|
|
"supports_json_mode": "Whether the model can guarantee valid JSON output",
|
|
"supports_function_calling": "Whether the model supports function/tool calling",
|
|
"supports_images": "Whether the model can process images/visual input",
|
|
"max_image_size_mb": "Maximum total size in MB for all images combined (capped at 40MB max for custom models)",
|
|
"supports_temperature": "Whether the model accepts temperature parameter in API calls (set to false for O3/O4 reasoning models)",
|
|
"temperature_constraint": "Type of temperature constraint: 'fixed' (fixed value), 'range' (continuous range), 'discrete' (specific values), or omit for default range",
|
|
"use_openai_response_api": "Set to true when the model must use the /responses endpoint (reasoning models like GPT-5 Pro). Leave false/omit for standard chat completions.",
|
|
"default_reasoning_effort": "Default reasoning effort level for models that support it (e.g., 'low', 'medium', 'high'). Omit if not applicable.",
|
|
"description": "Human-readable description of the model",
|
|
"intelligence_score": "1-20 human rating used as the primary signal for auto-mode model ordering",
|
|
"allow_code_generation": "Whether this model can generate and suggest fully working code - complete with functions, files, and detailed implementation instructions - for your AI tool to use right away. Only set this to 'true' for a model more capable than the AI model / CLI you're currently using."
|
|
}
|
|
},
|
|
"models": [
|
|
{
|
|
"model_name": "anthropic/claude-sonnet-4.5",
|
|
"aliases": [
|
|
"sonnet",
|
|
"sonnet4.5"
|
|
],
|
|
"context_window": 200000,
|
|
"max_output_tokens": 64000,
|
|
"supports_extended_thinking": false,
|
|
"supports_json_mode": false,
|
|
"supports_function_calling": false,
|
|
"supports_images": true,
|
|
"max_image_size_mb": 5.0,
|
|
"description": "Claude Sonnet 4.5 - High-performance model with exceptional reasoning and efficiency",
|
|
"intelligence_score": 12
|
|
},
|
|
{
|
|
"model_name": "anthropic/claude-opus-4.1",
|
|
"aliases": [
|
|
"opus",
|
|
"claude-opus"
|
|
],
|
|
"context_window": 200000,
|
|
"max_output_tokens": 64000,
|
|
"supports_extended_thinking": false,
|
|
"supports_json_mode": false,
|
|
"supports_function_calling": false,
|
|
"supports_images": true,
|
|
"max_image_size_mb": 5.0,
|
|
"description": "Claude Opus 4.1 - Our most capable and intelligent model yet",
|
|
"intelligence_score": 14
|
|
},
|
|
{
|
|
"model_name": "anthropic/claude-sonnet-4.1",
|
|
"aliases": [
|
|
"sonnet4.1"
|
|
],
|
|
"context_window": 200000,
|
|
"max_output_tokens": 64000,
|
|
"supports_extended_thinking": false,
|
|
"supports_json_mode": false,
|
|
"supports_function_calling": false,
|
|
"supports_images": true,
|
|
"max_image_size_mb": 5.0,
|
|
"description": "Claude Sonnet 4.1 - Last generation high-performance model with exceptional reasoning and efficiency",
|
|
"intelligence_score": 10
|
|
},
|
|
{
|
|
"model_name": "anthropic/claude-3.5-haiku",
|
|
"aliases": [
|
|
"haiku"
|
|
],
|
|
"context_window": 200000,
|
|
"max_output_tokens": 64000,
|
|
"supports_extended_thinking": false,
|
|
"supports_json_mode": false,
|
|
"supports_function_calling": false,
|
|
"supports_images": true,
|
|
"max_image_size_mb": 5.0,
|
|
"description": "Claude 3 Haiku - Fast and efficient with vision",
|
|
"intelligence_score": 8
|
|
},
|
|
{
|
|
"model_name": "google/gemini-3-pro-preview",
|
|
"aliases": [
|
|
"pro",
|
|
"gemini-pro",
|
|
"gemini",
|
|
"gemini3",
|
|
"pro-openrouter"
|
|
],
|
|
"context_window": 1048576,
|
|
"max_output_tokens": 65536,
|
|
"supports_extended_thinking": true,
|
|
"supports_json_mode": true,
|
|
"supports_function_calling": true,
|
|
"supports_images": true,
|
|
"max_image_size_mb": 20.0,
|
|
"allow_code_generation": true,
|
|
"description": "Google's Gemini 3.0 Pro via OpenRouter with vision",
|
|
"intelligence_score": 18
|
|
},
|
|
{
|
|
"model_name": "google/gemini-2.5-pro",
|
|
"aliases": [
|
|
"gemini-2.5",
|
|
"pro-2.5-openrouter"
|
|
],
|
|
"context_window": 1048576,
|
|
"max_output_tokens": 65536,
|
|
"supports_extended_thinking": true,
|
|
"supports_json_mode": true,
|
|
"supports_function_calling": true,
|
|
"supports_images": true,
|
|
"max_image_size_mb": 20.0,
|
|
"allow_code_generation": true,
|
|
"description": "Google's Gemini 2.5 Pro via OpenRouter with vision",
|
|
"intelligence_score": 18
|
|
},
|
|
{
|
|
"model_name": "google/gemini-2.5-flash",
|
|
"aliases": [
|
|
"flash",
|
|
"gemini-flash"
|
|
],
|
|
"context_window": 1048576,
|
|
"max_output_tokens": 65536,
|
|
"supports_extended_thinking": true,
|
|
"supports_json_mode": true,
|
|
"supports_function_calling": true,
|
|
"supports_images": true,
|
|
"max_image_size_mb": 15.0,
|
|
"description": "Google's Gemini 2.5 Flash via OpenRouter with vision",
|
|
"intelligence_score": 10
|
|
},
|
|
{
|
|
"model_name": "mistralai/mistral-large-2411",
|
|
"aliases": [
|
|
"mistral-large",
|
|
"mistral"
|
|
],
|
|
"context_window": 128000,
|
|
"max_output_tokens": 32000,
|
|
"supports_extended_thinking": false,
|
|
"supports_json_mode": true,
|
|
"supports_function_calling": true,
|
|
"supports_images": false,
|
|
"max_image_size_mb": 0.0,
|
|
"description": "Mistral's largest model (text-only)",
|
|
"intelligence_score": 11
|
|
},
|
|
{
|
|
"model_name": "meta-llama/llama-3-70b",
|
|
"aliases": [
|
|
"llama",
|
|
"llama3",
|
|
"llama3-70b",
|
|
"llama-70b",
|
|
"llama3-openrouter"
|
|
],
|
|
"context_window": 8192,
|
|
"max_output_tokens": 8192,
|
|
"supports_extended_thinking": false,
|
|
"supports_json_mode": false,
|
|
"supports_function_calling": false,
|
|
"supports_images": false,
|
|
"max_image_size_mb": 0.0,
|
|
"description": "Meta's Llama 3 70B model (text-only)",
|
|
"intelligence_score": 9
|
|
},
|
|
{
|
|
"model_name": "deepseek/deepseek-r1-0528",
|
|
"aliases": [
|
|
"deepseek-r1",
|
|
"deepseek",
|
|
"r1",
|
|
"deepseek-thinking"
|
|
],
|
|
"context_window": 65536,
|
|
"max_output_tokens": 32768,
|
|
"supports_extended_thinking": true,
|
|
"supports_json_mode": true,
|
|
"supports_function_calling": false,
|
|
"supports_images": false,
|
|
"max_image_size_mb": 0.0,
|
|
"description": "DeepSeek R1 with thinking mode - advanced reasoning capabilities (text-only)",
|
|
"intelligence_score": 15
|
|
},
|
|
{
|
|
"model_name": "perplexity/llama-3-sonar-large-32k-online",
|
|
"aliases": [
|
|
"perplexity",
|
|
"sonar",
|
|
"perplexity-online"
|
|
],
|
|
"context_window": 32768,
|
|
"max_output_tokens": 32768,
|
|
"supports_extended_thinking": false,
|
|
"supports_json_mode": false,
|
|
"supports_function_calling": false,
|
|
"supports_images": false,
|
|
"max_image_size_mb": 0.0,
|
|
"description": "Perplexity's online model with web search (text-only)",
|
|
"intelligence_score": 9
|
|
},
|
|
{
|
|
"model_name": "openai/o3",
|
|
"aliases": [
|
|
"o3"
|
|
],
|
|
"context_window": 200000,
|
|
"max_output_tokens": 100000,
|
|
"supports_extended_thinking": false,
|
|
"supports_json_mode": true,
|
|
"supports_function_calling": true,
|
|
"supports_images": true,
|
|
"max_image_size_mb": 20.0,
|
|
"supports_temperature": false,
|
|
"temperature_constraint": "fixed",
|
|
"description": "OpenAI's o3 model - well-rounded and powerful across domains with vision",
|
|
"intelligence_score": 14
|
|
},
|
|
{
|
|
"model_name": "openai/o3-mini",
|
|
"aliases": [
|
|
"o3-mini",
|
|
"o3mini"
|
|
],
|
|
"context_window": 200000,
|
|
"max_output_tokens": 100000,
|
|
"supports_extended_thinking": false,
|
|
"supports_json_mode": true,
|
|
"supports_function_calling": true,
|
|
"supports_images": true,
|
|
"max_image_size_mb": 20.0,
|
|
"supports_temperature": false,
|
|
"temperature_constraint": "fixed",
|
|
"description": "OpenAI's o3-mini model - balanced performance and speed with vision",
|
|
"intelligence_score": 12
|
|
},
|
|
{
|
|
"model_name": "openai/o3-mini-high",
|
|
"aliases": [
|
|
"o3-mini-high",
|
|
"o3mini-high"
|
|
],
|
|
"context_window": 200000,
|
|
"max_output_tokens": 100000,
|
|
"supports_extended_thinking": false,
|
|
"supports_json_mode": true,
|
|
"supports_function_calling": true,
|
|
"supports_images": true,
|
|
"max_image_size_mb": 20.0,
|
|
"supports_temperature": false,
|
|
"temperature_constraint": "fixed",
|
|
"description": "OpenAI's o3-mini with high reasoning effort - optimized for complex problems with vision",
|
|
"intelligence_score": 13
|
|
},
|
|
{
|
|
"model_name": "openai/o3-pro",
|
|
"aliases": [
|
|
"o3pro"
|
|
],
|
|
"context_window": 200000,
|
|
"max_output_tokens": 100000,
|
|
"supports_extended_thinking": false,
|
|
"supports_json_mode": true,
|
|
"supports_function_calling": true,
|
|
"supports_images": true,
|
|
"max_image_size_mb": 20.0,
|
|
"supports_temperature": false,
|
|
"temperature_constraint": "fixed",
|
|
"description": "OpenAI's o3-pro model - professional-grade reasoning and analysis with vision",
|
|
"intelligence_score": 15
|
|
},
|
|
{
|
|
"model_name": "openai/o4-mini",
|
|
"aliases": [
|
|
"o4-mini",
|
|
"o4mini"
|
|
],
|
|
"context_window": 200000,
|
|
"max_output_tokens": 100000,
|
|
"supports_extended_thinking": false,
|
|
"supports_json_mode": true,
|
|
"supports_function_calling": true,
|
|
"supports_images": true,
|
|
"max_image_size_mb": 20.0,
|
|
"supports_temperature": false,
|
|
"temperature_constraint": "fixed",
|
|
"description": "OpenAI's o4-mini model - optimized for shorter contexts with rapid reasoning and vision",
|
|
"intelligence_score": 11
|
|
},
|
|
{
|
|
"model_name": "openai/gpt-5",
|
|
"aliases": [
|
|
"gpt5"
|
|
],
|
|
"context_window": 400000,
|
|
"max_output_tokens": 128000,
|
|
"supports_extended_thinking": true,
|
|
"supports_json_mode": true,
|
|
"supports_function_calling": true,
|
|
"supports_images": true,
|
|
"max_image_size_mb": 20.0,
|
|
"supports_temperature": true,
|
|
"temperature_constraint": "range",
|
|
"description": "GPT-5 (400K context, 128K output) - Advanced model with reasoning support",
|
|
"intelligence_score": 16
|
|
},
|
|
{
|
|
"model_name": "openai/gpt-5-pro",
|
|
"aliases": [
|
|
"gpt5pro"
|
|
],
|
|
"context_window": 400000,
|
|
"max_output_tokens": 272000,
|
|
"supports_extended_thinking": true,
|
|
"supports_json_mode": true,
|
|
"supports_function_calling": true,
|
|
"supports_images": true,
|
|
"max_image_size_mb": 20.0,
|
|
"supports_temperature": false,
|
|
"temperature_constraint": "fixed",
|
|
"use_openai_response_api": true,
|
|
"default_reasoning_effort": "high",
|
|
"allow_code_generation": true,
|
|
"description": "GPT-5 Pro - Advanced reasoning model with highest quality responses (text+image input, text output only)",
|
|
"intelligence_score": 18
|
|
},
|
|
{
|
|
"model_name": "openai/gpt-5-codex",
|
|
"aliases": [
|
|
"codex",
|
|
"gpt5codex"
|
|
],
|
|
"context_window": 400000,
|
|
"max_output_tokens": 128000,
|
|
"supports_extended_thinking": false,
|
|
"supports_json_mode": true,
|
|
"supports_function_calling": false,
|
|
"supports_images": false,
|
|
"max_image_size_mb": 0.0,
|
|
"description": "GPT-5-Codex is a specialized version of GPT-5 optimized for software engineering and coding workflows",
|
|
"intelligence_score": 17
|
|
},
|
|
{
|
|
"model_name": "openai/gpt-5-mini",
|
|
"aliases": [
|
|
"gpt5mini"
|
|
],
|
|
"context_window": 400000,
|
|
"max_output_tokens": 128000,
|
|
"supports_extended_thinking": false,
|
|
"supports_json_mode": true,
|
|
"supports_function_calling": false,
|
|
"supports_images": false,
|
|
"max_image_size_mb": 0.0,
|
|
"supports_temperature": true,
|
|
"temperature_constraint": "fixed",
|
|
"description": "GPT-5-mini (400K context, 128K output) - Efficient variant with reasoning support",
|
|
"intelligence_score": 10
|
|
},
|
|
{
|
|
"model_name": "openai/gpt-5-nano",
|
|
"aliases": [
|
|
"gpt5nano"
|
|
],
|
|
"context_window": 400000,
|
|
"max_output_tokens": 128000,
|
|
"supports_extended_thinking": false,
|
|
"supports_json_mode": true,
|
|
"supports_function_calling": false,
|
|
"supports_images": false,
|
|
"max_image_size_mb": 0.0,
|
|
"supports_temperature": true,
|
|
"temperature_constraint": "fixed",
|
|
"description": "GPT-5 nano (400K context, 128K output) - Fastest, cheapest version of GPT-5 for summarization and classification tasks",
|
|
"intelligence_score": 8
|
|
},
|
|
{
|
|
"model_name": "openai/gpt-5.1",
|
|
"aliases": [
|
|
"gpt5.1",
|
|
"gpt-5.1",
|
|
"5.1"
|
|
],
|
|
"context_window": 400000,
|
|
"max_output_tokens": 128000,
|
|
"supports_extended_thinking": true,
|
|
"supports_json_mode": true,
|
|
"supports_function_calling": true,
|
|
"supports_images": true,
|
|
"max_image_size_mb": 20.0,
|
|
"supports_temperature": true,
|
|
"temperature_constraint": "fixed",
|
|
"default_reasoning_effort": "medium",
|
|
"allow_code_generation": true,
|
|
"description": "GPT-5.1 (400K context, 128K output) - Flagship reasoning model with configurable thinking effort and vision support",
|
|
"intelligence_score": 18
|
|
},
|
|
{
|
|
"model_name": "openai/gpt-5.1-codex",
|
|
"aliases": [
|
|
"gpt5.1-codex",
|
|
"gpt-5.1-codex",
|
|
"gpt5.1code",
|
|
"gpt-5.1-code",
|
|
"codex-5.1"
|
|
],
|
|
"context_window": 400000,
|
|
"max_output_tokens": 128000,
|
|
"supports_extended_thinking": true,
|
|
"supports_json_mode": true,
|
|
"supports_function_calling": true,
|
|
"supports_images": true,
|
|
"max_image_size_mb": 20.0,
|
|
"supports_temperature": true,
|
|
"temperature_constraint": "fixed",
|
|
"use_openai_response_api": true,
|
|
"default_reasoning_effort": "high",
|
|
"allow_code_generation": true,
|
|
"description": "GPT-5.1 Codex (400K context, 128K output) - Agentic coding specialization available through the Responses API",
|
|
"intelligence_score": 19
|
|
},
|
|
{
|
|
"model_name": "openai/gpt-5.1-codex-mini",
|
|
"aliases": [
|
|
"gpt5.1-codex-mini",
|
|
"gpt-5.1-codex-mini",
|
|
"codex-mini",
|
|
"5.1-codex-mini"
|
|
],
|
|
"context_window": 400000,
|
|
"max_output_tokens": 128000,
|
|
"supports_extended_thinking": true,
|
|
"supports_json_mode": true,
|
|
"supports_function_calling": true,
|
|
"supports_images": true,
|
|
"max_image_size_mb": 20.0,
|
|
"supports_temperature": true,
|
|
"temperature_constraint": "fixed",
|
|
"allow_code_generation": true,
|
|
"description": "GPT-5.1 Codex mini (400K context, 128K output) - Cost-efficient Codex variant with streaming support",
|
|
"intelligence_score": 16
|
|
},
|
|
{
|
|
"model_name": "x-ai/grok-4",
|
|
"aliases": [
|
|
"grok-4",
|
|
"grok4",
|
|
"grok"
|
|
],
|
|
"context_window": 256000,
|
|
"max_output_tokens": 256000,
|
|
"supports_extended_thinking": true,
|
|
"supports_json_mode": true,
|
|
"supports_function_calling": true,
|
|
"supports_images": true,
|
|
"max_image_size_mb": 20.0,
|
|
"supports_temperature": true,
|
|
"temperature_constraint": "range",
|
|
"description": "xAI's Grok 4 via OpenRouter with vision and advanced reasoning",
|
|
"intelligence_score": 15
|
|
}
|
|
]
|
|
}
|