Use the new Gemini 2.5 Flash

Updated to support Thinking Tokens as a ratio of the max allowed Updated tests Updated README
2025-06-12 20:46:54 +04:00
parent b34c63d710
commit 3aedb16101
27 changed files with 135 additions and 98 deletions
--- a/tools/base.py
+++ b/tools/base.py
@@ -57,7 +57,7 @@ class ToolRequest(BaseModel):
    # Higher values allow for more complex reasoning but increase latency and cost
    thinking_mode: Optional[Literal["minimal", "low", "medium", "high", "max"]] = Field(
        None,
-        description="Thinking depth: minimal (128), low (2048), medium (8192), high (16384), max (32768)",
+        description="Thinking depth: minimal (0.5% of model max), low (8%), medium (33%), high (67%), max (100% of model max)",
    )
    use_websearch: Optional[bool] = Field(
        True,