fix: external model name now recorded properly in responses

test: http cassettes added for improved integration tests refactor: generic name for the CLI agent
2025-10-03 11:29:06 +04:00
parent e9b69476cd
commit d55130a430
10 changed files with 477 additions and 105 deletions
--- a/tests/test_conversation_memory.py
+++ b/tests/test_conversation_memory.py
@@ -174,6 +174,8 @@ class TestConversationMemory:
                timestamp="2023-01-01T00:01:00Z",
                files=[str(examples_dir)],  # Directory will be expanded to files
                tool_name="chat",
+                model_name="gpt-5",
+                model_provider="openai",
            ),
        ]

@@ -195,8 +197,8 @@ class TestConversationMemory:
        assert f"Turn 2/{MAX_CONVERSATION_TURNS}" in history

        # Test speaker identification
-        assert "--- Turn 1 (Claude) ---" in history
-        assert "--- Turn 2 (Gemini using chat) ---" in history
+        assert "--- Turn 1 (Agent) ---" in history
+        assert "--- Turn 2 (gpt-5 using chat via openai) ---" in history

        # Test content
        assert "What is Python?" in history
@@ -527,6 +529,8 @@ class TestConversationFlow:
            "I've analyzed your codebase structure.",
            files=["/project/src/main.py", "/project/src/utils.py"],
            tool_name="analyze",
+            model_name="gemini-2.5-flash",
+            model_provider="google",
        )
        assert success is True

@@ -543,6 +547,8 @@ class TestConversationFlow:
                    timestamp="2023-01-01T00:00:30Z",
                    files=["/project/src/main.py", "/project/src/utils.py"],
                    tool_name="analyze",
+                    model_name="gemini-2.5-flash",
+                    model_provider="google",
                )
            ],
            initial_context={"prompt": "Analyze this codebase", "relevant_files": ["/project/src/"]},
@@ -586,6 +592,8 @@ class TestConversationFlow:
            "Test coverage analysis complete. Coverage is 85%.",
            files=["/project/tests/test_utils.py", "/project/coverage.html"],
            tool_name="analyze",
+            model_name="gemini-2.5-flash",
+            model_provider="google",
        )
        assert success is True

@@ -602,6 +610,8 @@ class TestConversationFlow:
                    timestamp="2023-01-01T00:00:30Z",
                    files=["/project/src/main.py", "/project/src/utils.py"],
                    tool_name="analyze",
+                    model_name="gemini-2.5-flash",
+                    model_provider="google",
                ),
                ConversationTurn(
                    role="user",
@@ -615,6 +625,8 @@ class TestConversationFlow:
                    timestamp="2023-01-01T00:02:30Z",
                    files=["/project/tests/test_utils.py", "/project/coverage.html"],
                    tool_name="analyze",
+                    model_name="gemini-2.5-flash",
+                    model_provider="google",
                ),
            ],
            initial_context={"prompt": "Analyze this codebase", "relevant_files": ["/project/src/"]},
@@ -623,9 +635,9 @@ class TestConversationFlow:
        history, tokens = build_conversation_history(final_context)

        # Verify chronological order and speaker identification
-        assert "--- Turn 1 (Gemini using analyze) ---" in history
-        assert "--- Turn 2 (Claude) ---" in history
-        assert "--- Turn 3 (Gemini using analyze) ---" in history
+        assert "--- Turn 1 (gemini-2.5-flash using analyze via google) ---" in history
+        assert "--- Turn 2 (Agent) ---" in history
+        assert "--- Turn 3 (gemini-2.5-flash using analyze via google) ---" in history

        # Verify all files are preserved in chronological order
        turn_1_files = "Files used in this turn: /project/src/main.py, /project/src/utils.py"
@@ -642,9 +654,9 @@ class TestConversationFlow:
        assert "Test coverage analysis complete. Coverage is 85%." in history

        # Verify chronological ordering (turn 1 appears before turn 2, etc.)
-        turn_1_pos = history.find("--- Turn 1 (Gemini using analyze) ---")
-        turn_2_pos = history.find("--- Turn 2 (Claude) ---")
-        turn_3_pos = history.find("--- Turn 3 (Gemini using analyze) ---")
+        turn_1_pos = history.find("--- Turn 1 (gemini-2.5-flash using analyze via google) ---")
+        turn_2_pos = history.find("--- Turn 2 (Agent) ---")
+        turn_3_pos = history.find("--- Turn 3 (gemini-2.5-flash using analyze via google) ---")

        assert turn_1_pos < turn_2_pos < turn_3_pos