test: add tests for reasoning attribute handling in streaming and non-streaming cases

2025-05-29 08:44:59 +00:00 · 2025-03-09 08:43:18 -07:00 · 2025-03-09 08:43:18 -07:00 · 41ae947885
commit 41ae947885
parent 84f610c0e9
1 changed files with 174 additions and 0 deletions
--- a/tests/basic/test_reasoning.py
+++ b/tests/basic/test_reasoning.py
@ -399,6 +399,180 @@ End"""
        text = "Just regular text"
        self.assertEqual(remove_reasoning_content(text, "think"), text)

+    def test_send_with_reasoning(self):
+        """Test that reasoning content from the 'reasoning' attribute is properly formatted and output."""
+        # Setup IO with no pretty
+        io = InputOutput(pretty=False)
+        io.assistant_output = MagicMock()
+
+        # Setup model and coder
+        model = Model("gpt-3.5-turbo")
+        coder = Coder.create(model, None, io=io, stream=False)
+
+        # Test data
+        reasoning_content = "My step-by-step reasoning process"
+        main_content = "Final answer after reasoning"
+
+        # Mock completion response with reasoning content
+        class MockCompletion:
+            def __init__(self, content, reasoning):
+                self.content = content
+                # Add required attributes expected by show_send_output
+                self.choices = [MagicMock()]
+                self.choices[0].message.content = content
+                self.choices[0].message.reasoning = reasoning  # Using reasoning instead of reasoning_content
+                self.finish_reason = "stop"
+
+        mock_completion = MockCompletion(main_content, reasoning_content)
+
+        # Create a mock hash object
+        mock_hash = MagicMock()
+        mock_hash.hexdigest.return_value = "mock_hash_digest"
+
+        # Mock the model's send_completion method to return the expected tuple format
+        with patch.object(model, "send_completion", return_value=(mock_hash, mock_completion)):
+            # Call send with a simple message
+            messages = [{"role": "user", "content": "test prompt"}]
+            list(coder.send(messages))
+
+            # Now verify ai_output was called with the right content
+            io.assistant_output.assert_called_once()
+            output = io.assistant_output.call_args[0][0]
+
+            dump(output)
+
+            # Output should contain formatted reasoning tags
+            self.assertIn(REASONING_START, output)
+            self.assertIn(REASONING_END, output)
+
+            # Output should include both reasoning and main content
+            self.assertIn(reasoning_content, output)
+            self.assertIn(main_content, output)
+
+            # Verify that partial_response_content only contains the main content
+            coder.remove_reasoning_content()
+            self.assertEqual(coder.partial_response_content.strip(), main_content.strip())
+
+            # Ensure proper order: reasoning first, then main content
+            reasoning_pos = output.find(reasoning_content)
+            main_pos = output.find(main_content)
+            self.assertLess(
+                reasoning_pos, main_pos, "Reasoning content should appear before main content"
+            )
+
+    def test_send_with_reasoning_stream(self):
+        """Test that streaming reasoning content from the 'reasoning' attribute is properly formatted and output."""
+        # Setup IO with pretty output for streaming
+        io = InputOutput(pretty=True)
+        mock_mdstream = MagicMock()
+        io.get_assistant_mdstream = MagicMock(return_value=mock_mdstream)
+
+        # Setup model and coder
+        model = Model("gpt-3.5-turbo")
+        coder = Coder.create(model, None, io=io, stream=True)
+
+        # Ensure the coder shows pretty output
+        coder.show_pretty = MagicMock(return_value=True)
+
+        # Mock streaming response chunks
+        class MockStreamingChunk:
+            def __init__(
+                self, content=None, reasoning_content=None, reasoning=None, finish_reason=None
+            ):
+                self.choices = [MagicMock()]
+                self.choices[0].delta = MagicMock()
+                self.choices[0].finish_reason = finish_reason
+
+                # Set content if provided
+                if content is not None:
+                    self.choices[0].delta.content = content
+                else:
+                    # Need to handle attribute access that would raise AttributeError
+                    delattr(self.choices[0].delta, "content")
+
+                # Set reasoning_content if provided
+                if reasoning_content is not None:
+                    self.choices[0].delta.reasoning_content = reasoning_content
+                else:
+                    # Need to handle attribute access that would raise AttributeError
+                    delattr(self.choices[0].delta, "reasoning_content")
+
+                # Set reasoning if provided
+                if reasoning is not None:
+                    self.choices[0].delta.reasoning = reasoning
+                else:
+                    # Need to handle attribute access that would raise AttributeError
+                    delattr(self.choices[0].delta, "reasoning")
+
+        # Create chunks to simulate streaming - using reasoning attribute instead of reasoning_content
+        chunks = [
+            # First chunk with reasoning content starts the tag
+            MockStreamingChunk(reasoning="My step-by-step "),
+            # Additional reasoning content
+            MockStreamingChunk(reasoning="reasoning process"),
+            # Switch to main content - this will automatically end the reasoning tag
+            MockStreamingChunk(content="Final "),
+            # More main content
+            MockStreamingChunk(content="answer "),
+            MockStreamingChunk(content="after reasoning"),
+            # End the response
+            MockStreamingChunk(finish_reason="stop"),
+        ]
+
+        # Create a mock hash object
+        mock_hash = MagicMock()
+        mock_hash.hexdigest.return_value = "mock_hash_digest"
+
+        # Mock the model's send_completion to return the hash and completion
+        with (
+            patch.object(model, "send_completion", return_value=(mock_hash, chunks)),
+            patch.object(model, "token_count", return_value=10),
+        ):  # Mock token count to avoid serialization issues
+            # Set mdstream directly on the coder object
+            coder.mdstream = mock_mdstream
+
+            # Call send with a simple message
+            messages = [{"role": "user", "content": "test prompt"}]
+            list(coder.send(messages))
+
+            # Verify mdstream.update was called multiple times
+            mock_mdstream.update.assert_called()
+
+            coder.live_incremental_response(True)
+
+            # Explicitly get all calls to update
+            update_calls = mock_mdstream.update.call_args_list
+
+            # There should be at least two calls - one for streaming and one final
+            self.assertGreaterEqual(
+                len(update_calls), 2, "Should have at least two calls to update (streaming + final)"
+            )
+
+            # Check that at least one call has final=True (should be the last one)
+            has_final_true = any(call[1].get("final", False) for call in update_calls)
+            self.assertTrue(has_final_true, "At least one update call should have final=True")
+
+            # Get the text from the last update call
+            final_text = update_calls[-1][0][0]
+
+            # The final text should include both reasoning and main content with proper formatting
+            self.assertIn(REASONING_START, final_text)
+            self.assertIn("My step-by-step reasoning process", final_text)
+            self.assertIn(REASONING_END, final_text)
+            self.assertIn("Final answer after reasoning", final_text)
+
+            # Ensure proper order: reasoning first, then main content
+            reasoning_pos = final_text.find("My step-by-step reasoning process")
+            main_pos = final_text.find("Final answer after reasoning")
+            self.assertLess(
+                reasoning_pos, main_pos, "Reasoning content should appear before main content"
+            )
+
+            # Verify that partial_response_content only contains the main content
+            coder.remove_reasoning_content()
+            expected_content = "Final answer after reasoning"
+            self.assertEqual(coder.partial_response_content.strip(), expected_content)
+
    @patch("aider.models.litellm.completion")
    def test_simple_send_with_retries_removes_reasoning(self, mock_completion):
        """Test that simple_send_with_retries correctly removes reasoning content."""