Moonsong-Labs · notlesh · Jun 13, 2025 · Jun 13, 2025 · Jun 13, 2025 · Jun 13, 2025
diff --git a/.github/workflows/checks.yml b/.github/workflows/checks.yml
@@ -61,6 +61,15 @@ jobs:
         run: make deps
       - name: Run tests
         run: make test-unit
+      - name: Run tests with coverage
+        run: make test-coverage
+      - name: Upload coverage to Codecov
+        uses: codecov/codecov-action@v4
+        with:
+          token: ${{ secrets.CODECOV_TOKEN }}
+          fail_ci_if_error: false
+          flags: unittests
+          name: codecov-umbrella
   smoke-test:
     name: Smoke test
     runs-on: ubuntu-latest

diff --git a/Makefile b/Makefile
@@ -45,6 +45,13 @@ test: test-unit
 test-unit:
 	uv run pytest tests/unit_tests
 
+test-coverage:
+	uv run pytest tests/unit_tests --cov=src --cov-report=html --cov-report=term
+
+coverage-report:
+	uv run coverage html
+	@echo "Coverage report generated in htmlcov/index.html"
+
 test-graphs:
 	uv run --env-file .env pytest -rs tests/graph_tests
 
@@ -121,6 +128,8 @@ help:
 	@echo 'tests                        - run unit tests'
 	@echo 'test TEST_FILE=<test_file>   - run all tests in file'
 	@echo 'test_watch                   - run unit tests in watch mode'
+	@echo 'test-coverage                - run unit tests with coverage report'
+	@echo 'coverage-report              - generate HTML coverage report'
 	@echo 'ci-build-check               - run build check for CI'
 	@echo 'demo                         - run demo orchestration script'
 
diff --git a/pyproject.toml b/pyproject.toml
@@ -29,6 +29,9 @@ optional-dependencies.dev = [
     "pytest~=8.3.5",
     "pytest-asyncio~=0.26.0",
     "pytest-dotenv~=0.5.2",
+    "pytest-cov>=4.1.0",
+    "coverage[toml]>=7.3.0",
+    "pytest-html>=4.0.0",
     "langgraph-cli[inmem]~=0.3.1",
     "openevals~=0.0.19",
     "debugpy~=1.8.14",
@@ -100,3 +103,31 @@ ignore_errors = false
 
 [tool.codespell]
 skip = "node_modules"
+
+[tool.coverage.run]
+source = ["src"]
+omit = [
+    "*/tests/*",
+    "*/test_*.py", 
+    "*/__pycache__/*",
+    "src/demo/*",
+]
+
+[tool.coverage.report]
+precision = 2
+show_missing = true
+skip_covered = false
+exclude_lines = [
+    "pragma: no cover",
+    "def __repr__",
+    "if self.debug:",
+    "if settings.DEBUG",
+    "raise AssertionError",
+    "raise NotImplementedError",
+    "if 0:",
+    "if __name__ == .__main__.:",
+    "if TYPE_CHECKING:",
+]
-exclude_lines = [
-    "pragma: no cover",
-    "def __repr__",
-    "if self.debug:",
-    "if settings.DEBUG",
-    "raise AssertionError",
-    "raise NotImplementedError",
-    "if 0:",
-    "if __name__ == .__main__.:",
-    "if TYPE_CHECKING:",
-]
+exclude_lines = [
+    "pragma: no cover",
+    "def __repr__",
+    "if self.debug:",
+    "if settings.DEBUG",
+    "raise AssertionError",
+    "raise NotImplementedError",
+    "if 0:",
+    "if __name__ == '__main__':",
+    "if TYPE_CHECKING:",
+]
-exclude_lines = [
-    "pragma: no cover",
-    "def __repr__",
-    "if self.debug:",
-    "if settings.DEBUG",
-    "raise AssertionError",
-    "raise NotImplementedError",
-    "if 0:",
-    "if __name__ == .__main__.:",
-    "if TYPE_CHECKING:",
-]
+exclude_lines = [
+    "pragma: no cover",
+    "def __repr__",
+    "if self.debug:",
+    "if settings.DEBUG",
+    "raise AssertionError",
+    "raise NotImplementedError",
+    "if 0:",
+    "if __name__ == '__main__':",
+    "if TYPE_CHECKING:",
+]
+
+[tool.coverage.html]
+directory = "htmlcov"
diff --git a/tests/unit_tests/common/test_tools.py b/tests/unit_tests/common/test_tools.py
@@ -2,11 +2,14 @@
 import shutil
 
 import pytest
+from langchain_core.messages import ToolMessage
+from langgraph.types import Command
 
 from common.tools.create_directory import create_directory
 from common.tools.create_file import create_file
 from common.tools.list_files import list_files
 from common.tools.read_file import read_file
+from common.tools.summarize import create_summarize_tool
 
 # Test directory for file operations
 TEST_DIR = "test_tools_dir"
@@ -220,3 +223,92 @@ def test_create_file_overwrite(self, setup_test_directory):
         with open(test_file, "r") as f:
             content = f.read()
         assert content == new_content
+
+
+class TestSummarize:
+    """Tests for the summarize tool."""
+
+    @pytest.mark.asyncio
+    async def test_create_summarize_tool(self, capsys):
+        """Test creating and using a summarize tool."""
+        agent_name = "TestAgent"
+        summarize_tool = create_summarize_tool(agent_name)
+
+        # Verify tool properties
+        assert summarize_tool.name == "summarize"
+        assert "summary" in summarize_tool.description.lower()
+
+        # Test invoking the tool
+        test_summary = "This is a test summary of the agent's work"
+        result = await summarize_tool.ainvoke({
+            "summary": test_summary,
+            "tool_call_id": "test_call_123"
+        })
+
+        # Verify the result is a Command
+        assert isinstance(result, Command)
+        assert "messages" in result.update
+        assert "summary" in result.update
+
+        # Verify the summary was stored correctly
+        assert result.update["summary"] == test_summary
+
+        # Verify the tool message
+        messages = result.update["messages"]
+        assert len(messages) == 1
+        assert isinstance(messages[0], ToolMessage)
+        assert messages[0].content == test_summary
+        assert messages[0].tool_call_id == "test_call_123"
+
+        # Verify console output
+        captured = capsys.readouterr()
+        assert f"======= Summary for {agent_name} =======" in captured.out
+        assert test_summary in captured.out
+        assert "==========================================" in captured.out
+
+    @pytest.mark.asyncio
+    async def test_summarize_tool_with_different_agents(self, capsys):
+        """Test that different agents have different summarize tools."""
+        agent1_name = "Agent1"
+        agent2_name = "Agent2"
+
+        summarize1 = create_summarize_tool(agent1_name)
+        summarize2 = create_summarize_tool(agent2_name)
+
+        # Both should have the same tool name
+        assert summarize1.name == summarize2.name == "summarize"
+
+        # Test agent 1
+        await summarize1.ainvoke({
+            "summary": "Agent 1 summary",
+            "tool_call_id": "call_1"
+        })
+
+        captured1 = capsys.readouterr()
+        assert f"======= Summary for {agent1_name} =======" in captured1.out
+        assert "Agent 1 summary" in captured1.out
+
+        # Test agent 2
+        await summarize2.ainvoke({
+            "summary": "Agent 2 summary",
+            "tool_call_id": "call_2"
+        })
+
+        captured2 = capsys.readouterr()
+        assert f"======= Summary for {agent2_name} =======" in captured2.out
+        assert "Agent 2 summary" in captured2.out
+
+    @pytest.mark.asyncio
+    async def test_summarize_empty_summary(self):
+        """Test summarize tool with empty summary."""
+        summarize_tool = create_summarize_tool("TestAgent")
+
+        result = await summarize_tool.ainvoke({
+            "summary": "",
+            "tool_call_id": "empty_call"
+        })
+
+        # Should still return a valid Command even with empty summary
+        assert isinstance(result, Command)
+        assert result.update["summary"] == ""
+        assert result.update["messages"][0].content == ""