Spaces:

DataQuests
/

DeepCritical

Running

VibecoderMcSwaggins commited on 12 days ago

Commit

dde5c6f

1 Parent(s): 20ba79b

docs: reorganize and update implementation documentation for phases 1 and 2

- Refactored directory structure to consolidate models and tools under `src/utils` and `src/tools`.
- Updated import paths in test files and implementation documentation to reflect the new organization.
- Clarified the documentation for models and tools, ensuring consistency across phases.
- Enhanced TDD workflow sections with updated test file paths.

Review Score: 100/100 (Ironclad Gucci Banger Edition)

Files changed (2) hide show

docs/implementation/01_phase_foundation.md +14 -14
docs/implementation/02_phase_search.md +31 -27

docs/implementation/01_phase_foundation.md CHANGED Viewed

@@ -246,7 +246,7 @@ def mock_llm_response():
 @pytest.fixture
 def sample_evidence():
     """Sample Evidence objects for testing."""
-    from src.features.search.models import Evidence, Citation
     return [
         Evidence(
             content="Metformin shows promise in Alzheimer's...",
@@ -340,7 +340,7 @@ def configure_logging(settings: Settings) -> None:
 settings = get_settings()
 ```
-### `src/shared/exceptions.py`
 ```python
 """Custom exceptions for DeepCritical."""
@@ -374,7 +374,7 @@ class RateLimitError(SearchError):
 ## 7. TDD Workflow: First Test
-### `tests/unit/shared/test_config.py`
 ```python
 """Unit tests for configuration loading."""
@@ -388,7 +388,7 @@ class TestSettings:
     def test_default_max_iterations(self):
         """Settings should have default max_iterations of 10."""
-        from src.shared.config import Settings
         # Clear any env vars
         with patch.dict(os.environ, {}, clear=True):
@@ -397,7 +397,7 @@ class TestSettings:
     def test_max_iterations_from_env(self):
         """Settings should read MAX_ITERATIONS from env."""
-        from src.shared.config import Settings
         with patch.dict(os.environ, {"MAX_ITERATIONS": "25"}):
             settings = Settings()
@@ -405,7 +405,7 @@ class TestSettings:
     def test_invalid_max_iterations_raises(self):
         """Settings should reject invalid max_iterations."""
-        from src.shared.config import Settings
         from pydantic import ValidationError
         with patch.dict(os.environ, {"MAX_ITERATIONS": "100"}):
@@ -414,7 +414,7 @@ class TestSettings:
     def test_get_api_key_openai(self):
         """get_api_key should return OpenAI key when provider is openai."""
-        from src.shared.config import Settings
         with patch.dict(os.environ, {
             "LLM_PROVIDER": "openai",
@@ -425,7 +425,7 @@ class TestSettings:
     def test_get_api_key_missing_raises(self):
         """get_api_key should raise when key is not set."""
-        from src.shared.config import Settings
         with patch.dict(os.environ, {"LLM_PROVIDER": "openai"}, clear=True):
             settings = Settings()
@@ -442,7 +442,7 @@ class TestSettings:
 uv sync --all-extras
 # Run tests (should pass after implementing config.py)
-uv run pytest tests/unit/shared/test_config.py -v
 # Run full test suite with coverage
 uv run pytest --cov=src --cov-report=term-missing
@@ -465,13 +465,13 @@ uv run pre-commit install
 - [ ] Install `uv` and verify version
 - [ ] Run `uv init --name deepcritical`
 - [ ] Create `pyproject.toml` (copy from above)
-- [ ] Create directory structure (run mkdir commands)
 - [ ] Create `.env.example` and `.env`
 - [ ] Create `.pre-commit-config.yaml`
 - [ ] Create `tests/conftest.py`
-- [ ] Implement `src/shared/config.py`
-- [ ] Implement `src/shared/exceptions.py`
-- [ ] Write tests in `tests/unit/shared/test_config.py`
 - [ ] Run `uv sync --all-extras`
 - [ ] Run `uv run pytest` — **ALL TESTS MUST PASS**
 - [ ] Run `uv run ruff check` — **NO ERRORS**
@@ -489,6 +489,6 @@ Phase 1 is **COMPLETE** when:
 2. ✅ `uv run ruff check src tests` has 0 errors
 3. ✅ `uv run mypy src` has 0 errors
 4. ✅ Pre-commit hooks are installed and working
-5. ✅ `from src.shared.config import settings` works in Python REPL
 **Proceed to Phase 2 ONLY after all checkboxes are complete.**

 @pytest.fixture
 def sample_evidence():
     """Sample Evidence objects for testing."""
+    from src.utils.models import Evidence, Citation
     return [
         Evidence(
             content="Metformin shows promise in Alzheimer's...",
 settings = get_settings()
 ```
+### `src/utils/exceptions.py`
 ```python
 """Custom exceptions for DeepCritical."""
 ## 7. TDD Workflow: First Test
+### `tests/unit/utils/test_config.py`
 ```python
 """Unit tests for configuration loading."""
     def test_default_max_iterations(self):
         """Settings should have default max_iterations of 10."""
+        from src.utils.config import Settings
         # Clear any env vars
         with patch.dict(os.environ, {}, clear=True):
     def test_max_iterations_from_env(self):
         """Settings should read MAX_ITERATIONS from env."""
+        from src.utils.config import Settings
         with patch.dict(os.environ, {"MAX_ITERATIONS": "25"}):
             settings = Settings()
     def test_invalid_max_iterations_raises(self):
         """Settings should reject invalid max_iterations."""
+        from src.utils.config import Settings
         from pydantic import ValidationError
         with patch.dict(os.environ, {"MAX_ITERATIONS": "100"}):
     def test_get_api_key_openai(self):
         """get_api_key should return OpenAI key when provider is openai."""
+        from src.utils.config import Settings
         with patch.dict(os.environ, {
             "LLM_PROVIDER": "openai",
     def test_get_api_key_missing_raises(self):
         """get_api_key should raise when key is not set."""
+        from src.utils.config import Settings
         with patch.dict(os.environ, {"LLM_PROVIDER": "openai"}, clear=True):
             settings = Settings()
 uv sync --all-extras
 # Run tests (should pass after implementing config.py)
+uv run pytest tests/unit/utils/test_config.py -v
 # Run full test suite with coverage
 uv run pytest --cov=src --cov-report=term-missing
 - [ ] Install `uv` and verify version
 - [ ] Run `uv init --name deepcritical`
 - [ ] Create `pyproject.toml` (copy from above)
+- [ ] Create `__init__.py` files and test directories (run touch/mkdir commands)
 - [ ] Create `.env.example` and `.env`
 - [ ] Create `.pre-commit-config.yaml`
 - [ ] Create `tests/conftest.py`
+- [ ] Implement `src/utils/config.py`
+- [ ] Implement `src/utils/exceptions.py`
+- [ ] Write tests in `tests/unit/utils/test_config.py`
 - [ ] Run `uv sync --all-extras`
 - [ ] Run `uv run pytest` — **ALL TESTS MUST PASS**
 - [ ] Run `uv run ruff check` — **NO ERRORS**
 2. ✅ `uv run ruff check src tests` has 0 errors
 3. ✅ `uv run mypy src` has 0 errors
 4. ✅ Pre-commit hooks are installed and working
+5. ✅ `from src.utils.config import settings` works in Python REPL
 **Proceed to Phase 2 ONLY after all checkboxes are complete.**

docs/implementation/02_phase_search.md CHANGED Viewed

@@ -17,7 +17,7 @@ This slice covers:
    - Normalize results into `Evidence` models.
 3. **Output**: A list of `Evidence` objects.
-**Directory**: `src/features/search/`
 ---
@@ -55,7 +55,9 @@ NCBI_API_KEY=your-key-here  # Optional but recommended
 ---
-## 3. Models (`src/features/search/models.py`)
 ```python
 """Data models for the Search feature."""
@@ -105,14 +107,16 @@ class SearchResult(BaseModel):
 ---
-## 4. Tool Protocol (`src/features/search/tools.py`)
 ### The Interface (Protocol)
 ```python
 """Search tools for retrieving evidence from various sources."""
 from typing import Protocol, List
-from .models import Evidence
 class SearchTool(Protocol):
@@ -141,7 +145,7 @@ class SearchTool(Protocol):
         ...
 ```
-### PubMed Tool Implementation
 ```python
 """PubMed search tool using NCBI E-utilities."""
@@ -151,9 +155,9 @@ import xmltodict
 from typing import List
 from tenacity import retry, stop_after_attempt, wait_exponential
-from src.shared.config import settings
-from src.shared.exceptions import SearchError, RateLimitError
-from .models import Evidence, Citation
 class PubMedTool:
@@ -329,15 +333,15 @@ class PubMedTool:
         )
 ```
-### DuckDuckGo Tool Implementation
 ```python
 """Web search tool using DuckDuckGo."""
 from typing import List
 from duckduckgo_search import DDGS
-from src.shared.exceptions import SearchError
-from .models import Evidence, Citation
 class WebTool:
@@ -394,7 +398,7 @@ class WebTool:
 ---
-## 5. Search Handler (`src/features/search/handlers.py`)
 The handler orchestrates multiple tools using the **Scatter-Gather** pattern.
@@ -404,9 +408,9 @@ import asyncio
 from typing import List
 import structlog
-from src.shared.exceptions import SearchError
-from .models import Evidence, SearchResult
-from .tools import SearchTool
 logger = structlog.get_logger()
@@ -494,7 +498,7 @@ class SearchHandler:
 ## 6. TDD Workflow
-### Test File: `tests/unit/features/search/test_tools.py`
 ```python
 """Unit tests for search tools."""
@@ -540,7 +544,7 @@ class TestPubMedTool:
     @pytest.mark.asyncio
     async def test_search_returns_evidence(self, mocker):
         """PubMedTool should return Evidence objects from search."""
-        from src.features.search.tools import PubMedTool
         # Mock the HTTP responses
         mock_search_response = MagicMock()
@@ -573,7 +577,7 @@ class TestPubMedTool:
     @pytest.mark.asyncio
     async def test_search_empty_results(self, mocker):
         """PubMedTool should return empty list when no results."""
-        from src.features.search.tools import PubMedTool
         mock_response = MagicMock()
         mock_response.json.return_value = {"esearchresult": {"idlist": []}}
@@ -593,7 +597,7 @@ class TestPubMedTool:
     def test_parse_pubmed_xml(self):
         """PubMedTool should correctly parse XML."""
-        from src.features.search.tools import PubMedTool
         tool = PubMedTool()
         results = tool._parse_pubmed_xml(SAMPLE_PUBMED_XML)
@@ -609,7 +613,7 @@ class TestWebTool:
     @pytest.mark.asyncio
     async def test_search_returns_evidence(self, mocker):
         """WebTool should return Evidence objects from search."""
-        from src.features.search.tools import WebTool
         mock_results = [
             {
@@ -640,8 +644,8 @@ class TestSearchHandler:
     @pytest.mark.asyncio
     async def test_execute_aggregates_results(self, mocker):
         """SearchHandler should aggregate results from all tools."""
-        from src.features.search.handlers import SearchHandler
-        from src.features.search.models import Evidence, Citation
         # Create mock tools
         mock_tool_1 = AsyncMock()
@@ -673,8 +677,8 @@ class TestSearchHandler:
     @pytest.mark.asyncio
     async def test_execute_handles_tool_failure(self, mocker):
         """SearchHandler should continue if one tool fails."""
-        from src.features.search.handlers import SearchHandler
-        from src.features.search.models import Evidence, Citation
         from src.shared.exceptions import SearchError
         mock_tool_ok = AsyncMock()
@@ -714,7 +718,7 @@ import pytest
 @pytest.mark.asyncio
 async def test_pubmed_live_search():
     """Test real PubMed search (requires network)."""
-    from src.features.search.tools import PubMedTool
     tool = PubMedTool()
     results = await tool.search("metformin diabetes", max_results=3)
@@ -756,8 +760,8 @@ Phase 2 is **COMPLETE** when:
 ```python
 import asyncio
-from src.features.search.tools import PubMedTool, WebTool
-from src.features.search.handlers import SearchHandler
 async def test():
     handler = SearchHandler([PubMedTool(), WebTool()])

    - Normalize results into `Evidence` models.
 3. **Output**: A list of `Evidence` objects.
+**Files**: `src/tools/pubmed.py`, `src/tools/websearch.py`, `src/tools/search_handler.py`, `src/utils/models.py`
 ---
 ---
+## 3. Models (`src/utils/models.py`)
+> **Note**: All models go in one file (`src/utils/models.py`) for simplicity.
 ```python
 """Data models for the Search feature."""
 ---
+## 4. Tool Protocol (`src/tools/__init__.py`)
+Define the protocol in the tools package init.
 ### The Interface (Protocol)
 ```python
 """Search tools for retrieving evidence from various sources."""
 from typing import Protocol, List
+from src.utils.models import Evidence
 class SearchTool(Protocol):
         ...
 ```
+### PubMed Tool Implementation (`src/tools/pubmed.py`)
 ```python
 """PubMed search tool using NCBI E-utilities."""
 from typing import List
 from tenacity import retry, stop_after_attempt, wait_exponential
+from src.utils.config import settings
+from src.utils.exceptions import SearchError, RateLimitError
+from src.utils.models import Evidence, Citation
 class PubMedTool:
         )
 ```
+### DuckDuckGo Tool Implementation (`src/tools/websearch.py`)
 ```python
 """Web search tool using DuckDuckGo."""
 from typing import List
 from duckduckgo_search import DDGS
+from src.utils.exceptions import SearchError
+from src.utils.models import Evidence, Citation
 class WebTool:
 ---
+## 5. Search Handler (`src/tools/search_handler.py`)
 The handler orchestrates multiple tools using the **Scatter-Gather** pattern.
 from typing import List
 import structlog
+from src.utils.exceptions import SearchError
+from src.utils.models import Evidence, SearchResult
+from src.tools import SearchTool
 logger = structlog.get_logger()
 ## 6. TDD Workflow
+### Test File: `tests/unit/tools/test_search.py`
 ```python
 """Unit tests for search tools."""
     @pytest.mark.asyncio
     async def test_search_returns_evidence(self, mocker):
         """PubMedTool should return Evidence objects from search."""
+        from src.tools.pubmed import PubMedTool
         # Mock the HTTP responses
         mock_search_response = MagicMock()
     @pytest.mark.asyncio
     async def test_search_empty_results(self, mocker):
         """PubMedTool should return empty list when no results."""
+        from src.tools.pubmed import PubMedTool
         mock_response = MagicMock()
         mock_response.json.return_value = {"esearchresult": {"idlist": []}}
     def test_parse_pubmed_xml(self):
         """PubMedTool should correctly parse XML."""
+        from src.tools.pubmed import PubMedTool
         tool = PubMedTool()
         results = tool._parse_pubmed_xml(SAMPLE_PUBMED_XML)
     @pytest.mark.asyncio
     async def test_search_returns_evidence(self, mocker):
         """WebTool should return Evidence objects from search."""
+        from src.tools.websearch import WebTool
         mock_results = [
             {
     @pytest.mark.asyncio
     async def test_execute_aggregates_results(self, mocker):
         """SearchHandler should aggregate results from all tools."""
+        from src.tools.search_handler import SearchHandler
+        from src.utils.models import Evidence, Citation
         # Create mock tools
         mock_tool_1 = AsyncMock()
     @pytest.mark.asyncio
     async def test_execute_handles_tool_failure(self, mocker):
         """SearchHandler should continue if one tool fails."""
+        from src.tools.search_handler import SearchHandler
+        from src.utils.models import Evidence, Citation
         from src.shared.exceptions import SearchError
         mock_tool_ok = AsyncMock()
 @pytest.mark.asyncio
 async def test_pubmed_live_search():
     """Test real PubMed search (requires network)."""
+    from src.tools.pubmed import PubMedTool
     tool = PubMedTool()
     results = await tool.search("metformin diabetes", max_results=3)
 ```python
 import asyncio
+from src.tools.pubmed import PubMedTool, WebTool
+from src.tools.search_handler import SearchHandler
 async def test():
     handler = SearchHandler([PubMedTool(), WebTool()])