Spaces:

MCP-1st-Birthday
/

DeepBoner

Running

VibecoderMcSwaggins commited on 12 days ago

Commit

069f0a0

1 Parent(s): 953b850

feat(phase1): Foundation & Tooling complete

* feat: initialize deepcritical project structure with core configuration and main functionality

- Added initial project files including `.python-version`, `pyproject.toml`, and main application logic in `main.py`.
- Implemented application configuration using Pydantic in `src/utils/config.py` with environment variable support.
- Created directory structure for source code and tests, including placeholders for agents, prompts, tools, and utilities.
- Added unit tests for configuration loading and validation in `tests/unit/utils/test_config.py`.

Review Score: 100/100 (Ironclad Gucci Banger Edition)

* feat(phase1): complete foundation with Python 3.11, tests, and tooling

- Fix Python version to 3.11 for HuggingFace Spaces compatibility
- Add config.py with pydantic-settings for typed configuration
- Add exceptions.py with custom exception hierarchy
- Add conftest.py with test fixtures (sample_evidence deferred to Phase 2)
- Add .env.example and .pre-commit-config.yaml
- Remove reference_repos from git tracking
- All 8 tests pass, ruff clean, mypy src clean

* fix(phase1): address Sourcery + CodeRabbit review feedback

- Use ConfigurationError instead of ValueError in get_api_key()
- Handle unknown LLM provider explicitly
- Wire up log_level in configure_logging()
- Add Anthropic provider tests (success + missing key)
- Add ConfigurationError hierarchy test
- Add catch-all base exception test

12 tests passing, ruff clean, mypy clean

Files changed (23) hide show

.env.example +13 -0
.pre-commit-config.yaml +17 -0
.python-version +1 -0
main.py +6 -0
pyproject.toml +111 -0
reference_repos/README.md +0 -54
src/__init__.py +0 -0
src/agent_factory/__init__.py +0 -0
src/prompts/__init__.py +0 -0
src/tools/__init__.py +0 -0
src/utils/__init__.py +0 -0
src/utils/config.py +89 -0
src/utils/exceptions.py +31 -0
tests/__init__.py +0 -0
tests/conftest.py +32 -0
tests/integration/__init__.py +0 -0
tests/unit/__init__.py +0 -0
tests/unit/agent_factory/__init__.py +0 -0
tests/unit/tools/__init__.py +0 -0
tests/unit/utils/__init__.py +0 -0
tests/unit/utils/test_config.py +60 -0
tests/unit/utils/test_exceptions.py +33 -0
uv.lock +0 -0

.env.example ADDED Viewed

	@@ -0,0 +1,13 @@

+# LLM Provider (choose one)
+OPENAI_API_KEY=sk-your-key-here
+ANTHROPIC_API_KEY=sk-ant-your-key-here
+# Optional: PubMed API key (higher rate limits)
+NCBI_API_KEY=your-ncbi-key-here
+# Optional: For HuggingFace deployment
+HF_TOKEN=hf_your-token-here
+# Agent Config
+MAX_ITERATIONS=10
+LOG_LEVEL=INFO

.pre-commit-config.yaml ADDED Viewed

	@@ -0,0 +1,17 @@

+repos:
+  - repo: https://github.com/astral-sh/ruff-pre-commit
+    rev: v0.4.4
+    hooks:
+      - id: ruff
+        args: [--fix]
+      - id: ruff-format
+  - repo: https://github.com/pre-commit/mirrors-mypy
+    rev: v1.10.0
+    hooks:
+      - id: mypy
+        files: ^src/
+        additional_dependencies:
+          - pydantic>=2.7
+          - pydantic-settings>=2.2
+        args: [--ignore-missing-imports]

.python-version ADDED Viewed

	@@ -0,0 +1 @@


1	+ 3.11

main.py ADDED Viewed

	@@ -0,0 +1,6 @@

+def main():
+    print("Hello from deepcritical!")
+if __name__ == "__main__":
+    main()

pyproject.toml ADDED Viewed

	@@ -0,0 +1,111 @@

+[project]
+name = "deepcritical"
+version = "0.1.0"
+description = "AI-Native Drug Repurposing Research Agent"
+readme = "README.md"
+requires-python = ">=3.11"
+dependencies = [
+    # Core
+    "pydantic>=2.7",
+    "pydantic-settings>=2.2",      # For BaseSettings (config)
+    "pydantic-ai>=0.0.16",          # Agent framework
+    # HTTP & Parsing
+    "httpx>=0.27",                   # Async HTTP client
+    "beautifulsoup4>=4.12",          # HTML parsing
+    "xmltodict>=0.13",               # PubMed XML -> dict
+    # Search
+    "duckduckgo-search>=6.0",        # Free web search
+    # UI
+    "gradio>=5.0",                   # Chat interface
+    # Utils
+    "python-dotenv>=1.0",            # .env loading
+    "tenacity>=8.2",                 # Retry logic
+    "structlog>=24.1",               # Structured logging
+]
+[project.optional-dependencies]
+dev = [
+    # Testing
+    "pytest>=8.0",
+    "pytest-asyncio>=0.23",
+    "pytest-sugar>=1.0",
+    "pytest-cov>=5.0",
+    "pytest-mock>=3.12",
+    "respx>=0.21",                   # Mock httpx requests
+    # Quality
+    "ruff>=0.4.0",
+    "mypy>=1.10",
+    "pre-commit>=3.7",
+]
+[build-system]
+requires = ["hatchling"]
+build-backend = "hatchling.build"
+[tool.hatch.build.targets.wheel]
+packages = ["src"]
+# ============== RUFF CONFIG ==============
+[tool.ruff]
+line-length = 100
+target-version = "py311"
+src = ["src", "tests"]
+[tool.ruff.lint]
+select = [
+    "E",    # pycodestyle errors
+    "F",    # pyflakes
+    "B",    # flake8-bugbear
+    "I",    # isort
+    "N",    # pep8-naming
+    "UP",   # pyupgrade
+    "PL",   # pylint
+    "RUF",  # ruff-specific
+]
+ignore = [
+    "PLR0913",  # Too many arguments (agents need many params)
+]
+[tool.ruff.lint.isort]
+known-first-party = ["src"]
+# ============== MYPY CONFIG ==============
+[tool.mypy]
+python_version = "3.11"
+strict = true
+ignore_missing_imports = true
+disallow_untyped_defs = true
+warn_return_any = true
+warn_unused_ignores = true
+# ============== PYTEST CONFIG ==============
+[tool.pytest.ini_options]
+testpaths = ["tests"]
+asyncio_mode = "auto"
+addopts = [
+    "-v",
+    "--tb=short",
+    "--strict-markers",
+]
+markers = [
+    "unit: Unit tests (mocked)",
+    "integration: Integration tests (real APIs)",
+    "slow: Slow tests",
+]
+# ============== COVERAGE CONFIG ==============
+[tool.coverage.run]
+source = ["src"]
+omit = ["*/__init__.py"]
+[tool.coverage.report]
+exclude_lines = [
+    "pragma: no cover",
+    "if TYPE_CHECKING:",
+    "raise NotImplementedError",
+]

reference_repos/README.md DELETED Viewed

@@ -1,54 +0,0 @@
-# Reference Repositories
-This directory contains reference implementations that inform our architecture. These repos are **git-ignored** and should be cloned locally.
-## Clone Commands
-```bash
-cd reference_repos
-# PydanticAI Research Agent (Brave Search + Agent patterns)
-git clone --depth 1 https://github.com/coleam00/PydanticAI-Research-Agent.git pydanticai-research-agent
-rm -rf pydanticai-research-agent/.git
-# PubMed MCP Server (Production-grade, TypeScript)
-git clone --depth 1 https://github.com/cyanheads/pubmed-mcp-server.git pubmed-mcp-server
-rm -rf pubmed-mcp-server/.git
-# Microsoft AutoGen (Multi-agent orchestration)
-git clone --depth 1 https://github.com/microsoft/autogen.git autogen-microsoft
-rm -rf autogen-microsoft/.git
-# Claude Agent SDK (Anthropic's agent framework)
-git clone --depth 1 https://github.com/anthropics/claude-agent-sdk-python.git claude-agent-sdk
-rm -rf claude-agent-sdk/.git
-```
-## What Each Repo Provides
-| Repository | Key Patterns | Reference In Docs |
-|------------|--------------|-------------------|
-| **pydanticai-research-agent** | @agent.tool decorator, Brave Search, dependency injection | Section 16 |
-| **pubmed-mcp-server** | PubMed E-utilities, MCP server patterns, research agent | Section 16 |
-| **autogen-microsoft** | Multi-agent orchestration, reflect_on_tool_use | Sections 14, 15 |
-| **claude-agent-sdk** | @tool decorator, hooks system, in-process MCP | Sections 14, 15 |
-## Quick Reference Files
-### PydanticAI Research Agent
-- `agents/research_agent.py` - Agent with @agent.tool pattern
-- `tools/brave_search.py` - Brave Search implementation
-- `models/research_models.py` - Pydantic models
-### PubMed MCP Server
-- `src/mcp-server/tools/pubmedSearchArticles/` - PubMed search
-- `src/mcp-server/tools/pubmedResearchAgent/` - Research orchestrator
-- `src/services/NCBI/` - NCBI E-utilities client
-### AutoGen
-- `python/packages/autogen-agentchat/` - Agent patterns
-- `python/packages/autogen-core/` - Core abstractions
-### Claude Agent SDK
-- `src/claude_agent_sdk/client.py` - SDK client
-- `examples/mcp_calculator.py` - @tool decorator example

src/__init__.py ADDED Viewed

File without changes

src/agent_factory/__init__.py ADDED Viewed

File without changes

src/prompts/__init__.py ADDED Viewed

File without changes

src/tools/__init__.py ADDED Viewed

File without changes

src/utils/__init__.py ADDED Viewed

File without changes

src/utils/config.py ADDED Viewed

	@@ -0,0 +1,89 @@

+"""Application configuration using Pydantic Settings."""
+import logging
+from typing import Literal
+import structlog
+from pydantic import Field
+from pydantic_settings import BaseSettings, SettingsConfigDict
+from src.utils.exceptions import ConfigurationError
+class Settings(BaseSettings):
+    """Strongly-typed application settings."""
+    model_config = SettingsConfigDict(
+        env_file=".env",
+        env_file_encoding="utf-8",
+        case_sensitive=False,
+        extra="ignore",
+    )
+    # LLM Configuration
+    openai_api_key: str | None = Field(default=None, description="OpenAI API key")
+    anthropic_api_key: str | None = Field(default=None, description="Anthropic API key")
+    llm_provider: Literal["openai", "anthropic"] = Field(
+        default="openai", description="Which LLM provider to use"
+    )
+    openai_model: str = Field(default="gpt-4o", description="OpenAI model name")
+    anthropic_model: str = Field(
+        default="claude-3-5-sonnet-20241022", description="Anthropic model"
+    )
+    # PubMed Configuration
+    ncbi_api_key: str | None = Field(
+        default=None, description="NCBI API key for higher rate limits"
+    )
+    # Agent Configuration
+    max_iterations: int = Field(default=10, ge=1, le=50)
+    search_timeout: int = Field(default=30, description="Seconds to wait for search")
+    # Logging
+    log_level: Literal["DEBUG", "INFO", "WARNING", "ERROR"] = "INFO"
+    def get_api_key(self) -> str:
+        """Get the API key for the configured provider."""
+        if self.llm_provider == "openai":
+            if not self.openai_api_key:
+                raise ConfigurationError("OPENAI_API_KEY not set")
+            return self.openai_api_key
+        if self.llm_provider == "anthropic":
+            if not self.anthropic_api_key:
+                raise ConfigurationError("ANTHROPIC_API_KEY not set")
+            return self.anthropic_api_key
+        raise ConfigurationError(f"Unknown LLM provider: {self.llm_provider}")
+def get_settings() -> Settings:
+    """Factory function to get settings (allows mocking in tests)."""
+    return Settings()
+def configure_logging(settings: Settings) -> None:
+    """Configure structured logging with the configured log level."""
+    # Set stdlib logging level from settings
+    logging.basicConfig(
+        level=getattr(logging, settings.log_level),
+        format="%(message)s",
+    )
+    structlog.configure(
+        processors=[
+            structlog.stdlib.filter_by_level,
+            structlog.stdlib.add_logger_name,
+            structlog.stdlib.add_log_level,
+            structlog.processors.TimeStamper(fmt="iso"),
+            structlog.processors.JSONRenderer(),
+        ],
+        wrapper_class=structlog.stdlib.BoundLogger,
+        context_class=dict,
+        logger_factory=structlog.stdlib.LoggerFactory(),
+    )
+# Singleton for easy import
+settings = get_settings()

src/utils/exceptions.py ADDED Viewed

	@@ -0,0 +1,31 @@

+"""Custom exceptions for DeepCritical."""
+class DeepCriticalError(Exception):
+    """Base exception for all DeepCritical errors."""
+    pass
+class SearchError(DeepCriticalError):
+    """Raised when a search operation fails."""
+    pass
+class JudgeError(DeepCriticalError):
+    """Raised when the judge fails to assess evidence."""
+    pass
+class ConfigurationError(DeepCriticalError):
+    """Raised when configuration is invalid."""
+    pass
+class RateLimitError(SearchError):
+    """Raised when we hit API rate limits."""
+    pass

tests/__init__.py ADDED Viewed

File without changes

tests/conftest.py ADDED Viewed

	@@ -0,0 +1,32 @@

+"""Shared pytest fixtures for all tests."""
+from unittest.mock import AsyncMock
+import pytest
+@pytest.fixture
+def mock_httpx_client(mocker):
+    """Mock httpx.AsyncClient for API tests."""
+    mock = mocker.patch("httpx.AsyncClient")
+    mock.return_value.__aenter__ = AsyncMock(return_value=mock.return_value)
+    mock.return_value.__aexit__ = AsyncMock(return_value=None)
+    return mock
+@pytest.fixture
+def mock_llm_response():
+    """Factory fixture for mocking LLM responses."""
+    def _mock(content: str):
+        return AsyncMock(return_value=content)
+    return _mock
+# NOTE: sample_evidence fixture will be added in Phase 2 when models.py exists
+# @pytest.fixture
+# def sample_evidence():
+#     """Sample Evidence objects for testing."""
+#     from src.utils.models import Citation, Evidence
+#     return [...]

tests/integration/__init__.py ADDED Viewed

File without changes

tests/unit/__init__.py ADDED Viewed

File without changes

tests/unit/agent_factory/__init__.py ADDED Viewed

File without changes

tests/unit/tools/__init__.py ADDED Viewed

File without changes

tests/unit/utils/__init__.py ADDED Viewed

File without changes

tests/unit/utils/test_config.py ADDED Viewed

	@@ -0,0 +1,60 @@

+"""Unit tests for configuration loading."""
+import os
+from unittest.mock import patch
+import pytest
+from pydantic import ValidationError
+from src.utils.config import Settings
+from src.utils.exceptions import ConfigurationError
+class TestSettings:
+    """Tests for Settings class."""
+    def test_default_max_iterations(self):
+        """Settings should have default max_iterations of 10."""
+        with patch.dict(os.environ, {}, clear=True):
+            settings = Settings()
+            assert settings.max_iterations == 10  # noqa: PLR2004
+    def test_max_iterations_from_env(self):
+        """Settings should read MAX_ITERATIONS from env."""
+        with patch.dict(os.environ, {"MAX_ITERATIONS": "25"}):
+            settings = Settings()
+            assert settings.max_iterations == 25  # noqa: PLR2004
+    def test_invalid_max_iterations_raises(self):
+        """Settings should reject invalid max_iterations."""
+        with patch.dict(os.environ, {"MAX_ITERATIONS": "100"}):
+            with pytest.raises(ValidationError):
+                Settings()  # 100 > 50 (max)
+    def test_get_api_key_openai(self):
+        """get_api_key should return OpenAI key when provider is openai."""
+        with patch.dict(os.environ, {"LLM_PROVIDER": "openai", "OPENAI_API_KEY": "sk-test-key"}):
+            settings = Settings()
+            assert settings.get_api_key() == "sk-test-key"
+    def test_get_api_key_openai_missing_raises(self):
+        """get_api_key should raise ConfigurationError when OpenAI key is not set."""
+        with patch.dict(os.environ, {"LLM_PROVIDER": "openai"}, clear=True):
+            settings = Settings()
+            with pytest.raises(ConfigurationError, match="OPENAI_API_KEY not set"):
+                settings.get_api_key()
+    def test_get_api_key_anthropic(self):
+        """get_api_key should return Anthropic key when provider is anthropic."""
+        with patch.dict(
+            os.environ, {"LLM_PROVIDER": "anthropic", "ANTHROPIC_API_KEY": "sk-ant-test-key"}
+        ):
+            settings = Settings()
+            assert settings.get_api_key() == "sk-ant-test-key"
+    def test_get_api_key_anthropic_missing_raises(self):
+        """get_api_key should raise ConfigurationError when Anthropic key is not set."""
+        with patch.dict(os.environ, {"LLM_PROVIDER": "anthropic"}, clear=True):
+            settings = Settings()
+            with pytest.raises(ConfigurationError, match="ANTHROPIC_API_KEY not set"):
+                settings.get_api_key()

tests/unit/utils/test_exceptions.py ADDED Viewed

	@@ -0,0 +1,33 @@

+"""Unit tests for custom exceptions."""
+from src.utils.exceptions import (
+    ConfigurationError,
+    DeepCriticalError,
+    JudgeError,
+    RateLimitError,
+    SearchError,
+)
+class TestExceptions:
+    """Tests for exception hierarchy."""
+    def test_search_error_is_deepcritical_error(self):
+        assert issubclass(SearchError, DeepCriticalError)
+    def test_rate_limit_error_is_search_error(self):
+        assert issubclass(RateLimitError, SearchError)
+    def test_judge_error_is_deepcritical_error(self):
+        assert issubclass(JudgeError, DeepCriticalError)
+    def test_configuration_error_is_deepcritical_error(self):
+        assert issubclass(ConfigurationError, DeepCriticalError)
+    def test_subclass_caught_as_base(self):
+        """Verify subclasses can be caught via DeepCriticalError."""
+        try:
+            raise RateLimitError("rate limited")
+        except DeepCriticalError as exc:
+            assert isinstance(exc, RateLimitError)
+            assert isinstance(exc, DeepCriticalError)

uv.lock ADDED Viewed

The diff for this file is too large to render. See raw diff