initial

2026-05-08 23:46:17 +10:00 · 2026-05-08 23:46:17 +10:00 · 10c8cfaa0f
commit 10c8cfaa0f
71 changed files with 2139 additions and 0 deletions
--- a/.env.example
+++ b/.env.example
@ -0,0 +1,36 @@
 # LLM Configuration
 # Choose one of the following LLM providers:
 # For OpenAI:
 LLM_MODEL=gpt-4
 LLM_BASE_URL=https://api.openai.com/v1
 LLM_API_KEY=your_openai_api_key_here
 LLM_PROVIDER=openai
 # For Anthropic:
 # LLM_MODEL=claude-3-opus-20240229
 # LLM_BASE_URL=https://api.anthropic.com
 # LLM_API_KEY=your_anthropic_api_key_here
 # LLM_PROVIDER=anthropic
 # For Ollama (local):
 # LLM_MODEL=llama2
 # LLM_BASE_URL=http://localhost:11434
 # LLM_API_KEY=ollama  # Ollama doesn't require a real API key
 # LLM_PROVIDER=ollama
 # MCP Server Configuration
 # Hadolint MCP Server (installed via pip in Docker)
 # Checkov MCP Server (installed via pip in Docker)
 # Semgrep MCP Server (native, no configuration needed)
 # Trivy MCP Server (native, no configuration needed)
 # Optional: Semgrep App URL and Token for SEMgrep App functionality
 SEMGRAPH_APP_URL=
 SEMGRAPH_API_TOKEN=
 # Timeout Configuration (in seconds)
 TOTAL_FLOW_TIMEOUT=600
 PER_CREW_TIMEOUT=300
 # Other Configuration
 LOG_LEVEL=INFO
--- a/.gitea_soon/workflows/build_push.yml
+++ b/.gitea_soon/workflows/build_push.yml
@ -0,0 +1,72 @@
 name: Build and Push Image
 on:
  push:
    branches:
      - master
 jobs:
  build:
    name: Build and push image
    runs-on: ubuntu-latest
    container: catthehacker/ubuntu:act-latest
    if: gitea.ref == 'refs/heads/master'
    steps:
      - name: Checkout
        uses: actions/checkout@v4
      - name: Create Kubeconfig
        run: |
          mkdir $HOME/.kube
          echo "${{ secrets.KUBEC_CONFIG_BUILDX_NEW }}" > $HOME/.kube/config
      - name: Set up Docker Buildx
        uses: docker/setup-buildx-action@v3
        with:
          driver: kubernetes
          driver-opts: |
            namespace=gitea-runner
            qemu.install=true
      - name: Login to Docker Registry
        uses: docker/login-action@v3
        with:
          registry: git.aridgwayweb.com
          username: armistace
          password: ${{ secrets.REG_PASSWORD }}
      - name: Build and push
        uses: docker/build-push-action@v5
        with:
          context: .
          push: true
          platforms: linux/amd64,linux/arm64
          tags: |
            git.aridgwayweb.com/armistace/pr-reviewer:latest
      - name: Trivy Scan
        run: |
          echo "Installing Trivy "
          sudo apt-get update
          sudo apt-get install -y wget apt-transport-https gnupg lsb-release
          wget -qO - https://aquasecurity.github.io/trivy-repo/deb/public.key | sudo apt-key add -
          echo deb https://aquasecurity.github.io/trivy-repo/deb $(lsb_release -sc) main | sudo tee -a /etc/apt/sources.list.d/trivy.list
          sudo apt-get update
          sudo apt-get install -y trivy
          trivy image --format table --exit-code 1 --ignore-unfixed --vuln-type os,library --severity HIGH,CRITICAL git.aridgwayweb.com/armistace/pr-reviewer:latest
      - name: Deploy
        run: |
          echo "Installing Kubectl"
          apt-get update
          apt-get install -y apt-transport-https ca-certificates curl gnupg
          curl -fsSL https://pkgs.k8s.io/core:/stable:/v1.33/deb/Release.key | gpg --dearmor -o /etc/apt/keyrings/kubernetes-apt-keyring.gpg
          chmod 644 /etc/apt/keyrings/kubernetes-apt-keyring.gpg
          echo 'deb [signed-by=/etc/apt/keyrings/kubernetes-apt-keyring.gpg] https://pkgs.k8s.io/core:/stable:/v1.33/deb/ /' | tee /etc/apt/sources.list.d/kubernetes.list
          chmod 644 /etc/apt/sources.list.d/kubernetes.list
          apt-get update
          apt-get install kubectl
          kubectl delete namespace pr-reviewer
          kubectl create namespace pr-reviewer
          kubectl create secret docker-registry regcred --docker-server=${{ vars.DOCKER_SERVER }} --docker-username=${{ vars.DOCKER_USERNAME }} --docker-password='${{ secrets.DOCKER_PASSWORD }}' --docker-email=${{ vars.DOCKER_EMAIL }} --namespace=pr-reviewer
          kubectl apply -f kube/pr-reviewer_pod.yaml && kubectl apply -f kube/pr-reviewer_deployment.yaml && kubectl apply -f kube/pr-reviewer_service.yaml
--- a/.gitignore
+++ b/.gitignore
@ -0,0 +1 @@
 .spec/
--- a/64
+++ b/64
@ -0,0 +1,64 @@
 # Stage 1: Base with system dependencies and tool installations
 FROM python:3.12-slim as builder
 # Install system dependencies
 RUN apt-get update && apt-get install -y \
    git \
    curl \
    && rm -rf /var/lib/apt/lists/*
 # Install Hadolint (for Dockerfile linting)
 RUN curl -Lo /bin/hadolint https://github.com/hadolint/hadolint/releases/download/v2.12.0/hadolint-Linux-x86_64 && \
    chmod +x /bin/hadolint
 # Install Checkov (for Kubernetes security scanning)
 RUN pip install checkov==3.1.123
 # Install Trivy (for container and IaC scanning) - Native MCP server
 RUN curl -sfL https://raw.githubusercontent.com/aquasecurity/trivy/main/contrib/install.sh | sh -s -- -b /usr/local/bin v0.47.0
 # Install Semgrep (for code scanning) - Will use native MCP server
 RUN pip install semgrep==1.76.0
 # Install UV package manager
 COPY --from=ghcr.io/astral-sh/uv:latest /uv /uvx /bin/
 # Stage 2: App with source code and UV sync
 FROM python:3.12-slim
 # Create non-root user
 RUN useradd --create-home --shell /bin/bash app
 WORKDIR /app
 USER app
 # Install runtime dependencies
 RUN apt-get update && apt-get install -y \
    git \
    && rm -rf /var/lib/apt/lists/*
 # Copy UV from builder stage
 COPY --from=builder /bin/uv /bin/uv
 COPY --from=builder /bin/uvx /bin/uvx
 # Copy application code
 COPY --chown=app:app pyproject.toml .
 COPY --chown=app:app README.md .
 COPY --chown=app:app src/ ./src/
 COPY --chown=app:app mcp_servers/ ./mcp_servers/
 COPY --chown=app:app crews/ ./crews/
 COPY --chown=app:app tools/ ./tools/
 COPY --chown=app:app config/ ./config/
 COPY --chown=app:app contexts/ ./contexts/
 # Install Python dependencies using UV
 RUN uv sync --frozen --no-dev
 # Set environment variables
 ENV PYTHONPATH=/app/src
 ENV PATH="/app/.venv/bin:$PATH"
 # Expose port
 EXPOSE 8000
 # Set entrypoint
 ENTRYPOINT ["uvicorn", "src.pr_reviewer.main:app", "--host", "0.0.0.0", "--port", "8000"]
--- a/README.md
+++ b/README.md
@ -0,0 +1,185 @@
 # PR Reviewer
 An automated pull request review system using CrewAI and MCP (Model Context Protocol).
 ## Overview
 This system provides automated code, security, and infrastructure reviews for pull requests using a multi-agent approach. It leverages CrewAI for orchestrating specialized review agents and MCP (Model Context Protocol) for integrating with various static analysis tools.
 ## Features
 - **Code Review**: Uses Semgrep (via MCP) to check code quality, best practices, and maintainability
 - **Security Review**: Uses Trivy (native MCP) to identify security vulnerabilities
 - **Infrastructure Review**: Uses Hadolint and Checkov (via MCP wrappers) to review Dockerfiles and Kubernetes manifests
 - **Contextual Review**: Incorporates customizable guidelines for code, security, and infrastructure reviews
 - **Automated Orchestration**: Uses CrewAI Flows to manage the review process
 - **REST API**: FastAPI endpoint for triggering reviews
 - **Containerized**: Docker support for easy deployment
 ## Architecture
 The system follows a modular architecture with:
 - State management using Pydantic models
 - LLM factory for flexible provider support (OpenAI, Anthropic, Ollama)
 - Context resolution system for incorporating review guidelines
 - Crew-based implementation for each review type (code, security, infrastructure)
 - MCP server integrations for static analysis tools
 - Flow-based orchestration for managing the review process
 - RESTful API for integration with CI/CD systems
 ## Installation
 ### Prerequisites
 - Python 3.10-3.13
 - UV package manager
 - Git
 - Docker (optional, for containerized deployment)
 ### Local Development
 1. Clone the repository
 2. Install UV package manager: `curl -LsSf https://astral.sh/uv/install.sh | sh`
 3. Activate UV environment: `source $HOME/.local/bin/env`
 4. Create virtual environment: `uv venv .venv`
 5. Activate virtual environment: `source .venv/bin/activate`
 6. Install dependencies: `uv pip install -e .`
 7. Configure environment variables (see `.env.example`)
 ### Docker Deployment
 1. Build the Docker image: `docker build -t pr-reviewer .`
 2. Run the container: `docker run -p 8000:8000 --env-file .env pr-reviewer`
 ## Usage
 ### API Endpoints
 #### Health Check
 ```bash
 GET /api/v1/health
 ```
 Returns the health status of the service.
 #### Trigger PR Review
 ```bash
 POST /api/v1/review
 ```
 Initiates a pull request review.
 Request Body:
 ```json
 {
  "pr_id": "123",
  "title": "Add new feature",
  "description": "This PR adds a new feature to the application",
  "repo": {
    "name": "my-repo",
    "url": "https://github.com/user/my-repo"
  },
  "source": {
    "branch": "feature/new-feature",
    "commit": "abc123"
  },
  "target": {
    "branch": "main",
    "commit": "def456"
  },
  "files": [
    {
      "path": "src/main.py",
      "content": "print('Hello World')",
      "status": "modified",
      "additions": 1,
      "deletions": 0
    }
  ],
  "context": {
    "code_review": "Follow PEP8 guidelines",
    "security_review": "Check for SQL injection vulnerabilities",
    "infra_review": "Ensure Dockerfile follows best practices"
  }
 }
 ```
 Response:
 ```json
 {
  "review_id": "uuid-string",
  "status": "completed",
  "timestamp": "2023-05-08T10:00:00Z",
  "results": {
    "code_review": "Code review results...",
    "security_review": "Security review results...",
    "infra_review": "Infrastructure review results...",
    "summary": "Synthesized review summary..."
  },
  "metadata": {
    "processing_time_seconds": 45.2,
    "pr_id": "123",
    "repo": {
      "name": "my-repo",
      "url": "https://github.com/user/my-repo"
    }
  }
 }
 ```
 ## Configuration
 ### Environment Variables
 See `.env.example` for detailed configuration options.
 ### Context Files
 Default review guidelines are located in `contexts/defaults/`:
 - `code_review.md`: Coding practice guidelines
 - `security_review.md`: Security guidelines
 - `infra_review.md`: Infrastructure guidelines
 These can be overridden via the API context parameter.
 ## Development
 ### Running Tests
 ```bash
 # Run unit tests
 pytest
 # Run tests with coverage
 pytest --cov=src.pr_reviewer
 # Run specific test categories
 pytest tests/unit/
 pytest tests/integration/
 ```
 ### Code Style
 The project uses Black for code formatting and Flake8 for linting.
 Run formatting:
 ```bash
 black src/
 ```
 Run linting:
 ```bash
 flake8 src/
 ```
 ## Deployment
 ### Kubernetes
 Kubernetes manifests are available in the `k8s/` directory:
 - Secret for LLM configuration
 - Deployment for the PR Reviewer service
 - Service for exposing the API
 ### Gitea Actions
 GitHub Actions workflow for CI/CD is available in `.gitea/workflows/deploy.yaml`.
 ## License
 MIT
 ## Contributing
 1. Fork the repository
 2. Create a feature branch
 3. Commit your changes
 4. Push to the branch
 5. Open a pull request
--- a/config/init.py
+++ b/config/init.py
--- a/config/agents.yaml
+++ b/config/agents.yaml
@ -0,0 +1,7 @@
 # Summarizer Agent Configuration
 summariser:
  role: Senior Code Review Coordinator
  goal: Synthesize individual review results into a cohesive, actionable review report
  backstory: You are a senior technical lead with extensive experience in code review practices across multiple domains. You excel at combining feedback from different reviewers into a clear, prioritized, and actionable summary that helps development teams improve their code efficiently.
  verbose: true
  allow_delegation: false
--- a/config/tasks.yaml
+++ b/config/tasks.yaml
@ -0,0 +1,16 @@
 # Summarizer Task Configuration
 summarise_task:
  description: |
    Synthesize the results from code, security, and infrastructure reviews into a cohesive review report.
    Code Review Results: {code_review_results}
    Security Review Results: {security_review_results}
    Infrastructure Review Results: {infra_review_results}
    Context: {context}
  expected_output: |
    A comprehensive review report that includes:
    - Executive summary of all findings
    - Prioritized list of issues (critical, high, medium, low)
    - Specific recommendations for each domain (code, security, infrastructure)
    - Overall assessment and recommendation (e.g., Approved, Approved with Minor Changes, Significant Changes Needed)
    - Summary of positive aspects of the PR
  agent: summariser
--- a/contexts/defaults/init.py
+++ b/contexts/defaults/init.py
--- a/contexts/defaults/code_review.md
+++ b/contexts/defaults/code_review.md
@ -0,0 +1,19 @@
 # Code Review Guidelines
 ## General Principles
 - Write clean, readable, and maintainable code.
 - Follow the project's coding standards and style guides.
 - Ensure code is well-tested and documented.
 - Avoid code duplication; refactor when necessary.
 - Use meaningful names for variables, functions, and classes.
 - Keep functions and classes focused on a single responsibility.
 ## Specific Checks
 - [ ] Code follows the project's style guide (e.g., PEP8 for Python).
 - [ ] No commented-out code or debug prints in production code.
 - [ ] Proper error handling and logging.
 - [ ] Resource management (e.g., closing files, releasing network connections).
 - [ ] Security best practices (input validation, output encoding, etc.).
 - [ ] Performance considerations (avoid unnecessary loops, optimize database queries).
 - [ ] Unit tests are present and passing for new code.
 - [ ] Changes are backward compatible or have a migration plan.
--- a/contexts/defaults/security_review.md
+++ b/contexts/defaults/security_review.md
@ -0,0 +1,22 @@
 # Security Review Guidelines
 ## General Principles
 - Follow the principle of least privilege.
 - Validate and sanitize all user inputs.
 - Use secure coding practices to prevent common vulnerabilities.
 - Keep dependencies up to date and monitor for known security issues.
 - Implement proper authentication and authorization mechanisms.
 - Encrypt sensitive data at rest and in transit.
 - Log security-relevant events and monitor for suspicious activities.
 ## Specific Checks
 - [ ] Input validation and sanitization (SQL injection, XSS, command injection, etc.).
 - [ ] Proper authentication and session management.
 - [ ] Authorization checks (users can only access resources they are permitted to).
 - [ ] Secure handling of sensitive data (passwords, tokens, PII).
 - [ ] Use of up-to-date and secure dependencies (no known vulnerabilities).
 - [ ] Proper error handling that does not leak sensitive information.
 - [ ] Secure configuration (e.g., not using default passwords, disabling unnecessary services).
 - [ ] Communication security (use of HTTPS, proper certificate validation).
 - [ ] Protection against CSRF, clickjacking, and other web vulnerabilities.
 - [ ] Secure file uploads (if applicable).
--- a/crews/code_review_crew/init.py
+++ b/crews/code_review_crew/init.py
--- a/crews/code_review_crew/pycache/init.cpython-314.pyc
+++ b/crews/code_review_crew/pycache/init.cpython-314.pyc
--- a/crews/code_review_crew/pycache/code_review_crew.cpython-314.pyc
+++ b/crews/code_review_crew/pycache/code_review_crew.cpython-314.pyc
--- a/crews/code_review_crew/code_review_crew.py
+++ b/crews/code_review_crew/code_review_crew.py
@ -0,0 +1,55 @@
 from crewai import CrewBase, Agent, Task, Crew
 from crewai_tools import MCPServerAdapter
 from mcp import StdioServerParameters
 import os
 from typing import Dict, Any
 class CodeReviewCrew(CrewBase):
    """Code Review Crew for conducting code quality reviews."""
    agents_config = "config/agents.yaml"
    tasks_config = "config/tasks.yaml"
    def __init__(self):
        super().__init__()
        # Configure Semgrep MCP server connection
        self.semgrep_server_params = StdioServerParameters(
            command="semgrep",
            args=["--metrics=off", "--json", "--stdin-display-name", "scanned_code", "--"],
            env={
                **os.environ,
                "SEMGRAPH_APP_URL": os.getenv("SEMGRAPH_APP_URL", ""),
                "SEMGRAPH_API_TOKEN": os.getenv("SEMGRAPH_API_TOKEN", ""),
            }
        )
    @Agent
    def code_reviewer(self) -> Agent:
        """Senior Software Engineer agent for code review."""
        return Agent(
            config=self.agents_config["code_reviewer"],
            tools=[],  # Tools will be added via MCP adapter in the task
            verbose=True
        )
    @Task
    def code_review_task(self) -> Task:
        """Task for conducting code review."""
        return Task(
            config=self.tasks_config["code_review_task"],
        )
    @Crew
    def crew(self) -> Crew:
        """Create the Code Review crew."""
        # Create MCP server adapter for Semgrep
        semgrep_adapter = MCPServerAdapter(self.semgrep_server_params)
        return Crew(
            agents=[self.code_reviewer()],
            tasks=[self.code_review_task()],
            process="sequential",
            verbose=True,
            tools=semgrep_adapter.tools if hasattr(semgrep_adapter, 'tools') else [],
        )
--- a/crews/code_review_crew/config/agents.yaml
+++ b/crews/code_review_crew/config/agents.yaml
@ -0,0 +1,7 @@
 # Code Review Crew Agents Configuration
 code_reviewer:
  role: Senior Software Engineer
  goal: Conduct thorough code reviews focusing on code quality, best practices, and maintainability
  backstory: You are an experienced software engineer with a keen eye for detail and a passion for clean code. You have reviewed thousands of pull requests and helped teams improve their code quality.
  verbose: true
  allow_delegation: false
--- a/crews/code_review_crew/config/tasks.yaml
+++ b/crews/code_review_crew/config/tasks.yaml
@ -0,0 +1,16 @@
 # Code Review Crew Tasks Configuration
 code_review_task:
  description: |
    Review the code changes in the pull request for quality, best practices, and maintainability.
    PR Title: {pr_title}
    PR Description: {pr_description}
    Files to review: {files}
    Context: {context}
  expected_output: |
    A detailed code review report including:
    - Summary of changes
    - Code quality issues (if any)
    - Best practices violations (if any)
    - Suggestions for improvement
    - Overall rating (e.g., Approved, Changes Needed)
  agent: code_reviewer
--- a/crews/infra_review_crew/init.py
+++ b/crews/infra_review_crew/init.py
--- a/crews/infra_review_crew/pycache/init.cpython-314.pyc
+++ b/crews/infra_review_crew/pycache/init.cpython-314.pyc
--- a/crews/infra_review_crew/pycache/infra_review_crew.cpython-314.pyc
+++ b/crews/infra_review_crew/pycache/infra_review_crew.cpython-314.pyc
--- a/crews/infra_review_crew/config/agents.yaml
+++ b/crews/infra_review_crew/config/agents.yaml
@ -0,0 +1,7 @@
 # Infrastructure Review Crew Agents Configuration
 infra_reviewer:
  role: DevOps/Platform Engineer
  goal: Review infrastructure as code for correctness, security, and best practices
  backstory: You are an experienced DevOps engineer with expertise in infrastructure as code, Kubernetes, Docker, and cloud platforms. You help teams ensure their infrastructure is secure, scalable, and follows best practices.
  verbose: true
  allow_delegation: false
--- a/crews/infra_review_crew/config/tasks.yaml
+++ b/crews/infra_review_crew/config/tasks.yaml
@ -0,0 +1,16 @@
 # Infrastructure Review Crew Tasks Configuration
 infra_review_task:
  description: |
    Review the infrastructure as code (IaC) in the pull request for correctness, security, and best practices.
    PR Title: {pr_title}
    PR Description: {pr_description}
    Files to review: {files}
    Context: {context}
  expected_output: |
    A detailed infrastructure review report including:
    - Summary of infrastructure changes
    - Issues found (misconfigurations, security vulnerabilities, etc.)
    - Best practices violations (if any)
    - Suggestions for improvement
    - Overall rating (e.g., Approved, Needs Changes)
  agent: infra_reviewer
--- a/crews/infra_review_crew/infra_review_crew.py
+++ b/crews/infra_review_crew/infra_review_crew.py
@ -0,0 +1,65 @@
 from crewai import CrewBase, Agent, Task, Crew
 from crewai_tools import MCPServerAdapter
 from mcp import StdioServerParameters
 import os
 from typing import Dict, Any
 class InfraReviewCrew(CrewBase):
    """Infrastructure Review Crew for conducting infrastructure reviews."""
    agents_config = "config/agents.yaml"
    tasks_config = "config/tasks.yaml"
    def __init__(self):
        super().__init__()
        # Configure Hadolint MCP server connection
        self.hadolint_server_params = StdioServerParameters(
            command="python",
            args=["/home/armistace/dev/pr_reviewer/mcp_servers/hadolint_mcp.py"],
            env=os.environ
        )
        # Configure Checkov MCP server connection
        self.checkov_server_params = StdioServerParameters(
            command="python",
            args=["/home/armistace/dev/pr_reviewer/mcp_servers/checkov_mcp.py"],
            env=os.environ
        )
    @Agent
    def infra_reviewer(self) -> Agent:
        """DevOps/Platform Engineer agent for infrastructure review."""
        return Agent(
            config=self.agents_config["infra_reviewer"],
            tools=[],  # Tools will be added via MCP adapter in the task
            verbose=True
        )
    @Task
    def infra_review_task(self) -> Task:
        """Task for conducting infrastructure review."""
        return Task(
            config=self.tasks_config["infra_review_task"],
        )
    @Crew
    def crew(self) -> Crew:
        """Create the Infrastructure Review crew."""
        # Create MCP server adapters for Hadolint and Checkov
        hadolint_adapter = MCPServerAdapter(self.hadolint_server_params)
        checkov_adapter = MCPServerAdapter(self.checkov_server_params)
        # Combine tools from both adapters
        all_tools = []
        if hasattr(hadolint_adapter, 'tools'):
            all_tools.extend(hadolint_adapter.tools)
        if hasattr(checkov_adapter, 'tools'):
            all_tools.extend(checkov_adapter.tools)
        return Crew(
            agents=[self.infra_reviewer()],
            tasks=[self.infra_review_task()],
            process="sequential",
            verbose=True,
            tools=all_tools,
        )
--- a/crews/security_review_crew/init.py
+++ b/crews/security_review_crew/init.py
--- a/crews/security_review_crew/pycache/init.cpython-314.pyc
+++ b/crews/security_review_crew/pycache/init.cpython-314.pyc
--- a/crews/security_review_crew/pycache/security_review_crew.cpython-314.pyc
+++ b/crews/security_review_crew/pycache/security_review_crew.cpython-314.pyc
--- a/crews/security_review_crew/config/agents.yaml
+++ b/crews/security_review_crew/config/agents.yaml
@ -0,0 +1,7 @@
 # Security Review Crew Agents Configuration
 security_reviewer:
  role: Application Security Engineer
  goal: Identify security vulnerabilities and ensure security best practices are followed
  backstory: You are an experienced security engineer specialized in application security. You have extensive experience in penetration testing, code security analysis, and helping organizations build secure software.
  verbose: true
  allow_delegation: false
--- a/crews/security_review_crew/config/tasks.yaml
+++ b/crews/security_review_crew/config/tasks.yaml
@ -0,0 +1,16 @@
 # Security Review Crew Tasks Configuration
 security_review_task:
  description: |
    Review the code changes in the pull request for security vulnerabilities and compliance with security best practices.
    PR Title: {pr_title}
    PR Description: {pr_description}
    Files to review: {files}
    Context: {context}
  expected_output: |
    A detailed security review report including:
    - Summary of security-related changes
    - Identified vulnerabilities (if any)
    - Security best practices violations (if any)
    - Suggestions for improving security posture
    - Overall security rating (e.g., Secure, Needs Improvement)
  agent: security_reviewer
--- a/crews/security_review_crew/security_review_crew.py
+++ b/crews/security_review_crew/security_review_crew.py
@ -0,0 +1,51 @@
 from crewai import CrewBase, Agent, Task, Crew
 from crewai_tools import MCPServerAdapter
 from mcp import StdioServerParameters
 import os
 from typing import Dict, Any
 class SecurityReviewCrew(CrewBase):
    """Security Review Crew for conducting security reviews."""
    agents_config = "config/agents.yaml"
    tasks_config = "config/tasks.yaml"
    def __init__(self):
        super().__init__()
        # Trivy uses native MCP server, so we don't need to configure a wrapper.
        # However, we might need to set up connection parameters if required by the native server.
        # For now, we assume the native Trivy MCP server is available at a known address or via stdio.
        # We'll leave the MCP server configuration empty and rely on the native server being available.
        self.trivy_server_params = None  # Placeholder for if we need to configure stdio parameters
    @Agent
    def security_reviewer(self) -> Agent:
        """Application Security Engineer agent for security review."""
        return Agent(
            config=self.agents_config["security_reviewer"],
            tools=[],  # Tools will be added via MCP adapter in the task
            verbose=True
        )
    @Task
    def security_review_task(self) -> Task:
        """Task for conducting security review."""
        return Task(
            config=self.tasks_config["security_review_task"],
        )
    @Crew
    def crew(self) -> Crew:
        """Create the Security Review crew."""
        # If we had an MCP server to wrap, we would create an adapter here.
        # Since Trivy is native, we don't add any tools via MCPServerAdapter.
        # However, the native server should be available in the MCP ecosystem.
        # We'll assume the tools are automatically available or will be handled differently.
        return Crew(
            agents=[self.security_reviewer()],
            tasks=[self.security_review_task()],
            process="sequential",
            verbose=True,
            # No additional tools from MCP wrapper for Trivy (native)
        )
--- a/crews/summariser_crew/init.py
+++ b/crews/summariser_crew/init.py
--- a/crews/summariser_crew/pycache/init.cpython-314.pyc
+++ b/crews/summariser_crew/pycache/init.cpython-314.pyc
--- a/crews/summariser_crew/pycache/summariser_crew.cpython-314.pyc
+++ b/crews/summariser_crew/pycache/summariser_crew.cpython-314.pyc
--- a/crews/summariser_crew/config/agents.yaml
+++ b/crews/summariser_crew/config/agents.yaml
@ -0,0 +1,7 @@
 # Summarizer Crew Agents Configuration
 summariser:
  role: Senior Code Review Coordinator
  goal: Synthesize individual review results into a cohesive, actionable review report
  backstory: You are a senior technical lead with extensive experience in code review practices across multiple domains. You excel at combining feedback from different reviewers into a clear, prioritized, and actionable summary that helps development teams improve their code efficiently.
  verbose: true
  allow_delegation: false
--- a/crews/summariser_crew/config/tasks.yaml
+++ b/crews/summariser_crew/config/tasks.yaml
@ -0,0 +1,16 @@
 # Summarizer Crew Tasks Configuration
 summarise_task:
  description: |
    Synthesize the results from code, security, and infrastructure reviews into a cohesive review report.
    Code Review Results: {code_review_results}
    Security Review Results: {security_review_results}
    Infrastructure Review Results: {infra_review_results}
    Context: {context}
  expected_output: |
    A comprehensive review report that includes:
    - Executive summary of all findings
    - Prioritized list of issues (critical, high, medium, low)
    - Specific recommendations for each domain (code, security, infrastructure)
    - Overall assessment and recommendation (e.g., Approved, Approved with Minor Changes, Significant Changes Needed)
    - Summary of positive aspects of the PR
  agent: summariser
--- a/crews/summariser_crew/summariser_crew.py
+++ b/crews/summariser_crew/summariser_crew.py
@ -0,0 +1,43 @@
 from crewai import CrewBase, Agent, Task, Crew
 from crewai_tools import MCPServerAdapter
 from mcp import StdioServerParameters
 import os
 from typing import Dict, Any
 class SummariserCrew(CrewBase):
    """Summariser Crew for synthesizing review results."""
    agents_config = "config/agents.yaml"
    tasks_config = "config/tasks.yaml"
    def __init__(self):
        super().__init__()
        # The summarizer doesn't need MCP server connections as it works with text results
    @Agent
    def summariser(self) -> Agent:
        """Senior Code Review Coordinator agent for summarizing reviews."""
        return Agent(
            config=self.agents_config["summariser"],
            tools=[],  # No tools needed for summarization
            verbose=True
        )
    @Task
    def summarise_task(self) -> Task:
        """Task for synthesizing review results."""
        return Task(
            config=self.tasks_config["summarise_task"],
        )
    @Crew
    def crew(self) -> Crew:
        """Create the Summariser crew."""
        return Crew(
            agents=[self.summariser()],
            tasks=[self.summarise_task()],
            process="sequential",
            verbose=True,
            # No additional tools needed
        )
--- a/example_pipelines/.gitea/workflows/build_push.yml
+++ b/example_pipelines/.gitea/workflows/build_push.yml
@ -0,0 +1,72 @@
 name: Build and Push Image
 on:
  push:
    branches:
      - master
 jobs:
  build:
    name: Build and push image
    runs-on: ubuntu-latest
    container: catthehacker/ubuntu:act-latest
    if: gitea.ref == 'refs/heads/master'
    steps:
      - name: Checkout
        uses: actions/checkout@v4
      - name: Create Kubeconfig
        run: |
          mkdir $HOME/.kube
          echo "${{ secrets.KUBEC_CONFIG_BUILDX_NEW }}" > $HOME/.kube/config
      - name: Set up Docker Buildx
        uses: docker/setup-buildx-action@v3
        with:
          driver: kubernetes
          driver-opts: |
            namespace=gitea-runner
            qemu.install=true
      - name: Login to Docker Registry
        uses: docker/login-action@v3
        with:
          registry: git.aridgwayweb.com
          username: armistace
          password: ${{ secrets.REG_PASSWORD }}
      - name: Build and push
        uses: docker/build-push-action@v5
        with:
          context: .
          push: true
          platforms: linux/amd64,linux/arm64
          tags: |
            git.aridgwayweb.com/armistace/blog:latest
      - name: Trivy Scan
        run: |
          echo "Installing Trivy "
          sudo apt-get update
          sudo apt-get install -y wget apt-transport-https gnupg lsb-release
          wget -qO - https://aquasecurity.github.io/trivy-repo/deb/public.key | sudo apt-key add -
          echo deb https://aquasecurity.github.io/trivy-repo/deb $(lsb_release -sc) main | sudo tee -a /etc/apt/sources.list.d/trivy.list
          sudo apt-get update
          sudo apt-get install -y trivy
          trivy image --format table --exit-code 1 --ignore-unfixed --vuln-type os,library --severity HIGH,CRITICAL git.aridgwayweb.com/armistace/blog:latest
      - name: Deploy
        run: |
          echo "Installing Kubectl"
          apt-get update
          apt-get install -y apt-transport-https ca-certificates curl gnupg
          curl -fsSL https://pkgs.k8s.io/core:/stable:/v1.33/deb/Release.key | gpg --dearmor -o /etc/apt/keyrings/kubernetes-apt-keyring.gpg
          chmod 644 /etc/apt/keyrings/kubernetes-apt-keyring.gpg
          echo 'deb [signed-by=/etc/apt/keyrings/kubernetes-apt-keyring.gpg] https://pkgs.k8s.io/core:/stable:/v1.33/deb/ /' | tee /etc/apt/sources.list.d/kubernetes.list
          chmod 644 /etc/apt/sources.list.d/kubernetes.list
          apt-get update
          apt-get install kubectl
          kubectl delete namespace blog
          kubectl create namespace blog
          kubectl create secret docker-registry regcred --docker-server=${{ vars.DOCKER_SERVER }} --docker-username=${{ vars.DOCKER_USERNAME }} --docker-password='${{ secrets.DOCKER_PASSWORD }}' --docker-email=${{ vars.DOCKER_EMAIL }} --namespace=blog
          kubectl apply -f kube/blog_pod.yaml && kubectl apply -f kube/blog_deployment.yaml && kubectl apply -f kube/blog_service.yaml
--- a/example_pipelines/kube/blog_deployment.yaml
+++ b/example_pipelines/kube/blog_deployment.yaml
@ -0,0 +1,24 @@
 apiVersion: apps/v1
 kind: Deployment
 metadata:
  name: blog-deployment
  labels:
    app: blog
  namespace: blog
 spec:
  replicas: 3
  selector:
    matchLabels:
      app: blog
  template:
    metadata:
      labels:
        app: blog
    spec:
      containers:
      - name: blog
        image: git.aridgwayweb.com/armistace/blog:latest
        ports:
        - containerPort: 8000
      imagePullSecrets:
        - name: regcred
--- a/example_pipelines/kube/blog_pod.yaml
+++ b/example_pipelines/kube/blog_pod.yaml
@ -0,0 +1,13 @@
 apiVersion: v1
 kind: Pod
 metadata:
    name: blog
    namespace: blog
 spec:
    containers:
        - name: blog
          image: git.aridgwayweb.com/armistace/blog:latest
          ports:
              - containerPort: 8000
    imagePullSecrets:
        - name: regcred
--- a/example_pipelines/kube/blog_service.yaml
+++ b/example_pipelines/kube/blog_service.yaml
@ -0,0 +1,13 @@
 apiVersion: v1
 kind: Service
 metadata:
  name: blog-service
  namespace: blog
 spec:
  type: NodePort
  selector:
    app: blog 
  ports:
    - port: 80
      targetPort: 8000
      nodePort: 30009
--- a/kube/pr-reviewer_deployment.yaml
+++ b/kube/pr-reviewer_deployment.yaml
@ -0,0 +1,24 @@
 apiVersion: apps/v1
 kind: Deployment
 metadata:
  name: pr-reviewer-deployment
  labels:
    app: pr-reviewer
  namespace: pr-reviewer
 spec:
  replicas: 3
  selector:
    matchLabels:
      app: pr-reviewer
  template:
    metadata:
      labels:
        app: pr-reviewer
    spec:
      containers:
      - name: pr-reviewer
        image: git.aridgwayweb.com/armistace/pr-reviewer:latest
        ports:
        - containerPort: 8000
      imagePullSecrets:
        - name: regcred
--- a/kube/pr-reviewer_pod.yaml
+++ b/kube/pr-reviewer_pod.yaml
@ -0,0 +1,13 @@
 apiVersion: v1
 kind: Pod
 metadata:
    name: pr-reviewer
    namespace: pr-reviewer
 spec:
    containers:
        - name: pr-reviewer
          image: git.aridgwayweb.com/armistace/pr-reviewer:latest
          ports:
              - containerPort: 8000
    imagePullSecrets:
        - name: regcred
--- a/kube/pr-reviewer_service.yaml
+++ b/kube/pr-reviewer_service.yaml
@ -0,0 +1,13 @@
 apiVersion: v1
 kind: Service
 metadata:
  name: pr-reviewer-service
  namespace: pr-reviewer
 spec:
  type: NodePort
  selector:
    app: pr-reviewer 
  ports:
    - port: 80
      targetPort: 8000
      nodePort: 30009
--- a/mcp_servers/init.py
+++ b/mcp_servers/init.py
--- a/mcp_servers/pycache/init.cpython-314.pyc
+++ b/mcp_servers/pycache/init.cpython-314.pyc
--- a/mcp_servers/pycache/checkov_mcp.cpython-314.pyc
+++ b/mcp_servers/pycache/checkov_mcp.cpython-314.pyc
--- a/mcp_servers/pycache/hadolint_mcp.cpython-314.pyc
+++ b/mcp_servers/pycache/hadolint_mcp.cpython-314.pyc
--- a/mcp_servers/checkov_mcp.py
+++ b/mcp_servers/checkov_mcp.py
@ -0,0 +1,146 @@
 #!/usr/bin/env python3
 """
 MCP server for Checkov Kubernetes security scanner.
 """
 import asyncio
 import json
 import logging
 import subprocess
 import sys
 import tempfile
 import os
 from typing import Any, Dict, List
 import mcp.server.stdio
 import mcp.types as types
 from mcp.server import NotificationOptions, Server
 from mcp.server.models import InitializationOptions
 # Configure logging
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
 # Create server instance
 server = Server("checkov-mcp")
@server.list_tools()
 async def handle_list_tools() -> List[types.Tool]:
    """
    List available tools.
    """
    return [
        types.Tool(
            name="scan_kubernetes_manifests",
            description="Scan Kubernetes manifests for security issues using Checkov",
            inputSchema={
                "type": "object",
                "properties": {
                    "manifest_content": {
                        "type": "string",
                        "description": "The content of the Kubernetes manifest(s) to scan"
                    }
                },
                "required": ["manifest_content"]
            }
        )
    ]
@server.call_tool()
 async def handle_call_tool(
    name: str, arguments: Dict[str, Any] | None
 ) -> List[types.TextContent | types.ImageContent | types.EmbeddedResource]:
    """
    Handle tool calls.
    """
    if name != "scan_kubernetes_manifests":
        raise ValueError(f"Unknown tool: {name}")
    if not arguments:
        raise ValueError("Missing arguments")
    manifest_content = arguments.get("manifest_content")
    if not manifest_content:
        raise ValueError("Missing manifest_content argument")
    try:
        # Create a temporary file to hold the manifest content
        with tempfile.NamedTemporaryFile(mode='w', suffix='.yaml', delete=False) as temp_file:
            temp_file.write(manifest_content)
            temp_file_path = temp_file.name
        try:
            # Run checkov on the manifest file
            process = await asyncio.create_subprocess_exec(
                "checkov",
                "-f", temp_file_path,
                "--quiet",  # Reduce verbosity
                "--output", "json",  # Get JSON output for easier parsing
                stdout=subprocess.PIPE,
                stderr=subprocess.PIPE,
            )
            stdout, stderr = await process.communicate()
            if process.returncode not in [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25]:  # Checkov returns various codes
                # Some non-zero codes are expected (findings, etc.)
                pass
            result = stdout.decode()
            if stderr:
                result += "\nSTDERR:\n" + stderr.decode()
            # If checkov is not found, we'll get an error from the subprocess
            if not result.strip() and process.returncode == 127:  # command not found typically returns 127
                result = "Error: Checkov command not found. Please install checkov."
            return [
                types.TextContent(
                    type="text",
                    text=result
                )
            ]
        finally:
            # Clean up the temporary file
            os.unlink(temp_file_path)
    except FileNotFoundError:
        logger.error("Checkov command not found. Please ensure checkov is installed and in PATH.")
        return [
            types.TextContent(
                type="text",
                text="Error: Checkov command not found. Please install checkov."
            )
        ]
    except Exception as e:
        logger.exception("Error running checkov")
        return [
            types.TextContent(
                type="text",
                text=f"Error running checkov: {str(e)}"
            )
        ]
 async def main():
    """
    Run the MCP server.
    """
    # Run the server using stdio
    async with mcp.server.stdio.stdio_server() as (read_stream, write_stream):
        await server.run(
            read_stream,
            write_stream,
            InitializationOptions(
                server_name="checkov-mcp",
                server_version="0.1.0",
                capabilities=server.get_capabilities(
                    notification_options=NotificationOptions(),
                    experimental_capabilities={},
                ),
            ),
        )
 if __name__ == "__main__":
    asyncio.run(main())
--- a/mcp_servers/hadolint_mcp.py
+++ b/mcp_servers/hadolint_mcp.py
@ -0,0 +1,133 @@
 #!/usr/bin/env python3
 """
 MCP server for Hadolint Dockerfile linter.
 """
 import asyncio
 import json
 import logging
 import subprocess
 import sys
 from typing import Any, Dict, List
 import mcp.server.stdio
 import mcp.types as types
 from mcp.server import NotificationOptions, Server
 from mcp.server.models import InitializationOptions
 # Configure logging
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
 # Create server instance
 server = Server("hadolint-mcp")
@server.list_tools()
 async def handle_list_tools() -> List[types.Tool]:
    """
    List available tools.
    """
    return [
        types.Tool(
            name="lint_dockerfile",
            description="Lint a Dockerfile using Hadolint",
            inputSchema={
                "type": "object",
                "properties": {
                    "dockerfile_content": {
                        "type": "string",
                        "description": "The content of the Dockerfile to lint"
                    }
                },
                "required": ["dockerfile_content"]
            }
        )
    ]
@server.call_tool()
 async def handle_call_tool(
    name: str, arguments: Dict[str, Any] | None
 ) -> List[types.TextContent | types.ImageContent | types.EmbeddedResource]:
    """
    Handle tool calls.
    """
    if name != "lint_dockerfile":
        raise ValueError(f"Unknown tool: {name}")
    if not arguments:
        raise ValueError("Missing arguments")
    dockerfile_content = arguments.get("dockerfile_content")
    if not dockerfile_content:
        raise ValueError("Missing dockerfile_content argument")
    try:
        # Run hadolint on the Dockerfile content
        process = await asyncio.create_subprocess_exec(
            "hadolint",
            "-",  # Read from stdin
            stdin=subprocess.PIPE,
            stdout=subprocess.PIPE,
            stderr=subprocess.PIPE,
        )
        stdout, stderr = await process.communicate(input=dockerfile_content.encode())
        if process.returncode != 0:
            # Hadolint returns non-zero for linting errors, which is expected
            # We still return the output as the result
            result = stdout.decode() + stderr.decode()
        else:
            result = stdout.decode()
        # If no output, hadolint passed with no issues
        if not result.strip():
            result = "Hadolint: No issues found."
        return [
            types.TextContent(
                type="text",
                text=result
            )
        ]
    except FileNotFoundError:
        logger.error("Hadolint command not found. Please ensure hadolint is installed and in PATH.")
        return [
            types.TextContent(
                type="text",
                text="Error: Hadolint command not found. Please install hadolint."
            )
        ]
    except Exception as e:
        logger.exception("Error running hadolint")
        return [
            types.TextContent(
                type="text",
                text=f"Error running hadolint: {str(e)}"
            )
        ]
 async def main():
    """
    Run the MCP server.
    """
    # Run the server using stdio
    async with mcp.server.stdio.stdio_server() as (read_stream, write_stream):
        await server.run(
            read_stream,
            write_stream,
            InitializationOptions(
                server_name="hadolint-mcp",
                server_version="0.1.0",
                capabilities=server.get_capabilities(
                    notification_options=NotificationOptions(),
                    experimental_capabilities={},
                ),
            ),
        )
 if __name__ == "__main__":
    asyncio.run(main())
--- a/pyproject.toml
+++ b/pyproject.toml
@ -0,0 +1,71 @@
 [project]
 name = "pr-reviewer"
 version = "0.1.0"
 description = "A PR Reviewer system using CrewAI and MCP"
 readme = "README.md"
 requires-python = ">=3.10,<3.14"
 authors = [
    {name = "Developer", email = "dev@example.com"}
 ]
 keywords = ["pull-request", "code-review", "security", "infrastructure", "crewai", "mcp"]
 classifiers = [
    "Development Status :: 3 - Alpha",
    "Intended Audience :: Developers",
    "License :: OSI Approved :: MIT License",
    "Programming Language :: Python :: 3",
    "Programming Language :: Python :: 3.10",
    "Programming Language :: Python :: 3.11",
    "Programming Language :: Python :: 3.12",
    "Programming Language :: Python :: 3.13",
 ]
 dependencies = [
    "crewai>=0.28.0",
    "fastapi>=0.104.0",
    "uvicorn>=0.24.0",
    "mcp>=0.1.0",
    "pydantic>=2.5.0",
    "python-dotenv>=1.0.0",
    "gitpython>=3.1.0"
 ]
 [project.optional-dependencies]
 anthropic = ["anthropic>=0.7.0"]
 openai = ["openai>=1.0.0"]
 ollama = []
 dev = [
    "pytest>=7.0.0",
    "black>=22.0.0",
    "flake8>=4.0.0",
    "mypy>=0.9.0",
 ]
 [project.urls]
 Homepage = "https://github.com/your-org/pr-reviewer"
 Documentation = "https://github.com/your-org/pr-reviewer#readme"
 Repository = "https://github.com/your-org/pr-reviewer.git"
 [build-system]
 requires = ["setuptools>=61.0"]
 build-backend = "setuptools.build_meta"
 [tool.black]
 line-length = 88
 target-version = ['py310']
 include = '\.py$'
 exclude = '''
 /(\.git
 | \.hg
 | \.mypy_cache
 | \.tox
 | \.venv
 | _build
 | buck-out
 | build
 | dist
 )/
 '''
 [tool.mypy]
 python_version = "3.10"
 warn_return_any = true
 warn_unused_configs = true
--- a/src/pr_reviewer/init.py
+++ b/src/pr_reviewer/init.py
--- a/src/pr_reviewer/pycache/init.cpython-314.pyc
+++ b/src/pr_reviewer/pycache/init.cpython-314.pyc
--- a/src/pr_reviewer/pycache/context.cpython-314.pyc
+++ b/src/pr_reviewer/pycache/context.cpython-314.pyc
--- a/src/pr_reviewer/pycache/flow.cpython-314.pyc
+++ b/src/pr_reviewer/pycache/flow.cpython-314.pyc
--- a/src/pr_reviewer/pycache/llm.cpython-314.pyc
+++ b/src/pr_reviewer/pycache/llm.cpython-314.pyc
--- a/src/pr_reviewer/pycache/main.cpython-314.pyc
+++ b/src/pr_reviewer/pycache/main.cpython-314.pyc
--- a/src/pr_reviewer/pycache/state.cpython-314.pyc
+++ b/src/pr_reviewer/pycache/state.cpython-314.pyc
--- a/src/pr_reviewer/context.py
+++ b/src/pr_reviewer/context.py
@ -0,0 +1,45 @@
 import os
 from pathlib import Path
 from typing import Dict, Optional
 from .state import PRReviewState, ContextOverrides
 def resolve_context(state: PRReviewState) -> Dict[str, str]:
    """
    Resolve the context for each review type based on overrides and default files.
    Args:
        state: The PR review state containing potential context overrides
    Returns:
        A dictionary with keys 'code_review', 'security_review', 'infra_review' 
        and their resolved context strings.
    """
    # Define the mapping of context types to their default file paths
    context_mapping = {
        'code_review': 'contexts/defaults/code_review.md',
        'security_review': 'contexts/defaults/security_review.md',
        'infra_review': 'contexts/defaults/infra_review.md'
    }
    resolved = {}
    for context_type, default_path in context_mapping.items():
        # Check if there's an override in the state
        override_value = None
        if state.context_overrides:
            override_value = getattr(state.context_overrides, context_type, None)
        if override_value is not None and override_value.strip() != '':
            # Use the override if provided and not empty
            resolved[context_type] = override_value.strip()
        else:
            # Use the default file
            try:
                with open(default_path, 'r') as f:
                    resolved[context_type] = f.read().strip()
            except FileNotFoundError:
                # If the default file doesn't exist, use an empty string
                resolved[context_type] = ''
    return resolved
--- a/src/pr_reviewer/flow.py
+++ b/src/pr_reviewer/flow.py
@ -0,0 +1,150 @@
 from crewai.flow import Flow, listen, start, and_
 from crewai import Crew
 from .state import PRReviewState
 from .llm import get_llm
 from .context import resolve_context
 import os
 from datetime import datetime
 # Import the crews
 from crews.code_review_crew.code_review_crew import CodeReviewCrew
 from crews.security_review_crew.security_review_crew import SecurityReviewCrew
 from crews.infra_review_crew.infra_review_crew import InfraReviewCrew
 from crews.summariser_crew.summariser_crew import SummariserCrew
 class CodeReviewFlow(Flow[PRReviewState]):
    @start()
    def receive_pr(self, inputs):
        """Initialize the PR review state with input data."""
        print(f"Received PR review request for PR #{inputs.get('pr_id')}")
        # Initialize the state
        self.state.pr_id = inputs.get("pr_id", "")
        self.state.pr_title = inputs.get("pr_title", "")
        self.state.pr_description = inputs.get("pr_description", "")
        self.state.pr_url = inputs.get("pr_url", "")
        self.state.repo_name = inputs.get("repo_name", "")
        self.state.repo_url = inputs.get("repo_url", "")
        self.state.branch = inputs.get("branch", "")
        self.state.base_branch = inputs.get("base_branch", "")
        # Convert files from list of dicts to list of FileInfo objects if needed
        files_input = inputs.get("files", [])
        if files_input and isinstance(files_input[0], dict):
            # Convert dicts to FileInfo objects
            from .state import FileInfo
            self.state.files = [FileInfo(**file_dict) for file_dict in files_input]
        else:
            self.state.files = files_input
        # Handle context_overrides
        context_overrides_input = inputs.get("context_overrides")
        if context_overrides_input and isinstance(context_overrides_input, dict):
            from .state import ContextOverrides
            self.state.context_overrides = ContextOverrides(**context_overrides_input)
        else:
            self.state.context_overrides = context_overrides_input
        self.state.started_at = datetime.now()
        # Resolve context
        self.state.resolved_context = resolve_context(self.state)
        return self.state
    @listen(receive_pr)
    def run_code_review(self):
        """Run the code review crew."""
        print("Starting code review...")
        # Instantiate and run the code review crew
        code_crew = CodeReviewCrew()
        # The crew's kickoff method expects inputs matching the task template variables
        inputs = {
            "pr_title": self.state.pr_title,
            "pr_description": self.state.pr_description,
            "files": [file.dict() if hasattr(file, 'dict') else file for file in self.state.files],
            "context": self.state.resolved_context.get("code_review", "")
        }
        result = code_crew.crew().kickoff(inputs=inputs)
        self.state.code_review_results = str(result)
        print("Code review completed.")
        return self.state
    @listen(receive_pr)
    def run_security_review(self):
        """Run the security review crew."""
        print("Starting security review...")
        # Instantiate and run the security review crew
        security_crew = SecurityReviewCrew()
        inputs = {
            "pr_title": self.state.pr_title,
            "pr_description": self.state.pr_description,
            "files": [file.dict() if hasattr(file, 'dict') else file for file in self.state.files],
            "context": self.state.resolved_context.get("security_review", "")
        }
        result = security_crew.crew().kickoff(inputs=inputs)
        self.state.security_review_results = str(result)
        print("Security review completed.")
        return self.state
    @listen(receive_pr)
    def run_infra_review(self):
        """Run the infrastructure review crew."""
        print("Starting infrastructure review...")
        # Instantiate and run the infrastructure review crew
        infra_crew = InfraReviewCrew()
        inputs = {
            "pr_title": self.state.pr_title,
            "pr_description": self.state.pr_description,
            "files": [file.dict() if hasattr(file, 'dict') else file for file in self.state.files],
            "context": self.state.resolved_context.get("infra_review", "")
        }
        result = infra_crew.crew().kickoff(inputs=inputs)
        self.state.infra_review_results = str(result)
        print("Infrastructure review completed.")
        return self.state
    @listen(and_(run_code_review, run_security_review, run_infra_review))
    def summarise(self):
        """Summarize the review results."""
        print("Starting summarisation...")
        # Instantiate and run the summariser crew
        summariser_crew = SummariserCrew()
        inputs = {
            "code_review_results": self.state.code_review_results,
            "security_review_results": self.state.security_review_results,
            "infra_review_results": self.state.infra_review_results,
            "context": self.state.resolved_context
        }
        result = summariser_crew.crew().kickoff(inputs=inputs)
        self.state.review_summary = str(result)
        self.state.completed_at = datetime.now()
        print("Summarisation completed.")
        return self.state
    @listen(summarise)
    def format_response(self):
        """Format the final response."""
        print("Formatting final response...")
        # Return the final state as the response
        return {
            "pr_id": self.state.pr_id,
            "pr_title": self.state.pr_title,
            "review_summary": self.state.review_summary,
            "code_review_results": self.state.code_review_results,
            "security_review_results": self.state.security_review_results,
            "infra_review_results": self.state.infra_review_results,
            "started_at": self.state.started_at.isoformat() if self.state.started_at else None,
            "completed_at": self.state.completed_at.isoformat() if self.state.completed_at else None,
            "error": self.state.error
        }
--- a/src/pr_reviewer/llm.py
+++ b/src/pr_reviewer/llm.py
@ -0,0 +1,56 @@
 import os
 from crewai import LLM
 from typing import Optional
 def create_llm() -> LLM:
    """
    Create an LLM instance based on environment variables.
    Expected environment variables:
    - LLM_MODEL: The model name to use (required)
    - LLM_BASE_URL: The base URL for the LLM API (optional)
    - LLM_API_KEY: The API key for the LLM service (optional)
    - LLM_PROVIDER: The provider (e.g., 'openai', 'anthropic', 'ollama') (optional)
    Returns:
        LLM: A CrewAI LLM instance
    """
    model = os.getenv("LLM_MODEL")
    if not model:
        raise ValueError("LLM_MODEL environment variable is required")
    base_url = os.getenv("LLM_BASE_URL")
    api_key = os.getenv("LLM_API_KEY")
    provider = os.getenv("LLM_PROVIDER")
    # Prepare LLM configuration
    llm_config = {
        "model": model,
    }
    if base_url:
        llm_config["base_url"] = base_url
    if api_key:
        llm_config["api_key"] = api_key
    if provider:
        llm_config["provider"] = provider
    return LLM(**llm_config)
 # Shared LLM singleton
 _shared_llm: Optional[LLM] = None
 def get_llm() -> LLM:
    """
    Get the shared LLM singleton instance.
    Returns:
        LLM: The shared LLM instance
    """
    global _shared_llm
    if _shared_llm is None:
        _shared_llm = create_llm()
    return _shared_llm
--- a/src/pr_reviewer/main.py
+++ b/src/pr_reviewer/main.py
@ -0,0 +1,297 @@
 import logging
 from fastapi import FastAPI, HTTPException, Request
 from fastapi.responses import JSONResponse
 import uvicorn
 from typing import Dict, Any, List, Optional
 import asyncio
 from concurrent.futures import ThreadPoolExecutor, TimeoutError as FutureTimeoutError
 import time
 import uuid
 from .flow import CodeReviewFlow
 from .state import PRReviewState, FileInfo, ContextOverrides
 # Configure logging
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
 app = FastAPI(
    title="PR Reviewer API",
    description="API for conducting automated pull request reviews",
    version="0.1.0"
 )
 # Configuration for timeouts
 TOTAL_FLOW_TIMEOUT = int(os.getenv("TOTAL_FLOW_TIMEOUT", "600"))  # Default 10 minutes
 PER_CREW_TIMEOUT = int(os.getenv("PER_CREW_TIMEOUT", "300"))     # Default 5 minutes
@app.get("/api/v1/health")
 async def health_check() -> Dict[str, str]:
    """
    Health check endpoint to verify the service is running.
    """
    return {"status": "healthy", "service": "pr-reviewer"}
@app.post("/api/v1/review")
 async def review_pr(request: Request) -> Dict[str, Any]:
    """
    Endpoint to trigger a PR review.
    Implements the full request/response schema as specified in Section 2.2.1.
    """
    start_time = time.time()
    review_id = str(uuid.uuid4())
    # Log the incoming request (excluding sensitive data)
    logger.info(f"Received PR review request: {review_id}")
    try:
        # Parse the JSON payload
        try:
            payload = await request.json()
        except Exception:
            raise HTTPException(status_code=422, detail="Invalid JSON payload")
        # Validate and extract required fields according to the API specification
        # Request schema:
        # {
        #   "pr_id": "string (required)",
        #   "title": "string (required)",
        #   "description": "string (optional)",
        #   "repo": {
        #     "name": "string (required)",
        #     "url": "string (required)"
        #   },
        #   "source": {
        #     "branch": "string (required)",
        #     "commit": "string (optional)"
        #   },
        #   "target": {
        #     "branch": "string (required)",
        #     "commit": "string (optional)"
        #   },
        #   "files": [
        #     {
        #       "path": "string (required)",
        #       "content": "string (optional)",
        #       "status": "string (required)",
        #       "additions": "integer (optional, default 0)",
        #       "deletions": "integer (optional, default 0)",
        #       "patch": "string (optional)"
        #     }
        #   ],
        #   "context": {
        #     "code_review": "string (optional)",
        #     "security_review": "string (optional)",
        #     "infra_review": "string (optional)"
        #   }
        # }
        # Extract top-level fields
        pr_id = payload.get("pr_id")
        title = payload.get("title")
        description = payload.get("description")
        # Extract repo information
        repo_data = payload.get("repo", {})
        repo_name = repo_data.get("name")
        repo_url = repo_data.get("url")
        # Extract source information
        source_data = payload.get("source", {})
        source_branch = source_data.get("branch")
        source_commit = source_data.get("commit")
        # Extract target information
        target_data = payload.get("target", {})
        target_branch = target_data.get("branch")
        target_commit = target_data.get("commit")
        # Extract files
        files_data = payload.get("files", [])
        # Extract context overrides
        context_data = payload.get("context", {})
        # Validate required fields
        if not pr_id:
            raise HTTPException(status_code=422, detail="Missing required field: pr_id")
        if not title:
            raise HTTPException(status_code=422, detail="Missing required field: title")
        if not repo_name:
            raise HTTPException(status_code=422, detail="Missing required field: repo.name")
        if not repo_url:
            raise HTTPException(status_code=422, detail="Missing required field: repo.url")
        if not source_branch:
            raise HTTPException(status_code=422, detail="Missing required field: source.branch")
        if not target_branch:
            raise HTTPException(status_code=422, detail="Missing required field: target.branch")
        # Convert files data to FileInfo objects
        files = []
        for file_data in files_data:
            if not file_data.get("path"):
                raise HTTPException(status_code=422, detail="Missing required field: files[].path")
            if not file_data.get("status"):
                raise HTTPException(status_code=422, detail="Missing required field: files[].status")
            file_info = FileInfo(
                path=file_data.get("path", ""),
                content=file_data.get("content"),
                status=file_data.get("status", "modified"),
                additions=file_data.get("additions", 0),
                deletions=file_data.get("deletions", 0),
                patch=file_data.get("patch")
            )
            files.append(file_info)
        # Create context overrides object (only if at least one field is provided)
        context_overrides = None
        if any([context_data.get("code_review"), 
                context_data.get("security_review"), 
                context_data.get("infra_review")]):
            context_overrides = ContextOverrides(
                code_review=context_data.get("code_review"),
                security_review=context_data.get("security_review"),
                infra_review=context_data.get("infra_review")
            )
        # Initialize and run the flow with timeout
        flow = CodeReviewFlow()
        # Run the flow in a thread pool with timeout to avoid blocking the event loop
        loop = asyncio.get_event_loop()
        with ThreadPoolExecutor() as pool:
            try:
                # Wait for the flow to complete with a timeout
                flow_result = await asyncio.wait_for(
                    loop.run_in_executor(
                        pool, 
                        lambda: flow.kickoff(inputs={
                            "pr_id": pr_id,
                            "pr_title": title,
                            "pr_description": description,
                            "pr_url": f"{repo_url}/pull/{pr_id}",  # Construct PR URL
                            "repo_name": repo_name,
                            "repo_url": repo_url,
                            "branch": source_branch,  # Using source branch as the active branch
                            "base_branch": target_branch,  # Using target branch as base
                            "files": [file.dict() for file in files],  # Convert to dict for flow
                            "context_overrides": context_overrides.dict() if context_overrides else None
                        })
                    ),
                    timeout=TOTAL_FLOW_TIMEOUT
                )
            except asyncio.TimeoutError:
                logger.error(f"PR review timed out: {review_id}")
                raise HTTPException(
                    status_code=504, 
                    detail=f"PR review timed out after {TOTAL_FLOW_TIMEOUT} seconds"
                )
        # Calculate processing time
        processing_time = time.time() - start_time
        # Prepare response according to the API specification:
        # {
        #   "review_id": "string (unique identifier for this review)",
        #   "status": "string (\"completed\", \"failed\", etc.)",
        #   "timestamp": "string (ISO 8601 timestamp)",
        #   "results": {
        #     "code_review": "string (results from code review)",
        #     "security_review": "string (results from security review)",
        #     "infra_review": "string (results from infrastructure review)",
        #     "summary": "string (synthesized review summary)"
        #   },
        #   "metadata": {
        #     "processing_time_seconds": "number",
        #     "pr_id": "string",
        #     "repo": {
        #       "name": "string",
        #       "url": "string"
        #     }
        #   }
        # }
        response = {
            "review_id": review_id,
            "status": "completed" if not flow_result.get("error") else "failed",
            "timestamp": time.strftime("%Y-%m-%dT%H:%M:%SZ", time.gmtime()),
            "results": {
                "code_review": flow_result.get("code_review_results"),
                "security_review": flow_result.get("security_review_results"),
                "infra_review": flow_result.get("infra_review_results"),
                "summary": flow_result.get("review_summary")
            },
            "metadata": {
                "processing_time_seconds": round(processing_time, 2),
                "pr_id": pr_id,
                "repo": {
                    "name": repo_name,
                    "url": repo_url
                }
            }
        }
        # Include error information if present
        if flow_result.get("error"):
            response["metadata"]["error"] = flow_result["error"]
            logger.error(f"PR review failed: {review_id} - {flow_result['error']}")
        else:
            logger.info(f"PR review completed successfully: {review_id} in {processing_time:.2f}s")
        return response
    except HTTPException:
        # Re-raise HTTP exceptions as they are already properly formatted
        raise
    except asyncio.TimeoutError:
        # This should be caught by the wait_for above, but just in case
        logger.error(f"PR review timed out: {review_id}")
        raise HTTPException(
            status_code=504, 
            detail=f"PR review timed out after {TOTAL_FLOW_TIMEOUT} seconds"
        )
    except Exception as e:
        # Log the error for debugging
        logger.error(f"Error in PR review: {review_id} - {str(e)}")
        raise HTTPException(status_code=500, detail=f"Internal server error: {str(e)}")
 # Error handlers
@app.exception_handler(404)
 async def not_found_handler(request: Request, exc: HTTPException):
    return JSONResponse(
        status_code=404,
        content={"message": "Endpoint not found"}
    )
@app.exception_handler(422)
 async def request_validation_exception_handler(request: Request, exc: HTTPException):
    return JSONResponse(
        status_code=422,
        content={"message": "Invalid request payload", "details": exc.detail}
    )
@app.exception_handler(500)
 async def internal_error_handler(request: Request, exc: HTTPException):
    return JSONResponse(
        status_code=500,
        content={"message": "Internal server error"}
    )
@app.exception_handler(504)
 async def timeout_handler(request: Request, exc: HTTPException):
    return JSONResponse(
        status_code=504,
        content={"message": "Request timeout", "details": exc.detail}
    )
 if __name__ == "__main__":
    uvicorn.run(app, host="0.0.0.0", port=8000)
--- a/src/pr_reviewer/state.py
+++ b/src/pr_reviewer/state.py
@ -0,0 +1,45 @@
 from pydantic import BaseModel, Field
 from typing import List, Optional, Dict, Any
 from datetime import datetime
 class FileInfo(BaseModel):
    """Information about a file in the PR."""
    path: str
    content: Optional[str] = None
    status: str  # added, modified, removed, etc.
    additions: int = 0
    deletions: int = 0
    patch: Optional[str] = None
 class ContextOverrides(BaseModel):
    """Overrides for the default context."""
    code_review: Optional[str] = None
    security_review: Optional[str] = None
    infra_review: Optional[str] = None
 class PRReviewState(BaseModel):
    """State of the PR review process."""
    # Input fields
    pr_id: str
    pr_title: str
    pr_description: Optional[str] = None
    pr_url: Optional[str] = None
    repo_name: str
    repo_url: str
    branch: str
    base_branch: str
    files: List[FileInfo] = Field(default_factory=list)
    context_overrides: Optional[ContextOverrides] = None
    # Internal fields
    resolved_context: Optional[Dict[str, str]] = None
    code_review_results: Optional[str] = None
    security_review_results: Optional[str] = None
    infra_review_results: Optional[str] = None
    review_summary: Optional[str] = None
    # Metadata
    started_at: Optional[datetime] = None
    completed_at: Optional[datetime] = None
    error: Optional[str] = None
--- a/tests/integration/pycache/test_mcp_servers.cpython-314-pytest-9.0.3.pyc
+++ b/tests/integration/pycache/test_mcp_servers.cpython-314-pytest-9.0.3.pyc
--- a/tests/integration/test_mcp_servers.py
+++ b/tests/integration/test_mcp_servers.py
@ -0,0 +1,70 @@
 """
 Integration tests for MCP servers.
 """
 import pytest
 import sys
 import os
 # Add the project root to the path so we can import the MCP servers
 sys.path.insert(0, os.path.join(os.path.dirname(__file__), '..', '..'))
 def test_hadolint_mcp_import():
    """Test that the Hadolint MCP server can be imported."""
    try:
        from mcp_servers.hadolint_mcp import server
        assert server is not None
    except ImportError as e:
        pytest.fail(f"Failed to import Hadolint MCP server: {e}")
 def test_checkov_mcp_import():
    """Test that the Checkov MCP server can be imported."""
    try:
        from mcp_servers.checkov_mcp import server
        assert server is not None
    except ImportError as e:
        pytest.fail(f"Failed to import Checkov MCP server: {e}")
 def test_crew_imports():
    """Test that all crew modules can be imported."""
    try:
        from crews.code_review_crew.code_review_crew import CodeReviewCrew
        from crews.security_review_crew.security_review_crew import SecurityReviewCrew
        from crews.infra_review_crew.infra_review_crew import InfraReviewCrew
        from crews.summariser_crew.summariser_crew import SummariserCrew
        # Test that we can instantiate the crews
        code_crew = CodeReviewCrew()
        security_crew = SecurityReviewCrew()
        infra_crew = InfraReviewCrew()
        summariser_crew = SummariserCrew()
        assert code_crew is not None
        assert security_crew is not None
        assert infra_crew is not None
        assert summariser_crew is not None
    except ImportError as e:
        pytest.fail(f"Failed to import crew modules: {e}")
    except Exception as e:
        pytest.fail(f"Failed to instantiate crews: {e}")
 def test_flow_import():
    """Test that the flow module can be imported."""
    try:
        from src.pr_reviewer.flow import CodeReviewFlow
        flow = CodeReviewFlow()
        assert flow is not None
    except ImportError as e:
        pytest.fail(f"Failed to import flow module: {e}")
 def test_main_import():
    """Test that the main module can be imported."""
    try:
        from src.pr_reviewer.main import app
        assert app is not None
    except ImportError as e:
        pytest.fail(f"Failed to import main module: {e}")
--- a/tests/unit/pycache/test_context.cpython-314-pytest-9.0.3.pyc
+++ b/tests/unit/pycache/test_context.cpython-314-pytest-9.0.3.pyc
--- a/tests/unit/pycache/test_state.cpython-314-pytest-9.0.3.pyc
+++ b/tests/unit/pycache/test_state.cpython-314-pytest-9.0.3.pyc
--- a/tests/unit/test_context.py
+++ b/tests/unit/test_context.py
@ -0,0 +1,100 @@
 """
 Unit tests for the context resolution system.
 """
 import pytest
 import tempfile
 import os
 from src.pr_reviewer.context import resolve_context
 from src.pr_reviewer.state import PRReviewState, ContextOverrides
 def test_resolve_context_with_defaults():
    """Test resolving context when default files exist."""
    # Create temporary directory structure
    with tempfile.TemporaryDirectory() as temp_dir:
        # Create contexts/defaults directory
        defaults_dir = os.path.join(temp_dir, "contexts", "defaults")
        os.makedirs(defaults_dir)
        # Create default context files
        with open(os.path.join(defaults_dir, "code_review.md"), "w") as f:
            f.write("# Code Review\n\nFollow PEP8.")
        with open(os.path.join(defaults_dir, "security_review.md"), "w") as f:
            f.write("# Security Review\n\nCheck for SQL injection.")
        with open(os.path.join(defaults_dir, "infra_review.md"), "w") as f:
            f.write("# Infra Review\n\nValidate Dockerfile.")
        # Change to temp directory
        original_cwd = os.getcwd()
        os.chdir(temp_dir)
        try:
            # Create state without overrides
            state = PRReviewState(
                pr_id="123",
                pr_title="Test PR",
                repo_name="test-repo",
                repo_url="https://github.com/user/test-repo",
                branch="main",
                base_branch="main"
            )
            # Resolve context
            context = resolve_context(state)
            # Assertions
            assert context["code_review"] == "# Code Review\n\nFollow PEP8."
            assert context["security_review"] == "# Security Review\n\nCheck for SQL injection."
            assert context["infra_review"] == "# Infra Review\n\nValidate Dockerfile."
        finally:
            os.chdir(original_cwd)
 def test_resolve_context_with_overrides():
    """Test resolving context when overrides are provided."""
    # Create state with context overrides
    state = PRReviewState(
        pr_id="123",
        pr_title="Test PR",
        repo_name="test-repo",
        repo_url="https://github.com/user/test-repo",
        branch="main",
        base_branch="main",
        context_overrides=ContextOverrides(
            code_review="Custom code review guidelines",
            security_review="Custom security guidelines"
            # infra_review is not provided, should use default if file exists
        )
    )
    # Since we don't have default files in this test, infra_review should be empty
    context = resolve_context(state)
    # Assertions
    assert context["code_review"] == "Custom code review guidelines"
    assert context["security_review"] == "Custom security guidelines"
    assert context["infra_review"] == ""  # Empty because no default file and no override
 def test_resolve_context_empty_state():
    """Test resolving context with minimal state."""
    state = PRReviewState(
        pr_id="123",
        pr_title="Test PR",
        repo_name="test-repo",
        repo_url="https://github.com/user/test-repo",
        branch="main",
        base_branch="main"
    )
    # Without default files in the current directory, all contexts should be empty
    # But since we have default files in the project, we need to check what they contain
    context = resolve_context(state)
    # The function should return the content of the default files
    # We're just checking that it returns strings (could be empty or contain default content)
    assert isinstance(context["code_review"], str)
    assert isinstance(context["security_review"], str)
    assert isinstance(context["infra_review"], str)
--- a/tests/unit/test_state.py
+++ b/tests/unit/test_state.py
@ -0,0 +1,69 @@
 """
 Unit tests for the state management module.
 """
 import pytest
 from src.pr_reviewer.state import FileInfo, ContextOverrides, PRReviewState
 from datetime import datetime
 def test_file_info_creation():
    """Test creating a FileInfo instance."""
    file_info = FileInfo(
        path="src/main.py",
        content="print('hello')",
        status="modified",
        additions=5,
        deletions=2
    )
    assert file_info.path == "src/main.py"
    assert file_info.content == "print('hello')"
    assert file_info.status == "modified"
    assert file_info.additions == 5
    assert file_info.deletions == 2
 def test_context_overrides_creation():
    """Test creating a ContextOverrides instance."""
    context_overrides = ContextOverrides(
        code_review="Follow PEP8",
        security_review="Check for SQL injection",
        infra_review="Validate Dockerfile"
    )
    assert context_overrides.code_review == "Follow PEP8"
    assert context_overrides.security_review == "Check for SQL injection"
    assert context_overrides.infra_review == "Validate Dockerfile"
 def test_context_overrides_partial():
    """Test creating a ContextOverrides instance with partial fields."""
    context_overrides = ContextOverrides(
        code_review="Follow PEP8"
    )
    assert context_overrides.code_review == "Follow PEP8"
    assert context_overrides.security_review is None
    assert context_overrides.infra_review is None
 def test_pr_review_state_creation():
    """Test creating a PRReviewState instance."""
    state = PRReviewState(
        pr_id="123",
        pr_title="Add feature",
        repo_name="test-repo",
        repo_url="https://github.com/user/test-repo",
        branch="feature",
        base_branch="main"
    )
    assert state.pr_id == "123"
    assert state.pr_title == "Add feature"
    assert state.repo_name == "test-repo"
    assert state.repo_url == "https://github.com/user/test-repo"
    assert state.branch == "feature"
    assert state.base_branch == "main"
    assert state.files == []
    assert state.started_at is None
    assert state.completed_at is None
--- a/tools/init.py
+++ b/tools/init.py
--- a/tools/pycache/init.cpython-314.pyc
+++ b/tools/pycache/init.cpython-314.pyc
--- a/tools/pycache/git_tool.cpython-314.pyc
+++ b/tools/pycache/git_tool.cpython-314.pyc
--- a/tools/git_tool.py
+++ b/tools/git_tool.py
@ -0,0 +1,57 @@
 from pydantic import BaseModel, Field
 from crewai_tools import BaseTool
 import git
 import os
 import shutil
 from typing import Type
 class GitCloneInput(BaseModel):
    """Input schema for GitTool."""
    repo_url: str = Field(..., description="URL of the Git repository to clone")
    branch: str = Field(None, description="Branch to checkout (optional)")
    commit: str = Field(None, description="Commit hash to checkout (optional)")
    target_dir: str = Field(None, description="Target directory to clone into (optional)")
 class GitTool(BaseTool):
    name: str = "GitTool"
    description: str = "Clones a Git repository and checks out a specific branch or commit"
    args_schema: Type[BaseModel] = GitCloneInput
    def _run(self, repo_url: str, branch: str = None, commit: str = None, target_dir: str = None) -> str:
        """
        Clone a Git repository and checkout a specific branch or commit.
        Args:
            repo_url: URL of the Git repository to clone
            branch: Branch to checkout (optional)
            commit: Commit hash to checkout (optional)
            target_dir: Target directory to clone into (optional)
        Returns:
            A message indicating the result of the operation.
        """
        # If target_dir is not provided, extract the repository name from the URL
        if target_dir is None:
            target_dir = repo_url.split("/")[-1]
            if target_dir.endswith(".git"):
                target_dir = target_dir[:-4]
        # Remove the target directory if it already exists to avoid conflicts
        if os.path.exists(target_dir):
            shutil.rmtree(target_dir)
        try:
            # Clone the repository
            repo = git.Repo.clone_from(repo_url, target_dir)
            # Checkout the specified branch or commit
            if branch:
                repo.git.checkout(branch)
            elif commit:
                repo.git.checkout(commit)
            return f"Successfully cloned {repo_url} into {target_dir} and checked out {'branch: ' + branch if branch else 'commit: ' + commit if commit else 'default branch'}"
        except Exception as e:
            return f"Error cloning repository: {str(e)}"