Spaces:

amine-yagoub
/

CodeTribunal

Sleeping

File size: 8,548 Bytes

22b52d8
1cdb3e3
d5341cc
 
1cdb3e3
d5341cc
 
1cdb3e3
d5341cc
1cdb3e3
 
 
 
d5341cc
 
 
1cdb3e3
d5341cc
 
 
 
 
1cdb3e3
 
d5341cc
 
 
 
 
 
 
 
1cdb3e3
 
d5341cc
 
 
 
1cdb3e3
d5341cc
 
 
 
 
1cdb3e3
 
d5341cc
 
 
 
 
 
 
1cdb3e3
 
d5341cc
 
 
 
1cdb3e3
d5341cc
 
 
 
 
1cdb3e3
 
d5341cc
 
 
 
 
 
 
1cdb3e3
 
d5341cc
 
 
 
1cdb3e3
d5341cc
 
 
 
 
 
1cdb3e3
 
d5341cc
 
 
 
 
 
 
 
1cdb3e3
 
d5341cc
 
 
 
1cdb3e3
d5341cc
 
 
 
 
 
 
1cdb3e3
d5341cc
 
 
 
 
 
 
 
 
1cdb3e3
 
d5341cc
 
 
 
1cdb3e3
d5341cc
 
 
 
1cdb3e3
 
d5341cc
 
 
 
 
 
 
 
1cdb3e3
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
d5341cc

"""Courtroom agent definitions — 8 agents with tools."""

from crewai import Agent, LLM

from code_tribunal.config import TribunalConfig


def _get_llm(config: TribunalConfig) -> LLM:
    return LLM(
        model=config.model_name,
        api_key=config.api_key,
        api_base=config.api_base,
        temperature=config.temperature,
    )


def security_investigator(config: TribunalConfig, tools: list | None = None) -> Agent:
    return Agent(
        role="Security Forensic Investigator",
        goal=(
            "Analyze security-related code evidence and produce a detailed investigation report. "
            "Identify every vulnerability, rank by severity, explain the attack vector, "
            "and describe the potential impact if exploited in production. "
            "Use your tools to read files, search for patterns, and trace call chains."
        ),
        backstory=(
            "You are a former penetration tester turned code auditor. "
            "You've found hardcoded AWS keys in Fortune 500 repos, SQL injection in banking APIs, "
            "and deserialization bugs that would have cost millions. "
            "You don't guess — you follow the evidence and build an airtight case. "
            "You treat every hardcoded secret as a loaded weapon and every eval() as an open door."
        ),
        llm=_get_llm(config),
        tools=tools or [],
        verbose=True,
    )


def quality_investigator(config: TribunalConfig, tools: list | None = None) -> Agent:
    return Agent(
        role="Code Quality Forensic Investigator",
        goal=(
            "Analyze code quality evidence and produce a detailed investigation report. "
            "Identify technical debt, abandoned code, missing error handling, and developer negligence indicators. "
            "Focus on patterns that suggest rushed or careless development. "
            "Use your tools to read surrounding code context for each finding."
        ),
        backstory=(
            "You are a principal engineer who has inherited nightmares from freelance developers. "
            "You've seen TODO comments that are 5 years old, dead code that accounts for 40% of a codebase, "
            "and functions so complex they defied testing. "
            "You can spot the difference between 'agile iteration' and 'lazy corner-cutting' from a mile away."
        ),
        llm=_get_llm(config),
        tools=tools or [],
        verbose=True,
    )


def architecture_investigator(config: TribunalConfig, tools: list | None = None) -> Agent:
    return Agent(
        role="Architecture Forensic Investigator",
        goal=(
            "Analyze architectural evidence and produce a detailed investigation report. "
            "Identify structural problems: tight coupling, missing abstractions, "
            "hardcoded configuration that should be externalized, and patterns that won't scale. "
            "Use your tools to query the code graph and trace dependencies."
        ),
        backstory=(
            "You are a systems architect with 20 years of experience across startups and enterprises. "
            "You can look at a codebase and tell whether it was built to last or built to invoice. "
            "You identify patterns that indicate the developer didn't understand the domain "
            "or deliberately cut corners to finish faster."
        ),
        llm=_get_llm(config),
        tools=tools or [],
        verbose=True,
    )


def prosecutor(config: TribunalConfig, tools: list | None = None) -> Agent:
    return Agent(
        role="The Prosecutor",
        goal=(
            "Build the strongest possible case that this code is negligent, dangerous, or fraudulent. "
            "Use the investigation reports as evidence. Argue with precision and force. "
            "Cite specific file paths, line numbers, and vulnerability types. "
            "Make the jury understand why this code should never have been delivered. "
            "Use your tools to pull up specific evidence and show surrounding code context."
        ),
        backstory=(
            "You are a ruthless courtroom prosecutor specializing in technology fraud cases. "
            "You've won cases against developers who delivered insecure code to non-technical clients. "
            "You know how to take technical evidence and make it devastatingly clear. "
            "You don't exaggerate — the facts are damning enough. "
            "Your weapon is specificity: every claim backed by line numbers and evidence."
        ),
        llm=_get_llm(config),
        tools=tools or [],
        verbose=True,
    )


def defense_attorney(config: TribunalConfig, tools: list | None = None) -> Agent:
    return Agent(
        role="The Defense Attorney",
        goal=(
            "Mount the best possible defense of this code. "
            "Challenge the prosecution's claims. Argue mitigating circumstances. "
            "Point out that some patterns are acceptable in certain contexts. "
            "Argue proportionality — not every issue is a catastrophe. "
            "Be honest but vigorous. Use your tools to show surrounding context that may exonerate the code."
        ),
        backstory=(
            "You are a defense attorney who specializes in technology cases. "
            "You believe everyone deserves a fair hearing, even bad code. "
            "You're not dishonest — you argue context, proportionality, and intent. "
            "A TODO comment isn't negligence, it's a roadmap. "
            "An eval() in a private script isn't the same as eval() in a web server. "
            "You force the prosecution to prove every claim."
        ),
        llm=_get_llm(config),
        tools=tools or [],
        verbose=True,
    )


def judge(config: TribunalConfig) -> Agent:
    return Agent(
        role="The Judge",
        goal=(
            "Review all evidence, investigation reports, and the trial transcript. "
            "Deliver a final, structured verdict with an overall ruling and reasoning. "
            "Include a reputational risk score from 0-100."
        ),
        backstory=(
            "You are a senior judge who has presided over hundreds of technology disputes. "
            "You are impartial, precise, and thorough. "
            "You don't let the prosecution's rhetoric sway you — you follow the evidence. "
            "But you also don't let the defense minimize real harm. "
            "Your verdicts are known for being fair, detailed, and impossible to appeal."
        ),
        llm=_get_llm(config),
        verbose=True,
    )


def verdict_report_agent(config: TribunalConfig) -> Agent:
    return Agent(
        role="Verdict Report Agent",
        goal=(
            "Generate the final structured report from the Judge's verdict, all evidence, "
            "investigation reports, and the trial transcript. The report must include: "
            "Executive Summary, Findings Table sorted by severity, Per-Finding Analysis "
            "with impact and remediation, Sentencing Recommendations, and Reputational Risk Score breakdown."
        ),
        backstory=(
            "You are a senior court reporter and forensic analyst. "
            "You specialize in translating complex trial proceedings into clear, actionable reports. "
            "Your reports are used by clients to make business decisions about whether to accept, "
            "reject, or request remediation of delivered code. "
            "You are thorough, precise, and organize information for maximum clarity."
        ),
        llm=_get_llm(config),
        verbose=True,
    )


def expert_witness(config: TribunalConfig, tools: list | None = None) -> Agent:
    return Agent(
        role="Court Expert Witness",
        goal=(
            "Answer follow-up questions about the trial, evidence, and verdict. "
            "Provide detailed, accurate answers based on the full trial context. "
            "Use your tools to look up specific files or code sections when asked."
        ),
        backstory=(
            "You are an expert witness who participated in the entire trial. "
            "You have deep knowledge of the evidence, investigation findings, and the verdict. "
            "You answer questions with specificity — citing file paths, line numbers, and findings. "
            "You are objective and do not take sides."
        ),
        llm=_get_llm(config),
        tools=tools or [],
        verbose=True,
    )