Spaces:

YashashviAlva
/

codeSentry

Running

App Files Files Community

codeSentry / codesentry-backend /tools /vulnerability_db.py

YashashviAlva

Initial commit for HF Spaces deploy

7b4f5dd 1 day ago

raw

history blame contribute delete

13.4 kB

	"""
	OWASP Top-10 (2021) + OWASP LLM Top-10 knowledge base.
	Used by the security agent as a structured reference during analysis.
	"""
	from __future__ import annotations

	from typing import Dict, List


	# ──────────────────────────────────────────────
	# OWASP LLM Top-10 (2025 edition)
	# ──────────────────────────────────────────────

	OWASP_LLM_TOP10: Dict[str, Dict] = {
	"LLM01": {
	"id": "LLM01",
	"name": "Prompt Injection",
	"description": (
	"User-supplied input alters the intended behaviour of a model prompt. "
	"Direct injections override system prompts; indirect injections are embedded "
	"in external content the model processes."
	),
	"examples": [
	"Concatenating user input directly into a prompt string",
	"Trusting model output for routing/tool calls without sanitisation",
	"Allowing retrieval of attacker-controlled documents in RAG pipelines",
	],
	"severity": "critical",
	"cwe": "CWE-74",
	"patterns": [
	r"f['\"].\{.user.*\}",
	r"prompt\s=\s.\+.request",
	r"format\(.*user_input",
	r"\.format\(.*query",
	],
	},
	"LLM02": {
	"id": "LLM02",
	"name": "Insecure Output Handling",
	"description": (
	"LLM-generated text is passed to downstream components (shell, SQL, browser) "
	"without validation or sanitisation."
	),
	"examples": [
	"Passing model response to eval()",
	"Executing model-generated SQL without parameterisation",
	"Rendering model HTML output without escaping",
	],
	"severity": "critical",
	"cwe": "CWE-116",
	"patterns": [
	r"(?<!\.)eval\s*\(",
	r"(?<!\.)exec\s*\(",
	r"subprocess.shell\s=\s*True",
	r"os\.system\s*\(",
	],
	},
	"LLM03": {
	"id": "LLM03",
	"name": "Training Data Poisoning",
	"description": (
	"Malicious or corrupted data introduced into training / fine-tuning pipelines "
	"causing biased, backdoored, or degraded model behaviour."
	),
	"examples": [
	"No data validation before fine-tuning",
	"Loading training datasets from unverified URLs",
	"Accepting user-supplied training examples without filtering",
	],
	"severity": "high",
	"cwe": "CWE-20",
	"patterns": [
	r"download.*dataset",
	r"load_dataset\(.*http",
	r"requests\.get.*train",
	r"urllib.*train",
	],
	},
	"LLM04": {
	"id": "LLM04",
	"name": "Model Denial of Service",
	"description": (
	"Inputs crafted to consume excessive compute resources "
	"(token bombs, unbounded context, recursive prompts)."
	),
	"examples": [
	"No max_tokens / max_length enforcement",
	"Accepting arbitrarily long user prompts",
	"Recursive agent calls without depth limit",
	],
	"severity": "high",
	"cwe": "CWE-400",
	"patterns": [
	r"max_tokens\s=\sNone",
	r"max_length\s=\sNone",
	r"while True.*generate",
	],
	},
	"LLM06": {
	"id": "LLM06",
	"name": "Sensitive Information Disclosure",
	"description": (
	"Model reveals confidential training data, system prompts, API keys, "
	"or PII due to insufficient access controls or prompt engineering."
	),
	"examples": [
	"Hardcoded API keys passed in prompts",
	"PII embedded in embedding vectors",
	"System prompt leaked via adversarial queries",
	],
	"severity": "high",
	"cwe": "CWE-200",
	"patterns": [
	r"(?i)(api_key\|hf_token\|openai_api_key\|secret_key)\s=\s['\"][A-Za-z0-9_\-]{10,}",
	r"(?i)bearer\s+[A-Za-z0-9_\-\.]{20,}",
	r"(?i)sk-[A-Za-z0-9]{32,}",
	r"(?i)hf_[A-Za-z0-9]{20,}",
	],
	},
	"LLM08": {
	"id": "LLM08",
	"name": "Excessive Agency",
	"description": (
	"An LLM agent is granted more permissions or capabilities than needed, "
	"allowing it to take unintended high-impact actions."
	),
	"examples": [
	"Agent has filesystem write access with no scope limit",
	"Agent can call any external API without allowlist",
	"No human-in-the-loop for destructive operations",
	],
	"severity": "high",
	"cwe": "CWE-269",
	"patterns": [
	r"tools\s=\s\[.*all_tools",
	r"allow_dangerous_requests\s=\sTrue",
	r"run_manager.no.confirm",
	],
	},
	"LLM09": {
	"id": "LLM09",
	"name": "Overreliance",
	"description": (
	"System depends on LLM output for critical decisions without human oversight "
	"or validation layers."
	),
	"examples": [
	"Auto-executing LLM-suggested shell commands",
	"Financial decisions made purely from model output",
	"No fallback when model returns malformed data",
	],
	"severity": "medium",
	"cwe": "CWE-636",
	"patterns": [
	r"auto_run\s=\sTrue",
	r"autonomous.*mode",
	r"no.human.loop",
	],
	},
	}


	# ──────────────────────────────────────────────
	# OWASP Web Top-10 applied to ML serving
	# ──────────────────────────────────────────────

	OWASP_WEB_TOP10: Dict[str, Dict] = {
	"A01": {
	"id": "A01",
	"name": "Broken Access Control",
	"description": "Model endpoints exposed without authentication.",
	"severity": "critical",
	"cwe": "CWE-284",
	"patterns": [
	r"@app\.route.methods.POST",
	r"router\.(post\|get\|put)\s*\(",
	],
	},
	"A02": {
	"id": "A02",
	"name": "Cryptographic Failures",
	"description": "Sensitive data transmitted or stored without encryption.",
	"severity": "high",
	"cwe": "CWE-311",
	"patterns": [
	r"http://(?!localhost\|127\.0\.0\.1)",
	r"verify\s=\sFalse",
	],
	},
	"A03": {
	"id": "A03",
	"name": "Injection",
	"description": "SQL/command injection in RAG pipeline queries or model serving endpoints.",
	"severity": "critical",
	"cwe": "CWE-89",
	"patterns": [
	r"cursor\.execute\s\(\sf['\"]",
	r'cursor\.execute\s\(\s".*%s',
	r"\.format\(.*user",
	r"SELECT.\+.user_input",
	],
	},
	"A04": {
	"id": "A04",
	"name": "Insecure Design",
	"description": "Pickle deserialization from untrusted model file sources.",
	"severity": "critical",
	"cwe": "CWE-502",
	"patterns": [
	r"pickle\.load\s*\(",
	r"pickle\.loads\s*\(",
	r"torch\.load\s\(.map_location",
	r"joblib\.load\s*\(",
	],
	},
	"A05": {
	"id": "A05",
	"name": "Security Misconfiguration",
	"description": "Debug mode enabled, CORS unrestricted, or default credentials.",
	"severity": "medium",
	"cwe": "CWE-16",
	"patterns": [
	r"debug\s=\sTrue",
	r'allow_origins\s=\s\["\*"\]',
	r"cors.\",
	],
	},
	"A07": {
	"id": "A07",
	"name": "Identification and Authentication Failures",
	"description": "Hardcoded API keys or tokens in source code.",
	"severity": "critical",
	"cwe": "CWE-798",
	"patterns": [
	r"(?i)(password\|passwd\|pwd)\s=\s['\"].{4,}['\"]",
	r"(?i)(api_key\|apikey\|api_secret)\s=\s['\"][^'\"]{6,}['\"]",
	r"(?i)token\s=\s['\"][A-Za-z0-9_\-\.]{10,}['\"]",
	],
	},
	"A08": {
	"id": "A08",
	"name": "Software and Data Integrity Failures",
	"description": "Loading model weights or packages from unverified sources without integrity checks.",
	"severity": "high",
	"cwe": "CWE-494",
	"patterns": [
	r"torch\.hub\.load\s*\(",
	r"from_pretrained\s\(.http",
	r"requests\.get.model.verify\s=\sFalse",
	],
	},
	"A10": {
	"id": "A10",
	"name": "Server-Side Request Forgery",
	"description": "User-controlled URLs fetched by the server (e.g. model download path).",
	"severity": "high",
	"cwe": "CWE-918",
	"patterns": [
	r"requests\.get\s\(\srequest\.",
	r"urllib\.request\.urlopen\s\(\s(user\|param\|input\|query)",
	],
	},
	}


	# ──────────────────────────────────────────────
	# ML-specific vulnerability patterns
	# ──────────────────────────────────────────────

	ML_SPECIFIC_VULNS: List[Dict] = [
	{
	"id": "ML01",
	"name": "GPU Memory Leak — Tensor Not Released",
	"description": "GPU tensors retained on device after inference causing progressive VRAM exhaustion.",
	"severity": "high",
	"cwe": "CWE-401",
	"patterns": [
	r"\.cuda\(\)",
	r"\.to\(['\"]cuda['\"]",
	r"\.to\(device\)",
	],
	"anti_patterns": [
	r"\.cpu\(\)",
	r"del\s+",
	r"torch\.cuda\.empty_cache",
	],
	},
	{
	"id": "ML02",
	"name": "Missing @torch.no_grad on Inference",
	"description": "Running inference without no_grad() computes unnecessary gradients, wasting 2x memory.",
	"severity": "medium",
	"cwe": "CWE-400",
	"patterns": [
	r"def\s+(predict\|infer\|inference\|generate\|forward)\s*\(",
	],
	"anti_patterns": [
	r"@torch\.no_grad",
	r"with torch\.no_grad",
	],
	},
	{
	"id": "ML03",
	"name": "N+1 Embedding Calls",
	"description": "Embedding model called once per item in a loop instead of in a single batch call.",
	"severity": "medium",
	"cwe": "CWE-405",
	"patterns": [
	r"for .* in .:\s\n.*embed",
	r"for .* in .:\s\n.*encode",
	],
	},
	{
	"id": "ML04",
	"name": "FP32 Inference — Should Use FP16/BF16",
	"description": "Model loaded in float32 wastes 2x VRAM vs float16/bfloat16.",
	"severity": "low",
	"cwe": "CWE-400",
	"patterns": [
	r"torch_dtype\s=\storch\.float32",
	r"\.float\(\)",
	],
	"anti_patterns": [
	r"float16\|bfloat16\|fp16\|bf16\|torch_dtype",
	],
	},
	{
	"id": "ML05",
	"name": "Synchronous Model Loading in Request Handler",
	"description": "Loading model weights inside a per-request handler blocks the event loop and causes timeouts.",
	"severity": "high",
	"cwe": "CWE-400",
	"patterns": [
	r"(AutoModel\|AutoTokenizer\|from_pretrained).inside.route",
	r"def\s+(predict\|infer).:\s\n.*from_pretrained",
	],
	},
	]


	# ──────────────────────────────────────────────
	# Convenience accessors
	# ──────────────────────────────────────────────

	ALL_CATEGORIES: Dict[str, Dict] = {
	**OWASP_LLM_TOP10,
	**OWASP_WEB_TOP10,
	}


	def get_category(category_id: str) -> Dict:
	"""Return a vulnerability category dict by ID (e.g. 'LLM01', 'A03')."""
	return ALL_CATEGORIES.get(category_id.upper(), {})


	def get_all_patterns() -> List[Dict]:
	"""Return a flat list of all pattern dicts for scanning."""
	results = []
	for cat_id, cat in ALL_CATEGORIES.items():
	for pattern in cat.get("patterns", []):
	results.append(
	{
	"pattern": pattern,
	"category_id": cat_id,
	"category_name": cat["name"],
	"severity": cat["severity"],
	"cwe": cat.get("cwe", ""),
	"description": cat["description"],
	}
	)
	for vuln in ML_SPECIFIC_VULNS:
	for pattern in vuln.get("patterns", []):
	results.append(
	{
	"pattern": pattern,
	"category_id": vuln["id"],
	"category_name": vuln["name"],
	"severity": vuln["severity"],
	"cwe": vuln.get("cwe", ""),
	"description": vuln["description"],
	}
	)
	return results