Spaces:

build-small-hackathon
/

multi-agent-lab

Running on Zero

multi-agent-lab / src /core /structured.py

agharsallah

feat: Implement well-known typed fields for verdicts in output models

ce159dc 10 days ago

19.3 kB

	"""Structured output for agent responses — two layers, one schema.

	Small models comply better under constraint. Asking for free prose is
	where they drift. Asking for a specific JSON schema is where they stay
	in character.

	Two paths share the same ``{kind, text, …}`` shape:

	- Live path (validated). ``build_output_model`` turns an agent's
	``may_emit`` grant + ``output_extra_fields`` into a Pydantic model whose
	``kind`` is constrained to the allowed kinds. The live provider asks the
	model for that model and retries on validation failure, so the payload is
	valid by construction — no malformed prose ever reaches the ledger.
	- Offline path (tolerant parse). ``json_instruction`` appends a JSON
	block to the prompt and ``parse_agent_output`` normalises whatever text the
	deterministic stub returns, wrapping non-compliant prose in the fallback
	kind. This keeps demos and tests fully offline with no dependency.

	Both paths are model/provider-agnostic: the live constraint rides on the same
	``{kind, text, …}`` contract the parser produces, so downstream
	(``Event`` construction, conductor, ledger) is identical either way.
	"""

	from __future__ import annotations

	import json
	import re
	from typing import TYPE_CHECKING, Any, Literal

	from src.models.provider import is_model_error

	if TYPE_CHECKING:
	from pydantic import BaseModel


	# ── output schema ─────────────────────────────────────────────────────────────


	class AgentOutputError(ValueError):
	"""Raised when output cannot be normalised to a valid event payload."""


	# ── well-known typed extra fields ──────────────────────────────────────────────


	# A small, curated table of engine-known extra fields (ADR-0029). Most
	# ``output_extra_fields`` are arbitrary scenario fields (``mood``, ``wants``, …) and
	# remain required strings, but ``winner`` and ``scores`` are the verdict contract
	# ADR-0026 already names in ``run.finished`` — so the engine gives them real types:
	# an optional cast name and an optional ``{player: score}`` map. Each entry pairs
	# the Pydantic field spec (built lazily so ``Field`` stays a local import) with the
	# JSON-schema hint ``json_instruction`` renders for that field. Anything not in this
	# table hits the other row and behaves exactly as before — back-compat is total.
	def _well_known_specs() -> dict[str, tuple[Any, str]]:
	"""Return ``{field: (pydantic_spec, json_hint)}`` for engine-known extra fields.

	Built behind a function so ``Field`` is a local import (matching the lazy-import
	idiom of ``build_output_model``) and never touched on the offline path that
	doesn't construct a validated model.
	"""
	from pydantic import Field

	# The hint is the literal JSON value to render after ``"<field>": `` — a quoted
	# string for ``winner``, a bare object for ``scores`` (it is not a string value).
	return {
	"winner": ((str \| None, None), '"<a player\'s name, or null>"'),
	"scores": ((dict[str, float], Field(default_factory=dict)), '{"<player>": 0-10}'),
	}


	# ── validated output model (live path) ─────────────────────────────────────────


	def build_output_model(
	allowed_kinds: list[str],
	extra_fields: list[str] \| None = None,
	) -> type["BaseModel"]:
	"""Build a Pydantic model for an agent's validated output.

	``kind`` is constrained to allowed_kinds via a ``Literal``, so the model
	cannot emit a kind it is not authorised for; ``text`` is a required string.
	extra_fields are required strings too, except the **well-known typed
	fields** of ADR-0029: ``winner`` becomes ``str \| None`` (default ``None``) and
	``scores`` becomes ``dict[str, float]`` (default ``{}``). Used on the live path
	with structured output: the provider retries on validation failure and returns a
	valid instance, which means the malformed-prose ``_raw_fallback`` path is never
	taken.

	Args:
	allowed_kinds: event kinds this agent may emit (the ``may_emit`` grant,
	reflection excluded). Must be non-empty.
	extra_fields: optional additional payload fields (e.g. ``"emotion"``). Each
	is a required string alongside ``text`` unless it is a well-known typed
	field (``winner``, ``scores``), which is optional with a typed default.
	"""
	if not allowed_kinds:
	raise AgentOutputError("build_output_model requires at least one allowed kind")

	from pydantic import create_model

	well_known = _well_known_specs()
	# A single-element Literal is legal and still constrains to that one kind.
	kind_type = Literal[tuple(allowed_kinds)] # type: ignore[valid-type]
	fields: dict[str, Any] = {
	"kind": (kind_type, ...),
	"text": (str, ...),
	}
	for name in extra_fields or []:
	spec, _hint = well_known.get(name, ((str, ...), None))
	fields[name] = spec

	return create_model(
	"AgentOutput",
	__doc__="Validated agent event payload (kind constrained to may_emit).",
	**fields,
	)


	# ── prompt instruction ────────────────────────────────────────────────────────


	def json_instruction(allowed_kinds: list[str], extra_fields: list[str] \| None = None) -> str:
	"""Return the JSON constraint block appended to every agent prompt.

	For ordinary fields the schema hint is the uniform ``"...": "..."`` shape. When
	a well-known typed field of ADR-0029 is present, that field gets a typed hint
	instead (``"winner": "<a player's name, or null>"``,
	``"scores": {"<player>": 0-10}``) so a small model knows it may answer ``null`` or
	a number map rather than a sentence. Manifests with no well-known field render
	byte-identically to the original uniform schema.

	Args:
	allowed_kinds: event kinds this agent may emit.
	extra_fields: optional additional payload fields (e.g. "emotion", "wants").
	"""
	fields = extra_fields or []
	well_known = _well_known_specs()
	kinds_str = " \| ".join(allowed_kinds)

	if any(name in well_known for name in fields):
	# Richer per-field schema: typed hints for known fields, "..." for the rest.
	# Only taken when a well-known field is present, so the common case below
	# stays byte-identical to the original uniform-schema output.
	hints = {"kind": '"..."', "text": '"..."'}
	for name in fields:
	_spec, hint = well_known.get(name, (None, None))
	hints[name] = hint if hint is not None else '"..."'
	schema_body = ", ".join(f'"{name}": {hints[name]}' for name in ["kind", "text", *fields])
	schema_line = f"Schema: {{{schema_body}}}\n"
	else:
	field_list = '", "'.join(["kind", "text"] + list(fields))
	schema_line = f'Schema: {{"{field_list}": "..."}}\n'

	return (
	"\n\nOUTPUT FORMAT\n"
	"Reply with a single JSON object and NOTHING else. No analysis, no reasoning, "
	"no <think> blocks, no markdown fences, no text before or after the JSON.\n"
	f"{schema_line}"
	f"kind must be one of: {kinds_str}\n"
	"text must be one or two sentences, vivid and specific — your line, never your reasoning.\n"
	"If you were given a secret word, never spell or quote it; describe it only.\n"
	"Example: "
	'{"kind": "' + allowed_kinds[0] + '", "text": "A brief, evocative response."}'
	)


	# ── parser ────────────────────────────────────────────────────────────────────

	# Reasoning models (and chat models told to "think") often wrap their scratchpad
	# in tagged blocks or fence the JSON. We strip those before parsing so a stray
	# chain-of-thought never reaches the ledger as the spoken line — the leak we saw
	# live, where "…I think the word is COFFEE…" was emitted as an agent's clue.
	_REASONING_BLOCK = re.compile(
	r"<\s(think\|thinking\|reason\|reasoning\|analysis\|scratchpad\|monologue)\s>(.?)<\s/\s\1\s>",
	re.DOTALL \| re.IGNORECASE,
	)
	# An UNTERMINATED reasoning block — the model was truncated mid-think (no closing tag),
	# so everything from the open tag onward is reasoning, not the answer.
	_REASONING_OPEN = re.compile(
	r"<\s(?:think\|thinking\|reason\|reasoning\|analysis\|scratchpad\|monologue)\s>",
	re.IGNORECASE,
	)
	_CODE_FENCE = re.compile(r"```[a-zA-Z]*\n?\|\n?```")
	# Sentences/lines that are obviously scratchpad or meta-commentary about the task —
	# used only when salvaging a fallback line, so a "thinking out loud" model's notes
	# ("But it must be one or two sentences…") don't become the spoken clue.
	_SCRATCHPAD_LINE = re.compile(
	r"^\s*(we (?:need\|must\|should\|are\|have)\|the (?:schema\|text\|clue\|answer\|response\|user)\|"
	r"thought\s:\|mood\s:\|json\s*:\|output\b\|let'?s\|but\b\|must\b\|i (?:need\|should\|must\|will\|think\|am\|'ll)\|"
	r"(?:one\|two) sentences?\|remember\b\|note\b\|so\b\|okay\b\|ok\b\|first\b\|now\b)",
	re.IGNORECASE,
	)
	# A quoted text value — from a partial JSON (``"text": "…"``) or a prose label (``Text: "…"``).
	_TEXT_VALUE = re.compile(r'(?:"text"\|text)\s:\s"([^"]{3,})"', re.IGNORECASE)
	_SENTENCE_SPLIT = re.compile(r"(?<=[.!?])\s+")


	def _strip_reasoning(raw: str) -> str:
	"""Remove reasoning blocks and code fences from raw.

	Strips closed ``<think>…</think>`` blocks, then — if an UNTERMINATED reasoning
	block remains (truncated mid-think) — drops everything from that open tag to the
	end, since none of it is the answer."""
	raw = _REASONING_BLOCK.sub(" ", raw or "")
	raw = _CODE_FENCE.sub("", raw)
	open_tag = _REASONING_OPEN.search(raw)
	if open_tag:
	raw = raw[: open_tag.start()]
	return raw.strip()


	def extract_reasoning(raw: str, limit: int = 600) -> str:
	"""Return the model's inline reasoning from raw (joined, trimmed).

	Captures both closed ``<think>…</think>`` blocks and an UNTERMINATED one (the
	truncated-mid-think case), so the mind-reader ``thought`` still has the thinking
	even when the answer never arrived. Empty when there are no reasoning tags — e.g.
	when vLLM split it into ``reasoning_content`` (captured separately by the provider).
	Never fed back into any agent's prompt."""
	raw = raw or ""
	parts = [m.group(2).strip() for m in _REASONING_BLOCK.finditer(raw)]
	remainder = _REASONING_BLOCK.sub(" ", raw)
	open_tag = _REASONING_OPEN.search(remainder)
	if open_tag:
	parts.append(remainder[open_tag.end() :].strip())
	return " ".join(p for p in parts if p)[:limit].strip()


	def _balanced_objects(text: str) -> list[str]:
	"""Return every top-level ``{...}`` substring in text, in order.

	A string-aware brace scan, so nested objects and braces inside string values
	don't truncate the match the way a flat ``\\{[^{}]+\\}`` regex would.
	"""
	objects: list[str] = []
	depth = 0
	start = -1
	in_str = False
	escape = False
	for i, ch in enumerate(text):
	if in_str:
	if escape:
	escape = False
	elif ch == "\\":
	escape = True
	elif ch == '"':
	in_str = False
	continue
	if ch == '"':
	in_str = True
	elif ch == "{":
	if depth == 0:
	start = i
	depth += 1
	elif ch == "}" and depth > 0:
	depth -= 1
	if depth == 0 and start >= 0:
	objects.append(text[start : i + 1])
	start = -1
	return objects


	def parse_agent_output(
	raw: str,
	allowed_kinds: list[str],
	fallback_kind: str,
	) -> dict[str, Any]:
	"""Parse raw model output into a validated event payload dict.

	Strategy:
	1. Strip tagged reasoning blocks and code fences.
	2. Parse the LAST balanced ``{...}`` object — a reasoning model that emits
	scratchpad before its answer puts the real payload last.
	3. Fall back to salvaging a safe line (never the raw chain-of-thought).

	Returns a dict with at least ``{"kind": str, "text": str}``. The caller
	constructs the Event from this dict.
	"""
	cleaned = _strip_reasoning(raw)

	for candidate in reversed(_balanced_objects(cleaned)):
	result = _try_parse(candidate, allowed_kinds, fallback_kind)
	if result is not None:
	return result

	# No parseable object — salvage a clean line, never the scratchpad.
	return {"kind": fallback_kind, **_salvage_text(cleaned), "_raw_fallback": True}


	def _salvage_text(cleaned: str) -> dict[str, str]:
	"""Recover a safe spoken line from unparseable output.

	In order: the quoted value the model intended (closed ``"text": "…"`` /
	``Text: "…"``); the tail after a lone opening quote (a clue the model began
	drafting before it was cut off); then the substantive sentences with
	scratchpad/meta dropped. Only a neutral placeholder if nothing survives — so a
	"thinking out loud" monologue never becomes the spoken line.
	"""
	m = _TEXT_VALUE.search(cleaned)
	if m:
	return {"text": m.group(1).strip()}
	# A lone (unterminated) opening quote — the model started drafting the clue.
	if cleaned.count('"') % 2 == 1:
	tail = cleaned.rsplit('"', 1)[-1].strip()
	if len(tail) >= 8 and not _SCRATCHPAD_LINE.match(tail):
	return {"text": tail[:280]}
	kept = [
	s.strip(" \"'")
	for s in _SENTENCE_SPLIT.split(cleaned)
	if len(s.strip()) >= 5 and not s.lstrip().startswith("{") and not _SCRATCHPAD_LINE.match(s.strip())
	]
	if kept:
	return {"text": " ".join(kept)[:280]}
	return {"text": "…"}


	# HARD meta — a secret-word leak or an echo of the JSON/format instruction. These must
	# NEVER become the spoken line; they always go to the (private) residue, even when nothing
	# else survives (better to skip the turn than ship the secret or the schema).
	_HARD_META = re.compile(
	r"secret word\|the word is\|my word\|also include\|must (?:include\|output\|name\|provide)\|"
	r"\bjson\b\|\bschema\b\|\bmood\b\|\bthought\b\|one or two sentence\|vivid and specific\|"
	r"\bagent\.\w+\|brief,? evocative\|output format\|\bfield\b",
	re.IGNORECASE,
	)
	# SOFT meta — a scratchpad/planning preamble or a first-person opener ("Alright, the user
	# wants me to play as CARA…", "Let me… I should…", "I think mine is…"). Dropped to residue
	# when real speech survives alongside it, but PROMOTED to the spoken line when it is all the
	# model gave: on the prose fallback an over-thinker's "I think mine is…" is in-character
	# speech, not reasoning, so shipping it beats raising "no usable line" and skipping the turn.
	_SOFT_META = re.compile(
	r"need to\|have to\|must be\b\|"
	r"\balright\b\|\bokay\b\|the user\b\|looking at\|let me\b\|my clue\b\|play as\b\|"
	r"\bas (?:cara\|bex\|nil\|ovo)\b\|i (?:should\|need\|must\|will\|think\|'ll\|'m\|am)\b\|the (?:scenario\|game\|prompt)\b",
	re.IGNORECASE,
	)
	# A standalone ALL-CAPS token (≥3 letters) — personas write the secret as COFFEE / TEA /
	# TREE, and a model that slips it does so in caps; clues never do. A generic word-leak guard.
	_CAPS_TOKEN = re.compile(r"\b[A-Z]{3,}\b")
	_EXAMPLE_ECHO = "a brief, evocative response"


	def _is_hard_meta(sentence: str) -> bool:
	"""True if sentence leaks the secret (caps token) or echoes the format instruction —
	never a spoken line, no matter what."""
	return bool(_HARD_META.search(sentence)) or bool(_CAPS_TOKEN.search(sentence))


	def _is_meta(sentence: str) -> bool:
	"""True if sentence is hard meta or a soft scratchpad/planning preamble."""
	return _is_hard_meta(sentence) or bool(_SOFT_META.search(sentence))


	def clean_clue(raw: str) -> tuple[str, str]:
	"""Extract a clean spoken line from PROSE output, plus the residue.

	Used on the live fallback when a model ignores the JSON schema and just talks
	(often a small or reasoning model). Returns ``(clue, residue)``: clue is the
	spoken line with reasoning blocks and meta-commentary sentences stripped (``""``
	when nothing usable survives — the caller then skips the turn rather than ship
	junk); residue is the stripped thinking, usable as the private mind-reader
	thought (never shown to other agents)."""
	residue: list[str] = []
	reasoning = extract_reasoning(raw) # closed + unterminated <think>, the truncated case
	if reasoning:
	residue.append(reasoning)
	cleaned = _strip_reasoning(raw)

	m = _TEXT_VALUE.search(cleaned)
	if m:
	return m.group(1).strip(), " ".join(p for p in residue if p)[:600].strip()

	if cleaned.count('"') % 2 == 1:
	tail = cleaned.rsplit('"', 1)[-1].strip()
	if len(tail) >= 8 and not _is_meta(tail):
	cleaned = tail

	kept: list[str] = []
	soft: list[str] = []
	for s in _SENTENCE_SPLIT.split(cleaned):
	sentence = s.strip()
	if len(sentence) < 6 or sentence.startswith("{"):
	continue
	clean_sentence = sentence.strip(" \"'")
	if _is_hard_meta(sentence):
	residue.append(clean_sentence)
	elif _SOFT_META.search(sentence):
	soft.append(clean_sentence)
	else:
	kept.append(clean_sentence)

	# Soft meta rides as private residue when real speech survives — but when it's all the
	# model gave, it IS the line: a "thinking out loud" opener still passed every hard guard
	# (no secret word, no schema echo), so shipping it beats skipping the turn.
	if kept:
	residue.extend(soft)
	else:
	kept = soft

	return " ".join(kept)[:300].strip(), " ".join(p for p in residue if p)[:600].strip()


	def is_usable_line(text: str) -> bool:
	"""True when text is a real spoken line — not empty, a ``…`` placeholder, the
	example, or a provider failure sentinel that slipped through (defense in depth: the
	agent already raises on a model error before this gate, see ADR-0023)."""
	if is_model_error(text):
	return False
	normalized = (text or "").strip().lower().strip(" .…\"'")
	return len(normalized) >= 6 and normalized != _EXAMPLE_ECHO


	def _try_parse(s: str, allowed_kinds: list[str], fallback_kind: str) -> dict[str, Any] \| None:
	try:
	data = json.loads(s)
	except json.JSONDecodeError:
	return None

	if not isinstance(data, dict):
	return None

	# Normalise kind
	kind = data.get("kind", fallback_kind)
	if kind not in allowed_kinds:
	kind = fallback_kind
	data["kind"] = kind

	# Ensure text exists
	if "text" not in data or not isinstance(data.get("text"), str):
	data["text"] = str(data.get("content", data.get("message", s[:200])))

	return data