Spaces:

build-small-hackathon
/

daimon

Running

App Files Files Community

daimon / engine /memory.py

davidquicast

chore: initial commit

f0347b4 1 day ago

raw

history blame contribute delete

8.97 kB

	"""Step 6 of the living loop: curated memory (F2, v4).

	Durable, consolidated knowledge - NOT a transcript. The raw chat transcript
	itself is owned entirely by `gr.Chatbot`'s session history (passed into
	`engine.loop.build_messages()` for multi-turn coherence); this module never
	stores a copy of it. Since Daimon runs 100% on a local model, the extra
	curation call is free, so both files are rewritten by `curate_memory()`
	after every turn:

	- `memory.md` - cross-session long-term memory: `## User profile`,
	`## Stable preferences and behavioral patterns`,
	`## Notable interactions`.
	- `memory/<date>.md` - this session's consolidated summary: YAML
	frontmatter (`date`, `session_id`) + `## episodic`,
	`## user_preferences`, `## procedural`, `## autobiographical`.
	"""

	from __future__ import annotations

	import re
	import sys
	from datetime import datetime, timezone
	from pathlib import Path

	REPO_ROOT = Path(__file__).resolve().parent.parent
	if str(REPO_ROOT) not in sys.path:
	sys.path.insert(0, str(REPO_ROOT))

	from engine.spec_bridge import PERSONAS_DIR # noqa: E402

	# Guards against a small model echoing the prompt/turn back as "content":
	# if any of these show up in the output, treat it as a malformed reply and
	# leave the memory file untouched rather than corrupt it.
	_BAD_MARKERS = ("new turn:", "current sections:", "your reply:", "user:", "daimon:")

	# Both curation prompts ask the model for ONLY the bullet sections (not the
	# header/frontmatter, which are deterministic and applied by Python below) -
	# a 1B model is unreliable at reproducing boilerplate verbatim, so we never
	# ask it to.
	_LONG_TERM_SECTIONS = ("User profile", "Stable preferences and behavioral patterns", "Notable interactions")
	_EPISODIC_SECTIONS = ("episodic", "user_preferences", "procedural", "autobiographical")

	_LONG_TERM_SYSTEM_PROMPT = (
	"You maintain Daimon's long-term memory: durable, cross-session "
	"knowledge about the USER and this relationship - NOT a transcript.\n\n"
	"Output ONLY these 3 sections, each a bullet list of at most 4 bullets, "
	"each under 15 words:\n\n"
	"## User profile\n- ...\n\n"
	"## Stable preferences and behavioral patterns\n- ...\n\n"
	"## Notable interactions\n- ...\n\n"
	"You will see the CURRENT sections and ONE new turn. If the turn reveals "
	"a new durable fact (about the user, their preferences, or a notable "
	"refusal/boundary moment), output the updated sections (same 3, in "
	"order, each trimmed to at most 4 bullets - drop the oldest/least "
	"useful first). If nothing durable changed, reply with exactly: "
	"NO_CHANGE\n\n"
	"Example reply:\n"
	"## User profile\n- User is named Ana, a veterinarian.\n\n"
	"## Stable preferences and behavioral patterns\n- Prefers short, direct answers.\n\n"
	"## Notable interactions\n- (none yet)"
	)

	_EPISODIC_SYSTEM_PROMPT = (
	"You maintain Daimon's consolidated session summary for today - a "
	"narrative summary of THIS conversation so far, NOT a transcript.\n\n"
	"Output ONLY these 4 sections, each a bullet list of at most 5 bullets, "
	"each under 20 words:\n\n"
	"## episodic\n- what happened this session (events, topics, outcomes)\n\n"
	"## user_preferences\n- preferences the user expressed this session\n\n"
	"## procedural\n- how Daimon should act/respond going forward, learned this session\n\n"
	"## autobiographical\n- what Daimon itself did/decided/felt this session\n\n"
	"You will see the CURRENT sections and ONE new turn. Output the updated "
	"sections (same 4, in order, each trimmed to at most 5 bullets - drop "
	"the oldest/least useful first). If the turn adds nothing to any "
	"section, reply with exactly: NO_CHANGE"
	)

	_FENCE_RE = re.compile(r"^```\w\s$", re.MULTILINE)

	# A small model occasionally echoes a section header back as if it were a
	# bullet (e.g. "- User profile" inside "## Notable interactions") - drop
	# bullets that are just one of our own header names.
	_KNOWN_HEADERS = {h.lower() for h in _LONG_TERM_SECTIONS + _EPISODIC_SECTIONS}


	def _extract_section_bullets(text: str, header: str, limit: int) -> list[str]:
	"""Return up to `limit` '- ' bullet lines found under `## {header}` in
	`text` (case-sensitive header match, stops at the next `## ` or EOF)."""
	pattern = re.compile(rf"^## {re.escape(header)}\s\n(.?)(?=\n## \|\Z)", re.DOTALL \| re.MULTILINE)
	m = pattern.search(text)
	if not m:
	return []
	bullets = [ln.strip() for ln in m.group(1).splitlines() if ln.strip().startswith("- ")]
	bullets = [b for b in bullets if b.lower() not in ("- (none yet)", "- ...")]
	bullets = [b for b in bullets if b[2:].strip().lower() not in _KNOWN_HEADERS]
	return bullets[:limit]


	def _memory_dir(slug: str) -> Path:
	path = PERSONAS_DIR / slug / "memory"
	path.mkdir(parents=True, exist_ok=True)
	return path


	def _memory_md_path(slug: str) -> Path:
	return PERSONAS_DIR / slug / "memory.md"


	def _today() -> str:
	return datetime.now(timezone.utc).strftime("%Y-%m-%d")


	def _episodic_path(slug: str) -> Path:
	return _memory_dir(slug) / f"{_today()}.md"


	def _rebuild(sections: tuple[str, ...], preamble: str, current: str, model_out: str, limit: int) -> tuple[str, bool]:
	"""Deterministically reassemble a curated memory file from `preamble`
	(header/frontmatter, never written by the model) plus, for each
	section, whichever bullet list is non-empty between the model's
	proposal and the current file (the model's proposal wins; if it left a
	section out entirely, the old bullets for that section are kept)."""
	changed = False
	lines = [preamble.rstrip(), ""]
	for header in sections:
	old = _extract_section_bullets(current, header, limit)
	new = _extract_section_bullets(model_out, header, limit)
	bullets = new or old
	if bullets != old:
	changed = True
	lines.append(f"## {header}")
	lines.extend(bullets if bullets else ["- (none yet)"])
	lines.append("")
	return "\n".join(lines).rstrip() + "\n", changed


	def _curate_file(
	path: Path,
	*,
	system_prompt: str,
	sections: tuple[str, ...],
	limit: int,
	preamble: str,
	user_message: str,
	reply: str,
	max_tokens: int,
	) -> bool:
	"""Show the model the CURRENT bullet sections of `path` plus one new
	turn, and let it propose updated sections (not the whole file - the
	header/frontmatter is reapplied deterministically by `_rebuild`).
	Returns True if `path` was rewritten. Best-effort: any model/parsing
	failure or no-op proposal leaves `path` untouched."""
	from model.client import chat # local import: keep memory.py importable without a model server

	current = path.read_text(encoding="utf-8") if path.exists() else ""
	current_sections = "\n\n".join(
	f"## {header}\n" + "\n".join(_extract_section_bullets(current, header, limit) or ["- (none yet)"])
	for header in sections
	)

	messages = [
	{"role": "system", "content": system_prompt},
	{
	"role": "user",
	"content": (
	f"Current sections:\n{current_sections}\n\n"
	f"New turn:\nUser: {user_message}\nDaimon: {reply}\n\n"
	"Your reply:"
	),
	},
	]
	try:
	out = chat(messages, modality="text", max_tokens=max_tokens, temperature=0.1, enable_thinking=False)
	except Exception:
	return False

	out = _FENCE_RE.sub("", (out or "")).strip()
	if not out or out.upper().startswith("NO_CHANGE"):
	return False
	if any(marker in out.lower() for marker in _BAD_MARKERS):
	return False # model echoed the prompt back - don't corrupt the file

	new_text, changed = _rebuild(sections, preamble, current, out, limit)
	if not changed:
	return False
	path.write_text(new_text, encoding="utf-8")
	return True


	def curate_memory(slug: str, user_message: str, reply: str) -> dict[str, bool]:
	"""Let the local model update both curated-memory files for the new
	turn: `memory.md` (cross-session) and `memory/<date>.md` (today's
	consolidated summary). Returns which files actually changed."""
	long_term_changed = _curate_file(
	_memory_md_path(slug),
	system_prompt=_LONG_TERM_SYSTEM_PROMPT,
	sections=_LONG_TERM_SECTIONS,
	limit=4,
	preamble="# Daimon - long-term memory",
	user_message=user_message,
	reply=reply,
	max_tokens=200,
	)
	episodic_changed = _curate_file(
	_episodic_path(slug),
	system_prompt=_EPISODIC_SYSTEM_PROMPT,
	sections=_EPISODIC_SECTIONS,
	limit=5,
	preamble=f"---\ndate: {_today()}\nsession_id: {slug}-{_today()}\n---",
	user_message=user_message,
	reply=reply,
	max_tokens=300,
	)
	return {"memory.md": long_term_changed, f"memory/{_today()}.md": episodic_changed}