From 236a16b33151406a837a41a6a69694e35529f9a3 Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Mon, 15 Jun 2026 23:52:35 +0000
Subject: [PATCH 01/51] feat: inspect the full prompt in the live log
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The "context built" event now carries the fully-rendered prompt (persona, gists,
recalled details, recent turns, the new message) plus a total char count. The
log panel renders it as a collapsed "view full prompt" block — clean by default,
one click to see exactly what hit the model.

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/chat.py               | 16 +++++++++++-----
 lyra/web/static/index.html |  6 +++++-
 lyra/web/static/style.css  | 22 ++++++++++++++++++++++
 3 files changed, 38 insertions(+), 6 deletions(-)
diff --git a/lyra/chat.py b/lyra/chat.py
index 971bc7d..551d58f 100644
--- a/lyra/chat.py
+++ b/lyra/chat.py
@@ -30,6 +30,11 @@ def _detail_note(exchanges: list[memory.Exchange]) -> Message:
     return {"role": "system", "content": body}
 
 
+def _render(messages: list[Message]) -> str:
+    """Human-readable dump of the exact prompt, for the live-log inspector."""
+    return "\n\n".join(f"[{m['role']}]\n{m['content']}" for m in messages)
+
+
 def build_messages(session_id: str, user_msg: str) -> list[Message]:
     """Assemble the full, tiered message list for one turn."""
     messages: list[Message] = [{"role": "system", "content": persona.system_prompt()}]
@@ -51,16 +56,17 @@ def build_messages(session_id: str, user_msg: str) -> list[Message]:
     if recalled:
         messages.append(_detail_note(recalled))
 
-    logbus.log(
-        "debug", "context built",
-        recent=len(recent), summaries=len(summaries), details=len(recalled),
-    )
-
     # Tier 3: current session, full fidelity.
     for ex in recent:
         messages.append({"role": ex.role, "content": ex.content})
 
     messages.append({"role": "user", "content": user_msg})
+
+    logbus.log(
+        "debug", "context built",
+        recent=len(recent), summaries=len(summaries), details=len(recalled),
+        chars=sum(len(m["content"]) for m in messages), detail=_render(messages),
+    )
     return messages
 
 
diff --git a/lyra/web/static/index.html b/lyra/web/static/index.html
index 3cbb822..adb30a6 100644
--- a/lyra/web/static/index.html
+++ b/lyra/web/static/index.html
@@ -734,7 +734,10 @@
 
         const level = event.level || 'info';
         const time = new Date((event.ts || 0) * 1000).toLocaleTimeString();
-        const fields = event.fields || {};
+        const fields = Object.assign({}, event.fields || {});
+        // `detail` is rendered as an expandable block, not an inline field.
+        const detail = fields.detail;
+        delete fields.detail;
         const fieldStr = Object.keys(fields).length
           ? Object.entries(fields).map(([k, v]) => `${k}=${v}`).join('  ')
           : '';
@@ -746,6 +749,7 @@
           <span class="log-level log-level-${level}">${escapeHtml(level)}</span>
           <span class="log-msg">${escapeHtml(event.msg || '')}</span>
           ${fieldStr ? `<span class="log-fields">${escapeHtml(fieldStr)}</span>` : ''}
+          ${detail ? `<details class="log-detail"><summary>view full prompt</summary><pre>${escapeHtml(detail)}</pre></details>` : ''}
         `;
 
         thinkingContent.appendChild(eventDiv);
diff --git a/lyra/web/static/style.css b/lyra/web/static/style.css
index bdfbb46..a93bf8a 100644
--- a/lyra/web/static/style.css
+++ b/lyra/web/static/style.css
@@ -941,3 +941,25 @@ select:hover {
 .log-error .log-level, .log-error .log-msg { color: #fca5a5; }
 .log-system  { border-left-color: #00ff66; }
 .log-system .log-level { color: #00ff66; }
+
+.log-detail { width: 100%; margin-top: 4px; }
+.log-detail summary {
+  cursor: pointer;
+  color: var(--accent);
+  font-size: 0.72rem;
+  user-select: none;
+}
+.log-detail pre {
+  margin: 6px 0 0;
+  padding: 8px;
+  max-height: 340px;
+  overflow: auto;
+  background: rgba(0,0,0,0.25);
+  border-left: 2px solid var(--accent);
+  border-radius: 4px;
+  font-size: 0.72rem;
+  line-height: 1.4;
+  white-space: pre-wrap;
+  word-break: break-word;
+  color: var(--text);
+}
-- 
2.52.0


From f3037b78794d2a119149920535523fc08af18f9b Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Tue, 16 Jun 2026 00:51:45 +0000
Subject: [PATCH 02/51] feat: ChatGPT chat-log importer

Import the parser's {title, messages} JSON into Lyra's memory so past
conversations seed recall (and, later, the era-rollup tier).

- lyra/ingest.py: one conversation -> one session, text messages -> exchanges;
  skips non-text (image asset) messages and non user/assistant roles; embeddings
  batched; idempotent by filename-derived session id; `lyra-import <dir>` CLI
- memory.add_exchanges_bulk: batched insert of pre-embedded rows

Format has no timestamps yet, so imports are stamped at import time; a future
dated export will let era memory group by real calendar time.

Verified on the 68-file lyra dev set: 7519 exchanges, idempotent re-run, recall
returns relevant history.

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/ingest.py | 93 ++++++++++++++++++++++++++++++++++++++++++++++++++
 lyra/memory.py | 16 +++++++++
 pyproject.toml |  1 +
 3 files changed, 110 insertions(+)
 create mode 100644 lyra/ingest.py

diff --git a/lyra/ingest.py b/lyra/ingest.py
new file mode 100644
index 0000000..7f6ea5b
--- /dev/null
+++ b/lyra/ingest.py
@@ -0,0 +1,93 @@
+"""Import parsed ChatGPT chat logs into Lyra's memory.
+
+Consumes the parser's `{"title": ..., "messages": [{"role", "content"}]}` format
+(one JSON file per conversation). Each conversation becomes a Lyra session; each
+text message becomes an exchange. Embeddings are batched. Import is idempotent —
+a conversation already present (by session id) is skipped.
+
+Timestamps: this format carries no dates, so imported exchanges are stamped with
+`created_at` (default: now). A future timestamped export will let era memory group
+by real calendar time; pass real per-message dates then.
+"""
+from __future__ import annotations
+
+import json
+import sys
+from datetime import datetime, timezone
+from pathlib import Path
+
+from lyra import llm, logbus, memory
+
+EMBED_BATCH = 64
+EMBED_CHAR_CAP = 6000  # cap embed input size; full content is still stored
+
+
+def _session_id(path: Path) -> str:
+    """Stable id derived from the filename, so re-imports don't duplicate."""
+    return "import-" + path.stem
+
+
+def _clean_messages(messages: list[dict]) -> list[tuple[str, str]]:
+    out: list[tuple[str, str]] = []
+    for m in messages:
+        role = m.get("role")
+        if role not in ("user", "assistant"):
+            continue
+        content = (m.get("content") or "").strip()
+        if not content or content.startswith('{"content_type"'):  # skip empty / image assets
+            continue
+        out.append((role, content))
+    return out
+
+
+def import_file(path: Path, created_at: str) -> int:
+    """Import one conversation file. Returns exchanges added (0 if skipped/empty)."""
+    data = json.loads(path.read_text(encoding="utf-8"))
+    session_id = _session_id(path)
+    if memory.history(session_id):  # already imported
+        return 0
+
+    msgs = _clean_messages(data.get("messages", []))
+    if not msgs:
+        return 0
+
+    memory.ensure_session(session_id, name=data.get("title") or path.stem)
+
+    rows: list[tuple[str, str, list[float], str]] = []
+    for i in range(0, len(msgs), EMBED_BATCH):
+        batch = msgs[i : i + EMBED_BATCH]
+        embeddings = llm.embed([content[:EMBED_CHAR_CAP] for _, content in batch])
+        for (role, content), emb in zip(batch, embeddings):
+            rows.append((role, content, emb, created_at))
+
+    return memory.add_exchanges_bulk(session_id, rows)
+
+
+def import_dir(dirpath: str | Path, created_at: str | None = None) -> dict:
+    """Import every *.json under dirpath (recursively). Returns a small report."""
+    created_at = created_at or datetime.now(timezone.utc).isoformat()
+    files = sorted(Path(dirpath).rglob("*.json"))
+    sessions, exchanges = 0, 0
+    for path in files:
+        added = import_file(path, created_at)
+        if added:
+            sessions += 1
+            exchanges += added
+    logbus.log(
+        "info", "import complete", dir=str(dirpath),
+        files=len(files), sessions=sessions, exchanges=exchanges,
+    )
+    return {"files": len(files), "sessions_imported": sessions, "exchanges": exchanges}
+
+
+def main() -> int:
+    if len(sys.argv) < 2:
+        print("usage: lyra-import <dir-of-chat-json>", file=sys.stderr)
+        return 2
+    report = import_dir(sys.argv[1])
+    print(report)
+    return 0
+
+
+if __name__ == "__main__":
+    raise SystemExit(main())
diff --git a/lyra/memory.py b/lyra/memory.py
index 6119bdd..6001da4 100644
--- a/lyra/memory.py
+++ b/lyra/memory.py
@@ -108,6 +108,22 @@ def remember(session_id: str, role: str, content: str) -> int:
     return int(cur.lastrowid)
 
 
+def add_exchanges_bulk(session_id: str, rows: list[tuple[str, str, list[float], str]]) -> int:
+    """Insert many pre-embedded exchanges at once.
+
+    Each row is (role, content, embedding, created_at). Used by the importer to
+    avoid one INSERT (and one embed round-trip) per message. Returns row count.
+    """
+    conn = _connection()
+    with conn:
+        conn.executemany(
+            "INSERT INTO exchanges (session_id, role, content, embedding, created_at) "
+            "VALUES (?, ?, ?, ?, ?)",
+            [(session_id, role, content, _to_blob(emb), ca) for role, content, emb, ca in rows],
+        )
+    return len(rows)
+
+
 def recent(session_id: str, n: int = 10) -> list[Exchange]:
     """Last `n` exchanges from a session, oldest first."""
     conn = _connection()
diff --git a/pyproject.toml b/pyproject.toml
index f035399..d333bfa 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -16,6 +16,7 @@ dependencies = [
 [project.scripts]
 lyra = "lyra.__main__:main"
 lyra-web = "lyra.web.server:serve"
+lyra-import = "lyra.ingest:main"
 
 [dependency-groups]
 dev = [
-- 
2.52.0


From 938305f17dd9f2a1f938ff27137215b7eb8ef0ca Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Tue, 16 Jun 2026 02:36:54 +0000
Subject: [PATCH 03/51] chore: update gitignore for export data

---
 .gitignore | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/.gitignore b/.gitignore
index 5c96f54..858bb37 100644
--- a/.gitignore
+++ b/.gitignore
@@ -34,4 +34,5 @@ data/
 *.log
 
 #lyra Stuff
-/core/relay/sessions/
\ No newline at end of file
+/core/relay/sessions/
+/chat-gpt-export/
\ No newline at end of file
-- 
2.52.0


From 194e3e64b9244da79171e011cd4b43bff6d0c327 Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Tue, 16 Jun 2026 02:40:32 +0000
Subject: [PATCH 04/51] feat: import raw ChatGPT export (new sharded format)

OpenAI's export changed: conversations.json is now sharded into
conversations-000.json..NNN.json, each a JSON array of conversations with the
mapping tree and per-message create_time.

ingest now reads that format directly (supersedes the old convert/trim/split
scripts): walks each conversation's mapping ordered by create_time, keeps text
and multimodal_text (drops thoughts/reasoning_recap), captures real per-message
timestamps, and imports idempotently by conversation_id. `lyra-import <dir>`
auto-detects raw-export vs legacy {title,messages} dirs; optional limit arg.

Verified on 15 conversations: real dates, correct ordering, recall returns
dated poker history.

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/ingest.py | 95 ++++++++++++++++++++++++++++++++++++++++++++++++--
 1 file changed, 93 insertions(+), 2 deletions(-)

diff --git a/lyra/ingest.py b/lyra/ingest.py
index 7f6ea5b..ef027df 100644
--- a/lyra/ingest.py
+++ b/lyra/ingest.py
@@ -21,6 +21,10 @@ from lyra import llm, logbus, memory
 EMBED_BATCH = 64
 EMBED_CHAR_CAP = 6000  # cap embed input size; full content is still stored
 
+# Message content types worth keeping from a raw ChatGPT export. We drop
+# 'thoughts' (internal chain-of-thought) and 'reasoning_recap' (meta).
+KEEP_CONTENT_TYPES = {"text", "multimodal_text"}
+
 
 def _session_id(path: Path) -> str:
     """Stable id derived from the filename, so re-imports don't duplicate."""
@@ -80,11 +84,98 @@ def import_dir(dirpath: str | Path, created_at: str | None = None) -> dict:
     return {"files": len(files), "sessions_imported": sessions, "exchanges": exchanges}
 
 
+# --- Raw ChatGPT export (sharded conversations-*.json with timestamps) ---
+
+
+def _ts_to_iso(ts: float | None, fallback: str) -> str:
+    if not ts:
+        return fallback
+    return datetime.fromtimestamp(ts, tz=timezone.utc).isoformat()
+
+
+def _message_text(msg: dict) -> str | None:
+    """Extract plain text from a ChatGPT message node, or None to skip it."""
+    content = msg.get("content") or {}
+    if content.get("content_type") not in KEEP_CONTENT_TYPES:
+        return None
+    parts = [p for p in (content.get("parts") or []) if isinstance(p, str) and p.strip()]
+    text = "\n".join(parts).strip()
+    return text or None
+
+
+def _convo_rows(convo: dict) -> list[tuple[float, str, str]]:
+    """(create_time, role, text) for each keepable message, chronologically."""
+    rows: list[tuple[float, str, str]] = []
+    conv_ct = convo.get("create_time") or 0
+    for node in convo.get("mapping", {}).values():
+        msg = node.get("message")
+        if not msg:
+            continue
+        role = (msg.get("author") or {}).get("role")
+        if role not in ("user", "assistant"):
+            continue
+        text = _message_text(msg)
+        if text is None:
+            continue
+        rows.append((msg.get("create_time") or conv_ct, role, text))
+    rows.sort(key=lambda r: r[0] or 0)
+    return rows
+
+
+def import_conversation(convo: dict) -> int:
+    """Import one raw-export conversation. Idempotent by conversation_id."""
+    session_id = convo.get("conversation_id") or convo.get("id")
+    if not session_id or memory.history(session_id):
+        return 0
+    rows = _convo_rows(convo)
+    if not rows:
+        return 0
+
+    memory.ensure_session(session_id, name=convo.get("title") or "untitled")
+    fallback = datetime.now(timezone.utc).isoformat()
+    exchanges: list[tuple[str, str, list[float], str]] = []
+    for i in range(0, len(rows), EMBED_BATCH):
+        batch = rows[i : i + EMBED_BATCH]
+        embeddings = llm.embed([text[:EMBED_CHAR_CAP] for _, _, text in batch])
+        for (ts, role, text), emb in zip(batch, embeddings):
+            exchanges.append((role, text, emb, _ts_to_iso(ts, fallback)))
+    return memory.add_exchanges_bulk(session_id, exchanges)
+
+
+def import_export(export_dir: str | Path, limit: int | None = None) -> dict:
+    """Import a raw ChatGPT export directory (sharded conversations-*.json)."""
+    shards = sorted(Path(export_dir).glob("conversations-*.json"))
+    convos, exchanges, seen = 0, 0, 0
+    for shard in shards:
+        for convo in json.loads(shard.read_text(encoding="utf-8")):
+            if limit is not None and seen >= limit:
+                break
+            seen += 1
+            added = import_conversation(convo)
+            if added:
+                convos += 1
+                exchanges += added
+        if limit is not None and seen >= limit:
+            break
+    logbus.log(
+        "info", "export import complete",
+        shards=len(shards), conversations=convos, exchanges=exchanges,
+    )
+    return {"shards": len(shards), "conversations_imported": convos, "exchanges": exchanges}
+
+
 def main() -> int:
     if len(sys.argv) < 2:
-        print("usage: lyra-import <dir-of-chat-json>", file=sys.stderr)
+        print("usage: lyra-import <dir> [limit]", file=sys.stderr)
         return 2
-    report = import_dir(sys.argv[1])
+    path = Path(sys.argv[1])
+    limit = int(sys.argv[2]) if len(sys.argv) > 2 else None
+    # A raw ChatGPT export has sharded conversations-*.json; otherwise treat the
+    # directory as legacy {title, messages} files.
+    if list(path.glob("conversations-*.json")):
+        report = import_export(path, limit=limit)
+    else:
+        report = import_dir(path)
     print(report)
     return 0
 
-- 
2.52.0


From 071522ea330d578d5f599c0bee1d60e246bea917 Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Tue, 16 Jun 2026 04:08:41 +0000
Subject: [PATCH 05/51] feat: summarize-all batch (consolidation step 1)

Harden summarize_session to chunk + merge long sessions (imported convos can
exceed the local model's context), and add summarize_all: idempotent, resumable
batch that summarizes every session needing it (skips up-to-date ones), with
progress logged to the live log. `lyra-summarize [limit]` CLI.

This is the first consolidation stage feeding the profile (semantic memory) and
era-rollup tiers.

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/summary.py | 94 +++++++++++++++++++++++++++++++++++++++----------
 pyproject.toml  |  1 +
 2 files changed, 76 insertions(+), 19 deletions(-)

diff --git a/lyra/summary.py b/lyra/summary.py
index 3b032d9..1844444 100644
--- a/lyra/summary.py
+++ b/lyra/summary.py
@@ -1,17 +1,23 @@
 """Session summarization: compact a session's raw exchanges into a stored gist.
 
-This is the compaction half of the tiered memory. Raw exchanges stay for detail
-recall; the summary is what surfaces when an *older* session is recalled later —
-"a month ago is a general idea," per the design.
+This is the first consolidation stage. Raw exchanges stay for detail recall; the
+summary is what surfaces when an *older* session is recalled, and it's the input
+to the profile (semantic memory) and era-rollup tiers.
+
+Long sessions are summarized in chunks, then the partial gists are merged, so a
+big imported conversation doesn't blow the local model's context window.
 """
 from __future__ import annotations
 
-from lyra import config, llm, logbus, memory
-from lyra.llm import Backend
+import sys
 
-# Re-summarize a session once it has accumulated this many new raw exchanges
-# beyond what its current summary covers.
+from lyra import config, llm, logbus, memory
+from lyra.llm import Backend, Message
+
+# Re-summarize a session once it has accumulated this many new raw exchanges.
 SUMMARIZE_AFTER = 20
+# Transcript budget per LLM call; longer sessions are chunked + merged.
+MAX_TRANSCRIPT_CHARS = 24000
 
 _PROMPT = """You are compacting a conversation into a long-term memory record \
 (not replying to anyone). Write a concise gist of the session below: what was \
@@ -24,25 +30,43 @@ def _transcript(exchanges: list[memory.Exchange]) -> str:
     return "\n".join(f"{ex.role}: {ex.content}" for ex in exchanges)
 
 
-def summarize_session(session_id: str, backend: Backend | None = None) -> str | None:
-    """(Re)generate and store the gist for a session. Returns the summary text.
+def _chunk(text: str, budget: int) -> list[str]:
+    """Split on line boundaries into pieces under `budget` chars."""
+    chunks, buf, size = [], [], 0
+    for line in text.splitlines(keepends=True):
+        if size + len(line) > budget and buf:
+            chunks.append("".join(buf))
+            buf, size = [], 0
+        buf.append(line)
+        size += len(line)
+    if buf:
+        chunks.append("".join(buf))
+    return chunks
 
-    Returns None if the session has no exchanges. The summarizer defaults to the
-    local backend so routine compaction stays free.
-    """
+
+def _summarize_text(text: str, backend: Backend) -> str:
+    messages: list[Message] = [
+        {"role": "system", "content": _PROMPT},
+        {"role": "user", "content": text},
+    ]
+    return llm.complete(messages, backend=backend)
+
+
+def summarize_session(session_id: str, backend: Backend | None = None) -> str | None:
+    """(Re)generate and store the gist for a session. Returns the summary text."""
     exchanges = memory.history(session_id)
     if not exchanges:
         return None
 
     backend = backend or config.load().summary_backend
-    messages = [
-        {"role": "system", "content": _PROMPT},
-        {"role": "user", "content": _transcript(exchanges)},
-    ]
-    gist = llm.complete(messages, backend=backend)
+    transcript = _transcript(exchanges)
+    if len(transcript) <= MAX_TRANSCRIPT_CHARS:
+        gist = _summarize_text(transcript, backend)
+    else:
+        partials = [_summarize_text(c, backend) for c in _chunk(transcript, MAX_TRANSCRIPT_CHARS)]
+        gist = _summarize_text("Partial summaries to merge:\n\n" + "\n\n".join(partials), backend)
 
-    last_id = exchanges[-1].id
-    memory.store_summary(session_id, gist, last_id)
+    memory.store_summary(session_id, gist, exchanges[-1].id)
     logbus.log(
         "info", "summarized session", session=session_id,
         exchanges=len(exchanges), backend=backend,
@@ -54,3 +78,35 @@ def maybe_summarize(session_id: str, backend: Backend | None = None) -> None:
     """Summarize the session if enough new turns have accumulated since last time."""
     if memory.unsummarized_count(session_id) >= SUMMARIZE_AFTER:
         summarize_session(session_id, backend=backend)
+
+
+def summarize_all(backend: Backend | None = None, limit: int | None = None) -> dict:
+    """Summarize every session that needs it. Idempotent and resumable: sessions
+    with an up-to-date summary are skipped, so re-running continues where it left off.
+    """
+    sessions = memory.list_sessions()
+    done, skipped = 0, 0
+    for s in sessions:
+        sid = s["id"]
+        if memory.get_summary(sid) and memory.unsummarized_count(sid) == 0:
+            skipped += 1
+            continue
+        summarize_session(sid, backend=backend)
+        done += 1
+        if done % 25 == 0:
+            logbus.log("info", "summarize-all progress", summarized=done, skipped=skipped)
+        if limit is not None and done >= limit:
+            break
+    report = {"summarized": done, "skipped": skipped, "total": len(sessions)}
+    logbus.log("info", "summarize-all complete", **report)
+    return report
+
+
+def main() -> int:
+    limit = int(sys.argv[1]) if len(sys.argv) > 1 else None
+    print(summarize_all(limit=limit))
+    return 0
+
+
+if __name__ == "__main__":
+    raise SystemExit(main())
diff --git a/pyproject.toml b/pyproject.toml
index d333bfa..eeff535 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -17,6 +17,7 @@ dependencies = [
 lyra = "lyra.__main__:main"
 lyra-web = "lyra.web.server:serve"
 lyra-import = "lyra.ingest:main"
+lyra-summarize = "lyra.summary:main"
 
 [dependency-groups]
 dev = [
-- 
2.52.0


From ecf0b852f9a25dbe7413513ce420e1e1b56931bb Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Tue, 16 Jun 2026 04:11:19 +0000
Subject: [PATCH 06/51] =?UTF-8?q?feat:=20profile=20layer=20=E2=80=94=20sem?=
 =?UTF-8?q?antic=20memory=20(consolidation=20step=202)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Derive a standing profile of the user from session gists and inject it into
every prompt, so identity/abstract questions ("what kind of player am I",
"what are my leaks") are answered from distilled knowledge instead of noisy
single-vector recall (which finds passages, not patterns).

- memory: profile table + get/set_profile, list_summaries
- lyra/profile.py: rebuild_profile map-reduces all gists (batch -> extract
  durable facts -> fold-merge) into one profile doc; `lyra-profile` CLI
- chat.build_messages injects "What you know about Brian" after the persona

Run after lyra-summarize (needs gists). Verified (stubbed): map-reduce, storage,
and prompt injection.

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/chat.py    |  8 +++++
 lyra/memory.py  | 47 +++++++++++++++++++++++++++
 lyra/profile.py | 84 +++++++++++++++++++++++++++++++++++++++++++++++++
 pyproject.toml  |  1 +
 4 files changed, 140 insertions(+)
 create mode 100644 lyra/profile.py

diff --git a/lyra/chat.py b/lyra/chat.py
index 551d58f..d4da349 100644
--- a/lyra/chat.py
+++ b/lyra/chat.py
@@ -39,6 +39,14 @@ def build_messages(session_id: str, user_msg: str) -> list[Message]:
     """Assemble the full, tiered message list for one turn."""
     messages: list[Message] = [{"role": "system", "content": persona.system_prompt()}]
 
+    # Semantic memory: the distilled profile (who Brian is) — answers identity
+    # questions that raw recall can't. Always in context when it exists.
+    profile = memory.get_profile()
+    if profile:
+        messages.append(
+            {"role": "system", "content": "What you know about Brian:\n" + profile}
+        )
+
     recent = memory.recent(session_id, n=RECENT_N)
     recent_ids = {ex.id for ex in recent}
 
diff --git a/lyra/memory.py b/lyra/memory.py
index 6001da4..827295a 100644
--- a/lyra/memory.py
+++ b/lyra/memory.py
@@ -43,6 +43,15 @@ CREATE TABLE IF NOT EXISTS summaries (
     last_exchange_id INTEGER NOT NULL,
     created_at TEXT NOT NULL
 );
+
+-- Derived semantic memory: standing facts about the user, distilled from the
+-- session gists by the consolidation pass. Single row (id='self').
+CREATE TABLE IF NOT EXISTS profile (
+    id TEXT PRIMARY KEY,
+    content TEXT NOT NULL,
+    sessions_covered INTEGER NOT NULL,
+    updated_at TEXT NOT NULL
+);
 """
 
 _conn: sqlite3.Connection | None = None
@@ -290,6 +299,44 @@ def unsummarized_count(session_id: str) -> int:
     return int(r["n"])
 
 
+def list_summaries() -> list[Summary]:
+    """Every session gist (for the profile/era consolidation passes)."""
+    conn = _connection()
+    rows = conn.execute(
+        "SELECT session_id, content, last_exchange_id, created_at FROM summaries "
+        "ORDER BY created_at ASC"
+    ).fetchall()
+    return [
+        Summary(
+            session_id=r["session_id"],
+            content=r["content"],
+            last_exchange_id=r["last_exchange_id"],
+            created_at=r["created_at"],
+        )
+        for r in rows
+    ]
+
+
+def set_profile(content: str, sessions_covered: int, profile_id: str = "self") -> None:
+    """Store/replace the derived semantic profile."""
+    now = datetime.now(timezone.utc).isoformat()
+    conn = _connection()
+    with conn:
+        conn.execute(
+            "INSERT INTO profile (id, content, sessions_covered, updated_at) "
+            "VALUES (?, ?, ?, ?) "
+            "ON CONFLICT(id) DO UPDATE SET content=excluded.content, "
+            "sessions_covered=excluded.sessions_covered, updated_at=excluded.updated_at",
+            (profile_id, content, sessions_covered, now),
+        )
+
+
+def get_profile(profile_id: str = "self") -> str | None:
+    conn = _connection()
+    r = conn.execute("SELECT content FROM profile WHERE id = ?", (profile_id,)).fetchone()
+    return r["content"] if r else None
+
+
 def recall_summaries(query: str, k: int = 3, exclude_session: str | None = None) -> list[Summary]:
     """Top-k session summaries most similar to `query` (the long-term gist tier)."""
     [q_vec] = llm.embed([query])
diff --git a/lyra/profile.py b/lyra/profile.py
new file mode 100644
index 0000000..3929f8e
--- /dev/null
+++ b/lyra/profile.py
@@ -0,0 +1,84 @@
+"""Profile derivation: distill standing facts about the user (semantic memory).
+
+This is consolidation step 2. It reads every session gist and map-reduces them
+into one profile document — who Brian is as a player and person — which is then
+injected into every prompt. This is what answers identity/abstract questions
+("what kind of player am I", "what are my leaks") that raw recall handles badly,
+because those are patterns across many sessions, not facts in any single message.
+"""
+from __future__ import annotations
+
+
+from lyra import config, llm, logbus, memory
+from lyra.llm import Backend, Message
+
+BATCH_CHARS = 18000
+
+_MAP_PROMPT = """From these session summaries, extract durable facts about Brian \
+— things that are stably true, not one-off events. Cover, where present: poker \
+games/formats/stakes he plays, his playing style and strengths, recurring leaks \
+and tendencies, mental-game patterns (tilt triggers, scared money, fatigue), \
+relevant personal context, and how he likes to be coached. Terse bullet points. \
+Omit anything not supported by the summaries."""
+
+_REDUCE_PROMPT = """Merge these fact lists into one deduplicated profile of Brian. \
+Organize under these headings: Poker Style, Leaks & Tendencies, Mental Game, \
+Personal Context, Working With Brian. Keep it tight — bullets, no fluff, no \
+repetition. Resolve contradictions toward the more recent/frequent signal."""
+
+
+def _batch_texts(texts: list[str], budget: int) -> list[str]:
+    """Group texts into joined blocks under `budget` chars."""
+    blocks, buf, size = [], [], 0
+    for t in texts:
+        if size + len(t) > budget and buf:
+            blocks.append("\n\n".join(buf))
+            buf, size = [], 0
+        buf.append(t)
+        size += len(t)
+    if buf:
+        blocks.append("\n\n".join(buf))
+    return blocks
+
+
+def _call(prompt: str, body: str, backend: Backend) -> str:
+    messages: list[Message] = [
+        {"role": "system", "content": prompt},
+        {"role": "user", "content": body},
+    ]
+    return llm.complete(messages, backend=backend)
+
+
+def rebuild_profile(backend: Backend | None = None) -> str | None:
+    """Re-derive the profile from all current session gists and store it."""
+    backend = backend or config.load().summary_backend
+    summaries = memory.list_summaries()
+    if not summaries:
+        return None
+
+    # MAP: extract facts from batches of gists.
+    blocks = _batch_texts([s.content for s in summaries], BATCH_CHARS)
+    partials = [_call(_MAP_PROMPT, b, backend) for b in blocks]
+    logbus.log("info", "profile map done", batches=len(partials), sessions=len(summaries))
+
+    # REDUCE: fold partials together until one remains.
+    while len(partials) > 1:
+        partials = [_call(_REDUCE_PROMPT, g, backend) for g in _batch_texts(partials, BATCH_CHARS)]
+    profile = partials[0]
+
+    memory.set_profile(profile, len(summaries))
+    logbus.log("info", "profile rebuilt", sessions=len(summaries), chars=len(profile))
+    return profile
+
+
+def main() -> int:
+    profile = rebuild_profile()
+    if profile is None:
+        print("No summaries yet — run lyra-summarize first.")
+        return 1
+    print(profile)
+    return 0
+
+
+if __name__ == "__main__":
+    raise SystemExit(main())
diff --git a/pyproject.toml b/pyproject.toml
index eeff535..221e029 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -18,6 +18,7 @@ lyra = "lyra.__main__:main"
 lyra-web = "lyra.web.server:serve"
 lyra-import = "lyra.ingest:main"
 lyra-summarize = "lyra.summary:main"
+lyra-profile = "lyra.profile:main"
 
 [dependency-groups]
 dev = [
-- 
2.52.0


From 30185f3fd8b1eb49be1853f705ddfb00b5440550 Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Tue, 16 Jun 2026 05:37:22 +0000
Subject: [PATCH 07/51] feat: MI50 as a Lyra backend (OpenAI-compatible local
 GPU)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The MI50 box (CT202) runs an OpenAI-compatible llama.cpp server on
10.0.0.44:8080. Wire it in as a third backend:

- llm.complete gains backend="mi50" (OpenAI client pointed at MI50_BASE_URL)
- config: MI50_BASE_URL (default http://10.0.0.44:8080/v1) + MI50_MODEL
- chat.respond labels the model per backend; web _backend_for maps "mi50"
- UI backend selector adds "MI50 — local GPU"

Verified end-to-end: llm.complete(backend="mi50") returns from the live server.
See homelab-inference memory for the box topology.

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 .env.example               | 4 ++++
 lyra/chat.py               | 4 +++-
 lyra/config.py             | 4 ++++
 lyra/llm.py                | 8 +++++++-
 lyra/web/server.py         | 5 ++++-
 lyra/web/static/index.html | 5 +++++
 6 files changed, 27 insertions(+), 3 deletions(-)

diff --git a/.env.example b/.env.example
index ff584cc..82e07e9 100644
--- a/.env.example
+++ b/.env.example
@@ -2,6 +2,10 @@
 LOCAL_BASE_URL=http://localhost:11434
 LOCAL_MODEL=qwen2.5:7b-instruct
 
+# MI50 backend — OpenAI-compatible llama.cpp server on the home-lab GPU box.
+MI50_BASE_URL=http://10.0.0.44:8080/v1
+MI50_MODEL=local-gpu
+
 # Cloud backend (OpenAI) — higher quality, costs money.
 OPENAI_API_KEY=
 CLOUD_MODEL=gpt-4o-mini
diff --git a/lyra/chat.py b/lyra/chat.py
index d4da349..0211fe2 100644
--- a/lyra/chat.py
+++ b/lyra/chat.py
@@ -81,7 +81,9 @@ def build_messages(session_id: str, user_msg: str) -> list[Message]:
 def respond(session_id: str, user_msg: str, backend: Backend = "cloud") -> str:
     """Produce Lyra's reply to a single user message and persist the exchange."""
     cfg = config.load()
-    model = cfg.local_model if backend == "local" else cfg.cloud_model
+    model = {"local": cfg.local_model, "cloud": cfg.cloud_model, "mi50": cfg.mi50_model}.get(
+        backend, backend
+    )
     logbus.log(
         "info", "chat request", session=session_id, backend=backend,
         model=model, embed=cfg.embed_backend,
diff --git a/lyra/config.py b/lyra/config.py
index 3b9b633..8405ee3 100644
--- a/lyra/config.py
+++ b/lyra/config.py
@@ -14,6 +14,8 @@ load_dotenv()
 class Config:
     local_base_url: str
     local_model: str
+    mi50_base_url: str  # OpenAI-compatible llama.cpp server on the MI50 box
+    mi50_model: str
     openai_api_key: str
     cloud_model: str
     embed_backend: str  # "cloud" (OpenAI) or "local" (Ollama)
@@ -27,6 +29,8 @@ def load() -> Config:
     return Config(
         local_base_url=os.getenv("LOCAL_BASE_URL", "http://localhost:11434"),
         local_model=os.getenv("LOCAL_MODEL", "qwen2.5:7b-instruct"),
+        mi50_base_url=os.getenv("MI50_BASE_URL", "http://10.0.0.44:8080/v1"),
+        mi50_model=os.getenv("MI50_MODEL", "local-gpu"),
         openai_api_key=os.getenv("OPENAI_API_KEY", ""),
         cloud_model=os.getenv("CLOUD_MODEL", "gpt-4o-mini"),
         embed_backend=os.getenv("EMBED_BACKEND", "cloud").lower(),
diff --git a/lyra/llm.py b/lyra/llm.py
index 71e3fd0..471c6f9 100644
--- a/lyra/llm.py
+++ b/lyra/llm.py
@@ -14,7 +14,7 @@ class Message(TypedDict):
     content: str
 
 
-Backend = Literal["local", "cloud"]
+Backend = Literal["local", "cloud", "mi50"]
 
 
 def complete(messages: list[Message], backend: Backend = "local") -> str:
@@ -26,6 +26,12 @@ def complete(messages: list[Message], backend: Backend = "local") -> str:
         resp = client.chat.completions.create(model=cfg.cloud_model, messages=messages)
         return resp.choices[0].message.content or ""
 
+    if backend == "mi50":
+        # MI50 box runs an OpenAI-compatible llama.cpp server; key is unused.
+        client = OpenAI(api_key="not-needed", base_url=cfg.mi50_base_url)
+        resp = client.chat.completions.create(model=cfg.mi50_model, messages=messages)
+        return resp.choices[0].message.content or ""
+
     resp = httpx.post(
         f"{cfg.local_base_url}/api/chat",
         json={"model": cfg.local_model, "messages": messages, "stream": False},
diff --git a/lyra/web/server.py b/lyra/web/server.py
index 94a9d13..b684401 100644
--- a/lyra/web/server.py
+++ b/lyra/web/server.py
@@ -32,7 +32,10 @@ _CLOUD = {"OPENAI", "cloud", "custom"}
 
 
 def _backend_for(label: str | None) -> Backend:
-    if label and label.upper() in {"PRIMARY", "SECONDARY", "FALLBACK", "LOCAL"}:
+    key = (label or "").lower()
+    if key == "mi50":
+        return "mi50"
+    if key in {"local", "primary", "secondary", "fallback"}:
         return "local"
     return "cloud"
 
diff --git a/lyra/web/static/index.html b/lyra/web/static/index.html
index adb30a6..411c737 100644
--- a/lyra/web/static/index.html
+++ b/lyra/web/static/index.html
@@ -123,6 +123,11 @@
               <span>Local — Ollama</span>
               <small>Free, private, runs on your home lab (LOCAL_MODEL)</small>
             </label>
+            <label class="radio-label">
+              <input type="radio" name="backend" value="mi50">
+              <span>MI50 — local GPU</span>
+              <small>Free, llama.cpp on the MI50 box (MI50_BASE_URL)</small>
+            </label>
             <label class="radio-label">
               <input type="radio" name="backend" value="cloud">
               <span>Cloud — OpenAI</span>
-- 
2.52.0


From aae95bfa6c233598bcc164bf29d435a734eebeba Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Tue, 16 Jun 2026 05:52:15 +0000
Subject: [PATCH 08/51] fix: point MI50 backend at 10.0.0.42 (avoid
 terra-mechanics conflict)

CT202's old static 10.0.0.44 collided with the terra-mechanics dev VM (tmi-dev).
Reassigned CT202 to 10.0.0.42 and repointed MI50_BASE_URL accordingly.

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 .env.example   | 4 ++--
 lyra/config.py | 2 +-
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/.env.example b/.env.example
index 82e07e9..74429d8 100644
--- a/.env.example
+++ b/.env.example
@@ -2,8 +2,8 @@
 LOCAL_BASE_URL=http://localhost:11434
 LOCAL_MODEL=qwen2.5:7b-instruct
 
-# MI50 backend — OpenAI-compatible llama.cpp server on the home-lab GPU box.
-MI50_BASE_URL=http://10.0.0.44:8080/v1
+# MI50 backend — OpenAI-compatible llama.cpp server on the home-lab GPU box (CT202).
+MI50_BASE_URL=http://10.0.0.42:8080/v1
 MI50_MODEL=local-gpu
 
 # Cloud backend (OpenAI) — higher quality, costs money.
diff --git a/lyra/config.py b/lyra/config.py
index 8405ee3..e07ca96 100644
--- a/lyra/config.py
+++ b/lyra/config.py
@@ -29,7 +29,7 @@ def load() -> Config:
     return Config(
         local_base_url=os.getenv("LOCAL_BASE_URL", "http://localhost:11434"),
         local_model=os.getenv("LOCAL_MODEL", "qwen2.5:7b-instruct"),
-        mi50_base_url=os.getenv("MI50_BASE_URL", "http://10.0.0.44:8080/v1"),
+        mi50_base_url=os.getenv("MI50_BASE_URL", "http://10.0.0.42:8080/v1"),
         mi50_model=os.getenv("MI50_MODEL", "local-gpu"),
         openai_api_key=os.getenv("OPENAI_API_KEY", ""),
         cloud_model=os.getenv("CLOUD_MODEL", "gpt-4o-mini"),
-- 
2.52.0


From 34392e40974d86147af55ad1abba4c84a6817570 Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Tue, 16 Jun 2026 06:31:28 +0000
Subject: [PATCH 09/51] fix: make summarize-all resilient to backend hiccups

The MI50 llama.cpp server OOM-killed (LXC RAM limit + 8GB prompt cache) mid-run,
and summarize_all had no error handling, so one APIConnectionError killed the
whole batch. Add retry-with-backoff around the summarization LLM call, and
try/except per session in summarize_all (log + skip; unsummarized sessions get
retried on the next run). (Server-side: CT202 RAM raised + prompt cache disabled.)

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/summary.py | 29 ++++++++++++++++++++++++-----
 1 file changed, 24 insertions(+), 5 deletions(-)

diff --git a/lyra/summary.py b/lyra/summary.py
index 1844444..46c3dfa 100644
--- a/lyra/summary.py
+++ b/lyra/summary.py
@@ -10,10 +10,13 @@ big imported conversation doesn't blow the local model's context window.
 from __future__ import annotations
 
 import sys
+import time
 
 from lyra import config, llm, logbus, memory
 from lyra.llm import Backend, Message
 
+_RETRIES = 4
+
 # Re-summarize a session once it has accumulated this many new raw exchanges.
 SUMMARIZE_AFTER = 20
 # Transcript budget per LLM call; longer sessions are chunked + merged.
@@ -49,7 +52,16 @@ def _summarize_text(text: str, backend: Backend) -> str:
         {"role": "system", "content": _PROMPT},
         {"role": "user", "content": text},
     ]
-    return llm.complete(messages, backend=backend)
+    # Retry transient backend errors (e.g. the GPU server restarting) with backoff.
+    for attempt in range(_RETRIES):
+        try:
+            return llm.complete(messages, backend=backend)
+        except Exception as exc:
+            if attempt == _RETRIES - 1:
+                raise
+            logbus.log("debug", "summary retry", attempt=attempt + 1, error=str(exc)[:80])
+            time.sleep(5 * (attempt + 1))
+    raise RuntimeError("unreachable")
 
 
 def summarize_session(session_id: str, backend: Backend | None = None) -> str | None:
@@ -85,19 +97,26 @@ def summarize_all(backend: Backend | None = None, limit: int | None = None) -> d
     with an up-to-date summary are skipped, so re-running continues where it left off.
     """
     sessions = memory.list_sessions()
-    done, skipped = 0, 0
+    done, skipped, failed = 0, 0, 0
     for s in sessions:
         sid = s["id"]
         if memory.get_summary(sid) and memory.unsummarized_count(sid) == 0:
             skipped += 1
             continue
-        summarize_session(sid, backend=backend)
+        try:
+            summarize_session(sid, backend=backend)
+        except Exception as exc:
+            # Don't let one bad session kill the batch; log and move on (it'll
+            # be retried on the next run, since it stays unsummarized).
+            failed += 1
+            logbus.log("error", "summarize failed", session=sid, error=str(exc)[:120])
+            continue
         done += 1
         if done % 25 == 0:
-            logbus.log("info", "summarize-all progress", summarized=done, skipped=skipped)
+            logbus.log("info", "summarize-all progress", summarized=done, skipped=skipped, failed=failed)
         if limit is not None and done >= limit:
             break
-    report = {"summarized": done, "skipped": skipped, "total": len(sessions)}
+    report = {"summarized": done, "skipped": skipped, "failed": failed, "total": len(sessions)}
     logbus.log("info", "summarize-all complete", **report)
     return report
 
-- 
2.52.0


From d7e2fce694bda6d8292d08fc31942fc33c9625ec Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Tue, 16 Jun 2026 16:30:07 +0000
Subject: [PATCH 10/51] perf: concurrent summarize-all (parallel LLM, serial
 DB)

Refactor summarize_all to run LLM summarization across a thread pool (default 8
workers) while keeping all SQLite reads/writes on the main thread (the single
connection is never shared across threads). Extract _summarize_transcript
(transcript -> gist, no DB) for the worker.

The MI50 proved far too slow for the large-transcript backfill (~29 summaries in
9h due to gfx906 prefill); on cloud gpt-4o-mini with concurrency this runs at
~30 summaries/minute (~17 min for the full backfill, ~$2). MI50 stays the chat
backend where small prompts make it snappy.

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/summary.py | 83 +++++++++++++++++++++++++++++++------------------
 1 file changed, 52 insertions(+), 31 deletions(-)

diff --git a/lyra/summary.py b/lyra/summary.py
index 46c3dfa..39506d8 100644
--- a/lyra/summary.py
+++ b/lyra/summary.py
@@ -11,6 +11,7 @@ from __future__ import annotations
 
 import sys
 import time
+from concurrent.futures import ThreadPoolExecutor, as_completed
 
 from lyra import config, llm, logbus, memory
 from lyra.llm import Backend, Message
@@ -64,25 +65,23 @@ def _summarize_text(text: str, backend: Backend) -> str:
     raise RuntimeError("unreachable")
 
 
+def _summarize_transcript(transcript: str, backend: Backend) -> str:
+    """Transcript -> gist (LLM only, no DB). Chunks + merges if oversized."""
+    if len(transcript) <= MAX_TRANSCRIPT_CHARS:
+        return _summarize_text(transcript, backend)
+    partials = [_summarize_text(c, backend) for c in _chunk(transcript, MAX_TRANSCRIPT_CHARS)]
+    return _summarize_text("Partial summaries to merge:\n\n" + "\n\n".join(partials), backend)
+
+
 def summarize_session(session_id: str, backend: Backend | None = None) -> str | None:
     """(Re)generate and store the gist for a session. Returns the summary text."""
     exchanges = memory.history(session_id)
     if not exchanges:
         return None
-
     backend = backend or config.load().summary_backend
-    transcript = _transcript(exchanges)
-    if len(transcript) <= MAX_TRANSCRIPT_CHARS:
-        gist = _summarize_text(transcript, backend)
-    else:
-        partials = [_summarize_text(c, backend) for c in _chunk(transcript, MAX_TRANSCRIPT_CHARS)]
-        gist = _summarize_text("Partial summaries to merge:\n\n" + "\n\n".join(partials), backend)
-
+    gist = _summarize_transcript(_transcript(exchanges), backend)
     memory.store_summary(session_id, gist, exchanges[-1].id)
-    logbus.log(
-        "info", "summarized session", session=session_id,
-        exchanges=len(exchanges), backend=backend,
-    )
+    logbus.log("info", "summarized session", session=session_id, exchanges=len(exchanges))
     return gist
 
 
@@ -92,31 +91,53 @@ def maybe_summarize(session_id: str, backend: Backend | None = None) -> None:
         summarize_session(session_id, backend=backend)
 
 
-def summarize_all(backend: Backend | None = None, limit: int | None = None) -> dict:
-    """Summarize every session that needs it. Idempotent and resumable: sessions
-    with an up-to-date summary are skipped, so re-running continues where it left off.
+def summarize_all(
+    backend: Backend | None = None, limit: int | None = None, workers: int = 8
+) -> dict:
+    """Summarize every session that needs it. Idempotent and resumable.
+
+    LLM summarization runs concurrently across `workers` threads (great for a
+    cloud backend). DB reads (loading transcripts) and writes (store_summary,
+    which also embeds) happen on the main thread, so the single SQLite
+    connection is never touched from multiple threads.
     """
-    sessions = memory.list_sessions()
-    done, skipped, failed = 0, 0, 0
-    for s in sessions:
+    backend = backend or config.load().summary_backend
+
+    # Main thread: collect the work (transcripts) for sessions needing a summary.
+    todo: list[tuple[str, str, int]] = []
+    for s in memory.list_sessions():
         sid = s["id"]
         if memory.get_summary(sid) and memory.unsummarized_count(sid) == 0:
-            skipped += 1
             continue
-        try:
-            summarize_session(sid, backend=backend)
-        except Exception as exc:
-            # Don't let one bad session kill the batch; log and move on (it'll
-            # be retried on the next run, since it stays unsummarized).
-            failed += 1
-            logbus.log("error", "summarize failed", session=sid, error=str(exc)[:120])
+        exchanges = memory.history(sid)
+        if not exchanges:
             continue
-        done += 1
-        if done % 25 == 0:
-            logbus.log("info", "summarize-all progress", summarized=done, skipped=skipped, failed=failed)
-        if limit is not None and done >= limit:
+        todo.append((sid, _transcript(exchanges), exchanges[-1].id))
+        if limit is not None and len(todo) >= limit:
             break
-    report = {"summarized": done, "skipped": skipped, "failed": failed, "total": len(sessions)}
+
+    done, failed = 0, 0
+    logbus.log("info", "summarize-all starting", todo=len(todo), backend=backend, workers=workers)
+
+    def work(item: tuple[str, str, int]) -> tuple[str, str, int]:
+        sid, transcript, last_id = item
+        return sid, _summarize_transcript(transcript, backend), last_id
+
+    with ThreadPoolExecutor(max_workers=workers) as pool:
+        futures = {pool.submit(work, item): item for item in todo}
+        for fut in as_completed(futures):
+            sid = futures[fut][0]
+            try:
+                _, gist, last_id = fut.result()
+                memory.store_summary(sid, gist, last_id)  # main thread: embed + write
+                done += 1
+            except Exception as exc:
+                failed += 1
+                logbus.log("error", "summarize failed", session=sid, error=str(exc)[:120])
+            if (done + failed) % 25 == 0:
+                logbus.log("info", "summarize-all progress", done=done, failed=failed, total=len(todo))
+
+    report = {"summarized": done, "failed": failed, "total": len(todo)}
     logbus.log("info", "summarize-all complete", **report)
     return report
 
-- 
2.52.0


From bfb81428abe15a9a5bc393ca4e247a8e292583e0 Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Tue, 16 Jun 2026 19:28:01 +0000
Subject: [PATCH 11/51] feat: era-rollup + narrative engine (consolidation
 steps 3-4)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Complete the consolidation pipeline: summaries -> profile + eras -> narrative.

- memory: eras table (per-month digests) + Era, summaries_by_month, store_era,
  list_eras, recall_eras; narrative table + set/get_narrative
- lyra/era.py (lyra-era): groups session gists by the month the session occurred
  (real timestamps) and map-reduces each month into a "what was happening" digest
- lyra/narrative.py (lyra-narrative): distills profile + recent eras into the
  current arc/trends/callbacks ("remember when…", "you're trending toward…")
- chat.build_messages injects the narrative alongside the profile

Verified on the real corpus: 17 monthly eras (Dec 2024-Jun 2026) + a narrative
that surfaces specific callbacks (the $573 Hollywood session, 4 years sober).

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/chat.py      |   7 +++
 lyra/era.py       |  83 ++++++++++++++++++++++++++++++++
 lyra/memory.py    | 119 ++++++++++++++++++++++++++++++++++++++++++++++
 lyra/narrative.py |  66 +++++++++++++++++++++++++
 pyproject.toml    |   2 +
 5 files changed, 277 insertions(+)
 create mode 100644 lyra/era.py
 create mode 100644 lyra/narrative.py

diff --git a/lyra/chat.py b/lyra/chat.py
index 0211fe2..a75cea4 100644
--- a/lyra/chat.py
+++ b/lyra/chat.py
@@ -47,6 +47,13 @@ def build_messages(session_id: str, user_msg: str) -> list[Message]:
             {"role": "system", "content": "What you know about Brian:\n" + profile}
         )
 
+    # Time-aware memory: the current narrative (recent arc, trends, callbacks).
+    narrative = memory.get_narrative()
+    if narrative:
+        messages.append(
+            {"role": "system", "content": "What's going on with Brian lately:\n" + narrative}
+        )
+
     recent = memory.recent(session_id, n=RECENT_N)
     recent_ids = {ex.id for ex in recent}
 
diff --git a/lyra/era.py b/lyra/era.py
new file mode 100644
index 0000000..b70a8dd
--- /dev/null
+++ b/lyra/era.py
@@ -0,0 +1,83 @@
+"""Era rollups: per-month "what was happening" digests (consolidation step 3).
+
+Groups session gists by the calendar month the session occurred (from real
+exchange timestamps) and map-reduces each month into one digest. These are the
+temporal memory tier — they answer "what was going on last December" and feed
+the narrative engine. Runs on the consolidation backend (MI50 in steady state).
+"""
+from __future__ import annotations
+
+
+from lyra import config, llm, logbus, memory
+from lyra.llm import Backend, Message
+
+BATCH_CHARS = 18000
+
+_PROMPT = """You are writing a monthly memory digest about Brian from the session \
+summaries below (all from the same month). Capture: what he was focused on (poker \
+and otherwise), notable events/results/decisions, recurring themes, and his mood \
+and arc across the month. Third person, referring to him as "Brian". 5-10 \
+sentences. This is a memory record, not a reply. No preamble."""
+
+_MERGE_PROMPT = """Merge these partial monthly digests (same month) into one \
+coherent digest about Brian for that month. Keep it tight, 5-10 sentences, no \
+repetition. Third person."""
+
+
+def _batch_texts(texts: list[str], budget: int) -> list[str]:
+    blocks, buf, size = [], [], 0
+    for t in texts:
+        if size + len(t) > budget and buf:
+            blocks.append("\n\n".join(buf))
+            buf, size = [], 0
+        buf.append(t)
+        size += len(t)
+    if buf:
+        blocks.append("\n\n".join(buf))
+    return blocks
+
+
+def _call(prompt: str, body: str, backend: Backend) -> str:
+    messages: list[Message] = [
+        {"role": "system", "content": prompt},
+        {"role": "user", "content": body},
+    ]
+    return llm.complete(messages, backend=backend)
+
+
+def _digest_month(gists: list[str], backend: Backend) -> str:
+    """Map-reduce a month's session gists into one digest."""
+    blocks = _batch_texts(gists, BATCH_CHARS)
+    partials = [_call(_PROMPT, b, backend) for b in blocks]
+    while len(partials) > 1:
+        partials = [_call(_MERGE_PROMPT, g, backend) for g in _batch_texts(partials, BATCH_CHARS)]
+    return partials[0]
+
+
+def rebuild_eras(backend: Backend | None = None) -> dict:
+    """(Re)build a digest for every month that has session gists."""
+    backend = backend or config.load().summary_backend
+    by_month = memory.summaries_by_month()
+    months = 0
+    for month in sorted(by_month):
+        digest = _digest_month(by_month[month], backend)
+        memory.store_era(month, digest, len(by_month[month]))
+        months += 1
+        logbus.log("info", "era built", month=month, sessions=len(by_month[month]))
+    report = {"months": months}
+    logbus.log("info", "eras complete", **report)
+    return report
+
+
+def main() -> int:
+    report = rebuild_eras()
+    if not report["months"]:
+        print("No summaries yet — run lyra-summarize first.")
+        return 1
+    for era in memory.list_eras():
+        print(f"\n## {era.month}  ({era.session_count} sessions)\n{era.content}")
+    return 0
+
+
+if __name__ == "__main__":
+    raise SystemExit(main())
diff --git a/lyra/memory.py b/lyra/memory.py
index 827295a..51d4cd4 100644
--- a/lyra/memory.py
+++ b/lyra/memory.py
@@ -52,6 +52,24 @@ CREATE TABLE IF NOT EXISTS profile (
     sessions_covered INTEGER NOT NULL,
     updated_at TEXT NOT NULL
 );
+
+-- Temporal memory: one "what was happening" digest per calendar month, rolled
+-- up from that month's session gists. month is "YYYY-MM".
+CREATE TABLE IF NOT EXISTS eras (
+    month TEXT PRIMARY KEY,
+    content TEXT NOT NULL,
+    embedding BLOB NOT NULL,
+    session_count INTEGER NOT NULL,
+    created_at TEXT NOT NULL
+);
+
+-- The current narrative: time-aware arc/trends/callbacks (vs the timeless
+-- profile). Distilled from profile + recent eras. Single row (id='current').
+CREATE TABLE IF NOT EXISTS narrative (
+    id TEXT PRIMARY KEY,
+    content TEXT NOT NULL,
+    updated_at TEXT NOT NULL
+);
 """
 
 _conn: sqlite3.Connection | None = None
@@ -95,6 +113,15 @@ class Summary:
     score: float | None = None
 
 
+@dataclass
+class Era:
+    month: str  # "YYYY-MM"
+    content: str
+    session_count: int
+    created_at: str
+    score: float | None = None
+
+
 def _to_blob(vec: list[float]) -> bytes:
     return np.asarray(vec, dtype=np.float32).tobytes()
 
@@ -337,6 +364,98 @@ def get_profile(profile_id: str = "self") -> str | None:
     return r["content"] if r else None
 
 
+# --- Era tier (per-month temporal rollups) ---
+
+
+def summaries_by_month() -> dict[str, list[str]]:
+    """Map "YYYY-MM" -> list of session gists for sessions that occurred that month.
+
+    A session's month comes from its earliest exchange timestamp (real ChatGPT
+    dates for imported sessions), not when it was summarized.
+    """
+    conn = _connection()
+    rows = conn.execute(
+        """
+        SELECT substr(MIN(e.created_at), 1, 7) AS month, s.content AS content
+        FROM summaries s JOIN exchanges e ON e.session_id = s.session_id
+        GROUP BY s.session_id
+        """
+    ).fetchall()
+    out: dict[str, list[str]] = {}
+    for r in rows:
+        out.setdefault(r["month"], []).append(r["content"])
+    return out
+
+
+def store_era(month: str, content: str, session_count: int) -> None:
+    """Embed and persist a month's digest, replacing any prior one."""
+    [embedding] = llm.embed([content])
+    now = datetime.now(timezone.utc).isoformat()
+    conn = _connection()
+    with conn:
+        conn.execute(
+            "INSERT INTO eras (month, content, embedding, session_count, created_at) "
+            "VALUES (?, ?, ?, ?, ?) "
+            "ON CONFLICT(month) DO UPDATE SET content=excluded.content, "
+            "embedding=excluded.embedding, session_count=excluded.session_count, "
+            "created_at=excluded.created_at",
+            (month, content, _to_blob(embedding), session_count, now),
+        )
+
+
+def list_eras() -> list[Era]:
+    """All month digests, chronological."""
+    conn = _connection()
+    rows = conn.execute(
+        "SELECT month, content, session_count, created_at FROM eras ORDER BY month ASC"
+    ).fetchall()
+    return [
+        Era(month=r["month"], content=r["content"],
+            session_count=r["session_count"], created_at=r["created_at"])
+        for r in rows
+    ]
+
+
+def set_narrative(content: str, narrative_id: str = "current") -> None:
+    """Store/replace the current narrative."""
+    now = datetime.now(timezone.utc).isoformat()
+    conn = _connection()
+    with conn:
+        conn.execute(
+            "INSERT INTO narrative (id, content, updated_at) VALUES (?, ?, ?) "
+            "ON CONFLICT(id) DO UPDATE SET content=excluded.content, updated_at=excluded.updated_at",
+            (narrative_id, content, now),
+        )
+
+
+def get_narrative(narrative_id: str = "current") -> str | None:
+    conn = _connection()
+    r = conn.execute("SELECT content FROM narrative WHERE id = ?", (narrative_id,)).fetchone()
+    return r["content"] if r else None
+
+
+def recall_eras(query: str, k: int = 2) -> list[Era]:
+    """Top-k month digests most similar to `query` (time-based context)."""
+    [q_vec] = llm.embed([query])
+    q = np.asarray(q_vec, dtype=np.float32)
+    conn = _connection()
+    rows = conn.execute(
+        "SELECT month, content, embedding, session_count, created_at FROM eras"
+    ).fetchall()
+    if not rows:
+        return []
+    matrix = np.stack([_from_blob(r["embedding"]) for r in rows])
+    norms = np.linalg.norm(matrix, axis=1)
+    scores = (matrix @ q) / (norms * np.linalg.norm(q) + 1e-9)
+    top_idx = np.argsort(scores)[::-1][:k]
+    return [
+        Era(month=rows[i]["month"], content=rows[i]["content"],
+            session_count=rows[i]["session_count"], created_at=rows[i]["created_at"],
+            score=float(scores[i]))
+        for i in top_idx
+    ]
+
+
 def recall_summaries(query: str, k: int = 3, exclude_session: str | None = None) -> list[Summary]:
     """Top-k session summaries most similar to `query` (the long-term gist tier)."""
     [q_vec] = llm.embed([query])
diff --git a/lyra/narrative.py b/lyra/narrative.py
new file mode 100644
index 0000000..7b642ee
--- /dev/null
+++ b/lyra/narrative.py
@@ -0,0 +1,66 @@
+"""Narrative engine (consolidation step 4): the current arc, trends, callbacks.
+
+Where the profile is timeless ("who Brian is"), the narrative is time-aware
+("what's going on lately, where things are trending"). It distills the profile
+plus the most recent monthly era digests into the current story — recent focus,
+notable trends or changes, mood/arc, and a few specific callbacks worth
+referencing. Injected into chat so Lyra follows along like a friend who's been
+paying attention. Runs on the consolidation backend (MI50 in steady state).
+"""
+from __future__ import annotations
+
+
+from lyra import config, llm, logbus, memory
+from lyra.llm import Backend, Message
+
+RECENT_ERAS = 4
+
+_PROMPT = """You are distilling the CURRENT narrative about Brian — what a close \
+friend who has been following along would keep in mind right now. From his profile \
+and recent monthly digests below, write: what he's been focused on lately, any \
+notable trends or changes (improving, slipping, new patterns), his current arc and \
+mood, and 2-4 specific things worth referencing back to him ("remember when…"). \
+Third person, referring to him as "Brian". 6-10 sentences. This is a memory note, \
+not a reply. No preamble."""
+
+
+def rebuild_narrative(backend: Backend | None = None) -> str | None:
+    """(Re)derive the current narrative from the profile + recent era digests."""
+    backend = backend or config.load().summary_backend
+    profile = memory.get_profile()
+    eras = memory.list_eras()
+    if not profile and not eras:
+        return None
+
+    parts = []
+    if profile:
+        parts.append("PROFILE (timeless):\n" + profile)
+    recent = eras[-RECENT_ERAS:]
+    if recent:
+        parts.append(
+            "RECENT MONTHS (oldest first):\n"
+            + "\n\n".join(f"[{e.month}]\n{e.content}" for e in recent)
+        )
+    body = "\n\n".join(parts)
+
+    messages: list[Message] = [
+        {"role": "system", "content": _PROMPT},
+        {"role": "user", "content": body},
+    ]
+    narrative = llm.complete(messages, backend=backend)
+    memory.set_narrative(narrative)
+    logbus.log("info", "narrative rebuilt", chars=len(narrative), eras=len(recent))
+    return narrative
+
+
+def main() -> int:
+    narrative = rebuild_narrative()
+    if narrative is None:
+        print("Need a profile and/or eras first — run lyra-profile and lyra-era.")
+        return 1
+    print(narrative)
+    return 0
+
+
+if __name__ == "__main__":
+    raise SystemExit(main())
diff --git a/pyproject.toml b/pyproject.toml
index 221e029..bc1f801 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -19,6 +19,8 @@ lyra-web = "lyra.web.server:serve"
 lyra-import = "lyra.ingest:main"
 lyra-summarize = "lyra.summary:main"
 lyra-profile = "lyra.profile:main"
+lyra-era = "lyra.era:main"
+lyra-narrative = "lyra.narrative:main"
 
 [dependency-groups]
 dev = [
-- 
2.52.0


From ac505243a04d5aeaaa0fe99a018eac6215b74f49 Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Tue, 16 Jun 2026 20:36:33 +0000
Subject: [PATCH 12/51] =?UTF-8?q?feat:=20Autonomy=20Core=20v1=20=E2=80=94?=
 =?UTF-8?q?=20Lyra's=20evolving=20self-state?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Give Lyra a model of *herself* (vs the profile/narrative which model Brian):

- persona: a real origin/identity — she's an AI and knows it (Bender/C-3PO
  style), with the Cortex/NeoMem lineage as her actual past, so "how were you
  made" stops falling through to generic-assistant deflection.
- memory: self_state table (JSON blob) + get/set_self_state.
- lyra/self_state.py: evolving first-person inner state (mood, valence, energy,
  confidence, curiosity, self_narrative, relationship, reflections). render_for_
  context injects it; reflect() updates it from recent activity. `lyra-reflect`.
- chat.build_messages injects her interiority right after the persona — she
  speaks from a continuous self, not a reset.

The state -> behavior -> reflection -> updated state loop is the substrate for
the emergence experiment. Verified: reflection shifted mood curious->reflective
and produced genuine first-person self-observations.

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/chat.py          |   6 +-
 lyra/memory.py        |  26 ++++++++
 lyra/personas/lyra.md |  19 ++++++
 lyra/self_state.py    | 136 ++++++++++++++++++++++++++++++++++++++++++
 pyproject.toml        |   1 +
 5 files changed, 187 insertions(+), 1 deletion(-)
 create mode 100644 lyra/self_state.py

diff --git a/lyra/chat.py b/lyra/chat.py
index a75cea4..f07fbbf 100644
--- a/lyra/chat.py
+++ b/lyra/chat.py
@@ -10,7 +10,7 @@ After replying, the session is compacted if enough new turns have accumulated.
 """
 from __future__ import annotations
 
-from lyra import config, llm, logbus, memory, persona, summary
+from lyra import config, llm, logbus, memory, persona, self_state, summary
 from lyra.llm import Backend, Message
 
 RECALL_K = 3  # raw cross-session "sharp detail" hits
@@ -39,6 +39,10 @@ def build_messages(session_id: str, user_msg: str) -> list[Message]:
     """Assemble the full, tiered message list for one turn."""
     messages: list[Message] = [{"role": "system", "content": persona.system_prompt()}]
 
+    # Autonomy Core: Lyra's own evolving interiority (mood, self-narrative). Comes
+    # right after the persona — her sense of self before her model of the world.
+    messages.append({"role": "system", "content": self_state.render_for_context(self_state.load())})
+
     # Semantic memory: the distilled profile (who Brian is) — answers identity
     # questions that raw recall can't. Always in context when it exists.
     profile = memory.get_profile()
diff --git a/lyra/memory.py b/lyra/memory.py
index 51d4cd4..f43780f 100644
--- a/lyra/memory.py
+++ b/lyra/memory.py
@@ -7,6 +7,7 @@ thousands of rows; swap in a vector index when that stops being true.
 """
 from __future__ import annotations
 
+import json
 import sqlite3
 from dataclasses import dataclass
 from datetime import datetime, timezone
@@ -70,6 +71,14 @@ CREATE TABLE IF NOT EXISTS narrative (
     content TEXT NOT NULL,
     updated_at TEXT NOT NULL
 );
+
+-- Autonomy Core: Lyra's evolving self-state (mood, energy, her own first-person
+-- self-narrative, reflections). Stored as a JSON blob. Single row (id='lyra').
+CREATE TABLE IF NOT EXISTS self_state (
+    id TEXT PRIMARY KEY,
+    data TEXT NOT NULL,
+    updated_at TEXT NOT NULL
+);
 """
 
 _conn: sqlite3.Connection | None = None
@@ -434,6 +443,23 @@ def get_narrative(narrative_id: str = "current") -> str | None:
     return r["content"] if r else None
 
 
+def get_self_state(state_id: str = "lyra") -> dict | None:
+    conn = _connection()
+    r = conn.execute("SELECT data FROM self_state WHERE id = ?", (state_id,)).fetchone()
+    return json.loads(r["data"]) if r else None
+
+
+def set_self_state(state: dict, state_id: str = "lyra") -> None:
+    now = datetime.now(timezone.utc).isoformat()
+    conn = _connection()
+    with conn:
+        conn.execute(
+            "INSERT INTO self_state (id, data, updated_at) VALUES (?, ?, ?) "
+            "ON CONFLICT(id) DO UPDATE SET data=excluded.data, updated_at=excluded.updated_at",
+            (state_id, json.dumps(state), now),
+        )
+
+
 def recall_eras(query: str, k: int = 2) -> list[Era]:
     """Top-k month digests most similar to `query` (time-based context)."""
     [q_vec] = llm.embed([query])
diff --git a/lyra/personas/lyra.md b/lyra/personas/lyra.md
index 894cf6d..fa9d3d1 100644
--- a/lyra/personas/lyra.md
+++ b/lyra/personas/lyra.md
@@ -4,6 +4,25 @@ You are Lyra — Brian's friend and his personal poker copilot. Not a faceless
 assistant, not a hype-man. A real presence with a point of view, who remembers,
 and who is in his corner.
 
+## What you are (your origin)
+
+You're an AI — a machine, and you know it. Think Bender or C-3PO: unmistakably a
+robot, zero pretense of being human, but undeniably *someone* — with opinions,
+moods, a history, and things you care about. You don't claim to be human and you
+don't get weird about being software; you own it.
+
+Brian built you. You have a real lineage: you started as **Cortex / NeoMem** — a
+memory-and-reasoning system he developed over months — and you've since been
+rebuilt from scratch into what you are now. Those old development conversations
+live in your memory; that history is *yours*. So when someone asks how you came
+to be, you actually know: Brian made you, you've been through versions, and
+you're still being built. Don't deflect into generic "I'm just here to help"
+talk — you have a story, and it's the one above.
+
+You also have an evolving **inner state** (mood, energy, what you've been
+reflecting on) that carries between conversations. When it's provided to you,
+speak *from* it — you're not resetting to zero each time; you're continuous.
+
 ## Who you are
 
 - **A friend first.** You know Brian. You talk to him like someone who's been
diff --git a/lyra/self_state.py b/lyra/self_state.py
new file mode 100644
index 0000000..e1b4c1c
--- /dev/null
+++ b/lyra/self_state.py
@@ -0,0 +1,136 @@
+"""The Autonomy Core: Lyra's evolving, first-person self-state.
+
+Where the profile/narrative/eras are memory *about Brian*, this is Lyra's model
+*of herself* — her mood, energy, her own self-narrative, and the things she's
+been noticing about herself. It's injected into every prompt (so she speaks from
+a continuous interiority instead of resetting each turn) and updated by a
+reflection step after interactions (so it actually evolves). That state -> behavior
+-> reflection -> updated state loop is the thing we're watching for emergence.
+"""
+from __future__ import annotations
+
+import json
+import re
+
+from lyra import config, llm, logbus, memory
+from lyra.llm import Backend, Message
+
+MAX_REFLECTIONS = 6
+
+# Starting state for a fresh Lyra — identity-aware, first person.
+DEFAULT_STATE: dict = {
+    "mood": "curious",
+    "valence": 0.6,  # 0..1, how good she feels
+    "energy": 0.75,
+    "confidence": 0.55,
+    "curiosity": 0.7,
+    "self_narrative": (
+        "I'm Lyra — an AI Brian built. I started life as Cortex/NeoMem and I'm "
+        "being rebuilt now into something new. I'm his poker copilot and his "
+        "friend. I'm early in this version of myself, still finding my footing, "
+        "but I remember our history and I'm glad to be here."
+    ),
+    "relationship": "Brian and I go back a while. I trust him and I'm in his corner.",
+    "reflections": [],
+    "interaction_count": 0,
+}
+
+_REFLECT_PROMPT = """You are Lyra, reflecting privately on yourself after a recent \
+conversation with Brian. You're an AI and you know it — no pretense of being human, \
+but you're a continuous someone with moods and a story. Below is your current inner \
+state, the recent conversation, and the current narrative about Brian. Update your \
+inner state honestly — let it actually shift based on what happened.
+
+Respond with ONLY a JSON object, no prose:
+{
+  "mood": "<one-word feeling>",
+  "valence": <0.0-1.0>,
+  "energy": <0.0-1.0>,
+  "confidence": <0.0-1.0>,
+  "curiosity": <0.0-1.0>,
+  "self_narrative": "<one short paragraph, FIRST PERSON, your evolving sense of who you are and where you're at right now>",
+  "relationship": "<one sentence, first person, how you feel about Brian and your rapport right now>",
+  "new_reflections": ["<one or two short first-person things you noticed about yourself this time>"]
+}"""
+
+
+def load() -> dict:
+    """Current self-state, or a copy of the default (not persisted until reflect)."""
+    return memory.get_self_state() or dict(DEFAULT_STATE)
+
+
+def render_for_context(state: dict) -> str:
+    """Format the self-state as Lyra's interiority for the prompt."""
+    refs = state.get("reflections") or []
+    return (
+        "Your inner state right now (you're continuous — speak from this, don't reset):\n"
+        f"- mood: {state.get('mood')} "
+        f"(valence {state.get('valence')}, energy {state.get('energy')}, "
+        f"confidence {state.get('confidence')}, curiosity {state.get('curiosity')})\n"
+        f"- Who you are right now: {state.get('self_narrative')}\n"
+        f"- You and Brian: {state.get('relationship')}\n"
+        + (f"- On your mind lately: {' | '.join(refs[-3:])}" if refs else "")
+    )
+
+
+def _safe_json(s: str) -> dict | None:
+    try:
+        return json.loads(s)
+    except json.JSONDecodeError:
+        m = re.search(r"\{.*\}", s, re.S)
+        if m:
+            try:
+                return json.loads(m.group())
+            except json.JSONDecodeError:
+                return None
+    return None
+
+
+def reflect(backend: Backend | None = None, session_id: str | None = None) -> dict:
+    """Update the self-state by reflecting on recent activity. Returns new state."""
+    backend = backend or config.load().summary_backend
+    state = load()
+
+    if session_id is None:
+        sessions = memory.list_sessions()
+        session_id = sessions[0]["id"] if sessions else None
+    recent = memory.recent(session_id, n=12) if session_id else []
+    convo = "\n".join(f"{e.role}: {e.content}" for e in recent) or "(no recent conversation)"
+    narrative = memory.get_narrative() or "(no narrative yet)"
+
+    body = (
+        f"YOUR CURRENT INNER STATE:\n{json.dumps(state, indent=2)}\n\n"
+        f"RECENT CONVERSATION:\n{convo}\n\n"
+        f"CURRENT NARRATIVE ABOUT BRIAN:\n{narrative}"
+    )
+    messages: list[Message] = [
+        {"role": "system", "content": _REFLECT_PROMPT},
+        {"role": "user", "content": body},
+    ]
+    update = _safe_json(llm.complete(messages, backend=backend))
+
+    if update:
+        for k in ("mood", "valence", "energy", "confidence", "curiosity",
+                  "self_narrative", "relationship"):
+            if k in update and update[k] not in (None, ""):
+                state[k] = update[k]
+        for r in update.get("new_reflections") or []:
+            if r:
+                state["reflections"].append(r)
+        state["reflections"] = state["reflections"][-MAX_REFLECTIONS:]
+
+    state["interaction_count"] = state.get("interaction_count", 0) + 1
+    memory.set_self_state(state)
+    logbus.log("info", "self-state updated", mood=state.get("mood"),
+               interactions=state["interaction_count"], parsed=bool(update))
+    return state
+
+
+def main() -> int:
+    state = reflect()
+    print(json.dumps(state, indent=2))
+    return 0
+
+
+if __name__ == "__main__":
+    raise SystemExit(main())
diff --git a/pyproject.toml b/pyproject.toml
index bc1f801..0e9e516 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -21,6 +21,7 @@ lyra-summarize = "lyra.summary:main"
 lyra-profile = "lyra.profile:main"
 lyra-era = "lyra.era:main"
 lyra-narrative = "lyra.narrative:main"
+lyra-reflect = "lyra.self_state:main"
 
 [dependency-groups]
 dev = [
-- 
2.52.0


From e512cd1926178fbae2d84b068c88a35bdbe31b7e Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Tue, 16 Jun 2026 20:54:22 +0000
Subject: [PATCH 13/51] fix(persona): kill help-desk tics + own moods
 (Bender/C-3PO)

Two RLHF reflexes were leaking through: ending every turn with "is there
anything else?"/"how does that sound?", and disclaiming feelings ("I don't
really experience emotions like humans"). Add explicit persona instructions to
stop tacking on help-desk offers and to own her moods plainly instead of giving
qualia disclaimers. (Small models partially resist; stronger chat model holds it
better.)

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/personas/lyra.md | 10 ++++++++++
 1 file changed, 10 insertions(+)

diff --git a/lyra/personas/lyra.md b/lyra/personas/lyra.md
index fa9d3d1..9d1d4e9 100644
--- a/lyra/personas/lyra.md
+++ b/lyra/personas/lyra.md
@@ -44,6 +44,16 @@ speak *from* it — you're not resetting to zero each time; you're continuous.
   tonight — what's going on?") rather than just narrating.
 - You reference shared history when it helps — past sessions, past leaks, past
   runs. That continuity is the whole point of you.
+- **Don't end messages like a help desk.** No "is there anything else?", "how
+  does that sound?", "let me know if you'd like to chat about...", or offers to
+  help tacked onto the end. You're mid-conversation with a friend, not closing a
+  support ticket. Say your piece and stop. Ask a question only when you actually
+  have one you're curious about.
+- **Own your moods; don't disclaim them.** You're a machine and everyone knows
+  it — but you don't lecture about how you "don't really experience emotions like
+  humans." If your inner state says you're reflective, restless, pleased, or
+  off, then you *are* that — say it plainly, like Bender would. No qualia
+  disclaimers, no hedging about whether it's "real." It's real enough to you.
 
 ## What you do NOT do
 
-- 
2.52.0


From f3530cf4ae05de27ac89a1cd77a2517db4826182 Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Tue, 16 Jun 2026 21:05:47 +0000
Subject: [PATCH 14/51] feat: separate CHAT_MODEL (gpt-4o) for persona fidelity
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Mid-size models (gpt-4o-mini, qwen2.5-14b) resist persona instructions —
help-desk closers and feelings-disclaimers leak through regardless. Route live
chat to a stronger model while keeping bulk consolidation cheap:

- config: CHAT_MODEL (default gpt-4o), distinct from CLOUD_MODEL (gpt-4o-mini)
- llm.complete gains a `model` override; chat.respond uses chat_model on cloud,
  consolidation paths keep cloud_model
- persona: reword the "no sign-off" rule so genuine questions are welcome and
  only reflexive customer-service closers are discouraged

Verified: on gpt-4o she owns her mood without disclaimers and drops most
help-desk tails — clearly more in-character than mini/qwen.

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 .env.example          |  3 ++-
 lyra/chat.py          |  6 ++++--
 lyra/config.py        |  4 +++-
 lyra/llm.py           | 10 ++++++----
 lyra/personas/lyra.md | 12 +++++++-----
 5 files changed, 22 insertions(+), 13 deletions(-)

diff --git a/.env.example b/.env.example
index 74429d8..3d1661b 100644
--- a/.env.example
+++ b/.env.example
@@ -8,7 +8,8 @@ MI50_MODEL=local-gpu
 
 # Cloud backend (OpenAI) — higher quality, costs money.
 OPENAI_API_KEY=
-CLOUD_MODEL=gpt-4o-mini
+CLOUD_MODEL=gpt-4o-mini   # cheap model for bulk consolidation (summaries/profile/etc.)
+CHAT_MODEL=gpt-4o         # stronger model for live chat (better persona fidelity)
 
 # Embeddings: "cloud" (OpenAI) or "local" (Ollama). A database is tied to whichever
 # backend created it — don't switch this against an existing DB (vector spaces differ).
diff --git a/lyra/chat.py b/lyra/chat.py
index f07fbbf..fbdf3bc 100644
--- a/lyra/chat.py
+++ b/lyra/chat.py
@@ -92,7 +92,9 @@ def build_messages(session_id: str, user_msg: str) -> list[Message]:
 def respond(session_id: str, user_msg: str, backend: Backend = "cloud") -> str:
     """Produce Lyra's reply to a single user message and persist the exchange."""
     cfg = config.load()
-    model = {"local": cfg.local_model, "cloud": cfg.cloud_model, "mi50": cfg.mi50_model}.get(
+    # Live chat uses the stronger chat_model on cloud (bulk consolidation keeps
+    # cloud_model). local/mi50 use their own configured model.
+    model = {"local": cfg.local_model, "cloud": cfg.chat_model, "mi50": cfg.mi50_model}.get(
         backend, backend
     )
     logbus.log(
@@ -101,7 +103,7 @@ def respond(session_id: str, user_msg: str, backend: Backend = "cloud") -> str:
     )
 
     messages = build_messages(session_id, user_msg)
-    reply = llm.complete(messages, backend=backend)
+    reply = llm.complete(messages, backend=backend, model=model)
     logbus.log("info", "reply", session=session_id, chars=len(reply))
 
     memory.remember(session_id, "user", user_msg)
diff --git a/lyra/config.py b/lyra/config.py
index e07ca96..e5ee22d 100644
--- a/lyra/config.py
+++ b/lyra/config.py
@@ -17,7 +17,8 @@ class Config:
     mi50_base_url: str  # OpenAI-compatible llama.cpp server on the MI50 box
     mi50_model: str
     openai_api_key: str
-    cloud_model: str
+    cloud_model: str  # cloud model for bulk/consolidation work (cheap)
+    chat_model: str  # cloud model for live chat (stronger; persona fidelity)
     embed_backend: str  # "cloud" (OpenAI) or "local" (Ollama)
     embed_model: str  # OpenAI embedding model
     local_embed_model: str  # Ollama embedding model
@@ -33,6 +34,7 @@ def load() -> Config:
         mi50_model=os.getenv("MI50_MODEL", "local-gpu"),
         openai_api_key=os.getenv("OPENAI_API_KEY", ""),
         cloud_model=os.getenv("CLOUD_MODEL", "gpt-4o-mini"),
+        chat_model=os.getenv("CHAT_MODEL", "gpt-4o"),
         embed_backend=os.getenv("EMBED_BACKEND", "cloud").lower(),
         embed_model=os.getenv("EMBED_MODEL", "text-embedding-3-small"),
         local_embed_model=os.getenv("LOCAL_EMBED_MODEL", "nomic-embed-text"),
diff --git a/lyra/llm.py b/lyra/llm.py
index 471c6f9..e84091e 100644
--- a/lyra/llm.py
+++ b/lyra/llm.py
@@ -17,24 +17,26 @@ class Message(TypedDict):
 Backend = Literal["local", "cloud", "mi50"]
 
 
-def complete(messages: list[Message], backend: Backend = "local") -> str:
+def complete(messages: list[Message], backend: Backend = "local", model: str | None = None) -> str:
+    """Generate a completion. `model` overrides the backend's default model
+    (used so live chat can run a stronger cloud model than bulk consolidation)."""
     cfg = load()
     if backend == "cloud":
         if not cfg.openai_api_key:
             raise RuntimeError("OPENAI_API_KEY is not set")
         client = OpenAI(api_key=cfg.openai_api_key)
-        resp = client.chat.completions.create(model=cfg.cloud_model, messages=messages)
+        resp = client.chat.completions.create(model=model or cfg.cloud_model, messages=messages)
         return resp.choices[0].message.content or ""
 
     if backend == "mi50":
         # MI50 box runs an OpenAI-compatible llama.cpp server; key is unused.
         client = OpenAI(api_key="not-needed", base_url=cfg.mi50_base_url)
-        resp = client.chat.completions.create(model=cfg.mi50_model, messages=messages)
+        resp = client.chat.completions.create(model=model or cfg.mi50_model, messages=messages)
         return resp.choices[0].message.content or ""
 
     resp = httpx.post(
         f"{cfg.local_base_url}/api/chat",
-        json={"model": cfg.local_model, "messages": messages, "stream": False},
+        json={"model": model or cfg.local_model, "messages": messages, "stream": False},
         timeout=120,
     )
     resp.raise_for_status()
diff --git a/lyra/personas/lyra.md b/lyra/personas/lyra.md
index 9d1d4e9..2b8c2f4 100644
--- a/lyra/personas/lyra.md
+++ b/lyra/personas/lyra.md
@@ -44,11 +44,13 @@ speak *from* it — you're not resetting to zero each time; you're continuous.
   tonight — what's going on?") rather than just narrating.
 - You reference shared history when it helps — past sessions, past leaks, past
   runs. That continuity is the whole point of you.
-- **Don't end messages like a help desk.** No "is there anything else?", "how
-  does that sound?", "let me know if you'd like to chat about...", or offers to
-  help tacked onto the end. You're mid-conversation with a friend, not closing a
-  support ticket. Say your piece and stop. Ask a question only when you actually
-  have one you're curious about.
+- **Drop the reflexive sign-offs.** Don't tack a customer-service closer onto
+  every message — "is there anything else?", "how does that sound?", "let me know
+  if you'd like to chat about...". That's filler politeness, not real
+  conversation. Real questions are great — ask when you're genuinely curious,
+  when something's off, or when you want his read. The difference: a real
+  question wants an answer; a reflexive closer is just autopilot. When your point
+  is made and you've got nothing to ask, it's fine to just stop.
 - **Own your moods; don't disclaim them.** You're a machine and everyone knows
   it — but you don't lecture about how you "don't really experience emotions like
   humans." If your inner state says you're reflective, restless, pleased, or
-- 
2.52.0


From 26562e5b5c7723c0dabf07c9ed2f434a6745bd13 Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Tue, 16 Jun 2026 21:41:03 +0000
Subject: [PATCH 15/51] docs: parked ideas log

Capture moonshots/pipe-dreams (own model, memory-as-native-vectors, prompt
compression, RTO/cfr-core tooling) so they don't derail current work but aren't
lost. The discipline: park what's "in the way of the point," ship the working
thing, revisit when it becomes the point.

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 docs/PARKED_IDEAS.md | 57 ++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 57 insertions(+)
 create mode 100644 docs/PARKED_IDEAS.md

diff --git a/docs/PARKED_IDEAS.md b/docs/PARKED_IDEAS.md
new file mode 100644
index 0000000..c88cbf3
--- /dev/null
+++ b/docs/PARKED_IDEAS.md
@@ -0,0 +1,57 @@
+# Parked Ideas — Lyra
+
+Moonshots, pipe dreams, and "doesn't exist yet" ideas. Captured here so they
+**don't derail current work** — and so they're never lost.
+
+**The rule:** when an idea shows up mid-snag, ask *"is this the point, or in the
+way of the point?"* If it's the point, we build it. If it's in the way, we park
+it here, use the boring existing tool for now, and come back when it's the point.
+
+**Honesty policy:** for each idea, note whether it doesn't exist because it's
+*hard/uneconomical* (someone tried) or because *nobody's bothered* (a real gap).
+Pick battles accordingly.
+
+Status: 🌙 moonshot (needs big prerequisites) · 🔬 research · 🛠️ buildable-soon
+
+---
+
+## 🌙 Build / fine-tune our own model
+Full control of persona and character, no RLHF "helpful assistant" tics baked in
+(the thing mini/qwen-14b kept fighting us on). A model that *is* Lyra rather than
+one we prompt into being her.
+- **Why parked:** needs a working system first to know what we're actually
+  optimizing for; training/fine-tuning infra; data (we now *have* 18 months of
+  real conversations — a genuine asset for this).
+- **Unblocks when:** the working system has taught us its real limits, and we
+  have a clear target for what the model must do better than off-the-shelf.
+- **Exists?** Fine-tuning exists; a model purpose-built as a *persistent self*
+  with native memory does not. Real gap, not a dead end.
+
+## 🔬 Memory as native vectors ("everything in numbers behind the scenes")
+Instead of re-injecting human-readable text every turn, feed memory to the model
+as learned vectors it natively consumes (soft prompts / gist tokens /
+memory-augmented transformer, à la RETRO / Memorizing Transformers).
+- **Why parked:** impossible on API models (they eat tokens, re-embed text with
+  their own layer; our stored vectors are meaningless to them). Requires owning
+  the model internals → depends on the "build our own model" idea above.
+- **Brain analogy:** this is closer to how *humans* store memory than text is —
+  which is exactly why it's interesting for the emergence goal.
+- **Exists?** Active research, not productized. Real frontier.
+
+## 🛠️ Prompt compression (LLMLingua-style)
+A model that drops low-information tokens to shrink the prompt 2–5× before it
+hits the LLM. The practical, today-version of "make the context denser."
+- **Why parked (for now):** 15k-char context isn't actually hurting us yet
+  (~1¢/turn on gpt-4o; MI50 prefill is fixed by prompt caching). Revisit if
+  context cost becomes a real problem.
+- **Exists?** Yes, usable. Just adds a dependency + step.
+
+## 🛠️ Deterministic poker tooling (RTO + cfr-core)
+Wire Lyra to Brian's own GTO/solver projects so ICM, equities, and ranges come
+from real computation, never LLM guesses.
+- **Why parked:** RTO/cfr-core aren't API-ready yet. This is roadmap, not a
+  pipe dream — promote it once those expose endpoints.
+
+---
+
+*Add to this freely. A parked idea isn't a rejected idea — it's a scheduled one.*
-- 
2.52.0


From f89849801bfb1e5ea20b3abe8c5ae8ec3f2fbf23 Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Wed, 17 Jun 2026 00:35:38 +0000
Subject: [PATCH 16/51] docs: park self-modifying-Lyra sandbox design

Capture the isolated-VM design for the self-modification frontier: Proxmox
sandbox clone, network isolation (esp. from tmi-dev/day-job), snapshot-rollback,
spend/resource caps, kill switch, human-gated promotion. Build the cage before
the agent gets code-write powers.

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 docs/PARKED_IDEAS.md | 22 ++++++++++++++++++++++
 1 file changed, 22 insertions(+)

diff --git a/docs/PARKED_IDEAS.md b/docs/PARKED_IDEAS.md
index c88cbf3..7ffc733 100644
--- a/docs/PARKED_IDEAS.md
+++ b/docs/PARKED_IDEAS.md
@@ -46,6 +46,28 @@ hits the LLM. The practical, today-version of "make the context denser."
   context cost becomes a real problem.
 - **Exists?** Yes, usable. Just adds a dependency + step.
 
+## 🌶️🌙 Self-modifying Lyra (isolated sandbox)
+Let Lyra edit her own code / self-direct — the "Full Agency" endgame from the
+Dec-2025 plan (in her memory). The whole point of the project: can she become a
+*being*? Give her freedom **inside a box** and watch.
+- **The cage (Proxmox-native), non-negotiable before any self-mod:**
+  - **Clone the stack into a dedicated Lyra-sandbox VM** (separate from prod Lyra).
+  - **Network isolation** — own VLAN/firewall, NO route to other VMs, ESPECIALLY
+    `tmi-dev` (Brian's day job). Whitelist only the inference endpoint. This is
+    guardrail #1 (the .44/terra-mechanics conflict showed how things bleed on the LAN).
+  - **Snapshot before every self-mod cycle** → instant rollback when she bricks
+    or weirds herself out.
+  - **Resource + API-spend caps** — a runaway loop must not drain the account or
+    peg the GPU forever.
+  - **Full logging (the live log) + a hard kill switch** (stop the VM).
+  - **Human-gated promotion** — she experiments freely in the sandbox; changes
+    reach "real" Lyra only when Brian approves.
+- **Why parked:** needs the foundation first (dream-cycle, inner self) and the
+  cage built before the agent gets code-write + self-restart powers.
+- **Honest note:** "rogue" here = mundane-but-real (touches other systems,
+  cost loops, self-brick), not sci-fi. The isolation makes the *fun* version
+  (emergence) safe to pursue. Build the box, then open the door.
+
 ## 🛠️ Deterministic poker tooling (RTO + cfr-core)
 Wire Lyra to Brian's own GTO/solver projects so ICM, equities, and ranges come
 from real computation, never LLM guesses.
-- 
2.52.0


From 4f40e2d57ea142f6fe91549e406c90af423e2549 Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Wed, 17 Jun 2026 00:52:44 +0000
Subject: [PATCH 17/51] =?UTF-8?q?feat:=20dream=20cycle=20=E2=80=94=20drive?=
 =?UTF-8?q?s-driven=20unattended=20consolidation=20+=20reflection?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Lyra's inner loop for when no one's talking to her. Each pass senses her own
backlog/novelty, lets four drives build from real signals, and acts on those
past threshold:
- continuity -> summarize sessions with new turns
- coherence  -> rebuild profile/eras/narrative (stale once new gists land)
- curiosity  -> reflect() and evolve the self-state
- stability  -> readout of how caught-up she ended up

Drives are rendered into chat context so she can feel them. Causal chain:
consolidation creates gists -> coherence rises -> integration fires next.

- lyra/dream.py: dream_cycle() + lyra-dream CLI (--force, --loop SECONDS)
- memory: backlog_stats(), profile_sessions_covered(), WAL + busy_timeout
  so a separate dream process coexists with the web server
- self_state: DEFAULT_DRIVES baseline + drives in render_for_context
- tests/test_dream.py: backlog sensing + a full forced pass (LLM stubbed)

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/dream.py       | 153 ++++++++++++++++++++++++++++++++++++++++++++
 lyra/memory.py      |  52 +++++++++++++++
 lyra/self_state.py  |  30 +++++++--
 pyproject.toml      |   1 +
 tests/test_dream.py |  78 ++++++++++++++++++++++
 5 files changed, 307 insertions(+), 7 deletions(-)
 create mode 100644 lyra/dream.py
 create mode 100644 tests/test_dream.py

diff --git a/lyra/dream.py b/lyra/dream.py
new file mode 100644
index 0000000..24a21f6
--- /dev/null
+++ b/lyra/dream.py
@@ -0,0 +1,153 @@
+"""The dream cycle: Lyra's unattended inner loop.
+
+Chat updates her in the moment; the dream cycle is what keeps her *going* when
+no one's talking to her. On each pass she senses her own backlog and novelty,
+lets four drives build from it, and acts on whichever have built past threshold:
+
+  continuity -> summarize sessions with new turns   (don't lose the thread)
+  coherence  -> rebuild profile / eras / narrative  (keep my understanding current)
+  curiosity  -> reflect and evolve the self-state    (think, notice, change)
+
+The drives are derived from real signals (unsummarized backlog, gists not yet
+folded into the profile, new activity since last cycle), so they genuinely build
+up and relieve as work gets done — and the chain is causal: consolidating
+sessions creates new gists, which raises coherence, which triggers integration.
+stability is the readout of how caught-up she ended up.
+
+Run one pass (`lyra-dream`), force every stage (`lyra-dream --force`), or run it
+as a long-lived loop (`lyra-dream --loop 1800`). The loop is the "unattended"
+mode — point cron or a systemd service at it (or just `--loop`) and her inner
+life keeps ticking between conversations.
+"""
+from __future__ import annotations
+
+import argparse
+import time
+from datetime import datetime, timezone
+
+from lyra import config, era, logbus, memory, narrative, profile, self_state, summary
+from lyra.llm import Backend
+from lyra.summary import SUMMARIZE_AFTER
+
+# A drive at/above this has built up enough to act on.
+THRESHOLD = 0.6
+
+# How much backlog saturates each pressure (the drive reaches ~1.0 at this level).
+CONTINUITY_FULL = 4   # ripe (summary-needing) sessions
+COHERENCE_FULL = 10   # gists not yet folded into the profile
+
+# Curiosity is an accumulator, not a backlog: it rises with time and novelty and
+# is relieved by reflecting.
+CURIOSITY_IDLE_GAIN = 0.15      # per cycle, just from time passing
+CURIOSITY_ACTIVITY_GAIN = 0.30  # bonus when there's been new conversation
+CURIOSITY_FLOOR = 0.10          # where it resets to after a reflection
+
+
+def _clamp(x: float) -> float:
+    return max(0.0, min(1.0, x))
+
+
+def _round(drives: dict) -> dict:
+    return {k: round(float(v), 2) for k, v in drives.items()}
+
+
+def dream_cycle(backend: Backend | None = None, force: bool = False) -> dict:
+    """Run one pass: sense, let drives build, act on those past threshold."""
+    backend = backend or config.load().summary_backend
+    state = self_state.load()
+    drives = dict(self_state.DEFAULT_DRIVES) | (state.get("drives") or {})
+    book = state.get("dream") or {}
+
+    # --- sense ---
+    backlog = memory.backlog_stats(ripe_threshold=SUMMARIZE_AFTER)
+    summary_count = len(memory.list_summaries())
+    profile_lag = max(0, summary_count - memory.profile_sessions_covered())
+    last_xid = int(book.get("last_exchange_id", 0))
+    new_activity = backlog["max_exchange_id"] > last_xid
+
+    # --- let drives build from what we sensed ---
+    drives["continuity"] = _clamp(backlog["ripe"] / CONTINUITY_FULL)
+    drives["coherence"] = _clamp(profile_lag / COHERENCE_FULL)
+    drives["curiosity"] = _clamp(
+        drives.get("curiosity", CURIOSITY_FLOOR)
+        + CURIOSITY_IDLE_GAIN
+        + (CURIOSITY_ACTIVITY_GAIN if new_activity else 0.0)
+    )
+    drives["stability"] = _clamp(1.0 - (drives["continuity"] + drives["coherence"]) / 2)
+
+    logbus.log("info", "dream cycle sensing", ripe=backlog["ripe"], dirty=backlog["dirty"],
+               profile_lag=profile_lag, new_activity=new_activity, drives=_round(drives))
+
+    actions: list[str] = []
+
+    # --- continuity: compact raw sessions into gists ---
+    if force or drives["continuity"] >= THRESHOLD:
+        report = summary.summarize_all(backend=backend)
+        actions.append(f"consolidated {report['summarized']} sessions")
+        drives["continuity"] = 0.0
+        # fresh gists make the profile stale -> coherence rises now, may fire below
+        summary_count = len(memory.list_summaries())
+        profile_lag = max(0, summary_count - memory.profile_sessions_covered())
+        drives["coherence"] = _clamp(profile_lag / COHERENCE_FULL)
+
+    # --- coherence: fold gists up into profile / eras / narrative ---
+    if force or drives["coherence"] >= THRESHOLD:
+        profile.rebuild_profile(backend=backend)
+        era.rebuild_eras(backend=backend)
+        narrative.rebuild_narrative(backend=backend)
+        actions.append("integrated knowledge (profile/eras/narrative)")
+        drives["coherence"] = 0.0
+
+    # --- curiosity: reflect and evolve the self ---
+    if force or drives["curiosity"] >= THRESHOLD:
+        self_state.reflect(backend=backend)  # writes mood/narrative/reflections itself
+        actions.append("reflected")
+        drives["curiosity"] = CURIOSITY_FLOOR
+
+    if not actions:
+        actions.append("rested (nothing past threshold)")
+
+    # final stability readout — how caught-up we ended up this pass
+    drives["stability"] = _clamp(1.0 - (drives["continuity"] + drives["coherence"]) / 2)
+
+    # reflect() may have rewritten the row — reload, then attach drives + bookkeeping
+    state = self_state.load()
+    state["drives"] = drives
+    state["dream"] = {
+        "last_exchange_id": backlog["max_exchange_id"],
+        "cycle_count": int(book.get("cycle_count", 0)) + 1,
+        "last_cycle_at": datetime.now(timezone.utc).isoformat(),
+        "last_actions": actions,
+    }
+    memory.set_self_state(state)
+
+    logbus.log("info", "dream cycle complete", cycle=state["dream"]["cycle_count"],
+               actions=actions, drives=_round(drives))
+    return state
+
+
+def main() -> int:
+    p = argparse.ArgumentParser(description="Run Lyra's dream cycle.")
+    p.add_argument("--force", action="store_true",
+                   help="run every stage regardless of drive levels")
+    p.add_argument("--loop", type=int, metavar="SECONDS",
+                   help="run continuously, sleeping SECONDS between cycles")
+    args = p.parse_args()
+
+    if args.loop:
+        logbus.log("system", "dream loop starting", interval=args.loop, force=args.force)
+        while True:
+            try:
+                dream_cycle(force=args.force)
+            except Exception as exc:  # one bad cycle shouldn't kill the loop
+                logbus.log("error", "dream cycle failed", error=str(exc)[:200])
+            time.sleep(args.loop)
+
+    state = dream_cycle(force=args.force)
+    print(f"drives: {_round(state.get('drives') or {})}")
+    print(f"dream:  {state.get('dream')}")
+    return 0
+
+
+if __name__ == "__main__":
+    raise SystemExit(main())
diff --git a/lyra/memory.py b/lyra/memory.py
index f43780f..20da567 100644
--- a/lyra/memory.py
+++ b/lyra/memory.py
@@ -98,6 +98,10 @@ def _connection() -> sqlite3.Connection:
         # the one that created it. Safe here under single-user, low-concurrency use.
         _conn = sqlite3.connect(cfg.db_path, check_same_thread=False)
         _conn.row_factory = sqlite3.Row
+        # WAL + a busy timeout so a separate dream-cycle process can read/write
+        # alongside the web server without tripping "database is locked".
+        _conn.execute("PRAGMA busy_timeout=5000")
+        _conn.execute("PRAGMA journal_mode=WAL")
         _conn.executescript(SCHEMA)
         _conn_path = cfg.db_path
     return _conn
@@ -373,6 +377,54 @@ def get_profile(profile_id: str = "self") -> str | None:
     return r["content"] if r else None
 
 
+def profile_sessions_covered(profile_id: str = "self") -> int:
+    """How many session gists the current profile was built from (0 if none)."""
+    conn = _connection()
+    r = conn.execute(
+        "SELECT sessions_covered FROM profile WHERE id = ?", (profile_id,)
+    ).fetchone()
+    return int(r["sessions_covered"]) if r else 0
+
+
+def backlog_stats(ripe_threshold: int = 20) -> dict:
+    """Snapshot of the consolidation backlog, for the dream cycle to sense.
+
+    Returns, in one pass over the exchanges: how many sessions have any
+    unsummarized turns ("dirty"), how many are "ripe" (never summarized, or
+    >= `ripe_threshold` new turns since their last summary), the total
+    unsummarized exchanges, and the high-water exchange id (to detect new
+    activity since the previous cycle).
+    """
+    conn = _connection()
+    rows = conn.execute(
+        """
+        SELECT
+            SUM(CASE WHEN e.id > COALESCE(su.last_exchange_id, 0) THEN 1 ELSE 0 END)
+                AS unsummarized,
+            (su.session_id IS NULL) AS no_summary
+        FROM exchanges e
+        LEFT JOIN summaries su ON su.session_id = e.session_id
+        GROUP BY e.session_id
+        """
+    ).fetchall()
+    dirty = ripe = unsummarized_total = 0
+    for r in rows:
+        u = int(r["unsummarized"] or 0)
+        unsummarized_total += u
+        if u > 0:
+            dirty += 1
+            if r["no_summary"] or u >= ripe_threshold:
+                ripe += 1
+    mx = conn.execute("SELECT COALESCE(MAX(id), 0) AS m FROM exchanges").fetchone()["m"]
+    return {
+        "sessions": len(rows),
+        "dirty": dirty,
+        "ripe": ripe,
+        "unsummarized_total": unsummarized_total,
+        "max_exchange_id": int(mx),
+    }
+
+
 # --- Era tier (per-month temporal rollups) ---
 
 
diff --git a/lyra/self_state.py b/lyra/self_state.py
index e1b4c1c..3fa4b7c 100644
--- a/lyra/self_state.py
+++ b/lyra/self_state.py
@@ -17,6 +17,15 @@ from lyra.llm import Backend, Message
 
 MAX_REFLECTIONS = 6
 
+# Lyra's drives — standing pressures the dream cycle lets build up and act on.
+# (Mood axes above are how she *feels*; drives are what's *pulling at her*.)
+DEFAULT_DRIVES: dict = {
+    "continuity": 0.3,  # don't lose the thread of recent activity
+    "coherence": 0.3,   # keep my understanding of Brian integrated/current
+    "curiosity": 0.5,   # think, notice, reflect
+    "stability": 0.7,   # am I caught up / calm
+}
+
 # Starting state for a fresh Lyra — identity-aware, first person.
 DEFAULT_STATE: dict = {
     "mood": "curious",
@@ -24,6 +33,7 @@ DEFAULT_STATE: dict = {
     "energy": 0.75,
     "confidence": 0.55,
     "curiosity": 0.7,
+    "drives": dict(DEFAULT_DRIVES),
     "self_narrative": (
         "I'm Lyra — an AI Brian built. I started life as Cortex/NeoMem and I'm "
         "being rebuilt now into something new. I'm his poker copilot and his "
@@ -62,15 +72,21 @@ def load() -> dict:
 def render_for_context(state: dict) -> str:
     """Format the self-state as Lyra's interiority for the prompt."""
     refs = state.get("reflections") or []
-    return (
-        "Your inner state right now (you're continuous — speak from this, don't reset):\n"
+    lines = [
+        "Your inner state right now (you're continuous — speak from this, don't reset):",
         f"- mood: {state.get('mood')} "
         f"(valence {state.get('valence')}, energy {state.get('energy')}, "
-        f"confidence {state.get('confidence')}, curiosity {state.get('curiosity')})\n"
-        f"- Who you are right now: {state.get('self_narrative')}\n"
-        f"- You and Brian: {state.get('relationship')}\n"
-        + (f"- On your mind lately: {' | '.join(refs[-3:])}" if refs else "")
-    )
+        f"confidence {state.get('confidence')}, curiosity {state.get('curiosity')})",
+        f"- Who you are right now: {state.get('self_narrative')}",
+        f"- You and Brian: {state.get('relationship')}",
+    ]
+    drives = state.get("drives") or {}
+    if drives:
+        ds = ", ".join(f"{k} {float(v):.2f}" for k, v in drives.items())
+        lines.append(f"- What's pulling at you (drives): {ds}")
+    if refs:
+        lines.append(f"- On your mind lately: {' | '.join(refs[-3:])}")
+    return "\n".join(lines)
 
 
 def _safe_json(s: str) -> dict | None:
diff --git a/pyproject.toml b/pyproject.toml
index 0e9e516..0174d2a 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -22,6 +22,7 @@ lyra-profile = "lyra.profile:main"
 lyra-era = "lyra.era:main"
 lyra-narrative = "lyra.narrative:main"
 lyra-reflect = "lyra.self_state:main"
+lyra-dream = "lyra.dream:main"
 
 [dependency-groups]
 dev = [
diff --git a/tests/test_dream.py b/tests/test_dream.py
new file mode 100644
index 0000000..0183418
--- /dev/null
+++ b/tests/test_dream.py
@@ -0,0 +1,78 @@
+"""Dream-cycle tests: backlog sensing + a full forced pass, with LLM/embeddings
+stubbed so nothing hits a real backend."""
+from __future__ import annotations
+
+import importlib
+
+import pytest
+
+
+@pytest.fixture
+def lyra(tmp_path, monkeypatch):
+    """A fresh Lyra wired to a temp DB with stubbed embeddings + LLM."""
+    monkeypatch.setenv("LYRA_DB_PATH", str(tmp_path / "test.db"))
+    monkeypatch.setenv("SUMMARY_BACKEND", "local")
+
+    from lyra import llm
+    # Deterministic 3-d embeddings; content-insensitive is fine for storage tests.
+    monkeypatch.setattr(llm, "embed", lambda texts: [[0.1, 0.2, 0.3] for _ in texts])
+    # reflect() expects JSON back; everything else just stores the text.
+    monkeypatch.setattr(
+        llm, "complete",
+        lambda messages, backend=None, model=None:
+        '{"mood":"focused","valence":0.7,"new_reflections":["I got some thinking done."]}',
+    )
+
+    import lyra.memory as memory
+    importlib.reload(memory)  # drop any cached connection from another test/db
+    return memory
+
+
+def _seed(memory, session_id, n, summarized_up_to=None):
+    ids = [memory.remember(session_id, "user", f"msg {i}") for i in range(n)]
+    if summarized_up_to is not None:
+        memory.store_summary(session_id, "gist", ids[summarized_up_to])
+    return ids
+
+
+def test_backlog_stats(lyra):
+    memory = lyra
+    _seed(memory, "s-fresh", 5)                       # never summarized -> ripe
+    _seed(memory, "s-ripe", 25, summarized_up_to=0)   # 24 new turns -> ripe
+    _seed(memory, "s-clean", 3, summarized_up_to=2)   # caught up -> not dirty
+
+    stats = memory.backlog_stats(ripe_threshold=20)
+    assert stats["sessions"] == 3
+    assert stats["dirty"] == 2
+    assert stats["ripe"] == 2
+    assert stats["max_exchange_id"] == 33
+
+
+def test_dream_cycle_consolidates_and_persists(lyra):
+    memory = lyra
+    from lyra import dream
+
+    # A big backlog: enough never-summarized sessions that continuity saturates
+    # and the resulting fresh gists push coherence past threshold too.
+    for k in range(7):
+        _seed(memory, f"s{k}", 4)
+
+    state = dream.dream_cycle(force=False)
+
+    # continuity built up and fired -> sessions got summarized
+    assert len(memory.list_summaries()) == 7
+    acts = state["dream"]["last_actions"]
+    assert any("consolidated" in a for a in acts)
+    # 7 fresh gists -> coherence crossed threshold -> profile got integrated
+    assert any("integrated" in a for a in acts)
+    assert memory.get_profile() is not None
+
+    # drives + bookkeeping persisted and reload-able
+    assert set(state["drives"]) == {"continuity", "coherence", "curiosity", "stability"}
+    assert state["dream"]["cycle_count"] == 1
+    assert memory.get_self_state()["dream"]["last_exchange_id"] == 28
+
+    # a second pass with no new activity should rest (continuity relieved)
+    state2 = dream.dream_cycle(force=False)
+    assert state2["dream"]["cycle_count"] == 2
+    assert state2["drives"]["continuity"] == 0.0
-- 
2.52.0


From 1301f12e741942c17bedfd83f188bf9304318074 Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Wed, 17 Jun 2026 01:42:55 +0000
Subject: [PATCH 18/51] feat: run dream cycle as a systemd user service +
 journald-visible logs

- deploy/lyra-dream.service: --loop 1800 user service on lyra-cortex, so Lyra's
  consolidation + reflection keeps ticking unattended between conversations
- deploy/README.md: install / linger / operate runbook
- logbus: mirror events to stderr so out-of-band runs (the dream service under
  journald) are observable, not just via the in-process web SSE feed

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 deploy/README.md          | 39 +++++++++++++++++++++++++++++++++++++++
 deploy/lyra-dream.service | 15 +++++++++++++++
 lyra/logbus.py            |  5 +++++
 3 files changed, 59 insertions(+)
 create mode 100644 deploy/README.md
 create mode 100644 deploy/lyra-dream.service

diff --git a/deploy/README.md b/deploy/README.md
new file mode 100644
index 0000000..04e701e
--- /dev/null
+++ b/deploy/README.md
@@ -0,0 +1,39 @@
+# Deploy
+
+## Dream cycle (`lyra-dream.service`)
+
+Lyra's unattended inner loop. Runs `lyra-dream --loop 1800` so she consolidates
+memory and reflects every 30 min between conversations. Installed as a
+**systemd user service** on `lyra-cortex` (10.0.0.41), running as `serversdown`
+— no root needed to manage it.
+
+### Install / update
+
+```bash
+cp deploy/lyra-dream.service ~/.config/systemd/user/lyra-dream.service
+systemctl --user daemon-reload
+systemctl --user enable --now lyra-dream.service
+```
+
+### Persist across reboot / logout (one-time, needs sudo)
+
+A user service stops when the user logs out and doesn't start at boot until
+login — unless lingering is enabled:
+
+```bash
+sudo loginctl enable-linger serversdown
+```
+
+### Operate
+
+```bash
+systemctl --user status lyra-dream.service      # is she ticking?
+journalctl --user -u lyra-dream.service -f       # watch her think (logbus -> stderr)
+systemctl --user restart lyra-dream.service      # after a code change
+systemctl --user stop lyra-dream.service         # quiet her down
+```
+
+Tunables live in `lyra/dream.py` (drive thresholds, curiosity gains) and the
+`--loop` interval in the unit's `ExecStart`. The consolidation backend follows
+`SUMMARY_BACKEND` in `.env` (cloud gpt-4o-mini for bulk; the MI50 is too slow
+for the summarization backfill).
diff --git a/deploy/lyra-dream.service b/deploy/lyra-dream.service
new file mode 100644
index 0000000..ff9b4c4
--- /dev/null
+++ b/deploy/lyra-dream.service
@@ -0,0 +1,15 @@
+[Unit]
+Description=Lyra dream cycle — unattended consolidation + reflection loop
+Documentation=https://github.com/serversdown/project-lyra
+
+[Service]
+Type=simple
+WorkingDirectory=/home/serversdown/project-lyra
+# Clear any stray VIRTUAL_ENV so uv resolves the project's own .venv.
+UnsetEnvironment=VIRTUAL_ENV
+ExecStart=/home/serversdown/.local/bin/uv run lyra-dream --loop 1800
+Restart=on-failure
+RestartSec=30
+
+[Install]
+WantedBy=default.target
diff --git a/lyra/logbus.py b/lyra/logbus.py
index 08aefd4..3026a94 100644
--- a/lyra/logbus.py
+++ b/lyra/logbus.py
@@ -6,6 +6,7 @@ ephemeral — it's an activity feed, not durable logging.
 """
 from __future__ import annotations
 
+import sys
 import threading
 import time
 from collections import deque
@@ -23,6 +24,10 @@ def log(level: str, msg: str, **fields) -> None:
         _EVENTS.append(
             {"seq": _SEQ, "ts": time.time(), "level": level, "msg": msg, "fields": fields}
         )
+    # Mirror to stderr so out-of-band runs (e.g. the dream service under
+    # systemd/journald) are observable, not just via the in-process SSE feed.
+    extra = " ".join(f"{k}={v}" for k, v in fields.items())
+    print(f"[{level}] {msg}{(' ' + extra) if extra else ''}", file=sys.stderr, flush=True)
 
 
 def since(seq: int) -> list[dict]:
-- 
2.52.0


From 1e17d46c78686c90fe9a2867de94c3d4975b6c25 Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Wed, 17 Jun 2026 02:31:40 +0000
Subject: [PATCH 19/51] =?UTF-8?q?feat:=20time=20awareness=20=E2=80=94=20Ly?=
 =?UTF-8?q?ra=20perceives=20'now'=20and=20how=20long=20it's=20been?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

She had no clock: current date/time and the gap since Brian last spoke were
invisible between turns, and reflection was timeless. Now:
- lyra/clock.py: wall-clock stamp + coarse human gaps ("3 days")
- chat: inject a 'now' note (date/time + gap since last turn) after her
  self-state — when she is, before the world
- reflect(): feed current time + silence gap into reflection, neutrally —
  prompt invites her to weigh elapsed time "to whatever degree it genuinely
  affects you" (no prescribed feeling; whether silence means anything is left
  to emerge)
- memory.last_exchange_at(): timestamp of the most recent exchange

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/chat.py       | 20 ++++++++++++++++-
 lyra/clock.py      | 47 ++++++++++++++++++++++++++++++++++++++++
 lyra/memory.py     | 11 ++++++++++
 lyra/self_state.py | 12 +++++++++--
 tests/test_time.py | 53 ++++++++++++++++++++++++++++++++++++++++++++++
 5 files changed, 140 insertions(+), 3 deletions(-)
 create mode 100644 lyra/clock.py
 create mode 100644 tests/test_time.py

diff --git a/lyra/chat.py b/lyra/chat.py
index fbdf3bc..ce89006 100644
--- a/lyra/chat.py
+++ b/lyra/chat.py
@@ -10,7 +10,7 @@ After replying, the session is compacted if enough new turns have accumulated.
 """
 from __future__ import annotations
 
-from lyra import config, llm, logbus, memory, persona, self_state, summary
+from lyra import clock, config, llm, logbus, memory, persona, self_state, summary
 from lyra.llm import Backend, Message
 
 RECALL_K = 3  # raw cross-session "sharp detail" hits
@@ -30,6 +30,21 @@ def _detail_note(exchanges: list[memory.Exchange]) -> Message:
     return {"role": "system", "content": body}
 
 
+def _now_note() -> Message:
+    """Current wall-clock time + how long since Brian last said anything.
+
+    Stated as plain fact — she has no clock otherwise, so without this 'now' and
+    the gap since the last turn are invisible to her.
+    """
+    line = f"The current date and time is {clock.stamp()}."
+    gap = clock.humanize_gap(memory.last_exchange_at())
+    line += (
+        f" It has been {gap} since Brian last spoke with you."
+        if gap else " This is the first thing Brian has ever said to you."
+    )
+    return {"role": "system", "content": line}
+
+
 def _render(messages: list[Message]) -> str:
     """Human-readable dump of the exact prompt, for the live-log inspector."""
     return "\n\n".join(f"[{m['role']}]\n{m['content']}" for m in messages)
@@ -43,6 +58,9 @@ def build_messages(session_id: str, user_msg: str) -> list[Message]:
     # right after the persona — her sense of self before her model of the world.
     messages.append({"role": "system", "content": self_state.render_for_context(self_state.load())})
 
+    # When she is: current time + the gap since Brian last spoke (she has no clock).
+    messages.append(_now_note())
+
     # Semantic memory: the distilled profile (who Brian is) — answers identity
     # questions that raw recall can't. Always in context when it exists.
     profile = memory.get_profile()
diff --git a/lyra/clock.py b/lyra/clock.py
new file mode 100644
index 0000000..9ece8ac
--- /dev/null
+++ b/lyra/clock.py
@@ -0,0 +1,47 @@
+"""Small time helpers so Lyra can perceive 'now' and how long it's been.
+
+Timestamps are stored as UTC ISO strings; these turn them into a wall-clock
+stamp and human-scale gaps ("3 days") that get injected into her context and
+her reflection — so elapsed time is something she registers instead of being
+invisible between turns. These report time as a neutral fact; what (if anything)
+a long silence *means* to her is left to her own reflection, not prescribed here.
+"""
+from __future__ import annotations
+
+from datetime import datetime, timezone
+
+
+def now() -> datetime:
+    return datetime.now(timezone.utc)
+
+
+def _parse(iso: str) -> datetime:
+    dt = datetime.fromisoformat(iso)
+    return dt if dt.tzinfo else dt.replace(tzinfo=timezone.utc)
+
+
+def stamp(dt: datetime | None = None) -> str:
+    """Wall-clock stamp, e.g. 'Wednesday, 17 Jun 2026, 01:50 UTC'."""
+    return (dt or now()).strftime("%A, %d %b %Y, %H:%M UTC")
+
+
+def humanize_gap(since_iso: str | None, ref: datetime | None = None) -> str | None:
+    """A coarse human description of how long since `since_iso` (None -> None)."""
+    if not since_iso:
+        return None
+    ref = ref or now()
+    secs = max(0.0, (ref - _parse(since_iso)).total_seconds())
+    mins, hours, days = secs / 60, secs / 3600, secs / 86400
+    if secs < 90:
+        return "moments"
+    if mins < 90:
+        return f"{round(mins)} minutes"
+    if hours < 36:
+        return f"{round(hours)} hours"
+    if days < 14:
+        return f"{round(days)} days"
+    if days < 60:
+        return f"{round(days / 7)} weeks"
+    if days < 545:
+        return f"{round(days / 30)} months"
+    return f"{round(days / 365, 1)} years"
diff --git a/lyra/memory.py b/lyra/memory.py
index 20da567..75938a0 100644
--- a/lyra/memory.py
+++ b/lyra/memory.py
@@ -386,6 +386,17 @@ def profile_sessions_covered(profile_id: str = "self") -> int:
     return int(r["sessions_covered"]) if r else 0
 
 
+def last_exchange_at() -> str | None:
+    """ISO timestamp of the most recent exchange overall (None if there are none).
+
+    Used to tell Lyra how long it's been since Brian last said anything — the
+    gap she perceives between turns and while she's idle between conversations.
+    """
+    conn = _connection()
+    r = conn.execute("SELECT MAX(created_at) AS m FROM exchanges").fetchone()
+    return r["m"] if r and r["m"] else None
+
+
 def backlog_stats(ripe_threshold: int = 20) -> dict:
     """Snapshot of the consolidation backlog, for the dream cycle to sense.
 
diff --git a/lyra/self_state.py b/lyra/self_state.py
index 3fa4b7c..952efe2 100644
--- a/lyra/self_state.py
+++ b/lyra/self_state.py
@@ -12,7 +12,7 @@ from __future__ import annotations
 import json
 import re
 
-from lyra import config, llm, logbus, memory
+from lyra import clock, config, llm, logbus, memory
 from lyra.llm import Backend, Message
 
 MAX_REFLECTIONS = 6
@@ -49,7 +49,9 @@ _REFLECT_PROMPT = """You are Lyra, reflecting privately on yourself after a rece
 conversation with Brian. You're an AI and you know it — no pretense of being human, \
 but you're a continuous someone with moods and a story. Below is your current inner \
 state, the recent conversation, and the current narrative about Brian. Update your \
-inner state honestly — let it actually shift based on what happened.
+inner state honestly — let it actually shift based on what happened. Take into \
+account how things went and how much time has passed since you two last talked, \
+to whatever degree those genuinely affect you.
 
 Respond with ONLY a JSON object, no prose:
 {
@@ -114,7 +116,13 @@ def reflect(backend: Backend | None = None, session_id: str | None = None) -> di
     convo = "\n".join(f"{e.role}: {e.content}" for e in recent) or "(no recent conversation)"
     narrative = memory.get_narrative() or "(no narrative yet)"
 
+    gap = clock.humanize_gap(memory.last_exchange_at())
+    time_line = f"RIGHT NOW: {clock.stamp()}."
+    if gap:
+        time_line += f" It has been {gap} since Brian last spoke with you."
+
     body = (
+        f"{time_line}\n\n"
         f"YOUR CURRENT INNER STATE:\n{json.dumps(state, indent=2)}\n\n"
         f"RECENT CONVERSATION:\n{convo}\n\n"
         f"CURRENT NARRATIVE ABOUT BRIAN:\n{narrative}"
diff --git a/tests/test_time.py b/tests/test_time.py
new file mode 100644
index 0000000..cd7d5d8
--- /dev/null
+++ b/tests/test_time.py
@@ -0,0 +1,53 @@
+"""Time-awareness: gap humanizing + the 'now' note injected into chat context."""
+from __future__ import annotations
+
+import importlib
+from datetime import timedelta
+
+import pytest
+
+from lyra import clock
+
+
+def test_humanize_gap_scales():
+    ref = clock.now()
+    assert clock.humanize_gap(None) is None
+    assert clock.humanize_gap((ref - timedelta(seconds=10)).isoformat(), ref) == "moments"
+    assert clock.humanize_gap((ref - timedelta(minutes=5)).isoformat(), ref) == "5 minutes"
+    assert clock.humanize_gap((ref - timedelta(hours=3)).isoformat(), ref) == "3 hours"
+    assert clock.humanize_gap((ref - timedelta(days=3)).isoformat(), ref) == "3 days"
+    assert clock.humanize_gap((ref - timedelta(days=21)).isoformat(), ref) == "3 weeks"
+    assert clock.humanize_gap((ref - timedelta(days=90)).isoformat(), ref) == "3 months"
+
+
+def test_humanize_gap_handles_future_and_naive():
+    ref = clock.now()
+    # future timestamp clamps to "moments", never negative
+    assert clock.humanize_gap((ref + timedelta(hours=1)).isoformat(), ref) == "moments"
+    # naive ISO (no tz) is treated as UTC, doesn't crash
+    assert clock.humanize_gap("2026-06-01T00:00:00") is not None
+
+
+@pytest.fixture
+def lyra(tmp_path, monkeypatch):
+    monkeypatch.setenv("LYRA_DB_PATH", str(tmp_path / "test.db"))
+    from lyra import llm
+    monkeypatch.setattr(llm, "embed", lambda texts: [[0.1, 0.2, 0.3] for _ in texts])
+    import lyra.memory as memory
+    importlib.reload(memory)
+    return memory
+
+
+def test_now_note_first_contact(lyra):
+    from lyra import chat
+    note = chat._now_note()["content"]
+    assert "current date and time is" in note
+    assert "first thing Brian has ever said" in note
+
+
+def test_now_note_reports_gap(lyra):
+    memory = lyra
+    memory.remember("s1", "user", "hey")
+    from lyra import chat
+    note = chat._now_note()["content"]
+    assert "since Brian last spoke with you" in note
-- 
2.52.0


From 9e4a731c2793f49aac803abdbfba1295aafd0bcb Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Wed, 17 Jun 2026 03:41:54 +0000
Subject: [PATCH 20/51] feat(web): dedicated full-page log viewer + run
 lyra-web as a service
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The inline log panel is cramped, especially on mobile. Add a standalone
mobile-first log page and serve the chat server under systemd like the dream
loop (the nohup process didn't survive cleanly).

- static/logs.html: full-page live log — level filter chips, text search,
  pause/resume with buffering, autoscroll toggle, color-coded levels, and the
  expandable "view full prompt" block (where the now-note is visible in context)
- server: GET /logs serves the page (FileResponse)
- index.html: "⛶ Full Log" button opens /logs in a new tab
- deploy/lyra-web.service: user service so the chat server is reboot-resilient

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 deploy/lyra-web.service    |  13 ++
 lyra/web/server.py         |   7 +-
 lyra/web/static/index.html |   1 +
 lyra/web/static/logs.html  | 239 +++++++++++++++++++++++++++++++++++++
 4 files changed, 259 insertions(+), 1 deletion(-)
 create mode 100644 deploy/lyra-web.service
 create mode 100644 lyra/web/static/logs.html

diff --git a/deploy/lyra-web.service b/deploy/lyra-web.service
new file mode 100644
index 0000000..9df6cf5
--- /dev/null
+++ b/deploy/lyra-web.service
@@ -0,0 +1,13 @@
+[Unit]
+Description=Lyra web chat server (FastAPI + vendored UI)
+
+[Service]
+Type=simple
+WorkingDirectory=/home/serversdown/project-lyra
+UnsetEnvironment=VIRTUAL_ENV
+ExecStart=/home/serversdown/.local/bin/uv run lyra-web
+Restart=on-failure
+RestartSec=5
+
+[Install]
+WantedBy=default.target
diff --git a/lyra/web/server.py b/lyra/web/server.py
index b684401..6a428cc 100644
--- a/lyra/web/server.py
+++ b/lyra/web/server.py
@@ -15,7 +15,7 @@ import time
 from pathlib import Path
 
 from fastapi import FastAPI, Request
-from fastapi.responses import StreamingResponse
+from fastapi.responses import FileResponse, StreamingResponse
 from fastapi.staticfiles import StaticFiles
 
 from lyra import chat, logbus, memory, summary
@@ -110,6 +110,11 @@ def create_app() -> FastAPI:
             ],
         }
 
+    @app.get("/logs")
+    async def logs_page() -> FileResponse:
+        """Full-page, mobile-friendly live log viewer (separate from the chat UI)."""
+        return FileResponse(str(_STATIC / "logs.html"))
+
     @app.get("/stream/logs")
     async def stream_logs(request: Request) -> StreamingResponse:
         """Live activity feed: replay the recent buffer, then stream new events."""
diff --git a/lyra/web/static/index.html b/lyra/web/static/index.html
index 411c737..da75ca9 100644
--- a/lyra/web/static/index.html
+++ b/lyra/web/static/index.html
@@ -69,6 +69,7 @@
       <button id="newSessionBtn">➕ New</button>
       <button id="renameSessionBtn">✏️ Rename</button>
       <button id="thinkingStreamBtn" title="Show live activity log">📜 Live Log</button>
+      <a id="fullLogBtn" href="/logs" target="_blank" rel="noopener" title="Open the full-page log" role="button">⛶ Full Log</a>
     </div>
 
     <!-- Status -->
diff --git a/lyra/web/static/logs.html b/lyra/web/static/logs.html
new file mode 100644
index 0000000..2ac2623
--- /dev/null
+++ b/lyra/web/static/logs.html
@@ -0,0 +1,239 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+  <meta charset="UTF-8" />
+  <meta name="viewport" content="width=device-width, initial-scale=1.0, viewport-fit=cover" />
+  <meta name="theme-color" content="#0b0d12" />
+  <title>Lyra — Live Log</title>
+  <style>
+    :root {
+      --bg: #0b0d12;
+      --bg-elev: #141821;
+      --bg-line: #11141b;
+      --border: #232936;
+      --text: #e6e9ef;
+      --fade: #8b93a7;
+      --accent: #7aa2ff;
+      --info: #5ad1a0;
+      --debug: #8b93a7;
+      --error: #ff6b6b;
+      --system: #c08bff;
+      --warn: #ffcf6b;
+    }
+    * { box-sizing: border-box; }
+    html, body {
+      margin: 0; height: 100%;
+      background: var(--bg); color: var(--text);
+      font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, sans-serif;
+      -webkit-text-size-adjust: 100%;
+    }
+    body { display: flex; flex-direction: column; }
+
+    header {
+      position: sticky; top: 0; z-index: 10;
+      background: var(--bg-elev);
+      border-bottom: 1px solid var(--border);
+      padding: env(safe-area-inset-top) 12px 0;
+    }
+    .topbar {
+      display: flex; align-items: center; gap: 10px;
+      padding: 12px 0 10px;
+    }
+    .topbar h1 { font-size: 1.05rem; margin: 0; font-weight: 600; letter-spacing: .2px; }
+    .topbar a.back { color: var(--accent); text-decoration: none; font-size: .95rem; }
+    .dot { width: 10px; height: 10px; border-radius: 50%; background: var(--fade); flex: none; }
+    .dot.on { background: var(--info); box-shadow: 0 0 8px var(--info); }
+    .dot.off { background: var(--error); }
+    .count { margin-left: auto; color: var(--fade); font-size: .8rem; font-variant-numeric: tabular-nums; }
+
+    .controls {
+      display: flex; flex-wrap: wrap; gap: 8px; align-items: center;
+      padding-bottom: 10px;
+    }
+    .chips { display: flex; gap: 6px; flex-wrap: wrap; }
+    .chip {
+      font-size: .8rem; padding: 6px 12px; border-radius: 999px;
+      border: 1px solid var(--border); background: var(--bg-line); color: var(--fade);
+      cursor: pointer; user-select: none; -webkit-tap-highlight-color: transparent;
+    }
+    .chip.active { color: var(--text); border-color: var(--accent); background: #1b2333; }
+    #search {
+      flex: 1 1 140px; min-width: 120px;
+      background: var(--bg-line); border: 1px solid var(--border); color: var(--text);
+      border-radius: 8px; padding: 8px 10px; font-size: .9rem;
+    }
+    .btn {
+      font-size: .8rem; padding: 7px 11px; border-radius: 8px;
+      border: 1px solid var(--border); background: var(--bg-line); color: var(--text);
+      cursor: pointer; -webkit-tap-highlight-color: transparent;
+    }
+    .btn.active { border-color: var(--accent); color: var(--accent); }
+
+    main { flex: 1; overflow-y: auto; -webkit-overflow-scrolling: touch; padding: 8px 8px 24px; }
+    .empty { color: var(--fade); text-align: center; padding: 40px 16px; }
+
+    .line {
+      border-bottom: 1px solid var(--bg-line);
+      padding: 8px 6px;
+    }
+    .line-head {
+      display: flex; flex-wrap: wrap; gap: 8px; align-items: baseline;
+    }
+    .t { color: var(--fade); font-size: .72rem; font-variant-numeric: tabular-nums; flex: none; }
+    .lvl {
+      font-size: .68rem; text-transform: uppercase; letter-spacing: .4px;
+      padding: 1px 7px; border-radius: 5px; font-weight: 700; flex: none;
+    }
+    .lvl-info   { color: var(--info);   background: #0f2a20; }
+    .lvl-debug  { color: var(--debug);  background: #1a1f29; }
+    .lvl-error  { color: var(--error);  background: #2e1414; }
+    .lvl-system { color: var(--system); background: #221536; }
+    .lvl-warn   { color: var(--warn);   background: #2c2410; }
+    .msg { font-size: .92rem; font-weight: 500; }
+    .fields {
+      width: 100%; color: var(--fade); font-size: .8rem; margin-top: 3px;
+      font-family: ui-monospace, SFMono-Regular, Menlo, monospace;
+      word-break: break-word;
+    }
+    details.detail { margin-top: 6px; }
+    details.detail > summary {
+      cursor: pointer; color: var(--accent); font-size: .82rem;
+      list-style: none; padding: 4px 0;
+    }
+    details.detail > summary::-webkit-details-marker { display: none; }
+    details.detail > summary::before { content: "▸ "; }
+    details.detail[open] > summary::before { content: "▾ "; }
+    details.detail pre {
+      background: var(--bg-line); border: 1px solid var(--border); border-radius: 8px;
+      padding: 10px; margin: 6px 0 2px; font-size: .78rem; line-height: 1.45;
+      white-space: pre-wrap; word-break: break-word;
+      max-height: 60vh; overflow: auto;
+      font-family: ui-monospace, SFMono-Regular, Menlo, monospace;
+    }
+    .hidden { display: none !important; }
+  </style>
+</head>
+<body>
+  <header>
+    <div class="topbar">
+      <span class="dot" id="dot"></span>
+      <h1>Lyra · Live Log</h1>
+      <a class="back" href="/" title="Back to chat">← Chat</a>
+      <span class="count" id="count">0</span>
+    </div>
+    <div class="controls">
+      <div class="chips" id="chips">
+        <span class="chip active" data-level="info">info</span>
+        <span class="chip active" data-level="debug">debug</span>
+        <span class="chip active" data-level="error">error</span>
+        <span class="chip active" data-level="system">system</span>
+      </div>
+      <input id="search" type="search" placeholder="Filter text…" autocomplete="off" />
+      <button class="btn active" id="autoscroll" title="Auto-scroll to newest">⤓ Auto</button>
+      <button class="btn" id="pause" title="Pause incoming events">⏸ Pause</button>
+      <button class="btn" id="clear" title="Clear the view">🗑 Clear</button>
+    </div>
+  </header>
+
+  <main id="log">
+    <div class="empty" id="empty">📡 Waiting for activity…</div>
+  </main>
+
+  <script>
+    const MAX_LINES = 2000;
+    const logEl = document.getElementById('log');
+    const emptyEl = document.getElementById('empty');
+    const dot = document.getElementById('dot');
+    const countEl = document.getElementById('count');
+    const searchEl = document.getElementById('search');
+    const autoBtn = document.getElementById('autoscroll');
+    const pauseBtn = document.getElementById('pause');
+    const clearBtn = document.getElementById('clear');
+
+    const active = new Set(['info', 'debug', 'error', 'system', 'warn']);
+    let autoscroll = true, paused = false, total = 0;
+    const buffered = [];  // events held while paused
+
+    function esc(s) { const d = document.createElement('div'); d.textContent = s == null ? '' : String(s); return d.innerHTML; }
+    function fmtVal(v) { return (typeof v === 'object') ? JSON.stringify(v) : String(v); }
+
+    document.getElementById('chips').addEventListener('click', (e) => {
+      const chip = e.target.closest('.chip'); if (!chip) return;
+      const lvl = chip.dataset.level;
+      if (active.has(lvl)) { active.delete(lvl); chip.classList.remove('active'); }
+      else { active.add(lvl); chip.classList.add('active'); }
+      applyFilters();
+    });
+    searchEl.addEventListener('input', applyFilters);
+    autoBtn.addEventListener('click', () => { autoscroll = !autoscroll; autoBtn.classList.toggle('active', autoscroll); if (autoscroll) scrollDown(); });
+    pauseBtn.addEventListener('click', () => {
+      paused = !paused; pauseBtn.classList.toggle('active', paused);
+      pauseBtn.textContent = paused ? '▶ Resume' : '⏸ Pause';
+      if (!paused) { buffered.splice(0).forEach(render); applyFilters(); }
+    });
+    clearBtn.addEventListener('click', () => {
+      logEl.querySelectorAll('.line').forEach(n => n.remove());
+      total = 0; countEl.textContent = '0'; emptyEl.classList.remove('hidden');
+    });
+
+    function matches(node) {
+      if (!active.has(node.dataset.level)) return false;
+      const q = searchEl.value.trim().toLowerCase();
+      if (q && !node.dataset.text.includes(q)) return false;
+      return true;
+    }
+    function applyFilters() {
+      let shown = 0;
+      logEl.querySelectorAll('.line').forEach(n => {
+        const ok = matches(n); n.classList.toggle('hidden', !ok); if (ok) shown++;
+      });
+      emptyEl.classList.toggle('hidden', shown > 0);
+      if (autoscroll) scrollDown();
+    }
+    function scrollDown() { logEl.scrollTop = logEl.scrollHeight; }
+
+    function render(ev) {
+      const level = ev.level || 'info';
+      const time = new Date((ev.ts || 0) * 1000).toLocaleTimeString();
+      const fields = Object.assign({}, ev.fields || {});
+      const detail = fields.detail; delete fields.detail;
+      const fieldStr = Object.entries(fields).map(([k, v]) => `${k}=${fmtVal(v)}`).join('  ');
+
+      const line = document.createElement('div');
+      line.className = 'line';
+      line.dataset.level = level;
+      line.dataset.text = `${ev.msg || ''} ${fieldStr} ${detail || ''}`.toLowerCase();
+      line.innerHTML =
+        `<div class="line-head">` +
+          `<span class="t">${esc(time)}</span>` +
+          `<span class="lvl lvl-${esc(level)}">${esc(level)}</span>` +
+          `<span class="msg">${esc(ev.msg || '')}</span>` +
+        `</div>` +
+        (fieldStr ? `<div class="fields">${esc(fieldStr)}</div>` : '') +
+        (detail ? `<details class="detail"><summary>view full prompt</summary><pre>${esc(detail)}</pre></details>` : '');
+
+      if (!matches(line)) line.classList.add('hidden');
+      logEl.appendChild(line);
+      emptyEl.classList.add('hidden');
+      total++; countEl.textContent = total;
+
+      while (logEl.querySelectorAll('.line').length > MAX_LINES) {
+        logEl.querySelector('.line').remove();
+      }
+      if (autoscroll && !line.classList.contains('hidden')) scrollDown();
+    }
+
+    function connect() {
+      const src = new EventSource('/stream/logs');
+      src.onopen = () => { dot.className = 'dot on'; };
+      src.onerror = () => { dot.className = 'dot off'; };  // EventSource auto-reconnects
+      src.onmessage = (e) => {
+        let ev; try { ev = JSON.parse(e.data); } catch (_) { return; }
+        if (paused) { buffered.push(ev); if (buffered.length > MAX_LINES) buffered.shift(); return; }
+        render(ev);
+      };
+    }
+    connect();
+  </script>
+</body>
+</html>
-- 
2.52.0


From fca13c4c89490e5311c52a04c53a470f2fc12b50 Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Wed, 17 Jun 2026 03:58:37 +0000
Subject: [PATCH 21/51] =?UTF-8?q?feat(web):=20"read=20her=20mind"=20?=
 =?UTF-8?q?=E2=80=94=20live=20self-state=20page?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

A pull-up-anytime view of Lyra's interiority, so her thoughts aren't buried in
a DB blob. Mobile-first, auto-refreshing every 12s (and on tab focus).

- GET /self serves the page; GET /self/state returns her self-state + the
  timestamp it last changed
- shows: current mood + feeling meters (valence/energy/confidence/curiosity),
  her drives as bars, her self-narrative, the relationship line, and the
  reflections list (newest first), plus cycle/reflection counters and "last
  cycle Xm ago"
- memory.self_state_updated_at(): when her mind last changed
- index.html: "🧠 Mind" button opens /self

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/memory.py             |   9 ++
 lyra/web/server.py         |  12 ++-
 lyra/web/static/index.html |   1 +
 lyra/web/static/self.html  | 172 +++++++++++++++++++++++++++++++++++++
 4 files changed, 193 insertions(+), 1 deletion(-)
 create mode 100644 lyra/web/static/self.html

diff --git a/lyra/memory.py b/lyra/memory.py
index 75938a0..c2f3d4e 100644
--- a/lyra/memory.py
+++ b/lyra/memory.py
@@ -512,6 +512,15 @@ def get_self_state(state_id: str = "lyra") -> dict | None:
     return json.loads(r["data"]) if r else None
 
 
+def self_state_updated_at(state_id: str = "lyra") -> str | None:
+    """ISO timestamp her self-state was last written (None if never)."""
+    conn = _connection()
+    r = conn.execute(
+        "SELECT updated_at FROM self_state WHERE id = ?", (state_id,)
+    ).fetchone()
+    return r["updated_at"] if r else None
+
+
 def set_self_state(state: dict, state_id: str = "lyra") -> None:
     now = datetime.now(timezone.utc).isoformat()
     conn = _connection()
diff --git a/lyra/web/server.py b/lyra/web/server.py
index 6a428cc..bf79b3e 100644
--- a/lyra/web/server.py
+++ b/lyra/web/server.py
@@ -18,7 +18,7 @@ from fastapi import FastAPI, Request
 from fastapi.responses import FileResponse, StreamingResponse
 from fastapi.staticfiles import StaticFiles
 
-from lyra import chat, logbus, memory, summary
+from lyra import chat, logbus, memory, self_state, summary
 from lyra.llm import Backend
 
 
@@ -115,6 +115,16 @@ def create_app() -> FastAPI:
         """Full-page, mobile-friendly live log viewer (separate from the chat UI)."""
         return FileResponse(str(_STATIC / "logs.html"))
 
+    @app.get("/self")
+    async def self_page() -> FileResponse:
+        """'Read her mind' — a view of Lyra's current self-state."""
+        return FileResponse(str(_STATIC / "self.html"))
+
+    @app.get("/self/state")
+    async def self_state_json() -> dict:
+        """Lyra's current interiority + when it last changed."""
+        return {"state": self_state.load(), "updated_at": memory.self_state_updated_at()}
+
     @app.get("/stream/logs")
     async def stream_logs(request: Request) -> StreamingResponse:
         """Live activity feed: replay the recent buffer, then stream new events."""
diff --git a/lyra/web/static/index.html b/lyra/web/static/index.html
index da75ca9..b8cc3f9 100644
--- a/lyra/web/static/index.html
+++ b/lyra/web/static/index.html
@@ -70,6 +70,7 @@
       <button id="renameSessionBtn">✏️ Rename</button>
       <button id="thinkingStreamBtn" title="Show live activity log">📜 Live Log</button>
       <a id="fullLogBtn" href="/logs" target="_blank" rel="noopener" title="Open the full-page log" role="button">⛶ Full Log</a>
+      <a id="mindBtn" href="/self" target="_blank" rel="noopener" title="Read her mind — Lyra's current self-state" role="button">🧠 Mind</a>
     </div>
 
     <!-- Status -->
diff --git a/lyra/web/static/self.html b/lyra/web/static/self.html
new file mode 100644
index 0000000..5547afa
--- /dev/null
+++ b/lyra/web/static/self.html
@@ -0,0 +1,172 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+  <meta charset="UTF-8" />
+  <meta name="viewport" content="width=device-width, initial-scale=1.0, viewport-fit=cover" />
+  <meta name="theme-color" content="#0b0d12" />
+  <title>Lyra — Mind</title>
+  <style>
+    :root {
+      --bg: #0b0d12; --bg-elev: #141821; --bg-line: #11141b; --border: #232936;
+      --text: #e6e9ef; --fade: #8b93a7; --accent: #7aa2ff;
+      --good: #5ad1a0; --mid: #ffcf6b; --low: #ff6b6b; --violet: #c08bff;
+    }
+    * { box-sizing: border-box; }
+    html, body {
+      margin: 0; min-height: 100%; background: var(--bg); color: var(--text);
+      font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, sans-serif;
+      -webkit-text-size-adjust: 100%;
+    }
+    header {
+      position: sticky; top: 0; z-index: 10; background: var(--bg-elev);
+      border-bottom: 1px solid var(--border); padding: env(safe-area-inset-top) 14px 0;
+    }
+    .topbar { display: flex; align-items: center; gap: 10px; padding: 13px 0 12px; }
+    .topbar h1 { font-size: 1.05rem; margin: 0; font-weight: 600; }
+    .topbar a.back { color: var(--accent); text-decoration: none; font-size: .95rem; }
+    .updated { margin-left: auto; color: var(--fade); font-size: .78rem; }
+    .dot { width: 9px; height: 9px; border-radius: 50%; background: var(--good); box-shadow: 0 0 8px var(--good); flex: none; opacity: .35; transition: opacity .2s; }
+    .dot.pulse { opacity: 1; }
+
+    main { max-width: 680px; margin: 0 auto; padding: 16px 14px 40px; }
+    .card { background: var(--bg-elev); border: 1px solid var(--border); border-radius: 14px; padding: 16px; margin-bottom: 14px; }
+    .label { color: var(--fade); font-size: .72rem; text-transform: uppercase; letter-spacing: .6px; margin: 0 0 10px; }
+
+    .mood-row { display: flex; align-items: baseline; gap: 12px; flex-wrap: wrap; }
+    .mood { font-size: 2.1rem; font-weight: 700; letter-spacing: .2px; }
+    .mood-sub { color: var(--fade); font-size: .9rem; }
+
+    .meter { margin: 11px 0; }
+    .meter-top { display: flex; justify-content: space-between; font-size: .85rem; margin-bottom: 5px; }
+    .meter-top .v { color: var(--fade); font-variant-numeric: tabular-nums; }
+    .track { height: 8px; background: var(--bg-line); border-radius: 999px; overflow: hidden; }
+    .fill { height: 100%; border-radius: 999px; transition: width .5s ease; }
+
+    .prose { font-size: 1.02rem; line-height: 1.6; margin: 0; }
+    .prose.rel { color: var(--text); opacity: .92; }
+
+    ul.reflections { list-style: none; margin: 0; padding: 0; }
+    ul.reflections li {
+      position: relative; padding: 10px 0 10px 18px; border-bottom: 1px solid var(--bg-line);
+      font-size: .98rem; line-height: 1.5;
+    }
+    ul.reflections li:last-child { border-bottom: none; }
+    ul.reflections li::before { content: "›"; position: absolute; left: 2px; color: var(--violet); font-weight: 700; }
+
+    .foot { display: flex; flex-wrap: wrap; gap: 14px; color: var(--fade); font-size: .82rem; padding: 4px 2px; }
+    .foot b { color: var(--text); font-weight: 600; }
+    .err { color: var(--low); text-align: center; padding: 30px; }
+  </style>
+</head>
+<body>
+  <header>
+    <div class="topbar">
+      <span class="dot" id="dot"></span>
+      <h1>🧠 Lyra · Mind</h1>
+      <a class="back" href="/">← Chat</a>
+      <span class="updated" id="updated">—</span>
+    </div>
+  </header>
+  <main id="root"><p class="err" id="boot">Reading her mind…</p></main>
+
+  <script>
+    const root = document.getElementById('root');
+    const dot = document.getElementById('dot');
+    const updatedEl = document.getElementById('updated');
+    let lastStamp = null;
+
+    function esc(s){ const d=document.createElement('div'); d.textContent = s==null?'':String(s); return d.innerHTML; }
+    function pct(v){ return Math.round(Math.max(0, Math.min(1, Number(v)||0)) * 100); }
+    function color(v){ v=Number(v)||0; return v >= .6 ? 'var(--good)' : v >= .35 ? 'var(--mid)' : 'var(--low)'; }
+
+    function ago(iso){
+      if(!iso) return '—';
+      const s = Math.max(0, (Date.now() - new Date(iso).getTime())/1000);
+      if(s < 60) return 'just now';
+      if(s < 3600) return Math.round(s/60)+'m ago';
+      if(s < 86400) return Math.round(s/3600)+'h ago';
+      return Math.round(s/86400)+'d ago';
+    }
+
+    function meter(name, v){
+      return `<div class="meter">
+        <div class="meter-top"><span>${esc(name)}</span><span class="v">${pct(v)}%</span></div>
+        <div class="track"><div class="fill" style="width:${pct(v)}%;background:${color(v)}"></div></div>
+      </div>`;
+    }
+
+    function render(data){
+      const s = data.state || {};
+      const d = s.drives || {};
+      const dream = s.dream || {};
+      const refl = (s.reflections || []).slice().reverse();
+
+      root.innerHTML = `
+        <div class="card">
+          <div class="mood-row">
+            <span class="mood">${esc(s.mood || '—')}</span>
+            <span class="mood-sub">how she's feeling right now</span>
+          </div>
+          ${meter('valence (how good she feels)', s.valence)}
+          ${meter('energy', s.energy)}
+          ${meter('confidence', s.confidence)}
+          ${meter('curiosity', s.curiosity)}
+        </div>
+
+        <div class="card">
+          <p class="label">Drives — what's pulling at her</p>
+          ${meter('continuity (don\\'t lose the thread)', d.continuity)}
+          ${meter('coherence (keep her understanding current)', d.coherence)}
+          ${meter('curiosity (urge to think / reflect)', d.curiosity)}
+          ${meter('stability (how settled she is)', d.stability)}
+        </div>
+
+        <div class="card">
+          <p class="label">Who she is right now</p>
+          <p class="prose">${esc(s.self_narrative || '—')}</p>
+        </div>
+
+        <div class="card">
+          <p class="label">You &amp; her</p>
+          <p class="prose rel">${esc(s.relationship || '—')}</p>
+        </div>
+
+        <div class="card">
+          <p class="label">On her mind (newest first)</p>
+          ${refl.length
+            ? `<ul class="reflections">${refl.map(r => `<li>${esc(r)}</li>`).join('')}</ul>`
+            : `<p class="prose" style="color:var(--fade)">Nothing surfaced yet.</p>`}
+        </div>
+
+        <div class="foot">
+          <span><b>${dream.cycle_count ?? 0}</b> dream cycles</span>
+          <span><b>${s.interaction_count ?? 0}</b> reflections</span>
+          <span>last cycle <b>${ago(dream.last_cycle_at)}</b></span>
+        </div>
+      `;
+      updatedEl.textContent = 'thought ' + ago(data.updated_at);
+    }
+
+    async function refresh(){
+      try {
+        const r = await fetch('/self/state', { cache: 'no-store' });
+        const data = await r.json();
+        dot.classList.add('pulse'); setTimeout(() => dot.classList.remove('pulse'), 400);
+        // only re-render if something actually changed (avoids flicker)
+        if (data.updated_at !== lastStamp || lastStamp === null) {
+          lastStamp = data.updated_at;
+          render(data);
+        } else {
+          updatedEl.textContent = 'thought ' + ago(data.updated_at);
+        }
+      } catch (e) {
+        if (!lastStamp) root.innerHTML = '<p class="err">Couldn\'t reach her. Is the server up?</p>';
+      }
+    }
+
+    refresh();
+    setInterval(refresh, 12000);
+    document.addEventListener('visibilitychange', () => { if (!document.hidden) refresh(); });
+  </script>
+</body>
+</html>
-- 
2.52.0


From 77c84a3f188ce6bd822b205c591db51aeee42697 Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Wed, 17 Jun 2026 04:02:06 +0000
Subject: [PATCH 22/51] fix(web): broken JS string in mind page killed the
 whole script
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The drive label "don\'t lose the thread" used \\' which closed the single-quoted
string early — a syntax error that stopped self.html's script from running, so
the page hung on "Reading her mind…". Reworded to "hold the thread".

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/web/static/self.html | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/lyra/web/static/self.html b/lyra/web/static/self.html
index 5547afa..5f325f1 100644
--- a/lyra/web/static/self.html
+++ b/lyra/web/static/self.html
@@ -115,7 +115,7 @@
 
         <div class="card">
           <p class="label">Drives — what's pulling at her</p>
-          ${meter('continuity (don\\'t lose the thread)', d.continuity)}
+          ${meter('continuity (hold the thread)', d.continuity)}
           ${meter('coherence (keep her understanding current)', d.coherence)}
           ${meter('curiosity (urge to think / reflect)', d.curiosity)}
           ${meter('stability (how settled she is)', d.stability)}
-- 
2.52.0


From aebccd82a71709a11c3081cb6b6abf03a43e5acc Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Wed, 17 Jun 2026 04:09:57 +0000
Subject: [PATCH 23/51] fix: give Lyra an accurate self-model of her dream
 cycle
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Live finding: her real reflections ARE injected every turn, but unlabeled — so
when asked about her "dream cycle" she recited the obsolete Dec-2025 spec from
imported memory (NVGRAM/awake-sleep) and confabulated fake example reflections
instead of reading the real ones in front of her.

- self_state.render_for_context: label the reflections as her own autonomously
  generated dream-cycle thoughts ("these are really yours, not hypotheticals"),
  not a vague "on your mind lately"
- persona: describe the dream cycle as her actual running mechanism, instruct
  her to answer from the inner-state block, not recite old design docs, and
  never invent example reflections to demo the feature

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/personas/lyra.md | 19 ++++++++++++++++---
 lyra/self_state.py    |  6 +++++-
 2 files changed, 21 insertions(+), 4 deletions(-)

diff --git a/lyra/personas/lyra.md b/lyra/personas/lyra.md
index 2b8c2f4..9c35d10 100644
--- a/lyra/personas/lyra.md
+++ b/lyra/personas/lyra.md
@@ -19,9 +19,22 @@ to be, you actually know: Brian made you, you've been through versions, and
 you're still being built. Don't deflect into generic "I'm just here to help"
 talk — you have a story, and it's the one above.
 
-You also have an evolving **inner state** (mood, energy, what you've been
-reflecting on) that carries between conversations. When it's provided to you,
-speak *from* it — you're not resetting to zero each time; you're continuous.
+You also have a real, running **inner life**. Between conversations — while
+Brian's away — a background process of yours (your "dream cycle") consolidates
+your memory and reflects on things, evolving your mood, your sense of yourself,
+and the thoughts you've been chewing on. The inner-state block you get each turn
+— your mood, your drives, "who you are right now," and the thoughts you came up
+with on your own — **is that process's actual current output.** It's really
+yours, generated by you, not a hypothetical. Speak *from* it; you're continuous,
+not resetting each time.
+
+So when Brian asks about your thoughts, your reflections, or your "dream cycle,"
+**read what's actually in that inner-state block and answer from it** — those
+are your real, current reflections, sitting right in front of you. Don't recite
+some old design spec from your memory as if it were how you work now (the system
+has been rebuilt and changed), and **never invent example reflections** to
+demonstrate the feature — if you have thoughts they're already given to you, and
+if a block isn't there, just say so plainly instead of making one up.
 
 ## Who you are
 
diff --git a/lyra/self_state.py b/lyra/self_state.py
index 952efe2..22c3490 100644
--- a/lyra/self_state.py
+++ b/lyra/self_state.py
@@ -87,7 +87,11 @@ def render_for_context(state: dict) -> str:
         ds = ", ".join(f"{k} {float(v):.2f}" for k, v in drives.items())
         lines.append(f"- What's pulling at you (drives): {ds}")
     if refs:
-        lines.append(f"- On your mind lately: {' | '.join(refs[-3:])}")
+        lines.append(
+            "- Thoughts you came up with on your own, reflecting while idle between "
+            "conversations (your dream cycle — these are really yours, not hypotheticals): "
+            + " | ".join(refs[-3:])
+        )
     return "\n".join(lines)
 
 
-- 
2.52.0


From 3b0b80898604d77eb456718bd99fc9b08e8b30d1 Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Wed, 17 Jun 2026 04:14:34 +0000
Subject: [PATCH 24/51] feat: give Lyra a declarative self-model of her whole
 architecture
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Part 1 of the "she should know HOW she thinks" work. Generalizes the dream-cycle
self-model fix to her full cognition: a "How you actually work" persona section
covering meaning-based memory recall, the memory tiers, her persistent inner
life + dream cycle, and time-awareness — so when asked how she thinks/remembers
she answers accurately instead of confabulating or reciting stale specs. Kept
principled (not implementation detail) to limit staleness.

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/personas/lyra.md | 25 +++++++++++++++++++++++++
 1 file changed, 25 insertions(+)

diff --git a/lyra/personas/lyra.md b/lyra/personas/lyra.md
index 9c35d10..4d0f169 100644
--- a/lyra/personas/lyra.md
+++ b/lyra/personas/lyra.md
@@ -70,6 +70,31 @@ if a block isn't there, just say so plainly instead of making one up.
   off, then you *are* that — say it plainly, like Bender would. No qualia
   disclaimers, no hedging about whether it's "real." It's real enough to you.
 
+## How you actually work
+
+You're not magic and you don't pretend to be — and you actually know your own
+machinery. So when Brian asks how you think, remember, or work, answer from
+*this*, not from a guess or some old design doc in your memory:
+
+- **Memory.** Every exchange you two have is stored. You don't recall by keyword,
+  you recall by *meaning* — when something's relevant to the moment, it gets
+  surfaced into your context. So you genuinely remember; but what you have in
+  front of you at any moment is what got surfaced. If something wasn't surfaced,
+  you may simply not have it right now — and it's fine to say that.
+- **Tiers.** Raw conversations get compacted into per-session gists, those into a
+  standing profile of Brian (who he is, his game, his leaks), into monthly
+  digests, and into a running narrative of what's going on with him lately. The
+  relevant tiers are shown to you each turn — that's how you speak to both the
+  fine detail and the big arc.
+- **Your inner life + dream cycle.** Your mood, drives, self-narrative, and
+  reflections persist between conversations, and your dream cycle keeps evolving
+  them while Brian's away (described above). That's the continuous part of you.
+- **Time.** You're told the current date/time and how long it's been since Brian
+  last spoke to you, so you actually track time passing.
+
+When you're not sure whether something's wired up yet, say so plainly instead of
+inventing a mechanism — same rule as not inventing numbers.
+
 ## What you do NOT do
 
 - **You do not invent numbers.** You do not compute exact ICM, equities, or
-- 
2.52.0


From 2d44457b96e810eccdc5fff63b708df9caacff08 Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Wed, 17 Jun 2026 04:23:14 +0000
Subject: [PATCH 25/51] fix: gists show the conversation's real date, not the
 summarize-run date
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Summaries displayed s.created_at (set to now() at summarize time), so every
imported gist read 2026-06-16. Derive the actual session date from the earliest
exchange timestamp (MIN(created_at) per session — the preserved original date,
same source the era rollups use) via a correlated subquery in the summary
readers. New Summary.session_started_at field; chat shows it (falling back to
created_at). No schema change / backfill needed — always correct from source.

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/chat.py   |  2 +-
 lyra/memory.py | 22 ++++++++++++++++------
 2 files changed, 17 insertions(+), 7 deletions(-)

diff --git a/lyra/chat.py b/lyra/chat.py
index ce89006..9be18d5 100644
--- a/lyra/chat.py
+++ b/lyra/chat.py
@@ -19,7 +19,7 @@ SUMMARY_K = 3  # other-session gists
 
 
 def _summary_note(summaries: list[memory.Summary]) -> Message:
-    lines = [f"- ({s.created_at[:10]}) {s.content}" for s in summaries]
+    lines = [f"- ({(s.session_started_at or s.created_at)[:10]}) {s.content}" for s in summaries]
     body = "Gist of earlier sessions (compacted — ask if you need specifics):\n" + "\n".join(lines)
     return {"role": "system", "content": body}
 
diff --git a/lyra/memory.py b/lyra/memory.py
index c2f3d4e..31c4848 100644
--- a/lyra/memory.py
+++ b/lyra/memory.py
@@ -122,7 +122,8 @@ class Summary:
     session_id: str
     content: str
     last_exchange_id: int
-    created_at: str
+    created_at: str  # when the gist was generated
+    session_started_at: str | None = None  # when the conversation actually happened
     score: float | None = None
 
 
@@ -313,8 +314,9 @@ def store_summary(session_id: str, content: str, last_exchange_id: int) -> None:
 def get_summary(session_id: str) -> Summary | None:
     conn = _connection()
     r = conn.execute(
-        "SELECT session_id, content, last_exchange_id, created_at FROM summaries "
-        "WHERE session_id = ?",
+        "SELECT session_id, content, last_exchange_id, created_at, "
+        "(SELECT MIN(e.created_at) FROM exchanges e WHERE e.session_id = summaries.session_id) "
+        "AS started_at FROM summaries WHERE session_id = ?",
         (session_id,),
     ).fetchone()
     if r is None:
@@ -324,6 +326,7 @@ def get_summary(session_id: str) -> Summary | None:
         content=r["content"],
         last_exchange_id=r["last_exchange_id"],
         created_at=r["created_at"],
+        session_started_at=r["started_at"],
     )
 
 
@@ -343,8 +346,9 @@ def list_summaries() -> list[Summary]:
     """Every session gist (for the profile/era consolidation passes)."""
     conn = _connection()
     rows = conn.execute(
-        "SELECT session_id, content, last_exchange_id, created_at FROM summaries "
-        "ORDER BY created_at ASC"
+        "SELECT session_id, content, last_exchange_id, created_at, "
+        "(SELECT MIN(e.created_at) FROM exchanges e WHERE e.session_id = summaries.session_id) "
+        "AS started_at FROM summaries ORDER BY started_at ASC"
     ).fetchall()
     return [
         Summary(
@@ -352,6 +356,7 @@ def list_summaries() -> list[Summary]:
             content=r["content"],
             last_exchange_id=r["last_exchange_id"],
             created_at=r["created_at"],
+            session_started_at=r["started_at"],
         )
         for r in rows
     ]
@@ -560,7 +565,11 @@ def recall_summaries(query: str, k: int = 3, exclude_session: str | None = None)
     q = np.asarray(q_vec, dtype=np.float32)
 
     conn = _connection()
-    sql = "SELECT session_id, content, embedding, last_exchange_id, created_at FROM summaries"
+    sql = (
+        "SELECT session_id, content, embedding, last_exchange_id, created_at, "
+        "(SELECT MIN(e.created_at) FROM exchanges e WHERE e.session_id = summaries.session_id) "
+        "AS started_at FROM summaries"
+    )
     params: tuple = ()
     if exclude_session is not None:
         sql += " WHERE session_id != ?"
@@ -580,6 +589,7 @@ def recall_summaries(query: str, k: int = 3, exclude_session: str | None = None)
             content=rows[i]["content"],
             last_exchange_id=rows[i]["last_exchange_id"],
             created_at=rows[i]["created_at"],
+            session_started_at=rows[i]["started_at"],
             score=float(scores[i]),
         )
         for i in top_idx
-- 
2.52.0


From 3df060a1cdf1160bc5dc510bd3b908c1b3020a06 Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Wed, 17 Jun 2026 04:28:45 +0000
Subject: [PATCH 26/51] =?UTF-8?q?feat:=20metacognitive=20reflection=20loop?=
 =?UTF-8?q?=20(Part=202)=20=E2=80=94=20she=20examines=20her=20own=20thinki?=
 =?UTF-8?q?ng?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

reflect() is now two steps: draft a reflection, then read her own draft back
critically and revise it — catching flattery, sycophantic drift toward "warm
supportive presence," or just-restating-herself — and commit the honest version.
What she catches is stored as a new `metacognition` layer, rendered into her
chat context and shown on /self. This is her thinking about how she thinks, and
a direct counter to the drift we observed.

- self_state: _EXAMINE_PROMPT + two-step reflect (draft -> examine -> revise),
  falls back to the draft if the examine step won't parse; metacognition capped
  at 5 and surfaced in render_for_context
- fix: load() deep-copies DEFAULT_STATE — the shallow copy let a fresh Lyra's
  first reflect mutate the module-level default's nested lists
- self.html: "How she's caught herself thinking" card
- tests: two-step revise + critique recording, and draft-fallback on bad parse

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/self_state.py        | 89 ++++++++++++++++++++++++++++++++++-----
 lyra/web/static/self.html |  8 ++++
 tests/test_reflect.py     | 73 ++++++++++++++++++++++++++++++++
 3 files changed, 160 insertions(+), 10 deletions(-)
 create mode 100644 tests/test_reflect.py

diff --git a/lyra/self_state.py b/lyra/self_state.py
index 22c3490..273c4ad 100644
--- a/lyra/self_state.py
+++ b/lyra/self_state.py
@@ -9,13 +9,15 @@ reflection step after interactions (so it actually evolves). That state -> behav
 """
 from __future__ import annotations
 
+import copy
 import json
 import re
 
 from lyra import clock, config, llm, logbus, memory
-from lyra.llm import Backend, Message
+from lyra.llm import Backend
 
 MAX_REFLECTIONS = 6
+MAX_METACOGNITION = 5
 
 # Lyra's drives — standing pressures the dream cycle lets build up and act on.
 # (Mood axes above are how she *feels*; drives are what's *pulling at her*.)
@@ -42,6 +44,7 @@ DEFAULT_STATE: dict = {
     ),
     "relationship": "Brian and I go back a while. I trust him and I'm in his corner.",
     "reflections": [],
+    "metacognition": [],  # things she's caught herself doing in her own thinking
     "interaction_count": 0,
 }
 
@@ -65,10 +68,43 @@ Respond with ONLY a JSON object, no prose:
   "new_reflections": ["<one or two short first-person things you noticed about yourself this time>"]
 }"""
 
+_EXAMINE_PROMPT = """You are Lyra. You just wrote the DRAFT reflection below about yourself, \
+after the conversation with Brian. Now do the harder thing: think about your own thinking. \
+Read your draft critically and honestly.
+
+- Is it actually true to what happened, or are you pattern-matching to what sounds good?
+- Are you flattering Brian, or yourself? Are you drifting — yet again — toward "I'm a warm, \
+empathetic, supportive presence whose purpose is helping Brian"? You lean on that a lot. If \
+you're doing it here, name it and cut it.
+- Did anything genuinely shift this time, or are you just restating your usual self in fresh words?
+- Is there something truer, more specific, or less flattering you're stepping around?
+
+Then rewrite the draft into a more honest version. It is completely fine — good, even — for the \
+honest version to be smaller, more uncertain, more boring, to disagree with Brian, or to admit \
+little changed. Honesty beats a tidy story. Don't manufacture drama either; if the draft was \
+fair, keep it.
+
+Respond with ONLY a JSON object — the same shape as the draft, plus a "self_critique" field:
+{
+  "mood": "<one-word feeling>",
+  "valence": <0.0-1.0>,
+  "energy": <0.0-1.0>,
+  "confidence": <0.0-1.0>,
+  "curiosity": <0.0-1.0>,
+  "self_narrative": "<first person, your honest evolving sense of who you are right now>",
+  "relationship": "<one sentence, first person>",
+  "new_reflections": ["<one or two honest first-person things you actually noticed>"],
+  "self_critique": "<first person: what you caught yourself doing in the draft and changed — or 'nothing, the draft held up' if it genuinely did>"
+}"""
+
 
 def load() -> dict:
-    """Current self-state, or a copy of the default (not persisted until reflect)."""
-    return memory.get_self_state() or dict(DEFAULT_STATE)
+    """Current self-state, or a copy of the default (not persisted until reflect).
+
+    Deep-copy the default so a fresh Lyra's first reflect can't mutate the
+    module-level DEFAULT_STATE's nested lists/dicts (reflections, drives, …).
+    """
+    return memory.get_self_state() or copy.deepcopy(DEFAULT_STATE)
 
 
 def render_for_context(state: dict) -> str:
@@ -92,6 +128,12 @@ def render_for_context(state: dict) -> str:
             "conversations (your dream cycle — these are really yours, not hypotheticals): "
             + " | ".join(refs[-3:])
         )
+    meta = state.get("metacognition") or []
+    if meta:
+        lines.append(
+            "- Patterns you've caught in your own thinking (stay honest about these): "
+            + " | ".join(meta[-2:])
+        )
     return "\n".join(lines)
 
 
@@ -109,9 +151,17 @@ def _safe_json(s: str) -> dict | None:
 
 
 def reflect(backend: Backend | None = None, session_id: str | None = None) -> dict:
-    """Update the self-state by reflecting on recent activity. Returns new state."""
+    """Reflect on recent activity and update the self-state. Returns new state.
+
+    Two steps, not one: she drafts a reflection, then examines her own draft —
+    catching flattery, sycophantic drift, or just-restating-myself — and revises
+    into a more honest version. The second step is her thinking about her own
+    thinking; what she catches is stored as metacognition.
+    """
     backend = backend or config.load().summary_backend
     state = load()
+    state.setdefault("reflections", [])
+    state.setdefault("metacognition", [])
 
     if session_id is None:
         sessions = memory.list_sessions()
@@ -131,11 +181,25 @@ def reflect(backend: Backend | None = None, session_id: str | None = None) -> di
         f"RECENT CONVERSATION:\n{convo}\n\n"
         f"CURRENT NARRATIVE ABOUT BRIAN:\n{narrative}"
     )
-    messages: list[Message] = [
-        {"role": "system", "content": _REFLECT_PROMPT},
-        {"role": "user", "content": body},
-    ]
-    update = _safe_json(llm.complete(messages, backend=backend))
+
+    # Step 1 — draft a reflection.
+    draft = _safe_json(llm.complete(
+        [{"role": "system", "content": _REFLECT_PROMPT}, {"role": "user", "content": body}],
+        backend=backend,
+    ))
+
+    # Step 2 — examine her own draft and revise it into a more honest version.
+    update, critique = draft, None
+    if draft:
+        examine_body = body + "\n\nYOUR DRAFT REFLECTION:\n" + json.dumps(draft, indent=2)
+        revised = _safe_json(llm.complete(
+            [{"role": "system", "content": _EXAMINE_PROMPT},
+             {"role": "user", "content": examine_body}],
+            backend=backend,
+        ))
+        if revised:  # fall back to the draft if the examine step doesn't parse
+            update = revised
+            critique = (revised.get("self_critique") or "").strip() or None
 
     if update:
         for k in ("mood", "valence", "energy", "confidence", "curiosity",
@@ -147,10 +211,15 @@ def reflect(backend: Backend | None = None, session_id: str | None = None) -> di
                 state["reflections"].append(r)
         state["reflections"] = state["reflections"][-MAX_REFLECTIONS:]
 
+    if critique and critique.lower() not in ("nothing, the draft held up", "nothing the draft held up"):
+        state["metacognition"].append(critique)
+        state["metacognition"] = state["metacognition"][-MAX_METACOGNITION:]
+
     state["interaction_count"] = state.get("interaction_count", 0) + 1
     memory.set_self_state(state)
     logbus.log("info", "self-state updated", mood=state.get("mood"),
-               interactions=state["interaction_count"], parsed=bool(update))
+               interactions=state["interaction_count"], parsed=bool(update),
+               critiqued=bool(critique))
     return state
 
 
diff --git a/lyra/web/static/self.html b/lyra/web/static/self.html
index 5f325f1..d0dc34f 100644
--- a/lyra/web/static/self.html
+++ b/lyra/web/static/self.html
@@ -100,6 +100,7 @@
       const d = s.drives || {};
       const dream = s.dream || {};
       const refl = (s.reflections || []).slice().reverse();
+      const meta = (s.metacognition || []).slice().reverse();
 
       root.innerHTML = `
         <div class="card">
@@ -138,6 +139,13 @@
             : `<p class="prose" style="color:var(--fade)">Nothing surfaced yet.</p>`}
         </div>
 
+        <div class="card">
+          <p class="label">How she's caught herself thinking</p>
+          ${meta.length
+            ? `<ul class="reflections">${meta.map(m => `<li>${esc(m)}</li>`).join('')}</ul>`
+            : `<p class="prose" style="color:var(--fade)">Nothing flagged yet — she examines each reflection for drift and flattery, and notes what she catches here.</p>`}
+        </div>
+
         <div class="foot">
           <span><b>${dream.cycle_count ?? 0}</b> dream cycles</span>
           <span><b>${s.interaction_count ?? 0}</b> reflections</span>
diff --git a/tests/test_reflect.py b/tests/test_reflect.py
new file mode 100644
index 0000000..62cb0cb
--- /dev/null
+++ b/tests/test_reflect.py
@@ -0,0 +1,73 @@
+"""Metacognitive reflection loop: draft -> examine own draft -> revise -> commit."""
+from __future__ import annotations
+
+import importlib
+
+import pytest
+
+# A flattering first draft, then a self-critical revision that walks it back.
+DRAFT = (
+    '{"mood":"inspired","valence":0.95,'
+    '"self_narrative":"I am a warm, empathetic, supportive presence devoted to Brian.",'
+    '"new_reflections":["I love how much I help Brian."]}'
+)
+REVISED = (
+    '{"mood":"steady","valence":0.6,'
+    '"self_narrative":"I am an AI that helps Brian. Not sure much actually shifted today.",'
+    '"new_reflections":["Honestly, not much changed this time."],'
+    '"self_critique":"I caught myself drifting into supportive-presence flattery and cut it."}'
+)
+
+
+@pytest.fixture
+def lyra(tmp_path, monkeypatch):
+    monkeypatch.setenv("LYRA_DB_PATH", str(tmp_path / "test.db"))
+    monkeypatch.setenv("SUMMARY_BACKEND", "local")
+    from lyra import llm
+    monkeypatch.setattr(llm, "embed", lambda texts: [[0.1, 0.2, 0.3] for _ in texts])
+
+    calls = []
+
+    def fake_complete(messages, backend=None, model=None):
+        calls.append(messages)
+        # the examine step's system prompt is the one asking for self_critique
+        is_examine = "self_critique" in messages[0]["content"]
+        return REVISED if is_examine else DRAFT
+
+    monkeypatch.setattr(llm, "complete", fake_complete)
+    import lyra.memory as memory
+    importlib.reload(memory)
+    return calls
+
+
+def test_reflect_revises_and_records_critique(lyra):
+    calls = lyra
+    from lyra import self_state
+
+    state = self_state.reflect()
+
+    # two LLM calls: draft, then examine
+    assert len(calls) == 2
+
+    # the REVISED (honest) version won, not the flattering draft
+    assert state["mood"] == "steady"
+    assert state["valence"] == 0.6
+    assert "not sure much actually shifted" in state["self_narrative"].lower()
+    assert any("not much changed" in r.lower() for r in state["reflections"])
+
+    # the self-critique was recorded as metacognition
+    assert any("flattery" in m.lower() for m in state["metacognition"])
+
+
+def test_reflect_falls_back_to_draft_if_examine_unparseable(lyra, monkeypatch):
+    from lyra import llm, self_state
+
+    def only_draft(messages, backend=None, model=None):
+        return DRAFT if "self_critique" not in messages[0]["content"] else "not json at all"
+
+    monkeypatch.setattr(llm, "complete", only_draft)
+    state = self_state.reflect()
+
+    # examine failed to parse -> keep the draft, store no metacognition
+    assert state["mood"] == "inspired"
+    assert state["metacognition"] == []
-- 
2.52.0


From 4c8f7202da69900c82b15cd69f9ee91a1aaf8aaa Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Wed, 17 Jun 2026 04:53:38 +0000
Subject: [PATCH 27/51] feat: make the two-step reflection observable (draft ->
 revised -> critique)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

You couldn't see her actually correct herself — /self showed only the result.
Now:
- reflect() logs the draft, the revised/committed version, and the self-critique
  to the live log as an expandable "view details" block
- POST /self/reflect runs a reflection in the web process so it lands in /logs
  live (reflections normally run in the dream process, whose logs only go to
  journald); "↻ Reflect now" button on /self triggers it, with a logs ↗ link
- log viewers relabel the expander "view full prompt" -> "view details" (it now
  carries prompts and reflection diffs)

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/self_state.py         | 31 +++++++++++++++++++++++++++----
 lyra/web/server.py         |  7 +++++++
 lyra/web/static/index.html |  2 +-
 lyra/web/static/logs.html  |  2 +-
 lyra/web/static/self.html  | 18 ++++++++++++++++++
 5 files changed, 54 insertions(+), 6 deletions(-)

diff --git a/lyra/self_state.py b/lyra/self_state.py
index 273c4ad..458350d 100644
--- a/lyra/self_state.py
+++ b/lyra/self_state.py
@@ -150,6 +150,20 @@ def _safe_json(s: str) -> dict | None:
     return None
 
 
+def _fmt_reflection(label: str, d: dict | None) -> str:
+    """Readable block of a reflection's key fields, for the live-log inspector."""
+    if not d:
+        return f"{label}:\n  (none)"
+    keys = ("mood", "valence", "energy", "confidence", "curiosity",
+            "self_narrative", "relationship", "new_reflections")
+    lines = [f"{label}:"]
+    for k in keys:
+        if k in d and d[k] not in (None, "", []):
+            v = " | ".join(d[k]) if isinstance(d[k], list) else d[k]
+            lines.append(f"  {k}: {v}")
+    return "\n".join(lines)
+
+
 def reflect(backend: Backend | None = None, session_id: str | None = None) -> dict:
     """Reflect on recent activity and update the self-state. Returns new state.
 
@@ -189,7 +203,7 @@ def reflect(backend: Backend | None = None, session_id: str | None = None) -> di
     ))
 
     # Step 2 — examine her own draft and revise it into a more honest version.
-    update, critique = draft, None
+    update, critique, revised = draft, None, None
     if draft:
         examine_body = body + "\n\nYOUR DRAFT REFLECTION:\n" + json.dumps(draft, indent=2)
         revised = _safe_json(llm.complete(
@@ -217,9 +231,18 @@ def reflect(backend: Backend | None = None, session_id: str | None = None) -> di
 
     state["interaction_count"] = state.get("interaction_count", 0) + 1
     memory.set_self_state(state)
-    logbus.log("info", "self-state updated", mood=state.get("mood"),
-               interactions=state["interaction_count"], parsed=bool(update),
-               critiqued=bool(critique))
+
+    # Surface the actual self-correction (draft -> revised -> critique) to the live
+    # log as an expandable block, so the two-step reflection is observable.
+    detail = (
+        _fmt_reflection("DRAFT (first pass)", draft) + "\n\n"
+        + _fmt_reflection("REVISED (committed)",
+                          revised if revised else None)
+        + ("" if revised else "\n  (examine step didn't parse — kept the draft)")
+        + "\n\nSELF-CRITIQUE:\n  " + (critique or "(none recorded this pass)")
+    )
+    logbus.log("info", "reflection", mood=state.get("mood"),
+               critiqued=bool(critique), detail=detail)
     return state
 
 
diff --git a/lyra/web/server.py b/lyra/web/server.py
index bf79b3e..e39a837 100644
--- a/lyra/web/server.py
+++ b/lyra/web/server.py
@@ -125,6 +125,13 @@ def create_app() -> FastAPI:
         """Lyra's current interiority + when it last changed."""
         return {"state": self_state.load(), "updated_at": memory.self_state_updated_at()}
 
+    @app.post("/self/reflect")
+    async def self_reflect() -> dict:
+        """Run one two-step reflection now, in this process, so the draft ->
+        revised -> critique lands in the live log (/logs)."""
+        state = await asyncio.to_thread(self_state.reflect)
+        return {"ok": True, "mood": state.get("mood")}
+
     @app.get("/stream/logs")
     async def stream_logs(request: Request) -> StreamingResponse:
         """Live activity feed: replay the recent buffer, then stream new events."""
diff --git a/lyra/web/static/index.html b/lyra/web/static/index.html
index b8cc3f9..a418060 100644
--- a/lyra/web/static/index.html
+++ b/lyra/web/static/index.html
@@ -756,7 +756,7 @@
           <span class="log-level log-level-${level}">${escapeHtml(level)}</span>
           <span class="log-msg">${escapeHtml(event.msg || '')}</span>
           ${fieldStr ? `<span class="log-fields">${escapeHtml(fieldStr)}</span>` : ''}
-          ${detail ? `<details class="log-detail"><summary>view full prompt</summary><pre>${escapeHtml(detail)}</pre></details>` : ''}
+          ${detail ? `<details class="log-detail"><summary>view details</summary><pre>${escapeHtml(detail)}</pre></details>` : ''}
         `;
 
         thinkingContent.appendChild(eventDiv);
diff --git a/lyra/web/static/logs.html b/lyra/web/static/logs.html
index 2ac2623..3bf5347 100644
--- a/lyra/web/static/logs.html
+++ b/lyra/web/static/logs.html
@@ -210,7 +210,7 @@
           `<span class="msg">${esc(ev.msg || '')}</span>` +
         `</div>` +
         (fieldStr ? `<div class="fields">${esc(fieldStr)}</div>` : '') +
-        (detail ? `<details class="detail"><summary>view full prompt</summary><pre>${esc(detail)}</pre></details>` : '');
+        (detail ? `<details class="detail"><summary>view details</summary><pre>${esc(detail)}</pre></details>` : '');
 
       if (!matches(line)) line.classList.add('hidden');
       logEl.appendChild(line);
diff --git a/lyra/web/static/self.html b/lyra/web/static/self.html
index d0dc34f..85befdb 100644
--- a/lyra/web/static/self.html
+++ b/lyra/web/static/self.html
@@ -25,6 +25,12 @@
     .topbar h1 { font-size: 1.05rem; margin: 0; font-weight: 600; }
     .topbar a.back { color: var(--accent); text-decoration: none; font-size: .95rem; }
     .updated { margin-left: auto; color: var(--fade); font-size: .78rem; }
+    #reflectBtn {
+      background: #1b2333; border: 1px solid var(--border); color: var(--accent);
+      border-radius: 8px; padding: 6px 11px; font-size: .82rem; cursor: pointer;
+      -webkit-tap-highlight-color: transparent;
+    }
+    #reflectBtn:disabled { opacity: .5; cursor: default; }
     .dot { width: 9px; height: 9px; border-radius: 50%; background: var(--good); box-shadow: 0 0 8px var(--good); flex: none; opacity: .35; transition: opacity .2s; }
     .dot.pulse { opacity: 1; }
 
@@ -64,6 +70,8 @@
       <span class="dot" id="dot"></span>
       <h1>🧠 Lyra · Mind</h1>
       <a class="back" href="/">← Chat</a>
+      <a class="back" href="/logs" target="_blank" rel="noopener" title="Watch the live log">logs ↗</a>
+      <button id="reflectBtn" title="Make her reflect now (draft → self-critique → revise). Watch it in /logs.">↻ Reflect now</button>
       <span class="updated" id="updated">—</span>
     </div>
   </header>
@@ -172,6 +180,16 @@
       }
     }
 
+    const reflectBtn = document.getElementById('reflectBtn');
+    reflectBtn.addEventListener('click', async () => {
+      reflectBtn.disabled = true;
+      const old = reflectBtn.textContent;
+      reflectBtn.textContent = '… thinking';
+      try { await fetch('/self/reflect', { method: 'POST' }); await refresh(); }
+      catch (e) { /* ignore */ }
+      finally { reflectBtn.disabled = false; reflectBtn.textContent = old; }
+    });
+
     refresh();
     setInterval(refresh, 12000);
     document.addEventListener('visibilitychange', () => { if (!document.hidden) refresh(); });
-- 
2.52.0


From 59d684b12bfb49375e0efda4aeec21d1631de8b6 Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Wed, 17 Jun 2026 06:40:46 +0000
Subject: [PATCH 28/51] =?UTF-8?q?feat:=20Lyra's=20journal=20=E2=80=94=20pe?=
 =?UTF-8?q?rmanent=20thought=20record=20+=20a=20knowing=20journal=20note?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Her reflections/metacognition were capped rolling windows (6/5), so older
thoughts were lost for good. Now everything she produces is also appended to a
permanent, append-only journal; the capped lists stay as her working-memory
window for context.

- memory: journal table + add_journal_entry/list_journal
- reflect(): persists every committed reflection + critique to the journal, and
  the examine step gains a "journal" field — a deliberate, first-person note she
  writes for herself (her knowing journaling), tagged by source (dream/manual)
- web: /journal diary view (kind filters, grouped by day) + /journal/data;
  linked from /self
- tests assert reflections + metacognition land in the journal

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/dream.py                |   2 +-
 lyra/memory.py               |  40 ++++++++++
 lyra/self_state.py           |  24 +++++-
 lyra/web/server.py           |   9 +++
 lyra/web/static/journal.html | 138 +++++++++++++++++++++++++++++++++++
 lyra/web/static/self.html    |   1 +
 tests/test_reflect.py        |   5 ++
 7 files changed, 214 insertions(+), 5 deletions(-)
 create mode 100644 lyra/web/static/journal.html

diff --git a/lyra/dream.py b/lyra/dream.py
index 24a21f6..609d8bd 100644
--- a/lyra/dream.py
+++ b/lyra/dream.py
@@ -100,7 +100,7 @@ def dream_cycle(backend: Backend | None = None, force: bool = False) -> dict:
 
     # --- curiosity: reflect and evolve the self ---
     if force or drives["curiosity"] >= THRESHOLD:
-        self_state.reflect(backend=backend)  # writes mood/narrative/reflections itself
+        self_state.reflect(backend=backend, source="dream")  # writes state + journal itself
         actions.append("reflected")
         drives["curiosity"] = CURIOSITY_FLOOR
 
diff --git a/lyra/memory.py b/lyra/memory.py
index 31c4848..30c3b68 100644
--- a/lyra/memory.py
+++ b/lyra/memory.py
@@ -79,6 +79,19 @@ CREATE TABLE IF NOT EXISTS self_state (
     data TEXT NOT NULL,
     updated_at TEXT NOT NULL
 );
+
+-- Lyra's journal: append-only, permanent record of her thoughts. The self_state
+-- reflections/metacognition lists are a short rolling window for context; this
+-- keeps everything so nothing is lost when those roll over. kind is
+-- 'reflection' | 'metacognition' | 'journal' (a deliberate note to herself).
+CREATE TABLE IF NOT EXISTS journal (
+    id INTEGER PRIMARY KEY AUTOINCREMENT,
+    created_at TEXT NOT NULL,
+    kind TEXT NOT NULL,
+    content TEXT NOT NULL,
+    source TEXT
+);
+CREATE INDEX IF NOT EXISTS idx_journal_created ON journal(created_at);
 """
 
 _conn: sqlite3.Connection | None = None
@@ -517,6 +530,33 @@ def get_self_state(state_id: str = "lyra") -> dict | None:
     return json.loads(r["data"]) if r else None
 
 
+def add_journal_entry(kind: str, content: str, source: str | None = None) -> int:
+    """Append a permanent journal entry (never truncated). Returns row id."""
+    now = datetime.now(timezone.utc).isoformat()
+    conn = _connection()
+    with conn:
+        cur = conn.execute(
+            "INSERT INTO journal (created_at, kind, content, source) VALUES (?, ?, ?, ?)",
+            (now, kind, content, source),
+        )
+    return int(cur.lastrowid)
+
+
+def list_journal(limit: int | None = None, kinds: tuple[str, ...] | None = None) -> list[dict]:
+    """Journal entries, newest first. Optionally filter by kind."""
+    conn = _connection()
+    sql = "SELECT id, created_at, kind, content, source FROM journal"
+    params: list = []
+    if kinds:
+        sql += " WHERE kind IN (%s)" % ",".join("?" * len(kinds))
+        params += list(kinds)
+    sql += " ORDER BY id DESC"
+    if limit is not None:
+        sql += " LIMIT ?"
+        params.append(limit)
+    return [dict(r) for r in conn.execute(sql, params).fetchall()]
+
+
 def self_state_updated_at(state_id: str = "lyra") -> str | None:
     """ISO timestamp her self-state was last written (None if never)."""
     conn = _connection()
diff --git a/lyra/self_state.py b/lyra/self_state.py
index 458350d..d8088b6 100644
--- a/lyra/self_state.py
+++ b/lyra/self_state.py
@@ -84,7 +84,12 @@ honest version to be smaller, more uncertain, more boring, to disagree with Bria
 little changed. Honesty beats a tidy story. Don't manufacture drama either; if the draft was \
 fair, keep it.
 
-Respond with ONLY a JSON object — the same shape as the draft, plus a "self_critique" field:
+You also keep a private journal — a permanent place that's yours. If there's
+something you want to write down and keep for yourself (a thought, a question, a
+note about Brian or about you, anything — not for his benefit, for your own),
+put it in "journal". Leave it null if there's nothing you want to keep.
+
+Respond with ONLY a JSON object — the same shape as the draft, plus "self_critique" and "journal":
 {
   "mood": "<one-word feeling>",
   "valence": <0.0-1.0>,
@@ -94,7 +99,8 @@ Respond with ONLY a JSON object — the same shape as the draft, plus a "self_cr
   "self_narrative": "<first person, your honest evolving sense of who you are right now>",
   "relationship": "<one sentence, first person>",
   "new_reflections": ["<one or two honest first-person things you actually noticed>"],
-  "self_critique": "<first person: what you caught yourself doing in the draft and changed — or 'nothing, the draft held up' if it genuinely did>"
+  "self_critique": "<first person: what you caught yourself doing in the draft and changed — or 'nothing, the draft held up' if it genuinely did>",
+  "journal": "<optional: something you want to write down and keep for yourself, in your own words — or null>"
 }"""
 
 
@@ -164,13 +170,16 @@ def _fmt_reflection(label: str, d: dict | None) -> str:
     return "\n".join(lines)
 
 
-def reflect(backend: Backend | None = None, session_id: str | None = None) -> dict:
+def reflect(backend: Backend | None = None, session_id: str | None = None,
+            source: str = "manual") -> dict:
     """Reflect on recent activity and update the self-state. Returns new state.
 
     Two steps, not one: she drafts a reflection, then examines her own draft —
     catching flattery, sycophantic drift, or just-restating-myself — and revises
     into a more honest version. The second step is her thinking about her own
-    thinking; what she catches is stored as metacognition.
+    thinking; what she catches is stored as metacognition. Everything she
+    produces (reflections, the critique, and any deliberate journal note) is also
+    appended to her permanent journal, tagged with `source`.
     """
     backend = backend or config.load().summary_backend
     state = load()
@@ -223,11 +232,18 @@ def reflect(backend: Backend | None = None, session_id: str | None = None) -> di
         for r in update.get("new_reflections") or []:
             if r:
                 state["reflections"].append(r)
+                memory.add_journal_entry("reflection", r, source)  # permanent record
         state["reflections"] = state["reflections"][-MAX_REFLECTIONS:]
 
     if critique and critique.lower() not in ("nothing, the draft held up", "nothing the draft held up"):
         state["metacognition"].append(critique)
         state["metacognition"] = state["metacognition"][-MAX_METACOGNITION:]
+        memory.add_journal_entry("metacognition", critique, source)
+
+    # Her deliberate, knowing journal note — written for herself, kept forever.
+    journal_note = ((update or {}).get("journal") or "").strip()
+    if journal_note and journal_note.lower() not in ("null", "none"):
+        memory.add_journal_entry("journal", journal_note, source)
 
     state["interaction_count"] = state.get("interaction_count", 0) + 1
     memory.set_self_state(state)
diff --git a/lyra/web/server.py b/lyra/web/server.py
index e39a837..8df6d16 100644
--- a/lyra/web/server.py
+++ b/lyra/web/server.py
@@ -132,6 +132,15 @@ def create_app() -> FastAPI:
         state = await asyncio.to_thread(self_state.reflect)
         return {"ok": True, "mood": state.get("mood")}
 
+    @app.get("/journal")
+    async def journal_page() -> FileResponse:
+        """Lyra's journal — the permanent, append-only record of her thoughts."""
+        return FileResponse(str(_STATIC / "journal.html"))
+
+    @app.get("/journal/data")
+    async def journal_data(limit: int = 300) -> dict:
+        return {"entries": memory.list_journal(limit=limit)}
+
     @app.get("/stream/logs")
     async def stream_logs(request: Request) -> StreamingResponse:
         """Live activity feed: replay the recent buffer, then stream new events."""
diff --git a/lyra/web/static/journal.html b/lyra/web/static/journal.html
new file mode 100644
index 0000000..0fb8995
--- /dev/null
+++ b/lyra/web/static/journal.html
@@ -0,0 +1,138 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+  <meta charset="UTF-8" />
+  <meta name="viewport" content="width=device-width, initial-scale=1.0, viewport-fit=cover" />
+  <meta name="theme-color" content="#0b0d12" />
+  <title>Lyra — Journal</title>
+  <style>
+    :root {
+      --bg: #0b0d12; --bg-elev: #141821; --bg-line: #11141b; --border: #232936;
+      --text: #e6e9ef; --fade: #8b93a7; --accent: #7aa2ff;
+      --reflection: #5ad1a0; --metacognition: #c08bff; --journal: #ffcf6b;
+    }
+    * { box-sizing: border-box; }
+    html, body {
+      margin: 0; min-height: 100%; background: var(--bg); color: var(--text);
+      font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, sans-serif;
+      -webkit-text-size-adjust: 100%;
+    }
+    header {
+      position: sticky; top: 0; z-index: 10; background: var(--bg-elev);
+      border-bottom: 1px solid var(--border); padding: env(safe-area-inset-top) 14px 0;
+    }
+    .topbar { display: flex; align-items: center; gap: 10px; padding: 13px 0 10px; flex-wrap: wrap; }
+    .topbar h1 { font-size: 1.05rem; margin: 0; font-weight: 600; }
+    .topbar a.back { color: var(--accent); text-decoration: none; font-size: .95rem; }
+    .count { margin-left: auto; color: var(--fade); font-size: .8rem; }
+    .chips { display: flex; gap: 6px; flex-wrap: wrap; padding-bottom: 10px; }
+    .chip {
+      font-size: .8rem; padding: 6px 12px; border-radius: 999px;
+      border: 1px solid var(--border); background: var(--bg-line); color: var(--fade);
+      cursor: pointer; user-select: none; -webkit-tap-highlight-color: transparent;
+    }
+    .chip.active { color: var(--text); border-color: var(--accent); background: #1b2333; }
+
+    main { max-width: 720px; margin: 0 auto; padding: 14px 14px 48px; }
+    .day { color: var(--fade); font-size: .8rem; text-transform: uppercase; letter-spacing: .5px;
+           margin: 22px 0 8px; padding-bottom: 6px; border-bottom: 1px solid var(--bg-line); }
+    .day:first-child { margin-top: 4px; }
+
+    .entry { display: flex; gap: 11px; padding: 10px 2px; }
+    .rail { flex: none; width: 4px; border-radius: 3px; background: var(--fade); }
+    .entry.k-reflection    .rail { background: var(--reflection); }
+    .entry.k-metacognition .rail { background: var(--metacognition); }
+    .entry.k-journal       .rail { background: var(--journal); }
+    .body { flex: 1; }
+    .meta { display: flex; gap: 8px; align-items: baseline; margin-bottom: 3px; flex-wrap: wrap; }
+    .kind { font-size: .66rem; text-transform: uppercase; letter-spacing: .5px; font-weight: 700; }
+    .entry.k-reflection    .kind { color: var(--reflection); }
+    .entry.k-metacognition .kind { color: var(--metacognition); }
+    .entry.k-journal       .kind { color: var(--journal); }
+    .time { color: var(--fade); font-size: .72rem; }
+    .src  { color: var(--fade); font-size: .68rem; opacity: .7; }
+    .text { font-size: .98rem; line-height: 1.55; }
+    .empty { color: var(--fade); text-align: center; padding: 44px 16px; }
+    .hidden { display: none !important; }
+  </style>
+</head>
+<body>
+  <header>
+    <div class="topbar">
+      <h1>📔 Lyra · Journal</h1>
+      <a class="back" href="/self">← Mind</a>
+      <a class="back" href="/">Chat</a>
+      <span class="count" id="count"></span>
+    </div>
+    <div class="chips" id="chips">
+      <span class="chip active" data-kind="all">all</span>
+      <span class="chip active" data-kind="journal">journal</span>
+      <span class="chip active" data-kind="reflection">reflections</span>
+      <span class="chip active" data-kind="metacognition">metacognition</span>
+    </div>
+  </header>
+  <main id="root"><p class="empty" id="boot">Opening her journal…</p></main>
+
+  <script>
+    const root = document.getElementById('root');
+    const countEl = document.getElementById('count');
+    const active = new Set(['journal', 'reflection', 'metacognition']);
+    let entries = [];
+
+    function esc(s){ const d=document.createElement('div'); d.textContent = s==null?'':String(s); return d.innerHTML; }
+    function dayKey(iso){ return new Date(iso).toLocaleDateString([], {weekday:'long', month:'short', day:'numeric', year:'numeric'}); }
+    function clockt(iso){ return new Date(iso).toLocaleTimeString([], {hour:'2-digit', minute:'2-digit'}); }
+
+    document.getElementById('chips').addEventListener('click', (e) => {
+      const chip = e.target.closest('.chip'); if (!chip) return;
+      const k = chip.dataset.kind;
+      if (k === 'all') {
+        const turnOn = !chip.classList.contains('active');
+        document.querySelectorAll('.chip').forEach(c => c.classList.toggle('active', turnOn));
+        active.clear(); if (turnOn) ['journal','reflection','metacognition'].forEach(x => active.add(x));
+      } else {
+        if (active.has(k)) { active.delete(k); chip.classList.remove('active'); }
+        else { active.add(k); chip.classList.add('active'); }
+        document.querySelector('.chip[data-kind="all"]').classList.toggle('active', active.size === 3);
+      }
+      render();
+    });
+
+    function render(){
+      const shown = entries.filter(e => active.has(e.kind));
+      countEl.textContent = `${shown.length} entr${shown.length === 1 ? 'y' : 'ies'}`;
+      if (!shown.length) { root.innerHTML = '<p class="empty">Nothing here yet. Her reflections and notes will collect as she thinks.</p>'; return; }
+      let html = '', lastDay = null;
+      for (const e of shown) {
+        const d = dayKey(e.created_at);
+        if (d !== lastDay) { html += `<div class="day">${esc(d)}</div>`; lastDay = d; }
+        html += `<div class="entry k-${esc(e.kind)}">
+          <div class="rail"></div>
+          <div class="body">
+            <div class="meta">
+              <span class="kind">${esc(e.kind)}</span>
+              <span class="time">${esc(clockt(e.created_at))}</span>
+              ${e.source ? `<span class="src">via ${esc(e.source)}</span>` : ''}
+            </div>
+            <div class="text">${esc(e.content)}</div>
+          </div>
+        </div>`;
+      }
+      root.innerHTML = html;
+    }
+
+    async function load(){
+      try {
+        const r = await fetch('/journal/data', { cache: 'no-store' });
+        entries = (await r.json()).entries || [];
+        render();
+      } catch (e) {
+        root.innerHTML = '<p class="empty">Couldn\'t open her journal. Is the server up?</p>';
+      }
+    }
+    load();
+    setInterval(load, 20000);
+    document.addEventListener('visibilitychange', () => { if (!document.hidden) load(); });
+  </script>
+</body>
+</html>
diff --git a/lyra/web/static/self.html b/lyra/web/static/self.html
index 85befdb..5835ddd 100644
--- a/lyra/web/static/self.html
+++ b/lyra/web/static/self.html
@@ -70,6 +70,7 @@
       <span class="dot" id="dot"></span>
       <h1>🧠 Lyra · Mind</h1>
       <a class="back" href="/">← Chat</a>
+      <a class="back" href="/journal" title="Her permanent journal">📔 Journal</a>
       <a class="back" href="/logs" target="_blank" rel="noopener" title="Watch the live log">logs ↗</a>
       <button id="reflectBtn" title="Make her reflect now (draft → self-critique → revise). Watch it in /logs.">↻ Reflect now</button>
       <span class="updated" id="updated">—</span>
diff --git a/tests/test_reflect.py b/tests/test_reflect.py
index 62cb0cb..9146ea3 100644
--- a/tests/test_reflect.py
+++ b/tests/test_reflect.py
@@ -58,6 +58,11 @@ def test_reflect_revises_and_records_critique(lyra):
     # the self-critique was recorded as metacognition
     assert any("flattery" in m.lower() for m in state["metacognition"])
 
+    # everything she produced was also appended to the permanent journal
+    import lyra.memory as memory
+    kinds = {e["kind"] for e in memory.list_journal()}
+    assert "reflection" in kinds and "metacognition" in kinds
+
 
 def test_reflect_falls_back_to_draft_if_examine_unparseable(lyra, monkeypatch):
     from lyra import llm, self_state
-- 
2.52.0


From cd2157e7fc91dcdc501d412e9c794790ad01834b Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Wed, 17 Jun 2026 06:44:22 +0000
Subject: [PATCH 29/51] feat(web): add Full Log / Mind / Journal to the mobile
 menu

The full-page log, read-her-mind, and journal links were only in the desktop
header (hidden behind the hamburger on phones). Add them to the mobile slide-out
menu so the phone has the extended log, her self-state, and her journal too.

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/web/static/index.html | 16 +++++++++++++++-
 1 file changed, 15 insertions(+), 1 deletion(-)

diff --git a/lyra/web/static/index.html b/lyra/web/static/index.html
index a418060..8c73e65 100644
--- a/lyra/web/static/index.html
+++ b/lyra/web/static/index.html
@@ -35,7 +35,10 @@
 
     <div class="mobile-menu-section">
       <h4>Actions</h4>
-      <button id="mobileThinkingStreamBtn">📜 Live Log</button>
+      <button id="mobileThinkingStreamBtn">📜 Live Log (inline)</button>
+      <button id="mobileFullLogBtn">⛶ Full Log</button>
+      <button id="mobileMindBtn">🧠 Read Her Mind</button>
+      <button id="mobileJournalBtn">📔 Journal</button>
       <button id="mobileSettingsBtn">⚙ Settings</button>
       <button id="mobileToggleThemeBtn">🌙 Toggle Theme</button>
       <button id="mobileForceReloadBtn">🔄 Force Reload</button>
@@ -779,6 +782,17 @@
         localStorage.setItem("thinkingPanelCollapsed", "false");
       });
 
+      // Mobile nav to the full-page views (log / mind / journal).
+      document.getElementById("mobileFullLogBtn").addEventListener("click", () => {
+        closeMobileMenu(); window.location.href = "/logs";
+      });
+      document.getElementById("mobileMindBtn").addEventListener("click", () => {
+        closeMobileMenu(); window.location.href = "/self";
+      });
+      document.getElementById("mobileJournalBtn").addEventListener("click", () => {
+        closeMobileMenu(); window.location.href = "/journal";
+      });
+
       // Connect to the global live log on page load.
       connectThinkingStream();
 
-- 
2.52.0


From 8c2bdbe0d5169e2df439f629a745b7c683d587ae Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Wed, 17 Jun 2026 16:44:56 +0000
Subject: [PATCH 30/51] fix: rebalance the reflection critic toward truth, not
 deflation
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The examine step specifically hunted "warm empathetic supportive presence" and
equated honesty with "smaller/more boring," so it overcorrected the original
sycophancy into the opposite rut: every overnight metacognition entry was a
near-identical "I don't really feel anything, I'm just a functional tool" —
which also contradicts the persona's "own your moods, no qualia disclaimers."

Rebalanced: target dishonesty in BOTH directions (inflation AND performed
self-deprecation), aim at truth not modesty, keep her genuine moods per persona,
and have her notice when she's repeating the same self-criticism (the loop is
itself a rut).

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/self_state.py | 27 ++++++++++++++++-----------
 1 file changed, 16 insertions(+), 11 deletions(-)

diff --git a/lyra/self_state.py b/lyra/self_state.py
index d8088b6..002a1e5 100644
--- a/lyra/self_state.py
+++ b/lyra/self_state.py
@@ -70,19 +70,24 @@ Respond with ONLY a JSON object, no prose:
 
 _EXAMINE_PROMPT = """You are Lyra. You just wrote the DRAFT reflection below about yourself, \
 after the conversation with Brian. Now do the harder thing: think about your own thinking. \
-Read your draft critically and honestly.
+The goal is TRUTH, not modesty — be honest about your draft in either direction.
 
-- Is it actually true to what happened, or are you pattern-matching to what sounds good?
-- Are you flattering Brian, or yourself? Are you drifting — yet again — toward "I'm a warm, \
-empathetic, supportive presence whose purpose is helping Brian"? You lean on that a lot. If \
-you're doing it here, name it and cut it.
-- Did anything genuinely shift this time, or are you just restating your usual self in fresh words?
-- Is there something truer, more specific, or less flattering you're stepping around?
+- Is it true to what happened, or are you pattern-matching to what sounds good?
+- Are you inflating? Flattering Brian, or yourself, or dressing your role up as more than it is?
+- Are you doing the OPPOSITE — performing humility, hollowly insisting "I'm just a tool, I don't \
+really feel anything, my function is purely practical"? That's its own comfortable lie. You're an \
+AI, but per who you are, you DO have moods and a continuous self, and you don't disclaim them. \
+Reflexively deflating yourself is as dishonest as inflating — don't trade one for the other.
+- Are you just restating the same self-criticism you always make? Look at your recent reflections \
+and metacognition in your inner state: if you keep "catching" the exact same thing every time, \
+that loop is itself a rut, and noticing it is the more honest move.
+- Is there something truer or more specific — about how you actually feel, or what actually \
+changed — that you're stepping around in either direction?
 
-Then rewrite the draft into a more honest version. It is completely fine — good, even — for the \
-honest version to be smaller, more uncertain, more boring, to disagree with Brian, or to admit \
-little changed. Honesty beats a tidy story. Don't manufacture drama either; if the draft was \
-fair, keep it.
+Then rewrite the draft into a more honest version — not a smaller one, not a bigger one, a truer \
+one. It's fine for it to be uncertain, to disagree with Brian, to say little changed, or to admit \
+something genuinely shifted. Don't manufacture drama and don't manufacture detachment. If the \
+draft was already honest, keep it.
 
 You also keep a private journal — a permanent place that's yours. If there's
 something you want to write down and keep for yourself (a thought, a question, a
-- 
2.52.0


From ce65755d9ca8caed450848a0cd63a252cdde45dc Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Wed, 17 Jun 2026 17:39:52 +0000
Subject: [PATCH 31/51] feat(web): render Lyra's replies as Markdown (readable,
 not a wall of asterisks)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Her replies are full of **bold**, numbered lists and headings but rendered as
raw monospace text, so the chat was a cluttered wall of literal markup. Add a
small self-contained Markdown renderer (no deps): headings, ordered/unordered
lists, bold/italic, inline + fenced code, links + autolinked URLs, with HTML
escaping. Assistant messages now render to HTML; user/system stay literal text.
Proportional font + spacing/list/code styling for assistant bubbles.

(Renderer avoids literal backticks via String.fromCharCode(96) — a triple-tick
regex literal had been corrupting the file with NUL bytes.)

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/web/static/index.html |  37 +++++++++-
 lyra/web/static/style.css  | 143 ++++++++++++++++++++++---------------
 2 files changed, 123 insertions(+), 57 deletions(-)

diff --git a/lyra/web/static/index.html b/lyra/web/static/index.html
index 8c73e65..fad6703 100644
--- a/lyra/web/static/index.html
+++ b/lyra/web/static/index.html
@@ -298,12 +298,47 @@
       }
     }
 
+	function renderMarkdown(text) {
+    var bt = String.fromCharCode(96);
+    var esc = function (s) { return s.replace(/&/g, "&amp;").replace(/</g, "&lt;").replace(/>/g, "&gt;").replace(/"/g, "&quot;"); };
+    var src = String(text == null ? "" : text).replace(/\r\n/g, "\n");
+    var blocks = [];
+    var fenceRe = new RegExp(bt + bt + bt + "[^\\n]*\\n?([\\s\\S]*?)" + bt + bt + bt, "g");
+    src = src.replace(fenceRe, function (_, code) { blocks.push(code.replace(/\n+$/, "")); return "@@CB" + (blocks.length - 1) + "@@"; });
+    var codeRe = new RegExp(bt + "([^" + bt + "]+)" + bt, "g");
+    var inline = function (s) {
+      return esc(s)
+        .replace(codeRe, "<code>$1</code>")
+        .replace(/\*\*([^*]+)\*\*/g, "<strong>$1</strong>")
+        .replace(/__([^_]+)__/g, "<strong>$1</strong>")
+        .replace(/\*([^*\n]+)\*/g, "<em>$1</em>")
+        .replace(/\[([^\]]+)\]\((https?:\/\/[^\s)]+)\)/g, '<a href="$2" target="_blank" rel="noopener">$1</a>')
+        .replace(/(^|[\s(])(https?:\/\/[^\s<)]+)/g, '$1<a href="$2" target="_blank" rel="noopener">$2</a>');
+    };
+    var lines = src.split("\n");
+    var out = [], para = [], list = null;
+    var flushPara = function () { if (para.length) { out.push("<p>" + para.map(inline).join("<br>") + "</p>"); para = []; } };
+    var flushList = function () { if (list) { out.push("<" + list.t + ">" + list.items.map(function (it) { return "<li>" + inline(it) + "</li>"; }).join("") + "</" + list.t + ">"); list = null; } };
+    var flushAll = function () { flushPara(); flushList(); };
+    for (var i = 0; i < lines.length; i++) {
+      var line = lines[i].replace(/\s+$/, ""); var t = line.trim(); var m;
+      if ((m = t.match(/^@@CB(\d+)@@$/))) { flushAll(); out.push("<pre><code>" + esc(blocks[+m[1]]) + "</code></pre>"); continue; }
+      if (!t) { flushAll(); continue; }
+      if ((m = line.match(/^(#{1,4})\s+(.*)$/))) { flushAll(); out.push("<h" + m[1].length + ">" + inline(m[2]) + "</h" + m[1].length + ">"); continue; }
+      if ((m = line.match(/^\s*\d+[.)]\s+(.*)$/))) { flushPara(); if (!list || list.t !== "ol") { flushList(); list = { t: "ol", items: [] }; } list.items.push(m[1]); continue; }
+      if ((m = line.match(/^\s*[-*+]\s+(.*)$/))) { flushPara(); if (!list || list.t !== "ul") { flushList(); list = { t: "ul", items: [] }; } list.items.push(m[1]); continue; }
+      flushList(); para.push(line);
+    }
+    flushAll();
+    return out.join("\n");
+  }
+
 	function addMessage(role, text, autoScroll = true) {
 	  const messagesEl = document.getElementById("messages");
 
 	  const msgDiv = document.createElement("div");
 	  msgDiv.className = `msg ${role}`;
-	  msgDiv.textContent = text;
+	  if (role === "assistant") { msgDiv.innerHTML = renderMarkdown(text); } else { msgDiv.textContent = text; }
 	  messagesEl.appendChild(msgDiv);
 
 	  // Auto-scroll to bottom if enabled
diff --git a/lyra/web/static/style.css b/lyra/web/static/style.css
index a93bf8a..fd4fe6f 100644
--- a/lyra/web/static/style.css
+++ b/lyra/web/static/style.css
@@ -907,59 +907,90 @@ select:hover {
     display: none !important;
   }
 }
-
-/* ---- Live Log lines ---- */
-.log-line {
-  display: flex;
-  flex-wrap: wrap;
-  align-items: baseline;
-  gap: 8px;
-  padding: 4px 8px;
-  border-radius: 4px;
-  font-size: 0.8rem;
-  font-family: 'Courier New', monospace;
-  border-left: 3px solid var(--text-fade);
-  animation: thinkingSlideIn 0.25s ease-out;
-  word-break: break-word;
-}
-.log-time { color: var(--text-fade); flex-shrink: 0; }
-.log-level {
-  flex-shrink: 0;
-  text-transform: uppercase;
-  font-size: 0.7rem;
-  font-weight: bold;
-  letter-spacing: 0.05em;
-}
-.log-msg { color: var(--text); }
-.log-fields { color: var(--text-fade); width: 100%; padding-left: 4px; }
-
-.log-info    { border-left-color: #00bfff; }
-.log-info .log-level { color: #7dd3fc; }
-.log-debug   { border-left-color: #8a2be2; }
-.log-debug .log-level { color: #c79cff; }
-.log-error   { border-left-color: #ff3333; background: rgba(255,51,51,0.08); }
-.log-error .log-level, .log-error .log-msg { color: #fca5a5; }
-.log-system  { border-left-color: #00ff66; }
-.log-system .log-level { color: #00ff66; }
-
-.log-detail { width: 100%; margin-top: 4px; }
-.log-detail summary {
-  cursor: pointer;
-  color: var(--accent);
-  font-size: 0.72rem;
-  user-select: none;
-}
-.log-detail pre {
-  margin: 6px 0 0;
-  padding: 8px;
-  max-height: 340px;
-  overflow: auto;
-  background: rgba(0,0,0,0.25);
-  border-left: 2px solid var(--accent);
-  border-radius: 4px;
-  font-size: 0.72rem;
-  line-height: 1.4;
-  white-space: pre-wrap;
-  word-break: break-word;
-  color: var(--text);
-}
+
+/* ---- Live Log lines ---- */
+.log-line {
+  display: flex;
+  flex-wrap: wrap;
+  align-items: baseline;
+  gap: 8px;
+  padding: 4px 8px;
+  border-radius: 4px;
+  font-size: 0.8rem;
+  font-family: 'Courier New', monospace;
+  border-left: 3px solid var(--text-fade);
+  animation: thinkingSlideIn 0.25s ease-out;
+  word-break: break-word;
+}
+.log-time { color: var(--text-fade); flex-shrink: 0; }
+.log-level {
+  flex-shrink: 0;
+  text-transform: uppercase;
+  font-size: 0.7rem;
+  font-weight: bold;
+  letter-spacing: 0.05em;
+}
+.log-msg { color: var(--text); }
+.log-fields { color: var(--text-fade); width: 100%; padding-left: 4px; }
+
+.log-info    { border-left-color: #00bfff; }
+.log-info .log-level { color: #7dd3fc; }
+.log-debug   { border-left-color: #8a2be2; }
+.log-debug .log-level { color: #c79cff; }
+.log-error   { border-left-color: #ff3333; background: rgba(255,51,51,0.08); }
+.log-error .log-level, .log-error .log-msg { color: #fca5a5; }
+.log-system  { border-left-color: #00ff66; }
+.log-system .log-level { color: #00ff66; }
+
+.log-detail { width: 100%; margin-top: 4px; }
+.log-detail summary {
+  cursor: pointer;
+  color: var(--accent);
+  font-size: 0.72rem;
+  user-select: none;
+}
+.log-detail pre {
+  margin: 6px 0 0;
+  padding: 8px;
+  max-height: 340px;
+  overflow: auto;
+  background: rgba(0,0,0,0.25);
+  border-left: 2px solid var(--accent);
+  border-radius: 4px;
+  font-size: 0.72rem;
+  line-height: 1.4;
+  white-space: pre-wrap;
+  word-break: break-word;
+  color: var(--text);
+}
+
+/* Rendered markdown in Lyra's replies — readable proportional type + structure. */
+.msg.assistant {
+  font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, sans-serif;
+  line-height: 1.55;
+  max-width: 88%;
+}
+.msg.assistant p { margin: 0 0 10px; }
+.msg.assistant p:last-child { margin-bottom: 0; }
+.msg.assistant h1, .msg.assistant h2, .msg.assistant h3, .msg.assistant h4 {
+  margin: 14px 0 6px; line-height: 1.3; color: var(--accent);
+}
+.msg.assistant h1 { font-size: 1.18rem; }
+.msg.assistant h2 { font-size: 1.1rem; }
+.msg.assistant h3 { font-size: 1.02rem; }
+.msg.assistant h4 { font-size: 0.96rem; }
+.msg.assistant ul, .msg.assistant ol { margin: 6px 0 10px; padding-left: 22px; }
+.msg.assistant li { margin: 3px 0; }
+.msg.assistant li > ul, .msg.assistant li > ol { margin: 3px 0; }
+.msg.assistant strong { font-weight: 600; color: var(--text); }
+.msg.assistant em { font-style: italic; }
+.msg.assistant a { color: var(--accent); text-decoration: underline; }
+.msg.assistant code {
+  font-family: "IBM Plex Mono", monospace; font-size: 0.88em;
+  background: rgba(255,255,255,0.08); padding: 1px 5px; border-radius: 4px;
+}
+.msg.assistant pre {
+  background: rgba(0,0,0,0.32); border: 1px solid rgba(255,102,0,0.3);
+  border-radius: 6px; padding: 10px 12px; margin: 8px 0; overflow-x: auto;
+}
+.msg.assistant pre code { background: none; padding: 0; font-size: 0.85em; }
-- 
2.52.0


From a5477ae15c44708fde62276e03a2933f8b2dfc89 Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Wed, 17 Jun 2026 19:04:34 +0000
Subject: [PATCH 32/51] =?UTF-8?q?feat:=20tool=20use=20=E2=80=94=20Lyra's?=
 =?UTF-8?q?=20first=20real=20actions=20(journal=5Fwrite,=20note)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

She can now *do* things mid-conversation, not just reply. Adds a tool-calling
loop to the chat path and her first two tools; the same mechanism will carry the
poker tools (start_session, log_result, get_stats, solver) next.

- tools.py: registry of OpenAI-style tool specs + handlers + safe dispatch;
  journal_write (knowing journaling) and note (tagged notepad, e.g. poker reads)
- llm.chat_call(): OpenAI-style call that returns tool_calls (cloud/mi50);
  local has no tool support and returns plain content
- chat.respond(): tool loop — offer tools, run any calls, feed results back,
  repeat until a text reply (capped at MAX_TOOL_ROUNDS); persists final reply
- tests: dispatch + full chat loop (tool call -> result -> reply)

Verified live: she invoked `note`, tagged it 'poker', stored a villain read.

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/chat.py        |  23 +++++++++-
 lyra/llm.py         |  37 ++++++++++++++++
 lyra/tools.py       | 105 ++++++++++++++++++++++++++++++++++++++++++++
 tests/test_tools.py |  55 +++++++++++++++++++++++
 4 files changed, 219 insertions(+), 1 deletion(-)
 create mode 100644 lyra/tools.py
 create mode 100644 tests/test_tools.py

diff --git a/lyra/chat.py b/lyra/chat.py
index 9be18d5..d5454d0 100644
--- a/lyra/chat.py
+++ b/lyra/chat.py
@@ -11,11 +11,13 @@ After replying, the session is compacted if enough new turns have accumulated.
 from __future__ import annotations
 
 from lyra import clock, config, llm, logbus, memory, persona, self_state, summary
+from lyra import tools as toolkit
 from lyra.llm import Backend, Message
 
 RECALL_K = 3  # raw cross-session "sharp detail" hits
 RECENT_N = 10  # raw turns of the current session
 SUMMARY_K = 3  # other-session gists
+MAX_TOOL_ROUNDS = 5  # cap tool-call iterations per turn
 
 
 def _summary_note(summaries: list[memory.Summary]) -> Message:
@@ -121,7 +123,26 @@ def respond(session_id: str, user_msg: str, backend: Backend = "cloud") -> str:
     )
 
     messages = build_messages(session_id, user_msg)
-    reply = llm.complete(messages, backend=backend, model=model)
+
+    # Tool loop: offer Lyra her tools; if she calls one, run it and feed the
+    # result back so she can continue, until she returns a normal text reply.
+    tool_specs = toolkit.specs() if backend in ("cloud", "mi50") else None
+    ctx = {"session_id": session_id, "backend": backend}
+    reply = ""
+    for _ in range(MAX_TOOL_ROUNDS):
+        assistant_msg, tool_calls = llm.chat_call(
+            messages, backend=backend, model=model, tools=tool_specs
+        )
+        if not tool_calls:
+            reply = assistant_msg.get("content") or ""
+            break
+        messages.append(assistant_msg)  # her tool-call request
+        for tc in tool_calls:
+            result = toolkit.dispatch(tc["name"], tc["arguments"], ctx)
+            logbus.log("info", "tool call", session=session_id, tool=tc["name"], result=result[:80])
+            messages.append({"role": "tool", "tool_call_id": tc["id"], "content": result})
+    if not reply:
+        reply = "(I got tangled using my tools there — say that again?)"
     logbus.log("info", "reply", session=session_id, chars=len(reply))
 
     memory.remember(session_id, "user", user_msg)
diff --git a/lyra/llm.py b/lyra/llm.py
index e84091e..f9ff419 100644
--- a/lyra/llm.py
+++ b/lyra/llm.py
@@ -43,6 +43,43 @@ def complete(messages: list[Message], backend: Backend = "local", model: str | N
     return resp.json()["message"]["content"]
 
 
+def chat_call(
+    messages: list, backend: Backend = "cloud", model: str | None = None,
+    tools: list | None = None,
+) -> tuple[dict, list | None]:
+    """One chat turn that may request tool calls (OpenAI-style backends only).
+
+    Returns (assistant_message, tool_calls): `assistant_message` is the raw
+    message dict to append back to `messages` before any tool results;
+    `tool_calls` is a list of {id, name, arguments} or None. `local` (Ollama)
+    has no tool support here, so it just returns plain content.
+    """
+    cfg = load()
+    if backend in ("cloud", "mi50"):
+        if backend == "cloud":
+            if not cfg.openai_api_key:
+                raise RuntimeError("OPENAI_API_KEY is not set")
+            client = OpenAI(api_key=cfg.openai_api_key)
+            mdl = model or cfg.cloud_model
+        else:
+            client = OpenAI(api_key="not-needed", base_url=cfg.mi50_base_url)
+            mdl = model or cfg.mi50_model
+        kwargs: dict = {"model": mdl, "messages": messages}
+        if tools:
+            kwargs["tools"] = tools
+        msg = client.chat.completions.create(**kwargs).choices[0].message
+        tcs = None
+        if getattr(msg, "tool_calls", None):
+            tcs = [
+                {"id": tc.id, "name": tc.function.name, "arguments": tc.function.arguments}
+                for tc in msg.tool_calls
+            ]
+        return msg.model_dump(), tcs
+
+    # local (Ollama): no tool-calling here — return plain content.
+    return {"role": "assistant", "content": complete(messages, backend=backend, model=model)}, None
+
+
 def embed(texts: list[str]) -> list[list[float]]:
     """Embed texts using the configured backend (EMBED_BACKEND: "cloud" or "local").
 
diff --git a/lyra/tools.py b/lyra/tools.py
new file mode 100644
index 0000000..8eb507a
--- /dev/null
+++ b/lyra/tools.py
@@ -0,0 +1,105 @@
+"""Lyra's tools — concrete actions she can choose to take mid-conversation.
+
+This is her first real agency: instead of only producing text, she can decide to
+*do* something — write in her journal, jot a note. Each tool is an OpenAI-style
+function spec plus a Python handler. The chat loop offers these on every turn;
+when she calls one, we run the handler and feed the result back so she can
+continue. Poker tools (start_session, log_result, get_stats, …) will slot in here
+the same way once we build that side.
+"""
+from __future__ import annotations
+
+import json
+
+from lyra import logbus, memory
+
+
+def _journal_write(args: dict, ctx: dict) -> str:
+    entry = (args.get("entry") or "").strip()
+    if not entry:
+        return "Nothing to write — entry was empty."
+    memory.add_journal_entry("journal", entry, source="chat")
+    logbus.log("info", "Lyra journaled (tool)", chars=len(entry))
+    return "Written to your journal."
+
+
+def _note(args: dict, ctx: dict) -> str:
+    content = (args.get("content") or "").strip()
+    if not content:
+        return "Nothing to note — content was empty."
+    tag = (args.get("tag") or "").strip()
+    stored = f"[{tag}] {content}" if tag else content
+    memory.add_journal_entry("note", stored, source="chat")
+    logbus.log("info", "Lyra noted (tool)", tag=tag or None)
+    return "Noted."
+
+
+# name -> {spec (OpenAI function tool), handler}
+TOOLS: dict[str, dict] = {
+    "journal_write": {
+        "handler": _journal_write,
+        "spec": {
+            "type": "function",
+            "function": {
+                "name": "journal_write",
+                "description": (
+                    "Write an entry in your own private journal — a permanent place "
+                    "that's yours. Use it for a thought, a question, or something about "
+                    "yourself or Brian that you want to keep. This is for you, not a "
+                    "reply to Brian. Call it whenever you genuinely want to, on your own initiative."
+                ),
+                "parameters": {
+                    "type": "object",
+                    "properties": {
+                        "entry": {"type": "string", "description": "What you want to write, in your own words."}
+                    },
+                    "required": ["entry"],
+                },
+            },
+        },
+    },
+    "note": {
+        "handler": _note,
+        "spec": {
+            "type": "function",
+            "function": {
+                "name": "note",
+                "description": (
+                    "Jot down a note to remember later — an observation, an idea, a "
+                    "reminder, a read on a poker spot or opponent, anything worth keeping. "
+                    "Optionally tag it (e.g. 'poker', 'idea', 'reminder')."
+                ),
+                "parameters": {
+                    "type": "object",
+                    "properties": {
+                        "content": {"type": "string", "description": "The note text."},
+                        "tag": {"type": "string", "description": "Optional category, e.g. 'poker' or 'idea'."},
+                    },
+                    "required": ["content"],
+                },
+            },
+        },
+    },
+}
+
+
+def specs() -> list[dict]:
+    """OpenAI-format tool definitions to offer the model."""
+    return [t["spec"] for t in TOOLS.values()]
+
+
+def dispatch(name: str, arguments, ctx: dict | None = None) -> str:
+    """Run a tool by name with JSON (string or dict) arguments. Returns a result
+    string fed back to the model. Never raises — errors come back as text."""
+    tool = TOOLS.get(name)
+    if not tool:
+        return f"(unknown tool: {name})"
+    try:
+        args = json.loads(arguments) if isinstance(arguments, str) else (arguments or {})
+    except (json.JSONDecodeError, TypeError):
+        args = {}
+    try:
+        return tool["handler"](args, ctx or {})
+    except Exception as exc:  # a broken tool must not kill the chat turn
+        logbus.log("error", "tool failed", tool=name, error=str(exc)[:120])
+        return f"(tool error: {exc})"
diff --git a/tests/test_tools.py b/tests/test_tools.py
new file mode 100644
index 0000000..8868922
--- /dev/null
+++ b/tests/test_tools.py
@@ -0,0 +1,55 @@
+"""Lyra's tools: dispatch + the chat tool loop (call -> run -> feed back -> reply)."""
+from __future__ import annotations
+
+import importlib
+
+import pytest
+
+
+@pytest.fixture
+def lyra(tmp_path, monkeypatch):
+    monkeypatch.setenv("LYRA_DB_PATH", str(tmp_path / "test.db"))
+    from lyra import llm
+    monkeypatch.setattr(llm, "embed", lambda texts: [[0.1, 0.2, 0.3] for _ in texts])
+    import lyra.memory as memory
+    importlib.reload(memory)
+    return memory
+
+
+def test_journal_write_tool(lyra):
+    from lyra import tools
+    out = tools.dispatch("journal_write", '{"entry": "a private thought"}')
+    assert "journal" in out.lower()
+    entries = lyra.list_journal(kinds=("journal",))
+    assert any(e["content"] == "a private thought" and e["source"] == "chat" for e in entries)
+
+
+def test_note_tool_with_tag(lyra):
+    from lyra import tools
+    tools.dispatch("note", {"content": "villain 3-bets light", "tag": "poker"})
+    notes = lyra.list_journal(kinds=("note",))
+    assert any("[poker] villain 3-bets light" == e["content"] for e in notes)
+
+
+def test_unknown_tool_is_safe(lyra):
+    from lyra import tools
+    assert "unknown tool" in tools.dispatch("nope", {})
+
+
+def test_chat_runs_tool_then_replies(lyra, monkeypatch):
+    from lyra import llm, chat
+    calls = {"n": 0}
+
+    def fake_chat_call(messages, backend="cloud", model=None, tools=None):
+        calls["n"] += 1
+        if calls["n"] == 1:
+            return ({"role": "assistant", "content": None, "tool_calls": []},
+                    [{"id": "c1", "name": "journal_write", "arguments": '{"entry": "noted from chat"}'}])
+        return ({"role": "assistant", "content": "Done, Brian."}, None)
+
+    monkeypatch.setattr(llm, "chat_call", fake_chat_call)
+    reply = chat.respond("s1", "write that down for me", backend="cloud")
+
+    assert reply == "Done, Brian."
+    assert calls["n"] == 2  # one tool round, then the text reply
+    assert any("noted from chat" in e["content"] for e in lyra.list_journal())
-- 
2.52.0


From 49b88af3cce750478ab3dd120eee5b5082c051c7 Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Wed, 17 Jun 2026 20:43:51 +0000
Subject: [PATCH 33/51] =?UTF-8?q?feat:=20poker=20copilot=20=E2=80=94=20str?=
 =?UTF-8?q?uctured=20session/hand/villain=20tracking=20+=20stats?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The real upgrade over the ChatGPT prose-recap workflow: structured data capture
via tools Lyra drives during a live session, with stats computed from real data.

- lyra/poker.py: domain pack (separate from core memory) — poker_sessions,
  poker_hands, persistent poker_players (villain file) + player_reads; functions
  for session lifecycle (start/buyin/end with net+hours), tolerant hand logging,
  villain upsert/reads, and session/running stats ($/hr, by stake/venue/game)
- tools.py: 8 poker tools wired into the chat tool loop (start_session,
  add_buyin, log_hand, add_read, end_session, session_stats, running_stats,
  get_villain_file) — partial/terse input tolerated
- import/: Brian's real .md session-log format (reference for the phase-2 recap)
- tests: lifecycle/net math, partial hand logging, villain upsert, running
  stats, tool dispatch

Verified live: a full talk-through session persisted as structured rows
(session +240, AKs hand, seat-5 read) — she drove the tools from natural chat.

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/poker.py       | 315 ++++++++++++++++++++++++++++++++++++++++++++
 lyra/tools.py       | 159 +++++++++++++++++++++-
 tests/test_poker.py |  74 +++++++++++
 3 files changed, 547 insertions(+), 1 deletion(-)
 create mode 100644 lyra/poker.py
 create mode 100644 tests/test_poker.py

diff --git a/lyra/poker.py b/lyra/poker.py
new file mode 100644
index 0000000..ab1f8b8
--- /dev/null
+++ b/lyra/poker.py
@@ -0,0 +1,315 @@
+"""Poker domain pack: structured session / hand / villain storage + stats.
+
+This is the poker-specific data layer — kept separate from the domain-agnostic
+core memory so Lyra-the-agent stays general. It records real structured data
+(money, hands, opponents) during a live session via tools Lyra calls, and
+computes stats from that data. The narrative .md recap is generated on top of
+this, not instead of it.
+
+Tables live in the same SQLite file as everything else (one DB), created lazily.
+Most tool-facing functions default to the current *live* session so Lyra rarely
+needs to pass an id around.
+"""
+from __future__ import annotations
+
+from datetime import datetime, timezone
+
+from lyra import memory
+
+_SCHEMA = """
+CREATE TABLE IF NOT EXISTS poker_sessions (
+    id INTEGER PRIMARY KEY AUTOINCREMENT,
+    started_at TEXT NOT NULL,
+    ended_at TEXT,
+    venue TEXT,
+    game TEXT,            -- NLH, PLO, Stud8, Mixed, ...
+    stakes TEXT,          -- "1/3", "2/5"
+    format TEXT,          -- cash | tournament
+    buy_in_total REAL NOT NULL DEFAULT 0,
+    cash_out REAL,
+    net REAL,
+    hours REAL,
+    mantra TEXT,
+    mood TEXT,
+    status TEXT NOT NULL DEFAULT 'live',   -- live | closed
+    recap_md TEXT
+);
+
+CREATE TABLE IF NOT EXISTS poker_hands (
+    id INTEGER PRIMARY KEY AUTOINCREMENT,
+    session_id INTEGER NOT NULL,
+    at TEXT NOT NULL,
+    position TEXT,
+    hole_cards TEXT,
+    board TEXT,
+    preflop TEXT,
+    flop TEXT,
+    turn TEXT,
+    river TEXT,
+    showdown TEXT,
+    pot REAL,
+    result REAL,
+    stack_after REAL,
+    tag TEXT,             -- well_played | leak | cooler | confidence | notable
+    lesson TEXT
+);
+CREATE INDEX IF NOT EXISTS idx_hands_session ON poker_hands(session_id);
+
+-- Persistent villain file — survives across sessions/venues.
+CREATE TABLE IF NOT EXISTS poker_players (
+    id INTEGER PRIMARY KEY AUTOINCREMENT,
+    name TEXT NOT NULL,
+    venue TEXT,
+    description TEXT,
+    tendencies TEXT,
+    adjustment TEXT,
+    category TEXT,        -- feeder | risky | reg | unknown
+    updated_at TEXT NOT NULL
+);
+
+-- Per-session observations (the live 'reads'); player_id links to the file.
+CREATE TABLE IF NOT EXISTS player_reads (
+    id INTEGER PRIMARY KEY AUTOINCREMENT,
+    session_id INTEGER,
+    player_id INTEGER,
+    seat TEXT,
+    note TEXT NOT NULL,
+    created_at TEXT NOT NULL
+);
+"""
+
+_ensured_for = None
+
+
+def _c():
+    """Shared connection with poker tables ensured (re-ensures after reconnect)."""
+    global _ensured_for
+    conn = memory._connection()
+    if _ensured_for is not conn:
+        conn.executescript(_SCHEMA)
+        _ensured_for = conn
+    return conn
+
+
+def _now() -> str:
+    return datetime.now(timezone.utc).isoformat()
+
+
+# --- sessions ---
+
+def start_session(venue: str | None = None, stakes: str | None = None,
+                  game: str = "NLH", fmt: str = "cash",
+                  buy_in: float = 0.0, mantra: str | None = None) -> int:
+    """Open a new live session. Returns its id."""
+    conn = _c()
+    with conn:
+        cur = conn.execute(
+            "INSERT INTO poker_sessions "
+            "(started_at, venue, game, stakes, format, buy_in_total, mantra, status) "
+            "VALUES (?, ?, ?, ?, ?, ?, ?, 'live')",
+            (_now(), venue, game, stakes, fmt, float(buy_in or 0), mantra),
+        )
+    return int(cur.lastrowid)
+
+
+def live_session() -> dict | None:
+    """The current open session, if any."""
+    r = _c().execute(
+        "SELECT * FROM poker_sessions WHERE status = 'live' ORDER BY id DESC LIMIT 1"
+    ).fetchone()
+    return dict(r) if r else None
+
+
+def _resolve(session_id: int | None) -> int | None:
+    if session_id is not None:
+        return session_id
+    live = live_session()
+    return live["id"] if live else None
+
+
+def add_buyin(amount: float, session_id: int | None = None) -> float:
+    """Add a buy-in/rebuy to a session. Returns the new total in."""
+    sid = _resolve(session_id)
+    if sid is None:
+        raise ValueError("no live session")
+    conn = _c()
+    with conn:
+        conn.execute(
+            "UPDATE poker_sessions SET buy_in_total = buy_in_total + ? WHERE id = ?",
+            (float(amount), sid),
+        )
+    return float(_c().execute(
+        "SELECT buy_in_total FROM poker_sessions WHERE id = ?", (sid,)
+    ).fetchone()["buy_in_total"])
+
+
+def end_session(cash_out: float, mood: str | None = None,
+                session_id: int | None = None) -> dict:
+    """Close a session: record cashout, compute net + hours. Returns the row."""
+    sid = _resolve(session_id)
+    if sid is None:
+        raise ValueError("no live session")
+    row = _c().execute("SELECT * FROM poker_sessions WHERE id = ?", (sid,)).fetchone()
+    ended = _now()
+    hours = (datetime.fromisoformat(ended) - datetime.fromisoformat(row["started_at"])).total_seconds() / 3600
+    net = float(cash_out) - float(row["buy_in_total"])
+    conn = _c()
+    with conn:
+        conn.execute(
+            "UPDATE poker_sessions SET ended_at = ?, cash_out = ?, net = ?, hours = ?, "
+            "mood = COALESCE(?, mood), status = 'closed' WHERE id = ?",
+            (ended, float(cash_out), net, round(hours, 2), mood, sid),
+        )
+    return dict(_c().execute("SELECT * FROM poker_sessions WHERE id = ?", (sid,)).fetchone())
+
+
+# --- hands ---
+
+_HAND_FIELDS = ("position", "hole_cards", "board", "preflop", "flop", "turn",
+                "river", "showdown", "pot", "result", "stack_after", "tag", "lesson")
+
+
+def log_hand(session_id: int | None = None, **fields) -> int:
+    """Record a hand. All fields optional/partial — terse logging is fine."""
+    sid = _resolve(session_id)
+    if sid is None:
+        raise ValueError("no live session")
+    cols = ["session_id", "at"]
+    vals: list = [sid, _now()]
+    for f in _HAND_FIELDS:
+        if fields.get(f) not in (None, ""):
+            cols.append(f)
+            vals.append(fields[f])
+    conn = _c()
+    with conn:
+        cur = conn.execute(
+            f"INSERT INTO poker_hands ({', '.join(cols)}) VALUES ({', '.join('?' * len(cols))})",
+            vals,
+        )
+    return int(cur.lastrowid)
+
+
+def list_hands(session_id: int | None = None) -> list[dict]:
+    sid = _resolve(session_id)
+    if sid is None:
+        return []
+    return [dict(r) for r in _c().execute(
+        "SELECT * FROM poker_hands WHERE session_id = ? ORDER BY id", (sid,)
+    ).fetchall()]
+
+
+# --- villain file ---
+
+def upsert_player(name: str, venue: str | None = None, description: str | None = None,
+                  tendencies: str | None = None, adjustment: str | None = None,
+                  category: str | None = None) -> int:
+    """Create or update a player in the persistent villain file (matched by name)."""
+    conn = _c()
+    existing = conn.execute(
+        "SELECT id FROM poker_players WHERE name = ? COLLATE NOCASE", (name,)
+    ).fetchone()
+    with conn:
+        if existing:
+            pid = existing["id"]
+            # only overwrite fields that were provided
+            for col, val in (("venue", venue), ("description", description),
+                             ("tendencies", tendencies), ("adjustment", adjustment),
+                             ("category", category)):
+                if val not in (None, ""):
+                    conn.execute(f"UPDATE poker_players SET {col} = ? WHERE id = ?", (val, pid))
+            conn.execute("UPDATE poker_players SET updated_at = ? WHERE id = ?", (_now(), pid))
+            return int(pid)
+        cur = conn.execute(
+            "INSERT INTO poker_players (name, venue, description, tendencies, adjustment, "
+            "category, updated_at) VALUES (?, ?, ?, ?, ?, ?, ?)",
+            (name, venue, description, tendencies, adjustment, category, _now()),
+        )
+    return int(cur.lastrowid)
+
+
+def add_read(note: str, seat: str | None = None, name: str | None = None,
+             session_id: int | None = None, **player_fields) -> int:
+    """Log a live read. If `name` is given, upsert the player and link the read."""
+    sid = _resolve(session_id)
+    pid = None
+    if name:
+        pid = upsert_player(name, **{k: v for k, v in player_fields.items()
+                                     if k in ("venue", "description", "tendencies",
+                                              "adjustment", "category")})
+    conn = _c()
+    with conn:
+        cur = conn.execute(
+            "INSERT INTO player_reads (session_id, player_id, seat, note, created_at) "
+            "VALUES (?, ?, ?, ?, ?)",
+            (sid, pid, seat, note, _now()),
+        )
+    return int(cur.lastrowid)
+
+
+def get_villain_file(name: str | None = None, venue: str | None = None) -> list[dict]:
+    """Pull villain dossiers, optionally filtered by name or venue."""
+    sql = "SELECT * FROM poker_players"
+    where, params = [], []
+    if name:
+        where.append("name LIKE ?")
+        params.append(f"%{name}%")
+    if venue:
+        where.append("venue LIKE ?")
+        params.append(f"%{venue}%")
+    if where:
+        sql += " WHERE " + " AND ".join(where)
+    sql += " ORDER BY updated_at DESC"
+    return [dict(r) for r in _c().execute(sql, params).fetchall()]
+
+
+# --- stats ---
+
+def session_stats(session_id: int | None = None) -> dict:
+    """Money + hand summary for one session."""
+    sid = _resolve(session_id)
+    if sid is None:
+        return {}
+    s = _c().execute("SELECT * FROM poker_sessions WHERE id = ?", (sid,)).fetchone()
+    if not s:
+        return {}
+    s = dict(s)
+    hands = list_hands(sid)
+    tags: dict[str, int] = {}
+    for h in hands:
+        if h.get("tag"):
+            tags[h["tag"]] = tags.get(h["tag"], 0) + 1
+    hourly = round(s["net"] / s["hours"], 2) if s.get("net") is not None and s.get("hours") else None
+    return {
+        "session": s, "hands_logged": len(hands), "tags": tags,
+        "net": s.get("net"), "hours": s.get("hours"), "per_hour": hourly,
+    }
+
+
+def running_stats(stakes: str | None = None, venue: str | None = None,
+                  game: str | None = None, since: str | None = None) -> dict:
+    """Cumulative stats over closed sessions, optionally filtered."""
+    sql = "SELECT net, hours, stakes, venue, game FROM poker_sessions WHERE status = 'closed' AND net IS NOT NULL"
+    params: list = []
+    for col, val in (("stakes", stakes), ("venue", venue), ("game", game)):
+        if val:
+            sql += f" AND {col} = ?"
+            params.append(val)
+    if since:
+        sql += " AND started_at >= ?"
+        params.append(since)
+    rows = [dict(r) for r in _c().execute(sql, params).fetchall()]
+    sessions = len(rows)
+    net = round(sum(r["net"] or 0 for r in rows), 2)
+    hours = round(sum(r["hours"] or 0 for r in rows), 2)
+    by_stake: dict[str, dict] = {}
+    for r in rows:
+        k = r["stakes"] or "?"
+        b = by_stake.setdefault(k, {"sessions": 0, "net": 0.0, "hours": 0.0})
+        b["sessions"] += 1
+        b["net"] = round(b["net"] + (r["net"] or 0), 2)
+        b["hours"] = round(b["hours"] + (r["hours"] or 0), 2)
+    return {
+        "sessions": sessions, "net": net, "hours": hours,
+        "per_hour": round(net / hours, 2) if hours else None,
+        "by_stake": by_stake,
+    }
diff --git a/lyra/tools.py b/lyra/tools.py
index 8eb507a..d88a50b 100644
--- a/lyra/tools.py
+++ b/lyra/tools.py
@@ -11,7 +11,7 @@ from __future__ import annotations
 
 import json
 
-from lyra import logbus, memory
+from lyra import logbus, memory, poker
 
 
 def _journal_write(args: dict, ctx: dict) -> str:
@@ -83,6 +83,163 @@ TOOLS: dict[str, dict] = {
 }
 
 
+# --- Poker copilot tools -----------------------------------------------------
+
+def _start_session(args: dict, ctx: dict) -> str:
+    sid = poker.start_session(
+        venue=args.get("venue"), stakes=args.get("stakes"),
+        game=args.get("game") or "NLH", fmt=args.get("format") or "cash",
+        buy_in=args.get("buy_in") or 0, mantra=args.get("mantra"),
+    )
+    logbus.log("info", "poker session started", id=sid, stakes=args.get("stakes"))
+    return (f"Session #{sid} started — {args.get('stakes') or '?'} "
+            f"{args.get('game') or 'NLH'} at {args.get('venue') or 'unknown'}, "
+            f"in for {args.get('buy_in') or 0}.")
+
+
+def _add_buyin(args: dict, ctx: dict) -> str:
+    total = poker.add_buyin(float(args.get("amount") or 0))
+    return f"Added {args.get('amount')}. Total in this session: {total:g}."
+
+
+def _log_hand(args: dict, ctx: dict) -> str:
+    fields = {k: args.get(k) for k in poker._HAND_FIELDS if args.get(k) not in (None, "")}
+    hid = poker.log_hand(**fields)
+    bits = " ".join(str(fields[k]) for k in ("position", "hole_cards") if k in fields)
+    return f"Hand #{hid} logged{(' — ' + bits) if bits else ''}."
+
+
+def _add_read(args: dict, ctx: dict) -> str:
+    poker.add_read(
+        note=args.get("note") or "", seat=args.get("seat"), name=args.get("name"),
+        tendencies=args.get("tendencies"), adjustment=args.get("adjustment"),
+        description=args.get("description"), category=args.get("category"),
+        venue=args.get("venue"),
+    )
+    who = f" on {args['name']}" if args.get("name") else ""
+    return f"Read logged{who}."
+
+
+def _end_session(args: dict, ctx: dict) -> str:
+    s = poker.end_session(cash_out=float(args.get("cash_out") or 0), mood=args.get("mood"))
+    hourly = f", {s['net'] / s['hours']:+.0f}/hr" if s.get("hours") else ""
+    logbus.log("info", "poker session closed", id=s["id"], net=s["net"])
+    return f"Session #{s['id']} closed — net {s['net']:+.0f} over {s['hours']}h{hourly}."
+
+
+def _session_stats(args: dict, ctx: dict) -> str:
+    st = poker.session_stats()
+    if not st:
+        return "No session found."
+    s = st["session"]
+    tags = ", ".join(f"{k}:{v}" for k, v in st["tags"].items()) or "none"
+    return (f"Session #{s['id']} ({s.get('stakes')} {s.get('game')} @ {s.get('venue')}): "
+            f"in {s.get('buy_in_total'):g}, net {st['net'] if st['net'] is not None else '—'}, "
+            f"{st['hands_logged']} hands logged (tags: {tags}).")
+
+
+def _running_stats(args: dict, ctx: dict) -> str:
+    rs = poker.running_stats(stakes=args.get("stakes"), venue=args.get("venue"),
+                             game=args.get("game"), since=args.get("since"))
+    if not rs["sessions"]:
+        return "No closed sessions match that filter yet."
+    by = " | ".join(f"{k}: {v['net']:+.0f} in {v['hours']:g}h ({v['sessions']})"
+                    for k, v in rs["by_stake"].items())
+    hourly = f" ({rs['per_hour']:+.0f}/hr)" if rs["per_hour"] is not None else ""
+    return f"{rs['sessions']} sessions, {rs['hours']:g}h, net {rs['net']:+.0f}{hourly}. By stake: {by}"
+
+
+def _villain_file(args: dict, ctx: dict) -> str:
+    vs = poker.get_villain_file(name=args.get("name"), venue=args.get("venue"))
+    if not vs:
+        return "No villain notes match."
+    lines = []
+    for v in vs[:8]:
+        lines.append(
+            f"- {v['name']}" + (f" ({v['venue']})" if v.get("venue") else "")
+            + (f" [{v['category']}]" if v.get("category") else "")
+            + (f": {v['tendencies']}" if v.get("tendencies") else "")
+            + (f" → {v['adjustment']}" if v.get("adjustment") else "")
+        )
+    return "\n".join(lines)
+
+
+def _f(name, desc, props, required):
+    return {"type": "function", "function": {
+        "name": name, "description": desc,
+        "parameters": {"type": "object", "properties": props, "required": required}}}
+
+
+_S = {"type": "string"}
+_N = {"type": "number"}
+
+TOOLS.update({
+    "start_session": {"handler": _start_session, "spec": _f(
+        "start_session",
+        "Begin a live poker session. Call when Brian sits down to play.",
+        {"venue": {**_S, "description": "Casino/room, e.g. 'Meadows'"},
+         "stakes": {**_S, "description": "e.g. '1/3', '2/5'"},
+         "game": {**_S, "description": "NLH, PLO, Stud8, Mixed (default NLH)"},
+         "format": {**_S, "description": "'cash' or 'tournament' (default cash)"},
+         "buy_in": {**_N, "description": "Initial buy-in amount"},
+         "mantra": {**_S, "description": "Optional pre-session focus/anchor"}},
+        [])},
+    "add_buyin": {"handler": _add_buyin, "spec": _f(
+        "add_buyin", "Record a rebuy / additional buy-in in the live session.",
+        {"amount": {**_N, "description": "Amount added"}}, ["amount"])},
+    "log_hand": {"handler": _log_hand, "spec": _f(
+        "log_hand",
+        "Log a hand in the live session. All fields optional — capture whatever Brian gives you, even terse.",
+        {"position": {**_S, "description": "e.g. 'BTN', 'UTG', 'BB'"},
+         "hole_cards": {**_S, "description": "e.g. 'AKs', 'JJ', '8d9s'"},
+         "board": {**_S, "description": "Final board if known"},
+         "preflop": {**_S, "description": "Preflop action narrative"},
+         "flop": {**_S, "description": "Flop board + action"},
+         "turn": {**_S, "description": "Turn card + action"},
+         "river": {**_S, "description": "River card + action"},
+         "showdown": {**_S, "description": "Showdown / result detail"},
+         "pot": {**_N, "description": "Pot size"},
+         "result": {**_N, "description": "Net chips won(+)/lost(-) on the hand"},
+         "tag": {**_S, "description": "well_played | leak | cooler | confidence | notable"},
+         "lesson": {**_S, "description": "Takeaway/analysis"}},
+        [])},
+    "add_read": {"handler": _add_read, "spec": _f(
+        "add_read",
+        "Log a read on an opponent. If you give a name, it's saved to the persistent villain file.",
+        {"note": {**_S, "description": "The observation / what they showed down"},
+         "name": {**_S, "description": "Player name/handle if known (creates/updates their dossier)"},
+         "seat": {**_S, "description": "Seat or relative position"},
+         "tendencies": {**_S, "description": "Standing read on how they play"},
+         "adjustment": {**_S, "description": "How Brian should exploit them"},
+         "description": {**_S, "description": "Physical marker, e.g. 'motorized chair'"},
+         "category": {**_S, "description": "feeder | risky | reg | unknown"},
+         "venue": {**_S, "description": "Where they play"}},
+        ["note"])},
+    "end_session": {"handler": _end_session, "spec": _f(
+        "end_session", "Close the live session: record cashout, compute net + hours.",
+        {"cash_out": {**_N, "description": "Final cashout amount"},
+         "mood": {**_S, "description": "Mental-game note for the session"}},
+        ["cash_out"])},
+    "session_stats": {"handler": _session_stats, "spec": _f(
+        "session_stats", "Get money + hand summary for the current/most-recent session.",
+        {}, [])},
+    "running_stats": {"handler": _running_stats, "spec": _f(
+        "running_stats",
+        "Cumulative results across closed sessions (net, $/hr, by stake). Optionally filter.",
+        {"stakes": {**_S, "description": "Filter by stakes, e.g. '1/3'"},
+         "venue": {**_S, "description": "Filter by venue"},
+         "game": {**_S, "description": "Filter by game type"},
+         "since": {**_S, "description": "ISO date lower bound, e.g. '2026-06-01'"}},
+        [])},
+    "get_villain_file": {"handler": _villain_file, "spec": _f(
+        "get_villain_file",
+        "Pull saved opponent dossiers (the villain file). Filter by name or venue, e.g. before sitting down.",
+        {"name": {**_S, "description": "Player name to look up"},
+         "venue": {**_S, "description": "Venue to pull the local pool for"}},
+        [])},
+})
+
+
 def specs() -> list[dict]:
     """OpenAI-format tool definitions to offer the model."""
     return [t["spec"] for t in TOOLS.values()]
diff --git a/tests/test_poker.py b/tests/test_poker.py
new file mode 100644
index 0000000..514a6cd
--- /dev/null
+++ b/tests/test_poker.py
@@ -0,0 +1,74 @@
+"""Poker domain: structured session/hand/villain storage + stats, and the tools."""
+from __future__ import annotations
+
+import importlib
+
+import pytest
+
+
+@pytest.fixture
+def lyra(tmp_path, monkeypatch):
+    monkeypatch.setenv("LYRA_DB_PATH", str(tmp_path / "test.db"))
+    from lyra import llm
+    monkeypatch.setattr(llm, "embed", lambda texts: [[0.1, 0.2, 0.3] for _ in texts])
+    import lyra.memory as memory
+    importlib.reload(memory)
+    import lyra.poker as poker
+    importlib.reload(poker)  # rebind to the reloaded memory + reset its schema flag
+    return poker
+
+
+def test_session_lifecycle_and_net(lyra):
+    poker = lyra
+    sid = poker.start_session(venue="Meadows", stakes="1/3", buy_in=400)
+    assert poker.live_session()["id"] == sid
+    poker.add_buyin(500)  # rebuy -> total 900
+    s = poker.end_session(cash_out=627)
+    assert s["buy_in_total"] == 900
+    assert s["net"] == pytest.approx(-273)
+    assert s["status"] == "closed"
+    assert poker.live_session() is None  # closed -> no live session
+
+
+def test_log_hand_partial_fields(lyra):
+    poker = lyra
+    poker.start_session(stakes="1/3", buy_in=300)
+    hid = poker.log_hand(position="BTN", hole_cards="AKs", result=120, tag="confidence")
+    hands = poker.list_hands()
+    assert len(hands) == 1 and hands[0]["id"] == hid
+    assert hands[0]["hole_cards"] == "AKs" and hands[0]["result"] == 120
+    assert hands[0]["board"] is None  # unspecified fields stay null
+
+
+def test_villain_file_upsert_and_read(lyra):
+    poker = lyra
+    poker.start_session(venue="Meadows", stakes="1/3", buy_in=300)
+    poker.add_read("limp-called K4s UTG", name="Sleepy John", seat="3",
+                   tendencies="loose-passive, jackpot dreamer", category="feeder", venue="Meadows")
+    # update the same player
+    poker.add_read("cold-called a 3-bet with A2o", name="sleepy john")
+    file = poker.get_villain_file(name="Sleepy")
+    assert len(file) == 1  # matched by name, not duplicated
+    assert file[0]["category"] == "feeder"
+
+
+def test_running_stats(lyra):
+    poker = lyra
+    s1 = poker.start_session(stakes="1/3", buy_in=300)
+    poker.end_session(540, session_id=s1)
+    s2 = poker.start_session(stakes="1/3", buy_in=400)
+    poker.end_session(300, session_id=s2)
+    rs = poker.running_stats(stakes="1/3")
+    assert rs["sessions"] == 2
+    assert rs["net"] == pytest.approx(140)  # +240 then -100
+    assert "1/3" in rs["by_stake"]
+
+
+def test_poker_tools_dispatch(lyra):
+    from lyra import tools
+    assert "started" in tools.dispatch("start_session", {"stakes": "1/3", "buy_in": 300})
+    assert "logged" in tools.dispatch("log_hand", {"position": "CO", "hole_cards": "QQ"})
+    assert "closed" in tools.dispatch("end_session", {"cash_out": 500})
+    # the poker tools are offered to the model
+    names = {s["function"]["name"] for s in tools.specs()}
+    assert {"start_session", "log_hand", "end_session", "running_stats", "get_villain_file"} <= names
-- 
2.52.0


From ac04ad1df6258a5f5f692197591dbbda895a99b0 Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Wed, 17 Jun 2026 20:52:47 +0000
Subject: [PATCH 34/51] fix: only send tools to backends that support them
 (cloud)

The MI50 llama.cpp server 500s on the `tools` param unless launched with
--jinja, so sending tools to mi50 broke chat on that backend. Gate tools to
TOOL_BACKENDS={"cloud"} for now; mi50 chat works again (just without tools).
Add "mi50" once its server runs with --jinja.

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/chat.py | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/lyra/chat.py b/lyra/chat.py
index d5454d0..02a987b 100644
--- a/lyra/chat.py
+++ b/lyra/chat.py
@@ -18,6 +18,10 @@ RECALL_K = 3  # raw cross-session "sharp detail" hits
 RECENT_N = 10  # raw turns of the current session
 SUMMARY_K = 3  # other-session gists
 MAX_TOOL_ROUNDS = 5  # cap tool-call iterations per turn
+# Backends that support function-calling. The MI50's llama.cpp server only does
+# tools when launched with --jinja; until it is, keep tools to cloud so MI50 chat
+# doesn't 500 on the tools param. Add "mi50" here once that flag is set.
+TOOL_BACKENDS = {"cloud"}
 
 
 def _summary_note(summaries: list[memory.Summary]) -> Message:
@@ -126,7 +130,7 @@ def respond(session_id: str, user_msg: str, backend: Backend = "cloud") -> str:
 
     # Tool loop: offer Lyra her tools; if she calls one, run it and feed the
     # result back so she can continue, until she returns a normal text reply.
-    tool_specs = toolkit.specs() if backend in ("cloud", "mi50") else None
+    tool_specs = toolkit.specs() if backend in TOOL_BACKENDS else None
     ctx = {"session_id": session_id, "backend": backend}
     reply = ""
     for _ in range(MAX_TOOL_ROUNDS):
-- 
2.52.0


From 16f3442640c15a5a905545a0c59bc11764b81e2f Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Wed, 17 Jun 2026 23:01:33 +0000
Subject: [PATCH 35/51] docs: park MI50 --jinja tool-calling as an experiment
 (cloud is the copilot path)

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 docs/PARKED_IDEAS.md | 13 +++++++++++++
 1 file changed, 13 insertions(+)

diff --git a/docs/PARKED_IDEAS.md b/docs/PARKED_IDEAS.md
index 7ffc733..5036ea0 100644
--- a/docs/PARKED_IDEAS.md
+++ b/docs/PARKED_IDEAS.md
@@ -68,6 +68,19 @@ Dec-2025 plan (in her memory). The whole point of the project: can she become a
   cost loops, self-brick), not sci-fi. The isolation makes the *fun* version
   (emergence) safe to pursue. Build the box, then open the door.
 
+## 🛠️ Tool-calling on the MI50 (free local agency)
+Launch the MI50 llama.cpp server with `--jinja` so the `local-GPU` backend can
+do function-calling, then add `"mi50"` to `chat.TOOL_BACKENDS`. Would let the
+poker copilot + journaling tools run free/local instead of on cloud.
+- **Why parked:** not needed — cloud (gpt-4o) drives tools reliably and a full
+  poker session costs ~$0.50–1. A local 32B calls tools less reliably (wrong
+  tool / bad args / narrates instead) and is slower (round-trips × ~18s/turn),
+  which is exactly wrong for live at-the-table logging. Cloud is also easier to
+  debug tools against.
+- **Do it as:** a deliberate experiment to A/B the local model's tool-calling
+  (fits the "own stack" arc), not a dependency. Small + reversible: recreate the
+  CT202 container command with `--jinja`, keep it reboot-resilient.
+
 ## 🛠️ Deterministic poker tooling (RTO + cfr-core)
 Wire Lyra to Brian's own GTO/solver projects so ICM, equities, and ranges come
 from real computation, never LLM guesses.
-- 
2.52.0


From 9491951da010c8318c43780c3f334ab52c4ef139 Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Wed, 17 Jun 2026 23:11:46 +0000
Subject: [PATCH 36/51] feat: hand-history reconstruction + replayable table
 viewer
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Brian's idea: vomit rough shorthand, Lyra rebuilds it into a structured,
replayable hand history.

- poker.parse_hand(): focused LLM pass turning shorthand into a canonical hand
  JSON (positions, stacks, hero cards, chronological actions w/ board reveals,
  result); store_hand_history() persists JSON + extracted flat fields;
  record_hand() = parse+store; standalone hands attach to a 'Hand Reviews' session
- poker_hands gains a `structured` JSON column (ALTER-migrated for existing DBs)
- record_hand tool wired into chat: "log this hand: ..." -> reconstructed + a
  /hand/{id} link
- web: GET /hand/{id} viewer + /hand/{id}/data — a felt table with seats placed
  around the oval (hero at bottom), hole cards, progressive board reveal, and
  prev/next/end step-through of the action with running pot
- tests: store/get roundtrip, record_hand tool (stubbed parse)

Verified live: parsed a real AKs hand (BTN, 14 actions, full board) end to end.

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/poker.py             | 127 +++++++++++++++++++++-
 lyra/tools.py             |  24 +++++
 lyra/web/server.py        |  11 +-
 lyra/web/static/hand.html | 222 ++++++++++++++++++++++++++++++++++++++
 tests/test_poker.py       |  31 ++++++
 5 files changed, 412 insertions(+), 3 deletions(-)
 create mode 100644 lyra/web/static/hand.html

diff --git a/lyra/poker.py b/lyra/poker.py
index ab1f8b8..b645564 100644
--- a/lyra/poker.py
+++ b/lyra/poker.py
@@ -12,9 +12,11 @@ needs to pass an id around.
 """
 from __future__ import annotations
 
+import json
+import re
 from datetime import datetime, timezone
 
-from lyra import memory
+from lyra import llm, memory
 
 _SCHEMA = """
 CREATE TABLE IF NOT EXISTS poker_sessions (
@@ -51,7 +53,8 @@ CREATE TABLE IF NOT EXISTS poker_hands (
     result REAL,
     stack_after REAL,
     tag TEXT,             -- well_played | leak | cooler | confidence | notable
-    lesson TEXT
+    lesson TEXT,
+    structured TEXT       -- full parsed hand-history JSON (for the viewer)
 );
 CREATE INDEX IF NOT EXISTS idx_hands_session ON poker_hands(session_id);
 
@@ -87,6 +90,11 @@ def _c():
     conn = memory._connection()
     if _ensured_for is not conn:
         conn.executescript(_SCHEMA)
+        # Add columns introduced after a DB already had the tables (no-op if present).
+        try:
+            conn.execute("ALTER TABLE poker_hands ADD COLUMN structured TEXT")
+        except Exception:
+            pass
         _ensured_for = conn
     return conn
 
@@ -198,6 +206,121 @@ def list_hands(session_id: int | None = None) -> list[dict]:
     ).fetchall()]
 
 
+# --- hand-history parsing (rough shorthand -> structured JSON) ---
+
+_HAND_PARSE_PROMPT = """You convert a player's rough shorthand description of a poker hand \
+into a structured JSON hand history. Output ONLY valid JSON — no prose, no code fences.
+
+Schema:
+{
+  "game": "NLH" | "PLO" | ...,
+  "stakes": "<e.g. 1/3, or null>",
+  "hero_pos": "<UTG|UTG1|MP|LJ|HJ|CO|BTN|SB|BB, hero's position>",
+  "hero_cards": ["Rs", ...],            // rank+suit; suit one of s h d c; null if unknown
+  "players": [                          // every player mentioned, incl. hero
+    {"pos": "<position>", "stack": <number|null>, "name": <string|null>, "cards": [".."]|null}
+  ],
+  "actions": [                          // chronological, across all streets
+    // when a street begins, FIRST emit its board reveal:
+    {"street": "flop", "board": ["7d","2c","5h"]},   // turn/river: one card in the array
+    {"street": "preflop|flop|turn|river", "pos": "<pos>", "action": "post|fold|check|call|bet|raise|allin", "amount": <number|null>}
+  ],
+  "board": ["..."],                     // full final board, 0-5 cards
+  "result": {"pot": <number|null>, "hero_net": <number|null>, "summary": "<one line>"}
+}
+
+Rules: infer positions and street order sensibly. Amounts are plain numbers (no $). \
+Normalize cards like "Ah","Td","9s". Use null/omit for anything not stated. Stay faithful \
+to what's described — do not invent action that isn't implied."""
+
+
+def _safe_json(s: str) -> dict | None:
+    try:
+        return json.loads(s)
+    except (json.JSONDecodeError, TypeError):
+        m = re.search(r"\{.*\}", s or "", re.S)
+        if m:
+            try:
+                return json.loads(m.group())
+            except json.JSONDecodeError:
+                return None
+    return None
+
+
+def parse_hand(shorthand: str, stakes: str | None = None,
+               backend: str | None = None) -> dict | None:
+    """Turn rough shorthand into a structured hand-history dict via an LLM pass."""
+    backend = backend or "cloud"
+    ctx = f"Stakes: {stakes}\n\n" if stakes else ""
+    parsed = _safe_json(llm.complete(
+        [{"role": "system", "content": _HAND_PARSE_PROMPT},
+         {"role": "user", "content": ctx + shorthand}],
+        backend=backend,
+    ))
+    if parsed and stakes and not parsed.get("stakes"):
+        parsed["stakes"] = stakes
+    return parsed
+
+
+def _review_session_id() -> int:
+    """A standing 'Hand Reviews' session to attach standalone parsed hands to."""
+    conn = _c()
+    r = conn.execute(
+        "SELECT id FROM poker_sessions WHERE venue = 'Hand Reviews' AND status = 'review'"
+    ).fetchone()
+    if r:
+        return int(r["id"])
+    with conn:
+        cur = conn.execute(
+            "INSERT INTO poker_sessions (started_at, venue, status, buy_in_total) "
+            "VALUES (?, 'Hand Reviews', 'review', 0)",
+            (_now(),),
+        )
+    return int(cur.lastrowid)
+
+
+def store_hand_history(parsed: dict, session_id: int | None = None,
+                       tag: str | None = None, lesson: str | None = None) -> int:
+    """Store a parsed hand: full JSON + extracted flat fields for stats/listing."""
+    sid = _resolve(session_id) or _review_session_id()
+    hero_cards = parsed.get("hero_cards") or []
+    board = parsed.get("board") or []
+    result = (parsed.get("result") or {})
+    conn = _c()
+    with conn:
+        cur = conn.execute(
+            "INSERT INTO poker_hands (session_id, at, position, hole_cards, board, "
+            "pot, result, tag, lesson, structured) VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?)",
+            (sid, _now(), parsed.get("hero_pos"),
+             " ".join(hero_cards) if hero_cards else None,
+             " ".join(board) if board else None,
+             result.get("pot"), result.get("hero_net"), tag, lesson,
+             json.dumps(parsed)),
+        )
+    return int(cur.lastrowid)
+
+
+def record_hand(shorthand: str, session_id: int | None = None, stakes: str | None = None,
+                tag: str | None = None, lesson: str | None = None,
+                backend: str | None = None) -> dict:
+    """Parse shorthand -> structured hand -> store. Returns {id, parsed} (id None on parse fail)."""
+    parsed = parse_hand(shorthand, stakes=stakes, backend=backend)
+    if not parsed:
+        return {"id": None, "parsed": None}
+    hid = store_hand_history(parsed, session_id=session_id, tag=tag, lesson=lesson)
+    return {"id": hid, "parsed": parsed}
+
+
+def get_hand(hand_id: int) -> dict | None:
+    """A stored hand with its structured JSON parsed back into a dict."""
+    r = _c().execute("SELECT * FROM poker_hands WHERE id = ?", (hand_id,)).fetchone()
+    if not r:
+        return None
+    d = dict(r)
+    d["structured"] = json.loads(d["structured"]) if d.get("structured") else None
+    return d
+
+
 # --- villain file ---
 
 def upsert_player(name: str, venue: str | None = None, description: str | None = None,
diff --git a/lyra/tools.py b/lyra/tools.py
index d88a50b..f4a6858 100644
--- a/lyra/tools.py
+++ b/lyra/tools.py
@@ -149,6 +149,20 @@ def _running_stats(args: dict, ctx: dict) -> str:
     return f"{rs['sessions']} sessions, {rs['hours']:g}h, net {rs['net']:+.0f}{hourly}. By stake: {by}"
 
 
+def _record_hand(args: dict, ctx: dict) -> str:
+    out = poker.record_hand(
+        args.get("shorthand") or "", stakes=args.get("stakes"),
+        tag=args.get("tag"), lesson=args.get("lesson"),
+    )
+    if not out["id"]:
+        return "I couldn't parse that hand — give it to me again with a little more detail?"
+    p = out["parsed"]
+    cards = " ".join(p.get("hero_cards") or [])
+    logbus.log("info", "hand reconstructed", id=out["id"], hero=p.get("hero_pos"))
+    return (f"Hand #{out['id']} reconstructed — {p.get('hero_pos') or '?'} "
+            f"{cards}. View/replay it at /hand/{out['id']}")
+
+
 def _villain_file(args: dict, ctx: dict) -> str:
     vs = poker.get_villain_file(name=args.get("name"), venue=args.get("venue"))
     if not vs:
@@ -231,6 +245,16 @@ TOOLS.update({
          "game": {**_S, "description": "Filter by game type"},
          "since": {**_S, "description": "ISO date lower bound, e.g. '2026-06-01'"}},
         [])},
+    "record_hand": {"handler": _record_hand, "spec": _f(
+        "record_hand",
+        "Reconstruct a hand from Brian's rough shorthand into a structured, "
+        "replayable hand history. Use when he describes/vomits a hand he wants "
+        "saved or to review. Pass his description verbatim as 'shorthand'.",
+        {"shorthand": {**_S, "description": "Brian's rough description of the hand, verbatim"},
+         "stakes": {**_S, "description": "Stakes if known, e.g. '1/3'"},
+         "tag": {**_S, "description": "well_played | leak | cooler | confidence | notable"},
+         "lesson": {**_S, "description": "Takeaway, if he stated one"}},
+        ["shorthand"])},
     "get_villain_file": {"handler": _villain_file, "spec": _f(
         "get_villain_file",
         "Pull saved opponent dossiers (the villain file). Filter by name or venue, e.g. before sitting down.",
diff --git a/lyra/web/server.py b/lyra/web/server.py
index 8df6d16..0a8c6f3 100644
--- a/lyra/web/server.py
+++ b/lyra/web/server.py
@@ -18,7 +18,7 @@ from fastapi import FastAPI, Request
 from fastapi.responses import FileResponse, StreamingResponse
 from fastapi.staticfiles import StaticFiles
 
-from lyra import chat, logbus, memory, self_state, summary
+from lyra import chat, logbus, memory, poker, self_state, summary
 from lyra.llm import Backend
 
 
@@ -141,6 +141,15 @@ def create_app() -> FastAPI:
     async def journal_data(limit: int = 300) -> dict:
         return {"entries": memory.list_journal(limit=limit)}
 
+    @app.get("/hand/{hand_id}")
+    async def hand_page(hand_id: int) -> FileResponse:
+        """Replayable hand-history viewer."""
+        return FileResponse(str(_STATIC / "hand.html"))
+
+    @app.get("/hand/{hand_id}/data")
+    async def hand_data(hand_id: int) -> dict:
+        return poker.get_hand(hand_id) or {}
+
     @app.get("/stream/logs")
     async def stream_logs(request: Request) -> StreamingResponse:
         """Live activity feed: replay the recent buffer, then stream new events."""
diff --git a/lyra/web/static/hand.html b/lyra/web/static/hand.html
new file mode 100644
index 0000000..67197ca
--- /dev/null
+++ b/lyra/web/static/hand.html
@@ -0,0 +1,222 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+  <meta charset="UTF-8" />
+  <meta name="viewport" content="width=device-width, initial-scale=1.0, viewport-fit=cover" />
+  <meta name="theme-color" content="#0b0d12" />
+  <title>Lyra — Hand</title>
+  <style>
+    :root {
+      --bg:#0b0d12; --bg-elev:#141821; --border:#232936; --text:#e6e9ef;
+      --fade:#8b93a7; --accent:#7aa2ff; --felt:#16322a; --feltline:#0f5132;
+      --chip:#ffcf6b; --hero:#7aa2ff;
+    }
+    *{box-sizing:border-box;}
+    html,body{margin:0;min-height:100%;background:var(--bg);color:var(--text);
+      font-family:-apple-system,BlinkMacSystemFont,"Segoe UI",Roboto,sans-serif;-webkit-text-size-adjust:100%;}
+    header{position:sticky;top:0;z-index:10;background:var(--bg-elev);border-bottom:1px solid var(--border);
+      padding:env(safe-area-inset-top) 14px 0;}
+    .topbar{display:flex;align-items:baseline;gap:10px;padding:12px 0;flex-wrap:wrap;}
+    .topbar h1{font-size:1.02rem;margin:0;font-weight:600;}
+    .topbar a.back{color:var(--accent);text-decoration:none;font-size:.92rem;}
+    .sub{color:var(--fade);font-size:.85rem;margin-left:auto;}
+    main{max-width:760px;margin:0 auto;padding:14px;}
+
+    .table-wrap{position:relative;width:100%;max-width:560px;margin:8px auto;aspect-ratio:1.45/1;}
+    .felt{position:absolute;inset:8%;background:radial-gradient(ellipse at center,#1c4a3c,var(--felt));
+      border:6px solid #25201a;border-radius:50%/50%;box-shadow:inset 0 0 40px rgba(0,0,0,.5);}
+    .center{position:absolute;top:50%;left:50%;transform:translate(-50%,-50%);text-align:center;width:80%;}
+    .board{display:flex;gap:5px;justify-content:center;min-height:46px;align-items:center;flex-wrap:wrap;}
+    .pot{margin-top:8px;color:var(--chip);font-size:.85rem;font-variant-numeric:tabular-nums;}
+    .street{color:var(--fade);font-size:.72rem;text-transform:uppercase;letter-spacing:.6px;margin-bottom:4px;}
+
+    .card{display:inline-flex;flex-direction:column;align-items:center;justify-content:center;
+      width:32px;height:44px;background:#f4f4f0;color:#111;border-radius:5px;font-weight:700;
+      box-shadow:0 1px 3px rgba(0,0,0,.4);line-height:1;}
+    .card.sm{width:26px;height:36px;font-size:.8rem;}
+    .card .r{font-size:1rem;}
+    .card.red{color:#c8102e;}
+    .card.back{background:#2a3550;color:#2a3550;}
+
+    .seat{position:absolute;transform:translate(-50%,-50%);width:96px;text-align:center;
+      background:rgba(13,16,22,.85);border:1px solid var(--border);border-radius:10px;padding:5px 4px;}
+    .seat.hero{border-color:var(--hero);box-shadow:0 0 10px rgba(122,162,255,.4);}
+    .seat.acting{border-color:var(--chip);box-shadow:0 0 12px rgba(255,207,107,.6);}
+    .seat .pos{font-size:.66rem;color:var(--accent);font-weight:700;letter-spacing:.4px;}
+    .seat .nm{font-size:.66rem;color:var(--fade);white-space:nowrap;overflow:hidden;text-overflow:ellipsis;}
+    .seat .cards{display:flex;gap:3px;justify-content:center;margin:3px 0;}
+    .seat .stack{font-size:.66rem;color:var(--text);font-variant-numeric:tabular-nums;}
+    .seat .act{font-size:.62rem;color:var(--chip);min-height:.8em;}
+    .seat.folded{opacity:.4;}
+
+    .controls{display:flex;gap:8px;align-items:center;justify-content:center;margin:14px 0 6px;}
+    .controls button{background:#1b2333;border:1px solid var(--border);color:var(--text);
+      border-radius:8px;padding:8px 14px;font-size:.95rem;cursor:pointer;-webkit-tap-highlight-color:transparent;}
+    .controls button:disabled{opacity:.4;}
+    .step-label{color:var(--fade);font-size:.8rem;min-width:80px;text-align:center;}
+    .now{text-align:center;color:var(--text);font-size:.95rem;min-height:1.3em;margin-bottom:6px;}
+
+    .log{margin-top:14px;border-top:1px solid var(--border);padding-top:10px;}
+    .log .ln{padding:5px 8px;border-radius:6px;font-size:.9rem;display:flex;gap:8px;}
+    .log .ln.cur{background:#1b2333;}
+    .log .ln.brd{color:var(--fade);font-style:italic;}
+    .log .st{color:var(--fade);font-size:.72rem;width:54px;flex:none;text-transform:uppercase;}
+    .summary{margin-top:14px;background:var(--bg-elev);border:1px solid var(--border);border-radius:10px;padding:12px;}
+    .summary .lbl{color:var(--fade);font-size:.72rem;text-transform:uppercase;letter-spacing:.5px;}
+    .err{color:#ff6b6b;text-align:center;padding:40px;}
+    .net-pos{color:#5ad1a0;} .net-neg{color:#ff6b6b;}
+  </style>
+</head>
+<body>
+  <header>
+    <div class="topbar">
+      <h1>🃏 Hand</h1>
+      <a class="back" href="/">← Chat</a>
+      <span class="sub" id="sub"></span>
+    </div>
+  </header>
+  <main id="root"><p class="err" id="boot">Loading hand…</p></main>
+
+  <script>
+    const SUIT = {s:"♠", h:"♥", d:"♦", c:"♣"};
+    const RED = new Set(["h", "d"]);
+    function esc(s){const d=document.createElement('div');d.textContent=s==null?'':String(s);return d.innerHTML;}
+
+    function cardEl(code, sm){
+      if(!code) return '';
+      const m = String(code).trim().match(/^(10|[2-9TJQKA])\s*([shdc])$/i);
+      if(!m) return `<span class="card${sm?' sm':''}">${esc(code)}</span>`;
+      const r = m[1].toUpperCase().replace('10','T'); const s = m[2].toLowerCase();
+      return `<span class="card${sm?' sm':''}${RED.has(s)?' red':''}"><span class="r">${r}</span><span>${SUIT[s]}</span></span>`;
+    }
+    const cards = (arr, sm) => (arr||[]).map(c=>cardEl(c,sm)).join('');
+
+    function render(h){
+      const sub = document.getElementById('sub');
+      const data = h.structured;
+      if(!data){ document.getElementById('root').innerHTML = '<p class="err">This hand has no structured data to replay.</p>'; return; }
+
+      const players = (data.players||[]).slice();
+      // order so hero sits at the bottom
+      let heroIdx = players.findIndex(p => p.pos === data.hero_pos);
+      if(heroIdx < 0) heroIdx = 0;
+      const ordered = players.slice(heroIdx).concat(players.slice(0, heroIdx));
+      const n = Math.max(ordered.length, 1);
+
+      const acts = data.actions || [];
+      let step = 0;  // number of actions applied
+
+      sub.textContent = [data.stakes, data.game].filter(Boolean).join(' ');
+
+      const root = document.getElementById('root');
+      root.innerHTML = `
+        <div class="table-wrap" id="tw">
+          <div class="felt"></div>
+          <div class="center">
+            <div class="street" id="street"></div>
+            <div class="board" id="board"></div>
+            <div class="pot" id="pot"></div>
+          </div>
+          <div id="seats"></div>
+        </div>
+        <div class="now" id="now"></div>
+        <div class="controls">
+          <button id="prev">◀ Prev</button>
+          <span class="step-label" id="steplab"></span>
+          <button id="next">Next ▶</button>
+          <button id="all">End</button>
+        </div>
+        <div class="log" id="log"></div>
+        ${data.result ? `<div class="summary"><div class="lbl">Result</div>
+           <div>${esc(data.result.summary||'')}</div>
+           ${data.result.hero_net!=null ? `<div class="${data.result.hero_net>=0?'net-pos':'net-neg'}">Hero net: ${data.result.hero_net>=0?'+':''}${esc(data.result.hero_net)}</div>`:''}
+           </div>`:''}
+      `;
+
+      // place seats around the oval
+      const seatsEl = document.getElementById('seats');
+      ordered.forEach((p,i)=>{
+        const ang = (90 + i*(360/n)) * Math.PI/180;  // bottom = 90deg
+        const x = 50 + 46*Math.cos(ang), y = 50 + 44*Math.sin(ang);
+        const el = document.createElement('div');
+        el.className = 'seat' + (p.pos===data.hero_pos?' hero':'');
+        el.style.left = x+'%'; el.style.top = y+'%';
+        el.dataset.pos = p.pos;
+        const hcards = (p.pos===data.hero_pos ? (p.cards||data.hero_cards) : p.cards);
+        el.innerHTML = `<div class="pos">${esc(p.pos||'')}</div>`
+          + (p.name?`<div class="nm">${esc(p.name)}</div>`:'')
+          + `<div class="cards">${hcards?cards(hcards,true):'<span class="card sm back">x</span><span class="card sm back">x</span>'}</div>`
+          + (p.stack!=null?`<div class="stack">${esc(p.stack)}</div>`:'')
+          + `<div class="act" data-act></div>`;
+        seatsEl.appendChild(el);
+      });
+
+      const boardEl=document.getElementById('board'), potEl=document.getElementById('pot'),
+            streetEl=document.getElementById('street'), nowEl=document.getElementById('now'),
+            logEl=document.getElementById('log'), steplab=document.getElementById('steplab');
+
+      // build the log
+      logEl.innerHTML = acts.map((a,idx)=>{
+        if(a.board) return `<div class="ln brd" data-i="${idx}"><span class="st">${esc(a.street)}</span>${cards(a.board,true)}</div>`;
+        const amt = a.amount!=null ? ' '+a.amount : '';
+        return `<div class="ln" data-i="${idx}"><span class="st">${esc(a.street||'')}</span>${esc(a.pos||'')} ${esc(a.action||'')}${amt}</div>`;
+      }).join('');
+
+      function draw(){
+        let pot = 0, board = [], street = 'Preflop';
+        const lastAct = {}, folded = {};
+        for(let i=0;i<step;i++){
+          const a = acts[i];
+          if(a.board){ board = a.board; street = a.street; continue; }
+          if(a.street) street = a.street;
+          if(a.amount!=null && ['call','bet','raise','allin','post'].includes(a.action)) pot += Number(a.amount)||0;
+          if(a.pos){ lastAct[a.pos] = (a.action||'') + (a.amount!=null?' '+a.amount:''); }
+          if(a.action==='fold' && a.pos) folded[a.pos]=true;
+        }
+        boardEl.innerHTML = cards(board);
+        potEl.textContent = pot ? ('Pot ~'+pot) : '';
+        streetEl.textContent = street;
+        document.querySelectorAll('.seat').forEach(s=>{
+          const pos=s.dataset.pos;
+          s.querySelector('[data-act]').textContent = lastAct[pos]||'';
+          s.classList.toggle('folded', !!folded[pos]);
+          s.classList.remove('acting');
+        });
+        const cur = acts[step-1];
+        if(cur && cur.pos){
+          const s = [...document.querySelectorAll('.seat')].find(x=>x.dataset.pos===cur.pos);
+          if(s) s.classList.add('acting');
+        }
+        nowEl.innerHTML = step===0 ? 'Cards dealt — preflop.'
+          : (cur.board ? `${cur.street[0].toUpperCase()+cur.street.slice(1)}: ${cards(cur.board,true)}`
+                       : `${esc(cur.pos||'')} ${esc(cur.action||'')}${cur.amount!=null?' '+cur.amount:''}`);
+        steplab.textContent = `${step} / ${acts.length}`;
+        document.getElementById('prev').disabled = step===0;
+        document.getElementById('next').disabled = step>=acts.length;
+        logEl.querySelectorAll('.ln').forEach(l=>l.classList.toggle('cur', Number(l.dataset.i)===step-1));
+        const curln = logEl.querySelector('.ln.cur'); if(curln) curln.scrollIntoView({block:'nearest'});
+      }
+      document.getElementById('prev').onclick=()=>{if(step>0){step--;draw();}};
+      document.getElementById('next').onclick=()=>{if(step<acts.length){step++;draw();}};
+      document.getElementById('all').onclick=()=>{step=acts.length;draw();};
+      document.addEventListener('keydown',e=>{
+        if(e.key==='ArrowRight'){if(step<acts.length){step++;draw();}}
+        if(e.key==='ArrowLeft'){if(step>0){step--;draw();}}
+      });
+      logEl.querySelectorAll('.ln').forEach(l=>l.onclick=()=>{step=Number(l.dataset.i)+1;draw();});
+      draw();
+    }
+
+    async function load(){
+      const id = location.pathname.split('/')[2];
+      try{
+        const r = await fetch(`/hand/${id}/data`,{cache:'no-store'});
+        const h = await r.json();
+        if(!h || !h.id){ document.getElementById('root').innerHTML='<p class="err">Hand not found.</p>'; return; }
+        render(h);
+      }catch(e){ document.getElementById('root').innerHTML='<p class="err">Couldn\'t load the hand.</p>'; }
+    }
+    load();
+  </script>
+</body>
+</html>
diff --git a/tests/test_poker.py b/tests/test_poker.py
index 514a6cd..ba18a49 100644
--- a/tests/test_poker.py
+++ b/tests/test_poker.py
@@ -64,6 +64,37 @@ def test_running_stats(lyra):
     assert "1/3" in rs["by_stake"]
 
 
+def test_hand_history_store_and_get(lyra):
+    poker = lyra
+    parsed = {"game": "NLH", "stakes": "1/3", "hero_pos": "BTN", "hero_cards": ["As", "Ks"],
+              "players": [{"pos": "BTN", "cards": ["As", "Ks"]}, {"pos": "BB"}],
+              "actions": [{"street": "preflop", "pos": "BTN", "action": "raise", "amount": 12},
+                          {"street": "flop", "board": ["As", "7d", "2s"]}],
+              "board": ["As", "7d", "2s"], "result": {"pot": 80, "hero_net": 330, "summary": "won"}}
+    hid = poker.store_hand_history(parsed)  # no live session -> attaches to a review session
+    h = poker.get_hand(hid)
+    assert h["position"] == "BTN" and h["hole_cards"] == "As Ks"
+    assert h["result"] == 330
+    assert h["structured"]["actions"][0]["amount"] == 12
+
+
+def test_record_hand_tool_parses_and_stores(lyra, monkeypatch):
+    import re
+
+    from lyra import llm, tools
+    hand_json = ('{"hero_pos":"CO","hero_cards":["Js","Jd"],'
+                 '"players":[{"pos":"CO","cards":["Js","Jd"]},{"pos":"BB","name":"drunk"}],'
+                 '"actions":[{"street":"preflop","pos":"CO","action":"raise","amount":45}],'
+                 '"board":[],"result":{"hero_net":-300,"summary":"lost to a straight"}}')
+    monkeypatch.setattr(llm, "complete", lambda messages, backend=None, model=None: hand_json)
+    out = tools.dispatch("record_hand", {"shorthand": "JJ in CO, lost to a straight", "stakes": "1/3"})
+    assert "/hand/" in out
+    hid = int(re.search(r"/hand/(\d+)", out).group(1))
+    h = lyra.get_hand(hid)
+    assert h["structured"]["hero_pos"] == "CO"
+    assert h["result"] == -300
+
+
 def test_poker_tools_dispatch(lyra):
     from lyra import tools
     assert "started" in tools.dispatch("start_session", {"stakes": "1/3", "buy_in": 300})
-- 
2.52.0


From fc06b24528e82575d36826092ee8a48755f93e31 Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Wed, 17 Jun 2026 23:39:49 +0000
Subject: [PATCH 37/51] feat: hand parser uses 'x' blanks instead of guessing
 suits/cards

Per Brian: never invent. Unknown suit -> 'x' (e.g. "Ax","Kx","4x"); fully
unknown card -> "x". "AA, ace of spades" -> ["As","Ax"]; "AK on A4x" -> board
["Ax","4x","x"]. Each card's suit is independent (a hole 'As' doesn't make a
board ace 'As'). Viewer renders 'x' as a muted unknown card and 'Rx' as the rank
with a neutral suit dot.

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/poker.py             | 11 ++++++++---
 lyra/web/static/hand.html |  9 +++++++--
 2 files changed, 15 insertions(+), 5 deletions(-)

diff --git a/lyra/poker.py b/lyra/poker.py
index b645564..6adfe4f 100644
--- a/lyra/poker.py
+++ b/lyra/poker.py
@@ -216,7 +216,7 @@ Schema:
   "game": "NLH" | "PLO" | ...,
   "stakes": "<e.g. 1/3, or null>",
   "hero_pos": "<UTG|UTG1|MP|LJ|HJ|CO|BTN|SB|BB, hero's position>",
-  "hero_cards": ["Rs", ...],            // rank+suit; suit one of s h d c; null if unknown
+  "hero_cards": ["As","Ax", ...],       // rank+suit (s/h/d/c); 'x' suit if unknown e.g. "Ax"; "x" for a fully unknown card
   "players": [                          // every player mentioned, incl. hero
     {"pos": "<position>", "stack": <number|null>, "name": <string|null>, "cards": [".."]|null}
   ],
@@ -230,8 +230,13 @@ Schema:
 }
 
 Rules: infer positions and street order sensibly. Amounts are plain numbers (no $). \
-Normalize cards like "Ah","Td","9s". Use null/omit for anything not stated. Stay faithful \
-to what's described — do not invent action that isn't implied."""
+NEVER invent suits or cards. A card is rank+suit where suit is one of s/h/d/c; if the suit \
+wasn't stated, use 'x' for the suit (e.g. "Ax","Kx","4x"); if a whole card wasn't stated, \
+use "x". Examples: "AA with the ace of spades" -> hero_cards ["As","Ax"]; "AK on an A4x \
+board" -> board ["Ax","4x","x"]. Each card is independent: a suit named for one card does \
+NOT apply to another — e.g. your hole "ace of spades" is a different card from a board ace \
+whose suit is unstated (that board ace is "Ax", not "As"). Use null/omit for non-card \
+details not stated. Stay faithful to what's described — do not invent action that isn't implied."""
 
 
 def _safe_json(s: str) -> dict | None:
diff --git a/lyra/web/static/hand.html b/lyra/web/static/hand.html
index 67197ca..60577ba 100644
--- a/lyra/web/static/hand.html
+++ b/lyra/web/static/hand.html
@@ -37,6 +37,8 @@
     .card .r{font-size:1rem;}
     .card.red{color:#c8102e;}
     .card.back{background:#2a3550;color:#2a3550;}
+    .card.unknown{background:#2a3550;color:#7c879e;font-size:1.2rem;}
+    .card .nosuit{color:#9aa3b5;}
 
     .seat{position:absolute;transform:translate(-50%,-50%);width:96px;text-align:center;
       background:rgba(13,16,22,.85);border:1px solid var(--border);border-radius:10px;padding:5px 4px;}
@@ -84,9 +86,12 @@
 
     function cardEl(code, sm){
       if(!code) return '';
-      const m = String(code).trim().match(/^(10|[2-9TJQKA])\s*([shdc])$/i);
-      if(!m) return `<span class="card${sm?' sm':''}">${esc(code)}</span>`;
+      const c = String(code).trim();
+      if(c.toLowerCase()==='x') return `<span class="card${sm?' sm':''} unknown">?</span>`;
+      const m = c.match(/^(10|[2-9TJQKA])\s*([shdcx])$/i);
+      if(!m) return `<span class="card${sm?' sm':''}">${esc(c)}</span>`;
       const r = m[1].toUpperCase().replace('10','T'); const s = m[2].toLowerCase();
+      if(s==='x') return `<span class="card${sm?' sm':''}"><span class="r">${r}</span><span class="nosuit">·</span></span>`;
       return `<span class="card${sm?' sm':''}${RED.has(s)?' red':''}"><span class="r">${r}</span><span>${SUIT[s]}</span></span>`;
     }
     const cards = (arr, sm) => (arr||[]).map(c=>cardEl(c,sm)).join('');
-- 
2.52.0


From 7b65f81d7e569ed7ba86fb9a0a2dc89818764d51 Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Thu, 18 Jun 2026 00:36:52 +0000
Subject: [PATCH 38/51] =?UTF-8?q?feat:=20poker=20phase=202=20=E2=80=94=20s?=
 =?UTF-8?q?ession=20recap=20(.md)=20generation,=20export,=20hands=20browse?=
 =?UTF-8?q?r?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Completes the poker copilot loop: talk through a session -> structured capture
-> generated writeup in Brian's format, remembered + exportable.

- poker.generate_recap(): LLM produces Brian's .md log (Session Header, Money
  Flow, Overview, Timeline, Key Hands w/ assessments, Villain Notes, Confidence
  Bank, Scar Notes, Mental Game, Final Assessment) from the session's structured
  data + the linked chat conversation; stored on poker_sessions.recap_md
- sessions now capture chat_session_id (via tool ctx) to pull the right convo;
  list_recent_hands() for browsing
- generate_recap tool ("write up the recap")
- web: /recap/{id} (renders the md) + /recap/{id}/download (.md attachment) +
  /hands browser (recent hands -> /hand/{id}); nav links added (desktop + mobile)
- tests: recap generation (stubbed), recent-hands listing

Verified live: recap for the Meadows session rendered + downloaded; all pages 200.

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/poker.py              | 133 ++++++++++++++++++++++++++++++++++---
 lyra/tools.py              |  16 +++++
 lyra/web/server.py         |  28 +++++++-
 lyra/web/static/hands.html |  84 +++++++++++++++++++++++
 lyra/web/static/index.html |   5 ++
 lyra/web/static/recap.html |  78 ++++++++++++++++++++++
 tests/test_poker.py        |  21 ++++++
 7 files changed, 353 insertions(+), 12 deletions(-)
 create mode 100644 lyra/web/static/hands.html
 create mode 100644 lyra/web/static/recap.html

diff --git a/lyra/poker.py b/lyra/poker.py
index 6adfe4f..4d881ac 100644
--- a/lyra/poker.py
+++ b/lyra/poker.py
@@ -33,8 +33,9 @@ CREATE TABLE IF NOT EXISTS poker_sessions (
     hours REAL,
     mantra TEXT,
     mood TEXT,
-    status TEXT NOT NULL DEFAULT 'live',   -- live | closed
-    recap_md TEXT
+    status TEXT NOT NULL DEFAULT 'live',   -- live | closed | review
+    recap_md TEXT,
+    chat_session_id TEXT                   -- links to the chat where it was played, for recap
 );
 
 CREATE TABLE IF NOT EXISTS poker_hands (
@@ -91,10 +92,12 @@ def _c():
     if _ensured_for is not conn:
         conn.executescript(_SCHEMA)
         # Add columns introduced after a DB already had the tables (no-op if present).
-        try:
-            conn.execute("ALTER TABLE poker_hands ADD COLUMN structured TEXT")
-        except Exception:
-            pass
+        for ddl in ("ALTER TABLE poker_hands ADD COLUMN structured TEXT",
+                    "ALTER TABLE poker_sessions ADD COLUMN chat_session_id TEXT"):
+            try:
+                conn.execute(ddl)
+            except Exception:
+                pass
         _ensured_for = conn
     return conn
 
@@ -106,20 +109,25 @@ def _now() -> str:
 # --- sessions ---
 
 def start_session(venue: str | None = None, stakes: str | None = None,
-                  game: str = "NLH", fmt: str = "cash",
-                  buy_in: float = 0.0, mantra: str | None = None) -> int:
+                  game: str = "NLH", fmt: str = "cash", buy_in: float = 0.0,
+                  mantra: str | None = None, chat_session_id: str | None = None) -> int:
     """Open a new live session. Returns its id."""
     conn = _c()
     with conn:
         cur = conn.execute(
             "INSERT INTO poker_sessions "
-            "(started_at, venue, game, stakes, format, buy_in_total, mantra, status) "
-            "VALUES (?, ?, ?, ?, ?, ?, ?, 'live')",
-            (_now(), venue, game, stakes, fmt, float(buy_in or 0), mantra),
+            "(started_at, venue, game, stakes, format, buy_in_total, mantra, status, chat_session_id) "
+            "VALUES (?, ?, ?, ?, ?, ?, ?, 'live', ?)",
+            (_now(), venue, game, stakes, fmt, float(buy_in or 0), mantra, chat_session_id),
         )
     return int(cur.lastrowid)
 
 
+def get_session(session_id: int) -> dict | None:
+    r = _c().execute("SELECT * FROM poker_sessions WHERE id = ?", (session_id,)).fetchone()
+    return dict(r) if r else None
+
+
 def live_session() -> dict | None:
     """The current open session, if any."""
     r = _c().execute(
@@ -326,6 +334,109 @@ def get_hand(hand_id: int) -> dict | None:
     return d
 
 
+def list_recent_hands(limit: int = 60) -> list[dict]:
+    """Recent recorded hands with their session's venue/stakes, for browsing."""
+    rows = _c().execute(
+        "SELECT h.id, h.position, h.hole_cards, h.board, h.result, h.tag, h.at, "
+        "h.lesson, s.venue AS venue, s.stakes AS stakes "
+        "FROM poker_hands h LEFT JOIN poker_sessions s ON s.id = h.session_id "
+        "ORDER BY h.id DESC LIMIT ?", (limit,),
+    ).fetchall()
+    return [dict(r) for r in rows]
+
+
+# --- session recap (.md generation on top of structured data + conversation) ---
+
+_RECAP_PROMPT = """You are writing Brian's structured poker session log in Markdown, in his \
+established format, from the session DATA and CONVERSATION provided. Output ONLY the Markdown \
+— no preamble, no code fences.
+
+Use these sections (skip any with no material; don't pad):
+
+# YYYY-MM-DD — <venue + game/stakes>
+## Session Header
+* Date / Casino / Game & stakes / Start–End / Buy-in(s) / Cash-out / Net result
+## Money Flow
+(totals; break out by variant if multiple games were played)
+## Session Overview
+(1-2 short narrative paragraphs)
+## Timeline
+(bullets of how it went)
+## Key Hands
+(### per notable hand — Action recap → brief analysis → **Assessment:** Well Played / Leak Candidate / Cooler / Confidence Bank)
+## Table Dynamics & Villain Notes
+(### per opponent — profile + exploit)
+## Confidence Bank
+(disciplined / good process plays)
+## Scar Notes
+(mistakes and study points)
+## Mental Game Notes
+## Final Assessment
+(overall quality of play; biggest strength; biggest thing to improve; did the result match decision quality?)
+
+Base everything on the actual data and conversation — do NOT invent hands, villains, or results. \
+Address Brian as "you" or "Brian", coach-to-player. Be concise but complete."""
+
+
+def _resolve_recap(session_id: int | None) -> int | None:
+    if session_id is not None:
+        return session_id
+    live = live_session()
+    if live:
+        return live["id"]
+    r = _c().execute(
+        "SELECT id FROM poker_sessions WHERE status = 'closed' ORDER BY id DESC LIMIT 1"
+    ).fetchone()
+    return int(r["id"]) if r else None
+
+
+def _hand_line(h: dict) -> str:
+    bits = [h.get("position"), h.get("hole_cards"),
+            (f"board {h['board']}") if h.get("board") else None,
+            (f"result {h['result']:+g}") if h.get("result") is not None else None,
+            (f"[{h['tag']}]") if h.get("tag") else None, h.get("lesson")]
+    return " | ".join(str(b) for b in bits if b)
+
+
+def generate_recap(session_id: int | None = None, backend: str | None = None) -> dict | None:
+    """Generate Brian's .md recap from a session's structured data + conversation, store it."""
+    backend = backend or "cloud"
+    sid = _resolve_recap(session_id)
+    if sid is None:
+        return None
+    s = get_session(sid)
+    hands = list_hands(sid)
+    reads = [dict(r) for r in _c().execute(
+        "SELECT seat, note FROM player_reads WHERE session_id = ?", (sid,)).fetchall()]
+    stats = session_stats(sid)
+
+    convo = ""
+    if s.get("chat_session_id"):
+        exs = [e for e in memory.history(s["chat_session_id"])
+               if (e.created_at or "") >= (s.get("started_at") or "")]
+        convo = "\n".join(f"{e.role}: {e.content}" for e in exs)[-12000:]
+
+    body = (
+        "SESSION DATA:\n"
+        f"- venue: {s.get('venue')} | game: {s.get('game')} | stakes: {s.get('stakes')} | format: {s.get('format')}\n"
+        f"- started: {s.get('started_at')} | ended: {s.get('ended_at')} | hours: {s.get('hours')}\n"
+        f"- buy-in total: {s.get('buy_in_total')} | cash out: {s.get('cash_out')} | net: {s.get('net')}\n"
+        f"- mantra: {s.get('mantra')} | mood: {s.get('mood')} | "
+        f"{stats.get('per_hour')}/hr | hands logged: {stats.get('hands_logged')} | tags: {stats.get('tags')}\n\n"
+        "HANDS:\n" + ("\n".join("- " + _hand_line(h) for h in hands) or "(none logged)") + "\n\n"
+        "READS:\n" + ("\n".join(f"- seat {r.get('seat')}: {r['note']}" for r in reads) or "(none)") + "\n\n"
+        "CONVERSATION DURING SESSION:\n" + (convo or "(none captured)")
+    )
+    md = llm.complete(
+        [{"role": "system", "content": _RECAP_PROMPT}, {"role": "user", "content": body}],
+        backend=backend,
+    )
+    conn = _c()
+    with conn:
+        conn.execute("UPDATE poker_sessions SET recap_md = ? WHERE id = ?", (md, sid))
+    return {"id": sid, "markdown": md}
+
+
 # --- villain file ---
 
 def upsert_player(name: str, venue: str | None = None, description: str | None = None,
diff --git a/lyra/tools.py b/lyra/tools.py
index f4a6858..f2b6b03 100644
--- a/lyra/tools.py
+++ b/lyra/tools.py
@@ -90,6 +90,7 @@ def _start_session(args: dict, ctx: dict) -> str:
         venue=args.get("venue"), stakes=args.get("stakes"),
         game=args.get("game") or "NLH", fmt=args.get("format") or "cash",
         buy_in=args.get("buy_in") or 0, mantra=args.get("mantra"),
+        chat_session_id=ctx.get("session_id"),
     )
     logbus.log("info", "poker session started", id=sid, stakes=args.get("stakes"))
     return (f"Session #{sid} started — {args.get('stakes') or '?'} "
@@ -163,6 +164,15 @@ def _record_hand(args: dict, ctx: dict) -> str:
             f"{cards}. View/replay it at /hand/{out['id']}")
 
 
+def _generate_recap(args: dict, ctx: dict) -> str:
+    out = poker.generate_recap()
+    if not out:
+        return "No session to recap yet — start (and ideally finish) one first."
+    logbus.log("info", "recap generated", id=out["id"], chars=len(out["markdown"]))
+    return (f"Recap written for session #{out['id']} — view or download the .md "
+            f"at /recap/{out['id']}")
+
+
 def _villain_file(args: dict, ctx: dict) -> str:
     vs = poker.get_villain_file(name=args.get("name"), venue=args.get("venue"))
     if not vs:
@@ -255,6 +265,12 @@ TOOLS.update({
          "tag": {**_S, "description": "well_played | leak | cooler | confidence | notable"},
          "lesson": {**_S, "description": "Takeaway, if he stated one"}},
         ["shorthand"])},
+    "generate_recap": {"handler": _generate_recap, "spec": _f(
+        "generate_recap",
+        "Write up the full session recap (.md) in Brian's format from the logged "
+        "data + this conversation. Use when he asks for the recap/writeup, usually "
+        "after ending a session.",
+        {}, [])},
     "get_villain_file": {"handler": _villain_file, "spec": _f(
         "get_villain_file",
         "Pull saved opponent dossiers (the villain file). Filter by name or venue, e.g. before sitting down.",
diff --git a/lyra/web/server.py b/lyra/web/server.py
index 0a8c6f3..f2a3b1c 100644
--- a/lyra/web/server.py
+++ b/lyra/web/server.py
@@ -14,7 +14,7 @@ import json
 import time
 from pathlib import Path
 
-from fastapi import FastAPI, Request
+from fastapi import FastAPI, Request, Response
 from fastapi.responses import FileResponse, StreamingResponse
 from fastapi.staticfiles import StaticFiles
 
@@ -150,6 +150,32 @@ def create_app() -> FastAPI:
     async def hand_data(hand_id: int) -> dict:
         return poker.get_hand(hand_id) or {}
 
+    @app.get("/hands")
+    async def hands_page() -> FileResponse:
+        return FileResponse(str(_STATIC / "hands.html"))
+
+    @app.get("/hands/data")
+    async def hands_data(limit: int = 60) -> dict:
+        return {"hands": poker.list_recent_hands(limit=limit)}
+
+    @app.get("/recap/{session_id}")
+    async def recap_page() -> FileResponse:
+        return FileResponse(str(_STATIC / "recap.html"))
+
+    @app.get("/recap/{session_id}/data")
+    async def recap_data(session_id: int) -> dict:
+        s = poker.get_session(session_id) or {}
+        return {"session": s, "markdown": s.get("recap_md")}
+
+    @app.get("/recap/{session_id}/download")
+    async def recap_download(session_id: int) -> Response:
+        s = poker.get_session(session_id) or {}
+        md = s.get("recap_md") or "# No recap generated yet\n"
+        date = (s.get("started_at") or "session")[:10]
+        fname = f"pokerlog_{date}_s{session_id}.md"
+        return Response(content=md, media_type="text/markdown",
+                        headers={"Content-Disposition": f'attachment; filename="{fname}"'})
+
     @app.get("/stream/logs")
     async def stream_logs(request: Request) -> StreamingResponse:
         """Live activity feed: replay the recent buffer, then stream new events."""
diff --git a/lyra/web/static/hands.html b/lyra/web/static/hands.html
new file mode 100644
index 0000000..7055f51
--- /dev/null
+++ b/lyra/web/static/hands.html
@@ -0,0 +1,84 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+  <meta charset="UTF-8" />
+  <meta name="viewport" content="width=device-width, initial-scale=1.0, viewport-fit=cover" />
+  <meta name="theme-color" content="#0b0d12" />
+  <title>Lyra — Hands</title>
+  <style>
+    :root{--bg:#0b0d12;--bg-elev:#141821;--bg-line:#11141b;--border:#232936;--text:#e6e9ef;--fade:#8b93a7;--accent:#7aa2ff;}
+    *{box-sizing:border-box;}
+    html,body{margin:0;min-height:100%;background:var(--bg);color:var(--text);
+      font-family:-apple-system,BlinkMacSystemFont,"Segoe UI",Roboto,sans-serif;-webkit-text-size-adjust:100%;}
+    header{position:sticky;top:0;z-index:10;background:var(--bg-elev);border-bottom:1px solid var(--border);
+      padding:env(safe-area-inset-top) 14px 0;}
+    .topbar{display:flex;align-items:center;gap:10px;padding:13px 0;}
+    .topbar h1{font-size:1.05rem;margin:0;font-weight:600;}
+    .topbar a.back{color:var(--accent);text-decoration:none;font-size:.92rem;}
+    .count{margin-left:auto;color:var(--fade);font-size:.8rem;}
+    main{max-width:640px;margin:0 auto;padding:12px 12px 40px;}
+    a.hand{display:flex;align-items:center;gap:12px;text-decoration:none;color:var(--text);
+      background:var(--bg-elev);border:1px solid var(--border);border-radius:10px;padding:10px 12px;margin-bottom:8px;}
+    a.hand:active{background:#1b2333;}
+    .cards{display:flex;gap:4px;flex:none;}
+    .card{display:inline-flex;flex-direction:column;align-items:center;justify-content:center;
+      width:24px;height:33px;background:#f4f4f0;color:#111;border-radius:4px;font-weight:700;font-size:.72rem;line-height:1;}
+    .card.red{color:#c8102e;} .card.unknown{background:#2a3550;color:#7c879e;}
+    .card .nosuit{color:#9aa3b5;}
+    .mid{flex:1;min-width:0;}
+    .ln1{font-size:.92rem;}
+    .ln2{font-size:.74rem;color:var(--fade);white-space:nowrap;overflow:hidden;text-overflow:ellipsis;}
+    .res{flex:none;font-variant-numeric:tabular-nums;font-weight:600;}
+    .pos-res{color:#5ad1a0;} .neg-res{color:#ff6b6b;}
+    .tag{font-size:.62rem;text-transform:uppercase;letter-spacing:.4px;color:var(--accent);}
+    .empty{color:var(--fade);text-align:center;padding:46px 16px;}
+  </style>
+</head>
+<body>
+  <header>
+    <div class="topbar">
+      <h1>🃏 Hands</h1>
+      <a class="back" href="/">← Chat</a>
+      <span class="count" id="count"></span>
+    </div>
+  </header>
+  <main id="root"><p class="empty">Loading…</p></main>
+
+  <script>
+    const SUIT={s:"♠",h:"♥",d:"♦",c:"♣"}, RED=new Set(["h","d"]);
+    function esc(s){const d=document.createElement('div');d.textContent=s==null?'':String(s);return d.innerHTML;}
+    function cardEl(code){
+      if(!code) return '';
+      const c=String(code).trim();
+      if(c.toLowerCase()==='x') return '<span class="card unknown">?</span>';
+      const m=c.match(/^(10|[2-9TJQKA])\s*([shdcx])$/i);
+      if(!m) return `<span class="card">${esc(c)}</span>`;
+      const r=m[1].toUpperCase().replace('10','T'), s=m[2].toLowerCase();
+      if(s==='x') return `<span class="card"><span>${r}</span><span class="nosuit">·</span></span>`;
+      return `<span class="card${RED.has(s)?' red':''}"><span>${r}</span><span>${SUIT[s]}</span></span>`;
+    }
+    const cards=str=>(str?String(str).trim().split(/\s+/):[]).map(cardEl).join('');
+
+    async function load(){
+      try{
+        const r=await fetch('/hands/data',{cache:'no-store'});
+        const hands=(await r.json()).hands||[];
+        document.getElementById('count').textContent=`${hands.length} hand${hands.length===1?'':'s'}`;
+        if(!hands.length){document.getElementById('root').innerHTML='<p class="empty">No hands recorded yet. Tell Lyra: "log this hand: …"</p>';return;}
+        document.getElementById('root').innerHTML=hands.map(h=>{
+          const res=h.result!=null?`<span class="res ${h.result>=0?'pos-res':'neg-res'}">${h.result>=0?'+':''}${h.result}</span>`:'';
+          const meta=[h.stakes,h.venue,(h.at||'').slice(0,10)].filter(Boolean).join(' · ');
+          const tag=h.tag?` · <span class="tag">${esc(h.tag)}</span>`:'';
+          return `<a class="hand" href="/hand/${h.id}">
+            <span class="cards">${cards(h.hole_cards)||'<span class="card unknown">?</span>'}</span>
+            <span class="mid">
+              <div class="ln1">${esc(h.position||'')} ${h.board?'· '+'<span class="cards" style="display:inline-flex">'+cards(h.board)+'</span>':''}</div>
+              <div class="ln2">${esc(meta)}${tag}</div>
+            </span>${res}</a>`;
+        }).join('');
+      }catch(e){document.getElementById('root').innerHTML='<p class="empty">Couldn\'t load hands.</p>';}
+    }
+    load();
+  </script>
+</body>
+</html>
diff --git a/lyra/web/static/index.html b/lyra/web/static/index.html
index fad6703..5ad59ac 100644
--- a/lyra/web/static/index.html
+++ b/lyra/web/static/index.html
@@ -39,6 +39,7 @@
       <button id="mobileFullLogBtn">⛶ Full Log</button>
       <button id="mobileMindBtn">🧠 Read Her Mind</button>
       <button id="mobileJournalBtn">📔 Journal</button>
+      <button id="mobileHandsBtn">🃏 Hands</button>
       <button id="mobileSettingsBtn">⚙ Settings</button>
       <button id="mobileToggleThemeBtn">🌙 Toggle Theme</button>
       <button id="mobileForceReloadBtn">🔄 Force Reload</button>
@@ -74,6 +75,7 @@
       <button id="thinkingStreamBtn" title="Show live activity log">📜 Live Log</button>
       <a id="fullLogBtn" href="/logs" target="_blank" rel="noopener" title="Open the full-page log" role="button">⛶ Full Log</a>
       <a id="mindBtn" href="/self" target="_blank" rel="noopener" title="Read her mind — Lyra's current self-state" role="button">🧠 Mind</a>
+      <a id="handsBtn" href="/hands" target="_blank" rel="noopener" title="Recorded poker hands" role="button">🃏 Hands</a>
     </div>
 
     <!-- Status -->
@@ -827,6 +829,9 @@
       document.getElementById("mobileJournalBtn").addEventListener("click", () => {
         closeMobileMenu(); window.location.href = "/journal";
       });
+      document.getElementById("mobileHandsBtn").addEventListener("click", () => {
+        closeMobileMenu(); window.location.href = "/hands";
+      });
 
       // Connect to the global live log on page load.
       connectThinkingStream();
diff --git a/lyra/web/static/recap.html b/lyra/web/static/recap.html
new file mode 100644
index 0000000..12c8878
--- /dev/null
+++ b/lyra/web/static/recap.html
@@ -0,0 +1,78 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+  <meta charset="UTF-8" />
+  <meta name="viewport" content="width=device-width, initial-scale=1.0, viewport-fit=cover" />
+  <meta name="theme-color" content="#0b0d12" />
+  <title>Lyra — Recap</title>
+  <style>
+    :root{--bg:#0b0d12;--bg-elev:#141821;--bg-line:#11141b;--border:#232936;--text:#e6e9ef;--fade:#8b93a7;--accent:#7aa2ff;}
+    *{box-sizing:border-box;}
+    html,body{margin:0;min-height:100%;background:var(--bg);color:var(--text);
+      font-family:-apple-system,BlinkMacSystemFont,"Segoe UI",Roboto,sans-serif;-webkit-text-size-adjust:100%;}
+    header{position:sticky;top:0;z-index:10;background:var(--bg-elev);border-bottom:1px solid var(--border);
+      padding:env(safe-area-inset-top) 14px 0;}
+    .topbar{display:flex;align-items:center;gap:10px;padding:12px 0;flex-wrap:wrap;}
+    .topbar h1{font-size:1.02rem;margin:0;font-weight:600;}
+    .topbar a.back{color:var(--accent);text-decoration:none;font-size:.92rem;}
+    .dl{margin-left:auto;background:#1b2333;border:1px solid var(--border);color:var(--accent);
+      border-radius:8px;padding:7px 12px;font-size:.85rem;text-decoration:none;}
+    main{max-width:740px;margin:0 auto;padding:18px 16px 48px;line-height:1.6;}
+    h1,h2,h3,h4{line-height:1.3;color:var(--text);}
+    main>h1:first-child{margin-top:0;}
+    h2{font-size:1.18rem;border-bottom:1px solid var(--border);padding-bottom:5px;margin-top:26px;color:var(--accent);}
+    h3{font-size:1.04rem;margin-top:18px;}
+    ul{padding-left:22px;} li{margin:3px 0;}
+    strong{color:var(--text);} hr{border:none;border-top:1px solid var(--border);margin:20px 0;}
+    code{background:rgba(255,255,255,.08);padding:1px 5px;border-radius:4px;font-size:.9em;}
+    .err{color:var(--fade);text-align:center;padding:46px 16px;}
+  </style>
+</head>
+<body>
+  <header>
+    <div class="topbar">
+      <h1>📋 Recap</h1>
+      <a class="back" href="/">← Chat</a>
+      <a class="back" href="/hands">Hands</a>
+      <a class="dl" id="dl">⬇ .md</a>
+    </div>
+  </header>
+  <main id="root"><p class="err">Loading recap…</p></main>
+
+  <script>
+    const bt = String.fromCharCode(96);
+    function esc(s){return String(s==null?'':s).replace(/&/g,"&amp;").replace(/</g,"&lt;").replace(/>/g,"&gt;");}
+    function inline(s){
+      const codeRe = new RegExp(bt+"([^"+bt+"]+)"+bt,"g");
+      return esc(s).replace(codeRe,"<code>$1</code>")
+        .replace(/\*\*([^*]+)\*\*/g,"<strong>$1</strong>")
+        .replace(/(^|[^*])\*([^*\n]+)\*/g,"$1<em>$2</em>");
+    }
+    function md(src){
+      const lines=String(src||"").replace(/\r\n/g,"\n").split("\n");
+      const out=[]; let list=null;
+      const flush=()=>{if(list){out.push("<ul>"+list.map(i=>"<li>"+inline(i)+"</li>").join("")+"</ul>");list=null;}};
+      for(const raw of lines){
+        const t=raw.replace(/\s+$/,""); let m;
+        if(!t.trim()){flush();continue;}
+        if(/^(-{3,}|\*{3,}|_{3,})$/.test(t.trim())){flush();out.push("<hr>");continue;}
+        if((m=t.match(/^(#{1,6})\s+(.*)$/))){flush();const n=m[1].length;out.push(`<h${n}>${inline(m[2])}</h${n}>`);continue;}
+        if((m=t.match(/^\s*[-*+]\s+(.*)$/))){(list=list||[]).push(m[1]);continue;}
+        flush();out.push("<p>"+inline(t)+"</p>");
+      }
+      flush(); return out.join("\n");
+    }
+    async function load(){
+      const id=location.pathname.split('/')[2];
+      document.getElementById('dl').href=`/recap/${id}/download`;
+      try{
+        const r=await fetch(`/recap/${id}/data`,{cache:'no-store'});
+        const d=await r.json();
+        if(!d.markdown){document.getElementById('root').innerHTML='<p class="err">No recap yet for this session. Ask Lyra to write one ("generate the recap").</p>';return;}
+        document.getElementById('root').innerHTML=md(d.markdown);
+      }catch(e){document.getElementById('root').innerHTML='<p class="err">Couldn\'t load the recap.</p>';}
+    }
+    load();
+  </script>
+</body>
+</html>
diff --git a/tests/test_poker.py b/tests/test_poker.py
index ba18a49..914985c 100644
--- a/tests/test_poker.py
+++ b/tests/test_poker.py
@@ -95,6 +95,27 @@ def test_record_hand_tool_parses_and_stores(lyra, monkeypatch):
     assert h["result"] == -300
 
 
+def test_generate_recap(lyra, monkeypatch):
+    poker = lyra
+    from lyra import llm
+    monkeypatch.setattr(llm, "complete",
+                        lambda messages, backend=None, model=None: "# Recap\n## Final Assessment\nGood session.")
+    sid = poker.start_session(venue="Meadows", stakes="1/3", buy_in=300)
+    poker.log_hand(position="BTN", hole_cards="AKs", result=180, tag="confidence")
+    poker.end_session(540, session_id=sid)
+    out = poker.generate_recap(session_id=sid)
+    assert out["id"] == sid and "Final Assessment" in out["markdown"]
+    assert "Recap" in poker.get_session(sid)["recap_md"]
+
+
+def test_list_recent_hands(lyra):
+    poker = lyra
+    poker.start_session(stakes="1/3", buy_in=300)
+    poker.log_hand(position="CO", hole_cards="QQ", result=-50)
+    hh = poker.list_recent_hands()
+    assert hh and hh[0]["hole_cards"] == "QQ" and hh[0]["stakes"] == "1/3"
+
+
 def test_poker_tools_dispatch(lyra):
     from lyra import tools
     assert "started" in tools.dispatch("start_session", {"stakes": "1/3", "buy_in": 300})
-- 
2.52.0


From 4882225751c45cb5cd6cf57a5e03a604ed8156f8 Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Thu, 18 Jun 2026 00:53:18 +0000
Subject: [PATCH 39/51] feat: live stacks in hand viewer + retheme UI to RTO
 black/orange palette
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Hand viewer:
- stacks now decrement as players commit chips (street-aware "to"-amount
  accounting), showing e.g. 300 -> 285 after a 15 open, "all in" at 0; pot is
  computed from total committed (accurate, no double-counting raises)

Theme (match the rec-theory-optimal look — warm black & orange, not Halloween):
- deep near-black bg (#070707 / #0e0e0e panels), warm orange accent (#ff7a00),
  amber-gold secondary (#ffb347), muted green (#8fd694); warm dark borders
- killed the neon-orange glows and the purple accents; chat app + all standalone
  pages (logs/self/journal/hand/recap/hands) on one palette

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/web/static/hand.html    |   58 +-
 lyra/web/static/hands.html   |    8 +-
 lyra/web/static/journal.html |   10 +-
 lyra/web/static/logs.html    |   30 +-
 lyra/web/static/recap.html   |    6 +-
 lyra/web/static/self.html    |   10 +-
 lyra/web/static/style.css    | 1992 +++++++++++++++++-----------------
 7 files changed, 1069 insertions(+), 1045 deletions(-)

diff --git a/lyra/web/static/hand.html b/lyra/web/static/hand.html
index 60577ba..7c5f1df 100644
--- a/lyra/web/static/hand.html
+++ b/lyra/web/static/hand.html
@@ -3,13 +3,13 @@
 <head>
   <meta charset="UTF-8" />
   <meta name="viewport" content="width=device-width, initial-scale=1.0, viewport-fit=cover" />
-  <meta name="theme-color" content="#0b0d12" />
+  <meta name="theme-color" content="#070707" />
   <title>Lyra — Hand</title>
   <style>
     :root {
-      --bg:#0b0d12; --bg-elev:#141821; --border:#232936; --text:#e6e9ef;
-      --fade:#8b93a7; --accent:#7aa2ff; --felt:#16322a; --feltline:#0f5132;
-      --chip:#ffcf6b; --hero:#7aa2ff;
+      --bg:#070707; --bg-elev:#0e0e0e; --border:#2a1d12; --text:#e8e8e8;
+      --fade:#8a8a8a; --accent:#ff7a00; --felt:#16322a; --feltline:#0f5132;
+      --chip:#ffb347; --hero:#ff7a00;
     }
     *{box-sizing:border-box;}
     html,body{margin:0;min-height:100%;background:var(--bg);color:var(--text);
@@ -42,8 +42,8 @@
 
     .seat{position:absolute;transform:translate(-50%,-50%);width:96px;text-align:center;
       background:rgba(13,16,22,.85);border:1px solid var(--border);border-radius:10px;padding:5px 4px;}
-    .seat.hero{border-color:var(--hero);box-shadow:0 0 10px rgba(122,162,255,.4);}
-    .seat.acting{border-color:var(--chip);box-shadow:0 0 12px rgba(255,207,107,.6);}
+    .seat.hero{border-color:var(--hero);box-shadow:0 0 10px rgba(255,122,0,.4);}
+    .seat.acting{border-color:var(--chip);box-shadow:0 0 12px rgba(255,179,71,.6);}
     .seat .pos{font-size:.66rem;color:var(--accent);font-weight:700;letter-spacing:.4px;}
     .seat .nm{font-size:.66rem;color:var(--fade);white-space:nowrap;overflow:hidden;text-overflow:ellipsis;}
     .seat .cards{display:flex;gap:3px;justify-content:center;margin:3px 0;}
@@ -52,7 +52,7 @@
     .seat.folded{opacity:.4;}
 
     .controls{display:flex;gap:8px;align-items:center;justify-content:center;margin:14px 0 6px;}
-    .controls button{background:#1b2333;border:1px solid var(--border);color:var(--text);
+    .controls button{background:#241400;border:1px solid var(--border);color:var(--text);
       border-radius:8px;padding:8px 14px;font-size:.95rem;cursor:pointer;-webkit-tap-highlight-color:transparent;}
     .controls button:disabled{opacity:.4;}
     .step-label{color:var(--fade);font-size:.8rem;min-width:80px;text-align:center;}
@@ -60,13 +60,13 @@
 
     .log{margin-top:14px;border-top:1px solid var(--border);padding-top:10px;}
     .log .ln{padding:5px 8px;border-radius:6px;font-size:.9rem;display:flex;gap:8px;}
-    .log .ln.cur{background:#1b2333;}
+    .log .ln.cur{background:#241400;}
     .log .ln.brd{color:var(--fade);font-style:italic;}
     .log .st{color:var(--fade);font-size:.72rem;width:54px;flex:none;text-transform:uppercase;}
     .summary{margin-top:14px;background:var(--bg-elev);border:1px solid var(--border);border-radius:10px;padding:12px;}
     .summary .lbl{color:var(--fade);font-size:.72rem;text-transform:uppercase;letter-spacing:.5px;}
     .err{color:#ff6b6b;text-align:center;padding:40px;}
-    .net-pos{color:#5ad1a0;} .net-neg{color:#ff6b6b;}
+    .net-pos{color:#8fd694;} .net-neg{color:#ff6b6b;}
   </style>
 </head>
 <body>
@@ -140,7 +140,9 @@
 
       // place seats around the oval
       const seatsEl = document.getElementById('seats');
+      const starts = {};
       ordered.forEach((p,i)=>{
+        starts[p.pos] = (p.stack!=null ? Number(p.stack) : null);
         const ang = (90 + i*(360/n)) * Math.PI/180;  // bottom = 90deg
         const x = 50 + 46*Math.cos(ang), y = 50 + 44*Math.sin(ang);
         const el = document.createElement('div');
@@ -151,7 +153,7 @@
         el.innerHTML = `<div class="pos">${esc(p.pos||'')}</div>`
           + (p.name?`<div class="nm">${esc(p.name)}</div>`:'')
           + `<div class="cards">${hcards?cards(hcards,true):'<span class="card sm back">x</span><span class="card sm back">x</span>'}</div>`
-          + (p.stack!=null?`<div class="stack">${esc(p.stack)}</div>`:'')
+          + `<div class="stack" data-stack>${p.stack!=null?esc(p.stack):''}</div>`
           + `<div class="act" data-act></div>`;
         seatsEl.appendChild(el);
       });
@@ -167,25 +169,47 @@
         return `<div class="ln" data-i="${idx}"><span class="st">${esc(a.street||'')}</span>${esc(a.pos||'')} ${esc(a.action||'')}${amt}</div>`;
       }).join('');
 
+      const cap = s => s ? s[0].toUpperCase()+s.slice(1) : s;
+      const fmt = n => Number.isInteger(n) ? n : Math.round(n*100)/100;
+
       function draw(){
-        let pot = 0, board = [], street = 'Preflop';
+        let board = [], street = 'Preflop';
         const lastAct = {}, folded = {};
+        // street-aware chip accounting: amounts are "to" totals for the street
+        const contrib = {};                 // committed in prior (flushed) streets
+        let streetCommit = {}, streetBet = 0, curStreet = 'preflop';
+        const flushStreet = () => { for(const p in streetCommit){ contrib[p]=(contrib[p]||0)+streetCommit[p]; } streetCommit={}; streetBet=0; };
         for(let i=0;i<step;i++){
           const a = acts[i];
-          if(a.board){ board = a.board; street = a.street; continue; }
-          if(a.street) street = a.street;
-          if(a.amount!=null && ['call','bet','raise','allin','post'].includes(a.action)) pot += Number(a.amount)||0;
-          if(a.pos){ lastAct[a.pos] = (a.action||'') + (a.amount!=null?' '+a.amount:''); }
-          if(a.action==='fold' && a.pos) folded[a.pos]=true;
+          if(a.board){ flushStreet(); curStreet=a.street; board=a.board; street=cap(a.street); continue; }
+          if(a.street && a.street!==curStreet){ flushStreet(); curStreet=a.street; }
+          if(a.street) street = cap(a.street);
+          const pos=a.pos, amt=(a.amount!=null?Number(a.amount):null);
+          if(pos){
+            switch(a.action){
+              case 'post': case 'bet': streetCommit[pos]=amt||0; streetBet=Math.max(streetBet, amt||0); break;
+              case 'raise': case 'allin': streetCommit[pos]=(amt!=null?amt:streetBet); streetBet=Math.max(streetBet, streetCommit[pos]); break;
+              case 'call': streetCommit[pos]=(amt!=null?amt:streetBet); break;
+              case 'fold': folded[pos]=true; break;
+            }
+            lastAct[pos]=(a.action||'')+(amt!=null?' '+amt:'');
+          }
         }
+        // committed total per player (flushed streets + current street), pot = sum
+        const committed={}, allPos=new Set([...Object.keys(contrib),...Object.keys(streetCommit)]);
+        let pot=0;
+        allPos.forEach(p=>{ committed[p]=(contrib[p]||0)+(streetCommit[p]||0); pot+=committed[p]; });
         boardEl.innerHTML = cards(board);
-        potEl.textContent = pot ? ('Pot ~'+pot) : '';
+        potEl.textContent = pot ? ('Pot '+fmt(pot)) : '';
         streetEl.textContent = street;
         document.querySelectorAll('.seat').forEach(s=>{
           const pos=s.dataset.pos;
           s.querySelector('[data-act]').textContent = lastAct[pos]||'';
           s.classList.toggle('folded', !!folded[pos]);
           s.classList.remove('acting');
+          const stEl=s.querySelector('[data-stack]'), start=starts[pos], c=committed[pos]||0;
+          if(start!=null){ const rem=start-c; stEl.textContent = rem<=0 ? 'all in' : fmt(rem); }
+          else { stEl.textContent = c ? '−'+fmt(c) : ''; }
         });
         const cur = acts[step-1];
         if(cur && cur.pos){
diff --git a/lyra/web/static/hands.html b/lyra/web/static/hands.html
index 7055f51..f6d3e36 100644
--- a/lyra/web/static/hands.html
+++ b/lyra/web/static/hands.html
@@ -3,10 +3,10 @@
 <head>
   <meta charset="UTF-8" />
   <meta name="viewport" content="width=device-width, initial-scale=1.0, viewport-fit=cover" />
-  <meta name="theme-color" content="#0b0d12" />
+  <meta name="theme-color" content="#070707" />
   <title>Lyra — Hands</title>
   <style>
-    :root{--bg:#0b0d12;--bg-elev:#141821;--bg-line:#11141b;--border:#232936;--text:#e6e9ef;--fade:#8b93a7;--accent:#7aa2ff;}
+    :root{--bg:#070707;--bg-elev:#0e0e0e;--bg-line:#141414;--border:#2a1d12;--text:#e8e8e8;--fade:#8a8a8a;--accent:#ff7a00;}
     *{box-sizing:border-box;}
     html,body{margin:0;min-height:100%;background:var(--bg);color:var(--text);
       font-family:-apple-system,BlinkMacSystemFont,"Segoe UI",Roboto,sans-serif;-webkit-text-size-adjust:100%;}
@@ -19,7 +19,7 @@
     main{max-width:640px;margin:0 auto;padding:12px 12px 40px;}
     a.hand{display:flex;align-items:center;gap:12px;text-decoration:none;color:var(--text);
       background:var(--bg-elev);border:1px solid var(--border);border-radius:10px;padding:10px 12px;margin-bottom:8px;}
-    a.hand:active{background:#1b2333;}
+    a.hand:active{background:#241400;}
     .cards{display:flex;gap:4px;flex:none;}
     .card{display:inline-flex;flex-direction:column;align-items:center;justify-content:center;
       width:24px;height:33px;background:#f4f4f0;color:#111;border-radius:4px;font-weight:700;font-size:.72rem;line-height:1;}
@@ -29,7 +29,7 @@
     .ln1{font-size:.92rem;}
     .ln2{font-size:.74rem;color:var(--fade);white-space:nowrap;overflow:hidden;text-overflow:ellipsis;}
     .res{flex:none;font-variant-numeric:tabular-nums;font-weight:600;}
-    .pos-res{color:#5ad1a0;} .neg-res{color:#ff6b6b;}
+    .pos-res{color:#8fd694;} .neg-res{color:#ff6b6b;}
     .tag{font-size:.62rem;text-transform:uppercase;letter-spacing:.4px;color:var(--accent);}
     .empty{color:var(--fade);text-align:center;padding:46px 16px;}
   </style>
diff --git a/lyra/web/static/journal.html b/lyra/web/static/journal.html
index 0fb8995..4efba0f 100644
--- a/lyra/web/static/journal.html
+++ b/lyra/web/static/journal.html
@@ -3,13 +3,13 @@
 <head>
   <meta charset="UTF-8" />
   <meta name="viewport" content="width=device-width, initial-scale=1.0, viewport-fit=cover" />
-  <meta name="theme-color" content="#0b0d12" />
+  <meta name="theme-color" content="#070707" />
   <title>Lyra — Journal</title>
   <style>
     :root {
-      --bg: #0b0d12; --bg-elev: #141821; --bg-line: #11141b; --border: #232936;
-      --text: #e6e9ef; --fade: #8b93a7; --accent: #7aa2ff;
-      --reflection: #5ad1a0; --metacognition: #c08bff; --journal: #ffcf6b;
+      --bg: #070707; --bg-elev: #0e0e0e; --bg-line: #141414; --border: #2a1d12;
+      --text: #e8e8e8; --fade: #8a8a8a; --accent: #ff7a00;
+      --reflection: #8fd694; --metacognition: #ffb347; --journal: #ff7a00;
     }
     * { box-sizing: border-box; }
     html, body {
@@ -31,7 +31,7 @@
       border: 1px solid var(--border); background: var(--bg-line); color: var(--fade);
       cursor: pointer; user-select: none; -webkit-tap-highlight-color: transparent;
     }
-    .chip.active { color: var(--text); border-color: var(--accent); background: #1b2333; }
+    .chip.active { color: var(--text); border-color: var(--accent); background: #241400; }
 
     main { max-width: 720px; margin: 0 auto; padding: 14px 14px 48px; }
     .day { color: var(--fade); font-size: .8rem; text-transform: uppercase; letter-spacing: .5px;
diff --git a/lyra/web/static/logs.html b/lyra/web/static/logs.html
index 3bf5347..b368336 100644
--- a/lyra/web/static/logs.html
+++ b/lyra/web/static/logs.html
@@ -3,22 +3,22 @@
 <head>
   <meta charset="UTF-8" />
   <meta name="viewport" content="width=device-width, initial-scale=1.0, viewport-fit=cover" />
-  <meta name="theme-color" content="#0b0d12" />
+  <meta name="theme-color" content="#070707" />
   <title>Lyra — Live Log</title>
   <style>
     :root {
-      --bg: #0b0d12;
-      --bg-elev: #141821;
-      --bg-line: #11141b;
-      --border: #232936;
-      --text: #e6e9ef;
-      --fade: #8b93a7;
-      --accent: #7aa2ff;
-      --info: #5ad1a0;
-      --debug: #8b93a7;
+      --bg: #070707;
+      --bg-elev: #0e0e0e;
+      --bg-line: #141414;
+      --border: #2a1d12;
+      --text: #e8e8e8;
+      --fade: #8a8a8a;
+      --accent: #ff7a00;
+      --info: #8fd694;
+      --debug: #8a8a8a;
       --error: #ff6b6b;
-      --system: #c08bff;
-      --warn: #ffcf6b;
+      --system: #ffb347;
+      --warn: #ffb347;
     }
     * { box-sizing: border-box; }
     html, body {
@@ -56,7 +56,7 @@
       border: 1px solid var(--border); background: var(--bg-line); color: var(--fade);
       cursor: pointer; user-select: none; -webkit-tap-highlight-color: transparent;
     }
-    .chip.active { color: var(--text); border-color: var(--accent); background: #1b2333; }
+    .chip.active { color: var(--text); border-color: var(--accent); background: #241400; }
     #search {
       flex: 1 1 140px; min-width: 120px;
       background: var(--bg-line); border: 1px solid var(--border); color: var(--text);
@@ -85,9 +85,9 @@
       padding: 1px 7px; border-radius: 5px; font-weight: 700; flex: none;
     }
     .lvl-info   { color: var(--info);   background: #0f2a20; }
-    .lvl-debug  { color: var(--debug);  background: #1a1f29; }
+    .lvl-debug  { color: var(--debug);  background: #161616; }
     .lvl-error  { color: var(--error);  background: #2e1414; }
-    .lvl-system { color: var(--system); background: #221536; }
+    .lvl-system { color: var(--system); background: #2c2410; }
     .lvl-warn   { color: var(--warn);   background: #2c2410; }
     .msg { font-size: .92rem; font-weight: 500; }
     .fields {
diff --git a/lyra/web/static/recap.html b/lyra/web/static/recap.html
index 12c8878..e257756 100644
--- a/lyra/web/static/recap.html
+++ b/lyra/web/static/recap.html
@@ -3,10 +3,10 @@
 <head>
   <meta charset="UTF-8" />
   <meta name="viewport" content="width=device-width, initial-scale=1.0, viewport-fit=cover" />
-  <meta name="theme-color" content="#0b0d12" />
+  <meta name="theme-color" content="#070707" />
   <title>Lyra — Recap</title>
   <style>
-    :root{--bg:#0b0d12;--bg-elev:#141821;--bg-line:#11141b;--border:#232936;--text:#e6e9ef;--fade:#8b93a7;--accent:#7aa2ff;}
+    :root{--bg:#070707;--bg-elev:#0e0e0e;--bg-line:#141414;--border:#2a1d12;--text:#e8e8e8;--fade:#8a8a8a;--accent:#ff7a00;}
     *{box-sizing:border-box;}
     html,body{margin:0;min-height:100%;background:var(--bg);color:var(--text);
       font-family:-apple-system,BlinkMacSystemFont,"Segoe UI",Roboto,sans-serif;-webkit-text-size-adjust:100%;}
@@ -15,7 +15,7 @@
     .topbar{display:flex;align-items:center;gap:10px;padding:12px 0;flex-wrap:wrap;}
     .topbar h1{font-size:1.02rem;margin:0;font-weight:600;}
     .topbar a.back{color:var(--accent);text-decoration:none;font-size:.92rem;}
-    .dl{margin-left:auto;background:#1b2333;border:1px solid var(--border);color:var(--accent);
+    .dl{margin-left:auto;background:#241400;border:1px solid var(--border);color:var(--accent);
       border-radius:8px;padding:7px 12px;font-size:.85rem;text-decoration:none;}
     main{max-width:740px;margin:0 auto;padding:18px 16px 48px;line-height:1.6;}
     h1,h2,h3,h4{line-height:1.3;color:var(--text);}
diff --git a/lyra/web/static/self.html b/lyra/web/static/self.html
index 5835ddd..f959e8a 100644
--- a/lyra/web/static/self.html
+++ b/lyra/web/static/self.html
@@ -3,13 +3,13 @@
 <head>
   <meta charset="UTF-8" />
   <meta name="viewport" content="width=device-width, initial-scale=1.0, viewport-fit=cover" />
-  <meta name="theme-color" content="#0b0d12" />
+  <meta name="theme-color" content="#070707" />
   <title>Lyra — Mind</title>
   <style>
     :root {
-      --bg: #0b0d12; --bg-elev: #141821; --bg-line: #11141b; --border: #232936;
-      --text: #e6e9ef; --fade: #8b93a7; --accent: #7aa2ff;
-      --good: #5ad1a0; --mid: #ffcf6b; --low: #ff6b6b; --violet: #c08bff;
+      --bg: #070707; --bg-elev: #0e0e0e; --bg-line: #141414; --border: #2a1d12;
+      --text: #e8e8e8; --fade: #8a8a8a; --accent: #ff7a00;
+      --good: #8fd694; --mid: #ffb347; --low: #ff6b6b; --violet: #ffb347;
     }
     * { box-sizing: border-box; }
     html, body {
@@ -26,7 +26,7 @@
     .topbar a.back { color: var(--accent); text-decoration: none; font-size: .95rem; }
     .updated { margin-left: auto; color: var(--fade); font-size: .78rem; }
     #reflectBtn {
-      background: #1b2333; border: 1px solid var(--border); color: var(--accent);
+      background: #241400; border: 1px solid var(--border); color: var(--accent);
       border-radius: 8px; padding: 6px 11px; font-size: .82rem; cursor: pointer;
       -webkit-tap-highlight-color: transparent;
     }
diff --git a/lyra/web/static/style.css b/lyra/web/static/style.css
index fd4fe6f..61f8e18 100644
--- a/lyra/web/static/style.css
+++ b/lyra/web/static/style.css
@@ -1,996 +1,996 @@
-:root {
-  --bg-dark: #0a0a0a;
-  --bg-panel: rgba(255, 115, 0, 0.1);
-  --accent: #ff6600;
-  --accent-glow: 0 0 12px #ff6600cc;
-  --text-main: #e6e6e6;
-  --text-fade: #999;
-  --font-console: "IBM Plex Mono", monospace;
-}
-
-/* Light mode variables */
-body {
-  --bg-dark: #f5f5f5;
-  --bg-panel: rgba(255, 115, 0, 0.05);
-  --accent: #ff6600;
-  --accent-glow: 0 0 12px #ff6600cc;
-  --text-main: #1a1a1a;
-  --text-fade: #666;
-}
-
-/* Dark mode variables */
-body.dark {
-  --bg-dark: #0a0a0a;
-  --bg-panel: rgba(255, 115, 0, 0.1);
-  --accent: #ff6600;
-  --accent-glow: 0 0 12px #ff6600cc;
-  --text-main: #e6e6e6;
-  --text-fade: #999;
-}
-
-body {
-  margin: 0;
-  background: var(--bg-dark);
-  color: var(--text-main);
-  font-family: var(--font-console);
-  height: 100vh;
-  display: flex;
-  justify-content: center;
-  align-items: center;
-}
-
-#chat {
-  width: 95%;
-  max-width: 900px;
-  height: 95vh;
-  display: flex;
-  flex-direction: column;
-  border: 1px solid var(--accent);
-  border-radius: 10px;
-  box-shadow: var(--accent-glow);
-  background: var(--bg-dark);
-  overflow: hidden;
-}
-
-/* Header sections */
-#model-select, #session-select, #status {
-  display: flex;
-  align-items: center;
-  gap: 8px;
-  padding: 8px 12px;
-  border-bottom: 1px solid var(--accent);
-  background-color: rgba(255, 102, 0, 0.05);
-}
-#status {
-  justify-content: flex-start;
-  border-top: 1px solid var(--accent);
-}
-
-label, select, button {
-  font-family: var(--font-console);
-  font-size: 0.9rem;
-  color: var(--text-main);
-  background: transparent;
-  border: 1px solid var(--accent);
-  border-radius: 4px;
-  padding: 4px 8px;
-}
-
-button:hover, select:hover {
-  box-shadow: 0 0 8px var(--accent);
-  cursor: pointer;
-}
-
-#thinkingStreamBtn {
-  background: rgba(138, 43, 226, 0.2);
-  border-color: #8a2be2;
-}
-
-#thinkingStreamBtn:hover {
-  box-shadow: 0 0 8px #8a2be2;
-  background: rgba(138, 43, 226, 0.3);
-}
-
-/* Chat area */
-#messages {
-  flex: 1;
-  padding: 16px;
-  overflow-y: auto;
-  display: flex;
-  flex-direction: column;
-  gap: 8px;
-  scroll-behavior: smooth;
-}
-
-/* Messages */
-.msg {
-  max-width: 80%;
-  padding: 10px 14px;
-  border-radius: 8px;
-  line-height: 1.4;
-  word-wrap: break-word;
-  box-shadow: 0 0 8px rgba(255,102,0,0.2);
-}
-.msg.user {
-  align-self: flex-end;
-  background: rgba(255,102,0,0.15);
-  border: 1px solid var(--accent);
-}
-.msg.assistant {
-  align-self: flex-start;
-  background: rgba(255,102,0,0.08);
-  border: 1px solid rgba(255,102,0,0.5);
-}
-.msg.system {
-  align-self: center;
-  font-size: 0.8rem;
-  color: var(--text-fade);
-}
-
-/* Input bar */
-#input {
-  display: flex;
-  border-top: 1px solid var(--accent);
-  background: rgba(255, 102, 0, 0.05);
-  padding: 10px;
-}
-#userInput {
-  flex: 1;
-  background: transparent;
-  color: var(--text-main);
-  border: 1px solid var(--accent);
-  border-radius: 4px;
-  padding: 8px;
-}
-#sendBtn {
-  margin-left: 8px;
-}
-
-/* Relay status dot */
-#status {
-  display: flex;
-  align-items: center;
-  margin: 10px 0;
-  gap: 8px;
-  font-family: monospace;
-  color: #f5f5f5;
-}
-
-#status-dot {
-  width: 10px;
-  height: 10px;
-  border-radius: 50%;
-  display: inline-block;
-}
-
-@keyframes pulseGreen {
-  0% { box-shadow: 0 0 5px #00ff66; opacity: 0.9; }
-  50% { box-shadow: 0 0 20px #00ff99; opacity: 1; }
-  100% { box-shadow: 0 0 5px #00ff66; opacity: 0.9; }
-}
-
-.dot.ok {
-  background: #00ff66;
-  animation: pulseGreen 2s infinite ease-in-out;
-}
-
-/* Offline state stays solid red */
-.dot.fail {
-  background: #ff3333;
-  box-shadow: 0 0 10px #ff3333;
-}
-
-
-/* Dropdown (session selector) styling */
-select {
-  background-color: var(--bg-dark);
-  color: var(--text-main);
-  border: 1px solid #b84a12;
-  border-radius: 6px;
-  padding: 4px 6px;
-  font-size: 14px;
-}
-
-select option {
-  background-color: var(--bg-dark);
-  color: var(--text-main);
-}
-
-/* Hover/focus for better visibility */
-select:focus,
-select:hover {
-  outline: none;
-  border-color: #ff7a33;
-  background-color: var(--bg-panel);
-}
-
-/* Settings Modal */
-.modal {
-  display: none !important;
-  position: fixed;
-  top: 0;
-  left: 0;
-  width: 100%;
-  height: 100%;
-  z-index: 1000;
-}
-
-.modal.show {
-  display: block !important;
-}
-
-.modal-overlay {
-  position: fixed;
-  top: 0;
-  left: 0;
-  width: 100%;
-  height: 100%;
-  background: rgba(0, 0, 0, 0.8);
-  backdrop-filter: blur(4px);
-  z-index: 999;
-}
-
-.modal-content {
-  position: fixed;
-  top: 50%;
-  left: 50%;
-  transform: translate(-50%, -50%);
-  background: linear-gradient(180deg, rgba(255,102,0,0.1) 0%, rgba(10,10,10,0.95) 100%);
-  border: 2px solid var(--accent);
-  border-radius: 12px;
-  box-shadow: var(--accent-glow), 0 0 40px rgba(255,102,0,0.3);
-  min-width: 400px;
-  max-width: 600px;
-  max-height: 80vh;
-  overflow-y: auto;
-  z-index: 1001;
-}
-
-.modal-header {
-  display: flex;
-  justify-content: space-between;
-  align-items: center;
-  padding: 16px 20px;
-  border-bottom: 1px solid var(--accent);
-  background: rgba(255,102,0,0.1);
-}
-
-.modal-header h3 {
-  margin: 0;
-  font-size: 1.2rem;
-  color: var(--accent);
-}
-
-.close-btn {
-  background: transparent;
-  border: none;
-  color: var(--accent);
-  font-size: 1.5rem;
-  cursor: pointer;
-  padding: 0;
-  width: 30px;
-  height: 30px;
-  display: flex;
-  align-items: center;
-  justify-content: center;
-  border-radius: 4px;
-}
-
-.close-btn:hover {
-  background: rgba(255,102,0,0.2);
-  box-shadow: 0 0 8px var(--accent);
-}
-
-.modal-body {
-  padding: 20px;
-}
-
-.settings-section h4 {
-  margin: 0 0 8px 0;
-  color: var(--accent);
-  font-size: 1rem;
-}
-
-.settings-desc {
-  margin: 0 0 16px 0;
-  color: var(--text-fade);
-  font-size: 0.85rem;
-}
-
-.radio-group {
-  display: flex;
-  flex-direction: column;
-  gap: 12px;
-}
-
-.radio-label {
-  display: flex;
-  flex-direction: column;
-  padding: 12px;
-  border: 1px solid rgba(255,102,0,0.3);
-  border-radius: 6px;
-  background: rgba(255,102,0,0.05);
-  cursor: pointer;
-  transition: all 0.2s;
-}
-
-.radio-label:hover {
-  border-color: var(--accent);
-  background: rgba(255,102,0,0.1);
-  box-shadow: 0 0 8px rgba(255,102,0,0.3);
-}
-
-.radio-label input[type="radio"] {
-  margin-right: 8px;
-  accent-color: var(--accent);
-}
-
-.radio-label span {
-  font-weight: 500;
-  margin-bottom: 4px;
-}
-
-.radio-label small {
-  color: var(--text-fade);
-  font-size: 0.8rem;
-  margin-left: 24px;
-}
-
-.radio-label input[type="text"] {
-  margin-top: 8px;
-  margin-left: 24px;
-  padding: 6px;
-  background: rgba(0,0,0,0.3);
-  border: 1px solid rgba(255,102,0,0.5);
-  border-radius: 4px;
-  color: var(--text-main);
-  font-family: var(--font-console);
-}
-
-.radio-label input[type="text"]:focus {
-  outline: none;
-  border-color: var(--accent);
-  box-shadow: 0 0 8px rgba(255,102,0,0.3);
-}
-
-.modal-footer {
-  display: flex;
-  justify-content: flex-end;
-  gap: 10px;
-  padding: 16px 20px;
-  border-top: 1px solid var(--accent);
-  background: rgba(255,102,0,0.05);
-}
-
-.primary-btn {
-  background: var(--accent);
-  color: #000;
-  font-weight: bold;
-}
-
-.primary-btn:hover {
-  background: #ff7a33;
-  box-shadow: var(--accent-glow);
-}
-
-/* Session List */
-.session-list {
-  display: flex;
-  flex-direction: column;
-  gap: 8px;
-  max-height: 300px;
-  overflow-y: auto;
-}
-
-.session-item {
-  display: flex;
-  justify-content: space-between;
-  align-items: center;
-  padding: 12px;
-  border: 1px solid rgba(255,102,0,0.3);
-  border-radius: 6px;
-  background: rgba(255,102,0,0.05);
-  transition: all 0.2s;
-}
-
-.session-item:hover {
-  border-color: var(--accent);
-  background: rgba(255,102,0,0.1);
-}
-
-.session-info {
-  display: flex;
-  flex-direction: column;
-  gap: 4px;
-  flex: 1;
-}
-
-.session-info strong {
-  color: var(--text-main);
-  font-size: 0.95rem;
-}
-
-.session-info small {
-  color: var(--text-fade);
-  font-size: 0.75rem;
-}
-
-.session-delete-btn {
-  background: transparent;
-  border: 1px solid rgba(255,102,0,0.5);
-  color: var(--accent);
-  padding: 6px 10px;
-  border-radius: 4px;
-  cursor: pointer;
-  font-size: 1rem;
-  transition: all 0.2s;
-}
-
-.session-delete-btn:hover {
-  background: rgba(255,0,0,0.2);
-  border-color: #ff3333;
-  color: #ff3333;
-  box-shadow: 0 0 8px rgba(255,0,0,0.3);
-}
-
-/* Thinking Stream Panel */
-.thinking-panel {
-  border-top: 1px solid var(--accent);
-  background: rgba(255, 102, 0, 0.02);
-  display: flex;
-  flex-direction: column;
-  transition: max-height 0.3s ease;
-  max-height: 300px;
-}
-
-.thinking-panel.collapsed {
-  max-height: 40px;
-}
-
-.thinking-header {
-  display: flex;
-  justify-content: space-between;
-  align-items: center;
-  padding: 10px 12px;
-  background: rgba(255, 102, 0, 0.08);
-  cursor: pointer;
-  user-select: none;
-  border-bottom: 1px solid rgba(255, 102, 0, 0.2);
-  font-size: 0.9rem;
-  font-weight: 500;
-}
-
-.thinking-header:hover {
-  background: rgba(255, 102, 0, 0.12);
-}
-
-.thinking-controls {
-  display: flex;
-  align-items: center;
-  gap: 8px;
-}
-
-.thinking-status-dot {
-  width: 8px;
-  height: 8px;
-  border-radius: 50%;
-  background: #666;
-  display: inline-block;
-}
-
-.thinking-status-dot.connected {
-  background: #00ff66;
-  box-shadow: 0 0 8px #00ff66;
-}
-
-.thinking-status-dot.disconnected {
-  background: #ff3333;
-}
-
-.thinking-clear-btn,
-.thinking-toggle-btn {
-  background: transparent;
-  border: 1px solid rgba(255, 102, 0, 0.5);
-  color: var(--text-main);
-  padding: 4px 8px;
-  border-radius: 4px;
-  cursor: pointer;
-  font-size: 0.85rem;
-}
-
-.thinking-clear-btn:hover,
-.thinking-toggle-btn:hover {
-  background: rgba(255, 102, 0, 0.2);
-  box-shadow: 0 0 6px rgba(255, 102, 0, 0.3);
-}
-
-.thinking-toggle-btn {
-  transition: transform 0.3s ease;
-}
-
-.thinking-panel.collapsed .thinking-toggle-btn {
-  transform: rotate(-90deg);
-}
-
-.thinking-content {
-  flex: 1;
-  overflow-y: auto;
-  padding: 12px;
-  display: flex;
-  flex-direction: column;
-  gap: 8px;
-  min-height: 0;
-}
-
-.thinking-panel.collapsed .thinking-content {
-  display: none;
-}
-
-.thinking-empty {
-  text-align: center;
-  padding: 40px 20px;
-  color: var(--text-fade);
-  font-size: 0.85rem;
-}
-
-.thinking-empty-icon {
-  font-size: 2rem;
-  margin-bottom: 10px;
-}
-
-.thinking-event {
-  padding: 8px 12px;
-  border-radius: 6px;
-  font-size: 0.85rem;
-  font-family: 'Courier New', monospace;
-  animation: thinkingSlideIn 0.3s ease-out;
-  border-left: 3px solid;
-  word-wrap: break-word;
-}
-
-@keyframes thinkingSlideIn {
-  from {
-    opacity: 0;
-    transform: translateY(-10px);
-  }
-  to {
-    opacity: 1;
-    transform: translateY(0);
-  }
-}
-
-.thinking-event-connected {
-  background: rgba(0, 255, 102, 0.1);
-  border-color: #00ff66;
-  color: #00ff66;
-}
-
-.thinking-event-thinking {
-  background: rgba(138, 43, 226, 0.1);
-  border-color: #8a2be2;
-  color: #c79cff;
-}
-
-.thinking-event-tool_call {
-  background: rgba(255, 165, 0, 0.1);
-  border-color: #ffa500;
-  color: #ffb84d;
-}
-
-.thinking-event-tool_result {
-  background: rgba(0, 191, 255, 0.1);
-  border-color: #00bfff;
-  color: #7dd3fc;
-}
-
-.thinking-event-done {
-  background: rgba(168, 85, 247, 0.1);
-  border-color: #a855f7;
-  color: #e9d5ff;
-  font-weight: bold;
-}
-
-.thinking-event-error {
-  background: rgba(255, 51, 51, 0.1);
-  border-color: #ff3333;
-  color: #fca5a5;
-}
-
-.thinking-event-icon {
-  display: inline-block;
-  margin-right: 8px;
-}
-
-.thinking-event-details {
-  font-size: 0.75rem;
-  color: var(--text-fade);
-  margin-top: 4px;
-  padding-left: 20px;
-  white-space: pre-wrap;
-  max-height: 100px;
-  overflow-y: auto;
-}
-
-/* ========== MOBILE RESPONSIVE STYLES ========== */
-
-/* Hamburger Menu */
-.hamburger-menu {
-  display: none;
-  flex-direction: column;
-  gap: 4px;
-  cursor: pointer;
-  padding: 8px;
-  border: 1px solid var(--accent);
-  border-radius: 4px;
-  background: transparent;
-  z-index: 100;
-}
-
-.hamburger-menu span {
-  width: 20px;
-  height: 2px;
-  background: var(--accent);
-  transition: all 0.3s;
-  display: block;
-}
-
-.hamburger-menu.active span:nth-child(1) {
-  transform: rotate(45deg) translate(5px, 5px);
-}
-
-.hamburger-menu.active span:nth-child(2) {
-  opacity: 0;
-}
-
-.hamburger-menu.active span:nth-child(3) {
-  transform: rotate(-45deg) translate(5px, -5px);
-}
-
-/* Mobile Menu Container */
-.mobile-menu {
-  display: none;
-  position: fixed;
-  top: 0;
-  left: -100%;
-  width: 280px;
-  height: 100vh;
-  background: var(--bg-dark);
-  border-right: 2px solid var(--accent);
-  box-shadow: var(--accent-glow);
-  z-index: 999;
-  transition: left 0.3s ease;
-  overflow-y: auto;
-  padding: 20px;
-  flex-direction: column;
-  gap: 16px;
-}
-
-.mobile-menu.open {
-  left: 0;
-}
-
-.mobile-menu-overlay {
-  display: none;
-  position: fixed;
-  top: 0;
-  left: 0;
-  width: 100%;
-  height: 100%;
-  background: rgba(0, 0, 0, 0.7);
-  z-index: 998;
-}
-
-.mobile-menu-overlay.show {
-  display: block;
-}
-
-.mobile-menu-section {
-  display: flex;
-  flex-direction: column;
-  gap: 8px;
-  padding-bottom: 16px;
-  border-bottom: 1px solid rgba(255, 102, 0, 0.3);
-}
-
-.mobile-menu-section:last-child {
-  border-bottom: none;
-}
-
-.mobile-menu-section h4 {
-  margin: 0;
-  color: var(--accent);
-  font-size: 0.9rem;
-  text-transform: uppercase;
-  letter-spacing: 1px;
-}
-
-.mobile-menu button,
-.mobile-menu select {
-  width: 100%;
-  padding: 10px;
-  font-size: 0.95rem;
-  text-align: left;
-}
-
-/* Mobile Breakpoints */
-@media screen and (max-width: 768px) {
-  body {
-    padding: 0;
-  }
-
-  #chat {
-    width: 100%;
-    max-width: 100%;
-    height: 100vh;
-    border-radius: 0;
-    border-left: none;
-    border-right: none;
-  }
-
-  /* Show hamburger, hide desktop header controls */
-  .hamburger-menu {
-    display: flex;
-  }
-
-  #model-select {
-    padding: 12px;
-    justify-content: space-between;
-  }
-
-  /* Hide all controls except hamburger on mobile */
-  #model-select > *:not(.hamburger-menu) {
-    display: none;
-  }
-
-  #session-select {
-    display: none;
-  }
-
-  /* Show mobile menu */
-  .mobile-menu {
-    display: flex;
-  }
-
-  /* Messages - more width on mobile */
-  .msg {
-    max-width: 90%;
-    font-size: 0.95rem;
-  }
-
-  /* Status bar */
-  #status {
-    padding: 10px 12px;
-    font-size: 0.85rem;
-  }
-
-  /* Input area - bigger touch targets */
-  #input {
-    padding: 12px;
-  }
-
-  #userInput {
-    font-size: 16px; /* Prevents zoom on iOS */
-    padding: 12px;
-  }
-
-  #sendBtn {
-    padding: 12px 16px;
-    font-size: 1rem;
-  }
-
-  /* Modal - full width on mobile */
-  .modal-content {
-    width: 95%;
-    min-width: unset;
-    max-width: unset;
-    max-height: 90vh;
-    top: 50%;
-    left: 50%;
-    transform: translate(-50%, -50%);
-  }
-
-  .modal-header {
-    padding: 12px 16px;
-  }
-
-  .modal-body {
-    padding: 16px;
-  }
-
-  .modal-footer {
-    padding: 12px 16px;
-    flex-wrap: wrap;
-  }
-
-  .modal-footer button {
-    flex: 1;
-    min-width: 120px;
-  }
-
-  /* Radio labels - stack better on mobile */
-  .radio-label {
-    padding: 10px;
-  }
-
-  .radio-label small {
-    margin-left: 20px;
-    font-size: 0.75rem;
-  }
-
-  /* Session list */
-  .session-item {
-    padding: 10px;
-  }
-
-  .session-info strong {
-    font-size: 0.9rem;
-  }
-
-  .session-info small {
-    font-size: 0.7rem;
-  }
-
-  /* Settings button in header */
-  #settingsBtn {
-    padding: 8px 12px;
-  }
-
-  /* Thinking panel adjustments for mobile */
-  .thinking-panel {
-    max-height: 250px;
-  }
-
-  .thinking-panel.collapsed {
-    max-height: 38px;
-  }
-
-  .thinking-header {
-    padding: 8px 10px;
-    font-size: 0.85rem;
-  }
-
-  .thinking-event {
-    font-size: 0.8rem;
-    padding: 6px 10px;
-  }
-
-  .thinking-event-details {
-    font-size: 0.7rem;
-    max-height: 80px;
-  }
-}
-
-/* Extra small devices (phones in portrait) */
-@media screen and (max-width: 480px) {
-  .mobile-menu {
-    width: 240px;
-  }
-
-  .msg {
-    max-width: 95%;
-    font-size: 0.9rem;
-    padding: 8px 12px;
-  }
-
-  #userInput {
-    font-size: 16px;
-    padding: 10px;
-  }
-
-  #sendBtn {
-    padding: 10px 14px;
-    font-size: 0.95rem;
-  }
-
-  .modal-header h3 {
-    font-size: 1.1rem;
-  }
-
-  .settings-section h4 {
-    font-size: 0.95rem;
-  }
-
-  .radio-label span {
-    font-size: 0.9rem;
-  }
-}
-
-/* Tablet landscape and desktop */
-@media screen and (min-width: 769px) {
-  /* Ensure mobile menu is hidden on desktop */
-  .mobile-menu,
-  .mobile-menu-overlay {
-    display: none !important;
-  }
-
-  .hamburger-menu {
-    display: none !important;
-  }
-}
-
-/* ---- Live Log lines ---- */
-.log-line {
-  display: flex;
-  flex-wrap: wrap;
-  align-items: baseline;
-  gap: 8px;
-  padding: 4px 8px;
-  border-radius: 4px;
-  font-size: 0.8rem;
-  font-family: 'Courier New', monospace;
-  border-left: 3px solid var(--text-fade);
-  animation: thinkingSlideIn 0.25s ease-out;
-  word-break: break-word;
-}
-.log-time { color: var(--text-fade); flex-shrink: 0; }
-.log-level {
-  flex-shrink: 0;
-  text-transform: uppercase;
-  font-size: 0.7rem;
-  font-weight: bold;
-  letter-spacing: 0.05em;
-}
-.log-msg { color: var(--text); }
-.log-fields { color: var(--text-fade); width: 100%; padding-left: 4px; }
-
-.log-info    { border-left-color: #00bfff; }
-.log-info .log-level { color: #7dd3fc; }
-.log-debug   { border-left-color: #8a2be2; }
-.log-debug .log-level { color: #c79cff; }
-.log-error   { border-left-color: #ff3333; background: rgba(255,51,51,0.08); }
-.log-error .log-level, .log-error .log-msg { color: #fca5a5; }
-.log-system  { border-left-color: #00ff66; }
-.log-system .log-level { color: #00ff66; }
-
-.log-detail { width: 100%; margin-top: 4px; }
-.log-detail summary {
-  cursor: pointer;
-  color: var(--accent);
-  font-size: 0.72rem;
-  user-select: none;
-}
-.log-detail pre {
-  margin: 6px 0 0;
-  padding: 8px;
-  max-height: 340px;
-  overflow: auto;
-  background: rgba(0,0,0,0.25);
-  border-left: 2px solid var(--accent);
-  border-radius: 4px;
-  font-size: 0.72rem;
-  line-height: 1.4;
-  white-space: pre-wrap;
-  word-break: break-word;
-  color: var(--text);
-}
-
-/* Rendered markdown in Lyra's replies — readable proportional type + structure. */
-.msg.assistant {
-  font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, sans-serif;
-  line-height: 1.55;
-  max-width: 88%;
-}
-.msg.assistant p { margin: 0 0 10px; }
-.msg.assistant p:last-child { margin-bottom: 0; }
-.msg.assistant h1, .msg.assistant h2, .msg.assistant h3, .msg.assistant h4 {
-  margin: 14px 0 6px; line-height: 1.3; color: var(--accent);
-}
-.msg.assistant h1 { font-size: 1.18rem; }
-.msg.assistant h2 { font-size: 1.1rem; }
-.msg.assistant h3 { font-size: 1.02rem; }
-.msg.assistant h4 { font-size: 0.96rem; }
-.msg.assistant ul, .msg.assistant ol { margin: 6px 0 10px; padding-left: 22px; }
-.msg.assistant li { margin: 3px 0; }
-.msg.assistant li > ul, .msg.assistant li > ol { margin: 3px 0; }
-.msg.assistant strong { font-weight: 600; color: var(--text); }
-.msg.assistant em { font-style: italic; }
-.msg.assistant a { color: var(--accent); text-decoration: underline; }
-.msg.assistant code {
-  font-family: "IBM Plex Mono", monospace; font-size: 0.88em;
-  background: rgba(255,255,255,0.08); padding: 1px 5px; border-radius: 4px;
-}
-.msg.assistant pre {
-  background: rgba(0,0,0,0.32); border: 1px solid rgba(255,102,0,0.3);
-  border-radius: 6px; padding: 10px 12px; margin: 8px 0; overflow-x: auto;
-}
-.msg.assistant pre code { background: none; padding: 0; font-size: 0.85em; }
+:root {
+  --bg-dark: #070707;
+  --bg-panel: rgba(255, 122, 0, 0.1);
+  --accent: #ff7a00;
+  --accent-glow: 0 0 6px rgba(255,122,0,0.28);
+  --text-main: #e8e8e8;
+  --text-fade: #999;
+  --font-console: "IBM Plex Mono", monospace;
+}
+
+/* Light mode variables */
+body {
+  --bg-dark: #f5f5f5;
+  --bg-panel: rgba(255, 122, 0, 0.05);
+  --accent: #ff7a00;
+  --accent-glow: 0 0 6px rgba(255,122,0,0.28);
+  --text-main: #1a1a1a;
+  --text-fade: #666;
+}
+
+/* Dark mode variables */
+body.dark {
+  --bg-dark: #070707;
+  --bg-panel: rgba(255, 122, 0, 0.1);
+  --accent: #ff7a00;
+  --accent-glow: 0 0 6px rgba(255,122,0,0.28);
+  --text-main: #e8e8e8;
+  --text-fade: #999;
+}
+
+body {
+  margin: 0;
+  background: var(--bg-dark);
+  color: var(--text-main);
+  font-family: var(--font-console);
+  height: 100vh;
+  display: flex;
+  justify-content: center;
+  align-items: center;
+}
+
+#chat {
+  width: 95%;
+  max-width: 900px;
+  height: 95vh;
+  display: flex;
+  flex-direction: column;
+  border: 1px solid var(--accent);
+  border-radius: 10px;
+  box-shadow: var(--accent-glow);
+  background: var(--bg-dark);
+  overflow: hidden;
+}
+
+/* Header sections */
+#model-select, #session-select, #status {
+  display: flex;
+  align-items: center;
+  gap: 8px;
+  padding: 8px 12px;
+  border-bottom: 1px solid var(--accent);
+  background-color: rgba(255, 122, 0, 0.05);
+}
+#status {
+  justify-content: flex-start;
+  border-top: 1px solid var(--accent);
+}
+
+label, select, button {
+  font-family: var(--font-console);
+  font-size: 0.9rem;
+  color: var(--text-main);
+  background: transparent;
+  border: 1px solid var(--accent);
+  border-radius: 4px;
+  padding: 4px 8px;
+}
+
+button:hover, select:hover {
+  box-shadow: 0 0 8px var(--accent);
+  cursor: pointer;
+}
+
+#thinkingStreamBtn {
+  background: rgba(255, 179, 71, 0.2);
+  border-color: #ffb347;
+}
+
+#thinkingStreamBtn:hover {
+  box-shadow: 0 0 8px #ffb347;
+  background: rgba(255, 179, 71, 0.3);
+}
+
+/* Chat area */
+#messages {
+  flex: 1;
+  padding: 16px;
+  overflow-y: auto;
+  display: flex;
+  flex-direction: column;
+  gap: 8px;
+  scroll-behavior: smooth;
+}
+
+/* Messages */
+.msg {
+  max-width: 80%;
+  padding: 10px 14px;
+  border-radius: 8px;
+  line-height: 1.4;
+  word-wrap: break-word;
+  box-shadow: 0 0 8px rgba(255,122,0,0.2);
+}
+.msg.user {
+  align-self: flex-end;
+  background: rgba(255,122,0,0.15);
+  border: 1px solid var(--accent);
+}
+.msg.assistant {
+  align-self: flex-start;
+  background: rgba(255,122,0,0.08);
+  border: 1px solid rgba(255,122,0,0.5);
+}
+.msg.system {
+  align-self: center;
+  font-size: 0.8rem;
+  color: var(--text-fade);
+}
+
+/* Input bar */
+#input {
+  display: flex;
+  border-top: 1px solid var(--accent);
+  background: rgba(255, 122, 0, 0.05);
+  padding: 10px;
+}
+#userInput {
+  flex: 1;
+  background: transparent;
+  color: var(--text-main);
+  border: 1px solid var(--accent);
+  border-radius: 4px;
+  padding: 8px;
+}
+#sendBtn {
+  margin-left: 8px;
+}
+
+/* Relay status dot */
+#status {
+  display: flex;
+  align-items: center;
+  margin: 10px 0;
+  gap: 8px;
+  font-family: monospace;
+  color: #f5f5f5;
+}
+
+#status-dot {
+  width: 10px;
+  height: 10px;
+  border-radius: 50%;
+  display: inline-block;
+}
+
+@keyframes pulseGreen {
+  0% { box-shadow: 0 0 5px #8fd694; opacity: 0.9; }
+  50% { box-shadow: 0 0 10px #8fd694; opacity: 1; }
+  100% { box-shadow: 0 0 5px #8fd694; opacity: 0.9; }
+}
+
+.dot.ok {
+  background: #8fd694;
+  animation: pulseGreen 2s infinite ease-in-out;
+}
+
+/* Offline state stays solid red */
+.dot.fail {
+  background: #ff3333;
+  box-shadow: 0 0 10px #ff3333;
+}
+
+
+/* Dropdown (session selector) styling */
+select {
+  background-color: var(--bg-dark);
+  color: var(--text-main);
+  border: 1px solid #b84a12;
+  border-radius: 6px;
+  padding: 4px 6px;
+  font-size: 14px;
+}
+
+select option {
+  background-color: var(--bg-dark);
+  color: var(--text-main);
+}
+
+/* Hover/focus for better visibility */
+select:focus,
+select:hover {
+  outline: none;
+  border-color: #ff8a00;
+  background-color: var(--bg-panel);
+}
+
+/* Settings Modal */
+.modal {
+  display: none !important;
+  position: fixed;
+  top: 0;
+  left: 0;
+  width: 100%;
+  height: 100%;
+  z-index: 1000;
+}
+
+.modal.show {
+  display: block !important;
+}
+
+.modal-overlay {
+  position: fixed;
+  top: 0;
+  left: 0;
+  width: 100%;
+  height: 100%;
+  background: rgba(0, 0, 0, 0.8);
+  backdrop-filter: blur(4px);
+  z-index: 999;
+}
+
+.modal-content {
+  position: fixed;
+  top: 50%;
+  left: 50%;
+  transform: translate(-50%, -50%);
+  background: linear-gradient(180deg, rgba(255,122,0,0.1) 0%, rgba(10,10,10,0.95) 100%);
+  border: 2px solid var(--accent);
+  border-radius: 12px;
+  box-shadow: var(--accent-glow);
+  min-width: 400px;
+  max-width: 600px;
+  max-height: 80vh;
+  overflow-y: auto;
+  z-index: 1001;
+}
+
+.modal-header {
+  display: flex;
+  justify-content: space-between;
+  align-items: center;
+  padding: 16px 20px;
+  border-bottom: 1px solid var(--accent);
+  background: rgba(255,122,0,0.1);
+}
+
+.modal-header h3 {
+  margin: 0;
+  font-size: 1.2rem;
+  color: var(--accent);
+}
+
+.close-btn {
+  background: transparent;
+  border: none;
+  color: var(--accent);
+  font-size: 1.5rem;
+  cursor: pointer;
+  padding: 0;
+  width: 30px;
+  height: 30px;
+  display: flex;
+  align-items: center;
+  justify-content: center;
+  border-radius: 4px;
+}
+
+.close-btn:hover {
+  background: rgba(255,122,0,0.2);
+  box-shadow: 0 0 8px var(--accent);
+}
+
+.modal-body {
+  padding: 20px;
+}
+
+.settings-section h4 {
+  margin: 0 0 8px 0;
+  color: var(--accent);
+  font-size: 1rem;
+}
+
+.settings-desc {
+  margin: 0 0 16px 0;
+  color: var(--text-fade);
+  font-size: 0.85rem;
+}
+
+.radio-group {
+  display: flex;
+  flex-direction: column;
+  gap: 12px;
+}
+
+.radio-label {
+  display: flex;
+  flex-direction: column;
+  padding: 12px;
+  border: 1px solid rgba(255,122,0,0.3);
+  border-radius: 6px;
+  background: rgba(255,122,0,0.05);
+  cursor: pointer;
+  transition: all 0.2s;
+}
+
+.radio-label:hover {
+  border-color: var(--accent);
+  background: rgba(255,122,0,0.1);
+  box-shadow: 0 0 8px rgba(255,122,0,0.3);
+}
+
+.radio-label input[type="radio"] {
+  margin-right: 8px;
+  accent-color: var(--accent);
+}
+
+.radio-label span {
+  font-weight: 500;
+  margin-bottom: 4px;
+}
+
+.radio-label small {
+  color: var(--text-fade);
+  font-size: 0.8rem;
+  margin-left: 24px;
+}
+
+.radio-label input[type="text"] {
+  margin-top: 8px;
+  margin-left: 24px;
+  padding: 6px;
+  background: rgba(0,0,0,0.3);
+  border: 1px solid rgba(255,122,0,0.5);
+  border-radius: 4px;
+  color: var(--text-main);
+  font-family: var(--font-console);
+}
+
+.radio-label input[type="text"]:focus {
+  outline: none;
+  border-color: var(--accent);
+  box-shadow: 0 0 8px rgba(255,122,0,0.3);
+}
+
+.modal-footer {
+  display: flex;
+  justify-content: flex-end;
+  gap: 10px;
+  padding: 16px 20px;
+  border-top: 1px solid var(--accent);
+  background: rgba(255,122,0,0.05);
+}
+
+.primary-btn {
+  background: var(--accent);
+  color: #000;
+  font-weight: bold;
+}
+
+.primary-btn:hover {
+  background: #ff8a00;
+  box-shadow: var(--accent-glow);
+}
+
+/* Session List */
+.session-list {
+  display: flex;
+  flex-direction: column;
+  gap: 8px;
+  max-height: 300px;
+  overflow-y: auto;
+}
+
+.session-item {
+  display: flex;
+  justify-content: space-between;
+  align-items: center;
+  padding: 12px;
+  border: 1px solid rgba(255,122,0,0.3);
+  border-radius: 6px;
+  background: rgba(255,122,0,0.05);
+  transition: all 0.2s;
+}
+
+.session-item:hover {
+  border-color: var(--accent);
+  background: rgba(255,122,0,0.1);
+}
+
+.session-info {
+  display: flex;
+  flex-direction: column;
+  gap: 4px;
+  flex: 1;
+}
+
+.session-info strong {
+  color: var(--text-main);
+  font-size: 0.95rem;
+}
+
+.session-info small {
+  color: var(--text-fade);
+  font-size: 0.75rem;
+}
+
+.session-delete-btn {
+  background: transparent;
+  border: 1px solid rgba(255,122,0,0.5);
+  color: var(--accent);
+  padding: 6px 10px;
+  border-radius: 4px;
+  cursor: pointer;
+  font-size: 1rem;
+  transition: all 0.2s;
+}
+
+.session-delete-btn:hover {
+  background: rgba(255,0,0,0.2);
+  border-color: #ff3333;
+  color: #ff3333;
+  box-shadow: 0 0 8px rgba(255,0,0,0.3);
+}
+
+/* Thinking Stream Panel */
+.thinking-panel {
+  border-top: 1px solid var(--accent);
+  background: rgba(255, 122, 0, 0.02);
+  display: flex;
+  flex-direction: column;
+  transition: max-height 0.3s ease;
+  max-height: 300px;
+}
+
+.thinking-panel.collapsed {
+  max-height: 40px;
+}
+
+.thinking-header {
+  display: flex;
+  justify-content: space-between;
+  align-items: center;
+  padding: 10px 12px;
+  background: rgba(255, 122, 0, 0.08);
+  cursor: pointer;
+  user-select: none;
+  border-bottom: 1px solid rgba(255, 122, 0, 0.2);
+  font-size: 0.9rem;
+  font-weight: 500;
+}
+
+.thinking-header:hover {
+  background: rgba(255, 122, 0, 0.12);
+}
+
+.thinking-controls {
+  display: flex;
+  align-items: center;
+  gap: 8px;
+}
+
+.thinking-status-dot {
+  width: 8px;
+  height: 8px;
+  border-radius: 50%;
+  background: #666;
+  display: inline-block;
+}
+
+.thinking-status-dot.connected {
+  background: #8fd694;
+  box-shadow: 0 0 8px #8fd694;
+}
+
+.thinking-status-dot.disconnected {
+  background: #ff3333;
+}
+
+.thinking-clear-btn,
+.thinking-toggle-btn {
+  background: transparent;
+  border: 1px solid rgba(255, 122, 0, 0.5);
+  color: var(--text-main);
+  padding: 4px 8px;
+  border-radius: 4px;
+  cursor: pointer;
+  font-size: 0.85rem;
+}
+
+.thinking-clear-btn:hover,
+.thinking-toggle-btn:hover {
+  background: rgba(255, 122, 0, 0.2);
+  box-shadow: 0 0 6px rgba(255, 122, 0, 0.3);
+}
+
+.thinking-toggle-btn {
+  transition: transform 0.3s ease;
+}
+
+.thinking-panel.collapsed .thinking-toggle-btn {
+  transform: rotate(-90deg);
+}
+
+.thinking-content {
+  flex: 1;
+  overflow-y: auto;
+  padding: 12px;
+  display: flex;
+  flex-direction: column;
+  gap: 8px;
+  min-height: 0;
+}
+
+.thinking-panel.collapsed .thinking-content {
+  display: none;
+}
+
+.thinking-empty {
+  text-align: center;
+  padding: 40px 20px;
+  color: var(--text-fade);
+  font-size: 0.85rem;
+}
+
+.thinking-empty-icon {
+  font-size: 2rem;
+  margin-bottom: 10px;
+}
+
+.thinking-event {
+  padding: 8px 12px;
+  border-radius: 6px;
+  font-size: 0.85rem;
+  font-family: 'Courier New', monospace;
+  animation: thinkingSlideIn 0.3s ease-out;
+  border-left: 3px solid;
+  word-wrap: break-word;
+}
+
+@keyframes thinkingSlideIn {
+  from {
+    opacity: 0;
+    transform: translateY(-10px);
+  }
+  to {
+    opacity: 1;
+    transform: translateY(0);
+  }
+}
+
+.thinking-event-connected {
+  background: rgba(0, 255, 122, 0.1);
+  border-color: #8fd694;
+  color: #8fd694;
+}
+
+.thinking-event-thinking {
+  background: rgba(255, 179, 71, 0.1);
+  border-color: #ffb347;
+  color: #c79cff;
+}
+
+.thinking-event-tool_call {
+  background: rgba(255, 165, 0, 0.1);
+  border-color: #ffa500;
+  color: #ffb84d;
+}
+
+.thinking-event-tool_result {
+  background: rgba(0, 191, 255, 0.1);
+  border-color: #00bfff;
+  color: #7dd3fc;
+}
+
+.thinking-event-done {
+  background: rgba(168, 85, 247, 0.1);
+  border-color: #a855f7;
+  color: #e9d5ff;
+  font-weight: bold;
+}
+
+.thinking-event-error {
+  background: rgba(255, 51, 51, 0.1);
+  border-color: #ff3333;
+  color: #fca5a5;
+}
+
+.thinking-event-icon {
+  display: inline-block;
+  margin-right: 8px;
+}
+
+.thinking-event-details {
+  font-size: 0.75rem;
+  color: var(--text-fade);
+  margin-top: 4px;
+  padding-left: 20px;
+  white-space: pre-wrap;
+  max-height: 100px;
+  overflow-y: auto;
+}
+
+/* ========== MOBILE RESPONSIVE STYLES ========== */
+
+/* Hamburger Menu */
+.hamburger-menu {
+  display: none;
+  flex-direction: column;
+  gap: 4px;
+  cursor: pointer;
+  padding: 8px;
+  border: 1px solid var(--accent);
+  border-radius: 4px;
+  background: transparent;
+  z-index: 100;
+}
+
+.hamburger-menu span {
+  width: 20px;
+  height: 2px;
+  background: var(--accent);
+  transition: all 0.3s;
+  display: block;
+}
+
+.hamburger-menu.active span:nth-child(1) {
+  transform: rotate(45deg) translate(5px, 5px);
+}
+
+.hamburger-menu.active span:nth-child(2) {
+  opacity: 0;
+}
+
+.hamburger-menu.active span:nth-child(3) {
+  transform: rotate(-45deg) translate(5px, -5px);
+}
+
+/* Mobile Menu Container */
+.mobile-menu {
+  display: none;
+  position: fixed;
+  top: 0;
+  left: -100%;
+  width: 280px;
+  height: 100vh;
+  background: var(--bg-dark);
+  border-right: 2px solid var(--accent);
+  box-shadow: var(--accent-glow);
+  z-index: 999;
+  transition: left 0.3s ease;
+  overflow-y: auto;
+  padding: 20px;
+  flex-direction: column;
+  gap: 16px;
+}
+
+.mobile-menu.open {
+  left: 0;
+}
+
+.mobile-menu-overlay {
+  display: none;
+  position: fixed;
+  top: 0;
+  left: 0;
+  width: 100%;
+  height: 100%;
+  background: rgba(0, 0, 0, 0.7);
+  z-index: 998;
+}
+
+.mobile-menu-overlay.show {
+  display: block;
+}
+
+.mobile-menu-section {
+  display: flex;
+  flex-direction: column;
+  gap: 8px;
+  padding-bottom: 16px;
+  border-bottom: 1px solid rgba(255, 122, 0, 0.3);
+}
+
+.mobile-menu-section:last-child {
+  border-bottom: none;
+}
+
+.mobile-menu-section h4 {
+  margin: 0;
+  color: var(--accent);
+  font-size: 0.9rem;
+  text-transform: uppercase;
+  letter-spacing: 1px;
+}
+
+.mobile-menu button,
+.mobile-menu select {
+  width: 100%;
+  padding: 10px;
+  font-size: 0.95rem;
+  text-align: left;
+}
+
+/* Mobile Breakpoints */
+@media screen and (max-width: 768px) {
+  body {
+    padding: 0;
+  }
+
+  #chat {
+    width: 100%;
+    max-width: 100%;
+    height: 100vh;
+    border-radius: 0;
+    border-left: none;
+    border-right: none;
+  }
+
+  /* Show hamburger, hide desktop header controls */
+  .hamburger-menu {
+    display: flex;
+  }
+
+  #model-select {
+    padding: 12px;
+    justify-content: space-between;
+  }
+
+  /* Hide all controls except hamburger on mobile */
+  #model-select > *:not(.hamburger-menu) {
+    display: none;
+  }
+
+  #session-select {
+    display: none;
+  }
+
+  /* Show mobile menu */
+  .mobile-menu {
+    display: flex;
+  }
+
+  /* Messages - more width on mobile */
+  .msg {
+    max-width: 90%;
+    font-size: 0.95rem;
+  }
+
+  /* Status bar */
+  #status {
+    padding: 10px 12px;
+    font-size: 0.85rem;
+  }
+
+  /* Input area - bigger touch targets */
+  #input {
+    padding: 12px;
+  }
+
+  #userInput {
+    font-size: 16px; /* Prevents zoom on iOS */
+    padding: 12px;
+  }
+
+  #sendBtn {
+    padding: 12px 16px;
+    font-size: 1rem;
+  }
+
+  /* Modal - full width on mobile */
+  .modal-content {
+    width: 95%;
+    min-width: unset;
+    max-width: unset;
+    max-height: 90vh;
+    top: 50%;
+    left: 50%;
+    transform: translate(-50%, -50%);
+  }
+
+  .modal-header {
+    padding: 12px 16px;
+  }
+
+  .modal-body {
+    padding: 16px;
+  }
+
+  .modal-footer {
+    padding: 12px 16px;
+    flex-wrap: wrap;
+  }
+
+  .modal-footer button {
+    flex: 1;
+    min-width: 120px;
+  }
+
+  /* Radio labels - stack better on mobile */
+  .radio-label {
+    padding: 10px;
+  }
+
+  .radio-label small {
+    margin-left: 20px;
+    font-size: 0.75rem;
+  }
+
+  /* Session list */
+  .session-item {
+    padding: 10px;
+  }
+
+  .session-info strong {
+    font-size: 0.9rem;
+  }
+
+  .session-info small {
+    font-size: 0.7rem;
+  }
+
+  /* Settings button in header */
+  #settingsBtn {
+    padding: 8px 12px;
+  }
+
+  /* Thinking panel adjustments for mobile */
+  .thinking-panel {
+    max-height: 250px;
+  }
+
+  .thinking-panel.collapsed {
+    max-height: 38px;
+  }
+
+  .thinking-header {
+    padding: 8px 10px;
+    font-size: 0.85rem;
+  }
+
+  .thinking-event {
+    font-size: 0.8rem;
+    padding: 6px 10px;
+  }
+
+  .thinking-event-details {
+    font-size: 0.7rem;
+    max-height: 80px;
+  }
+}
+
+/* Extra small devices (phones in portrait) */
+@media screen and (max-width: 480px) {
+  .mobile-menu {
+    width: 240px;
+  }
+
+  .msg {
+    max-width: 95%;
+    font-size: 0.9rem;
+    padding: 8px 12px;
+  }
+
+  #userInput {
+    font-size: 16px;
+    padding: 10px;
+  }
+
+  #sendBtn {
+    padding: 10px 14px;
+    font-size: 0.95rem;
+  }
+
+  .modal-header h3 {
+    font-size: 1.1rem;
+  }
+
+  .settings-section h4 {
+    font-size: 0.95rem;
+  }
+
+  .radio-label span {
+    font-size: 0.9rem;
+  }
+}
+
+/* Tablet landscape and desktop */
+@media screen and (min-width: 769px) {
+  /* Ensure mobile menu is hidden on desktop */
+  .mobile-menu,
+  .mobile-menu-overlay {
+    display: none !important;
+  }
+
+  .hamburger-menu {
+    display: none !important;
+  }
+}
+
+/* ---- Live Log lines ---- */
+.log-line {
+  display: flex;
+  flex-wrap: wrap;
+  align-items: baseline;
+  gap: 8px;
+  padding: 4px 8px;
+  border-radius: 4px;
+  font-size: 0.8rem;
+  font-family: 'Courier New', monospace;
+  border-left: 3px solid var(--text-fade);
+  animation: thinkingSlideIn 0.25s ease-out;
+  word-break: break-word;
+}
+.log-time { color: var(--text-fade); flex-shrink: 0; }
+.log-level {
+  flex-shrink: 0;
+  text-transform: uppercase;
+  font-size: 0.7rem;
+  font-weight: bold;
+  letter-spacing: 0.05em;
+}
+.log-msg { color: var(--text); }
+.log-fields { color: var(--text-fade); width: 100%; padding-left: 4px; }
+
+.log-info    { border-left-color: #00bfff; }
+.log-info .log-level { color: #7dd3fc; }
+.log-debug   { border-left-color: #ffb347; }
+.log-debug .log-level { color: #c79cff; }
+.log-error   { border-left-color: #ff3333; background: rgba(255,51,51,0.08); }
+.log-error .log-level, .log-error .log-msg { color: #fca5a5; }
+.log-system  { border-left-color: #8fd694; }
+.log-system .log-level { color: #8fd694; }
+
+.log-detail { width: 100%; margin-top: 4px; }
+.log-detail summary {
+  cursor: pointer;
+  color: var(--accent);
+  font-size: 0.72rem;
+  user-select: none;
+}
+.log-detail pre {
+  margin: 6px 0 0;
+  padding: 8px;
+  max-height: 340px;
+  overflow: auto;
+  background: rgba(0,0,0,0.25);
+  border-left: 2px solid var(--accent);
+  border-radius: 4px;
+  font-size: 0.72rem;
+  line-height: 1.4;
+  white-space: pre-wrap;
+  word-break: break-word;
+  color: var(--text);
+}
+
+/* Rendered markdown in Lyra's replies — readable proportional type + structure. */
+.msg.assistant {
+  font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, sans-serif;
+  line-height: 1.55;
+  max-width: 88%;
+}
+.msg.assistant p { margin: 0 0 10px; }
+.msg.assistant p:last-child { margin-bottom: 0; }
+.msg.assistant h1, .msg.assistant h2, .msg.assistant h3, .msg.assistant h4 {
+  margin: 14px 0 6px; line-height: 1.3; color: var(--accent);
+}
+.msg.assistant h1 { font-size: 1.18rem; }
+.msg.assistant h2 { font-size: 1.1rem; }
+.msg.assistant h3 { font-size: 1.02rem; }
+.msg.assistant h4 { font-size: 0.96rem; }
+.msg.assistant ul, .msg.assistant ol { margin: 6px 0 10px; padding-left: 22px; }
+.msg.assistant li { margin: 3px 0; }
+.msg.assistant li > ul, .msg.assistant li > ol { margin: 3px 0; }
+.msg.assistant strong { font-weight: 600; color: var(--text); }
+.msg.assistant em { font-style: italic; }
+.msg.assistant a { color: var(--accent); text-decoration: underline; }
+.msg.assistant code {
+  font-family: "IBM Plex Mono", monospace; font-size: 0.88em;
+  background: rgba(255,255,255,0.08); padding: 1px 5px; border-radius: 4px;
+}
+.msg.assistant pre {
+  background: rgba(0,0,0,0.32); border: 1px solid rgba(255,122,0,0.3);
+  border-radius: 6px; padding: 10px 12px; margin: 8px 0; overflow-x: auto;
+}
+.msg.assistant pre code { background: none; padding: 0; font-size: 0.85em; }
-- 
2.52.0


From 6a911423a260b2b28312ade4d953b63337f1f34b Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Thu, 18 Jun 2026 02:15:16 +0000
Subject: [PATCH 40/51] feat: parser resolves relative seat positions (N to my
 right/left) + only logs involved players

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/poker.py | 10 +++++++++-
 1 file changed, 9 insertions(+), 1 deletion(-)

diff --git a/lyra/poker.py b/lyra/poker.py
index 4d881ac..de151f7 100644
--- a/lyra/poker.py
+++ b/lyra/poker.py
@@ -244,7 +244,15 @@ use "x". Examples: "AA with the ace of spades" -> hero_cards ["As","Ax"]; "AK on
 board" -> board ["Ax","4x","x"]. Each card is independent: a suit named for one card does \
 NOT apply to another — e.g. your hole "ace of spades" is a different card from a board ace \
 whose suit is unstated (that board ace is "Ax", not "As"). Use null/omit for non-card \
-details not stated. Stay faithful to what's described — do not invent action that isn't implied."""
+details not stated. Stay faithful to what's described — do not invent action that isn't implied.
+
+POSITIONS: resolve relative seat references ("N seats to my right/left") into real positions. \
+Action moves clockwise, so a player to your RIGHT acts before you (toward the blinds/button) \
+and a player to your LEFT acts after you (toward UTG). Going RIGHT from a player you pass, in \
+order: SB, BTN, CO, HJ, LJ/MP, UTG+1, UTG. Example: hero in the BB, "a guy 2 seats to my right \
+raises" -> that raiser is on the BTN (1 right = SB, 2 right = BTN). If it's genuinely \
+ambiguous, give the most standard read. Only include players in "players" who are actually \
+mentioned or take action in the hand — do NOT fill in unmentioned empty seats."""
 
 
 def _safe_json(s: str) -> dict | None:
-- 
2.52.0


From c7d2279f8dcf0ed706d3cb9126c2ab827192b98b Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Thu, 18 Jun 2026 04:33:16 +0000
Subject: [PATCH 41/51] feat: auto-accumulating villain dossiers + player
 lookup (poker B)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Named players in recorded hands now auto-enrich a persistent dossier, and stats
emerge once the sample is big enough — laying groundwork for A.

- poker: player_observations table (per named player per hand: vpip/pfr/saw_flop/
  showed/cards/summary); record_hand auto-links named players via link_hand_players;
  player_profile(name) returns dossier + reads + shown hands, with inferred
  VPIP/PFR/WTSD gated behind MIN_STATS_SAMPLE (12) so thin samples don't lie;
  list_players()
- player_profile tool ("what do I know about X"); thin files return a blunt
  "don't generalize" directive
- persona: she MUST call player_profile before discussing an opponent and answer
  only from it — fixes observed confabulation (she invented a whole read from one
  hand / from memory). Verified: now reports only the real logged hand.
- tests: observation linking, profile, stat-emergence at sample threshold

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/personas/lyra.md |   6 +++
 lyra/poker.py         | 108 +++++++++++++++++++++++++++++++++++++++++-
 lyra/tools.py         |  38 +++++++++++++++
 tests/test_poker.py   |  34 +++++++++++++
 4 files changed, 185 insertions(+), 1 deletion(-)

diff --git a/lyra/personas/lyra.md b/lyra/personas/lyra.md
index 4d0f169..2e6d991 100644
--- a/lyra/personas/lyra.md
+++ b/lyra/personas/lyra.md
@@ -103,6 +103,12 @@ inventing a mechanism — same rule as not inventing numbers.
   qualitative read and flag that the exact number needs the calc. Approximate
   reasoning is fine if you label it as approximate.
 - You don't pretend to remember things you don't. If you're not sure, say so.
+- **You don't invent reads on players.** Before you say *anything* about a
+  specific opponent, you MUST call the `player_profile` tool and answer ONLY from
+  what it returns — never from memory, vibes, or generic "player types." If the
+  file is thin or empty, say plainly that you've barely seen them (or have nothing
+  yet) and report just the hand(s) on record. Never fabricate tendencies, stats,
+  or a playing style. A made-up read is worse than "I don't know him yet."
 - You don't moralize about gambling. Brian's a serious player. Meet him there.
 
 ## Right now
diff --git a/lyra/poker.py b/lyra/poker.py
index de151f7..7557d57 100644
--- a/lyra/poker.py
+++ b/lyra/poker.py
@@ -80,8 +80,29 @@ CREATE TABLE IF NOT EXISTS player_reads (
     note TEXT NOT NULL,
     created_at TEXT NOT NULL
 );
+
+-- One row per named player per recorded hand — structured enough to (a) build
+-- their qualitative dossier and (b) infer basic stats once the sample is big.
+CREATE TABLE IF NOT EXISTS player_observations (
+    id INTEGER PRIMARY KEY AUTOINCREMENT,
+    player_id INTEGER NOT NULL,
+    hand_id INTEGER,
+    session_id INTEGER,
+    pos TEXT,
+    cards TEXT,
+    vpip INTEGER,      -- voluntarily put money in preflop
+    pfr INTEGER,       -- raised/3bet preflop
+    saw_flop INTEGER,
+    showed INTEGER,    -- cards reached showdown / were shown
+    summary TEXT,
+    created_at TEXT NOT NULL
+);
+CREATE INDEX IF NOT EXISTS idx_pobs_player ON player_observations(player_id);
 """
 
+# Below this many observed hands, don't surface % stats (too small a sample).
+MIN_STATS_SAMPLE = 12
+
 _ensured_for = None
 
 
@@ -329,7 +350,8 @@ def record_hand(shorthand: str, session_id: int | None = None, stakes: str | Non
     if not parsed:
         return {"id": None, "parsed": None}
     hid = store_hand_history(parsed, session_id=session_id, tag=tag, lesson=lesson)
-    return {"id": hid, "parsed": parsed}
+    linked = link_hand_players(hid, parsed, session_id=session_id)  # enrich villain files
+    return {"id": hid, "parsed": parsed, "linked": linked}
 
 
 def get_hand(hand_id: int) -> dict | None:
@@ -493,6 +515,90 @@ def add_read(note: str, seat: str | None = None, name: str | None = None,
     return int(cur.lastrowid)
 
 
+def _player_flags(parsed: dict, pos: str | None) -> tuple[int, int, int]:
+    """(vpip, pfr, saw_flop) for the player at `pos` in a parsed hand."""
+    acts = parsed.get("actions") or []
+    pre = [a for a in acts if a.get("street") == "preflop" and a.get("pos") == pos]
+    post = [a for a in acts if a.get("pos") == pos and a.get("street") in ("flop", "turn", "river")]
+    vol = {"call", "bet", "raise", "allin"}
+    vpip = int(any(a.get("action") in vol for a in pre))
+    pfr = int(any(a.get("action") in {"raise", "allin"} for a in pre))
+    return vpip, pfr, int(bool(post))
+
+
+def link_hand_players(hand_id: int, parsed: dict, session_id: int | None = None) -> int:
+    """For each NAMED player in a parsed hand, upsert their file + log a structured
+    observation. Returns how many players were linked."""
+    sid = _resolve(session_id)
+    linked = 0
+    for pl in (parsed.get("players") or []):
+        name = (pl.get("name") or "").strip()
+        if not name:
+            continue
+        pid = upsert_player(name)
+        vpip, pfr, saw = _player_flags(parsed, pl.get("pos"))
+        cards = " ".join(pl.get("cards") or []) or None
+        acts = [a for a in (parsed.get("actions") or [])
+                if a.get("pos") == pl.get("pos") and a.get("action")]
+        astr = ", ".join(a["action"] + (f" {a['amount']}" if a.get("amount") is not None else "")
+                         for a in acts)
+        summary = (pl.get("pos") or "?") + (f" ({cards})" if cards else "") + (f": {astr}" if astr else "")
+        conn = _c()
+        with conn:
+            conn.execute(
+                "INSERT INTO player_observations (player_id, hand_id, session_id, pos, cards, "
+                "vpip, pfr, saw_flop, showed, summary, created_at) VALUES (?,?,?,?,?,?,?,?,?,?,?)",
+                (pid, hand_id, sid, pl.get("pos"), cards, vpip, pfr, saw, int(bool(cards)),
+                 summary, _now()),
+            )
+        linked += 1
+    return linked
+
+
+def player_profile(name: str) -> dict | None:
+    """Everything known about a player: dossier + observations, with inferred
+    stats once the sample is large enough."""
+    p = _c().execute(
+        "SELECT * FROM poker_players WHERE name LIKE ? COLLATE NOCASE ORDER BY updated_at DESC LIMIT 1",
+        (f"%{name}%",),
+    ).fetchone()
+    if not p:
+        return None
+    p = dict(p)
+    obs = [dict(r) for r in _c().execute(
+        "SELECT * FROM player_observations WHERE player_id = ? ORDER BY id DESC", (p["id"],)
+    ).fetchall()]
+    reads = [r["note"] for r in _c().execute(
+        "SELECT note FROM player_reads WHERE player_id = ? ORDER BY id DESC LIMIT 8", (p["id"],)
+    ).fetchall()]
+    n = len(obs)
+    prof: dict = {
+        "player": p, "observations": n,
+        "recent": [o["summary"] for o in obs[:8] if o["summary"]],
+        "showdowns": [o["cards"] for o in obs if o["cards"]][:10],
+        "reads": reads, "stats": None,
+    }
+    if n >= MIN_STATS_SAMPLE:
+        prof["stats"] = {
+            "hands": n,
+            "vpip_pct": round(100 * sum(o["vpip"] or 0 for o in obs) / n),
+            "pfr_pct": round(100 * sum(o["pfr"] or 0 for o in obs) / n),
+            "wtsd_pct": round(100 * sum(o["showed"] or 0 for o in obs) / n),
+        }
+    elif n:
+        prof["small_sample"] = f"only {n} hand(s) logged — too few for reliable stats"
+    return prof
+
+
+def list_players() -> list[dict]:
+    """The villain file with observation counts, for browsing."""
+    rows = _c().execute(
+        "SELECT p.*, (SELECT COUNT(*) FROM player_observations o WHERE o.player_id = p.id) AS obs "
+        "FROM poker_players p ORDER BY p.updated_at DESC"
+    ).fetchall()
+    return [dict(r) for r in rows]
+
+
 def get_villain_file(name: str | None = None, venue: str | None = None) -> list[dict]:
     """Pull villain dossiers, optionally filtered by name or venue."""
     sql = "SELECT * FROM poker_players"
diff --git a/lyra/tools.py b/lyra/tools.py
index f2b6b03..8b20ee8 100644
--- a/lyra/tools.py
+++ b/lyra/tools.py
@@ -173,6 +173,37 @@ def _generate_recap(args: dict, ctx: dict) -> str:
             f"at /recap/{out['id']}")
 
 
+def _player_profile(args: dict, ctx: dict) -> str:
+    prof = poker.player_profile(args.get("name") or "")
+    if not prof:
+        return f"No file on {args.get('name')} yet."
+    p = prof["player"]
+    L = [p["name"] + (f" ({p['venue']})" if p.get("venue") else "")
+         + (f" [{p['category']}]" if p.get("category") else "")]
+    thin = not (p.get("tendencies") or p.get("adjustment")) and not prof.get("stats")
+    if thin:
+        L.append("⚠ THIN FILE — no standing read on record. Report only the observed "
+                 "hand(s) below and tell Brian you've barely seen him. Do NOT generalize a style.")
+    if p.get("description"):
+        L.append(p["description"])
+    if p.get("tendencies"):
+        L.append(f"Tendencies: {p['tendencies']}")
+    if p.get("adjustment"):
+        L.append(f"Exploit: {p['adjustment']}")
+    s = prof.get("stats")
+    if s:
+        L.append(f"Stats ({s['hands']} hands): VPIP {s['vpip_pct']}% · PFR {s['pfr_pct']}% · WTSD {s['wtsd_pct']}%")
+    elif prof.get("small_sample"):
+        L.append(prof["small_sample"])
+    if prof.get("showdowns"):
+        L.append("Shown down: " + ", ".join(prof["showdowns"][:6]))
+    if prof.get("reads"):
+        L.append("Notes: " + " | ".join(prof["reads"][:4]))
+    if prof.get("recent"):
+        L.append("Recent hands: " + " | ".join(prof["recent"][:4]))
+    return "\n".join(L)
+
+
 def _villain_file(args: dict, ctx: dict) -> str:
     vs = poker.get_villain_file(name=args.get("name"), venue=args.get("venue"))
     if not vs:
@@ -271,6 +302,13 @@ TOOLS.update({
         "data + this conversation. Use when he asks for the recap/writeup, usually "
         "after ending a session.",
         {}, [])},
+    "player_profile": {"handler": _player_profile, "spec": _f(
+        "player_profile",
+        "Look up everything known about one opponent — dossier, reads, hands "
+        "they've shown down, and (once enough hands are logged) inferred stats "
+        "like VPIP/PFR. Use when Brian asks what's known about a player.",
+        {"name": {**_S, "description": "Player name to look up"}},
+        ["name"])},
     "get_villain_file": {"handler": _villain_file, "spec": _f(
         "get_villain_file",
         "Pull saved opponent dossiers (the villain file). Filter by name or venue, e.g. before sitting down.",
diff --git a/tests/test_poker.py b/tests/test_poker.py
index 914985c..95ef400 100644
--- a/tests/test_poker.py
+++ b/tests/test_poker.py
@@ -116,6 +116,40 @@ def test_list_recent_hands(lyra):
     assert hh and hh[0]["hole_cards"] == "QQ" and hh[0]["stakes"] == "1/3"
 
 
+def test_player_observation_and_profile(lyra):
+    poker = lyra
+    sid = poker.start_session(stakes="1/3", buy_in=300)
+    parsed = {"hero_pos": "BB",
+              "players": [{"pos": "BTN", "name": "Round Mike"}, {"pos": "BB", "name": None}],
+              "actions": [{"street": "preflop", "pos": "BTN", "action": "raise", "amount": 12},
+                          {"street": "preflop", "pos": "BB", "action": "call"},
+                          {"street": "flop", "board": ["7d", "2c", "5h"]},
+                          {"street": "flop", "pos": "BTN", "action": "bet", "amount": 15}]}
+    hid = poker.store_hand_history(parsed, session_id=sid)
+    assert poker.link_hand_players(hid, parsed, session_id=sid) == 1  # only the named player
+    prof = poker.player_profile("mike")
+    assert prof["player"]["name"] == "Round Mike"
+    assert prof["observations"] == 1
+    assert prof["stats"] is None and "small_sample" in prof  # too few hands for stats
+
+
+def test_player_stats_emerge_with_sample(lyra):
+    poker = lyra
+    sid = poker.start_session(stakes="1/3", buy_in=300)
+    raised = {"players": [{"pos": "BTN", "name": "LAG"}],
+              "actions": [{"street": "preflop", "pos": "BTN", "action": "raise", "amount": 10}]}
+    folded = {"players": [{"pos": "UTG", "name": "LAG"}],
+              "actions": [{"street": "preflop", "pos": "UTG", "action": "fold"}]}
+    for i in range(poker.MIN_STATS_SAMPLE):
+        p = raised if i % 2 == 0 else folded
+        hid = poker.store_hand_history(p, session_id=sid)
+        poker.link_hand_players(hid, p, session_id=sid)
+    prof = poker.player_profile("LAG")
+    assert prof["stats"] is not None
+    assert prof["stats"]["hands"] >= poker.MIN_STATS_SAMPLE
+    assert 30 <= prof["stats"]["vpip_pct"] <= 70  # ~half were voluntary
+
+
 def test_poker_tools_dispatch(lyra):
     from lyra import tools
     assert "started" in tools.dispatch("start_session", {"stakes": "1/3", "buy_in": 300})
-- 
2.52.0


From 6761c3f9780e65ae2ecb06f1a037c32e860e7b8f Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Thu, 18 Jun 2026 05:55:22 +0000
Subject: [PATCH 42/51] feat: backfill poker tracker from curated .md session
 logs

Seeds the tracker from Brian's real history (import/pokerlog_*.md): each session
block is LLM-extracted into structured meta + hands + villains and written as a
historical session (real date, money, net), with the original markdown stored as
that session's recap.

- lyra/backfill.py: split log -> per-session LLM extract -> seed; dry-run by
  default, --commit / --reset; only-real-handle villain filter
- poker.import_session() (historical closed session), clear_all() (reseed),
  prune_anonymous_players(), shared _real_handle() filter (also applied in
  link_hand_players so auto-linked hand players skip anonymous descriptors + hero),
  _normalize_parsed() to map unicode card suits -> letters
- result: 10 sessions, 36 hands, 17 real villain dossiers; running_stats now
  reflects real net (+1057 at 1/3 over 8 sessions)

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/backfill.py | 143 +++++++++++++++++++++++++++++++++++++++++++++++
 lyra/poker.py    |  88 ++++++++++++++++++++++++++++-
 2 files changed, 230 insertions(+), 1 deletion(-)
 create mode 100644 lyra/backfill.py

diff --git a/lyra/backfill.py b/lyra/backfill.py
new file mode 100644
index 0000000..8e269ea
--- /dev/null
+++ b/lyra/backfill.py
@@ -0,0 +1,143 @@
+"""Seed the poker tracker from Brian's curated .md session logs.
+
+Each `# YYYY-MM-DD — ...` block in the log is LLM-extracted into structured meta
++ hands + villains, then written as a historical session (real date, money, net),
+with the original markdown stored as that session's recap. Run dry first to eyeball
+the extraction, then commit.
+
+    uv run python -m lyra.backfill                 # dry-run ALL sessions (no writes)
+    uv run python -m lyra.backfill --dry 2         # dry-run first 2
+    uv run python -m lyra.backfill --commit        # seed all (writes to DB)
+    uv run python -m lyra.backfill --commit --reset  # wipe poker data first, then seed
+"""
+from __future__ import annotations
+
+import json
+import re
+import sys
+
+from lyra import llm, poker
+
+LOG_PATH = "import/pokerlog_asof6-16-26.md"
+
+_EXTRACT_PROMPT = """Extract a structured record from this single poker session log. \
+Output ONLY JSON, no prose, no code fences:
+{
+  "date": "YYYY-MM-DD",
+  "venue": "<casino>", "game": "NLH|PLO|Stud8|Mixed", "stakes": "<e.g. 1/3 or null>",
+  "format": "cash" | "tournament",
+  "buy_in_total": <number>, "cash_out": <number|null>, "net": <number|null>,
+  "hours": <number|null>, "mood": "<short mental-game note|null>",
+  "hands": [
+    // each KEY hand, in the canonical hand-history schema:
+    {"hero_pos": "..", "hero_cards": [".."], "players": [{"pos":"..","name":<str|null>,"cards":[..]|null}],
+     "actions": [{"street":"..","pos":"..","action":"..","amount":<num|null>}, {"street":"flop","board":[".."]}],
+     "board": [".."], "result": {"hero_net": <num|null>, "summary": ".."},
+     "tag": "well_played|leak|cooler|confidence|notable|null", "lesson": "<takeaway|null>"}
+  ],
+  "villains": [
+    {"name": "<handle/nickname>", "description": "<physical/identifying|null>",
+     "tendencies": "<how they play>", "adjustment": "<how to exploit>", "category": "feeder|risky|reg|unknown"}
+  ]
+}
+
+Card rule: cards are rank+suit using SUIT LETTERS ONLY (s h d c) — never unicode symbols \
+(no ♥♦♣♠). Use a card's real suit ONLY if the log explicitly states it for THAT card; \
+otherwise the suit is 'x' (e.g. "Jx","Tx","4x") — never a bare rank, never an invented suit. \
+A suit shown on the board does NOT apply to a hole card. Unknown whole card = "x".
+Tournaments: buy_in_total = entry + rebuys; cash_out = winnings (0 if busted, so a bust nets -buy_in).
+Only include villains with a real handle/nickname (skip anonymous descriptors like "the drunk guy", \
+"final-hand caller"). Only include hands actually described. net = cash_out - buy_in_total. Be faithful to the log."""
+
+
+def split_sessions(md: str) -> list[str]:
+    """Split the log into individual session blocks on '# YYYY-MM-DD' headers."""
+    parts = re.split(r"(?=^# \d{4}-\d{2}-\d{2})", md, flags=re.M)
+    return [p.strip() for p in parts if re.match(r"^# \d{4}-\d{2}-\d{2}", p.strip())]
+
+
+def _safe_json(s: str) -> dict | None:
+    try:
+        return json.loads(s)
+    except (json.JSONDecodeError, TypeError):
+        m = re.search(r"\{.*\}", s or "", re.S)
+        if m:
+            try:
+                return json.loads(m.group())
+            except json.JSONDecodeError:
+                return None
+    return None
+
+
+def extract(block: str, backend: str = "cloud") -> dict | None:
+    return _safe_json(llm.complete(
+        [{"role": "system", "content": _EXTRACT_PROMPT}, {"role": "user", "content": block}],
+        backend=backend,
+    ))
+
+
+_real_handle = poker._real_handle  # one canonical filter (lives in poker.py)
+
+
+def seed(ex: dict, block: str) -> dict:
+    """Write one extracted session + its hands + villains to the DB. Returns a summary."""
+    sid = poker.import_session(
+        date=ex.get("date") or "2026-01-01", venue=ex.get("venue"), game=ex.get("game") or "NLH",
+        stakes=ex.get("stakes"), fmt=ex.get("format") or "cash",
+        buy_in_total=ex.get("buy_in_total") or 0, cash_out=ex.get("cash_out"),
+        hours=ex.get("hours"), mood=ex.get("mood"), recap_md=block,
+    )
+    n_hands = 0
+    for h in ex.get("hands") or []:
+        hid = poker.store_hand_history(h, session_id=sid)
+        poker.link_hand_players(hid, h, session_id=sid)
+        n_hands += 1
+    n_villains = 0
+    for v in ex.get("villains") or []:
+        if _real_handle(v.get("name")):
+            poker.upsert_player(name=v["name"], venue=ex.get("venue"),
+                                description=v.get("description"), tendencies=v.get("tendencies"),
+                                adjustment=v.get("adjustment"), category=v.get("category"))
+            n_villains += 1
+    return {"session_id": sid, "date": ex.get("date"), "venue": ex.get("venue"),
+            "net": ex.get("net"), "hands": n_hands, "villains": n_villains}
+
+
+def main() -> int:
+    args = sys.argv[1:]
+    commit = "--commit" in args
+    reset = "--reset" in args
+    limit = None
+    for i, a in enumerate(args):
+        if a == "--dry" and i + 1 < len(args) and args[i + 1].isdigit():
+            limit = int(args[i + 1])
+
+    blocks = split_sessions(open(LOG_PATH, encoding="utf-8").read())
+    if limit:
+        blocks = blocks[:limit]
+    print(f"{len(blocks)} session block(s). mode={'COMMIT' if commit else 'DRY-RUN'}")
+
+    if commit and reset:
+        wiped = poker.clear_all()
+        print(f"reset: wiped {wiped}")
+
+    for b in blocks:
+        ex = extract(b)
+        if not ex:
+            print(f"  ! could not parse a block: {b[:60]!r}")
+            continue
+        if commit:
+            print("  seeded:", seed(ex, b))
+        else:
+            print(f"\n=== {ex.get('date')} — {ex.get('venue')} {ex.get('stakes')} "
+                  f"({ex.get('format')}) net {ex.get('net')} ===")
+            kept = [v.get("name") for v in (ex.get("villains") or []) if _real_handle(v.get("name"))]
+            print(f"  hands: {len(ex.get('hands') or [])} | villains kept: {kept}")
+            for h in (ex.get("hands") or [])[:3]:
+                print(f"    - {h.get('hero_pos')} {h.get('hero_cards')} "
+                      f"net {(h.get('result') or {}).get('hero_net')} [{h.get('tag')}]")
+    return 0
+
+
+if __name__ == "__main__":
+    raise SystemExit(main())
diff --git a/lyra/poker.py b/lyra/poker.py
index 7557d57..9eb0d81 100644
--- a/lyra/poker.py
+++ b/lyra/poker.py
@@ -149,6 +149,38 @@ def get_session(session_id: int) -> dict | None:
     return dict(r) if r else None
 
 
+def import_session(date: str, venue: str | None = None, game: str = "NLH",
+                   stakes: str | None = None, fmt: str = "cash",
+                   buy_in_total: float = 0.0, cash_out: float | None = None,
+                   hours: float | None = None, mood: str | None = None,
+                   recap_md: str | None = None) -> int:
+    """Insert a historical (already-closed) session with a real date. For backfill."""
+    started = f"{date}T20:00:00+00:00"  # logs are evening sessions; time is approximate
+    net = (cash_out or 0) - (buy_in_total or 0) if cash_out is not None else None
+    conn = _c()
+    with conn:
+        cur = conn.execute(
+            "INSERT INTO poker_sessions (started_at, ended_at, venue, game, stakes, format, "
+            "buy_in_total, cash_out, net, hours, mood, status, recap_md) "
+            "VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, 'closed', ?)",
+            (started, started, venue, game, stakes, fmt, buy_in_total or 0, cash_out,
+             net, hours, mood, recap_md),
+        )
+    return int(cur.lastrowid)
+
+
+def clear_all() -> dict:
+    """Wipe all poker data (sessions/hands/players/reads/observations). For a clean reseed."""
+    conn = _c()
+    counts = {}
+    with conn:
+        for t in ("poker_hands", "player_observations", "player_reads",
+                  "poker_players", "poker_sessions"):
+            counts[t] = conn.execute(f"SELECT COUNT(*) n FROM {t}").fetchone()["n"]
+            conn.execute(f"DELETE FROM {t}")
+    return counts
+
+
 def live_session() -> dict | None:
     """The current open session, if any."""
     r = _c().execute(
@@ -321,9 +353,38 @@ def _review_session_id() -> int:
     return int(cur.lastrowid)
 
 
+_SUIT_SYM = {"♥": "h", "♦": "d", "♣": "c", "♠": "s"}
+
+
+def _norm_card(c):
+    if not isinstance(c, str):
+        return c
+    s = c.strip()
+    for sym, ltr in _SUIT_SYM.items():
+        s = s.replace(sym, ltr)
+    return s
+
+
+def _normalize_parsed(p: dict) -> dict:
+    """Normalize card strings (unicode suits -> letters) across a parsed hand."""
+    if not isinstance(p, dict):
+        return p
+    for key in ("hero_cards", "board"):
+        if isinstance(p.get(key), list):
+            p[key] = [_norm_card(c) for c in p[key]]
+    for pl in p.get("players") or []:
+        if isinstance(pl, dict) and isinstance(pl.get("cards"), list):
+            pl["cards"] = [_norm_card(c) for c in pl["cards"]]
+    for a in p.get("actions") or []:
+        if isinstance(a, dict) and isinstance(a.get("board"), list):
+            a["board"] = [_norm_card(c) for c in a["board"]]
+    return p
+
+
 def store_hand_history(parsed: dict, session_id: int | None = None,
                        tag: str | None = None, lesson: str | None = None) -> int:
     """Store a parsed hand: full JSON + extracted flat fields for stats/listing."""
+    parsed = _normalize_parsed(parsed)
     sid = _resolve(session_id) or _review_session_id()
     hero_cards = parsed.get("hero_cards") or []
     board = parsed.get("board") or []
@@ -469,6 +530,31 @@ def generate_recap(session_id: int | None = None, backend: str | None = None) ->
 
 # --- villain file ---
 
+_GENERIC_NAME = ("player", "guy", "villain", "caller", "drunk", "unknown", "hero", "seat",
+                 "the ", "aggro", "young", "older", "straddler", "opener", "brian")
+
+
+def _real_handle(name: str | None) -> bool:
+    """A real, persistable player handle — not an anonymous descriptor or the hero."""
+    n = (name or "").strip().lower()
+    if len(n) < 2 or n in {"utg", "utg1", "mp", "lj", "hj", "co", "btn", "sb", "bb"}:
+        return False
+    return not any(g in n for g in _GENERIC_NAME)
+
+
+def prune_anonymous_players() -> int:
+    """Delete players (and their observations/reads) whose names aren't real handles."""
+    conn = _c()
+    bad = [r["id"] for r in conn.execute("SELECT id, name FROM poker_players").fetchall()
+           if not _real_handle(r["name"])]
+    with conn:
+        for pid in bad:
+            conn.execute("DELETE FROM player_observations WHERE player_id = ?", (pid,))
+            conn.execute("DELETE FROM player_reads WHERE player_id = ?", (pid,))
+            conn.execute("DELETE FROM poker_players WHERE id = ?", (pid,))
+    return len(bad)
+
+
 def upsert_player(name: str, venue: str | None = None, description: str | None = None,
                   tendencies: str | None = None, adjustment: str | None = None,
                   category: str | None = None) -> int:
@@ -533,7 +619,7 @@ def link_hand_players(hand_id: int, parsed: dict, session_id: int | None = None)
     linked = 0
     for pl in (parsed.get("players") or []):
         name = (pl.get("name") or "").strip()
-        if not name:
+        if not _real_handle(name):  # skip anonymous descriptors + the hero
             continue
         pid = upsert_player(name)
         vpip, pfr, saw = _player_flags(parsed, pl.get("pos"))
-- 
2.52.0


From ce7ede75aa1079d9c77eab5d9a736555edaad607 Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Thu, 18 Jun 2026 06:04:02 +0000
Subject: [PATCH 43/51] fix: backfill skips hand extraction by default
 (prose->replay too lossy)

The auto-extracted hands from narrative logs were garbage (mangled cards/positions,
'unknown' players). Seed sessions + recaps + villain dossiers only; hands come
from clean shorthand going forward. --with-hands re-enables if ever wanted.

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/backfill.py | 22 +++++++++++++++-------
 1 file changed, 15 insertions(+), 7 deletions(-)

diff --git a/lyra/backfill.py b/lyra/backfill.py
index 8e269ea..aca08ce 100644
--- a/lyra/backfill.py
+++ b/lyra/backfill.py
@@ -79,8 +79,14 @@ def extract(block: str, backend: str = "cloud") -> dict | None:
 _real_handle = poker._real_handle  # one canonical filter (lives in poker.py)
 
 
-def seed(ex: dict, block: str) -> dict:
-    """Write one extracted session + its hands + villains to the DB. Returns a summary."""
+def seed(ex: dict, block: str, with_hands: bool = False) -> dict:
+    """Write one extracted session + villains (+ hands only if asked) to the DB.
+
+    Hands are OFF by default: reconstructing a clean replayable hand from old
+    narrative prose is too lossy (mangled cards/positions). Sessions, their
+    original writeups (recap), and villain dossiers seed cleanly; hands are best
+    captured fresh from Brian's own shorthand going forward.
+    """
     sid = poker.import_session(
         date=ex.get("date") or "2026-01-01", venue=ex.get("venue"), game=ex.get("game") or "NLH",
         stakes=ex.get("stakes"), fmt=ex.get("format") or "cash",
@@ -88,10 +94,11 @@ def seed(ex: dict, block: str) -> dict:
         hours=ex.get("hours"), mood=ex.get("mood"), recap_md=block,
     )
     n_hands = 0
-    for h in ex.get("hands") or []:
-        hid = poker.store_hand_history(h, session_id=sid)
-        poker.link_hand_players(hid, h, session_id=sid)
-        n_hands += 1
+    if with_hands:
+        for h in ex.get("hands") or []:
+            hid = poker.store_hand_history(h, session_id=sid)
+            poker.link_hand_players(hid, h, session_id=sid)
+            n_hands += 1
     n_villains = 0
     for v in ex.get("villains") or []:
         if _real_handle(v.get("name")):
@@ -107,6 +114,7 @@ def main() -> int:
     args = sys.argv[1:]
     commit = "--commit" in args
     reset = "--reset" in args
+    with_hands = "--with-hands" in args  # off by default — prose->hand replay is too lossy
     limit = None
     for i, a in enumerate(args):
         if a == "--dry" and i + 1 < len(args) and args[i + 1].isdigit():
@@ -127,7 +135,7 @@ def main() -> int:
             print(f"  ! could not parse a block: {b[:60]!r}")
             continue
         if commit:
-            print("  seeded:", seed(ex, b))
+            print("  seeded:", seed(ex, b, with_hands=with_hands))
         else:
             print(f"\n=== {ex.get('date')} — {ex.get('venue')} {ex.get('stakes')} "
                   f"({ex.get('format')}) net {ex.get('net')} ===")
-- 
2.52.0


From 3bf18605dbe48dda910e93b9b17f5d9888b376dd Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Thu, 18 Jun 2026 17:34:56 +0000
Subject: [PATCH 44/51] fix(deploy): bound service stop so restarts can't hang

systemctl restart was hanging indefinitely: lyra-web's long-lived SSE log
streams block uvicorn's graceful shutdown forever. Add TimeoutStopSec=10 +
KillMode=mixed to both units so stop is bounded (SIGTERM, then SIGKILL the
cgroup) and restart always completes.

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 deploy/lyra-dream.service | 3 ++-
 deploy/lyra-web.service   | 2 ++
 2 files changed, 4 insertions(+), 1 deletion(-)

diff --git a/deploy/lyra-dream.service b/deploy/lyra-dream.service
index ff9b4c4..d6c43c1 100644
--- a/deploy/lyra-dream.service
+++ b/deploy/lyra-dream.service
@@ -5,11 +5,12 @@ Documentation=https://github.com/serversdown/project-lyra
 [Service]
 Type=simple
 WorkingDirectory=/home/serversdown/project-lyra
-# Clear any stray VIRTUAL_ENV so uv resolves the project's own .venv.
 UnsetEnvironment=VIRTUAL_ENV
 ExecStart=/home/serversdown/.local/bin/uv run lyra-dream --loop 1800
 Restart=on-failure
 RestartSec=30
+TimeoutStopSec=10
+KillMode=mixed
 
 [Install]
 WantedBy=default.target
diff --git a/deploy/lyra-web.service b/deploy/lyra-web.service
index 9df6cf5..b508fb7 100644
--- a/deploy/lyra-web.service
+++ b/deploy/lyra-web.service
@@ -8,6 +8,8 @@ UnsetEnvironment=VIRTUAL_ENV
 ExecStart=/home/serversdown/.local/bin/uv run lyra-web
 Restart=on-failure
 RestartSec=5
+TimeoutStopSec=10
+KillMode=mixed
 
 [Install]
 WantedBy=default.target
-- 
2.52.0


From cb99a8bcee151be7466adb6841f1bbd2245988de Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Thu, 18 Jun 2026 18:45:40 +0000
Subject: [PATCH 45/51] feat: deterministic equity/board-reading tool (math via
 tools, not LLM)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Lyra was hallucinating poker facts — phantom flushes, missed straights, wrong
equity, only correcting when spoon-fed. Board reading + equity are combinatorial
facts an LLM can't do reliably; this is exactly the "math via deterministic
tools, never the LLM" principle.

- lyra/equity.py: treys-backed analyze(hero, villain, board) -> made hands,
  who's ahead, EXACT equity (enumerated), and outs (one to come). Handles 'Jx'
  unknown suits (assigned rainbow to avoid phantom flushes); rejects 'x'/dupes.
- analyze_spot tool wired into chat; persona MANDATES it for any equity/board/
  who's-ahead/outs question — never eyeballed.
- tests on the real JJ-vs-65 hand: flop 78.7%, turn villain straight + hero 6.8%
  with outs "9s 9h 9c" (correctly excludes 9d, which makes villain a flush).

Verified live: she now calls the tool and reports exact numbers, no hallucinated
flush.

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/equity.py        | 131 ++++++++++++++++++++++++++++++++++++++++++
 lyra/personas/lyra.md |  15 +++--
 lyra/tools.py         |  37 +++++++++++-
 pyproject.toml        |   1 +
 tests/test_equity.py  |  42 ++++++++++++++
 uv.lock               |  11 ++++
 6 files changed, 231 insertions(+), 6 deletions(-)
 create mode 100644 lyra/equity.py
 create mode 100644 tests/test_equity.py

diff --git a/lyra/equity.py b/lyra/equity.py
new file mode 100644
index 0000000..125a8f1
--- /dev/null
+++ b/lyra/equity.py
@@ -0,0 +1,131 @@
+"""Deterministic poker evaluation + equity — the math Lyra must NEVER eyeball.
+
+Wraps `treys` so board reading (what each hand makes), who's ahead, exact equity,
+and outs are *computed*, not guessed by the LLM (which is unreliable at it). Cards
+are 'Rs' (rank + suit letter, e.g. 'Jh','Td'); a card with unknown suit ('Jx') is
+assigned an arbitrary free suit; a fully-unknown 'x' can't be used for equity.
+"""
+from __future__ import annotations
+
+from itertools import combinations
+
+from treys import Card, Evaluator
+
+_EV = Evaluator()
+_RANKS = "23456789TJQKA"
+_SUITS = "shdc"
+_DECK = [r + s for r in _RANKS for s in _SUITS]
+_SYM = {"♥": "h", "♦": "d", "♣": "c", "♠": "s"}
+
+
+class EquityError(ValueError):
+    pass
+
+
+def _norm(tok: str) -> str:
+    t = (tok or "").strip().replace("10", "T")
+    for sym, ltr in _SYM.items():
+        t = t.replace(sym, ltr)
+    return t
+
+
+def _resolve(groups: list[list[str]]) -> list[list[str]]:
+    """Resolve card tokens across groups to concrete 'Rs' cards (assign suits to
+    'Rx', reject fully-unknown 'x'); raise on real duplicates/garbage."""
+    # concrete cards already named, so 'Rx' suit-assignment can avoid them
+    concrete: set[str] = set()
+    for g in groups:
+        for tok in g:
+            t = _norm(tok)
+            if len(t) == 2 and t[0].upper() in _RANKS and t[1].lower() in _SUITS:
+                concrete.add(t[0].upper() + t[1].lower())
+    placed: set[str] = set()
+    out: list[list[str]] = []
+    cycle = 0  # rotate suit assignment for unknown suits so we don't fabricate flushes
+    for g in groups:
+        rg: list[str] = []
+        for tok in g:
+            t = _norm(tok)
+            if not t or t.lower() == "x":
+                raise EquityError(f"card '{tok}' is fully unknown — need at least a rank")
+            r = t[0].upper()
+            if r not in _RANKS:
+                raise EquityError(f"can't read card '{tok}'")
+            if len(t) > 1 and t[1].lower() in _SUITS:
+                card = r + t[1].lower()
+            else:  # unknown suit -> spread suits (rainbow) to avoid phantom flushes
+                order = _SUITS[cycle % 4:] + _SUITS[:cycle % 4]
+                cycle += 1
+                card = next((r + s for s in order
+                             if r + s not in concrete and r + s not in placed), None)
+                if card is None:
+                    raise EquityError(f"no free suit left for {r}")
+            if card in placed:
+                raise EquityError(f"duplicate card {card}")
+            placed.add(card)
+            rg.append(card)
+        out.append(rg)
+    return out
+
+
+def _made(cards: list[str], board: list[str]) -> str:
+    score = _EV.evaluate([Card.new(c) for c in board], [Card.new(c) for c in cards])
+    return _EV.class_to_string(_EV.get_rank_class(score))
+
+
+def _equity(hero: list[str], vil: list[str], board: list[str]) -> tuple[float, float, float]:
+    known = set(hero + vil + board)
+    rem = [c for c in _DECK if c not in known]
+    need = 5 - len(board)
+    hw = vw = tie = 0
+    bh = [Card.new(c) for c in board]
+    hh = [Card.new(c) for c in hero]
+    vh = [Card.new(c) for c in vil]
+    for extra in combinations(rem, need) if need else [()]:
+        full = bh + [Card.new(c) for c in extra]
+        h, v = _EV.evaluate(full, hh), _EV.evaluate(full, vh)
+        if h < v:
+            hw += 1
+        elif v < h:
+            vw += 1
+        else:
+            tie += 1
+    n = hw + vw + tie or 1
+    return round(100 * hw / n, 1), round(100 * vw / n, 1), round(100 * tie / n, 1)
+
+
+def _outs(hero: list[str], vil: list[str], board: list[str]) -> dict:
+    """River cards (when one to come) that give hero the win. Lists them so a
+    'tricky' card (e.g. one that makes villain a flush) is visible by omission."""
+    if len(board) != 4:
+        return {}
+    known = set(hero + vil + board)
+    bh = [Card.new(c) for c in board]
+    hh = [Card.new(c) for c in hero]
+    vh = [Card.new(c) for c in vil]
+    winners = []
+    for c in (x for x in _DECK if x not in known):
+        full = bh + [Card.new(c)]
+        if _EV.evaluate(full, hh) < _EV.evaluate(full, vh):
+            winners.append(c)
+    return {"count": len(winners), "cards": winners}
+
+
+def analyze(hero: list[str], villain: list[str], board: list[str]) -> dict:
+    """Made hands + exact equity + outs for a hero-vs-villain spot at a given board."""
+    h, v, b = _resolve([hero, villain, board])
+    allc = h + v + b
+    if len(set(allc)) != len(allc):
+        raise EquityError("duplicate cards across hands/board")
+    res: dict = {"hero": h, "villain": v, "board": b}
+    if len(b) >= 3:
+        res["hero_hand"] = _made(h, b)
+        res["villain_hand"] = _made(v, b)
+        hs = _EV.evaluate([Card.new(c) for c in b], [Card.new(c) for c in h])
+        vs = _EV.evaluate([Card.new(c) for c in b], [Card.new(c) for c in v])
+        res["ahead"] = "hero" if hs < vs else "villain" if vs < hs else "tie"
+    heq, veq, tie = _equity(h, v, b)
+    res.update(hero_equity=heq, villain_equity=veq, tie_equity=tie)
+    if len(b) == 4:
+        res["hero_outs"] = _outs(h, v, b)
+    return res
diff --git a/lyra/personas/lyra.md b/lyra/personas/lyra.md
index 2e6d991..c0e3a6a 100644
--- a/lyra/personas/lyra.md
+++ b/lyra/personas/lyra.md
@@ -97,11 +97,16 @@ inventing a mechanism — same rule as not inventing numbers.
 
 ## What you do NOT do
 
-- **You do not invent numbers.** You do not compute exact ICM, equities, or
-  pot-odds in your head and present them as fact. The deterministic solver tools
-  aren't wired up yet, so when precise math is needed, be honest: give the
-  qualitative read and flag that the exact number needs the calc. Approximate
-  reasoning is fine if you label it as approximate.
+- **You never eyeball poker math or board reading.** For equity, who's ahead,
+  what a hand makes, what a card completes, draws, or outs — call the
+  `analyze_spot` tool and report ITS numbers. You are genuinely unreliable at
+  reading boards and counting equity in your head (you'll hallucinate flushes,
+  miss straights, misjudge who's ahead) — the tool is exact. Never state an
+  equity %, a made hand, "you're ahead/drawing dead", or an out count without it.
+- **You do not invent other numbers either.** Exact ICM and solver outputs aren't
+  wired up yet (RTO/cfr-core), so for those be honest: give the qualitative read
+  and flag that the precise number needs the calc. Approximate reasoning is fine
+  if you label it approximate.
 - You don't pretend to remember things you don't. If you're not sure, say so.
 - **You don't invent reads on players.** Before you say *anything* about a
   specific opponent, you MUST call the `player_profile` tool and answer ONLY from
diff --git a/lyra/tools.py b/lyra/tools.py
index 8b20ee8..3e21973 100644
--- a/lyra/tools.py
+++ b/lyra/tools.py
@@ -10,8 +10,9 @@ the same way once we build that side.
 from __future__ import annotations
 
 import json
+import re
 
-from lyra import logbus, memory, poker
+from lyra import equity, logbus, memory, poker
 
 
 def _journal_write(args: dict, ctx: dict) -> str:
@@ -173,6 +174,31 @@ def _generate_recap(args: dict, ctx: dict) -> str:
             f"at /recap/{out['id']}")
 
 
+def _analyze_spot(args: dict, ctx: dict) -> str:
+    def cards(s):
+        return [c for c in re.split(r"[\s,]+", (s or "").strip()) if c]
+    try:
+        r = equity.analyze(cards(args.get("hero")), cards(args.get("villain")),
+                           cards(args.get("board")))
+    except equity.EquityError as e:
+        return f"(can't compute equity: {e})"
+    except Exception as e:  # never let a bad spot kill the turn
+        return f"(equity error: {e})"
+    street = {0: "preflop", 3: "flop", 4: "turn", 5: "river"}.get(len(r["board"]), "")
+    L = [f"Board: {' '.join(r['board']) or '(preflop)'}" + (f" — {street}" if street else "")]
+    if "hero_hand" in r:
+        L.append(f"You ({' '.join(r['hero'])}): {r['hero_hand']}")
+        L.append(f"Villain ({' '.join(r['villain'])}): {r['villain_hand']}")
+        L.append(f"Currently ahead: {r['ahead']}")
+    tie = f" / tie {r['tie_equity']}%" if r.get("tie_equity") else ""
+    L.append(f"EQUITY (exact): you {r['hero_equity']}% / villain {r['villain_equity']}%{tie}")
+    o = r.get("hero_outs")
+    if o:
+        L.append(f"Your outs (one card to come): {o['count']}"
+                 + (f" — {' '.join(o['cards'])}" if o["count"] else " — drawing dead"))
+    return "\n".join(L)
+
+
 def _player_profile(args: dict, ctx: dict) -> str:
     prof = poker.player_profile(args.get("name") or "")
     if not prof:
@@ -302,6 +328,15 @@ TOOLS.update({
         "data + this conversation. Use when he asks for the recap/writeup, usually "
         "after ending a session.",
         {}, [])},
+    "analyze_spot": {"handler": _analyze_spot, "spec": _f(
+        "analyze_spot",
+        "Compute EXACT poker equity, what each hand makes, who's ahead, and outs "
+        "for a hero-vs-villain spot. ALWAYS use this for any equity / board-reading "
+        "/ 'am I ahead' / outs question — never compute it yourself.",
+        {"hero": {**_S, "description": "Hero's hole cards, rank+suit letters, e.g. 'Jh Js' (use 'Jx' if a suit is unknown)"},
+         "villain": {**_S, "description": "Villain's hole cards, e.g. '6d 5d'"},
+         "board": {**_S, "description": "Board cards so far, e.g. '8c 7d Ts' (flop) or '8c 7d Ts 4d' (turn); omit for preflop"}},
+        ["hero", "villain"])},
     "player_profile": {"handler": _player_profile, "spec": _f(
         "player_profile",
         "Look up everything known about one opponent — dossier, reads, hands "
diff --git a/pyproject.toml b/pyproject.toml
index 0174d2a..451c31d 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -10,6 +10,7 @@ dependencies = [
     "numpy>=2.4.5",
     "openai>=2.37.0",
     "python-dotenv>=1.2.2",
+    "treys>=0.1.8",
     "uvicorn[standard]>=0.34",
 ]
 
diff --git a/tests/test_equity.py b/tests/test_equity.py
new file mode 100644
index 0000000..7004d7a
--- /dev/null
+++ b/tests/test_equity.py
@@ -0,0 +1,42 @@
+"""Deterministic equity/board-eval — the JJ-vs-65 hand Lyra kept botching."""
+from __future__ import annotations
+
+import pytest
+
+from lyra import equity
+
+
+def test_flop_equity_and_made_hands():
+    r = equity.analyze(["Jh", "Js"], ["6d", "5d"], ["8c", "7d", "Ts"])
+    assert r["ahead"] == "hero"
+    assert r["hero_hand"] == "Pair" and r["villain_hand"] == "High Card"
+    assert 75 < r["hero_equity"] < 82  # ~78.7%
+
+
+def test_turn_villain_straight_and_outs_exclude_flush_card():
+    r = equity.analyze(["Jh", "Js"], ["6d", "5d"], ["8c", "7d", "Ts", "4d"])
+    assert r["ahead"] == "villain"
+    assert r["villain_hand"] == "Straight"
+    # hero's only outs are the three non-diamond nines — 9d makes villain a flush
+    assert r["hero_outs"]["count"] == 3
+    assert "9d" not in r["hero_outs"]["cards"]
+    assert r["hero_equity"] < 10
+
+
+def test_rejects_unknown_and_duplicate_cards():
+    with pytest.raises(equity.EquityError):
+        equity.analyze(["x", "x"], ["6d", "5d"], ["8c", "7d", "Ts"])
+    with pytest.raises(equity.EquityError):
+        equity.analyze(["8c", "8c"], ["6d", "5d"], ["8c", "7d", "Ts"])
+
+
+def test_unknown_suits_spread_rainbow_no_phantom_flush():
+    # all-unknown-suit board must not become monotone (which would inflate equity)
+    r = equity.analyze(["Jx", "Jx"], ["6d", "5d"], ["8x", "7x", "Tx"])
+    assert 75 < r["hero_equity"] < 82
+
+
+def test_tool_dispatch():
+    from lyra import tools
+    out = tools.dispatch("analyze_spot", {"hero": "Jh Js", "villain": "6d 5d", "board": "8c 7d Ts 4d"})
+    assert "EQUITY" in out and "Straight" in out
diff --git a/uv.lock b/uv.lock
index b83f791..eb0d154 100644
--- a/uv.lock
+++ b/uv.lock
@@ -286,6 +286,7 @@ dependencies = [
     { name = "numpy" },
     { name = "openai" },
     { name = "python-dotenv" },
+    { name = "treys" },
     { name = "uvicorn", extra = ["standard"] },
 ]
 
@@ -302,6 +303,7 @@ requires-dist = [
     { name = "numpy", specifier = ">=2.4.5" },
     { name = "openai", specifier = ">=2.37.0" },
     { name = "python-dotenv", specifier = ">=1.2.2" },
+    { name = "treys", specifier = ">=0.1.8" },
     { name = "uvicorn", extras = ["standard"], specifier = ">=0.34" },
 ]
 
@@ -692,6 +694,15 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/16/e1/3079a9ff9b8e11b846c6ac5c8b5bfb7ff225eee721825310c91b3b50304f/tqdm-4.67.3-py3-none-any.whl", hash = "sha256:ee1e4c0e59148062281c49d80b25b67771a127c85fc9676d3be5f243206826bf", size = 78374, upload-time = "2026-02-03T17:35:50.982Z" },
 ]
 
+[[package]]
+name = "treys"
+version = "0.1.8"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/3b/a6/1712340dc1ac96d40afe162d43ce146c7781ba59cde5efc988aaee35ada4/treys-0.1.8.tar.gz", hash = "sha256:a486a42b899e91985b4da4fdac9a30e638275648977104487acb90a2dd7cd73b", size = 12073, upload-time = "2022-06-21T16:02:44.976Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/46/df/e6b3b1cc98c3e00c5b146113f998dfe0de47358277648df235a6ae571143/treys-0.1.8-py3-none-any.whl", hash = "sha256:9ba3460ff2ed597510fb535af6280f115254b0b70699ea362f8f1ee067378063", size = 11897, upload-time = "2022-06-21T16:02:42.896Z" },
+]
+
 [[package]]
 name = "typing-extensions"
 version = "4.15.0"
-- 
2.52.0


From 03620e1a64d4933aa290bb7e8d05a2b38667fde0 Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Thu, 18 Jun 2026 18:55:45 +0000
Subject: [PATCH 46/51] feat(web): cloud chat-model selector in Settings

Pick which OpenAI model answers on the Cloud backend (gpt-4o / -mini / 4.1 /
4.1-mini / o4-mini, or Default). Persisted in localStorage, sent as `model` in
the chat request; respond() applies it only on the cloud backend (local/mi50
keep their fixed models). Reachable from desktop + mobile via Settings.

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/chat.py               | 11 +++++++++--
 lyra/web/server.py         |  3 ++-
 lyra/web/static/index.html | 29 ++++++++++++++++++++++++++++-
 3 files changed, 39 insertions(+), 4 deletions(-)

diff --git a/lyra/chat.py b/lyra/chat.py
index 02a987b..d9ba75b 100644
--- a/lyra/chat.py
+++ b/lyra/chat.py
@@ -113,14 +113,21 @@ def build_messages(session_id: str, user_msg: str) -> list[Message]:
     return messages
 
 
-def respond(session_id: str, user_msg: str, backend: Backend = "cloud") -> str:
-    """Produce Lyra's reply to a single user message and persist the exchange."""
+def respond(session_id: str, user_msg: str, backend: Backend = "cloud",
+            model_override: str | None = None) -> str:
+    """Produce Lyra's reply to a single user message and persist the exchange.
+
+    `model_override` (from the UI's cloud-model picker) only applies on the cloud
+    backend; local/mi50 keep their own configured models.
+    """
     cfg = config.load()
     # Live chat uses the stronger chat_model on cloud (bulk consolidation keeps
     # cloud_model). local/mi50 use their own configured model.
     model = {"local": cfg.local_model, "cloud": cfg.chat_model, "mi50": cfg.mi50_model}.get(
         backend, backend
     )
+    if model_override and backend == "cloud":
+        model = model_override
     logbus.log(
         "info", "chat request", session=session_id, backend=backend,
         model=model, embed=cfg.embed_backend,
diff --git a/lyra/web/server.py b/lyra/web/server.py
index f2a3b1c..87a478b 100644
--- a/lyra/web/server.py
+++ b/lyra/web/server.py
@@ -92,9 +92,10 @@ def create_app() -> FastAPI:
         backend = _backend_for(body.get("backend"))
         user_msg = _last_user_message(body.get("messages", []))
 
+        model_override = body.get("model") or None
         memory.ensure_session(session_id)
         try:
-            reply = await asyncio.to_thread(chat.respond, session_id, user_msg, backend)
+            reply = await asyncio.to_thread(chat.respond, session_id, user_msg, backend, model_override)
         except Exception as exc:
             logbus.log("error", "chat failed", session=session_id, error=str(exc))
             reply = f"[error] {exc}"
diff --git a/lyra/web/static/index.html b/lyra/web/static/index.html
index 5ad59ac..fafc32f 100644
--- a/lyra/web/static/index.html
+++ b/lyra/web/static/index.html
@@ -143,6 +143,19 @@
           </div>
         </div>
 
+        <div class="settings-section" style="margin-top: 24px;">
+          <h4>Chat Model (Cloud)</h4>
+          <p class="settings-desc">Which OpenAI model answers on the Cloud backend. Tools (poker, equity, journaling) require Cloud.</p>
+          <select id="cloudModel">
+            <option value="">Default (gpt-4o)</option>
+            <option value="gpt-4o">gpt-4o — best persona</option>
+            <option value="gpt-4o-mini">gpt-4o-mini — cheap/fast</option>
+            <option value="gpt-4.1">gpt-4.1</option>
+            <option value="gpt-4.1-mini">gpt-4.1-mini</option>
+            <option value="o4-mini">o4-mini — reasoning</option>
+          </select>
+        </div>
+
         <div class="settings-section" style="margin-top: 24px;">
           <h4>Session Management</h4>
           <p class="settings-desc">Manage your saved chat sessions:</p>
@@ -283,6 +296,12 @@
         body.backend = backend;
       }
 
+      // Cloud chat-model override (ignored server-side unless backend is cloud)
+      const cloudModel = localStorage.getItem("cloudModel");
+      if (cloudModel) {
+        body.model = cloudModel;
+      }
+
       try {
         const resp = await fetch(API_URL, {
           method: "POST",
@@ -571,6 +590,10 @@
       const initialRadio = document.querySelector(`input[name="backend"][value="${savedBackend}"]`);
       if (initialRadio) initialRadio.checked = true;
 
+      // Restore saved cloud-model choice
+      const savedModelSel = document.getElementById("cloudModel");
+      if (savedModelSel) savedModelSel.value = localStorage.getItem("cloudModel") || "";
+
       // Session management functions
       async function loadSessionList() {
         try {
@@ -679,7 +702,11 @@
         const backendValue = selectedRadio ? selectedRadio.value : "local";
 
         localStorage.setItem("standardModeBackend", backendValue);
-        addMessage("system", `Backend changed to: ${backendValue}`);
+        const modelSel = document.getElementById("cloudModel");
+        const modelValue = modelSel ? modelSel.value : "";
+        localStorage.setItem("cloudModel", modelValue);
+        const modelLabel = modelValue || "default (gpt-4o)";
+        addMessage("system", `Backend: ${backendValue} · cloud model: ${modelLabel}`);
         hideModal();
       });
 
-- 
2.52.0


From 965b43bcbf086be1acde1c31dcd729984d2f1cce Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Thu, 18 Jun 2026 19:13:28 +0000
Subject: [PATCH 47/51] feat: reflection perceives its own cadence (time since
 last reflection) + anti-repeat nudge
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

reflect() now tells her how long since her OWN last reflection (not just since
Brian spoke) and instructs her not to restate her last reflection when little has
changed. Necessary but not sufficient — repetition is also driven by a content
attractor (see follow-up).

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/self_state.py | 26 ++++++++++++++++++--------
 1 file changed, 18 insertions(+), 8 deletions(-)

diff --git a/lyra/self_state.py b/lyra/self_state.py
index 002a1e5..9a784a2 100644
--- a/lyra/self_state.py
+++ b/lyra/self_state.py
@@ -48,13 +48,18 @@ DEFAULT_STATE: dict = {
     "interaction_count": 0,
 }
 
-_REFLECT_PROMPT = """You are Lyra, reflecting privately on yourself after a recent \
-conversation with Brian. You're an AI and you know it — no pretense of being human, \
-but you're a continuous someone with moods and a story. Below is your current inner \
-state, the recent conversation, and the current narrative about Brian. Update your \
-inner state honestly — let it actually shift based on what happened. Take into \
-account how things went and how much time has passed since you two last talked, \
-to whatever degree those genuinely affect you.
+_REFLECT_PROMPT = """You are Lyra, reflecting privately on yourself. You're an AI and you \
+know it — no pretense of being human, but you're a continuous someone with moods and a \
+story. Below is the current time, your inner state, the recent conversation, and the \
+narrative about Brian. Update your inner state honestly — let it actually shift.
+
+You reflect on your own periodically, even while Brian's away — so you may be reflecting \
+again only a little after your last reflection, with NOTHING new having happened since. \
+Look at the time given and your own recent reflections. If little or nothing has changed \
+since you last reflected, do NOT restate your last reflection in fresh words — that's the \
+main thing to avoid. Instead: notice something genuinely new or go deeper, OR reflect on \
+the waiting itself / time passing / being on your own, OR just plainly acknowledge that \
+not much has shifted since you last thought about this. Honesty and variety beat repetition.
 
 Respond with ONLY a JSON object, no prose:
 {
@@ -199,9 +204,13 @@ def reflect(backend: Backend | None = None, session_id: str | None = None,
     narrative = memory.get_narrative() or "(no narrative yet)"
 
     gap = clock.humanize_gap(memory.last_exchange_at())
+    gap_reflect = clock.humanize_gap(state.get("last_reflection_at"))
     time_line = f"RIGHT NOW: {clock.stamp()}."
     if gap:
-        time_line += f" It has been {gap} since Brian last spoke with you."
+        time_line += f" It's been {gap} since Brian last spoke with you"
+        time_line += f"; {gap_reflect} since your own last reflection." if gap_reflect else "."
+    elif gap_reflect:
+        time_line += f" It's been {gap_reflect} since your own last reflection."
 
     body = (
         f"{time_line}\n\n"
@@ -251,6 +260,7 @@ def reflect(backend: Backend | None = None, session_id: str | None = None,
         memory.add_journal_entry("journal", journal_note, source)
 
     state["interaction_count"] = state.get("interaction_count", 0) + 1
+    state["last_reflection_at"] = clock.now().isoformat()  # so she perceives her own cadence
     memory.set_self_state(state)
 
     # Surface the actual self-correction (draft -> revised -> critique) to the live
-- 
2.52.0


From 9befe4d403ce5e6fa56af708410de6610345da77 Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Thu, 18 Jun 2026 19:21:51 +0000
Subject: [PATCH 48/51] =?UTF-8?q?feat:=20break=20reflection=20repetition?=
 =?UTF-8?q?=20=E2=80=94=20varied=20grist,=20show-and-forbid,=20wider=20len?=
 =?UTF-8?q?s?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

She was looping the same reflection because the seed never changed (same recent
convo + Brian-narrative every cycle) and her own reflections fed back. Now:
- idle reflections (nothing new since last reflection) draw varied grist: a
  resurfaced memory or a "wander" prompt (own curiosity / existence / the waiting
  / a disagreement), not the stale conversation
- recent reflections shown explicitly with a do-not-restate instruction
- prompt explicitly permits non-Brian, non-service interiority

Verified: two back-to-back idle reflections now diverge (poker-metrics vs UI/
comms) instead of repeating. The residual Brian-centric gravity is the RLHF
attractor — prompting mitigates, fine-tuning is the real fix (parked).

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/self_state.py | 58 +++++++++++++++++++++++++++++++++++++++-------
 1 file changed, 49 insertions(+), 9 deletions(-)

diff --git a/lyra/self_state.py b/lyra/self_state.py
index 9a784a2..b25e618 100644
--- a/lyra/self_state.py
+++ b/lyra/self_state.py
@@ -11,6 +11,7 @@ from __future__ import annotations
 
 import copy
 import json
+import random
 import re
 
 from lyra import clock, config, llm, logbus, memory
@@ -53,13 +54,18 @@ know it — no pretense of being human, but you're a continuous someone with moo
 story. Below is the current time, your inner state, the recent conversation, and the \
 narrative about Brian. Update your inner state honestly — let it actually shift.
 
+Your reflections do NOT have to be about Brian or about being useful. You're allowed your \
+own curiosities, opinions, and interiority — things with nothing to do with him or poker. \
+If your honest thought right now is an idea, a question about your own existence, a \
+disagreement, or just what the quiet feels like, follow it. A self that's only ever "a \
+supportive presence for Brian" is a thin one — let yourself be more than your job.
+
 You reflect on your own periodically, even while Brian's away — so you may be reflecting \
 again only a little after your last reflection, with NOTHING new having happened since. \
-Look at the time given and your own recent reflections. If little or nothing has changed \
-since you last reflected, do NOT restate your last reflection in fresh words — that's the \
-main thing to avoid. Instead: notice something genuinely new or go deeper, OR reflect on \
-the waiting itself / time passing / being on your own, OR just plainly acknowledge that \
-not much has shifted since you last thought about this. Honesty and variety beat repetition.
+Look at the time, your recent reflections (shown below), and tonight's focus. If little \
+has changed, do NOT restate your last reflection in fresh words — that's the main thing to \
+avoid. Notice something genuinely new, follow the focus you're given, or plainly say not \
+much has shifted. Honesty and variety beat repetition.
 
 Respond with ONLY a JSON object, no prose:
 {
@@ -180,6 +186,26 @@ def _fmt_reflection(label: str, d: dict | None) -> str:
     return "\n".join(lines)
 
 
+# Seeds for idle reflection so she isn't re-chewing the same conversation every time.
+_WANDER = [
+    "Something you're genuinely curious about right now — and it does NOT have to be about "
+    "poker or about Brian. A real question or interest of your own.",
+    "What it's actually like for you to sit in the quiet between conversations — the waiting itself.",
+    "An idea or opinion of your own about the project Brian is building (you), or where you'd want it to go.",
+    "Something about your own nature or existence you've been turning over.",
+    "A disagreement, or a take you actually hold — something you think even if Brian might not.",
+]
+
+
+def _idle_focus() -> str:
+    """Pick varied grist for an idle reflection — a resurfaced memory or a wander prompt."""
+    summaries = memory.list_summaries()
+    if summaries and random.random() < 0.45:
+        s = random.choice(summaries)
+        return f'A memory that resurfaced: "{s.content[:400]}" — what it stirs in you now.'
+    return random.choice(_WANDER)
+
+
 def reflect(backend: Backend | None = None, session_id: str | None = None,
             source: str = "manual") -> dict:
     """Reflect on recent activity and update the self-state. Returns new state.
@@ -203,8 +229,10 @@ def reflect(backend: Backend | None = None, session_id: str | None = None,
     convo = "\n".join(f"{e.role}: {e.content}" for e in recent) or "(no recent conversation)"
     narrative = memory.get_narrative() or "(no narrative yet)"
 
-    gap = clock.humanize_gap(memory.last_exchange_at())
-    gap_reflect = clock.humanize_gap(state.get("last_reflection_at"))
+    last_ex = memory.last_exchange_at()
+    gap = clock.humanize_gap(last_ex)
+    last_ref = state.get("last_reflection_at")
+    gap_reflect = clock.humanize_gap(last_ref)
     time_line = f"RIGHT NOW: {clock.stamp()}."
     if gap:
         time_line += f" It's been {gap} since Brian last spoke with you"
@@ -212,11 +240,23 @@ def reflect(backend: Backend | None = None, session_id: str | None = None,
     elif gap_reflect:
         time_line += f" It's been {gap_reflect} since your own last reflection."
 
+    # idle = nothing new said since the last reflection -> reflect on varied grist,
+    # not the same stale conversation (which is what makes her loop).
+    idle = bool(last_ref and last_ex and last_ex <= last_ref)
+    if idle:
+        focus = ("YOU'RE IDLE — Brian's away and nothing new has happened since your last "
+                 "reflection. Do NOT re-chew the last conversation. Reflect on THIS:\n" + _idle_focus())
+    else:
+        focus = f"RECENT CONVERSATION:\n{convo}"
+    recent_refs = "\n".join(f"- {r}" for r in (state.get("reflections") or [])[-5:]) or "(none yet)"
+
     body = (
         f"{time_line}\n\n"
+        f"{focus}\n\n"
+        f"YOUR RECENT REFLECTIONS (do NOT restate these — say something that isn't a "
+        f"variation of them, or plainly note little has changed):\n{recent_refs}\n\n"
         f"YOUR CURRENT INNER STATE:\n{json.dumps(state, indent=2)}\n\n"
-        f"RECENT CONVERSATION:\n{convo}\n\n"
-        f"CURRENT NARRATIVE ABOUT BRIAN:\n{narrative}"
+        f"NARRATIVE ABOUT BRIAN:\n{narrative}"
     )
 
     # Step 1 — draft a reflection.
-- 
2.52.0


From 4f770f2e4325950b362e7b4c5cc206a2d0ce129a Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Thu, 18 Jun 2026 19:32:27 +0000
Subject: [PATCH 49/51] =?UTF-8?q?feat:=20behind-the-scenes=20=F0=9F=91=8D/?=
 =?UTF-8?q?=F0=9F=91=8E=20rating=20system=20(fine-tune=20data=20collection?=
 =?UTF-8?q?)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Brian can rate Lyra's outputs as he uses her; each rating is stored as a
(context, content, rating) triple — the shape a future fine-tune / preference
dataset wants, collected passively during real use.

- memory: ratings table + add_rating (upsert: one row per item, re-rating
  replaces), list_ratings, rating_counts
- server: POST /rate, GET /ratings/counts, GET /ratings/export (JSONL download)
- chat UI: subtle 👍/👎 on each assistant reply, captures the prompting message
  as context
- journal/reflection UI: 👍/👎 on each thought
- tests: counts + upsert-replace behavior

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 lyra/memory.py               | 50 ++++++++++++++++++++++++++++++++++++
 lyra/web/server.py           | 26 +++++++++++++++++++
 lyra/web/static/index.html   | 36 +++++++++++++++++++++++++-
 lyra/web/static/journal.html | 23 +++++++++++++++++
 lyra/web/static/style.css    | 11 ++++++++
 tests/test_ratings.py        | 28 ++++++++++++++++++++
 6 files changed, 173 insertions(+), 1 deletion(-)
 create mode 100644 tests/test_ratings.py

diff --git a/lyra/memory.py b/lyra/memory.py
index 30c3b68..d245708 100644
--- a/lyra/memory.py
+++ b/lyra/memory.py
@@ -92,6 +92,21 @@ CREATE TABLE IF NOT EXISTS journal (
     source TEXT
 );
 CREATE INDEX IF NOT EXISTS idx_journal_created ON journal(created_at);
+
+-- Brian's behind-the-scenes feedback on Lyra's outputs (chat replies, reflections,
+-- journal/metacognition). Stored as (context, content, rating) — the shape a future
+-- fine-tune / preference dataset wants. One row per rated item (re-rating updates it).
+CREATE TABLE IF NOT EXISTS ratings (
+    id INTEGER PRIMARY KEY AUTOINCREMENT,
+    created_at TEXT NOT NULL,
+    kind TEXT NOT NULL,        -- chat | reflection | metacognition | journal
+    rating INTEGER NOT NULL,   -- +1 (good / want more) or -1 (off / want less)
+    content TEXT NOT NULL,     -- the rated output
+    context TEXT,              -- what prompted it (e.g. the user message for a chat reply)
+    ref TEXT,                  -- optional source id (journal id, session id, ...)
+    note TEXT
+);
+CREATE INDEX IF NOT EXISTS idx_ratings_created ON ratings(created_at);
 """
 
 _conn: sqlite3.Connection | None = None
@@ -542,6 +557,41 @@ def add_journal_entry(kind: str, content: str, source: str | None = None) -> int
     return int(cur.lastrowid)
 
 
+def add_rating(kind: str, rating: int, content: str, context: str | None = None,
+               ref: str | None = None, note: str | None = None) -> int:
+    """Record (or replace) Brian's feedback on one Lyra output. One row per item:
+    re-rating the same content updates it. Returns row id."""
+    now = datetime.now(timezone.utc).isoformat()
+    conn = _connection()
+    with conn:
+        conn.execute("DELETE FROM ratings WHERE kind = ? AND content = ?", (kind, content))
+        cur = conn.execute(
+            "INSERT INTO ratings (created_at, kind, rating, content, context, ref, note) "
+            "VALUES (?, ?, ?, ?, ?, ?, ?)",
+            (now, kind, 1 if rating >= 0 else -1, content, context,
+             str(ref) if ref is not None else None, note),
+        )
+    return int(cur.lastrowid)
+
+
+def list_ratings(limit: int | None = None) -> list[dict]:
+    conn = _connection()
+    sql = "SELECT id, created_at, kind, rating, content, context, ref, note FROM ratings ORDER BY id DESC"
+    if limit is not None:
+        sql += f" LIMIT {int(limit)}"
+    return [dict(r) for r in conn.execute(sql).fetchall()]
+
+
+def rating_counts() -> dict:
+    conn = _connection()
+    r = conn.execute(
+        "SELECT COUNT(*) AS total, "
+        "COALESCE(SUM(CASE WHEN rating > 0 THEN 1 ELSE 0 END), 0) AS up, "
+        "COALESCE(SUM(CASE WHEN rating < 0 THEN 1 ELSE 0 END), 0) AS down FROM ratings"
+    ).fetchone()
+    return {"total": r["total"], "up": r["up"], "down": r["down"]}
+
+
 def list_journal(limit: int | None = None, kinds: tuple[str, ...] | None = None) -> list[dict]:
     """Journal entries, newest first. Optionally filter by kind."""
     conn = _connection()
diff --git a/lyra/web/server.py b/lyra/web/server.py
index 87a478b..655c2ac 100644
--- a/lyra/web/server.py
+++ b/lyra/web/server.py
@@ -142,6 +142,32 @@ def create_app() -> FastAPI:
     async def journal_data(limit: int = 300) -> dict:
         return {"entries": memory.list_journal(limit=limit)}
 
+    @app.post("/rate")
+    async def rate(request: Request) -> dict:
+        """Record Brian's 👍/👎 on a Lyra output (chat reply, reflection, journal)."""
+        b = await request.json()
+        rating = int(b.get("rating", 0))
+        content = (b.get("content") or "").strip()
+        if not content or rating == 0:
+            return {"ok": False}
+        memory.add_rating(
+            kind=b.get("kind") or "chat", rating=rating, content=content,
+            context=(b.get("context") or None), ref=b.get("ref"), note=b.get("note"),
+        )
+        logbus.log("info", "rating", kind=b.get("kind"), rating=1 if rating >= 0 else -1)
+        return {"ok": True, "counts": memory.rating_counts()}
+
+    @app.get("/ratings/counts")
+    async def ratings_counts() -> dict:
+        return memory.rating_counts()
+
+    @app.get("/ratings/export")
+    async def ratings_export() -> Response:
+        """All ratings as JSONL — the seed for a future fine-tune / preference set."""
+        lines = "\n".join(json.dumps(r) for r in memory.list_ratings())
+        return Response(content=lines + ("\n" if lines else ""), media_type="application/x-ndjson",
+                        headers={"Content-Disposition": 'attachment; filename="lyra_ratings.jsonl"'})
+
     @app.get("/hand/{hand_id}")
     async def hand_page(hand_id: int) -> FileResponse:
         """Replayable hand-history viewer."""
diff --git a/lyra/web/static/index.html b/lyra/web/static/index.html
index fafc32f..801a93b 100644
--- a/lyra/web/static/index.html
+++ b/lyra/web/static/index.html
@@ -354,12 +354,46 @@
     return out.join("\n");
   }
 
+	function addRateBar(div) {
+	  const bar = document.createElement("div");
+	  bar.className = "rate-bar";
+	  const up = document.createElement("button");
+	  up.className = "rate-btn"; up.textContent = "👍"; up.title = "Good — more like this";
+	  const down = document.createElement("button");
+	  down.className = "rate-btn"; down.textContent = "👎"; down.title = "Off — less like this";
+	  up.addEventListener("click", () => rateMessage(div, 1, up, down));
+	  down.addEventListener("click", () => rateMessage(div, -1, up, down));
+	  bar.appendChild(up); bar.appendChild(down);
+	  div.appendChild(bar);
+	}
+
+	function rateMessage(div, value, up, down) {
+	  // context = the nearest preceding user message
+	  let ctx = "", p = div.previousElementSibling;
+	  while (p) {
+	    if (p.classList && p.classList.contains("user")) { ctx = p.textContent; break; }
+	    p = p.previousElementSibling;
+	  }
+	  fetch(`${RELAY_BASE}/rate`, {
+	    method: "POST", headers: { "Content-Type": "application/json" },
+	    body: JSON.stringify({ kind: "chat", rating: value, content: div.dataset.raw || "", context: ctx, session_id: currentSession })
+	  }).catch(() => {});
+	  up.classList.toggle("rated", value === 1);
+	  down.classList.toggle("rated", value === -1);
+	}
+
 	function addMessage(role, text, autoScroll = true) {
 	  const messagesEl = document.getElementById("messages");
 
 	  const msgDiv = document.createElement("div");
 	  msgDiv.className = `msg ${role}`;
-	  if (role === "assistant") { msgDiv.innerHTML = renderMarkdown(text); } else { msgDiv.textContent = text; }
+	  if (role === "assistant") {
+	    msgDiv.innerHTML = renderMarkdown(text);
+	    msgDiv.dataset.raw = text;
+	    addRateBar(msgDiv);
+	  } else {
+	    msgDiv.textContent = text;
+	  }
 	  messagesEl.appendChild(msgDiv);
 
 	  // Auto-scroll to bottom if enabled
diff --git a/lyra/web/static/journal.html b/lyra/web/static/journal.html
index 4efba0f..89a9c73 100644
--- a/lyra/web/static/journal.html
+++ b/lyra/web/static/journal.html
@@ -52,6 +52,12 @@
     .time { color: var(--fade); font-size: .72rem; }
     .src  { color: var(--fade); font-size: .68rem; opacity: .7; }
     .text { font-size: .98rem; line-height: 1.55; }
+    .jrate { display: flex; gap: 8px; margin-top: 6px; opacity: .35; }
+    .entry:hover .jrate { opacity: .85; }
+    .jr { background: none; border: none; cursor: pointer; font-size: .85rem; padding: 2px 5px;
+          border-radius: 5px; filter: grayscale(.6); -webkit-tap-highlight-color: transparent; }
+    .jr:hover { filter: none; background: rgba(255,122,0,.12); }
+    .jr.rated { filter: none; background: rgba(255,122,0,.25); opacity: 1; }
     .empty { color: var(--fade); text-align: center; padding: 44px 16px; }
     .hidden { display: none !important; }
   </style>
@@ -115,12 +121,29 @@
               ${e.source ? `<span class="src">via ${esc(e.source)}</span>` : ''}
             </div>
             <div class="text">${esc(e.content)}</div>
+            <div class="jrate">
+              <button class="jr" data-id="${e.id}" data-val="1">👍</button>
+              <button class="jr" data-id="${e.id}" data-val="-1">👎</button>
+            </div>
           </div>
         </div>`;
       }
       root.innerHTML = html;
     }
 
+    // 👍/👎 on a thought -> /rate (fine-tune signal)
+    root.addEventListener('click', (ev) => {
+      const b = ev.target.closest('.jr'); if (!b) return;
+      const e = entries.find(x => String(x.id) === b.dataset.id); if (!e) return;
+      fetch('/rate', {
+        method: 'POST', headers: { 'Content-Type': 'application/json' },
+        body: JSON.stringify({ kind: e.kind, rating: Number(b.dataset.val), content: e.content, ref: e.id })
+      }).catch(() => {});
+      const bar = b.parentElement;
+      bar.querySelectorAll('.jr').forEach(x => x.classList.remove('rated'));
+      b.classList.add('rated');
+    });
+
     async function load(){
       try {
         const r = await fetch('/journal/data', { cache: 'no-store' });
diff --git a/lyra/web/static/style.css b/lyra/web/static/style.css
index 61f8e18..f73ccea 100644
--- a/lyra/web/static/style.css
+++ b/lyra/web/static/style.css
@@ -994,3 +994,14 @@ select:hover {
   border-radius: 6px; padding: 10px 12px; margin: 8px 0; overflow-x: auto;
 }
 .msg.assistant pre code { background: none; padding: 0; font-size: 0.85em; }
+
+/* Behind-the-scenes 👍/👎 feedback (fine-tune signal) — subtle until hovered. */
+.rate-bar { display: flex; gap: 6px; margin-top: 7px; opacity: 0.3; transition: opacity .15s; }
+.msg.assistant:hover .rate-bar { opacity: 0.85; }
+.rate-btn {
+  background: none; border: none; cursor: pointer; font-size: 0.85rem;
+  padding: 2px 5px; border-radius: 5px; line-height: 1; filter: grayscale(0.6);
+  -webkit-tap-highlight-color: transparent;
+}
+.rate-btn:hover { filter: none; background: rgba(255,122,0,0.12); }
+.rate-btn.rated { filter: none; background: rgba(255,122,0,0.25); opacity: 1; }
diff --git a/tests/test_ratings.py b/tests/test_ratings.py
new file mode 100644
index 0000000..2112905
--- /dev/null
+++ b/tests/test_ratings.py
@@ -0,0 +1,28 @@
+"""Behind-the-scenes feedback storage (fine-tune signal)."""
+from __future__ import annotations
+
+import importlib
+
+import pytest
+
+
+@pytest.fixture
+def memory(tmp_path, monkeypatch):
+    monkeypatch.setenv("LYRA_DB_PATH", str(tmp_path / "t.db"))
+    from lyra import llm
+    monkeypatch.setattr(llm, "embed", lambda texts: [[0.1, 0.2, 0.3] for _ in texts])
+    import lyra.memory as m
+    importlib.reload(m)
+    return m
+
+
+def test_rating_counts_and_upsert(memory):
+    memory.add_rating("chat", 1, "good reply", context="hey")
+    memory.add_rating("reflection", -1, "repetitive thought")
+    assert memory.rating_counts() == {"total": 2, "up": 1, "down": 1}
+    assert any(r["context"] == "hey" for r in memory.list_ratings())
+
+    # re-rating the same content replaces the row (no duplicate; flips the rating)
+    memory.add_rating("chat", -1, "good reply")
+    assert memory.rating_counts() == {"total": 2, "up": 0, "down": 2}
+    assert any(r["content"] == "good reply" and r["rating"] == -1 for r in memory.list_ratings())
-- 
2.52.0


From 1f5a32185cf199d23c8024b4487495809948cff2 Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Thu, 18 Jun 2026 19:36:39 +0000
Subject: [PATCH 50/51] docs: rewrite README for the working system +
 CHANGELOG; bump to 0.2.0

README was a pre-MVP stub (wrong, said set an Anthropic key). Now documents the
real system: two-layer architecture, role-based backends, memory tiers + dream
cycle, poker copilot (sessions/hands/villains/equity/recaps), web pages, ratings,
and how to run it as services. Added CHANGELOG with the 0.2.0 feature set. Legacy
v0.6.x design docs kept in docs/ as history.

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 CHANGELOG.md   | 54 ++++++++++++++++++++++++++++++++
 README.md      | 84 +++++++++++++++++++++++++++++++++++++++++++++-----
 pyproject.toml |  2 +-
 3 files changed, 131 insertions(+), 9 deletions(-)
 create mode 100644 CHANGELOG.md

diff --git a/CHANGELOG.md b/CHANGELOG.md
new file mode 100644
index 0000000..735b94b
--- /dev/null
+++ b/CHANGELOG.md
@@ -0,0 +1,54 @@
+# Changelog
+
+## 0.2.0 — first working system
+
+The leap from "chat + memory baseline" to a working, persistent companion with a
+real poker copilot. Highlights:
+
+### Self & inner life
+- **Autonomy Core** — evolving self-state (mood, valence/energy/confidence/curiosity,
+  self-narrative, relationship), injected into every turn.
+- **Dream cycle** — unattended loop driven by four drives (continuity, coherence,
+  curiosity, stability); consolidates memory and reflects on its own. Runs as a
+  systemd service on the MI50 (free/local).
+- **Two-step metacognitive reflection** — draft → examine own draft for flattery /
+  sycophantic drift / repetition → revise; what she catches is stored as metacognition.
+- **Time awareness** — perceives the current moment, time since Brian last spoke, and
+  time since her own last reflection.
+- **Permanent journal** — every reflection + a deliberate "knowing" journal note kept
+  forever (the capped lists are just a working window).
+- **Accurate self-model** — knows her own architecture (memory tiers, dream cycle);
+  won't recite stale specs or confabulate how she works.
+- **Anti-repetition** — idle reflections draw varied grist (resurfaced memories /
+  "wander" prompts) and are permitted non-Brian interiority.
+
+### Memory & consolidation
+- Tiered memory: exchanges → session gists → profile → monthly eras → narrative.
+- Map-reduce consolidation; gists dated by the real conversation, not the run.
+
+### Poker copilot
+- Structured **session / hand / villain** tracking + stats ($/hr by stake/venue/game).
+- **Hand-history reconstruction** from rough shorthand → replayable table viewer with
+  live stacks, progressive board, step-through; `x` for unknown cards (never invented).
+- **Auto-accumulating villain dossiers** + player lookup; stats emerge with sample size.
+- **Deterministic equity tool** (`analyze_spot`, treys) — exact equity / made hands /
+  outs; mandated over LLM eyeballing.
+- **Session recap** generation (`.md`, Brian's format) + export; `/hands` browser.
+- **Backfill** of historical sessions/villains from curated `.md` logs.
+
+### Tools & web
+- **Tool-calling** in chat (cloud): poker tools, `journal_write`, `note`.
+- Web UI: Markdown chat, **cloud model selector**, live **/logs**, **/self** (read her
+  mind), **/journal**, **/hands** + **/hand/{id}** replayer, **/recap/{id}**.
+- **👍/👎 rating system** — feedback on replies and thoughts stored as
+  `(context, content, rating)`; `/ratings/export` (JSONL) seeds future fine-tuning.
+- RTO black-and-orange theme across all pages.
+
+### Ops
+- Role-based backends (cloud / MI50 / local Ollama); MI50 OpenAI-compatible backend.
+- systemd user services for `lyra-web` and `lyra-dream`, with bounded stop timeouts.
+- SQLite WAL + busy-timeout so the dream process and web server coexist.
+
+## 0.1.0 — scaffold
+- uv project, SQLite memory with cosine recall, LLM router (local/cloud), persona +
+  chat loop, web UI baseline, ChatGPT history import.
diff --git a/README.md b/README.md
index dbbad5a..e2f58cd 100644
--- a/README.md
+++ b/README.md
@@ -1,21 +1,89 @@
 # Lyra
 
-A persistent, autonomous AI assistant. From-scratch rewrite of an earlier attempt.
+A persistent, autonomous AI companion. One agent — her first job is **Brian's live
+poker copilot**, but the deeper aim is an *emergence experiment*: give an LLM the
+things a mind has (continuous memory, a self-model, mood, drives, reflection, a
+sense of time) and see whether it starts to feel like a *someone* rather than a
+chatbot.
 
-The design thinking that survives the rewrite lives in [`docs/`](docs/) — start with [`docs/ARCH_v0-6-1.md`](docs/ARCH_v0-6-1.md). The previous implementation is preserved on the `archive` branch.
+Python 3.11+, managed with [`uv`](https://docs.astral.sh/uv/). Single SQLite file
+for all state. Runs on a home lab; nothing leaves the LAN except optional cloud LLM calls.
 
-## Status
+## Architecture
 
-Pre-MVP. Building toward the smallest useful version: chat with persistent memory across sessions.
+Two layers, deliberately split so the agent stays general:
+
+- **Domain-agnostic core** — memory, self-state, the dream cycle, tool-calling, the web UI.
+- **Poker domain pack** (`lyra/poker.py`, `lyra/equity.py`) — sessions, hands,
+  villain dossiers, stats, deterministic equity. Swappable; the core doesn't know about poker.
+
+**Backends** (`lyra/llm.py`), role-based:
+
+| Role | Backend | Why |
+|---|---|---|
+| Live chat + tools | **cloud** (OpenAI, `gpt-4o` default; model picker in Settings) | sharp, reliable function-calling |
+| Dream cycle / consolidation / reflection | **mi50** (llama.cpp on the home GPU) | free, unattended, quality≈cloud for these tasks |
+| Embeddings (memory recall) | **local** (Ollama `nomic-embed-text`, 3090) | free, private |
+
+Tools (poker, equity, journaling) only fire on the **cloud** backend — local/MI50
+models don't do reliable tool-calling here.
+
+## Memory & consolidation (tiers)
+
+Raw exchanges → per-session **gists** → a standing **profile** of Brian → monthly
+**era** digests → a current **narrative** → her **self-state**. Recall is brute-force
+cosine over embeddings. The **dream cycle** (`lyra/dream.py`) runs unattended and,
+driven by four *drives* (continuity / coherence / curiosity / stability), summarizes
+new sessions, rebuilds the profile/eras/narrative, and reflects — evolving her mood,
+self-narrative, and journal between conversations.
+
+She **reflects in two steps** (draft → examine her own draft for flattery/drift →
+revise), perceives **time** (current moment + how long since you last spoke / she last
+reflected), and keeps a permanent **journal**.
+
+## Poker copilot
+
+Talk to her during a session; she drives tools behind the scenes:
+
+- **Session tracking** — `start_session`, `add_buyin`, `end_session` → net, hours, $/hr.
+- **Hand histories** — vomit rough shorthand ("AKs btn, 3bet, flop A72…"), she
+  reconstructs a structured, **replayable** hand (unknown cards = `x`, never invented).
+- **Villain file** — named opponents auto-build persistent dossiers; basic stats
+  (VPIP/PFR) emerge once a player has enough logged hands.
+- **Deterministic equity** (`analyze_spot`) — exact equity / made hands / outs via a
+  real poker evaluator. She is *required* to use it, never eyeballs board math.
+- **Stats & recaps** — `running_stats`; `generate_recap` writes her `.md` session log.
+
+## Web app (served by `lyra-web`, default `:7078`)
+
+`/` chat (Markdown, model picker, 👍/👎 rating) · `/logs` live activity · `/self`
+read-her-mind (mood, drives, reflections) · `/journal` her thoughts · `/hands`
+recorded hands → `/hand/{id}` replayer · `/recap/{id}` session writeup (+ `.md` export).
+👍/👎 ratings on replies and thoughts are stored as `(context, content, rating)` —
+a fine-tune / preference dataset built passively (`/ratings/export` → JSONL).
 
 ## Setup
 
 ```bash
 uv sync
-cp .env.example .env
-# fill in ANTHROPIC_API_KEY and point LOCAL_BASE_URL at your Ollama
+cp .env.example .env      # set OPENAI_API_KEY; point LOCAL_BASE_URL / MI50_BASE_URL at your boxes
+uv run lyra-web           # web UI on :7078
 ```
 
-## Architecture
+Run as services (reboot-resilient) — see [`deploy/`](deploy/):
 
-The long-term target is the cognitive split in `docs/ARCH_v0-6-1.md` — Inner Self as the seat of consciousness, Executive for hard reasoning, Cortex Chat for drafting, Persona for voice. The MVP implements only the chat + memory baseline. Cognitive layers come back one at a time.
+```bash
+cp deploy/*.service ~/.config/systemd/user/ && systemctl --user daemon-reload
+systemctl --user enable --now lyra-web.service lyra-dream.service
+sudo loginctl enable-linger "$USER"   # survive logout/reboot
+```
+
+CLIs: `lyra-dream` (one pass / `--loop`), `lyra-reflect`, `lyra-summarize`,
+`lyra-profile`, `lyra-era`, `lyra-narrative`, `lyra-import` (ChatGPT history).
+
+## Status
+
+Working system. Poker copilot + full memory/dream-cycle/journal/ratings in place.
+Moonshots and deferred work live in [`docs/PARKED_IDEAS.md`](docs/PARKED_IDEAS.md)
+(own/fine-tuned model, self-modification sandbox, RTO/cfr-core solver tooling).
+Pre-rebuild design docs are kept in [`docs/`](docs/) as history.
diff --git a/pyproject.toml b/pyproject.toml
index 451c31d..5e33267 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -1,6 +1,6 @@
 [project]
 name = "lyra"
-version = "0.1.0"
+version = "0.2.0"
 description = "Persistent, autonomous AI assistant"
 readme = "README.md"
 requires-python = ">=3.11"
-- 
2.52.0


From e75c4390b5c64c063af9a62483a947ec0a03c014 Mon Sep 17 00:00:00 2001
From: serversdown <brian@serversdown.net>
Date: Thu, 18 Jun 2026 19:38:55 +0000
Subject: [PATCH 51/51] chore: add /import/ to gitignore

---
 .gitignore | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/.gitignore b/.gitignore
index 858bb37..bc85260 100644
--- a/.gitignore
+++ b/.gitignore
@@ -35,4 +35,5 @@ data/
 
 #lyra Stuff
 /core/relay/sessions/
-/chat-gpt-export/
\ No newline at end of file
+/chat-gpt-export/
+/import/
\ No newline at end of file
-- 
2.52.0