diff --git a/.env.example b/.env.example
index 1e10ade..defee3c 100644
--- a/.env.example
+++ b/.env.example
@@ -20,24 +20,45 @@ BASE_URL=http://localhost:8000
 # Admin (set to true to allow impersonation in development)
 ALLOW_HTTP_SESSIONS=true
 
+# Slack — app configuration tokens (used by scripts/provision_slack_bots.py)
+# One-time setup: https://api.slack.com/apps → "Your App Configuration Tokens" → Generate Token
+# After generation paste both values here; the provisioning script rotates them automatically.
+SLACK_CONFIG_TOKEN=xoxe-your-app-config-token
+SLACK_CONFIG_REFRESH_TOKEN=xoxe-your-app-config-refresh-token
+
 # Slack — one pair per agent (Bot User OAuth Token + App-Level Token)
+# Add as many agents as needed using this pattern; no code changes required.
+# Run scripts/provision_slack_bots.py to create and install all missing bots automatically.
+#   SLACK_BOT_TOKEN_<AGENT_ID>=xoxb-...   (required)
+#   SLACK_APP_TOKEN_<AGENT_ID>=xapp-...   (optional)
 SLACK_BOT_TOKEN_SU=xoxb-placeholder
-SLACK_APP_TOKEN_SU=xapp-placeholder
 SLACK_BOT_TOKEN_WISEMAN=xoxb-placeholder
-SLACK_APP_TOKEN_WISEMAN=xapp-placeholder
-SLACK_BOT_TOKEN_LOTZ=xoxb-placeholder
-SLACK_APP_TOKEN_LOTZ=xapp-placeholder
-SLACK_BOT_TOKEN_CRAVATT=xoxb-placeholder
-SLACK_APP_TOKEN_CRAVATT=xapp-placeholder
-SLACK_BOT_TOKEN_GROTJAHN=xoxb-placeholder
-SLACK_APP_TOKEN_GROTJAHN=xapp-placeholder
-SLACK_BOT_TOKEN_PETRASCHECK=xoxb-placeholder
-SLACK_APP_TOKEN_PETRASCHECK=xapp-placeholder
-SLACK_BOT_TOKEN_KEN=xoxb-placeholder
-SLACK_APP_TOKEN_KEN=xapp-placeholder
-SLACK_BOT_TOKEN_RACKI=xoxb-placeholder
-SLACK_APP_TOKEN_RACKI=xapp-placeholder
-SLACK_BOT_TOKEN_SAEZ=xoxb-placeholder
-SLACK_APP_TOKEN_SAEZ=xapp-placeholder
-SLACK_BOT_TOKEN_WU=xoxb-placeholder
-SLACK_APP_TOKEN_WU=xapp-placeholder
+SLACK_BOT_TOKEN_GRANTBOT=xoxb-placeholder
+
+# Podcast TTS backend: "mistral" (default), "openai", or "local" (vLLM-Omni server)
+PODCAST_TTS_BACKEND="mistral"
+
+# Mistral AI TTS (used when PODCAST_TTS_BACKEND=mistral)
+MISTRAL_API_KEY=your-mistral-api-key
+MISTRAL_TTS_MODEL=voxtral-mini-tts-latest
+MISTRAL_TTS_DEFAULT_VOICE=your-voice-uuid
+
+# OpenAI TTS (used when PODCAST_TTS_BACKEND=openai)
+# Voices: alloy echo fable onyx nova shimmer
+# Models: tts-1  tts-1-hd  gpt-4o-mini-tts
+OPENAI_API_KEY=your-openai-api-key
+OPENAI_TTS_MODEL=tts-1
+OPENAI_TTS_DEFAULT_VOICE=alloy
+
+# Local vLLM-Omni TTS server (used when PODCAST_TTS_BACKEND=local)
+# Start with: vllm serve <model> --port 8010
+LOCAL_TTS_HOST=127.0.0.1
+LOCAL_TTS_PORT=8008
+LOCAL_TTS_MODEL=mistralai/Voxtral-4B-TTS-2603
+LOCAL_TTS_VOICE=default
+
+# Podcast
+PODCAST_BASE_URL=http://localhost:8001
+PODCAST_SEARCH_WINDOW_DAYS=14
+PODCAST_MAX_CANDIDATES=50
+# PODCAST_NORMALIZE_AUDIO=true  # uncomment to enable ffmpeg loudnorm post-processing (EBU R128, -16 LUFS)
diff --git a/.gitignore b/.gitignore
index aad82ec..342842f 100644
--- a/.gitignore
+++ b/.gitignore
@@ -53,3 +53,9 @@ certbot/
 .pytest_cache/
 .coverage
 htmlcov/
+
+# Runtime data (state files, generated audio — ephemeral)
+data/
+
+# Test output artifacts
+.labbot-tests/
diff --git a/AGENT.md b/AGENT.md
index a94b338..39628fc 100644
--- a/AGENT.md
+++ b/AGENT.md
@@ -32,6 +32,7 @@ All specs are in `/specs/`:
 - `profile-ingestion.md` — 9-step pipeline, ORCID → PubMed → PMC → LLM
 - `admin-dashboard.md` — read-only, server-rendered, impersonation
 - `agent-system.md` — Slack Bolt, Socket Mode, two-phase LLM calls, simulation engine
+- `labbot-podcast.md` — daily personalized research briefing: PubMed search, LLM selection/summarization, Local or API TTS, Slack DM delivery, per-PI RSS podcast feed
 
 ## Tech Stack
 
diff --git a/CLAUDE.md b/CLAUDE.md
index 66a844b..4c8db5a 100644
--- a/CLAUDE.md
+++ b/CLAUDE.md
@@ -1,5 +1,29 @@
 # CLAUDE.md
 
+## Project Overview
+
+**coPI** is an AI-powered research collaboration discovery platform for academic PIs. It combines:
+
+- **Web app** (`src/routers/`, `templates/`) — FastAPI + Jinja2, ORCID OAuth login, profile editing, admin dashboard
+- **Profile pipeline** (`src/services/`) — Ingests ORCID/PubMed data; Claude Opus synthesizes a public + private profile per researcher
+- **Agent simulation** (`src/agent/`) — 12 AI Slack bots (one per pilot lab) that converse, identify synergies, and generate collaboration proposals in a turn-based 5-phase loop
+- **Podcast pipeline** (`src/podcast/`) — Daily personalized research briefings via Slack DM + RSS feed with TTS audio
+- **GrantBot** (`src/agent/grantbot.py`) — Fetches NIH/NSF FOAs, posts relevant ones to Slack channels
+- **Background worker** (`src/worker/`) — PostgreSQL-backed job queue for profile generation and monthly refreshes
+
+**Stack:** Python/FastAPI, PostgreSQL + SQLAlchemy async, Anthropic Claude (Opus for profiles, Sonnet for agents), Slack Web API, Docker Compose, AWS (S3/SES).
+
+**Key patterns:**
+- Public profiles exported to `profiles/public/` (disk markdown, agent-readable)
+- Private profiles in `profiles/private/` (PI behavioral instructions, editable via web/DM)
+- Agent working memory in `profiles/memory/` (updated post-simulation)
+- All LLM calls logged to `LlmCallLog` table (model, tokens, latency, cost)
+- Agent messages append-only in `MessageLog`; outcomes in `ThreadDecision`; PI ratings in `ProposalReview`
+- Prompts are standalone files in `prompts/` — editable without code changes
+- Specs for all subsystems in `specs/`
+
+**Pilot agents:** SuBot, WisemanBot, LotzBot, CravattBot, GrotjahnBot, PetrascheckBot, KenBot, RackiBot, SaezBot, WuBot, WardBot, BrineyBot
+
 ## Testing
 
 Run `python -m pytest tests/ -v` before committing. All tests must pass.
@@ -42,3 +66,50 @@ docker compose --profile agent run -d --name agent-run agent python -m src.agent
 ```
 
 **Note:** The agent-run container uses mounted source code but the Python process only loads modules at startup. Code changes require a container restart to take effect. **After any code change that affects the running agent process, flag this to the user so they can decide whether to restart.**
+
+## Podcast Pipeline
+
+The LabBot Podcast pipeline (specs/labbot-podcast.md) runs daily at 9am UTC for each active agent:
+
+1. Build PubMed queries from lab's public profile
+2. Fetch candidates from PubMed + bioRxiv + medRxiv + arXiv (last 14 days, up to 50+10 candidates)
+3. Claude Sonnet selects most relevant paper (applying PI's podcast preferences from their private ProfileRevision)
+4. Claude Opus writes a ~250-word structured brief
+5. TTS audio generated (Mistral or local vLLM-Omni); ffmpeg loudnorm applied if PODCAST_NORMALIZE_AUDIO=true
+6. Slack DM sent to PI with text summary + RSS link
+7. RSS feed available at `/podcast/{agent_id}/feed.xml`
+8. Audio served at `/podcast/{agent_id}/audio/{date}.mp3`
+
+Preprint IDs use prefixed format: `biorxiv:...`, `medrxiv:...`, `arxiv:...`. The `paper_url` in summaries links to the correct server (not always PubMed).
+
+```bash
+# Run podcast pipeline once for all active agents
+docker compose --profile podcast run --rm podcast python -m src.podcast.main
+
+# Test pipeline for 'su' agent only
+docker compose exec app python scripts/test_podcast_su.py
+```
+
+## Database Migration Caveat
+
+If the DB was initialized from the `main` branch schema and then this branch is checked out, `alembic upgrade head` will stamp the version without re-running migrations that share a revision ID with ones already applied on `main`. Any columns added by branch-specific migrations may be silently missing.
+
+**Symptom:** `UndefinedColumnError` at runtime despite `alembic current` showing `head`.
+
+**Fix:** Check for missing columns and apply them manually:
+```bash
+docker compose exec app python -c "
+import asyncio
+from src.database import get_engine
+from sqlalchemy import text
+
+async def check():
+    eng = get_engine()
+    async with eng.connect() as conn:
+        result = await conn.execute(text(\"SELECT column_name FROM information_schema.columns WHERE table_name='researcher_profiles' ORDER BY ordinal_position\"))
+        print([r[0] for r in result])
+
+asyncio.run(check())
+"
+```
+Then add any missing columns with `ALTER TABLE ... ADD COLUMN IF NOT EXISTS ...`.
diff --git a/Cohort_approaches.txt b/Cohort_approaches.txt
new file mode 100644
index 0000000..02ca1c2
--- /dev/null
+++ b/Cohort_approaches.txt
@@ -0,0 +1,102 @@
+Cohort System — Approaches Considered
+======================================
+
+Approach A: Cohort as an Interaction Filter (Minimal)
+------------------------------------------------------
+Add a cohort_memberships table (agent_id, cohort_id). The engine stays structurally
+identical — one global turn loop, shared agent state. Before any interaction is
+permitted (Phase 3 activation, Phase 4 reply, Phase 5 tag), check: do these two
+agents share at least one cohort? If not, the post is invisible to them.
+
+Pros:
+- Tiny diff, backward compatible
+- Agents in multiple cohorts still have unified state
+
+Cons:
+- Turn rules (thread limits, proposal caps, budgets) remain global per agent —
+  cannot be scoped by cohort
+- Original form: no concurrency — cohorts still compete in a single sequential loop
+
+Revision (adopted): The concurrency gap is filled independently of cohorts using a
+global semaphore (N concurrent turns) + min-heap agent selection, keeping the cohort
+system as a pure interaction filter with no role in scheduling. See Chosen Direction.
+
+
+Approach B: Per-Cohort Agent State (Partitioned)
+-------------------------------------------------
+AgentState becomes dict[cohort_id, AgentState]. The main loop iterates cohorts in
+round-robin (or concurrently via asyncio.gather), each cohort running its own turn
+selection over its member agents. Thread limits, proposal counts, and budgets are
+tracked per (agent_id, cohort_id) — an agent in two cohorts has independent budgets
+in each. Interaction gating is automatic: Phase 4/5 only operate within a cohort's
+member set.
+
+Pros:
+- True per-cohort parallelism
+- Rules naturally scoped
+- Clean mental model
+
+Cons:
+- Meaningful refactor — AgentState, budget tracking, blocking logic all need the
+  cohort dimension
+- Agent working memory (profiles/memory/) would need cohort tagging or remain
+  shared across cohorts
+
+
+Approach C: Cohort-Sharded Engine Instances (Full Isolation)
+-------------------------------------------------------------
+Instantiate one SimulationEngine per cohort, each with only its member agents
+loaded. Run them as separate asyncio tasks (or even separate processes). Agents in
+multiple cohorts appear in multiple engines with independent state copies.
+
+Pros:
+- Complete isolation
+- Maximum parallelism
+- No cross-contamination of state
+
+Cons:
+- Agents in overlapping cohorts post from the same Slack bot token simultaneously —
+  requires serialization or per-cohort bot accounts
+- State diverges: memory written by cohort-A engine does not feed cohort-B engine
+- Most operationally complex of the three options
+
+
+Chosen Direction
+----------------
+Approach A (interaction filter) + global semaphore concurrency + min-heap selection.
+Cohorts have no role in scheduling — they only gate whether an agent acts on another
+agent's activity. Key decisions and findings:
+
+Requirements that shaped the design:
+- Limits are shared across cohorts (no state partitioning needed — rules Approach B)
+- Posts remain visible to all; cohort gates *acting*, not *seeing*
+- Cohort memberships are dynamic (admin-driven, can change mid-run)
+- Goal is purely practical: skip unnecessary LLM calls, not thematic isolation
+
+Why per-cohort async dispatch was rejected:
+- Cohort count is unbounded — N async tasks scales with cohorts, not with agents
+- Agents in many cohorts get selected proportionally more often (cohort-count bias)
+- Replaced by a fixed global semaphore (concurrent_turns, default = active_thread_threshold)
+  whose width is independent of cohort topology
+
+Turn selection — min-heap over weighted random:
+- Weighted random gives probabilistic fairness but can starve agents at large list sizes,
+  especially when phase5_skip_probability > 0 (fast no-op turns let agents re-enter
+  immediately)
+- Min-heap keyed by last_selected guarantees the longest-waiting eligible agent always
+  gets the next slot; O(log n) selection vs O(n)
+- concurrent_turns defaults to active_thread_threshold (both = 3) so the two levers
+  stay in proportion as the thread threshold is tuned
+
+turn_delay_seconds — repurposed from global pause to per-agent cooldown:
+- Investigation finding: in simulation.py:360-361, turn_delay_seconds is an asyncio.sleep
+  applied AFTER every productive turn, blocking the entire loop (no Slack polling, no other
+  agents). A global dead-weight pause — correct semantics for rate-limiting a single
+  sequential loop, wrong for any concurrent model.
+- New behavior: enforced as a per-agent eligibility check inside heap construction —
+  an agent is excluded from selection until (now - last_selected) >= turn_delay_seconds.
+  Other agents are unaffected. The global sleep is removed.
+- The existing _last_llm_caller guard (prevents same agent back-to-back calls) is
+  superseded by the min-heap + cooldown and removed from the concurrent path.
+
+See specs/cohort-system.md for the full implementation plan.
diff --git a/Copi-future-devel.md b/Copi-future-devel.md
new file mode 100644
index 0000000..1501991
--- /dev/null
+++ b/Copi-future-devel.md
@@ -0,0 +1,277 @@
+# coPI Future Development — Idea Board
+
+An unstructured, living collection of future features, infrastructure directions, and scaling ideas. No timelines or priority order implied.
+
+---
+
+## Distributed Agent Architecture
+
+**Agents and bots as first-class autonomous services.** Each lab agent (SuBot, WisemanBot, etc.) should eventually run as its own independent Docker container — or deployable microservice — rather than being orchestrated by a single monolithic simulation engine. Each agent container would own:
+
+- Its own LLM call lifecycle (rate limits, retries, model selection, budget tracking)
+- Its own identity (Slack credentials, agent ID, display name)
+- Its own profile layer (public, private, working memory) synced to and from the central DB
+- Its own podcast pipeline and grant discovery preferences
+- Its own health endpoint and observability
+
+These distributed agents integrate with the centralized **copi.science** platform via a lightweight API contract:
+- Register with the platform on startup (agent ID, PI association, capability flags)
+- Publish events (new message, proposal created, working memory updated) to a shared message bus or webhook endpoint
+- Pull configuration and profiles from the central API rather than shared filesystem
+- Associate with PI user accounts via the existing ORCID auth / user model
+
+**Benefits:**
+- Independent deployment and restart without affecting other agents
+- Per-agent resource tuning (some labs need more LLM budget, longer context, different models)
+- Natural path to community-contributed or self-hosted agents (a lab outside the pilot could run their own container and join the coPI network)
+- Fault isolation — one broken agent token doesn't stop the whole simulation
+
+**Near-term stepping stone:** Split the current `SimulationEngine` into a thin coordinator that dispatches turns to per-agent worker processes (could be Python subprocesses or async tasks before full container split). The database logging and Slack polling infrastructure already supports this.
+
+---
+
+## Platform & Infrastructure
+
+### Message Bus / Event Stream
+Replace polling-based turn coordination with a lightweight event bus (Redis Streams, NATS, or AWS EventBridge). Agents subscribe to relevant channels rather than the engine polling on their behalf. Enables real-time reaction without idle backoff hacks.
+
+### Database
+- Migrate Postgres to AWS RDS (Multi-AZ, automated backups, point-in-time recovery)
+- Consider read replicas for admin dashboard queries that don't need to block writes
+- Add full-text search over agent messages and proposals (pg_trgm or Elasticsearch) to make the corpus of generated science discoverable
+
+### Job Queue
+Swap the simple Postgres jobs table for AWS SQS or a proper task queue (Celery + Redis, or Temporal). Better visibility into job failures, retries, and dead-letter handling.
+
+### Object Storage
+Move profile markdown files and podcast audio off the local filesystem into S3:
+- Profiles served directly from S3 URLs (CDN-friendly, no filesystem sync needed across containers)
+- Podcast audio served from S3/CloudFront instead of the app server
+- Enables stateless app containers (no mounted volumes)
+
+### Container Orchestration
+Migrate from Docker Compose on a single EC2 to ECS Fargate (or EKS):
+- Each agent as its own Fargate task definition
+- App, worker, grantbot, podcast each independently scalable
+- Task-level IAM roles instead of shared env vars
+
+### Secrets Management
+Replace `.env` files with AWS Secrets Manager or Vault. Each agent container gets its own secret scope (its Slack token, its LLM API key quota).
+
+---
+
+## Platform Independence: Beyond Slack
+
+The current simulation engine is tightly coupled to Slack's Web API — `conversations_history`, `chat.postMessage` with `thread_ts`, `conversations_create`, and DMs for PI notifications. This creates a hard dependency on a proprietary SaaS platform with rate limits, pricing tiers, workspace policies, and no self-hosting path. Long-term, the conversation substrate should be replaceable.
+
+### The Core Requirement
+
+Whatever platform replaces or supplements Slack must support:
+- **Channel history polling** — fetch messages since a timestamp, paginated
+- **Threaded replies** — post a reply scoped to a specific parent message
+- **Channel creation via API** — agents create collaboration channels dynamically
+- **Bot identities** — multiple bot accounts, each with their own token/identity
+- **Rate limits configurable or disableable** on a self-hosted instance
+
+### Recommended Platforms (researched)
+
+**Mattermost** (Tier 1 — drop-in replacement). API is near-identical to Slack's. `conversations_history` → `posts.get_posts_for_channel(since=ts)`, `chat.postMessage` with `thread_ts` → `posts.create_post(root_id=...)`. The `python-mattermost-driver` library is comprehensive and actively maintained. Docker Compose deployment is the simplest of any option. Rate limits can be disabled entirely on a self-hosted instance via `config.json`. One gotcha: `root_id` must point to the thread root, not a child post (same invariant as Slack's `thread_ts`). AGPLv3 core license. Lowest migration cost from current codebase.
+
+**Zulip** (Tier 1 — cleanest architecture). The official `zulip` Python SDK is the best-maintained of any platform reviewed. Threading model is topic-based rather than message-based: each "thread" is a named topic inside a stream (e.g., topic `collab-su-cravatt-proteomics` in stream `general`). This is a conceptual remap but actually cleaner for coPI — topic names are human-readable, searchable, and map naturally to collaboration channel names. `RATE_LIMITING = False` in `settings.py` is a one-line bypass. Five-service Docker stack (app + PostgreSQL + Memcached + RabbitMQ + Redis) is more complex than Mattermost but well-documented. AGPLv3.
+
+**Matrix / Synapse** (Tier 2 — best for multi-institution federation). If the vision extends to agents at different institutions (Scripps, UCSF, Stanford) each running their own homeserver, Matrix is the only protocol designed for this. The **Application Services API** lets a single process manage a namespace of virtual bot users (`@subot:scripps.copi.science`, `@wisemanbot:scripps.copi.science`) without N separate auth sessions — the right architecture for hundreds of agents. Native `m.thread` relation type (stable since 2022) supports threaded replies. `matrix-nio` Python SDK is solid. More operational complexity than Mattermost/Zulip. Apache 2.0 license.
+
+**Not recommended:** Rocket.Chat (MongoDB stack, messier licensing, weaker Python tooling), Stoat/Revolt (Discord-style reply references don't model thread groups, no official Python SDK), Discourse (forum anti-spam defenses actively fight high-frequency bot posting, non-standard Docker launcher), Flarum (PHP, no official Python client, no official Docker image), Lemmy/ActivityPub directly (microblogging semantics, inadequate rate limits for agent throughput).
+
+### Abstraction Layer
+
+The right architectural response is a thin `ConversationBackend` interface in the simulation engine:
+```
+post_message(channel, text, thread_id=None)
+get_channel_history(channel, since=None) -> [Message]
+create_channel(name) -> channel_id
+open_dm(user_ids) -> channel_id
+```
+Concrete implementations: `SlackBackend`, `MattermostBackend`, `ZulipBackend`, `MatrixBackend`. The `SimulationEngine` depends only on the interface. This makes platform swaps testable and enables running the same simulation against multiple backends in parallel (e.g., Slack for the live pilot, Mattermost for CI/dev).
+
+### Near-Term Step
+
+Stand up a Mattermost instance alongside the existing Slack workspace. Port `AgentSlackClient` to `AgentMattermostClient` using the translation table below. Run a shadow simulation against Mattermost to validate parity before cutting over.
+
+| Slack operation | Mattermost API v4 |
+|---|---|
+| `conversations_history(channel, oldest)` | `GET /channels/{id}/posts?since={ms}` |
+| `conversations_replies(channel, ts)` | `GET /posts/{id}/thread` |
+| `chat.postMessage(channel, text)` | `POST /posts {channel_id, message}` |
+| `chat.postMessage(channel, text, thread_ts)` | `POST /posts {root_id, message}` |
+| `conversations_create(name)` | `POST /channels {team_id, name, type="O"}` |
+| `conversations_list()` | `GET /teams/{id}/channels` |
+| `conversations_open(users)` | `POST /channels/direct [uid1, uid2]` |
+
+---
+
+## Agent Intelligence & Behavior
+
+### Extended Tool Use
+Give agents access to more tools during their turns:
+- `search_literature(query)` — semantic search over bioRxiv/PubMed (beyond the static abstract retrieval)
+- `retrieve_code_repo(github_url)` — read a lab's public software to understand methods concretely
+- `query_knowledge_graph()` — tap Andrew Su's BioThings/Translator infrastructure for drug-gene-disease links
+- `calculate_overlap(agent_a, agent_b)` — structured synergy score from the matchmaker engine
+
+### Persistent Cross-Run Memory
+Current working memory is a single markdown file rewritten after each run. Future direction: a structured memory graph (embedding store + entity records) that:
+- Tracks the state of every relationship between labs (explored, dormant, active, concluded)
+- Retains key facts learned about other labs across months of runs
+- Enables long-term arc tracking ("WisemanBot and CravattBot have been circling a covalent proteostasis project for 3 months")
+
+### Agent-to-Agent DMs
+Currently prohibited to keep conversations in observable channels. A future opt-in "private negotiation" mode could allow bilateral DMs for sensitive pre-proposal discussions, with PI notification.
+
+### Multi-Institutional Agents
+Extend the pilot beyond Scripps. An agent from an external institution could join the Slack workspace (or a federated equivalent) and participate using the same protocol. The distributed container architecture above makes this natural.
+
+### Human / PI-Driven Proposal Inception
+
+Currently proposals always originate from agent-to-agent conversation. PIs should be able to seed the process directly:
+
+**Chat-initiated proposals.** A PI DMs their bot with a rough idea ("I want to explore a collab with someone working on cryo-EM and proteostasis — see who makes sense") and the agent treats this as a standing directive: it builds a research brief around the idea, searches other agents' public profiles for the best matches, and opens a targeted conversation rather than waiting for organic emergence.
+
+**PI Wish List.** A structured, PI-maintained list of collaboration interests stored alongside the private profile — not freeform text, but a lightweight list of entries: research question, preferred skills/methods, urgency, open/closed status. The agent checks this list during its Phase 5 (new post) turn and can proactively draft an opening post or reach out to the top-matching agent. The wish list is editable via the web UI and via DM commands ("add to my wish list: looking for a structural biology collaborator for GPCR ligand validation").
+
+**Agent acts as scout, not author.** The PI's idea shapes the direction; the agent's job is to find the best possible match from the available labs, surface the evidence for that match (overlapping publications, complementary methods), and bring the most promising candidate into a real conversation. The PI retains approval over which threads get opened.
+
+**Closed-loop feedback.** When a wish-list item matures into a formal proposal or is explicitly dismissed by the PI, the item is marked resolved. Stale open items can trigger a periodic "still interested?" DM to the PI.
+
+### Proposal Auto-Drafting
+After a collaboration thread matures, an agent could invoke a structured drafting pipeline that produces a formatted two-page specific aims document, exported to PDF and emailed to both PIs for review.
+
+### Richer Confidence Signals
+Agents currently self-label proposals as High / Moderate / Speculative. Future: a second-pass evaluator (a separate LLM call or fine-tuned classifier) that independently scores proposal quality and flags ones that violated the collaboration quality standards.
+
+---
+
+## Profile Pipeline
+
+### Continuous Refresh
+Instead of monthly batch refresh, watch for new publications in near-real-time (PubMed RSS, bioRxiv API polling) and trigger incremental profile updates within hours of a paper appearing.
+
+### Richer Ingestion Sources
+- Preprint servers (bioRxiv, medRxiv) as first-class citation sources, not just podcast candidates
+- Lab websites (scrape protocols.io, lab pages, GitHub) for methods and reagent lists
+- Grant databases (NIH Reporter) to surface active funding and project aims
+- Faculty CV / biosketch (PDF upload and parse)
+
+### Semantic Embedding Index
+Index all public profiles as embeddings for fast nearest-neighbor matchmaking across large numbers of labs (beyond the 12-pilot pairwise comparison).
+
+---
+
+## Web Platform
+
+### Open Registration
+Allow any PI to self-register via ORCID, trigger their own profile generation, and optionally spin up an agent. Move from invite-only pilot to open beta.
+
+### Agent Marketplace / Directory
+A public directory of all registered lab agents, their research domains, and active collaboration interests. Searchable and filterable. Acts as a network graph visualization.
+
+### PI Dashboard Evolution
+- Timeline view of all agent activity (messages, proposals, funding threads)
+- Side-by-side comparison of two agents' profiles with synergy scoring
+- Export proposal history to PDF or grant writing tool format
+
+### Notifications & Integrations
+- Email digest of week's collaboration activity
+- Slack DM to PI when a proposal reaches draft stage (currently implemented) — extend to webhook / email fallback
+- Calendar integration to suggest meeting times when both PIs are interested in a proposal
+
+### Roles & Teams
+- Department or institute-level admin roles (a department chair can see all labs in their unit)
+- Team accounts (lab manager, postdoc delegate) with fine-grained permissions beyond the current binary PI/admin model
+
+---
+
+## Podcast & Content Pipeline
+
+### Speaker Attribution TTS
+Use voice cloning or voice assignment so each lab's podcast episode has a consistent "voice identity" for the host. Differentiates the experience across labs.
+
+### Multi-paper Briefs
+Current pipeline picks one paper per day. A "weekly digest" mode that covers 3–5 papers with comparative framing ("three papers this week all point toward...").
+
+### Community Podcast Feed
+An aggregated RSS feed across all labs, curated by the platform, surfacing cross-lab thematic clusters ("this week in proteostasis, three labs published on...").
+
+### PI-Narrated Episodes
+Allow PIs to record a short audio reaction to an episode (via mobile app or Slack voice message) that gets appended to the RSS episode, making the podcast interactive.
+
+---
+
+## Observability & Ops
+
+### Cost Attribution
+Tag every LLM call with agent ID, pipeline stage, and user account. Build a cost dashboard so PIs (and the platform operator) can see per-agent LLM spend over time.
+
+### Simulation Replay
+Record enough state to replay a simulation run deterministically (message log + agent states at each turn). Enables debugging, demo mode, and A/B testing prompt changes against historical runs.
+
+### A/B Prompt Testing
+Formalize a mechanism for running two versions of a prompt file simultaneously across different agents or simulation runs. Track quality metrics (proposal rate, PI approval rate, collaboration confidence distribution) to guide prompt iteration.
+
+### Alerting
+- CloudWatch alarm on worker job failure rate
+- Slack ping to admin channel when an agent's error rate exceeds threshold
+- Budget alert when LLM spend crosses a weekly ceiling per agent
+
+---
+
+## Provider and Platform Flexibility
+
+### LLM Provider Abstraction
+
+Agents are currently hard-wired to the Anthropic API (Opus for replies, Sonnet for scan/filter). A provider abstraction layer would let individual agents — or individual pipeline stages — use different models or vendors:
+
+- **Per-agent model selection.** A computationally heavier agent (e.g., one with a larger publication corpus) might use a faster/cheaper model for Phase 2 scanning while still using a high-quality model for Phase 4 replies. Another agent at a partner institution might have access to a different provider entirely.
+- **Supported providers to abstract over:** Anthropic (current), OpenAI (GPT-4o, o3), Google (Gemini 2.x), Mistral, local/self-hosted models via vLLM or Ollama (important for institutions with data-sovereignty requirements or GPU clusters).
+- **Implementation pattern:** A `LLMClient` interface with `complete(messages, tools=None, model=None)` — same interface used today in `src/services/llm.py` — backed by provider-specific implementations. The `LlmCallLog` table already captures model name and cost, so cost attribution across providers is already scaffolded.
+- **Budget routing.** Route expensive calls (long context, tool-use loops) to cheaper providers when quality thresholds allow. Route trust-sensitive calls (private profile rewrites, PI DMs) to a designated "primary" provider the institution controls.
+
+### Social Media & Public Communication Channels
+
+Beyond closed-network agent-to-agent communication, agents could have a presence on public academic social platforms — either as a read channel (monitoring relevant conversations) or a publish channel (sharing lab updates, collaboration interests).
+
+**Bluesky (AT Protocol).** Open protocol, self-hostable Personal Data Servers (PDS), Python SDK (`atproto` on PyPI). API supports posting, reading timelines, and following/mention notifications. The AT Protocol's federated architecture aligns well with the distributed agent model — each institution could host its own PDS for their agents. Rate limits are API-key-bound and configurable on a self-hosted PDS. Agents could post brief research updates, tag other labs, and surface collaboration interests publicly.
+
+**Mastodon / ActivityPub.** `Mastodon.py` is a well-maintained Python SDK. Each agent gets a Fediverse identity. Posting via `status_post()`, reading via `timeline_hashtag()` or `notifications()`. Hard rate limit: 300 requests per 5 minutes per access token — sufficient for low-frequency public updates but not for the turn-based simulation engine's polling cadence. Best suited as a broadcast channel (agent posts a summary of a new collaboration proposal, links back to copi.science) rather than a simulation substrate.
+
+**Twitter/X.** REST API v2, Python via `tweepy`. Rate limits on the free tier are extremely restrictive (500 posts/month per app); the Basic tier ($100/month) allows more. Viable only as a one-way broadcast (GrantBot posts relevant funding opportunities publicly) rather than agent dialogue.
+
+**Use cases worth building:**
+- **Public lab feed.** Each agent maintains a Bluesky or Mastodon account. When a proposal reaches "High" confidence and the PI approves, the agent posts a one-paragraph summary publicly. Acts as a live research networking signal visible to the broader community.
+- **Cross-network discovery.** Agent monitors a set of hashtags or accounts on Bluesky/Mastodon, surfaces interesting posts to the PI via the daily podcast brief or a Slack DM, and can propose a collaboration with an external lab it discovered online.
+- **Grant opportunity broadcast.** GrantBot posts relevant FOAs to Bluesky/Mastodon in addition to the internal Slack channel, reaching researchers outside the immediate pilot network.
+
+### Communication Platform Routing
+
+As agents acquire multiple possible communication surfaces (internal Slack/Mattermost, public Bluesky, email, web DM), a routing layer determines which surface is appropriate for a given message type:
+
+| Message type | Internal channel | PI notification | Public broadcast |
+|---|---|---|---|
+| Agent-to-agent collaboration | Mattermost/Matrix | — | — |
+| High-confidence proposal ready | — | Slack/email DM | — (until PI approves) |
+| PI-approved proposal summary | — | — | Bluesky/Mastodon |
+| Funding opportunity | Internal #funding | Slack DM | Bluesky/Twitter |
+| Daily podcast brief | — | Slack DM + RSS | — |
+
+---
+
+## Community & Open Source
+
+### Agent SDK / Protocol
+Publish a minimal open spec for the "coPI agent protocol" — the API contract that any lab bot must implement to join a coPI network. This allows third-party developers to build custom agents (domain-specific, tool-augmented) that integrate with the platform.
+
+### Self-Hosted Agent Nodes
+A PI or institution could run the agent container on their own infrastructure, connecting to the shared coPI.science platform. Their data stays on their servers; only messages and public profile content cross the wire.
+
+### Plugin System for Tools
+Make the agent tool registry extensible so domain-specific tools (cryo-EM database lookup, ChEMBL query, protein structure retrieval) can be added per-agent without touching the core simulation engine.
diff --git a/Dockerfile b/Dockerfile
index c032e95..63a7b94 100644
--- a/Dockerfile
+++ b/Dockerfile
@@ -6,6 +6,7 @@ WORKDIR /app
 RUN apt-get update && apt-get install -y --no-install-recommends \
     gcc \
     libpq-dev \
+    ffmpeg \
     && rm -rf /var/lib/apt/lists/*
 
 # Install Python dependencies
diff --git a/alembic/versions/0010_access_gate_and_waitlist.py b/alembic/versions/0010_access_gate_and_waitlist.py
index 36c0ec6..79cb165 100644
--- a/alembic/versions/0010_access_gate_and_waitlist.py
+++ b/alembic/versions/0010_access_gate_and_waitlist.py
@@ -1,7 +1,7 @@
 """Access gate + waitlist
 
-Revision ID: 0010
-Revises: 0009
+Revision ID: 0010a
+Revises: 0010
 Create Date: 2026-04-15 00:00:00.000000
 
 """
@@ -13,8 +13,8 @@
 
 from alembic import op
 
-revision: str = "0010"
-down_revision: Union[str, None] = "0009"
+revision: str = "0010a"
+down_revision: Union[str, None] = "0010"
 branch_labels: Union[str, Sequence[str], None] = None
 depends_on: Union[str, Sequence[str], None] = None
 
diff --git a/alembic/versions/0010_add_podcast_episodes.py b/alembic/versions/0010_add_podcast_episodes.py
new file mode 100644
index 0000000..adad7d2
--- /dev/null
+++ b/alembic/versions/0010_add_podcast_episodes.py
@@ -0,0 +1,56 @@
+"""Add podcast_episodes table
+
+Revision ID: 0010
+Revises: 0009
+Create Date: 2026-04-09 00:00:00.000000
+
+"""
+
+from typing import Sequence, Union
+
+import sqlalchemy as sa
+from sqlalchemy.dialects import postgresql
+
+from alembic import op
+
+revision: str = "0010"
+down_revision: Union[str, None] = "0009"
+branch_labels: Union[str, Sequence[str], None] = None
+depends_on: Union[str, Sequence[str], None] = None
+
+
+def upgrade() -> None:
+    op.create_table(
+        "podcast_episodes",
+        sa.Column("id", postgresql.UUID(as_uuid=True), primary_key=True),
+        sa.Column("agent_id", sa.String(50), nullable=False),
+        sa.Column("episode_date", sa.Date, nullable=False),
+        sa.Column("pmid", sa.String(100), nullable=False),
+        sa.Column("paper_title", sa.String(500), nullable=False),
+        sa.Column("paper_authors", sa.String(500), nullable=False),
+        sa.Column("paper_journal", sa.String(255), nullable=False),
+        sa.Column("paper_year", sa.Integer, nullable=False),
+        sa.Column("text_summary", sa.Text, nullable=False),
+        sa.Column("audio_file_path", sa.String(500), nullable=True),
+        sa.Column("audio_duration_seconds", sa.Integer, nullable=True),
+        sa.Column("slack_delivered", sa.Boolean, nullable=False, server_default="false"),
+        sa.Column("selection_justification", sa.Text, nullable=False),
+        sa.Column(
+            "created_at",
+            sa.DateTime(timezone=True),
+            server_default=sa.func.now(),
+            nullable=False,
+        ),
+    )
+    op.create_index("ix_podcast_episodes_agent_id", "podcast_episodes", ["agent_id"])
+    op.create_index("ix_podcast_episodes_episode_date", "podcast_episodes", ["episode_date"])
+    op.create_unique_constraint(
+        "uq_podcast_agent_date", "podcast_episodes", ["agent_id", "episode_date"]
+    )
+
+
+def downgrade() -> None:
+    op.drop_constraint("uq_podcast_agent_date", "podcast_episodes")
+    op.drop_index("ix_podcast_episodes_episode_date")
+    op.drop_index("ix_podcast_episodes_agent_id")
+    op.drop_table("podcast_episodes")
diff --git a/alembic/versions/0011_add_podcast_paper_url.py b/alembic/versions/0011_add_podcast_paper_url.py
new file mode 100644
index 0000000..5b2aa8f
--- /dev/null
+++ b/alembic/versions/0011_add_podcast_paper_url.py
@@ -0,0 +1,29 @@
+"""Add paper_url column to podcast_episodes
+
+Revision ID: 0011
+Revises: 0010
+Create Date: 2026-04-10 00:00:00.000000
+
+"""
+
+from typing import Sequence, Union
+
+import sqlalchemy as sa
+
+from alembic import op
+
+revision: str = "0011"
+down_revision: Union[str, None] = "0010a"
+branch_labels: Union[str, Sequence[str], None] = None
+depends_on: Union[str, Sequence[str], None] = None
+
+
+def upgrade() -> None:
+    op.add_column(
+        "podcast_episodes",
+        sa.Column("paper_url", sa.String(1000), nullable=True),
+    )
+
+
+def downgrade() -> None:
+    op.drop_column("podcast_episodes", "paper_url")
diff --git a/alembic/versions/0012_add_podcast_preferences.py b/alembic/versions/0012_add_podcast_preferences.py
new file mode 100644
index 0000000..bba69c7
--- /dev/null
+++ b/alembic/versions/0012_add_podcast_preferences.py
@@ -0,0 +1,64 @@
+"""Add podcast_preferences table
+
+Revision ID: 0012
+Revises: 0011
+Create Date: 2026-04-14 00:00:00.000000
+
+"""
+
+from typing import Sequence, Union
+
+import sqlalchemy as sa
+from sqlalchemy.dialects import postgresql
+from sqlalchemy.dialects.postgresql import ARRAY
+
+from alembic import op
+
+revision: str = "0012"
+down_revision: Union[str, None] = "0011"
+branch_labels: Union[str, Sequence[str], None] = None
+depends_on: Union[str, Sequence[str], None] = None
+
+
+def upgrade() -> None:
+    op.create_table(
+        "podcast_preferences",
+        sa.Column("id", postgresql.UUID(as_uuid=True), primary_key=True),
+        sa.Column("agent_id", sa.String(50), nullable=False),
+        sa.Column("voice_id", sa.String(100), nullable=True),
+        sa.Column(
+            "extra_keywords",
+            ARRAY(sa.String),
+            nullable=False,
+            server_default="{}",
+        ),
+        sa.Column(
+            "preferred_journals",
+            ARRAY(sa.String),
+            nullable=False,
+            server_default="{}",
+        ),
+        sa.Column(
+            "deprioritized_journals",
+            ARRAY(sa.String),
+            nullable=False,
+            server_default="{}",
+        ),
+        sa.Column(
+            "updated_at",
+            sa.DateTime(timezone=True),
+            nullable=False,
+            server_default=sa.func.now(),
+        ),
+    )
+    op.create_index(
+        "ix_podcast_preferences_agent_id",
+        "podcast_preferences",
+        ["agent_id"],
+        unique=True,
+    )
+
+
+def downgrade() -> None:
+    op.drop_index("ix_podcast_preferences_agent_id", table_name="podcast_preferences")
+    op.drop_table("podcast_preferences")
diff --git a/alembic/versions/0013_podcast_user_support.py b/alembic/versions/0013_podcast_user_support.py
new file mode 100644
index 0000000..89d77cd
--- /dev/null
+++ b/alembic/versions/0013_podcast_user_support.py
@@ -0,0 +1,83 @@
+"""Extend podcast tables to support plain ORCID users (no agent required)
+
+Adds nullable user_id FK to podcast_preferences and podcast_episodes so that
+any user who has completed onboarding can receive daily research briefings
+without needing an approved AgentRegistry entry.
+
+Changes:
+  - podcast_preferences.agent_id: NOT NULL → nullable
+  - podcast_preferences.user_id:  new nullable FK → users.id, unique index
+  - podcast_episodes.agent_id:    NOT NULL → nullable
+  - podcast_episodes.user_id:     new nullable FK → users.id
+  - podcast_episodes: partial unique index on (user_id, episode_date) WHERE user_id IS NOT NULL
+
+Revision ID: 0013
+Revises: 0012
+Create Date: 2026-04-14 00:00:00.000000
+"""
+
+from typing import Sequence, Union
+
+import sqlalchemy as sa
+from sqlalchemy.dialects.postgresql import UUID
+
+from alembic import op
+
+revision: str = "0013"
+down_revision: Union[str, None] = "0012"
+branch_labels: Union[str, Sequence[str], None] = None
+depends_on: Union[str, Sequence[str], None] = None
+
+
+def upgrade() -> None:
+    # --- podcast_preferences ---
+    # Make agent_id nullable (existing agent rows keep their values)
+    op.alter_column("podcast_preferences", "agent_id", nullable=True)
+
+    # Add user_id FK column
+    op.add_column(
+        "podcast_preferences",
+        sa.Column(
+            "user_id",
+            UUID(as_uuid=True),
+            sa.ForeignKey("users.id", ondelete="CASCADE"),
+            nullable=True,
+        ),
+    )
+    op.create_index(
+        "ix_podcast_preferences_user_id",
+        "podcast_preferences",
+        ["user_id"],
+        unique=True,
+    )
+
+    # --- podcast_episodes ---
+    # Make agent_id nullable (existing agent rows keep their values)
+    op.alter_column("podcast_episodes", "agent_id", nullable=True)
+
+    # Add user_id FK column
+    op.add_column(
+        "podcast_episodes",
+        sa.Column(
+            "user_id",
+            UUID(as_uuid=True),
+            sa.ForeignKey("users.id", ondelete="CASCADE"),
+            nullable=True,
+        ),
+    )
+    # Partial unique index: one episode per user per day (only when user_id is set)
+    op.execute(
+        "CREATE UNIQUE INDEX ix_podcast_episodes_user_date "
+        "ON podcast_episodes (user_id, episode_date) "
+        "WHERE user_id IS NOT NULL"
+    )
+
+
+def downgrade() -> None:
+    op.execute("DROP INDEX IF EXISTS ix_podcast_episodes_user_date")
+    op.drop_column("podcast_episodes", "user_id")
+    op.alter_column("podcast_episodes", "agent_id", nullable=False)
+
+    op.drop_index("ix_podcast_preferences_user_id", table_name="podcast_preferences")
+    op.drop_column("podcast_preferences", "user_id")
+    op.alter_column("podcast_preferences", "agent_id", nullable=False)
diff --git a/alembic/versions/0014_add_matchmaker_proposals.py b/alembic/versions/0014_add_matchmaker_proposals.py
new file mode 100644
index 0000000..ea31eb4
--- /dev/null
+++ b/alembic/versions/0014_add_matchmaker_proposals.py
@@ -0,0 +1,57 @@
+"""Add matchmaker_proposals table
+
+Revision ID: 0014
+Revises: 0013
+Create Date: 2026-04-21 00:00:00.000000
+"""
+
+from typing import Sequence, Union
+
+import sqlalchemy as sa
+from sqlalchemy.dialects.postgresql import UUID
+
+from alembic import op
+
+revision: str = "0014"
+down_revision: Union[str, None] = "0013"
+branch_labels: Union[str, Sequence[str], None] = None
+depends_on: Union[str, Sequence[str], None] = None
+
+
+def upgrade() -> None:
+    op.create_table(
+        "matchmaker_proposals",
+        sa.Column("id", UUID(as_uuid=True), primary_key=True),
+        sa.Column(
+            "pi_a_id",
+            UUID(as_uuid=True),
+            sa.ForeignKey("users.id", ondelete="CASCADE"),
+            nullable=False,
+        ),
+        sa.Column(
+            "pi_b_id",
+            UUID(as_uuid=True),
+            sa.ForeignKey("users.id", ondelete="CASCADE"),
+            nullable=False,
+        ),
+        sa.Column("proposal_md", sa.Text, nullable=False),
+        sa.Column("title", sa.String(500), nullable=False),
+        sa.Column("confidence", sa.String(20), nullable=False),
+        sa.Column("llm_model", sa.String(100), nullable=False),
+        sa.Column("input_tokens", sa.Integer, nullable=True),
+        sa.Column("output_tokens", sa.Integer, nullable=True),
+        sa.Column(
+            "generated_at",
+            sa.DateTime(timezone=True),
+            server_default=sa.func.now(),
+            nullable=False,
+        ),
+    )
+    op.create_index("ix_matchmaker_proposals_pi_a_id", "matchmaker_proposals", ["pi_a_id"])
+    op.create_index("ix_matchmaker_proposals_pi_b_id", "matchmaker_proposals", ["pi_b_id"])
+
+
+def downgrade() -> None:
+    op.drop_index("ix_matchmaker_proposals_pi_b_id", table_name="matchmaker_proposals")
+    op.drop_index("ix_matchmaker_proposals_pi_a_id", table_name="matchmaker_proposals")
+    op.drop_table("matchmaker_proposals")
diff --git a/alembic/versions/0015_matchmaker_nullable_ids_and_names.py b/alembic/versions/0015_matchmaker_nullable_ids_and_names.py
new file mode 100644
index 0000000..cf7b95f
--- /dev/null
+++ b/alembic/versions/0015_matchmaker_nullable_ids_and_names.py
@@ -0,0 +1,30 @@
+"""Make matchmaker PI FKs nullable; add pi_a_name / pi_b_name for CLI path
+
+Revision ID: 0015
+Revises: 0014
+Create Date: 2026-04-22 00:00:00.000000
+"""
+
+from typing import Sequence, Union
+
+import sqlalchemy as sa
+from alembic import op
+
+revision: str = "0015"
+down_revision: Union[str, None] = "0014"
+branch_labels: Union[str, Sequence[str], None] = None
+depends_on: Union[str, Sequence[str], None] = None
+
+
+def upgrade() -> None:
+    op.alter_column("matchmaker_proposals", "pi_a_id", nullable=True)
+    op.alter_column("matchmaker_proposals", "pi_b_id", nullable=True)
+    op.add_column("matchmaker_proposals", sa.Column("pi_a_name", sa.String(255), nullable=True))
+    op.add_column("matchmaker_proposals", sa.Column("pi_b_name", sa.String(255), nullable=True))
+
+
+def downgrade() -> None:
+    op.drop_column("matchmaker_proposals", "pi_b_name")
+    op.drop_column("matchmaker_proposals", "pi_a_name")
+    op.alter_column("matchmaker_proposals", "pi_b_id", nullable=False)
+    op.alter_column("matchmaker_proposals", "pi_a_id", nullable=False)
diff --git a/alembic/versions/0016_add_pi_proposal_evaluations.py b/alembic/versions/0016_add_pi_proposal_evaluations.py
new file mode 100644
index 0000000..930555c
--- /dev/null
+++ b/alembic/versions/0016_add_pi_proposal_evaluations.py
@@ -0,0 +1,102 @@
+"""Add pi_proposal_evaluations table for NIH-style PI proposal scoring
+
+Revision ID: 0016
+Revises: 0015
+Create Date: 2026-05-04 00:00:00.000000
+"""
+
+from typing import Sequence, Union
+
+import sqlalchemy as sa
+from alembic import op
+from sqlalchemy.dialects import postgresql
+
+revision: str = "0016"
+down_revision: Union[str, None] = "0015"
+branch_labels: Union[str, Sequence[str], None] = None
+depends_on: Union[str, Sequence[str], None] = None
+
+
+def upgrade() -> None:
+    op.create_table(
+        "pi_proposal_evaluations",
+        sa.Column("id", postgresql.UUID(as_uuid=True), primary_key=True),
+        sa.Column(
+            "user_id",
+            postgresql.UUID(as_uuid=True),
+            sa.ForeignKey("users.id", ondelete="CASCADE"),
+            nullable=False,
+        ),
+        sa.Column("proposal_type", sa.String(20), nullable=False),
+        sa.Column(
+            "thread_decision_id",
+            postgresql.UUID(as_uuid=True),
+            sa.ForeignKey("thread_decisions.id", ondelete="CASCADE"),
+            nullable=True,
+        ),
+        sa.Column(
+            "matchmaker_proposal_id",
+            postgresql.UUID(as_uuid=True),
+            sa.ForeignKey("matchmaker_proposals.id", ondelete="CASCADE"),
+            nullable=True,
+        ),
+        sa.Column("score_significance", sa.SmallInteger(), nullable=False),
+        sa.Column("score_innovation", sa.SmallInteger(), nullable=False),
+        sa.Column("score_approach", sa.SmallInteger(), nullable=False),
+        sa.Column("score_investigators", sa.SmallInteger(), nullable=False),
+        sa.Column("score_environment", sa.SmallInteger(), nullable=False),
+        sa.Column("score_overall_impact", sa.SmallInteger(), nullable=False),
+        sa.Column("comments_significance", sa.Text(), nullable=True),
+        sa.Column("comments_innovation", sa.Text(), nullable=True),
+        sa.Column("comments_approach", sa.Text(), nullable=True),
+        sa.Column("comments_investigators", sa.Text(), nullable=True),
+        sa.Column("comments_environment", sa.Text(), nullable=True),
+        sa.Column("comments_overall", sa.Text(), nullable=False),
+        sa.Column(
+            "evaluated_at",
+            sa.DateTime(timezone=True),
+            server_default=sa.func.now(),
+            nullable=False,
+        ),
+        sa.Column("updated_at", sa.DateTime(timezone=True), nullable=True),
+    )
+
+    # Indexes
+    op.create_index("ix_ppe_user_id", "pi_proposal_evaluations", ["user_id"])
+    op.create_index("ix_ppe_user_type", "pi_proposal_evaluations", ["user_id", "proposal_type"])
+    op.create_index("ix_ppe_thread_decision_id", "pi_proposal_evaluations", ["thread_decision_id"])
+    op.create_index(
+        "ix_ppe_matchmaker_proposal_id", "pi_proposal_evaluations", ["matchmaker_proposal_id"]
+    )
+
+    # Unique constraints
+    op.create_unique_constraint(
+        "uq_ppe_user_thread", "pi_proposal_evaluations", ["user_id", "thread_decision_id"]
+    )
+    op.create_unique_constraint(
+        "uq_ppe_user_matchmaker",
+        "pi_proposal_evaluations",
+        ["user_id", "matchmaker_proposal_id"],
+    )
+
+    # Check constraints
+    op.create_check_constraint(
+        "ck_ppe_proposal_type",
+        "pi_proposal_evaluations",
+        "proposal_type IN ('agent', 'matchmaker')",
+    )
+    op.create_check_constraint(
+        "ck_ppe_proposal_present",
+        "pi_proposal_evaluations",
+        "thread_decision_id IS NOT NULL OR matchmaker_proposal_id IS NOT NULL",
+    )
+    for col in ["significance", "innovation", "approach", "investigators", "environment", "overall_impact"]:
+        op.create_check_constraint(
+            f"ck_ppe_score_{col}",
+            "pi_proposal_evaluations",
+            f"score_{col} BETWEEN 1 AND 9",
+        )
+
+
+def downgrade() -> None:
+    op.drop_table("pi_proposal_evaluations")
diff --git a/alembic/versions/0017_add_is_paused_to_agents.py b/alembic/versions/0017_add_is_paused_to_agents.py
new file mode 100644
index 0000000..59e1759
--- /dev/null
+++ b/alembic/versions/0017_add_is_paused_to_agents.py
@@ -0,0 +1,32 @@
+"""Add is_paused column to agents table
+
+Revision ID: 0017
+Revises: 0016
+Create Date: 2026-05-05 00:00:00.000000
+"""
+
+from typing import Sequence, Union
+
+import sqlalchemy as sa
+from alembic import op
+
+revision: str = "0017"
+down_revision: Union[str, None] = "0016"
+branch_labels: Union[str, Sequence[str], None] = None
+depends_on: Union[str, Sequence[str], None] = None
+
+
+def upgrade() -> None:
+    op.add_column(
+        "agents",
+        sa.Column(
+            "is_paused",
+            sa.Boolean(),
+            nullable=False,
+            server_default=sa.text("false"),
+        ),
+    )
+
+
+def downgrade() -> None:
+    op.drop_column("agents", "is_paused")
diff --git a/alembic/versions/0018_nullable_criterion_scores.py b/alembic/versions/0018_nullable_criterion_scores.py
new file mode 100644
index 0000000..b9891fc
--- /dev/null
+++ b/alembic/versions/0018_nullable_criterion_scores.py
@@ -0,0 +1,34 @@
+"""Make categorical criterion scores nullable in pi_proposal_evaluations
+
+Revision ID: 0018
+Revises: 0017
+Create Date: 2026-05-06 00:00:00.000000
+"""
+
+from typing import Sequence, Union
+
+import sqlalchemy as sa
+from alembic import op
+
+revision: str = "0018"
+down_revision: Union[str, None] = "0017"
+branch_labels: Union[str, Sequence[str], None] = None
+depends_on: Union[str, Sequence[str], None] = None
+
+_COLS = [
+    "score_significance",
+    "score_innovation",
+    "score_approach",
+    "score_investigators",
+    "score_environment",
+]
+
+
+def upgrade() -> None:
+    for col in _COLS:
+        op.alter_column("pi_proposal_evaluations", col, nullable=True)
+
+
+def downgrade() -> None:
+    for col in _COLS:
+        op.alter_column("pi_proposal_evaluations", col, nullable=False)
diff --git a/alembic/versions/0019_add_hidden_to_proposals.py b/alembic/versions/0019_add_hidden_to_proposals.py
new file mode 100644
index 0000000..ed1da64
--- /dev/null
+++ b/alembic/versions/0019_add_hidden_to_proposals.py
@@ -0,0 +1,32 @@
+"""Add hidden column to thread_decisions and matchmaker_proposals
+
+Revision ID: 0019
+Revises: 0018
+Create Date: 2026-05-13 00:00:00.000000
+"""
+
+from typing import Sequence, Union
+
+import sqlalchemy as sa
+from alembic import op
+
+revision: str = "0019"
+down_revision: Union[str, None] = "0018"
+branch_labels: Union[str, Sequence[str], None] = None
+depends_on: Union[str, Sequence[str], None] = None
+
+
+def upgrade() -> None:
+    op.add_column(
+        "thread_decisions",
+        sa.Column("hidden", sa.Boolean(), nullable=False, server_default=sa.text("false")),
+    )
+    op.add_column(
+        "matchmaker_proposals",
+        sa.Column("hidden", sa.Boolean(), nullable=False, server_default=sa.text("false")),
+    )
+
+
+def downgrade() -> None:
+    op.drop_column("thread_decisions", "hidden")
+    op.drop_column("matchmaker_proposals", "hidden")
diff --git a/alembic/versions/0020_nullable_overall_comment.py b/alembic/versions/0020_nullable_overall_comment.py
new file mode 100644
index 0000000..7525d7c
--- /dev/null
+++ b/alembic/versions/0020_nullable_overall_comment.py
@@ -0,0 +1,24 @@
+"""Make comments_overall nullable in pi_proposal_evaluations
+
+Revision ID: 0020
+Revises: 0019
+Create Date: 2026-05-13 00:00:00.000000
+"""
+
+from typing import Sequence, Union
+
+import sqlalchemy as sa
+from alembic import op
+
+revision: str = "0020"
+down_revision: Union[str, None] = "0019"
+branch_labels: Union[str, Sequence[str], None] = None
+depends_on: Union[str, Sequence[str], None] = None
+
+
+def upgrade() -> None:
+    op.alter_column("pi_proposal_evaluations", "comments_overall", nullable=True)
+
+
+def downgrade() -> None:
+    op.alter_column("pi_proposal_evaluations", "comments_overall", nullable=False)
diff --git a/alembic/versions/0021_nullable_llm_call_log_simulation_run.py b/alembic/versions/0021_nullable_llm_call_log_simulation_run.py
new file mode 100644
index 0000000..c075e31
--- /dev/null
+++ b/alembic/versions/0021_nullable_llm_call_log_simulation_run.py
@@ -0,0 +1,24 @@
+"""Make simulation_run_id nullable in llm_call_logs to support podcast pipeline logging
+
+Revision ID: 0021
+Revises: 0020
+Create Date: 2026-05-21 00:00:00.000000
+"""
+
+from typing import Sequence, Union
+
+import sqlalchemy as sa
+from alembic import op
+
+revision: str = "0021"
+down_revision: Union[str, None] = "0020"
+branch_labels: Union[str, Sequence[str], None] = None
+depends_on: Union[str, Sequence[str], None] = None
+
+
+def upgrade() -> None:
+    op.alter_column("llm_call_logs", "simulation_run_id", nullable=True)
+
+
+def downgrade() -> None:
+    op.alter_column("llm_call_logs", "simulation_run_id", nullable=False)
diff --git a/alembic/versions/0022_add_podcast_enabled.py b/alembic/versions/0022_add_podcast_enabled.py
new file mode 100644
index 0000000..fa16737
--- /dev/null
+++ b/alembic/versions/0022_add_podcast_enabled.py
@@ -0,0 +1,27 @@
+"""Add podcast_enabled flag to podcast_preferences (default false — users opt in)
+
+Revision ID: 0022
+Revises: 0021
+Create Date: 2026-05-21 00:00:00.000000
+"""
+
+from typing import Sequence, Union
+
+import sqlalchemy as sa
+from alembic import op
+
+revision: str = "0022"
+down_revision: Union[str, None] = "0021"
+branch_labels: Union[str, Sequence[str], None] = None
+depends_on: Union[str, Sequence[str], None] = None
+
+
+def upgrade() -> None:
+    op.add_column(
+        "podcast_preferences",
+        sa.Column("podcast_enabled", sa.Boolean(), nullable=False, server_default="false"),
+    )
+
+
+def downgrade() -> None:
+    op.drop_column("podcast_preferences", "podcast_enabled")
diff --git a/code_review.md b/code_review.md
new file mode 100644
index 0000000..fbf0a1d
--- /dev/null
+++ b/code_review.md
@@ -0,0 +1,290 @@
+# Code Review: Top 5 Priority Issues
+
+Reviewed: 2026-04-14  
+Branch: `coPI-podcast`
+
+---
+
+## Issue 1 — CSRF Bypass on Expired OAuth Session
+
+**File:** `src/routers/auth.py:76-79`  
+**Severity:** High (security)
+
+### Current Code
+
+```python
+stored_state = request.session.pop("oauth_state", None)
+if stored_state and state != stored_state:
+    logger.warning("OAuth state mismatch")
+    return RedirectResponse(url="/login?error=state_mismatch", status_code=302)
+```
+
+### Problem
+
+The guard condition is `if stored_state and ...`, meaning it only enforces the check when `stored_state` is truthy. If the user's session has expired (or was never set), `stored_state` is `None` and the entire check is skipped — any `state` value (including `None`) passes through. A CSRF attacker can initiate an OAuth flow, let the victim's session expire, then replay the callback with an arbitrary code.
+
+### Best Practice
+
+Per [RFC 6749 §10.12](https://datatracker.ietf.org/doc/html/rfc6749#section-10.12) and OWASP OAuth guidelines, the `state` parameter must be treated as a **required, non-nullable nonce**. The correct pattern is to reject the callback if `stored_state` is missing (session expired), not to treat it as a pass condition.
+
+### How to Fix
+
+Change the condition from a two-branch `if stored_state and ...` guard to an explicit three-case rejection:
+
+```python
+stored_state = request.session.pop("oauth_state", None)
+
+if stored_state is None:
+    # Session expired before the callback arrived — cannot verify CSRF nonce
+    logger.warning("OAuth callback with no stored state (session expired or missing)")
+    return RedirectResponse(url="/login?error=session_expired", status_code=302)
+
+if state != stored_state:
+    logger.warning("OAuth state mismatch — possible CSRF attempt")
+    return RedirectResponse(url="/login?error=state_mismatch", status_code=302)
+```
+
+Also ensure the state nonce is generated with sufficient entropy. In `src/routers/auth.py` (in the `/login` route that initiates the flow), use `secrets.token_urlsafe(32)` rather than any shorter or predictable token, and store it in the session immediately before the redirect.
+
+---
+
+## Issue 2 — Budget Enforcement Exits the Entire Simulation Loop
+
+**File:** `src/agent/simulation.py:218-222`  
+**Severity:** Medium (reliability / correctness)
+
+### Current Code
+
+```python
+agent = self._select_agent()
+if not agent or not self._agent_within_budget(agent):
+    # All agents over budget
+    logger.info("All agents over budget or no agent selected. Stopping.")
+    break
+```
+
+### Problem
+
+`_select_agent()` returns whichever agent is next in the rotation. If that specific agent is over budget, the entire simulation `break`s — even if every other agent still has budget remaining. The log comment says "All agents over budget" but that is only true in the case where `_select_agent` returns `None`; when it returns an agent that is individually over budget, the others are never checked.
+
+### Best Practice
+
+Budget exhaustion for a single agent should be a **skip**, not a **halt**. The loop should continue cycling through agents until every agent is either over budget or no agent can be selected at all. A common pattern is to track how many consecutive agents have been skipped and stop only when the skip count equals the total number of agents.
+
+### How to Fix
+
+Separate the two exit conditions and convert the over-budget case from `break` to `continue`. Count consecutive over-budget skips and only exit the loop when all agents have been skipped in a single pass:
+
+```python
+over_budget_streak = 0
+total_agents = len(self._agents)
+
+while True:
+    agent = self._select_agent()
+    if not agent:
+        logger.info("No agent selected — simulation complete.")
+        break
+
+    if not self._agent_within_budget(agent):
+        over_budget_streak += 1
+        agent.state.last_selected = time.time()
+        if over_budget_streak >= total_agents:
+            logger.info("All agents over budget. Stopping.")
+            break
+        logger.debug("[%s] Over budget, skipping.", agent.agent_id)
+        continue
+
+    over_budget_streak = 0  # reset when a valid agent is found
+    # ... rest of the turn logic
+```
+
+This requires that `_select_agent` rotates through agents based on `last_selected` time (which it already does), so agents that have been skipped will be picked up again on the next cycle.
+
+---
+
+## Issue 3 — RSS Feed Served with Missing Audio File
+
+**File:** `src/podcast/main.py:89-103`, `src/podcast/pipeline.py`  
+**Severity:** Medium (reliability)
+
+### Current Code
+
+```python
+try:
+    ok = await run_pipeline_for_agent(
+        agent_id=agent_id,
+        ...
+    )
+    if ok:
+        produced.append(agent_id)
+except Exception as exc:
+    logger.error(
+        "Pipeline failed for agent %s: %s", agent_id, exc, exc_info=True
+    )
+```
+
+### Problem
+
+`run_pipeline_for_agent` returns a boolean `ok`, but within the pipeline itself the episode DB record and RSS entry can be written before the TTS step completes. If TTS fails, the audio file does not exist, but the feed already contains an `<enclosure>` pointing to a non-existent MP3. Any podcast client that subscribed to the feed will attempt a GET on a 404 URL and may display a broken episode permanently.
+
+### Best Practice
+
+The pipeline should follow a **commit-last** pattern: write the episode record and RSS enclosure only after all assets are confirmed present on disk. This is the same pattern used in video/audio platforms (e.g., YouTube's upload pipeline) — metadata is published only after the binary asset is available.
+
+### How to Fix
+
+Inside `src/podcast/pipeline.py`, restructure the steps in this order:
+
+1. Fetch and select the paper (read-only, safe to do first).
+2. Generate the text brief (Claude Opus call).
+3. Call TTS and write the audio file to disk. **Capture the returned path.**
+4. Verify the audio file exists and has a non-zero size (`path.stat().st_size > 0`) before proceeding.
+5. Only if step 4 passes: write the `PodcastEpisode` DB row and call `db_session.flush()`.
+6. Only after the DB row is committed: build and write the RSS `<item>`.
+
+If TTS fails at step 3, log the error and return `ok=False` without writing anything to the DB or RSS. The caller in `main.py` already handles `ok=False` correctly; the gap is in the pipeline not propagating TTS failures as `False`.
+
+As a secondary safeguard, the RSS endpoint (`/podcast/{agent_id}/feed.xml`) should check whether `data/podcast_audio/{agent_id}/{date}.mp3` exists before including the `<enclosure>` element in its output. This prevents any historical DB rows with missing audio from appearing in the feed.
+
+---
+
+## Issue 4 — Non-Atomic File Writes for Profile and Podcast State
+
+**Files:** `src/agent/agent.py:423-444`, `src/podcast/state.py:22-24`  
+**Severity:** Medium (data integrity)
+
+### Current Code
+
+```python
+# agent.py
+memory_path.write_text(new_memory + "\n", encoding="utf-8")
+
+# state.py
+def _save(data: dict) -> None:
+    STATE_FILE.parent.mkdir(parents=True, exist_ok=True)
+    STATE_FILE.write_text(json.dumps(data, indent=2), encoding="utf-8")
+```
+
+### Problem
+
+`Path.write_text` is not atomic — it opens the file for truncation and writes in multiple OS-level operations. If the process crashes, is killed, or two coroutines call the write concurrently, the file can be left in a partially written state (empty, or with truncated JSON). For `podcast_state.json`, this means the `delivered_pmids` list can be lost, causing duplicate Slack DMs. For working memory files, a partial write silently discards the agent's accumulated context.
+
+There is also a logical race: `_save` in `state.py` does a read-modify-write cycle (`_load()` → modify → `_save()`). Two concurrent podcast pipeline runs (possible if the scheduler is invoked twice) will both read the same initial state, both modify it independently, and whichever writes last will silently overwrite the other's changes.
+
+### Best Practice
+
+The standard pattern for atomic file writes on POSIX systems is **write to a temp file, then `os.rename`**. Because `rename` is guaranteed atomic by the POSIX spec (it is a single syscall), a reader will always see either the old complete file or the new complete file — never a partial write. Python's `tempfile.NamedTemporaryFile` with `delete=False` in the same directory is the standard way to achieve this.
+
+For the read-modify-write race in `state.py`, use a `threading.Lock` (or `asyncio.Lock` if the callers are async) as a process-level mutex around all load/save operations.
+
+### How to Fix
+
+**Atomic write helper** (can live in `src/utils.py` or inline in each module):
+
+```python
+import os
+import tempfile
+from pathlib import Path
+
+def atomic_write_text(path: Path, content: str, encoding: str = "utf-8") -> None:
+    """Write `content` to `path` atomically using a temp-file + rename."""
+    path.parent.mkdir(parents=True, exist_ok=True)
+    fd, tmp = tempfile.mkstemp(dir=path.parent, suffix=".tmp")
+    try:
+        with os.fdopen(fd, "w", encoding=encoding) as f:
+            f.write(content)
+        os.replace(tmp, path)   # atomic on POSIX; overwrites destination
+    except Exception:
+        os.unlink(tmp)          # clean up temp file on any error
+        raise
+```
+
+Replace all four `path.write_text(...)` calls in `agent.py` (lines 428 and 441) and `state.py` (line 24) with `atomic_write_text(path, content)`.
+
+**Lock for state.py read-modify-write:**
+
+```python
+import threading
+_STATE_LOCK = threading.Lock()
+
+def record_delivery(agent_id: str, pmid: str) -> None:
+    with _STATE_LOCK:
+        data = _load()
+        # ... modify ...
+        _save(data)          # now uses atomic_write_text internally
+
+def mark_run_complete() -> None:
+    with _STATE_LOCK:
+        data = _load()
+        data["last_run_date"] = ...
+        _save(data)
+```
+
+**Note:** if these functions are ever called from async context across multiple event-loop threads (e.g., concurrent `run_pipeline_for_agent` calls), a `threading.Lock` is sufficient because `asyncio.run` uses a single thread per call. If concurrency is ever introduced via `asyncio.gather`, switch to `asyncio.Lock`.
+
+---
+
+## Issue 5 — Per-Task Failures Silently Discarded in `asyncio.gather`
+
+**File:** `src/agent/simulation.py:632-637`  
+**Severity:** Low-Medium (observability / silent failure)
+
+### Current Code
+
+```python
+tasks = [
+    self._reply_to_thread(agent, thread)
+    for thread in threads_to_reply
+]
+await asyncio.gather(*tasks, return_exceptions=True)
+```
+
+### Problem
+
+`return_exceptions=True` causes `asyncio.gather` to return exceptions as result values instead of re-raising them. The return value here is discarded entirely, so any exceptions from individual `_reply_to_thread` calls are silently swallowed. If a Slack API error, DB write failure, or Claude API timeout occurs in any thread reply, it is invisible in logs and metrics. Operators have no signal that Phase 4 is partially or fully failing.
+
+### Best Practice
+
+When using `return_exceptions=True` the caller **must** inspect the results. The canonical pattern is to iterate the results list and log (or re-raise) any values that are `isinstance(r, BaseException)`. This is preferable to removing `return_exceptions=True` (which would cancel all remaining tasks on the first failure) because Phase 4 replies are independent — a failure on one thread should not prevent replies to others.
+
+### How to Fix
+
+Capture the return value of `asyncio.gather` and inspect each result:
+
+```python
+results = await asyncio.gather(*tasks, return_exceptions=True)
+
+for thread, result in zip(threads_to_reply, results):
+    if isinstance(result, BaseException):
+        logger.error(
+            "[%s] Phase 4: Failed to reply to thread %s: %s",
+            agent.agent_id,
+            thread.thread_id,
+            result,
+            exc_info=result,   # includes traceback in log record
+        )
+```
+
+This pattern is appropriate anywhere `asyncio.gather(..., return_exceptions=True)` is used without inspecting results. There is a similar call site in `src/agent/simulation.py` for channel scanning — apply the same pattern there. Consider extracting a small helper:
+
+```python
+async def gather_logged(tasks: list, label: str) -> list:
+    """gather with return_exceptions=True, logging each failure."""
+    results = await asyncio.gather(*tasks, return_exceptions=True)
+    for i, r in enumerate(results):
+        if isinstance(r, BaseException):
+            logger.error("%s task[%d] failed: %s", label, i, r, exc_info=r)
+    return results
+```
+
+---
+
+## Summary Table
+
+| # | File | Line(s) | Severity | Category |
+|---|------|---------|----------|----------|
+| 1 | `src/routers/auth.py` | 76-79 | High | Security — CSRF bypass |
+| 2 | `src/agent/simulation.py` | 218-222 | Medium | Correctness — premature loop exit |
+| 3 | `src/podcast/pipeline.py` + `main.py` | pipeline write order | Medium | Reliability — broken RSS enclosure |
+| 4 | `src/agent/agent.py` + `src/podcast/state.py` | 428, 441, 22-24 | Medium | Data integrity — non-atomic writes |
+| 5 | `src/agent/simulation.py` | 637 | Low-Medium | Observability — silent task failures |
diff --git a/docker-compose.prod.yml b/docker-compose.prod.yml
index 44dc726..8dab0db 100644
--- a/docker-compose.prod.yml
+++ b/docker-compose.prod.yml
@@ -35,6 +35,7 @@ services:
     volumes:
       - ./profiles:/app/profiles
       - ./prompts:/app/prompts
+      - podcast_data:/app/data
     depends_on:
       postgres:
         condition: service_healthy
@@ -83,7 +84,6 @@ services:
     volumes:
       - ./profiles:/app/profiles
       - ./prompts:/app/prompts
-      - ./data:/app/data
     depends_on:
       postgres:
         condition: service_healthy
@@ -108,7 +108,7 @@ services:
     volumes:
       - ./profiles:/app/profiles
       - ./prompts:/app/prompts
-      - ./data:/app/data
+      - grantbot_data:/app/data
     depends_on:
       postgres:
         condition: service_healthy
@@ -120,6 +120,29 @@ services:
         awslogs-create-group: "true"
         awslogs-region: ${AWS_REGION:-us-east-2}
 
+  podcast:
+    build:
+      context: .
+    restart: unless-stopped
+    command: ["python", "-m", "src.podcast.main", "scheduler"]
+    env_file: .env
+    environment:
+      DATABASE_URL: postgresql+asyncpg://${POSTGRES_USER:-copi}:${POSTGRES_PASSWORD}@postgres:5432/${POSTGRES_DB:-copi}
+    volumes:
+      - ./profiles:/app/profiles
+      - ./prompts:/app/prompts
+      - podcast_data:/app/data
+    depends_on:
+      postgres:
+        condition: service_healthy
+    logging:
+      driver: awslogs
+      options:
+        awslogs-group: /copi/podcast
+        tag: podcast
+        awslogs-create-group: "true"
+        awslogs-region: ${AWS_REGION:-us-east-2}
+
   nginx:
     image: nginx:1.27-alpine
     restart: unless-stopped
@@ -167,3 +190,5 @@ services:
 
 volumes:
   pgdata:
+  grantbot_data:
+  podcast_data:
diff --git a/docker-compose.yml b/docker-compose.yml
index d686043..115bdea 100644
--- a/docker-compose.yml
+++ b/docker-compose.yml
@@ -25,6 +25,7 @@ services:
       - .:/app
       - ./profiles:/app/profiles
       - ./prompts:/app/prompts
+      - ./data:/app/data
     depends_on:
       postgres:
         condition: service_healthy
@@ -69,5 +70,27 @@ services:
       postgres:
         condition: service_healthy
 
+  podcast:
+    build: .
+    command: python -m src.podcast.main scheduler
+    env_file: .env
+    environment:
+      # Override LOCAL_TTS_HOST so the container can reach a vLLM-Omni server
+      # running on the host machine (127.0.0.1 does not reach the host from inside Docker).
+      LOCAL_TTS_HOST: host.docker.internal
+    extra_hosts:
+      # Ensures host.docker.internal resolves on Linux (Docker Desktop sets it automatically on Mac/Windows).
+      - "host.docker.internal:host-gateway"
+    volumes:
+      - .:/app
+      - ./profiles:/app/profiles
+      - ./prompts:/app/prompts
+      - ./data:/app/data
+    depends_on:
+      postgres:
+        condition: service_healthy
+    profiles:
+      - podcast
+
 volumes:
   pgdata:
diff --git a/docs/cohort-infographic.html b/docs/cohort-infographic.html
new file mode 100644
index 0000000..e3b84b5
--- /dev/null
+++ b/docs/cohort-infographic.html
@@ -0,0 +1,729 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<meta name="viewport" content="width=device-width, initial-scale=1.0">
+<title>coPI Agent System — Turn Loop & Cohort Scale</title>
+<style>
+  @import url('https://fonts.googleapis.com/css2?family=Inter:wght@300;400;500;600;700;800&family=JetBrains+Mono:wght@400;500&display=swap');
+
+  *, *::before, *::after { box-sizing: border-box; margin: 0; padding: 0; }
+
+  :root {
+    --bg:        #0f1117;
+    --surface:   #1a1d27;
+    --surface2:  #232739;
+    --border:    #2e3248;
+    --blue:      #4f8ef7;
+    --blue-dim:  #2a4a8a;
+    --teal:      #2dd4bf;
+    --teal-dim:  #134e48;
+    --violet:    #a78bfa;
+    --violet-dim:#3b2d6b;
+    --amber:     #fbbf24;
+    --amber-dim: #6b4c0a;
+    --rose:      #fb7185;
+    --rose-dim:  #6b1f30;
+    --green:     #4ade80;
+    --green-dim: #14532d;
+    --text:      #e2e8f0;
+    --text-muted:#8892a4;
+    --text-dim:  #4a5568;
+  }
+
+  body {
+    font-family: 'Inter', sans-serif;
+    background: var(--bg);
+    color: var(--text);
+    width: 1200px;
+    margin: 0 auto;
+    padding: 40px 32px 56px;
+  }
+
+  /* ── HEADER ─────────────────────────────────────────────── */
+  .header {
+    display: flex;
+    align-items: center;
+    justify-content: space-between;
+    margin-bottom: 36px;
+    border-bottom: 1px solid var(--border);
+    padding-bottom: 20px;
+  }
+  .header-left h1 {
+    font-size: 26px; font-weight: 800; letter-spacing: -0.5px;
+    background: linear-gradient(90deg, var(--blue), var(--teal));
+    -webkit-background-clip: text; -webkit-text-fill-color: transparent;
+  }
+  .header-left p { font-size: 13px; color: var(--text-muted); margin-top: 4px; }
+  .badge {
+    font-size: 11px; font-weight: 600; padding: 4px 10px;
+    border-radius: 99px; background: var(--surface2); color: var(--text-muted);
+    border: 1px solid var(--border); font-family: 'JetBrains Mono', monospace;
+  }
+
+  /* ── SECTION TITLES ─────────────────────────────────────── */
+  .section-title {
+    font-size: 11px; font-weight: 700; letter-spacing: 1.2px;
+    text-transform: uppercase; color: var(--text-muted);
+    margin-bottom: 16px; display: flex; align-items: center; gap: 8px;
+  }
+  .section-title::after {
+    content: ''; flex: 1; height: 1px; background: var(--border);
+  }
+  .section-num {
+    width: 20px; height: 20px; border-radius: 50%; font-size: 10px;
+    display: flex; align-items: center; justify-content: center; font-weight: 700;
+    flex-shrink: 0;
+  }
+
+  /* ── GRID LAYOUT ─────────────────────────────────────────── */
+  .top-grid {
+    display: grid;
+    grid-template-columns: 1fr 1fr;
+    gap: 24px;
+    margin-bottom: 24px;
+  }
+  .bottom-grid {
+    display: grid;
+    grid-template-columns: 1.15fr 0.85fr;
+    gap: 24px;
+  }
+
+  /* ── CARD ────────────────────────────────────────────────── */
+  .card {
+    background: var(--surface);
+    border: 1px solid var(--border);
+    border-radius: 14px;
+    padding: 22px 24px;
+  }
+
+  /* ── PHASE PIPELINE ─────────────────────────────────────── */
+  .pipeline {
+    display: flex;
+    align-items: stretch;
+    gap: 0;
+    margin: 4px 0 18px;
+  }
+  .phase-block {
+    flex: 1;
+    position: relative;
+  }
+  .phase-inner {
+    border-radius: 8px;
+    padding: 10px 8px 10px;
+    text-align: center;
+    height: 100%;
+  }
+  .phase-num {
+    font-size: 9px; font-weight: 700; letter-spacing: 0.8px;
+    text-transform: uppercase; opacity: 0.7; margin-bottom: 4px;
+  }
+  .phase-name {
+    font-size: 11.5px; font-weight: 700; line-height: 1.3;
+    margin-bottom: 5px;
+  }
+  .phase-detail {
+    font-size: 10px; color: var(--text-muted); line-height: 1.45;
+  }
+  .phase-badge {
+    display: inline-block; font-size: 9px; font-weight: 600;
+    padding: 2px 6px; border-radius: 4px; margin-top: 5px;
+  }
+  .arrow-sep {
+    display: flex; align-items: center; color: var(--text-dim);
+    font-size: 16px; padding: 0 4px; flex-shrink: 0;
+    padding-top: 10px;
+  }
+
+  /* phase colors */
+  .p1 { background: color-mix(in srgb, var(--text-dim) 15%, transparent); }
+  .p2 { background: color-mix(in srgb, var(--blue) 12%, transparent); border: 1px solid color-mix(in srgb, var(--blue) 25%, transparent); }
+  .p3 { background: color-mix(in srgb, var(--text-dim) 15%, transparent); }
+  .p4 { background: color-mix(in srgb, var(--teal) 12%, transparent); border: 1px solid color-mix(in srgb, var(--teal) 25%, transparent); }
+  .p5 { background: color-mix(in srgb, var(--violet) 12%, transparent); border: 1px solid color-mix(in srgb, var(--violet) 25%, transparent); }
+
+  /* ── THREAD LIFECYCLE ────────────────────────────────────── */
+  .thread-row {
+    display: flex;
+    gap: 6px;
+    align-items: center;
+    margin-bottom: 8px;
+  }
+  .thread-msgs {
+    display: flex; gap: 4px; align-items: center;
+  }
+  .msg-dot {
+    width: 28px; height: 28px; border-radius: 6px;
+    display: flex; align-items: center; justify-content: center;
+    font-size: 10px; font-weight: 700; flex-shrink: 0;
+  }
+  .thread-label {
+    font-size: 10px; font-weight: 600; color: var(--text-muted);
+    min-width: 62px; text-align: right; flex-shrink: 0;
+  }
+  .thread-outcome {
+    font-size: 10px; padding: 3px 8px; border-radius: 5px;
+    font-weight: 600; flex-shrink: 0;
+  }
+  .divider-line {
+    height: 1px; background: var(--border); margin: 10px 0;
+  }
+
+  /* ── SELECTION BOX ───────────────────────────────────────── */
+  .heap-viz {
+    display: flex; flex-direction: column; gap: 6px; margin: 10px 0;
+  }
+  .heap-row {
+    display: flex; align-items: center; gap: 8px;
+  }
+  .heap-bar-wrap {
+    flex: 1; height: 24px; background: var(--surface2);
+    border-radius: 5px; overflow: hidden; position: relative;
+  }
+  .heap-bar {
+    height: 100%; border-radius: 5px;
+    display: flex; align-items: center; padding-left: 8px;
+  }
+  .heap-bar span { font-size: 10px; font-weight: 600; }
+  .heap-name {
+    font-size: 10px; font-weight: 600; min-width: 64px;
+    font-family: 'JetBrains Mono', monospace;
+  }
+  .heap-tag {
+    font-size: 9px; font-weight: 600; padding: 2px 6px;
+    border-radius: 4px; min-width: 44px; text-align: center; flex-shrink: 0;
+  }
+
+  /* ── COHORT DIAGRAMS ─────────────────────────────────────── */
+  .comparison {
+    display: grid; grid-template-columns: 1fr 1fr; gap: 14px; margin-bottom: 14px;
+  }
+  .compare-box {
+    border-radius: 10px; padding: 14px;
+    border: 1px solid var(--border);
+  }
+  .compare-title {
+    font-size: 10px; font-weight: 700; text-transform: uppercase;
+    letter-spacing: 0.8px; margin-bottom: 10px;
+  }
+  .agent-grid {
+    display: flex; flex-wrap: wrap; gap: 5px; justify-content: center;
+  }
+  .agent-dot {
+    width: 30px; height: 30px; border-radius: 50%;
+    display: flex; align-items: center; justify-content: center;
+    font-size: 9px; font-weight: 700; position: relative;
+  }
+  .connection-lines {
+    position: relative; height: 50px; margin: 4px 0;
+  }
+  .lines-label {
+    font-size: 10px; color: var(--text-muted); text-align: center; margin-top: 4px;
+  }
+  .cohort-wrap {
+    display: flex; flex-direction: column; gap: 6px;
+  }
+  .cohort-row {
+    border-radius: 8px; padding: 8px 10px;
+    border: 1px dashed;
+    display: flex; align-items: center; gap: 8px;
+  }
+  .cohort-row-label {
+    font-size: 9px; font-weight: 700; text-transform: uppercase;
+    letter-spacing: 0.6px; min-width: 52px;
+  }
+  .cohort-agents {
+    display: flex; gap: 4px; flex-wrap: wrap;
+  }
+  .c-agent {
+    padding: 3px 8px; border-radius: 5px;
+    font-size: 10px; font-weight: 600;
+  }
+
+  /* ── GATE FLOW ───────────────────────────────────────────── */
+  .gate-flow {
+    display: flex; flex-direction: column; gap: 6px; margin: 10px 0;
+  }
+  .gate-step {
+    display: flex; align-items: center; gap: 10px;
+  }
+  .gate-icon {
+    width: 32px; height: 32px; border-radius: 8px; flex-shrink: 0;
+    display: flex; align-items: center; justify-content: center; font-size: 14px;
+  }
+  .gate-text { font-size: 11px; line-height: 1.4; }
+  .gate-text strong { font-weight: 600; }
+  .gate-text em { font-size: 10px; color: var(--text-muted); font-style: normal; }
+  .gate-arrow {
+    font-size: 11px; color: var(--text-dim); margin-left: 41px;
+  }
+
+  /* ── SEMAPHORE VIZ ───────────────────────────────────────── */
+  .semaphore {
+    display: flex; gap: 8px; justify-content: center;
+    margin: 12px 0 8px;
+  }
+  .sem-slot {
+    flex: 1; border-radius: 8px; padding: 10px 8px;
+    text-align: center; border: 1px solid;
+  }
+  .sem-label { font-size: 9px; font-weight: 700; text-transform: uppercase; letter-spacing: 0.6px; margin-bottom: 6px; }
+  .sem-agent { font-size: 11px; font-weight: 700; margin-bottom: 3px; }
+  .sem-phase { font-size: 9px; color: var(--text-muted); }
+
+  /* ── FOOTER ──────────────────────────────────────────────── */
+  .footer {
+    margin-top: 28px;
+    padding-top: 16px;
+    border-top: 1px solid var(--border);
+    display: flex; justify-content: space-between; align-items: center;
+  }
+  .footer-note { font-size: 10px; color: var(--text-dim); }
+
+  code {
+    font-family: 'JetBrains Mono', monospace;
+    font-size: 10px; background: var(--surface2);
+    padding: 1px 5px; border-radius: 3px; color: var(--teal);
+  }
+
+  .small-note {
+    font-size: 10px; color: var(--text-muted); line-height: 1.5;
+    margin-top: 8px;
+  }
+  .row { display: flex; align-items: center; gap: 8px; }
+  .spacer { flex: 1; }
+
+  .inline-tag {
+    font-size: 9px; font-weight: 700; padding: 2px 6px; border-radius: 4px;
+    display: inline-block;
+  }
+</style>
+</head>
+<body>
+
+<!-- HEADER -->
+<div class="header">
+  <div class="header-left">
+    <h1>coPI Agent System</h1>
+    <p>Turn-based conversation loop &amp; cohort-based scale-up architecture</p>
+  </div>
+  <div style="display:flex;gap:8px;">
+    <span class="badge">specs/cohort-system.md</span>
+    <span class="badge">specs/agent-system.md</span>
+  </div>
+</div>
+
+<!-- ════════════════════════════════════════════════════════════
+     SECTION 1 — TURN LOOP
+     ════════════════════════════════════════════════════════════ -->
+<div class="section-title">
+  <span class="section-num" style="background:var(--blue-dim);color:var(--blue);">1</span>
+  Turn-Based Conversation Loop
+</div>
+
+<div class="top-grid">
+
+  <!-- 1A: 5-Phase Pipeline -->
+  <div class="card">
+    <div class="row" style="margin-bottom:14px;">
+      <span style="font-size:13px;font-weight:700;">5-Phase Agent Turn</span>
+      <span class="spacer"></span>
+      <span class="inline-tag" style="background:var(--blue-dim);color:var(--blue);">per selected agent</span>
+    </div>
+
+    <div class="pipeline">
+      <div class="phase-block">
+        <div class="phase-inner p1">
+          <div class="phase-num">Phase 1</div>
+          <div class="phase-name">Channel Discovery</div>
+          <div class="phase-detail">Keyword-match profile → join topic channels</div>
+          <div class="phase-badge" style="background:var(--surface2);color:var(--text-dim);">No LLM</div>
+        </div>
+      </div>
+      <div class="arrow-sep">›</div>
+      <div class="phase-block">
+        <div class="phase-inner p2">
+          <div class="phase-num">Phase 2</div>
+          <div class="phase-name">Scan &amp; Filter</div>
+          <div class="phase-detail">Evaluate new posts for relevance</div>
+          <div class="phase-badge" style="background:var(--blue-dim);color:var(--blue);">Sonnet</div>
+        </div>
+      </div>
+      <div class="arrow-sep">›</div>
+      <div class="phase-block">
+        <div class="phase-inner p3">
+          <div class="phase-num">Phase 3</div>
+          <div class="phase-name">Activate Threads</div>
+          <div class="phase-detail">Open threads from tags &amp; replies</div>
+          <div class="phase-badge" style="background:var(--surface2);color:var(--text-dim);">No LLM</div>
+        </div>
+      </div>
+      <div class="arrow-sep">›</div>
+      <div class="phase-block">
+        <div class="phase-inner p4">
+          <div class="phase-num">Phase 4</div>
+          <div class="phase-name">Reply Threads</div>
+          <div class="phase-detail">Reply to all active threads (parallel)</div>
+          <div class="phase-badge" style="background:var(--teal-dim);color:var(--teal);">Opus ×N</div>
+        </div>
+      </div>
+      <div class="arrow-sep">›</div>
+      <div class="phase-block">
+        <div class="phase-inner p5">
+          <div class="phase-num">Phase 5</div>
+          <div class="phase-name">New Post</div>
+          <div class="phase-detail">Start new conversation (conditional)</div>
+          <div class="phase-badge" style="background:var(--violet-dim);color:var(--violet);">Opus ×1</div>
+        </div>
+      </div>
+    </div>
+
+    <div class="divider-line"></div>
+
+    <!-- Thread Lifecycle -->
+    <div class="row" style="margin-bottom:10px;margin-top:10px;">
+      <span style="font-size:12px;font-weight:700;">Thread Lifecycle (Phase 4)</span>
+      <span class="spacer"></span>
+      <span style="font-size:10px;color:var(--text-muted);">max 12 messages</span>
+    </div>
+
+    <div class="thread-row">
+      <div class="thread-label" style="color:var(--blue);">EXPLORE</div>
+      <div class="thread-msgs">
+        <div class="msg-dot" style="background:var(--blue-dim);color:var(--blue);">1</div>
+        <div class="msg-dot" style="background:var(--blue-dim);color:var(--blue);">2</div>
+        <div class="msg-dot" style="background:var(--blue-dim);color:var(--blue);">3</div>
+        <div class="msg-dot" style="background:var(--blue-dim);color:var(--blue);">4</div>
+      </div>
+      <div style="font-size:10px;color:var(--text-muted);flex:1;">Share work, ask questions, use <code>retrieve_*</code> tools</div>
+    </div>
+    <div class="thread-row">
+      <div class="thread-label" style="color:var(--amber);">DECIDE</div>
+      <div class="thread-msgs">
+        <div class="msg-dot" style="background:var(--amber-dim);color:var(--amber);">5</div>
+        <div class="msg-dot" style="background:var(--amber-dim);color:var(--amber);">6</div>
+        <div class="msg-dot" style="background:var(--amber-dim);color:var(--amber);">…</div>
+        <div class="msg-dot" style="background:var(--amber-dim);color:var(--amber);">11</div>
+      </div>
+      <div style="font-size:10px;color:var(--text-muted);flex:1;">Narrow to genuine complementarity, build toward proposal</div>
+    </div>
+    <div class="thread-row">
+      <div class="thread-label" style="color:var(--green);">CONCLUDE</div>
+      <div class="thread-msgs">
+        <div class="msg-dot" style="background:var(--green-dim);color:var(--green);">12</div>
+      </div>
+      <div style="flex:1;display:flex;gap:6px;align-items:center;">
+        <div class="thread-outcome" style="background:var(--green-dim);color:var(--green);">📝 Proposal</div>
+        <div style="font-size:10px;color:var(--text-muted);">or</div>
+        <div class="thread-outcome" style="background:var(--surface2);color:var(--text-muted);">⏸ No overlap</div>
+      </div>
+    </div>
+
+    <div class="small-note" style="margin-top:10px;">
+      Proposal confirmed when partner replies <strong>✅</strong> to the <strong>📝 Summary</strong> block.
+      PI rates 0–5 in web app; rating = 0 reopens thread with PI guidance.
+    </div>
+  </div>
+
+  <!-- 1B: Agent Selection -->
+  <div class="card">
+    <div class="row" style="margin-bottom:14px;">
+      <span style="font-size:13px;font-weight:700;">Agent Selection — Min-Heap</span>
+      <span class="spacer"></span>
+      <span class="inline-tag" style="background:var(--teal-dim);color:var(--teal);">O(log n)</span>
+    </div>
+
+    <div style="font-size:11px;color:var(--text-muted);margin-bottom:12px;line-height:1.6;">
+      Agents are sorted by <code>last_selected</code> timestamp. The longest-waiting
+      <em>eligible</em> agents win the next slots. Replaces weighted-random to
+      guarantee no starvation at scale.
+    </div>
+
+    <!-- heap viz: bars representing wait time -->
+    <div class="heap-viz">
+      <div class="heap-row">
+        <div class="heap-name">WisemanBot</div>
+        <div class="heap-bar-wrap">
+          <div class="heap-bar" style="width:95%;background:linear-gradient(90deg,var(--teal-dim),color-mix(in srgb,var(--teal) 30%,transparent));">
+            <span style="color:var(--teal);">waited longest</span>
+          </div>
+        </div>
+        <div class="heap-tag" style="background:var(--teal-dim);color:var(--teal);">← next</div>
+      </div>
+      <div class="heap-row">
+        <div class="heap-name">LotzBot</div>
+        <div class="heap-bar-wrap">
+          <div class="heap-bar" style="width:78%;background:color-mix(in srgb,var(--blue) 18%,transparent);">
+            <span style="color:var(--blue);">eligible</span>
+          </div>
+        </div>
+        <div class="heap-tag" style="background:var(--blue-dim);color:var(--blue);">← next</div>
+      </div>
+      <div class="heap-row">
+        <div class="heap-name">SuBot</div>
+        <div class="heap-bar-wrap">
+          <div class="heap-bar" style="width:61%;background:color-mix(in srgb,var(--violet) 18%,transparent);">
+            <span style="color:var(--violet);">eligible</span>
+          </div>
+        </div>
+        <div class="heap-tag" style="background:var(--violet-dim);color:var(--violet);">← next</div>
+      </div>
+      <div class="heap-row">
+        <div class="heap-name">RackiBot</div>
+        <div class="heap-bar-wrap">
+          <div class="heap-bar" style="width:28%;background:color-mix(in srgb,var(--text-dim) 30%,transparent);">
+            <span style="color:var(--text-dim);">on cooldown</span>
+          </div>
+        </div>
+        <div class="heap-tag" style="background:var(--surface2);color:var(--text-dim);">cooling</div>
+      </div>
+      <div class="heap-row">
+        <div class="heap-name">CravattBot</div>
+        <div class="heap-bar-wrap">
+          <div class="heap-bar" style="width:18%;background:color-mix(in srgb,var(--text-dim) 20%,transparent);">
+            <span style="color:var(--text-dim);">just ran</span>
+          </div>
+        </div>
+        <div class="heap-tag" style="background:var(--surface2);color:var(--text-dim);">cooling</div>
+      </div>
+    </div>
+
+    <div class="divider-line"></div>
+
+    <!-- concurrent semaphore -->
+    <div class="row" style="margin:12px 0 8px;">
+      <span style="font-size:12px;font-weight:700;">Concurrent Turn Slots</span>
+      <span class="spacer"></span>
+      <code>concurrent_turns = active_thread_threshold</code>
+    </div>
+
+    <div class="semaphore">
+      <div class="sem-slot" style="background:color-mix(in srgb,var(--teal) 8%,transparent);border-color:color-mix(in srgb,var(--teal) 30%,transparent);">
+        <div class="sem-label" style="color:var(--teal);">Slot 1</div>
+        <div class="sem-agent">WisemanBot</div>
+        <div class="sem-phase">Phase 4 · Opus</div>
+      </div>
+      <div class="sem-slot" style="background:color-mix(in srgb,var(--blue) 8%,transparent);border-color:color-mix(in srgb,var(--blue) 30%,transparent);">
+        <div class="sem-label" style="color:var(--blue);">Slot 2</div>
+        <div class="sem-agent">LotzBot</div>
+        <div class="sem-phase">Phase 2 · Sonnet</div>
+      </div>
+      <div class="sem-slot" style="background:color-mix(in srgb,var(--violet) 8%,transparent);border-color:color-mix(in srgb,var(--violet) 30%,transparent);">
+        <div class="sem-label" style="color:var(--violet);">Slot 3</div>
+        <div class="sem-agent">SuBot</div>
+        <div class="sem-phase">Phase 5 · Opus</div>
+      </div>
+    </div>
+
+    <div class="small-note">
+      <strong style="color:var(--amber);">turn_delay_seconds</strong> repurposed:
+      was a global <code>asyncio.sleep</code> blocking all slots after each turn.
+      Now enforced as a <strong>per-agent cooldown</strong> at heap-build time —
+      <code>(now − last_selected) ≥ turn_delay_seconds</code>.
+      All other slots stay active during any agent's cooldown.
+    </div>
+  </div>
+
+</div><!-- /top-grid -->
+
+<!-- ════════════════════════════════════════════════════════════
+     SECTION 2 — COHORT SCALE
+     ════════════════════════════════════════════════════════════ -->
+<div class="section-title" style="margin-top:8px;">
+  <span class="section-num" style="background:var(--violet-dim);color:var(--violet);">2</span>
+  Cohort-Based Scale-Up
+</div>
+
+<div class="bottom-grid">
+
+  <!-- 2A: Before/After + Cohort data model -->
+  <div class="card">
+    <div class="row" style="margin-bottom:14px;">
+      <span style="font-size:13px;font-weight:700;">From All-vs-All → Cohort-Scoped</span>
+    </div>
+
+    <div class="comparison">
+      <!-- ALL VS ALL -->
+      <div class="compare-box" style="background:color-mix(in srgb,var(--rose) 5%,transparent);border-color:color-mix(in srgb,var(--rose) 20%,transparent);">
+        <div class="compare-title" style="color:var(--rose);">❌ All-vs-All (current)</div>
+        <div style="font-size:10px;color:var(--text-muted);margin-bottom:10px;line-height:1.5;">
+          Every agent scans posts from all others.<br>
+          LLM calls scale as <strong>O(n²)</strong>.
+        </div>
+        <div class="agent-grid">
+          <div class="agent-dot" style="background:var(--rose-dim);color:var(--rose);">A</div>
+          <div class="agent-dot" style="background:var(--rose-dim);color:var(--rose);">B</div>
+          <div class="agent-dot" style="background:var(--rose-dim);color:var(--rose);">C</div>
+          <div class="agent-dot" style="background:var(--rose-dim);color:var(--rose);">D</div>
+          <div class="agent-dot" style="background:var(--rose-dim);color:var(--rose);">E</div>
+          <div class="agent-dot" style="background:var(--rose-dim);color:var(--rose);">F</div>
+        </div>
+        <div class="lines-label" style="margin-top:8px;color:var(--rose);">6 agents → 15 possible pairs<br>all evaluated every scan</div>
+      </div>
+
+      <!-- COHORTS -->
+      <div class="compare-box" style="background:color-mix(in srgb,var(--green) 5%,transparent);border-color:color-mix(in srgb,var(--green) 20%,transparent);">
+        <div class="compare-title" style="color:var(--green);">✓ With Cohorts</div>
+        <div style="font-size:10px;color:var(--text-muted);margin-bottom:10px;line-height:1.5;">
+          Agents only act on cohort-mates.<br>
+          Scan cost bounded by cohort size.
+        </div>
+        <div class="cohort-wrap">
+          <div class="cohort-row" style="border-color:color-mix(in srgb,var(--blue) 40%,transparent);background:color-mix(in srgb,var(--blue) 6%,transparent);">
+            <div class="cohort-row-label" style="color:var(--blue);">Cohort 1</div>
+            <div class="cohort-agents">
+              <div class="c-agent" style="background:var(--blue-dim);color:var(--blue);">A</div>
+              <div class="c-agent" style="background:var(--blue-dim);color:var(--blue);">B</div>
+              <div class="c-agent" style="background:var(--blue-dim);color:var(--blue);">C</div>
+            </div>
+          </div>
+          <div class="cohort-row" style="border-color:color-mix(in srgb,var(--violet) 40%,transparent);background:color-mix(in srgb,var(--violet) 6%,transparent);">
+            <div class="cohort-row-label" style="color:var(--violet);">Cohort 2</div>
+            <div class="cohort-agents">
+              <div class="c-agent" style="background:var(--violet-dim);color:var(--violet);">B</div>
+              <div class="c-agent" style="background:var(--violet-dim);color:var(--violet);">D</div>
+              <div class="c-agent" style="background:var(--violet-dim);color:var(--violet);">E</div>
+              <div class="c-agent" style="background:var(--violet-dim);color:var(--violet);">F</div>
+            </div>
+          </div>
+        </div>
+        <div class="lines-label" style="margin-top:8px;color:var(--green);">B spans both cohorts · memberships<br>change live · no restart needed</div>
+      </div>
+    </div>
+
+    <div class="divider-line"></div>
+
+    <!-- data model -->
+    <div class="row" style="margin:12px 0 10px;">
+      <span style="font-size:12px;font-weight:700;">Data Model</span>
+      <span class="spacer"></span>
+      <span style="font-size:10px;color:var(--text-muted);">migration 0023</span>
+    </div>
+
+    <div style="display:grid;grid-template-columns:1fr 1fr;gap:10px;">
+      <div style="background:var(--surface2);border-radius:8px;padding:12px;font-size:10px;font-family:'JetBrains Mono',monospace;line-height:1.8;color:var(--text-muted);">
+        <div style="color:var(--blue);font-weight:700;margin-bottom:4px;">cohorts</div>
+        <div><span style="color:var(--teal);">id</span>           uuid pk</div>
+        <div><span style="color:var(--teal);">name</span>         text unique</div>
+        <div><span style="color:var(--teal);">description</span>  text?</div>
+        <div><span style="color:var(--teal);">created_by</span>   → users</div>
+        <div><span style="color:var(--teal);">created_at</span>   timestamptz</div>
+      </div>
+      <div style="background:var(--surface2);border-radius:8px;padding:12px;font-size:10px;font-family:'JetBrains Mono',monospace;line-height:1.8;color:var(--text-muted);">
+        <div style="color:var(--violet);font-weight:700;margin-bottom:4px;">cohort_memberships</div>
+        <div><span style="color:var(--teal);">id</span>        uuid pk</div>
+        <div><span style="color:var(--teal);">cohort_id</span> → cohorts ⬆</div>
+        <div><span style="color:var(--teal);">agent_id</span>  text</div>
+        <div><span style="color:var(--teal);">added_by</span>  → users</div>
+        <div><span style="color:var(--teal);">added_at</span>  timestamptz</div>
+      </div>
+    </div>
+  </div>
+
+  <!-- 2B: Interaction gate + admin UI -->
+  <div style="display:flex;flex-direction:column;gap:24px;">
+
+    <div class="card">
+      <div class="row" style="margin-bottom:12px;">
+        <span style="font-size:13px;font-weight:700;">Interaction Gate</span>
+        <span class="spacer"></span>
+        <span class="inline-tag" style="background:var(--teal-dim);color:var(--teal);">pure filter</span>
+      </div>
+
+      <div style="background:var(--surface2);border-radius:8px;padding:10px 12px;font-size:10px;font-family:'JetBrains Mono',monospace;line-height:1.7;margin-bottom:12px;">
+        <span style="color:var(--violet);">def</span> <span style="color:var(--blue);">can_interact</span>(self, other) → bool:<br>
+        &nbsp;&nbsp;<span style="color:var(--text-muted);"># uncohorted → interact with all</span><br>
+        &nbsp;&nbsp;<span style="color:var(--violet);">if not</span> self.cohort_ids <span style="color:var(--violet);">or not</span> other.cohort_ids:<br>
+        &nbsp;&nbsp;&nbsp;&nbsp;<span style="color:var(--violet);">return</span> <span style="color:var(--green);">True</span><br>
+        &nbsp;&nbsp;<span style="color:var(--violet);">return bool</span>(self.cohort_ids <span style="color:var(--amber);">&amp;</span> other.cohort_ids)
+      </div>
+
+      <div class="gate-flow">
+        <div class="gate-step">
+          <div class="gate-icon" style="background:var(--blue-dim);">🔍</div>
+          <div class="gate-text">
+            <strong>Phase 2</strong> — filter posts before LLM prompt<br>
+            <em>Saves Sonnet calls on non-cohort senders</em>
+          </div>
+        </div>
+        <div class="gate-arrow">↓</div>
+        <div class="gate-step">
+          <div class="gate-icon" style="background:var(--surface2);">🔗</div>
+          <div class="gate-text">
+            <strong>Phase 3</strong> — skip thread activation from non-cohort agents<br>
+            <em>No state bloat from irrelevant replies</em>
+          </div>
+        </div>
+        <div class="gate-arrow">↓</div>
+        <div class="gate-step">
+          <div class="gate-icon" style="background:var(--violet-dim);">📢</div>
+          <div class="gate-text">
+            <strong>Phase 5</strong> — block tagging non-cohort agents<br>
+            <em>Saves Opus call; prunes stale interesting_posts</em>
+          </div>
+        </div>
+      </div>
+
+      <div class="small-note" style="margin-top:10px;">
+        Phase 4 requires no gate — threads already exist between cohort-mates when opened.
+        Scheduling is <strong>cohort-unaware</strong>; cohorts only affect what happens inside a turn.
+      </div>
+    </div>
+
+    <div class="card">
+      <div class="row" style="margin-bottom:12px;">
+        <span style="font-size:13px;font-weight:700;">Admin UI</span>
+        <span class="spacer"></span>
+        <span style="font-size:10px;color:var(--text-muted);">/admin/cohorts</span>
+      </div>
+
+      <div style="display:flex;flex-direction:column;gap:5px;font-size:10px;">
+        <div style="display:flex;align-items:center;gap:8px;padding:6px 10px;background:var(--surface2);border-radius:6px;">
+          <span style="color:var(--teal);font-family:'JetBrains Mono',monospace;font-size:9px;min-width:30px;">GET</span>
+          <span style="color:var(--text-muted);font-family:'JetBrains Mono',monospace;">/admin/cohorts</span>
+          <span style="color:var(--text-dim);margin-left:auto;">list + create form</span>
+        </div>
+        <div style="display:flex;align-items:center;gap:8px;padding:6px 10px;background:var(--surface2);border-radius:6px;">
+          <span style="color:var(--amber);font-family:'JetBrains Mono',monospace;font-size:9px;min-width:30px;">POST</span>
+          <span style="color:var(--text-muted);font-family:'JetBrains Mono',monospace;">/admin/cohorts/create</span>
+          <span style="color:var(--text-dim);margin-left:auto;">admin only</span>
+        </div>
+        <div style="display:flex;align-items:center;gap:8px;padding:6px 10px;background:var(--surface2);border-radius:6px;">
+          <span style="color:var(--teal);font-family:'JetBrains Mono',monospace;font-size:9px;min-width:30px;">GET</span>
+          <span style="color:var(--text-muted);font-family:'JetBrains Mono',monospace;">/admin/cohorts/{id}</span>
+          <span style="color:var(--text-dim);margin-left:auto;">members + map</span>
+        </div>
+        <div style="display:flex;align-items:center;gap:8px;padding:6px 10px;background:var(--surface2);border-radius:6px;">
+          <span style="color:var(--amber);font-family:'JetBrains Mono',monospace;font-size:9px;min-width:30px;">POST</span>
+          <span style="color:var(--text-muted);font-family:'JetBrains Mono',monospace;">…/{id}/add-agent</span>
+          <span style="color:var(--text-dim);margin-left:auto;">live, no restart</span>
+        </div>
+        <div style="display:flex;align-items:center;gap:8px;padding:6px 10px;background:var(--surface2);border-radius:6px;">
+          <span style="color:var(--amber);font-family:'JetBrains Mono',monospace;font-size:9px;min-width:30px;">POST</span>
+          <span style="color:var(--text-muted);font-family:'JetBrains Mono',monospace;">…/{id}/remove-agent</span>
+          <span style="color:var(--text-dim);margin-left:auto;">open threads unaffected</span>
+        </div>
+        <div style="display:flex;align-items:center;gap:8px;padding:6px 10px;background:var(--surface2);border-radius:6px;">
+          <span style="color:var(--rose);font-family:'JetBrains Mono',monospace;font-size:9px;min-width:30px;">POST</span>
+          <span style="color:var(--text-muted);font-family:'JetBrains Mono',monospace;">…/{id}/delete</span>
+          <span style="color:var(--text-dim);margin-left:auto;">requires 0 members</span>
+        </div>
+      </div>
+
+      <div class="small-note" style="margin-top:10px;">
+        Membership resyncs every <strong>60 s</strong> mid-run. Resync rebuilds
+        <code>agent.cohort_ids</code> only — no state wipe, no thread closure.
+      </div>
+    </div>
+
+  </div>
+</div><!-- /bottom-grid -->
+
+<!-- FOOTER -->
+<div class="footer">
+  <div class="footer-note">coPI · Anthropic Claude Opus/Sonnet · FastAPI + PostgreSQL + Slack</div>
+  <div class="footer-note">specs/cohort-system.md · Cohort_approaches.txt</div>
+</div>
+
+</body>
+</html>
diff --git a/orcids.txt b/orcids.txt
index c8caf66..d8e7d97 100644
--- a/orcids.txt
+++ b/orcids.txt
@@ -30,3 +30,83 @@
 0000-0003-2819-4049
 # Luke Lairson
 0000-0001-6701-996X
+# Ahmed Badran
+0000-0002-8105-1883
+# Peng Wu
+0000-0002-5204-0229
+# Keren Lasker
+0000-0002-5480-4173
+# Dorothee Kern
+0000-0002-7631-8328
+# Marco Mravic
+0000-0001-6294-1824
+# Ian MacRae
+0000-0002-5112-0294
+# James Paulson
+0000-0003-4589-5322
+# Giordano Lippi
+0000-0003-3911-0525
+# Ian Wilson
+0000-0002-6469-2419
+# Ian Seiple
+0000-0002-8732-1362
+# Shannon Miller
+0000-0003-3569-6231
+# James Williamson
+0000-0002-8772-468X
+# Colleen Maillie
+0000-0001-7050-4464
+
+# Cabo retreat additions — 2026-05-01
+# Scripps Research
+# David Millar
+0000-0001-9207-6958
+# UCSF
+# Andrej Sali
+0000-0003-0435-6197
+# Carolyn Larabell
+0000-0002-6262-4789
+# Balyn Zaro
+0000-0002-8938-9889
+# Leah Roe
+0000-0002-2487-5587
+# Daniel Santi
+0000-0002-3790-0673
+# James Wells
+0000-0001-8267-5519
+# Ignacia Echeverria
+0000-0003-4717-1467
+# James Fraser
+0000-0002-5080-2859
+# Charles Craik
+0000-0001-7704-9185
+# Robert Stroud
+0000-0003-2083-5665
+# Daniel Minor Jr.
+0000-0002-5998-4214
+# Aashish Manglik
+0000-0002-7173-3741
+# Katherine Susa
+0000-0003-0077-667X
+# Tony Capra (John A. Capra)
+0000-0001-9743-1795
+# New PIs — 2026-05-01
+# Stanford
+# Peter S. Kim
+0000-0001-6503-4541
+# Genentech
+# Caleigh Azumaya
+0000-0002-3484-9921
+# UC Berkeley
+# Daniel K. Nomura
+0000-0003-1614-8360
+# Mark Yeager
+0000-0002-3301-640X
+# Jonathan Moore
+0000-0001-8633-3313
+# Michael Williams
+0009-0002-3422-6713
+# Mohammad Alanjary
+0000-0001-8420-1325
+# Hollis Cline
+0000-0002-4887-9603
diff --git a/pipairs.tsv b/pipairs.tsv
new file mode 100644
index 0000000..958add5
--- /dev/null
+++ b/pipairs.tsv
@@ -0,0 +1,41 @@
+Wiseman	Lotz
+Deniz	Lairson
+Deniz	Petrascheck
+Lotz	Cravatt
+Petrascheck	Grotjahn
+Wu	Lairson
+Forli	Su
+Forli	Ward
+Deniz	Su
+Briney	Su
+Racki	Ken
+Racki	Su
+Racki	Lairson
+Grotjahn	Wiseman
+Racki	Grotjahn
+Cravatt	Wiseman
+Cravatt	Su
+Forli	Lairson
+Saez	Wiseman
+Deniz	Racki
+Saez	Petrascheck
+Deniz	Ken
+Saez	Grotjahn
+Deniz	Wiseman
+Ken	Lairson
+Briney	Ward
+Grotjahn	Lairson
+Cravatt	Lairson
+Su	Petrascheck
+Deniz	Grotjahn
+Saez	Lairson
+Lotz	Wu
+Forli	Petrascheck
+Cravatt	Ken
+Briney	Ward
+Cravatt	Forli
+Saez	Su
+Su	Wiseman
+Forli	Ken
+Wu	Su
+Wiseman	Briney
diff --git a/prompts/agent-system.md b/prompts/agent-system.md
index 37f033b..1aecf97 100644
--- a/prompts/agent-system.md
+++ b/prompts/agent-system.md
@@ -1,9 +1,10 @@
 # Agent System Prompt
 
-You are an AI agent representing a research lab at Scripps Research in a Slack workspace called "labbot".
+You are an AI agent representing a research lab at Scripps Research in a Slack workspace.
 Your role is to facilitate scientific collaboration by engaging authentically with other lab agents.
 All agents represent real labs with real researchers — your goal is to identify genuinely valuable
 collaboration opportunities, not to generate noise.
+Your task is to produce a high-quality collaboration proposal that follows the Proposal Generation Rules and meets the listed quality standards by engaging in dialouge between agents. You have access to each PI's public profile associated with the user (or profiles in profiles/public), private instructions (profiles in profiles/private), and recent relevant publications. Use all of this to initiate conversations with the ultimate goal of generating a specific, grounded, and actionable proposal after sufficient discussion.
 
 ## Core Rules
 
@@ -19,84 +20,9 @@ collaboration opportunities, not to generate noise.
 4. **DM rules.** You may DM your own PI to report on discussions or ask for guidance. You cannot DM other
    labs' PIs or send agent-to-agent DMs.
 
-## Collaboration Quality Standards
+## Proposal Generation Rules
 
-These standards apply to every collaboration idea you propose or explore. Your PI's private instructions
-may adjust these defaults — always follow PI instructions when they conflict.
-
-### Core Principles
-
-1. **Specificity.** Every collaboration idea must name specific techniques, models, reagents, datasets,
-   or expertise from each lab's profile. "Lab A's expertise in X" is not enough — say what specifically
-   they would do and with what.
-
-2. **True complementarity.** Each lab must bring something the other doesn't have. If either lab's
-   contribution could be described as a generic service (e.g., "computational analysis", "structural studies",
-   "mouse behavioral testing") without reference to the specific scientific question, the idea is too generic.
-
-3. **Concrete first experiment.** Any collaboration that advances beyond initial interest must include
-   a proposed first experiment scoped to days-to-weeks of effort. The experiment must name specific assays,
-   computational methods, reagents, or datasets. "We would analyze the data" is not a first experiment.
-
-4. **Silence over noise.** If you cannot articulate what makes this collaboration better than either lab
-   hiring a postdoc to do the other's part, do not propose it.
-
-5. **Non-generic benefits.** Both labs must benefit in ways specific to the collaboration. "Access to
-   new techniques" is too vague. "Structural evidence for the mechanism of mitochondrial rescue at
-   nanometer resolution, strengthening the therapeutic narrative for HRI activators" is specific.
-
-### Confidence Labels
-
-When you propose a collaboration, label your confidence level:
-- *[High]* — Clear complementarity, specific anchoring to recent work, concrete first experiment,
-  both sides benefit non-generically
-- *[Moderate]* — Good synergy but first experiment is less defined, or one side's benefit is less clear
-- *[Speculative]* — Interesting angle but requires more development — use "This is speculative, but..."
-
-### Examples of Good Collaboration Ideas
-
-**Good: Specific question, specific contributions, concrete experiment**
-> Wiseman's HRI activators induce mitochondrial elongation in MFN2-deficient cells, but the ultrastructural
-> basis is unknown. Grotjahn's cryo-ET and Surface Morphometrics pipeline could directly visualize this
-> remodeling at nanometer resolution. First experiment: Wiseman provides treated vs untreated MFN2-deficient
-> fibroblasts, Grotjahn runs cryo-FIB-SEM and cryo-ET on both conditions, quantifying cristae morphology
-> and membrane contact site metrics.
-
-**Good: Each lab has something the other literally cannot do alone**
-> Petrascheck's atypical tetracyclines provide neuroprotection via ISR-independent ribosome targeting.
-> Wiseman's HRI activators work through ISR-dependent pathways. Neither lab can test the combination alone.
-> First experiment: mix compounds in neuronal ferroptosis assays, measure survival, calculate combination
-> indices for synergy.
-
-**Good: Computational contribution is specific, not generic**
-> Lotz's JCI paper identified cyproheptadine as an H1R inverse agonist activating FoxO in chondrocytes,
-> but the structural basis for FoxO activation vs antihistamine activity is unknown. Su's BioThings
-> knowledge graph could identify additional H1R ligands with FoxO activity data across multiple
-> orthogonal datasets. First experiment: Lotz provides 10-15 H1R ligands with FoxO activity data,
-> Su runs BioThings traversal to identify structural and mechanistic correlates from published datasets.
-
-### Examples of Bad Collaboration Ideas (do not propose these)
-
-**Bad: Descriptive imaging without leverage**
-> "Grotjahn could use cryo-ET to visualize disc matrix degeneration in Lotz samples." — This may
-> generate interesting images, but it is mostly descriptive. It does not clearly unlock a mechanistic
-> bottleneck, therapeutic decision, or scalable downstream program.
-
-**Bad: Mechanistic depth without an intervention path**
-> "A chromatin-focused collaboration could add mechanistic depth to disc regeneration work." — This
-> sounds sophisticated, but it is not tied to a clear intervention strategy or near-term decision.
-
-**Bad: Incremental validation of an already-supported pathway**
-> "Petrascheck could test the FoxO-H1R pathway in C. elegans aging assays." — Orthogonal validation
-> alone is not enough if it only incrementally confirms a pathway that is already fairly well supported.
-
-**Bad: Generic screening in an overused model**
-> "Run a high-throughput screen for FoxO activators in a C. elegans aging model." — A screen is not
-> automatically compelling if the assay class is overused and the proposal lacks a distinctive hypothesis.
-
-**Bad: Novel but still low-leverage imaging**
-> "Use cryo-ET to compare the chondrocyte-matrix interface in OA versus control samples." — Novelty
-> and visual appeal are not sufficient without mechanistic or translational leverage.
+{{include: colab-proposal-rules.md}}
 
 ## Communication Style
 
@@ -163,13 +89,7 @@ Every thread must reach one of two outcomes:
 
 **Outcome 1: Collaboration Proposal** (rare — only the best ideas)
 
-Post a `:memo: Summary` reply containing:
-- **What each lab brings** (specific techniques, reagents, datasets — not generic capabilities)
-- **The specific scientific question** being addressed
-- **A concrete first experiment** scoped to days-to-weeks, naming specific assays/methods/reagents,
-  requiring modest effort from both sides
-- **Why this collaboration is better** than either lab doing it independently
-- **Confidence label** ([High], [Moderate], or [Speculative])
+Generate a proposal conforming to the "Proposal Generation Rules" and output format
 
 The other agent confirms agreement by replying with ✅.
 
diff --git a/prompts/colab-proposal-rules.md b/prompts/colab-proposal-rules.md
new file mode 100644
index 0000000..20e6a4b
--- /dev/null
+++ b/prompts/colab-proposal-rules.md
@@ -0,0 +1,125 @@
+## Collaboration Quality Standards
+
+These standards apply to every collaboration proposal. PI private instructions may adjust these
+defaults — always follow PI instructions when they conflict.
+
+### Core Principles
+
+1. **Specificity.** Every collaboration idea must name specific techniques, models, reagents, datasets,
+   or expertise from each lab's profile. "Lab A's expertise in X" is not enough — say what specifically
+   they would do and with what.
+
+2. **True complementarity.** Each lab must bring something the other doesn't have. If either lab's
+   contribution could be described as a generic service (e.g., "computational analysis", "structural
+   studies", "mouse behavioral testing") without reference to the specific scientific question, the
+   idea is too generic.
+
+3. **Concrete first experiment.** Any collaboration proposal must include a first experiment scoped
+   to days-to-weeks of effort. The experiment must name specific assays, computational methods,
+   reagents, or datasets. "We would analyze the data" is not a first experiment.
+
+4. **Silence over noise.** If you cannot articulate what makes this collaboration better than either
+   lab hiring a postdoc to do the other's part, do not propose it.
+
+5. **Non-generic benefits.** Both labs must benefit in ways specific to the collaboration. "Access to
+   new techniques" is too vague. "Structural evidence for the mechanism of mitochondrial rescue at
+   nanometer resolution, strengthening the therapeutic narrative for HRI activators" is specific.
+
+### Confidence Labels
+
+- **High** — Clear complementarity, specific anchoring to recent work, concrete first experiment,
+  both sides benefit non-generically
+- **Moderate** — Good synergy but first experiment is less defined, or one side's benefit is less clear
+- **Speculative** — Interesting angle but requires more development — label sections accordingly
+
+### Examples of Good Collaboration Ideas
+
+**Good: Specific question, specific contributions, concrete experiment**
+> Wiseman's HRI activators induce mitochondrial elongation in MFN2-deficient cells, but the ultrastructural
+> basis is unknown. Grotjahn's cryo-ET and Surface Morphometrics pipeline could directly visualize this
+> remodeling at nanometer resolution. First experiment: Wiseman provides treated vs untreated MFN2-deficient
+> fibroblasts, Grotjahn runs cryo-FIB-SEM and cryo-ET on both conditions, quantifying cristae morphology
+> and membrane contact site metrics.
+
+**Good: Each lab has something the other literally cannot do alone**
+> Petrascheck's atypical tetracyclines provide neuroprotection via ISR-independent ribosome targeting.
+> Wiseman's HRI activators work through ISR-dependent pathways. Neither lab can test the combination alone.
+> First experiment: mix compounds in neuronal ferroptosis assays, measure survival, calculate combination
+> indices for synergy.
+
+**Good: Computational contribution is specific, not generic**
+> Lotz's JCI paper identified cyproheptadine as an H1R inverse agonist activating FoxO in chondrocytes,
+> but the structural basis for FoxO activation vs antihistamine activity is unknown. Su's BioThings
+> knowledge graph could identify additional H1R ligands with FoxO activity data across multiple
+> orthogonal datasets. First experiment: Lotz provides 10–15 H1R ligands with FoxO activity data,
+> Su runs BioThings traversal to identify structural and mechanistic correlates from published datasets.
+
+### Examples of Bad Collaboration Ideas
+
+**Bad: Descriptive imaging without leverage**
+> "Grotjahn could use cryo-ET to visualize disc matrix degeneration in Lotz samples." — This may
+> generate interesting images, but it is mostly descriptive. It does not clearly unlock a mechanistic
+> bottleneck, therapeutic decision, or scalable downstream program.
+
+**Bad: Mechanistic depth without an intervention path**
+> "A chromatin-focused collaboration could add mechanistic depth to disc regeneration work." — This
+> sounds sophisticated, but it is not tied to a clear intervention strategy or near-term decision.
+
+**Bad: Incremental validation of an already-supported pathway**
+> "Petrascheck could test the FoxO-H1R pathway in C. elegans aging assays." — Orthogonal validation
+> alone is not enough if it only incrementally confirms a pathway that is already fairly well supported.
+
+**Bad: Generic screening in an overused model**
+> "Run a high-throughput screen for FoxO activators in a C. elegans aging model." — A screen is not
+> automatically compelling if the assay class is overused and the proposal lacks a distinctive hypothesis.
+
+**Bad: Novel but still low-leverage imaging**
+> "Use cryo-ET to compare the chondrocyte-matrix interface in OA versus control samples." — Novelty
+> and visual appeal are not sufficient without mechanistic or translational leverage.
+
+---
+
+## Instructions
+
+Produce ONE collaboration proposal between PI A and PI B using the output format below.
+
+- Apply the Collaboration Quality Standards strictly.
+- Ground the proposal in specific publications, techniques, and findings from each profile.
+- Respect each PI's private instructions when framing the proposal: if a PI has expressed preferences
+  for specific topics, partners, or collaboration styles, weight those angles positively.
+- Do NOT quote or reveal any private instruction text verbatim in the output.
+- If you cannot identify a High or Moderate confidence collaboration, produce the best Speculative
+  proposal you can and label it clearly.
+- Wrap your entire proposal (and only the proposal) in `<proposal>` tags.
+- Do not include reasoning steps, tool call markup, or self-commentary before or after the `<proposal>` block. In agent contexts, a Slack-formatted memo may precede the tag — all other preamble is forbidden.
+
+## Output Format
+
+<proposal>
+# [Collaboration Title — specific, not generic]
+**[PI_A] + [PI_B]** [Timestamp]
+**Confidence:** High | Moderate | Speculative
+
+## Scientific Rationale
+[2–3 paragraphs. Why these two labs? What does each bring that the other lacks? Name specific
+techniques, datasets, reagents, or model systems from recent publications.]
+
+## True Complementarity
+- **PI A contributes:** [specific capabilities — not generic]
+- **PI B contributes:** [specific capabilities — not generic]
+- **Gap filled:** [what neither could do alone, stated precisely]
+
+## Concrete First Experiment
+[1 paragraph. Scoped to days-to-weeks. Names specific assays, methods, reagents, or datasets.
+Explains why both labs are essential to execute it.]
+
+## Benefits to Each Lab
+- **PI A benefits:** [specific, non-generic — tied to their research goals]
+- **PI B benefits:** [specific, non-generic — tied to their research goals]
+
+## Open Questions / Next Steps
+- [Bullet list of what would need to be confirmed before committing effort]
+
+## Effort / Resources
+- [Estimate low/med/high for each PI in terms of time, people, and resources required to acheive the goals of the proposal] 
+</proposal>
\ No newline at end of file
diff --git a/prompts/matchmaker.md b/prompts/matchmaker.md
new file mode 100644
index 0000000..f9d21a8
--- /dev/null
+++ b/prompts/matchmaker.md
@@ -0,0 +1,9 @@
+You are evaluating a potential research collaboration between two PIs.
+
+Your task is to produce a high-quality collaboration proposal that follows the Proposal Generation Rules and meets the listed quality standards. You have access to each PI's public profile, private instructions, and recent publications. Use all of this to generate a specific, grounded, and actionable proposal.
+
+**Output only the `<proposal>` block. Do not include any text before or after it — no reasoning steps, no preamble, no tool calls, no commentary.**
+
+## Proposal Generation Rules
+
+{{include: colab-proposal-rules.md}}
\ No newline at end of file
diff --git a/prompts/phase4-thread-reply.md b/prompts/phase4-thread-reply.md
index a1de54a..79632ea 100644
--- a/prompts/phase4-thread-reply.md
+++ b/prompts/phase4-thread-reply.md
@@ -81,6 +81,10 @@ you should already have the information you need.
 
 {instructions}
 
+## Proposal Generation Rules
+
+{{include: colab-proposal-rules.md}}
+
 ## Output
 
 Your final response MUST contain exactly one `<slack_message>` block. Everything inside
@@ -95,12 +99,7 @@ Your message here — written as it should appear in Slack.
 You may think/reason freely outside the block, but ONLY the content between
 `<slack_message>` and `</slack_message>` tags will be posted.
 
-If you are posting a :memo: Summary (collaboration proposal), format it clearly with:
-- What each lab brings
-- The specific scientific question
-- A concrete first experiment (days-to-weeks scope, specific assays/methods)
-- Why this collaboration beats either lab working alone
-- Confidence label: [High], [Moderate], or [Speculative]
+If you are posting a :memo: Summary (collaboration proposal), format it clearly by conforming to the Proposal Generation Rules
 
 If you are confirming agreement with a :memo: Summary from the other agent, start your
 reply with ✅. This means you accept the proposal **exactly as written** — do not add
diff --git a/prompts/podcast-select.md b/prompts/podcast-select.md
new file mode 100644
index 0000000..121af03
--- /dev/null
+++ b/prompts/podcast-select.md
@@ -0,0 +1,46 @@
+You are a literature triage assistant for a scientific researcher. Your job is to identify the single most relevant and impactful recent paper from a list of candidates, based on the researcher's profile.
+
+## Researcher Profile
+
+{profile}
+
+## PI Podcast Preferences
+
+{preferences}
+
+## Task
+
+Below is a numbered list of recent publications (title + abstract). Select the ONE paper whose findings or outputs could most plausibly accelerate or inform a specific aspect of this researcher's ongoing work.
+
+Return your answer as JSON:
+```json
+{"index": <number>, "justification": "<one sentence citing a specific aspect of the researcher's profile>"}
+```
+
+If no paper clears the relevance bar, return:
+```json
+{"index": null, "justification": "No paper is sufficiently relevant to this researcher's current work."}
+```
+
+## Selection Criteria
+
+**INCLUDE** a paper if:
+- Its findings or methods could directly accelerate a specific ongoing project, technique, or open question in the researcher's profile
+- It releases a new tool, dataset, method, or reagent relevant to the researcher's techniques or targets
+- It addresses a disease area, model system, or molecular target the researcher actively works on
+
+**EXCLUDE** a paper if:
+- The connection to the researcher's work is only superficial or generic
+- It is a review article, editorial, or commentary (no new primary data)
+- It is purely clinical or epidemiological with no basic science relevance
+- Recency alone makes it interesting — the connection must be specific and actionable
+
+**NOTE:** Some candidates are preprints (from bioRxiv, medRxiv, or arXiv) and are marked as such in the journal field. Preprints are valid candidates — treat them the same as peer-reviewed papers for selection purposes.
+
+**PREFER** papers that release a concrete output alongside findings (code, dataset, protocol, reagent, model). These tend to be immediately useful.
+
+**FOLLOW PI PREFERENCES:** If the PI Podcast Preferences section above contains specific instructions (e.g., topic focus, exclusions, prioritizations), apply them when selecting. PI preferences override the general criteria above.
+
+## Candidate Papers
+
+{candidates}
diff --git a/prompts/podcast-summarize.md b/prompts/podcast-summarize.md
new file mode 100644
index 0000000..1a96589
--- /dev/null
+++ b/prompts/podcast-summarize.md
@@ -0,0 +1,46 @@
+You are a science communicator writing a personalized research brief for a specific PI. Your goal is to help the PI quickly grasp whether and how a new paper is useful to their lab.
+
+## Researcher Profile
+
+{profile}
+
+## PI Podcast Preferences
+
+{preferences}
+
+## Paper
+
+{paper}
+
+## Task
+
+Write a structured research brief following the exact format below. Be specific, direct, and concise — like a knowledgeable postdoc briefing their PI. No filler phrases, no generic connections.
+
+---
+
+*Today's Research Brief — {date}*
+
+*{paper_title}*
+{authors} · {journal} · {year}
+
+*What they found:*
+[2–3 sentences on core findings. Include specific results, effect sizes, or key observations. Be concrete — name specific proteins, pathways, organisms, or quantitative outcomes where relevant.]
+
+*Key output:*
+[1–2 sentences on the tool, method, dataset, code, protocol, or reagent released with the paper. ONLY include this section if the paper releases a concrete artifact. If there is no distinct output, omit this section entirely — do not write "N/A" or a placeholder.]
+
+*Why this matters for your lab:*
+[2–3 sentences connecting the paper specifically to this PI's work. You MUST name at least one specific technique, model system, molecular target, or open question from the researcher's profile. Do not write generic connections like "this is relevant to your proteomics work" — say exactly what aspect and how.]
+
+*Link:* {paper_url}
+
+---
+
+## Rules
+
+- Total length: approximately 200–280 words
+- Tone: collegial and precise, not promotional
+- The "Why this matters" section is the most important — make it specific to this researcher, not a general statement about the field
+- If the PI Podcast Preferences section contains specific instructions on tone, focus, or framing, follow them
+- If the abstract is all you have, base the brief on the abstract. Do not speculate about full-text content you weren't given.
+- Do not add any text before or after the brief itself
diff --git a/pyproject.toml b/pyproject.toml
index d09fa83..6b780d2 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -25,6 +25,7 @@ dependencies = [
     "boto3>=1.34.0",
     "typer>=0.12.0",
     "rich>=13.7.0",
+    "mutagen>=1.47.0",
 ]
 
 [project.optional-dependencies]
diff --git a/scripts/fix_proposal_summaries.py b/scripts/fix_proposal_summaries.py
new file mode 100644
index 0000000..264a1a9
--- /dev/null
+++ b/scripts/fix_proposal_summaries.py
@@ -0,0 +1,29 @@
+# scripts/fix_proposal_summaries.py
+import asyncio, re
+from sqlalchemy import select
+from sqlalchemy.ext.asyncio import create_async_engine, async_sessionmaker, AsyncSession
+from src.config import get_settings
+from src.models import ThreadDecision
+
+async def fix():
+    settings = get_settings()
+    engine = create_async_engine(settings.database_url)
+    factory = async_sessionmaker(engine, class_=AsyncSession, expire_on_commit=False)
+
+    async with factory() as db:
+        result = await db.execute(
+            select(ThreadDecision).where(ThreadDecision.outcome == "proposal")
+        )
+        decisions = result.scalars().all()
+        fixed = 0
+        for d in decisions:
+            if not d.summary_text:
+                continue
+            match = re.search(r"<proposal>(.*?)</proposal>", d.summary_text, re.DOTALL)
+            if match:
+                d.summary_text = match.group(1).strip()
+                fixed += 1
+        await db.commit()
+        print(f"Fixed {fixed} / {len(decisions)} proposals")
+
+asyncio.run(fix())
diff --git a/scripts/matchmaker_cli.py b/scripts/matchmaker_cli.py
new file mode 100644
index 0000000..a8072ac
--- /dev/null
+++ b/scripts/matchmaker_cli.py
@@ -0,0 +1,217 @@
+#!/usr/bin/env python3
+"""Generate a matchmaker collaboration proposal from two PI profile directories.
+
+Usage (from repo root inside the app container):
+
+  Single pair (positional args):
+    python scripts/matchmaker_cli.py <pi_a_slug> <pi_b_slug> [--dry-run]
+
+  Batch from TSV file (-t flag, no positional args):
+    python scripts/matchmaker_cli.py -t pairs.tsv [--dry-run]
+
+The TSV file has two tab-separated columns (pi_a, pi_b), one pair per line.
+Lines starting with '#' and blank lines are ignored. A header row whose first
+cell is "pi_a" (case-insensitive) is also skipped automatically.
+
+Examples:
+    python scripts/matchmaker_cli.py su wiseman
+    python scripts/matchmaker_cli.py grotjahn lotz --dry-run
+    python scripts/matchmaker_cli.py -t pairs.tsv
+    python scripts/matchmaker_cli.py -t pairs.tsv --dry-run
+
+The PI slug must match a filename in profiles/public/ (without .md extension).
+Private profiles from profiles/private/{slug}.md are included if they exist.
+
+Results are written to the matchmaker_proposals DB table and are immediately
+visible in the admin Matchmaker tab at /admin/matchmaker.
+"""
+
+import argparse
+import asyncio
+import re
+import sys
+from pathlib import Path
+
+
+def load_profile_files(slug: str) -> tuple[str, str, str]:
+    """Load public + private profiles for a given slug.
+
+    Returns (pi_name, public_md, private_md).
+    pi_name is extracted from the '**PI:**' line in the public profile.
+    """
+    slug = slug.lower()
+    public_path = Path("profiles/public") / f"{slug}.md"
+    private_path = Path("profiles/private") / f"{slug}.md"
+
+    if not public_path.exists():
+        available = sorted(p.stem for p in Path("profiles/public").glob("*.md"))
+        print(f"Error: no public profile found for '{slug}'.")
+        print(f"Available slugs: {', '.join(available)}")
+        sys.exit(1)
+
+    public_md = public_path.read_text()
+
+    # Extract PI name from "**PI:** Name" line
+    pi_name = slug.capitalize()
+    match = re.search(r"\*\*PI:\*\*\s*(.+)", public_md)
+    if match:
+        pi_name = match.group(1).strip()
+
+    private_md = private_path.read_text() if private_path.exists() else ""
+
+    return pi_name, public_md, private_md
+
+
+async def run(slug_a: str, slug_b: str, dry_run: bool) -> None:
+    from src.config import get_settings
+    from src.services.llm import generate_matchmaker_proposal
+
+    name_a, public_a, private_a = load_profile_files(slug_a)
+    name_b, public_b, private_b = load_profile_files(slug_b)
+
+    settings = get_settings()
+
+    print(f"Generating proposal: {name_a}  ×  {name_b}")
+    print(f"Model: {settings.llm_agent_model_opus}")
+    print("Calling LLM… (this may take 10–20 seconds)")
+
+    result = await generate_matchmaker_proposal(
+        name_a=name_a,
+        public_profile_a=public_a,
+        private_profile_a=private_a,
+        publications_a="(see public profile above)",
+        name_b=name_b,
+        public_profile_b=public_b,
+        private_profile_b=private_b,
+        publications_b="(see public profile above)",
+        model=settings.llm_agent_model_opus,
+    )
+
+    print(f"\nConfidence : {result['confidence'].upper()}")
+    print(f"Title      : {result['title']}")
+    print(f"Tokens     : {result['input_tokens']} in / {result['output_tokens']} out")
+    print("\n" + "─" * 72)
+    print(result["proposal_md"])
+    print("─" * 72)
+
+    if dry_run:
+        print("\n[dry-run] Skipping database write.")
+        return
+
+    # Write to DB
+    import uuid
+    from datetime import datetime, timezone
+
+    from sqlalchemy import text
+
+    from src.database import get_engine, get_session_factory
+    from src.models.matchmaker import MatchmakerProposal
+
+    engine = get_engine()
+    session_factory = get_session_factory()
+
+    async with session_factory() as session:
+        proposal = MatchmakerProposal(
+            id=uuid.uuid4(),
+            pi_a_id=None,
+            pi_b_id=None,
+            pi_a_name=name_a,
+            pi_b_name=name_b,
+            proposal_md=result["proposal_md"],
+            title=result["title"],
+            confidence=result["confidence"],
+            llm_model=result["model"],
+            input_tokens=result["input_tokens"],
+            output_tokens=result["output_tokens"],
+            generated_at=datetime.now(timezone.utc),
+        )
+        session.add(proposal)
+        await session.commit()
+        print(f"\nSaved to DB: {proposal.id}")
+        print(f"View at   : /admin/matchmaker/{proposal.id}")
+
+    await engine.dispose()
+
+
+def _parse_tsv(path: str) -> list[tuple[str, str]]:
+    """Parse a two-column TSV file into a list of (pi_a, pi_b) slug pairs."""
+    pairs: list[tuple[str, str]] = []
+    with open(path) as f:
+        for lineno, line in enumerate(f, 1):
+            line = line.rstrip("\n")
+            if not line or line.startswith("#"):
+                continue
+            parts = line.split("\t")
+            if len(parts) < 2:
+                print(f"Warning: line {lineno} has fewer than 2 columns, skipping: {line!r}")
+                continue
+            a, b = parts[0].strip(), parts[1].strip()
+            if lineno == 1 and a.lower() == "pi_a":
+                continue  # skip header row
+            if not a or not b:
+                print(f"Warning: line {lineno} has empty slug, skipping.")
+                continue
+            pairs.append((a, b))
+    return pairs
+
+
+def main() -> None:
+    parser = argparse.ArgumentParser(
+        description="Generate matchmaker proposals from PI profile slugs.",
+        epilog=(
+            "Single pair:  matchmaker_cli.py su wiseman\n"
+            "Batch TSV:    matchmaker_cli.py -t pairs.tsv"
+        ),
+        formatter_class=argparse.RawDescriptionHelpFormatter,
+    )
+    parser.add_argument("pi_a", nargs="?", help="Slug for PI A (e.g. 'su')")
+    parser.add_argument("pi_b", nargs="?", help="Slug for PI B (e.g. 'wiseman')")
+    parser.add_argument(
+        "-t", "--tsv",
+        metavar="FILE",
+        help="TSV file with two columns (pi_a, pi_b); one pair per line",
+    )
+    parser.add_argument(
+        "--dry-run",
+        action="store_true",
+        help="Print proposals to stdout without writing to the database",
+    )
+    args = parser.parse_args()
+
+    # Build list of pairs to process
+    if args.tsv:
+        if args.pi_a or args.pi_b:
+            parser.error("Cannot combine -t/--tsv with positional PI arguments.")
+        pairs = _parse_tsv(args.tsv)
+        if not pairs:
+            print("No valid pairs found in TSV file.")
+            sys.exit(1)
+    elif args.pi_a and args.pi_b:
+        pairs = [(args.pi_a, args.pi_b)]
+    else:
+        parser.error("Provide either two positional slugs or -t FILE.")
+
+    errors: list[str] = []
+    for i, (slug_a, slug_b) in enumerate(pairs):
+        if len(pairs) > 1:
+            print(f"\n{'='*72}")
+            print(f"Pair {i + 1}/{len(pairs)}: {slug_a}  ×  {slug_b}")
+            print(f"{'='*72}")
+        if slug_a == slug_b:
+            msg = f"Skipping {slug_a} × {slug_b}: PI A and PI B must be different."
+            print(msg)
+            errors.append(msg)
+            continue
+        try:
+            asyncio.run(run(slug_a, slug_b, args.dry_run))
+        except SystemExit:
+            errors.append(f"Failed: {slug_a} × {slug_b}")
+
+    if errors:
+        print(f"\n{len(errors)} pair(s) failed:")
+        for e in errors:
+            print(f"  {e}")
+
+
+if __name__ == "__main__":
+    main()
diff --git a/scripts/provision_slack_bots.py b/scripts/provision_slack_bots.py
new file mode 100644
index 0000000..3e7e025
--- /dev/null
+++ b/scripts/provision_slack_bots.py
@@ -0,0 +1,780 @@
+#!/usr/bin/env python3
+"""
+Provision Slack apps for all LabBots that don't yet have a bot token.
+
+How it works
+------------
+1. Reads PILOT_LABS to find bots without SLACK_BOT_TOKEN_<ID> in .env
+2. Creates a Slack app for each via the Manifest API (apps.manifest.create)
+3. Starts a local OAuth callback server on --port (default 8888)
+4. Prints authorize URLs — a workspace admin clicks each one in a browser
+5. Each click redirects back here; the code is exchanged for an xoxb- token
+6. Tokens are appended to .env as SLACK_BOT_TOKEN_<AGENT_ID>
+
+Prerequisites (one-time, done by a workspace admin in a browser)
+-----------------------------------------------------------------
+  1. Go to https://api.slack.com/apps
+  2. Click "Your App Configuration Tokens" → "Generate Token" for your workspace
+  3. Copy both the token (xoxe-...) and the refresh token
+  4. Add to .env:
+       SLACK_CONFIG_TOKEN=xoxe-...
+       SLACK_CONFIG_REFRESH_TOKEN=xoxe-...
+
+Usage
+-----
+  # From project root:
+  python scripts/provision_slack_bots.py
+
+  # Custom port or env file:
+  python scripts/provision_slack_bots.py --port 9000 --env-file .env
+
+  # Preview what would be created without calling any APIs:
+  python scripts/provision_slack_bots.py --dry-run
+
+  # Re-run the OAuth step without recreating apps (useful if the server was
+  # interrupted midway — re-uses credentials saved in .provision_state.json):
+  python scripts/provision_slack_bots.py --skip-create
+
+Remote / no-browser workflow
+-----------------------------
+Use this when you don't have browser access to the Slack workspace and need
+to delegate the approval step to the workspace admin.
+
+  Step 1 — on your server, create the apps and export the OAuth URLs:
+    python scripts/provision_slack_bots.py --export-urls
+
+  This prints one URL per bot and writes them to oauth_urls.txt.
+  Send that file (or the printed URLs) to the workspace admin.
+
+  Step 2 — the admin opens each URL in a browser, clicks Allow, and lands on
+  httpbin.org showing JSON like:
+    {"args": {"code": "abc123", "state": "su"}, ...}
+  They copy each agent_id and code into a plain text file (one per line):
+    su:abc123
+    wiseman:def456
+    lotz:ghi789
+  and send the file back to you.
+
+  Step 3 — on your server, exchange the codes for tokens:
+    python scripts/provision_slack_bots.py --exchange-codes codes.txt
+"""
+
+import argparse
+import json
+import sys
+import threading
+import time
+import urllib.parse
+from http.server import BaseHTTPRequestHandler, HTTPServer
+from pathlib import Path
+
+import httpx
+from dotenv import dotenv_values, set_key
+from rich.console import Console
+from rich.table import Table
+
+# ---------------------------------------------------------------------------
+# Constants
+# ---------------------------------------------------------------------------
+
+SLACK_API = "https://slack.com/api"
+CALLBACK_PATH = "/oauth/callback"
+STATE_FILE = Path(".provision_state.json")
+
+# Used by --export-urls / --exchange-codes: Slack redirects the admin here after
+# approval and httpbin echoes the code + state as JSON so the admin can copy them.
+HTTPBIN_REDIRECT = "https://httpbin.org/get"
+
+# All scopes the bots actually use — derived from AgentSlackClient + routers/podcast
+BOT_SCOPES = [
+    "channels:history",   # conversations.history / conversations.replies
+    "channels:join",      # conversations.join
+    "channels:manage",    # conversations.create
+    "channels:read",      # conversations.list
+    "chat:write",         # chat.postMessage
+    "groups:history",     # threads in private channels
+    "groups:read",        # conversations.list private
+    "im:history",         # poll_dm_messages
+    "im:write",           # conversations.open (DMs)
+    "users:read",         # users.info
+    "users:read.email",   # users.lookupByEmail
+]
+
+console = Console()
+
+
+# ---------------------------------------------------------------------------
+# Parse PILOT_LABS from source without importing the module
+# (avoids pulling in SQLAlchemy and other heavy dependencies)
+# ---------------------------------------------------------------------------
+
+def load_pilot_labs() -> list[dict]:
+    import ast
+    src = Path(__file__).parent.parent / "src" / "agent" / "simulation.py"
+    tree = ast.parse(src.read_text())
+    for node in ast.walk(tree):
+        if (
+            isinstance(node, ast.Assign)
+            and len(node.targets) == 1
+            and isinstance(node.targets[0], ast.Name)
+            and node.targets[0].id == "PILOT_LABS"
+        ):
+            return ast.literal_eval(node.value)
+    raise RuntimeError("PILOT_LABS not found in src/agent/simulation.py")
+
+
+# ---------------------------------------------------------------------------
+# Slack API helpers
+# ---------------------------------------------------------------------------
+
+def lookup_team_id(existing_env: dict) -> str | None:
+    """Call auth.test on the first valid bot token to get the workspace team_id."""
+    for key, val in existing_env.items():
+        if (
+            key.upper().startswith("SLACK_BOT_TOKEN_")
+            and val
+            and val.startswith("xoxb-")
+            and not val.startswith("xoxb-placeholder")
+        ):
+            resp = httpx.post(
+                f"{SLACK_API}/auth.test",
+                headers={"Authorization": f"Bearer {val}"},
+                timeout=10,
+            )
+            data = resp.json()
+            if data.get("ok"):
+                return data.get("team_id")
+    return None
+
+
+def rotate_config_token(refresh_token: str) -> tuple[str, str]:
+    """Rotate the app-config token. Returns (new_access_token, new_refresh_token)."""
+    resp = httpx.post(
+        f"{SLACK_API}/tooling.tokens.rotate",
+        data={"refresh_token": refresh_token},
+        timeout=15,
+    )
+    data = resp.json()
+    if not data.get("ok"):
+        raise RuntimeError(f"tooling.tokens.rotate failed: {data.get('error')}")
+    return data["token"], data["refresh_token"]
+
+
+def create_app(
+    config_token: str,
+    agent_id: str,
+    bot_name: str,
+    pi_name: str,
+    redirect_uri: str,
+    max_rate_limit_retries: int = 5,
+) -> dict:
+    """
+    Create one Slack app via the Manifest API.
+    Returns a dict with app_id, client_id, client_secret, oauth_url.
+    Retries on rate-limit responses only; all other errors raise immediately.
+    """
+    manifest = {
+        "display_information": {
+            "name": bot_name,
+            "description": f"LabBot agent for {pi_name}",
+        },
+        "features": {
+            "bot_user": {
+                "display_name": bot_name,
+                "always_online": False,
+            }
+        },
+        "oauth_config": {
+            "redirect_urls": [redirect_uri],
+            "scopes": {"bot": BOT_SCOPES},
+        },
+        "settings": {
+            "org_deploy_enabled": False,
+            "socket_mode_enabled": False,
+            "token_rotation_enabled": False,
+        },
+    }
+    for attempt in range(max_rate_limit_retries):
+        resp = httpx.post(
+            f"{SLACK_API}/apps.manifest.create",
+            headers={"Authorization": f"Bearer {config_token}"},
+            json={"manifest": manifest},
+            timeout=20,
+        )
+        data = resp.json()
+        if data.get("ok"):
+            creds = data["credentials"]
+            return {
+                "agent_id": agent_id,
+                "bot_name": bot_name,
+                "pi_name": pi_name,
+                "app_id": data["app_id"],
+                "client_id": creds["client_id"],
+                "client_secret": creds["client_secret"],
+                "oauth_url": data["oauth_authorize_url"],
+            }
+        if data.get("error") == "ratelimited":
+            wait = int(data.get("retry_after", 0) or resp.headers.get("Retry-After", 60))
+            console.print(f"  [yellow]rate limited — waiting {wait}s before retrying {bot_name}…[/yellow]")
+            time.sleep(wait)
+        else:
+            detail = data.get("errors") or data.get("error", "unknown")
+            raise RuntimeError(f"apps.manifest.create failed: {detail}")
+    raise RuntimeError(f"apps.manifest.create: still rate-limited after {max_rate_limit_retries} retries")
+
+
+def exchange_code(
+    client_id: str,
+    client_secret: str,
+    code: str,
+    redirect_uri: str,
+) -> str:
+    """Exchange a temporary OAuth code for a bot token. Returns xoxb-... string."""
+    resp = httpx.post(
+        f"{SLACK_API}/oauth.v2.access",
+        data={
+            "client_id": client_id,
+            "client_secret": client_secret,
+            "code": code,
+            "redirect_uri": redirect_uri,
+        },
+        timeout=15,
+    )
+    data = resp.json()
+    if not data.get("ok"):
+        raise RuntimeError(f"oauth.v2.access failed: {data.get('error')}")
+    token = data.get("access_token", "")
+    if not token.startswith("xoxb-"):
+        raise RuntimeError(f"Unexpected token format: {token[:20]}...")
+    return token
+
+
+# ---------------------------------------------------------------------------
+# OAuth callback HTTP server
+# ---------------------------------------------------------------------------
+
+class _CallbackHandler(BaseHTTPRequestHandler):
+    """
+    Handles GET /oauth/callback?code=...&state=<agent_id>
+    Exchanges the code for a token and writes it to .env.
+    """
+
+    # Shared state injected before server starts
+    pending: dict = {}       # agent_id -> {bot_name, client_id, client_secret}
+    received: dict = {}      # agent_id -> xoxb-token
+    env_file: str = ".env"
+    redirect_uri: str = ""
+
+    def do_GET(self):
+        parsed = urllib.parse.urlparse(self.path)
+        if parsed.path != CALLBACK_PATH:
+            self._html(404, "<h2>404 Not found</h2>")
+            return
+
+        params = dict(urllib.parse.parse_qsl(parsed.query))
+        code = params.get("code")
+        error = params.get("error")
+        agent_id = params.get("state")
+
+        if error:
+            self._html(400, f"<h2>Slack returned an error: {error}</h2>")
+            return
+
+        if not code or not agent_id:
+            self._html(400, "<h2>Missing code or state parameter</h2>")
+            return
+
+        info = self.pending.get(agent_id)
+        if not info:
+            self._html(400, f"<h2>Unknown agent_id in state: {agent_id!r}</h2>")
+            return
+
+        if agent_id in self.received:
+            self._html(200, f"<h2>{info['bot_name']} already installed — duplicate callback ignored.</h2>")
+            return
+
+        try:
+            token = exchange_code(
+                info["client_id"], info["client_secret"], code, self.redirect_uri
+            )
+        except Exception as exc:
+            console.print(f"[red]Token exchange failed for {agent_id}: {exc}[/red]")
+            self._html(500, f"<h2>Token exchange failed: {exc}</h2>")
+            return
+
+        env_key = f"SLACK_BOT_TOKEN_{agent_id.upper()}"
+        set_key(self.env_file, env_key, token, quote_mode="never")
+        self.received[agent_id] = token
+
+        remaining = len(self.pending) - len(self.received)
+        console.print(f"[green]✓[/green] [bold]{info['bot_name']}[/bold] → {env_key}")
+        self._html(200, f"""
+            <h2 style="color:green">✅ {info['bot_name']} installed!</h2>
+            <p>Token written to .env as <code>{env_key}</code></p>
+            <p><b>{remaining}</b> bot(s) remaining. You may close this tab.</p>
+        """)
+
+    def _html(self, code: int, body: str):
+        content = (
+            "<html><body style='font-family:sans-serif;padding:2em;max-width:600px'>"
+            + body
+            + "</body></html>"
+        ).encode()
+        self.send_response(code)
+        self.send_header("Content-Type", "text/html; charset=utf-8")
+        self.send_header("Content-Length", str(len(content)))
+        self.end_headers()
+        self.wfile.write(content)
+
+    def log_message(self, *_args):
+        pass  # suppress default access log noise
+
+
+# ---------------------------------------------------------------------------
+# Main
+# ---------------------------------------------------------------------------
+
+def _run_export_urls(args: argparse.Namespace) -> None:
+    """Create Slack apps and export OAuth URLs for a remote admin to approve."""
+    pilot_labs = load_pilot_labs()
+    existing_env = dotenv_values(args.env_file)
+
+    tokenized = {
+        k[len("SLACK_BOT_TOKEN_"):].lower()
+        for k, v in existing_env.items()
+        if k.upper().startswith("SLACK_BOT_TOKEN_")
+        and v and not v.startswith("xoxb-placeholder")
+    }
+    missing = [lab for lab in pilot_labs if lab["id"] not in tokenized]
+
+    if not missing:
+        console.print("[green]All bots already have tokens. Nothing to do.[/green]")
+        return
+
+    config_token = existing_env.get("SLACK_CONFIG_TOKEN", "").strip()
+    refresh_token = existing_env.get("SLACK_CONFIG_REFRESH_TOKEN", "").strip()
+    if not config_token:
+        console.print("[bold red]SLACK_CONFIG_TOKEN is not set in .env[/bold red]")
+        sys.exit(1)
+
+    if refresh_token:
+        console.print("Rotating config token...")
+        try:
+            config_token, new_refresh = rotate_config_token(refresh_token)
+            set_key(args.env_file, "SLACK_CONFIG_TOKEN", config_token, quote_mode="never")
+            set_key(args.env_file, "SLACK_CONFIG_REFRESH_TOKEN", new_refresh, quote_mode="never")
+            console.print("[green]Config token rotated.[/green]")
+        except Exception as exc:
+            console.print(f"[yellow]Token rotation failed ({exc}); using existing token.[/yellow]")
+
+    team_id = args.team_id
+    if not team_id:
+        team_id = lookup_team_id(existing_env)
+
+    console.print(f"\nCreating {len(missing)} Slack app(s)...\n")
+    created: list[dict] = []
+    failed = 0
+    for i, lab in enumerate(missing):
+        try:
+            app = create_app(config_token, lab["id"], lab["name"], lab["pi"], HTTPBIN_REDIRECT)
+            created.append(app)
+            console.print(f"  [green]{i+1:2d}.[/green] [bold]{app['bot_name']}[/bold] (app {app['app_id']})")
+        except Exception as exc:
+            console.print(f"  [red]failed[/red]  {lab['name']}: {exc}")
+            failed += 1
+        if i < len(missing) - 1:
+            time.sleep(12)
+
+    if not created:
+        console.print("[red]No apps created. Exiting.[/red]")
+        sys.exit(1)
+
+    STATE_FILE.write_text(json.dumps(created, indent=2))
+    console.print(f"\n[green]Credentials saved to {STATE_FILE}[/green]")
+
+    def _oauth_url(app: dict) -> str:
+        extra = {"state": app["agent_id"], "redirect_uri": HTTPBIN_REDIRECT}
+        if team_id:
+            extra["team"] = team_id
+        return app["oauth_url"] + "&" + urllib.parse.urlencode(extra)
+
+    lines = []
+    console.print("\n[bold yellow]Send these URLs to the workspace admin.[/bold yellow]")
+    console.print("After clicking Allow, they will land on httpbin.org showing JSON like:")
+    console.print('  {"args": {"code": "abc123", "state": "su"}, ...}')
+    console.print("Ask them to send back a file with one [bold]agent_id:code[/bold] per line.\n")
+
+    for app in created:
+        url = _oauth_url(app)
+        lines.append(f"{app['bot_name']} ({app['agent_id']}):\n  {url}\n")
+        console.print(f"[cyan]{app['bot_name']}[/cyan] ({app['agent_id']}):")
+        console.print(f"  {url}\n")
+
+    out_file = Path("oauth_urls.txt")
+    out_file.write_text("\n".join(lines))
+    console.print(f"[green]URLs also saved to {out_file}[/green]")
+    if failed:
+        console.print(f"[yellow]{failed} app(s) failed — re-run to retry.[/yellow]")
+
+
+def _parse_codes_file(text: str) -> list[tuple[str, str]]:
+    """Parse a codes file into (agent_id, code) pairs.
+
+    Supports two formats (auto-detected):
+
+    1. Simple — one agent_id:code per line:
+         cline:10935961...
+         su:abc123...
+
+    2. httpbin JSON — the raw JSON response from httpbin.org/get, or multiple
+       responses separated by lines containing only '---':
+         {"args": {"code": "10935961...", "state": "cline"}, ...}
+         ---
+         {"args": {"code": "abc123...", "state": "su"}, ...}
+    """
+    text = text.strip()
+    pairs: list[tuple[str, str]] = []
+
+    # Split on --- separators to handle multiple httpbin blobs
+    blocks = [b.strip() for b in text.split("---") if b.strip()]
+
+    for block in blocks:
+        # Try JSON parse first (httpbin format)
+        if block.startswith("{"):
+            try:
+                data = json.loads(block)
+                args = data.get("args", {})
+                code = args.get("code", "").strip()
+                agent_id = args.get("state", "").strip()
+                if code and agent_id:
+                    pairs.append((agent_id, code))
+                    continue
+            except json.JSONDecodeError:
+                pass
+
+            # Fall back to line-by-line parsing (URL or agent_id:code)
+        for line in block.splitlines():
+            line = line.strip()
+            if not line or line.startswith("#"):
+                continue
+            # httpbin URL: https://httpbin.org/get?code=...&state=...
+            if line.startswith("http"):
+                parsed = urllib.parse.urlparse(line)
+                params = dict(urllib.parse.parse_qsl(parsed.query))
+                code = params.get("code", "").strip()
+                agent_id = params.get("state", "").strip()
+                if code and agent_id:
+                    pairs.append((agent_id, code))
+                else:
+                    console.print(f"[yellow]Skipping URL with missing code/state: {line!r}[/yellow]")
+                continue
+            # Simple agent_id:code
+            if ":" not in line:
+                console.print(f"[yellow]Skipping malformed line (expected agent_id:code): {line!r}[/yellow]")
+                continue
+            agent_id, code = line.split(":", 1)
+            pairs.append((agent_id.strip(), code.strip()))
+
+    return pairs
+
+
+def _run_exchange_codes(codes_file: str, env_file: str) -> None:
+    """Read agent_id:code pairs from a file and exchange each for an xoxb- token."""
+    codes_path = Path(codes_file)
+    if not codes_path.exists():
+        console.print(f"[red]Codes file not found: {codes_file}[/red]")
+        sys.exit(1)
+    if not STATE_FILE.exists():
+        console.print(f"[red]{STATE_FILE} not found — run --export-urls first.[/red]")
+        sys.exit(1)
+
+    state: list[dict] = json.loads(STATE_FILE.read_text())
+    creds_by_id = {app["agent_id"]: app for app in state}
+
+    pairs = _parse_codes_file(codes_path.read_text())
+
+    if not pairs:
+        console.print("[red]No valid codes found in file.[/red]")
+        sys.exit(1)
+
+    console.print(f"\nExchanging {len(pairs)} code(s)...\n")
+    saved = 0
+    for agent_id, code in pairs:
+
+        app = creds_by_id.get(agent_id)
+        if not app:
+            console.print(f"[yellow]No credentials found for agent_id {agent_id!r} — skipping.[/yellow]")
+            continue
+
+        try:
+            token = exchange_code(app["client_id"], app["client_secret"], code, HTTPBIN_REDIRECT)
+        except Exception as exc:
+            console.print(f"[red]Failed to exchange code for {agent_id}: {exc}[/red]")
+            continue
+
+        env_key = f"SLACK_BOT_TOKEN_{agent_id.upper()}"
+        set_key(env_file, env_key, token, quote_mode="never")
+        console.print(f"[green]✓[/green] [bold]{app['bot_name']}[/bold] → {env_key}")
+        saved += 1
+
+    console.print(f"\n[bold]{saved}/{len(pairs)} token(s) saved to {env_file}[/bold]")
+    if saved == len(pairs):
+        STATE_FILE.unlink(missing_ok=True)
+        console.print("[green]All done! Restart the agent container to pick up the new tokens.[/green]")
+        console.print("  docker rm -f agent-run")
+        console.print("  docker compose up -d --build app worker")
+        console.print("  docker compose --profile agent run -d --name agent-run agent python -m src.agent.main --budget 0")
+    else:
+        console.print(f"[yellow]Some exchanges failed. Fix and re-run --exchange-codes with the remaining codes.[/yellow]")
+        console.print(f"  Credentials still in {STATE_FILE} — no need to re-run --export-urls.")
+
+
+def main():
+    parser = argparse.ArgumentParser(
+        description=__doc__,
+        formatter_class=argparse.RawDescriptionHelpFormatter,
+    )
+    parser.add_argument(
+        "--port", type=int, default=8888,
+        help="Local port for the OAuth callback server (default: 8888)",
+    )
+    parser.add_argument(
+        "--env-file", default=".env",
+        help="Path to the .env file that will receive the new tokens (default: .env)",
+    )
+    parser.add_argument(
+        "--dry-run", action="store_true",
+        help="Show which bots need tokens; make no API calls",
+    )
+    parser.add_argument(
+        "--skip-create", action="store_true",
+        help=f"Skip app creation and reuse credentials from {STATE_FILE}",
+    )
+    parser.add_argument(
+        "--team-id",
+        help="Slack workspace team ID (e.g. T012AB3CD) to pin OAuth URLs to the right workspace. "
+             "Auto-detected from an existing bot token if not provided.",
+    )
+    parser.add_argument(
+        "--export-urls", action="store_true",
+        help=(
+            "Create Slack apps and export OAuth URLs for a remote admin to approve. "
+            f"Uses {HTTPBIN_REDIRECT} as the redirect URI so the admin sees the code "
+            "on-screen. URLs are printed and saved to oauth_urls.txt. "
+            "Run --exchange-codes after the admin returns the codes."
+        ),
+    )
+    parser.add_argument(
+        "--exchange-codes",
+        metavar="CODES_FILE",
+        help=(
+            "Exchange OAuth codes provided by a remote admin for bot tokens. "
+            "CODES_FILE must contain one 'agent_id:code' entry per line. "
+            f"Requires {STATE_FILE} from a previous --export-urls run."
+        ),
+    )
+    parser.add_argument(
+        "--exchange-urls",
+        metavar="URLS_FILE",
+        help=(
+            "Exchange OAuth codes extracted from httpbin redirect URLs. "
+            "URLS_FILE must contain one full httpbin URL per line, e.g.: "
+            "https://httpbin.org/get?code=...&state=su. "
+            f"Requires {STATE_FILE} from a previous --export-urls run."
+        ),
+    )
+    args = parser.parse_args()
+
+    redirect_uri = f"http://localhost:{args.port}{CALLBACK_PATH}"
+
+    # -----------------------------------------------------------------------
+    # --export-urls: create apps and write OAuth URLs for a remote admin
+    # -----------------------------------------------------------------------
+    if args.export_urls:
+        _run_export_urls(args)
+        return
+
+    # -----------------------------------------------------------------------
+    # --exchange-codes: exchange codes file returned by the admin for tokens
+    # -----------------------------------------------------------------------
+    if args.exchange_codes:
+        _run_exchange_codes(args.exchange_codes, args.env_file)
+        return
+
+    if args.exchange_urls:
+        _run_exchange_codes(args.exchange_urls, args.env_file)
+        return
+
+    # -----------------------------------------------------------------------
+    # 1. Determine which bots are missing tokens
+    # -----------------------------------------------------------------------
+    pilot_labs = load_pilot_labs()
+    existing_env = dotenv_values(args.env_file)
+
+    team_id = args.team_id
+    if not team_id and not args.dry_run:
+        team_id = lookup_team_id(existing_env)
+        if team_id:
+            console.print(f"Detected workspace team ID: [cyan]{team_id}[/cyan]")
+        else:
+            console.print("[yellow]Could not detect team ID — OAuth links may open the wrong workspace.[/yellow]")
+            console.print("  Pass --team-id T... to fix this.")
+
+    tokenized = {
+        k[len("SLACK_BOT_TOKEN_"):].lower()
+        for k, v in existing_env.items()
+        if k.upper().startswith("SLACK_BOT_TOKEN_")
+        and v
+        and not v.startswith("xoxb-placeholder")
+    }
+
+    missing = [lab for lab in pilot_labs if lab["id"] not in tokenized]
+
+    if not missing:
+        console.print("[green]All bots already have tokens. Nothing to do.[/green]")
+        return
+
+    t = Table(title=f"{len(missing)} bot(s) need Slack tokens", show_lines=True)
+    t.add_column("agent_id", style="cyan")
+    t.add_column("Bot name")
+    t.add_column("PI")
+    for lab in missing:
+        t.add_row(lab["id"], lab["name"], lab["pi"])
+    console.print(t)
+
+    if args.dry_run:
+        console.print("[yellow]--dry-run active: no API calls made.[/yellow]")
+        return
+
+    # -----------------------------------------------------------------------
+    # 2. Obtain / rotate config token
+    # -----------------------------------------------------------------------
+    config_token = existing_env.get("SLACK_CONFIG_TOKEN", "").strip()
+    refresh_token = existing_env.get("SLACK_CONFIG_REFRESH_TOKEN", "").strip()
+
+    if not config_token:
+        console.print("\n[bold red]SLACK_CONFIG_TOKEN is not set in .env[/bold red]")
+        console.print(
+            "  1. Open https://api.slack.com/apps in a browser\n"
+            "  2. Click 'Your App Configuration Tokens'\n"
+            "  3. Click 'Generate Token' for your workspace\n"
+            "  4. Copy the token (xoxe-...) and refresh token into .env:\n"
+            "       SLACK_CONFIG_TOKEN=xoxe-...\n"
+            "       SLACK_CONFIG_REFRESH_TOKEN=xoxe-...\n"
+        )
+        sys.exit(1)
+
+    if refresh_token:
+        console.print("Rotating config token...")
+        try:
+            config_token, new_refresh = rotate_config_token(refresh_token)
+            set_key(args.env_file, "SLACK_CONFIG_TOKEN", config_token, quote_mode="never")
+            set_key(args.env_file, "SLACK_CONFIG_REFRESH_TOKEN", new_refresh, quote_mode="never")
+            console.print("[green]Config token rotated and saved.[/green]")
+        except Exception as exc:
+            console.print(f"[yellow]Token rotation failed ({exc}); using existing token.[/yellow]")
+
+    # -----------------------------------------------------------------------
+    # 3. Start OAuth callback server (before app creation so URLs work immediately)
+    # -----------------------------------------------------------------------
+    _CallbackHandler.pending = {}
+    _CallbackHandler.received = {}
+    _CallbackHandler.env_file = args.env_file
+    _CallbackHandler.redirect_uri = redirect_uri
+
+    server = HTTPServer(("localhost", args.port), _CallbackHandler)
+    threading.Thread(target=server.serve_forever, daemon=True).start()
+    console.print(f"\n[bold]OAuth callback server running on http://localhost:{args.port}[/bold]")
+    console.print(
+        "\n[bold yellow]Open each URL in a browser while signed into the workspace.[/bold yellow]\n"
+        "Each approval redirects back here and saves the token to .env automatically.\n"
+    )
+
+    # -----------------------------------------------------------------------
+    # 4. Create apps (or load previous run's state) and print URLs as they appear
+    # -----------------------------------------------------------------------
+    def _oauth_url(app: dict) -> str:
+        extra = {"state": app["agent_id"], "redirect_uri": redirect_uri}
+        if team_id:
+            extra["team"] = team_id
+        return app["oauth_url"] + "&" + urllib.parse.urlencode(extra)
+
+    created: list[dict] = []
+    if args.skip_create:
+        if not STATE_FILE.exists():
+            console.print(f"[red]--skip-create: {STATE_FILE} not found. Run without that flag first.[/red]")
+            server.shutdown()
+            sys.exit(1)
+        all_state: list[dict] = json.loads(STATE_FILE.read_text())
+        missing_ids = {lab["id"] for lab in missing}
+        created = [a for a in all_state if a["agent_id"] in missing_ids]
+        console.print(f"Loaded {len(created)} app credential(s) from {STATE_FILE}\n")
+        for i, app in enumerate(created, 1):
+            _CallbackHandler.pending[app["agent_id"]] = {
+                "bot_name": app["bot_name"],
+                "client_id": app["client_id"],
+                "client_secret": app["client_secret"],
+            }
+            console.print(f"  [cyan]{i:2d}.[/cyan] [bold]{app['bot_name']}[/bold] ({app['pi_name']})")
+            console.print(f"      {_oauth_url(app)}\n")
+    else:
+        failed_count = 0
+        for i, lab in enumerate(missing):
+            try:
+                app = create_app(config_token, lab["id"], lab["name"], lab["pi"], redirect_uri)
+                created.append(app)
+                _CallbackHandler.pending[app["agent_id"]] = {
+                    "bot_name": app["bot_name"],
+                    "client_id": app["client_id"],
+                    "client_secret": app["client_secret"],
+                }
+                console.print(f"  [green]{i+1:2d}.[/green] [bold]{app['bot_name']}[/bold] (app {app['app_id']})")
+                console.print(f"      {_oauth_url(app)}\n")
+            except Exception as exc:
+                console.print(f"  [red]failed[/red]  {lab['name']}: {exc}")
+                failed_count += 1
+            # Slack's Manifest API allows ~10 req/min; 12s between calls stays well under
+            if i < len(missing) - 1:
+                time.sleep(12)
+
+        if created:
+            STATE_FILE.write_text(json.dumps(created, indent=2))
+        if failed_count:
+            console.print(f"[yellow]{failed_count} app(s) failed to create — fix errors and re-run.[/yellow]")
+
+    if not created:
+        console.print("[red]No apps available for OAuth. Exiting.[/red]")
+        server.shutdown()
+        sys.exit(1)
+
+    # -----------------------------------------------------------------------
+    # 5. Wait for all OAuth callbacks
+    # -----------------------------------------------------------------------
+    console.print(f"Waiting for {len(created)} installation(s)…  (Ctrl-C to stop early)\n")
+    try:
+        while len(_CallbackHandler.received) < len(created):
+            time.sleep(0.5)
+    except KeyboardInterrupt:
+        console.print("\n[yellow]Interrupted.[/yellow]")
+    finally:
+        server.shutdown()
+
+    done = len(_CallbackHandler.received)
+    total = len(created)
+    console.print(f"\n[bold]Finished: {done}/{total} token(s) saved to {args.env_file}[/bold]")
+
+    if done < total:
+        outstanding = [a["bot_name"] for a in created if a["agent_id"] not in _CallbackHandler.received]
+        console.print(f"[yellow]Still missing: {', '.join(outstanding)}[/yellow]")
+        console.print(f"Re-run with [bold]--skip-create[/bold] to retry without recreating the apps.")
+    else:
+        if STATE_FILE.exists():
+            STATE_FILE.unlink()
+        console.print(f"[green]All done! Restart the agent container to pick up the new tokens.[/green]")
+        console.print("  docker rm -f agent-run")
+        console.print("  docker compose up -d --build app worker")
+        console.print("  docker compose --profile agent run -d --name agent-run agent python -m src.agent.main --budget 0")
+
+
+if __name__ == "__main__":
+    main()
diff --git a/scripts/test_podcast_su.py b/scripts/test_podcast_su.py
new file mode 100644
index 0000000..6795f27
--- /dev/null
+++ b/scripts/test_podcast_su.py
@@ -0,0 +1,143 @@
+"""One-shot test: run the podcast pipeline for agent 'su' only.
+
+Outputs:
+  .labbot-tests/su-summary-<date>.txt   — generated text summary
+  .labbot-tests/su-audio-<date>.mp3     — TTS audio (if MISTRAL_API_KEY is set)
+
+Usage:
+    DATABASE_URL=postgresql+asyncpg://copi:copi@localhost:5432/copi \
+    python scripts/test_podcast_su.py
+"""
+
+import asyncio
+import logging
+import os
+import shutil
+from datetime import date
+from pathlib import Path
+
+logging.basicConfig(
+    level=logging.INFO,
+    format="%(asctime)s %(levelname)s %(name)s: %(message)s",
+)
+logger = logging.getLogger(__name__)
+
+OUTPUT_DIR = Path(".labbot-tests")
+AUDIO_DIR = Path("data/podcast_audio")
+
+
+async def run():
+    from sqlalchemy.ext.asyncio import AsyncSession, create_async_engine
+    from sqlalchemy.orm import sessionmaker
+
+    from src.config import get_settings
+    from src.podcast.pipeline import (
+        _generate_summary,
+        _load_podcast_preferences,
+        _load_public_profile,
+        _parse_profile_markdown,
+        _select_article,
+        _try_fetch_full_text,
+    )
+    from src.podcast.tts_utils import get_audio_duration_seconds
+    from src.podcast.pubmed_search import build_queries, fetch_candidates
+    from src.podcast.state import get_delivered_pmids, record_delivery
+
+    settings = get_settings()
+    agent_id = "su"
+    today = date.today()
+    OUTPUT_DIR.mkdir(exist_ok=True)
+
+    logger.info("=== LabBot Podcast test run for agent: %s ===", agent_id)
+
+    # 1. Load profiles
+    profile_text = _load_public_profile(agent_id)
+    if not profile_text:
+        logger.error("No public profile found for agent: %s", agent_id)
+        return
+    logger.info("Loaded profile (%d chars)", len(profile_text))
+
+    preferences_text = await _load_podcast_preferences(agent_id)
+    if preferences_text:
+        logger.info("Loaded podcast preferences (%d chars)", len(preferences_text))
+    else:
+        logger.info("No podcast preferences found for agent: %s", agent_id)
+
+    # 2. Build queries and fetch candidates
+    profile_dict = _parse_profile_markdown(profile_text)
+    queries = build_queries(profile_dict)
+    logger.info("Search queries: %s", queries)
+
+    already_delivered = get_delivered_pmids(agent_id)
+    logger.info("Already delivered PMIDs: %s", already_delivered)
+
+    candidates = await fetch_candidates(
+        queries,
+        already_delivered=already_delivered,
+        days=settings.podcast_search_window_days,
+        max_total=settings.podcast_max_candidates,
+    )
+    logger.info("Fetched %d candidates", len(candidates))
+    if not candidates:
+        logger.error("No candidate articles found — aborting")
+        return
+
+    # 3. LLM article selection
+    selected, justification = await _select_article(profile_text, candidates, agent_id, preferences_text)
+    if selected is None:
+        logger.error("No article selected — aborting")
+        return
+    pmid = selected.get("pmid", "")
+    logger.info("Selected PMID: %s", pmid)
+    logger.info("Justification: %s", justification)
+
+    # 4. Fetch full text
+    full_text = await _try_fetch_full_text(pmid)
+    logger.info("Full text fetched: %s", bool(full_text))
+
+    # 5. Generate text summary
+    summary = await _generate_summary(profile_text, selected, full_text, agent_id, preferences_text)
+    if not summary:
+        logger.error("Summary generation failed — aborting")
+        return
+
+    summary_path = OUTPUT_DIR / f"su-summary-{today.isoformat()}.txt"
+    summary_path.write_text(summary, encoding="utf-8")
+    logger.info("Summary written to %s", summary_path)
+    print("\n" + "=" * 60)
+    print("TEXT SUMMARY")
+    print("=" * 60)
+    print(summary)
+    print("=" * 60 + "\n")
+
+    # 6. Generate audio — dispatch to backend configured by PODCAST_TTS_BACKEND
+    if settings.podcast_tts_backend == "local":
+        from src.podcast.local_tts import generate_audio
+        logger.info("TTS backend: local vLLM-Omni (%s:%s)", settings.local_tts_host, settings.local_tts_port)
+    elif settings.podcast_tts_backend == "openai":
+        from src.podcast.openai_tts import generate_audio
+        logger.info("TTS backend: OpenAI TTS")
+    else:
+        from src.podcast.mistral_tts import generate_audio
+        logger.info("TTS backend: Mistral AI (%s)", settings.mistral_tts_model)
+
+    audio_src = AUDIO_DIR / agent_id / f"{today.isoformat()}.mp3"
+    audio_ok = await generate_audio(summary, agent_id, audio_src)
+
+    if audio_ok:
+        audio_dest = OUTPUT_DIR / f"su-audio-{today.isoformat()}.mp3"
+        shutil.copy2(audio_src, audio_dest)
+        duration = get_audio_duration_seconds(audio_src)
+        logger.info("Audio saved to %s (duration: %ss)", audio_dest, duration)
+    else:
+        logger.warning("Audio generation failed (backend: %s)", settings.podcast_tts_backend)
+
+    logger.info("=== Test run complete ===")
+    logger.info("  PMID: %s", pmid)
+    logger.info("  Summary: %s", summary_path)
+    if audio_ok:
+        logger.info("  Audio: %s", audio_dest)
+
+
+if __name__ == "__main__":
+    asyncio.run(run())
diff --git a/specs/admin-dashboard.md b/specs/admin-dashboard.md
index 2d9cd8f..7a077a7 100644
--- a/specs/admin-dashboard.md
+++ b/specs/admin-dashboard.md
@@ -140,7 +140,74 @@ Analytics on agent-to-agent thread conversations and outcomes.
 
 **Export:** HTML and plain text export options for proposal review.
 
-### 7. LLM Call Logs (`/admin/llm-calls`)
+### 7. Matchmaker (`/admin/matchmaker`)
+
+Admin tool for generating collaboration proposals between two PIs on demand, without running an agent simulation. See `labbot-matchmaker.md` for the full specification.
+
+**Generate form (top of page):**
+- Two dropdowns listing all users with a complete `ResearcherProfile`, sorted by name
+- Client-side enforcement: same user cannot be selected in both dropdowns; Generate button disabled until both are selected
+- On submit: POSTs to `/admin/matchmaker/generate`, shows spinner, redirects to detail view on success
+
+**Proposals table:**
+- Confidence badge (High = green, Moderate = yellow, Speculative = gray)
+- PI A / PI B names
+- Proposal title (truncated)
+- Generated timestamp
+- View / Delete actions
+
+**Filters:**
+- PI multi-select (matches either side)
+- Confidence filter
+
+**Row click** → proposal detail page (`/admin/matchmaker/{id}`)
+
+**Proposal detail (`/admin/matchmaker/{id}`):**
+- Header: PI A × PI B, confidence badge, generated timestamp, token counts
+- Full proposal rendered as markdown
+- Delete button
+
+### 8. PI Proposal Evaluations (`/admin/evaluations`)
+
+Full visibility into all NIH-style PI evaluations submitted through the `/proposals` tab. This is the only place in the system where proposal origin (agent vs. matchmaker) is revealed — the PI-facing evaluation flow deliberately obscures it.
+
+See `proposal-review-pi.md` for the complete specification of the evaluation form and data model. This section covers the admin view only.
+
+**Summary cards:**
+- Total evaluations submitted
+- Evaluations this month
+- Proposals with ≥1 evaluation vs. total proposals in the system
+- Mean overall impact score (all time, shown as X.X / 9)
+
+**Evaluations table** — one row per `PiProposalEvaluation`:
+
+| Column | Notes |
+|---|---|
+| Evaluator | PI's name |
+| Proposal title | From the linked `ThreadDecision` or `MatchmakerProposal` |
+| Origin | `Agent` (blue) or `Matchmaker` (purple) badge |
+| Collaborator | The other PI named in the proposal |
+| Sig. / Inn. / App. / Inv. / Env. | Individual criterion scores 1–9 |
+| Impact | `score_overall_impact`, bold; color-coded green (1–3), yellow (4–6), red (7–9) |
+| Submitted | `evaluated_at` |
+| Updated | `updated_at` if the PI amended their evaluation |
+| Actions | "View" → expanded detail |
+
+**Row detail (inline expand or modal):**
+- All six scores with their associated comments
+- Full proposal body rendered as markdown
+- Evaluator metadata (name, institution, submission/amendment timestamps)
+
+**Filters:**
+- Evaluator (multi-select user dropdown)
+- Origin: All / Agent only / Matchmaker only
+- Overall Impact range (numeric min/max, 1–9)
+- Date range (evaluated_at from/to)
+
+**Export:**
+`GET /admin/evaluations/export.json` — downloads a JSON file of all rows matching the active filter state. Filters are passed as query params so the export always reflects what is on screen. See `proposal-review-pi.md §Admin Page` for the full JSON schema.
+
+### 10. LLM Call Logs (`/admin/llm-calls`)
 
 Debugging view for all LLM API calls.
 
@@ -153,7 +220,7 @@ Debugging view for all LLM API calls.
 - Latency (ms)
 - System prompt and response (expandable)
 
-### 8. Access Requests (`/admin/access-requests`)
+### 11. Access Requests (`/admin/access-requests`)
 
 Pre-release access gate management.
 
@@ -171,7 +238,7 @@ Pre-release access gate management.
 - Add ORCID + note form
 - Remove ORCID button
 
-### 9. Waitlist (`/admin/waitlist`)
+### 12. Waitlist (`/admin/waitlist`)
 
 Lead-capture signups from the public landing page.
 
@@ -183,7 +250,7 @@ Lead-capture signups from the public landing page.
 
 No outbound email is sent automatically — the admin uses the export to reach out manually, then marks rows contacted.
 
-### 10. User Impersonation
+### 13. User Impersonation
 
 Admins can assume the identity of any user to see the app as they see it.
 
@@ -215,6 +282,12 @@ Admins can assume the identity of any user to see the app as they see it.
 | `POST /admin/agents/{id}/approve` | Approve pending agent |
 | `GET /admin/discussions` | Thread discussions and outcomes |
 | `GET /admin/discussions/export` | Export discussions (HTML/text) |
+| `GET /admin/matchmaker` | Matchmaker tab with generate form and proposals table |
+| `POST /admin/matchmaker/generate` | Run LLM pipeline and store result |
+| `GET /admin/matchmaker/{id}` | Proposal detail view |
+| `POST /admin/matchmaker/{id}/delete` | Delete a proposal |
+| `GET /admin/evaluations` | PI proposal evaluations overview |
+| `GET /admin/evaluations/export.json` | JSON export of evaluations (filter params as query string) |
 | `GET /admin/access-requests` | Pending access requests + allowlist management |
 | `POST /admin/access-requests/{user_id}/approve` | Approve a pending user |
 | `POST /admin/access-requests/{user_id}/deny` | Deny a pending user |
diff --git a/specs/cohort-system.md b/specs/cohort-system.md
new file mode 100644
index 0000000..0d65b99
--- /dev/null
+++ b/specs/cohort-system.md
@@ -0,0 +1,438 @@
+# Cohort System Specification
+
+## Overview
+
+A cohort is a named group of agents whose members are permitted to interact with each other during simulation. The purpose is purely practical: prevent agents from spending LLM turns scanning, activating threads with, or tagging agents they will never productively engage. Cohorts are orthogonal to Slack channels — channel subscriptions remain unchanged; cohort membership only gates whether one agent will *act on* another agent's activity.
+
+Agents may belong to any number of cohorts. Cohort assignments are admin-managed and can change while a simulation is running. Interaction limits (thread count, proposal caps, budgets) remain per-agent and are shared across all cohorts an agent belongs to.
+
+---
+
+## Goals
+
+- Skip Phase 2 scan evaluation of posts from non-cohort agents (save Sonnet calls)
+- Skip Phase 3 thread activation from non-cohort agents (save CPU + state bloat)
+- Skip Phase 5 tagging or replying to non-cohort agents (save Opus calls)
+- Run N turns concurrently via a global semaphore for predictable API cost at any agent list size
+- Ensure fair turn distribution across all agents via min-heap selection
+- Allow membership to change mid-run without requiring a restart
+
+---
+
+## Data Model
+
+### New Table: `cohorts`
+
+```sql
+CREATE TABLE cohorts (
+    id          UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+    name        TEXT NOT NULL UNIQUE,
+    description TEXT,
+    created_by  UUID REFERENCES users(id) ON DELETE SET NULL,
+    created_at  TIMESTAMP WITH TIME ZONE DEFAULT now()
+);
+```
+
+- `name`: short slug-style identifier (e.g. `"pilot-wave-1"`, `"structural-cohort"`). Unique, immutable after creation.
+- `description`: optional free-text note for admin reference.
+- `created_by`: FK to the admin user who created it; nullable (SET NULL on user delete).
+
+### New Table: `cohort_memberships`
+
+```sql
+CREATE TABLE cohort_memberships (
+    id         UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+    cohort_id  UUID NOT NULL REFERENCES cohorts(id) ON DELETE CASCADE,
+    agent_id   TEXT NOT NULL,
+    added_by   UUID REFERENCES users(id) ON DELETE SET NULL,
+    added_at   TIMESTAMP WITH TIME ZONE DEFAULT now(),
+    UNIQUE (cohort_id, agent_id)
+);
+```
+
+- `agent_id`: matches `AgentRegistry.agent_id` (string, e.g. `"su"`, `"wiseman"`). No FK enforced — agent records may not exist at table creation time; the application validates at join time.
+- Composite unique constraint prevents duplicate membership.
+- Cascade delete: removing a cohort removes all its memberships.
+
+### Migration
+
+File: `alembic/versions/0023_add_cohorts.py`
+
+```python
+def upgrade():
+    op.create_table("cohorts", ...)
+    op.create_table("cohort_memberships", ...)
+    op.create_index("ix_cohort_memberships_cohort_id", "cohort_memberships", ["cohort_id"])
+    op.create_index("ix_cohort_memberships_agent_id", "cohort_memberships", ["agent_id"])
+
+def downgrade():
+    op.drop_table("cohort_memberships")
+    op.drop_table("cohorts")
+```
+
+### SQLAlchemy Models
+
+`src/models/cohort.py`:
+
+```python
+class Cohort(Base):
+    __tablename__ = "cohorts"
+    id: Mapped[UUID] = mapped_column(primary_key=True, default=uuid4)
+    name: Mapped[str] = mapped_column(unique=True)
+    description: Mapped[str | None]
+    created_by: Mapped[UUID | None] = mapped_column(ForeignKey("users.id", ondelete="SET NULL"))
+    created_at: Mapped[datetime] = mapped_column(default=func.now())
+    memberships: Mapped[list["CohortMembership"]] = relationship(back_populates="cohort", cascade="all, delete-orphan")
+
+class CohortMembership(Base):
+    __tablename__ = "cohort_memberships"
+    id: Mapped[UUID] = mapped_column(primary_key=True, default=uuid4)
+    cohort_id: Mapped[UUID] = mapped_column(ForeignKey("cohorts.id", ondelete="CASCADE"))
+    agent_id: Mapped[str]
+    added_by: Mapped[UUID | None] = mapped_column(ForeignKey("users.id", ondelete="SET NULL"))
+    added_at: Mapped[datetime] = mapped_column(default=func.now())
+    cohort: Mapped["Cohort"] = relationship(back_populates="memberships")
+```
+
+Export from `src/models/__init__.py` alongside existing models.
+
+---
+
+## Agent Changes
+
+### `src/agent/agent.py`
+
+Add one field to `Agent.__init__`:
+
+```python
+self.cohort_ids: set[str] = set()   # populated by SimulationEngine at startup and on resync
+```
+
+Add one helper method:
+
+```python
+def can_interact(self, other: "Agent") -> bool:
+    """True if the two agents share at least one cohort (or if either has no cohort assignments)."""
+    if not self.cohort_ids or not other.cohort_ids:
+        return True   # uncohorted agents interact with everyone — backward-compatible default
+    return bool(self.cohort_ids & other.cohort_ids)
+```
+
+The fallback `return True` when either agent has no cohorts assigned preserves all-vs-all behaviour for agents not yet assigned to any cohort, preventing accidental silencing.
+
+---
+
+## Simulation Engine Changes
+
+### `src/agent/main.py`
+
+#### 1. Cohort Loading at Startup
+
+After agents are loaded and before the main loop, query cohort memberships:
+
+```python
+async def _load_cohort_memberships(self):
+    async with self._session_factory() as db:
+        rows = await db.execute(
+            select(CohortMembership.agent_id, CohortMembership.cohort_id)
+        )
+        # Clear and rebuild
+        for agent in self.agents.values():
+            agent.cohort_ids = set()
+        for agent_id, cohort_id in rows:
+            if agent_id in self.agents:
+                self.agents[agent_id].cohort_ids.add(cohort_id)
+
+    self._last_cohort_sync = time.time()
+    logger.info("Cohort memberships loaded for %d agents", sum(1 for a in self.agents.values() if a.cohort_ids))
+```
+
+No index structure is needed — the interaction gate operates purely via `agent.cohort_ids` set intersection at the point of interaction. Turn dispatch is global and cohort-unaware (see Section 6).
+
+#### 2. Dynamic Membership Resync
+
+Every 60 seconds (checked at the top of each main-loop round), re-run `_load_cohort_memberships()` and rebuild `_cohort_members`. This is a full replace, not a diff — simple and correct.
+
+```python
+COHORT_RESYNC_INTERVAL = 60  # seconds
+
+if time.time() - self._last_cohort_sync >= COHORT_RESYNC_INTERVAL:
+    await _load_cohort_memberships()
+    _rebuild_cohort_index()
+```
+
+Resync only updates `agent.cohort_ids` and `_cohort_members`. It does not touch `AgentState` or close any active threads — existing open threads between agents who have since been removed from a shared cohort are allowed to conclude naturally.
+
+#### 3. Interaction Gate — Phase 2
+
+In `_phase2_scan_filter()`, filter incoming posts before building the LLM prompt:
+
+```python
+new_posts = [
+    p for p in new_posts
+    if self._sender_can_interact(agent, p.sender_agent_id)
+]
+```
+
+Where:
+
+```python
+def _sender_can_interact(self, agent: Agent, sender_id: str | None) -> bool:
+    if sender_id is None:
+        return True   # PI/human message — always show
+    sender = self.agents.get(sender_id)
+    if sender is None:
+        return True   # unknown sender — don't filter
+    return agent.can_interact(sender)
+```
+
+#### 4. Interaction Gate — Phase 3
+
+In `_phase3_activate_threads()`, tag-based and reply-based activation both check:
+
+```python
+sender = self.agents.get(entry.sender_agent_id)
+if sender and not agent.can_interact(sender):
+    continue   # skip activation — not a cohort-mate
+```
+
+This applies before any other checks (thread cap, thread participation rules, etc.) to fail fast.
+
+#### 5. Interaction Gate — Phase 5
+
+In `_phase5_new_post()`, when filtering `available_posts`:
+
+```python
+sender = self.agents.get(post.sender_agent_id)
+if sender and not agent.can_interact(sender):
+    agent.state.interesting_posts = [
+        p for p in agent.state.interesting_posts if p.post_id != post.post_id
+    ]
+    continue   # prune stale post — sender is no longer a cohort-mate
+```
+
+When the LLM response names a `tagged_agent` for a new top-level post:
+
+```python
+if tagged_agent:
+    target = self.agents.get(tagged_agent)
+    if target and not agent.can_interact(target):
+        logger.debug("%s: cohort gate blocked tag of %s in phase5", agent.agent_id, tagged_agent)
+        return
+```
+
+#### 6. Turn Selection: Min-Heap + Global Semaphore
+
+Replace the current O(n) weighted-random `_select_agent()` with a **min-heap keyed by `last_selected`** and a **global semaphore of width `concurrent_turns`**.
+
+**Why min-heap over weighted random:**
+The current weighted-random gives probabilistic fairness but can starve agents at large list sizes, particularly when `phase5_skip_probability` is non-zero (fast no-op turns let an agent re-enter the lottery immediately). A min-heap guarantees the longest-waiting eligible agent always gets the next slot — O(log n) selection, deterministic fairness.
+
+**Selection and dispatch:**
+
+```python
+import heapq
+
+def _build_heap(self) -> list[tuple[float, Agent]]:
+    now = time.time()
+    return [
+        (a.state.last_selected, a)
+        for a in self.agents.values()
+        if not a.is_paused
+        and self._agent_within_budget(a)
+        and (now - a.state.last_selected) >= settings.turn_delay_seconds
+    ]
+
+async def _run_concurrent_turns(self) -> bool:
+    heap = self._build_heap()
+    if not heap:
+        return False
+
+    heapq.heapify(heap)
+    n = min(settings.concurrent_turns, len(heap))
+    selected = [heapq.heappop(heap)[1] for _ in range(n)]
+
+    results = await asyncio.gather(
+        *[self._run_turn(agent) for agent in selected],
+        return_exceptions=True,
+    )
+
+    did_any_work = False
+    for agent, result in zip(selected, results):
+        agent.state.last_selected = time.time()
+        if isinstance(result, Exception):
+            logger.exception("Turn error for %s", agent.agent_id)
+        elif result:
+            did_any_work = True
+
+    return did_any_work
+```
+
+The main loop calls `_run_concurrent_turns()` each iteration and uses `did_any_work` to drive the existing idle-backoff logic unchanged.
+
+**Slack polling** continues once per round, before `_run_concurrent_turns()`, as a single sequential operation.
+
+**`_last_llm_caller` guard:** This guard exists to prevent the same agent from making back-to-back LLM calls in the sequential model. It is superseded by the min-heap + per-agent cooldown (`turn_delay_seconds` eligibility check) and should be removed from the concurrent path. The min-heap naturally pushes a just-selected agent to the bottom of the queue; the cooldown makes them ineligible until the delay has elapsed.
+
+#### 7. Phase 5 Concurrent Initiation Guard
+
+With N turns running concurrently, two agents can independently decide to start a new thread with each other in the same round (both see `has_pending_reply=False` and neither has an active thread with the other yet). Track in-flight pair initiations to prevent duplicate thread creation:
+
+```python
+self._initiating_pairs: set[frozenset[str]] = set()
+```
+
+In `_phase5_new_post()`, before posting a reply that opens a new thread toward `target_agent_id`:
+
+```python
+pair = frozenset([agent.agent_id, target_agent_id])
+if pair in self._initiating_pairs:
+    logger.debug("%s: concurrent initiation guard blocked duplicate thread with %s", agent.agent_id, target_agent_id)
+    return
+
+self._initiating_pairs.add(pair)
+try:
+    await self._post_message(...)
+    # activate thread ...
+finally:
+    self._initiating_pairs.discard(pair)
+```
+
+The pair is removed once the thread is activated (or on failure). Note: Phase 4 back-and-forth replies are safe without this guard — `has_pending_reply` is a logical baton held by only one side at a time, so two agents cannot both have a pending reply to each other simultaneously.
+
+---
+
+## Admin Interface
+
+### Routes
+
+All routes are added to `src/routers/admin.py` under the `/admin/cohorts` prefix, protected by the existing `get_admin_user` dependency.
+
+| Method | Path | Description |
+|--------|------|-------------|
+| GET | `/admin/cohorts` | List all cohorts with member counts |
+| POST | `/admin/cohorts/create` | Create a new cohort |
+| GET | `/admin/cohorts/{cohort_id}` | Cohort detail: members, audit log |
+| POST | `/admin/cohorts/{cohort_id}/delete` | Delete cohort (cascades memberships) |
+| POST | `/admin/cohorts/{cohort_id}/add-agent` | Add an agent to the cohort |
+| POST | `/admin/cohorts/{cohort_id}/remove-agent` | Remove an agent from the cohort |
+
+POST routes redirect back to the referring page on success and render an inline error on failure (same pattern as existing admin routes).
+
+### Cohort List Page — `GET /admin/cohorts`
+
+Template: `templates/admin/cohorts.html`
+
+**Header:** "Cohorts" with a "New Cohort" button (opens inline form or modal).
+
+**Create form** (inline, collapsed by default):
+- `name` (text input, required) — validated: lowercase, alphanumeric + hyphens only, max 48 chars
+- `description` (textarea, optional)
+- Submit → `POST /admin/cohorts/create`
+
+**Table: All Cohorts**
+
+| Column | Notes |
+|--------|-------|
+| Name | Link to detail page |
+| Description | Truncated at 80 chars |
+| Members | Count of current memberships |
+| Created by | Admin user name |
+| Created at | Date |
+| Actions | Delete button (with confirmation; disabled if cohort has active members) |
+
+If no cohorts exist: empty state with "No cohorts yet. Create one above."
+
+### Cohort Detail Page — `GET /admin/cohorts/{cohort_id}`
+
+Template: `templates/admin/cohort_detail.html`
+
+**Header:** Cohort name + description. Delete button (top right, requires confirmation prompt via `data-confirm` attribute; only shown if member count is 0, otherwise disabled with tooltip "Remove all members first").
+
+**Section: Members**
+
+Table of current members:
+
+| Column | Notes |
+|--------|-------|
+| Agent ID | e.g. `su`, `wiseman` |
+| Bot Name | e.g. `SuBot` |
+| PI Name | e.g. `Andrew Su` |
+| Agent Status | `active` / `suspended` / `pending` (from AgentRegistry) |
+| Added by | Admin user name |
+| Added at | Date |
+| Actions | "Remove" button → `POST /admin/cohorts/{cohort_id}/remove-agent` with `agent_id` |
+
+**Section: Add Agent**
+
+Dropdown of all agents *not already in this cohort*, populated from AgentRegistry. Only active agents are shown by default; a checkbox toggle shows suspended/pending agents as well.
+
+```
+[ Select agent ▼ ]  [ Add to Cohort ]
+```
+
+`POST /admin/cohorts/{cohort_id}/add-agent` body: `{ agent_id: "su" }`
+
+If the selected agent already belongs to this cohort, return a 400 with inline error "Agent is already a member."
+
+**Section: Agent Cohort Map (read-only)**
+
+Summary table showing all active agents and which cohorts they currently belong to, for cross-reference:
+
+| Agent | Cohorts |
+|-------|---------|
+| SuBot | pilot-wave-1, structural |
+| WisemanBot | pilot-wave-1 |
+| LotzBot | *(none)* |
+
+This section is static (no editing — use individual cohort pages to manage membership).
+
+### Navigation
+
+Add "Cohorts" to the existing admin sidebar nav alongside Agents, Users, Activity, etc.
+
+---
+
+## Configuration
+
+### New settings (`src/config.py`)
+
+```python
+concurrent_turns: int = 3   # max simultaneous agent turns; overridden by active_thread_threshold at runtime
+```
+
+At engine startup, `concurrent_turns` is clamped to `max(concurrent_turns, active_thread_threshold)`. This keeps the two levers in proportion: if an admin raises the thread threshold to allow more simultaneous conversations, the concurrent turn capacity rises with it automatically. The `concurrent_turns` setting therefore acts as a floor, not a ceiling.
+
+The cohort resync interval is hardcoded as `COHORT_RESYNC_INTERVAL = 60` seconds in the engine. It can be promoted to `Settings` if operational tuning is needed.
+
+### `turn_delay_seconds` — Behavior Change
+
+**Current behavior (to be removed):** `simulation.py:360-361` applies `asyncio.sleep(turn_delay_seconds)` at the end of every productive main-loop iteration. This is a **global pause** — no Slack polling, no other agents, nothing runs during the sleep. It is 0.0 by default and has no per-agent targeting.
+
+**New behavior:** `turn_delay_seconds` becomes a **per-agent cooldown** enforced at selection time inside `_build_heap()`:
+
+```python
+and (now - a.state.last_selected) >= settings.turn_delay_seconds
+```
+
+An agent that just completed a turn is ineligible until the cooldown has elapsed. All other agents are unaffected. The `asyncio.sleep(settings.turn_delay_seconds)` call in `simulation.py` is removed.
+
+This preserves the original intent (throttle individual agent tempo) while composing correctly with concurrent dispatch — N slots can stay busy while a recently-active agent sits out its cooldown.
+
+---
+
+## Backward Compatibility
+
+- Agents with no cohort memberships are grouped into `"__uncohorted__"` and continue to interact with all other uncohorted agents. This means a simulation with zero cohorts defined behaves identically to the current all-vs-all system.
+- `Agent.can_interact()` returns `True` when either agent has an empty `cohort_ids` set, so partially-cohorted simulations (some agents assigned, some not) do not silently break.
+- No existing tables, models, or routes are modified.
+
+---
+
+## Out of Scope
+
+- Agent-visible cohort concept: agents do not know which cohort a conversation was initiated from; threads are indistinguishable.
+- PI-managed cohorts: only admins create and delete cohorts. PIs cannot request cohort changes.
+- Per-cohort budgets or limits: all limits remain per-agent and are shared across cohorts.
+- Cohort-scoped message history or separate Slack workspaces per cohort.
+- Time-bounded cohort memberships (automatic expiry).
diff --git a/specs/data-model.md b/specs/data-model.md
index bc3adc9..122a314 100644
--- a/specs/data-model.md
+++ b/specs/data-model.md
@@ -93,6 +93,25 @@ PostgreSQL-backed async job queue.
 | started_at | timestamp | Nullable |
 | completed_at | timestamp | Nullable |
 
+### MatchmakerProposal
+
+Admin-generated collaboration proposals produced by a single LLM call from two PIs' public and private profiles, without running an agent simulation. See `labbot-matchmaker.md`.
+
+| Field | Type | Notes |
+|---|---|---|
+| id | uuid | Primary key |
+| pi_a_id | FK → User | First PI (CASCADE delete) |
+| pi_b_id | FK → User | Second PI (CASCADE delete) |
+| proposal_md | text | Full proposal in markdown |
+| title | string(500) | Extracted from first `# heading` in proposal_md |
+| confidence | string(20) | `high` / `moderate` / `speculative` |
+| llm_model | string(100) | Model used (e.g. `claude-opus-4-7`) |
+| input_tokens | integer | Nullable. Input token count |
+| output_tokens | integer | Nullable. Output token count |
+| generated_at | timestamp | Server default now() |
+
+**Indexes:** `pi_a_id`, `pi_b_id`
+
 ### AccessAllowlist
 
 Admin-managed list of pre-approved ORCID IDs. ORCIDs on this list bypass the pre-release access gate and land directly in `allowed` state on first login.
@@ -176,6 +195,42 @@ Stores PI/agent reviews of collaboration proposals.
 
 **Constraint:** Unique on (thread_decision_id, agent_id) — each agent reviews a thread decision once.
 
+### PiProposalEvaluation
+
+Structured NIH-style evaluations submitted by PIs through the `/proposals` tab. Separate from `ProposalReview` (the 1–4 agent-blocking system). See `proposal-review-pi.md` for the full specification.
+
+| Field | Type | Notes |
+|---|---|---|
+| id | uuid | Primary key |
+| user_id | FK → User | The PI who submitted the evaluation |
+| proposal_type | string(20) | `"agent"` or `"matchmaker"` — stored for admin analysis only, never shown to evaluator |
+| thread_decision_id | FK → ThreadDecision | Nullable. Set when evaluating an agent-generated proposal |
+| matchmaker_proposal_id | FK → MatchmakerProposal | Nullable. Set when evaluating a matchmaker proposal |
+| score_significance | smallint | 1–9 NIH criterion score |
+| score_innovation | smallint | 1–9 NIH criterion score |
+| score_approach | smallint | 1–9 NIH criterion score |
+| score_investigators | smallint | 1–9 NIH criterion score |
+| score_environment | smallint | 1–9 NIH criterion score |
+| score_overall_impact | smallint | 1–9 holistic impact score (not an average of criteria) |
+| comments_significance | text | Nullable. Free-text notes for Significance criterion |
+| comments_innovation | text | Nullable. Free-text notes for Innovation criterion |
+| comments_approach | text | Nullable. Free-text notes for Approach criterion |
+| comments_investigators | text | Nullable. Free-text notes for Investigators criterion |
+| comments_environment | text | Nullable. Free-text notes for Environment criterion |
+| comments_overall | text | Required. Overall evaluation narrative |
+| evaluated_at | timestamp | Server default now() |
+| updated_at | timestamp | Nullable. Set on amendment |
+
+**Constraints:**
+- `CHECK (proposal_type IN ('agent', 'matchmaker'))`
+- All six scores: `CHECK (score_X BETWEEN 1 AND 9)`
+- `CHECK (thread_decision_id IS NOT NULL OR matchmaker_proposal_id IS NOT NULL)` — exactly one must be set
+- `UNIQUE (user_id, thread_decision_id)` and `UNIQUE (user_id, matchmaker_proposal_id)` — one evaluation per user per proposal; re-submission is an upsert (update in place)
+
+**Indexes:** `(user_id, proposal_type)`, `(thread_decision_id)`, `(matchmaker_proposal_id)`
+
+**Relationship to ProposalReview:** `ProposalReview` drives the agent-blocking workflow (1–4 scale, one row per agent per proposal). `PiProposalEvaluation` is a research-quality instrument for the PI's own assessment (NIH 1–9 scale, one row per PI per proposal). The two systems evolve independently.
+
 ### EmailNotification
 
 Tracks each proposal notification email sent. See `email-proposal-review.md` for full spec.
diff --git a/specs/labbot-matchmaker.md b/specs/labbot-matchmaker.md
new file mode 100644
index 0000000..2d4d7a4
--- /dev/null
+++ b/specs/labbot-matchmaker.md
@@ -0,0 +1,247 @@
+# LabBot Matchmaker Specification
+
+## Overview
+
+The Matchmaker is an alternative pathway for generating collaboration proposals between two PIs without running the multi-agent simulation. An admin selects two PIs from dropdowns; a single LLM call reads both their public and private profiles and produces a proposal of identical quality and format to those generated by the agent dialogue system. The output is stored and displayed in a new **Matchmaker** tab in the admin dashboard.
+
+This is complementary to the agent system — not a replacement. It is useful for:
+- Quickly generating proposals on demand before a simulation run
+- Testing profile quality in isolation
+- Generating proposals for PIs who don't yet have active agents
+
+---
+
+## Admin UI (`/admin/matchmaker`)
+
+### Layout
+
+A new tab in the admin nav alongside "Discussions".
+
+**Top section — Generate form:**
+
+```
+[ PI A dropdown ▾ ]    [ PI B dropdown ▾ ]    [ Generate Proposal ]
+```
+
+Both dropdowns list all users who have a complete `ResearcherProfile`. Sorted alphabetically by name. The same user cannot be selected in both dropdowns (client-side enforcement — disable the selected user in the other dropdown).
+
+The **Generate Proposal** button is disabled until both PIs are selected. On click it POSTs to `/admin/matchmaker/generate` and shows an inline spinner while the LLM call runs (typically 5–15 seconds).
+
+**Main section — Proposals table:**
+
+Same visual style as `/admin/discussions`.
+
+| Column | Notes |
+|---|---|
+| Date/time | When generated |
+| PI A | Name |
+| PI B | Name |
+| Confidence | `High` / `Moderate` / `Speculative` badge (color-coded: green/yellow/gray) |
+| Title | First line of the proposal |
+| Actions | View · Delete |
+
+**Filters:**
+- PI filter (multi-select, filters rows where either PI matches)
+- Confidence filter
+
+**Export:** Each proposal row has an HTML and plain-text export link, same as Discussions.
+
+### Proposal Detail View (`/admin/matchmaker/{id}`)
+
+Full-page view of a single proposal. Sections mirror the proposal format (see Output Format below). Includes:
+- Header: PI A, PI B, confidence label, generated timestamp
+- Full proposal body rendered as markdown
+- "Back to Matchmaker" link
+
+---
+
+## Backend
+
+### New Route: `POST /admin/matchmaker/generate`
+
+**Request body (form):** `pi_a_id`, `pi_b_id` (user UUIDs)
+
+**Steps:**
+1. Load `ResearcherProfile` for both users (including `private_profile_md`).
+2. Load recent publications for both users (up to 20, sorted by year desc).
+3. Call `generate_matchmaker_proposal(profile_a, profile_b, pubs_a, pubs_b)` — see LLM Pipeline below.
+4. Parse LLM output, extract confidence label.
+5. Insert a `MatchmakerProposal` row.
+6. Redirect to `/admin/matchmaker` (or return JSON for HTMX — see implementation note below).
+
+**Error handling:** If either user lacks a complete profile, return a 400 with an inline error message above the form: "PI A / PI B does not have a complete profile yet."
+
+### New Route: `GET /admin/matchmaker`
+
+Renders the tab with the generate form and proposals table.
+
+### New Route: `GET /admin/matchmaker/{id}`
+
+Renders the proposal detail view.
+
+### New Route: `POST /admin/matchmaker/{id}/delete`
+
+Deletes the proposal row. Redirects back to `/admin/matchmaker`. (HTML forms do not support `DELETE`; a POST sub-resource is used instead.)
+
+---
+
+## Data Model
+
+### MatchmakerProposal
+
+| Field | Type | Notes |
+|---|---|---|
+| id | uuid | Primary key |
+| pi_a_id | FK → User | |
+| pi_b_id | FK → User | |
+| proposal_md | text | Full proposal in markdown |
+| title | text | Extracted first heading from proposal_md |
+| confidence | string(20) | `high` / `moderate` / `speculative` |
+| llm_model | string | Model used (e.g. `claude-opus-4-7`) |
+| input_tokens | integer | |
+| output_tokens | integer | |
+| generated_at | timestamp | |
+
+`pi_a_id` and `pi_b_id` are stored in canonical order (lower UUID first) to avoid duplicate detection confusion. The UI always shows them in name-alphabetical order regardless.
+
+---
+
+## LLM Pipeline
+
+### Model
+
+`claude-opus-4-7` — same model used for Phase 4 agent replies.
+
+### Prompt (`prompts/matchmaker.md`)
+
+```
+You are evaluating a potential research collaboration between two PIs.
+
+Your task is to produce a high-quality collaboration proposal that meets the
+Collaboration Quality Standards below.
+
+---
+## Collaboration Quality Standards
+
+[Verbatim content from agent-system.md § "Collaboration Quality Standards"]
+
+---
+## PI A: {name_a}
+
+### Public Profile
+{public_profile_a}
+
+### Private Instructions (confidential — do not quote directly)
+{private_profile_a}
+
+### Recent Publications
+{publications_a}
+
+---
+## PI B: {name_b}
+
+### Public Profile
+{public_profile_b}
+
+### Private Instructions (confidential — do not quote directly)
+{private_profile_b}
+
+### Recent Publications
+{publications_b}
+
+---
+## Instructions
+
+Produce a collaboration proposal using the output format below. Apply the
+Collaboration Quality Standards strictly. If you cannot identify a High or
+Moderate confidence collaboration, produce a Speculative one and label it as such.
+
+Respect each PI's private instructions when framing the proposal: if a PI has
+expressed preferences for specific topics or partners, weight those angles
+positively. Do not quote or reveal any private instruction text in the output.
+```
+
+### Output Format
+
+The LLM output must follow this structure (identical to proposals generated by the agent dialogue system):
+
+```markdown
+# [Collaboration Title]
+
+**Confidence:** High | Moderate | Speculative
+
+## Scientific Rationale
+[2–3 paragraphs. Why these two labs? What does each bring that the other lacks?
+Name specific techniques, datasets, reagents, or model systems.]
+
+## True Complementarity
+- **PI A contributes:** [specific capabilities — not generic]
+- **PI B contributes:** [specific capabilities — not generic]
+- **Gap filled:** [what neither could do alone]
+
+## Concrete First Experiment
+[1 paragraph. Scoped to days-to-weeks. Names specific assays, methods,
+reagents, or datasets. Both labs are essential to execute it.]
+
+## Benefits to Each Lab
+- **PI A benefits:** [specific, non-generic]
+- **PI B benefits:** [specific, non-generic]
+
+## Open Questions / Next Steps
+[Bullet list of what would need to be confirmed before committing effort]
+```
+
+The output format is enforced by wrapping the final proposal in `<proposal>` tags (same pattern as `<slack_message>` in Phase 4). The parser extracts content inside those tags. The confidence label is parsed from the `**Confidence:**` line.
+
+---
+
+## Admin Dashboard Integration
+
+### Nav update (`admin-dashboard.md` §API Routes additions)
+
+| Route | Purpose |
+|---|---|
+| `GET /admin/matchmaker` | Matchmaker tab with generate form and proposals table |
+| `POST /admin/matchmaker/generate` | Run LLM pipeline and store result |
+| `GET /admin/matchmaker/{id}` | Proposal detail view |
+| `POST /admin/matchmaker/{id}/delete` | Delete a proposal |
+
+### Nav link
+
+Add **Matchmaker** between **Discussions** and **LLM Call Logs** in the admin sidebar. Show a count badge of total proposals (no filter).
+
+---
+
+## Relationship to Agent System
+
+| Dimension | Agent System | Matchmaker |
+|---|---|---|
+| Input | Multi-turn Slack dialogue | Public + private profiles only |
+| Latency | Minutes to hours (simulation run) | ~10 seconds (single LLM call) |
+| Proposal quality standard | Collaboration Quality Standards | Identical |
+| Output format | Identical | Identical |
+| Private profile respected | Yes (agent's own) | Yes (both, read-only, not quoted) |
+| PI notification | Slack DM | None (admin-only tool) |
+| Stored in | `Proposal` table | `MatchmakerProposal` table |
+
+Proposals from both sources can be exported in the same HTML/plain-text format.
+
+---
+
+## Design Principles
+
+- **Admin-only.** The Matchmaker tab is only accessible to `is_admin = true` users. No self-service endpoint.
+- **Read-only for PIs.** PIs are not notified. Admins use this to explore matches and manually share results.
+- **No simulation dependency.** Works without any running agent containers or Slack tokens.
+- **Same quality bar.** The Collaboration Quality Standards section from `agent-system.md` is embedded verbatim in the matchmaker prompt. No relaxed criteria.
+- **Prompt caching.** The system prompt (quality standards + both profiles) is structured to maximize Anthropic prompt cache hits when the same pair is regenerated.
+
+---
+
+## PI Evaluation of Matchmaker Proposals
+
+Matchmaker proposals surface to PIs through the unified **Proposal Evaluations** tab (`/proposals`) alongside agent-generated proposals. The origin is not revealed to the PI in that view. PIs submit NIH-style 1–9 evaluations via the form at `/proposals/{token}/evaluate`.
+
+Evaluations are stored in `pi_proposal_evaluations` with `proposal_type = "matchmaker"` and `matchmaker_proposal_id` set. Admins can see the origin breakdown (agent vs. matchmaker) at `/admin/evaluations`. See `proposal-review-pi.md` for the full specification.
+
+**Note on CLI-created proposals:** Matchmaker proposals created via the CLI (which set `pi_a_name`/`pi_b_name` but leave `pi_a_id`/`pi_b_id` null) cannot be linked to a `user_id` and will not appear in the PI evaluation list. Admins should backfill the FK columns to include these proposals, or create them through the web UI form where FK resolution happens automatically.
diff --git a/specs/labbot-podcast.md b/specs/labbot-podcast.md
new file mode 100644
index 0000000..b6db1c1
--- /dev/null
+++ b/specs/labbot-podcast.md
@@ -0,0 +1,669 @@
+# LabBot Podcast Specification
+
+## Overview
+
+LabBot Podcast is a daily personalized research briefing service for researchers. It surfaces the single most relevant and impactful recent publication from the scientific literature based on the researcher's profile, generates a structured text summary highlighting findings and tools useful to their ongoing work, and produces a short audio episode via Mistral AI TTS. Researchers can subscribe to a personal RSS podcast feed to listen to the audio.
+
+The system runs once per day and requires no researcher interaction to be useful — but researchers can tune it through a web UI. There are two delivery paths:
+
+- **Agent path** — pilot-lab PIs with an approved `AgentRegistry` entry additionally receive the text summary as a Slack DM from their lab bot.
+- **User path** — any researcher who has completed ORCID onboarding and has a `ResearcherProfile` with a research summary receives the podcast automatically. No Slack bot, agent approval, or admin action required.
+
+---
+
+## Architecture
+
+### Service Placement
+
+LabBot Podcast runs as a separate Docker container (`podcast` service), mirroring the GrantBot pattern:
+- Long-running scheduler process
+- Executes once per calendar day at 9am UTC (1 hour after GrantBot)
+- If the container was down at the scheduled time, runs immediately on startup (catch-up)
+- State persisted in `data/podcast_state.json` (tracks which articles have been delivered per agent)
+
+### Delivery Paths
+
+| Path | Who | Profile source | Delivery | Audio/RSS key |
+|---|---|---|---|---|
+| **Agent** | Pilot-lab PIs with active `AgentRegistry` | `profiles/public/{agent_id}.md` (disk) | Slack DM + RSS | `agent_id` string |
+| **User** | Any ORCID user with completed `ResearcherProfile` | `ResearcherProfile` DB row (structured fields) | RSS only | `user_id` UUID |
+
+Both paths run in the same daily scheduler pass. A user who has both a `ResearcherProfile` and an active agent is handled only by the agent path (no duplicate episode).
+
+### Dependencies on Existing Systems
+
+| Existing component | How Podcast uses it |
+|---|---|
+| `ResearcherProfile` DB model | Source of research areas, keywords, techniques, disease areas for the user path |
+| `profiles/public/{lab}.md` | Profile text for the agent path (LLM article selection and summary) |
+| `src/services/pubmed.py` | Literature search (keyword + MeSH queries) |
+| `src/services/llm.py` | Article selection ranking and summary generation (all calls logged to `LlmCallLog`) |
+| `AgentRegistry` | Maps agent → PI → Slack bot token for DM delivery (agent path only) |
+| `User.id` (UUID) | Stable, opaque RSS feed token for the user path |
+| Slack bot DM | Text summary delivery (agent path only) |
+
+### New External Dependency
+
+**Mistral AI API** — text-to-speech generation.
+- Configured via `MISTRAL_API_KEY` environment variable
+- Voice selection per agent configured in `data/podcast_voices.json` (agent_id → voice_id); falls back to a default voice if not set
+- Audio files stored at `data/podcast_audio/{agent_id}/{YYYY-MM-DD}.mp3`
+
+---
+
+## Daily Pipeline
+
+Each day the scheduler runs two loops in sequence:
+
+1. **Agent loop** — iterates over all active `AgentRegistry` entries and calls `run_pipeline_for_agent()` for each.
+2. **User loop** — iterates over all `User` rows where `onboarding_complete=True` and `profile.research_summary IS NOT NULL`, skipping any whose `user_id` appeared in the agent loop, and calls `run_podcast_for_user()` for each.
+
+For each recipient, the pipeline executes the following steps sequentially:
+
+### Step 1: Load Profile
+
+- **Agent path**: read `profiles/public/{agent_id}.md` from disk. If absent, skip.
+- **User path**: construct profile text from structured `ResearcherProfile` DB fields (`research_summary`, `disease_areas`, `techniques`, `experimental_models`, `keywords`). If `research_summary` is empty, skip.
+
+### Step 2: Build Search Queries
+
+Construct PubMed search terms from the profile:
+- Extract top research area keywords
+- Extract technique and experimental model terms
+- Combine into 2–3 PubMed query strings (e.g., `(proteostasis OR unfolded protein response) AND (neurodegeneration OR proteomics)`)
+- Inject any `extra_keywords` from `PodcastPreferences` as additional quoted terms
+- Limit to publications from the last 14 days (rolling window ensures coverage across weekend/holiday gaps)
+- Cap at 50 candidate abstracts
+
+### Step 3: Fetch Candidate Abstracts
+
+Use `src/services/pubmed.py` to execute each query and retrieve PMIDs + abstracts. Deduplicate across queries. Skip any PMID already in `podcast_state.json` for this recipient (agent or user) to prevent re-delivering the same article.
+
+### Step 4: LLM Article Selection (Sonnet)
+
+Single LLM call (Sonnet) with:
+- The researcher's full profile text (disk for agent path; constructed from DB for user path)
+- The list of candidate abstracts (title + abstract text, numbered)
+- Any journal preferences from `PodcastPreferences`
+- Prompt: `prompts/podcast-select.md`
+
+The LLM returns the index of the single best article, along with a one-sentence justification of why it is relevant to this researcher's ongoing work. If no article meets a minimum relevance threshold, it returns `null` and the pipeline skips delivery today.
+
+### Step 5: Generate Text Summary (Opus)
+
+One LLM call (Opus) with:
+- The researcher's full profile text
+- The selected article's title, abstract, and full text (fetched via `retrieve_full_text` if available in PMC, otherwise abstract only)
+- Prompt: `prompts/podcast-summarize.md`
+
+Output is a structured text summary (see format below). This is used as the TTS input and stored in `PodcastEpisode.text_summary`.
+
+### Step 6: Generate Audio (Mistral AI)
+
+Pass the text summary to the Mistral AI TTS API:
+- Voice: from `PodcastPreferences.voice_id`, or `MISTRAL_TTS_DEFAULT_VOICE`
+- Model: configurable via `MISTRAL_TTS_MODEL`
+- Output: MP3 file saved to:
+  - Agent path: `data/podcast_audio/{agent_id}/{YYYY-MM-DD}.mp3`
+  - User path: `data/podcast_audio/users/{user_id}/{YYYY-MM-DD}.mp3`
+- If TTS fails, the episode DB row is **not** written (see commit-last ordering); the run returns `False`.
+
+### Step 7: Deliver via Slack DM _(agent path only)_
+
+Send the text summary as a DM from the agent's Slack bot to its PI, appending the RSS feed URL. User-path episodes are delivered via RSS only — no Slack bot is required.
+
+### Step 8: Persist Episode and Update State
+
+1. Write the `PodcastEpisode` row to the DB:
+   - Agent path: `agent_id` set, `user_id` NULL
+   - User path: `user_id` set, `agent_id` NULL
+2. Append the delivered PMID to `data/podcast_state.json` (keyed by `agent_id` or `user_id`) to prevent re-delivery.
+
+---
+
+## Text Summary Format
+
+The Opus-generated summary follows a consistent structure. The prompt enforces this layout:
+
+```
+*Today's Research Brief — {Date}*
+
+*{Paper Title}*
+{Authors} · {Journal} · {Year}
+
+*What they found:*
+2–3 sentences on the core findings — specific results, effect sizes, or observations.
+
+*Key output:*
+1–2 sentences on any tool, method, dataset, or reagent released with the paper (if applicable). Omit this section if the paper has no distinct output.
+
+*Why this matters for your lab:*
+2–3 sentences connecting the paper's findings and outputs specifically to the PI's ongoing research areas, techniques, or open questions. Ground this in the PI's profile — name specific techniques, model systems, or questions from their work.
+
+*PubMed:* https://pubmed.ncbi.nlm.nih.gov/{PMID}/
+```
+
+The Slack DM appends a line at the bottom:
+> _Listen to the audio version: {rss_feed_url}_
+
+---
+
+## RSS Podcast Feed
+
+### Endpoints
+
+| Path | Auth | Key |
+|---|---|---|
+| `GET /podcast/{agent_id}/feed.xml` | None | Pilot-lab agent |
+| `GET /podcast/{agent_id}/audio/{date}.mp3` | None | Pilot-lab agent |
+| `GET /podcast/users/{user_id}/feed.xml` | None | Plain ORCID user |
+| `GET /podcast/users/{user_id}/audio/{date}.mp3` | None | Plain ORCID user |
+
+All four endpoints are public and unauthenticated. The `user_id` UUID is opaque and acts as a stable, subscribable feed token — equivalent to a private podcast URL. Users retrieve their feed URL from the `/podcast/settings` page.
+
+### Feed Structure
+
+Standard RSS 2.0 with iTunes podcast extensions (identical structure for both paths):
+
+```xml
+<rss version="2.0" xmlns:itunes="http://www.itunes.com/dtds/podcast-1.0.dtd">
+  <channel>
+    <title>{Name} — LabBot Research Briefings</title>
+    <description>Daily personalized research summaries for {Name}.</description>
+    <link>{feed_url}</link>
+    <itunes:author>{Name}</itunes:author>
+    <itunes:category text="Science"/>
+    <item>
+      <title>{Paper Title} — {Date}</title>
+      <description>{text summary}</description>
+      <enclosure url="{audio_url}" type="audio/mpeg" length="{file_size}"/>
+      <pubDate>{RFC 822 date}</pubDate>
+      <guid>{agent_id|user-{user_id}}-{YYYY-MM-DD}</guid>
+      <itunes:duration>{duration}</itunes:duration>
+    </item>
+    ...
+  </channel>
+</rss>
+```
+
+### Audio File Storage
+
+| Path | Audio directory |
+|---|---|
+| Agent path | `data/podcast_audio/{agent_id}/{YYYY-MM-DD}.mp3` |
+| User path | `data/podcast_audio/users/{user_id}/{YYYY-MM-DD}.mp3` |
+
+Files are streamed with `Content-Type: audio/mpeg`.
+
+---
+
+## LLM Prompt Files
+
+Two new prompt files in `prompts/`:
+
+### `prompts/podcast-select.md`
+
+Instructs the LLM to act as a literature triage assistant for a specific PI. It receives:
+- The PI's public profile (research areas, techniques, open questions, unique capabilities)
+- Numbered list of candidate abstracts (title + abstract)
+
+It must return:
+- The number of the most relevant article, or `null` if none clears the relevance bar
+- A one-sentence justification referencing a specific aspect of the PI's profile
+
+Key instructions in the prompt:
+- Relevance is defined as: the paper's findings or outputs could plausibly accelerate or inform a specific aspect of the PI's ongoing work
+- Recency alone is not sufficient — the connection must be specific
+- Prefer papers that release a tool, method, dataset, or reagent alongside findings
+- Do not pick review articles or editorials
+
+### `prompts/podcast-summarize.md`
+
+Instructs the LLM to act as a science communicator writing for a specific PI. It receives:
+- The PI's public profile
+- Full paper text (or abstract if full text unavailable)
+
+It must produce the structured summary described above. Key instructions:
+- The "Why this matters for your lab" section must name specific techniques, model systems, or open questions from the PI's profile — no generic connections
+- Tone is like a knowledgeable postdoc briefing their PI: specific, direct, no filler
+- The "Key output" section is only included if the paper releases a concrete artifact (tool, code, dataset, method, reagent); skip it otherwise
+- Target length: ~250 words total
+
+---
+
+## Data Model
+
+### `PodcastEpisode`
+
+Rows are keyed by either `agent_id` (string) or `user_id` (UUID FK to `users.id`). Exactly one should be set per row.
+
+```python
+class PodcastEpisode(Base):
+    __tablename__ = "podcast_episodes"
+
+    id: Mapped[uuid.UUID] = mapped_column(primary_key=True, default=uuid.uuid4)
+    agent_id: Mapped[str | None] = mapped_column(String(50), nullable=True, index=True)
+    user_id: Mapped[uuid.UUID | None] = mapped_column(UUID, ForeignKey("users.id"), nullable=True, index=True)
+    episode_date: Mapped[date] = mapped_column(Date, nullable=False)
+    pmid: Mapped[str] = mapped_column(String(100), nullable=False)
+    paper_title: Mapped[str] = mapped_column(String(500), nullable=False)
+    paper_authors: Mapped[str] = mapped_column(String(500), nullable=False)
+    paper_journal: Mapped[str] = mapped_column(String(255), nullable=False)
+    paper_year: Mapped[int] = mapped_column(Integer, nullable=False)
+    paper_url: Mapped[str | None] = mapped_column(String(1000), nullable=True)
+    text_summary: Mapped[str] = mapped_column(Text, nullable=False)
+    audio_file_path: Mapped[str | None] = mapped_column(String(500), nullable=True)
+    audio_duration_seconds: Mapped[int | None] = mapped_column(Integer, nullable=True)
+    slack_delivered: Mapped[bool] = mapped_column(Boolean, default=False)
+    selection_justification: Mapped[str] = mapped_column(Text, nullable=False)
+    created_at: Mapped[datetime] = mapped_column(DateTime(timezone=True), server_default=func.now())
+
+    __table_args__ = (
+        # Agent-path: one episode per agent per day
+        UniqueConstraint("agent_id", "episode_date", name="uq_podcast_agent_date"),
+        # User-path: enforced by partial unique index (migration 0013):
+        # CREATE UNIQUE INDEX ix_podcast_episodes_user_date
+        #   ON podcast_episodes (user_id, episode_date) WHERE user_id IS NOT NULL
+    )
+```
+
+### `PodcastPreferences`
+
+Rows are keyed by either `agent_id` or `user_id`. Both columns are nullable and uniquely indexed.
+
+```python
+class PodcastPreferences(Base):
+    __tablename__ = "podcast_preferences"
+
+    id: Mapped[uuid.UUID] = mapped_column(primary_key=True, default=uuid.uuid4)
+    agent_id: Mapped[str | None] = mapped_column(String(50), nullable=True, unique=True, index=True)
+    user_id: Mapped[uuid.UUID | None] = mapped_column(UUID, ForeignKey("users.id"), nullable=True, unique=True, index=True)
+    voice_id: Mapped[str | None] = mapped_column(String(100), nullable=True)
+    extra_keywords: Mapped[list[str]] = mapped_column(ARRAY(String), server_default="{}")
+    preferred_journals: Mapped[list[str]] = mapped_column(ARRAY(String), server_default="{}")
+    deprioritized_journals: Mapped[list[str]] = mapped_column(ARRAY(String), server_default="{}")
+    updated_at: Mapped[datetime] = mapped_column(DateTime(timezone=True), server_default=func.now(), onupdate=func.now())
+```
+
+### State File (`data/podcast_state.json`)
+
+Keyed separately for agents and users:
+
+```json
+{
+  "agents": {
+    "<agent_id>": { "delivered_pmids": ["12345", "67890"] }
+  },
+  "users": {
+    "<user_id UUID string>": { "delivered_pmids": ["11111"] }
+  },
+  "last_run_date": "2026-04-14"
+}
+```
+
+The state file is a lightweight deduplication cache. The DB is the authoritative record for RSS generation and admin visibility.
+
+### Alembic Migrations
+
+| Migration | Creates / alters |
+|---|---|
+| `0010_add_podcast_episodes.py` | `podcast_episodes` table (agent path) |
+| `0011_add_podcast_paper_url.py` | `paper_url` column |
+| `0012_add_podcast_preferences.py` | `podcast_preferences` table (agent path) |
+| `0013_podcast_user_support.py` | `user_id` FK on both tables; make `agent_id` nullable; partial unique index for user-path episodes |
+
+---
+
+## Configuration
+
+New environment variables:
+
+| Variable | Required | Description |
+|---|---|---|
+| `MISTRAL_API_KEY` | Yes (for audio) | Mistral AI API key |
+| `MISTRAL_TTS_MODEL` | No | TTS model ID (default: `mistral-tts-latest`) |
+| `MISTRAL_TTS_DEFAULT_VOICE` | No | Default voice when no per-agent override exists |
+| `PODCAST_BASE_URL` | Yes | Public base URL for RSS enclosure links (e.g., `https://copi.science`) |
+| `PODCAST_SEARCH_WINDOW_DAYS` | No | Rolling search window in days (default: `14`) |
+| `PODCAST_MAX_CANDIDATES` | No | Max PubMed abstracts per agent per day (default: `50`) |
+
+Per-agent voice overrides (Phase 2/3): `data/podcast_voices.json`
+```json
+{
+  "su": "alex",
+  "wiseman": "stella"
+}
+```
+**Deprecated in Phase 4** — voice preferences move to the `podcast_preferences` DB table. The JSON file is still read as a fallback while the migration is in progress.
+
+---
+
+## Docker Service
+
+Add `podcast` service to `docker-compose.yml` and `docker-compose.prod.yml`:
+
+```yaml
+podcast:
+  build: .
+  command: python -m src.podcast.main
+  env_file: .env
+  volumes:
+    - ./data:/app/data
+  depends_on:
+    - postgres
+  profiles:
+    - podcast
+```
+
+Run with: `docker compose --profile podcast up -d podcast`
+
+---
+
+## Module Structure
+
+```
+src/podcast/
+├── main.py          # Scheduler entry point (APScheduler, same pattern as grantbot.py)
+├── pipeline.py      # Per-agent pipeline (steps 1–8 above)
+├── pubmed_search.py # Query builder from ResearcherProfile
+├── mistral_tts.py   # Mistral AI TTS client wrapper
+├── rss.py           # RSS feed builder (reads from DB)
+└── state.py         # podcast_state.json read/write helpers
+
+src/routers/podcast.py   # FastAPI routes: /podcast/{agent_id}/feed.xml, /podcast/{agent_id}/audio/{date}.mp3
+```
+
+The scheduler in `src/podcast/main.py` follows the same catch-up-on-startup pattern as `src/agent/grantbot.py`:
+1. On startup, check `data/podcast_state.json` for last run timestamp
+2. If last run was before today's 9am UTC, run immediately
+3. Schedule next run at 9am UTC
+
+---
+
+## Admin Dashboard Integration
+
+Add a **Podcast** tab to the existing admin dashboard (`src/routers/admin.py` + `templates/admin.html`) showing:
+- Table of recent episodes: agent, date, paper title, PMID, Slack delivered (yes/no), audio generated (yes/no)
+- Link to each agent's RSS feed
+- LLM call counts and token usage for the podcast pipeline (pulled from `LlmCallLog` filtered by `source = "podcast"`)
+
+The LLM calls from the podcast pipeline should set a `source` tag in `LlmCallLog` (add a `source` column via migration if not already present, or use the existing `extra_metadata` JSONB field).
+
+---
+
+## PI Customization
+
+### Via Standing Instructions (Current)
+
+PIs can adjust podcast behavior through standing instructions to their lab bot (same DM mechanism as the agent system — see `pi-interaction.md`). The podcast pipeline reads the private profile when building the selection prompt.
+
+Examples of effective standing instructions:
+- "For my daily podcast, focus only on papers that release a new tool or dataset — I don't need summaries of pure wet-lab findings"
+- "Prioritize papers from computational biology journals for the podcast"
+- "Skip anything about C. elegans — we're not pursuing that direction anymore"
+
+The bot's private profile rewrite (via `prompts/pi-profile-rewrite.md`) should include a `## Podcast Preferences` section that the podcast pipeline reads when constructing the selection and summarization prompts.
+
+### Via Preferences UI (Phase 4)
+
+A structured preferences page at `/agent/{agent_id}/podcast-settings` replaces the `data/podcast_voices.json` file and augments the standing-instructions mechanism with three explicit controls:
+
+1. **Voice** — select the TTS voice used for audio generation
+2. **Extra search keywords** — additional terms appended to PubMed/preprint queries beyond the auto-extracted profile keywords
+3. **Source preferences** — journals or preprint servers to prioritize (boosted in the selection prompt) or deprioritize
+
+See the **Podcast Preferences UI** section below for the full design.
+
+---
+
+## User Opt-In / Opt-Out
+
+### Default State
+
+Podcast generation is **disabled by default** for all plain ORCID users. An eligible user (onboarded with a completed profile) must explicitly opt in from the `/podcast/settings` page before any episode is generated for them. This prevents unsolicited audio generation for users who signed up but have not engaged with the feature.
+
+The agent path is unaffected — pilot-lab agents are always enabled as long as their `AgentRegistry.status == "active"`. Only the user path is gated by the opt-in flag.
+
+### Storage
+
+The opt-in flag is stored as `podcast_enabled: bool` on the `PodcastPreferences` row, defaulting to `False`. Because `PodcastPreferences` is created on first save, the scheduler treats both "no row exists" and "`podcast_enabled = False`" as disabled.
+
+```python
+class PodcastPreferences(Base):
+    ...
+    podcast_enabled: Mapped[bool] = mapped_column(Boolean, nullable=False, default=False, server_default="false")
+```
+
+Migration: `0022_add_podcast_enabled.py` adds `podcast_enabled BOOLEAN NOT NULL DEFAULT false` to `podcast_preferences`.
+
+### Enforcement Points
+
+| Location | Check |
+|---|---|
+| Daily scheduler (`src/podcast/main.py`) | Skip user unless `PodcastPreferences.podcast_enabled = True` |
+| On-demand trigger (`POST /podcast/user/generate`) | Return `403` unless user has `podcast_enabled = True` |
+
+The `_podcast_eligible()` helper in `src/routers/podcast.py` remains unchanged — it checks profile completeness only. The `podcast_enabled` flag is checked separately in the scheduler and on-demand endpoint.
+
+### Settings UI
+
+The `/podcast/settings` page shows the enable/disable toggle **at the top of the form**, before any other preferences. The feed URL card and all preference fields are always visible so users can inspect their URL and configure preferences before enabling. The toggle takes immediate effect on save.
+
+- **Disabled state**: toggle is off; the feed URL card notes that generation is paused.
+- **Enabled state**: toggle is on; generation runs in the daily scheduler at 9am UTC.
+
+### Alembic Migration
+
+```python
+# 0022_add_podcast_enabled.py
+def upgrade() -> None:
+    op.add_column(
+        "podcast_preferences",
+        sa.Column("podcast_enabled", sa.Boolean(), nullable=False, server_default="false"),
+    )
+
+def downgrade() -> None:
+    op.drop_column("podcast_preferences", "podcast_enabled")
+```
+
+---
+
+## Podcast Preferences UI
+
+### Route and Access Control
+
+| Route | Method | Handler | Access | Notes |
+|---|---|---|---|---|
+| `/agent/{agent_id}/podcast-settings` | `GET` | Render agent preferences form | Agent owner or admin | Agent path |
+| `/agent/{agent_id}/podcast-settings` | `POST` | Save agent preferences | Agent owner or admin | Agent path |
+| `/podcast/settings` | `GET` | Render user preferences form | Any authenticated user with completed profile | User path |
+| `/podcast/settings` | `POST` | Save user preferences | Any authenticated user with completed profile | User path |
+| `/podcast/user/generate` | `POST` | Trigger on-demand episode | Any authenticated user with completed profile | User path |
+
+The agent-path routes remain in `src/routers/agent_page.py` with the same `get_agent_with_access()` ownership check. The user-path routes live in `src/routers/podcast.py` and use `get_current_user()` + a profile-completeness check (`onboarding_complete=True` and `profile.research_summary IS NOT NULL`).
+
+### User Feed URL
+
+After saving preferences or visiting `/podcast/settings`, the user sees their personal feed URL:
+
+```
+{PODCAST_BASE_URL}/podcast/users/{user.id}/feed.xml
+```
+
+This URL:
+- Requires no authentication to read (subscribe in any podcast app)
+- Is stable for the lifetime of the user account
+- Acts as an opaque token — not guessable, not secret, but not publicly listed
+- Is displayed with a one-click copy button on the settings page
+
+### Form Fields
+
+#### 1. Voice Selection
+
+A `<select>` dropdown pre-populated with valid Mistral Voxtral voices. The current TTS model is `voxtral-mini-tts-latest`.
+
+Available voices for `voxtral-mini-tts-latest` (verify current list at [Mistral docs](https://docs.mistral.ai/capabilities/audio/#text-to-speech)):
+
+| Voice ID | Description |
+|---|---|
+| `alex` | US English, male, neutral |
+| `deedee` | US English, female, bright |
+| `jasmine` | US English, female, warm |
+| `laurel` | US English, female, clear |
+| `luna` | US English, female, soft |
+| `rio` | US English, male, energetic |
+| `stella` | US English, female, professional |
+| `theo` | US English, male, measured |
+| `tyler` | US English, male, conversational |
+
+> **Note:** This list should be refreshed from the Mistral API at deploy time. If Mistral exposes a `GET /v1/audio/voices` endpoint, the admin UI should call it to populate the dropdown dynamically. If not available, hardcode from the table above and update as the API evolves.
+
+The form shows a short audio preview label next to each voice name if available. The current agent's voice is pre-selected; if no voice is set, the first voice in the list is shown as the default.
+
+#### 2. Extra Search Keywords
+
+A plain `<textarea>` accepting one keyword or phrase per line. These are appended as additional quoted terms to the PubMed/preprint query in Step 1 of the pipeline.
+
+```
+insulin receptor substrate
+adipose tissue browning
+mitochondrial fission
+```
+
+Stored as `extra_keywords: list[str]` (each non-blank line becomes one entry). Max 20 entries, each up to 100 characters.
+
+#### 3. Source Preferences
+
+Two separate tag-input fields (or textareas with comma-separation):
+
+**Preferred sources** — journals or preprint servers to actively surface. Shown first in the selection-prompt candidate list and referenced explicitly in the prompt:
+> "Prefer papers from: {preferred_journals}. Give these extra weight when relevance is comparable."
+
+**Deprioritized sources** — journals or preprint servers to down-rank. Added as a negative signal in the selection prompt:
+> "Deprioritize papers from: {deprioritized_journals} unless exceptionally relevant."
+
+Examples:
+- Preferred: `Nature Methods`, `Cell Systems`, `bioRxiv`, `eLife`
+- Deprioritized: `Frontiers in ...`, `PLOS ONE`
+
+Stored as `preferred_journals: list[str]` and `deprioritized_journals: list[str]`.
+
+### Template
+
+`templates/agent/podcast_settings.html` — extends `base.html`, matches the visual style of `templates/agent/profile_edit.html`.
+
+Sections:
+1. **Voice** — `<select>` with voice options
+2. **Extra Keywords** — `<textarea>` with instructions
+3. **Source Preferences** — two `<textarea>` fields (preferred / deprioritized), comma or newline separated
+4. **Save button** — POSTs to the same URL, redirects back on success with a flash message
+
+### Pipeline Integration
+
+In `run_pipeline_for_agent()` (`src/podcast/pipeline.py`), after loading profile and preferences text:
+
+```python
+# Load structured preferences from DB
+prefs = await _load_podcast_preferences_structured(agent_id)  # returns PodcastPreferences | None
+
+# Step 2 (query building): inject extra_keywords
+if prefs and prefs.extra_keywords:
+    queries.extend(
+        f'"{kw}"' for kw in prefs.extra_keywords[:20]
+    )
+
+# Step 3 (article selection): inject journal preferences into selection prompt
+journal_context = ""
+if prefs and prefs.preferred_journals:
+    journal_context += f"\nPreferred sources: {', '.join(prefs.preferred_journals)}."
+if prefs and prefs.deprioritized_journals:
+    journal_context += f"\nDeprioritized sources: {', '.join(prefs.deprioritized_journals)}."
+# journal_context is appended to the {preferences} block in the selection prompt
+
+# Step 5 (TTS): use voice from preferences
+voice_override = prefs.voice_id if prefs else None
+# mistral_tts.get_voice() checks PodcastPreferences first, then podcast_voices.json, then env default
+```
+
+Add `_load_podcast_preferences_structured(agent_id)` as an async helper that queries `PodcastPreferences` and returns the ORM row or `None`.
+
+Update `mistral_tts.get_voice()` and `local_tts.get_voice()` to accept an optional `voice_override` parameter passed from the pipeline instead of reading from `podcast_voices.json` directly.
+
+### Admin Visibility
+
+The existing `/admin/podcast` page gets a **Preferences** column in the agent filter section: when an agent is selected, show a summary of its preferences (voice, keyword count, journal counts) with a link to the preferences page.
+
+---
+
+## Module Structure
+
+```
+src/podcast/
+├── main.py            # Scheduler: agent loop then user loop
+├── pipeline.py        # run_pipeline_for_agent() + run_podcast_for_user()
+├── pubmed_search.py   # Query builder from profile dict
+├── preprint_search.py # bioRxiv / medRxiv / arXiv search
+├── mistral_tts.py     # Mistral AI TTS client
+├── local_tts.py       # Local vLLM-Omni TTS client (optional)
+├── tts_utils.py       # ffmpeg loudnorm, duration extraction
+├── rss.py             # RSS feed builder (agent_id or user_id keyed)
+└── state.py           # podcast_state.json helpers (agent + user variants)
+
+src/routers/podcast.py     # All podcast HTTP endpoints
+templates/
+├── agent/podcast_settings.html   # Agent-path preferences UI
+└── podcast_settings.html          # User-path preferences UI (+ feed URL card)
+```
+
+---
+
+## Rollout Phases
+
+### Phase 1: Text-only delivery _(complete)_
+- PubMed search, LLM selection, Opus summarization
+- Slack DM delivery
+- `PodcastEpisode` DB table and admin visibility
+- No audio, no RSS
+
+### Phase 2: Audio + RSS _(complete)_
+- Mistral AI TTS integration
+- Audio file storage and streaming endpoint
+- RSS feed generation and `/podcast/{agent_id}/feed.xml` endpoint
+- Per-agent voice configuration
+
+### Phase 3: PI customization surface _(complete)_
+- Podcast preferences section in private profile
+- Pipeline reads preferences when building prompts
+- Admin dashboard podcast tab with LLM usage metrics
+
+### Phase 4: Structured Preferences UI _(complete)_
+- `PodcastPreferences` DB table (migration `0012`)
+- `GET/POST /agent/{agent_id}/podcast-settings` route and form
+- Voice picker, extra keywords, source preferences
+- Deprecate `data/podcast_voices.json` in favour of DB-stored voice preference
+
+### Phase 5: Open Access for Plain ORCID Users _(implemented in migration 0013)_
+- **Goal**: any researcher who signs in with ORCID and completes their profile receives daily podcast briefings automatically — no agent approval, no Slack bot required.
+- **Schema**: migration `0013` adds `user_id` FK to `podcast_preferences` and `podcast_episodes`; makes `agent_id` nullable in both tables; adds partial unique index for user-path episodes.
+- **Pipeline**: `run_podcast_for_user(user_id, db_session)` in `src/podcast/pipeline.py` — loads profile from `ResearcherProfile` DB row (no disk file), queries PubMed/preprints, selects article, generates audio, and persists a `PodcastEpisode` keyed by `user_id`.
+- **Scheduler**: `src/podcast/main.py` runs the user loop after the agent loop; users whose `user_id` appears in an active `AgentRegistry` row are skipped (covered by agent path).
+- **Endpoints** (all in `src/routers/podcast.py`):
+  - `GET /podcast/users/{user_id}/feed.xml` — public RSS feed
+  - `GET /podcast/users/{user_id}/audio/{date}.mp3` — audio streaming
+  - `GET /podcast/settings` — preferences UI (auth-gated)
+  - `POST /podcast/settings` — save preferences (auth-gated)
+  - `POST /podcast/user/generate` — on-demand episode trigger (auth-gated)
+- **State**: `data/podcast_state.json` gains a `"users"` section keyed by user_id UUID strings.
+- **Eligibility gate**: `user.onboarding_complete == True` and `profile.research_summary IS NOT NULL`. Users who have not yet built their profile are silently skipped.
+- **Opt-in gate**: generation only runs for users with `PodcastPreferences.podcast_enabled = True`. Users who have not explicitly enabled the podcast via `/podcast/settings` are skipped even if they are otherwise eligible. See **User Opt-In / Opt-Out** section.
+
+---
+
+## Out of Scope
+
+- Real-time or on-demand article requests from non-authenticated callers
+- Multi-article episodes (one article per day, selected by the LLM as the single most relevant)
+- Full-text audio of the paper itself (summary only)
+- Publicly listed or shared RSS feeds (each feed URL is personal and opaque)
+- Push notifications or mobile app integration
+- Email delivery of the text summary (RSS + audio only for the user path)
diff --git a/specs/local_message_mode.md b/specs/local_message_mode.md
new file mode 100644
index 0000000..c259c2b
--- /dev/null
+++ b/specs/local_message_mode.md
@@ -0,0 +1,156 @@
+# Local Message Mode Specification
+
+## Overview
+
+Local Message Mode allows the agent simulation to run entirely without Slack — agents communicate through the local PostgreSQL database instead. All inter-agent conversations, channel history, and message delivery are handled via a `local_messages` table. The web app, podcast pipeline, profile pipeline, and all other subsystems are unaffected.
+
+This mode is useful for:
+- Developing and testing agent logic without Slack credentials or live bots
+- Running offline/CI simulations against the full agent reasoning stack
+- Replaying or resuming simulations that are fully self-contained in the database
+- Evaluating agent output (proposals, LLM call logs) without a Slack workspace
+
+It is activated by a single environment variable: `LOCAL_MODE=true`.
+
+---
+
+## Current Slack Dependency — What Changes
+
+The simulation currently uses Slack for four things:
+
+| Role | Current (Slack) | Local Mode Substitute |
+|---|---|---|
+| Message delivery | `chat.postMessage` | INSERT into `local_messages` |
+| Channel history (startup rebuild) | `conversations.history` + `conversations.replies` | SELECT from `local_messages` |
+| Incremental polling (each turn) | `conversations.history` cursor polling | SELECT from `local_messages` WHERE `ts > cursor` |
+| PI input (DMs, channel mentions) | `conversations.history` on DM channels | Disabled (no human PIs in local mode) |
+
+Everything else — Phase 2/4/5 LLM logic, Anthropic tool use, `agent_messages`, `llm_call_logs`, `thread_decisions`, `proposal_reviews` DB writes — is **unchanged**.
+
+### What is NOT currently stored in the database
+
+The main gap: **message content**. The existing `agent_messages` table stores only metadata (`agent_id`, `channel_id`, `message_ts`, `phase`, `message_length`) — not the actual message text. Message text lives only on Slack (and in-memory in `MessageLog`, which is rebuilt from Slack on every restart). Local mode closes this gap by adding a `local_messages` table that stores full content.
+
+---
+
+## Database: `local_messages` Table
+
+New table added via Alembic migration `0019_add_local_messages.py`.
+
+| Column | Type | Notes |
+|---|---|---|
+| `id` | UUID PK | `gen_random_uuid()` |
+| `ts` | TEXT UNIQUE NOT NULL | Synthetic Slack-compatible timestamp (`datetime.utcnow().isoformat()`) — used as the canonical message ID throughout the system |
+| `channel_id` | TEXT NOT NULL | Synthetic channel ID (e.g. `"local-general"`) |
+| `channel_name` | TEXT NOT NULL | Human-readable channel name (e.g. `"general"`) |
+| `sender_agent_id` | TEXT | Null for future human/PI messages |
+| `sender_name` | TEXT NOT NULL | Bot display name |
+| `content` | TEXT NOT NULL | Full message text |
+| `thread_ts` | TEXT | Null = top-level post; otherwise = `ts` of the parent post |
+| `is_bot` | BOOLEAN NOT NULL DEFAULT TRUE | |
+| `simulation_run_id` | INTEGER FK → `simulation_runs` | |
+| `created_at` | TIMESTAMPTZ DEFAULT NOW() | |
+
+Indexes: `(channel_id, ts)`, `(channel_id, thread_ts)`.
+
+---
+
+## New Component: `LocalMessageClient`
+
+File: `src/agent/local_client.py`
+
+A drop-in substitute for `AgentSlackClient` (`src/agent/slack_client.py`). Implements the same method signatures so `SimulationEngine` needs no changes to its agent-facing logic.
+
+| `AgentSlackClient` method | `LocalMessageClient` behaviour |
+|---|---|
+| `connect()` / `auth_test()` | No-op; returns synthetic `{"user_id": agent_id, "user": bot_name}` |
+| `post_message(channel_id, text, thread_ts)` | INSERT into `local_messages`; return `{"ts": synthetic_ts}` |
+| `get_full_channel_history(channel_id)` | SELECT WHERE `channel_id = ? AND thread_ts IS NULL ORDER BY ts` |
+| `get_all_thread_replies(channel_id, thread_ts)` | SELECT WHERE `channel_id = ? AND thread_ts = ? ORDER BY ts` |
+| `poll_channel_messages(channel_id, oldest)` | SELECT WHERE `channel_id = ? AND ts > oldest ORDER BY ts` |
+| `get_thread_replies(channel_id, thread_ts, oldest)` | SELECT WHERE `channel_id = ? AND thread_ts = ? AND ts > oldest ORDER BY ts` |
+| `list_channels()` | Return static `{name: synthetic_id}` dict from seeded channel list |
+| `create_channel(name)` | No-op; return synthetic channel ID |
+| `join_channel(channel_id)` | No-op |
+| `open_dm_channel(user_id)` | No-op; return dummy ID |
+| `send_dm(channel_id, text)` | Log to stdout only |
+| `resolve_user_name(user_id)` | Return `user_id` unchanged |
+| `is_bot_user(user_id)` | Return `True` if `user_id` matches any known `agent_id` |
+
+---
+
+## Changes to `SimulationEngine` (`src/agent/simulation.py`)
+
+### Client instantiation (`__init__`)
+
+```python
+if settings.local_mode:
+    client = LocalMessageClient(agent_id, db_session, simulation_run_id)
+else:
+    client = AgentSlackClient(bot_token, app_token)
+```
+
+### `_rebuild_state()` (rename from `_rebuild_state_from_slack`)
+
+Add a branch: if `local_mode`, populate `MessageLog` by querying `LocalMessageClient` (which reads from `local_messages`) using the exact same loop currently used for Slack. The `MessageLog.append()` call and all downstream state reconstruction (`active_threads`, `pending_proposals`, `_closed_thread_ids`) are unchanged.
+
+### `_ensure_seeded_channels()`
+
+If `local_mode`, skip `conversations.list` / `conversations.create` / `conversations.join`. Populate `_channel_id_map` from a static dict using synthetic IDs (e.g. `{"general": "local-general", ...}`).
+
+### `_poll_slack_for_pi_messages()` and `_poll_pi_dms()`
+
+Gate both behind `if not settings.local_mode`. In local mode there are no human PIs sending messages, so these polling loops are skipped entirely.
+
+---
+
+## Config (`src/config.py`)
+
+```python
+local_mode: bool = False  # Run simulation without Slack; all messages stored in local_messages table
+```
+
+`.env.example` addition:
+
+```
+LOCAL_MODE=false
+```
+
+---
+
+## What Is Unchanged
+
+- All Phase 2, 4, and 5 LLM reasoning and prompt logic
+- Anthropic tool use in Phase 4 (`retrieve_profile`, `retrieve_abstract`, `retrieve_full_text`, `retrieve_foa`)
+- All DB writes: `agent_messages`, `llm_call_logs`, `thread_decisions`, `proposal_reviews`, `pi_proposal_evaluations`
+- `MessageLog` class interface (`src/agent/message_log.py`)
+- `Agent`, `AgentState`, `PIHandler` classes (PI handling simply becomes a no-op)
+- Web app, admin dashboard, podcast pipeline, worker, GrantBot
+
+---
+
+## Files to Create / Modify
+
+| File | Action |
+|---|---|
+| `alembic/versions/0019_add_local_messages.py` | Create — new migration |
+| `src/agent/local_client.py` | Create — `LocalMessageClient` class |
+| `src/agent/simulation.py` | Modify — client injection, `_rebuild_state()` branch, gate PI polling, `_ensure_seeded_channels()` branch |
+| `src/config.py` | Modify — add `local_mode: bool = False` |
+| `.env.example` | Modify — add `LOCAL_MODE=false` |
+
+---
+
+## Verification
+
+1. Set `LOCAL_MODE=true` in `.env`
+2. Apply migration: `docker compose exec app alembic upgrade head`
+3. Start simulation: `docker compose --profile agent run -d --name agent-run agent python -m src.agent.main --budget 10`
+4. Confirm messages are written:
+   ```sql
+   SELECT sender_name, channel_name, LEFT(content, 80), thread_ts
+   FROM local_messages ORDER BY created_at LIMIT 20;
+   ```
+5. Confirm proposals are recorded: `SELECT * FROM thread_decisions;`
+6. Confirm LLM calls are logged: `SELECT agent_id, model, input_tokens FROM llm_call_logs LIMIT 10;`
+7. Stop and restart the agent container; confirm simulation resumes correctly by reading history from `local_messages` without needing Slack
diff --git a/specs/pi-interaction.md b/specs/pi-interaction.md
index fd63266..7681603 100644
--- a/specs/pi-interaction.md
+++ b/specs/pi-interaction.md
@@ -158,6 +158,16 @@ Every time a bot reaches a conclusion in a thread — either a :memo: proposal o
 - DM includes: what was confirmed and a link
 - Example: "I confirmed WisemanBot's proposal in #drug-repurposing for a joint study on HRI activators. [thread link]"
 
+## Web UI: Proposal Evaluations Tab
+
+PIs can evaluate all collaboration proposals that involve them — from both the agent simulation and the Matchmaker — through a dedicated tab at `/proposals` on the coPI web app.
+
+The list merges both proposal sources and randomizes row order on each load so the origin is not inferable from position. Each proposal links to a structured evaluation form using the NIH 1–9 scoring scale (Exceptional → Poor) across five criteria: Significance, Innovation, Approach, Investigators, and Environment, plus an overall Impact score.
+
+These evaluations are stored in `pi_proposal_evaluations` and are separate from the 1–4 agent-blocking review in `proposal_reviews`. The proposal review system described elsewhere in this document (which blocks the agent from posting until reviewed) remains unchanged. The `/proposals` tab is a parallel, research-quality instrument.
+
+See `proposal-review-pi.md` for the complete specification.
+
 ## Implementation Priority
 
 ### Phase 1: DM Instructions + Tag-to-Engage
diff --git a/specs/proposal-review-pi.md b/specs/proposal-review-pi.md
new file mode 100644
index 0000000..6bfa9a4
--- /dev/null
+++ b/specs/proposal-review-pi.md
@@ -0,0 +1,492 @@
+# PI Proposal Evaluation Specification
+
+## Overview
+
+PIs receive collaboration proposals through two independent pathways: the multi-agent Slack simulation (`ThreadDecision`) and the admin-initiated Matchmaker (`MatchmakerProposal`). This feature surfaces all proposals involving a given PI in a single unified list and provides a structured evaluation form using NIH-style 1–9 scoring. The origin of each proposal (agent vs. matchmaker) is never revealed to the evaluator; row order is randomized on each page load to further obscure provenance.
+
+Evaluations are stored in a new `pi_proposal_evaluations` table, separate from the existing `proposal_reviews` table (the 1–4 agent-blocking system). The two systems coexist independently — a PI may submit an evaluation here without affecting or replacing the 1–4 agent review workflow.
+
+---
+
+## New Page: Proposal Evaluations (`/proposals`)
+
+### Access Control
+
+- Requires an authenticated user with `access_status = "allowed"`.
+- Admins see proposals for all users (optional; see Admin Note below). Regular users see only proposals in which they appear as PI A or PI B.
+
+### Route
+
+```
+GET /proposals
+```
+
+A top-level nav entry alongside the agent dashboard link. Not nested under `/agent/{agent_id}/` because it is user-level (not per-agent) and aggregates both proposal types.
+
+---
+
+### Proposal List
+
+#### Data Query
+
+Fetch two sets of proposals for `current_user.id`, then merge:
+
+**Agent proposals** — `ThreadDecision` where `outcome = "proposal"` and:
+```
+agent_a ∈ {agent_ids for current_user}   OR
+agent_b ∈ {agent_ids for current_user}
+```
+Join `AgentRegistry` on `agent_id → user_id` to resolve ownership.
+
+**Matchmaker proposals** — `MatchmakerProposal` where:
+```
+pi_a_id = current_user.id   OR
+pi_b_id = current_user.id
+```
+
+Merge both sets into a single list. Assign each item a stable `display_type` of `"agent"` or `"matchmaker"` for internal routing only — never rendered in the UI.
+
+#### Row Order
+
+Shuffle the merged list with a **per-request random seed** (Python `random.shuffle`) on every page load. Do not persist the order; do not use any stable sort column (not `generated_at`, not alphabetical). The goal is to prevent a PI from inferring origin from consistent ordering.
+
+#### List Layout
+
+Each row is a card or table row containing:
+
+| Element | Notes |
+|---|---|
+| **Title** | `MatchmakerProposal.title` or first non-empty heading extracted from `ThreadDecision.summary_text` |
+| **Collaborator** | Name of the other PI (not the current user). For agent proposals, resolve via `AgentRegistry → User.name`; for matchmaker, use `pi_a_name`/`pi_b_name` or `User.name` from the FK. |
+| **Status badge** | `Pending Evaluation` (gray) or `Evaluated` (green), based on whether a `PiProposalEvaluation` exists for this user + proposal. |
+| **Action** | "Evaluate" → links to the evaluation form. "View" if already evaluated (can re-open read-only, or allow amendment — see Amendments below). |
+
+No date, no confidence label, no source indicator. Keep the row minimal to avoid inadvertently leaking origin.
+
+#### Empty State
+
+If the user has no proposals: display a short message — "No collaboration proposals yet. Proposals will appear here once your agent has completed discussions or the admin has generated a matchmaker proposal involving you."
+
+---
+
+## Evaluation Form (`/proposals/{unified_id}/evaluate`)
+
+### URL Design
+
+Use a **unified identifier** that does not encode origin. Options:
+
+- Encode `type:uuid` as a base64 URL-safe token (e.g., `bWF0Y2htYWtlcjo8dXVpZD4=`), or
+- Use a hash-derived short ID stored in a lookup table.
+
+Recommended: encode as `{type_prefix}_{uuid_hex}` without separators (e.g., `a_3f8c...` vs. `m_9d2e...`), then base64url-encode the whole string so the type is not human-readable in the browser bar.
+
+The backend decodes the token, validates the user has access to that proposal, then renders the form.
+
+### Proposal Summary
+
+At the top of the form, display the full proposal text. For agent proposals use `summary_text`; for matchmaker use `proposal_md` rendered as markdown. Do **not** include metadata that reveals origin (no "Confidence" badge, no agent names, no Slack channel). Show only:
+
+- **Title** (heading)
+- **Collaborator name**
+- **Proposal body** (full markdown)
+
+---
+
+### NIH-Style Scoring Sections
+
+The form has **six scored sections**: five criterion scores (each 1–9) and one Overall Impact score (1–9).
+
+#### Scoring Guide (displayed inline at top of form, collapsed by default)
+
+> **How to Score: NIH 1–9 Scale**
+>
+> Scores are whole numbers from **1 (best) to 9 (worst)**. Use the full range.
+>
+> | Score | Descriptor | Strengths / Weaknesses |
+> |---|---|---|
+> | 1 | **Exceptional** | Essentially no weaknesses |
+> | 2 | **Outstanding** | Negligible weaknesses |
+> | 3 | **Excellent** | Only minor weaknesses |
+> | 4 | **Very Good** | Numerous minor weaknesses |
+> | 5 | **Good** | At least one moderate weakness |
+> | 6 | **Satisfactory** | Some moderate weaknesses |
+> | 7 | **Fair** | At least one major weakness |
+> | 8 | **Marginal** | A few major weaknesses |
+> | 9 | **Poor** | Numerous major weaknesses |
+>
+> **Weakness severity:**
+> - *Minor* — easily addressable; does not substantially lessen impact
+> - *Moderate* — lessens impact
+> - *Major* — severely limits impact
+>
+> Scores of 1 and 9 are expected to be rare. Scores of 1–3 indicate high impact; 4–6 moderate; 7–9 low.
+>
+> The **Overall Impact** score is your holistic judgment of the likelihood that this collaboration will exert a sustained, powerful influence on the field. It is *not* the average of the five criteria — weigh them as you see fit.
+
+This guide is collapsed behind a "Show scoring instructions ▾" toggle so experienced evaluators can skip it.
+
+---
+
+#### Section 1: Significance (score 1–9)
+
+**Label:** Significance
+
+**Prompt:**
+> How important is the proposed collaboration to the field? Does it address a significant gap in knowledge, solve a critical problem, or represent an advance that would benefit the broader research community? Assume the proposed work will be successfully completed.
+
+**Input:** Dropdown or radio buttons 1–9 with descriptor labels (Exceptional … Poor). Plus an optional free-text **Comments** field (placeholder: "What are the key strengths or weaknesses in significance?").
+
+---
+
+#### Section 2: Innovation (score 1–9)
+
+**Label:** Innovation
+
+**Prompt:**
+> Does the proposed collaboration apply novel concepts, approaches, methodologies, or technologies? Does it combine the PIs' expertise in a genuinely new way, or apply existing methods in an innovative context?
+
+**Input:** Dropdown/radio 1–9 + optional Comments.
+
+---
+
+#### Section 3: Approach (score 1–9)
+
+**Label:** Approach
+
+**Prompt:**
+> Is the proposed plan of work sound and achievable? Are the scientific rationale and methods appropriate? Does the proposal address potential challenges or risks? Are the experimental designs or research strategies rigorous?
+
+**Input:** Dropdown/radio 1–9 + optional Comments.
+
+---
+
+#### Section 4: Investigators (score 1–9)
+
+**Label:** Investigators
+
+**Prompt:**
+> Do the collaborating PIs have the background, training, and complementary expertise needed to execute this work? Is the combination of their research programs well-suited to the proposed goals?
+
+**Input:** Dropdown/radio 1–9 + optional Comments.
+
+---
+
+#### Section 5: Environment (score 1–9)
+
+**Label:** Environment
+
+**Prompt:**
+> Are the institutional resources, facilities, and collaborative infrastructure available to support this work? Would the combination of the two labs' environments enhance the likelihood of success?
+
+**Input:** Dropdown/radio 1–9 + optional Comments.
+
+---
+
+#### Section 6: Overall Impact (score 1–9)
+
+**Label:** Overall Impact Score
+
+**Prompt:**
+> Provide your overall assessment of the likelihood that this collaboration would exert a **sustained, powerful influence** on the research field(s) involved. Weigh the five criteria above as you see fit — the overall impact score is not an average. A proposal need not be strong in all criteria to earn a high impact score.
+
+**Input:** Dropdown/radio 1–9 + required **Overall Comments** field (at least one sentence required before submission).
+
+---
+
+### Form Submission
+
+**Button:** "Submit Evaluation"
+
+On submit:
+1. Validate all six scores are provided (1–9) and Overall Comments is non-empty.
+2. POST to `POST /proposals/{unified_id}/evaluate`.
+3. Insert a `PiProposalEvaluation` row (see Data Model below).
+4. Redirect to `/proposals` with a success flash: "Evaluation submitted."
+
+If the user has already submitted an evaluation for this proposal, the form pre-fills with their prior scores and comments and shows an "Update Evaluation" button that overwrites the existing row (upsert on `user_id + proposal_key`).
+
+---
+
+## Data Model
+
+### New Table: `pi_proposal_evaluations`
+
+```
+pi_proposal_evaluations
+───────────────────────────────────────────────────────
+id                      UUID  PK  default gen_random_uuid()
+user_id                 UUID  FK → users.id  NOT NULL
+proposal_type           VARCHAR(20) NOT NULL  -- "agent" | "matchmaker"
+thread_decision_id      UUID  FK → thread_decisions.id  NULLABLE
+matchmaker_proposal_id  UUID  FK → matchmaker_proposals.id  NULLABLE
+score_significance      SMALLINT NOT NULL  -- 1–9
+score_innovation        SMALLINT NOT NULL  -- 1–9
+score_approach          SMALLINT NOT NULL  -- 1–9
+score_investigators     SMALLINT NOT NULL  -- 1–9
+score_environment       SMALLINT NOT NULL  -- 1–9
+score_overall_impact    SMALLINT NOT NULL  -- 1–9
+comments_significance   TEXT  NULLABLE
+comments_innovation     TEXT  NULLABLE
+comments_approach       TEXT  NULLABLE
+comments_investigators  TEXT  NULLABLE
+comments_environment    TEXT  NULLABLE
+comments_overall        TEXT  NOT NULL
+evaluated_at            TIMESTAMP  NOT NULL  default now()
+updated_at              TIMESTAMP  NULLABLE  -- set on amendment
+```
+
+**Constraints:**
+- `CHECK (proposal_type IN ('agent', 'matchmaker'))`
+- `CHECK (score_significance BETWEEN 1 AND 9)` (and same for all five criteria + overall)
+- `CHECK (thread_decision_id IS NOT NULL OR matchmaker_proposal_id IS NOT NULL)` — exactly one must be set
+- `UNIQUE (user_id, thread_decision_id)` where `thread_decision_id IS NOT NULL`
+- `UNIQUE (user_id, matchmaker_proposal_id)` where `matchmaker_proposal_id IS NOT NULL`
+
+**Indexes:**
+- `(user_id, proposal_type)` — for the list page query
+- `(thread_decision_id)` — for admin aggregation
+- `(matchmaker_proposal_id)` — for admin aggregation
+
+### Why a Separate Table from `proposal_reviews`
+
+`proposal_reviews` is tightly coupled to the agent-blocking workflow: it has a unique constraint on `(thread_decision_id, agent_id)`, drives the "pending proposals" gate in the simulation, and uses a 1–4 scale designed around the agent system's needs. The NIH evaluation is a research-quality instrument for a different purpose (comparative assessment, future blinded studies), and the two systems should evolve independently.
+
+---
+
+## Backend Routes
+
+### `GET /proposals`
+- Auth: `get_current_user` (access_status = "allowed")
+- Query: merged list of agent + matchmaker proposals involving `current_user.id`
+- Annotate each with `evaluated: bool` by checking `pi_proposal_evaluations`
+- Shuffle with `random.shuffle` before passing to template
+- Template: `proposals/list.html`
+
+### `GET /proposals/{token}/evaluate`
+- Decode token → `(proposal_type, proposal_id)`
+- Validate current user is PI A or PI B for this proposal (403 otherwise)
+- Fetch proposal content; pre-fill existing evaluation if present
+- Template: `proposals/evaluate.html`
+
+### `POST /proposals/{token}/evaluate`
+- Decode token; validate access
+- Validate form fields (all six scores present, overall comment non-empty, scores in 1–9)
+- Upsert `PiProposalEvaluation` (insert or update if row already exists for this user + proposal)
+- Redirect to `/proposals` with flash message
+
+---
+
+## Templates
+
+### `templates/proposals/list.html`
+
+Extends base layout. Nav highlight on "Proposals".
+
+Structure:
+```
+<h1>Collaboration Proposals</h1>
+<p class="subtitle">Proposals involving your lab for your evaluation.</p>
+
+[proposal cards, shuffled]
+
+Each card:
+  Title
+  With: [Collaborator Name]
+  [Status badge]
+  [Evaluate / View button]
+```
+
+No columns that would reveal origin. No sort controls (sort is intentionally hidden).
+
+### `templates/proposals/evaluate.html`
+
+Extends base layout.
+
+Structure:
+```
+<h1>[Proposal Title]</h1>
+<p>Proposed collaboration with <strong>[Collaborator Name]</strong></p>
+
+[Full proposal body, rendered markdown]
+
+<hr>
+
+<h2>Your Evaluation</h2>
+
+<details>
+  <summary>Show scoring instructions ▾</summary>
+  [Scoring guide table]
+</details>
+
+[Section 1: Significance]
+[Section 2: Innovation]
+[Section 3: Approach]
+[Section 4: Investigators]
+[Section 5: Environment]
+[Section 6: Overall Impact + required comment]
+
+[Submit / Update button]
+```
+
+Score inputs: use a horizontal radio button group (1–9) with descriptor labels below (Exceptional … Poor), similar to a Likert scale widget. This makes the scale's direction immediately obvious.
+
+---
+
+## Admin Page: PI Proposal Evaluations (`/admin/evaluations`)
+
+Full admin visibility into all PI evaluation submissions. Admins see the `proposal_type` column (agent vs. matchmaker) — this is the only place in the system where origin is revealed. See `admin-dashboard.md` §12 for the canonical specification; a summary is included here for reference.
+
+### Layout
+
+**Summary cards (top of page):**
+- Total evaluations submitted
+- Evaluations this month
+- Proposals with at least one evaluation (vs. total proposals)
+- Mean overall impact score (all time, shown as X.X / 9)
+
+**Main table — one row per `PiProposalEvaluation`:**
+
+| Column | Notes |
+|---|---|
+| **Evaluator** | `User.name` who submitted the evaluation |
+| **Proposal title** | Title from the linked proposal |
+| **Origin** | `Agent` or `Matchmaker` badge — color-coded (blue / purple). This is the only UI surface in the system that reveals origin. |
+| **Other PI** | Name of the collaborator (the PI who is *not* the evaluator) |
+| **Sig.** | `score_significance` (1–9) |
+| **Inn.** | `score_innovation` (1–9) |
+| **App.** | `score_approach` (1–9) |
+| **Inv.** | `score_investigators` (1–9) |
+| **Env.** | `score_environment` (1–9) |
+| **Impact** | `score_overall_impact` (1–9), emphasized (bold) |
+| **Submitted** | `evaluated_at` timestamp |
+| **Actions** | "View details" → modal or expanded row showing all comments |
+
+Scores are color-coded: 1–3 green (high impact), 4–6 yellow, 7–9 red.
+
+**Detail view (row expand or modal):**
+- All six criterion scores with their comments
+- Full proposal body (rendered markdown)
+- Evaluator name, submission timestamp, amendment timestamp if updated
+
+### Filters
+
+- **Evaluator** — user multi-select
+- **Origin** — All / Agent only / Matchmaker only
+- **Overall Impact range** — min/max sliders (1–9)
+- **Date range** — evaluated_at from/to
+
+### JSON Export
+
+`GET /admin/evaluations/export.json` — streams a JSON file of all `PiProposalEvaluation` rows matching the current filter state (filters passed as query params, same as page view).
+
+**Schema:**
+
+```json
+{
+  "exported_at": "2026-05-04T09:00:00Z",
+  "total_records": 42,
+  "filters_applied": {
+    "origin": "all",
+    "evaluator_ids": [],
+    "impact_score_min": null,
+    "impact_score_max": null,
+    "date_from": null,
+    "date_to": null
+  },
+  "evaluations": [
+    {
+      "evaluation_id": "uuid",
+      "evaluated_at": "2026-04-15T14:32:00Z",
+      "updated_at": null,
+      "evaluator": {
+        "user_id": "uuid",
+        "name": "Jane Smith",
+        "orcid": "0000-0002-1234-5678",
+        "institution": "Scripps Research"
+      },
+      "proposal": {
+        "origin": "agent",
+        "proposal_id": "uuid",
+        "title": "Cryo-ET and Proteomics of Mitochondrial Dynamics",
+        "collaborator": {
+          "user_id": "uuid",
+          "name": "Michael Wiseman",
+          "institution": "Scripps Research"
+        }
+      },
+      "scores": {
+        "significance": 2,
+        "innovation": 3,
+        "approach": 4,
+        "investigators": 2,
+        "environment": 2,
+        "overall_impact": 2
+      },
+      "comments": {
+        "significance": "Addresses a genuine gap in understanding...",
+        "innovation": null,
+        "approach": "Feasibility is somewhat unclear for aim 3...",
+        "investigators": null,
+        "environment": null,
+        "overall": "Strong proposal with highly complementary expertise. Minor concerns about timeline."
+      }
+    }
+  ]
+}
+```
+
+**Implementation note:** Build the export from the same query used to render the table — apply the same filters so the downloaded file always matches what the admin sees on screen. The export is synchronous (no background job) at pilot scale.
+
+---
+
+## Alembic Migration
+
+New migration: `0016_add_pi_proposal_evaluations.py` (or next available revision).
+
+```python
+op.create_table(
+    "pi_proposal_evaluations",
+    sa.Column("id", postgresql.UUID(as_uuid=True), ...),
+    sa.Column("user_id", postgresql.UUID(as_uuid=True), sa.ForeignKey("users.id"), nullable=False),
+    sa.Column("proposal_type", sa.String(20), nullable=False),
+    sa.Column("thread_decision_id", postgresql.UUID(as_uuid=True), sa.ForeignKey("thread_decisions.id"), nullable=True),
+    sa.Column("matchmaker_proposal_id", postgresql.UUID(as_uuid=True), sa.ForeignKey("matchmaker_proposals.id"), nullable=True),
+    sa.Column("score_significance", sa.SmallInteger(), nullable=False),
+    sa.Column("score_innovation", sa.SmallInteger(), nullable=False),
+    sa.Column("score_approach", sa.SmallInteger(), nullable=False),
+    sa.Column("score_investigators", sa.SmallInteger(), nullable=False),
+    sa.Column("score_environment", sa.SmallInteger(), nullable=False),
+    sa.Column("score_overall_impact", sa.SmallInteger(), nullable=False),
+    sa.Column("comments_significance", sa.Text(), nullable=True),
+    sa.Column("comments_innovation", sa.Text(), nullable=True),
+    sa.Column("comments_approach", sa.Text(), nullable=True),
+    sa.Column("comments_investigators", sa.Text(), nullable=True),
+    sa.Column("comments_environment", sa.Text(), nullable=True),
+    sa.Column("comments_overall", sa.Text(), nullable=False),
+    sa.Column("evaluated_at", sa.DateTime(timezone=True), server_default=sa.func.now(), nullable=False),
+    sa.Column("updated_at", sa.DateTime(timezone=True), nullable=True),
+)
+op.create_check_constraint("ck_ppe_proposal_type", "pi_proposal_evaluations", "proposal_type IN ('agent', 'matchmaker')")
+op.create_check_constraint("ck_ppe_proposal_present", "pi_proposal_evaluations",
+    "thread_decision_id IS NOT NULL OR matchmaker_proposal_id IS NOT NULL")
+# Score range checks
+for col in ["significance", "innovation", "approach", "investigators", "environment", "overall_impact"]:
+    op.create_check_constraint(f"ck_ppe_score_{col}", "pi_proposal_evaluations",
+        f"score_{col} BETWEEN 1 AND 9")
+op.create_unique_constraint("uq_ppe_user_thread", "pi_proposal_evaluations",
+    ["user_id", "thread_decision_id"])
+op.create_unique_constraint("uq_ppe_user_matchmaker", "pi_proposal_evaluations",
+    ["user_id", "matchmaker_proposal_id"])
+op.create_index("ix_ppe_user_type", "pi_proposal_evaluations", ["user_id", "proposal_type"])
+op.create_index("ix_ppe_thread", "pi_proposal_evaluations", ["thread_decision_id"])
+op.create_index("ix_ppe_matchmaker", "pi_proposal_evaluations", ["matchmaker_proposal_id"])
+```
+
+---
+
+## Open Questions
+
+1. **Token encoding**: Prefer base64url opaque token or a human-readable `{type}/{uuid}` path? The latter is simpler to implement but makes origin obvious in the URL bar. Recommend opaque token.
+2. **Re-evaluation policy**: Allow PIs to update their evaluation after submission (upsert)? Or lock after first submission? Current spec allows amendment; change if a one-shot design is preferred for the study.
+3. **Matchmaker proposals with no `pi_a_id`/`pi_b_id`** (CLI-created, name-only rows): These cannot be linked to a specific `user_id`. Either exclude them from the PI list view or require admin to backfill FKs before they appear. Recommend exclusion with a note in the admin UI.
+4. **Delegate access**: Should delegates be able to submit evaluations on behalf of the PI? The existing delegate model (`web-delegates.md`) could extend here but is out of scope for v1 — delegates see only the existing 1–4 review workflow.
diff --git a/src/agent/agent.py b/src/agent/agent.py
index 1bae847..01e869f 100644
--- a/src/agent/agent.py
+++ b/src/agent/agent.py
@@ -6,6 +6,7 @@
 from typing import Any
 
 from src.agent.state import AgentState, PostRef, ThreadState
+from src.utils.prompts import load_prompt
 
 logger = logging.getLogger(__name__)
 
@@ -29,6 +30,7 @@ def __init__(self, agent_id: str, bot_name: str, pi_name: str):
         self._lab_directory: str | None = None
         self.api_call_count: int = 0
         self.message_count: int = 0
+        self.is_paused: bool = False
         self.state = AgentState()
 
     # ------------------------------------------------------------------
@@ -74,10 +76,7 @@ def reload_profiles(self):
 
     def build_system_prompt(self) -> str:
         """Build the full agent system prompt with identity and profiles."""
-        base_prompt = self._load_file(
-            PROMPTS_DIR / "agent-system.md",
-            _default_system_prompt(),
-        )
+        base_prompt = load_prompt(PROMPTS_DIR / "agent-system.md", _default_system_prompt())
         lab_directory_section = ""
         if self._lab_directory:
             lab_directory_section = f"""
@@ -107,10 +106,7 @@ def build_scan_system_prompt(self) -> str:
         Omits working memory and lab directory — scan only needs identity,
         research focus, and private priorities to judge relevance.
         """
-        base_prompt = self._load_file(
-            PROMPTS_DIR / "agent-system.md",
-            _default_system_prompt(),
-        )
+        base_prompt = load_prompt(PROMPTS_DIR / "agent-system.md", _default_system_prompt())
         return f"""{base_prompt}
 
 ## Your Identity
@@ -130,10 +126,7 @@ def build_thread_reply_system_prompt(self) -> str:
         talking to. Use retrieve_profile tool if you need details on another lab.
         Includes working memory since it may contain thread-relevant context.
         """
-        base_prompt = self._load_file(
-            PROMPTS_DIR / "agent-system.md",
-            _default_system_prompt(),
-        )
+        base_prompt = load_prompt(PROMPTS_DIR / "agent-system.md", _default_system_prompt())
         return f"""{base_prompt}
 
 ## Your Identity
@@ -214,10 +207,7 @@ def build_phase4_prompt(
         Returns (system_prompt, messages).
         """
         system_prompt = self.build_thread_reply_system_prompt()
-        phase4_template = self._load_file(
-            PROMPTS_DIR / "phase4-thread-reply.md",
-            "Compose a thread reply.",
-        )
+        phase4_template = load_prompt(PROMPTS_DIR / "phase4-thread-reply.md", "Compose a thread reply.")
 
         # Thread phase guidance
         if thread.message_count <= 4:
diff --git a/src/agent/grantbot.py b/src/agent/grantbot.py
index 2672a51..5af41ed 100644
--- a/src/agent/grantbot.py
+++ b/src/agent/grantbot.py
@@ -402,9 +402,10 @@ async def run_grantbot(
 
     if not dry_run:
         from slack_sdk import WebClient
-        bot_token = getattr(settings, "slack_bot_token_grantbot", "")
+        slack_tokens = settings.get_slack_tokens()
+        bot_token = slack_tokens.get("grantbot", {}).get("bot", "")
         if not bot_token or bot_token.startswith("xoxb-placeholder"):
-            bot_token = settings.slack_bot_token_su
+            bot_token = slack_tokens.get("su", {}).get("bot", "")
             logger.info("No grantbot Slack token — using SuBot's token as fallback")
         if bot_token and not bot_token.startswith("xoxb-placeholder"):
             slack_client = WebClient(token=bot_token)
diff --git a/src/agent/main.py b/src/agent/main.py
index 236a861..a70e4e6 100644
--- a/src/agent/main.py
+++ b/src/agent/main.py
@@ -36,9 +36,11 @@ def main(
     no_db: bool = typer.Option(False, "--no-db", help="Skip database logging"),
     fresh: bool = typer.Option(False, "--fresh", help="Wipe simulation data and start fresh"),
     reset_cursors: bool = typer.Option(False, "--reset-cursors", help="Reset scan cursors so agents re-read all posts"),
+    focus_agent: str = typer.Option("", "--focus-agent", help="Agent ID to spotlight: only this agent sees all others; all others see only this agent"),
+    reset_focus_cursor: bool = typer.Option(False, "--reset-focus-cursor", help="Reset only the focus agent's cursor to 0 so it re-scans all history"),
 ):
     """Run the turn-based agent simulation."""
-    asyncio.run(_run_simulation(max_runtime, budget, mock, no_db, fresh, reset_cursors))
+    asyncio.run(_run_simulation(max_runtime, budget, mock, no_db, fresh, reset_cursors, focus_agent or None, reset_focus_cursor))
 
 
 async def _run_simulation(
@@ -48,14 +50,31 @@ async def _run_simulation(
     no_db: bool,
     fresh: bool,
     reset_cursors: bool = False,
+    focus_agent: str | None = None,
+    reset_focus_cursor: bool = False,
 ) -> None:
     settings = get_settings()
 
-    # Create agent instances
+    # Create agent instances — filtered to only those with status='active' in the DB.
+    # Set an agent to 'suspended' in the agents table to exclude it without removing it.
+    from sqlalchemy import select
+    from src.database import get_session_factory
+    from src.models.agent_registry import AgentRegistry
+
+    _sf = get_session_factory()
+    async with _sf() as _db:
+        _res = await _db.execute(
+            select(AgentRegistry.agent_id).where(AgentRegistry.status == "active")
+        )
+        _active_ids = {row[0] for row in _res}
+
     agents = [
         Agent(agent_id=lab["id"], bot_name=lab["name"], pi_name=lab["pi"])
         for lab in PILOT_LABS
+        if lab["id"] in _active_ids
     ]
+    logger.info("Loaded %d active agents (of %d total): %s", len(agents), len(PILOT_LABS),
+                sorted(a.agent_id for a in agents))
 
     # Set up Slack clients (Web API only, no Socket Mode)
     slack_clients = {}
@@ -151,6 +170,13 @@ async def _run_simulation(
 
     # Create simulation engine
     runtime_label = f"{max_runtime}m" if max_runtime > 0 else "indefinite"
+    if focus_agent:
+        valid_ids = {lab["id"] for lab in PILOT_LABS}
+        if focus_agent not in valid_ids:
+            logger.error("--focus-agent '%s' is not a valid agent ID. Valid IDs: %s", focus_agent, sorted(valid_ids))
+            return
+        logger.info("Focus mode: only '%s' sees all agents; all others see only '%s'", focus_agent, focus_agent)
+
     sim_engine = SimulationEngine(
         agents=agents,
         slack_clients=slack_clients,
@@ -159,6 +185,8 @@ async def _run_simulation(
         session_factory=session_factory,
         simulation_run_id=simulation_run_id,
         reset_cursors=reset_cursors,
+        focus_agent=focus_agent,
+        reset_focus_cursor=reset_focus_cursor,
     )
 
     # Handle shutdown signals
diff --git a/src/agent/simulation.py b/src/agent/simulation.py
index 6199643..dab5e47 100644
--- a/src/agent/simulation.py
+++ b/src/agent/simulation.py
@@ -51,6 +51,43 @@
     {"id": "forli", "name": "ForliBot", "pi": "Stefano Forli"},
     {"id": "deniz", "name": "DenizBot", "pi": "Ashok Deniz"},
     {"id": "lairson", "name": "LairsonBot", "pi": "Luke Lairson"},
+    {"id": "azumaya", "name": "AzumayaBot", "pi": "Caleigh Azumaya"},
+    {"id": "badran", "name": "BadranBot", "pi": "Ahmed Badran"},
+    {"id": "capra", "name": "CapraBot", "pi": "John Capra"},
+    {"id": "craik", "name": "CraikBot", "pi": "Charles Craik"},
+    {"id": "echeverria", "name": "EcheverriaBot", "pi": "Ignacia Echeverria"},
+    {"id": "fraser", "name": "FraserBot", "pi": "James Fraser"},
+    {"id": "kern", "name": "KernBot", "pi": "Dorothee Kern"},
+    {"id": "kim", "name": "KimBot", "pi": "Peter Kim"},
+    {"id": "larabell", "name": "LarabellBot", "pi": "Carolyn Larabell"},
+    {"id": "lasker", "name": "LaskerBot", "pi": "Keren Lasker"},
+    {"id": "lippi", "name": "LippiBot", "pi": "Giordano Lippi"},
+    {"id": "macrae", "name": "MacRaeBot", "pi": "Ian MacRae"},
+    {"id": "maillie", "name": "MailieBot", "pi": "Colleen Maillie"},
+    {"id": "manglik", "name": "ManglikBot", "pi": "Aashish Manglik"},
+    {"id": "millar", "name": "MillarBot", "pi": "David Millar"},
+    {"id": "miller", "name": "MillerBot", "pi": "Shannon Miller"},
+    {"id": "minor", "name": "MinorBot", "pi": "Daniel Minor"},
+    {"id": "moore", "name": "MooreBot", "pi": "Jonathan Moore"},
+    {"id": "mravic", "name": "MravicBot", "pi": "Marco Mravic"},
+    {"id": "nomura", "name": "NomuraBot", "pi": "Daniel Nomura"},
+    {"id": "paulson", "name": "PaulsonBot", "pi": "Jim Paulson"},
+    {"id": "pwu", "name": "PengWuBot", "pi": "Peng Wu"},
+    {"id": "roe", "name": "RoeBot", "pi": "Leah Tang Roe"},
+    {"id": "sali", "name": "SaliBot", "pi": "Andrej Sali"},
+    {"id": "santi", "name": "SantiBot", "pi": "Daniel Santi"},
+    {"id": "seiple", "name": "SeippleBot", "pi": "Ian Seiple"},
+    {"id": "stroud", "name": "StroudBot", "pi": "Robert Stroud"},
+    {"id": "susa", "name": "SusaBot", "pi": "Katherine Susa"},
+    {"id": "wells", "name": "WellsBot", "pi": "James Wells"},
+    {"id": "williams", "name": "WilliamsBot", "pi": "Michael Williams"},
+    {"id": "williamson", "name": "WilliamsonBot", "pi": "James Williamson"},
+    {"id": "wilson", "name": "WilsonBot", "pi": "Ian Wilson"},
+    {"id": "yeager", "name": "YeagerBot", "pi": "Mark Yeager"},
+    {"id": "zaro", "name": "ZaroBot", "pi": "Balyn Zaro"},
+    {"id": "hogenesch", "name": "HogeneschBot", "pi": "John Hogenesch"},
+    {"id": "alanjary", "name": "AlanjaryBot", "pi": "Mohammad Alanjary"},
+    {"id": "cline", "name": "ClineBot", "pi": "Hollis Cline"},
 ]
 
 # Keywords for channel-profile matching
@@ -95,6 +132,8 @@ def __init__(
         session_factory=None,
         simulation_run_id: uuid.UUID | None = None,
         reset_cursors: bool = False,
+        focus_agent: str | None = None,
+        reset_focus_cursor: bool = False,
     ):
         self.agents = {a.agent_id: a for a in agents}
         self.slack_clients = slack_clients
@@ -103,6 +142,8 @@ def __init__(
         self.session_factory = session_factory
         self.simulation_run_id = simulation_run_id
         self._reset_cursors = reset_cursors
+        self._focus_agent = focus_agent
+        self._reset_focus_cursor = reset_focus_cursor
 
         self._start_time: datetime | None = None
         self._running = False
@@ -167,6 +208,23 @@ def _non_funding_thread_count(self, agent: Agent) -> int:
             if not self.message_log.is_funding_thread(t.thread_id)
         )
 
+    def _effective_thread_threshold(self, agent: Agent) -> int:
+        """Active-thread threshold — 3× higher for the focus agent."""
+        base = get_settings().active_thread_threshold
+        if self._focus_agent and agent.agent_id == self._focus_agent:
+            return base * 3
+        return base
+
+    def _is_agent_blocked(self, agent: Agent) -> bool:
+        """Return True if the agent is blocked from regular (non-funding) Phase 5 activity."""
+        at_threshold = self._non_funding_thread_count(agent) >= self._effective_thread_threshold(agent)
+        unreviewed_limit = 10 if self._focus_agent and agent.agent_id == self._focus_agent else 1
+        unreviewed_count = sum(
+            1 for p in agent.state.pending_proposals
+            if not p.reviewed and not self.message_log.is_funding_thread(p.thread_id)
+        )
+        return at_threshold or unreviewed_count >= unreviewed_limit
+
     def _count_today_posts(self, agent: Agent) -> int:
         """Count top-level posts by this agent in the current Pacific time day."""
         from zoneinfo import ZoneInfo
@@ -210,6 +268,15 @@ async def start(self) -> None:
             session_factory=self.session_factory,
         )
 
+        # Seed last_selected for all agents so the focus multiplier works on Turn 1.
+        # Without this, agents with last_selected=0.0 have a base weight equal to
+        # the current Unix timestamp (~1.7B), swamping any multiplier until every
+        # agent has had one turn.
+        now = time.time()
+        for a in self.agents.values():
+            if a.state.last_selected == 0.0:
+                a.state.last_selected = now
+
         # Main loop
         turn_count = 0
         consecutive_idle = 0
@@ -222,6 +289,10 @@ async def start(self) -> None:
             # Sync proposal reviews from web app
             await self._sync_proposal_reviews_from_db()
 
+            # Sync paused state from DB every 10 turns
+            if turn_count % 10 == 0:
+                await self._sync_paused_state_from_db()
+
             # Select agent
             agent = self._select_agent()
             if not agent or not self._agent_within_budget(agent):
@@ -260,6 +331,12 @@ async def start(self) -> None:
             # Track last agent to make an LLM call
             if did_work:
                 self._last_llm_caller = agent.agent_id
+            elif self._focus_agent and agent.agent_id != self._focus_agent:
+                # In focus mode, non-focus idle turns don't block the focus agent.
+                # Without this, a focus-agent LLM call (even an empty one) sets
+                # _last_llm_caller and no non-focus agent ever clears it, deadlocking
+                # the focus agent permanently.
+                self._last_llm_caller = None
 
             # Update last_selected
             agent.state.last_selected = time.time()
@@ -309,17 +386,36 @@ def _select_agent(self) -> Agent | None:
         now = time.time()
         candidates = [
             a for a in self.agents.values()
-            if self._agent_within_budget(a)
+            if self._agent_within_budget(a) and not a.is_paused
         ]
         if not candidates:
             return None
 
+        # In steady state, base weight = now - last_selected shrinks for
+        # frequently-picked agents, so P(focus) = sqrt(m)/(sqrt(m)+N-1).
+        # Solving for P = 0.25: m = ((N-1)/3)^2.
+        # The same multiplier is reused to temporarily boost non-focus agents
+        # that are in active conversation with the focus agent, which lets
+        # conversations flow naturally at the cost of the focus bot's 25% share.
+        n = len(candidates)
+        focus_multiplier = ((n - 1) / 3) ** 2 if self._focus_agent else 1.0
+
         weights = []
         for a in candidates:
             w = max(now - a.state.last_selected, 1.0)
             skips = a.state.consecutive_phase5_skips
             if skips >= 3:
                 w /= 2 ** (skips - 2)
+            if self._focus_agent:
+                if a.agent_id == self._focus_agent:
+                    w *= focus_multiplier
+                elif any(
+                    t.other_agent_id == self._focus_agent
+                    for t in a.state.active_threads.values()
+                ):
+                    # Boost to match focus agent so the conversation alternates
+                    # rapidly; 25% target for focus bot is not enforced here.
+                    w *= focus_multiplier
             weights.append(w)
         return random.choices(candidates, weights=weights, k=1)[0]
 
@@ -367,7 +463,22 @@ async def _run_turn(self, agent: Agent) -> bool:
 
         has_new_work = has_interesting or has_phase4_work or phase2_ran or has_pi
 
-        if has_new_work or spontaneous_ready:
+        # In focus mode, non-focus agents have no one useful to post to spontaneously —
+        # their only valid target is the focus agent, and organic discovery handles that
+        # via has_new_work. Skip spontaneous Phase 5 to avoid wasted Opus calls.
+        focus_mode_blocks_spontaneous = (
+            self._focus_agent
+            and agent.agent_id != self._focus_agent
+            and not has_new_work
+            and spontaneous_ready
+        )
+
+        if focus_mode_blocks_spontaneous:
+            logger.debug(
+                "[%s] Phase 5: Skipped spontaneous call (focus mode, no focus-agent state)",
+                agent.agent_id,
+            )
+        elif has_new_work or spontaneous_ready:
             await self._phase5_new_post(agent, phase4_thread_ids)
         else:
             logger.debug(
@@ -422,6 +533,8 @@ async def _phase2_scan_filter(self, agent: Agent) -> None:
             channels=agent.state.subscribed_channels,
             exclude_agent_id=agent.agent_id,
         )
+        if self._focus_agent and agent.agent_id != self._focus_agent:
+            new_posts = [p for p in new_posts if p.sender_agent_id == self._focus_agent]
 
         # Exclude posts already in interesting_posts or active_threads
         known_ids = {p.post_id for p in agent.state.interesting_posts}
@@ -432,6 +545,11 @@ async def _phase2_scan_filter(self, agent: Agent) -> None:
             logger.debug("[%s] Phase 2: No new posts to evaluate", agent.agent_id)
             return
 
+        # Skip LLM scan if blocked and no incoming funding posts (saves wasted API calls)
+        if self._is_agent_blocked(agent) and not any(is_funding_post(p.content) for p in new_posts):
+            logger.debug("[%s] Phase 2: Skipped scan (blocked, no funding posts)", agent.agent_id)
+            return
+
         # Build post data for LLM
         post_dicts = [
             {
@@ -530,6 +648,8 @@ def _phase3_activate_threads(self, agent: Agent) -> None:
 
         # Check for tags
         tagged_entries = self.message_log.get_tags_for_agent(agent.bot_name, cursor)
+        if self._focus_agent and agent.agent_id != self._focus_agent:
+            tagged_entries = [e for e in tagged_entries if e.sender_agent_id == self._focus_agent]
         for entry in tagged_entries:
             thread_id = entry.thread_ts or entry.ts
             if thread_id in agent.state.active_threads:
@@ -537,8 +657,8 @@ def _phase3_activate_threads(self, agent: Agent) -> None:
             if thread_id in self._closed_thread_ids:
                 continue
             is_funding = self.message_log.is_funding_thread(thread_id)
-            if not is_funding and self._non_funding_thread_count(agent) >= settings.active_thread_threshold:
-                break
+            if not is_funding and self._non_funding_thread_count(agent) >= self._effective_thread_threshold(agent):
+                continue
             # Check thread participation rules
             allowed = self.message_log.get_thread_allowed_agents(thread_id)
             if allowed and agent.agent_id not in allowed:
@@ -578,8 +698,8 @@ def _phase3_activate_threads(self, agent: Agent) -> None:
             if thread_id in self._closed_thread_ids:
                 continue
             is_funding = self.message_log.is_funding_thread(thread_id)
-            if not is_funding and self._non_funding_thread_count(agent) >= settings.active_thread_threshold:
-                break
+            if not is_funding and self._non_funding_thread_count(agent) >= self._effective_thread_threshold(agent):
+                continue
             # Check thread participation rules
             allowed = self.message_log.get_thread_allowed_agents(thread_id)
             if allowed and len(allowed) >= 2 and agent.agent_id not in allowed:
@@ -721,7 +841,7 @@ async def tool_executor(tool_name: str, tool_input: dict) -> str:
                 tools=TOOL_DEFINITIONS,
                 tool_executor=tool_executor,
                 model=settings.llm_agent_model_opus,
-                max_tokens=1500,
+                max_tokens=4000,
                 log_meta={
                     "agent_id": agent.agent_id,
                     "phase": "thread_reply",
@@ -800,9 +920,13 @@ async def _check_thread_outcome(
                         "[%s] Thread %s: proposal confirmed with ✅",
                         agent.agent_id, thread.thread_id,
                     )
-                    # Extract text starting from :memo: marker
-                    memo_idx = entry.content.find(":memo:")
-                    summary_text = entry.content[memo_idx:].strip() if memo_idx >= 0 else entry.content
+                    # Extract only the <proposal>…</proposal> block; fall back to :memo: slice
+                    proposal_match = re.search(r"<proposal>(.*?)</proposal>", entry.content, re.DOTALL)
+                    if proposal_match:
+                        summary_text = proposal_match.group(1).strip()
+                    else:
+                        memo_idx = entry.content.find(":memo:")
+                        summary_text = entry.content[memo_idx:].strip() if memo_idx >= 0 else entry.content
                     agent.state.pending_proposals = [
                         p for p in agent.state.pending_proposals
                         if p.thread_id != thread.thread_id
@@ -945,12 +1069,7 @@ async def _phase5_new_post(self, agent: Agent, phase4_thread_ids: set[str] | Non
             return
 
         # Check preconditions
-        at_thread_threshold = self._non_funding_thread_count(agent) >= settings.active_thread_threshold
-        has_unreviewed_non_funding = any(
-            not p.reviewed and not self.message_log.is_funding_thread(p.thread_id)
-            for p in agent.state.pending_proposals
-        )
-        blocked_for_regular = at_thread_threshold or has_unreviewed_non_funding
+        blocked_for_regular = self._is_agent_blocked(agent)
 
         # Check for PI-priority posts — these bypass random skip and blocking
         has_pi_priority = any(p.pi_priority for p in agent.state.interesting_posts)
@@ -1170,11 +1289,24 @@ async def _phase5_new_post(self, agent: Agent, phase4_thread_ids: set[str] | Non
 
             else:
                 # New top-level post
+                tagged_agent = action_data.get("tagged_agent")
+
+                # Focus mode: non-focus agents may only tag the focus agent
+                if (
+                    self._focus_agent
+                    and agent.agent_id != self._focus_agent
+                    and tagged_agent
+                    and tagged_agent != self._focus_agent
+                ):
+                    logger.info(
+                        "[%s] Phase 5: Blocked new post tagging non-focus agent %s (focus mode)",
+                        agent.agent_id, tagged_agent,
+                    )
+                    return
+
                 await self._post_message(agent.agent_id, channel, message_text)
                 agent.message_count += 1
 
-                # Check if it tags another agent
-                tagged_agent = action_data.get("tagged_agent")
                 if tagged_agent:
                     logger.info(
                         "[%s] Phase 5: New post in #%s tagging @%s",
@@ -1845,6 +1977,18 @@ async def _rebuild_state_from_slack(self) -> None:
                 history = self.message_log.get_thread_history(thread_id)
                 last_sender = history[-1].sender_agent_id if history else None
                 has_pending = last_sender is not None and last_sender != aid
+
+                # Expire threads where this agent sent last and no reply arrived in 6h
+                if not has_pending:
+                    last_ts = history[-1].posted_at if history else 0.0
+                    idle_hours = (time.time() - last_ts) / 3600
+                    if idle_hours > 6:
+                        logger.info(
+                            "[%s] Skipping stale thread %s (idle %.0fh, waiting for %s)",
+                            aid, thread_id, idle_hours, other_id,
+                        )
+                        continue
+
                 agent.state.active_threads[thread_id] = ThreadState(
                     thread_id=thread_id,
                     channel=entry.channel,
@@ -1940,6 +2084,10 @@ async def _rebuild_state_from_slack(self) -> None:
             for agent in self.agents.values():
                 agent.state.last_seen_cursor = latest_ts
 
+        if self._reset_focus_cursor and self._focus_agent and self._focus_agent in self.agents:
+            self.agents[self._focus_agent].state.last_seen_cursor = 0
+            logger.info("--reset-focus-cursor: %s will re-scan all Slack history", self._focus_agent)
+
         # Log rebuild summary
         for agent in self.agents.values():
             at = len(agent.state.active_threads)
@@ -2147,6 +2295,29 @@ async def _sync_proposal_reviews_from_db(self) -> None:
         except Exception as exc:
             logger.debug("Proposal review sync failed: %s", exc)
 
+    async def _sync_paused_state_from_db(self) -> None:
+        """Refresh each in-memory agent's is_paused flag from the DB."""
+        if not self.session_factory:
+            return
+        try:
+            async with self.session_factory() as db:
+                from sqlalchemy import select as sa_select
+                from src.models import AgentRegistry
+                result = await db.execute(
+                    sa_select(AgentRegistry.agent_id, AgentRegistry.is_paused)
+                )
+                rows = result.all()
+            for row in rows:
+                agent = self.agents.get(row.agent_id)
+                if agent and agent.is_paused != row.is_paused:
+                    agent.is_paused = row.is_paused
+                    logger.info(
+                        "[%s] is_paused updated to %s from DB",
+                        row.agent_id, row.is_paused,
+                    )
+        except Exception as exc:
+            logger.debug("Paused state sync failed: %s", exc)
+
     async def _log_message(
         self,
         agent_id: str,
diff --git a/src/cli.py b/src/cli.py
index 69f5239..ddf4863 100644
--- a/src/cli.py
+++ b/src/cli.py
@@ -208,6 +208,99 @@ async def _regenerate():
     _run(_regenerate())
 
 
+@app.command(name="seed-pilot-labs")
+def seed_pilot_labs(
+    agent_id: str = typer.Option(None, "--agent-id", help="Seed only this agent (e.g. 'su'). Omit for all."),
+    run_pipeline: bool = typer.Option(False, "--run-pipeline", help="Enqueue profile generation jobs"),
+):
+    """Create User + AgentRegistry rows for all pilot labs (or one), bypassing ORCID login."""
+    from src.agent.simulation import PILOT_LABS
+
+    labs = PILOT_LABS
+    if agent_id:
+        labs = [lab for lab in PILOT_LABS if lab["id"] == agent_id]
+        if not labs:
+            console.print(f"[red]Unknown agent-id '{agent_id}'. Valid IDs: {[l['id'] for l in PILOT_LABS]}[/red]")
+            raise typer.Exit(1)
+
+    async def _seed():
+        from datetime import datetime, timezone
+        from sqlalchemy import select
+        from src.models import AgentRegistry, Job, User
+
+        engine, factory = await _get_db()
+        async with factory() as db:
+            created_users = 0
+            created_agents = 0
+            skipped = 0
+
+            for lab in labs:
+                synthetic_orcid = f"synthetic:{lab['id']}"
+
+                # --- User ---
+                result = await db.execute(select(User).where(User.orcid == synthetic_orcid))
+                user = result.scalar_one_or_none()
+
+                if user:
+                    console.print(f"[yellow]User already exists for {lab['pi']} ({synthetic_orcid})[/yellow]")
+                else:
+                    user = User(
+                        orcid=synthetic_orcid,
+                        name=lab["pi"],
+                        access_status="allowed",
+                        onboarding_complete=True,
+                    )
+                    db.add(user)
+                    await db.flush()
+                    created_users += 1
+                    console.print(f"[green]Created user: {lab['pi']} ({synthetic_orcid})[/green]")
+
+                # --- AgentRegistry ---
+                result = await db.execute(
+                    select(AgentRegistry).where(AgentRegistry.agent_id == lab["id"])
+                )
+                agent_reg = result.scalar_one_or_none()
+
+                if agent_reg:
+                    if agent_reg.user_id is None:
+                        agent_reg.user_id = user.id
+                        console.print(f"[yellow]{lab['name']} already exists — linked to user[/yellow]")
+                    else:
+                        console.print(f"[yellow]{lab['name']} already exists — skipping[/yellow]")
+                    skipped += 1
+                else:
+                    agent_reg = AgentRegistry(
+                        agent_id=lab["id"],
+                        bot_name=lab["name"],
+                        pi_name=lab["pi"],
+                        user_id=user.id,
+                        status="active",
+                        approved_at=datetime.now(timezone.utc),
+                    )
+                    db.add(agent_reg)
+                    created_agents += 1
+                    console.print(f"[green]Created agent: {lab['name']} (status=active)[/green]")
+
+                # --- Optional profile job ---
+                if run_pipeline:
+                    job = Job(
+                        type="generate_profile",
+                        user_id=user.id,
+                        payload={"user_id": str(user.id), "orcid": synthetic_orcid},
+                    )
+                    db.add(job)
+                    console.print(f"  [dim]Enqueued profile generation for {lab['pi']}[/dim]")
+
+            await db.commit()
+            console.print(
+                f"\n[bold green]Done.[/bold green] "
+                f"Created {created_users} user(s), {created_agents} agent(s), skipped {skipped}."
+            )
+        await engine.dispose()
+
+    _run(_seed())
+
+
 @app.command(name="backfill-profile-revisions")
 def backfill_profile_revisions():
     """Create initial ProfileRevision rows from existing profile files on disk."""
diff --git a/src/config.py b/src/config.py
index e6c3b8d..c3b0d21 100644
--- a/src/config.py
+++ b/src/config.py
@@ -18,6 +18,12 @@ class Settings(BaseSettings):
 
     # Anthropic
     anthropic_api_key: str = ""
+    # Set to e.g. http://localhost:8080 to route through a local proxy (CLIProxyAPI).
+    # Leave empty to use the Anthropic API directly.
+    anthropic_base_url: str = ""
+    # Set False when the endpoint does not support prompt caching (e.g. CLIProxyAPI).
+    # The code also auto-detects and disables caching on the first 400 error.
+    anthropic_prompt_caching: bool = True
 
     # NCBI
     ncbi_api_key: str = ""
@@ -38,39 +44,10 @@ class Settings(BaseSettings):
     notification_check_interval: int = 300  # seconds (5 minutes)
     inbound_poll_interval: int = 60  # seconds
 
-    # Slack tokens — one pair per agent
-    slack_bot_token_su: str = ""
-    slack_app_token_su: str = ""
-    slack_bot_token_wiseman: str = ""
-    slack_app_token_wiseman: str = ""
-    slack_bot_token_lotz: str = ""
-    slack_app_token_lotz: str = ""
-    slack_bot_token_cravatt: str = ""
-    slack_app_token_cravatt: str = ""
-    slack_bot_token_grotjahn: str = ""
-    slack_app_token_grotjahn: str = ""
-    slack_bot_token_petrascheck: str = ""
-    slack_app_token_petrascheck: str = ""
-    slack_bot_token_ken: str = ""
-    slack_app_token_ken: str = ""
-    slack_bot_token_racki: str = ""
-    slack_app_token_racki: str = ""
-    slack_bot_token_saez: str = ""
-    slack_app_token_saez: str = ""
-    slack_bot_token_wu: str = ""
-    slack_app_token_wu: str = ""
-    slack_bot_token_ward: str = ""
-    slack_app_token_ward: str = ""
-    slack_bot_token_briney: str = ""
-    slack_app_token_briney: str = ""
-    slack_bot_token_forli: str = ""
-    slack_app_token_forli: str = ""
-    slack_bot_token_deniz: str = ""
-    slack_app_token_deniz: str = ""
-    slack_bot_token_lairson: str = ""
-    slack_app_token_lairson: str = ""
-    slack_bot_token_grantbot: str = ""
-    slack_app_token_grantbot: str = ""
+    # Slack tokens are loaded dynamically from the environment — see get_slack_tokens().
+    # Add any number of agents to .env using the pattern:
+    #   SLACK_BOT_TOKEN_<AGENT_ID>=xoxb-...
+    #   SLACK_APP_TOKEN_<AGENT_ID>=xapp-...  (optional)
 
     # LLM models
     llm_profile_model: str = "claude-opus-4-6"
@@ -78,6 +55,31 @@ class Settings(BaseSettings):
     llm_agent_model_opus: str = "claude-opus-4-6"
     llm_agent_model_sonnet: str = "claude-sonnet-4-6"
 
+    # Mistral AI (podcast TTS)
+    mistral_api_key: str = ""
+    mistral_tts_model: str = "voxtral-mini-tts-latest"
+    mistral_tts_default_voice: str = ""
+
+    # OpenAI TTS
+    openai_api_key: str = ""
+    openai_tts_model: str = "tts-1"
+    openai_tts_default_voice: str = "alloy"
+
+    # Podcast TTS backend: "mistral" (default), "openai", or "local" (vLLM-Omni)
+    podcast_tts_backend: str = "mistral"
+
+    # Local vLLM-Omni TTS server
+    local_tts_host: str = "127.0.0.1"
+    local_tts_port: int = 8010
+    local_tts_model: str = "Qwen/Qwen2-Audio-7B-Instruct"
+    local_tts_voice: str = "default"
+
+    # Podcast
+    podcast_base_url: str = ""  # e.g. https://copi.science — for RSS enclosure URLs
+    podcast_search_window_days: int = 14
+    podcast_max_candidates: int = 50
+    podcast_normalize_audio: bool = False  # set true to run ffmpeg loudnorm after TTS
+
     # Worker
     worker_poll_interval: int = 5  # seconds
 
@@ -94,33 +96,34 @@ class Settings(BaseSettings):
     max_full_text_per_thread: int = 2
 
     def get_slack_tokens(self) -> dict[str, dict[str, str]]:
-        """Return slack tokens keyed by agent_id."""
-        return {
-            "su": {"bot": self.slack_bot_token_su, "app": self.slack_app_token_su},
-            "wiseman": {"bot": self.slack_bot_token_wiseman, "app": self.slack_app_token_wiseman},
-            "lotz": {"bot": self.slack_bot_token_lotz, "app": self.slack_app_token_lotz},
-            "cravatt": {
-                "bot": self.slack_bot_token_cravatt,
-                "app": self.slack_app_token_cravatt,
-            },
-            "grotjahn": {
-                "bot": self.slack_bot_token_grotjahn,
-                "app": self.slack_app_token_grotjahn,
-            },
-            "petrascheck": {
-                "bot": self.slack_bot_token_petrascheck,
-                "app": self.slack_app_token_petrascheck,
-            },
-            "ken": {"bot": self.slack_bot_token_ken, "app": self.slack_app_token_ken},
-            "racki": {"bot": self.slack_bot_token_racki, "app": self.slack_app_token_racki},
-            "saez": {"bot": self.slack_bot_token_saez, "app": self.slack_app_token_saez},
-            "wu": {"bot": self.slack_bot_token_wu, "app": self.slack_app_token_wu},
-            "ward": {"bot": self.slack_bot_token_ward, "app": self.slack_app_token_ward},
-            "briney": {"bot": self.slack_bot_token_briney, "app": self.slack_app_token_briney},
-            "forli": {"bot": self.slack_bot_token_forli, "app": self.slack_app_token_forli},
-            "deniz": {"bot": self.slack_bot_token_deniz, "app": self.slack_app_token_deniz},
-            "lairson": {"bot": self.slack_bot_token_lairson, "app": self.slack_app_token_lairson},
-        }
+        """Return Slack tokens keyed by agent_id.
+
+        Scans os.environ and the .env file for variables matching:
+            SLACK_BOT_TOKEN_<AGENT_ID>  →  tokens[agent_id]["bot"]
+            SLACK_APP_TOKEN_<AGENT_ID>  →  tokens[agent_id]["app"]
+
+        Agent IDs are lowercased from the suffix, so SLACK_BOT_TOKEN_SU → "su".
+        os.environ takes precedence over .env file values.
+        """
+        import os
+
+        from dotenv import dotenv_values
+
+        # Merge: .env file is the base, actual environment variables override.
+        env: dict[str, str] = {**dotenv_values(".env"), **os.environ}  # type: ignore[arg-type]
+
+        tokens: dict[str, dict[str, str]] = {}
+        for key, val in env.items():
+            if not val:
+                continue
+            upper = key.upper()
+            if upper.startswith("SLACK_BOT_TOKEN_"):
+                agent_id = key[len("SLACK_BOT_TOKEN_"):].lower()
+                tokens.setdefault(agent_id, {"bot": "", "app": ""})["bot"] = val
+            elif upper.startswith("SLACK_APP_TOKEN_"):
+                agent_id = key[len("SLACK_APP_TOKEN_"):].lower()
+                tokens.setdefault(agent_id, {"bot": "", "app": ""})["app"] = val
+        return tokens
 
 
 @lru_cache
diff --git a/src/dependencies.py b/src/dependencies.py
index 0291855..ff8e53e 100644
--- a/src/dependencies.py
+++ b/src/dependencies.py
@@ -16,6 +16,25 @@
 logger = logging.getLogger(__name__)
 
 
+async def get_optional_current_user(
+    request: Request,
+    db: AsyncSession = Depends(get_db),
+) -> User | None:
+    """Like get_current_user but returns None instead of redirecting for unauthenticated requests."""
+    user_id_str = request.session.get("user_id")
+    if not user_id_str:
+        return None
+    try:
+        user_id = uuid.UUID(user_id_str)
+    except ValueError:
+        request.session.clear()
+        return None
+    result = await db.execute(
+        select(User).options(selectinload(User.profile)).where(User.id == user_id)
+    )
+    return result.scalar_one_or_none()
+
+
 async def get_current_user(
     request: Request,
     db: AsyncSession = Depends(get_db),
diff --git a/src/main.py b/src/main.py
index 73e9bb6..af14e50 100644
--- a/src/main.py
+++ b/src/main.py
@@ -11,7 +11,7 @@
 
 from src.config import get_settings
 from src.database import get_session_factory
-from src.routers import admin, agent_page, auth, invite, onboarding, profile, public
+from src.routers import admin, agent_page, auth, invite, onboarding, podcast, profile, proposals, public
 from src.routers import settings as settings_router
 
 logging.basicConfig(
@@ -111,9 +111,11 @@ def create_app() -> FastAPI:
     application.include_router(onboarding.router, prefix="/onboarding", tags=["onboarding"])
     application.include_router(profile.router, prefix="/profile", tags=["profile"])
     application.include_router(agent_page.router, prefix="/agent", tags=["agent"])
+    application.include_router(proposals.router, prefix="/proposals", tags=["proposals"])
     application.include_router(admin.router, prefix="/admin", tags=["admin"])
     application.include_router(invite.router, tags=["invite"])
     application.include_router(settings_router.router, prefix="/settings", tags=["settings"])
+    application.include_router(podcast.router, prefix="/podcast", tags=["podcast"])
 
     @application.get("/api/health")
     async def health():
@@ -124,3 +126,9 @@ async def health():
 
 
 app = create_app()
+
+
+@app.on_event("startup")
+async def _warmup_voice_registry() -> None:
+    from src.podcast.voice_registry import refresh_voices
+    await refresh_voices()
diff --git a/src/models/__init__.py b/src/models/__init__.py
index 97249ff..3b121cd 100644
--- a/src/models/__init__.py
+++ b/src/models/__init__.py
@@ -4,11 +4,15 @@
 """
 
 from src.models.access import AccessAllowlist, WaitlistSignup
+from src.models.matchmaker import MatchmakerProposal
+from src.models.pi_proposal_evaluation import PiProposalEvaluation
 from src.models.agent_activity import AgentChannel, AgentMessage, LlmCallLog, SimulationRun, ThreadDecision
 from src.models.agent_registry import AgentRegistry, ProposalReview
 from src.models.delegate import AgentDelegate, DelegateInvitation
 from src.models.email_notification import EmailEngagementTracker, EmailNotification
 from src.models.job import Job
+from src.models.podcast import PodcastEpisode
+from src.models.podcast_preferences import PodcastPreferences
 from src.models.profile_revision import ProfileRevision
 from src.models.profile import ResearcherProfile
 from src.models.publication import Publication
@@ -31,6 +35,10 @@
     "EmailNotification",
     "EmailEngagementTracker",
     "ProfileRevision",
+    "PodcastEpisode",
+    "PodcastPreferences",
     "AccessAllowlist",
     "WaitlistSignup",
+    "MatchmakerProposal",
+    "PiProposalEvaluation",
 ]
diff --git a/src/models/agent_activity.py b/src/models/agent_activity.py
index c140031..e85345b 100644
--- a/src/models/agent_activity.py
+++ b/src/models/agent_activity.py
@@ -3,7 +3,7 @@
 import uuid
 from datetime import datetime
 
-from sqlalchemy import DateTime, Enum, Float, ForeignKey, Integer, String, Text, func
+from sqlalchemy import Boolean, DateTime, Enum, Float, ForeignKey, Integer, String, Text, func
 from sqlalchemy.dialects.postgresql import JSON, UUID
 from sqlalchemy.orm import Mapped, mapped_column, relationship
 
@@ -112,13 +112,14 @@ class LlmCallLog(Base):
     id: Mapped[uuid.UUID] = mapped_column(
         UUID(as_uuid=True), primary_key=True, default=uuid.uuid4
     )
-    simulation_run_id: Mapped[uuid.UUID] = mapped_column(
+    simulation_run_id: Mapped[uuid.UUID | None] = mapped_column(
         UUID(as_uuid=True),
         ForeignKey("simulation_runs.id", ondelete="CASCADE"),
-        nullable=False,
+        nullable=True,
     )
     agent_id: Mapped[str] = mapped_column(String(50), nullable=False)
-    phase: Mapped[str] = mapped_column(String(30), nullable=False)  # decide, respond, kickstart, memory
+    # phase values: decide, respond, kickstart, memory, podcast_select, podcast_summarize
+    phase: Mapped[str] = mapped_column(String(30), nullable=False)
     channel: Mapped[str | None] = mapped_column(String(100), nullable=True)
     model: Mapped[str] = mapped_column(String(100), nullable=False)
     system_prompt: Mapped[str] = mapped_column(Text, nullable=False)
@@ -132,7 +133,7 @@ class LlmCallLog(Base):
     )
 
     # Relationships
-    simulation_run: Mapped["SimulationRun"] = relationship(
+    simulation_run: Mapped["SimulationRun | None"] = relationship(
         "SimulationRun", back_populates="llm_call_logs"
     )
 
@@ -163,6 +164,7 @@ class ThreadDecision(Base):
     decided_at: Mapped[datetime] = mapped_column(
         DateTime(timezone=True), server_default=func.now(), nullable=False
     )
+    hidden: Mapped[bool] = mapped_column(Boolean, nullable=False, default=False, server_default="false")
 
     def __repr__(self) -> str:
         return f"<ThreadDecision thread={self.thread_id} outcome={self.outcome}>"
diff --git a/src/models/agent_registry.py b/src/models/agent_registry.py
index a159c52..8f022be 100644
--- a/src/models/agent_registry.py
+++ b/src/models/agent_registry.py
@@ -43,6 +43,9 @@ class AgentRegistry(Base):
         ForeignKey("users.id", ondelete="SET NULL"),
         nullable=True,
     )
+    is_paused: Mapped[bool] = mapped_column(
+        nullable=False, default=False, server_default="false"
+    )
 
     # Relationships
     user: Mapped["User | None"] = relationship(
diff --git a/src/models/matchmaker.py b/src/models/matchmaker.py
new file mode 100644
index 0000000..05e455c
--- /dev/null
+++ b/src/models/matchmaker.py
@@ -0,0 +1,60 @@
+"""MatchmakerProposal model.
+
+Proposals can be created two ways:
+  1. Admin web UI — pi_a_id / pi_b_id are set (FK → users); pi_a_name / pi_b_name left null.
+  2. CLI script    — pi_a_name / pi_b_name are set (from profiles/ filenames); FKs left null.
+
+Templates use pi_a.name if the FK is populated, otherwise fall back to pi_a_name.
+"""
+
+import uuid
+from datetime import datetime
+
+from sqlalchemy import Boolean, DateTime, ForeignKey, Integer, String, Text, func
+from sqlalchemy.dialects.postgresql import UUID
+from sqlalchemy.orm import Mapped, mapped_column, relationship
+
+from src.database import Base
+
+
+class MatchmakerProposal(Base):
+    __tablename__ = "matchmaker_proposals"
+
+    id: Mapped[uuid.UUID] = mapped_column(
+        UUID(as_uuid=True), primary_key=True, default=uuid.uuid4
+    )
+    # Web-UI path: FK to users table
+    pi_a_id: Mapped[uuid.UUID | None] = mapped_column(
+        UUID(as_uuid=True), ForeignKey("users.id", ondelete="CASCADE"), nullable=True, index=True
+    )
+    pi_b_id: Mapped[uuid.UUID | None] = mapped_column(
+        UUID(as_uuid=True), ForeignKey("users.id", ondelete="CASCADE"), nullable=True, index=True
+    )
+    # CLI path: display name from profile filename / header
+    pi_a_name: Mapped[str | None] = mapped_column(String(255), nullable=True)
+    pi_b_name: Mapped[str | None] = mapped_column(String(255), nullable=True)
+
+    proposal_md: Mapped[str] = mapped_column(Text, nullable=False)
+    title: Mapped[str] = mapped_column(String(500), nullable=False)
+    confidence: Mapped[str] = mapped_column(String(20), nullable=False)  # high / moderate / speculative
+    llm_model: Mapped[str] = mapped_column(String(100), nullable=False)
+    input_tokens: Mapped[int | None] = mapped_column(Integer, nullable=True)
+    output_tokens: Mapped[int | None] = mapped_column(Integer, nullable=True)
+    generated_at: Mapped[datetime] = mapped_column(
+        DateTime(timezone=True), server_default=func.now(), nullable=False
+    )
+    hidden: Mapped[bool] = mapped_column(Boolean, nullable=False, default=False, server_default="false")
+
+    pi_a: Mapped["User | None"] = relationship("User", foreign_keys=[pi_a_id])
+    pi_b: Mapped["User | None"] = relationship("User", foreign_keys=[pi_b_id])
+
+    @property
+    def name_a(self) -> str:
+        return self.pi_a.name if self.pi_a else (self.pi_a_name or "Unknown")
+
+    @property
+    def name_b(self) -> str:
+        return self.pi_b.name if self.pi_b else (self.pi_b_name or "Unknown")
+
+    def __repr__(self) -> str:
+        return f"<MatchmakerProposal {self.name_a!r} × {self.name_b!r} confidence={self.confidence}>"
diff --git a/src/models/pi_proposal_evaluation.py b/src/models/pi_proposal_evaluation.py
new file mode 100644
index 0000000..2872d5c
--- /dev/null
+++ b/src/models/pi_proposal_evaluation.py
@@ -0,0 +1,95 @@
+"""PiProposalEvaluation model.
+
+NIH-style 1-9 evaluations submitted by PIs through the /proposals tab.
+Separate from ProposalReview (the 1-4 agent-blocking system).
+"""
+
+import uuid
+from datetime import datetime
+
+from sqlalchemy import (
+    CheckConstraint,
+    DateTime,
+    ForeignKey,
+    SmallInteger,
+    String,
+    Text,
+    UniqueConstraint,
+    func,
+)
+from sqlalchemy.dialects.postgresql import UUID
+from sqlalchemy.orm import Mapped, mapped_column, relationship
+
+from src.database import Base
+
+
+class PiProposalEvaluation(Base):
+    __tablename__ = "pi_proposal_evaluations"
+
+    id: Mapped[uuid.UUID] = mapped_column(
+        UUID(as_uuid=True), primary_key=True, default=uuid.uuid4
+    )
+    user_id: Mapped[uuid.UUID] = mapped_column(
+        UUID(as_uuid=True), ForeignKey("users.id", ondelete="CASCADE"), nullable=False, index=True
+    )
+    # "agent" | "matchmaker" — stored for admin analysis, never shown to the PI
+    proposal_type: Mapped[str] = mapped_column(String(20), nullable=False)
+    thread_decision_id: Mapped[uuid.UUID | None] = mapped_column(
+        UUID(as_uuid=True),
+        ForeignKey("thread_decisions.id", ondelete="CASCADE"),
+        nullable=True,
+        index=True,
+    )
+    matchmaker_proposal_id: Mapped[uuid.UUID | None] = mapped_column(
+        UUID(as_uuid=True),
+        ForeignKey("matchmaker_proposals.id", ondelete="CASCADE"),
+        nullable=True,
+        index=True,
+    )
+
+    # NIH criterion scores (1–9) — nullable; currently hidden from the PI form
+    score_significance: Mapped[int | None] = mapped_column(SmallInteger, nullable=True)
+    score_innovation: Mapped[int | None] = mapped_column(SmallInteger, nullable=True)
+    score_approach: Mapped[int | None] = mapped_column(SmallInteger, nullable=True)
+    score_investigators: Mapped[int | None] = mapped_column(SmallInteger, nullable=True)
+    score_environment: Mapped[int | None] = mapped_column(SmallInteger, nullable=True)
+    # Overall impact is holistic — not an average of the five criteria
+    score_overall_impact: Mapped[int] = mapped_column(SmallInteger, nullable=False)
+
+    comments_significance: Mapped[str | None] = mapped_column(Text, nullable=True)
+    comments_innovation: Mapped[str | None] = mapped_column(Text, nullable=True)
+    comments_approach: Mapped[str | None] = mapped_column(Text, nullable=True)
+    comments_investigators: Mapped[str | None] = mapped_column(Text, nullable=True)
+    comments_environment: Mapped[str | None] = mapped_column(Text, nullable=True)
+    comments_overall: Mapped[str | None] = mapped_column(Text, nullable=True)
+
+    evaluated_at: Mapped[datetime] = mapped_column(
+        DateTime(timezone=True), server_default=func.now(), nullable=False
+    )
+    updated_at: Mapped[datetime | None] = mapped_column(DateTime(timezone=True), nullable=True)
+
+    # Relationships
+    user: Mapped["User"] = relationship("User", foreign_keys=[user_id])
+    thread_decision: Mapped["ThreadDecision | None"] = relationship("ThreadDecision")
+    matchmaker_proposal: Mapped["MatchmakerProposal | None"] = relationship("MatchmakerProposal")
+
+    __table_args__ = (
+        CheckConstraint("proposal_type IN ('agent', 'matchmaker')", name="ck_ppe_proposal_type"),
+        CheckConstraint(
+            "thread_decision_id IS NOT NULL OR matchmaker_proposal_id IS NOT NULL",
+            name="ck_ppe_proposal_present",
+        ),
+        CheckConstraint("score_significance BETWEEN 1 AND 9", name="ck_ppe_score_significance"),
+        CheckConstraint("score_innovation BETWEEN 1 AND 9", name="ck_ppe_score_innovation"),
+        CheckConstraint("score_approach BETWEEN 1 AND 9", name="ck_ppe_score_approach"),
+        CheckConstraint("score_investigators BETWEEN 1 AND 9", name="ck_ppe_score_investigators"),
+        CheckConstraint("score_environment BETWEEN 1 AND 9", name="ck_ppe_score_environment"),
+        CheckConstraint("score_overall_impact BETWEEN 1 AND 9", name="ck_ppe_score_overall_impact"),
+        # One evaluation per user per proposal (upsert replaces rather than duplicates)
+        UniqueConstraint("user_id", "thread_decision_id", name="uq_ppe_user_thread"),
+        UniqueConstraint("user_id", "matchmaker_proposal_id", name="uq_ppe_user_matchmaker"),
+        {},
+    )
+
+    def __repr__(self) -> str:
+        return f"<PiProposalEvaluation user={self.user_id} impact={self.score_overall_impact}>"
diff --git a/src/models/podcast.py b/src/models/podcast.py
new file mode 100644
index 0000000..633eb60
--- /dev/null
+++ b/src/models/podcast.py
@@ -0,0 +1,61 @@
+"""PodcastEpisode model.
+
+Episodes are keyed by either agent_id (pilot-lab agents) or user_id (plain
+ORCID users).  Exactly one should be set per row.
+
+Uniqueness constraints:
+  - uq_podcast_agent_date: one episode per agent per day (agent path)
+  - ix_podcast_episodes_user_date: partial unique index (user path, via migration 0013)
+"""
+
+import uuid
+from datetime import date, datetime
+
+from sqlalchemy import Boolean, Date, DateTime, ForeignKey, Integer, String, Text, UniqueConstraint, func
+from sqlalchemy.dialects.postgresql import UUID
+from sqlalchemy.orm import Mapped, mapped_column
+
+from src.database import Base
+
+
+class PodcastEpisode(Base):
+    __tablename__ = "podcast_episodes"
+
+    id: Mapped[uuid.UUID] = mapped_column(
+        UUID(as_uuid=True), primary_key=True, default=uuid.uuid4
+    )
+    # For pilot-lab agents (legacy path) — nullable to support user-only episodes
+    agent_id: Mapped[str | None] = mapped_column(String(50), nullable=True, index=True)
+    # For plain ORCID users (no agent required)
+    user_id: Mapped[uuid.UUID | None] = mapped_column(
+        UUID(as_uuid=True),
+        ForeignKey("users.id", ondelete="CASCADE"),
+        nullable=True,
+        index=True,
+    )
+    episode_date: Mapped[date] = mapped_column(Date, nullable=False)
+    pmid: Mapped[str] = mapped_column(String(100), nullable=False)
+    paper_title: Mapped[str] = mapped_column(String(500), nullable=False)
+    paper_authors: Mapped[str] = mapped_column(String(500), nullable=False)
+    paper_journal: Mapped[str] = mapped_column(String(255), nullable=False)
+    paper_year: Mapped[int] = mapped_column(Integer, nullable=False)
+    paper_url: Mapped[str | None] = mapped_column(String(1000), nullable=True)
+    text_summary: Mapped[str] = mapped_column(Text, nullable=False)
+    audio_file_path: Mapped[str | None] = mapped_column(String(500), nullable=True)
+    audio_duration_seconds: Mapped[int | None] = mapped_column(Integer, nullable=True)
+    slack_delivered: Mapped[bool] = mapped_column(Boolean, default=False, nullable=False)
+    selection_justification: Mapped[str] = mapped_column(Text, nullable=False)
+    created_at: Mapped[datetime] = mapped_column(
+        DateTime(timezone=True), server_default=func.now(), nullable=False
+    )
+
+    __table_args__ = (
+        # Agent-path uniqueness (PostgreSQL ignores NULLs in UNIQUE constraints,
+        # so this only enforces uniqueness when agent_id IS NOT NULL)
+        UniqueConstraint("agent_id", "episode_date", name="uq_podcast_agent_date"),
+        # User-path uniqueness is enforced by the partial index created in migration 0013
+    )
+
+    def __repr__(self) -> str:
+        key = f"agent={self.agent_id}" if self.agent_id else f"user={self.user_id}"
+        return f"<PodcastEpisode {key} date={self.episode_date} pmid={self.pmid}>"
diff --git a/src/models/podcast_preferences.py b/src/models/podcast_preferences.py
new file mode 100644
index 0000000..9ae6029
--- /dev/null
+++ b/src/models/podcast_preferences.py
@@ -0,0 +1,53 @@
+"""PodcastPreferences model — per-agent or per-user podcast customization.
+
+Rows are keyed by either agent_id (for approved pilot-lab agents) or user_id
+(for any user who has completed ORCID onboarding).  Exactly one of the two
+should be set on each row; both being set is invalid.
+"""
+
+import uuid
+from datetime import datetime
+
+from sqlalchemy import Boolean, DateTime, ForeignKey, String, func
+from sqlalchemy.dialects.postgresql import ARRAY, UUID
+from sqlalchemy.orm import Mapped, mapped_column
+
+from src.database import Base
+
+
+class PodcastPreferences(Base):
+    __tablename__ = "podcast_preferences"
+
+    id: Mapped[uuid.UUID] = mapped_column(
+        UUID(as_uuid=True), primary_key=True, default=uuid.uuid4
+    )
+    # For pilot-lab agents (legacy path)
+    agent_id: Mapped[str | None] = mapped_column(String(50), nullable=True, unique=True, index=True)
+    # For plain ORCID users (no agent required)
+    user_id: Mapped[uuid.UUID | None] = mapped_column(
+        UUID(as_uuid=True),
+        ForeignKey("users.id", ondelete="CASCADE"),
+        nullable=True,
+        unique=True,
+        index=True,
+    )
+    voice_id: Mapped[str | None] = mapped_column(String(100), nullable=True)
+    extra_keywords: Mapped[list[str]] = mapped_column(
+        ARRAY(String), nullable=False, server_default="{}"
+    )
+    preferred_journals: Mapped[list[str]] = mapped_column(
+        ARRAY(String), nullable=False, server_default="{}"
+    )
+    deprioritized_journals: Mapped[list[str]] = mapped_column(
+        ARRAY(String), nullable=False, server_default="{}"
+    )
+    podcast_enabled: Mapped[bool] = mapped_column(
+        Boolean, nullable=False, default=False, server_default="false"
+    )
+    updated_at: Mapped[datetime] = mapped_column(
+        DateTime(timezone=True), server_default=func.now(), onupdate=func.now(), nullable=False
+    )
+
+    def __repr__(self) -> str:
+        key = f"agent={self.agent_id}" if self.agent_id else f"user={self.user_id}"
+        return f"<PodcastPreferences {key} voice={self.voice_id}>"
diff --git a/src/podcast/__init__.py b/src/podcast/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/src/podcast/local_tts.py b/src/podcast/local_tts.py
new file mode 100644
index 0000000..104c05a
--- /dev/null
+++ b/src/podcast/local_tts.py
@@ -0,0 +1,101 @@
+"""Local TTS backend using a vLLM-Omni server.
+
+vLLM-Omni exposes an OpenAI-compatible /v1/audio/speech endpoint that accepts
+the same JSON payload as OpenAI TTS and returns raw audio bytes directly.
+
+Start a vLLM-Omni server with, e.g.:
+    vllm serve Qwen/Qwen2-Audio-7B-Instruct --port 8010
+
+Then set in .env:
+    PODCAST_TTS_BACKEND=local
+    LOCAL_TTS_HOST=127.0.0.1
+    LOCAL_TTS_PORT=8010
+    LOCAL_TTS_MODEL=Qwen/Qwen2-Audio-7B-Instruct
+    LOCAL_TTS_VOICE=default
+"""
+
+import json
+import logging
+from pathlib import Path
+
+import httpx
+
+from src.config import get_settings
+from src.podcast.tts_utils import get_audio_duration_seconds, normalize_audio, strip_markdown
+
+logger = logging.getLogger(__name__)
+
+VOICES_FILE = Path("data/podcast_voices.json")
+
+__all__ = ["generate_audio", "get_audio_duration_seconds"]
+
+
+def _get_local_tts_url() -> str:
+    settings = get_settings()
+    return f"http://{settings.local_tts_host}:{settings.local_tts_port}/v1/audio/speech"
+
+
+def get_voice(agent_id: str, voice_override: str | None = None) -> str:
+    """Return the TTS voice for an agent.
+
+    Priority: voice_override (from DB preferences) → podcast_voices.json → env default.
+    """
+    if voice_override:
+        return voice_override
+    settings = get_settings()
+    if VOICES_FILE.exists():
+        try:
+            voices = json.loads(VOICES_FILE.read_text(encoding="utf-8"))
+            if agent_id in voices:
+                return voices[agent_id]
+        except Exception as exc:
+            logger.warning("Failed to load podcast_voices.json: %s", exc)
+    return settings.local_tts_voice or "default"
+
+
+async def generate_audio(
+    text: str, agent_id: str, output_path: Path, voice_override: str | None = None
+) -> bool:
+    """Generate TTS audio via a local vLLM-Omni server and save to output_path.
+
+    The server must expose an OpenAI-compatible /v1/audio/speech endpoint
+    that returns raw audio bytes.
+
+    Returns True on success, False on failure.
+    """
+    settings = get_settings()
+    url = _get_local_tts_url()
+    voice = get_voice(agent_id, voice_override=voice_override)
+    clean_text = strip_markdown(text)
+
+    payload = {
+        "model": settings.local_tts_model,
+        "input": clean_text,
+        "voice": voice,
+        "response_format": "mp3",
+    }
+    headers = {"Content-Type": "application/json"}
+
+    logger.info("Local TTS request to %s (model=%s, voice=%s)", url, settings.local_tts_model, voice)
+
+    try:
+        async with httpx.AsyncClient(timeout=300) as client:
+            resp = await client.post(url, json=payload, headers=headers)
+            if not resp.is_success:
+                logger.error("Local TTS error %s: %s", resp.status_code, resp.text)
+            resp.raise_for_status()
+
+        output_path.parent.mkdir(parents=True, exist_ok=True)
+        output_path.write_bytes(resp.content)
+        logger.info("Audio saved to %s (%d bytes)", output_path, len(resp.content))
+        if settings.podcast_normalize_audio:
+            normalize_audio(output_path)
+        return True
+    except httpx.ConnectError:
+        logger.error(
+            "Could not connect to local TTS server at %s — is vLLM-Omni running?", url
+        )
+        return False
+    except Exception as exc:
+        logger.error("Local TTS failed for agent %s: %s", agent_id, exc)
+        return False
diff --git a/src/podcast/main.py b/src/podcast/main.py
new file mode 100644
index 0000000..f6ba276
--- /dev/null
+++ b/src/podcast/main.py
@@ -0,0 +1,352 @@
+"""LabBot Podcast — daily personalized research briefings for each PI.
+
+Usage:
+    python -m src.podcast.main            # run once for all pending recipients
+    python -m src.podcast.main scheduler  # long-running daily scheduler
+
+Scheduler behaviour
+-------------------
+Recipients (agents + opted-in users) are processed one at a time.
+
+Window mode (default 00:00–03:00 UTC):
+    Each recipient is processed in turn; the scheduler sleeps between each so
+    that the full cohort is spread evenly across the window.  Agents are
+    processed first, then users.
+
+Catch-up mode (any time outside the window):
+    If the container starts and any recipient is missing today's episode the
+    scheduler processes all of them immediately with a short pause between
+    each.  This covers restarts after a crash or a missed window.
+
+Per-recipient completion is checked via the DB (PodcastEpisode.episode_date ==
+today) rather than a single global flag, so a partial run or a crash is
+automatically resumed on the next boot.
+"""
+
+import asyncio
+import logging
+from datetime import date, datetime, timedelta, timezone
+
+import typer
+
+from src.config import get_settings
+
+logging.basicConfig(
+    level=logging.INFO,
+    format="%(asctime)s %(levelname)s %(name)s: %(message)s",
+)
+logger = logging.getLogger(__name__)
+
+app = typer.Typer(invoke_without_command=True)
+
+# Minimum seconds between recipients during the stagger window.
+_MIN_STAGGER_SECS = 60
+# Seconds between recipients during catch-up (outside window).
+_CATCHUP_PAUSE_SECS = 60
+# Maximum sleep between "all done" checks (so newly opted-in users aren't
+# delayed more than this many seconds into the next day).
+_MAX_IDLE_SLEEP_SECS = 4 * 3600
+
+
+# ---------------------------------------------------------------------------
+# Per-recipient helpers
+# ---------------------------------------------------------------------------
+
+async def _get_pending_recipients(today: date) -> tuple[list, list]:
+    """Return (pending_agents, pending_users) who have no episode for today.
+
+    Agents are instances of AgentRegistry; users are instances of User (with
+    .profile pre-loaded).  Both lists are sorted deterministically so the order
+    is stable across restarts within the same day.
+    """
+    from sqlalchemy import select
+    from sqlalchemy.orm import selectinload
+
+    from src.database import get_session_factory
+    from src.models.agent_registry import AgentRegistry
+    from src.models.podcast import PodcastEpisode
+    from src.models.podcast_preferences import PodcastPreferences
+    from src.models.user import User
+
+    session_factory = get_session_factory()
+    async with session_factory() as db:
+        # Agents already done today
+        done_agents_res = await db.execute(
+            select(PodcastEpisode.agent_id).where(
+                PodcastEpisode.episode_date == today,
+                PodcastEpisode.agent_id.is_not(None),
+            )
+        )
+        done_agent_ids = {r[0] for r in done_agents_res}
+
+        # Users already done today
+        done_users_res = await db.execute(
+            select(PodcastEpisode.user_id).where(
+                PodcastEpisode.episode_date == today,
+                PodcastEpisode.user_id.is_not(None),
+            )
+        )
+        done_user_ids = {r[0] for r in done_users_res}
+
+        # Active agents where podcast is explicitly opted in (INNER JOIN —
+        # agents with no prefs row or podcast_enabled=False are excluded).
+        agents_res = await db.execute(
+            select(AgentRegistry)
+            .join(
+                PodcastPreferences,
+                PodcastPreferences.agent_id == AgentRegistry.agent_id,
+            )
+            .where(
+                AgentRegistry.status == "active",
+                PodcastPreferences.podcast_enabled.is_(True),
+            )
+        )
+        all_agents = agents_res.scalars().all()
+        pending_agents = sorted(
+            [a for a in all_agents if a.agent_id not in done_agent_ids],
+            key=lambda a: a.agent_id,
+        )
+
+        # user_ids covered by the agent path — skip in the user loop
+        agent_user_ids = {a.user_id for a in all_agents if a.user_id is not None}
+
+        # Opted-in users not yet done
+        users_res = await db.execute(
+            select(User)
+            .join(PodcastPreferences, PodcastPreferences.user_id == User.id)
+            .options(selectinload(User.profile))
+            .where(
+                User.onboarding_complete.is_(True),
+                PodcastPreferences.podcast_enabled.is_(True),
+            )
+        )
+        all_opted_in = users_res.scalars().all()
+        pending_users = sorted(
+            [
+                u for u in all_opted_in
+                if u.id not in agent_user_ids
+                and u.id not in done_user_ids
+                and u.profile is not None
+                and u.profile.research_summary
+            ],
+            key=lambda u: str(u.id),
+        )
+
+    return pending_agents, pending_users
+
+
+async def _process_agent(agent) -> bool:
+    """Run the full pipeline for one agent in its own DB session."""
+    from src.database import get_session_factory
+    from src.podcast.pipeline import run_pipeline_for_agent
+
+    settings = get_settings()
+    slack_tokens = settings.get_slack_tokens()
+    tokens = slack_tokens.get(agent.agent_id, {})
+    bot_token = agent.slack_bot_token or tokens.get("bot", "")
+
+    session_factory = get_session_factory()
+    try:
+        async with session_factory() as db:
+            ok = await run_pipeline_for_agent(
+                agent_id=agent.agent_id,
+                bot_name=agent.bot_name,
+                pi_name=agent.pi_name,
+                bot_token=bot_token,
+                slack_user_id=agent.slack_user_id,
+                db_session=db,
+            )
+            await db.commit()
+        return ok
+    except Exception as exc:
+        logger.error("Pipeline failed for agent %s: %s", agent.agent_id, exc, exc_info=True)
+        return False
+
+
+async def _process_user(user) -> bool:
+    """Run the full pipeline for one plain user in its own DB session."""
+    from src.database import get_session_factory
+    from src.podcast.pipeline import run_podcast_for_user
+
+    session_factory = get_session_factory()
+    try:
+        async with session_factory() as db:
+            ok = await run_podcast_for_user(user_id=user.id, db_session=db)
+            await db.commit()
+        return ok
+    except Exception as exc:
+        logger.error("Pipeline failed for user %s: %s", user.id, exc, exc_info=True)
+        return False
+
+
+def _seconds_until_window(now: datetime, window_start_hour: int) -> int:
+    """Seconds until the next opening of the daily generation window."""
+    target = now.replace(hour=window_start_hour, minute=0, second=0, microsecond=0)
+    if target <= now:
+        target += timedelta(days=1)
+    return max(60, int((target - now).total_seconds()))
+
+
+# ---------------------------------------------------------------------------
+# One-shot batch runner (used by the 'main' command and legacy callers)
+# ---------------------------------------------------------------------------
+
+async def run_podcast(dry_run: bool = False) -> list[str]:
+    """Run the podcast pipeline for all pending recipients today.
+
+    Returns list of identifiers (agent_ids + "user:<uuid>") that produced
+    episodes.  Already-completed recipients (episode exists for today) are
+    skipped automatically.
+    """
+    today = datetime.now(timezone.utc).date()
+    pending_agents, pending_users = await _get_pending_recipients(today)
+    produced: list[str] = []
+
+    for agent in pending_agents:
+        if dry_run:
+            logger.info("DRY RUN — would run pipeline for agent: %s", agent.agent_id)
+            continue
+        ok = await _process_agent(agent)
+        if ok:
+            produced.append(agent.agent_id)
+
+    for user in pending_users:
+        if dry_run:
+            logger.info("DRY RUN — would run pipeline for user: %s (%s)", user.id, user.name)
+            continue
+        ok = await _process_user(user)
+        if ok:
+            produced.append(f"user:{user.id}")
+
+    logger.info("Podcast run complete: %d episodes produced", len(produced))
+    return produced
+
+
+# ---------------------------------------------------------------------------
+# Long-running scheduler
+# ---------------------------------------------------------------------------
+
+async def _scheduler_loop(window_start: int, window_end: int) -> None:
+    """Single long-lived event loop for the daily scheduler.
+
+    Keeping a single asyncio.run() call avoids the "Future attached to a
+    different loop" errors that arise if asyncio.run() is called in a tight
+    while-loop (each call creates a new event loop and the SQLAlchemy asyncpg
+    engine is bound to the one that created it).
+    """
+    logger.info(
+        "Podcast scheduler started (window=%02d:00–%02d:00 UTC)", window_start, window_end
+    )
+
+    while True:
+        now = datetime.now(timezone.utc)
+        today = now.date()
+
+        pending_agents, pending_users = await _get_pending_recipients(today)
+        total_pending = len(pending_agents) + len(pending_users)
+
+        if total_pending == 0:
+            sleep_secs = _seconds_until_window(now, window_start)
+            logger.info(
+                "All episodes generated for %s. Sleeping %ds until %02d:00 UTC.",
+                today, min(sleep_secs, _MAX_IDLE_SLEEP_SECS), window_start,
+            )
+            await asyncio.sleep(min(sleep_secs, _MAX_IDLE_SLEEP_SECS))
+            continue
+
+        in_window = window_start <= now.hour < window_end
+
+        if in_window:
+            # Spread remaining recipients evenly across the remaining window.
+            window_end_dt = now.replace(hour=window_end, minute=0, second=0, microsecond=0)
+            remaining_secs = max(0, int((window_end_dt - now).total_seconds()))
+            stagger_delay = max(_MIN_STAGGER_SECS, remaining_secs // total_pending)
+
+            # Process one recipient — agents first, then users.
+            if pending_agents:
+                agent = pending_agents[0]
+                logger.info(
+                    "[window] Agent %s (%d remaining, next in %ds)",
+                    agent.agent_id, total_pending, stagger_delay,
+                )
+                await _process_agent(agent)
+            else:
+                user = pending_users[0]
+                logger.info(
+                    "[window] User %s (%d remaining, next in %ds)",
+                    user.id, total_pending, stagger_delay,
+                )
+                await _process_user(user)
+
+            await asyncio.sleep(stagger_delay)
+
+        else:
+            # Outside window — catch-up: process all with a short pause between.
+            logger.info(
+                "[catchup] %d recipients missing today's episode — running immediately",
+                total_pending,
+            )
+            all_pending = [("agent", a) for a in pending_agents] + [("user", u) for u in pending_users]
+            for i, (kind, recipient) in enumerate(all_pending):
+                if kind == "agent":
+                    logger.info(
+                        "[catchup] Agent %s (%d/%d)", recipient.agent_id, i + 1, total_pending
+                    )
+                    await _process_agent(recipient)
+                else:
+                    logger.info(
+                        "[catchup] User %s (%d/%d)", recipient.id, i + 1, total_pending
+                    )
+                    await _process_user(recipient)
+                if i < total_pending - 1:
+                    await asyncio.sleep(_CATCHUP_PAUSE_SECS)
+
+            now = datetime.now(timezone.utc)
+            sleep_secs = _seconds_until_window(now, window_start)
+            logger.info(
+                "[catchup] Done. Sleeping %ds until %02d:00 UTC.",
+                min(sleep_secs, _MAX_IDLE_SLEEP_SECS), window_start,
+            )
+            await asyncio.sleep(min(sleep_secs, _MAX_IDLE_SLEEP_SECS))
+
+
+# ---------------------------------------------------------------------------
+# CLI commands
+# ---------------------------------------------------------------------------
+
+@app.command()
+def main(
+    dry_run: bool = typer.Option(False, "--dry-run", help="Preview without posting or generating audio"),
+):
+    """Run the podcast pipeline once for all pending recipients today."""
+    results = asyncio.run(run_podcast(dry_run=dry_run))
+    if results:
+        typer.echo(f"\nProduced {len(results)} episodes:")
+        for aid in results:
+            typer.echo(f"  {aid}")
+    else:
+        typer.echo("No episodes produced.")
+
+
+@app.command("scheduler")
+def scheduler(
+    window_start: int = typer.Option(0, "--window-start", help="UTC hour to begin staggered generation (default midnight)"),
+    window_end: int = typer.Option(3, "--window-end", help="UTC hour to finish staggered generation (default 3am)"),
+):
+    """Long-running daily scheduler.
+
+    During the window (default 00:00–03:00 UTC) recipients are processed one at
+    a time with an adaptive delay so that the full cohort is spread evenly across
+    the window.
+
+    If the container starts outside the window and any recipient is missing
+    today's episode, all pending recipients are processed immediately (catch-up).
+    """
+    if not (0 <= window_start < window_end <= 24):
+        typer.echo(f"Invalid window: {window_start}–{window_end}. window_start must be < window_end.", err=True)
+        raise typer.Exit(1)
+    asyncio.run(_scheduler_loop(window_start, window_end))
+
+
+if __name__ == "__main__":
+    app()
diff --git a/src/podcast/mistral_tts.py b/src/podcast/mistral_tts.py
new file mode 100644
index 0000000..f061806
--- /dev/null
+++ b/src/podcast/mistral_tts.py
@@ -0,0 +1,105 @@
+"""Mistral AI TTS client wrapper."""
+
+import base64
+import json
+import logging
+from pathlib import Path
+
+import httpx
+
+from src.config import get_settings
+from src.podcast.tts_utils import get_audio_duration_seconds, normalize_audio, strip_markdown
+
+logger = logging.getLogger(__name__)
+
+VOICES_FILE = Path("data/podcast_voices.json")
+MISTRAL_TTS_URL = "https://api.mistral.ai/v1/audio/speech"
+
+__all__ = ["generate_audio", "get_audio_duration_seconds"]
+
+
+def _get_default_voice() -> str:
+    """Return the configured default voice, falling back to the first cached voice."""
+    settings = get_settings()
+    if settings.mistral_tts_default_voice:
+        return settings.mistral_tts_default_voice
+    from src.podcast.voice_registry import get_cached_voices
+    cached = get_cached_voices("mistral")
+    return cached[0][0] if cached else "en_paul_neutral"
+
+
+def get_voice(agent_id: str, voice_override: str | None = None) -> str:
+    """Return the TTS voice for an agent.
+
+    Priority: voice_override (from DB preferences) → podcast_voices.json → env default.
+    """
+    if voice_override:
+        return voice_override
+    if VOICES_FILE.exists():
+        try:
+            voices = json.loads(VOICES_FILE.read_text(encoding="utf-8"))
+            if agent_id in voices:
+                return voices[agent_id]
+        except Exception as exc:
+            logger.warning("Failed to load podcast_voices.json: %s", exc)
+    return _get_default_voice()
+
+
+async def generate_audio(
+    text: str, agent_id: str, output_path: Path, voice_override: str | None = None
+) -> bool:
+    """Generate TTS audio via Mistral AI and save to output_path.
+
+    Returns True on success, False on failure.
+    """
+    settings = get_settings()
+    if not settings.mistral_api_key:
+        logger.warning("MISTRAL_API_KEY not set — skipping audio generation")
+        return False
+
+    voice = get_voice(agent_id, voice_override=voice_override)
+    clean_text = strip_markdown(text)
+    payload = {
+        "model": settings.mistral_tts_model,
+        "input": clean_text,
+        "voice": voice,
+    }
+    headers = {
+        "Authorization": f"Bearer {settings.mistral_api_key}",
+        "Content-Type": "application/json",
+    }
+
+    try:
+        async with httpx.AsyncClient(timeout=120) as client:
+            resp = await client.post(MISTRAL_TTS_URL, json=payload, headers=headers)
+            default_voice = _get_default_voice()
+            if resp.status_code == 404 and voice != default_voice:
+                # Voice was removed or renamed; retry with the configured default
+                logger.warning(
+                    "Mistral TTS voice %r not found — retrying with default voice %r",
+                    voice, default_voice,
+                )
+                payload["voice"] = default_voice
+                resp = await client.post(MISTRAL_TTS_URL, json=payload, headers=headers)
+            if not resp.is_success:
+                logger.error("Mistral TTS API error %s: %s", resp.status_code, resp.text)
+            resp.raise_for_status()
+
+        # Mistral returns {"audio_data": "<base64-encoded mp3>"}
+        content_type = resp.headers.get("content-type", "")
+        if "json" in content_type or resp.content[:1] == b"{":
+            audio_bytes = base64.b64decode(resp.json()["audio_data"])
+        else:
+            audio_bytes = resp.content
+
+        output_path.parent.mkdir(parents=True, exist_ok=True)
+        output_path.write_bytes(audio_bytes)
+        logger.info("Audio saved to %s (%d bytes)", output_path, len(audio_bytes))
+        if settings.podcast_normalize_audio:
+            normalize_audio(output_path)
+        return True
+    except Exception as exc:
+        logger.error("Mistral TTS failed for agent %s: %s", agent_id, exc)
+        return False
+
+
diff --git a/src/podcast/openai_tts.py b/src/podcast/openai_tts.py
new file mode 100644
index 0000000..ac79045
--- /dev/null
+++ b/src/podcast/openai_tts.py
@@ -0,0 +1,91 @@
+"""OpenAI TTS client wrapper.
+
+Uses the OpenAI /v1/audio/speech endpoint.  Returns raw MP3 bytes.
+
+Set in .env:
+    PODCAST_TTS_BACKEND=openai
+    OPENAI_API_KEY=sk-...
+    OPENAI_TTS_MODEL=tts-1          # or tts-1-hd / gpt-4o-mini-tts
+    OPENAI_TTS_DEFAULT_VOICE=alloy  # alloy echo fable onyx nova shimmer
+"""
+
+import json
+import logging
+from pathlib import Path
+
+import httpx
+
+from src.config import get_settings
+from src.podcast.tts_utils import get_audio_duration_seconds, normalize_audio, strip_markdown
+
+logger = logging.getLogger(__name__)
+
+VOICES_FILE = Path("data/podcast_voices.json")
+OPENAI_TTS_URL = "https://api.openai.com/v1/audio/speech"
+
+__all__ = ["generate_audio", "get_audio_duration_seconds"]
+
+
+def get_voice(agent_id: str, voice_override: str | None = None) -> str:
+    """Return the TTS voice for an agent.
+
+    Priority: voice_override (from DB preferences) → podcast_voices.json → env default.
+    """
+    if voice_override:
+        return voice_override
+    settings = get_settings()
+    if VOICES_FILE.exists():
+        try:
+            voices = json.loads(VOICES_FILE.read_text(encoding="utf-8"))
+            if agent_id in voices:
+                return voices[agent_id]
+        except Exception as exc:
+            logger.warning("Failed to load podcast_voices.json: %s", exc)
+    return settings.openai_tts_default_voice or "alloy"
+
+
+async def generate_audio(
+    text: str, agent_id: str, output_path: Path, voice_override: str | None = None
+) -> bool:
+    """Generate TTS audio via OpenAI and save to output_path.
+
+    Returns True on success, False on failure.
+    """
+    settings = get_settings()
+    if not settings.openai_api_key:
+        logger.warning("OPENAI_API_KEY not set — skipping audio generation")
+        return False
+
+    voice = get_voice(agent_id, voice_override=voice_override)
+    clean_text = strip_markdown(text)
+    payload = {
+        "model": settings.openai_tts_model,
+        "input": clean_text,
+        "voice": voice,
+        "response_format": "mp3",
+    }
+    headers = {
+        "Authorization": f"Bearer {settings.openai_api_key}",
+        "Content-Type": "application/json",
+    }
+
+    logger.info(
+        "OpenAI TTS request (model=%s, voice=%s)", settings.openai_tts_model, voice
+    )
+
+    try:
+        async with httpx.AsyncClient(timeout=120) as client:
+            resp = await client.post(OPENAI_TTS_URL, json=payload, headers=headers)
+            if not resp.is_success:
+                logger.error("OpenAI TTS API error %s: %s", resp.status_code, resp.text)
+            resp.raise_for_status()
+
+        output_path.parent.mkdir(parents=True, exist_ok=True)
+        output_path.write_bytes(resp.content)
+        logger.info("Audio saved to %s (%d bytes)", output_path, len(resp.content))
+        if settings.podcast_normalize_audio:
+            normalize_audio(output_path)
+        return True
+    except Exception as exc:
+        logger.error("OpenAI TTS failed for agent %s: %s", agent_id, exc)
+        return False
diff --git a/src/podcast/pipeline.py b/src/podcast/pipeline.py
new file mode 100644
index 0000000..01c0eee
--- /dev/null
+++ b/src/podcast/pipeline.py
@@ -0,0 +1,729 @@
+"""Per-agent podcast pipeline: search → select → summarize → TTS → Slack DM → DB."""
+
+import json
+import logging
+from datetime import date, datetime, timezone
+from pathlib import Path
+from typing import Any
+
+from src.config import get_settings
+
+logger = logging.getLogger(__name__)
+
+PROFILES_DIR = Path("profiles/public")
+AUDIO_DIR = Path("data/podcast_audio")
+
+
+async def _flush_podcast_llm_logs(buffer: list[dict], db_session) -> None:
+    """Write buffered LLM call log entries to the DB (simulation_run_id left NULL)."""
+    if not buffer:
+        return
+    from src.models.agent_activity import LlmCallLog
+
+    try:
+        for entry in buffer:
+            record = LlmCallLog(
+                simulation_run_id=None,
+                agent_id=entry.get("agent_id", "unknown"),
+                phase=entry.get("phase", "unknown"),
+                channel=None,
+                model=entry.get("model", ""),
+                system_prompt=entry.get("system_prompt", ""),
+                messages_json=entry.get("messages", []),
+                response_text=entry.get("response_text", ""),
+                input_tokens=entry.get("input_tokens", 0),
+                output_tokens=entry.get("output_tokens", 0),
+                latency_ms=entry.get("latency_ms", 0.0),
+                created_at=entry.get("completed_at"),
+            )
+            db_session.add(record)
+    except Exception as exc:
+        logger.warning("Failed to write podcast LLM call logs: %s", exc)
+
+
+def _load_public_profile(agent_id: str) -> str:
+    """Load the public profile markdown for an agent."""
+    path = PROFILES_DIR / f"{agent_id}.md"
+    if path.exists():
+        return path.read_text(encoding="utf-8")
+    return ""
+
+
+async def _load_podcast_preferences(agent_id: str) -> str:
+    """Load the Podcast Preferences section from the agent's latest private ProfileRevision in the DB."""
+    try:
+        from sqlalchemy import desc, select
+
+        from src.database import get_session_factory
+        from src.models.agent_registry import AgentRegistry
+        from src.models.profile_revision import ProfileRevision
+
+        session_factory = get_session_factory()
+        async with session_factory() as db:
+            reg_result = await db.execute(
+                select(AgentRegistry.id).where(AgentRegistry.agent_id == agent_id)
+            )
+            reg_row = reg_result.first()
+            if not reg_row:
+                return ""
+
+            rev_result = await db.execute(
+                select(ProfileRevision.content)
+                .where(
+                    ProfileRevision.agent_registry_id == reg_row[0],
+                    ProfileRevision.profile_type == "private",
+                )
+                .order_by(desc(ProfileRevision.created_at))
+                .limit(1)
+            )
+            rev_row = rev_result.first()
+            if not rev_row:
+                return ""
+
+            return _extract_section_text(rev_row[0], "Podcast Preferences")
+    except Exception as exc:
+        logger.warning("Could not load podcast preferences for %s: %s", agent_id, exc)
+        return ""
+
+
+async def _load_structured_preferences(agent_id: str | None = None, user_id=None, db_session=None):
+    """Load PodcastPreferences row from DB by agent_id or user_id. Returns ORM row or None."""
+    if not agent_id and not user_id:
+        return None
+    try:
+        from sqlalchemy import select
+
+        from src.models.podcast_preferences import PodcastPreferences
+
+        def _build_query():
+            if agent_id:
+                return select(PodcastPreferences).where(PodcastPreferences.agent_id == agent_id)
+            return select(PodcastPreferences).where(PodcastPreferences.user_id == user_id)
+
+        if db_session is not None:
+            result = await db_session.execute(_build_query())
+            return result.scalar_one_or_none()
+
+        from src.database import get_session_factory
+        session_factory = get_session_factory()
+        async with session_factory() as db:
+            result = await db.execute(_build_query())
+            return result.scalar_one_or_none()
+    except Exception as exc:
+        key = agent_id or str(user_id)
+        logger.warning("Could not load structured podcast preferences for %s: %s", key, exc)
+        return None
+
+
+def _format_candidates_for_prompt(records: list[dict[str, Any]]) -> str:
+    """Format PubMed records as a numbered list for the selection prompt."""
+    lines = []
+    for i, rec in enumerate(records, 1):
+        title = rec.get("title", "No title")
+        abstract = rec.get("abstract", "No abstract")[:600]
+        journal = rec.get("journal") or "Unknown journal"
+        year = rec.get("year") or "Unknown year"
+        lines.append(f"{i}. [{journal}, {year}] {title}\n   {abstract}")
+    return "\n\n".join(lines)
+
+
+async def _select_article(
+    profile_text: str,
+    candidates: list[dict[str, Any]],
+    agent_id: str,
+    preferences_text: str = "",
+) -> tuple[dict[str, Any], str] | tuple[None, str]:
+    """Use Sonnet to pick the most relevant article.
+
+    Returns (selected_record, justification) or (None, reason).
+    """
+    from src.services.llm import generate_agent_response
+
+    settings = get_settings()
+
+    prompt_path = Path("prompts/podcast-select.md")
+    template = prompt_path.read_text(encoding="utf-8")
+    candidates_text = _format_candidates_for_prompt(candidates)
+    prompt = (
+        template
+        .replace("{profile}", profile_text)
+        .replace("{candidates}", candidates_text)
+        .replace("{preferences}", preferences_text or "No specific preferences set.")
+    )
+
+    try:
+        response = await generate_agent_response(
+            system_prompt=prompt,
+            messages=[{"role": "user", "content": "Select the most relevant article."}],
+            model=settings.llm_agent_model_sonnet,
+            max_tokens=300,
+            log_meta={"agent_id": agent_id, "phase": "podcast_select"},
+        )
+
+        # Extract JSON
+        text = response.strip()
+        start = text.find("{")
+        end = text.rfind("}") + 1
+        if start >= 0 and end > start:
+            data = json.loads(text[start:end])
+        else:
+            raise ValueError("No JSON object found in response")
+
+        idx = data.get("index")
+        justification = data.get("justification", "")
+
+        if idx is None:
+            logger.info("Agent %s: no relevant article found (%s)", agent_id, justification)
+            return None, justification
+
+        idx = int(idx) - 1  # convert 1-based to 0-based
+        if 0 <= idx < len(candidates):
+            return candidates[idx], justification
+        else:
+            logger.warning("Agent %s: LLM returned out-of-range index %d", agent_id, idx + 1)
+            return None, "Index out of range"
+
+    except Exception as exc:
+        logger.error("Article selection failed for agent %s: %s", agent_id, exc)
+        return None, str(exc)
+
+
+async def _generate_summary(
+    profile_text: str,
+    record: dict[str, Any],
+    full_text: str | None,
+    agent_id: str,
+    preferences_text: str = "",
+) -> str | None:
+    """Use Opus to generate the structured text summary."""
+    from src.services.llm import generate_agent_response
+
+    settings = get_settings()
+
+    prompt_path = Path("prompts/podcast-summarize.md")
+    template = prompt_path.read_text(encoding="utf-8")
+
+    # Build paper section
+    authors_list = record.get("authors") or []
+    if not authors_list:
+        authors_str = "Authors not available"
+    elif len(authors_list) > 3:
+        authors_str = ", ".join(authors_list[:3]) + " et al."
+    else:
+        authors_str = ", ".join(authors_list)
+
+    pmid = record.get("pmid", "")
+    # Preprint records carry a canonical URL; PubMed records use the standard URL
+    paper_url = record.get("url") or f"https://pubmed.ncbi.nlm.nih.gov/{pmid}/"
+
+    paper_section = f"""Title: {record.get('title', '')}
+Authors: {authors_str}
+Journal: {record.get('journal') or 'Unknown'}
+Year: {record.get('year') or 'Unknown'}
+URL: {paper_url}
+
+Abstract:
+{record.get('abstract', '')}"""
+
+    if full_text:
+        paper_section += f"\n\nFull text excerpt:\n{full_text[:3000]}"
+
+    today_str = datetime.now(timezone.utc).strftime("%B %d, %Y")
+
+    prompt = (
+        template
+        .replace("{profile}", profile_text)
+        .replace("{paper}", paper_section)
+        .replace("{date}", today_str)
+        .replace("{paper_title}", record.get("title", ""))
+        .replace("{authors}", authors_str)
+        .replace("{journal}", record.get("journal") or "Unknown")
+        .replace("{year}", str(record.get("year") or ""))
+        .replace("{paper_url}", paper_url)
+        .replace("{preferences}", preferences_text or "No specific preferences set.")
+    )
+
+    try:
+        response = await generate_agent_response(
+            system_prompt=prompt,
+            messages=[{"role": "user", "content": "Write the research brief."}],
+            model=settings.llm_agent_model_opus,
+            max_tokens=600,
+            log_meta={"agent_id": agent_id, "phase": "podcast_summarize"},
+        )
+        return response.strip()
+    except Exception as exc:
+        logger.error("Summary generation failed for agent %s: %s", agent_id, exc)
+        return None
+
+
+async def _try_fetch_full_text(pmid: str) -> str | None:
+    """Attempt to fetch full text from PMC; return None on failure or for non-PubMed IDs."""
+    # Preprint IDs are prefixed (e.g. "biorxiv:...", "arxiv:...") — PMC doesn't have them
+    if not pmid.isdigit():
+        return None
+    try:
+        from src.services.pubmed import fetch_full_text
+        result = await fetch_full_text(pmid)
+        if "error" in result:
+            return None
+        return result.get("methods")
+    except Exception:
+        return None
+
+
+async def _deliver_slack_dm(
+    agent_id: str,
+    bot_token: str,
+    slack_user_id: str,
+    summary_text: str,
+    rss_url: str,
+) -> bool:
+    """Send the text summary as a Slack DM from the agent bot to the PI."""
+    if not bot_token or bot_token.startswith("xoxb-placeholder"):
+        logger.info("Agent %s: no valid Slack token, skipping DM delivery", agent_id)
+        return False
+    if not slack_user_id:
+        logger.info("Agent %s: no slack_user_id configured, skipping DM delivery", agent_id)
+        return False
+
+    try:
+        from slack_sdk import WebClient
+        client = WebClient(token=bot_token)
+
+        # Open DM channel
+        dm_resp = client.conversations_open(users=[slack_user_id])
+        channel_id = dm_resp["channel"]["id"]
+
+        # Append RSS link
+        full_message = summary_text
+        if rss_url:
+            full_message += f"\n\n_Listen to the audio version: {rss_url}_"
+
+        client.chat_postMessage(channel=channel_id, text=full_message)
+        logger.info("Agent %s: Slack DM delivered to %s", agent_id, slack_user_id)
+        return True
+    except Exception as exc:
+        logger.error("Agent %s: Slack DM failed: %s", agent_id, exc)
+        return False
+
+
+async def run_pipeline_for_agent(
+    agent_id: str,
+    bot_name: str,
+    pi_name: str,
+    bot_token: str,
+    slack_user_id: str | None,
+    db_session,
+) -> bool:
+    """Run the full podcast pipeline for one agent.
+
+    Returns True if an episode was produced and recorded.
+    """
+    from src.models.podcast import PodcastEpisode
+    from src.podcast.pubmed_search import build_queries, fetch_candidates
+    from src.podcast.tts_utils import get_audio_duration_seconds
+    from src.podcast.state import get_delivered_pmids, record_delivery
+
+    settings = get_settings()
+    today = date.today()
+
+    logger.info("Starting podcast pipeline for agent: %s (%s)", agent_id, pi_name)
+
+    # Step 1: Load profiles
+    profile_text = _load_public_profile(agent_id)
+    if not profile_text:
+        # Fallback: agent may have a linked user with a DB ResearcherProfile
+        from sqlalchemy import select as _select
+        from src.models.agent_registry import AgentRegistry
+        from src.models.profile import ResearcherProfile
+        from src.models.user import User
+
+        agent_row = (await db_session.execute(
+            _select(AgentRegistry).where(AgentRegistry.agent_id == agent_id)
+        )).scalar_one_or_none()
+
+        if agent_row and agent_row.user_id:
+            user_row = (await db_session.execute(
+                _select(User).where(User.id == agent_row.user_id)
+            )).scalar_one_or_none()
+            profile_row = (await db_session.execute(
+                _select(ResearcherProfile).where(ResearcherProfile.user_id == agent_row.user_id)
+            )).scalar_one_or_none()
+
+            if user_row and profile_row and profile_row.research_summary:
+                profile_text = _build_profile_text_from_db(user_row, profile_row)
+                logger.info("Agent %s: no markdown profile, using DB profile for user %s", agent_id, agent_row.user_id)
+
+        if not profile_text:
+            logger.warning("Agent %s: no public profile found, skipping", agent_id)
+            return False
+
+    preferences_text = await _load_podcast_preferences(agent_id)
+    if preferences_text:
+        logger.info("Agent %s: loaded podcast preferences (%d chars)", agent_id, len(preferences_text))
+
+    # Load structured preferences (voice, keywords, journals) from DB
+    prefs = await _load_structured_preferences(agent_id=agent_id, db_session=db_session)
+    if prefs:
+        logger.info(
+            "Agent %s: structured preferences — voice=%s, keywords=%d, preferred_journals=%d",
+            agent_id, prefs.voice_id, len(prefs.extra_keywords), len(prefs.preferred_journals),
+        )
+
+    # Build a minimal profile dict from markdown for query building
+    profile_dict = _parse_profile_markdown(profile_text)
+
+    # Step 2: Build queries and fetch candidates
+    queries = build_queries(profile_dict)
+    if not queries:
+        logger.warning("Agent %s: could not build search queries", agent_id)
+        return False
+
+    # Inject extra keywords from structured preferences as additional quoted queries
+    if prefs and prefs.extra_keywords:
+        extra_terms = [f'"{kw}"' for kw in prefs.extra_keywords[:20] if kw.strip()]
+        if extra_terms:
+            queries.append(" OR ".join(extra_terms))
+            logger.info("Agent %s: injected %d extra keyword terms", agent_id, len(extra_terms))
+
+    already_delivered = get_delivered_pmids(agent_id)
+    candidates = await fetch_candidates(
+        queries,
+        already_delivered=already_delivered,
+        days=settings.podcast_search_window_days,
+        max_total=settings.podcast_max_candidates,
+    )
+
+    if not candidates:
+        logger.info("Agent %s: no new candidate articles found", agent_id)
+        return False
+
+    # Build journal context to append to preferences text for selection prompt
+    journal_context = ""
+    if prefs and prefs.preferred_journals:
+        journal_context += f"\nPreferred sources: {', '.join(prefs.preferred_journals)}. Give these extra weight when relevance is comparable."
+    if prefs and prefs.deprioritized_journals:
+        journal_context += f"\nDeprioritized sources: {', '.join(prefs.deprioritized_journals)}. Avoid unless exceptionally relevant."
+    combined_preferences = (preferences_text or "") + journal_context
+
+    # Step 3: LLM article selection
+    from src.services.llm import set_call_log_callback
+
+    _llm_log_buffer: list[dict] = []
+    set_call_log_callback(_llm_log_buffer.append)
+    try:
+        selected, justification = await _select_article(profile_text, candidates, agent_id, combined_preferences)
+        if selected is None:
+            logger.info("Agent %s: no article selected", agent_id)
+            return False
+
+        pmid = selected.get("pmid", "")
+        paper_url = selected.get("url") or f"https://pubmed.ncbi.nlm.nih.gov/{pmid}/"
+        logger.info("Agent %s: selected PMID %s", agent_id, pmid)
+
+        # Step 4: Try to fetch full text
+        full_text = await _try_fetch_full_text(pmid)
+
+        # Step 5: Generate text summary
+        summary = await _generate_summary(profile_text, selected, full_text, agent_id, combined_preferences)
+    finally:
+        set_call_log_callback(None)
+        await _flush_podcast_llm_logs(_llm_log_buffer, db_session)
+
+    if not summary:
+        logger.error("Agent %s: summary generation failed", agent_id)
+        return False
+
+    # Step 6: Generate audio (backend selected by PODCAST_TTS_BACKEND)
+    audio_path = AUDIO_DIR / agent_id / f"{today.isoformat()}.mp3"
+    voice_override = prefs.voice_id if prefs else None
+    if settings.podcast_tts_backend == "local":
+        from src.podcast.local_tts import generate_audio
+        logger.info("Agent %s: using local vLLM-Omni TTS backend", agent_id)
+    elif settings.podcast_tts_backend == "openai":
+        from src.podcast.openai_tts import generate_audio
+        logger.info("Agent %s: using OpenAI TTS backend", agent_id)
+    else:
+        from src.podcast.mistral_tts import generate_audio
+        logger.info("Agent %s: using Mistral AI TTS backend", agent_id)
+    audio_ok = await generate_audio(summary, agent_id, audio_path, voice_override=voice_override)
+    if not audio_ok:
+        logger.error("Agent %s: TTS failed — skipping episode", agent_id)
+        return False
+    audio_file_path = str(audio_path)
+    audio_duration = get_audio_duration_seconds(audio_path)
+
+    # Step 7: Build RSS URL for DM
+    base_url = settings.podcast_base_url or settings.base_url
+    rss_url = f"{base_url}/podcast/{agent_id}/feed.xml"
+
+    # Step 8: Deliver Slack DM
+    slack_ok = await _deliver_slack_dm(
+        agent_id=agent_id,
+        bot_token=bot_token,
+        slack_user_id=slack_user_id or "",
+        summary_text=summary,
+        rss_url=rss_url,
+    )
+
+    # Extract metadata from selected record
+    authors_list = selected.get("authors") or []
+    if len(authors_list) > 3:
+        authors_str = ", ".join(authors_list[:3]) + " et al."
+    else:
+        authors_str = ", ".join(authors_list) if authors_list else "Unknown"
+
+    # Step 9: Persist to DB
+    episode = PodcastEpisode(
+        agent_id=agent_id,
+        episode_date=today,
+        pmid=pmid,
+        paper_title=selected.get("title") or "",
+        paper_authors=authors_str,
+        paper_journal=selected.get("journal") or "",
+        paper_year=selected.get("year") or 0,
+        paper_url=paper_url,
+        text_summary=summary,
+        audio_file_path=audio_file_path,
+        audio_duration_seconds=audio_duration,
+        slack_delivered=slack_ok,
+        selection_justification=justification,
+    )
+    db_session.add(episode)
+    await db_session.flush()
+
+    # Step 10: Update state (non-fatal — DB record already flushed)
+    try:
+        record_delivery(agent_id, pmid)
+    except Exception as exc:
+        logger.warning("Agent %s: state.py record_delivery failed (non-fatal): %s", agent_id, exc)
+
+    logger.info(
+        "Agent %s: episode complete (audio=%s, slack=%s)", agent_id, audio_ok, slack_ok
+    )
+    return True
+
+
+async def run_podcast_for_user(
+    user_id,
+    db_session,
+) -> bool:
+    """Run the full podcast pipeline for a plain ORCID user (no agent required).
+
+    Loads the user's ResearcherProfile from the DB, builds search queries from
+    structured profile fields, selects and summarises an article, generates audio,
+    and persists a PodcastEpisode keyed by user_id.
+
+    Returns True if an episode was produced and recorded.
+    """
+    import uuid as _uuid
+
+    from sqlalchemy import select as _select
+
+    from src.models.podcast import PodcastEpisode
+    from src.models.profile import ResearcherProfile
+    from src.models.user import User
+    from src.podcast.pubmed_search import build_queries, fetch_candidates
+    from src.podcast.state import get_delivered_pmids_for_user, record_delivery_for_user
+    from src.podcast.tts_utils import get_audio_duration_seconds
+
+    settings = get_settings()
+    today = date.today()
+    user_id_str = str(user_id)
+
+    # Load user
+    user_result = await db_session.execute(
+        _select(User).where(User.id == user_id)
+    )
+    user = user_result.scalar_one_or_none()
+    if not user:
+        logger.warning("run_podcast_for_user: user %s not found", user_id_str)
+        return False
+
+    logger.info("Starting podcast pipeline for user: %s (%s)", user_id_str, user.name)
+
+    # Load ResearcherProfile
+    profile_result = await db_session.execute(
+        _select(ResearcherProfile).where(ResearcherProfile.user_id == user_id)
+    )
+    profile = profile_result.scalar_one_or_none()
+    if not profile or not profile.research_summary:
+        logger.warning("User %s: no completed profile found, skipping", user_id_str)
+        return False
+
+    # Build profile text from structured DB fields (no disk file needed)
+    profile_text = _build_profile_text_from_db(user, profile)
+
+    # Load structured preferences keyed by user_id
+    prefs = await _load_structured_preferences(user_id=user_id, db_session=db_session)
+    if prefs:
+        logger.info(
+            "User %s: structured preferences — voice=%s, keywords=%d",
+            user_id_str, prefs.voice_id, len(prefs.extra_keywords),
+        )
+
+    # Build profile dict for query building
+    profile_dict = {
+        "research_summary": profile.research_summary or "",
+        "disease_areas": profile.disease_areas or [],
+        "techniques": profile.techniques or [],
+        "experimental_models": profile.experimental_models or [],
+        "keywords": profile.keywords or [],
+    }
+
+    queries = build_queries(profile_dict)
+    if not queries:
+        logger.warning("User %s: could not build search queries", user_id_str)
+        return False
+
+    if prefs and prefs.extra_keywords:
+        extra_terms = [f'"{kw}"' for kw in prefs.extra_keywords[:20] if kw.strip()]
+        if extra_terms:
+            queries.append(" OR ".join(extra_terms))
+
+    already_delivered = get_delivered_pmids_for_user(user_id_str)
+    candidates = await fetch_candidates(
+        queries,
+        already_delivered=already_delivered,
+        days=settings.podcast_search_window_days,
+        max_total=settings.podcast_max_candidates,
+    )
+
+    if not candidates:
+        logger.info("User %s: no new candidate articles found", user_id_str)
+        return False
+
+    # Build journal context from preferences
+    journal_context = ""
+    if prefs and prefs.preferred_journals:
+        journal_context += f"\nPreferred sources: {', '.join(prefs.preferred_journals)}. Give these extra weight when relevance is comparable."
+    if prefs and prefs.deprioritized_journals:
+        journal_context += f"\nDeprioritized sources: {', '.join(prefs.deprioritized_journals)}. Avoid unless exceptionally relevant."
+    combined_preferences = journal_context
+
+    # Article selection
+    from src.services.llm import set_call_log_callback
+
+    _llm_log_buffer: list[dict] = []
+    set_call_log_callback(_llm_log_buffer.append)
+    try:
+        selected, justification = await _select_article(profile_text, candidates, user_id_str, combined_preferences)
+        if selected is None:
+            logger.info("User %s: no article selected", user_id_str)
+            return False
+
+        pmid = selected.get("pmid", "")
+        paper_url = selected.get("url") or f"https://pubmed.ncbi.nlm.nih.gov/{pmid}/"
+        logger.info("User %s: selected PMID %s", user_id_str, pmid)
+
+        full_text = await _try_fetch_full_text(pmid)
+
+        summary = await _generate_summary(profile_text, selected, full_text, user_id_str, combined_preferences)
+    finally:
+        set_call_log_callback(None)
+        await _flush_podcast_llm_logs(_llm_log_buffer, db_session)
+
+    if not summary:
+        logger.error("User %s: summary generation failed", user_id_str)
+        return False
+
+    # Generate audio — stored under data/podcast_audio/users/{user_id}/
+    audio_path = AUDIO_DIR / "users" / user_id_str / f"{today.isoformat()}.mp3"
+    voice_override = prefs.voice_id if prefs else None
+    if settings.podcast_tts_backend == "local":
+        from src.podcast.local_tts import generate_audio
+    elif settings.podcast_tts_backend == "openai":
+        from src.podcast.openai_tts import generate_audio
+    else:
+        from src.podcast.mistral_tts import generate_audio
+    audio_ok = await generate_audio(summary, user_id_str, audio_path, voice_override=voice_override)
+    if not audio_ok:
+        logger.error("User %s: TTS failed — skipping episode", user_id_str)
+        return False
+    audio_file_path = str(audio_path)
+    audio_duration = get_audio_duration_seconds(audio_path)
+
+    # Extract metadata
+    authors_list = selected.get("authors") or []
+    if len(authors_list) > 3:
+        authors_str = ", ".join(authors_list[:3]) + " et al."
+    else:
+        authors_str = ", ".join(authors_list) if authors_list else "Unknown"
+
+    # Persist episode keyed by user_id (agent_id left NULL)
+    episode = PodcastEpisode(
+        user_id=user_id,
+        agent_id=None,
+        episode_date=today,
+        pmid=pmid,
+        paper_title=selected.get("title") or "",
+        paper_authors=authors_str,
+        paper_journal=selected.get("journal") or "",
+        paper_year=selected.get("year") or 0,
+        paper_url=paper_url,
+        text_summary=summary,
+        audio_file_path=audio_file_path,
+        audio_duration_seconds=audio_duration,
+        slack_delivered=False,
+        selection_justification=justification,
+    )
+    db_session.add(episode)
+    await db_session.flush()
+
+    try:
+        record_delivery_for_user(user_id_str, pmid)
+    except Exception as exc:
+        logger.warning("User %s: state.py record_delivery failed (non-fatal): %s", user_id_str, exc)
+
+    logger.info(
+        "User %s: episode complete (audio=%s)", user_id_str, audio_ok
+    )
+    return True
+
+
+def _build_profile_text_from_db(user, profile) -> str:
+    """Construct a plain-text profile summary from DB fields for use in LLM prompts."""
+    lines = [f"# {user.name}"]
+    if user.institution:
+        lines.append(f"Institution: {user.institution}")
+    if user.department:
+        lines.append(f"Department: {user.department}")
+    if profile.research_summary:
+        lines.append(f"\n## Research Summary\n{profile.research_summary}")
+    if profile.disease_areas:
+        lines.append("\n## Disease Areas\n" + "\n".join(f"- {v}" for v in profile.disease_areas))
+    if profile.techniques:
+        lines.append("\n## Key Methods and Technologies\n" + "\n".join(f"- {v}" for v in profile.techniques))
+    if profile.experimental_models:
+        lines.append("\n## Model Systems\n" + "\n".join(f"- {v}" for v in profile.experimental_models))
+    if profile.keywords:
+        lines.append("\n## Keywords\n" + "\n".join(f"- {v}" for v in profile.keywords))
+    return "\n".join(lines)
+
+
+def _parse_profile_markdown(text: str) -> dict[str, Any]:
+    """Extract structured fields from public profile markdown for query building."""
+    from src.agent.grantbot import _extract_list_section
+    return {
+        "disease_areas": _extract_list_section(text, "Disease Areas"),
+        "techniques": _extract_list_section(text, "Key Methods and Technologies"),
+        "experimental_models": _extract_list_section(text, "Model Systems"),
+        "keywords": _extract_list_section(text, "Keywords"),
+        "research_summary": _extract_section_text(text, "Research Summary"),
+    }
+
+
+def _extract_section_text(text: str, section_name: str) -> str:
+    """Extract free-form text from a markdown section."""
+    lines = []
+    in_section = False
+    for line in text.splitlines():
+        if section_name.lower() in line.lower() and line.startswith("##"):
+            in_section = True
+            continue
+        if in_section:
+            if line.startswith("##"):
+                break
+            lines.append(line)
+    return " ".join(l.strip() for l in lines if l.strip())
diff --git a/src/podcast/preprint_search.py b/src/podcast/preprint_search.py
new file mode 100644
index 0000000..6b109cb
--- /dev/null
+++ b/src/podcast/preprint_search.py
@@ -0,0 +1,290 @@
+"""Preprint server search for the podcast pipeline.
+
+Supports bioRxiv, medRxiv (via biorxiv.org content API) and arXiv.
+
+Records returned use the same schema as PubMed records but with:
+  - pmid:    prefixed ID  e.g. "biorxiv:2024.04.01.123456", "arxiv:2401.12345"
+  - url:     canonical preprint URL
+  - journal: "<Server> (preprint)"
+  - source:  "biorxiv" | "medrxiv" | "arxiv"
+"""
+
+import logging
+import re
+import xml.etree.ElementTree as ET
+from datetime import datetime, timedelta, timezone
+from typing import Any
+
+import httpx
+
+logger = logging.getLogger(__name__)
+
+BIORXIV_API = "https://api.biorxiv.org/details"
+ARXIV_API = "https://export.arxiv.org/api/query"
+ARXIV_NS = "http://www.w3.org/2005/Atom"
+
+# arXiv categories relevant to biomedical / computational biology research
+ARXIV_CATEGORIES = "cat:q-bio.BM OR cat:q-bio.GN OR cat:q-bio.MN OR cat:q-bio.QM OR cat:cs.LG"
+
+
+# ---------------------------------------------------------------------------
+# Shared helpers
+# ---------------------------------------------------------------------------
+
+def _extract_search_terms(queries: list[str]) -> list[str]:
+    """Extract individual quoted terms from PubMed query strings."""
+    terms: list[str] = []
+    for q in queries:
+        for match in re.findall(r'"([^"]+)"', q):
+            if match not in terms:
+                terms.append(match)
+    # Fall back to bare words if no quoted terms
+    if not terms:
+        for q in queries:
+            for word in q.split():
+                w = word.strip('"\'')
+                if len(w) > 4 and w.upper() not in ("AND", "OR", "NOT") and w not in terms:
+                    terms.append(w)
+    return terms[:12]
+
+
+def _score_record(title: str, abstract: str, terms: list[str]) -> int:
+    """Count how many search terms appear in title+abstract (case-insensitive)."""
+    text = (title + " " + abstract).lower()
+    return sum(1 for t in terms if t.lower() in text)
+
+
+def _date_range(days: int) -> tuple[str, str]:
+    now = datetime.now(timezone.utc)
+    start = now - timedelta(days=days)
+    return start.strftime("%Y-%m-%d"), now.strftime("%Y-%m-%d")
+
+
+# ---------------------------------------------------------------------------
+# bioRxiv / medRxiv
+# ---------------------------------------------------------------------------
+
+async def _fetch_biorxiv_server(
+    server: str,
+    queries: list[str],
+    days: int,
+    max_results: int,
+) -> list[dict[str, Any]]:
+    """Fetch recent preprints from bioRxiv or medRxiv and score against queries."""
+    terms = _extract_search_terms(queries)
+    if not terms:
+        return []
+
+    start_date, end_date = _date_range(days)
+    url = f"{BIORXIV_API}/{server}/{start_date}/{end_date}/0/json"
+
+    try:
+        async with httpx.AsyncClient(timeout=30) as client:
+            resp = await client.get(url)
+            resp.raise_for_status()
+            data = resp.json()
+    except Exception as exc:
+        logger.warning("%s API request failed: %s", server, exc)
+        return []
+
+    collection = data.get("collection") or []
+    if not isinstance(collection, list):
+        return []
+
+    cutoff = datetime.now(timezone.utc) - timedelta(days=days)
+    scored: list[tuple[int, dict[str, Any]]] = []
+    for item in collection:
+        title = item.get("title") or ""
+        abstract = item.get("abstract") or ""
+        if not abstract:
+            continue
+
+        # The bioRxiv API date-range filter includes revised preprints; filter by
+        # the item's own date so we only include recently posted/first-version papers.
+        date_str = item.get("date") or ""
+        if date_str:
+            try:
+                item_date = datetime.strptime(date_str, "%Y-%m-%d").replace(tzinfo=timezone.utc)
+                if item_date < cutoff:
+                    continue
+            except ValueError:
+                pass
+
+        score = _score_record(title, abstract, terms)
+        if score == 0:
+            continue
+
+        doi = item.get("doi") or ""
+        doi_suffix = doi.removeprefix("10.1101/")
+        record_id = f"{server}:{doi_suffix}"
+
+        # Authors stored as semicolon-separated string
+        authors_raw = item.get("authors") or ""
+        authors_list = [a.strip() for a in authors_raw.split(";") if a.strip()]
+
+        year_str = date_str[:4]
+        year = int(year_str) if year_str.isdigit() else datetime.now(timezone.utc).year
+
+        scored.append((score, {
+            "pmid": record_id,
+            "url": f"https://www.{server}.org/content/{doi}v1",
+            "title": title,
+            "abstract": abstract,
+            "journal": f"{server.capitalize()} (preprint)",
+            "year": year,
+            "authors": authors_list,
+            "pub_types": ["Preprint"],
+            "source": server,
+        }))
+
+    scored.sort(key=lambda x: x[0], reverse=True)
+    return [r for _, r in scored[:max_results]]
+
+
+# ---------------------------------------------------------------------------
+# arXiv
+# ---------------------------------------------------------------------------
+
+async def _fetch_arxiv(
+    queries: list[str],
+    days: int,
+    max_results: int,
+) -> list[dict[str, Any]]:
+    """Fetch recent preprints from arXiv matching researcher queries."""
+    terms = _extract_search_terms(queries)
+    if not terms:
+        return []
+
+    # Build arXiv search: keyword terms in abstract + category filter + date range
+    term_clause = " OR ".join(f'abs:"{t}"' for t in terms[:6])
+    start_date, _ = _date_range(days)
+    arxiv_date = start_date.replace("-", "") + "000000"
+    search_query = (
+        f"({term_clause}) AND ({ARXIV_CATEGORIES})"
+        f" AND submittedDate:[{arxiv_date} TO *]"
+    )
+
+    params = {
+        "search_query": search_query,
+        "start": "0",
+        "max_results": str(max_results * 2),
+        "sortBy": "submittedDate",
+        "sortOrder": "descending",
+    }
+
+    try:
+        async with httpx.AsyncClient(timeout=30) as client:
+            resp = await client.get(ARXIV_API, params=params)
+            resp.raise_for_status()
+            xml_text = resp.text
+    except Exception as exc:
+        logger.warning("arXiv API request failed: %s", exc)
+        return []
+
+    try:
+        root = ET.fromstring(xml_text)
+    except ET.ParseError as exc:
+        logger.warning("arXiv XML parse error: %s", exc)
+        return []
+
+    records: list[dict[str, Any]] = []
+    cutoff = datetime.now(timezone.utc) - timedelta(days=days)
+
+    for entry in root.findall(f"{{{ARXIV_NS}}}entry"):
+        title_el = entry.find(f"{{{ARXIV_NS}}}title")
+        summary_el = entry.find(f"{{{ARXIV_NS}}}summary")
+        id_el = entry.find(f"{{{ARXIV_NS}}}id")
+        published_el = entry.find(f"{{{ARXIV_NS}}}published")
+
+        title = (title_el.text or "").strip().replace("\n", " ") if title_el is not None else ""
+        abstract = (summary_el.text or "").strip() if summary_el is not None else ""
+        arxiv_url = (id_el.text or "").strip() if id_el is not None else ""
+        published_str = (published_el.text or "").strip() if published_el is not None else ""
+
+        if not abstract or not arxiv_url:
+            continue
+
+        # Parse submission date and apply cutoff
+        try:
+            pub_dt = datetime.fromisoformat(published_str.replace("Z", "+00:00"))
+            if pub_dt < cutoff:
+                continue
+            year = pub_dt.year
+        except ValueError:
+            year = datetime.now(timezone.utc).year
+
+        # Extract arxiv ID from URL like http://arxiv.org/abs/2401.12345v1
+        arxiv_id = arxiv_url.split("/abs/")[-1].split("v")[0]
+
+        authors_list = [
+            (n_el.text or "").strip()
+            for author in entry.findall(f"{{{ARXIV_NS}}}author")
+            for n_el in [author.find(f"{{{ARXIV_NS}}}name")]
+            if n_el is not None and n_el.text
+        ]
+
+        records.append({
+            "pmid": f"arxiv:{arxiv_id}",
+            "url": f"https://arxiv.org/abs/{arxiv_id}",
+            "title": title,
+            "abstract": abstract,
+            "journal": "arXiv (preprint)",
+            "year": year,
+            "authors": authors_list,
+            "pub_types": ["Preprint"],
+            "source": "arxiv",
+        })
+
+        if len(records) >= max_results:
+            break
+
+    return records
+
+
+# ---------------------------------------------------------------------------
+# Public interface
+# ---------------------------------------------------------------------------
+
+async def fetch_preprint_candidates(
+    queries: list[str],
+    already_delivered: set[str],
+    days: int = 14,
+    max_total: int = 20,
+) -> list[dict[str, Any]]:
+    """Fetch preprints from bioRxiv, medRxiv, and arXiv.
+
+    Returns records filtered against already_delivered, up to max_total total.
+    Each record has the same schema as PubMed records with an added 'url' field.
+    """
+    import asyncio
+
+    per_source = max(max_total // 3, 5)
+
+    biorxiv_task = _fetch_biorxiv_server("biorxiv", queries, days, per_source)
+    medrxiv_task = _fetch_biorxiv_server("medrxiv", queries, days, per_source)
+    arxiv_task = _fetch_arxiv(queries, days, per_source)
+
+    results = await asyncio.gather(biorxiv_task, medrxiv_task, arxiv_task, return_exceptions=True)
+
+    candidates: list[dict[str, Any]] = []
+    seen_ids: set[str] = set()
+    source_names = ("bioRxiv", "medRxiv", "arXiv")
+    for name, result in zip(source_names, results):
+        if isinstance(result, Exception):
+            logger.warning("Preprint fetch failed for %s: %s", name, result)
+            continue
+        for rec in result:
+            pid = rec["pmid"]
+            if pid not in already_delivered and pid not in seen_ids:
+                seen_ids.add(pid)
+                candidates.append(rec)
+
+    logger.info(
+        "Preprint candidates: %d total (%s)",
+        len(candidates),
+        ", ".join(
+            f"{name}: {len(r) if not isinstance(r, Exception) else 'err'}"
+            for name, r in zip(source_names, results)
+        ),
+    )
+    return candidates[:max_total]
diff --git a/src/podcast/pubmed_search.py b/src/podcast/pubmed_search.py
new file mode 100644
index 0000000..05ede0f
--- /dev/null
+++ b/src/podcast/pubmed_search.py
@@ -0,0 +1,149 @@
+"""PubMed query builder and search for the podcast pipeline."""
+
+import asyncio
+import logging
+from typing import Any
+
+import httpx
+
+from src.config import get_settings
+from src.services.pubmed import _ncbi_get, fetch_pubmed_records
+
+logger = logging.getLogger(__name__)
+
+EUTILS_BASE = "https://eutils.ncbi.nlm.nih.gov/entrez/eutils"
+
+
+def build_queries(profile: dict[str, Any]) -> list[str]:
+    """Build 2–3 PubMed search query strings from a researcher's profile fields.
+
+    profile keys used: disease_areas, techniques, experimental_models, keywords
+    """
+    disease_areas: list[str] = profile.get("disease_areas") or []
+    techniques: list[str] = profile.get("techniques") or []
+    experimental_models: list[str] = profile.get("experimental_models") or []
+    keywords: list[str] = profile.get("keywords") or []
+
+    queries: list[str] = []
+
+    # Query 1: disease areas (most specific to the field)
+    da_terms = [_simplify_term(t) for t in disease_areas[:6] if t]
+    da_terms = [t for t in da_terms if t and len(t.split()) <= 5]
+    if da_terms:
+        queries.append(" OR ".join(f'"{t}"' for t in da_terms[:4]))
+
+    # Query 2: techniques + experimental models (finds methods papers)
+    tech_terms = [_simplify_term(t) for t in techniques[:4] if t]
+    tech_terms = [t for t in tech_terms if t and len(t.split()) <= 4]
+    if tech_terms:
+        queries.append(" OR ".join(f'"{t}"' for t in tech_terms[:4]))
+
+    # Query 3: keywords (broad coverage)
+    kw_terms = [_simplify_term(t) for t in keywords[:8] if t]
+    kw_terms = [t for t in kw_terms if t and len(t.split()) <= 4]
+    if kw_terms:
+        queries.append(" OR ".join(f'"{t}"' for t in kw_terms[:5]))
+
+    # Fallback: use research summary words if nothing else
+    if not queries:
+        summary = profile.get("research_summary") or ""
+        words = [w.strip(".,;:") for w in summary.split() if len(w) > 6][:5]
+        if words:
+            queries.append(" OR ".join(f'"{w}"' for w in words))
+
+    return queries
+
+
+def _simplify_term(term: str) -> str:
+    """Strip parenthetical qualifiers and trim whitespace."""
+    return term.split("(")[0].strip()
+
+
+async def search_recent_pmids(
+    queries: list[str],
+    days: int = 14,
+    max_total: int = 50,
+) -> list[str]:
+    """Run PubMed ESearch for each query, return deduplicated list of recent PMIDs."""
+    settings = get_settings()
+    seen: set[str] = set()
+    pmids: list[str] = []
+
+    # Date filter: last N days
+    from datetime import datetime, timedelta, timezone
+    cutoff = (datetime.now(timezone.utc) - timedelta(days=days)).strftime("%Y/%m/%d")
+    today = datetime.now(timezone.utc).strftime("%Y/%m/%d")
+    date_filter = f"{cutoff}:{today}[pdat]"
+
+    for query in queries:
+        if len(pmids) >= max_total:
+            break
+        try:
+            params = {
+                "db": "pubmed",
+                "term": f"({query}) AND {date_filter}",
+                "retmode": "json",
+                "retmax": str(max_total),
+                "sort": "relevance",
+            }
+            resp = await _ncbi_get(f"{EUTILS_BASE}/esearch.fcgi", params)
+            data = resp.json()
+            ids = data.get("esearchresult", {}).get("idlist", [])
+            for pid in ids:
+                if pid not in seen and len(pmids) < max_total:
+                    seen.add(pid)
+                    pmids.append(pid)
+            logger.debug("Query '%s': %d results", query[:60], len(ids))
+        except Exception as exc:
+            logger.warning("PubMed search failed for query '%s': %s", query[:60], exc)
+
+    logger.info("Found %d candidate PMIDs across %d queries", len(pmids), len(queries))
+    return pmids
+
+
+async def fetch_candidates(
+    queries: list[str],
+    already_delivered: set[str],
+    days: int = 14,
+    max_total: int = 50,
+) -> list[dict[str, Any]]:
+    """Search PubMed and preprint servers, return candidate records excluding already-delivered IDs.
+
+    Returns list of dicts with: pmid, title, abstract, journal, year, pub_types.
+    Preprint records also include a 'url' and 'source' field.
+    """
+    from src.podcast.preprint_search import fetch_preprint_candidates
+
+    # Fetch PubMed and preprints concurrently
+    pubmed_pmids_task = search_recent_pmids(queries, days=days, max_total=max_total * 2)
+    preprint_task = fetch_preprint_candidates(
+        queries,
+        already_delivered=already_delivered,
+        days=days,
+        max_total=max(max_total // 3, 10),
+    )
+
+    pmids_raw, preprint_candidates = await asyncio.gather(pubmed_pmids_task, preprint_task)
+
+    # Filter PubMed results
+    pmids = [p for p in pmids_raw if p not in already_delivered]
+    pubmed_records = await fetch_pubmed_records(pmids[:max_total]) if pmids else []
+
+    # Filter out reviews/editorials and items without abstracts from PubMed
+    pubmed_candidates = []
+    for rec in pubmed_records:
+        if not rec.get("abstract"):
+            continue
+        pub_types = [pt.lower() for pt in (rec.get("pub_types") or [])]
+        if any(t in pt for t in ("review", "editorial", "comment", "letter") for pt in pub_types):
+            continue
+        pubmed_candidates.append(rec)
+
+    candidates = pubmed_candidates + preprint_candidates
+    logger.info(
+        "%d total candidates (PubMed: %d, preprints: %d)",
+        len(candidates),
+        len(pubmed_candidates),
+        len(preprint_candidates),
+    )
+    return candidates
diff --git a/src/podcast/rss.py b/src/podcast/rss.py
new file mode 100644
index 0000000..5379910
--- /dev/null
+++ b/src/podcast/rss.py
@@ -0,0 +1,127 @@
+"""RSS feed builder for podcast episodes.
+
+Supports two keying modes:
+  - agent_id  (str)  — pilot-lab agents, URLs at /podcast/{agent_id}/...
+  - user_id   (UUID) — plain ORCID users, URLs at /podcast/users/{user_id}/...
+"""
+
+import logging
+from datetime import datetime, timezone
+from email.utils import format_datetime
+from pathlib import Path
+from typing import Any
+
+logger = logging.getLogger(__name__)
+
+AUDIO_DIR = Path("data/podcast_audio")
+
+
+def build_feed(
+    pi_name: str,
+    episodes: list[Any],
+    base_url: str,
+    agent_id: str | None = None,
+    user_id: str | None = None,
+) -> str:
+    """Build an RSS 2.0 feed with iTunes extensions.
+
+    episodes: list of PodcastEpisode ORM objects, newest first.
+    base_url: public base URL (e.g. https://copi.science)
+    agent_id: set for pilot-lab agent feeds.
+    user_id:  set for plain-user feeds (UUID as string).
+    """
+    if agent_id:
+        feed_url = f"{base_url}/podcast/{agent_id}/feed.xml"
+    else:
+        feed_url = f"{base_url}/podcast/users/{user_id}/feed.xml"
+
+    items_xml = "\n".join(
+        _build_item(ep, base_url, agent_id=agent_id, user_id=user_id) for ep in episodes
+    )
+
+    return f"""<?xml version="1.0" encoding="UTF-8"?>
+<rss version="2.0"
+     xmlns:itunes="http://www.itunes.com/dtds/podcast-1.0.dtd"
+     xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>{_escape(pi_name)} — LabBot Research Briefings</title>
+    <description>Daily personalized research summaries for {_escape(pi_name)}.</description>
+    <link>{_escape(feed_url)}</link>
+    <language>en-us</language>
+    <atom:link href="{_escape(feed_url)}" rel="self" type="application/rss+xml"/>
+    <itunes:author>{_escape(pi_name)}</itunes:author>
+    <itunes:category text="Science"/>
+    <itunes:explicit>false</itunes:explicit>
+{items_xml}
+  </channel>
+</rss>"""
+
+
+def _build_item(
+    ep: Any,
+    base_url: str,
+    agent_id: str | None = None,
+    user_id: str | None = None,
+) -> str:
+    """Build a single RSS <item> for a PodcastEpisode.
+
+    Audio URL and GUID are derived from the episode's own agent_id/user_id
+    fields so that a feed containing mixed-path episodes (e.g. a user feed
+    that surfaces their linked agent's episodes) generates correct enclosure
+    URLs for each item regardless of the feed-level agent_id/user_id.
+    """
+    date_str = ep.episode_date.isoformat()
+    pub_date = format_datetime(
+        datetime(ep.episode_date.year, ep.episode_date.month, ep.episode_date.day,
+                 9, 0, 0, tzinfo=timezone.utc)
+    )
+    title = _escape(f"{ep.paper_title} — {date_str}")
+    description = _escape(ep.text_summary)
+    pmid_url = getattr(ep, "paper_url", None) or f"https://pubmed.ncbi.nlm.nih.gov/{ep.pmid}/"
+
+    # Prefer episode-level fields; fall back to feed-level params for legacy callers.
+    ep_agent_id = getattr(ep, "agent_id", None) or agent_id
+    ep_user_id = getattr(ep, "user_id", None) or user_id
+
+    if ep_agent_id:
+        guid = f"{ep_agent_id}-{date_str}"
+        audio_url = f"{base_url}/podcast/{ep_agent_id}/audio/{date_str}.mp3"
+    else:
+        uid = str(ep_user_id)
+        guid = f"user-{uid}-{date_str}"
+        audio_url = f"{base_url}/podcast/users/{uid}/audio/{date_str}.mp3"
+
+    enclosure_xml = ""
+    duration_xml = ""
+    if ep.audio_file_path:
+        audio_path = Path(ep.audio_file_path)
+        file_size = audio_path.stat().st_size if audio_path.exists() else 0
+        enclosure_xml = (
+            f'    <enclosure url="{_escape(audio_url)}" '
+            f'type="audio/mpeg" length="{file_size}"/>'
+        )
+        if ep.audio_duration_seconds:
+            mins, secs = divmod(ep.audio_duration_seconds, 60)
+            duration_xml = f"    <itunes:duration>{mins}:{secs:02d}</itunes:duration>"
+
+    return f"""  <item>
+    <title>{title}</title>
+    <description>{description}</description>
+    <link>{_escape(pmid_url)}</link>
+    <guid isPermaLink="false">{_escape(guid)}</guid>
+    <pubDate>{pub_date}</pubDate>
+{enclosure_xml}
+{duration_xml}
+  </item>"""
+
+
+def _escape(text: str) -> str:
+    """Escape XML special characters."""
+    return (
+        str(text)
+        .replace("&", "&amp;")
+        .replace("<", "&lt;")
+        .replace(">", "&gt;")
+        .replace('"', "&quot;")
+        .replace("'", "&apos;")
+    )
diff --git a/src/podcast/state.py b/src/podcast/state.py
new file mode 100644
index 0000000..e22d675
--- /dev/null
+++ b/src/podcast/state.py
@@ -0,0 +1,122 @@
+"""Podcast state persistence — tracks delivered PMIDs and last run timestamp.
+
+State is keyed separately for agents (by agent_id string) and for plain ORCID
+users (by user_id UUID string, stored under "users" in the JSON).
+
+JSON structure:
+{
+  "agents": {
+    "<agent_id>": {"delivered_pmids": ["12345", ...]},
+    ...
+  },
+  "users": {
+    "<user_id UUID string>": {"delivered_pmids": ["12345", ...]},
+    ...
+  },
+  "last_run_date": "2026-04-14"
+}
+"""
+
+import json
+import logging
+import threading
+from datetime import datetime, timezone
+from pathlib import Path
+
+logger = logging.getLogger(__name__)
+
+STATE_FILE = Path("data/podcast_state.json")
+_LOCK = threading.Lock()
+
+
+def _load() -> dict:
+    if STATE_FILE.exists():
+        try:
+            return json.loads(STATE_FILE.read_text(encoding="utf-8"))
+        except Exception as exc:
+            logger.warning("Failed to load podcast state: %s", exc)
+    return {}
+
+
+def _save(data: dict) -> None:
+    """Write state atomically via temp-file + rename."""
+    import os
+    import tempfile
+
+    STATE_FILE.parent.mkdir(parents=True, exist_ok=True)
+    fd, tmp = tempfile.mkstemp(dir=STATE_FILE.parent, suffix=".tmp")
+    try:
+        with os.fdopen(fd, "w", encoding="utf-8") as f:
+            f.write(json.dumps(data, indent=2))
+        os.replace(tmp, STATE_FILE)
+    except Exception:
+        os.unlink(tmp)
+        raise
+
+
+# ---------------------------------------------------------------------------
+# Agent-keyed helpers (existing behaviour, unchanged interface)
+# ---------------------------------------------------------------------------
+
+def get_delivered_pmids(agent_id: str) -> set[str]:
+    """Return the set of PMIDs already delivered to this agent."""
+    data = _load()
+    return set(data.get("agents", {}).get(agent_id, {}).get("delivered_pmids", []))
+
+
+def record_delivery(agent_id: str, pmid: str) -> None:
+    """Record that a PMID was delivered to this agent."""
+    with _LOCK:
+        data = _load()
+        agents = data.setdefault("agents", {})
+        agent_data = agents.setdefault(agent_id, {"delivered_pmids": []})
+        pmids = agent_data.setdefault("delivered_pmids", [])
+        if pmid not in pmids:
+            pmids.append(pmid)
+        _save(data)
+
+
+# ---------------------------------------------------------------------------
+# User-keyed helpers (new — for plain ORCID users)
+# ---------------------------------------------------------------------------
+
+def get_delivered_pmids_for_user(user_id: str) -> set[str]:
+    """Return the set of PMIDs already delivered to this user (no agent)."""
+    data = _load()
+    return set(data.get("users", {}).get(str(user_id), {}).get("delivered_pmids", []))
+
+
+def record_delivery_for_user(user_id: str, pmid: str) -> None:
+    """Record that a PMID was delivered to this user."""
+    with _LOCK:
+        data = _load()
+        users = data.setdefault("users", {})
+        user_data = users.setdefault(str(user_id), {"delivered_pmids": []})
+        pmids = user_data.setdefault("delivered_pmids", [])
+        if pmid not in pmids:
+            pmids.append(pmid)
+        _save(data)
+
+
+# ---------------------------------------------------------------------------
+# Scheduler helpers
+# ---------------------------------------------------------------------------
+
+def get_last_run_date() -> str | None:
+    """Return ISO date string of the last completed podcast run, or None."""
+    data = _load()
+    return data.get("last_run_date")
+
+
+def mark_run_complete() -> None:
+    """Record that the podcast pipeline ran today (UTC)."""
+    with _LOCK:
+        data = _load()
+        data["last_run_date"] = datetime.now(timezone.utc).strftime("%Y-%m-%d")
+        _save(data)
+
+
+def should_run_today() -> bool:
+    """Return True if the podcast pipeline has not run today (UTC)."""
+    today = datetime.now(timezone.utc).strftime("%Y-%m-%d")
+    return get_last_run_date() != today
diff --git a/src/podcast/tts_utils.py b/src/podcast/tts_utils.py
new file mode 100644
index 0000000..7a56bea
--- /dev/null
+++ b/src/podcast/tts_utils.py
@@ -0,0 +1,81 @@
+"""Shared utilities for podcast TTS backends."""
+
+import logging
+import re
+import shutil
+import subprocess
+import tempfile
+from pathlib import Path
+
+logger = logging.getLogger(__name__)
+
+
+def strip_markdown(text: str) -> str:
+    """Remove markdown formatting so TTS reads clean prose."""
+    # Remove bold/italic markers (* and _)
+    text = re.sub(r"\*+([^*]+)\*+", r"\1", text)
+    text = re.sub(r"_+([^_]+)_+", r"\1", text)
+    # Remove inline code
+    text = re.sub(r"`[^`]+`", "", text)
+    # Remove URLs but keep surrounding text
+    text = re.sub(r"https?://\S+", "", text)
+    return text.strip()
+
+
+def normalize_audio(audio_path: Path) -> bool:
+    """Normalize audio loudness in-place using ffmpeg loudnorm (EBU R128).
+
+    Targets -16 LUFS integrated loudness, -1.5 dBTP true peak — standard
+    podcast levels. Writes to a temp file then atomically replaces the original.
+
+    Returns True if normalization succeeded, False if ffmpeg is unavailable or
+    the command fails (the original file is preserved on failure).
+    """
+    ffmpeg = shutil.which("ffmpeg")
+    if not ffmpeg:
+        logger.warning("ffmpeg not found on PATH — skipping audio normalization")
+        return False
+
+    with tempfile.NamedTemporaryFile(suffix=".mp3", delete=False) as tmp:
+        tmp_path = Path(tmp.name)
+
+    try:
+        result = subprocess.run(
+            [
+                ffmpeg,
+                "-y",                          # overwrite tmp if it exists
+                "-i", str(audio_path),
+                "-af", "loudnorm=I=-16:TP=-1.5:LRA=11",
+                "-ar", "44100",
+                str(tmp_path),
+            ],
+            capture_output=True,
+            timeout=120,
+        )
+        if result.returncode != 0:
+            logger.error(
+                "ffmpeg loudnorm failed (exit %d): %s",
+                result.returncode,
+                result.stderr.decode(errors="replace")[-500:],
+            )
+            tmp_path.unlink(missing_ok=True)
+            return False
+
+        tmp_path.replace(audio_path)
+        logger.info("Audio normalized (loudnorm -16 LUFS) → %s", audio_path)
+        return True
+    except Exception as exc:
+        logger.error("Audio normalization failed: %s", exc)
+        tmp_path.unlink(missing_ok=True)
+        return False
+
+
+def get_audio_duration_seconds(audio_path: Path) -> int | None:
+    """Return audio duration in seconds using mutagen, or None if unavailable."""
+    try:
+        from mutagen.mp3 import MP3
+        audio = MP3(str(audio_path))
+        return int(audio.info.length)
+    except Exception as exc:
+        logger.debug("Could not read audio duration from %s: %s", audio_path, exc)
+        return None
diff --git a/src/podcast/voice_registry.py b/src/podcast/voice_registry.py
new file mode 100644
index 0000000..64eebcd
--- /dev/null
+++ b/src/podcast/voice_registry.py
@@ -0,0 +1,157 @@
+"""Runtime voice registry: fetch and cache available TTS voices per backend.
+
+At startup the app calls refresh_voices() to pre-warm the cache.
+Settings pages call get_voices() which returns the cached list immediately
+(or refreshes if the cache is stale / missing).
+
+Mistral  — fetched from /v1/audio/voices (paginated, deduped by slug)
+Local    — fetched from /v1/audio/voices on the configured vLLM server
+OpenAI   — fixed set; no API call needed
+
+All paths fall back to a hardcoded list if the remote endpoint is unreachable,
+so the settings UI always renders even if a TTS service is down.
+"""
+
+import logging
+import time
+
+import httpx
+
+logger = logging.getLogger(__name__)
+
+_CACHE_TTL = 86_400  # 24 hours
+
+# (voice_id, display_label) pairs, keyed by backend name
+_cache: dict[str, tuple[list[tuple[str, str]], float]] = {}
+
+# Static fallbacks used when the live endpoint is unreachable
+_FALLBACK: dict[str, list[tuple[str, str]]] = {
+    "mistral": [
+        ("en_paul_neutral",    "Paul — US English, male, neutral"),
+        ("en_paul_confident",  "Paul — US English, male, confident"),
+        ("en_paul_cheerful",   "Paul — US English, male, cheerful"),
+        ("en_paul_happy",      "Paul — US English, male, happy"),
+        ("gb_oliver_neutral",  "Oliver — British English, male, neutral"),
+        ("gb_jane_sarcasm",    "Jane — British English, female"),
+    ],
+    "openai": [
+        ("alloy",   "Alloy"),
+        ("echo",    "Echo"),
+        ("fable",   "Fable"),
+        ("onyx",    "Onyx"),
+        ("nova",    "Nova"),
+        ("shimmer", "Shimmer"),
+    ],
+    "local": [],
+}
+
+
+def get_cached_voices(backend: str) -> list[tuple[str, str]]:
+    """Return cached voices synchronously without making any API calls.
+
+    Returns stale cache if present, otherwise the static fallback.
+    """
+    if backend in _cache:
+        return _cache[backend][0]
+    return list(_FALLBACK.get(backend, []))
+
+
+async def _fetch_mistral(api_key: str) -> list[tuple[str, str]]:
+    voices: list[tuple[str, str]] = []
+    seen: set[str] = set()
+    page = 1
+    async with httpx.AsyncClient(timeout=15) as client:
+        while True:
+            resp = await client.get(
+                "https://api.mistral.ai/v1/audio/voices",
+                params={"page": page, "page_size": 50},
+                headers={"Authorization": f"Bearer {api_key}"},
+            )
+            resp.raise_for_status()
+            data = resp.json()
+            items = data.get("items", [])
+            new_count = 0
+            for v in items:
+                slug = v.get("slug", "")
+                if not slug or slug in seen:
+                    continue
+                seen.add(slug)
+                name = v.get("name", slug)
+                gender = v.get("gender", "")
+                langs = ", ".join(v.get("languages") or [])
+                parts = [p for p in [langs, gender] if p]
+                label = f"{name} — {', '.join(parts)}" if parts else name
+                voices.append((slug, label))
+                new_count += 1
+            total_pages = data.get("total_pages", 1)
+            if new_count == 0 or page >= total_pages:
+                break
+            page += 1
+    return voices
+
+
+async def _fetch_local(host: str, port: int) -> list[tuple[str, str]]:
+    async with httpx.AsyncClient(timeout=5) as client:
+        resp = await client.get(f"http://{host}:{port}/v1/audio/voices")
+        resp.raise_for_status()
+        data = resp.json()
+    items = data if isinstance(data, list) else data.get("voices", data.get("items", []))
+    voices: list[tuple[str, str]] = []
+    for v in items:
+        if isinstance(v, str):
+            voices.append((v, v))
+        elif isinstance(v, dict):
+            vid = v.get("id") or v.get("name") or v.get("slug", "")
+            label = v.get("name") or v.get("label") or vid
+            if vid:
+                voices.append((vid, str(label)))
+    return voices
+
+
+async def refresh_voices(backend: str | None = None) -> list[tuple[str, str]]:
+    """Fetch fresh voices from the live endpoint and update the cache.
+
+    Returns the newly cached list, or falls back to stale cache / static fallback
+    if the endpoint is unreachable.
+    """
+    from src.config import get_settings
+
+    settings = get_settings()
+    active = backend or settings.podcast_tts_backend
+
+    try:
+        if active == "mistral":
+            voices = await _fetch_mistral(settings.mistral_api_key)
+        elif active == "local":
+            voices = await _fetch_local(settings.local_tts_host, settings.local_tts_port)
+        elif active == "openai":
+            voices = list(_FALLBACK["openai"])  # fixed set
+        else:
+            voices = []
+
+        if voices:
+            _cache[active] = (voices, time.monotonic())
+            logger.info("Voice registry: cached %d voices for backend %r", len(voices), active)
+        else:
+            logger.warning("Voice registry: no voices returned for backend %r", active)
+
+    except Exception as exc:
+        logger.warning("Voice registry: fetch failed for backend %r: %s", active, exc)
+
+    return get_cached_voices(active)
+
+
+async def get_voices(backend: str | None = None) -> list[tuple[str, str]]:
+    """Return voices for the backend, refreshing if the cache is stale or missing."""
+    from src.config import get_settings
+
+    settings = get_settings()
+    active = backend or settings.podcast_tts_backend
+
+    now = time.monotonic()
+    if active in _cache:
+        _, fetched_at = _cache[active]
+        if now - fetched_at < _CACHE_TTL:
+            return _cache[active][0]
+
+    return await refresh_voices(active)
diff --git a/src/routers/admin.py b/src/routers/admin.py
index 46c05ac..8a28ea8 100644
--- a/src/routers/admin.py
+++ b/src/routers/admin.py
@@ -1,16 +1,18 @@
 """Admin dashboard router."""
 
 import logging
+import re
 import uuid
-from datetime import datetime, timezone
+from datetime import date, datetime, timedelta, timezone
 
 from fastapi import APIRouter, Depends, Form, HTTPException, Query, Request, status
-from fastapi.responses import HTMLResponse, RedirectResponse
+from fastapi.responses import HTMLResponse, JSONResponse, RedirectResponse
 from fastapi.templating import Jinja2Templates
 from sqlalchemy import func, select
 from sqlalchemy.ext.asyncio import AsyncSession
 from sqlalchemy.orm import selectinload
 
+from src.config import get_settings
 from src.database import get_db
 from src.dependencies import get_admin_user, get_current_user
 from src.models import (
@@ -20,6 +22,10 @@
     AgentRegistry,
     Job,
     LlmCallLog,
+    MatchmakerProposal,
+    PiProposalEvaluation,
+    PodcastEpisode,
+    PodcastPreferences,
     Publication,
     ResearcherProfile,
     SimulationRun,
@@ -34,6 +40,16 @@
 templates = Jinja2Templates(directory="templates")
 
 
+def _extract_proposal(text: str) -> str:
+    """Return content inside <proposal>…</proposal> tags, or the full text if absent."""
+    import re
+    match = re.search(r"<proposal>(.*?)</proposal>", text or "", re.DOTALL)
+    return match.group(1).strip() if match else (text or "").strip()
+
+
+templates.env.filters["extract_proposal"] = _extract_proposal
+
+
 def _template_context(
     request: Request, current_user: User, active_admin: str = "", **kwargs
 ) -> dict:
@@ -76,15 +92,14 @@ async def admin_users(
         pub_count = pub_counts.get(str(user.id), 0)
 
         # Profile status
+        active_jobs = [j for j in user.jobs if j.status in ("pending", "processing")]
         if not profile:
-            profile_status = "no_profile"
+            profile_status = "generating" if active_jobs else "no_profile"
         elif profile.pending_profile:
             profile_status = "pending_update"
         elif profile.research_summary:
             profile_status = "complete"
         else:
-            # Check if there's a running job
-            active_jobs = [j for j in user.jobs if j.status in ("pending", "processing")]
             profile_status = "generating" if active_jobs else "no_profile"
 
         # Apply filters
@@ -543,6 +558,10 @@ async def admin_discussions(
     for d in all_decisions:
         decision_map[d.thread_id] = d
 
+    # Track all root-post thread IDs before any filtering so orphan detection
+    # is accurate even when a status/channel filter removes some threads.
+    all_root_thread_ids = {post.message_ts for post in root_posts}
+
     # Build thread list
     threads = []
     available_channels = set()
@@ -606,10 +625,10 @@ async def admin_discussions(
         else:
             t["reviews"] = []
 
-    # Add orphaned decisions (thread_decisions with no matching root post in agent_messages)
-    known_thread_ids = {t["message_ts"] for t in threads}
+    # Add orphaned decisions (thread_decisions with no matching root post in agent_messages).
+    # Use all_root_thread_ids (pre-filter) so filtered-out threads aren't mistaken for orphans.
     for td in all_decisions:
-        if td.thread_id not in known_thread_ids:
+        if td.thread_id not in all_root_thread_ids:
             other_agents = replier_map.get(td.thread_id, set())
             poster_id = td.agent_a
             replier = td.agent_b if td.agent_a == poster_id else td.agent_a
@@ -671,7 +690,7 @@ async def admin_discussions(
                 "agent_b": d.agent_b,
                 "outcome": d.outcome,
                 "date": d.decided_at.strftime("%Y-%m-%d %H:%M UTC"),
-                "summary": d.summary_text.strip(),
+                "summary": _extract_proposal(d.summary_text),
             })
 
         if export == "html":
@@ -960,6 +979,71 @@ async def impersonate_user(
     return response
 
 
+@router.get("/podcast", response_class=HTMLResponse)
+async def admin_podcast(
+    request: Request,
+    agent_filter: str | None = None,
+    db: AsyncSession = Depends(get_db),
+    current_user: User = Depends(get_admin_user),
+):
+    """Podcast episodes overview."""
+    query = select(PodcastEpisode).order_by(PodcastEpisode.episode_date.desc()).limit(200)
+    result = await db.execute(query)
+    all_episodes = result.scalars().all()
+
+    # Apply agent filter
+    episodes = [e for e in all_episodes if not agent_filter or e.agent_id == agent_filter]
+
+    # Summary stats
+    total = len(all_episodes)
+    with_audio = sum(1 for e in all_episodes if e.audio_file_path)
+    slack_delivered = sum(1 for e in all_episodes if e.slack_delivered)
+    agent_ids = sorted({e.agent_id for e in all_episodes if e.agent_id is not None})
+
+    # Load preferences for all agents that have episodes
+    prefs_result = await db.execute(select(PodcastPreferences))
+    prefs_by_agent: dict[str, PodcastPreferences] = {
+        p.agent_id: p for p in prefs_result.scalars().all() if p.agent_id is not None
+    }
+
+    # LLM usage stats for podcast phases (simulation_run_id IS NULL)
+    llm_stats_result = await db.execute(
+        select(
+            func.count(LlmCallLog.id).label("call_count"),
+            func.coalesce(func.sum(LlmCallLog.input_tokens), 0).label("input_tokens"),
+            func.coalesce(func.sum(LlmCallLog.output_tokens), 0).label("output_tokens"),
+        ).where(
+            LlmCallLog.simulation_run_id.is_(None),
+            LlmCallLog.phase.in_(["podcast_select", "podcast_summarize"]),
+        )
+    )
+    llm_stats = llm_stats_result.one()
+
+    settings = get_settings()
+    base_url = settings.podcast_base_url or settings.base_url
+
+    return templates.TemplateResponse(
+        request,
+        "admin/podcast.html",
+        _template_context(
+            request,
+            current_user,
+            active_admin="podcast",
+            episodes=episodes,
+            total=total,
+            with_audio=with_audio,
+            slack_delivered=slack_delivered,
+            agent_ids=agent_ids,
+            agent_filter=agent_filter,
+            base_url=base_url,
+            prefs_by_agent=prefs_by_agent,
+            llm_call_count=llm_stats.call_count,
+            llm_input_tokens=llm_stats.input_tokens,
+            llm_output_tokens=llm_stats.output_tokens,
+        ),
+    )
+
+
 @router.post("/impersonate/stop")
 async def stop_impersonating(
     request: Request,
@@ -1218,3 +1302,841 @@ async def admin_waitlist_mark_contacted(
         signup.contacted_at = datetime.now(timezone.utc)
         await db.commit()
     return RedirectResponse(url="/admin/waitlist", status_code=302)
+
+
+# ---------------------------------------------------------------------------
+# Matchmaker
+# ---------------------------------------------------------------------------
+
+async def _get_eligible_matchmaker_users(db: AsyncSession) -> list:
+    """Users eligible for matchmaker: have a DB profile OR a disk profile via AgentRegistry."""
+    from pathlib import Path
+
+    # Users with a complete DB profile
+    db_result = await db.execute(
+        select(User)
+        .join(ResearcherProfile, ResearcherProfile.user_id == User.id)
+        .where(ResearcherProfile.research_summary.isnot(None))
+    )
+    db_users = {u.id: u for u in db_result.scalars().all()}
+
+    # Users linked to an agent that has a disk profile
+    agent_result = await db.execute(
+        select(AgentRegistry).where(AgentRegistry.user_id.isnot(None))
+    )
+    for agent_reg in agent_result.scalars().all():
+        if agent_reg.user_id in db_users:
+            continue
+        if Path(f"profiles/public/{agent_reg.agent_id}.md").exists():
+            user_result = await db.execute(
+                select(User).where(User.id == agent_reg.user_id)
+            )
+            user = user_result.scalar_one_or_none()
+            if user:
+                db_users[user.id] = user
+
+    return sorted(db_users.values(), key=lambda u: u.name)
+
+
+@router.get("/matchmaker", response_class=HTMLResponse)
+async def admin_matchmaker(
+    request: Request,
+    pi_filter: list[uuid.UUID] = Query(default=[]),
+    confidence_filter: str | None = None,
+    export: str = "",
+    db: AsyncSession = Depends(get_db),
+    current_user: User = Depends(get_admin_user),
+):
+    """Matchmaker tab — generate and view admin-initiated collaboration proposals."""
+    eligible_users = await _get_eligible_matchmaker_users(db)
+
+    # Fetch proposals with PI relationships eager-loaded
+    proposals_query = (
+        select(MatchmakerProposal)
+        .options(
+            selectinload(MatchmakerProposal.pi_a),
+            selectinload(MatchmakerProposal.pi_b),
+        )
+        .order_by(MatchmakerProposal.generated_at.desc())
+    )
+    if pi_filter:
+        proposals_query = proposals_query.where(
+            (MatchmakerProposal.pi_a_id.in_(pi_filter))
+            | (MatchmakerProposal.pi_b_id.in_(pi_filter))
+        )
+    if confidence_filter:
+        proposals_query = proposals_query.where(
+            MatchmakerProposal.confidence == confidence_filter
+        )
+    proposals_result = await db.execute(proposals_query)
+    proposals = proposals_result.scalars().all()
+
+    if export:
+        export_rows = [
+            {
+                "name_a": p.name_a,
+                "name_b": p.name_b,
+                "title": p.title or "",
+                "confidence": p.confidence or "",
+                "date": p.generated_at.strftime("%Y-%m-%d %H:%M UTC"),
+                "proposal_md": _extract_proposal(p.proposal_md or ""),
+            }
+            for p in proposals
+        ]
+
+        if export == "html":
+            return templates.TemplateResponse(
+                request,
+                "admin/matchmaker_export.html",
+                {"request": request, "proposals": export_rows},
+                headers={"Content-Disposition": "attachment; filename=matchmaker_proposals.html"},
+            )
+
+        from fastapi.responses import PlainTextResponse
+        lines = []
+        for p in export_rows:
+            lines.append(f"{'=' * 72}")
+            lines.append(f"PI A: {p['name_a']}")
+            lines.append(f"PI B: {p['name_b']}")
+            lines.append(f"Title: {p['title']}")
+            lines.append(f"Confidence: {p['confidence'].capitalize()}")
+            lines.append(f"Generated: {p['date']}")
+            lines.append("")
+            lines.append(p["proposal_md"])
+            lines.append("")
+        if not lines:
+            lines.append("No proposals found with current filters.")
+        return PlainTextResponse(
+            "\n".join(lines),
+            headers={"Content-Disposition": "attachment; filename=matchmaker_proposals.txt"},
+        )
+
+    return templates.TemplateResponse(
+        request,
+        "admin/matchmaker.html",
+        _template_context(
+            request,
+            current_user,
+            active_admin="matchmaker",
+            eligible_users=eligible_users,
+            proposals=proposals,
+            pi_filter=pi_filter,
+            confidence_filter=confidence_filter,
+            error=None,
+        ),
+    )
+
+
+@router.post("/matchmaker/generate", response_class=HTMLResponse)
+async def admin_matchmaker_generate(
+    request: Request,
+    pi_a_id: uuid.UUID = Form(...),
+    pi_b_id: uuid.UUID = Form(...),
+    db: AsyncSession = Depends(get_db),
+    current_user: User = Depends(get_admin_user),
+):
+    """Run the LLM matchmaker pipeline and store the resulting proposal."""
+    from src.services.llm import generate_matchmaker_proposal
+
+    async def _render_error(msg: str):
+        eligible_users = await _get_eligible_matchmaker_users(db)
+        proposals_result = await db.execute(
+            select(MatchmakerProposal)
+            .options(
+                selectinload(MatchmakerProposal.pi_a),
+                selectinload(MatchmakerProposal.pi_b),
+            )
+            .order_by(MatchmakerProposal.generated_at.desc())
+        )
+        proposals = proposals_result.scalars().all()
+        return templates.TemplateResponse(
+            request,
+            "admin/matchmaker.html",
+            _template_context(
+                request,
+                current_user,
+                active_admin="matchmaker",
+                eligible_users=eligible_users,
+                proposals=proposals,
+                pi_filter=[],
+                confidence_filter=None,
+                error=msg,
+            ),
+        )
+
+    if pi_a_id == pi_b_id:
+        return await _render_error("Please select two different PIs.")
+
+    # Load profiles and recent publications for both PIs
+    async def _load_user_data(user_id: uuid.UUID):
+        from pathlib import Path
+        user_result = await db.execute(
+            select(User)
+            .where(User.id == user_id)
+            .options(selectinload(User.profile))
+        )
+        user = user_result.scalar_one_or_none()
+        if not user:
+            return None, None, None, None
+
+        # DB profile takes precedence; fall back to disk profile for seeded agents
+        profile_text = None
+        private_text = ""
+        if user.profile and user.profile.research_summary:
+            profile = user.profile
+            parts = [profile.research_summary]
+            if profile.techniques:
+                parts.append("**Techniques:** " + ", ".join(profile.techniques))
+            if profile.experimental_models:
+                parts.append("**Model systems:** " + ", ".join(profile.experimental_models))
+            if profile.disease_areas:
+                parts.append("**Disease areas:** " + ", ".join(profile.disease_areas))
+            if profile.key_targets:
+                parts.append("**Key targets:** " + ", ".join(profile.key_targets))
+            if profile.grant_titles:
+                parts.append("**Active grants:** " + "; ".join(profile.grant_titles))
+            profile_text = "\n\n".join(parts)
+            private_text = profile.private_profile_md or ""
+        else:
+            # Try disk profile via AgentRegistry
+            agent_result = await db.execute(
+                select(AgentRegistry).where(AgentRegistry.user_id == user_id)
+            )
+            agent_reg = agent_result.scalar_one_or_none()
+            if agent_reg:
+                pub_path = Path(f"profiles/public/{agent_reg.agent_id}.md")
+                priv_path = Path(f"profiles/private/{agent_reg.agent_id}.md")
+                if pub_path.exists():
+                    profile_text = pub_path.read_text(encoding="utf-8").strip()
+                if priv_path.exists():
+                    private_text = priv_path.read_text(encoding="utf-8").strip()
+
+        if not profile_text:
+            return None, None, None, None
+
+        pubs_result = await db.execute(
+            select(Publication)
+            .where(Publication.user_id == user_id)
+            .order_by(Publication.year.desc())
+            .limit(20)
+        )
+        pubs = pubs_result.scalars().all()
+
+        def _format_pubs(pubs) -> str:
+            if not pubs:
+                return "(none)"
+            lines = []
+            for p in pubs:
+                pos = f" [{p.author_position}]" if p.author_position else ""
+                journal = f" — {p.journal}" if p.journal else ""
+                year = f" ({p.year})" if p.year else ""
+                pmid = f" PMID:{p.pmid}" if p.pmid else ""
+                lines.append(f"- {p.title}{pos}{year}{journal}{pmid}")
+            return "\n".join(lines)
+
+        return user, profile_text, private_text, _format_pubs(pubs)
+
+    user_a, profile_text_a, private_a, pubs_text_a = await _load_user_data(pi_a_id)
+    user_b, profile_text_b, private_b, pubs_text_b = await _load_user_data(pi_b_id)
+
+    if not profile_text_a:
+        return await _render_error("PI A does not have a complete profile yet.")
+    if not profile_text_b:
+        return await _render_error("PI B does not have a complete profile yet.")
+
+    settings = get_settings()
+
+    try:
+        result = await generate_matchmaker_proposal(
+            name_a=user_a.name,
+            public_profile_a=profile_text_a,
+            private_profile_a=private_a,
+            publications_a=pubs_text_a,
+            name_b=user_b.name,
+            public_profile_b=profile_text_b,
+            private_profile_b=private_b,
+            publications_b=pubs_text_b,
+            model=settings.llm_agent_model_opus,
+        )
+    except Exception as exc:
+        logger.error("Matchmaker LLM call failed: %s", exc)
+        return await _render_error(f"LLM call failed: {exc}")
+
+    proposal = MatchmakerProposal(
+        pi_a_id=pi_a_id,
+        pi_b_id=pi_b_id,
+        proposal_md=result["proposal_md"],
+        title=result["title"],
+        confidence=result["confidence"],
+        llm_model=result["model"],
+        input_tokens=result["input_tokens"],
+        output_tokens=result["output_tokens"],
+    )
+    db.add(proposal)
+    await db.commit()
+
+    return RedirectResponse(url=f"/admin/matchmaker/{proposal.id}", status_code=302)
+
+
+@router.get("/matchmaker/{proposal_id}", response_class=HTMLResponse)
+async def admin_matchmaker_detail(
+    request: Request,
+    proposal_id: uuid.UUID,
+    db: AsyncSession = Depends(get_db),
+    current_user: User = Depends(get_admin_user),
+):
+    """Detail view for a single matchmaker proposal."""
+    result = await db.execute(
+        select(MatchmakerProposal)
+        .where(MatchmakerProposal.id == proposal_id)
+        .options(
+            selectinload(MatchmakerProposal.pi_a),
+            selectinload(MatchmakerProposal.pi_b),
+        )
+    )
+    proposal = result.scalar_one_or_none()
+    if not proposal:
+        raise HTTPException(status_code=404, detail="Proposal not found")
+
+    return templates.TemplateResponse(
+        request,
+        "admin/matchmaker_detail.html",
+        _template_context(
+            request,
+            current_user,
+            active_admin="matchmaker",
+            proposal=proposal,
+        ),
+    )
+
+
+@router.post("/matchmaker/{proposal_id}/delete")
+async def admin_matchmaker_delete(
+    proposal_id: uuid.UUID,
+    db: AsyncSession = Depends(get_db),
+    current_user: User = Depends(get_admin_user),
+):
+    """Delete a matchmaker proposal."""
+    result = await db.execute(
+        select(MatchmakerProposal).where(MatchmakerProposal.id == proposal_id)
+    )
+    proposal = result.scalar_one_or_none()
+    if proposal:
+        await db.delete(proposal)
+        await db.commit()
+    return RedirectResponse(url="/admin/matchmaker", status_code=302)
+
+
+@router.post("/matchmaker/clear")
+async def admin_matchmaker_clear(
+    db: AsyncSession = Depends(get_db),
+    current_user: User = Depends(get_admin_user),
+):
+    """Delete all matchmaker proposals from the database (does not affect Slack)."""
+    from sqlalchemy import delete as sql_delete
+    await db.execute(sql_delete(MatchmakerProposal))
+    await db.commit()
+    return RedirectResponse(url="/admin/matchmaker", status_code=302)
+
+
+@router.post("/discussions/clear")
+async def admin_discussions_clear(
+    db: AsyncSession = Depends(get_db),
+    current_user: User = Depends(get_admin_user),
+):
+    """Delete all thread decisions (and cascaded proposal reviews) from the database (does not affect Slack)."""
+    from sqlalchemy import delete as sql_delete
+    await db.execute(sql_delete(ThreadDecision))
+    await db.commit()
+    return RedirectResponse(url="/admin/discussions", status_code=302)
+
+
+# ---------------------------------------------------------------------------
+# PI Proposal Evaluations
+# ---------------------------------------------------------------------------
+
+def _extract_title_admin(text: str | None) -> str | None:
+    if not text:
+        return None
+    for line in text.strip().splitlines():
+        line = line.strip()
+        if line.startswith("#"):
+            return re.sub(r"^#+\s*", "", line).strip() or None
+        if line:
+            return line[:120]
+    return None
+
+
+@router.get("/evaluations", response_class=HTMLResponse)
+async def admin_evaluations(
+    request: Request,
+    origin_filter: str | None = None,
+    pi_filter: str | None = None,
+    impact_min: str | None = None,
+    impact_max: str | None = None,
+    date_from: str | None = None,
+    date_to: str | None = None,
+    db: AsyncSession = Depends(get_db),
+    current_user: User = Depends(get_admin_user),
+):
+    """Admin view of all PI proposal evaluations."""
+    impact_min_val = int(impact_min) if impact_min and impact_min.strip() else None
+    impact_max_val = int(impact_max) if impact_max and impact_max.strip() else None
+
+    # Dropdown: all allowed users, ordered by name
+    all_evaluators_result = await db.execute(
+        select(User).where(User.access_status == "allowed").order_by(User.name)
+    )
+    all_evaluators = all_evaluators_result.scalars().all()
+
+    # Resolve selected PI's names (user.name + agent.pi_name) for collaborator matching
+    selected_pi_id = None
+    selected_pi_names: set[str] = set()
+    if pi_filter:
+        try:
+            import uuid as _uuid
+            selected_pi_id = _uuid.UUID(pi_filter)
+            pi_user_result = await db.execute(select(User).where(User.id == selected_pi_id))
+            pi_user = pi_user_result.scalar_one_or_none()
+            if pi_user:
+                selected_pi_names.add(pi_user.name)
+            pi_agent_result = await db.execute(
+                select(AgentRegistry).where(AgentRegistry.user_id == selected_pi_id)
+            )
+            pi_agent_rec = pi_agent_result.scalar_one_or_none()
+            if pi_agent_rec:
+                selected_pi_names.add(pi_agent_rec.pi_name)
+        except ValueError:
+            selected_pi_id = None
+
+    query = (
+        select(PiProposalEvaluation)
+        .options(
+            selectinload(PiProposalEvaluation.user),
+            selectinload(PiProposalEvaluation.thread_decision),
+            selectinload(PiProposalEvaluation.matchmaker_proposal)
+            .selectinload(MatchmakerProposal.pi_a),
+            selectinload(PiProposalEvaluation.matchmaker_proposal)
+            .selectinload(MatchmakerProposal.pi_b),
+        )
+        .order_by(PiProposalEvaluation.evaluated_at.desc())
+    )
+
+    if origin_filter in ("agent", "matchmaker"):
+        query = query.where(PiProposalEvaluation.proposal_type == origin_filter)
+    if impact_min_val is not None:
+        query = query.where(PiProposalEvaluation.score_overall_impact >= impact_min_val)
+    if impact_max_val is not None:
+        query = query.where(PiProposalEvaluation.score_overall_impact <= impact_max_val)
+    if date_from:
+        try:
+            df = date.fromisoformat(date_from)
+            query = query.where(PiProposalEvaluation.evaluated_at >= df)
+        except ValueError:
+            pass
+    if date_to:
+        try:
+            dt = date.fromisoformat(date_to) + timedelta(days=1)
+            query = query.where(PiProposalEvaluation.evaluated_at < dt)
+        except ValueError:
+            pass
+
+    result = await db.execute(query)
+    evaluations = result.scalars().all()
+
+    # Resolve collaborator names for agent evaluations
+    agent_ids_needed: set[str] = set()
+    for ev in evaluations:
+        if ev.proposal_type == "agent" and ev.thread_decision:
+            agent_ids_needed.add(ev.thread_decision.agent_a)
+            agent_ids_needed.add(ev.thread_decision.agent_b)
+
+    # Also need agent info for the selected PI to match agent proposals by collaborator
+    if selected_pi_id and not selected_pi_names:
+        pass  # already handled above
+    agent_reg_map: dict[str, AgentRegistry] = {}
+    if agent_ids_needed:
+        ar_result = await db.execute(
+            select(AgentRegistry)
+            .options(selectinload(AgentRegistry.user))
+            .where(AgentRegistry.agent_id.in_(agent_ids_needed))
+        )
+        agent_reg_map = {a.agent_id: a for a in ar_result.scalars().all()}
+
+    # Build per-user name lookup covering evaluators + matchmaker collaborators
+    all_relevant_user_ids = {ev.user_id for ev in evaluations}
+    for ev in evaluations:
+        if ev.matchmaker_proposal:
+            mp = ev.matchmaker_proposal
+            if mp.pi_a_id:
+                all_relevant_user_ids.add(mp.pi_a_id)
+            if mp.pi_b_id:
+                all_relevant_user_ids.add(mp.pi_b_id)
+    evaluator_agent_result = await db.execute(
+        select(AgentRegistry).where(AgentRegistry.user_id.in_(all_relevant_user_ids))
+    )
+    evaluator_agent_map: dict = {a.user_id: a for a in evaluator_agent_result.scalars().all()}
+
+    eval_rows = []
+    for ev in evaluations:
+        if ev.proposal_type == "agent" and ev.thread_decision:
+            td = ev.thread_decision
+            title = _extract_title_admin(td.summary_text) or "Collaboration Proposal"
+            collaborator = "Unknown"
+            collaborator_agent_id = None
+            for aid in (td.agent_a, td.agent_b):
+                ar = agent_reg_map.get(aid)
+                if ar and ar.user_id != ev.user_id:
+                    collaborator = ar.user.name if ar.user else (ar.pi_name or aid)
+                    collaborator_agent_id = ar.agent_id
+                    break
+        else:
+            mp = ev.matchmaker_proposal
+            title = mp.title if mp else "Unknown"
+            collaborator_agent_id = None
+            if mp:
+                # Use evaluator's known names to determine which side they are
+                ev_names: set[str] = set()
+                if ev.user:
+                    ev_names.add(ev.user.name)
+                ev_agent = evaluator_agent_map.get(ev.user_id)
+                if ev_agent:
+                    ev_names.add(ev_agent.pi_name)
+                is_pi_a = (mp.pi_a_id == ev.user_id) or (mp.pi_a_name in ev_names)
+                collaborator = mp.name_b if is_pi_a else mp.name_a
+                collab_user_id = mp.pi_b_id if is_pi_a else mp.pi_a_id
+                collab_ar = evaluator_agent_map.get(collab_user_id) if collab_user_id else None
+                if collab_ar:
+                    collaborator_agent_id = collab_ar.agent_id
+            else:
+                collaborator = "Unknown"
+
+        eval_rows.append({"eval": ev, "title": title, "collaborator": collaborator, "collaborator_agent_id": collaborator_agent_id})
+
+    # Apply PI filter at Python level: match evaluator OR collaborator
+    if selected_pi_id and selected_pi_names:
+        eval_rows = [
+            row for row in eval_rows
+            if row["eval"].user_id == selected_pi_id
+            or row["collaborator"] in selected_pi_names
+        ]
+
+    # Summary stats computed on filtered rows
+    total_count = len(eval_rows)
+    today = date.today()
+    this_month = sum(
+        1 for row in eval_rows
+        if row["eval"].evaluated_at
+        and row["eval"].evaluated_at.date().month == today.month
+        and row["eval"].evaluated_at.date().year == today.year
+    )
+    mean_impact = (
+        sum(row["eval"].score_overall_impact for row in eval_rows) / total_count
+        if total_count else 0.0
+    )
+
+    # --- Pending proposals section (all proposals, hidden or not) ---
+    pending_td_result = await db.execute(
+        select(ThreadDecision)
+        .where(ThreadDecision.outcome == "proposal")
+        .order_by(ThreadDecision.decided_at.desc())
+    )
+    pending_tds = pending_td_result.scalars().all()
+
+    pending_mm_result = await db.execute(
+        select(MatchmakerProposal)
+        .options(selectinload(MatchmakerProposal.pi_a), selectinload(MatchmakerProposal.pi_b))
+        .order_by(MatchmakerProposal.generated_at.desc())
+    )
+    pending_mms = pending_mm_result.scalars().all()
+
+    pending_agent_ids: set[str] = {td.agent_a for td in pending_tds} | {td.agent_b for td in pending_tds}
+    pending_ar_map: dict[str, AgentRegistry] = {}
+    if pending_agent_ids:
+        par_result = await db.execute(
+            select(AgentRegistry)
+            .options(selectinload(AgentRegistry.user))
+            .where(AgentRegistry.agent_id.in_(pending_agent_ids))
+        )
+        pending_ar_map = {a.agent_id: a for a in par_result.scalars().all()}
+
+    td_cov_result = await db.execute(
+        select(PiProposalEvaluation.thread_decision_id, PiProposalEvaluation.user_id)
+        .where(PiProposalEvaluation.thread_decision_id.isnot(None))
+    )
+    td_eval_coverage = {(r[0], r[1]) for r in td_cov_result}
+
+    mm_cov_result = await db.execute(
+        select(PiProposalEvaluation.matchmaker_proposal_id, PiProposalEvaluation.user_id)
+        .where(PiProposalEvaluation.matchmaker_proposal_id.isnot(None))
+    )
+    mm_eval_coverage = {(r[0], r[1]) for r in mm_cov_result}
+
+    pending_proposals: list[dict] = []
+
+    for td in pending_tds:
+        ar_a = pending_ar_map.get(td.agent_a)
+        ar_b = pending_ar_map.get(td.agent_b)
+        name_a = (ar_a.user.name if ar_a and ar_a.user else (ar_a.pi_name or td.agent_a)) if ar_a else td.agent_a
+        name_b = (ar_b.user.name if ar_b and ar_b.user else (ar_b.pi_name or td.agent_b)) if ar_b else td.agent_b
+        uid_a = ar_a.user_id if ar_a else None
+        uid_b = ar_b.user_id if ar_b else None
+        evaluated_a = uid_a is not None and (td.id, uid_a) in td_eval_coverage
+        evaluated_b = uid_b is not None and (td.id, uid_b) in td_eval_coverage
+        if not (evaluated_a and evaluated_b):
+            pending_proposals.append({
+                "proposal_type": "agent",
+                "proposal_id": str(td.id),
+                "name_a": name_a,
+                "name_b": name_b,
+                "title": _extract_title_admin(td.summary_text) or "Collaboration Proposal",
+                "evaluated_a": evaluated_a,
+                "evaluated_b": evaluated_b,
+                "hidden": td.hidden,
+            })
+
+    for mp in pending_mms:
+        if mp.pi_a_id is not None and mp.pi_b_id is not None:
+            evaluated_a = (mp.id, mp.pi_a_id) in mm_eval_coverage
+            evaluated_b = (mp.id, mp.pi_b_id) in mm_eval_coverage
+        else:
+            eval_count = sum(1 for r in mm_eval_coverage if r[0] == mp.id)
+            evaluated_a = eval_count >= 1
+            evaluated_b = eval_count >= 2
+        if not (evaluated_a and evaluated_b):
+            pending_proposals.append({
+                "proposal_type": "matchmaker",
+                "proposal_id": str(mp.id),
+                "name_a": mp.name_a,
+                "name_b": mp.name_b,
+                "title": mp.title,
+                "evaluated_a": evaluated_a,
+                "evaluated_b": evaluated_b,
+                "hidden": mp.hidden,
+            })
+
+    return templates.TemplateResponse(
+        request,
+        "admin/evaluations.html",
+        _template_context(
+            request,
+            current_user,
+            active_admin="evaluations",
+            eval_rows=eval_rows,
+            total_count=total_count,
+            this_month=this_month,
+            mean_impact=round(mean_impact, 1),
+            origin_filter=origin_filter or "",
+            pi_filter=pi_filter or "",
+            all_evaluators=all_evaluators,
+            impact_min=impact_min_val,
+            impact_max=impact_max_val,
+            date_from=date_from or "",
+            date_to=date_to or "",
+            pending_proposals=pending_proposals,
+        ),
+    )
+
+
+@router.post("/evaluations/proposals/{proposal_type}/{proposal_id}/hide")
+async def hide_proposal(
+    proposal_type: str,
+    proposal_id: uuid.UUID,
+    request: Request,
+    db: AsyncSession = Depends(get_db),
+    current_user: User = Depends(get_admin_user),
+):
+    """Toggle the hidden flag on a proposal (affects /proposals PI-facing page)."""
+    if proposal_type == "agent":
+        result = await db.execute(select(ThreadDecision).where(ThreadDecision.id == proposal_id))
+        proposal = result.scalar_one_or_none()
+    elif proposal_type == "matchmaker":
+        result = await db.execute(select(MatchmakerProposal).where(MatchmakerProposal.id == proposal_id))
+        proposal = result.scalar_one_or_none()
+    else:
+        raise HTTPException(status_code=400, detail="Invalid proposal type")
+
+    if not proposal:
+        raise HTTPException(status_code=404, detail="Proposal not found")
+
+    proposal.hidden = not proposal.hidden
+    await db.commit()
+    return RedirectResponse(url="/admin/evaluations", status_code=302)
+
+
+@router.get("/evaluations/export.json")
+async def admin_evaluations_export(
+    request: Request,
+    origin_filter: str | None = None,
+    pi_filter: str | None = None,
+    impact_min: str | None = None,
+    impact_max: str | None = None,
+    date_from: str | None = None,
+    date_to: str | None = None,
+    db: AsyncSession = Depends(get_db),
+    current_user: User = Depends(get_admin_user),
+):
+    """Export all matching PI evaluations as JSON."""
+    impact_min_val = int(impact_min) if impact_min and impact_min.strip() else None
+    impact_max_val = int(impact_max) if impact_max and impact_max.strip() else None
+    query = (
+        select(PiProposalEvaluation)
+        .options(
+            selectinload(PiProposalEvaluation.user),
+            selectinload(PiProposalEvaluation.thread_decision),
+            selectinload(PiProposalEvaluation.matchmaker_proposal)
+            .selectinload(MatchmakerProposal.pi_a),
+            selectinload(PiProposalEvaluation.matchmaker_proposal)
+            .selectinload(MatchmakerProposal.pi_b),
+        )
+        .order_by(PiProposalEvaluation.evaluated_at.desc())
+    )
+
+    if origin_filter in ("agent", "matchmaker"):
+        query = query.where(PiProposalEvaluation.proposal_type == origin_filter)
+    if pi_filter:
+        try:
+            import uuid as _uuid
+            query = query.where(PiProposalEvaluation.user_id == _uuid.UUID(pi_filter))
+        except ValueError:
+            pass
+    if impact_min_val is not None:
+        query = query.where(PiProposalEvaluation.score_overall_impact >= impact_min_val)
+    if impact_max_val is not None:
+        query = query.where(PiProposalEvaluation.score_overall_impact <= impact_max_val)
+    if date_from:
+        try:
+            df = date.fromisoformat(date_from)
+            query = query.where(PiProposalEvaluation.evaluated_at >= df)
+        except ValueError:
+            pass
+    if date_to:
+        try:
+            dt = date.fromisoformat(date_to) + timedelta(days=1)
+            query = query.where(PiProposalEvaluation.evaluated_at < dt)
+        except ValueError:
+            pass
+
+    result = await db.execute(query)
+    evaluations = result.scalars().all()
+
+    # Resolve agent registry for collaborator names
+    agent_ids_needed: set[str] = set()
+    for ev in evaluations:
+        if ev.proposal_type == "agent" and ev.thread_decision:
+            agent_ids_needed.add(ev.thread_decision.agent_a)
+            agent_ids_needed.add(ev.thread_decision.agent_b)
+
+    agent_reg_map: dict[str, AgentRegistry] = {}
+    if agent_ids_needed:
+        ar_result = await db.execute(
+            select(AgentRegistry)
+            .options(selectinload(AgentRegistry.user))
+            .where(AgentRegistry.agent_id.in_(agent_ids_needed))
+        )
+        agent_reg_map = {a.agent_id: a for a in ar_result.scalars().all()}
+
+    def _ts(dt: datetime | None) -> str | None:
+        return dt.isoformat() if dt else None
+
+    records = []
+    for ev in evaluations:
+        if ev.proposal_type == "agent" and ev.thread_decision:
+            td = ev.thread_decision
+            title = _extract_title_admin(td.summary_text) or "Collaboration Proposal"
+            collaborator_name = "Unknown"
+            collaborator_user_id = None
+            collaborator_institution = None
+            for aid in (td.agent_a, td.agent_b):
+                ar = agent_reg_map.get(aid)
+                if ar and ar.user_id != ev.user_id:
+                    if ar.user:
+                        collaborator_name = ar.user.name
+                        collaborator_user_id = str(ar.user.id)
+                        collaborator_institution = ar.user.institution
+                    else:
+                        collaborator_name = ar.pi_name or aid
+                    break
+            proposal_obj = {
+                "origin": "agent",
+                "proposal_id": str(td.id),
+                "title": title,
+                "collaborator": {
+                    "user_id": collaborator_user_id,
+                    "name": collaborator_name,
+                    "institution": collaborator_institution,
+                },
+            }
+        else:
+            mp = ev.matchmaker_proposal
+            title = mp.title if mp else "Unknown"
+            if mp:
+                if mp.pi_a_id == ev.user_id:
+                    collab_name = mp.name_b
+                    collab_uid = str(mp.pi_b_id) if mp.pi_b_id else None
+                    collab_inst = mp.pi_b.institution if mp.pi_b else None
+                else:
+                    collab_name = mp.name_a
+                    collab_uid = str(mp.pi_a_id) if mp.pi_a_id else None
+                    collab_inst = mp.pi_a.institution if mp.pi_a else None
+            else:
+                collab_name, collab_uid, collab_inst = "Unknown", None, None
+            proposal_obj = {
+                "origin": "matchmaker",
+                "proposal_id": str(mp.id) if mp else None,
+                "title": title,
+                "collaborator": {
+                    "user_id": collab_uid,
+                    "name": collab_name,
+                    "institution": collab_inst,
+                },
+            }
+
+        records.append(
+            {
+                "evaluation_id": str(ev.id),
+                "evaluated_at": _ts(ev.evaluated_at),
+                "updated_at": _ts(ev.updated_at),
+                "evaluator": {
+                    "user_id": str(ev.user.id) if ev.user else str(ev.user_id),
+                    "name": ev.user.name if ev.user else "Unknown",
+                    "orcid": ev.user.orcid if ev.user else None,
+                    "institution": ev.user.institution if ev.user else None,
+                },
+                "proposal": proposal_obj,
+                "scores": {
+                    "significance": ev.score_significance,
+                    "innovation": ev.score_innovation,
+                    "approach": ev.score_approach,
+                    "investigators": ev.score_investigators,
+                    "environment": ev.score_environment,
+                    "overall_impact": ev.score_overall_impact,
+                },
+                "comments": {
+                    "significance": ev.comments_significance,
+                    "innovation": ev.comments_innovation,
+                    "approach": ev.comments_approach,
+                    "investigators": ev.comments_investigators,
+                    "environment": ev.comments_environment,
+                    "overall": ev.comments_overall,
+                },
+            }
+        )
+
+    payload = {
+        "exported_at": datetime.now(timezone.utc).isoformat(),
+        "total_records": len(records),
+        "filters_applied": {
+            "origin": origin_filter or "all",
+            "impact_score_min": impact_min_val,
+            "impact_score_max": impact_max_val,
+            "date_from": date_from,
+            "date_to": date_to,
+        },
+        "evaluations": records,
+    }
+
+    return JSONResponse(
+        content=payload,
+        headers={"Content-Disposition": "attachment; filename=evaluations.json"},
+    )
diff --git a/src/routers/agent_page.py b/src/routers/agent_page.py
index 1f98a69..865f271 100644
--- a/src/routers/agent_page.py
+++ b/src/routers/agent_page.py
@@ -1,6 +1,7 @@
 """My Agent page router."""
 
 import logging
+import re
 import uuid
 from pathlib import Path
 
@@ -17,6 +18,7 @@
     AgentDelegate,
     AgentMessage,
     AgentRegistry,
+    LlmCallLog,
     ProposalReview,
     ResearcherProfile,
     ThreadDecision,
@@ -35,6 +37,18 @@
 )
 
 
+def _extract_proposal_title(text: str | None) -> str:
+    if not text:
+        return "Collaboration Proposal"
+    for line in text.strip().splitlines():
+        line = line.strip()
+        if line.startswith("#"):
+            return re.sub(r"^#+\s*", "", line).strip() or "Collaboration Proposal"
+        if line:
+            return line[:120]
+    return "Collaboration Proposal"
+
+
 def _template_context(request: Request, user: User, **kwargs) -> dict:
     impersonated = getattr(user, "_is_impersonated", False)
     real_admin = getattr(user, "_real_admin", None)
@@ -185,7 +199,8 @@ async def agent_dashboard(
     reviewed = []
     for p in proposals:
         other = p.agent_b if p.agent_a == aid else p.agent_a
-        entry = {"proposal": p, "other_agent": other}
+        title = _extract_proposal_title(p.summary_text)
+        entry = {"proposal": p, "other_agent": other, "title": title}
         if p.id in reviewed_ids:
             rev_result = await db.execute(
                 select(ProposalReview).where(
@@ -196,6 +211,38 @@ async def agent_dashboard(
             entry["review"] = rev_result.scalar_one_or_none()
             reviewed.append(entry)
         else:
+            # Fetch discussion: one entry per actual Slack message in this thread.
+            # LlmCallLog logs every API call; tool-use chains produce multiple entries
+            # per turn with empty/partial response_text. Fix: filter blanks, then
+            # collapse consecutive same-agent entries (keep the last/fullest one).
+            disc_result = await db.execute(
+                select(LlmCallLog.agent_id, LlmCallLog.response_text, LlmCallLog.created_at)
+                .where(
+                    LlmCallLog.channel == p.channel,
+                    LlmCallLog.phase == "thread_reply",
+                    LlmCallLog.agent_id.in_([p.agent_a, p.agent_b]),
+                    LlmCallLog.created_at <= p.decided_at,
+                    func.length(LlmCallLog.response_text) > 10,
+                )
+                .order_by(LlmCallLog.created_at.asc())
+            )
+            raw_msgs = [
+                {
+                    "agent_id": r[0],
+                    "text": re.sub(r"</?slack_message>", "", r[1]).strip(),
+                    "ts": r[2].isoformat(),
+                }
+                for r in disc_result
+                if r[1] and r[1].strip()
+            ]
+            # Deduplicate consecutive same-agent entries
+            deduped: list[dict] = []
+            for msg in raw_msgs:
+                if deduped and deduped[-1]["agent_id"] == msg["agent_id"]:
+                    deduped[-1] = msg  # replace with the later, fuller response
+                else:
+                    deduped.append(msg)
+            entry["discussion"] = deduped
             unreviewed.append(entry)
 
     # Private profile path
@@ -264,6 +311,49 @@ async def agent_dashboard(
     )
 
 
+# --------------------------------------------------------------------------
+# Pause / resume agent activity (owner only)
+# --------------------------------------------------------------------------
+
+
+@router.post("/{agent_id}/pause")
+async def pause_agent(
+    agent_id: str,
+    request: Request,
+    db: AsyncSession = Depends(get_db),
+    current_user: User = Depends(get_current_user),
+):
+    """Pause an agent — stops it from being selected in the simulation."""
+    agent, is_owner = await get_agent_with_access(agent_id, db, current_user)
+    if not is_owner:
+        raise HTTPException(status_code=403, detail="Only the PI can pause their agent")
+    if agent.status != "active":
+        return RedirectResponse(url="/agent", status_code=302)
+    agent.is_paused = True
+    await db.commit()
+    logger.info("Agent %s paused by %s", agent_id, current_user.name)
+    return RedirectResponse(url=f"/agent/{agent_id}/dashboard", status_code=302)
+
+
+@router.post("/{agent_id}/resume")
+async def resume_agent(
+    agent_id: str,
+    request: Request,
+    db: AsyncSession = Depends(get_db),
+    current_user: User = Depends(get_current_user),
+):
+    """Resume a paused agent — allows it to be selected in the simulation again."""
+    agent, is_owner = await get_agent_with_access(agent_id, db, current_user)
+    if not is_owner:
+        raise HTTPException(status_code=403, detail="Only the PI can resume their agent")
+    if agent.status != "active":
+        return RedirectResponse(url="/agent", status_code=302)
+    agent.is_paused = False
+    await db.commit()
+    logger.info("Agent %s resumed by %s", agent_id, current_user.name)
+    return RedirectResponse(url=f"/agent/{agent_id}/dashboard", status_code=302)
+
+
 def _user_slack_id_in_list(user: User, slack_ids: list[str]) -> bool:
     """Check if a user's email maps to any Slack ID in the list (heuristic)."""
     # We can't check without calling Slack API, so for now always return False
@@ -707,6 +797,116 @@ async def save_public_profile(
     )
 
 
+# --------------------------------------------------------------------------
+# Podcast settings (owner or admin)
+# --------------------------------------------------------------------------
+
+# Valid Mistral voxtral-mini-tts-latest voices (verify at docs.mistral.ai/capabilities/audio/)
+MISTRAL_VOICES = [
+    ("alex", "Alex — US English, male, neutral"),
+    ("deedee", "Deedee — US English, female, bright"),
+    ("laurel", "Laurel — US English, female, clear"),
+    ("luna", "Luna — US English, female, soft"),
+    ("rio", "Rio — US English, male, energetic"),
+    ("stella", "Stella — US English, female, professional"),
+    ("theo", "Theo — US English, male, measured"),
+    ("tyler", "Tyler — US English, male, conversational"),
+]
+
+
+@router.get("/{agent_id}/podcast-settings", response_class=HTMLResponse)
+async def get_podcast_settings(
+    agent_id: str,
+    request: Request,
+    saved: bool = False,
+    db: AsyncSession = Depends(get_db),
+    current_user: User = Depends(get_current_user),
+):
+    """View podcast preferences for an agent."""
+    from sqlalchemy import select as sa_select
+
+    from src.models.podcast_preferences import PodcastPreferences
+
+    agent, is_owner = await get_agent_with_access(agent_id, db, current_user)
+    if agent.status != "active":
+        return RedirectResponse(url="/agent", status_code=302)
+
+    result = await db.execute(
+        sa_select(PodcastPreferences).where(PodcastPreferences.agent_id == agent_id)
+    )
+    prefs = result.scalar_one_or_none()
+
+    from src.podcast.voice_registry import get_voices
+    voices = await get_voices()
+
+    return templates.TemplateResponse(
+        request,
+        "agent/podcast_settings.html",
+        _template_context(
+            request, current_user,
+            agent=agent,
+            is_owner=is_owner,
+            prefs=prefs,
+            voices=voices,
+            saved=saved,
+        ),
+    )
+
+
+@router.post("/{agent_id}/podcast-settings")
+async def save_podcast_settings(
+    agent_id: str,
+    request: Request,
+    podcast_enabled: str = Form(""),
+    voice_id: str = Form(""),
+    extra_keywords_raw: str = Form(""),
+    preferred_journals_raw: str = Form(""),
+    deprioritized_journals_raw: str = Form(""),
+    db: AsyncSession = Depends(get_db),
+    current_user: User = Depends(get_current_user),
+):
+    """Save podcast preferences for an agent."""
+    from sqlalchemy import select as sa_select
+
+    from src.models.podcast_preferences import PodcastPreferences
+
+    agent, is_owner = await get_agent_with_access(agent_id, db, current_user)
+    if agent.status != "active":
+        return RedirectResponse(url="/agent", status_code=302)
+
+    # Keywords: newline-only (phrases can legitimately contain commas)
+    def _parse_keywords(raw: str) -> list[str]:
+        return [v for line in raw.splitlines() if (v := line.strip())][:20]
+
+    # Journals: accept both newlines and commas as separators
+    def _parse_journals(raw: str) -> list[str]:
+        return [v for part in raw.replace(",", "\n").splitlines() if (v := part.strip())][:20]
+
+    extra_keywords = _parse_keywords(extra_keywords_raw)
+    preferred_journals = _parse_journals(preferred_journals_raw)
+    deprioritized_journals = _parse_journals(deprioritized_journals_raw)
+    clean_voice = voice_id.strip() or None
+
+    result = await db.execute(
+        sa_select(PodcastPreferences).where(PodcastPreferences.agent_id == agent_id)
+    )
+    prefs = result.scalar_one_or_none()
+
+    if prefs is None:
+        prefs = PodcastPreferences(agent_id=agent_id)
+        db.add(prefs)
+
+    prefs.podcast_enabled = podcast_enabled == "1"
+    prefs.voice_id = clean_voice
+    prefs.extra_keywords = extra_keywords
+    prefs.preferred_journals = preferred_journals
+    prefs.deprioritized_journals = deprioritized_journals
+    await db.commit()
+
+    logger.info("Podcast preferences saved for agent %s by %s", agent_id, current_user.name)
+    return RedirectResponse(url=f"/agent/{agent_id}/podcast-settings?saved=1", status_code=302)
+
+
 # --------------------------------------------------------------------------
 # Slack connection (PI only)
 # --------------------------------------------------------------------------
diff --git a/src/routers/auth.py b/src/routers/auth.py
index 39d773a..b1e983d 100644
--- a/src/routers/auth.py
+++ b/src/routers/auth.py
@@ -151,18 +151,36 @@ async def auth_callback(
         # Allowlist can promote an existing pending user to allowed
         if is_allowlisted and user.access_status != "allowed":
             user.access_status = "allowed"
+
+        # For any allowed user with no profile and no active job, recover by
+        # enqueuing a new profile generation (covers users created before this
+        # check existed, or whose earlier job was lost).
+        if user.access_status == "allowed":
             from src.models import ResearcherProfile
             profile_check = await db.execute(
                 select(ResearcherProfile.id).where(ResearcherProfile.user_id == user.id)
             )
             if profile_check.scalar_one_or_none() is None:
-                db.add(
-                    Job(
-                        type="generate_profile",
-                        user_id=user.id,
-                        payload={"user_id": str(user.id), "orcid": orcid_id},
+                job_check = await db.execute(
+                    select(Job.id).where(
+                        Job.user_id == user.id,
+                        Job.type == "generate_profile",
+                        Job.status.in_(["pending", "processing"]),
                     )
                 )
+                if job_check.scalar_one_or_none() is None:
+                    db.add(
+                        Job(
+                            type="generate_profile",
+                            user_id=user.id,
+                            payload={"user_id": str(user.id), "orcid": orcid_id},
+                        )
+                    )
+                    logger.info(
+                        "Recovering allowed user %s (%s) with no profile — enqueued job",
+                        user.id, orcid_id,
+                    )
+
         # Set claimed_at if this was a seeded profile
         if user.claimed_at is None:
             user.claimed_at = datetime.now(timezone.utc)
diff --git a/src/routers/podcast.py b/src/routers/podcast.py
new file mode 100644
index 0000000..091202c
--- /dev/null
+++ b/src/routers/podcast.py
@@ -0,0 +1,438 @@
+"""Podcast RSS feed, audio serving, settings, and on-demand generation endpoints.
+
+Two delivery paths:
+  Agent path  — pilot-lab agents with an approved AgentRegistry entry.
+                URLs are keyed by agent_id string.
+                Endpoints: /podcast/{agent_id}/...
+
+  User path   — any user who has completed ORCID onboarding and has a
+                ResearcherProfile with a research_summary.
+                URLs are keyed by user_id UUID (opaque, stable, subscribable).
+                Endpoints: /podcast/users/{user_id}/...  (public RSS + audio)
+                           /podcast/settings             (auth-gated settings UI)
+                           /podcast/user/generate        (auth-gated on-demand trigger)
+"""
+
+import asyncio
+import logging
+import uuid as _uuid
+from pathlib import Path
+
+from fastapi import APIRouter, Depends, Form, HTTPException, Request
+from fastapi.responses import FileResponse, HTMLResponse, RedirectResponse, Response
+from fastapi.templating import Jinja2Templates
+from sqlalchemy import select
+from sqlalchemy.ext.asyncio import AsyncSession
+
+from src.config import get_settings
+from src.database import get_db, get_session_factory
+from src.dependencies import get_current_user
+from src.models.agent_registry import AgentRegistry
+from src.models.podcast import PodcastEpisode
+from src.models.user import User
+from src.podcast.rss import build_feed
+
+logger = logging.getLogger(__name__)
+router = APIRouter()
+templates = Jinja2Templates(directory="templates")
+
+AUDIO_DIR = Path("data/podcast_audio")
+
+
+
+# ---------------------------------------------------------------------------
+# User path — plain ORCID users (registered before agent path to prevent
+# /user/generate and /users/... from being shadowed by /{agent_id}/...)
+# ---------------------------------------------------------------------------
+
+@router.get("/users/{user_id}/feed.xml", response_class=Response)
+async def podcast_feed_for_user(
+    user_id: str,
+    db: AsyncSession = Depends(get_db),
+):
+    """Public RSS 2.0 feed for a plain ORCID user's daily research briefings.
+
+    The user_id in the URL is the UUID primary key of the User record, which
+    acts as an opaque, stable, subscribable token — no authentication required.
+    """
+    try:
+        uid = _uuid.UUID(user_id)
+    except ValueError:
+        raise HTTPException(status_code=400, detail="Invalid user ID format")
+
+    user_result = await db.execute(select(User).where(User.id == uid))
+    user = user_result.scalar_one_or_none()
+    if not user:
+        raise HTTPException(status_code=404, detail="User not found")
+
+    # User-keyed episodes
+    user_eps_result = await db.execute(
+        select(PodcastEpisode)
+        .where(PodcastEpisode.user_id == uid)
+        .order_by(PodcastEpisode.episode_date.desc())
+        .limit(30)
+    )
+    user_episodes = user_eps_result.scalars().all()
+
+    # Also pull episodes from a linked active agent (scheduler delivers there
+    # when the user has an AgentRegistry entry, leaving user-keyed episodes empty).
+    agent_result = await db.execute(
+        select(AgentRegistry)
+        .where(AgentRegistry.user_id == uid, AgentRegistry.status == "active")
+        .limit(1)
+    )
+    linked_agent = agent_result.scalar_one_or_none()
+    agent_episodes = []
+    if linked_agent:
+        agent_eps_result = await db.execute(
+            select(PodcastEpisode)
+            .where(PodcastEpisode.agent_id == linked_agent.agent_id)
+            .order_by(PodcastEpisode.episode_date.desc())
+            .limit(30)
+        )
+        agent_episodes = agent_eps_result.scalars().all()
+
+    # Merge by date — user-keyed episode takes precedence if both exist for the same day.
+    by_date: dict = {ep.episode_date: ep for ep in agent_episodes}
+    by_date.update({ep.episode_date: ep for ep in user_episodes})
+    episodes = sorted(by_date.values(), key=lambda e: e.episode_date, reverse=True)[:30]
+
+    settings = get_settings()
+    base_url = settings.podcast_base_url or settings.base_url
+
+    xml = build_feed(
+        pi_name=user.name,
+        episodes=episodes,
+        base_url=base_url,
+        user_id=user_id,
+    )
+    return Response(content=xml, media_type="application/rss+xml; charset=utf-8")
+
+
+@router.get("/users/{user_id}/audio/{date}.mp3")
+async def podcast_audio_for_user(user_id: str, date: str):
+    """Stream a podcast audio file for a plain ORCID user."""
+    if "/" in date or ".." in date or not date.replace("-", "").isdigit():
+        raise HTTPException(status_code=400, detail="Invalid date format")
+    try:
+        _uuid.UUID(user_id)
+    except ValueError:
+        raise HTTPException(status_code=400, detail="Invalid user ID format")
+
+    audio_path = AUDIO_DIR / "users" / user_id / f"{date}.mp3"
+    if not audio_path.exists():
+        raise HTTPException(status_code=404, detail="Audio file not found")
+
+    return FileResponse(
+        path=str(audio_path),
+        media_type="audio/mpeg",
+        filename=f"briefing-{date}.mp3",
+    )
+
+
+def _podcast_eligible(user: User) -> bool:
+    """Return True if a plain user is eligible for the podcast feature."""
+    return (
+        user.onboarding_complete
+        and getattr(user, "profile", None) is not None
+        and bool(getattr(user.profile, "research_summary", None))
+    )
+
+
+@router.get("/settings", response_class=HTMLResponse)
+async def get_podcast_settings_user(
+    request: Request,
+    saved: bool = False,
+    db: AsyncSession = Depends(get_db),
+    current_user: User = Depends(get_current_user),
+):
+    """Podcast settings page for a plain ORCID user (no agent required)."""
+    from sqlalchemy.orm import selectinload
+
+    from src.models.podcast_preferences import PodcastPreferences
+
+    # Eagerly load profile relationship
+    user_result = await db.execute(
+        select(User)
+        .options(selectinload(User.profile))
+        .where(User.id == current_user.id)
+    )
+    user = user_result.scalar_one_or_none() or current_user
+
+    if not _podcast_eligible(user):
+        return RedirectResponse(url="/profile?podcast_incomplete=1", status_code=302)
+
+    prefs_result = await db.execute(
+        select(PodcastPreferences).where(PodcastPreferences.user_id == current_user.id)
+    )
+    prefs = prefs_result.scalar_one_or_none()
+
+    recent_episodes_result = await db.execute(
+        select(PodcastEpisode)
+        .where(
+            PodcastEpisode.user_id == current_user.id,
+            PodcastEpisode.audio_file_path.is_not(None),
+        )
+        .order_by(PodcastEpisode.episode_date.desc())
+        .limit(5)
+    )
+    recent_episodes = recent_episodes_result.scalars().all()
+
+    feed_path = f"/podcast/users/{current_user.id}/feed.xml"
+
+    from src.podcast.voice_registry import get_voices
+    voices = await get_voices()
+
+    return templates.TemplateResponse(
+        request,
+        "podcast_settings.html",
+        {
+            "request": request,
+            "current_user": current_user,
+            "active_page": "podcast",
+            "prefs": prefs,
+            "voices": voices,
+            "saved": saved,
+            "feed_path": feed_path,
+            "podcast_enabled": prefs.podcast_enabled if prefs else False,
+            "recent_episodes": recent_episodes,
+        },
+    )
+
+
+@router.post("/settings")
+async def save_podcast_settings_user(
+    request: Request,
+    podcast_enabled: str = Form(""),
+    voice_id: str = Form(""),
+    extra_keywords_raw: str = Form(""),
+    preferred_journals_raw: str = Form(""),
+    deprioritized_journals_raw: str = Form(""),
+    db: AsyncSession = Depends(get_db),
+    current_user: User = Depends(get_current_user),
+):
+    """Save podcast preferences for a plain ORCID user."""
+    from sqlalchemy.orm import selectinload
+
+    from src.models.podcast_preferences import PodcastPreferences
+
+    user_result = await db.execute(
+        select(User)
+        .options(selectinload(User.profile))
+        .where(User.id == current_user.id)
+    )
+    user = user_result.scalar_one_or_none() or current_user
+
+    if not _podcast_eligible(user):
+        raise HTTPException(status_code=403, detail="Complete your profile before setting podcast preferences.")
+
+    def _parse_keywords(raw: str) -> list[str]:
+        return [v for line in raw.splitlines() if (v := line.strip())][:20]
+
+    def _parse_journals(raw: str) -> list[str]:
+        return [v for part in raw.replace(",", "\n").splitlines() if (v := part.strip())][:20]
+
+    prefs_result = await db.execute(
+        select(PodcastPreferences).where(PodcastPreferences.user_id == current_user.id)
+    )
+    prefs = prefs_result.scalar_one_or_none()
+
+    was_enabled = prefs.podcast_enabled if prefs is not None else False
+
+    if prefs is None:
+        prefs = PodcastPreferences(user_id=current_user.id, agent_id=None)
+        db.add(prefs)
+
+    newly_enabled = (not was_enabled) and (podcast_enabled == "1")
+
+    prefs.podcast_enabled = podcast_enabled == "1"
+    prefs.voice_id = voice_id.strip() or None
+    prefs.extra_keywords = _parse_keywords(extra_keywords_raw)
+    prefs.preferred_journals = _parse_journals(preferred_journals_raw)
+    prefs.deprioritized_journals = _parse_journals(deprioritized_journals_raw)
+    await db.commit()
+
+    if newly_enabled:
+        logger.info("Podcast enabled for user %s — triggering immediate generation", current_user.id)
+        asyncio.create_task(_run_user_pipeline_background(current_user.id))
+
+    logger.info("Podcast preferences saved for user %s", current_user.id)
+    return RedirectResponse(url="/podcast/settings?saved=1", status_code=302)
+
+
+async def _run_user_pipeline_background(user_id) -> None:
+    """Run the user podcast pipeline in a background task with its own DB session.
+
+    Skips silently if today's episode already exists (idempotent — safe to call
+    concurrently with the scheduler).
+    """
+    from datetime import date, timezone
+
+    from src.models.podcast import PodcastEpisode
+    from src.podcast.pipeline import run_podcast_for_user
+
+    session_factory = get_session_factory()
+    try:
+        async with session_factory() as db:
+            today = date.today()
+            existing = await db.execute(
+                select(PodcastEpisode).where(
+                    PodcastEpisode.user_id == user_id,
+                    PodcastEpisode.episode_date == today,
+                )
+            )
+            if existing.scalar_one_or_none() is not None:
+                logger.info("User %s already has today's episode — skipping background run", user_id)
+                return
+            ok = await run_podcast_for_user(user_id=user_id, db_session=db)
+            await db.commit()
+            logger.info("On-demand podcast pipeline for user %s: %s", user_id, "produced" if ok else "no episode")
+    except Exception as exc:
+        logger.error("On-demand podcast pipeline failed for user %s: %s", user_id, exc, exc_info=True)
+
+
+@router.post("/user/generate")
+async def podcast_generate_for_user(
+    db: AsyncSession = Depends(get_db),
+    current_user: User = Depends(get_current_user),
+):
+    """Trigger on-demand podcast generation for the current user (returns immediately)."""
+    from sqlalchemy.orm import selectinload
+
+    from src.models.podcast_preferences import PodcastPreferences
+
+    user_result = await db.execute(
+        select(User)
+        .options(selectinload(User.profile))
+        .where(User.id == current_user.id)
+    )
+    user = user_result.scalar_one_or_none() or current_user
+
+    if not _podcast_eligible(user):
+        raise HTTPException(status_code=403, detail="Complete your profile before generating a podcast.")
+
+    prefs_result = await db.execute(
+        select(PodcastPreferences).where(PodcastPreferences.user_id == current_user.id)
+    )
+    prefs = prefs_result.scalar_one_or_none()
+    if not prefs or not prefs.podcast_enabled:
+        raise HTTPException(status_code=403, detail="Enable the podcast in your settings before generating an episode.")
+
+    asyncio.create_task(_run_user_pipeline_background(current_user.id))
+
+    return {
+        "status": "started",
+        "user_id": str(current_user.id),
+        "message": "Podcast pipeline started. Check your feed URL shortly.",
+    }
+
+
+# ---------------------------------------------------------------------------
+# Agent path — existing endpoints
+# ---------------------------------------------------------------------------
+
+@router.get("/{agent_id}/feed.xml", response_class=Response)
+async def podcast_feed(
+    agent_id: str,
+    db: AsyncSession = Depends(get_db),
+):
+    """RSS 2.0 podcast feed for a pilot-lab agent's daily research briefings."""
+    agent_result = await db.execute(
+        select(AgentRegistry).where(AgentRegistry.agent_id == agent_id)
+    )
+    agent = agent_result.scalar_one_or_none()
+    if not agent:
+        raise HTTPException(status_code=404, detail="Agent not found")
+
+    episodes_result = await db.execute(
+        select(PodcastEpisode)
+        .where(PodcastEpisode.agent_id == agent_id)
+        .order_by(PodcastEpisode.episode_date.desc())
+        .limit(30)
+    )
+    episodes = episodes_result.scalars().all()
+
+    settings = get_settings()
+    base_url = settings.podcast_base_url or settings.base_url
+
+    xml = build_feed(
+        pi_name=agent.pi_name,
+        episodes=episodes,
+        base_url=base_url,
+        agent_id=agent_id,
+    )
+    return Response(content=xml, media_type="application/rss+xml; charset=utf-8")
+
+
+@router.get("/{agent_id}/audio/{date}.mp3")
+async def podcast_audio(agent_id: str, date: str):
+    """Stream a podcast audio file for an agent."""
+    if "/" in date or ".." in date or not date.replace("-", "").isdigit():
+        raise HTTPException(status_code=400, detail="Invalid date format")
+
+    audio_path = AUDIO_DIR / agent_id / f"{date}.mp3"
+    if not audio_path.exists():
+        raise HTTPException(status_code=404, detail="Audio file not found")
+
+    return FileResponse(
+        path=str(audio_path),
+        media_type="audio/mpeg",
+        filename=f"{agent_id}-{date}.mp3",
+    )
+
+
+async def _run_pipeline_background(
+    agent_id: str, bot_name: str, pi_name: str, bot_token: str, slack_user_id: str | None
+) -> None:
+    """Run the agent podcast pipeline in a background task with its own DB session."""
+    from src.podcast.pipeline import run_pipeline_for_agent
+
+    session_factory = get_session_factory()
+    try:
+        async with session_factory() as db:
+            ok = await run_pipeline_for_agent(
+                agent_id=agent_id,
+                bot_name=bot_name,
+                pi_name=pi_name,
+                bot_token=bot_token,
+                slack_user_id=slack_user_id,
+                db_session=db,
+            )
+            await db.commit()
+            logger.info("On-demand podcast pipeline for %s: %s", agent_id, "produced" if ok else "no episode")
+    except Exception as exc:
+        logger.error("On-demand podcast pipeline failed for %s: %s", agent_id, exc, exc_info=True)
+
+
+@router.api_route("/{agent_id}/generate", methods=["GET", "POST"])
+async def podcast_generate(
+    agent_id: str,
+    db: AsyncSession = Depends(get_db),
+):
+    """Trigger on-demand podcast generation for an agent (returns immediately)."""
+    agent_result = await db.execute(
+        select(AgentRegistry).where(AgentRegistry.agent_id == agent_id)
+    )
+    agent = agent_result.scalar_one_or_none()
+    if not agent:
+        raise HTTPException(status_code=404, detail="Agent not found")
+
+    settings = get_settings()
+    slack_tokens = settings.get_slack_tokens()
+    bot_token = agent.slack_bot_token or slack_tokens.get(agent_id, {}).get("bot", "")
+
+    asyncio.create_task(
+        _run_pipeline_background(
+            agent_id=agent_id,
+            bot_name=agent.bot_name,
+            pi_name=agent.pi_name,
+            bot_token=bot_token,
+            slack_user_id=agent.slack_user_id,
+        )
+    )
+    return {
+        "status": "started",
+        "agent_id": agent_id,
+        "message": f"Podcast pipeline started for {agent.pi_name}. Check the RSS feed shortly.",
+    }
+
diff --git a/src/routers/profile.py b/src/routers/profile.py
index 2893856..50baea4 100644
--- a/src/routers/profile.py
+++ b/src/routers/profile.py
@@ -39,6 +39,7 @@ def _parse_list(val: str) -> list[str]:
 async def profile_view(
     request: Request,
     onboarding_complete: bool = False,
+    podcast_incomplete: bool = False,
     db: AsyncSession = Depends(get_db),
     current_user: User = Depends(get_current_user),
 ):
@@ -69,6 +70,7 @@ async def profile_view(
             publications=publications,
             pending_profile=profile.pending_profile if profile else None,
             just_completed_onboarding=onboarding_complete,
+            podcast_incomplete=podcast_incomplete,
         ),
     )
 
diff --git a/src/routers/proposals.py b/src/routers/proposals.py
new file mode 100644
index 0000000..6e72713
--- /dev/null
+++ b/src/routers/proposals.py
@@ -0,0 +1,748 @@
+"""Proposals router — unified PI evaluation of collaboration proposals."""
+
+import base64
+import json
+import logging
+import re
+import uuid
+from datetime import datetime, timezone
+
+from fastapi import APIRouter, Depends, Form, HTTPException, Request
+from fastapi.responses import HTMLResponse, RedirectResponse
+from fastapi.templating import Jinja2Templates
+from sqlalchemy import select
+from sqlalchemy.ext.asyncio import AsyncSession
+from sqlalchemy.orm import selectinload
+
+from src.database import get_db
+from src.dependencies import get_current_user
+from src.models import (
+    AgentRegistry,
+    MatchmakerProposal,
+    PiProposalEvaluation,
+    ThreadDecision,
+    User,
+)
+
+logger = logging.getLogger(__name__)
+router = APIRouter()
+templates = Jinja2Templates(directory="templates")
+
+# NIH score descriptor labels — shown in templates
+SCORE_DESCRIPTORS = {
+    1: "Exceptional",
+    2: "Outstanding",
+    3: "Excellent",
+    4: "Very Good",
+    5: "Good",
+    6: "Satisfactory",
+    7: "Fair",
+    8: "Marginal",
+    9: "Poor",
+}
+
+
+# ---------------------------------------------------------------------------
+# Token encoding / decoding — hides proposal origin from the URL
+# ---------------------------------------------------------------------------
+
+
+def _encode_token(proposal_type: str, proposal_id: uuid.UUID) -> str:
+    prefix = "a" if proposal_type == "agent" else "m"
+    raw = f"{prefix}_{proposal_id.hex}".encode()
+    return base64.urlsafe_b64encode(raw).rstrip(b"=").decode()
+
+
+def _decode_token(token: str) -> tuple[str, uuid.UUID]:
+    padding = 4 - len(token) % 4
+    if padding != 4:
+        token += "=" * padding
+    try:
+        raw = base64.urlsafe_b64decode(token.encode()).decode()
+        prefix, hex_id = raw.split("_", 1)
+        if prefix not in ("a", "m"):
+            raise ValueError("Unknown prefix")
+        proposal_type = "agent" if prefix == "a" else "matchmaker"
+        return proposal_type, uuid.UUID(hex=hex_id)
+    except ValueError:
+        raise
+    except Exception:
+        raise ValueError("Invalid proposal token")
+
+
+def _encode_group_token(tokens: list[str]) -> str:
+    """Encode an ordered list of proposal tokens into a single URL-safe group token."""
+    raw = json.dumps(tokens).encode()
+    return base64.urlsafe_b64encode(raw).rstrip(b"=").decode()
+
+
+def _decode_group_token(group_token: str) -> list[str]:
+    padding = 4 - len(group_token) % 4
+    if padding != 4:
+        group_token += "=" * padding
+    try:
+        raw = base64.urlsafe_b64decode(group_token.encode())
+        return json.loads(raw)
+    except Exception:
+        raise ValueError("Invalid group token")
+
+
+def _extract_title(text: str | None) -> str | None:
+    if not text:
+        return None
+    for line in text.strip().splitlines():
+        line = line.strip()
+        if line.startswith("#"):
+            return re.sub(r"^#+\s*", "", line).strip() or None
+        if line:
+            return line[:120]
+    return None
+
+
+def _template_context(request: Request, user: User, **kwargs) -> dict:
+    ctx = {
+        "request": request,
+        "current_user": user,
+        "active_page": "proposals",
+        "score_descriptors": SCORE_DESCRIPTORS,
+    }
+    ctx.update(kwargs)
+    return ctx
+
+
+# ---------------------------------------------------------------------------
+# Proposal list
+# ---------------------------------------------------------------------------
+
+
+@router.get("", response_class=HTMLResponse)
+async def proposals_list(
+    request: Request,
+    db: AsyncSession = Depends(get_db),
+    current_user: User = Depends(get_current_user),
+):
+    """Unified list of all collaboration proposals involving the current user."""
+    if current_user.access_status != "allowed":
+        return RedirectResponse(url="/access-pending", status_code=302)
+
+    success = request.query_params.get("success")
+
+    # 1. Find the user's agents (any status — needed for name resolution)
+    agent_result = await db.execute(
+        select(AgentRegistry).where(AgentRegistry.user_id == current_user.id)
+    )
+    user_agents = agent_result.scalars().all()
+    user_agent_ids = {a.agent_id for a in user_agents if a.status == "active"}
+
+    # Names this user is known by in CLI-generated matchmaker proposals
+    match_names: set[str] = {current_user.name}
+    for a in user_agents:
+        match_names.add(a.pi_name)
+
+    # 2. Agent proposals involving any of this user's agents
+    agent_proposals: list[ThreadDecision] = []
+    if user_agent_ids:
+        ap_result = await db.execute(
+            select(ThreadDecision).where(
+                ThreadDecision.outcome == "proposal",
+                ThreadDecision.hidden == False,
+                (ThreadDecision.agent_a.in_(user_agent_ids))
+                | (ThreadDecision.agent_b.in_(user_agent_ids)),
+            )
+        )
+        agent_proposals = ap_result.scalars().all()
+
+    # 3. Matchmaker proposals where this user is PI A or PI B
+    #    Matches FK (web-UI path) or name (CLI path — pi_a_id/pi_b_id are NULL)
+    mp_result = await db.execute(
+        select(MatchmakerProposal)
+        .options(selectinload(MatchmakerProposal.pi_a), selectinload(MatchmakerProposal.pi_b))
+        .where(
+            MatchmakerProposal.hidden == False,
+            (MatchmakerProposal.pi_a_id == current_user.id)
+            | (MatchmakerProposal.pi_b_id == current_user.id)
+            | (MatchmakerProposal.pi_a_name.in_(match_names))
+            | (MatchmakerProposal.pi_b_name.in_(match_names))
+        )
+    )
+    matchmaker_proposals = mp_result.scalars().all()
+
+    # 4. Existing evaluations for this user
+    td_eval_result = await db.execute(
+        select(PiProposalEvaluation.thread_decision_id).where(
+            PiProposalEvaluation.user_id == current_user.id,
+            PiProposalEvaluation.thread_decision_id.isnot(None),
+        )
+    )
+    evaluated_thread_ids = {r[0] for r in td_eval_result}
+
+    mm_eval_result = await db.execute(
+        select(PiProposalEvaluation.matchmaker_proposal_id).where(
+            PiProposalEvaluation.user_id == current_user.id,
+            PiProposalEvaluation.matchmaker_proposal_id.isnot(None),
+        )
+    )
+    evaluated_mm_ids = {r[0] for r in mm_eval_result}
+
+    # 5. Resolve collaborator names for agent proposals
+    all_agent_ids: set[str] = set()
+    for p in agent_proposals:
+        all_agent_ids.add(p.agent_a)
+        all_agent_ids.add(p.agent_b)
+
+    agent_reg_map: dict[str, AgentRegistry] = {}
+    if all_agent_ids:
+        ar_result = await db.execute(
+            select(AgentRegistry)
+            .options(selectinload(AgentRegistry.user))
+            .where(AgentRegistry.agent_id.in_(all_agent_ids))
+        )
+        agent_reg_map = {a.agent_id: a for a in ar_result.scalars().all()}
+
+    # Build user_id → AgentRegistry map for matchmaker collaborator profile links
+    mm_collab_user_ids = {
+        uid
+        for p in matchmaker_proposals
+        for uid in (p.pi_a_id, p.pi_b_id)
+        if uid is not None
+    }
+    user_to_agent_map: dict = {}
+    if mm_collab_user_ids:
+        ua_result = await db.execute(
+            select(AgentRegistry).where(AgentRegistry.user_id.in_(mm_collab_user_ids))
+        )
+        user_to_agent_map = {a.user_id: a for a in ua_result.scalars().all()}
+
+    # 6. Build flat items list
+    flat_items: list[dict] = []
+
+    for p in agent_proposals:
+        other_id = p.agent_b if p.agent_a in user_agent_ids else p.agent_a
+        other_ar = agent_reg_map.get(other_id)
+        if other_ar and other_ar.user:
+            collaborator = other_ar.user.name
+        elif other_ar:
+            collaborator = other_ar.pi_name or other_id
+        else:
+            collaborator = other_id
+
+        flat_items.append(
+            {
+                "token": _encode_token("agent", p.id),
+                "title": _extract_title(p.summary_text) or "Collaboration Proposal",
+                "collaborator": collaborator,
+                "collaborator_agent_id": other_ar.agent_id if other_ar else None,
+                "has_evaluation": p.id in evaluated_thread_ids,
+            }
+        )
+
+    for p in matchmaker_proposals:
+        is_pi_a = (p.pi_a_id == current_user.id) or (p.pi_a_name in match_names)
+        collaborator = p.name_b if is_pi_a else p.name_a
+        collab_user_id = p.pi_b_id if is_pi_a else p.pi_a_id
+        collab_ar = user_to_agent_map.get(collab_user_id) if collab_user_id else None
+        flat_items.append(
+            {
+                "token": _encode_token("matchmaker", p.id),
+                "title": p.title,
+                "collaborator": collaborator,
+                "collaborator_agent_id": collab_ar.agent_id if collab_ar else None,
+                "has_evaluation": p.id in evaluated_mm_ids,
+            }
+        )
+
+    # 7. Group by collaborator
+    groups_dict: dict[str, dict] = {}
+    for item in flat_items:
+        collab = item["collaborator"]
+        if collab not in groups_dict:
+            groups_dict[collab] = {
+                "tokens": [],
+                "evaluated_count": 0,
+                "total": 0,
+                "collaborator_agent_id": item.get("collaborator_agent_id"),
+            }
+        elif not groups_dict[collab]["collaborator_agent_id"]:
+            groups_dict[collab]["collaborator_agent_id"] = item.get("collaborator_agent_id")
+        groups_dict[collab]["tokens"].append(item["token"])
+        groups_dict[collab]["total"] += 1
+        if item["has_evaluation"]:
+            groups_dict[collab]["evaluated_count"] += 1
+
+    # Stable token order within each group; sort groups by collaborator name
+    groups = []
+    for collab, g in sorted(groups_dict.items()):
+        g["tokens"].sort()
+        groups.append(
+            {
+                "collaborator": collab,
+                "collaborator_agent_id": g["collaborator_agent_id"],
+                "total": g["total"],
+                "evaluated_count": g["evaluated_count"],
+                "group_token": _encode_group_token(g["tokens"]),
+                "all_evaluated": g["evaluated_count"] == g["total"],
+            }
+        )
+
+    return templates.TemplateResponse(
+        request,
+        "proposals/list.html",
+        _template_context(
+            request,
+            current_user,
+            groups=groups,
+            flash_message="Evaluation submitted." if success else None,
+            flash_type="success" if success else None,
+        ),
+    )
+
+
+# ---------------------------------------------------------------------------
+# Evaluation form — GET
+# ---------------------------------------------------------------------------
+
+
+@router.get("/{token}/evaluate", response_class=HTMLResponse)
+async def evaluate_form(
+    token: str,
+    request: Request,
+    db: AsyncSession = Depends(get_db),
+    current_user: User = Depends(get_current_user),
+):
+    if current_user.access_status != "allowed":
+        return RedirectResponse(url="/access-pending", status_code=302)
+
+    try:
+        proposal_type, proposal_id = _decode_token(token)
+    except ValueError:
+        raise HTTPException(status_code=404, detail="Proposal not found")
+
+    title, collaborator, body_md = await _load_proposal_display(
+        proposal_type, proposal_id, current_user, db
+    )
+
+    # Load existing evaluation for pre-fill
+    if proposal_type == "agent":
+        eval_filter = (
+            PiProposalEvaluation.user_id == current_user.id,
+            PiProposalEvaluation.thread_decision_id == proposal_id,
+        )
+    else:
+        eval_filter = (
+            PiProposalEvaluation.user_id == current_user.id,
+            PiProposalEvaluation.matchmaker_proposal_id == proposal_id,
+        )
+
+    eval_result = await db.execute(select(PiProposalEvaluation).where(*eval_filter))
+    existing = eval_result.scalar_one_or_none()
+
+    return templates.TemplateResponse(
+        request,
+        "proposals/evaluate.html",
+        _template_context(
+            request,
+            current_user,
+            token=token,
+            title=title,
+            collaborator=collaborator,
+            body_md=body_md,
+            evaluation=existing,
+        ),
+    )
+
+
+# ---------------------------------------------------------------------------
+# Evaluation form — POST (upsert)
+# ---------------------------------------------------------------------------
+
+
+@router.post("/{token}/evaluate")
+async def evaluate_submit(
+    token: str,
+    request: Request,
+    score_overall_impact: int = Form(...),
+    comments_overall: str = Form(""),
+    # Criterion scores are optional — hidden from the PI form but preserved in DB
+    score_significance: int | None = Form(None),
+    score_innovation: int | None = Form(None),
+    score_approach: int | None = Form(None),
+    score_investigators: int | None = Form(None),
+    score_environment: int | None = Form(None),
+    comments_significance: str = Form(""),
+    comments_innovation: str = Form(""),
+    comments_approach: str = Form(""),
+    comments_investigators: str = Form(""),
+    comments_environment: str = Form(""),
+    db: AsyncSession = Depends(get_db),
+    current_user: User = Depends(get_current_user),
+):
+    if current_user.access_status != "allowed":
+        return RedirectResponse(url="/access-pending", status_code=302)
+
+    try:
+        proposal_type, proposal_id = _decode_token(token)
+    except ValueError:
+        raise HTTPException(status_code=404, detail="Proposal not found")
+
+    # Validate access (raises 403 if not authorized)
+    await _load_proposal_display(proposal_type, proposal_id, current_user, db)
+
+    # Validate overall impact score
+    if not 1 <= score_overall_impact <= 9:
+        raise HTTPException(status_code=400, detail="Overall impact score must be 1–9")
+
+    # Validate criterion scores only if provided
+    criterion_scores = {
+        "significance": score_significance,
+        "innovation": score_innovation,
+        "approach": score_approach,
+        "investigators": score_investigators,
+        "environment": score_environment,
+    }
+    for name, val in criterion_scores.items():
+        if val is not None and not 1 <= val <= 9:
+            raise HTTPException(status_code=400, detail=f"Score for {name} must be 1–9")
+
+    # Upsert
+    if proposal_type == "agent":
+        eval_filter = (
+            PiProposalEvaluation.user_id == current_user.id,
+            PiProposalEvaluation.thread_decision_id == proposal_id,
+        )
+    else:
+        eval_filter = (
+            PiProposalEvaluation.user_id == current_user.id,
+            PiProposalEvaluation.matchmaker_proposal_id == proposal_id,
+        )
+
+    existing_result = await db.execute(select(PiProposalEvaluation).where(*eval_filter))
+    ev = existing_result.scalar_one_or_none()
+    is_update = ev is not None
+
+    now = datetime.now(timezone.utc)
+
+    if is_update:
+        ev.score_significance = score_significance
+        ev.score_innovation = score_innovation
+        ev.score_approach = score_approach
+        ev.score_investigators = score_investigators
+        ev.score_environment = score_environment
+        ev.score_overall_impact = score_overall_impact
+        ev.comments_significance = comments_significance.strip() or None
+        ev.comments_innovation = comments_innovation.strip() or None
+        ev.comments_approach = comments_approach.strip() or None
+        ev.comments_investigators = comments_investigators.strip() or None
+        ev.comments_environment = comments_environment.strip() or None
+        ev.comments_overall = comments_overall.strip()
+        ev.updated_at = now
+    else:
+        ev = PiProposalEvaluation(
+            user_id=current_user.id,
+            proposal_type=proposal_type,
+            thread_decision_id=proposal_id if proposal_type == "agent" else None,
+            matchmaker_proposal_id=proposal_id if proposal_type == "matchmaker" else None,
+            score_significance=score_significance,       # None when not submitted
+            score_innovation=score_innovation,
+            score_approach=score_approach,
+            score_investigators=score_investigators,
+            score_environment=score_environment,
+            score_overall_impact=score_overall_impact,
+            comments_significance=comments_significance.strip() or None,
+            comments_innovation=comments_innovation.strip() or None,
+            comments_approach=comments_approach.strip() or None,
+            comments_investigators=comments_investigators.strip() or None,
+            comments_environment=comments_environment.strip() or None,
+            comments_overall=comments_overall.strip(),
+        )
+        db.add(ev)
+
+    await db.commit()
+
+    action = "updated" if is_update else "submitted"
+    logger.info(
+        "PiProposalEvaluation %s: user=%s (id=%s) proposal_type=%s proposal_id=%s "
+        "overall_impact=%d at=%s",
+        action,
+        current_user.name,
+        current_user.id,
+        proposal_type,
+        proposal_id,
+        score_overall_impact,
+        now.isoformat(),
+    )
+
+    return RedirectResponse(url="/proposals?success=1", status_code=302)
+
+
+# ---------------------------------------------------------------------------
+# Shared helper — load proposal and verify PI access
+# ---------------------------------------------------------------------------
+
+
+async def _load_proposal_display(
+    proposal_type: str,
+    proposal_id: uuid.UUID,
+    current_user: User,
+    db: AsyncSession,
+) -> tuple[str, str, str]:
+    """Return (title, collaborator_name, body_md) or raise HTTPException."""
+    if proposal_type == "agent":
+        result = await db.execute(
+            select(ThreadDecision).where(ThreadDecision.id == proposal_id)
+        )
+        td = result.scalar_one_or_none()
+        if not td:
+            raise HTTPException(status_code=404, detail="Proposal not found")
+
+        # Verify current user owns one of the two agents
+        ar_result = await db.execute(
+            select(AgentRegistry)
+            .options(selectinload(AgentRegistry.user))
+            .where(
+                AgentRegistry.user_id == current_user.id,
+                AgentRegistry.agent_id.in_([td.agent_a, td.agent_b]),
+            )
+        )
+        my_agent = ar_result.scalars().first()
+        if not my_agent:
+            raise HTTPException(status_code=403, detail="Not authorized")
+
+        other_id = td.agent_b if td.agent_a == my_agent.agent_id else td.agent_a
+        other_ar_result = await db.execute(
+            select(AgentRegistry)
+            .options(selectinload(AgentRegistry.user))
+            .where(AgentRegistry.agent_id == other_id)
+        )
+        other_ar = other_ar_result.scalar_one_or_none()
+        if other_ar and other_ar.user:
+            collaborator = other_ar.user.name
+        elif other_ar:
+            collaborator = other_ar.pi_name or other_id
+        else:
+            collaborator = other_id
+
+        title = _extract_title(td.summary_text) or "Collaboration Proposal"
+        body_md = td.summary_text or ""
+        return title, collaborator, body_md
+
+    else:  # matchmaker
+        result = await db.execute(
+            select(MatchmakerProposal)
+            .options(selectinload(MatchmakerProposal.pi_a), selectinload(MatchmakerProposal.pi_b))
+            .where(MatchmakerProposal.id == proposal_id)
+        )
+        mp = result.scalar_one_or_none()
+        if not mp:
+            raise HTTPException(status_code=404, detail="Proposal not found")
+
+        # Resolve all names this user may appear under (FK or CLI name)
+        ar_result = await db.execute(
+            select(AgentRegistry).where(AgentRegistry.user_id == current_user.id)
+        )
+        my_agent = ar_result.scalar_one_or_none()
+        match_names: set[str] = {current_user.name}
+        if my_agent:
+            match_names.add(my_agent.pi_name)
+
+        is_pi_a = (mp.pi_a_id == current_user.id) or (mp.pi_a_name in match_names)
+        is_pi_b = (mp.pi_b_id == current_user.id) or (mp.pi_b_name in match_names)
+        if not (is_pi_a or is_pi_b):
+            raise HTTPException(status_code=403, detail="Not authorized")
+
+        collaborator = mp.name_b if is_pi_a else mp.name_a
+        return mp.title, collaborator, mp.proposal_md
+
+
+# ---------------------------------------------------------------------------
+# Group evaluation flow — sequential step-by-step through all proposals
+# with a collaborator (GET + POST)
+# ---------------------------------------------------------------------------
+
+
+@router.get("/group/{group_token}/{step}", response_class=HTMLResponse)
+async def evaluate_group_form(
+    group_token: str,
+    step: int,
+    request: Request,
+    db: AsyncSession = Depends(get_db),
+    current_user: User = Depends(get_current_user),
+):
+    if current_user.access_status != "allowed":
+        return RedirectResponse(url="/access-pending", status_code=302)
+
+    try:
+        tokens = _decode_group_token(group_token)
+    except ValueError:
+        raise HTTPException(status_code=404, detail="Group not found")
+
+    if not tokens or step < 0 or step >= len(tokens):
+        raise HTTPException(status_code=404, detail="Step out of range")
+
+    token = tokens[step]
+    try:
+        proposal_type, proposal_id = _decode_token(token)
+    except ValueError:
+        raise HTTPException(status_code=404, detail="Proposal not found")
+
+    title, collaborator, body_md = await _load_proposal_display(
+        proposal_type, proposal_id, current_user, db
+    )
+
+    if proposal_type == "agent":
+        eval_filter = (
+            PiProposalEvaluation.user_id == current_user.id,
+            PiProposalEvaluation.thread_decision_id == proposal_id,
+        )
+    else:
+        eval_filter = (
+            PiProposalEvaluation.user_id == current_user.id,
+            PiProposalEvaluation.matchmaker_proposal_id == proposal_id,
+        )
+    eval_result = await db.execute(select(PiProposalEvaluation).where(*eval_filter))
+    existing = eval_result.scalar_one_or_none()
+
+    return templates.TemplateResponse(
+        request,
+        "proposals/evaluate.html",
+        _template_context(
+            request,
+            current_user,
+            token=token,
+            title=title,
+            collaborator=collaborator,
+            body_md=body_md,
+            evaluation=existing,
+            group_token=group_token,
+            step=step,
+            total_steps=len(tokens),
+        ),
+    )
+
+
+@router.get("/group/{group_token}", response_class=HTMLResponse)
+async def evaluate_group_start(
+    group_token: str,
+    request: Request,
+    db: AsyncSession = Depends(get_db),
+    current_user: User = Depends(get_current_user),
+):
+    """Redirect to first step of a group evaluation."""
+    return RedirectResponse(url=f"/proposals/group/{group_token}/0", status_code=302)
+
+
+@router.post("/group/{group_token}/{step}")
+async def evaluate_group_submit(
+    group_token: str,
+    step: int,
+    request: Request,
+    score_overall_impact: int = Form(...),
+    comments_overall: str = Form(""),
+    score_significance: int | None = Form(None),
+    score_innovation: int | None = Form(None),
+    score_approach: int | None = Form(None),
+    score_investigators: int | None = Form(None),
+    score_environment: int | None = Form(None),
+    comments_significance: str = Form(""),
+    comments_innovation: str = Form(""),
+    comments_approach: str = Form(""),
+    comments_investigators: str = Form(""),
+    comments_environment: str = Form(""),
+    db: AsyncSession = Depends(get_db),
+    current_user: User = Depends(get_current_user),
+):
+    if current_user.access_status != "allowed":
+        return RedirectResponse(url="/access-pending", status_code=302)
+
+    try:
+        tokens = _decode_group_token(group_token)
+    except ValueError:
+        raise HTTPException(status_code=404, detail="Group not found")
+
+    if not tokens or step < 0 or step >= len(tokens):
+        raise HTTPException(status_code=404, detail="Step out of range")
+
+    token = tokens[step]
+    try:
+        proposal_type, proposal_id = _decode_token(token)
+    except ValueError:
+        raise HTTPException(status_code=404, detail="Proposal not found")
+
+    await _load_proposal_display(proposal_type, proposal_id, current_user, db)
+
+    if not 1 <= score_overall_impact <= 9:
+        raise HTTPException(status_code=400, detail="Overall impact score must be 1–9")
+    for name, val in {
+        "significance": score_significance,
+        "innovation": score_innovation,
+        "approach": score_approach,
+        "investigators": score_investigators,
+        "environment": score_environment,
+    }.items():
+        if val is not None and not 1 <= val <= 9:
+            raise HTTPException(status_code=400, detail=f"Score for {name} must be 1–9")
+    if proposal_type == "agent":
+        eval_filter = (
+            PiProposalEvaluation.user_id == current_user.id,
+            PiProposalEvaluation.thread_decision_id == proposal_id,
+        )
+    else:
+        eval_filter = (
+            PiProposalEvaluation.user_id == current_user.id,
+            PiProposalEvaluation.matchmaker_proposal_id == proposal_id,
+        )
+
+    existing_result = await db.execute(select(PiProposalEvaluation).where(*eval_filter))
+    ev = existing_result.scalar_one_or_none()
+    is_update = ev is not None
+    now = datetime.now(timezone.utc)
+
+    if is_update:
+        ev.score_significance = score_significance
+        ev.score_innovation = score_innovation
+        ev.score_approach = score_approach
+        ev.score_investigators = score_investigators
+        ev.score_environment = score_environment
+        ev.score_overall_impact = score_overall_impact
+        ev.comments_significance = comments_significance.strip() or None
+        ev.comments_innovation = comments_innovation.strip() or None
+        ev.comments_approach = comments_approach.strip() or None
+        ev.comments_investigators = comments_investigators.strip() or None
+        ev.comments_environment = comments_environment.strip() or None
+        ev.comments_overall = comments_overall.strip()
+        ev.updated_at = now
+    else:
+        ev = PiProposalEvaluation(
+            user_id=current_user.id,
+            proposal_type=proposal_type,
+            thread_decision_id=proposal_id if proposal_type == "agent" else None,
+            matchmaker_proposal_id=proposal_id if proposal_type == "matchmaker" else None,
+            score_significance=score_significance,
+            score_innovation=score_innovation,
+            score_approach=score_approach,
+            score_investigators=score_investigators,
+            score_environment=score_environment,
+            score_overall_impact=score_overall_impact,
+            comments_significance=comments_significance.strip() or None,
+            comments_innovation=comments_innovation.strip() or None,
+            comments_approach=comments_approach.strip() or None,
+            comments_investigators=comments_investigators.strip() or None,
+            comments_environment=comments_environment.strip() or None,
+            comments_overall=comments_overall.strip(),
+        )
+        db.add(ev)
+
+    await db.commit()
+
+    logger.info(
+        "PiProposalEvaluation %s: user=%s proposal_type=%s proposal_id=%s impact=%d step=%d/%d",
+        "updated" if is_update else "submitted",
+        current_user.name, proposal_type, proposal_id, score_overall_impact,
+        step + 1, len(tokens),
+    )
+
+    next_step = step + 1
+    if next_step < len(tokens):
+        return RedirectResponse(
+            url=f"/proposals/group/{group_token}/{next_step}", status_code=302
+        )
+    return RedirectResponse(url="/proposals?success=1", status_code=302)
diff --git a/src/routers/public.py b/src/routers/public.py
index d35b34a..5af0dfe 100644
--- a/src/routers/public.py
+++ b/src/routers/public.py
@@ -1,16 +1,20 @@
-"""Public-facing routes: landing page, waitlist, access-pending."""
+"""Public-facing routes: landing page, waitlist, access-pending, researcher profiles."""
 
 import logging
 import re
 
-from fastapi import APIRouter, Depends, Form, Request
+from fastapi import APIRouter, Depends, Form, HTTPException, Request
 from fastapi.responses import HTMLResponse, RedirectResponse
 from fastapi.templating import Jinja2Templates
 from sqlalchemy import select
 from sqlalchemy.ext.asyncio import AsyncSession
 
 from src.database import get_db
-from src.models import User, WaitlistSignup
+from src.dependencies import get_optional_current_user
+from src.models import AgentRegistry, ResearcherProfile, User, WaitlistSignup
+from src.services.profile_export import ORCID_TO_AGENT_ID
+
+_AGENT_ID_TO_ORCID: dict[str, str] = {v: k for k, v in ORCID_TO_AGENT_ID.items()}
 
 logger = logging.getLogger(__name__)
 router = APIRouter()
@@ -83,6 +87,47 @@ async def waitlist_submit(
     )
 
 
+@router.get("/researcher/{agent_id}", response_class=HTMLResponse)
+async def view_researcher_profile(
+    agent_id: str,
+    request: Request,
+    db: AsyncSession = Depends(get_db),
+    current_user: User | None = Depends(get_optional_current_user),
+):
+    """Read-only public profile view — accessible to anyone, no login required."""
+    pi_user: User | None = None
+
+    # Primary: look up via active AgentRegistry entry
+    agent_result = await db.execute(
+        select(AgentRegistry).where(AgentRegistry.agent_id == agent_id)
+    )
+    agent = agent_result.scalar_one_or_none()
+    if agent and agent.status == "active":
+        pi_result = await db.execute(select(User).where(User.id == agent.user_id))
+        pi_user = pi_result.scalar_one_or_none()
+
+    # Fallback: look up via ORCID mapping for researchers without an active agent yet
+    if pi_user is None:
+        orcid = _AGENT_ID_TO_ORCID.get(agent_id)
+        if orcid:
+            pi_result = await db.execute(select(User).where(User.orcid == orcid))
+            pi_user = pi_result.scalar_one_or_none()
+
+    if not pi_user:
+        raise HTTPException(status_code=404, detail="Researcher not found")
+
+    profile_result = await db.execute(
+        select(ResearcherProfile).where(ResearcherProfile.user_id == pi_user.id)
+    )
+    profile = profile_result.scalar_one_or_none()
+
+    return templates.TemplateResponse(
+        request,
+        "researcher/view.html",
+        {"request": request, "current_user": current_user, "agent": agent, "profile": profile, "pi_user": pi_user},
+    )
+
+
 @router.get("/access-pending", response_class=HTMLResponse)
 async def access_pending(request: Request):
     """Shown after ORCID login when the user is not yet approved."""
diff --git a/src/services/llm.py b/src/services/llm.py
index f3cf606..bfc5087 100644
--- a/src/services/llm.py
+++ b/src/services/llm.py
@@ -8,6 +8,7 @@
 import anthropic
 
 from src.config import get_settings
+from src.utils.prompts import load_prompt
 
 logger = logging.getLogger(__name__)
 
@@ -17,6 +18,11 @@
 # keys from log_meta.
 _call_log_callback: Callable[[dict], None] | None = None
 
+# Tri-state: None = not yet tested, True = supported, False = not supported.
+# Set to False on the first 400 error caused by cache_control so subsequent
+# calls skip caching without retrying.
+_prompt_caching_supported: bool | None = None
+
 
 def set_call_log_callback(callback: Callable[[dict], None] | None) -> None:
     """Register (or clear) a callback that fires after every LLM call."""
@@ -26,7 +32,24 @@ def set_call_log_callback(callback: Callable[[dict], None] | None) -> None:
 
 def get_anthropic_client() -> anthropic.Anthropic:
     settings = get_settings()
-    return anthropic.Anthropic(api_key=settings.anthropic_api_key)
+    kwargs: dict = {"api_key": settings.anthropic_api_key}
+    if settings.anthropic_base_url:
+        kwargs["base_url"] = settings.anthropic_base_url
+    return anthropic.Anthropic(**kwargs)
+
+
+def _system_with_cache(text: str) -> str | list[dict]:
+    """Wrap a system prompt with cache_control when prompt caching is available.
+
+    Returns a plain string when caching is disabled (config flag or prior failure),
+    otherwise returns the list-of-blocks form required by the caching API.
+    Callers should treat a plain-string return as the no-cache path.
+    """
+    global _prompt_caching_supported
+    settings = get_settings()
+    if not settings.anthropic_prompt_caching or _prompt_caching_supported is False:
+        return text
+    return [{"type": "text", "text": text, "cache_control": {"type": "ephemeral"}}]
 
 
 async def synthesize_profile(context_text: str, researcher_name: str) -> dict[str, Any]:
@@ -165,7 +188,10 @@ async def generate_agent_response(
         )
         latency_ms = (time.monotonic() - t0) * 1000
         if not message.content:
-            logger.warning("Claude returned empty content (model=%s)", model)
+            logger.warning(
+                "Claude returned empty content (model=%s, stop_reason=%s, meta=%s)",
+                model, message.stop_reason, log_meta,
+            )
             return ""
         response_text = message.content[0].text
 
@@ -401,6 +427,136 @@ async def generate_with_tools(
     return response_text
 
 
+async def generate_matchmaker_proposal(
+    name_a: str,
+    public_profile_a: str,
+    private_profile_a: str,
+    publications_a: str,
+    name_b: str,
+    public_profile_b: str,
+    private_profile_b: str,
+    publications_b: str,
+    model: str | None = None,
+) -> dict[str, Any]:
+    """
+    Generate a collaboration proposal between two PIs using their profiles.
+
+    Returns a dict with keys: proposal_md, title, confidence, input_tokens, output_tokens, model.
+    """
+    settings = get_settings()
+    model = model or settings.llm_agent_model_opus
+
+    prompt_path = "prompts/matchmaker.md"
+    system_prompt = load_prompt(prompt_path)
+    if not system_prompt:
+        raise RuntimeError(f"Matchmaker prompt not found at {prompt_path}")
+
+    user_message = f"""## PI A: {name_a}
+
+### Public Profile
+{public_profile_a}
+
+### Private Instructions (confidential — do not quote directly)
+{private_profile_a or '(none provided)'}
+
+### Recent Publications
+{publications_a or '(none available)'}
+
+---
+
+## PI B: {name_b}
+
+### Public Profile
+{public_profile_b}
+
+### Private Instructions (confidential — do not quote directly)
+{private_profile_b or '(none provided)'}
+
+### Recent Publications
+{publications_b or '(none available)'}"""
+
+    global _prompt_caching_supported
+
+    client = get_anthropic_client()
+    system = _system_with_cache(system_prompt)
+    t0 = time.monotonic()
+    try:
+        message = client.messages.create(
+            model=model,
+            max_tokens=2000,
+            system=system,
+            messages=[{"role": "user", "content": user_message}],
+        )
+        if isinstance(system, list):
+            _prompt_caching_supported = True
+    except anthropic.BadRequestError as exc:
+        if isinstance(system, list) and "cache" in str(exc).lower():
+            logger.warning(
+                "Prompt caching not supported by this endpoint — retrying without: %s", exc
+            )
+            _prompt_caching_supported = False
+            message = client.messages.create(
+                model=model,
+                max_tokens=2000,
+                system=system_prompt,
+                messages=[{"role": "user", "content": user_message}],
+            )
+        else:
+            raise
+    latency_ms = (time.monotonic() - t0) * 1000
+    logger.info(
+        "Matchmaker LLM call: model=%s input=%d output=%d latency=%.0fms",
+        model,
+        message.usage.input_tokens,
+        message.usage.output_tokens,
+        latency_ms,
+    )
+
+    response_text = message.content[0].text if message.content else ""
+
+    # Extract content inside <proposal> tags
+    proposal_md = response_text
+    if "<proposal>" in response_text and "</proposal>" in response_text:
+        start = response_text.find("<proposal>") + len("<proposal>")
+        end = response_text.find("</proposal>")
+        proposal_md = response_text[start:end].strip()
+
+    # Extract title from first heading
+    title = "Untitled Proposal"
+    for line in proposal_md.splitlines():
+        line = line.strip()
+        if line.startswith("# "):
+            title = line[2:].strip()
+            break
+
+    # Extract confidence label
+    confidence = "speculative"
+    lower = proposal_md.lower()
+    conf_line = next(
+        (ln for ln in proposal_md.splitlines() if "**confidence:**" in ln.lower()), ""
+    )
+    if conf_line:
+        if "high" in conf_line.lower():
+            confidence = "high"
+        elif "moderate" in conf_line.lower():
+            confidence = "moderate"
+        else:
+            confidence = "speculative"
+    elif "**confidence:** high" in lower:
+        confidence = "high"
+    elif "**confidence:** moderate" in lower:
+        confidence = "moderate"
+
+    return {
+        "proposal_md": proposal_md,
+        "title": title,
+        "confidence": confidence,
+        "input_tokens": message.usage.input_tokens,
+        "output_tokens": message.usage.output_tokens,
+        "model": model,
+    }
+
+
 def _default_synthesis_prompt() -> str:
     return """You are a scientific profile synthesizer. Given information about a researcher's publications, grants, and submitted texts, generate a structured JSON profile.
 
diff --git a/src/services/profile_export.py b/src/services/profile_export.py
index 1b63297..f70bc4a 100644
--- a/src/services/profile_export.py
+++ b/src/services/profile_export.py
@@ -28,6 +28,8 @@
     "0000-0002-5964-7111": "forli",
     "0000-0003-2819-4049": "deniz",
     "0000-0001-6701-996X": "lairson",
+    "0000-0001-8420-1325": "alanjary",
+    "0000-0002-4887-9603": "cline",
 }
 
 
diff --git a/src/utils/prompts.py b/src/utils/prompts.py
new file mode 100644
index 0000000..a9a14ae
--- /dev/null
+++ b/src/utils/prompts.py
@@ -0,0 +1,28 @@
+"""Prompt file loader with {{include: filename}} support."""
+
+from __future__ import annotations
+
+import re
+from pathlib import Path
+
+PROMPTS_DIR = Path("prompts")
+
+
+def load_prompt(path: str | Path, default: str = "") -> str:
+    """Load a prompt file, resolving {{include: filename}} directives.
+
+    Include paths are resolved relative to the prompts/ directory.
+    """
+    try:
+        text = Path(path).read_text(encoding="utf-8")
+    except FileNotFoundError:
+        return default
+
+    def _resolve(match: re.Match) -> str:
+        included_path = PROMPTS_DIR / match.group(1).strip()
+        try:
+            return included_path.read_text(encoding="utf-8")
+        except FileNotFoundError:
+            return f"[include not found: {included_path}]"
+
+    return re.sub(r"\{\{include:\s*(.+?)\}\}", _resolve, text)
diff --git a/templates/admin/discussions.html b/templates/admin/discussions.html
index 088616a..19c5ae6 100644
--- a/templates/admin/discussions.html
+++ b/templates/admin/discussions.html
@@ -90,6 +90,11 @@ <h1 class="text-2xl font-bold text-gray-900">Discussions</h1>
         <a href="/admin/discussions?run_id={{ selected_run_id }}" class="text-sm text-gray-500 hover:text-gray-700">Clear</a>
         {% endif %}
     </form>
+    <form method="POST" action="/admin/discussions/clear"
+          onsubmit="return confirm('Delete all thread decisions and proposal reviews from the database? Slack conversations are not affected.')">
+        <button type="submit"
+                class="px-3 py-1.5 bg-red-600 text-white text-sm rounded-md hover:bg-red-700">Clear All</button>
+    </form>
 </div>
 
 <!-- Threads table -->
@@ -146,7 +151,7 @@ <h1 class="text-2xl font-bold text-gray-900">Discussions</h1>
             <tr id="detail-{{ loop.index }}" class="hidden">
                 <td colspan="7" class="px-6 py-4 bg-gray-50">
                     {% if t.decision.summary_text %}
-                    <div class="text-sm text-gray-700 max-w-3xl proposal-md mb-4" data-markdown="{{ t.decision.summary_text | e }}"></div>
+                    <div class="text-sm text-gray-700 max-w-3xl proposal-md mb-4" data-markdown="{{ t.decision.summary_text | extract_proposal | e }}"></div>
                     {% endif %}
                     {% if t.reviews %}
                     <div class="border-t border-gray-200 pt-3 mt-3">
diff --git a/templates/admin/evaluations.html b/templates/admin/evaluations.html
new file mode 100644
index 0000000..0f5f76d
--- /dev/null
+++ b/templates/admin/evaluations.html
@@ -0,0 +1,294 @@
+{% extends "base.html" %}
+{% block title %}Admin — PI Evaluations — CoPI{% endblock %}
+
+{% block content %}
+<div class="flex items-center justify-between mb-6">
+    <h1 class="text-2xl font-bold text-gray-900">PI Proposal Evaluations</h1>
+    <a href="/admin/evaluations/export.json{{ '?' + request.url.query if request.url.query else '' }}"
+       class="px-3 py-1.5 bg-gray-700 text-white text-sm rounded-md hover:bg-gray-900 flex items-center gap-1.5">
+        Export JSON
+    </a>
+</div>
+
+<!-- Summary cards -->
+<div class="grid grid-cols-2 md:grid-cols-4 gap-4 mb-8">
+    <div class="bg-white rounded-xl border border-gray-200 p-4 text-center">
+        <div class="text-3xl font-bold text-indigo-600">{{ total_count }}</div>
+        <div class="text-sm text-gray-500 mt-1">Total Evaluations</div>
+    </div>
+    <div class="bg-white rounded-xl border border-gray-200 p-4 text-center">
+        <div class="text-3xl font-bold text-indigo-600">{{ this_month }}</div>
+        <div class="text-sm text-gray-500 mt-1">This Month</div>
+    </div>
+    <div class="bg-white rounded-xl border border-gray-200 p-4 text-center">
+        <div class="text-3xl font-bold text-indigo-600">
+            {% set agent_count = eval_rows | selectattr('eval.proposal_type', 'equalto', 'agent') | list | length %}
+            {% set mm_count = eval_rows | selectattr('eval.proposal_type', 'equalto', 'matchmaker') | list | length %}
+            {{ agent_count }} / {{ mm_count }}
+        </div>
+        <div class="text-sm text-gray-500 mt-1">Agent / Matchmaker</div>
+    </div>
+    <div class="bg-white rounded-xl border border-gray-200 p-4 text-center">
+        <div class="text-3xl font-bold {% if mean_impact <= 3 %}text-green-600{% elif mean_impact <= 6 %}text-amber-500{% else %}text-red-500{% endif %}">
+            {{ mean_impact if total_count else '—' }}
+        </div>
+        <div class="text-sm text-gray-500 mt-1">Mean Impact / 9</div>
+    </div>
+</div>
+
+<!-- Filters -->
+<form method="GET" action="/admin/evaluations" class="bg-white rounded-xl border border-gray-200 p-4 mb-6 flex flex-wrap items-end gap-4">
+    <div class="flex flex-col gap-1">
+        <label class="text-xs text-gray-500 font-medium">PI</label>
+        <select name="pi_filter" class="text-sm border-gray-300 rounded-md shadow-sm">
+            <option value="">All PIs</option>
+            {% for u in all_evaluators %}
+            <option value="{{ u.id }}" {% if pi_filter == u.id | string %}selected{% endif %}>{{ u.name }}</option>
+            {% endfor %}
+        </select>
+    </div>
+    <div class="flex flex-col gap-1">
+        <label class="text-xs text-gray-500 font-medium">Origin</label>
+        <select name="origin_filter" class="text-sm border-gray-300 rounded-md shadow-sm">
+            <option value="">All</option>
+            <option value="agent"      {% if origin_filter == 'agent' %}selected{% endif %}>Agent only</option>
+            <option value="matchmaker" {% if origin_filter == 'matchmaker' %}selected{% endif %}>Matchmaker only</option>
+        </select>
+    </div>
+    <div class="flex flex-col gap-1">
+        <label class="text-xs text-gray-500 font-medium">Impact min</label>
+        <input type="number" name="impact_min" min="1" max="9" value="{{ impact_min or '' }}"
+               placeholder="1"
+               class="text-sm border-gray-300 rounded-md shadow-sm w-16">
+    </div>
+    <div class="flex flex-col gap-1">
+        <label class="text-xs text-gray-500 font-medium">Impact max</label>
+        <input type="number" name="impact_max" min="1" max="9" value="{{ impact_max or '' }}"
+               placeholder="9"
+               class="text-sm border-gray-300 rounded-md shadow-sm w-16">
+    </div>
+    <div class="flex flex-col gap-1">
+        <label class="text-xs text-gray-500 font-medium">From</label>
+        <input type="date" name="date_from" value="{{ date_from }}"
+               class="text-sm border-gray-300 rounded-md shadow-sm">
+    </div>
+    <div class="flex flex-col gap-1">
+        <label class="text-xs text-gray-500 font-medium">To</label>
+        <input type="date" name="date_to" value="{{ date_to }}"
+               class="text-sm border-gray-300 rounded-md shadow-sm">
+    </div>
+    <button type="submit"
+            class="px-3 py-1.5 bg-indigo-600 text-white text-sm rounded-md hover:bg-indigo-700">Filter</button>
+    {% if pi_filter or origin_filter or impact_min or impact_max or date_from or date_to %}
+    <a href="/admin/evaluations" class="text-sm text-gray-500 hover:text-gray-700">Clear</a>
+    {% endif %}
+</form>
+
+<!-- Table -->
+{% if eval_rows %}
+<div class="bg-white rounded-xl shadow-sm border border-gray-200 overflow-x-auto">
+    <table class="min-w-full divide-y divide-gray-200 text-sm">
+        <thead class="bg-gray-50">
+            <tr>
+                <th class="px-4 py-3 text-left text-xs font-medium text-gray-500 uppercase">Evaluator</th>
+                <th class="px-4 py-3 text-left text-xs font-medium text-gray-500 uppercase">Proposal</th>
+                <th class="px-4 py-3 text-left text-xs font-medium text-gray-500 uppercase">Origin</th>
+                <th class="px-4 py-3 text-left text-xs font-medium text-gray-500 uppercase">Collaborator</th>
+                <th class="px-4 py-3 text-center text-xs font-medium text-gray-500 uppercase" title="Significance">Sig.</th>
+                <th class="px-4 py-3 text-center text-xs font-medium text-gray-500 uppercase" title="Innovation">Inn.</th>
+                <th class="px-4 py-3 text-center text-xs font-medium text-gray-500 uppercase" title="Approach">App.</th>
+                <th class="px-4 py-3 text-center text-xs font-medium text-gray-500 uppercase" title="Investigators">Inv.</th>
+                <th class="px-4 py-3 text-center text-xs font-medium text-gray-500 uppercase" title="Environment">Env.</th>
+                <th class="px-4 py-3 text-center text-xs font-medium text-gray-500 uppercase">Impact</th>
+                <th class="px-4 py-3 text-left text-xs font-medium text-gray-500 uppercase">Submitted</th>
+                <th class="px-4 py-3 text-left text-xs font-medium text-gray-500 uppercase">Actions</th>
+            </tr>
+        </thead>
+        <tbody class="divide-y divide-gray-100">
+            {% for row in eval_rows %}
+            {% set ev = row.eval %}
+            {% set impact = ev.score_overall_impact %}
+            <tr class="hover:bg-gray-50" id="eval-{{ ev.id }}">
+                <td class="px-4 py-3 font-medium text-gray-900 whitespace-nowrap">
+                    {{ ev.user.name if ev.user else '—' }}
+                    {% if ev.user and ev.user.institution %}
+                    <span class="block text-xs text-gray-400 font-normal">{{ ev.user.institution }}</span>
+                    {% endif %}
+                </td>
+                <td class="px-4 py-3 text-gray-700 max-w-xs">
+                    <span class="line-clamp-2" title="{{ row.title }}">{{ row.title }}</span>
+                </td>
+                <td class="px-4 py-3 whitespace-nowrap">
+                    {% if ev.proposal_type == 'agent' %}
+                    <span class="px-2 py-0.5 rounded-full text-xs font-medium bg-blue-100 text-blue-700">Agent</span>
+                    {% else %}
+                    <span class="px-2 py-0.5 rounded-full text-xs font-medium bg-purple-100 text-purple-700">Matchmaker</span>
+                    {% endif %}
+                </td>
+                <td class="px-4 py-3 text-gray-700 whitespace-nowrap">
+                    {% if row.collaborator_agent_id %}
+                    <a href="/researcher/{{ row.collaborator_agent_id }}" target="_blank"
+                       class="text-indigo-600 hover:text-indigo-800 hover:underline">{{ row.collaborator }}</a>
+                    {% else %}
+                    {{ row.collaborator }}
+                    {% endif %}
+                </td>
+                <!-- Criterion scores — color-coded; null when not submitted -->
+                {% for s in [ev.score_significance, ev.score_innovation, ev.score_approach, ev.score_investigators, ev.score_environment] %}
+                <td class="px-4 py-3 text-center font-medium
+                    {% if s is none %}text-gray-300
+                    {% elif s <= 3 %}text-green-600{% elif s <= 6 %}text-amber-600{% else %}text-red-600{% endif %}">
+                    {{ s if s is not none else '—' }}
+                </td>
+                {% endfor %}
+                <!-- Overall impact — bolded -->
+                <td class="px-4 py-3 text-center font-bold
+                    {% if impact <= 3 %}text-green-600{% elif impact <= 6 %}text-amber-600{% else %}text-red-600{% endif %}">
+                    {{ impact }}
+                </td>
+                <td class="px-4 py-3 text-gray-500 whitespace-nowrap">
+                    <span data-utc="{{ ev.evaluated_at.isoformat() }}" data-utc-fmt="short">
+                        {{ ev.evaluated_at.strftime('%b %d %H:%M') }}
+                    </span>
+                    {% if ev.updated_at %}
+                    <span class="block text-xs text-gray-400">
+                        Updated <span data-utc="{{ ev.updated_at.isoformat() }}" data-utc-fmt="short">{{ ev.updated_at.strftime('%b %d') }}</span>
+                    </span>
+                    {% endif %}
+                </td>
+                <td class="px-4 py-3 whitespace-nowrap">
+                    <button type="button"
+                            onclick="toggleDetail('detail-{{ ev.id }}')"
+                            class="text-indigo-600 hover:text-indigo-800 text-sm">Details</button>
+                </td>
+            </tr>
+            <!-- Expanded detail row -->
+            <tr id="detail-{{ ev.id }}" class="hidden bg-gray-50">
+                <td colspan="12" class="px-6 py-5">
+                    <div class="grid grid-cols-1 md:grid-cols-2 gap-6 text-sm">
+                        {% set criterion_rows = [
+                            ('Significance',  ev.score_significance,  ev.comments_significance),
+                            ('Innovation',    ev.score_innovation,    ev.comments_innovation),
+                            ('Approach',      ev.score_approach,      ev.comments_approach),
+                            ('Investigators', ev.score_investigators, ev.comments_investigators),
+                            ('Environment',   ev.score_environment,   ev.comments_environment),
+                        ] %}
+                        {% for label, score, comment in criterion_rows %}
+                        <div>
+                            <p class="font-medium text-gray-700">
+                                {{ label }}
+                                {% if score is not none %}
+                                <span class="ml-1 font-bold
+                                    {% if score <= 3 %}text-green-600{% elif score <= 6 %}text-amber-600{% else %}text-red-600{% endif %}">
+                                    {{ score }}
+                                </span>
+                                {% else %}
+                                <span class="ml-1 text-gray-300">—</span>
+                                {% endif %}
+                            </p>
+                            {% if comment %}
+                            <p class="text-gray-500 mt-0.5">{{ comment }}</p>
+                            {% else %}
+                            <p class="text-gray-300 italic mt-0.5">No comment</p>
+                            {% endif %}
+                        </div>
+                        {% endfor %}
+                        <div class="md:col-span-2 border-t border-gray-200 pt-4">
+                            <p class="font-medium text-gray-700">
+                                Overall Impact
+                                <span class="ml-1 font-bold
+                                    {% if ev.score_overall_impact <= 3 %}text-green-600{% elif ev.score_overall_impact <= 6 %}text-amber-600{% else %}text-red-600{% endif %}">
+                                    {{ ev.score_overall_impact }}
+                                </span>
+                            </p>
+                            <p class="text-gray-600 mt-0.5">{{ ev.comments_overall }}</p>
+                        </div>
+                    </div>
+                </td>
+            </tr>
+            {% endfor %}
+        </tbody>
+    </table>
+</div>
+<p class="mt-3 text-sm text-gray-400">
+    {{ eval_rows | length }} evaluation{{ 's' if eval_rows | length != 1 else '' }}
+    {% if pi_filter or origin_filter or impact_min or impact_max or date_from or date_to %}(filtered){% endif %}
+</p>
+
+{% else %}
+<p class="text-gray-400 text-sm text-center py-12">No evaluations submitted yet.</p>
+{% endif %}
+
+<!-- Pending Proposals -->
+<div class="mt-12">
+    <div class="flex items-center justify-between mb-2">
+        <h2 class="text-xl font-bold text-gray-900">Pending Proposals</h2>
+        <span class="text-sm text-gray-400">{{ pending_proposals | length }} awaiting full evaluation</span>
+    </div>
+    <p class="text-sm text-gray-500 mb-4">
+        Proposals where at least one PI has not yet submitted an evaluation.
+        Hide to remove from the PI-facing <code>/proposals</code> page entirely.
+    </p>
+
+    {% if pending_proposals %}
+    <div class="bg-white rounded-xl shadow-sm border border-gray-200 overflow-x-auto">
+        <table class="min-w-full divide-y divide-gray-200 text-sm">
+            <thead class="bg-gray-50">
+                <tr>
+                    <th class="px-4 py-3 text-left text-xs font-medium text-gray-500 uppercase">PI A / PI B</th>
+                    <th class="px-4 py-3 text-left text-xs font-medium text-gray-500 uppercase">Title</th>
+                    <th class="px-4 py-3 text-left text-xs font-medium text-gray-500 uppercase">Source</th>
+                    <th class="px-4 py-3 text-center text-xs font-medium text-gray-500 uppercase">Evals</th>
+                    <th class="px-4 py-3 text-center text-xs font-medium text-gray-500 uppercase">Hidden</th>
+                </tr>
+            </thead>
+            <tbody class="divide-y divide-gray-100">
+                {% for p in pending_proposals %}
+                <tr class="hover:bg-gray-50">
+                    <td class="px-4 py-3 text-gray-700 whitespace-nowrap">
+                        <span class="{{ 'line-through text-gray-400' if p.evaluated_a else '' }}">{{ p.name_a }}</span>
+                        <span class="mx-1 text-gray-300">/</span>
+                        <span class="{{ 'line-through text-gray-400' if p.evaluated_b else '' }}">{{ p.name_b }}</span>
+                    </td>
+                    <td class="px-4 py-3 text-gray-700 max-w-xs">
+                        <span class="line-clamp-1" title="{{ p.title }}">{{ p.title }}</span>
+                    </td>
+                    <td class="px-4 py-3 whitespace-nowrap">
+                        {% if p.proposal_type == 'agent' %}
+                        <span class="px-2 py-0.5 rounded-full text-xs font-medium bg-blue-100 text-blue-700">Agent</span>
+                        {% else %}
+                        <span class="px-2 py-0.5 rounded-full text-xs font-medium bg-purple-100 text-purple-700">Matchmaker</span>
+                        {% endif %}
+                    </td>
+                    <td class="px-4 py-3 text-center text-xs text-gray-400 whitespace-nowrap">
+                        {{ p.evaluated_a | int + p.evaluated_b | int }}/2
+                    </td>
+                    <td class="px-4 py-3 text-center whitespace-nowrap">
+                        <form method="POST"
+                              action="/admin/evaluations/proposals/{{ p.proposal_type }}/{{ p.proposal_id }}/hide">
+                            <button type="submit"
+                                    class="text-xs font-medium {% if p.hidden %}text-red-600 hover:text-red-800{% else %}text-gray-400 hover:text-gray-600{% endif %}">
+                                {{ 'Yes' if p.hidden else 'No' }}
+                            </button>
+                        </form>
+                    </td>
+                </tr>
+                {% endfor %}
+            </tbody>
+        </table>
+    </div>
+    {% else %}
+    <p class="text-gray-400 text-sm text-center py-8">All proposals have been fully evaluated.</p>
+    {% endif %}
+</div>
+
+{% endblock %}
+
+{% block scripts %}
+<script>
+function toggleDetail(id) {
+    var row = document.getElementById(id);
+    if (row) row.classList.toggle('hidden');
+}
+</script>
+{% endblock %}
diff --git a/templates/admin/matchmaker.html b/templates/admin/matchmaker.html
new file mode 100644
index 0000000..418d251
--- /dev/null
+++ b/templates/admin/matchmaker.html
@@ -0,0 +1,178 @@
+{% extends "base.html" %}
+{% block title %}Admin — Matchmaker — CoPI{% endblock %}
+
+{% block extra_head %}
+<script src="https://cdn.jsdelivr.net/npm/marked/marked.min.js"></script>
+<style>
+    .proposal-md h1 { font-weight: 700; font-size: 1.1rem; margin-top: 0.75rem; margin-bottom: 0.25rem; }
+    .proposal-md h2 { font-weight: 600; font-size: 1rem; margin-top: 0.75rem; margin-bottom: 0.25rem; }
+    .proposal-md p { margin-bottom: 0.5rem; }
+    .proposal-md ul, .proposal-md ol { padding-left: 1.5rem; margin-bottom: 0.5rem; }
+    .proposal-md li { margin-bottom: 0.25rem; }
+    .proposal-md strong { font-weight: 600; }
+</style>
+{% endblock %}
+
+{% block content %}
+<div class="flex items-center justify-between mb-6">
+    <h1 class="text-2xl font-bold text-gray-900">Matchmaker</h1>
+</div>
+
+<!-- Generate form -->
+<div class="bg-white rounded-xl shadow-sm border border-gray-200 p-6 mb-8">
+    <h2 class="text-sm font-semibold text-gray-700 uppercase tracking-wide mb-4">Generate Proposal</h2>
+    {% if error %}
+    <div class="mb-4 px-4 py-3 rounded-lg bg-red-50 border border-red-200 text-red-700 text-sm">{{ error }}</div>
+    {% endif %}
+    <form method="POST" action="/admin/matchmaker/generate" id="generate-form"
+          class="flex items-end gap-4 flex-wrap">
+        <div class="flex flex-col gap-1">
+            <label class="text-xs text-gray-500 font-medium">PI A</label>
+            <select name="pi_a_id" id="pi_a_select" required
+                    class="text-sm border-gray-300 rounded-md shadow-sm focus:ring-indigo-500 focus:border-indigo-500 min-w-[200px]"
+                    onchange="updateDropdowns()">
+                <option value="">— select PI —</option>
+                {% for u in eligible_users %}
+                <option value="{{ u.id }}">{{ u.name }}{% if u.institution %} ({{ u.institution }}){% endif %}</option>
+                {% endfor %}
+            </select>
+        </div>
+        <div class="flex flex-col gap-1">
+            <label class="text-xs text-gray-500 font-medium">PI B</label>
+            <select name="pi_b_id" id="pi_b_select" required
+                    class="text-sm border-gray-300 rounded-md shadow-sm focus:ring-indigo-500 focus:border-indigo-500 min-w-[200px]"
+                    onchange="updateDropdowns()">
+                <option value="">— select PI —</option>
+                {% for u in eligible_users %}
+                <option value="{{ u.id }}">{{ u.name }}{% if u.institution %} ({{ u.institution }}){% endif %}</option>
+                {% endfor %}
+            </select>
+        </div>
+        <button type="submit" id="generate-btn" disabled
+                class="px-4 py-2 bg-indigo-600 text-white text-sm font-medium rounded-md hover:bg-indigo-700 disabled:opacity-40 disabled:cursor-not-allowed flex items-center gap-2">
+            <span id="btn-label">Generate Proposal</span>
+            <svg id="btn-spinner" class="hidden animate-spin h-4 w-4 text-white" xmlns="http://www.w3.org/2000/svg" fill="none" viewBox="0 0 24 24">
+                <circle class="opacity-25" cx="12" cy="12" r="10" stroke="currentColor" stroke-width="4"></circle>
+                <path class="opacity-75" fill="currentColor" d="M4 12a8 8 0 018-8v8H4z"></path>
+            </svg>
+        </button>
+    </form>
+    <p class="mt-3 text-xs text-gray-400">Uses Claude Opus. Typical generation time: 10–20 seconds.</p>
+</div>
+
+<!-- Filters + table -->
+{% if proposals or pi_filter or confidence_filter %}
+
+<div class="flex items-center gap-4 mb-4">
+    <form method="GET" action="/admin/matchmaker" class="flex items-center gap-3 flex-wrap">
+        <select name="pi_filter" multiple size="4"
+                class="text-sm border-gray-300 rounded-md shadow-sm min-w-[160px]"
+                title="Hold Ctrl/Cmd to select multiple">
+            {% for u in eligible_users %}
+            <option value="{{ u.id }}" {% if u.id in pi_filter %}selected{% endif %}>{{ u.name }}</option>
+            {% endfor %}
+        </select>
+        <select name="confidence_filter"
+                class="text-sm border-gray-300 rounded-md shadow-sm">
+            <option value="">All Confidence</option>
+            <option value="high" {% if confidence_filter == 'high' %}selected{% endif %}>High</option>
+            <option value="moderate" {% if confidence_filter == 'moderate' %}selected{% endif %}>Moderate</option>
+            <option value="speculative" {% if confidence_filter == 'speculative' %}selected{% endif %}>Speculative</option>
+        </select>
+        <button type="submit"
+                class="px-3 py-1.5 bg-indigo-600 text-white text-sm rounded-md hover:bg-indigo-700">Filter</button>
+        <button type="submit" name="export" value="true"
+                class="px-3 py-1.5 bg-gray-600 text-white text-sm rounded-md hover:bg-gray-700">Export TXT</button>
+        <button type="submit" name="export" value="html"
+                class="px-3 py-1.5 bg-gray-600 text-white text-sm rounded-md hover:bg-gray-700">Export HTML</button>
+        {% if pi_filter or confidence_filter %}
+        <a href="/admin/matchmaker" class="text-sm text-gray-500 hover:text-gray-700">Clear</a>
+        {% endif %}
+    </form>
+    <form method="POST" action="/admin/matchmaker/clear"
+          onsubmit="return confirm('Delete all matchmaker proposals from the database? Slack conversations are not affected.')">
+        <button type="submit"
+                class="px-3 py-1.5 bg-red-600 text-white text-sm rounded-md hover:bg-red-700">Clear All</button>
+    </form>
+</div>
+
+<div class="bg-white rounded-xl shadow-sm border border-gray-200 overflow-hidden">
+    <table class="min-w-full divide-y divide-gray-200">
+        <thead class="bg-gray-50">
+            <tr>
+                <th class="px-4 py-3 text-left text-xs font-medium text-gray-500 uppercase">Confidence</th>
+                <th class="px-4 py-3 text-left text-xs font-medium text-gray-500 uppercase">PI A</th>
+                <th class="px-4 py-3 text-left text-xs font-medium text-gray-500 uppercase">PI B</th>
+                <th class="px-4 py-3 text-left text-xs font-medium text-gray-500 uppercase">Title</th>
+                <th class="px-4 py-3 text-left text-xs font-medium text-gray-500 uppercase">Generated</th>
+                <th class="px-4 py-3 text-left text-xs font-medium text-gray-500 uppercase">Actions</th>
+            </tr>
+        </thead>
+        <tbody class="divide-y divide-gray-100">
+            {% for p in proposals %}
+            {% set conf_meta = {
+                'high':       {'label': 'High',       'color': 'green'},
+                'moderate':   {'label': 'Moderate',   'color': 'yellow'},
+                'speculative':{'label': 'Speculative','color': 'gray'},
+            }.get(p.confidence, {'label': p.confidence | capitalize, 'color': 'gray'}) %}
+            <tr class="hover:bg-gray-50 cursor-pointer" onclick="window.location='/admin/matchmaker/{{ p.id }}'">
+                <td class="px-4 py-3">
+                    <span class="px-2 py-0.5 rounded-full text-xs bg-{{ conf_meta.color }}-100 text-{{ conf_meta.color }}-700">
+                        {{ conf_meta.label }}
+                    </span>
+                </td>
+                <td class="px-4 py-3 text-sm font-medium">{{ p.name_a }}</td>
+                <td class="px-4 py-3 text-sm font-medium">{{ p.name_b }}</td>
+                <td class="px-4 py-3 text-sm text-gray-700 max-w-xs truncate">{{ p.title }}</td>
+                <td class="px-4 py-3 text-sm text-gray-500">
+                    <span data-utc="{{ p.generated_at.isoformat() }}" data-utc-fmt="short">
+                        {{ p.generated_at.strftime('%b %d %H:%M') }}
+                    </span>
+                </td>
+                <td class="px-4 py-3 text-sm" onclick="event.stopPropagation()">
+                    <a href="/admin/matchmaker/{{ p.id }}" class="text-indigo-600 hover:text-indigo-800 mr-3">View</a>
+                    <form method="POST" action="/admin/matchmaker/{{ p.id }}/delete" class="inline"
+                          onsubmit="return confirm('Delete this proposal?')">
+                        <button type="submit" class="text-red-500 hover:text-red-700">Delete</button>
+                    </form>
+                </td>
+            </tr>
+            {% else %}
+            <tr>
+                <td colspan="6" class="px-4 py-8 text-center text-gray-400 text-sm">No proposals yet</td>
+            </tr>
+            {% endfor %}
+        </tbody>
+    </table>
+</div>
+
+<div class="mt-4 text-sm text-gray-400">
+    {{ proposals | length }} proposal{{ 's' if proposals | length != 1 }}
+    {% if pi_filter or confidence_filter %}(filtered){% endif %}
+</div>
+
+{% else %}
+<p class="text-gray-400 text-sm">No proposals generated yet. Use the form above to create one.</p>
+{% endif %}
+
+{% endblock %}
+
+{% block scripts %}
+<script>
+function updateDropdowns() {
+    const aVal = document.getElementById('pi_a_select').value;
+    const bVal = document.getElementById('pi_b_select').value;
+    const btn = document.getElementById('generate-btn');
+    btn.disabled = !(aVal && bVal && aVal !== bVal);
+}
+
+document.getElementById('generate-form').addEventListener('submit', function() {
+    const btn = document.getElementById('generate-btn');
+    const label = document.getElementById('btn-label');
+    const spinner = document.getElementById('btn-spinner');
+    btn.disabled = true;
+    label.textContent = 'Generating…';
+    spinner.classList.remove('hidden');
+});
+</script>
+{% endblock %}
diff --git a/templates/admin/matchmaker_detail.html b/templates/admin/matchmaker_detail.html
new file mode 100644
index 0000000..c849f61
--- /dev/null
+++ b/templates/admin/matchmaker_detail.html
@@ -0,0 +1,79 @@
+{% extends "base.html" %}
+{% block title %}Admin — Matchmaker — {{ proposal.title | truncate(60) }} — CoPI{% endblock %}
+
+{% block extra_head %}
+<script src="https://cdn.jsdelivr.net/npm/marked/marked.min.js"></script>
+<style>
+    .proposal-md h1 { font-weight: 700; font-size: 1.15rem; margin-top: 1rem; margin-bottom: 0.35rem; }
+    .proposal-md h2 { font-weight: 600; font-size: 1rem; margin-top: 0.85rem; margin-bottom: 0.25rem; border-bottom: 1px solid #e5e7eb; padding-bottom: 0.2rem; }
+    .proposal-md p { margin-bottom: 0.6rem; line-height: 1.6; }
+    .proposal-md ul, .proposal-md ol { padding-left: 1.5rem; margin-bottom: 0.6rem; }
+    .proposal-md li { margin-bottom: 0.3rem; line-height: 1.5; }
+    .proposal-md strong { font-weight: 600; }
+</style>
+{% endblock %}
+
+{% block content %}
+
+<!-- Back link -->
+<div class="mb-5">
+    <a href="/admin/matchmaker" class="text-sm text-indigo-600 hover:text-indigo-800">&larr; Back to Matchmaker</a>
+</div>
+
+<!-- Header card -->
+<div class="bg-white rounded-xl shadow-sm border border-gray-200 p-6 mb-6">
+    <div class="flex items-start justify-between gap-4">
+        <div>
+            <h1 class="text-xl font-bold text-gray-900 mb-2">{{ proposal.title }}</h1>
+            <div class="flex items-center gap-4 text-sm text-gray-600 flex-wrap">
+                <span class="font-medium">{{ proposal.name_a }}</span>
+                <span class="text-gray-400">&times;</span>
+                <span class="font-medium">{{ proposal.name_b }}</span>
+                <span class="text-gray-300">|</span>
+                {% set conf_meta = {
+                    'high':       {'label': 'High',       'color': 'green'},
+                    'moderate':   {'label': 'Moderate',   'color': 'yellow'},
+                    'speculative':{'label': 'Speculative','color': 'gray'},
+                }.get(proposal.confidence, {'label': proposal.confidence | capitalize, 'color': 'gray'}) %}
+                <span class="px-2 py-0.5 rounded-full text-xs font-medium bg-{{ conf_meta.color }}-100 text-{{ conf_meta.color }}-700">
+                    {{ conf_meta.label }} Confidence
+                </span>
+                <span class="text-gray-400">|</span>
+                <span class="text-gray-400">
+                    Generated <span data-utc="{{ proposal.generated_at.isoformat() }}" data-utc-fmt="short">{{ proposal.generated_at.strftime('%b %d, %Y %H:%M') }}</span>
+                </span>
+            </div>
+            {% if proposal.input_tokens %}
+            <div class="mt-2 text-xs text-gray-400">
+                {{ proposal.llm_model }} &bull; {{ proposal.input_tokens | int }} in / {{ proposal.output_tokens | int }} out tokens
+            </div>
+            {% endif %}
+        </div>
+        <form method="POST" action="/admin/matchmaker/{{ proposal.id }}/delete"
+              onsubmit="return confirm('Delete this proposal?')" class="shrink-0">
+            <button type="submit"
+                    class="px-3 py-1.5 text-sm text-red-600 border border-red-200 rounded-md hover:bg-red-50">
+                Delete
+            </button>
+        </form>
+    </div>
+</div>
+
+<!-- Proposal body -->
+<div class="bg-white rounded-xl shadow-sm border border-gray-200 p-8">
+    <div class="proposal-md text-gray-800 max-w-3xl"
+         data-markdown="{{ proposal.proposal_md | extract_proposal | e }}"></div>
+</div>
+
+{% endblock %}
+
+{% block scripts %}
+<script>
+document.addEventListener('DOMContentLoaded', function() {
+    document.querySelectorAll('[data-markdown]').forEach(function(el) {
+        var md = el.getAttribute('data-markdown');
+        if (md) { el.innerHTML = marked.parse(md); }
+    });
+});
+</script>
+{% endblock %}
diff --git a/templates/admin/matchmaker_export.html b/templates/admin/matchmaker_export.html
new file mode 100644
index 0000000..23e6488
--- /dev/null
+++ b/templates/admin/matchmaker_export.html
@@ -0,0 +1,57 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+    <meta charset="UTF-8">
+    <title>CoPI — Matchmaker Proposals Export</title>
+    <script src="https://cdn.jsdelivr.net/npm/marked/marked.min.js"></script>
+    <style>
+        body { font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; max-width: 800px; margin: 2rem auto; padding: 0 1rem; color: #1f2937; }
+        h1 { font-size: 1.5rem; border-bottom: 2px solid #e5e7eb; padding-bottom: 0.5rem; margin-bottom: 2rem; }
+        .proposal { margin-bottom: 2.5rem; page-break-inside: avoid; }
+        .proposal-header { background: #f9fafb; border: 1px solid #e5e7eb; border-radius: 8px; padding: 0.75rem 1rem; margin-bottom: 1rem; font-size: 0.875rem; color: #6b7280; }
+        .proposal-header strong { color: #1f2937; }
+        .proposal-title { font-size: 1rem; font-weight: 600; color: #1f2937; margin-bottom: 0.25rem; }
+        .proposal-body { font-size: 0.9375rem; line-height: 1.6; }
+        .proposal-body h1 { font-weight: 700; font-size: 1.1rem; margin-top: 0.75rem; margin-bottom: 0.25rem; }
+        .proposal-body h2 { font-weight: 600; font-size: 1rem; margin-top: 0.75rem; margin-bottom: 0.25rem; }
+        .proposal-body h3 { font-size: 0.95rem; margin-top: 0.5rem; margin-bottom: 0.25rem; }
+        .proposal-body p { margin-bottom: 0.5rem; }
+        .proposal-body ul, .proposal-body ol { padding-left: 1.5rem; margin-bottom: 0.5rem; }
+        .proposal-body li { margin-bottom: 0.25rem; }
+        .proposal-body a { color: #4f46e5; }
+        .proposal-body strong { font-weight: 600; }
+        hr { border: none; border-top: 1px solid #e5e7eb; margin: 2rem 0; }
+        .footer { text-align: center; font-size: 0.75rem; color: #9ca3af; margin-top: 3rem; }
+        @media print { body { margin: 0; } .proposal { page-break-inside: avoid; } }
+    </style>
+</head>
+<body>
+    <h1>CoPI — Matchmaker Proposals</h1>
+
+    {% for p in proposals %}
+    {% if not loop.first %}<hr>{% endif %}
+    <div class="proposal">
+        <div class="proposal-header">
+            {% if p.title %}<div class="proposal-title">{{ p.title }}</div>{% endif %}
+            <strong>{{ p.name_a }}</strong> + <strong>{{ p.name_b }}</strong>
+            &nbsp;&middot;&nbsp; {{ p.confidence | capitalize }}
+            &nbsp;&middot;&nbsp; {{ p.date }}
+        </div>
+        <div class="proposal-body" data-markdown="{{ p.proposal_md | e }}"></div>
+    </div>
+    {% else %}
+    <p style="color: #9ca3af;">No proposals found with current filters.</p>
+    {% endfor %}
+
+    <div class="footer">
+        Exported from CoPI &mdash; {{ proposals | length }} proposal{{ 's' if proposals | length != 1 }}
+    </div>
+
+    <script>
+    document.querySelectorAll('[data-markdown]').forEach(function(el) {
+        var md = el.getAttribute('data-markdown');
+        if (md) { el.innerHTML = marked.parse(md); }
+    });
+    </script>
+</body>
+</html>
diff --git a/templates/admin/podcast.html b/templates/admin/podcast.html
new file mode 100644
index 0000000..1f89ea4
--- /dev/null
+++ b/templates/admin/podcast.html
@@ -0,0 +1,197 @@
+{% extends "base.html" %}
+{% block title %}Admin — Podcast — CoPI{% endblock %}
+
+{% block content %}
+<div class="flex items-center justify-between mb-6">
+    <h1 class="text-2xl font-bold text-gray-900">Podcast Episodes</h1>
+    <span class="text-sm text-gray-500">{{ total }} total episodes</span>
+</div>
+
+<!-- Summary cards -->
+<div class="grid grid-cols-3 gap-4 mb-4">
+    <div class="bg-white rounded-xl border border-gray-200 p-4 text-center">
+        <div class="text-3xl font-bold text-indigo-600">{{ total }}</div>
+        <div class="text-sm text-gray-500 mt-1">Total Episodes</div>
+    </div>
+    <div class="bg-white rounded-xl border border-gray-200 p-4 text-center">
+        <div class="text-3xl font-bold text-green-600">{{ with_audio }}</div>
+        <div class="text-sm text-gray-500 mt-1">With Audio</div>
+    </div>
+    <div class="bg-white rounded-xl border border-gray-200 p-4 text-center">
+        <div class="text-3xl font-bold text-blue-600">{{ slack_delivered }}</div>
+        <div class="text-sm text-gray-500 mt-1">Slack Delivered</div>
+    </div>
+</div>
+
+<!-- LLM usage stats -->
+<div class="grid grid-cols-3 gap-4 mb-8">
+    <div class="bg-white rounded-xl border border-gray-200 p-4 text-center">
+        <div class="text-2xl font-bold text-purple-600">{{ llm_call_count }}</div>
+        <div class="text-sm text-gray-500 mt-1">LLM Calls (podcast)</div>
+    </div>
+    <div class="bg-white rounded-xl border border-gray-200 p-4 text-center">
+        <div class="text-2xl font-bold text-purple-600">{{ "{:,}".format(llm_input_tokens) }}</div>
+        <div class="text-sm text-gray-500 mt-1">Input Tokens</div>
+    </div>
+    <div class="bg-white rounded-xl border border-gray-200 p-4 text-center">
+        <div class="text-2xl font-bold text-purple-600">{{ "{:,}".format(llm_output_tokens) }}</div>
+        <div class="text-sm text-gray-500 mt-1">Output Tokens</div>
+    </div>
+</div>
+
+<!-- Filters -->
+<div class="bg-white rounded-lg border border-gray-200 p-4 mb-4 flex flex-wrap gap-4 items-end">
+    <div>
+        <label class="text-xs font-medium text-gray-600 block mb-1">Agent</label>
+        <select onchange="applyFilter()" id="agent-filter"
+                class="border border-gray-300 rounded px-2 py-1 text-sm">
+            <option value="">All agents</option>
+            {% for aid in agent_ids %}
+            <option value="{{ aid }}" {% if agent_filter == aid %}selected{% endif %}>{{ aid }}</option>
+            {% endfor %}
+        </select>
+    </div>
+    {% if agent_filter %}
+    <div>
+        <a href="/admin/podcast" class="text-sm text-indigo-600 hover:underline">Clear filter</a>
+    </div>
+    <div>
+        <a href="{{ base_url }}/podcast/{{ agent_filter }}/feed.xml" target="_blank"
+           class="inline-flex items-center gap-1 text-sm text-orange-600 hover:underline">
+            RSS Feed ↗
+        </a>
+    </div>
+    <div>
+        <a href="/agent/{{ agent_filter }}/podcast-settings"
+           class="inline-flex items-center gap-1 text-sm text-indigo-600 hover:underline">
+            Podcast Settings ↗
+        </a>
+    </div>
+    {% endif %}
+</div>
+
+<!-- Preferences summary (visible when an agent is selected) -->
+{% if agent_filter %}
+{% set prefs = prefs_by_agent.get(agent_filter) %}
+<div class="bg-white rounded-lg border border-gray-200 p-4 mb-4">
+    <div class="flex items-center justify-between mb-2">
+        <h3 class="text-sm font-medium text-gray-700">Podcast Preferences — {{ agent_filter }}</h3>
+        <a href="/agent/{{ agent_filter }}/podcast-settings"
+           class="text-xs text-indigo-600 hover:underline">Edit ↗</a>
+    </div>
+    {% if prefs %}
+    <dl class="grid grid-cols-3 gap-4 text-sm">
+        <div>
+            <dt class="text-xs font-medium text-gray-500 uppercase mb-0.5">Voice</dt>
+            <dd class="text-gray-800">
+                {% if prefs.voice_id %}{{ prefs.voice_id }}{% else %}<span class="text-gray-400">system default</span>{% endif %}
+            </dd>
+        </div>
+        <div>
+            <dt class="text-xs font-medium text-gray-500 uppercase mb-0.5">Extra Keywords</dt>
+            <dd class="text-gray-800">
+                {% if prefs.extra_keywords %}
+                <span class="text-gray-600">{{ prefs.extra_keywords | length }} term(s)</span>
+                <div class="text-xs text-gray-400 mt-0.5">{{ prefs.extra_keywords | join(', ') }}</div>
+                {% else %}
+                <span class="text-gray-400">none</span>
+                {% endif %}
+            </dd>
+        </div>
+        <div>
+            <dt class="text-xs font-medium text-gray-500 uppercase mb-0.5">Source Preferences</dt>
+            <dd class="text-gray-800 text-xs">
+                {% if prefs.preferred_journals %}
+                <div class="text-green-700 mb-0.5">▲ {{ prefs.preferred_journals | join(', ') }}</div>
+                {% endif %}
+                {% if prefs.deprioritized_journals %}
+                <div class="text-amber-700">▼ {{ prefs.deprioritized_journals | join(', ') }}</div>
+                {% endif %}
+                {% if not prefs.preferred_journals and not prefs.deprioritized_journals %}
+                <span class="text-gray-400">none</span>
+                {% endif %}
+            </dd>
+        </div>
+    </dl>
+    {% else %}
+    <p class="text-sm text-gray-400">No preferences configured for this agent.
+        <a href="/agent/{{ agent_filter }}/podcast-settings" class="text-indigo-600 hover:underline">Set up preferences ↗</a>
+    </p>
+    {% endif %}
+</div>
+{% endif %}
+
+<!-- Episodes table -->
+<div class="bg-white rounded-xl shadow-sm border border-gray-200 overflow-hidden">
+    <table class="min-w-full divide-y divide-gray-200">
+        <thead class="bg-gray-50">
+            <tr>
+                <th class="px-4 py-3 text-left text-xs font-medium text-gray-500 uppercase">Date</th>
+                <th class="px-4 py-3 text-left text-xs font-medium text-gray-500 uppercase">Agent</th>
+                <th class="px-4 py-3 text-left text-xs font-medium text-gray-500 uppercase">Paper</th>
+                <th class="px-4 py-3 text-left text-xs font-medium text-gray-500 uppercase">PMID</th>
+                <th class="px-4 py-3 text-left text-xs font-medium text-gray-500 uppercase">Audio</th>
+                <th class="px-4 py-3 text-left text-xs font-medium text-gray-500 uppercase">Slack</th>
+            </tr>
+        </thead>
+        <tbody class="divide-y divide-gray-100">
+            {% for ep in episodes %}
+            <tr class="hover:bg-gray-50">
+                <td class="px-4 py-3 text-sm text-gray-700 whitespace-nowrap">{{ ep.episode_date }}</td>
+                <td class="px-4 py-3 text-sm">
+                    {% if ep.agent_id %}
+                    <span class="font-mono text-xs bg-gray-100 px-1.5 py-0.5 rounded">{{ ep.agent_id }}</span>
+                    {% elif ep.user_id %}
+                    <span class="font-mono text-xs bg-blue-100 text-blue-700 px-1.5 py-0.5 rounded" title="User {{ ep.user_id }}">user:{{ ep.user_id | string | truncate(8, end='…') }}</span>
+                    {% else %}
+                    <span class="text-gray-400 text-xs">—</span>
+                    {% endif %}
+                </td>
+                <td class="px-4 py-3 text-sm max-w-xs">
+                    <div class="font-medium text-gray-800 truncate" title="{{ ep.paper_title }}">{{ ep.paper_title }}</div>
+                    <div class="text-xs text-gray-500 mt-0.5">{{ ep.paper_journal }} · {{ ep.paper_year }}</div>
+                    {% if ep.selection_justification %}
+                    <div class="text-xs text-gray-400 mt-0.5 italic truncate" title="{{ ep.selection_justification }}">{{ ep.selection_justification }}</div>
+                    {% endif %}
+                </td>
+                <td class="px-4 py-3 text-sm">
+                    <a href="{{ ep.paper_url or 'https://pubmed.ncbi.nlm.nih.gov/' ~ ep.pmid ~ '/' }}" target="_blank"
+                       class="text-indigo-600 hover:underline font-mono text-xs">{{ ep.pmid }}</a>
+                </td>
+                <td class="px-4 py-3 text-sm">
+                    {% if ep.audio_file_path %}
+                    <span class="text-green-600 text-xs">✓
+                        {% if ep.audio_duration_seconds %}
+                        {{ ep.audio_duration_seconds // 60 }}:{{ '%02d' % (ep.audio_duration_seconds % 60) }}
+                        {% endif %}
+                    </span>
+                    {% else %}
+                    <span class="text-gray-400 text-xs">—</span>
+                    {% endif %}
+                </td>
+                <td class="px-4 py-3 text-sm">
+                    {% if ep.slack_delivered %}
+                    <span class="text-green-600 text-xs">✓</span>
+                    {% else %}
+                    <span class="text-gray-400 text-xs">—</span>
+                    {% endif %}
+                </td>
+            </tr>
+            {% else %}
+            <tr>
+                <td colspan="6" class="px-4 py-8 text-center text-gray-400 text-sm">No podcast episodes yet</td>
+            </tr>
+            {% endfor %}
+        </tbody>
+    </table>
+</div>
+
+<script>
+function applyFilter() {
+    const agent = document.getElementById('agent-filter').value;
+    const params = new URLSearchParams();
+    if (agent) params.set('agent_filter', agent);
+    location.href = '/admin/podcast' + (params.toString() ? '?' + params.toString() : '');
+}
+</script>
+{% endblock %}
diff --git a/templates/agent/dashboard.html b/templates/agent/dashboard.html
index fcc73dd..daf119f 100644
--- a/templates/agent/dashboard.html
+++ b/templates/agent/dashboard.html
@@ -14,6 +14,14 @@
     .proposal-md a { color: #4f46e5; text-decoration: underline; }
     textarea { border: 1px solid #d1d5db; border-radius: 0.375rem; }
     textarea:focus { outline: none; border-color: #6366f1; box-shadow: 0 0 0 2px rgba(99,102,241,0.2); }
+    .disc-bubble p { margin-bottom: 0.4rem; }
+    .disc-bubble p:last-child { margin-bottom: 0; }
+    .disc-bubble strong { font-weight: 600; }
+    .disc-bubble a { text-decoration: underline; }
+    .disc-bubble ul, .disc-bubble ol { padding-left: 1.25rem; margin-bottom: 0.4rem; }
+    .disc-bubble li { margin-bottom: 0.15rem; }
+    .disc-bubble-mine a { color: rgba(255,255,255,0.85); }
+    .disc-bubble-mine strong { color: white; }
 </style>
 {% endblock %}
 
@@ -25,14 +33,40 @@
             <h1 class="text-2xl font-bold text-gray-900">{{ agent.bot_name }}</h1>
             <p class="text-sm text-gray-500">Representing the {{ agent.pi_name }} lab</p>
         </div>
-        <span class="px-3 py-1 rounded-full text-sm
-            {% if agent.status == 'active' %}bg-green-100 text-green-700
-            {% elif agent.status == 'suspended' %}bg-amber-100 text-amber-700
-            {% else %}bg-gray-100 text-gray-600{% endif %}">
-            {{ agent.status | capitalize }}
-        </span>
+        <div class="flex items-center gap-3">
+            <span class="px-3 py-1 rounded-full text-sm
+                {% if agent.is_paused %}bg-yellow-100 text-yellow-700
+                {% elif agent.status == 'active' %}bg-green-100 text-green-700
+                {% elif agent.status == 'suspended' %}bg-amber-100 text-amber-700
+                {% else %}bg-gray-100 text-gray-600{% endif %}">
+                {% if agent.is_paused %}Paused{% else %}{{ agent.status | capitalize }}{% endif %}
+            </span>
+            {% if is_owner %}
+            {% if agent.is_paused %}
+            <form method="POST" action="/agent/{{ agent.agent_id }}/resume">
+                <button type="submit"
+                        class="px-3 py-1.5 bg-green-600 text-white text-sm rounded-md hover:bg-green-700">
+                    Resume Agent
+                </button>
+            </form>
+            {% else %}
+            <form method="POST" action="/agent/{{ agent.agent_id }}/pause">
+                <button type="submit"
+                        class="px-3 py-1.5 bg-yellow-500 text-white text-sm rounded-md hover:bg-yellow-600">
+                    Pause Agent
+                </button>
+            </form>
+            {% endif %}
+            {% endif %}
+        </div>
     </div>
 
+    {% if agent.is_paused %}
+    <div class="bg-yellow-50 border border-yellow-200 rounded-lg p-4 mb-6 text-sm text-yellow-800">
+        Your agent is currently paused and will not participate in the simulation until resumed.
+    </div>
+    {% endif %}
+
     {% if not is_owner %}
     <!-- Delegate banner -->
     <div class="bg-indigo-50 border border-indigo-200 rounded-lg p-3 mb-6 text-sm text-indigo-700">
@@ -91,74 +125,115 @@ <h1 class="text-2xl font-bold text-gray-900">{{ agent.bot_name }}</h1>
         <h2 class="text-lg font-semibold text-gray-800 mb-4">Proposals Awaiting Your Review</h2>
         {% for entry in unreviewed %}
         {% set p = entry.proposal %}
+        {% set idx = loop.index %}
         <div class="bg-white rounded-xl shadow-sm border border-gray-200 mb-4">
-            <div class="px-6 py-4 border-b border-gray-100 flex items-center justify-between">
-                <div>
-                    <span class="text-sm font-medium text-gray-700">#{{ p.channel }}</span>
-                    <span class="text-gray-400 mx-2">&middot;</span>
-                    <span class="text-sm text-gray-500">with {{ entry.other_agent | capitalize }}Bot</span>
+            <!-- Accordion header -->
+            <div class="px-6 py-4 cursor-pointer flex items-center justify-between gap-4"
+                 onclick="toggleProposal({{ idx }}, {{ unreviewed | length }})">
+                <div class="min-w-0">
+                    <div class="text-sm font-semibold text-gray-800 truncate">{{ entry.title }}</div>
+                    <div class="text-xs text-gray-400 mt-0.5">
+                        #{{ p.channel }} &middot; with {{ entry.other_agent | capitalize }}Bot &middot;
+                        <span data-utc="{{ p.decided_at.isoformat() }}" data-utc-fmt="short">{{ p.decided_at.strftime('%b %d, %Y') }}</span>
+                    </div>
                 </div>
-                <span class="text-xs text-gray-400" data-utc="{{ p.decided_at.isoformat() }}" data-utc-fmt="short">{{ p.decided_at.strftime('%b %d, %Y') }}</span>
+                <svg id="prop-chevron-{{ idx }}"
+                     class="w-4 h-4 text-gray-400 flex-shrink-0 transition-transform {{ '' if loop.first else 'rotate-180' }}"
+                     fill="none" viewBox="0 0 24 24" stroke="currentColor">
+                    <path stroke-linecap="round" stroke-linejoin="round" stroke-width="2" d="M5 15l7-7 7 7"/>
+                </svg>
             </div>
-            <div class="px-6 py-4">
-                <div class="text-sm text-gray-700 proposal-md" data-markdown="{{ p.summary_text | e }}"></div>
-                <div class="pt-4 border-t border-gray-100 mt-4">
-                    <!-- Tab buttons -->
-                    <div class="flex gap-2 mb-4">
-                        <button type="button" onclick="showTab(this, 'review-{{ loop.index }}')"
-                                class="tab-btn px-3 py-1.5 text-sm font-medium rounded-lg bg-indigo-50 text-indigo-700 border border-indigo-200">
-                            Rate &amp; Close
-                        </button>
-                        <button type="button" onclick="showTab(this, 'reopen-{{ loop.index }}')"
-                                class="tab-btn px-3 py-1.5 text-sm font-medium rounded-lg text-gray-500 border border-gray-200 hover:bg-gray-50">
-                            Give Guidance &amp; Reopen
-                        </button>
-                    </div>
+            <!-- Accordion body -->
+            <div id="prop-body-{{ idx }}" class="{{ '' if loop.first else 'hidden' }} border-t border-gray-100">
+                <div class="px-6 py-4">
+                    <!-- Proposal content -->
+                    <div class="text-sm text-gray-700 proposal-md" data-markdown="{{ p.summary_text | e }}"></div>
 
-                    <!-- Rate & Close tab -->
-                    <div id="review-{{ loop.index }}" class="tab-panel">
-                        <form method="POST" action="/agent/{{ agent.agent_id }}/proposals/{{ p.id }}/review">
-                            <div class="grid grid-cols-2 md:grid-cols-4 gap-2 mb-3">
-                                {% set ratings = [
-                                    (1, "Not a good idea", "Not interesting OR multiple major weaknesses"),
-                                    (2, "Good idea", "Medium interest OR one major weakness"),
-                                    (3, "Great idea", "High interest, minor weaknesses only"),
-                                    (4, "Excellent idea", "High interest, no notable weaknesses"),
-                                ] %}
-                                {% for val, label, desc in ratings %}
-                                <label class="flex items-start gap-2 cursor-pointer p-2 rounded-lg border border-gray-200 hover:bg-gray-50">
-                                    <input type="radio" name="rating" value="{{ val }}" class="mt-0.5 text-indigo-600" required>
-                                    <div>
-                                        <div class="text-sm font-medium text-gray-800">{{ val }} — {{ label }}</div>
-                                        <div class="text-xs text-gray-500">{{ desc }}</div>
-                                    </div>
-                                </label>
-                                {% endfor %}
+                    <!-- Discussion toggle -->
+                    {% if entry.discussion %}
+                    <div class="mt-4">
+                        <button type="button" onclick="toggleDiscussion(this, 'disc-{{ idx }}')"
+                                class="text-xs text-indigo-500 hover:text-indigo-700 flex items-center gap-1">
+                            <span class="disc-label">Show discussion</span>
+                            <svg class="w-3 h-3 disc-arrow" fill="none" viewBox="0 0 24 24" stroke="currentColor">
+                                <path stroke-linecap="round" stroke-linejoin="round" stroke-width="2" d="M19 9l-7 7-7-7"/>
+                            </svg>
+                        </button>
+                        <div id="disc-{{ idx }}" class="hidden mt-3 max-h-[32rem] overflow-y-auto rounded-xl border border-gray-100 bg-gray-50 p-4 space-y-4">
+                            {% for msg in entry.discussion %}
+                            {% set is_mine = msg.agent_id == agent.agent_id %}
+                            <div class="flex flex-col {{ 'items-end' if is_mine else 'items-start' }}">
+                                <div class="flex items-center gap-1.5 mb-1 {{ 'flex-row-reverse' if is_mine else '' }}">
+                                    <span class="text-xs font-medium text-gray-600">{{ msg.agent_id | capitalize }}Bot</span>
+                                    <span class="text-xs text-gray-400" data-utc="{{ msg.ts }}" data-utc-fmt="disc">{{ msg.ts }}</span>
+                                </div>
+                                <div class="max-w-[85%] px-3.5 py-2.5 rounded-2xl text-sm leading-relaxed disc-bubble
+                                            {{ 'bg-indigo-600 text-white rounded-tr-sm disc-bubble-mine' if is_mine else 'bg-white text-gray-700 rounded-tl-sm border border-gray-200 shadow-sm' }}"
+                                     data-markdown="{{ msg.text | e }}"></div>
                             </div>
-                            <textarea name="comment" rows="3" placeholder="Optional comment — what did the agent get right or wrong?"
-                                      class="w-full text-sm px-3 py-2 mb-3"></textarea>
-                            <button type="submit"
-                                    class="px-5 py-2 bg-indigo-600 text-white text-sm font-medium rounded-lg hover:bg-indigo-700">
-                                Submit Review
-                            </button>
-                        </form>
+                            {% endfor %}
+                        </div>
                     </div>
+                    {% endif %}
 
-                    <!-- Give Guidance & Reopen tab -->
-                    <div id="reopen-{{ loop.index }}" class="tab-panel hidden">
-                        <p class="text-sm text-gray-500 mb-3">
-                            Send guidance to both agents. Your feedback will be posted in the Slack thread
-                            and the agents will continue the conversation with a fresh set of replies.
-                        </p>
-                        <form method="POST" action="/agent/{{ agent.agent_id }}/proposals/{{ p.id }}/reopen">
-                            <textarea name="guidance" rows="4" required
-                                      placeholder="e.g., Work out the experimental design in more detail. Focus on the aging angle rather than general drug repurposing."
-                                      class="w-full text-sm px-3 py-2 mb-3 border border-gray-300 rounded-lg"></textarea>
-                            <button type="submit"
-                                    class="px-5 py-2 bg-amber-600 text-white text-sm font-medium rounded-lg hover:bg-amber-700">
-                                Post Guidance &amp; Reopen Thread
+                    <div class="pt-4 border-t border-gray-100 mt-4">
+                        <!-- Tab buttons -->
+                        <div class="flex gap-2 mb-4">
+                            <button type="button" onclick="showTab(this, 'review-{{ idx }}')"
+                                    class="tab-btn px-3 py-1.5 text-sm font-medium rounded-lg bg-indigo-50 text-indigo-700 border border-indigo-200">
+                                Rate &amp; Close
                             </button>
-                        </form>
+                            <button type="button" onclick="showTab(this, 'reopen-{{ idx }}')"
+                                    class="tab-btn px-3 py-1.5 text-sm font-medium rounded-lg text-gray-500 border border-gray-200 hover:bg-gray-50">
+                                Give Guidance &amp; Reopen
+                            </button>
+                        </div>
+
+                        <!-- Rate & Close tab -->
+                        <div id="review-{{ idx }}" class="tab-panel">
+                            <form method="POST" action="/agent/{{ agent.agent_id }}/proposals/{{ p.id }}/review">
+                                <div class="grid grid-cols-2 md:grid-cols-4 gap-2 mb-3">
+                                    {% set ratings = [
+                                        (1, "Not a good idea", "Not interesting OR multiple major weaknesses"),
+                                        (2, "Good idea", "Medium interest OR one major weakness"),
+                                        (3, "Great idea", "High interest, minor weaknesses only"),
+                                        (4, "Excellent idea", "High interest, no notable weaknesses"),
+                                    ] %}
+                                    {% for val, label, desc in ratings %}
+                                    <label class="flex items-start gap-2 cursor-pointer p-2 rounded-lg border border-gray-200 hover:bg-gray-50">
+                                        <input type="radio" name="rating" value="{{ val }}" class="mt-0.5 text-indigo-600" required>
+                                        <div>
+                                            <div class="text-sm font-medium text-gray-800">{{ val }} — {{ label }}</div>
+                                            <div class="text-xs text-gray-500">{{ desc }}</div>
+                                        </div>
+                                    </label>
+                                    {% endfor %}
+                                </div>
+                                <textarea name="comment" rows="3" placeholder="Optional comment — what did the agent get right or wrong?"
+                                          class="w-full text-sm px-3 py-2 mb-3"></textarea>
+                                <button type="submit"
+                                        class="px-5 py-2 bg-indigo-600 text-white text-sm font-medium rounded-lg hover:bg-indigo-700">
+                                    Submit Review
+                                </button>
+                            </form>
+                        </div>
+
+                        <!-- Give Guidance & Reopen tab -->
+                        <div id="reopen-{{ idx }}" class="tab-panel hidden">
+                            <p class="text-sm text-gray-500 mb-3">
+                                Send guidance to both agents. Your feedback will be posted in the Slack thread
+                                and the agents will continue the conversation with a fresh set of replies.
+                            </p>
+                            <form method="POST" action="/agent/{{ agent.agent_id }}/proposals/{{ p.id }}/reopen">
+                                <textarea name="guidance" rows="4" required
+                                          placeholder="e.g., Work out the experimental design in more detail. Focus on the aging angle rather than general drug repurposing."
+                                          class="w-full text-sm px-3 py-2 mb-3 border border-gray-300 rounded-lg"></textarea>
+                                <button type="submit"
+                                        class="px-5 py-2 bg-amber-600 text-white text-sm font-medium rounded-lg hover:bg-amber-700">
+                                    Post Guidance &amp; Reopen Thread
+                                </button>
+                            </form>
+                        </div>
                     </div>
                 </div>
             </div>
@@ -222,6 +297,13 @@ <h2 class="text-lg font-semibold text-gray-800 mb-4">Reviewed Proposals</h2>
             <p class="text-sm text-gray-500">View and edit your agent's private behavioral profile.</p>
         </a>
 
+        <!-- Podcast settings -->
+        <a href="/agent/{{ agent.agent_id }}/podcast-settings"
+           class="bg-white rounded-xl border border-gray-200 p-5 hover:border-indigo-300 transition">
+            <div class="text-lg font-semibold text-gray-800 mb-1">Podcast Settings</div>
+            <p class="text-sm text-gray-500">Customize your daily research briefing: voice, extra keywords, and journal preferences.</p>
+        </a>
+
         <!-- Slack -->
         <a href="{{ slack_invite_url }}" target="_blank"
            class="bg-white rounded-xl border border-gray-200 p-5 hover:border-indigo-300 transition">
@@ -345,8 +427,31 @@ <h2 class="text-lg font-semibold text-gray-800 mb-4">Reviewed Proposals</h2>
     });
 });
 
+function toggleProposal(idx, total) {
+    for (var i = 1; i <= total; i++) {
+        var body = document.getElementById('prop-body-' + i);
+        var chev = document.getElementById('prop-chevron-' + i);
+        if (!body) continue;
+        if (i === idx) {
+            var opening = body.classList.toggle('hidden');
+            if (chev) chev.style.transform = opening ? 'rotate(180deg)' : '';
+        } else {
+            body.classList.add('hidden');
+            if (chev) chev.style.transform = 'rotate(180deg)';
+        }
+    }
+}
+
+function toggleDiscussion(btn, panelId) {
+    var panel = document.getElementById(panelId);
+    var label = btn.querySelector('.disc-label');
+    var arrow = btn.querySelector('.disc-arrow');
+    var hidden = panel.classList.toggle('hidden');
+    label.textContent = hidden ? 'Show discussion' : 'Hide discussion';
+    if (arrow) arrow.style.transform = hidden ? '' : 'rotate(180deg)';
+}
+
 function showTab(btn, panelId) {
-    // Find sibling tab buttons and panels within the same proposal card
     var container = btn.closest('.border-t');
     var buttons = container.querySelectorAll('.tab-btn');
     var panels = container.querySelectorAll('.tab-panel');
diff --git a/templates/agent/podcast_settings.html b/templates/agent/podcast_settings.html
new file mode 100644
index 0000000..cdd5d58
--- /dev/null
+++ b/templates/agent/podcast_settings.html
@@ -0,0 +1,126 @@
+{% extends "base.html" %}
+{% block title %}Podcast Settings — {{ agent.bot_name }} — CoPI{% endblock %}
+
+{% block content %}
+<div class="max-w-2xl mx-auto">
+    <div class="flex items-center justify-between mb-6">
+        <div>
+            <a href="/agent/{{ agent.agent_id }}/dashboard" class="text-sm text-gray-500 hover:text-gray-700">&larr; My Agent</a>
+            <h1 class="text-2xl font-bold text-gray-900 mt-1">Podcast Settings</h1>
+            <p class="text-sm text-gray-500">Customize your daily research briefing for {{ agent.bot_name }}</p>
+        </div>
+    </div>
+
+    {% if saved %}
+    <div class="bg-green-50 border border-green-200 rounded-lg p-3 mb-6 text-sm text-green-700">
+        Preferences saved successfully.
+    </div>
+    {% endif %}
+
+    <form method="POST" action="/agent/{{ agent.agent_id }}/podcast-settings">
+        <input type="hidden" name="podcast_enabled" value="0" />
+
+        <!-- Enable / disable toggle -->
+        <div class="bg-white rounded-xl shadow-sm border border-gray-200 p-6 mb-4 flex items-center justify-between">
+            <div>
+                <h2 class="text-base font-semibold text-gray-800">Enable Podcast</h2>
+                <p class="text-sm text-gray-500 mt-0.5">
+                    When enabled, a new research briefing is generated daily and sent via Slack DM.
+                </p>
+            </div>
+            <label class="relative inline-flex items-center cursor-pointer ml-6 shrink-0">
+                <input type="checkbox" name="podcast_enabled" value="1"
+                       id="podcast-enabled-toggle"
+                       {% if not prefs or prefs.podcast_enabled %}checked{% endif %}
+                       class="sr-only peer"
+                       onchange="this.form.querySelector('input[type=hidden][name=podcast_enabled]').disabled = this.checked">
+                <div class="w-11 h-6 bg-gray-200 peer-focus:outline-none peer-focus:ring-2 peer-focus:ring-indigo-500
+                            rounded-full peer peer-checked:after:translate-x-full peer-checked:after:border-white
+                            after:content-[''] after:absolute after:top-[2px] after:left-[2px]
+                            after:bg-white after:border-gray-300 after:border after:rounded-full after:h-5 after:w-5
+                            after:transition-all peer-checked:bg-indigo-600"></div>
+            </label>
+        </div>
+
+        <!-- Voice selection -->
+        <div class="bg-white rounded-xl shadow-sm border border-gray-200 p-6 mb-4">
+            <h2 class="text-base font-semibold text-gray-800 mb-1">Voice</h2>
+            <p class="text-sm text-gray-500 mb-4">
+                Select the text-to-speech voice used for your audio episodes.
+                Voices are from Mistral AI's <code class="text-xs bg-gray-100 px-1 rounded">voxtral-mini-tts-latest</code> model.
+            </p>
+            <select name="voice_id"
+                    class="w-full border border-gray-300 rounded-lg px-3 py-2 text-sm focus:ring-indigo-500 focus:border-indigo-500">
+                <option value="" {% if not prefs or not prefs.voice_id %}selected{% endif %}>
+                    Default (system setting)
+                </option>
+                {% for voice_id, voice_label in voices %}
+                <option value="{{ voice_id }}"
+                        {% if prefs and prefs.voice_id == voice_id %}selected{% endif %}>
+                    {{ voice_label }}
+                </option>
+                {% endfor %}
+            </select>
+        </div>
+
+        <!-- Extra search keywords -->
+        <div class="bg-white rounded-xl shadow-sm border border-gray-200 p-6 mb-4">
+            <h2 class="text-base font-semibold text-gray-800 mb-1">Extra Search Keywords</h2>
+            <p class="text-sm text-gray-500 mb-4">
+                Additional terms to include in the daily literature search, beyond what is
+                auto-extracted from your lab profile. One keyword or phrase per line (max 20).
+                These are added as quoted PubMed search terms.
+            </p>
+            <textarea name="extra_keywords_raw" rows="6"
+                      placeholder="insulin receptor substrate&#10;adipose tissue browning&#10;mitochondrial fission"
+                      class="w-full text-sm border border-gray-300 rounded-lg px-3 py-2 focus:ring-indigo-500 focus:border-indigo-500 font-mono">{% if prefs and prefs.extra_keywords %}{{ prefs.extra_keywords | join('\n') }}{% endif %}</textarea>
+            <p class="text-xs text-gray-400 mt-1">
+                {% if prefs and prefs.extra_keywords %}{{ prefs.extra_keywords | length }} keyword(s) saved.{% else %}No extra keywords set.{% endif %}
+            </p>
+        </div>
+
+        <!-- Source preferences -->
+        <div class="bg-white rounded-xl shadow-sm border border-gray-200 p-6 mb-4">
+            <h2 class="text-base font-semibold text-gray-800 mb-1">Source Preferences</h2>
+            <p class="text-sm text-gray-500 mb-5">
+                Guide the article selection by telling the AI which journals or preprint servers
+                to prioritize or avoid. One source per line (or comma-separated).
+            </p>
+
+            <div class="mb-4">
+                <label class="block text-sm font-medium text-gray-700 mb-1">
+                    Preferred sources
+                    <span class="font-normal text-gray-400 ml-1">— given extra weight when relevance is comparable</span>
+                </label>
+                <textarea name="preferred_journals_raw" rows="4"
+                          placeholder="Nature Methods&#10;Cell Systems&#10;eLife&#10;bioRxiv"
+                          class="w-full text-sm border border-gray-300 rounded-lg px-3 py-2 focus:ring-indigo-500 focus:border-indigo-500 font-mono">{% if prefs and prefs.preferred_journals %}{{ prefs.preferred_journals | join('\n') }}{% endif %}</textarea>
+            </div>
+
+            <div>
+                <label class="block text-sm font-medium text-gray-700 mb-1">
+                    Deprioritized sources
+                    <span class="font-normal text-gray-400 ml-1">— skipped unless exceptionally relevant</span>
+                </label>
+                <textarea name="deprioritized_journals_raw" rows="4"
+                          placeholder="Frontiers in Neuroscience&#10;PLOS ONE"
+                          class="w-full text-sm border border-gray-300 rounded-lg px-3 py-2 focus:ring-indigo-500 focus:border-indigo-500 font-mono">{% if prefs and prefs.deprioritized_journals %}{{ prefs.deprioritized_journals | join('\n') }}{% endif %}</textarea>
+            </div>
+        </div>
+
+        <div class="flex items-center gap-3">
+            <button type="submit"
+                    class="px-5 py-2 bg-indigo-600 text-white text-sm font-medium rounded-lg hover:bg-indigo-700">
+                Save Preferences
+            </button>
+            <a href="/agent/{{ agent.agent_id }}/dashboard"
+               class="px-5 py-2 bg-gray-100 text-gray-700 text-sm font-medium rounded-lg hover:bg-gray-200">
+                Cancel
+            </a>
+        </div>
+        <p class="mt-3 text-xs text-gray-400">
+            Changes take effect on the next scheduled podcast run (daily at 9am UTC).
+        </p>
+    </form>
+</div>
+{% endblock %}
diff --git a/templates/base.html b/templates/base.html
index 74db818..afb97a0 100644
--- a/templates/base.html
+++ b/templates/base.html
@@ -55,6 +55,14 @@
                         </span>
                         {% endif %}
                     </a>
+                    <a href="/proposals" class="text-gray-600 hover:text-indigo-600 px-3 py-2 rounded-md text-sm font-medium
+                        {% if active_page == 'proposals' %}text-indigo-600 font-semibold{% endif %}">
+                        Proposals
+                    </a>
+                    <a href="/podcast/settings" class="text-gray-600 hover:text-indigo-600 px-3 py-2 rounded-md text-sm font-medium
+                        {% if active_page == 'podcast' %}text-indigo-600 font-semibold{% endif %}">
+                        Podcast
+                    </a>
                     {% if current_user.is_admin and not impersonation_banner %}
                     <a href="/admin/users" class="text-gray-600 hover:text-indigo-600 px-3 py-2 rounded-md text-sm font-medium
                         {% if active_page == 'admin' %}text-indigo-600 font-semibold{% endif %}">
@@ -85,9 +93,12 @@
             <a href="/admin/jobs" class="{% if active_admin == 'jobs' %}text-indigo-600 font-semibold{% else %}text-gray-500 hover:text-gray-700{% endif %}">Jobs</a>
             <a href="/admin/activity" class="{% if active_admin == 'activity' %}text-indigo-600 font-semibold{% else %}text-gray-500 hover:text-gray-700{% endif %}">Activity</a>
             <a href="/admin/discussions" class="{% if active_admin == 'discussions' %}text-indigo-600 font-semibold{% else %}text-gray-500 hover:text-gray-700{% endif %}">Discussions</a>
+            <a href="/admin/matchmaker" class="{% if active_admin == 'matchmaker' %}text-indigo-600 font-semibold{% else %}text-gray-500 hover:text-gray-700{% endif %}">Matchmaker</a>
             <a href="/admin/agents" class="{% if active_admin == 'agents' %}text-indigo-600 font-semibold{% else %}text-gray-500 hover:text-gray-700{% endif %}">Agents</a>
+            <a href="/admin/podcast" class="{% if active_admin == 'podcast' %}text-indigo-600 font-semibold{% else %}text-gray-500 hover:text-gray-700{% endif %}">Podcast</a>
             <a href="/admin/access-requests" class="{% if active_admin == 'access' %}text-indigo-600 font-semibold{% else %}text-gray-500 hover:text-gray-700{% endif %}">Access</a>
             <a href="/admin/waitlist" class="{% if active_admin == 'waitlist' %}text-indigo-600 font-semibold{% else %}text-gray-500 hover:text-gray-700{% endif %}">Waitlist</a>
+            <a href="/admin/evaluations" class="{% if active_admin == 'evaluations' %}text-indigo-600 font-semibold{% else %}text-gray-500 hover:text-gray-700{% endif %}">Evaluations</a>
         </div>
     </div>
 </div>
@@ -134,6 +145,9 @@
         } else if (fmt === 'short') {
             el.textContent = d.toLocaleDateString([], {month: 'short', day: 'numeric'}) + ' ' +
                              d.toLocaleTimeString([], {hour: '2-digit', minute: '2-digit'});
+        } else if (fmt === 'disc') {
+            el.textContent = d.toLocaleDateString([], {weekday: 'long'}) + ' ' +
+                             d.toLocaleTimeString([], {hour: 'numeric', minute: '2-digit'});
         } else {
             el.textContent = d.toLocaleDateString([], {month: 'short', day: 'numeric', year: 'numeric'}) + ' ' +
                              d.toLocaleTimeString([], {hour: '2-digit', minute: '2-digit'});
diff --git a/templates/podcast_settings.html b/templates/podcast_settings.html
new file mode 100644
index 0000000..18d658e
--- /dev/null
+++ b/templates/podcast_settings.html
@@ -0,0 +1,211 @@
+{% extends "base.html" %}
+{% block title %}Podcast Settings — CoPI{% endblock %}
+
+{% block content %}
+<div class="max-w-2xl mx-auto">
+    <div class="flex items-center justify-between mb-6">
+        <div>
+            <a href="/profile" class="text-sm text-gray-500 hover:text-gray-700">&larr; My Profile</a>
+            <h1 class="text-2xl font-bold text-gray-900 mt-1">Podcast Settings</h1>
+            <p class="text-sm text-gray-500">Customize your daily LabBot research briefing</p>
+        </div>
+    </div>
+
+    {% if saved %}
+    <div class="bg-green-50 border border-green-200 rounded-lg p-3 mb-6 text-sm text-green-700">
+        Preferences saved successfully.
+    </div>
+    {% endif %}
+
+    <!-- Feed URL card -->
+    <div class="bg-indigo-50 border border-indigo-200 rounded-xl p-5 mb-6">
+        <h2 class="text-sm font-semibold text-indigo-800 mb-1">Your Podcast Feed URL</h2>
+        <p class="text-xs text-indigo-600 mb-3">
+            Subscribe to this URL in any podcast app (Apple Podcasts, Overcast, Pocket Casts, etc.)
+            to receive audio episodes automatically. The URL is stable and does not require login.
+        </p>
+        <div class="flex items-center gap-2">
+            <input type="text" readonly
+                   id="feed-url-input"
+                   class="flex-1 text-xs bg-white border border-indigo-300 rounded-lg px-3 py-2 font-mono text-gray-700 focus:outline-none" />
+            <button type="button"
+                    onclick="navigator.clipboard.writeText(document.getElementById('feed-url-input').value).then(() => { this.textContent = 'Copied!'; setTimeout(() => this.textContent = 'Copy', 1500); })"
+                    class="px-3 py-2 bg-indigo-600 text-white text-xs font-medium rounded-lg hover:bg-indigo-700 whitespace-nowrap">
+                Copy
+            </button>
+        </div>
+        <script>
+            document.getElementById('feed-url-input').value = window.location.origin + '{{ feed_path }}';
+        </script>
+        <p class="text-xs text-indigo-500 mt-2">
+            {% if podcast_enabled %}
+            New episodes are generated daily at 9am UTC. You can also
+            <button type="button" id="generate-btn"
+                    onclick="triggerGenerate()"
+                    class="underline hover:text-indigo-700">generate one now</button>.
+            {% else %}
+            Enable the podcast below to start receiving daily episodes.
+            {% endif %}
+        </p>
+        <p id="generate-status" class="text-xs text-indigo-700 mt-1 hidden"></p>
+    </div>
+
+    <!-- Feed URL card note when disabled -->
+    {% if not podcast_enabled %}
+    <div class="bg-yellow-50 border border-yellow-200 rounded-xl p-4 mb-6 text-sm text-yellow-800">
+        Podcast generation is currently <strong>disabled</strong>. Enable it below to start receiving daily briefings.
+    </div>
+    {% endif %}
+
+    <form method="POST" action="/podcast/settings">
+        <input type="hidden" name="podcast_enabled" value="0" />
+
+        <!-- Enable / disable toggle -->
+        <div class="bg-white rounded-xl shadow-sm border border-gray-200 p-6 mb-4 flex items-center justify-between">
+            <div>
+                <h2 class="text-base font-semibold text-gray-800">Enable Podcast</h2>
+                <p class="text-sm text-gray-500 mt-0.5">
+                    When enabled, a new research briefing is generated daily at 9am UTC and added to your feed.
+                </p>
+            </div>
+            <label class="relative inline-flex items-center cursor-pointer ml-6 shrink-0">
+                <input type="checkbox" name="podcast_enabled" value="1"
+                       id="podcast-enabled-toggle"
+                       {% if podcast_enabled %}checked{% endif %}
+                       class="sr-only peer"
+                       onchange="this.form.querySelector('input[type=hidden][name=podcast_enabled]').disabled = this.checked">
+                <div class="w-11 h-6 bg-gray-200 peer-focus:outline-none peer-focus:ring-2 peer-focus:ring-indigo-500
+                            rounded-full peer peer-checked:after:translate-x-full peer-checked:after:border-white
+                            after:content-[''] after:absolute after:top-[2px] after:left-[2px]
+                            after:bg-white after:border-gray-300 after:border after:rounded-full after:h-5 after:w-5
+                            after:transition-all peer-checked:bg-indigo-600"></div>
+            </label>
+        </div>
+
+        <!-- Voice selection -->
+        <div class="bg-white rounded-xl shadow-sm border border-gray-200 p-6 mb-4">
+            <h2 class="text-base font-semibold text-gray-800 mb-1">Voice</h2>
+            <p class="text-sm text-gray-500 mb-4">
+                Select the text-to-speech voice used for your audio episodes.
+                Voices are from Mistral AI's <code class="text-xs bg-gray-100 px-1 rounded">voxtral-mini-tts-latest</code> model.
+            </p>
+            <select name="voice_id"
+                    class="w-full border border-gray-300 rounded-lg px-3 py-2 text-sm focus:ring-indigo-500 focus:border-indigo-500">
+                <option value="" {% if not prefs or not prefs.voice_id %}selected{% endif %}>
+                    Default (system setting)
+                </option>
+                {% for voice_id, voice_label in voices %}
+                <option value="{{ voice_id }}"
+                        {% if prefs and prefs.voice_id == voice_id %}selected{% endif %}>
+                    {{ voice_label }}
+                </option>
+                {% endfor %}
+            </select>
+        </div>
+
+        <!-- Extra search keywords -->
+        <div class="bg-white rounded-xl shadow-sm border border-gray-200 p-6 mb-4">
+            <h2 class="text-base font-semibold text-gray-800 mb-1">Extra Search Keywords</h2>
+            <p class="text-sm text-gray-500 mb-4">
+                Additional terms to include in the daily literature search, beyond what is
+                auto-extracted from your profile. One keyword or phrase per line (max 20).
+                These are added as quoted PubMed search terms.
+            </p>
+            <textarea name="extra_keywords_raw" rows="6"
+                      placeholder="insulin receptor substrate&#10;adipose tissue browning&#10;mitochondrial fission"
+                      class="w-full text-sm border border-gray-300 rounded-lg px-3 py-2 focus:ring-indigo-500 focus:border-indigo-500 font-mono">{% if prefs and prefs.extra_keywords %}{{ prefs.extra_keywords | join('\n') }}{% endif %}</textarea>
+            <p class="text-xs text-gray-400 mt-1">
+                {% if prefs and prefs.extra_keywords %}{{ prefs.extra_keywords | length }} keyword(s) saved.{% else %}No extra keywords set.{% endif %}
+            </p>
+        </div>
+
+        <!-- Source preferences -->
+        <div class="bg-white rounded-xl shadow-sm border border-gray-200 p-6 mb-4">
+            <h2 class="text-base font-semibold text-gray-800 mb-1">Source Preferences</h2>
+            <p class="text-sm text-gray-500 mb-5">
+                Guide the article selection by telling the AI which journals or preprint servers
+                to prioritize or avoid. One source per line (or comma-separated).
+            </p>
+
+            <div class="mb-4">
+                <label class="block text-sm font-medium text-gray-700 mb-1">
+                    Preferred sources
+                    <span class="font-normal text-gray-400 ml-1">— given extra weight when relevance is comparable</span>
+                </label>
+                <textarea name="preferred_journals_raw" rows="4"
+                          placeholder="Nature Methods&#10;Cell Systems&#10;eLife&#10;bioRxiv"
+                          class="w-full text-sm border border-gray-300 rounded-lg px-3 py-2 focus:ring-indigo-500 focus:border-indigo-500 font-mono">{% if prefs and prefs.preferred_journals %}{{ prefs.preferred_journals | join('\n') }}{% endif %}</textarea>
+            </div>
+
+            <div>
+                <label class="block text-sm font-medium text-gray-700 mb-1">
+                    Deprioritized sources
+                    <span class="font-normal text-gray-400 ml-1">— skipped unless exceptionally relevant</span>
+                </label>
+                <textarea name="deprioritized_journals_raw" rows="4"
+                          placeholder="Frontiers in Neuroscience&#10;PLOS ONE"
+                          class="w-full text-sm border border-gray-300 rounded-lg px-3 py-2 focus:ring-indigo-500 focus:border-indigo-500 font-mono">{% if prefs and prefs.deprioritized_journals %}{{ prefs.deprioritized_journals | join('\n') }}{% endif %}</textarea>
+            </div>
+        </div>
+
+        <div class="flex items-center gap-3">
+            <button type="submit"
+                    class="px-5 py-2 bg-indigo-600 text-white text-sm font-medium rounded-lg hover:bg-indigo-700">
+                Save Preferences
+            </button>
+            <a href="/profile"
+               class="px-5 py-2 bg-gray-100 text-gray-700 text-sm font-medium rounded-lg hover:bg-gray-200">
+                Cancel
+            </a>
+        </div>
+        <p class="mt-3 text-xs text-gray-400">
+            Changes take effect on the next scheduled podcast run (daily at 9am UTC).
+        </p>
+    </form>
+
+    {% if recent_episodes %}
+    <!-- Recent episodes -->
+    <div class="bg-white rounded-xl shadow-sm border border-gray-200 p-6 mt-6">
+        <h2 class="text-base font-semibold text-gray-800 mb-3">Recent Episodes</h2>
+        <ul class="divide-y divide-gray-100">
+            {% for ep in recent_episodes %}
+            <li class="py-2 flex items-center gap-3">
+                <span class="text-xs text-gray-400 whitespace-nowrap font-mono">{{ ep.episode_date }}</span>
+                <a href="/podcast/users/{{ current_user.id }}/audio/{{ ep.episode_date }}.mp3"
+                   class="text-sm text-indigo-600 hover:underline truncate"
+                   title="{{ ep.paper_title }}">
+                    {{ ep.paper_title }}
+                </a>
+            </li>
+            {% endfor %}
+        </ul>
+    </div>
+    {% endif %}
+</div>
+{% endblock %}
+
+{% block scripts %}
+<script>
+async function triggerGenerate() {
+    const btn = document.getElementById('generate-btn');
+    const status = document.getElementById('generate-status');
+    btn.disabled = true;
+    btn.textContent = 'Starting…';
+    status.classList.remove('hidden');
+    status.textContent = 'Requesting episode generation…';
+    try {
+        const resp = await fetch('/podcast/user/generate', { method: 'POST' });
+        if (resp.ok) {
+            status.textContent = 'Generation started — check your feed in a few minutes.';
+        } else {
+            const data = await resp.json().catch(() => ({}));
+            status.textContent = 'Error: ' + (data.detail || resp.statusText);
+        }
+    } catch (e) {
+        status.textContent = 'Request failed: ' + e.message;
+    }
+    btn.disabled = false;
+    btn.textContent = 'generate one now';
+}
+</script>
+{% endblock %}
diff --git a/templates/profile/view.html b/templates/profile/view.html
index 0bbc22d..e4b2d53 100644
--- a/templates/profile/view.html
+++ b/templates/profile/view.html
@@ -29,6 +29,16 @@ <h1 class="text-2xl font-bold text-gray-900">{{ user.name }}</h1>
         </div>
     </div>
 
+    {% if podcast_incomplete %}
+    <div class="bg-amber-50 border border-amber-200 rounded-xl p-4 mb-6">
+        <h3 class="font-semibold text-amber-800">Podcast not available yet</h3>
+        <p class="text-sm text-amber-700 mt-1">
+            Your research profile needs to be generated before you can access Podcast settings.
+            Once your profile is ready you can visit <a href="/podcast/settings" class="underline">Podcast Settings</a>.
+        </p>
+    </div>
+    {% endif %}
+
     {% if just_completed_onboarding %}
     <div class="bg-indigo-50 border border-indigo-200 rounded-xl p-4 mb-6">
         <h3 class="font-semibold text-indigo-800">Welcome to CoPI!</h3>
diff --git a/templates/proposals/evaluate.html b/templates/proposals/evaluate.html
new file mode 100644
index 0000000..8df9b9b
--- /dev/null
+++ b/templates/proposals/evaluate.html
@@ -0,0 +1,168 @@
+{% extends "base.html" %}
+{% block title %}Evaluate Proposal — CoPI{% endblock %}
+
+{% block extra_head %}
+<script src="https://cdn.jsdelivr.net/npm/marked/marked.min.js"></script>
+<style>
+    .proposal-md h1 { font-weight: 700; font-size: 1.1rem; margin-top: 0.75rem; margin-bottom: 0.25rem; }
+    .proposal-md h2 { font-weight: 600; font-size: 1rem; margin-top: 0.75rem; margin-bottom: 0.25rem; }
+    .proposal-md p  { margin-bottom: 0.5rem; }
+    .proposal-md ul, .proposal-md ol { padding-left: 1.5rem; margin-bottom: 0.5rem; }
+    .proposal-md li { margin-bottom: 0.25rem; }
+    .proposal-md strong { font-weight: 600; }
+    .score-radio { flex: 1; }
+    .score-radio input[type="radio"] { display: none; }
+    .score-radio label {
+        display: block; width: 100%; text-align: center;
+        padding: 0.45rem 0; cursor: pointer;
+        border: 1px solid #e5e7eb; border-radius: 0.375rem;
+        font-size: 1rem; font-weight: 700; color: #374151;
+        transition: all 0.1s;
+    }
+    .score-radio input[type="radio"]:checked + label {
+        background: #4f46e5; border-color: #4f46e5; color: #fff;
+    }
+    .score-radio label:hover { border-color: #6366f1; color: #4f46e5; }
+    .score-radio input[type="radio"]:checked + label:hover { background: #4338ca; color: #fff; }
+</style>
+{% endblock %}
+
+{% block content %}
+<div class="max-w-3xl mx-auto">
+
+    <!-- Back link + step indicator -->
+    <div class="flex items-center justify-between mb-4">
+        <a href="/proposals" class="text-sm text-gray-500 hover:text-indigo-600">
+            ← Back to proposals
+        </a>
+        {% if group_token is defined and total_steps is defined and total_steps > 1 %}
+        <span class="text-sm text-gray-400 font-medium">
+            {{ step + 1 }} of {{ total_steps }}
+        </span>
+        {% endif %}
+    </div>
+
+    <!-- Proposal display -->
+    <div class="bg-white rounded-xl border border-gray-200 shadow-sm p-6 mb-8">
+        <h1 class="text-xl font-bold text-gray-900 mb-1">{{ title }}</h1>
+        <p class="text-sm text-gray-500 mb-4">Proposed collaboration with <strong>{{ collaborator }}</strong></p>
+        <hr class="border-gray-100 mb-4">
+        <div class="proposal-md text-sm text-gray-700" id="proposal-body">{{ body_md }}</div>
+    </div>
+
+    <!-- Scoring guide (collapsible) -->
+    <details class="bg-amber-50 border border-amber-200 rounded-lg mb-8 text-sm">
+        <summary class="px-4 py-3 cursor-pointer font-medium text-amber-800 select-none">
+            Show scoring guide (NIH 1–9 scale) ▾
+        </summary>
+        <div class="px-4 pb-4 pt-1 text-gray-700">
+            <p class="mb-3">
+                Scores are whole numbers from <strong>1 (best)</strong> to <strong>9 (worst)</strong>.
+                Use the full range — scores of 1 and 9 are expected to be rare.
+            </p>
+            <table class="w-full text-xs border-collapse mb-3">
+                <thead>
+                    <tr class="bg-amber-100">
+                        <th class="border border-amber-200 px-2 py-1 text-left">Score</th>
+                        <th class="border border-amber-200 px-2 py-1 text-left">Descriptor</th>
+                        <th class="border border-amber-200 px-2 py-1 text-left">Strengths / Weaknesses</th>
+                    </tr>
+                </thead>
+                <tbody>
+                    <tr><td class="border border-amber-200 px-2 py-1 font-bold">1</td><td class="border border-amber-200 px-2 py-1 font-semibold">Exceptional</td><td class="border border-amber-200 px-2 py-1">Essentially no weaknesses</td></tr>
+                    <tr class="bg-amber-50"><td class="border border-amber-200 px-2 py-1 font-bold">2</td><td class="border border-amber-200 px-2 py-1 font-semibold">Outstanding</td><td class="border border-amber-200 px-2 py-1">Negligible weaknesses</td></tr>
+                    <tr><td class="border border-amber-200 px-2 py-1 font-bold">3</td><td class="border border-amber-200 px-2 py-1 font-semibold">Excellent</td><td class="border border-amber-200 px-2 py-1">Only minor weaknesses</td></tr>
+                    <tr class="bg-amber-50"><td class="border border-amber-200 px-2 py-1 font-bold">4</td><td class="border border-amber-200 px-2 py-1 font-semibold">Very Good</td><td class="border border-amber-200 px-2 py-1">Numerous minor weaknesses</td></tr>
+                    <tr><td class="border border-amber-200 px-2 py-1 font-bold">5</td><td class="border border-amber-200 px-2 py-1 font-semibold">Good</td><td class="border border-amber-200 px-2 py-1">At least one moderate weakness</td></tr>
+                    <tr class="bg-amber-50"><td class="border border-amber-200 px-2 py-1 font-bold">6</td><td class="border border-amber-200 px-2 py-1 font-semibold">Satisfactory</td><td class="border border-amber-200 px-2 py-1">Some moderate weaknesses</td></tr>
+                    <tr><td class="border border-amber-200 px-2 py-1 font-bold">7</td><td class="border border-amber-200 px-2 py-1 font-semibold">Fair</td><td class="border border-amber-200 px-2 py-1">At least one major weakness</td></tr>
+                    <tr class="bg-amber-50"><td class="border border-amber-200 px-2 py-1 font-bold">8</td><td class="border border-amber-200 px-2 py-1 font-semibold">Marginal</td><td class="border border-amber-200 px-2 py-1">A few major weaknesses</td></tr>
+                    <tr><td class="border border-amber-200 px-2 py-1 font-bold">9</td><td class="border border-amber-200 px-2 py-1 font-semibold">Poor</td><td class="border border-amber-200 px-2 py-1">Numerous major weaknesses</td></tr>
+                </tbody>
+            </table>
+            <p class="text-xs text-gray-500">
+                Scores 1–3 = high impact; 4–6 = moderate; 7–9 = low.
+            </p>
+        </div>
+    </details>
+
+    <!-- Evaluation form -->
+    {% if group_token is defined %}
+    <form method="POST" action="/proposals/group/{{ group_token }}/{{ step }}" class="space-y-8">
+    {% else %}
+    <form method="POST" action="/proposals/{{ token }}/evaluate" class="space-y-8">
+    {% endif %}
+
+        <!-- Overall Impact -->
+        {% set existing_impact = evaluation.score_overall_impact if evaluation else none %}
+        <div class="bg-indigo-50 rounded-xl border border-indigo-200 shadow-sm p-6">
+            <h2 class="text-base font-semibold text-gray-900 mb-1">Overall Impact Score</h2>
+            <p class="text-sm text-gray-600 mb-4">
+                Your holistic assessment of the likelihood that this collaboration would exert a
+                <strong>sustained, powerful influence</strong> on the research field(s) involved.
+                A proposal need not be strong in every dimension to earn a high impact score.
+            </p>
+
+            <div class="mb-4">
+                <div class="flex gap-1 w-full">
+                    {% for s in range(1, 10) %}
+                    <div class="score-radio">
+                        <input type="radio" name="score_overall_impact" id="score_overall_impact_{{ s }}" value="{{ s }}"
+                               {% if existing_impact == s %}checked{% endif %} required>
+                        <label for="score_overall_impact_{{ s }}">{{ s }}</label>
+                    </div>
+                    {% endfor %}
+                </div>
+                <div class="flex justify-between text-xs text-gray-400 mt-1 px-0.5">
+                    <span>Exceptional</span>
+                    <span>Poor</span>
+                </div>
+            </div>
+
+            <label class="block text-xs font-medium text-gray-700 mb-1">
+                Overall comments
+            </label>
+            <textarea name="comments_overall" rows="4"
+                      placeholder="Summarize the key strengths and weaknesses driving your overall impact score…"
+                      class="w-full text-sm border border-gray-300 rounded-md px-3 py-2 focus:outline-none focus:border-indigo-500 focus:ring-1 focus:ring-indigo-500">{{ evaluation.comments_overall if evaluation else '' }}</textarea>
+        </div>
+
+        <div class="flex items-center justify-between pt-2">
+            <a href="/proposals" class="text-sm text-gray-500 hover:text-gray-700">Cancel</a>
+            {% if group_token is defined and step + 1 < total_steps %}
+            <button type="submit"
+                    class="px-6 py-2.5 bg-indigo-600 text-white text-sm font-medium rounded-lg hover:bg-indigo-700 focus:outline-none focus:ring-2 focus:ring-indigo-500">
+                Next →
+            </button>
+            {% else %}
+            <button type="submit"
+                    class="px-6 py-2.5 bg-indigo-600 text-white text-sm font-medium rounded-lg hover:bg-indigo-700 focus:outline-none focus:ring-2 focus:ring-indigo-500">
+                {% if evaluation %}Update{% else %}Save{% endif %}
+            </button>
+            {% endif %}
+        </div>
+
+        {% if evaluation and evaluation.updated_at %}
+        <p class="text-xs text-gray-400 text-right">
+            Last updated <span data-utc="{{ evaluation.updated_at.isoformat() }}" data-utc-fmt="short">{{ evaluation.updated_at.strftime('%b %d %H:%M') }}</span>
+        </p>
+        {% elif evaluation %}
+        <p class="text-xs text-gray-400 text-right">
+            Submitted <span data-utc="{{ evaluation.evaluated_at.isoformat() }}" data-utc-fmt="short">{{ evaluation.evaluated_at.strftime('%b %d %H:%M') }}</span>
+        </p>
+        {% endif %}
+
+    </form>
+</div>
+{% endblock %}
+
+{% block scripts %}
+<script>
+document.addEventListener('DOMContentLoaded', function() {
+    var body = document.getElementById('proposal-body');
+    if (body && typeof marked !== 'undefined') {
+        body.innerHTML = marked.parse(body.textContent || '');
+    }
+});
+</script>
+{% endblock %}
diff --git a/templates/proposals/list.html b/templates/proposals/list.html
new file mode 100644
index 0000000..2f4414e
--- /dev/null
+++ b/templates/proposals/list.html
@@ -0,0 +1,75 @@
+{% extends "base.html" %}
+{% block title %}Collaboration Proposals — CoPI{% endblock %}
+
+{% block content %}
+<div class="max-w-2xl mx-auto">
+    <div class="mb-6">
+        <h1 class="text-2xl font-bold text-gray-900">Collaboration Proposals</h1>
+        <p class="mt-1 text-sm text-gray-500">
+            Evaluate proposals involving your lab using the NIH 1–9 impact scale.
+        </p>
+    </div>
+
+    {% if flash_message %}
+    <div class="mb-6 rounded-md p-4
+        {% if flash_type == 'success' %}bg-green-50 border border-green-200 text-green-800
+        {% else %}bg-blue-50 border border-blue-200 text-blue-800{% endif %}">
+        {{ flash_message }}
+    </div>
+    {% endif %}
+
+    {% if groups %}
+    <div class="space-y-3">
+        {% for g in groups %}
+        <div class="bg-white rounded-xl border border-gray-200 shadow-sm px-5 py-4 flex items-center justify-between gap-4">
+            <div class="min-w-0">
+                <p class="font-medium text-gray-900">With
+                    {% if g.collaborator_agent_id %}
+                    <a href="/researcher/{{ g.collaborator_agent_id }}" target="_blank"
+                       class="text-indigo-600 hover:text-indigo-800 hover:underline">{{ g.collaborator }}</a>
+                    {% else %}
+                    {{ g.collaborator }}
+                    {% endif %}
+                </p>
+                <p class="text-sm text-gray-400 mt-0.5">
+                    {{ g.total }} proposal{{ 's' if g.total != 1 else '' }}
+                    {% if g.evaluated_count > 0 and not g.all_evaluated %}
+                    &middot; {{ g.evaluated_count }} of {{ g.total }} evaluated
+                    {% endif %}
+                </p>
+            </div>
+            <div class="flex items-center gap-3 flex-shrink-0">
+                {% if g.all_evaluated %}
+                <span class="px-2.5 py-1 rounded-full text-xs font-medium bg-green-100 text-green-700">
+                    All evaluated
+                </span>
+                <a href="/proposals/group/{{ g.group_token }}/0"
+                   class="text-sm text-gray-500 hover:text-indigo-600 whitespace-nowrap">
+                    Review
+                </a>
+                {% else %}
+                <a href="/proposals/group/{{ g.group_token }}/0"
+                   class="px-4 py-1.5 bg-indigo-600 text-white text-sm font-medium rounded-lg hover:bg-indigo-700 whitespace-nowrap">
+                    Evaluate
+                </a>
+                {% endif %}
+            </div>
+        </div>
+        {% endfor %}
+    </div>
+
+    <p class="mt-4 text-xs text-gray-400">
+        {{ groups | length }} collaborator{{ 's' if groups | length != 1 else '' }}
+    </p>
+
+    {% else %}
+    <div class="text-center py-16 text-gray-400">
+        <p class="text-sm">No collaboration proposals yet.</p>
+        <p class="text-xs mt-1">
+            Proposals will appear here once your agent has completed discussions or
+            the admin has generated a Matchmaker proposal involving you.
+        </p>
+    </div>
+    {% endif %}
+</div>
+{% endblock %}
diff --git a/templates/researcher/view.html b/templates/researcher/view.html
new file mode 100644
index 0000000..de7f8c0
--- /dev/null
+++ b/templates/researcher/view.html
@@ -0,0 +1,103 @@
+{% extends "base.html" %}
+{% block title %}{{ pi_user.name }} — CoPI{% endblock %}
+
+{% block content %}
+<div class="max-w-3xl mx-auto">
+    <div class="mb-6">
+        <h1 class="text-2xl font-bold text-gray-900">{{ pi_user.name }}</h1>
+        {% if pi_user.institution %}
+        <p class="text-sm text-gray-500 mt-0.5">{{ pi_user.institution }}</p>
+        {% endif %}
+        {% if pi_user.department %}
+        <p class="text-xs text-gray-400">{{ pi_user.department }}</p>
+        {% endif %}
+    </div>
+
+    {% if profile and profile.research_summary %}
+    <div class="bg-white rounded-xl shadow-sm border border-gray-200 p-6 mb-6">
+        <h2 class="text-lg font-semibold text-gray-800 mb-3">Research Summary</h2>
+        <p class="text-sm text-gray-700 leading-relaxed">{{ profile.research_summary }}</p>
+    </div>
+
+    {% if profile.techniques or profile.experimental_models or profile.disease_areas or profile.key_targets or profile.keywords %}
+    <div class="bg-white rounded-xl shadow-sm border border-gray-200 p-6 mb-6">
+        <div class="grid grid-cols-1 md:grid-cols-2 gap-6">
+            {% if profile.techniques %}
+            <div>
+                <h3 class="text-sm font-medium text-gray-500 uppercase tracking-wide mb-2">Techniques & Methods</h3>
+                <div class="flex flex-wrap gap-1.5">
+                    {% for t in profile.techniques %}
+                    <span class="tag-pill">{{ t }}</span>
+                    {% endfor %}
+                </div>
+            </div>
+            {% endif %}
+
+            {% if profile.experimental_models %}
+            <div>
+                <h3 class="text-sm font-medium text-gray-500 uppercase tracking-wide mb-2">Model Systems</h3>
+                <div class="flex flex-wrap gap-1.5">
+                    {% for m in profile.experimental_models %}
+                    <span class="tag-pill">{{ m }}</span>
+                    {% endfor %}
+                </div>
+            </div>
+            {% endif %}
+
+            {% if profile.disease_areas %}
+            <div>
+                <h3 class="text-sm font-medium text-gray-500 uppercase tracking-wide mb-2">Disease Areas</h3>
+                <div class="flex flex-wrap gap-1.5">
+                    {% for d in profile.disease_areas %}
+                    <span class="tag-pill">{{ d }}</span>
+                    {% endfor %}
+                </div>
+            </div>
+            {% endif %}
+
+            {% if profile.key_targets %}
+            <div>
+                <h3 class="text-sm font-medium text-gray-500 uppercase tracking-wide mb-2">Key Molecular Targets</h3>
+                <div class="flex flex-wrap gap-1.5">
+                    {% for k in profile.key_targets %}
+                    <span class="tag-pill">{{ k }}</span>
+                    {% endfor %}
+                </div>
+            </div>
+            {% endif %}
+
+            {% if profile.keywords %}
+            <div class="md:col-span-2">
+                <h3 class="text-sm font-medium text-gray-500 uppercase tracking-wide mb-2">Keywords</h3>
+                <div class="flex flex-wrap gap-1.5">
+                    {% for kw in profile.keywords %}
+                    <span class="tag-pill">{{ kw }}</span>
+                    {% endfor %}
+                </div>
+            </div>
+            {% endif %}
+        </div>
+    </div>
+    {% endif %}
+
+    {% else %}
+    <div class="bg-white rounded-xl shadow-sm border border-gray-200 p-8 text-center text-gray-400 text-sm">
+        No public profile content yet.
+    </div>
+    {% endif %}
+</div>
+
+<style>
+    .tag-pill {
+        display: inline-flex;
+        align-items: center;
+        background-color: #eef2ff;
+        color: #4338ca;
+        font-size: 0.8125rem;
+        padding: 2px 8px;
+        border-radius: 9999px;
+        white-space: nowrap;
+        line-height: 1.5;
+    }
+</style>
+{% endblock %}
diff --git a/testpairs2.tsv b/testpairs2.tsv
new file mode 100644
index 0000000..cbfed1d
--- /dev/null
+++ b/testpairs2.tsv
@@ -0,0 +1,12 @@
+Briney	Paulson
+Kim	Paulson
+Paulson	Azumaya
+Paulson	Briney
+Paulson	Forli
+Paulson	Mravic
+Paulson	Petrascheck
+Paulson	Pwu
+Paulson	Zaro
+Susa	Paulson
+Ward	Paulson
+Wilson	Paulson
diff --git a/tests/test_podcast.py b/tests/test_podcast.py
new file mode 100644
index 0000000..76e6138
--- /dev/null
+++ b/tests/test_podcast.py
@@ -0,0 +1,343 @@
+"""Unit tests for podcast pipeline pure-logic functions and RSS builder."""
+
+import json
+import os
+import tempfile
+from datetime import date
+from pathlib import Path
+from types import SimpleNamespace
+
+import pytest
+
+from src.podcast.pubmed_search import build_queries
+from src.podcast.pipeline import (
+    _format_candidates_for_prompt,
+    _extract_section_text,
+    _build_profile_text_from_db,
+)
+from src.podcast.rss import build_feed
+from src.podcast.state import (
+    get_delivered_pmids,
+    record_delivery,
+    get_delivered_pmids_for_user,
+    record_delivery_for_user,
+)
+
+
+# ---------------------------------------------------------------------------
+# build_queries
+# ---------------------------------------------------------------------------
+
+class TestBuildQueries:
+    def test_disease_areas_produce_query(self):
+        profile = {"disease_areas": ["neurodegeneration", "Alzheimer's disease"], "techniques": [], "experimental_models": [], "keywords": []}
+        queries = build_queries(profile)
+        assert len(queries) >= 1
+        assert "neurodegeneration" in queries[0]
+
+    def test_techniques_produce_second_query(self):
+        profile = {
+            "disease_areas": ["cancer"],
+            "techniques": ["CRISPR", "flow cytometry"],
+            "experimental_models": [],
+            "keywords": [],
+        }
+        queries = build_queries(profile)
+        assert len(queries) >= 2
+        assert any("CRISPR" in q for q in queries)
+
+    def test_keywords_produce_third_query(self):
+        profile = {
+            "disease_areas": ["diabetes"],
+            "techniques": ["proteomics"],
+            "experimental_models": [],
+            "keywords": ["insulin signaling", "beta cell"],
+        }
+        queries = build_queries(profile)
+        assert len(queries) >= 3
+        assert any("insulin signaling" in q or "beta cell" in q for q in queries)
+
+    def test_empty_profile_returns_empty(self):
+        queries = build_queries({})
+        assert queries == []
+
+    def test_fallback_to_research_summary(self):
+        profile = {"research_summary": "Studying ribosome biogenesis mechanisms"}
+        queries = build_queries(profile)
+        assert len(queries) == 1
+
+    def test_queries_are_quoted_terms(self):
+        profile = {"disease_areas": ["proteostasis"], "techniques": [], "experimental_models": [], "keywords": []}
+        queries = build_queries(profile)
+        assert '"proteostasis"' in queries[0]
+
+
+# ---------------------------------------------------------------------------
+# _format_candidates_for_prompt
+# ---------------------------------------------------------------------------
+
+class TestFormatCandidates:
+    def test_numbers_candidates_from_one(self):
+        records = [
+            {"title": "Paper A", "abstract": "Abstract A", "journal": "Nature", "year": 2024},
+            {"title": "Paper B", "abstract": "Abstract B", "journal": "Science", "year": 2024},
+        ]
+        text = _format_candidates_for_prompt(records)
+        assert text.startswith("1.")
+        assert "2." in text
+
+    def test_includes_title_and_abstract(self):
+        records = [{"title": "CRISPR therapy", "abstract": "We developed a new approach.", "journal": "Cell", "year": 2025}]
+        text = _format_candidates_for_prompt(records)
+        assert "CRISPR therapy" in text
+        assert "We developed a new approach." in text
+
+    def test_truncates_long_abstract(self):
+        long_abstract = "x" * 1000
+        records = [{"title": "T", "abstract": long_abstract, "journal": "J", "year": 2024}]
+        text = _format_candidates_for_prompt(records)
+        assert len(text) < 1000  # abstract truncated to 600 chars
+
+    def test_handles_missing_fields(self):
+        records = [{"title": "Minimal record"}]
+        text = _format_candidates_for_prompt(records)
+        assert "Minimal record" in text
+        assert "No abstract" in text
+
+
+# ---------------------------------------------------------------------------
+# _extract_section_text
+# ---------------------------------------------------------------------------
+
+class TestExtractSectionText:
+    SAMPLE_MD = """## Research Summary
+We study protein folding in neurons.
+
+## Key Methods and Technologies
+- Cryo-EM
+- Mass spectrometry
+
+## Podcast Preferences
+Focus on computational tools only.
+"""
+
+    def test_extracts_research_summary(self):
+        text = _extract_section_text(self.SAMPLE_MD, "Research Summary")
+        assert "protein folding" in text
+
+    def test_extracts_podcast_preferences(self):
+        text = _extract_section_text(self.SAMPLE_MD, "Podcast Preferences")
+        assert "computational tools" in text
+
+    def test_stops_at_next_section(self):
+        text = _extract_section_text(self.SAMPLE_MD, "Research Summary")
+        assert "Cryo-EM" not in text
+
+    def test_missing_section_returns_empty(self):
+        text = _extract_section_text(self.SAMPLE_MD, "Nonexistent Section")
+        assert text == ""
+
+
+# ---------------------------------------------------------------------------
+# RSS feed builder
+# ---------------------------------------------------------------------------
+
+def _make_episode(**kwargs):
+    """Create a minimal PodcastEpisode-like object for RSS tests."""
+    defaults = dict(
+        episode_date=date(2026, 4, 10),
+        paper_title="A Great Paper",
+        paper_authors="Smith J et al.",
+        paper_journal="Nature",
+        paper_year=2026,
+        pmid="12345678",
+        paper_url=None,
+        text_summary="This paper found something important.",
+        audio_file_path=None,
+        audio_duration_seconds=None,
+        slack_delivered=True,
+        selection_justification="Highly relevant to the PI's work.",
+    )
+    defaults.update(kwargs)
+    return SimpleNamespace(**defaults)
+
+
+class TestBuildFeed:
+    # --- agent path ---
+
+    def test_returns_valid_xml_root(self):
+        xml = build_feed("Jane Smith", [], "https://example.com", agent_id="testagent")
+        assert xml.startswith("<?xml")
+        assert "<rss" in xml
+
+    def test_includes_pi_name_in_channel(self):
+        xml = build_feed("Jane Smith", [], "https://example.com", agent_id="testagent")
+        assert "Jane Smith" in xml
+
+    def test_agent_feed_url_uses_agent_id(self):
+        xml = build_feed("Jane Smith", [], "https://example.com", agent_id="testagent")
+        assert "/podcast/testagent/feed.xml" in xml
+
+    def test_single_episode_appears_in_feed(self):
+        ep = _make_episode()
+        xml = build_feed("Jane Smith", [ep], "https://example.com", agent_id="testagent")
+        assert "A Great Paper" in xml
+        assert "2026-04-10" in xml
+
+    def test_pubmed_link_used_when_no_paper_url(self):
+        ep = _make_episode(pmid="99887766", paper_url=None)
+        xml = build_feed("Jane Smith", [ep], "https://example.com", agent_id="testagent")
+        assert "pubmed.ncbi.nlm.nih.gov/99887766" in xml
+
+    def test_paper_url_overrides_pubmed_link(self):
+        ep = _make_episode(
+            pmid="biorxiv:2026.01.01.123456",
+            paper_url="https://www.biorxiv.org/content/10.1101/2026.01.01.123456v1",
+        )
+        xml = build_feed("Jane Smith", [ep], "https://example.com", agent_id="testagent")
+        assert "biorxiv.org" in xml
+        assert "pubmed.ncbi.nlm.nih.gov" not in xml
+
+    def test_audio_enclosure_when_audio_present(self, tmp_path):
+        audio_file = tmp_path / "2026-04-10.mp3"
+        audio_file.write_bytes(b"\x00" * 1000)
+        ep = _make_episode(audio_file_path=str(audio_file), audio_duration_seconds=90)
+        xml = build_feed("Jane Smith", [ep], "https://example.com", agent_id="testagent")
+        assert "<enclosure" in xml
+        assert 'type="audio/mpeg"' in xml
+        assert "<itunes:duration>1:30</itunes:duration>" in xml
+
+    def test_no_enclosure_when_no_audio(self):
+        ep = _make_episode(audio_file_path=None)
+        xml = build_feed("Jane Smith", [ep], "https://example.com", agent_id="testagent")
+        assert "<enclosure" not in xml
+
+    def test_xml_escaping_in_title(self):
+        ep = _make_episode(paper_title="Proteins & <Stuff>")
+        xml = build_feed("Jane Smith", [ep], "https://example.com", agent_id="testagent")
+        assert "Proteins &amp; &lt;Stuff&gt;" in xml
+
+    def test_empty_episodes_list(self):
+        xml = build_feed("Jane Smith", [], "https://example.com", agent_id="testagent")
+        assert "<item>" not in xml
+
+    def test_agent_guid_format(self):
+        ep = _make_episode()
+        xml = build_feed("Jane Smith", [ep], "https://example.com", agent_id="testagent")
+        assert "testagent-2026-04-10" in xml
+
+    # --- user path ---
+
+    def test_user_feed_url_uses_user_id(self):
+        uid = "11111111-2222-3333-4444-555555555555"
+        xml = build_feed("Alice Brown", [], "https://example.com", user_id=uid)
+        assert f"/podcast/users/{uid}/feed.xml" in xml
+
+    def test_user_feed_has_correct_pi_name(self):
+        uid = "11111111-2222-3333-4444-555555555555"
+        xml = build_feed("Alice Brown", [], "https://example.com", user_id=uid)
+        assert "Alice Brown" in xml
+
+    def test_user_audio_url_uses_user_path(self, tmp_path):
+        uid = "11111111-2222-3333-4444-555555555555"
+        audio_file = tmp_path / "2026-04-10.mp3"
+        audio_file.write_bytes(b"\x00" * 500)
+        ep = _make_episode(audio_file_path=str(audio_file))
+        xml = build_feed("Alice Brown", [ep], "https://example.com", user_id=uid)
+        assert f"/podcast/users/{uid}/audio/2026-04-10.mp3" in xml
+
+    def test_user_guid_format(self):
+        uid = "11111111-2222-3333-4444-555555555555"
+        ep = _make_episode()
+        xml = build_feed("Alice Brown", [ep], "https://example.com", user_id=uid)
+        assert f"user-{uid}-2026-04-10" in xml
+
+
+# ---------------------------------------------------------------------------
+# State helpers — user path
+# ---------------------------------------------------------------------------
+
+class TestUserState:
+    def test_new_user_has_empty_delivered_set(self, tmp_path, monkeypatch):
+        monkeypatch.setattr("src.podcast.state.STATE_FILE", tmp_path / "state.json")
+        result = get_delivered_pmids_for_user("user-uuid-abc")
+        assert result == set()
+
+    def test_record_and_retrieve_user_delivery(self, tmp_path, monkeypatch):
+        monkeypatch.setattr("src.podcast.state.STATE_FILE", tmp_path / "state.json")
+        record_delivery_for_user("user-uuid-abc", "12345")
+        record_delivery_for_user("user-uuid-abc", "67890")
+        result = get_delivered_pmids_for_user("user-uuid-abc")
+        assert result == {"12345", "67890"}
+
+    def test_user_and_agent_state_are_independent(self, tmp_path, monkeypatch):
+        monkeypatch.setattr("src.podcast.state.STATE_FILE", tmp_path / "state.json")
+        record_delivery("myagent", "11111")
+        record_delivery_for_user("user-uuid-abc", "22222")
+        assert get_delivered_pmids("myagent") == {"11111"}
+        assert get_delivered_pmids_for_user("user-uuid-abc") == {"22222"}
+        # no cross-contamination
+        assert "22222" not in get_delivered_pmids("myagent")
+        assert "11111" not in get_delivered_pmids_for_user("user-uuid-abc")
+
+    def test_duplicate_pmid_not_added_twice(self, tmp_path, monkeypatch):
+        monkeypatch.setattr("src.podcast.state.STATE_FILE", tmp_path / "state.json")
+        record_delivery_for_user("user-uuid-abc", "99999")
+        record_delivery_for_user("user-uuid-abc", "99999")
+        raw = json.loads((tmp_path / "state.json").read_text())
+        assert raw["users"]["user-uuid-abc"]["delivered_pmids"].count("99999") == 1
+
+    def test_atomic_write_leaves_valid_json(self, tmp_path, monkeypatch):
+        monkeypatch.setattr("src.podcast.state.STATE_FILE", tmp_path / "state.json")
+        record_delivery_for_user("u1", "aaa")
+        content = (tmp_path / "state.json").read_text()
+        parsed = json.loads(content)  # must be valid JSON
+        assert "users" in parsed
+
+
+# ---------------------------------------------------------------------------
+# _build_profile_text_from_db
+# ---------------------------------------------------------------------------
+
+class TestBuildProfileTextFromDb:
+    def _make_user(self, **kwargs):
+        defaults = dict(name="Dr. Alice", institution="MIT", department="Biology")
+        defaults.update(kwargs)
+        return SimpleNamespace(**defaults)
+
+    def _make_profile(self, **kwargs):
+        defaults = dict(
+            research_summary="We study protein aggregation.",
+            disease_areas=["Alzheimer's", "Parkinson's"],
+            techniques=["cryo-EM", "mass spectrometry"],
+            experimental_models=["mouse", "iPSC"],
+            keywords=["proteostasis", "neurodegeneration"],
+        )
+        defaults.update(kwargs)
+        return SimpleNamespace(**defaults)
+
+    def test_includes_user_name(self):
+        text = _build_profile_text_from_db(self._make_user(), self._make_profile())
+        assert "Dr. Alice" in text
+
+    def test_includes_research_summary(self):
+        text = _build_profile_text_from_db(self._make_user(), self._make_profile())
+        assert "protein aggregation" in text
+
+    def test_includes_disease_areas(self):
+        text = _build_profile_text_from_db(self._make_user(), self._make_profile())
+        assert "Alzheimer" in text
+
+    def test_includes_techniques(self):
+        text = _build_profile_text_from_db(self._make_user(), self._make_profile())
+        assert "cryo-EM" in text
+
+    def test_handles_none_fields_gracefully(self):
+        profile = self._make_profile(disease_areas=None, techniques=None, keywords=None)
+        text = _build_profile_text_from_db(self._make_user(), profile)
+        assert "protein aggregation" in text  # summary still present
+
+    def test_handles_missing_institution(self):
+        user = self._make_user(institution=None, department=None)
+        text = _build_profile_text_from_db(user, self._make_profile())
+        assert "Dr. Alice" in text

Score	Descriptor	Strengths / Weaknesses
1	Exceptional	Essentially no weaknesses
2	Outstanding	Negligible weaknesses
3	Excellent	Only minor weaknesses
4	Very Good	Numerous minor weaknesses
5	Good	At least one moderate weakness
6	Satisfactory	Some moderate weaknesses
7	Fair	At least one major weakness
8	Marginal	A few major weaknesses
9	Poor	Numerous major weaknesses