From 705807e2866021b88c027c935fc20df01bb20e54 Mon Sep 17 00:00:00 2001
From: Keysat <licensing@keysat.xyz>
Date: Sat, 13 Jun 2026 13:35:53 -0500
Subject: [PATCH] Add internal-meetings pipeline and post-hoc speaker tools

---
 public/job-output-view.html               |  330 +++
 server/audio-meta.js                      |  171 ++
 server/chunk-buffer.js                    |  142 ++
 server/chunked-analyze.js                 | 1256 ++++++++++++
 server/job-stats.js                       |  323 +++
 server/jobs.js                            |  219 ++
 server/meeting-extras.js                  |  376 ++++
 server/meeting-speaker-edits.js           |  359 ++++
 server/output-store.js                    |  163 ++
 server/post-cluster-polish.js             |  655 ++++++
 server/routes/internal-meetings.js        | 2225 +++++++++++++++++++++
 server/speaker-clustering.js              |  624 ++++++
 server/test/meeting-speaker-edits.test.js |  269 +++
 server/test/polish-speaker-labels.test.js |   60 +
 server/test/speaker-clustering.test.js    |  203 ++
 15 files changed, 7375 insertions(+)
 create mode 100644 public/job-output-view.html
 create mode 100644 server/audio-meta.js
 create mode 100644 server/chunk-buffer.js
 create mode 100644 server/chunked-analyze.js
 create mode 100644 server/job-stats.js
 create mode 100644 server/jobs.js
 create mode 100644 server/meeting-extras.js
 create mode 100644 server/meeting-speaker-edits.js
 create mode 100644 server/output-store.js
 create mode 100644 server/post-cluster-polish.js
 create mode 100644 server/routes/internal-meetings.js
 create mode 100644 server/speaker-clustering.js
 create mode 100644 server/test/meeting-speaker-edits.test.js
 create mode 100644 server/test/polish-speaker-labels.test.js
 create mode 100644 server/test/speaker-clustering.test.js
diff --git a/public/job-output-view.html b/public/job-output-view.html
new file mode 100644
index 0000000..11c712e
--- /dev/null
+++ b/public/job-output-view.html
@@ -0,0 +1,330 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+  <meta charset="UTF-8" />
+  <meta name="viewport" content="width=device-width, initial-scale=1.0" />
+  <title>Job output — Recap Relay</title>
+  <!--
+    Stand-alone render of a stored job's transcript + analysis JSON.
+    Loaded by the operator's dashboard "View" link on a Jobs row.
+
+    Visual style: mirror of Recap's results panel (two-pane —
+    topic list on the left, transcript on the right, click a topic
+    to jump to its timestamp range in the transcript). Sourced from
+    Recap's index.html .chunk + .transcript-line styling so changes
+    there stay aesthetically aligned here.
+
+    Data source: GET /admin/job-output/:id returns
+      {
+        job_id, batch_id, source, saved_at,
+        transcript: "[MM:SS] line\n[MM:SS] line...",
+        analysis:  { sections: [{ title, summary, startIndex, endIndex }] } | null
+        analysis_raw_text: string | null  // when JSON-parse failed
+        meta:      { title, media_url, audio_seconds, ... }
+      }
+  -->
+  <style>
+    :root {
+      --bg: #0a0e1a;
+      --panel: #111827;
+      --panel-2: #1e293b;
+      --line: #1e293b;
+      --line-2: #334155;
+      --fg: #e2e8f0;
+      --fg-dim: #94a3b8;
+      --fg-faint: #64748b;
+      --accent: #818cf8;
+      --accent-soft: #a5b4fc;
+      --good: #4ade80;
+      --bad: #fca5a5;
+    }
+    * { box-sizing: border-box; }
+    body {
+      margin: 0; padding: 0;
+      background: var(--bg); color: var(--fg);
+      font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", Helvetica, Arial, sans-serif;
+      font-size: 13px; line-height: 1.55;
+      min-height: 100vh;
+    }
+    a { color: var(--accent-soft); text-decoration: none; }
+    a:hover { text-decoration: underline; }
+
+    .header {
+      padding: 14px 24px;
+      background: var(--panel);
+      border-bottom: 1px solid var(--line);
+      display: flex; align-items: center; gap: 16px; flex-wrap: wrap;
+    }
+    .header h1 {
+      margin: 0; font-size: 16px; font-weight: 700;
+      color: var(--fg); max-width: 800px;
+      overflow: hidden; text-overflow: ellipsis; white-space: nowrap;
+    }
+    .header .meta { font-size: 11px; color: var(--fg-faint); }
+    .header .meta strong { color: var(--fg-dim); }
+    .header .pill {
+      display: inline-block; padding: 2px 8px; border-radius: 999px;
+      font-size: 10px; font-weight: 700; text-transform: uppercase;
+      letter-spacing: 0.04em;
+      background: rgba(129,140,248,0.18); color: var(--accent-soft);
+    }
+
+    .split { display: flex; min-height: calc(100vh - 60px); }
+    .left {
+      flex: 0 0 42%; max-width: 42%;
+      border-right: 1px solid var(--line);
+      overflow-y: auto;
+      padding: 16px;
+      background: var(--bg);
+    }
+    .right {
+      flex: 1; min-width: 0;
+      overflow-y: auto;
+      padding: 16px;
+      background: var(--panel);
+    }
+    @media (max-width: 900px) {
+      .split { flex-direction: column; }
+      .left, .right { flex: none; max-width: 100%; border-right: none; }
+      .left { border-bottom: 1px solid var(--line); max-height: 50vh; }
+    }
+
+    /* Topic / chunk card */
+    .chunk {
+      padding: 12px 14px; margin-bottom: 8px;
+      background: var(--panel); border: 1px solid var(--line);
+      border-radius: 10px; cursor: pointer;
+      transition: border-color 0.15s, background 0.15s;
+    }
+    .chunk:hover { border-color: var(--accent); }
+    .chunk.active {
+      border-color: var(--accent);
+      background: rgba(129,140,248,0.06);
+      box-shadow: 0 2px 16px rgba(129,140,248,0.10);
+    }
+    .chunk-title {
+      font-size: 13px; font-weight: 700; color: var(--fg);
+      margin-bottom: 4px;
+    }
+    .chunk-time {
+      font-size: 10px; color: var(--fg-faint);
+      font-variant-numeric: tabular-nums; margin-left: 6px;
+      font-weight: 500;
+    }
+    .chunk-summary {
+      font-size: 12px; color: var(--fg-dim); line-height: 1.5;
+    }
+
+    /* Transcript pane */
+    .transcript-line {
+      display: flex; gap: 10px; padding: 4px 8px;
+      border-radius: 6px; line-height: 1.6;
+      scroll-margin-top: 80px;
+    }
+    .transcript-line.hl { background: rgba(129,140,248,0.10); }
+    .ts-badge {
+      flex: 0 0 auto;
+      font-family: "SF Mono", Menlo, monospace;
+      font-size: 11px; color: var(--accent-soft);
+      min-width: 56px;
+    }
+    .ts-text { flex: 1; font-size: 13px; color: var(--fg); }
+
+    .empty {
+      padding: 40px 20px; text-align: center;
+      color: var(--fg-faint); font-size: 13px;
+    }
+    .error {
+      padding: 20px; background: var(--panel);
+      border: 1px solid var(--bad); border-radius: 10px;
+      color: var(--bad); margin: 20px;
+    }
+    pre.raw {
+      background: var(--panel); padding: 12px;
+      border: 1px solid var(--line); border-radius: 8px;
+      overflow: auto; font-size: 11px; color: var(--fg-dim);
+      max-height: 300px; white-space: pre-wrap;
+    }
+  </style>
+</head>
+<body>
+  <div id="root">
+    <div class="empty">Loading job output…</div>
+  </div>
+
+  <script>
+    // Strip script tags + on-event attrs from any HTML the data
+    // accidentally contains. Transcript + analysis text comes from
+    // Gemini / Parakeet so it's unlikely to contain malicious HTML
+    // but escape it anyway — we're rendering server data in an
+    // admin context.
+    function esc(s) {
+      if (s == null) return "";
+      return String(s)
+        .replace(/&/g, "&amp;")
+        .replace(/</g, "&lt;")
+        .replace(/>/g, "&gt;")
+        .replace(/"/g, "&quot;");
+    }
+
+    // Parse "[MM:SS] text" or "[H:MM:SS] text" lines into entries
+    // with offset-seconds + text. Mirrors Recap's parser so the
+    // analysis startIndex/endIndex map onto the same entry indices.
+    function parseTimestampedTranscript(text) {
+      if (!text) return [];
+      const entries = [];
+      const re = /^\s*\[(\d+):(\d{2})(?::(\d{2}))?\]\s*(.*)$/;
+      for (const line of String(text).split(/\r?\n/)) {
+        const m = line.match(re);
+        if (!m) continue;
+        const hasHours = m[3] !== undefined;
+        const offset = hasHours
+          ? parseInt(m[1], 10) * 3600 + parseInt(m[2], 10) * 60 + parseInt(m[3], 10)
+          : parseInt(m[1], 10) * 60 + parseInt(m[2], 10);
+        entries.push({ offset, text: m[4].trim() });
+      }
+      return entries;
+    }
+
+    function formatTime(sec) {
+      sec = Math.max(0, Math.round(sec || 0));
+      const h = Math.floor(sec / 3600);
+      const m = Math.floor((sec % 3600) / 60);
+      const s = sec % 60;
+      const pad = (n) => String(n).padStart(2, "0");
+      return h > 0 ? `${h}:${pad(m)}:${pad(s)}` : `${m}:${pad(s)}`;
+    }
+
+    function getJobIdFromURL() {
+      const u = new URL(location.href);
+      return u.searchParams.get("id") || "";
+    }
+
+    async function load() {
+      const root = document.getElementById("root");
+      const jobId = getJobIdFromURL();
+      if (!jobId) {
+        root.innerHTML = '<div class="error">Missing ?id=&lt;job_id&gt; in URL.</div>';
+        return;
+      }
+      let data;
+      try {
+        const r = await fetch("/admin/job-output/" + encodeURIComponent(jobId));
+        if (r.status === 404) {
+          root.innerHTML = '<div class="error">No stored output for job <code>' + esc(jobId) + '</code>. The output may have been deleted, or this job ran before output-storage was enabled.</div>';
+          return;
+        }
+        if (!r.ok) throw new Error("HTTP " + r.status);
+        data = await r.json();
+      } catch (err) {
+        root.innerHTML = '<div class="error">Failed to load: ' + esc(err?.message || err) + '</div>';
+        return;
+      }
+      render(data);
+    }
+
+    function render(data) {
+      const root = document.getElementById("root");
+      const meta = data.meta || {};
+      const entries = parseTimestampedTranscript(data.transcript || "");
+      const sections = (data.analysis && Array.isArray(data.analysis.sections))
+        ? data.analysis.sections
+        : null;
+
+      // Header block — title, source, models, batch link back to dashboard.
+      const sourceLabel = data.source === "admin-test"
+        ? '<span class="pill">Test run</span>'
+        : (data.source === "admin-test-shared-tx" ? '<span class="pill">Shared TX</span>' : '');
+      const headerHTML =
+        '<div class="header">' +
+          '<h1>' + esc(meta.title || meta.media_url || data.job_id) + '</h1>' +
+          sourceLabel +
+          '<div class="meta">' +
+            (meta.media_url ? '<a href="' + esc(meta.media_url) + '" target="_blank" rel="noopener">source ↗</a> &middot; ' : '') +
+            (meta.audio_seconds ? '<strong>' + formatTime(meta.audio_seconds) + '</strong> audio &middot; ' : '') +
+            (meta.transcribe_backend ? 'TX: <strong>' + esc(meta.transcribe_model || meta.transcribe_backend) + '</strong> &middot; ' : '') +
+            (meta.analyze_backend ? 'AN: <strong>' + esc(meta.analyze_model || meta.analyze_backend) + '</strong>' : '') +
+          '</div>' +
+          '<div style="margin-left:auto;"><a href="/" title="Back to dashboard">← Dashboard</a></div>' +
+        '</div>';
+
+      // Empty states.
+      if (entries.length === 0) {
+        root.innerHTML = headerHTML +
+          '<div class="empty">No transcript text was saved for this job.</div>';
+        return;
+      }
+
+      // Left pane: topic list.
+      let leftHTML = '<div class="left" id="topics-pane">';
+      if (!sections || sections.length === 0) {
+        leftHTML += '<div class="empty">No analysis sections were saved for this job.';
+        if (data.analysis_raw_text) {
+          leftHTML += '<pre class="raw" style="text-align:left; margin-top: 12px;">' + esc(data.analysis_raw_text.slice(0, 4000)) + '</pre>';
+        }
+        leftHTML += '</div>';
+      } else {
+        sections.forEach((s, i) => {
+          const startIdx = Math.max(0, Math.min(s.startIndex || 0, entries.length - 1));
+          const startTs = entries[startIdx]?.offset || 0;
+          const endIdx = Math.max(startIdx, Math.min(s.endIndex || 0, entries.length - 1));
+          const endTs = entries[endIdx]?.offset || 0;
+          leftHTML +=
+            '<div class="chunk" data-section-idx="' + i + '" data-start="' + startIdx + '" onclick="onChunkClick(' + i + ')">' +
+              '<div class="chunk-title">' +
+                esc(s.title || "(untitled)") +
+                '<span class="chunk-time">' + formatTime(startTs) + ' — ' + formatTime(endTs) + '</span>' +
+              '</div>' +
+              '<div class="chunk-summary">' + esc(s.summary || "") + '</div>' +
+            '</div>';
+        });
+      }
+      leftHTML += '</div>';
+
+      // Right pane: transcript.
+      let rightHTML = '<div class="right" id="transcript-pane">';
+      entries.forEach((e, i) => {
+        rightHTML +=
+          '<div class="transcript-line" id="entry-' + i + '">' +
+            '<span class="ts-badge">' + formatTime(e.offset) + '</span>' +
+            '<span class="ts-text">' + esc(e.text) + '</span>' +
+          '</div>';
+      });
+      rightHTML += '</div>';
+
+      root.innerHTML = headerHTML + '<div class="split">' + leftHTML + rightHTML + '</div>';
+
+      // Expose for click handlers.
+      window._entries = entries;
+      window._sections = sections;
+    }
+
+    // Click a topic in the left pane: scroll the matching entry into
+    // view on the right pane and apply a highlight band over the
+    // section's entry range. Highlight clears after a couple seconds.
+    function onChunkClick(sectionIdx) {
+      const sections = window._sections;
+      if (!sections || !sections[sectionIdx]) return;
+      // Mark active chunk visually.
+      document.querySelectorAll(".chunk.active").forEach((el) => el.classList.remove("active"));
+      const chunkEl = document.querySelector('.chunk[data-section-idx="' + sectionIdx + '"]');
+      if (chunkEl) chunkEl.classList.add("active");
+
+      const s = sections[sectionIdx];
+      const start = Math.max(0, s.startIndex || 0);
+      const end = Math.max(start, s.endIndex || start);
+      // Scroll the start entry into view in the transcript pane.
+      const target = document.getElementById("entry-" + start);
+      if (target) target.scrollIntoView({ behavior: "smooth", block: "start" });
+      // Highlight the section's range; clear prior highlights first.
+      document.querySelectorAll(".transcript-line.hl").forEach((el) => el.classList.remove("hl"));
+      for (let i = start; i <= end; i++) {
+        const el = document.getElementById("entry-" + i);
+        if (el) el.classList.add("hl");
+      }
+    }
+
+    load();
+  </script>
+</body>
+</html>
diff --git a/server/audio-meta.js b/server/audio-meta.js
new file mode 100644
index 0000000..7c7ed68
--- /dev/null
+++ b/server/audio-meta.js
@@ -0,0 +1,171 @@
+// Wrapper around ffprobe for getting the playable duration of an
+// audio file. Used by the transcribe routes to record audio_seconds
+// alongside each audit entry, so the dashboard can normalize wall-
+// clock duration to "ms per minute of audio" — a backend-agnostic
+// speed benchmark.
+//
+// Returns the duration in seconds (float), or null if ffprobe fails
+// or the file isn't probeable. Never throws — best-effort metadata
+// shouldn't break the request that needs it.
+
+import { execFile } from "child_process";
+import { promisify } from "util";
+import fs from "fs/promises";
+import os from "os";
+import path from "path";
+
+const execFileAsync = promisify(execFile);
+
+// NOTE: there is intentionally NO default chunk size export here.
+// The canonical default lives in server/config.js
+// (`relay_hardware_tx_chunk_minutes` and `relay_gemini_tx_chunk_minutes`)
+// and flows down through createHardwareBackend / createGeminiBackend
+// to splitAudioFile. Removed in v0.2.32 so there's exactly one place
+// to change the default — the Settings tab in the dashboard.
+
+// Runs ffprobe on a file path. Returns seconds, or null on any failure.
+export async function getAudioDurationSeconds(filePath) {
+  if (!filePath) return null;
+  try {
+    // -v error: silence everything except hard errors
+    // -show_entries format=duration: just the duration float
+    // -of default=noprint_wrappers=1:nokey=1: bare number, no labels
+    const { stdout } = await execFileAsync(
+      "ffprobe",
+      [
+        "-v",
+        "error",
+        "-show_entries",
+        "format=duration",
+        "-of",
+        "default=noprint_wrappers=1:nokey=1",
+        filePath,
+      ],
+      { timeout: 10_000 }
+    );
+    const seconds = parseFloat(stdout.trim());
+    if (!Number.isFinite(seconds) || seconds <= 0) return null;
+    return seconds;
+  } catch {
+    return null;
+  }
+}
+
+// Split an audio file into fixed-length chunks via ffmpeg. Returns
+// an array of { filePath, startSeconds, durationSeconds, index }
+// ordered by startSeconds. Uses -acodec copy so it's lossless and
+// fast (no re-encoding pass). Returns an empty array if the audio
+// is shorter than chunkSeconds — caller should just send the
+// original file in that case.
+//
+// Used by the hardware backend to keep Parakeet calls within memory
+// limits on long audio. The relay's audit log later records audio_seconds
+// for the WHOLE file (not per-chunk) so the dashboard's
+// "ms per minute of audio" benchmark stays meaningful.
+export async function splitAudioFile({
+  inputPath,
+  outputDir,
+  chunkSeconds,
+  overlapSeconds = 0,
+}) {
+  if (!Number.isFinite(chunkSeconds) || chunkSeconds <= 0) {
+    throw new Error("splitAudioFile: chunkSeconds is required (no default — pass an explicit value from config)");
+  }
+  if (
+    !Number.isFinite(overlapSeconds) ||
+    overlapSeconds < 0 ||
+    overlapSeconds >= chunkSeconds
+  ) {
+    // Overlap must be smaller than chunk size or the loop never
+    // advances. 0 is fine (no overlap, original behavior).
+    overlapSeconds = 0;
+  }
+  const duration = await getAudioDurationSeconds(inputPath);
+  if (!duration || duration <= chunkSeconds) return [];
+  const chunks = [];
+  let startSec = 0;
+  let i = 0;
+  const ext = path.extname(inputPath).replace(/^\./, "") || "mp3";
+  // Advance step = chunkSeconds - overlap. Each chunk still has
+  // length up to chunkSeconds; consecutive chunks share `overlap`
+  // seconds at their boundary. The caller's stitching code dedupes
+  // by dropping the overlapping prefix from chunk N+1 (and all
+  // subsequent chunks).
+  const advanceStep = chunkSeconds - overlapSeconds;
+  while (startSec < duration) {
+    const chunkPath = path.join(outputDir, `chunk_${i}.${ext}`);
+    const segLen = Math.min(chunkSeconds, duration - startSec);
+    try {
+      await execFileAsync(
+        "ffmpeg",
+        [
+          "-y",
+          "-i",
+          inputPath,
+          "-ss",
+          String(startSec),
+          "-t",
+          String(segLen),
+          "-acodec",
+          "copy",
+          chunkPath,
+        ],
+        { timeout: 120_000 }
+      );
+    } catch (err) {
+      // `-acodec copy` fails on some containers/streams that don't
+      // start on a keyframe at the cut point. Retry with re-encoding,
+      // which always works at the cost of CPU time.
+      await execFileAsync(
+        "ffmpeg",
+        [
+          "-y",
+          "-i",
+          inputPath,
+          "-ss",
+          String(startSec),
+          "-t",
+          String(segLen),
+          chunkPath,
+        ],
+        { timeout: 180_000 }
+      );
+    }
+    chunks.push({
+      filePath: chunkPath,
+      startSeconds: startSec,
+      durationSeconds: segLen,
+      // Boundary marker: timestamps strictly less than this value
+      // are duplicates of the prior chunk's tail (overlap region).
+      // Caller dedupes by dropping output before this boundary.
+      // For chunk 0 this equals startSec (no prior chunk), so the
+      // boundary check is a no-op.
+      overlapBoundarySec: i === 0 ? startSec : startSec + overlapSeconds,
+      index: i,
+    });
+    startSec += advanceStep;
+    i++;
+  }
+  return chunks;
+}
+
+// Convenience wrapper for callers holding the audio in memory (the
+// /relay/transcribe route receives multipart uploads as buffers).
+// Writes a temp file, probes, cleans up. Cheaper than re-streaming
+// through ffprobe's stdin which doesn't always handle every format
+// reliably.
+export async function getAudioDurationSecondsFromBuffer(buffer) {
+  if (!buffer || !buffer.length) return null;
+  const tmpFile = path.join(
+    os.tmpdir(),
+    `relay-probe-${Date.now()}-${Math.random().toString(36).slice(2, 8)}`
+  );
+  try {
+    await fs.writeFile(tmpFile, buffer);
+    return await getAudioDurationSeconds(tmpFile);
+  } catch {
+    return null;
+  } finally {
+    fs.unlink(tmpFile).catch(() => {});
+  }
+}
diff --git a/server/chunk-buffer.js b/server/chunk-buffer.js
new file mode 100644
index 0000000..685b65f
--- /dev/null
+++ b/server/chunk-buffer.js
@@ -0,0 +1,142 @@
+// Chunk-buffer state used by the pipelined-analyze path in
+// routes/summarize-url.js. The hardware backend fires
+// onChunkComplete(chunkData) as each transcribe chunk finishes;
+// this buffer:
+//   - drains chunks in INDEX ORDER (chunks may arrive out of order
+//     when concurrency > 1; we hold them in `pending` until the
+//     next-expected index lands so dedup against the prior chunk's
+//     overlap boundary is deterministic)
+//   - dedupes each new chunk's segments against the prior chunk's
+//     overlapBoundarySec — same logic that runs at end-of-transcribe
+//     in hardware.js, but applied incrementally so analyze can read
+//     a clean, no-duplicates segment view per window
+//   - tracks coveredEndSec (the maximum global timestamp the deduped
+//     buffer extends to, considering ONLY in-order chunks)
+//   - lets the analyze workers await `waitForTime(targetSec)` and
+//     query `getSegments(startSec, endSec)` to build per-window
+//     analyze inputs as soon as the required chunks are in
+//
+// Failure modes:
+//   - A chunk fails entirely → its segments are empty / undefined.
+//     The buffer still advances nextExpected past it so later chunks
+//     aren't stuck behind. The window covering that chunk's range
+//     gets a shorter transcript and may yield no sections (or fewer
+//     than expected). Downstream stitcher tolerates gaps.
+//   - waitForTime can wait forever if the relevant chunk index
+//     never arrives. Caller is responsible for racing this against
+//     the transcribe Promise so a transcribe failure unblocks all
+//     pending waiters via reject.
+
+export function createChunkBuffer() {
+  return {
+    // Sparse staging area for chunks that arrived out of index order.
+    pending: new Map(),
+    // Drained, deduped, sorted-by-start segments. Append-only.
+    segments: [],
+    // Index of the next chunk we're waiting on to drain.
+    nextExpected: 0,
+    // Total chunk count, populated on the first onChunkComplete call.
+    totalChunks: null,
+    // Greatest global end-time covered by drained chunks. NOT just
+    // max(pending) — out-of-order pending chunks don't count until
+    // their predecessors land, so dedup is consistent.
+    coveredEndSec: 0,
+    // The previous chunk's overlap boundary in GLOBAL seconds.
+    // Segments in the next chunk with start < this are duplicates of
+    // segments already in the prior chunk's tail and get dropped.
+    prevOverlapBoundary: 0,
+    // Async waiters: { targetSec, resolve, reject }
+    waiters: [],
+    // Set true on terminal failure so future waiters reject immediately
+    // instead of hanging.
+    failed: false,
+    failedReason: null,
+
+    add(chunkData) {
+      if (this.failed) return;
+      if (chunkData == null) return;
+      if (this.totalChunks == null && Number.isInteger(chunkData.totalChunks)) {
+        this.totalChunks = chunkData.totalChunks;
+      }
+      this.pending.set(chunkData.chunkIndex, chunkData);
+      // Drain consecutive chunks starting from nextExpected
+      while (this.pending.has(this.nextExpected)) {
+        const c = this.pending.get(this.nextExpected);
+        this.pending.delete(this.nextExpected);
+        const segs = Array.isArray(c.segments) ? c.segments : [];
+        // Dedup against the global overlap boundary set by the prior
+        // chunk. Same predicate hardware.js uses at end-of-transcribe
+        // for the global stitch: `seg.start >= prevOverlapBoundary`.
+        for (const s of segs) {
+          if ((s.start || 0) >= this.prevOverlapBoundary) {
+            this.segments.push(s);
+          }
+        }
+        // overlapBoundarySec from audio-meta.js is ALREADY a global
+        // timestamp (= startSec + overlapSeconds at chunking time),
+        // NOT a chunk-relative offset. The earlier `c.startSeconds +
+        // c.overlapBoundarySec` double-counted: chunk 1 ended up
+        // with prevOverlapBoundary=570 instead of 300, chunk 2
+        // 1110 instead of 570, and by chunk 3+ the boundary had
+        // outrun every subsequent chunk's segments — all dropped.
+        // Symptom: window 1 received only ~30% of the segments it
+        // should have, windows 2-6 received zero. Matches the
+        // formula hardware.js uses at end-of-transcribe (with
+        // offsetSeconds=0 for summarize-url callers).
+        this.prevOverlapBoundary = c.overlapBoundarySec || 0;
+        const endHere = (c.startSeconds || 0) + (c.durationSeconds || 0);
+        if (endHere > this.coveredEndSec) this.coveredEndSec = endHere;
+        this.nextExpected += 1;
+      }
+      this.checkWaiters();
+    },
+
+    checkWaiters() {
+      const stillWaiting = [];
+      for (const w of this.waiters) {
+        if (this.coveredEndSec >= w.targetSec) {
+          w.resolve();
+        } else {
+          stillWaiting.push(w);
+        }
+      }
+      this.waiters = stillWaiting;
+    },
+
+    // Block until coveredEndSec reaches targetSec. Rejects with the
+    // failedReason if the buffer is poisoned by a transcribe failure.
+    waitForTime(targetSec) {
+      if (this.failed) return Promise.reject(this.failedReason);
+      if (this.coveredEndSec >= targetSec) return Promise.resolve();
+      return new Promise((resolve, reject) =>
+        this.waiters.push({ targetSec, resolve, reject })
+      );
+    },
+
+    // Snapshot the segments covering [startSec, endSec). Caller gets
+    // a fresh array safe to mutate.
+    getSegments(startSec, endSec) {
+      const out = [];
+      for (const s of this.segments) {
+        const t = s.start || 0;
+        if (t >= startSec && t < endSec) out.push(s);
+      }
+      return out;
+    },
+
+    // Mark the buffer dead so all current + future waiters reject.
+    // Called when transcribe throws — without this, runPipelinedAnalysis
+    // workers would hang forever waiting for a window that'll never
+    // become ready.
+    fail(reason) {
+      this.failed = true;
+      this.failedReason = reason instanceof Error
+        ? reason
+        : new Error(String(reason || "transcribe failed"));
+      for (const w of this.waiters) {
+        try { w.reject(this.failedReason); } catch {}
+      }
+      this.waiters = [];
+    },
+  };
+}
diff --git a/server/chunked-analyze.js b/server/chunked-analyze.js
new file mode 100644
index 0000000..7af2493
--- /dev/null
+++ b/server/chunked-analyze.js
@@ -0,0 +1,1256 @@
+// Chunked topic-analysis for the relay's test-run worker. Mirrors the
+// approach in `/Users/macpro/Projects/recap/server/chunked-analyze.js`
+// (Recap app) but adapted for the relay:
+//
+//   1. Input is the relay's bracketed-text transcript (the same format
+//      that gets saved to the output store), not a structured `entries`
+//      array. A small parser converts the bracketed text back into
+//      { offset, text } entries before windowing.
+//
+//   2. Each window emits its OWN audit-log row (pipeline="analyze",
+//      with window_idx + window_count fields), so the Jobs table's
+//      "AN windows" column reflects real parallel window count and
+//      `analyze_ms` becomes the sum-of-windows (total backend work).
+//      Per-window `audio_seconds` = window BODY seconds so per-row
+//      rate stats (s/audio-min) divide by the right denominator.
+//
+//   3. Single backend, single model per call. The recap-app version
+//      walks a model-fallback chain per window; the relay only ever
+//      runs one model per benchmark permutation, so no fallback loop.
+//
+//   4. No abort signal / jobId threading — the relay's test-run worker
+//      manages cancellation at a higher level via job state.
+//
+// Tunables (window body, overlap, concurrency, cutoff) are passed in
+// from the test-run worker, which sources them from the live-reloaded
+// /data/config/relay-config.json. No hardcoded defaults here — the
+// caller MUST supply explicit values, sourced from one canonical place
+// (server/config.js defaultConfig()).
+//
+// Public entry point: `runChunkedAnalysis()` at the bottom.
+
+import { recordCall } from "./audit-log.js";
+import {
+  sortAndDedupeTranscript,
+  mergeShortEntries,
+} from "./backends/gemini.js";
+
+// ─────────────────────────────────────────────────────────────────────
+// Bracketed-transcript → entries parser
+// ─────────────────────────────────────────────────────────────────────
+// Both the Gemini backend and the Hardware backend produce transcripts
+// in the shape:
+//
+//   [MM:SS] First caption line.
+//   [MM:SS] Next caption line.
+//   [H:MM:SS] (with hour for >60-min videos)
+//
+// We parse those bracketed timestamps back into entries so the
+// windowing logic (which is offset-aware) can plan time-based windows.
+// Lines without a leading bracket are appended to the previous entry's
+// text (handles wrapped lines).
+
+const TIMESTAMP_RE = /^\[(\d{1,2}):(\d{2})(?::(\d{2}))?\]\s*(.*)$/;
+
+export function parseBracketedTranscript(text) {
+  if (!text || typeof text !== "string") return [];
+  const lines = text.split(/\r?\n/);
+  const entries = [];
+  for (const line of lines) {
+    const m = line.match(TIMESTAMP_RE);
+    if (m) {
+      let offset;
+      if (m[3] !== undefined) {
+        // [H:MM:SS] — h, mm, ss in groups 1/2/3
+        offset = parseInt(m[1], 10) * 3600 + parseInt(m[2], 10) * 60 + parseInt(m[3], 10);
+      } else {
+        // [MM:SS] — mm, ss in groups 1/2
+        offset = parseInt(m[1], 10) * 60 + parseInt(m[2], 10);
+      }
+      entries.push({ offset, text: (m[4] || "").trim() });
+    } else if (entries.length > 0) {
+      // Continuation line — append to the previous entry's text.
+      const last = entries[entries.length - 1];
+      const extra = line.trim();
+      if (extra) last.text = last.text ? last.text + " " + extra : extra;
+    }
+    // Lines before the first bracket (e.g. a header) are discarded.
+  }
+  return entries;
+}
+
+// Format seconds → "[H:MM:SS]" or "[MM:SS]" matching the relay's
+// bracketed style.
+function fmtTimestamp(secs) {
+  const s = Math.max(0, Math.floor(secs || 0));
+  const h = Math.floor(s / 3600);
+  const m = Math.floor((s % 3600) / 60);
+  const sec = s % 60;
+  const pad = (n) => n.toString().padStart(2, "0");
+  return h > 0 ? `${h}:${pad(m)}:${pad(sec)}` : `${m}:${pad(sec)}`;
+}
+
+// ─────────────────────────────────────────────────────────────────────
+// Window planning — same algorithm as recap-app's planAnalysisWindows
+// ─────────────────────────────────────────────────────────────────────
+// Returns array of windows, each: { startIdx, endIdx, bodyStartIdx,
+// startSec, bodyStartSec, bodyEndSec }. We carry the second-domain
+// values forward (not just entry-index) so the audit row's per-window
+// audio_seconds can be set to the body length exactly.
+
+export function planAnalysisWindows(entries, { bodySeconds, overlapSeconds, cutoffSeconds }) {
+  if (!entries.length) return [];
+  const totalSec =
+    (entries[entries.length - 1].offset || 0) +
+    (entries[entries.length - 1].duration || 0);
+  if (totalSec <= cutoffSeconds) {
+    return [
+      {
+        startIdx: 0,
+        endIdx: entries.length - 1,
+        bodyStartIdx: 0,
+        startSec: 0,
+        bodyStartSec: 0,
+        bodyEndSec: totalSec,
+      },
+    ];
+  }
+  const windows = [];
+  let bodyStartSec = 0;
+  while (bodyStartSec < totalSec) {
+    const bodyEndSec = Math.min(totalSec, bodyStartSec + bodySeconds);
+    const windowEndSec = bodyStartSec + bodySeconds + overlapSeconds;
+    const bodyStartIdx = firstEntryAtOrAfter(entries, bodyStartSec);
+    // No more entries — done.
+    if (bodyStartIdx >= entries.length) break;
+    // Gap handling: if the next entry past bodyStartSec sits beyond
+    // this window's end (e.g., a middle TX chunk was truncated and
+    // left a hole in the timeline), don't stop the loop — jump the
+    // body cursor forward to the next entry's body-stride boundary
+    // so the entries on the other side of the gap still get a window.
+    const nextEntryOffset = entries[bodyStartIdx].offset || 0;
+    if (nextEntryOffset >= windowEndSec) {
+      bodyStartSec = Math.max(
+        bodyStartSec + bodySeconds,
+        Math.floor(nextEntryOffset / bodySeconds) * bodySeconds
+      );
+      continue;
+    }
+    const overlapWithPriorSec = Math.max(0, bodyStartSec - overlapSeconds);
+    const startIdx = firstEntryAtOrAfter(entries, overlapWithPriorSec);
+    const endIdx = lastEntryBefore(entries, windowEndSec);
+    if (endIdx < bodyStartIdx) {
+      // Defensive — the gap check above should prevent this. If we
+      // still hit it, advance and continue rather than break.
+      bodyStartSec += bodySeconds;
+      continue;
+    }
+    windows.push({
+      startIdx,
+      endIdx,
+      bodyStartIdx,
+      startSec: overlapWithPriorSec,
+      bodyStartSec,
+      bodyEndSec,
+    });
+    if (endIdx >= entries.length - 1) break;
+    bodyStartSec += bodySeconds;
+  }
+  return windows;
+}
+
+export function firstEntryAtOrAfter(entries, sec) {
+  for (let i = 0; i < entries.length; i++) {
+    if ((entries[i].offset || 0) >= sec) return i;
+  }
+  return entries.length;
+}
+
+export function lastEntryBefore(entries, sec) {
+  let ans = -1;
+  for (let i = 0; i < entries.length; i++) {
+    if ((entries[i].offset || 0) < sec) ans = i;
+    else break;
+  }
+  return ans;
+}
+
+// Find the canonical entry index whose [offset, offset+duration]
+// range contains the given time (in seconds). Falls back to the
+// nearest entry by offset distance when no containing entry exists.
+// Returns -1 only when `entries` is empty.
+export function canonicalIndexForOffset(entries, sec) {
+  if (!entries.length) return -1;
+  // Exact-match-or-containing pass
+  for (let i = 0; i < entries.length; i++) {
+    const start = entries[i].offset || 0;
+    const dur = entries[i].duration || 0;
+    if (start <= sec && sec <= start + dur) return i;
+    if (start > sec) {
+      // Past it without a containing match — return the closer of
+      // entries[i-1] vs entries[i] by offset distance.
+      if (i === 0) return 0;
+      const prevDist = sec - (entries[i - 1].offset || 0);
+      const nextDist = (entries[i].offset || 0) - sec;
+      return prevDist <= nextDist ? i - 1 : i;
+    }
+  }
+  // Past the last entry — clamp to end.
+  return entries.length - 1;
+}
+
+// ─────────────────────────────────────────────────────────────────────
+// Per-window prompt builder
+// ─────────────────────────────────────────────────────────────────────
+// Same shape as the test-run worker's original single-shot prompt,
+// but emitted per-window slice. Includes the entry's offset prefix so
+// the model can use timestamps when picking section boundaries.
+
+// Default analyze-prompt template. Three template variables get
+// interpolated at request time:
+//   {{windowMin}}      — window length in minutes (derived from entries)
+//   {{targetSections}} — count target string ("1 section" / "1-2 sections" / ...)
+//   {{maxIndex}}       — windowEntries.length - 1, used in the completeness
+//                        constraint so the model is told the exact valid
+//                        index range it must cover. NEW in this version
+//                        alongside the numbered-line transcript format.
+//   {{transcript}}     — the numbered + timestamped transcript text for the
+//                        window, formatted as `[N] (MM:SS) text` per line
+//                        (was `[MM:SS] text` before; switched to match the
+//                        Recap-app's direct-to-Gemini path which produces
+//                        much better section coverage because the model
+//                        can read indices off the input rather than count
+//                        bracketed lines internally).
+// Operator-editable via the dashboard's Settings tab. The variable
+// names MUST be preserved across edits; the validation in
+// /admin/settings PUT checks that the prompt still contains
+// {{transcript}} and the "JSON" output instruction.
+export const DEFAULT_ANALYZE_PROMPT_TEMPLATE = `You are analyzing a ~{{windowMin}}-minute section of a longer transcript. Your job is to identify natural topic boundaries and group the transcript into discussion-based sections — aim for {{targetSections}}.
+
+TRANSCRIPT (each line is numbered with a timestamp):
+{{transcript}}
+
+INSTRUCTIONS:
+1. Read the entire transcript carefully.
+2. Identify where the discussion naturally shifts from one topic to another.
+3. Group consecutive transcript segments by topic. Some sections may be short (a quick aside) and some may be long (an extended deep-dive). Let the content dictate the length.
+4. For each section, write:
+   - A short, specific topic title (3-8 words)
+   - A 1-3 sentence summary of what's discussed
+   - The start and end segment indices (inclusive), counted as the bracketed [N] number at the start of each transcript line above.
+
+IMPORTANT:
+- Sections must be chronological and non-overlapping.
+- Every segment index from 0 to {{maxIndex}} must belong to exactly one section.
+- startIndex of section N+1 must equal endIndex of section N plus 1.
+- Create as many or as few sections as the content naturally requires — but lean toward broad, substantive topics rather than minute-by-minute breakdowns. A natural topic that spans several minutes of dialogue should be one section, not several.
+- Titles should be descriptive and specific, not generic like "Introduction" unless it truly is one.
+
+Respond with ONLY valid JSON in this exact format, no other text:
+{
+  "sections": [
+    {
+      "title": "Brief Topic Title",
+      "summary": "1-3 sentence summary of this discussion section.",
+      "startIndex": 0,
+      "endIndex": 15
+    }
+  ]
+}`;
+
+// Pick the target-total-sections value for a given total audio
+// duration. The buckets match the Settings UI rows exactly so what
+// the operator sees in their preview table is what the prompt
+// receives at request time. Falls back to the next-larger bucket\'s
+// default when a setting is missing/non-numeric.
+function pickTargetTotalSections(totalAudioSec, totalsByBucket) {
+  const totalMin = (totalAudioSec || 0) / 60;
+  const pick = (k, fallback) => {
+    const v = Number(totalsByBucket?.[k]);
+    return Number.isFinite(v) && v > 0 ? v : fallback;
+  };
+  if (totalMin < 30) return pick("under_30", 6);
+  if (totalMin < 60) return pick("30_60", 8);
+  if (totalMin < 90) return pick("60_90", 9);
+  if (totalMin < 120) return pick("90_120", 10);
+  if (totalMin < 150) return pick("120_150", 11);
+  if (totalMin < 180) return pick("150_180", 12);
+  return pick("over_180", 12);
+}
+
+// Compute the per-window target sections from the total-target +
+// window/audio geometry. Returns BOTH a numeric average (for the
+// dashboard preview) and a free-form string to splice into the
+// prompt. The string is intentionally round numbers / short ranges
+// the model can interpret literally — fractional averages get
+// expressed as "N–M sections" so the model is given latitude rather
+// than a confusing "2.5 sections" instruction.
+//
+// Edge cases:
+//   - Empty audio → returns 1 section (defensive).
+//   - Single-window job (windowSec >= totalAudioSec) → returns
+//     full target total (no division by less-than-one num-windows).
+//   - Fractional result (e.g. 2.5) → returns "2–3 sections".
+//   - Integer result (e.g. 3.0) → returns "around 3 sections".
+export function computePerWindowTarget({ totalAudioSec, windowSec, totalsByBucket }) {
+  const target = pickTargetTotalSections(totalAudioSec, totalsByBucket);
+  if (!totalAudioSec || totalAudioSec <= 0) {
+    return { average: 1, label: "1 section", target_total: target };
+  }
+  // Effective number of windows the audio spans. Clamped to 1 so a
+  // single-shot run (audio <= analyze_cutoff) gets the full target.
+  const numWindows = Math.max(1, totalAudioSec / Math.max(60, windowSec || 60));
+  const avg = target / numWindows;
+  // Build the prompt-facing label.
+  let label;
+  if (avg <= 1.2) {
+    label = "1 section";
+  } else {
+    const lo = Math.max(1, Math.floor(avg));
+    const hi = Math.max(lo, Math.ceil(avg));
+    if (lo === hi) {
+      label = "around " + lo + " sections";
+    } else {
+      label = lo + "–" + hi + " sections";
+    }
+  }
+  return { average: avg, label, target_total: target };
+}
+
+function buildWindowPrompt(windowEntries, promptOverride, targetTotalsByBucket, totalAudioSec) {
+  // Numbered + timestamped transcript format. Each line is
+  //   [N] (MM:SS) text
+  // where N is the entry's position within THIS window (not its
+  // global position in the full transcript — the stitcher
+  // translates window-local indices to global at result time).
+  //
+  // Why numbered: the model is asked to emit startIndex/endIndex
+  // for each section. If indices aren't shown in the input, the
+  // model has to count bracketed-timestamp lines and frequently
+  // hallucinates out-of-range values (e.g., emitting endIndex=9999
+  // for a 200-entry window). Showing indices makes the contract
+  // explicit and dramatically reduces hallucination.
+  const transcriptText = windowEntries
+    .map((e, i) => `[${i}] (${fmtTimestamp(e.offset)}) ${e.text}`)
+    .join("\n");
+  // Window length in seconds (last entry's offset minus first's),
+  // used to scale the suggested section count. The actual per-window
+  // section target also depends on the TOTAL video duration, not
+  // just this window's slice — see computePerWindowTarget().
+  const windowSec = windowEntries.length > 1
+    ? (windowEntries[windowEntries.length - 1].offset || 0) - (windowEntries[0].offset || 0)
+    : 0;
+  const windowMin = Math.max(1, Math.round(windowSec / 60));
+  // Max valid index = last entry's position in this window's slice.
+  // Substituted into the prompt's completeness clause so the model
+  // is told the exact range it must cover (0 through maxIndex
+  // inclusive).
+  const maxIndex = Math.max(0, windowEntries.length - 1);
+  // Section-count target: the new model is total-sections-per-video
+  // bucketed by TOTAL audio duration. The relay divides by the
+  // effective number of windows ((totalAudioSec / windowSec), clamped
+  // to >=1) to produce the per-window average, then formats it as a
+  // human-readable string for {{targetSections}}.
+  //
+  // `totalAudioSec` is passed in from the caller (runChunkedAnalysis
+  // receives it from summarize-url.js' worker). When unavailable
+  // (e.g. legacy callers), computePerWindowTarget falls back to "1
+  // section" — defensive, won't crash but won't be useful either.
+  const targetCalc = computePerWindowTarget({
+    totalAudioSec,
+    windowSec,
+    totalsByBucket: targetTotalsByBucket || {},
+  });
+  const targetSections = targetCalc.label;
+  const template = (typeof promptOverride === "string" && promptOverride.trim())
+    ? promptOverride
+    : DEFAULT_ANALYZE_PROMPT_TEMPLATE;
+  // Simple {{var}} interpolation. We DON'T use a templating library
+  // to keep this dependency-free and predictable. Variables are
+  // replaced literally; unknown {{var}} tokens pass through as-is
+  // (helpful if the operator typos a variable — they'll see it in
+  // the model's output and know to fix it).
+  return template
+    .replaceAll("{{windowMin}}", String(windowMin))
+    .replaceAll("{{targetSections}}", targetSections)
+    .replaceAll("{{maxIndex}}", String(maxIndex))
+    .replaceAll("{{transcript}}", transcriptText);
+}
+
+// Strip code fences + parse a JSON-formatted analyze response into
+// `{ sections: [...] }`. Returns null on parse failure.
+function safeParseSections(text) {
+  if (!text || typeof text !== "string") return null;
+  let jsonStr = text.trim();
+  const cb = jsonStr.match(/```(?:json)?\s*([\s\S]*?)```/);
+  if (cb) jsonStr = cb[1].trim();
+  try {
+    const parsed = JSON.parse(jsonStr);
+    return parsed && Array.isArray(parsed.sections) ? parsed : null;
+  } catch {
+    return null;
+  }
+}
+
+// ─────────────────────────────────────────────────────────────────────
+// Stitcher
+// ─────────────────────────────────────────────────────────────────────
+// Combines per-window section lists into a single ordered list of
+// non-overlapping sections referencing entries by their position in
+// the FULL entries array. Same algorithm as recap-app's stitcher:
+// each window N owns sections whose globalStart falls before
+// window(N+1).bodyStartIdx. Last window has no successor → keep all.
+
+export function stitchAnalysisResults(results) {
+  const out = [];
+  for (let i = 0; i < results.length; i++) {
+    const r = results[i];
+    if (!r || !r.ok) continue;
+    const next = results[i + 1];
+    const nextBody =
+      next && next.window ? next.window.bodyStartIdx : Infinity;
+    const offset = r.window.startIdx;
+    // Cap each section's endIndex to this window's own range. Without
+    // this clamp, a model that emits a section with an out-of-range
+    // endIndex (e.g., endIndex: 9999 — happens when the LLM
+    // hallucinates a value past the window it was given) ends up
+    // with a globalEnd extending way past the window's actual end.
+    // Symptom: an analyze window covers 18 minutes of transcript but
+    // produces a section spanning 50+ minutes in the final output,
+    // because the inflated endIndex propagates all the way to the
+    // UI. The clamp uses r.window.endIdx, which is the last entry
+    // index this window's transcript actually contains.
+    const windowMaxEndIdx = r.window.endIdx;
+    for (const s of r.sections) {
+      const globalStart = offset + (s.startIndex ?? 0);
+      const rawGlobalEnd = offset + (s.endIndex ?? 0);
+      const globalEnd = Math.min(rawGlobalEnd, windowMaxEndIdx);
+      if (globalStart >= nextBody) continue;
+      // Skip sections that the clamp pushed below startIndex —
+      // these were degenerate to begin with (the model emitted
+      // start > end) and the clamp can't recover them.
+      if (globalEnd < globalStart) continue;
+      out.push({
+        startIndex: globalStart,
+        endIndex: globalEnd,
+        title: s.title,
+        summary: s.summary,
+      });
+    }
+  }
+  // Dedup with proper containment handling. The earlier implementation
+  // (sort + trim-on-next-start) handled simple partial overlaps but
+  // silently let TWO sections survive when one fully contained the
+  // other (e.g., model emits both "Systemic Critique 1:10-1:23" AND
+  // "Decentralizing 1:10-1:12" in the same window output). Symptom:
+  // the UI shows two topics starting at the same timestamp with one's
+  // range fully inside the other's. Algorithm:
+  //   1. Sort by startIndex ASC. Tiebreak by endIndex ASC so the
+  //      SMALLER (more specific) section comes first when two share
+  //      a start — the cross-section trim below then drops the
+  //      small one into a degenerate range, and we filter it out.
+  //   2. Walk left-to-right, tracking the largest endIndex seen so
+  //      far ("maxEndSeen"). A section whose endIndex is already
+  //      covered (<= maxEndSeen) is FULLY contained in something we
+  //      already accepted — drop it.
+  //   3. For partial overlap (current.startIndex <= previous.endIndex),
+  //      trim the previous section's endIndex back to current.startIndex - 1.
+  //      If that makes the previous degenerate, pop it.
+  out.sort(
+    (a, b) => a.startIndex - b.startIndex || a.endIndex - b.endIndex
+  );
+  const deduped = [];
+  let maxEndSeen = -1;
+  for (const s of out) {
+    if (s.endIndex < s.startIndex) continue;
+    // Fully contained in something already accepted — drop.
+    if (s.endIndex <= maxEndSeen) continue;
+    // Partial overlap with the prior accepted section — trim the
+    // prior to end one entry before this one starts.
+    const prev = deduped[deduped.length - 1];
+    if (prev && prev.endIndex >= s.startIndex) {
+      prev.endIndex = s.startIndex - 1;
+      if (prev.endIndex < prev.startIndex) {
+        deduped.pop();
+      }
+    }
+    deduped.push(s);
+    if (s.endIndex > maxEndSeen) maxEndSeen = s.endIndex;
+  }
+  return deduped;
+}
+
+// ─────────────────────────────────────────────────────────────────────
+// Public entry point
+// ─────────────────────────────────────────────────────────────────────
+// Runs chunked analysis end-to-end:
+//
+//   transcriptText (bracketed [MM:SS] format)
+//     → entries[]
+//     → windows[]
+//     → analyze each window in parallel (bounded concurrency)
+//     → audit per-window
+//     → stitch sections into final list
+//
+// Each window emits an audit row with pipeline="analyze",
+// audio_seconds=windowBodySeconds, window_idx=N, window_count=K,
+// duration_ms=this window's analyze wall time, status="success"|"error".
+// On error, the per-window row records the error message AND the
+// overall run continues — failed windows are dropped from stitching
+// (with a warning) rather than aborting the whole job.
+//
+// Returns:
+//   {
+//     text: "<JSON string with .sections>",  // for downstream parity
+//     model: dominantModelName,
+//     usage: null,
+//     attempts: { windows: N, failed: K },
+//   }
+// or throws when ALL windows failed.
+
+export async function runChunkedAnalysis({
+  transcriptText,
+  backend,
+  // Audit-row metadata (passed through to each per-window recordCall):
+  pipelineBackend, // "gemini" | "hardware"
+  jobId,
+  batchId,
+  mediaUrl,
+  title,
+  installId,
+  // Audit-only — paired with install_id on every per-window recordCall
+  // so license-pool aggregations on the dashboard see this work. Pure
+  // forensic field; credits.js isn't called from here.
+  licenseFingerprint = null,
+  source,
+  // Cost helper — caller passes a function (model, usage) → costDetails
+  // because gemini.js's cost calculator is gemini-specific. Returns
+  // { input_tokens, output_tokens, thinking_tokens, cost_usd }; hardware
+  // path passes a no-op helper that returns zeros.
+  computeCostDetails,
+  // Tunables (all required, no hardcoded defaults here):
+  bodySeconds,
+  overlapSeconds,
+  concurrency,
+  cutoffSeconds,
+  // Operator-editable analyze prompt template (Settings tab).
+  // Empty/missing falls back to DEFAULT_ANALYZE_PROMPT_TEMPLATE.
+  // Same applies to both Gemini and operator-hardware analyze paths.
+  analyzePromptOverride = "",
+  // Operator-editable section-count target totals per VIDEO duration
+  // bucket. Shape: { under_30, "30_60", "60_90", "90_120", "120_150",
+  // "150_180", over_180 } — each is a NUMBER (target total sections
+  // for a video in that duration bucket). The relay computes a
+  // per-window average by dividing by num_windows and formats it
+  // into {{targetSections}}. See computePerWindowTarget() in this
+  // file for the math + label formatting. Missing/non-numeric
+  // buckets fall back to hardcoded defaults (6/8/9/10/11/12/12).
+  targetTotalsByBucket = null,
+  // Total audio duration in seconds — required for the per-window
+  // target math. Pulled by the worker from getAudioDurationSeconds()
+  // and threaded through. If omitted (legacy callers), the prompt
+  // emits "1 section" as a defensive fallback.
+  totalAudioSec = 0,
+  // Optional: called once per window AS SOON AS its sections are
+  // available (out of order, since windows resolve in parallel). The
+  // callback receives the window's BODY-OWNED sections — the ones
+  // the final stitcher will keep. Each section carries GLOBAL indices
+  // (into the full entries array) so the caller can render them in
+  // place without further translation. Used by /relay/summarize-url
+  // to push window_complete SSE events to the connected Recap client
+  // as windows arrive, so the user sees topics appearing in real time
+  // instead of waiting for the whole pipeline to finish.
+  onWindowComplete = null,
+}) {
+  const entries = parseBracketedTranscript(transcriptText);
+  if (entries.length === 0) {
+    // Edge case: empty transcript. Record one failed analyze row so
+    // the Jobs table shows what happened, then throw.
+    await recordCall({
+      install_id: installId,
+      license_fingerprint: licenseFingerprint,
+      tier: "core",
+      pipeline: "analyze",
+      backend: pipelineBackend,
+      model: null,
+      status: "error",
+      duration_ms: 0,
+      audio_seconds: 0,
+      cost_usd: 0,
+      job_id: jobId,
+      batch_id: batchId,
+      source,
+      media_url: mediaUrl,
+      title: title || null,
+      error: "transcript empty — nothing to analyze",
+      window_idx: 0,
+      window_count: 1,
+    });
+    throw new Error("transcript empty — nothing to analyze");
+  }
+  const windows = planAnalysisWindows(entries, {
+    bodySeconds,
+    overlapSeconds,
+    cutoffSeconds,
+  });
+  if (windows.length === 0) {
+    throw new Error("planAnalysisWindows produced no windows (unexpected)");
+  }
+
+  // Each window's audio_seconds = its BODY duration. This matches what
+  // the per-row rate stats SHOULD divide by, since a window analyzes a
+  // body+overlap span but only the body contributes to the stitched
+  // output. Last window's body is clamped to the transcript end.
+  const results = new Array(windows.length);
+  let nextIdx = 0;
+
+  async function worker() {
+    while (true) {
+      const my = nextIdx++;
+      if (my >= windows.length) return;
+      const w = windows[my];
+      const windowEntries = entries.slice(w.startIdx, w.endIdx + 1);
+      const prompt = buildWindowPrompt(
+        windowEntries,
+        analyzePromptOverride,
+        targetTotalsByBucket,
+        totalAudioSec
+      );
+      const bodySec = Math.max(0, w.bodyEndSec - w.bodyStartSec);
+      const winStart = Date.now();
+      try {
+        // Per-window analyze with up to 3 attempts on invalid-JSON /
+        // exception. Analyze is by far the cheapest pipeline phase
+        // (a few seconds per window vs 30+ seconds for transcribe),
+        // so being aggressive about retries is essentially free —
+        // worst-case wall time for a failing window goes from ~5s to
+        // ~15s, which is still trivial compared to the 30+ minute
+        // transcribe phase for long content.
+        //
+        // The relay also now passes `responseMimeType:
+        // "application/json"` on the analyze call (see gemini.js
+        // analyzeText), so Gemini decoder-enforces valid JSON output
+        // — invalid-JSON failures from prose preamble / markdown
+        // fence wrapping / truncated brace should be eliminated
+        // entirely on Gemini. The retry loop here is now mostly
+        // defense for the hardware (Gemma) path which has no
+        // equivalent decoder-side guarantee, plus capacity blips.
+        const MAX_ATTEMPTS = 3;
+        let r = null;
+        let parsed = null;
+        let lastAttemptErr = null;
+        for (let attempt = 0; attempt < MAX_ATTEMPTS; attempt++) {
+          try {
+            r = await backend.analyzeText({ prompt });
+            parsed = safeParseSections(r.text);
+            if (parsed) {
+              lastAttemptErr = null;
+              break;
+            }
+            lastAttemptErr = "invalid JSON in window response";
+          } catch (innerErr) {
+            r = null;
+            parsed = null;
+            lastAttemptErr = (innerErr?.message || String(innerErr)).slice(0, 280);
+          }
+          if (attempt < MAX_ATTEMPTS - 1) {
+            console.warn(
+              `[chunked-analyze] window ${my + 1}/${windows.length} attempt ${attempt + 1} failed (${lastAttemptErr}) — retrying`
+            );
+          }
+        }
+        const dur = Date.now() - winStart;
+        if (!parsed) {
+          // Both attempts failed — record one audit row, drop from
+          // stitching, continue the run. The stitcher will skip this
+          // window's body region; the summarize-url credit gate will
+          // refuse to charge because anyWindowFailed becomes true.
+          results[my] = { window: w, ok: false, error: new Error(lastAttemptErr || "analyze failed") };
+          await recordCall({
+            install_id: installId,
+            license_fingerprint: licenseFingerprint,
+            tier: "core",
+            pipeline: "analyze",
+            backend: pipelineBackend,
+            model: r?.model || null,
+            status: "error",
+            duration_ms: dur,
+            audio_seconds: bodySec,
+            cost_usd: 0,
+            job_id: jobId,
+            batch_id: batchId,
+            source,
+            media_url: mediaUrl,
+            title: title || null,
+            error: (lastAttemptErr || "analyze failed") + " (after " + MAX_ATTEMPTS + " attempts)",
+            window_idx: my,
+            window_count: windows.length,
+            window_body_seconds: bodySec,
+          });
+          continue;
+        }
+        const costDetails = computeCostDetails(r.model, r.usage);
+        results[my] = {
+          window: w,
+          ok: true,
+          sections: parsed.sections,
+          model: r.model,
+        };
+        await recordCall({
+          install_id: installId,
+          license_fingerprint: licenseFingerprint,
+          tier: "core",
+          pipeline: "analyze",
+          backend: pipelineBackend,
+          model: r.model || null,
+          status: "success",
+          duration_ms: dur,
+          audio_seconds: bodySec,
+          job_id: jobId,
+          batch_id: batchId,
+          source,
+          media_url: mediaUrl,
+          title: title || null,
+          window_idx: my,
+          window_count: windows.length,
+          window_body_seconds: bodySec,
+          ...costDetails,
+        });
+        // Streaming callback: emit this window's body-owned sections
+        // as soon as they arrive. Uses the same ownership rule as the
+        // final stitcher (window N owns sections starting before
+        // window N+1's body), but computed locally with just this
+        // window's planned position — the next window's bodyStartIdx
+        // is known from the plan even if that window hasn't finished.
+        if (onWindowComplete) {
+          const next = windows[my + 1];
+          const nextBodyIdx = next ? next.bodyStartIdx : Infinity;
+          const offset = w.startIdx;
+          // Same endIndex clamp as stitchAnalysisResults — a model
+          // that emits an out-of-range endIndex would otherwise
+          // produce a streaming partial-section spanning way past
+          // this window's transcript range. The final stitch
+          // re-clamps, but if the SSE client renders partials
+          // incrementally it'd briefly show the inflated bounds.
+          const windowMaxEndIdx = w.endIdx;
+          const owned = [];
+          for (const s of parsed.sections) {
+            const globalStart = offset + (s.startIndex ?? 0);
+            const rawGlobalEnd = offset + (s.endIndex ?? 0);
+            const globalEnd = Math.min(rawGlobalEnd, windowMaxEndIdx);
+            if (globalStart >= nextBodyIdx) continue;
+            if (globalEnd < globalStart) continue;
+            owned.push({
+              startIndex: globalStart,
+              endIndex: globalEnd,
+              title: s.title,
+              summary: s.summary,
+            });
+          }
+          try {
+            onWindowComplete({
+              windowIdx: my,
+              totalWindows: windows.length,
+              ownedSections: owned,
+              windowBodySeconds: bodySec,
+              model: r.model || null,
+              durationMs: dur,
+            });
+          } catch (cbErr) {
+            // Streaming is best-effort — don't fail the analyze loop
+            // if a callback throws (e.g. the SSE client disconnected
+            // mid-window).
+            console.warn(
+              `[chunked-analyze] onWindowComplete callback failed: ${cbErr?.message || cbErr}`
+            );
+          }
+        }
+      } catch (err) {
+        const dur = Date.now() - winStart;
+        results[my] = { window: w, ok: false, error: err };
+        await recordCall({
+          install_id: installId,
+          license_fingerprint: licenseFingerprint,
+          tier: "core",
+          pipeline: "analyze",
+          backend: pipelineBackend,
+          model: null,
+          status: "error",
+          duration_ms: dur,
+          audio_seconds: bodySec,
+          cost_usd: 0,
+          job_id: jobId,
+          batch_id: batchId,
+          source,
+          media_url: mediaUrl,
+          title: title || null,
+          error: (err?.message || String(err)).slice(0, 400),
+          window_idx: my,
+          window_count: windows.length,
+          window_body_seconds: bodySec,
+        });
+      }
+    }
+  }
+
+  const workerPromises = Array.from(
+    { length: Math.min(concurrency, windows.length) },
+    worker
+  );
+  await Promise.all(workerPromises);
+
+  const succeeded = results.filter((r) => r && r.ok);
+  const failed = results.filter((r) => r && !r.ok);
+  if (succeeded.length === 0) {
+    throw new Error(
+      `All ${results.length} analyze windows failed. First error: ${
+        failed[0]?.error?.message || "unknown"
+      }`
+    );
+  }
+
+  const stitched = stitchAnalysisResults(results);
+  // Aggregate model attribution: dominant successful model.
+  const modelTally = new Map();
+  for (const r of results) {
+    if (!r.ok || !r.model) continue;
+    modelTally.set(r.model, (modelTally.get(r.model) || 0) + 1);
+  }
+  const dominantModel =
+    [...modelTally.entries()].sort((a, b) => b[1] - a[1])[0]?.[0] || null;
+
+  return {
+    text: JSON.stringify({ sections: stitched }),
+    model: dominantModel,
+    usage: null,
+    attempts: { windows: results.length, failed: failed.length },
+  };
+}
+
+// ─────────────────────────────────────────────────────────────────────
+// Pipelined analyze (Phase 2 of the streaming UX work).
+//
+// Lets analyze windows fire AS SOON AS their required transcribe
+// chunks have completed, in parallel with later chunks still being
+// transcribed. The wall-time savings are modest for short content
+// where transcribe dwarfs analyze (a 94-min video here: ~12s of
+// analyze that can hide under transcribe), but the user-perceived
+// improvement is dramatic — first topics render at T=~80s instead
+// of T=~160s, because they don't have to wait for transcribe of
+// minute 80-94 to start drawing the first window's topics.
+//
+// Design:
+//   1. Caller pre-plans windows by AUDIO TIME (not entries — entries
+//      don't exist yet).
+//   2. Caller provides a `getReadyText(startSec, endSec) → string`
+//      function that returns the current transcribe output covering
+//      that time range (bracketed MM:SS lines). It throws or returns
+//      null if not enough chunks have completed yet.
+//   3. Caller provides a `waitForTime(targetEndSec) → Promise<void>`
+//      that resolves when transcribe has covered up to targetEndSec.
+//   4. Each window's worker awaits its required time then calls
+//      analyzeOneWindow with the window's text. Workers run as a
+//      bounded concurrent pool same as runChunkedAnalysis.
+//   5. Section indices that come back from each window are LOCAL to
+//      that window's entry slice. The caller is responsible for
+//      mapping them to GLOBAL entry indices after transcribe fully
+//      completes (when the canonical entries array exists).
+// ─────────────────────────────────────────────────────────────────────
+
+// Pre-plan analyze windows from total audio duration alone. Same
+// math as planAnalysisWindows but returns ONLY time fields (no
+// entry indices) — entries aren't built yet during pipelining. The
+// caller assembles entries per-window when firing.
+export function planWindowsByDuration({
+  totalAudioSec,
+  bodySeconds,
+  overlapSeconds,
+  cutoffSeconds,
+}) {
+  if (!totalAudioSec || totalAudioSec <= 0) return [];
+  // Single-shot fast path for short audio — same threshold as
+  // planAnalysisWindows.
+  if (totalAudioSec <= cutoffSeconds) {
+    return [
+      {
+        idx: 0,
+        startSec: 0,
+        bodyStartSec: 0,
+        bodyEndSec: totalAudioSec,
+        windowEndSec: totalAudioSec,
+      },
+    ];
+  }
+  const windows = [];
+  let bodyStartSec = 0;
+  let idx = 0;
+  while (bodyStartSec < totalAudioSec) {
+    const bodyEndSec = Math.min(totalAudioSec, bodyStartSec + bodySeconds);
+    const windowEndSec = Math.min(
+      totalAudioSec,
+      bodyStartSec + bodySeconds + overlapSeconds
+    );
+    const overlapWithPriorSec = Math.max(0, bodyStartSec - overlapSeconds);
+    windows.push({
+      idx,
+      startSec: overlapWithPriorSec,
+      bodyStartSec,
+      bodyEndSec,
+      windowEndSec,
+    });
+    idx += 1;
+    if (bodyEndSec >= totalAudioSec) break;
+    bodyStartSec += bodySeconds;
+  }
+  return windows;
+}
+
+// Single-window analyze with the same retry + audit semantics
+// runChunkedAnalysis uses internally. Extracted so the pipelined
+// path can call it per-window without duplicating the logic.
+//
+// Returns: { ok: true, sections, model } or { ok: false, error }.
+// Audit row is recorded inside.
+export async function analyzeOneWindow({
+  windowEntries,
+  windowIdx,
+  windowCount,
+  windowBodySec,
+  windowStartSec,
+  windowEndSec,
+  backend,
+  // Audit / accounting params:
+  pipelineBackend,
+  jobId,
+  batchId,
+  mediaUrl,
+  title,
+  installId,
+  licenseFingerprint = null,
+  source,
+  computeCostDetails,
+  // Prompt params:
+  analyzePromptOverride = "",
+  targetTotalsByBucket = null,
+  totalAudioSec = 0,
+}) {
+  if (!windowEntries || windowEntries.length === 0) {
+    const err = new Error(
+      `analyzeOneWindow window ${windowIdx + 1} has no entries — audio gap or pre-cutoff window`
+    );
+    return { ok: false, error: err };
+  }
+  const prompt = buildWindowPrompt(
+    windowEntries,
+    analyzePromptOverride,
+    targetTotalsByBucket,
+    totalAudioSec
+  );
+  const winStart = Date.now();
+  const MAX_ATTEMPTS = 3;
+  let r = null;
+  let parsed = null;
+  let lastAttemptErr = null;
+  for (let attempt = 0; attempt < MAX_ATTEMPTS; attempt++) {
+    try {
+      r = await backend.analyzeText({ prompt });
+      parsed = safeParseSections(r.text);
+      if (parsed) {
+        lastAttemptErr = null;
+        break;
+      }
+      lastAttemptErr = "invalid JSON in window response";
+    } catch (innerErr) {
+      r = null;
+      parsed = null;
+      lastAttemptErr = (innerErr?.message || String(innerErr)).slice(0, 280);
+    }
+    if (attempt < MAX_ATTEMPTS - 1) {
+      console.warn(
+        `[chunked-analyze] window ${windowIdx + 1}/${windowCount} attempt ${attempt + 1} failed (${lastAttemptErr}) — retrying`
+      );
+    }
+  }
+  const dur = Date.now() - winStart;
+  const auditCommon = {
+    install_id: installId,
+    license_fingerprint: licenseFingerprint,
+    tier: "core",
+    pipeline: "analyze",
+    backend: pipelineBackend,
+    duration_ms: dur,
+    audio_seconds: windowBodySec,
+    job_id: jobId,
+    batch_id: batchId,
+    source,
+    media_url: mediaUrl,
+    title: title || null,
+    window_idx: windowIdx,
+    window_count: windowCount,
+    window_body_seconds: windowBodySec,
+  };
+  if (!parsed) {
+    await recordCall({
+      ...auditCommon,
+      model: r?.model || null,
+      status: "error",
+      cost_usd: 0,
+      error: (lastAttemptErr || "analyze failed") + " (after " + MAX_ATTEMPTS + " attempts)",
+    });
+    return { ok: false, error: new Error(lastAttemptErr || "analyze failed") };
+  }
+  const costDetails = computeCostDetails(r.model, r.usage);
+  await recordCall({
+    ...auditCommon,
+    model: r.model || null,
+    status: "success",
+    input_tokens: costDetails.input_tokens || 0,
+    output_tokens: costDetails.output_tokens || 0,
+    thinking_tokens: costDetails.thinking_tokens || 0,
+    cost_usd: costDetails.cost_usd || 0,
+  });
+  return {
+    ok: true,
+    sections: parsed.sections,
+    model: r.model,
+    durationMs: dur,
+  };
+}
+
+// Run analyze in pipelined mode, fired window-by-window as transcribe
+// chunks become available. See block comment above for the design.
+//
+// Inputs:
+//   audioDurationSec   — total audio seconds (used to pre-plan windows)
+//   waitForTime(sec)   — async; resolves when transcribe has covered
+//                        the audio up through `sec`
+//   getReadySegments(startSec, endSec) — returns the deduped segments
+//                        currently buffered for that time range (each
+//                        { start, end, text } with global timestamps).
+//                        Called per window AFTER waitForTime resolves.
+//   concurrency        — max simultaneous analyze windows
+//   onWindowComplete   — fired per window (same shape as
+//                        runChunkedAnalysis's callback) with WINDOW-
+//                        LOCAL section indices. Caller maps to global
+//                        indices at end of pipeline.
+//   ...                — all the audit + tunable params analyzeOneWindow
+//                        needs
+//
+// Returns:
+//   {
+//     windowResults: [{ window, ok, sections, model, windowEntries }],
+//     dominantModel,
+//     attempts: { windows, failed },
+//   }
+// where each windowEntries is the entries slice that window analyzed
+// (for the caller's later index-remapping).
+export async function runPipelinedAnalysis({
+  audioDurationSec,
+  waitForTime,
+  getReadySegments,
+  bodySeconds,
+  overlapSeconds,
+  cutoffSeconds,
+  concurrency,
+  onWindowComplete,
+  // Pass-through to analyzeOneWindow:
+  backend,
+  pipelineBackend,
+  jobId,
+  batchId,
+  mediaUrl,
+  title,
+  installId,
+  licenseFingerprint = null,
+  source,
+  computeCostDetails,
+  analyzePromptOverride = "",
+  targetTotalsByBucket = null,
+}) {
+  const windows = planWindowsByDuration({
+    totalAudioSec: audioDurationSec,
+    bodySeconds,
+    overlapSeconds,
+    cutoffSeconds,
+  });
+  if (windows.length === 0) {
+    throw new Error(
+      "planWindowsByDuration produced no windows — audioDurationSec missing or zero"
+    );
+  }
+
+  const results = new Array(windows.length);
+  let nextIdx = 0;
+  async function worker() {
+    while (true) {
+      const my = nextIdx++;
+      if (my >= windows.length) return;
+      const w = windows[my];
+      // Wait until transcribe has covered this window's full time
+      // range (including the overlap tail).
+      await waitForTime(w.windowEndSec);
+      // Extract segments in [w.startSec, w.windowEndSec). The caller
+      // is responsible for deduping at addChunk time so we don't
+      // see duplicates here.
+      const segments = getReadySegments(w.startSec, w.windowEndSec);
+      // Two-pass cleanup matching what hardware.js applies to the
+      // FULL stitched transcript: sortAndDedupeTranscript +
+      // mergeShortEntries collapses adjacent short Parakeet
+      // segments into thought-sized lines.
+      const rawBracketed = segmentsToBracketedText(segments);
+      const mergedBracketed = mergeShortEntries(
+        sortAndDedupeTranscript(rawBracketed)
+      );
+      const windowEntries = parseBracketedTranscript(mergedBracketed);
+      // Diagnostic so we can see per-window readiness in operator
+      // logs WITHOUT depending on audit-row inspection. Reveals
+      // empty-window or huge-entry-count issues that cause silent
+      // analyzeOneWindow failures.
+      console.log(
+        `[pipelined-analyze] window ${my + 1}/${windows.length}: ${segments.length} segments → ${windowEntries.length} merged entries · time [${w.startSec}s-${w.windowEndSec}s]`
+      );
+      const bodySec = Math.max(0, w.bodyEndSec - w.bodyStartSec);
+      const winResult = await analyzeOneWindow({
+        windowEntries,
+        windowIdx: my,
+        windowCount: windows.length,
+        windowBodySec: bodySec,
+        windowStartSec: w.startSec,
+        windowEndSec: w.windowEndSec,
+        backend,
+        pipelineBackend,
+        jobId,
+        batchId,
+        mediaUrl,
+        title,
+        installId,
+        licenseFingerprint,
+        source,
+        computeCostDetails,
+        analyzePromptOverride,
+        targetTotalsByBucket,
+        totalAudioSec: audioDurationSec,
+      });
+      results[my] = { window: w, windowEntries, ...winResult };
+      // Per-window outcome log so operator sees what actually
+      // happened beyond "X/Y windows failed" rollup. Failure log
+      // includes the underlying error so we can diagnose JSON
+      // validation, model 4xx, network, etc. without grepping
+      // the audit DB.
+      if (winResult.ok) {
+        const dur = ((winResult.durationMs || 0) / 1000).toFixed(1);
+        console.log(
+          `[pipelined-analyze] window ${my + 1}/${windows.length} ok in ${dur}s — ${(winResult.sections || []).length} sections`
+        );
+      } else {
+        const errMsg = winResult.error?.message || String(winResult.error || "unknown");
+        console.warn(
+          `[pipelined-analyze] window ${my + 1}/${windows.length} FAILED — ${errMsg.slice(0, 280)}`
+        );
+      }
+      // Emit per-window streaming event with WINDOW-LOCAL indices.
+      // The caller (summarize-url) will re-emit as a global-indexed
+      // event after the post-transcribe canonical-entries build.
+      //
+      // OWNED-SECTION FILTERING: each window's transcript range
+      // [startSec, windowEndSec] OVERLAPS BOTH the prior AND the
+      // next window. Without symmetric filtering, sections in the
+      // prior-overlap region (this window's view picked them up
+      // even though the prior window owns that body region) emit
+      // alongside the prior window's version → overlapping
+      // timestamps in the streaming UI. Symmetric filter: emit
+      // ONLY sections whose start time falls in this window's
+      // EXCLUSIVE body region [bodyStartSec, nextBodyStartSec).
+      // First window: bodyStartSec=0 → no lower bound.
+      // Last window: no next → no upper bound. The final stitcher
+      // still sees the FULL unfiltered section set (results[my]
+      // keeps everything), so any topic that crosses a body
+      // boundary and is missed by both adjacent windows in their
+      // body region still surfaces at result-event time.
+      const nextWindow = windows[my + 1];
+      const ownedFloorSec = w.bodyStartSec || 0;
+      const ownedCutoffSec = nextWindow
+        ? nextWindow.bodyStartSec
+        : Infinity;
+      const ownedSections = winResult.ok
+        ? (winResult.sections || []).filter((s) => {
+            const startEntry = windowEntries[s.startIndex];
+            if (!startEntry) return false;
+            const startSec = startEntry.offset || 0;
+            return startSec >= ownedFloorSec && startSec < ownedCutoffSec;
+          })
+        : [];
+      if (onWindowComplete && winResult.ok) {
+        try {
+          onWindowComplete({
+            windowIdx: my,
+            totalWindows: windows.length,
+            window: w,
+            windowEntries,
+            ownedSections,
+            windowBodySeconds: bodySec,
+            model: winResult.model || null,
+            durationMs: winResult.durationMs || 0,
+          });
+        } catch (cbErr) {
+          console.warn(
+            `[pipelined-analyze] onWindowComplete callback failed: ${cbErr?.message || cbErr}`
+          );
+        }
+      }
+    }
+  }
+  const workers = Array.from(
+    { length: Math.min(concurrency, windows.length) },
+    worker
+  );
+  await Promise.all(workers);
+
+  const failed = results.filter((r) => r && !r.ok);
+  const dominantModel = (() => {
+    const tally = new Map();
+    for (const r of results) {
+      if (!r || !r.ok || !r.model) continue;
+      tally.set(r.model, (tally.get(r.model) || 0) + 1);
+    }
+    return [...tally.entries()].sort((a, b) => b[1] - a[1])[0]?.[0] || null;
+  })();
+  return {
+    windowResults: results,
+    dominantModel,
+    attempts: { windows: results.length, failed: failed.length },
+  };
+}
+
+// Helper: convert an array of { start, end, text } segments into
+// the bracketed [MM:SS] text format the analyze prompt + parser
+// expect. Identical formatting to what hardware.js emits as its
+// stitched transcript text.
+function segmentsToBracketedText(segments) {
+  if (!segments || segments.length === 0) return "";
+  // Sort by start in case caller passed unsorted (defensive).
+  const sorted = segments.slice().sort((a, b) => (a.start || 0) - (b.start || 0));
+  return sorted
+    .map((s) => {
+      // Use H:MM:SS when the segment's time is in the 2nd hour or
+      // beyond. Previous code unconditionally used [MM:SS] which
+      // produced [106:30] for a 1:46:30 timestamp — 3-digit minutes
+      // are REJECTED by parseBracketedTranscript's regex
+      // (/^\[(\d{1,2}):(\d{2}).../), causing every transcript line
+      // past minute 100 to be silently dropped. Symptom on a 2h53m
+      // video: analyze windows 7-10 (covering 106+ min) all received
+      // 0 entries after the merge step and failed with "no entries —
+      // audio gap or pre-cutoff window". The H:MM:SS format matches
+      // what mergeShortEntries already emits and what the parser's
+      // optional 3rd capture group accepts.
+      const sec = Math.floor(s.start || 0);
+      const h = Math.floor(sec / 3600);
+      const m = Math.floor((sec % 3600) / 60);
+      const ss = sec % 60;
+      const pad = (n) => n.toString().padStart(2, "0");
+      const stamp = h > 0 ? `${h}:${pad(m)}:${pad(ss)}` : `${m}:${pad(ss)}`;
+      return `[${stamp}] ${(s.text || "").trim()}`;
+    })
+    .filter((l) => l.length > 0)
+    .join("\n");
+}
diff --git a/server/job-stats.js b/server/job-stats.js
new file mode 100644
index 0000000..ddc0833
--- /dev/null
+++ b/server/job-stats.js
@@ -0,0 +1,323 @@
+// Per-job aggregation over the relay's audit log. The audit log
+// records ONE row per relay call (transcribe or analyze); a single
+// summary job typically produces 1 transcribe row + N analyze rows
+// (one per chunked-analyze window). This module groups those rows by
+// X-Recap-Job-Id and computes per-video stats the dashboard renders
+// as a sortable / filterable table.
+//
+// The aggregation is computed on the fly from the in-memory entries
+// array — no separate persistence. A typical 30-day window has a few
+// thousand audit rows; grouping is O(n) and well under 10 ms.
+//
+// Output row shape (one per job_id, plus a synthetic row for
+// orphaned entries with no job_id):
+//   {
+//     job_id:            string | null
+//     started_at:        ms-epoch (earliest ts across the job's rows)
+//     completed_at:      ms-epoch (latest ts)
+//     install_id:        short string
+//     tier:              "core" | "pro" | "max" | null
+//     media_url:         string | null      // from the transcribe row
+//     title:             string | null      // ditto
+//     audio_seconds:     number | null      // from transcribe row
+//     audio_bytes:       number | null      // ditto (bytes downloaded
+//                                              by the relay for transcribe-url)
+//     transcribe_status: "success" | "error" | "refused" | "missing"
+//     transcribe_backend: "gemini" | "hardware" | null
+//     transcribe_model:   string | null
+//     transcribe_ms:      number | null
+//     download_ms:        number | null
+//     chunk_count:        number | null     // transcribe-side audio chunks
+//     analyze_windows_total:    number     // count of analyze rows
+//     analyze_windows_success:  number
+//     analyze_windows_failed:   number
+//     analyze_backend:   string | null    // dominant backend across analyze rows
+//     analyze_model:     string | null    // dominant model across analyze rows
+//     analyze_ms:        number          // sum of analyze duration_ms
+//     overall_status:    "success" | "partial" | "failed"
+//     wall_time_ms:      completed_at - started_at
+//     cost_usd:          number (sum across all rows)
+//     errors:            string[]        // concatenated short error strings
+//     // Derived metrics — pre-computed so the UI can sort by them:
+//     transcribe_ms_per_min:  number | null   // transcribe_ms / (audio_seconds/60)
+//     transcribe_ms_per_mb:   number | null   // transcribe_ms / (audio_bytes / 1MB)
+//     download_ms_per_mb:     number | null
+//     analyze_ms_per_min:     number | null
+//     analyze_ms_per_mb:      number | null
+//   }
+
+const MB = 1024 * 1024;
+
+export function aggregateJobs(entries, opts = {}) {
+  // Group by job_id. Entries without job_id become singleton groups
+  // keyed by their ts so they still appear in the table (helpful for
+  // debugging orphan calls).
+  const groups = new Map();
+  for (const e of entries) {
+    const key = e.job_id || `_orphan_${e.ts}`;
+    if (!groups.has(key)) groups.set(key, []);
+    groups.get(key).push(e);
+  }
+
+  // Optional set of job_ids that have stored output JSONs — passed
+  // in from the route layer so the aggregator doesn't have to hit
+  // the filesystem itself. Used to set the has_output flag the
+  // dashboard reads to show/hide the "View" link.
+  const outputIdSet = opts.outputIdSet instanceof Set ? opts.outputIdSet : null;
+
+  const out = [];
+  for (const [key, rows] of groups) {
+    const row = aggregateOne(key, rows);
+    row.has_output = outputIdSet ? outputIdSet.has(row.job_id) : false;
+    out.push(row);
+  }
+  // Newest first by started_at.
+  out.sort((a, b) => b.started_at - a.started_at);
+  return out;
+}
+
+function aggregateOne(key, rows) {
+  rows.sort((a, b) => a.ts - b.ts);
+  // ts in each audit row is when recordCall() fired — i.e., when the
+  // work for that row COMPLETED, not when it started. To recover the
+  // user-POV "job start" timestamp we work backwards from the first
+  // row's end-time using its duration_ms AND download_ms fields.
+  //
+  // TX row layout:
+  //   ts = download_end + tx_work_end
+  //   duration_ms = tx_work_duration (NOT including download)
+  //   download_ms = download_duration
+  //
+  // So: job_start = ts - duration_ms - download_ms.
+  //
+  // Without including download_ms here, wall_time misses the
+  // download phase (which can be 30-60s on a long YouTube fetch).
+  // Including it makes wall_time match the operator's intuitive
+  // formula: WALL ≈ DL + TX + AN_wall.
+  const firstRowDur = Number(rows[0].duration_ms) || 0;
+  const firstRowDownload = Number(rows[0].download_ms) || 0;
+  const startedAt = rows[0].ts - firstRowDur - firstRowDownload;
+  const completedAt = rows[rows.length - 1].ts;
+
+  const tx = rows.find((r) => r.pipeline === "transcribe");
+  const analyzeRows = rows.filter((r) => r.pipeline === "analyze");
+
+  const analyzeSuccess = analyzeRows.filter((r) => r.status === "success");
+  const analyzeFailed = analyzeRows.filter((r) => r.status !== "success");
+  const analyzeMs = analyzeRows.reduce(
+    (s, r) => s + (Number(r.duration_ms) || 0),
+    0
+  );
+  // Analyze wall time: elapsed clock time from when the FIRST window
+  // started to when the LAST window finished. For a 1-batch parallel
+  // analyze (all N windows fire concurrently), this ≈ the slowest
+  // single window's duration. For multi-batch (N > concurrency, e.g.
+  // 10 windows at concurrency 8 → 2 sequential batches), this spans
+  // both batches including any gap. Computed from end-ts minus
+  // start-ts (where start-ts = row.ts - row.duration_ms) so it's
+  // an accurate measured value, not a predicted one.
+  let analyzeWallMs = null;
+  if (analyzeRows.length > 0) {
+    let minStart = Infinity;
+    let maxEnd = -Infinity;
+    for (const r of analyzeRows) {
+      const end = Number(r.ts) || 0;
+      const dur = Number(r.duration_ms) || 0;
+      const start = end - dur;
+      if (start < minStart) minStart = start;
+      if (end > maxEnd) maxEnd = end;
+    }
+    analyzeWallMs = maxEnd - minStart;
+  }
+  const analyzeDominantBackend = dominant(
+    analyzeSuccess.map((r) => r.backend)
+  );
+  const analyzeDominantModel = dominant(analyzeSuccess.map((r) => r.model));
+
+  const errors = rows
+    .filter((r) => r.error)
+    .map((r) => `${r.pipeline}: ${String(r.error).slice(0, 160)}`);
+
+  const txStatus = tx ? tx.status : "missing";
+  let overall;
+  if (txStatus === "error" || txStatus === "refused" || txStatus === "missing") {
+    overall = "failed";
+  } else if (txStatus === "partial") {
+    // TX produced a truncated transcript (chunks hit the output-token
+    // cap). Mark the whole job partial regardless of analyze status —
+    // the analysis was performed against incomplete input, so even
+    // a "success" on analyze rows is misleading.
+    overall = "partial";
+  } else if (analyzeRows.length === 0) {
+    // Transcribe succeeded but no analyze rows — could be in flight,
+    // or the client never called /relay/analyze (uses local model).
+    overall = "success";
+  } else if (analyzeSuccess.length === analyzeRows.length) {
+    overall = "success";
+  } else if (analyzeSuccess.length > 0) {
+    overall = "partial";
+  } else {
+    overall = "failed";
+  }
+
+  const cost = rows.reduce((s, r) => s + (Number(r.cost_usd) || 0), 0);
+
+  // Use `??` (nullish-coalesce) — NOT `||` — so a legitimate 0 isn't
+  // treated as missing data. The test-run worker writes duration_ms=0
+  // historically (pre-fix) on cache-hit siblings; even though the new
+  // worker writes a non-zero shared wall-time, old audit rows from
+  // earlier benchmark batches still live in the NDJSON and we want
+  // those rendered correctly rather than collapsed to "—".
+  const audioSec = tx?.audio_seconds ?? null;
+  const audioBytes = tx?.audio_bytes ?? null;
+  const txMs = tx?.duration_ms ?? null;
+  const downloadMs = tx?.download_ms ?? null;
+  // TX backend compute time = sum of per-chunk wall-times. Distinct
+  // from txMs which is the outer parallel-fan-out wall-time.
+  //   single-chunk: txMsSum ≈ txMs (one chunk, one duration)
+  //   N-chunks at concurrency C: txMsSum ≈ N × per-chunk-duration
+  //                              txMs    ≈ ⌈N/C⌉ × per-chunk-duration
+  // Falls back to txMs (the wall-time) when chunk_durations_ms is
+  // absent — old audit rows from before v0.2.41 don't have it.
+  const chunkDurationsArr = Array.isArray(tx?.chunk_durations_ms) ? tx.chunk_durations_ms : null;
+  const txMsSum = chunkDurationsArr
+    ? chunkDurationsArr.reduce((s, d) => s + (Number(d) || 0), 0)
+    : txMs;
+
+  const audioMinutes = audioSec ? audioSec / 60 : null;
+  const audioMb = audioBytes ? audioBytes / MB : null;
+
+  // batch_id and source are stamped per audit row by the test-run
+  // path; use the first non-null we see so dashboard filters work
+  // regardless of which row gets read first in a multi-row job.
+  const batchId = rows.find((r) => r.batch_id)?.batch_id || null;
+  const source = rows.find((r) => r.source)?.source || null;
+
+  return {
+    job_id: key.startsWith("_orphan_") ? null : key,
+    started_at: startedAt,
+    completed_at: completedAt,
+    install_id: tx?.install_id || rows[0].install_id || null,
+    tier: tx?.tier || rows[0].tier || null,
+    media_url: tx?.media_url || null,
+    title: tx?.title || null,
+    batch_id: batchId,
+    source: source,
+    audio_seconds: audioSec,
+    audio_bytes: audioBytes,
+    transcribe_status: txStatus,
+    transcribe_backend: tx?.backend || null,
+    transcribe_model: tx?.model || null,
+    // transcribe_ms = outer wall-time of the whole TX phase (the
+    // value the operator perceives as "how long did transcribe
+    // take"). transcribe_ms_sum = total backend compute across all
+    // chunks (drives cost; equals N × wall when N chunks run truly
+    // sequentially, equals wall when single-chunk). For Gemini at
+    // concurrency 12 over 3 chunks: wall ≈ 60s, sum ≈ 180s.
+    transcribe_ms: txMs,
+    transcribe_ms_sum: txMsSum,
+    download_ms: downloadMs,
+    chunk_count: tx?.chunk_count ?? null,
+    analyze_windows_total: analyzeRows.length,
+    analyze_windows_success: analyzeSuccess.length,
+    analyze_windows_failed: analyzeFailed.length,
+    analyze_backend: analyzeDominantBackend,
+    analyze_model: analyzeDominantModel,
+    // analyze_ms = SUM of per-window durations (total backend compute,
+    // useful for cost). analyze_wall_time_ms = ELAPSED time from
+    // first window start to last window end (the time a user actually
+    // waits for the analyze phase). The two diverge when N windows
+    // run in parallel: a 10-window 100s-per-window job has analyze_ms
+    // = 1000s but analyze_wall_time_ms ≈ 100s (single batch) or
+    // ≈ 200s (two sequential batches at concurrency 5).
+    analyze_ms: analyzeMs,
+    analyze_wall_time_ms: analyzeWallMs,
+    overall_status: overall,
+    wall_time_ms: completedAt - startedAt,
+    cost_usd: cost,
+    errors,
+    // Derived rate metrics:
+    transcribe_ms_per_min: audioMinutes && txMs ? txMs / audioMinutes : null,
+    transcribe_ms_per_mb: audioMb && txMs ? txMs / audioMb : null,
+    download_ms_per_mb: audioMb && downloadMs ? downloadMs / audioMb : null,
+    analyze_ms_per_min: audioMinutes && analyzeMs ? analyzeMs / audioMinutes : null,
+    analyze_wall_ms_per_min: audioMinutes && analyzeWallMs ? analyzeWallMs / audioMinutes : null,
+    analyze_ms_per_mb: audioMb && analyzeMs ? analyzeMs / audioMb : null,
+  };
+}
+
+// Pick the most frequent string in a list (ties broken by first
+// occurrence). Used to attribute a backend/model to a job when its
+// rows might disagree (e.g. some analyze windows hit gemini and
+// fallback chain walked to hardware on others).
+function dominant(values) {
+  const counts = new Map();
+  for (const v of values) {
+    if (!v) continue;
+    counts.set(v, (counts.get(v) || 0) + 1);
+  }
+  let best = null;
+  let bestCount = 0;
+  for (const [v, c] of counts) {
+    if (c > bestCount) {
+      best = v;
+      bestCount = c;
+    }
+  }
+  return best;
+}
+
+// Compute summary statistics across all aggregated jobs. Returned to
+// the dashboard's top-of-page cards: success rate, total processing
+// time, average wall-time per video, etc.
+export function summarizeJobs(jobs) {
+  const total = jobs.length;
+  if (total === 0) {
+    return {
+      total: 0,
+      success: 0,
+      partial: 0,
+      failed: 0,
+      success_rate: 1,
+      median_wall_time_ms: null,
+      median_transcribe_ms_per_min: null,
+      median_analyze_ms_per_min: null,
+      total_cost_usd: 0,
+      total_audio_hours: 0,
+    };
+  }
+  const success = jobs.filter((j) => j.overall_status === "success").length;
+  const partial = jobs.filter((j) => j.overall_status === "partial").length;
+  const failed = jobs.filter((j) => j.overall_status === "failed").length;
+  const totalCost = jobs.reduce((s, j) => s + (j.cost_usd || 0), 0);
+  const totalAudioSec = jobs.reduce(
+    (s, j) => s + (j.audio_seconds || 0),
+    0
+  );
+
+  return {
+    total,
+    success,
+    partial,
+    failed,
+    success_rate: (success + partial) / total,
+    median_wall_time_ms: median(jobs.map((j) => j.wall_time_ms).filter(Number.isFinite)),
+    median_transcribe_ms_per_min: median(
+      jobs.map((j) => j.transcribe_ms_per_min).filter(Number.isFinite)
+    ),
+    median_analyze_ms_per_min: median(
+      jobs.map((j) => j.analyze_ms_per_min).filter(Number.isFinite)
+    ),
+    total_cost_usd: totalCost,
+    total_audio_hours: totalAudioSec / 3600,
+  };
+}
+
+function median(arr) {
+  if (!arr.length) return null;
+  const sorted = [...arr].sort((a, b) => a - b);
+  const mid = Math.floor(sorted.length / 2);
+  return sorted.length % 2 === 0
+    ? (sorted[mid - 1] + sorted[mid]) / 2
+    : sorted[mid];
+}
diff --git a/server/jobs.js b/server/jobs.js
new file mode 100644
index 0000000..7ef5d61
--- /dev/null
+++ b/server/jobs.js
@@ -0,0 +1,219 @@
+// In-memory background-job tracker. Used by /relay/transcribe-url
+// (and any future long-running endpoint) so the request that kicks
+// off the work returns immediately with a job_id, and the client
+// polls /relay/jobs/{id} to find out when it's done.
+//
+// Rationale: synchronous HTTP responses for multi-minute transcribes
+// are fragile. Any intermediate proxy / load balancer / NAT in the
+// path will drop the connection after some idle/total timeout (often
+// 100s–10min), failing the whole job mid-flight even though the
+// relay backend is working fine. Async jobs sidestep all of that:
+// the long-running work happens off the request path and the client
+// polls short, cheap requests until done.
+//
+// Storage is in-process memory. Restart-survivability is a known
+// gap — a relay restart mid-job loses that job's state, and the
+// client will re-poll forever until it gives up. Acceptable for v1
+// at small relay scale; the audit log already captures every
+// completed call so the operator has a paper trail either way.
+// Migrate to SQLite if/when restart-resilience becomes important.
+//
+// Each job is { id, kind, install_id, status, started_at, updated_at,
+//   completed_at?, progress?, result?, error? }
+// status: "queued" | "running" | "complete" | "failed"
+
+import { randomUUID } from "crypto";
+import { sanitizeErrorForClient } from "./sanitize-error.js";
+
+// All in-memory; lost on restart.
+const jobs = new Map();
+
+// Cap how long completed jobs hang around so the map doesn't grow
+// unbounded. Once a client has polled and seen "complete", it'll
+// stop polling — keeping the record 24h gives slow / retried clients
+// a generous window without exhausting memory.
+const RETENTION_MS = 24 * 60 * 60 * 1000;
+
+export function createJob({ kind, installId, metadata = {} }) {
+  pruneExpired();
+  const id = randomUUID();
+  const now = Date.now();
+  const job = {
+    id,
+    kind,
+    install_id: installId,
+    status: "queued",
+    started_at: now,
+    updated_at: now,
+    completed_at: null,
+    progress: null,
+    result: null,
+    error: null,
+    metadata,
+    // Event log + live subscriber list. Used by jobs that stream
+    // incremental results via SSE (e.g., /relay/summarize-url
+    // dispatches transcribe_progress, transcribe_complete,
+    // window_complete, done, error events). Each event is
+    // { type, data, ts } and gets BOTH appended to the log (so a
+    // late SSE-connecting client can replay missed events) and
+    // pushed to any currently-subscribed callbacks. `subscribers`
+    // is intentionally non-enumerable / non-serialized so it never
+    // leaks into snapshotJobs() or HTTP responses.
+    events: [],
+  };
+  Object.defineProperty(job, "subscribers", {
+    value: new Set(),
+    enumerable: false,
+    writable: false,
+  });
+  jobs.set(id, job);
+  return job;
+}
+
+// Append an event to a job's log AND notify any live SSE
+// subscribers. Used by /relay/summarize-url's background worker to
+// emit per-window progress as it streams in from runChunkedAnalysis.
+// Event shape:
+//   { type: "window_complete"|"transcribe_complete"|"done"|"error"|"progress",
+//     data: <event payload>,
+//     ts:   ms-epoch }
+// Subscriber callbacks receive ONLY the new event (not the full log);
+// new subscribers should replay the log themselves on connect.
+export function appendEvent(jobId, type, data) {
+  const job = jobs.get(jobId);
+  if (!job) return;
+  const event = { type, data, ts: Date.now() };
+  job.events.push(event);
+  job.updated_at = event.ts;
+  // Cap the log so a runaway job doesn't blow memory. 1000 events
+  // is far beyond any plausible window count (typical: 10-20).
+  if (job.events.length > 1000) job.events.shift();
+  for (const cb of job.subscribers) {
+    try {
+      cb(event);
+    } catch (err) {
+      console.warn(`[jobs] subscriber callback failed: ${err?.message || err}`);
+    }
+  }
+}
+
+// Subscribe to live events from a job. Returns an unsubscribe
+// function the caller MUST call (e.g., on SSE connection close)
+// or the job state will leak the callback closure forever.
+// Returns null when the job no longer exists.
+export function subscribeToJob(jobId, callback) {
+  const job = jobs.get(jobId);
+  if (!job) return null;
+  job.subscribers.add(callback);
+  return () => {
+    job.subscribers.delete(callback);
+  };
+}
+
+export function getJob(jobId) {
+  pruneExpired();
+  return jobs.get(jobId) || null;
+}
+
+export function markRunning(jobId) {
+  const job = jobs.get(jobId);
+  if (!job) return;
+  job.status = "running";
+  job.updated_at = Date.now();
+}
+
+export function setProgress(jobId, message) {
+  const job = jobs.get(jobId);
+  if (!job) return;
+  job.progress = String(message).slice(0, 200);
+  job.updated_at = Date.now();
+}
+
+export function markComplete(jobId, envelope) {
+  const job = jobs.get(jobId);
+  if (!job) return;
+  job.status = "complete";
+  // Keep the full envelope shape on the job (caller decides what to
+  // pass — typically { result: {...inner...}, credit_charged, tier }).
+  // Internal consumers that read job.result directly still see the
+  // wrapped form.
+  job.result = envelope;
+  job.completed_at = Date.now();
+  job.updated_at = job.completed_at;
+  // SSE "done" event: emit the INNER result directly so subscribers
+  // can read fields off `data.result.title` (or `.transcript`,
+  // `.analysis`, etc.) instead of a confusing `data.result.result.title`.
+  // The wrapped form (envelope.result) is unwrapped here; if the
+  // caller passed a flat result without an inner `.result` key we
+  // just pass it through unchanged. credit_charged + tier travel
+  // alongside as siblings so the SSE consumer can update its
+  // balance display without digging into the result body.
+  //
+  // Why this matters: Recap-app's SSE handler does
+  // `finalResult = data.result`, then reads `finalResult.title`.
+  // Before this fix, that landed on the wrapping envelope and every
+  // title came back undefined — library entries persisted as
+  // "Untitled" despite the relay correctly extracting the real title
+  // via yt-dlp. The audit log was unaffected (it reads the local
+  // `title` variable directly) which made the bug look like a
+  // Recap-side issue. It wasn't.
+  const inner = envelope && typeof envelope === "object" && "result" in envelope
+    ? envelope.result
+    : envelope;
+  appendEvent(jobId, "done", {
+    result: inner,
+    credit_charged: envelope?.credit_charged,
+    tier: envelope?.tier,
+  });
+}
+
+export function markFailed(jobId, errorMessage) {
+  const job = jobs.get(jobId);
+  if (!job) return;
+  job.status = "failed";
+  // Sanitize at the source so EVERY downstream surface that reads
+  // job.error (SSE error event, the per-job GET endpoints, etc.)
+  // gets the client-safe wording, without having to remember to
+  // sanitize at every call site. The raw operator-internal message
+  // stays available on job.error_internal for the admin dashboard +
+  // audit log (snapshotJobs exposes both fields).
+  const raw = String(errorMessage || "unknown error").slice(0, 500);
+  job.error_internal = raw;
+  job.error = sanitizeErrorForClient(raw).slice(0, 500);
+  job.completed_at = Date.now();
+  job.updated_at = job.completed_at;
+  // Same terminal event for failures — SSE clients close on this
+  // and surface the error to the user.
+  appendEvent(jobId, "error", { error: job.error });
+}
+
+export function snapshotJobs() {
+  pruneExpired();
+  return Array.from(jobs.values()).map((j) => ({
+    id: j.id,
+    kind: j.kind,
+    install_id: j.install_id,
+    status: j.status,
+    started_at: j.started_at,
+    updated_at: j.updated_at,
+    completed_at: j.completed_at,
+    progress: j.progress,
+    has_result: j.result != null,
+    // Both error variants exposed — the admin dashboard consumes
+    // snapshotJobs and can prefer error_internal for operator
+    // diagnosis (full backend / spark-control wording intact).
+    // External callers should always read `error` (sanitized).
+    error: j.error,
+    error_internal: j.error_internal || j.error,
+  }));
+}
+
+function pruneExpired() {
+  const cutoff = Date.now() - RETENTION_MS;
+  for (const [id, job] of jobs) {
+    const ref = job.completed_at || job.updated_at || job.started_at;
+    if (ref && ref < cutoff) {
+      jobs.delete(id);
+    }
+  }
+}
diff --git a/server/meeting-extras.js b/server/meeting-extras.js
new file mode 100644
index 0000000..cfc5c90
--- /dev/null
+++ b/server/meeting-extras.js
@@ -0,0 +1,376 @@
+// Phase 2 of Path 2A — meeting extras analysis.
+//
+// Runs a single LLM pass AFTER transcribe → diarize → cluster →
+// analyze → name-inference → summary-polish complete. Pulls out four
+// categories of structured information that operators consistently
+// want at the top of an internal meeting recap:
+//
+//   - decisions       : what was agreed on (with the offset where it was settled)
+//   - action_items    : who owes what, by when (best-effort due_hint)
+//   - open_questions  : questions raised that didn't get resolved
+//   - key_quotes      : notable statements worth surfacing verbatim
+//
+// Each item carries a `supporting_offset` (or `offset`) in seconds so
+// the dashboard can render the timestamp as a clickable jump to the
+// corresponding transcript line. Each item also carries speaker IDs
+// (cluster ids like Speaker_A) so the renderer can show the speaker's
+// colored chip + display name, and so an operator-rename or per-line
+// override propagates here too.
+//
+// Returns:
+//   {
+//     decisions:      [{ statement, agreed_by[], supporting_offset }],
+//     action_items:   [{ description, owner, due_hint, supporting_offset }],
+//     open_questions: [{ question, raised_by, answered }],
+//     key_quotes:     [{ speaker, offset, quote, why_notable }],
+//   }
+//
+// or null on total failure. Failure is non-fatal — the meeting still
+// saves with rec.extras = null and the dashboard just hides the
+// extras section.
+
+import { recordCall } from "./audit-log.js";
+
+const EXTRAS_MAX_ATTEMPTS = 3;
+
+export const DEFAULT_MEETING_EXTRAS_PROMPT_TEMPLATE = `You are extracting structured information from an internal team meeting transcript. The transcript below has been pre-tagged with speaker labels like [A], [B], [C] (anonymous voice-clustering labels) and inferred real names where available.
+
+MEETING METADATA:
+- Title: {{title}}
+- Duration: {{duration}}
+
+{{operatorContext}}SPEAKERS (from voice clustering, with operator-confirmed names where present):
+{{speakerRoster}}
+
+TOPIC SUMMARIES (already produced — for context only, do not duplicate):
+{{topics}}
+
+TRANSCRIPT (each line is "[<letter> <MM:SS>] text"):
+{{transcript}}
+
+INSTRUCTIONS:
+Extract FIVE categories of information from the meeting. Return EMPTY ARRAYS for categories that don't apply — do NOT invent items.
+
+1. TLDR — A 2-4 sentence executive summary of the entire meeting: what it was about, the key discussion arc, and the bottom-line outcome. Write in past tense, third person. Keep it dense — every clause should carry information. Skip pleasantries and procedural opening/closing chatter. If a meeting was genuinely substanceless (a 3-minute check-in, audio test, etc.), write one factual descriptor sentence instead of padding. This is the only required category — even the most trivial meeting gets a one-sentence TLDR.
+   - summary: the 2-4 sentence executive summary
+   - primary_speakers: array of Speaker_X ids who drove the conversation (the 1-3 people most central to the discussion, in rough order of contribution). Empty array if unclear.
+
+2. DECISIONS — Things explicitly decided / agreed during the meeting. Include only clear commitments ("we will do X", "let's go with Y"), not casual mentions. For each:
+   - statement: the decision in one sentence
+   - agreed_by: array of Speaker_X ids who explicitly agreed (use the chip-letter notation, e.g. ["Speaker_A", "Speaker_C"]). Empty array if unclear.
+   - supporting_offset: integer SECONDS where this decision was made (use the [<letter> <MM:SS>] timestamp from the most relevant transcript line — convert MM:SS to total seconds)
+
+3. ACTION_ITEMS — Specific commitments where someone said they would do something. Include only explicit ownership ("I'll send the doc", "Matt will follow up"), not vague "someone should...". For each:
+   - description: the action in imperative form
+   - owner: the Speaker_X id of the person taking it on (e.g. "Speaker_A"), or null if unclear
+   - due_hint: the deadline as a string if mentioned ("by Friday", "end of week", "before next call"), or null
+   - supporting_offset: integer seconds where the commitment was made
+
+4. OPEN_QUESTIONS — Questions raised that were NOT clearly answered during the meeting. Skip rhetorical questions and questions that got direct answers. For each:
+   - question: the question, rephrased to be self-contained
+   - raised_by: the Speaker_X id who asked (or null if unclear)
+   - answered: false (always — if it was answered, don't include it)
+
+5. KEY_QUOTES — Statements worth surfacing verbatim because they are pivotal, particularly insightful, or capture a strong opinion. Limit to 3-6 quotes max. Skip filler and conversational text. For each:
+   - speaker: the Speaker_X id of the speaker
+   - offset: integer seconds where the quote occurs
+   - quote: the verbatim quote (trim to the substantive sentence, 4-30 words)
+   - why_notable: one short clause on why this is worth surfacing
+
+Be conservative across all five. Better to return an empty array (or for TLDR, a single factual sentence) than to fabricate. A 5-minute small-talk call may legitimately have 0 decisions, 0 action items, 0 open questions, 0 key quotes — but it still gets a TLDR.
+
+Respond with ONLY valid JSON in this exact shape, no other text:
+{
+  "tldr": {"summary": "...", "primary_speakers": ["Speaker_A", "Speaker_B"]},
+  "decisions": [{"statement": "...", "agreed_by": ["Speaker_A"], "supporting_offset": 123}],
+  "action_items": [{"description": "...", "owner": "Speaker_B", "due_hint": "by Friday", "supporting_offset": 234}],
+  "open_questions": [{"question": "...", "raised_by": "Speaker_C", "answered": false}],
+  "key_quotes": [{"speaker": "Speaker_A", "offset": 345, "quote": "...", "why_notable": "..."}]
+}`;
+
+function fillTemplate(template, vars) {
+  return String(template || "").replace(/\{\{\s*(\w+)\s*\}\}/g, (_match, key) => {
+    return key in vars ? String(vars[key]) : `{{${key}}}`;
+  });
+}
+
+function formatDuration(seconds) {
+  const s = Math.max(0, Math.floor(seconds || 0));
+  const h = Math.floor(s / 3600);
+  const m = Math.floor((s % 3600) / 60);
+  const sec = s % 60;
+  if (h > 0) return `${h}h ${m}m ${sec}s`;
+  if (m > 0) return `${m}m ${sec}s`;
+  return `${sec}s`;
+}
+
+function formatLabeledTranscript(segments) {
+  if (!Array.isArray(segments) || segments.length === 0) return "";
+  const lines = [];
+  for (const seg of segments) {
+    const text = (seg.text || "").trim();
+    if (!text) continue;
+    const t = seg.start || 0;
+    let letter = "?";
+    const m = String(seg.speaker || "").match(/^Speaker_([A-Z]+)$/);
+    if (m) letter = m[1];
+    const secInt = Math.floor(t);
+    const mm = Math.floor(secInt / 60);
+    const ss = secInt % 60;
+    lines.push(`[${letter} ${mm}:${String(ss).padStart(2, "0")}] ${text}`);
+  }
+  return lines.join("\n");
+}
+
+// Trim a too-large transcript by keeping the head and tail. Keeps
+// the meeting's opening (introductions, agenda) AND closing (wrap-up,
+// next steps) which are where most extras-worthy content lives.
+function capTranscript(text, maxChars) {
+  if (text.length <= maxChars) return text;
+  const half = Math.floor(maxChars / 2) - 50;
+  return (
+    text.slice(0, half) +
+    "\n\n…[middle truncated for prompt length]…\n\n" +
+    text.slice(-half)
+  );
+}
+
+function safeParseExtras(text) {
+  if (!text || typeof text !== "string") return null;
+  let s = text.trim();
+  const fence = s.match(/```(?:json)?\s*([\s\S]*?)```/);
+  if (fence) s = fence[1].trim();
+  let parsed;
+  try {
+    parsed = JSON.parse(s);
+  } catch {
+    return null;
+  }
+  if (!parsed || typeof parsed !== "object") return null;
+  const asArray = (v) => (Array.isArray(v) ? v : []);
+  // TLDR — exactly one object (not an array). Required category;
+  // we accept any well-formed shape and clamp to safe bounds. If
+  // the LLM omitted it entirely we leave it null so the renderer
+  // can show "TLDR unavailable" rather than fabricating.
+  let tldr = null;
+  if (parsed.tldr && typeof parsed.tldr === "object" && !Array.isArray(parsed.tldr)) {
+    const summary = typeof parsed.tldr.summary === "string" ? parsed.tldr.summary.trim() : "";
+    if (summary) {
+      tldr = {
+        summary: summary.slice(0, 800),
+        primary_speakers: Array.isArray(parsed.tldr.primary_speakers)
+          ? parsed.tldr.primary_speakers
+              .filter((x) => typeof x === "string" && /^Speaker_[A-Z]+$/.test(x))
+              .slice(0, 5)
+          : [],
+      };
+    }
+  }
+  // Coerce + clamp each category to a sane shape. Drop entries
+  // that fail validation rather than failing the whole pass.
+  const decisions = asArray(parsed.decisions)
+    .map((d) => {
+      if (!d || typeof d !== "object") return null;
+      const statement = typeof d.statement === "string" ? d.statement.trim() : "";
+      if (!statement) return null;
+      return {
+        statement: statement.slice(0, 400),
+        agreed_by: Array.isArray(d.agreed_by)
+          ? d.agreed_by.filter((x) => typeof x === "string" && /^Speaker_[A-Z]+$/.test(x)).slice(0, 10)
+          : [],
+        supporting_offset: Number.isFinite(d.supporting_offset) ? Math.max(0, Math.floor(d.supporting_offset)) : null,
+      };
+    })
+    .filter(Boolean)
+    .slice(0, 20);
+  const action_items = asArray(parsed.action_items)
+    .map((a) => {
+      if (!a || typeof a !== "object") return null;
+      const description = typeof a.description === "string" ? a.description.trim() : "";
+      if (!description) return null;
+      return {
+        description: description.slice(0, 400),
+        owner: typeof a.owner === "string" && /^Speaker_[A-Z]+$/.test(a.owner) ? a.owner : null,
+        due_hint: typeof a.due_hint === "string" && a.due_hint.trim() ? a.due_hint.trim().slice(0, 80) : null,
+        supporting_offset: Number.isFinite(a.supporting_offset) ? Math.max(0, Math.floor(a.supporting_offset)) : null,
+      };
+    })
+    .filter(Boolean)
+    .slice(0, 30);
+  const open_questions = asArray(parsed.open_questions)
+    .map((q) => {
+      if (!q || typeof q !== "object") return null;
+      const question = typeof q.question === "string" ? q.question.trim() : "";
+      if (!question) return null;
+      return {
+        question: question.slice(0, 400),
+        raised_by: typeof q.raised_by === "string" && /^Speaker_[A-Z]+$/.test(q.raised_by) ? q.raised_by : null,
+        answered: q.answered === true,
+      };
+    })
+    .filter(Boolean)
+    .slice(0, 20);
+  const key_quotes = asArray(parsed.key_quotes)
+    .map((q) => {
+      if (!q || typeof q !== "object") return null;
+      const quote = typeof q.quote === "string" ? q.quote.trim() : "";
+      if (!quote) return null;
+      return {
+        speaker: typeof q.speaker === "string" && /^Speaker_[A-Z]+$/.test(q.speaker) ? q.speaker : null,
+        offset: Number.isFinite(q.offset) ? Math.max(0, Math.floor(q.offset)) : null,
+        quote: quote.slice(0, 400),
+        why_notable: typeof q.why_notable === "string" ? q.why_notable.trim().slice(0, 200) : "",
+      };
+    })
+    .filter(Boolean)
+    .slice(0, 10);
+  return { tldr, decisions, action_items, open_questions, key_quotes };
+}
+
+export async function runMeetingExtras({
+  title,
+  audioSec,
+  speakers,
+  speakerNames,
+  transcriptSegments,
+  topics, // array of { title, summary, startTime } from analyze-then-polish
+  promptOverride = "",
+  // Operator-supplied hints (internal meetings only). participantHints
+  // is a CSV-ish string of expected attendees; operatorNotes is free-
+  // form prose describing who-said-what. Both are framed as hints in
+  // the rendered prompt — the LLM is instructed to use them as soft
+  // signals and verify against the transcript before quoting or
+  // attributing. Empty → no OPERATOR HINTS block appears.
+  participantHints = "",
+  operatorNotes = "",
+  backend,
+  pipelineBackend,
+  jobId,
+  installId,
+  licenseFingerprint = null,
+  source,
+  computeCostDetails,
+}) {
+  if (!backend) return null;
+  if (!Array.isArray(transcriptSegments) || transcriptSegments.length === 0) return null;
+
+  // Build speaker roster — Speaker_A (chip A, 12m 34s, "Matt Hill")
+  const speakerLetters = Object.keys(speakers || {})
+    .filter((k) => /^Speaker_[A-Z]+$/.test(k))
+    .sort();
+  const speakerRoster = speakerLetters
+    .map((k) => {
+      const stats = speakers[k] || {};
+      const secs = Math.round(stats.total_speaking_seconds || 0);
+      const mins = Math.floor(secs / 60);
+      const rem = secs % 60;
+      const timeStr = mins > 0 ? `${mins}m ${rem}s` : `${rem}s`;
+      const letter = k.replace("Speaker_", "");
+      const name = speakerNames && speakerNames[k] ? `"${speakerNames[k]}"` : "(unknown)";
+      return `- ${k} (chip [${letter}], ${timeStr} speaking, ${stats.turns || 0} turns): ${name}`;
+    })
+    .join("\n");
+
+  const topicsBlock = Array.isArray(topics) && topics.length
+    ? topics
+        .map((t, i) => {
+          const startSec = t.startTime || 0;
+          const mm = Math.floor(startSec / 60);
+          const ss = Math.floor(startSec % 60);
+          const tStr = `${mm}:${String(ss).padStart(2, "0")}`;
+          return `${i + 1}. [${tStr}] ${t.title || "(untitled)"} — ${t.summary || ""}`;
+        })
+        .join("\n")
+    : "(no topics)";
+
+  const fullTranscript = formatLabeledTranscript(transcriptSegments);
+  const cappedTranscript = capTranscript(fullTranscript, 25000);
+
+  // Compose the OPERATOR HINTS block — same shape as the name-
+  // inference pipeline so the LLM gets consistent framing across
+  // both passes. Empty when no hints supplied.
+  const hintsParts = [];
+  if (participantHints && String(participantHints).trim()) {
+    hintsParts.push(
+      `Possible participants in this meeting (operator-supplied — may be incomplete):\n${String(participantHints).trim()}`,
+    );
+  }
+  if (operatorNotes && String(operatorNotes).trim()) {
+    const trimmed = String(operatorNotes).trim().slice(0, 4000);
+    hintsParts.push(
+      `Operator notes (may describe who said what — use as soft context, verify against the transcript before extracting decisions / action items / quotes):\n${trimmed}`,
+    );
+  }
+  const operatorContextBlock = hintsParts.length
+    ? `OPERATOR HINTS (treat as suggestions only — verify against the transcript):\n\n${hintsParts.join("\n\n")}\n\n`
+    : "";
+
+  const templateSource =
+    typeof promptOverride === "string" && promptOverride.trim()
+      ? promptOverride
+      : DEFAULT_MEETING_EXTRAS_PROMPT_TEMPLATE;
+  const prompt = fillTemplate(templateSource, {
+    title: title || "(untitled)",
+    duration: formatDuration(audioSec),
+    operatorContext: operatorContextBlock,
+    speakerRoster: speakerRoster || "(no speakers identified)",
+    topics: topicsBlock,
+    transcript: cappedTranscript || "(empty)",
+  });
+
+  const t0 = Date.now();
+  let r = null;
+  let parsed = null;
+  let lastErr = null;
+  for (let attempt = 0; attempt < EXTRAS_MAX_ATTEMPTS; attempt++) {
+    try {
+      r = await backend.analyzeText({ prompt });
+      parsed = safeParseExtras(r.text);
+      if (parsed) {
+        lastErr = null;
+        break;
+      }
+      lastErr = "invalid JSON in extras response";
+    } catch (err) {
+      lastErr = (err?.message || String(err)).slice(0, 280);
+      r = null;
+    }
+    if (attempt < EXTRAS_MAX_ATTEMPTS - 1) {
+      console.warn(
+        `[meeting-extras] attempt ${attempt + 1} failed (${lastErr}) — retrying`
+      );
+    }
+  }
+  const dur = Date.now() - t0;
+  const cost =
+    parsed && r
+      ? computeCostDetails(r.model, r.usage)
+      : { input_tokens: 0, output_tokens: 0, thinking_tokens: 0, cost_usd: 0 };
+  await recordCall({
+    install_id: installId,
+    license_fingerprint: licenseFingerprint,
+    tier: "core",
+    pipeline: "meeting_extras",
+    backend: pipelineBackend,
+    model: r?.model || null,
+    status: parsed ? "success" : "error",
+    duration_ms: dur,
+    audio_seconds: 0,
+    job_id: jobId,
+    batch_id: null,
+    source,
+    media_url: null,
+    error: parsed ? null : lastErr || "extras analysis failed",
+    ...cost,
+  });
+  if (!parsed) {
+    console.warn(
+      `[meeting-extras] all ${EXTRAS_MAX_ATTEMPTS} attempts failed (${lastErr}) — extras unavailable`
+    );
+    return null;
+  }
+  console.log(
+    `[meeting-extras] extracted ${parsed.tldr ? "tldr + " : "(no tldr) + "}${parsed.decisions.length} decision(s), ${parsed.action_items.length} action(s), ${parsed.open_questions.length} question(s), ${parsed.key_quotes.length} quote(s) in ${(dur / 1000).toFixed(1)}s`
+  );
+  return parsed;
+}
diff --git a/server/meeting-speaker-edits.js b/server/meeting-speaker-edits.js
new file mode 100644
index 0000000..0d446f8
--- /dev/null
+++ b/server/meeting-speaker-edits.js
@@ -0,0 +1,359 @@
+// Post-hoc speaker edits for saved internal meetings.
+//
+// Two operator tools that mutate a saved meeting record in place,
+// without re-uploading audio or hitting Spark Control:
+//
+//   mergeSpeakersInRecord  — fold one or more clusters that diarization
+//                            mistakenly split apart into a single speaker.
+//   reclusterMeetingRecord — re-run the cross-chunk voice clustering at a
+//                            new strictness threshold to separate two
+//                            people who were over-merged into one cluster.
+//                            Pure offline re-clustering off the persisted
+//                            per-chunk fingerprints (rec.diarization).
+//
+// Both must keep the FOUR places a speaker label lives in sync:
+//   1. rec.transcript_segments[].speaker
+//   2. rec.chunks[].entries[].speaker  (+ .speaker_override)
+//   3. rec.speakers          (per-cluster stats map)
+//   4. rec.extras            (tldr.primary_speakers, decisions.agreed_by,
+//                             action_items.owner, key_quotes.speaker)
+// plus rec.speaker_names (display-name map).
+
+import {
+  clusterSpeakers,
+  assignSpeakersToSegments,
+} from "./speaker-clustering.js";
+
+// ─── Entry speaker backfill ─────────────────────────────────────────
+// Re-derive each chunk entry's speaker from rec.transcript_segments by
+// timestamp. Used (a) on load to repair pre-diarization records and
+// (b) after a re-cluster re-stamps the segments. By default it only
+// fills entries that LACK a speaker (the load-path use); pass
+// { force: true } to re-stamp every entry (the re-cluster use, after
+// the old labels have been cleared).
+//
+// Matching mirrors the pipeline's original offset→segment logic
+// (internal-meetings.js build path): exact floored-start, then a
+// containing segment within ±0.5s, then nearest preceding within 5s.
+export function backfillEntrySpeakers(rec, { force = false } = {}) {
+  if (!rec || !Array.isArray(rec.chunks) || !Array.isArray(rec.transcript_segments)) {
+    return;
+  }
+  if (!force) {
+    const needsBackfill = rec.chunks.some((c) =>
+      Array.isArray(c.entries) && c.entries.some((e) => !e || !e.speaker)
+    );
+    if (!needsBackfill) return;
+  }
+
+  const segs = rec.transcript_segments
+    .slice()
+    .sort((a, b) => (a.start || 0) - (b.start || 0));
+  const byFlooredStart = new Map();
+  for (const seg of segs) {
+    const k = Math.floor(seg.start || 0);
+    if (!byFlooredStart.has(k)) byFlooredStart.set(k, seg);
+  }
+  const pickSpeaker = (t) => {
+    let found = byFlooredStart.get(t);
+    if (found && found.speaker) return found;
+    for (const seg of segs) {
+      if ((seg.start || 0) > t + 5) break;
+      if ((seg.start || 0) - 0.5 <= t && t <= (seg.end || 0) + 0.5) {
+        if (seg.speaker) return seg;
+      }
+    }
+    let bestPrev = null;
+    let bestDist = Infinity;
+    for (const seg of segs) {
+      if ((seg.start || 0) > t) break;
+      const dist = t - (seg.start || 0);
+      if (dist < bestDist && seg.speaker) {
+        bestDist = dist;
+        bestPrev = seg;
+      }
+    }
+    if (bestPrev && bestDist <= 5) return bestPrev;
+    return null;
+  };
+  for (const chunk of rec.chunks) {
+    if (!Array.isArray(chunk.entries)) continue;
+    for (const entry of chunk.entries) {
+      if (!force && entry.speaker) continue;
+      const t = entry.offset || 0;
+      const found = pickSpeaker(t);
+      if (found && found.speaker) {
+        entry.speaker = found.speaker;
+        entry.speaker_confidence = found.speaker_confidence ?? null;
+        entry.speaker_uncertain = !!found.speaker_uncertain;
+      }
+    }
+  }
+}
+
+// ─── Merge speakers ─────────────────────────────────────────────────
+// Fold each cluster in `absorbed` into `survivor`. Rewrites every label
+// reference, sums the stats, inherits the absorbed display name only
+// when the survivor has none, and rewrites extras attributions.
+// Remaining letters are intentionally NOT renumbered — that would
+// cascade through speaker_names + per-line overrides for no real gain.
+//
+// Returns { changed, speakers, speaker_names }. Throws on invalid input.
+export function mergeSpeakersInRecord(rec, survivor, absorbed) {
+  if (!rec || typeof rec !== "object") {
+    throw badRequest("record required");
+  }
+  const speakers = rec.speakers && typeof rec.speakers === "object" ? rec.speakers : {};
+  const absorbList = Array.isArray(absorbed) ? [...new Set(absorbed)] : [];
+
+  if (typeof survivor !== "string" || !speakers[survivor]) {
+    throw badRequest("survivor must be an existing speaker id");
+  }
+  if (absorbList.length === 0) {
+    throw badRequest("absorbed must list at least one speaker id");
+  }
+  for (const x of absorbList) {
+    if (x === survivor) throw badRequest("cannot merge a speaker into itself");
+    if (!speakers[x]) throw badRequest(`unknown speaker id: ${x}`);
+  }
+  // Refuse if the merge would leave no named-able speakers — i.e. it
+  // collapses everything into one is fine, but survivor must remain.
+  const remaining = Object.keys(speakers).filter((id) => !absorbList.includes(id));
+  if (!remaining.includes(survivor)) {
+    throw badRequest("survivor cannot be in the absorbed set");
+  }
+
+  const absorbedSet = new Set(absorbList);
+  let changed = 0;
+
+  // 1. transcript_segments
+  for (const seg of rec.transcript_segments || []) {
+    if (seg && absorbedSet.has(seg.speaker)) {
+      seg.speaker = survivor;
+      changed += 1;
+    }
+  }
+
+  // 2. chunk entries (+ per-line overrides)
+  for (const chunk of rec.chunks || []) {
+    for (const entry of chunk.entries || []) {
+      if (!entry) continue;
+      if (absorbedSet.has(entry.speaker)) {
+        entry.speaker = survivor;
+        changed += 1;
+      }
+      if (absorbedSet.has(entry.speaker_override)) {
+        entry.speaker_override = survivor;
+        changed += 1;
+      }
+    }
+  }
+
+  // 3. stats + display name
+  rec.speaker_names = rec.speaker_names && typeof rec.speaker_names === "object"
+    ? rec.speaker_names
+    : {};
+  for (const x of absorbList) {
+    mergeStats(speakers[survivor], speakers[x]);
+    delete speakers[x];
+    // Survivor inherits the absorbed name only if it has none of its own.
+    if (!rec.speaker_names[survivor] && rec.speaker_names[x]) {
+      rec.speaker_names[survivor] = rec.speaker_names[x];
+    }
+    if (x in rec.speaker_names) delete rec.speaker_names[x];
+  }
+
+  // 4. extras attributions
+  remapExtrasSpeakers(rec.extras, (id) => (absorbedSet.has(id) ? survivor : id));
+
+  rec.meta = rec.meta || {};
+  rec.meta.speakers_merged_at = Date.now();
+
+  return { changed, speakers: rec.speakers, speaker_names: rec.speaker_names };
+}
+
+// ─── Re-cluster (re-run diarization) ────────────────────────────────
+// Re-run cross-chunk clustering off the persisted per-chunk
+// fingerprints at a new threshold (+ optional suppression knobs),
+// re-stamp every segment + entry, then RESET the now-stale attribution
+// data (inferred names, per-line overrides, extras speaker tags) so the
+// operator re-labels from a clean slate. No LLM calls.
+//
+// Returns { speakers, clusterCount, threshold }. Throws a NO_FINGERPRINTS
+// error (code on err) when the record has no usable fingerprint data.
+export function reclusterMeetingRecord(rec, opts = {}) {
+  if (!rec || typeof rec !== "object") throw badRequest("record required");
+
+  const diar = Array.isArray(rec.diarization) ? rec.diarization : [];
+  const totalFps = diar.reduce(
+    (n, d) => n + (d && d.ok ? Object.keys(d.fingerprints || {}).length : 0),
+    0
+  );
+  if (totalFps === 0) {
+    const err = new Error(
+      "this meeting has no saved voice fingerprints — it predates fingerprint capture or was processed with diarization off, so it can't be re-clustered"
+    );
+    err.code = "NO_FINGERPRINTS";
+    throw err;
+  }
+
+  const threshold = opts.threshold;
+  const { globalMap, uncertaintyMap, speakers, clusterCount } = clusterSpeakers(
+    diar,
+    threshold,
+    {
+      anchorMinSpeakingSec: opts.anchorMinSpeakingSec,
+      smallClusterMaxSpeakingSec: opts.smallClusterMaxSpeakingSec,
+      uncertainMarginPct: opts.uncertainMarginPct,
+    }
+  );
+
+  // Re-stamp the flat transcript segments off the new clustering...
+  if (Array.isArray(rec.transcript_segments)) {
+    assignSpeakersToSegments(rec.transcript_segments, diar, globalMap, uncertaintyMap);
+  }
+  // ...then clear + re-derive each chunk entry's speaker from them.
+  for (const chunk of rec.chunks || []) {
+    for (const entry of chunk.entries || []) {
+      if (!entry) continue;
+      entry.speaker = null;
+      entry.speaker_confidence = null;
+      entry.speaker_uncertain = false;
+      if ("speaker_override" in entry) delete entry.speaker_override;
+    }
+  }
+  backfillEntrySpeakers(rec, { force: true });
+
+  // New roster; stale name/attribution data reset.
+  rec.speakers = speakers;
+  rec.speaker_names = {};
+  resetExtrasSpeakers(rec.extras);
+
+  rec.meta = rec.meta || {};
+  rec.meta.reclustered_at = Date.now();
+  rec.meta.recluster_threshold = clampPct(threshold);
+  rec.meta.polish_done = false;
+
+  return { speakers, clusterCount, threshold: rec.meta.recluster_threshold };
+}
+
+// ─── Apply re-polished summaries ────────────────────────────────────
+// After a re-polish pass (runSummaryPolish with the operator's corrected
+// names), write the new section summaries back into the saved record:
+//   - rec.analysis.sections — the canonical section store
+//   - rec.chunks[].summary  — the rendered topic cards
+// Chunk summaries are matched to sections BY TITLE (polish never changes
+// titles), consumed in section order so duplicate titles still line up.
+// Chunk ENTRIES and any per-line speaker_override are left untouched —
+// only the summary text changes. Returns the count of chunk summaries
+// actually changed.
+export function applyPolishedSummaries(rec, polishedSections) {
+  if (!rec || typeof rec !== "object" || !Array.isArray(polishedSections)) return 0;
+
+  if (rec.analysis && typeof rec.analysis === "object") {
+    rec.analysis.sections = polishedSections;
+  } else {
+    rec.analysis = { sections: polishedSections };
+  }
+
+  // title → queue of summaries, in section order.
+  const byTitle = new Map();
+  for (const s of polishedSections) {
+    const key = s && typeof s.title === "string" ? s.title : "";
+    if (!byTitle.has(key)) byTitle.set(key, []);
+    byTitle.get(key).push(s && typeof s.summary === "string" ? s.summary : "");
+  }
+
+  const used = new Map();
+  let changed = 0;
+  for (const chunk of rec.chunks || []) {
+    if (!chunk) continue;
+    const key = typeof chunk.title === "string" ? chunk.title : "";
+    const list = byTitle.get(key);
+    if (!list || !list.length) continue;
+    const i = used.get(key) || 0;
+    const summary = i < list.length ? list[i] : list[list.length - 1];
+    used.set(key, i + 1);
+    if (typeof summary === "string" && summary && chunk.summary !== summary) {
+      chunk.summary = summary;
+      changed += 1;
+    }
+  }
+  return changed;
+}
+
+// ─── helpers ────────────────────────────────────────────────────────
+
+function badRequest(message) {
+  const err = new Error(message);
+  err.code = "BAD_REQUEST";
+  return err;
+}
+
+function clampPct(v) {
+  const n = Number(v);
+  if (!Number.isFinite(n)) return 70;
+  return Math.max(50, Math.min(95, Math.round(n)));
+}
+
+// Merge stats of `from` into `into` in place. turns / speaking-time /
+// fingerprint-count sum; mean_confidence is turn-weighted across the
+// clusters that have one; chunks_appeared_in uses max as a safe
+// approximation (the raw per-cluster chunk sets aren't retained).
+function mergeStats(into, from) {
+  if (!into || !from) return;
+  const t1 = into.turns || 0;
+  const t2 = from.turns || 0;
+  const c1 = typeof into.mean_confidence === "number" ? into.mean_confidence : null;
+  const c2 = typeof from.mean_confidence === "number" ? from.mean_confidence : null;
+  let mean = null;
+  if (c1 != null && c2 != null) {
+    const w = t1 + t2;
+    mean = w > 0 ? (c1 * t1 + c2 * t2) / w : (c1 + c2) / 2;
+  } else if (c1 != null) {
+    mean = c1;
+  } else if (c2 != null) {
+    mean = c2;
+  }
+  into.turns = t1 + t2;
+  into.total_speaking_seconds =
+    Math.round(((into.total_speaking_seconds || 0) + (from.total_speaking_seconds || 0)) * 10) / 10;
+  into.fingerprint_count = (into.fingerprint_count || 0) + (from.fingerprint_count || 0);
+  into.chunks_appeared_in = Math.max(into.chunks_appeared_in || 0, from.chunks_appeared_in || 0);
+  into.mean_confidence = mean;
+}
+
+// Rewrite every speaker id in the extras block through `map`.
+function remapExtrasSpeakers(extras, map) {
+  if (!extras || typeof extras !== "object") return;
+  if (extras.tldr && Array.isArray(extras.tldr.primary_speakers)) {
+    extras.tldr.primary_speakers = dedupe(extras.tldr.primary_speakers.map(map));
+  }
+  for (const d of arr(extras.decisions)) {
+    if (Array.isArray(d.agreed_by)) d.agreed_by = dedupe(d.agreed_by.map(map));
+  }
+  for (const a of arr(extras.action_items)) {
+    if (a.owner) a.owner = map(a.owner);
+  }
+  for (const q of arr(extras.key_quotes)) {
+    if (q.speaker) q.speaker = map(q.speaker);
+  }
+}
+
+// Clear extras speaker attributions (keep the text). Used by re-cluster
+// since cluster identities change and old ids would be meaningless.
+function resetExtrasSpeakers(extras) {
+  if (!extras || typeof extras !== "object") return;
+  if (extras.tldr) extras.tldr.primary_speakers = [];
+  for (const d of arr(extras.decisions)) d.agreed_by = [];
+  for (const a of arr(extras.action_items)) a.owner = null;
+  for (const q of arr(extras.key_quotes)) q.speaker = null;
+}
+
+function arr(v) {
+  return Array.isArray(v) ? v : [];
+}
+
+function dedupe(list) {
+  return [...new Set(list)];
+}
diff --git a/server/output-store.js b/server/output-store.js
new file mode 100644
index 0000000..1811dfd
--- /dev/null
+++ b/server/output-store.js
@@ -0,0 +1,163 @@
+// Per-job output storage. After a transcribe + analyze cycle
+// completes, the worker calls saveJobOutput() to persist the
+// transcript + analysis JSON to /data/relay-outputs/<job_id>.json.
+// The operator dashboard surfaces these as a "View" link per job
+// that opens a Recap-style two-pane render in a new tab.
+//
+// Storage policy:
+//   - Test-run jobs (source = "admin-test") are ALWAYS saved
+//   - Real-user jobs are saved only when relay_save_user_outputs
+//     is true in the operator config (default false for privacy)
+//
+// Storage format (per file):
+//   {
+//     job_id: string
+//     batch_id: string | null
+//     source: "admin-test" | null
+//     saved_at: ms-epoch
+//     transcript: string ("[MM:SS] line\n[MM:SS] line...")
+//     analysis: { sections: [{title, summary, startIndex, endIndex}, ...] }
+//     meta: {
+//       title, media_url, audio_seconds, audio_bytes,
+//       transcribe_backend, transcribe_model,
+//       analyze_backend, analyze_model,
+//       transcribe_ms, analyze_ms, wall_time_ms,
+//       captions_mode
+//     }
+//   }
+//
+// Files are simple JSON — no index, no DB. Listing scans the dir;
+// deletion just rm's the file. Cheap up to thousands of entries; if
+// the operator hits scale, swap in a SQLite index without changing
+// the on-disk format.
+
+import fs from "fs/promises";
+import path from "path";
+
+let outputDir = "/data/relay-outputs";
+
+export async function initOutputStore({ dataDir }) {
+  outputDir = path.join(dataDir, "relay-outputs");
+  try {
+    await fs.mkdir(outputDir, { recursive: true, mode: 0o700 });
+  } catch (err) {
+    console.warn(`[output-store] mkdir failed: ${err?.message || err}`);
+  }
+  console.log(`[output-store] writing to ${outputDir}`);
+}
+
+// Path constructor with light sanitization — job_id is a UUID-style
+// string, but filter out anything that could traverse the filesystem
+// just in case the upstream ID generator changes.
+function pathFor(jobId) {
+  const safe = String(jobId || "").replace(/[^a-zA-Z0-9_-]/g, "");
+  if (!safe) throw new Error("invalid job_id");
+  return path.join(outputDir, `${safe}.json`);
+}
+
+// Save a job's transcript + analysis to disk. Best-effort: on write
+// failure, log and continue — the audit log remains the source of
+// truth for whether the job ran.
+export async function saveJobOutput(jobId, payload) {
+  try {
+    const filePath = pathFor(jobId);
+    const body = JSON.stringify(
+      { job_id: jobId, saved_at: Date.now(), ...payload },
+      null,
+      2
+    );
+    await fs.writeFile(filePath, body, { mode: 0o600 });
+  } catch (err) {
+    console.warn(
+      `[output-store] save failed for ${jobId}: ${err?.message || err}`
+    );
+  }
+}
+
+// Read a single job's stored output. Returns null when missing —
+// the route layer should turn that into a 404.
+export async function getJobOutput(jobId) {
+  try {
+    const filePath = pathFor(jobId);
+    const raw = await fs.readFile(filePath, "utf8");
+    return JSON.parse(raw);
+  } catch (err) {
+    if (err.code === "ENOENT") return null;
+    console.warn(
+      `[output-store] read failed for ${jobId}: ${err?.message || err}`
+    );
+    return null;
+  }
+}
+
+// Check existence cheaply (stat) without reading the file body —
+// the Jobs table only needs a has_output boolean per row, not the
+// full payload, and scanning thousands of stats is much cheaper
+// than reading thousands of files into memory.
+export async function listJobOutputIds() {
+  try {
+    const files = await fs.readdir(outputDir);
+    return files
+      .filter((f) => f.endsWith(".json"))
+      .map((f) => f.replace(/\.json$/, ""));
+  } catch (err) {
+    if (err.code === "ENOENT") return [];
+    console.warn(
+      `[output-store] list failed: ${err?.message || err}`
+    );
+    return [];
+  }
+}
+
+// Delete one job's output. Returns true on success, false when
+// the file didn't exist.
+export async function deleteJobOutput(jobId) {
+  try {
+    await fs.unlink(pathFor(jobId));
+    return true;
+  } catch (err) {
+    if (err.code === "ENOENT") return false;
+    throw err;
+  }
+}
+
+// Bulk delete. Accepts either an array of job_ids or { all: true }.
+// Returns { deleted, missing } for caller reporting.
+export async function bulkDeleteOutputs({ jobIds, all }) {
+  let deleted = 0;
+  let missing = 0;
+  if (all) {
+    const ids = await listJobOutputIds();
+    for (const id of ids) {
+      const ok = await deleteJobOutput(id).catch(() => false);
+      if (ok) deleted++;
+    }
+    return { deleted, missing };
+  }
+  if (!Array.isArray(jobIds)) return { deleted: 0, missing: 0 };
+  for (const id of jobIds) {
+    const ok = await deleteJobOutput(id).catch(() => false);
+    if (ok) deleted++;
+    else missing++;
+  }
+  return { deleted, missing };
+}
+
+// Aggregate stats for the dashboard "Stored outputs" mini-panel.
+export async function getStoredOutputsSummary() {
+  try {
+    const files = await fs.readdir(outputDir);
+    const jsonFiles = files.filter((f) => f.endsWith(".json"));
+    let totalBytes = 0;
+    for (const f of jsonFiles) {
+      try {
+        const s = await fs.stat(path.join(outputDir, f));
+        totalBytes += s.size;
+      } catch {}
+    }
+    return { count: jsonFiles.length, total_bytes: totalBytes };
+  } catch (err) {
+    if (err.code === "ENOENT") return { count: 0, total_bytes: 0 };
+    return { count: 0, total_bytes: 0, error: err?.message };
+  }
+}
diff --git a/server/post-cluster-polish.js b/server/post-cluster-polish.js
new file mode 100644
index 0000000..40329d3
--- /dev/null
+++ b/server/post-cluster-polish.js
@@ -0,0 +1,655 @@
+// Post-cluster polish pass: after transcribe + diarize + clustering
+// have produced a speaker-labeled transcript, AND after pipelined
+// analyze has produced section objects (titles + summaries), run a
+// two-stage LLM pass that:
+//
+//   Stage 1 — Global name inference. One LLM call with the
+//     speaker-labeled transcript + episode metadata (channel name,
+//     title, description) → JSON map { Speaker_A: "Matt Hill",
+//     Speaker_B: "Sarah Jones", Speaker_C: null }. The "_C: null"
+//     case is essential: when the LLM can't confidently identify a
+//     speaker, it must return null instead of guessing.
+//
+//   Stage 2 — Per-window summary polish. N parallel LLM calls, one
+//     per analyze window. Each call sees that window's sections
+//     (original summaries) + that window's transcript with speaker
+//     labels + the global name map from Stage 1, and rewrites each
+//     section's SUMMARY to attribute statements to specific
+//     speakers ("Matt Hill explains..." vs "the discussion
+//     centers..."). Section TITLES and start/end indices are kept
+//     unchanged — polish only touches summary text.
+//
+// Why two stages: name inference benefits from the FULL transcript
+// view (name introductions like "welcome Matt" tend to appear in
+// window 1 but Matt keeps speaking throughout); per-window polish
+// benefits from parallelism (matches the existing analyze pattern).
+// Running them as one batched call would either lose parallelism
+// or send the full transcript N times.
+//
+// Failure modes:
+//   - Stage 1 returns invalid JSON → all names default to null;
+//     Stage 2 still runs and produces "Speaker A explains..." etc.
+//   - Stage 2 fails for a particular window → keep the original
+//     analyze summary for that window's sections. Per-window
+//     failure shouldn't kill the whole polish.
+//   - Both stages fail → fall back to the unpolished analyzeResult.
+//     The caller sees the same output as a polish-disabled run.
+//
+// Cost: Stage 1 ~5-10s; Stage 2 ~10-15s (parallel); total ~15-25s
+// added to end of pipeline. On a 200s pipelined pipeline that's a
+// ~10% slowdown for the speaker-attribution UX win.
+
+import { recordCall } from "./audit-log.js";
+
+const STAGE_1_MAX_ATTEMPTS = 3;
+const STAGE_2_MAX_ATTEMPTS = 3;
+
+// ─── Default prompts (operator-editable via Settings tab) ───────────
+//
+// Same three-layer override pattern as the analyze + transcribe
+// prompts: per-session operator override → operator-promoted default
+// → these hardcoded defaults. Both are validated on save —
+// `DEFAULT_NAME_INFERENCE_PROMPT_TEMPLATE` must contain {{transcript}}
+// and JSON output instructions; `DEFAULT_SUMMARY_POLISH_PROMPT_TEMPLATE`
+// must contain {{sections}} and JSON output instructions. Template
+// variables (interpolated at request time):
+//
+// Name inference prompt:
+//   {{channel}}        — operator-supplied or yt-dlp-extracted channel name
+//   {{title}}          — episode/video title
+//   {{description}}    — episode description (capped at 800 chars)
+//   {{speakerStats}}   — pre-formatted block listing each speaker's
+//                        chip letter, total speaking time, turn count
+//   {{transcript}}     — speaker-labeled bracketed transcript, capped
+//                        at 25k chars (middle truncated when over)
+//   {{speakerKeys}}    — JSON-schema-friendly key list for the
+//                        response shape (one line per Speaker_X)
+//
+// Summary polish prompt:
+//   {{speakerRoster}}  — pre-formatted block listing each speaker
+//                        with their inferred name (or "(unknown)")
+//                        and stats
+//   {{transcript}}     — this window's slice of the labeled transcript
+//   {{sections}}       — pre-formatted block listing each section
+//                        with title + original summary + time range
+export const DEFAULT_NAME_INFERENCE_PROMPT_TEMPLATE = `You are identifying real-world speaker names in an interview/podcast/meeting transcript. The transcript below has been pre-tagged with speaker labels like [A], [B], [C] — these are anonymous labels assigned by voice clustering. Your job: infer the real names of each speaker from contextual clues in the transcript.
+
+EPISODE METADATA:
+- Channel/show: {{channel}}
+- Episode title: {{title}}
+- Description: {{description}}
+
+{{operatorContext}}SPEAKER STATISTICS (cluster output):
+{{speakerStats}}
+
+TRANSCRIPT (each line is "[<letter> <MM:SS>] text"):
+{{transcript}}
+
+INSTRUCTIONS:
+1. For each Speaker_X in the speaker statistics, infer the real name from contextual clues:
+   - Direct introductions ("welcome Matt", "I'm joined by Sarah")
+   - Self-introductions ("my name is", "I'm Sarah, founder of...")
+   - References between speakers ("what do you think Matt?", "as Sarah was saying")
+   - Channel name or episode title hints
+   - Operator hints in the OPERATOR HINTS section above, IF PRESENT — but see rule 6 for how to weight those.
+2. Use the speaker statistics to help — the host typically speaks more turns; guests speak less.
+3. Use first + last name if confidently identifiable. Use first name only if that's all you have.
+4. RETURN null IF YOU CANNOT CONFIDENTLY IDENTIFY THE SPEAKER. Do not guess. A null is better than a wrong name.
+5. For brief speakers (under 30s of speaking time, e.g. an intro music VO or a passing comment) it's expected that you'll often return null.
+6. WEIGHTING OPERATOR HINTS: When an OPERATOR HINTS section appears above, treat it as informed suggestion, NOT authoritative truth. The operator may have listed people who turned out not to speak, omitted people who did, or guessed wrong on who matches which voice. ALWAYS verify hints against the transcript. Specifically:
+   - A name in the hints is only a candidate; if the transcript provides no signal that THIS Speaker_X is that person, return null instead of guessing.
+   - If the transcript clearly identifies a speaker as someone NOT in the hints, use the transcript's name.
+   - If the hints describe what each named person did ("Steve gave the update, John asked questions"), use that as a soft signal for mapping names to chip letters, but still verify with the transcript before committing.
+   - It is better to leave a speaker as null than to confidently map a hint to the wrong chip letter.
+
+Respond with ONLY valid JSON in this exact format, no other text:
+{
+  "speakers": {
+{{speakerKeys}}
+  }
+}`;
+
+export const DEFAULT_SUMMARY_POLISH_PROMPT_TEMPLATE = `You wrote section summaries for a podcast/interview transcript window. We've now identified the speakers via voice clustering and (where possible) inferred their real names. Your job: rewrite each section's SUMMARY to attribute statements to specific speakers where it improves clarity, naturalness, and information density.
+
+SPEAKERS (from voice clustering across the full episode):
+{{speakerRoster}}
+
+WINDOW TRANSCRIPT (this window's slice; each line is labeled with the speaker's name, or a chip letter when their name is unknown):
+{{transcript}}
+
+ORIGINAL SECTIONS IN THIS WINDOW (re-write the summary of each):
+{{sections}}
+
+INSTRUCTIONS:
+1. The SPEAKERS roster and the WINDOW TRANSCRIPT are the AUTHORITATIVE source of who said what. The ORIGINAL summaries were written in an earlier pass and may attribute statements to OUTDATED or WRONG speaker names — your job includes CORRECTING those.
+2. Rewrite each section's SUMMARY so every speaker attribution matches the transcript + roster. If an original summary credits a statement to a person who, per the transcript, was actually said by someone else, REPLACE the name with the correct one. Never keep a name that does not appear in the roster.
+3. Use real names when available ("Matt Hill explains..."); fall back to a chip letter only for a speaker who has no name ("Speaker A explains...").
+4. Keep summaries 1-3 sentences — same length range as the original.
+5. KEEP THE TITLE EXACTLY AS GIVEN. Do not rewrite titles.
+6. Return the sections in the SAME ORDER as given, with the SAME INDEX numbers in the array.
+7. If a section is primarily one speaker, lean into their name ("Matt explains..."). If it is back-and-forth, name both ("Matt and Sarah debate...").
+8. If the transcript for a section genuinely has no speaker signal, keep the original summary's wording — but still fix or drop any name in it that conflicts with the roster. DO NOT invent attribution that the transcript does not support.
+
+Respond with ONLY valid JSON in this exact format:
+{
+  "sections": [
+    { "index": 0, "summary": "Polished summary text..." },
+    { "index": 1, "summary": "..." }
+  ]
+}
+
+Return only the sections in this window. Use the same indices as the input ([0], [1], ...). Only the summary field — title and indices stay as given.`;
+
+// Substitute {{key}} placeholders in a template. Unknown keys are
+// left as the literal {{key}} so an operator's edit that drops a
+// variable doesn't crash the run — the model just sees the placeholder.
+function fillTemplate(template, vars) {
+  return String(template || "").replace(/\{\{\s*(\w+)\s*\}\}/g, (_match, key) => {
+    return key in vars ? String(vars[key]) : `{{${key}}}`;
+  });
+}
+
+// Build a transcript representation with speaker labels prefixed.
+// Each line: `[A 0:08] So Matt, tell us how you got started…`
+//   - The bracketed prefix is `[<label> <MM:SS>]`
+//   - <label> is the speaker chip letter (Speaker_A → A) by default;
+//     when the segment has no speaker (gap, unmatched), uses "?" — the
+//     model is instructed to ignore those lines for name inference.
+//   - When opts.speakerNames is provided (the SUMMARY-POLISH pass), a
+//     named speaker is labeled with their RESOLVED name instead of the
+//     letter (`[Matt 0:08] …`). This matters for the re-polish flow: the
+//     operator's corrected names land directly on every transcript line,
+//     so the polish model attributes to the right person without having
+//     to resolve chip letters through the roster — and without trusting
+//     any stale names already baked into the original summaries. The
+//     name-INFERENCE pass deliberately omits speakerNames (it's inferring
+//     them) so it still sees plain chip letters.
+export function formatSpeakerLabeledTranscript(segments, opts = {}) {
+  if (!Array.isArray(segments) || segments.length === 0) return "";
+  const startSec = opts.startSec != null ? opts.startSec : -Infinity;
+  const endSec = opts.endSec != null ? opts.endSec : Infinity;
+  const speakerNames =
+    opts.speakerNames && typeof opts.speakerNames === "object"
+      ? opts.speakerNames
+      : null;
+  const lines = [];
+  for (const s of segments) {
+    const t = s.start || 0;
+    if (t < startSec || t >= endSec) continue;
+    const text = (s.text || "").trim();
+    if (!text) continue;
+    let label = "?";
+    const m = String(s.speaker || "").match(/^Speaker_([A-Z]+)$/);
+    if (m) {
+      label = m[1];
+      // Prefer the operator-corrected name when we have one.
+      if (speakerNames) {
+        const nm = speakerNames[s.speaker];
+        if (typeof nm === "string" && nm.trim()) {
+          label = nm.trim().replace(/[\[\]]/g, "");
+        }
+      }
+    }
+    const sec = Math.floor(t);
+    const mm = Math.floor(sec / 60);
+    const ss = sec % 60;
+    lines.push(`[${label} ${mm}:${String(ss).padStart(2, "0")}] ${text}`);
+  }
+  return lines.join("\n");
+}
+
+// ─── Stage 1: global speaker name inference ─────────────────────────
+//
+// Returns: { Speaker_A: "Matt Hill" | null, Speaker_B: ..., ... }
+// On total failure returns an object with all values null so Stage 2
+// can still run and produce generic speaker-attributed summaries
+// ("Speaker A explains...").
+export async function runNameInference({
+  speakers, // map from clusterSpeakers (Speaker_A → stats)
+  transcriptSegments, // array of { start, end, text, speaker } with speakers attached
+  channelHint = "",
+  titleHint = "",
+  descriptionHint = "",
+  // Operator-editable prompt override (Settings → LLM prompts).
+  // Three-layer resolution at the caller: per-session override →
+  // operator-promoted default → DEFAULT_NAME_INFERENCE_PROMPT_TEMPLATE.
+  // Empty string means "use the hardcoded default" inside this fn.
+  promptOverride = "",
+  // Free-form operator context — internal meetings path uses this to
+  // pass participant hints + notes that the LLM should treat as
+  // suggestions, not authoritative truth. Empty string → no
+  // OPERATOR HINTS block appears in the rendered prompt. The block
+  // is composed here (not by the caller) so the warning language
+  // stays consistent across pipelines.
+  participantHints = "",
+  operatorNotes = "",
+  backend,
+  // audit params
+  pipelineBackend,
+  jobId,
+  batchId,
+  mediaUrl,
+  installId,
+  licenseFingerprint = null,
+  source,
+  computeCostDetails,
+}) {
+  const speakerLetters = Object.keys(speakers || {})
+    .filter((k) => /^Speaker_[A-Z]+$/.test(k))
+    .sort();
+  // Build the null-default map up front so any early-return path
+  // still returns the right shape.
+  const nullMap = Object.fromEntries(speakerLetters.map((k) => [k, null]));
+  if (speakerLetters.length === 0) return nullMap;
+
+  // For name inference we send the WHOLE labeled transcript (no
+  // time window). Cap at ~25k chars to stay well inside Qwen3.6's
+  // context window — for very long content we'd truncate the
+  // middle; in practice 25k chars ≈ 200 minutes of transcript so
+  // this only bites on very long podcasts.
+  const fullLabeledTranscript = formatSpeakerLabeledTranscript(transcriptSegments);
+  const cappedTranscript =
+    fullLabeledTranscript.length > 25000
+      ? fullLabeledTranscript.slice(0, 12500) + "\n\n…[middle truncated for prompt length]…\n\n" + fullLabeledTranscript.slice(-12500)
+      : fullLabeledTranscript;
+
+  // Speaker stats block — gives the model a sense of who speaks
+  // how much, which helps it map names confidently.
+  const speakerStatsBlock = speakerLetters
+    .map((k) => {
+      const stats = speakers[k] || {};
+      const secs = Math.round(stats.total_speaking_seconds || 0);
+      const mins = Math.floor(secs / 60);
+      const rem = secs % 60;
+      const timeStr = mins > 0 ? `${mins}m ${rem}s` : `${rem}s`;
+      const letter = k.replace("Speaker_", "");
+      return `- ${k} (chip "${letter}"): ${timeStr} of speaking time, ${stats.turns || 0} turns`;
+    })
+    .join("\n");
+
+  const speakerKeysBlock = speakerLetters
+    .map((k, i) => `    "${k}": "Real Name or null"${i < speakerLetters.length - 1 ? "," : ""}`)
+    .join("\n");
+
+  // Compose the OPERATOR HINTS block. Renders only when at least one
+  // of participantHints / operatorNotes is non-empty. The wrapping
+  // heading + warning language lives here (not in the template) so
+  // operator-edited prompt overrides can't accidentally drop the
+  // "treat as suggestions" framing — the LLM always sees it when
+  // the block is present.
+  const hintsParts = [];
+  if (participantHints && String(participantHints).trim()) {
+    hintsParts.push(
+      `Possible participants in this conversation (operator-supplied — may be incomplete or include people who don't actually speak):\n${String(participantHints).trim()}`,
+    );
+  }
+  if (operatorNotes && String(operatorNotes).trim()) {
+    // Cap notes at 4000 chars to leave room for the transcript in
+    // the prompt window. Mid-truncate is fine — notes are usually
+    // short.
+    const trimmed = String(operatorNotes).trim().slice(0, 4000);
+    hintsParts.push(
+      `Operator notes on the conversation (may describe what each named participant did — use as a soft signal for mapping names to chip letters):\n${trimmed}`,
+    );
+  }
+  const operatorContextBlock = hintsParts.length
+    ? `OPERATOR HINTS (treat as suggestions only — verify against the transcript before assigning names):\n\n${hintsParts.join("\n\n")}\n\n`
+    : "";
+
+  const templateSource =
+    typeof promptOverride === "string" && promptOverride.trim()
+      ? promptOverride
+      : DEFAULT_NAME_INFERENCE_PROMPT_TEMPLATE;
+  const prompt = fillTemplate(templateSource, {
+    channel: channelHint || "(unknown)",
+    title: titleHint || "(unknown)",
+    description: (descriptionHint || "").slice(0, 800) || "(none)",
+    operatorContext: operatorContextBlock,
+    speakerStats: speakerStatsBlock,
+    transcript: cappedTranscript,
+    speakerKeys: speakerKeysBlock,
+  });
+
+  const t0 = Date.now();
+  let lastErr = null;
+  let r = null;
+  let parsed = null;
+  for (let attempt = 0; attempt < STAGE_1_MAX_ATTEMPTS; attempt++) {
+    try {
+      r = await backend.analyzeText({ prompt });
+      parsed = safeParseSpeakers(r.text, speakerLetters);
+      if (parsed) {
+        lastErr = null;
+        break;
+      }
+      lastErr = "invalid JSON in name-inference response";
+    } catch (err) {
+      lastErr = (err?.message || String(err)).slice(0, 280);
+      r = null;
+    }
+    if (attempt < STAGE_1_MAX_ATTEMPTS - 1) {
+      console.warn(
+        `[polish/names] attempt ${attempt + 1} failed (${lastErr}) — retrying`
+      );
+    }
+  }
+  const dur = Date.now() - t0;
+  const cost = parsed && r ? computeCostDetails(r.model, r.usage) : { input_tokens: 0, output_tokens: 0, thinking_tokens: 0, cost_usd: 0 };
+  await recordCall({
+    install_id: installId,
+    license_fingerprint: licenseFingerprint,
+    tier: "core",
+    pipeline: "polish_names",
+    backend: pipelineBackend,
+    model: r?.model || null,
+    status: parsed ? "success" : "error",
+    duration_ms: dur,
+    audio_seconds: 0,
+    job_id: jobId,
+    batch_id: batchId,
+    source,
+    media_url: mediaUrl,
+    error: parsed ? null : (lastErr || "name inference failed"),
+    ...cost,
+  });
+  if (!parsed) {
+    console.warn(
+      `[polish/names] all ${STAGE_1_MAX_ATTEMPTS} attempts failed (${lastErr}) — falling back to null names`
+    );
+    return nullMap;
+  }
+  const filled = { ...nullMap };
+  for (const k of speakerLetters) {
+    const v = parsed[k];
+    if (typeof v === "string" && v.trim() && v.trim().toLowerCase() !== "null") {
+      filled[k] = v.trim();
+    }
+  }
+  const namedCount = Object.values(filled).filter((v) => v).length;
+  console.log(
+    `[polish/names] inferred ${namedCount}/${speakerLetters.length} speakers in ${(dur / 1000).toFixed(1)}s`
+  );
+  return filled;
+}
+
+function safeParseSpeakers(text, expectedKeys) {
+  if (!text || typeof text !== "string") return null;
+  // Strip optional code fence wrapping.
+  let s = text.trim();
+  const fence = s.match(/```(?:json)?\s*([\s\S]*?)```/);
+  if (fence) s = fence[1].trim();
+  let parsed;
+  try {
+    parsed = JSON.parse(s);
+  } catch {
+    return null;
+  }
+  const speakers = parsed?.speakers;
+  if (!speakers || typeof speakers !== "object") return null;
+  // Require all expected keys present (null values OK)
+  for (const k of expectedKeys) {
+    if (!(k in speakers)) return null;
+  }
+  return speakers;
+}
+
+// ─── Stage 2: per-window summary polish ─────────────────────────────
+//
+// `sections` is the FULL stitched section list with global entry
+// indices (output of stitchAnalysisResults). We need per-window
+// groupings to fire N parallel LLM calls — each call sees only the
+// sections within its window's time range so the prompt stays
+// bounded.
+//
+// `windows` is the planned-windows array (each w.bodyStartSec /
+// w.bodyEndSec) — used to assign sections to windows and to slice
+// the transcript for the prompt.
+//
+// `canonicalEntries` is the parsed transcript (the same array
+// stitcher uses for indexing). We need it to convert section
+// startIndex/endIndex into time ranges for grouping.
+//
+// Returns: the same sections array with summaries rewritten in
+// place. Sections whose window's polish failed keep their original
+// summary. Section start/end indices and titles are NEVER modified.
+export async function runSummaryPolish({
+  sections,
+  canonicalEntries,
+  windows,
+  transcriptSegments,
+  speakerNames,
+  speakerStats,
+  // Operator-editable polish prompt override. Same three-layer
+  // resolution at caller as the name-inference override.
+  promptOverride = "",
+  backend,
+  concurrency,
+  // audit params
+  pipelineBackend,
+  jobId,
+  batchId,
+  mediaUrl,
+  installId,
+  licenseFingerprint = null,
+  source,
+  computeCostDetails,
+}) {
+  if (!Array.isArray(sections) || sections.length === 0) return sections;
+  if (!Array.isArray(windows) || windows.length === 0) return sections;
+  if (!Array.isArray(canonicalEntries) || canonicalEntries.length === 0) return sections;
+
+  // Group sections by window — assign each section to the window
+  // whose body contains its start time. Sections whose start time
+  // falls before any window's body (shouldn't happen in practice)
+  // get assigned to window 0.
+  const sectionsByWindow = windows.map(() => []);
+  for (const sec of sections) {
+    const startEntry = canonicalEntries[sec.startIndex];
+    if (!startEntry) continue;
+    const startSec = startEntry.offset || 0;
+    let assigned = -1;
+    for (let i = 0; i < windows.length; i++) {
+      const w = windows[i];
+      const nextW = windows[i + 1];
+      const upper = nextW ? nextW.bodyStartSec : Infinity;
+      if (startSec >= (w.bodyStartSec || 0) && startSec < upper) {
+        assigned = i;
+        break;
+      }
+    }
+    if (assigned < 0) assigned = 0;
+    sectionsByWindow[assigned].push(sec);
+  }
+
+  // Build a speaker-roster block reused across all window prompts.
+  const speakerRoster = Object.entries(speakerNames || {})
+    .filter(([k]) => /^Speaker_[A-Z]+$/.test(k))
+    .sort()
+    .map(([k, name]) => {
+      const letter = k.replace("Speaker_", "");
+      const stats = speakerStats?.[k] || {};
+      const secs = Math.round(stats.total_speaking_seconds || 0);
+      const mins = Math.floor(secs / 60);
+      const rem = secs % 60;
+      const timeStr = mins > 0 ? `${mins}m ${rem}s` : `${rem}s`;
+      const nameLabel = name ? `"${name}"` : "(unknown name)";
+      return `- ${k} (chip [${letter}], ${timeStr} speaking, ${stats.turns || 0} turns): ${nameLabel}`;
+    })
+    .join("\n");
+
+  // Per-window worker — runs one LLM call to polish all sections
+  // assigned to that window. Returns a Map<sectionIndex,
+  // newSummary> covering only the sections it successfully rewrote.
+  const worker = async (windowIdx) => {
+    const w = windows[windowIdx];
+    const winSections = sectionsByWindow[windowIdx];
+    if (winSections.length === 0) return new Map();
+
+    const winStartSec = w.startSec || 0;
+    const winEndSec = w.windowEndSec || (w.bodyEndSec || 0);
+    const windowTranscript = formatSpeakerLabeledTranscript(transcriptSegments, {
+      startSec: winStartSec,
+      endSec: winEndSec,
+      // Label lines with the corrected names so attributions in the
+      // rewritten summaries follow the operator's roster, not whatever
+      // (possibly stale) names the original summaries were written with.
+      speakerNames,
+    });
+
+    // Format each section for the prompt. We carry the section's
+    // ORIGINAL position in `sections` via `__origIdx` so the worker
+    // can map polished summaries back to the right slot.
+    const sectionsBlock = winSections
+      .map((sec, i) => {
+        const startEntry = canonicalEntries[sec.startIndex];
+        const endEntry = canonicalEntries[sec.endIndex];
+        const tStart = startEntry ? (startEntry.offset || 0) : 0;
+        const tEnd = endEntry ? (endEntry.offset || 0) : 0;
+        const tStartStr = fmtMmSs(tStart);
+        const tEndStr = fmtMmSs(tEnd);
+        return `[${i}] Title: "${sec.title}" (${tStartStr}-${tEndStr})\n    Original summary: ${sec.summary}`;
+      })
+      .join("\n\n");
+
+    const templateSource =
+      typeof promptOverride === "string" && promptOverride.trim()
+        ? promptOverride
+        : DEFAULT_SUMMARY_POLISH_PROMPT_TEMPLATE;
+    const prompt = fillTemplate(templateSource, {
+      speakerRoster: speakerRoster || "(no speakers identified)",
+      transcript: windowTranscript || "(empty)",
+      sections: sectionsBlock,
+    });
+
+    const t0 = Date.now();
+    let r = null;
+    let parsed = null;
+    let lastErr = null;
+    for (let attempt = 0; attempt < STAGE_2_MAX_ATTEMPTS; attempt++) {
+      try {
+        r = await backend.analyzeText({ prompt });
+        parsed = safeParsePolishedSections(r.text, winSections.length);
+        if (parsed) {
+          lastErr = null;
+          break;
+        }
+        lastErr = "invalid JSON in polish response";
+      } catch (err) {
+        lastErr = (err?.message || String(err)).slice(0, 280);
+        r = null;
+      }
+      if (attempt < STAGE_2_MAX_ATTEMPTS - 1) {
+        console.warn(
+          `[polish/window ${windowIdx + 1}/${windows.length}] attempt ${attempt + 1} failed (${lastErr}) — retrying`
+        );
+      }
+    }
+    const dur = Date.now() - t0;
+    const cost = parsed && r ? computeCostDetails(r.model, r.usage) : { input_tokens: 0, output_tokens: 0, thinking_tokens: 0, cost_usd: 0 };
+    await recordCall({
+      install_id: installId,
+      license_fingerprint: licenseFingerprint,
+      tier: "core",
+      pipeline: "polish_summaries",
+      backend: pipelineBackend,
+      model: r?.model || null,
+      status: parsed ? "success" : "error",
+      duration_ms: dur,
+      audio_seconds: 0,
+      job_id: jobId,
+      batch_id: batchId,
+      source,
+      media_url: mediaUrl,
+      error: parsed ? null : (lastErr || "polish failed"),
+      window_idx: windowIdx,
+      window_count: windows.length,
+      ...cost,
+    });
+    if (!parsed) {
+      console.warn(
+        `[polish/window ${windowIdx + 1}/${windows.length}] all attempts failed (${lastErr}) — keeping original summaries`
+      );
+      return new Map();
+    }
+    // Map polish output back to the original sections by their
+    // win-local index. Build a Map<orig-section-position-in-array,
+    // newSummary>.
+    const out = new Map();
+    for (const p of parsed) {
+      const localIdx = p.index;
+      if (!Number.isInteger(localIdx) || localIdx < 0 || localIdx >= winSections.length) continue;
+      const newSummary = (p.summary || "").trim();
+      if (!newSummary) continue;
+      const sec = winSections[localIdx];
+      const origIdx = sections.indexOf(sec);
+      if (origIdx >= 0) out.set(origIdx, newSummary);
+    }
+    console.log(
+      `[polish/window ${windowIdx + 1}/${windows.length}] polished ${out.size}/${winSections.length} sections in ${(dur / 1000).toFixed(1)}s`
+    );
+    return out;
+  };
+
+  // Concurrent worker pool (same shape as runPipelinedAnalysis).
+  let nextIdx = 0;
+  const updates = new Map();
+  async function poolWorker() {
+    while (true) {
+      const my = nextIdx++;
+      if (my >= windows.length) return;
+      const result = await worker(my);
+      for (const [k, v] of result) updates.set(k, v);
+    }
+  }
+  const pool = Array.from(
+    { length: Math.min(concurrency || 4, windows.length) },
+    poolWorker
+  );
+  await Promise.all(pool);
+
+  // Apply polished summaries onto a shallow copy of sections so the
+  // caller's reference doesn't mutate unexpectedly.
+  const polished = sections.map((sec, i) => {
+    const newSummary = updates.get(i);
+    return newSummary ? { ...sec, summary: newSummary } : sec;
+  });
+  console.log(
+    `[polish] applied ${updates.size}/${sections.length} polished summaries`
+  );
+  return polished;
+}
+
+function safeParsePolishedSections(text, maxIndex) {
+  if (!text || typeof text !== "string") return null;
+  let s = text.trim();
+  const fence = s.match(/```(?:json)?\s*([\s\S]*?)```/);
+  if (fence) s = fence[1].trim();
+  let parsed;
+  try {
+    parsed = JSON.parse(s);
+  } catch {
+    return null;
+  }
+  const arr = parsed?.sections;
+  if (!Array.isArray(arr)) return null;
+  // Validate each entry has {index: int, summary: string} and indices
+  // are in-range.
+  const valid = [];
+  for (const item of arr) {
+    if (!item || typeof item !== "object") continue;
+    if (!Number.isInteger(item.index)) continue;
+    if (item.index < 0 || item.index >= maxIndex) continue;
+    if (typeof item.summary !== "string" || !item.summary.trim()) continue;
+    valid.push(item);
+  }
+  return valid.length > 0 ? valid : null;
+}
+
+function fmtMmSs(seconds) {
+  const s = Math.max(0, Math.floor(seconds || 0));
+  const h = Math.floor(s / 3600);
+  const m = Math.floor((s % 3600) / 60);
+  const sec = s % 60;
+  const pad = (n) => n.toString().padStart(2, "0");
+  return h > 0 ? `${h}:${pad(m)}:${pad(sec)}` : `${m}:${pad(sec)}`;
+}
diff --git a/server/routes/internal-meetings.js b/server/routes/internal-meetings.js
new file mode 100644
index 0000000..8f84471
--- /dev/null
+++ b/server/routes/internal-meetings.js
@@ -0,0 +1,2225 @@
+// Internal team meeting processing — Path 2A Phase 1.
+//
+// Operator-only endpoint family. Accepts an uploaded audio file
+// (mp3 / m4a / wav / etc), runs the SAME hardware pipeline that
+// /relay/v1/summarize-url uses for YouTube/podcast content
+// (transcribe → diarize → cluster → analyze → post-cluster polish),
+// and saves the result to /data/internal-meetings/<id>.json.
+//
+// Differences from summarize-url:
+//   - No download step (caller already has the file)
+//   - No license / credit accounting (operator-owned compute)
+//   - No Recaps-app envelope (results live on the relay, not in a
+//     user library — Path 2B will migrate them into per-user
+//     libraries once multi-tenant Recaps lands)
+//   - Saved JSON is downloadable + markdown-renderable so the
+//     operator can feed transcripts to other tools without
+//     re-running the pipeline
+//
+// All routes mount under /admin/internal-meetings/* and inherit
+// the admin-session-cookie auth gate from the parent admin router.
+// No public exposure.
+
+import express from "express";
+import multer from "multer";
+import fs from "fs/promises";
+import path from "path";
+import os from "os";
+import { randomUUID } from "crypto";
+
+import { getConfigSnapshot } from "../config.js";
+import { resolveHardwareConfig } from "../hardware-config.js";
+import { createHardwareBackend } from "../backends/hardware.js";
+import {
+  runPipelinedAnalysis,
+  parseBracketedTranscript,
+  firstEntryAtOrAfter,
+  lastEntryBefore,
+  canonicalIndexForOffset,
+  stitchAnalysisResults,
+  planWindowsByDuration,
+} from "../chunked-analyze.js";
+import { createChunkBuffer } from "../chunk-buffer.js";
+import {
+  runNameInference,
+  runSummaryPolish,
+} from "../post-cluster-polish.js";
+import { runMeetingExtras } from "../meeting-extras.js";
+import {
+  backfillEntrySpeakers,
+  mergeSpeakersInRecord,
+  reclusterMeetingRecord,
+  applyPolishedSummaries,
+} from "../meeting-speaker-edits.js";
+import { acquireHardwareSlot } from "../hardware-queue.js";
+import { getAudioDurationSeconds } from "../audio-meta.js";
+import {
+  createJob,
+  appendEvent,
+  subscribeToJob,
+  getJob,
+  markRunning,
+  setProgress,
+  markComplete,
+  markFailed,
+} from "../jobs.js";
+
+// Upload size cap — generous enough for a 4-hour meeting at 192kbps
+// mp3 (~340MB) but rejects bigger uploads to avoid disk-fill DoS.
+const MAX_UPLOAD_BYTES = 500 * 1024 * 1024; // 500MB
+
+// Storage dir for completed meetings.
+function meetingsDir(dataDir) {
+  return path.join(dataDir, "internal-meetings");
+}
+
+async function ensureMeetingsDir(dataDir) {
+  await fs.mkdir(meetingsDir(dataDir), { recursive: true }).catch(() => {});
+}
+
+// ─── Storage layer ──────────────────────────────────────────────────
+
+async function saveMeeting(dataDir, id, record) {
+  await ensureMeetingsDir(dataDir);
+  const filePath = path.join(meetingsDir(dataDir), `${id}.json`);
+  await fs.writeFile(filePath, JSON.stringify(record, null, 2), {
+    mode: 0o600,
+  });
+}
+
+async function loadMeeting(dataDir, id) {
+  const filePath = path.join(meetingsDir(dataDir), `${id}.json`);
+  try {
+    const raw = await fs.readFile(filePath, "utf8");
+    const rec = JSON.parse(raw);
+    // Retroactive chunk-contiguity backfill must run BEFORE the
+    // speaker backfill, because contiguity adds entries that the
+    // speaker backfill then needs to label. Both are no-ops when
+    // the saved record was already produced by the post-v0.2.107
+    // pipeline (entries are contiguous + speaker fields populated).
+    backfillChunkContiguity(rec);
+    backfillEntrySpeakers(rec);
+    return rec;
+  } catch {
+    return null;
+  }
+}
+
+// Reslice each chunk's entries to fill gaps the LLM analyze pass
+// left between section boundaries. The original v0.2.103-v0.2.106
+// pipeline saved chunks with strict LLM startIndex/endIndex slices,
+// which dropped entries the model classified as "between topics"
+// (filler, brief transitions). On a 3-min meeting that meant
+// users saw topic 2 with one statement and 46-second timestamp
+// gaps between consecutive topics.
+//
+// Fix on read: re-derive canonical entries from rec.transcript,
+// match each saved chunk's first/last entry by (offset, text-prefix)
+// to find its canonical index range, then extend ranges to be
+// contiguous (chunk 0 → entry 0, chunk N's end → chunk N+1's start
+// minus 1, last chunk → end of transcript) and rewrite entries
+// from the extended slice. Section titles and summaries stay
+// untouched — only the entries[] gets refilled.
+function backfillChunkContiguity(rec) {
+  if (!rec || !Array.isArray(rec.chunks) || rec.chunks.length === 0) return;
+  if (typeof rec.transcript !== "string" || !rec.transcript) return;
+
+  const allEntries = parseBracketedTranscript(rec.transcript);
+  if (allEntries.length === 0) return;
+
+  // Quick exit: if the current saved chunks already cover every
+  // entry contiguously, do nothing. Heuristic — sum of entries
+  // across chunks equals total entries AND each chunk's last
+  // entry's offset equals the next chunk's first entry's offset
+  // minus the gap. Simpler check: total saved entries vs canonical.
+  const savedEntryCount = rec.chunks.reduce(
+    (n, c) => n + (Array.isArray(c.entries) ? c.entries.length : 0),
+    0
+  );
+  if (savedEntryCount >= allEntries.length) return;
+
+  const matchEntry = (saved) => {
+    if (!saved) return -1;
+    const t = saved.offset || 0;
+    const txt = (saved.text || "").slice(0, 24);
+    let fallback = -1;
+    for (let i = 0; i < allEntries.length; i++) {
+      const off = allEntries[i].offset || 0;
+      if (off !== t) {
+        if (off > t + 2) break;
+        continue;
+      }
+      const a = (allEntries[i].text || "").slice(0, 24);
+      if (a === txt) return i;
+      if (fallback < 0) fallback = i;
+    }
+    return fallback;
+  };
+
+  const ranges = [];
+  for (const chunk of rec.chunks) {
+    const entries = Array.isArray(chunk.entries) ? chunk.entries : [];
+    if (entries.length === 0) continue;
+    const firstIdx = matchEntry(entries[0]);
+    const lastIdx = matchEntry(entries[entries.length - 1]);
+    if (firstIdx < 0 || lastIdx < 0 || lastIdx < firstIdx) continue;
+    ranges.push({ chunk, firstIdx, lastIdx });
+  }
+  if (ranges.length === 0) return;
+  ranges.sort((a, b) => a.firstIdx - b.firstIdx);
+
+  // Extend ranges so they collectively cover every canonical entry.
+  ranges[0].firstIdx = 0;
+  for (let i = 0; i + 1 < ranges.length; i++) {
+    ranges[i].lastIdx = Math.max(
+      ranges[i].lastIdx,
+      ranges[i + 1].firstIdx - 1
+    );
+  }
+  ranges[ranges.length - 1].lastIdx = allEntries.length - 1;
+
+  // Rewrite each chunk's entries from its extended slice. We carry
+  // over the existing chunk's per-entry speaker/confidence/uncertain
+  // fields keyed by offset+text-prefix so any prior speaker
+  // attribution survives the rewrite.
+  for (const r of ranges) {
+    const priorByKey = new Map();
+    for (const e of r.chunk.entries || []) {
+      const k = `${e.offset || 0}|${(e.text || "").slice(0, 16)}`;
+      priorByKey.set(k, e);
+    }
+    const slice = allEntries.slice(r.firstIdx, r.lastIdx + 1).map((e) => {
+      const k = `${e.offset || 0}|${(e.text || "").slice(0, 16)}`;
+      const prior = priorByKey.get(k);
+      if (prior && prior.speaker) {
+        return {
+          ...e,
+          speaker: prior.speaker,
+          speaker_confidence: prior.speaker_confidence ?? null,
+          speaker_uncertain: !!prior.speaker_uncertain,
+        };
+      }
+      return { ...e };
+    });
+    r.chunk.entries = slice;
+    r.chunk.startTime = slice[0]?.offset || 0;
+  }
+}
+
+async function listMeetings(dataDir) {
+  await ensureMeetingsDir(dataDir);
+  const dir = meetingsDir(dataDir);
+  let files = [];
+  try {
+    files = await fs.readdir(dir);
+  } catch {
+    return [];
+  }
+  const out = [];
+  for (const f of files) {
+    if (!f.endsWith(".json")) continue;
+    try {
+      const raw = await fs.readFile(path.join(dir, f), "utf8");
+      const rec = JSON.parse(raw);
+      out.push({
+        id: rec.id,
+        title: rec.title || "(untitled)",
+        created_at: rec.created_at,
+        audio_seconds: rec.audio_seconds || 0,
+        topic_count: Array.isArray(rec.chunks) ? rec.chunks.length : 0,
+        speaker_count: rec.speakers ? Object.keys(rec.speakers).length : 0,
+      });
+    } catch {
+      // skip malformed files
+    }
+  }
+  // Most-recent first
+  out.sort((a, b) => (b.created_at || 0) - (a.created_at || 0));
+  return out;
+}
+
+async function deleteMeeting(dataDir, id) {
+  const filePath = path.join(meetingsDir(dataDir), `${id}.json`);
+  try {
+    await fs.unlink(filePath);
+    return true;
+  } catch {
+    return false;
+  }
+}
+
+// ─── Markdown formatter ─────────────────────────────────────────────
+// Converts a saved meeting record into a human-readable markdown doc
+// suitable for downloading + feeding to other LLMs / sharing.
+
+function formatTimestamp(secs) {
+  const s = Math.max(0, Math.floor(secs || 0));
+  const h = Math.floor(s / 3600);
+  const m = Math.floor((s % 3600) / 60);
+  const sec = s % 60;
+  const pad = (n) => n.toString().padStart(2, "0");
+  return h > 0 ? `${h}:${pad(m)}:${pad(sec)}` : `${m}:${pad(sec)}`;
+}
+
+function speakerDisplayName(speakerId, speakerNames) {
+  if (!speakerId) return "Unknown";
+  if (speakerId === "Speaker_Unknown") return "Unknown";
+  const inferred = speakerNames && speakerNames[speakerId];
+  if (typeof inferred === "string" && inferred.trim()) return inferred.trim();
+  const m = String(speakerId).match(/^Speaker_([A-Z]+)$/);
+  return m ? `Speaker ${m[1]}` : speakerId;
+}
+
+export function meetingToMarkdown(rec) {
+  if (!rec) return "";
+  const lines = [];
+  lines.push(`# ${rec.title || "Untitled meeting"}`);
+  lines.push("");
+
+  const dateStr = rec.created_at
+    ? new Date(rec.created_at).toLocaleString("en-US", {
+        dateStyle: "long",
+        timeStyle: "short",
+      })
+    : "(unknown)";
+  lines.push(`**Processed:** ${dateStr}`);
+  if (rec.audio_seconds) {
+    lines.push(`**Duration:** ${formatTimestamp(rec.audio_seconds)}`);
+  }
+  if (Array.isArray(rec.participants) && rec.participants.length) {
+    lines.push(`**Participant hints:** ${rec.participants.join(", ")}`);
+  }
+
+  // Speaker roster
+  if (rec.speakers && Object.keys(rec.speakers).length) {
+    lines.push("");
+    lines.push("## Speakers");
+    lines.push("");
+    const entries = Object.entries(rec.speakers).sort((a, b) => {
+      if (a[0] === "Speaker_Unknown") return 1;
+      if (b[0] === "Speaker_Unknown") return -1;
+      return a[0].localeCompare(b[0]);
+    });
+    for (const [id, stats] of entries) {
+      const display = speakerDisplayName(id, rec.speaker_names);
+      const secs = Math.round(stats.total_speaking_seconds || 0);
+      const turns = stats.turns || 0;
+      lines.push(`- **${display}** — ${formatTimestamp(secs)} speaking, ${turns} turn${turns !== 1 ? "s" : ""}`);
+    }
+  }
+
+  // Phase 2 extras (decisions / action items / open questions /
+  // key quotes). Rendered ABOVE the topics so the reader sees the
+  // most actionable content first. Empty categories collapse;
+  // entire block hides when no extras exist.
+  if (rec.extras) {
+    const x = rec.extras;
+    const tldr = x.tldr && typeof x.tldr === "object" ? x.tldr : null;
+    const decs = Array.isArray(x.decisions) ? x.decisions : [];
+    const acts = Array.isArray(x.action_items) ? x.action_items : [];
+    const qs = Array.isArray(x.open_questions) ? x.open_questions : [];
+    const quotes = Array.isArray(x.key_quotes) ? x.key_quotes : [];
+    const speakerNamesMd = rec.speaker_names || {};
+    const renderSpeakerMd = (sid) =>
+      sid ? speakerDisplayName(sid, speakerNamesMd) : "";
+    if (tldr && typeof tldr.summary === "string" && tldr.summary.trim()) {
+      lines.push("");
+      lines.push("## TL;DR");
+      lines.push("");
+      lines.push(tldr.summary.trim());
+      if (Array.isArray(tldr.primary_speakers) && tldr.primary_speakers.length) {
+        const names = tldr.primary_speakers.map(renderSpeakerMd).filter(Boolean);
+        if (names.length) {
+          lines.push("");
+          lines.push(`_Primary speakers: ${names.join(", ")}_`);
+        }
+      }
+    }
+    if (decs.length) {
+      lines.push("");
+      lines.push("## Decisions");
+      lines.push("");
+      for (const d of decs) {
+        const ts = d.supporting_offset != null ? ` [${formatTimestamp(d.supporting_offset)}]` : "";
+        const agreed = (d.agreed_by || []).map(renderSpeakerMd).filter(Boolean);
+        const agreedStr = agreed.length ? ` — agreed by ${agreed.join(", ")}` : "";
+        lines.push(`- ${d.statement}${ts}${agreedStr}`);
+      }
+    }
+    if (acts.length) {
+      lines.push("");
+      lines.push("## Action items");
+      lines.push("");
+      for (const a of acts) {
+        const ts = a.supporting_offset != null ? ` [${formatTimestamp(a.supporting_offset)}]` : "";
+        const owner = a.owner ? ` — ${renderSpeakerMd(a.owner)}` : "";
+        const due = a.due_hint ? ` (due: ${a.due_hint})` : "";
+        lines.push(`- ${a.description}${ts}${owner}${due}`);
+      }
+    }
+    if (qs.length) {
+      lines.push("");
+      lines.push("## Open questions");
+      lines.push("");
+      for (const q of qs) {
+        const by = q.raised_by ? ` — raised by ${renderSpeakerMd(q.raised_by)}` : "";
+        lines.push(`- ${q.question}${by}`);
+      }
+    }
+    if (quotes.length) {
+      lines.push("");
+      lines.push("## Key quotes");
+      lines.push("");
+      for (const q of quotes) {
+        const ts = q.offset != null ? ` [${formatTimestamp(q.offset)}]` : "";
+        const sp = q.speaker ? ` — ${renderSpeakerMd(q.speaker)}` : "";
+        const why = q.why_notable ? ` _(${q.why_notable})_` : "";
+        lines.push(`- "${q.quote}"${ts}${sp}${why}`);
+      }
+    }
+  }
+
+  // Topics + per-topic transcript chunks
+  if (Array.isArray(rec.chunks) && rec.chunks.length) {
+    lines.push("");
+    lines.push("## Topics");
+    lines.push("");
+    rec.chunks.forEach((chunk, i) => {
+      const start = formatTimestamp(chunk.startTime || 0);
+      // Adjacent display: end = next chunk's start so consecutive
+      // topics appear contiguous; last chunk extends to full audio.
+      let endSec;
+      if (i + 1 < rec.chunks.length) {
+        endSec = rec.chunks[i + 1].startTime || 0;
+      } else if (rec.audio_seconds) {
+        endSec = rec.audio_seconds;
+      } else if (chunk.entries && chunk.entries.length > 0) {
+        endSec = chunk.entries[chunk.entries.length - 1].offset || 0;
+      } else {
+        endSec = chunk.startTime || 0;
+      }
+      const end = formatTimestamp(endSec);
+      lines.push(`### ${i + 1}. ${chunk.title || "(untitled topic)"} (${start} — ${end})`);
+      lines.push("");
+      lines.push(chunk.summary || "");
+      if (Array.isArray(chunk.entries) && chunk.entries.length) {
+        lines.push("");
+        lines.push("<details><summary>Transcript</summary>");
+        lines.push("");
+        for (const entry of chunk.entries) {
+          const t = formatTimestamp(entry.offset || 0);
+          // Operator override wins (same convention as the .html
+          // and dashboard renderers).
+          const effSpeaker = entry.speaker_override || entry.speaker;
+          const who = effSpeaker
+            ? speakerDisplayName(effSpeaker, rec.speaker_names)
+            : null;
+          if (who) {
+            lines.push(`- **[${t}] ${who}:** ${entry.text || ""}`);
+          } else {
+            lines.push(`- **[${t}]** ${entry.text || ""}`);
+          }
+        }
+        lines.push("");
+        lines.push("</details>");
+      }
+      lines.push("");
+    });
+  }
+
+  // Full unattributed transcript at the bottom — useful for grep'ing
+  // and as a clean LLM-input form. Always emitted so downloads are
+  // self-contained.
+  if (rec.transcript) {
+    lines.push("");
+    lines.push("## Full transcript (bracketed)");
+    lines.push("");
+    lines.push("```");
+    lines.push(rec.transcript);
+    lines.push("```");
+  }
+
+  return lines.join("\n");
+}
+
+// ─── HTML formatter ─────────────────────────────────────────────────
+// Produces a fully self-contained HTML page that renders the meeting
+// in the same Recaps-style layout as the dashboard's detail view —
+// title, summary stats, speaker legend, topic cards with native
+// <details>-driven expandable transcript lines, and the full bracketed
+// transcript at the bottom. Includes inlined CSS so it's shareable as
+// a single file (email attachment, drag-into-browser, link from a
+// shared drive, etc.) and a print-friendly fallback.
+//
+// Phase-2 reserve: when `rec.extras` lands (Decisions / Action Items /
+// Open Questions / Key Quotes), this function will render those above
+// the topics. For now it just skips that section gracefully.
+
+function htmlEsc(s) {
+  return String(s == null ? "" : s)
+    .replace(/&/g, "&amp;")
+    .replace(/</g, "&lt;")
+    .replace(/>/g, "&gt;")
+    .replace(/"/g, "&quot;")
+    .replace(/'/g, "&#39;");
+}
+
+// Mirror dashboard.html's meetingsSpeakerChipColor — same palette so a
+// speaker has the same color across the dashboard, .md, and .html.
+function speakerChipColor(id) {
+  if (id === "Speaker_Unknown") {
+    return { bg: "rgba(100,116,139,0.18)", fg: "#cbd5e1", bd: "rgba(100,116,139,0.35)" };
+  }
+  const m = String(id || "").match(/^Speaker_([A-Z]+)$/);
+  const letters = m ? m[1] : "A";
+  let n = 0;
+  for (const c of letters) n = n * 26 + (c.charCodeAt(0) - 64);
+  n -= 1;
+  const palette = [
+    { bg: "rgba(239,68,68,0.18)",  fg: "#fca5a5", bd: "rgba(239,68,68,0.35)" },
+    { bg: "rgba(59,130,246,0.18)", fg: "#93c5fd", bd: "rgba(59,130,246,0.35)" },
+    { bg: "rgba(34,197,94,0.18)",  fg: "#86efac", bd: "rgba(34,197,94,0.35)" },
+    { bg: "rgba(245,158,11,0.18)", fg: "#fcd34d", bd: "rgba(245,158,11,0.35)" },
+    { bg: "rgba(168,85,247,0.18)", fg: "#d8b4fe", bd: "rgba(168,85,247,0.35)" },
+    { bg: "rgba(14,165,233,0.18)", fg: "#7dd3fc", bd: "rgba(14,165,233,0.35)" },
+    { bg: "rgba(236,72,153,0.18)", fg: "#f9a8d4", bd: "rgba(236,72,153,0.35)" },
+    { bg: "rgba(100,116,139,0.18)",fg: "#cbd5e1", bd: "rgba(100,116,139,0.35)" },
+  ];
+  return palette[((n % 8) + 8) % 8];
+}
+
+function speakerChipLabel(id, speakerNames) {
+  if (id === "Speaker_Unknown") return "?";
+  const inferred = speakerNames && typeof speakerNames[id] === "string" && speakerNames[id].trim();
+  if (inferred) {
+    const parts = inferred.split(/\s+/).filter(Boolean);
+    if (parts.length === 1) return parts[0][0].toUpperCase();
+    return (parts[0][0] + parts[parts.length - 1][0]).toUpperCase();
+  }
+  const m = String(id).match(/^Speaker_([A-Z]+)$/);
+  return m ? m[1] : "?";
+}
+
+function renderChipHtml(speakerId, confidence, uncertain, speakerNames) {
+  if (!speakerId) return "";
+  const c = speakerChipColor(speakerId);
+  const label = speakerChipLabel(speakerId, speakerNames);
+  const showQ = uncertain || (typeof confidence === "number" && confidence < 0.5);
+  const text = label + (showQ ? "?" : "");
+  const full = speakerDisplayName(speakerId, speakerNames);
+  const tooltip = speakerId === "Speaker_Unknown"
+    ? "Unknown speaker (brief utterance, no anchor match)"
+    : (showQ ? full + " — best-guess attribution" : full);
+  return (
+    `<span class="chip" style="background:${c.bg};color:${c.fg};border-color:${c.bd};" ` +
+    `title="${htmlEsc(tooltip)}">${htmlEsc(text)}</span>`
+  );
+}
+
+// Renders the Phase 2 extras block for the self-contained .html
+// download. Mirrors the dashboard's renderMeetingExtras layout —
+// four collapsible sections (Decisions / Action items / Open
+// questions / Key quotes), each item with inline speaker chips +
+// timestamp links. Timestamps in the downloaded file are NOT
+// clickable (static HTML); they're shown as styled tags for visual
+// parity with the dashboard. Returns "" when extras is empty/null.
+function renderExtrasHtml(extras, speakerNames) {
+  if (!extras) return "";
+  const tldr = extras.tldr && typeof extras.tldr === "object" ? extras.tldr : null;
+  const decs = Array.isArray(extras.decisions) ? extras.decisions : [];
+  const acts = Array.isArray(extras.action_items) ? extras.action_items : [];
+  const qs = Array.isArray(extras.open_questions) ? extras.open_questions : [];
+  const quotes = Array.isArray(extras.key_quotes) ? extras.key_quotes : [];
+  if (!tldr && !decs.length && !acts.length && !qs.length && !quotes.length) return "";
+
+  const tsTag = (sec) => {
+    if (sec == null || !Number.isFinite(sec)) return "";
+    return `<span class="ts-tag">${htmlEsc(formatTimestamp(sec))}</span>`;
+  };
+  const inlineChip = (sid) => {
+    if (!sid) return "";
+    const c = speakerChipColor(sid);
+    const label = speakerChipLabel(sid, speakerNames);
+    const full = sid === "Speaker_Unknown" ? "Unknown" : speakerDisplayName(sid, speakerNames);
+    return (
+      `<span class="inline-chip">` +
+        `<span class="chip" style="background:${c.bg};color:${c.fg};border-color:${c.bd};">${htmlEsc(label)}</span>` +
+        `<span class="inline-name">${htmlEsc(full)}</span>` +
+      `</span>`
+    );
+  };
+
+  const section = (label, items, render, emoji) => {
+    if (!items.length) return "";
+    return (
+      `<details class="extras-section" open>` +
+        `<summary>` +
+          `<span class="extras-title">${emoji} ${htmlEsc(label)}</span>` +
+          `<span class="extras-count">· ${items.length}</span>` +
+        `</summary>` +
+        `<div class="extras-body">` + items.map(render).join("") + `</div>` +
+      `</details>`
+    );
+  };
+
+  const renderDecision = (d) => {
+    const agreed = (d.agreed_by || []).map(inlineChip).join('<span class="sep"> · </span>');
+    return (
+      `<div class="extras-item">` +
+        `<div class="extras-text">${htmlEsc(d.statement || "")}</div>` +
+        `<div class="extras-meta">` +
+          (d.supporting_offset != null ? tsTag(d.supporting_offset) : "") +
+          (agreed ? `<span class="meta-label">agreed by:</span>${agreed}` : "") +
+        `</div>` +
+      `</div>`
+    );
+  };
+  const renderAction = (a) => (
+    `<div class="extras-item">` +
+      `<div class="extras-text">${htmlEsc(a.description || "")}</div>` +
+      `<div class="extras-meta">` +
+        (a.supporting_offset != null ? tsTag(a.supporting_offset) : "") +
+        (a.owner ? `<span class="meta-label">owner:</span>${inlineChip(a.owner)}` : "") +
+        (a.due_hint ? `<span class="meta-due">due: ${htmlEsc(a.due_hint)}</span>` : "") +
+      `</div>` +
+    `</div>`
+  );
+  const renderQuestion = (q) => (
+    `<div class="extras-item">` +
+      `<div class="extras-text">${htmlEsc(q.question || "")}</div>` +
+      (q.raised_by ? `<div class="extras-meta"><span class="meta-label">raised by:</span>${inlineChip(q.raised_by)}</div>` : "") +
+    `</div>`
+  );
+  const renderQuote = (q) => (
+    `<div class="extras-item">` +
+      `<div class="extras-quote">"${htmlEsc(q.quote || "")}"</div>` +
+      `<div class="extras-meta">` +
+        (q.offset != null ? tsTag(q.offset) : "") +
+        (q.speaker ? inlineChip(q.speaker) : "") +
+        (q.why_notable ? `<span class="meta-due">— ${htmlEsc(q.why_notable)}</span>` : "") +
+      `</div>` +
+    `</div>`
+  );
+
+  // TLDR — highlighted callout above the four collapsibles. Always
+  // visible (not in a <details>) because it's meant as the first
+  // read. Mirrors the dashboard's styling pattern.
+  let tldrHtml = "";
+  if (tldr && typeof tldr.summary === "string" && tldr.summary.trim()) {
+    const primary = Array.isArray(tldr.primary_speakers) ? tldr.primary_speakers : [];
+    const primaryHtml = primary.length
+      ? `<div class="tldr-meta"><span>primary speakers:</span>` +
+        primary.map(inlineChip).join(`<span class="sep"> · </span>`) +
+        `</div>`
+      : "";
+    tldrHtml = (
+      `<div class="tldr">` +
+        `<div class="tldr-label">TL;DR</div>` +
+        `<div class="tldr-summary">${htmlEsc(tldr.summary)}</div>` +
+        primaryHtml +
+      `</div>`
+    );
+  }
+
+  return (
+    `<section class="extras">` +
+      tldrHtml +
+      section("Decisions", decs, renderDecision, "✓") +
+      section("Action items", acts, renderAction, "→") +
+      section("Open questions", qs, renderQuestion, "?") +
+      section("Key quotes", quotes, renderQuote, "❝") +
+    `</section>`
+  );
+}
+
+export function meetingToHtml(rec) {
+  if (!rec) return "<!doctype html><html><body><p>Meeting not found.</p></body></html>";
+
+  const title = rec.title || "Untitled meeting";
+  const speakerNames = rec.speaker_names || {};
+  const speakerEntries = rec.speakers
+    ? Object.entries(rec.speakers).sort((a, b) => {
+        if (a[0] === "Speaker_Unknown") return 1;
+        if (b[0] === "Speaker_Unknown") return -1;
+        return a[0].localeCompare(b[0]);
+      })
+    : [];
+
+  const dateStr = rec.created_at
+    ? new Date(rec.created_at).toLocaleString("en-US", {
+        dateStyle: "medium",
+        timeStyle: "short",
+      })
+    : null;
+
+  const chunks = Array.isArray(rec.chunks) ? rec.chunks : [];
+  const metaParts = [];
+  if (rec.audio_seconds) metaParts.push(formatTimestamp(rec.audio_seconds));
+  metaParts.push(`${chunks.length} topic${chunks.length === 1 ? "" : "s"}`);
+  metaParts.push(`${speakerEntries.length} speaker${speakerEntries.length === 1 ? "" : "s"}`);
+  if (dateStr) metaParts.push(dateStr);
+
+  // ── Embed .md + .json as inline data URLs ──
+  // The shareable .html artifact carries the markdown and JSON
+  // serializations inside itself as base64 data URLs, so a recipient
+  // who downloads the .html (email attachment, shared drive, etc.)
+  // can grab either format without going back to the relay — the
+  // relay endpoints are admin-auth-gated anyway, so external
+  // recipients couldn't reach them. Self-contained = truly portable.
+  //
+  // Size overhead: base64 inflates ~33%, but the resulting blobs
+  // are still in the tens-of-KB range even for hour-long meetings.
+  // Done at HTML-build time so we don't recompute on every download
+  // click in the browser.
+  const safeFilenameBase = (title || "meeting")
+    .replace(/[^a-zA-Z0-9-_.]+/g, "-")
+    .slice(0, 80) || "meeting";
+  const mdContent = meetingToMarkdown(rec);
+  const jsonContent = JSON.stringify(rec, null, 2);
+  const mdDataUrl =
+    "data:text/markdown;charset=utf-8;base64," +
+    Buffer.from(mdContent, "utf8").toString("base64");
+  const jsonDataUrl =
+    "data:application/json;charset=utf-8;base64," +
+    Buffer.from(jsonContent, "utf8").toString("base64");
+
+  const legendHtml = speakerEntries.length
+    ? (
+      `<section class="legend"><div class="legend-label">Speakers</div><div class="legend-chips">` +
+      speakerEntries.map(([id, stats]) => {
+        const c = speakerChipColor(id);
+        const label = speakerChipLabel(id, speakerNames);
+        const full = speakerDisplayName(id, speakerNames);
+        const secs = Math.round(stats.total_speaking_seconds || 0);
+        return (
+          `<span class="legend-chip">` +
+            `<span class="chip" style="background:${c.bg};color:${c.fg};border-color:${c.bd};">${htmlEsc(label)}</span>` +
+            `<span class="legend-name">${htmlEsc(full)}</span>` +
+            `<span class="legend-secs">· ${formatTimestamp(secs)}</span>` +
+          `</span>`
+        );
+      }).join("") +
+      `</div></section>`
+    )
+    : "";
+
+  const topicsHtml = chunks.length
+    ? chunks.map((chunk, i) => {
+      const start = formatTimestamp(chunk.startTime || 0);
+      // Adjacent display: end = next chunk's start so topic ranges
+      // appear visually contiguous. Last chunk extends to the full
+      // audio duration. Fallback to last entry's offset.
+      let endSec;
+      if (i + 1 < chunks.length) {
+        endSec = chunks[i + 1].startTime || 0;
+      } else if (rec.audio_seconds) {
+        endSec = rec.audio_seconds;
+      } else {
+        const lastEntry = chunk.entries && chunk.entries[chunk.entries.length - 1];
+        endSec = lastEntry ? (lastEntry.offset || 0) : (chunk.startTime || 0);
+      }
+      const end = formatTimestamp(endSec);
+      const lines = (chunk.entries || []).map((entry) => {
+        const t = formatTimestamp(entry.offset || 0);
+        // Effective speaker: operator override (set via the
+        // dashboard's click-to-reassign UI) wins over the original
+        // diarization attribution. Override-source not shown in
+        // the static HTML download.
+        const effectiveSpeaker = entry.speaker_override || entry.speaker;
+        const chip = renderChipHtml(
+          effectiveSpeaker,
+          entry.speaker_confidence,
+          entry.speaker_uncertain,
+          speakerNames
+        );
+        return (
+          `<div class="line">` +
+            `<span class="ts">${htmlEsc(t)}</span>` +
+            (chip || `<span class="chip chip-empty"></span>`) +
+            `<span class="text">${htmlEsc(entry.text || "")}</span>` +
+          `</div>`
+        );
+      }).join("");
+      return (
+        `<details class="topic">` +
+          `<summary>` +
+            `<div class="topic-head">` +
+              `<span class="topic-title">${i + 1}. ${htmlEsc(chunk.title || "(untitled)")}</span>` +
+              `<span class="topic-range">${htmlEsc(start)} — ${htmlEsc(end)}</span>` +
+            `</div>` +
+            `<div class="topic-summary">${htmlEsc(chunk.summary || "")}</div>` +
+          `</summary>` +
+          `<div class="topic-body">` +
+            (lines || `<div class="empty-lines">No transcript entries for this topic.</div>`) +
+          `</div>` +
+        `</details>`
+      );
+    }).join("")
+    : `<div class="empty">No topic data — analyze may have failed.</div>`;
+
+  const transcriptHtml = rec.transcript
+    ? (
+      `<details class="full-transcript">` +
+        `<summary>Full transcript (bracketed)</summary>` +
+        `<pre>${htmlEsc(rec.transcript)}</pre>` +
+      `</details>`
+    )
+    : "";
+
+  // Phase 2 extras (decisions / action items / open questions /
+  // key quotes). Renders above the topics block when present.
+  // Empty categories collapse; if all four are empty the block hides.
+  const extrasHtml = renderExtrasHtml(rec.extras, speakerNames);
+
+  const css = `
+    :root {
+      --bg: #0b1220;
+      --panel: #111827;
+      --line: rgba(148,163,184,0.18);
+      --fg: #e2e8f0;
+      --fg-dim: #cbd5e1;
+      --fg-faint: #94a3b8;
+      --accent: #60a5fa;
+    }
+    * { box-sizing: border-box; }
+    html, body {
+      margin: 0;
+      padding: 0;
+      background: var(--bg);
+      color: var(--fg);
+      font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, Helvetica, Arial, sans-serif;
+      font-size: 14px;
+      line-height: 1.5;
+    }
+    main {
+      max-width: 920px;
+      margin: 0 auto;
+      padding: 32px 24px 64px;
+    }
+    header { margin-bottom: 18px; }
+    h1 {
+      font-size: 22px;
+      font-weight: 600;
+      margin: 0 0 6px;
+      color: var(--fg);
+    }
+    .meta {
+      font-size: 12px;
+      color: var(--fg-dim);
+    }
+    .header-actions {
+      margin-top: 12px;
+      display: flex;
+      flex-wrap: wrap;
+      gap: 8px;
+    }
+    .dl-btn {
+      display: inline-block;
+      padding: 6px 12px;
+      background: transparent;
+      border: 1px solid var(--line);
+      border-radius: 5px;
+      color: var(--fg);
+      font-size: 12px;
+      font-weight: 500;
+      text-decoration: none;
+      cursor: pointer;
+      transition: border-color 0.15s, background 0.15s;
+    }
+    .dl-btn:hover {
+      border-color: var(--accent);
+      background: rgba(96,165,250,0.08);
+    }
+    @media print {
+      .header-actions { display: none; }
+    }
+    .legend {
+      background: rgba(15,23,42,0.5);
+      border: 1px solid var(--line);
+      border-radius: 8px;
+      padding: 10px 14px;
+      margin-bottom: 16px;
+    }
+    .legend-label {
+      font-size: 10px;
+      font-weight: 600;
+      color: var(--fg-faint);
+      text-transform: uppercase;
+      letter-spacing: 0.06em;
+      margin-bottom: 8px;
+    }
+    .legend-chips { display: flex; flex-wrap: wrap; gap: 8px; }
+    .legend-chip {
+      display: inline-flex;
+      align-items: center;
+      gap: 6px;
+      padding: 3px 10px;
+      background: rgba(255,255,255,0.03);
+      border: 1px solid var(--line);
+      border-radius: 16px;
+      font-size: 11px;
+    }
+    .legend-name { color: var(--fg); }
+    .legend-secs { color: var(--fg-faint); }
+    .chip {
+      display: inline-flex;
+      align-items: center;
+      justify-content: center;
+      min-width: 26px;
+      height: 18px;
+      padding: 0 6px;
+      font-size: 10px;
+      font-weight: 700;
+      border-radius: 4px;
+      flex-shrink: 0;
+      letter-spacing: 0.02em;
+      line-height: 1;
+      font-family: ui-monospace, Menlo, Consolas, monospace;
+      border: 1px solid;
+    }
+    .chip-empty { background: transparent; border-color: transparent; }
+    /* Phase 2 extras block — TLDR + decisions / action items /
+       open questions / key quotes. Sits above the topics list. */
+    .extras { display: flex; flex-direction: column; gap: 8px; margin-bottom: 16px; }
+    .tldr {
+      background: linear-gradient(135deg, rgba(96,165,250,0.08), rgba(15,23,42,0.5));
+      border: 1px solid var(--line);
+      border-left: 3px solid var(--accent);
+      border-radius: 8px;
+      padding: 12px 16px;
+    }
+    .tldr-label {
+      font-size: 10px;
+      font-weight: 600;
+      color: var(--accent);
+      text-transform: uppercase;
+      letter-spacing: 0.08em;
+      margin-bottom: 6px;
+    }
+    .tldr-summary { font-size: 13px; line-height: 1.6; color: var(--fg); }
+    .tldr-meta {
+      margin-top: 8px;
+      display: flex;
+      flex-wrap: wrap;
+      gap: 8px;
+      align-items: center;
+      font-size: 11px;
+      color: var(--fg-faint);
+    }
+    @media print {
+      .tldr { background: #f5f9ff; border-color: #cbd5e1; border-left-color: #2563eb; }
+      .tldr-label { color: #2563eb; }
+    }
+    details.extras-section {
+      background: var(--panel);
+      border: 1px solid var(--line);
+      border-radius: 8px;
+      overflow: hidden;
+    }
+    details.extras-section > summary {
+      padding: 10px 14px;
+      cursor: pointer;
+      list-style: none;
+      display: flex;
+      align-items: baseline;
+      gap: 8px;
+    }
+    details.extras-section > summary::-webkit-details-marker { display: none; }
+    .extras-title { font-size: 13px; font-weight: 600; color: var(--fg); }
+    .extras-count { font-size: 11px; color: var(--fg-faint); }
+    .extras-body {
+      border-top: 1px solid var(--line);
+      padding: 8px 14px 12px;
+      background: rgba(15,23,42,0.3);
+      display: flex;
+      flex-direction: column;
+      gap: 10px;
+    }
+    .extras-item { font-size: 12px; line-height: 1.55; color: var(--fg); }
+    .extras-text {}
+    .extras-quote {
+      font-style: italic;
+      border-left: 3px solid var(--line);
+      padding-left: 10px;
+    }
+    .extras-meta {
+      margin-top: 4px;
+      display: flex;
+      flex-wrap: wrap;
+      gap: 8px;
+      align-items: center;
+      font-size: 11px;
+      color: var(--fg-faint);
+    }
+    .meta-label { color: var(--fg-faint); }
+    .meta-due { color: var(--fg-dim); }
+    .sep { color: var(--fg-faint); }
+    .ts-tag {
+      display: inline-block;
+      padding: 1px 6px;
+      border: 1px solid var(--line);
+      border-radius: 4px;
+      color: var(--accent);
+      font-family: ui-monospace, Menlo, Consolas, monospace;
+      font-size: 10.5px;
+    }
+    .inline-chip { display: inline-flex; align-items: center; gap: 4px; }
+    .inline-chip .chip {
+      min-width: 22px;
+      height: 16px;
+      padding: 0 5px;
+      font-size: 9px;
+    }
+    .inline-name { font-size: 11px; color: var(--fg-dim); }
+    .topics { display: flex; flex-direction: column; gap: 10px; }
+    details.topic {
+      background: var(--panel);
+      border: 1px solid var(--line);
+      border-radius: 8px;
+      padding: 0;
+      overflow: hidden;
+    }
+    details.topic > summary {
+      padding: 12px 16px;
+      cursor: pointer;
+      list-style: none;
+    }
+    details.topic > summary::-webkit-details-marker { display: none; }
+    .topic-head {
+      display: flex;
+      align-items: baseline;
+      gap: 10px;
+    }
+    .topic-title { font-size: 13px; font-weight: 600; color: var(--fg); }
+    .topic-range {
+      font-size: 10.5px;
+      color: var(--fg-faint);
+      font-family: ui-monospace, Menlo, Consolas, monospace;
+    }
+    .topic-summary {
+      font-size: 12px;
+      color: var(--fg-dim);
+      line-height: 1.55;
+      margin-top: 6px;
+    }
+    .topic-body {
+      border-top: 1px solid var(--line);
+      padding: 8px 8px 12px;
+      background: rgba(15,23,42,0.3);
+    }
+    .line {
+      display: flex;
+      gap: 10px;
+      align-items: flex-start;
+      padding: 4px 8px;
+      font-size: 12px;
+      line-height: 1.55;
+      color: var(--fg);
+    }
+    .line .ts {
+      font-size: 11px;
+      color: var(--accent);
+      min-width: 54px;
+      padding-top: 2px;
+      font-family: ui-monospace, Menlo, Consolas, monospace;
+    }
+    .line .text { flex: 1; }
+    .empty-lines, .empty {
+      padding: 10px 14px;
+      font-size: 11px;
+      color: var(--fg-faint);
+    }
+    details.full-transcript {
+      margin-top: 24px;
+      background: var(--panel);
+      border: 1px solid var(--line);
+      border-radius: 8px;
+      padding: 12px 16px;
+    }
+    details.full-transcript > summary {
+      cursor: pointer;
+      font-size: 12px;
+      font-weight: 600;
+      color: var(--fg-dim);
+    }
+    details.full-transcript pre {
+      margin: 12px 0 0;
+      padding: 12px;
+      background: rgba(15,23,42,0.5);
+      border: 1px solid var(--line);
+      border-radius: 6px;
+      font-family: ui-monospace, Menlo, Consolas, monospace;
+      font-size: 11px;
+      line-height: 1.55;
+      color: var(--fg-dim);
+      white-space: pre-wrap;
+      word-break: break-word;
+      max-height: 60vh;
+      overflow: auto;
+    }
+    footer {
+      margin-top: 32px;
+      padding-top: 16px;
+      border-top: 1px solid var(--line);
+      font-size: 11px;
+      color: var(--fg-faint);
+      text-align: center;
+    }
+    /* Print styles — flatten dark theme for paper. */
+    @media print {
+      html, body { background: #fff; color: #111; }
+      .topic, .legend, details.full-transcript { background: #fff; border-color: #ddd; }
+      .topic-summary, .legend-name, .meta { color: #444; }
+      .legend-secs, .topic-range, .empty-lines, .empty { color: #888; }
+      .line .ts { color: #2563eb; }
+      details { break-inside: avoid; }
+      details > summary { list-style: none; }
+      details, details > summary { display: block !important; }
+      details > summary + * { display: block !important; }
+    }
+  `;
+
+  return (
+    `<!doctype html>\n<html lang="en">\n<head>\n` +
+    `<meta charset="utf-8">\n` +
+    `<meta name="viewport" content="width=device-width, initial-scale=1">\n` +
+    `<title>${htmlEsc(title)}</title>\n` +
+    `<style>${css}</style>\n` +
+    `</head>\n<body>\n<main>\n` +
+    `<header>\n` +
+      `<h1>${htmlEsc(title)}</h1>\n` +
+      `<div class="meta">${htmlEsc(metaParts.join(" · "))}</div>\n` +
+      // Download buttons for the .md + .json siblings — embedded in
+      // the .html itself as base64 data URLs so they work entirely
+      // offline (no relay round-trip, no auth needed). Lets a
+      // recipient who got the .html grab any of the three formats
+      // without operator access.
+      `<div class="header-actions">\n` +
+        `<a class="dl-btn" href="${mdDataUrl}" download="${htmlEsc(safeFilenameBase)}.md">Download .md</a>\n` +
+        `<a class="dl-btn" href="${jsonDataUrl}" download="${htmlEsc(safeFilenameBase)}.json">Download .json</a>\n` +
+      `</div>\n` +
+    `</header>\n` +
+    legendHtml +
+    extrasHtml +
+    `<section class="topics">${topicsHtml}</section>\n` +
+    transcriptHtml +
+    `<footer>Generated by Recap Relay · Internal Meetings</footer>\n` +
+    `</main>\n</body>\n</html>\n`
+  );
+}
+
+// ─── Pipeline orchestrator ──────────────────────────────────────────
+// Runs the full hardware pipeline on an uploaded audio file. Mirrors
+// the relevant portion of summarize-url.js but without the URL
+// download / credit accounting / Recaps-app envelope layers.
+
+async function runMeetingPipeline({
+  dataDir,
+  jobId,
+  audioPath,
+  mimeType,
+  audioSec,
+  title,
+  participants,
+  notes = "",
+}) {
+  const cfg = await getConfigSnapshot();
+  const hw = await resolveHardwareConfig(cfg);
+  if (!hw.transcribe.url) {
+    throw new Error(
+      "hardware transcribe not available — Spark Control discovery isn't reporting a ready endpoint"
+    );
+  }
+
+  // ── Acquire hardware FIFO slot ──
+  const release = await acquireHardwareSlot({
+    jobId,
+    onWait: ({ position, activeJobId }) => {
+      appendEvent(jobId, "queued", {
+        position,
+        activeJobId: activeJobId || null,
+      });
+      setProgress(
+        jobId,
+        `queued — ${position} job(s) ahead on operator hardware`
+      );
+    },
+  });
+
+  try {
+    markRunning(jobId);
+    appendEvent(jobId, "progress", { message: "reading audio…" });
+
+    const audioBuf = await fs.readFile(audioPath);
+
+    // Build analyze backend up-front so the pipelined-analyze worker
+    // can fire windows as soon as their chunks arrive.
+    const analyzeBackend = createHardwareBackend({
+      parakeetBaseURL: hw.transcribe.url || "",
+      gemmaBaseURL: hw.analyze.url,
+      sparkControlBaseURL: hw.sparkBase || "",
+      parakeetModel: hw.transcribe.model || "",
+      gemmaModel: hw.analyze.model || "",
+      anMaxTokens: cfg.relay_hardware_an_max_tokens || 16000,
+    });
+
+    const bodyMin = cfg.relay_hardware_analyze_window_minutes || 18;
+    const overlapMin = cfg.relay_hardware_analyze_overlap_minutes || 2;
+    const anConcurrency = cfg.relay_hardware_analyze_concurrency || 8;
+    const cutoffMin = cfg.relay_analyze_cutoff_minutes || 25;
+    const targetTotalsByBucket = {
+      under_30: cfg.relay_analyze_total_sections_under_30,
+      "30_60": cfg.relay_analyze_total_sections_30_60,
+      "60_90": cfg.relay_analyze_total_sections_60_90,
+      "90_120": cfg.relay_analyze_total_sections_90_120,
+      "120_150": cfg.relay_analyze_total_sections_120_150,
+      "150_180": cfg.relay_analyze_total_sections_150_180,
+      over_180: cfg.relay_analyze_total_sections_over_180,
+    };
+    const analyzePromptOverride =
+      cfg.relay_analyze_prompt || cfg.relay_analyze_prompt_default || "";
+    const computeCostDetails = () => ({
+      input_tokens: 0,
+      output_tokens: 0,
+      thinking_tokens: 0,
+      cost_usd: 0,
+    });
+
+    const chunkBuffer = createChunkBuffer();
+    const pipelinedAnalyzePromise = runPipelinedAnalysis({
+      audioDurationSec: audioSec || 0,
+      waitForTime: (sec) => chunkBuffer.waitForTime(sec),
+      getReadySegments: (s, e) => chunkBuffer.getSegments(s, e),
+      bodySeconds: bodyMin * 60,
+      overlapSeconds: overlapMin * 60,
+      cutoffSeconds: cutoffMin * 60,
+      concurrency: anConcurrency,
+      backend: analyzeBackend,
+      pipelineBackend: "hardware",
+      jobId,
+      batchId: null,
+      mediaUrl: null,
+      title: title || null,
+      installId: "internal-meetings",
+      licenseFingerprint: null,
+      source: "internal-meetings",
+      computeCostDetails,
+      analyzePromptOverride,
+      targetTotalsByBucket,
+      onWindowComplete: (cb) => {
+        appendEvent(jobId, "window_complete", {
+          windowIdx: cb.windowIdx,
+          totalWindows: cb.totalWindows,
+          ownedSections: cb.ownedSections,
+          windowEntries: cb.windowEntries || undefined,
+          windowBodySeconds: cb.windowBodySeconds,
+          model: cb.model,
+          durationMs: cb.durationMs,
+        });
+        setProgress(
+          jobId,
+          `analyze window ${cb.windowIdx + 1}/${cb.totalWindows} done`
+        );
+      },
+    }).catch((err) => ({ __error: err }));
+
+    const transcribeBackend = createHardwareBackend({
+      parakeetBaseURL: hw.transcribe.url || "",
+      gemmaBaseURL: hw.analyze.url || "",
+      sparkControlBaseURL: hw.sparkBase || "",
+      parakeetModel: hw.transcribe.model || "",
+      gemmaModel: hw.analyze.model || "",
+      txChunkSeconds: (cfg.relay_hardware_tx_chunk_minutes || 5) * 60,
+      txChunkOverlapSeconds:
+        cfg.relay_hardware_tx_chunk_overlap_seconds ?? 30,
+      diarizationEnabled: !!cfg.relay_hardware_diarization_enabled,
+      clusterThresholdPct:
+        cfg.relay_hardware_voice_clustering_threshold ?? 70,
+      anchorMinSpeakingSec:
+        cfg.relay_hardware_anchor_min_speaking_sec ?? 30,
+      smallClusterMaxSpeakingSec:
+        cfg.relay_hardware_small_cluster_max_speaking_sec ?? 15,
+      uncertainMarginPct: cfg.relay_hardware_uncertain_margin_pct ?? 10,
+      txConcurrency: cfg.relay_hardware_tx_concurrency || 4,
+      anMaxTokens: cfg.relay_hardware_an_max_tokens || 16000,
+      onChunkComplete: (cd) => chunkBuffer.add(cd),
+    });
+
+    const txResult = await transcribeBackend.transcribeAudio({
+      audio: audioBuf,
+      mimeType,
+      offsetSeconds: 0,
+    });
+
+    appendEvent(jobId, "transcribe_complete", {
+      transcript: txResult.text || "",
+      model: txResult.model || null,
+      chunk_count: txResult.chunk_count ?? null,
+      audio_seconds: audioSec || null,
+    });
+
+    // Await the pipelined analyze.
+    const pipelinedRaw = await pipelinedAnalyzePromise;
+    if (pipelinedRaw && pipelinedRaw.__error) {
+      throw pipelinedRaw.__error;
+    }
+
+    // Remap window-local section indices to global canonical indices,
+    // mirroring summarize-url.js's post-pipeline stitch.
+    const canonicalEntries = parseBracketedTranscript(txResult.text || "");
+    const syntheticResults = (pipelinedRaw.windowResults || []).map((wr) => {
+      if (!wr || !wr.ok) return wr;
+      const w = wr.window;
+      const globalStartIdx = firstEntryAtOrAfter(canonicalEntries, w.startSec);
+      const globalBodyStartIdx = firstEntryAtOrAfter(
+        canonicalEntries,
+        w.bodyStartSec
+      );
+      const globalEndIdx = lastEntryBefore(
+        canonicalEntries,
+        w.windowEndSec + 0.5
+      );
+      if (
+        globalStartIdx >= canonicalEntries.length ||
+        globalEndIdx < globalStartIdx
+      ) {
+        return {
+          window: { startIdx: 0, endIdx: -1, bodyStartIdx: 0 },
+          ok: false,
+          error: new Error("pipelined window had no canonical entries"),
+        };
+      }
+      const remapped = [];
+      for (const s of wr.sections || []) {
+        const localStartEntry = wr.windowEntries?.[s.startIndex];
+        const localEndEntry = wr.windowEntries?.[s.endIndex];
+        if (!localStartEntry || !localEndEntry) continue;
+        const globalStart = canonicalIndexForOffset(
+          canonicalEntries,
+          localStartEntry.offset || 0
+        );
+        const globalEnd = canonicalIndexForOffset(
+          canonicalEntries,
+          localEndEntry.offset || 0
+        );
+        if (globalStart < 0 || globalEnd < 0) continue;
+        remapped.push({
+          startIndex: globalStart - globalStartIdx,
+          endIndex: globalEnd - globalStartIdx,
+          title: s.title,
+          summary: s.summary,
+        });
+      }
+      return {
+        window: {
+          startIdx: globalStartIdx,
+          endIdx: globalEndIdx,
+          bodyStartIdx: globalBodyStartIdx,
+        },
+        ok: true,
+        sections: remapped,
+        model: wr.model,
+      };
+    });
+    const stitched = stitchAnalysisResults(syntheticResults);
+    let analyzeResult = {
+      text: JSON.stringify({ sections: stitched }),
+      model: pipelinedRaw.dominantModel,
+      attempts: pipelinedRaw.attempts,
+    };
+
+    // ── Polish pass ──
+    let speakerNames = null;
+    const polishEnabled = cfg.relay_post_cluster_polish_enabled !== false;
+    const detectedSpeakerCount = Object.keys(txResult?.speakers || {}).length;
+    const parsedAnalysis = JSON.parse(analyzeResult.text);
+    const polishableSections = Array.isArray(parsedAnalysis.sections)
+      ? parsedAnalysis.sections
+      : null;
+    if (
+      polishEnabled &&
+      detectedSpeakerCount >= 2 &&
+      Array.isArray(txResult?.segments) &&
+      polishableSections &&
+      polishableSections.length > 0
+    ) {
+      appendEvent(jobId, "progress", { message: "polishing summaries…" });
+      try {
+        speakerNames = await runNameInference({
+          speakers: txResult.speakers,
+          transcriptSegments: txResult.segments,
+          channelHint: "",
+          titleHint: title || "",
+          // descriptionHint stays empty for internal meetings —
+          // we don't want to stuff participants into the "Description"
+          // metadata field where the LLM might read them as factual
+          // metadata about the meeting. They go through the explicit
+          // OPERATOR HINTS pathway instead, which the prompt warns
+          // the model to treat as suggestion-not-truth.
+          descriptionHint: "",
+          participantHints: Array.isArray(participants) && participants.length
+            ? participants.join(", ")
+            : "",
+          operatorNotes: notes || "",
+          backend: analyzeBackend,
+          pipelineBackend: "hardware",
+          jobId,
+          batchId: null,
+          mediaUrl: null,
+          installId: "internal-meetings",
+          licenseFingerprint: null,
+          source: "internal-meetings",
+          computeCostDetails,
+        });
+
+        const canonicalForPolish = parseBracketedTranscript(
+          txResult.text || ""
+        );
+        const { planWindowsByDuration } = await import("../chunked-analyze.js");
+        const windowsForPolish = planWindowsByDuration({
+          totalAudioSec: audioSec || 0,
+          bodySeconds: bodyMin * 60,
+          overlapSeconds: overlapMin * 60,
+          cutoffSeconds: cutoffMin * 60,
+        });
+        const polishedSections = await runSummaryPolish({
+          sections: polishableSections,
+          canonicalEntries: canonicalForPolish,
+          windows: windowsForPolish,
+          transcriptSegments: txResult.segments,
+          speakerNames,
+          speakerStats: txResult.speakers,
+          backend: analyzeBackend,
+          concurrency: anConcurrency,
+          pipelineBackend: "hardware",
+          jobId,
+          batchId: null,
+          mediaUrl: null,
+          installId: "internal-meetings",
+          licenseFingerprint: null,
+          source: "internal-meetings",
+          computeCostDetails,
+        });
+        analyzeResult = {
+          ...analyzeResult,
+          text: JSON.stringify({ sections: polishedSections }),
+        };
+      } catch (err) {
+        console.warn(
+          `[internal-meetings ${jobId.slice(0, 8)}] polish failed (keeping unpolished output): ${err?.message || err}`
+        );
+        speakerNames = null;
+      }
+    }
+
+    // Build the chunks shape Recaps-style rendering expects:
+    // chunks[i] = { title, summary, startTime, entries: [...] }
+    //
+    // Gap-absorbing slice: the LLM's analyze pass returns section
+    // ranges (startIndex/endIndex) that don't always cover every
+    // entry — short audio especially produces gaps where the model
+    // skipped over filler ("uh", "yeah, OK") between coherent
+    // topics. The naive slice(start, end+1) drops those orphaned
+    // entries entirely, so the user sees topic cards with one
+    // statement under a summary that clearly references more
+    // dialogue, and big un-rendered gaps between consecutive topic
+    // timestamps (e.g. 2:10 → 2:56 with nothing shown in between).
+    //
+    // We extend each chunk's end to one before the NEXT chunk's
+    // start (so consecutive topics are exactly adjacent), and the
+    // final chunk extends to the end of the transcript. Chunk 0
+    // backfills to entry 0 to absorb any opening preamble the LLM
+    // skipped. Result: every canonical entry lives in exactly one
+    // chunk's entries[], no transcript line is hidden, and topic
+    // ranges in the UI become contiguous.
+    //
+    // The LLM's original (uncovered) ranges stay in
+    // `analysis.sections` (saved with the record) for forensics —
+    // we only adjust the rendered `chunks`.
+    const finalAnalysis = JSON.parse(analyzeResult.text);
+    const sortedSections = (finalAnalysis.sections || [])
+      .slice()
+      .sort((a, b) => (a.startIndex ?? 0) - (b.startIndex ?? 0));
+    const lastEntryIdx = canonicalEntries.length - 1;
+    const chunks = sortedSections
+      .map((s, idx, arr) => {
+        let start = Math.max(0, s.startIndex ?? 0);
+        let end = Math.min(lastEntryIdx, s.endIndex ?? start);
+        // First chunk absorbs any pre-topic preamble.
+        if (idx === 0) start = 0;
+        // Non-final chunks extend to one before the next chunk's
+        // start. We take the MAX of (LLM-provided end, next-1) so
+        // we don't shrink a section the LLM intentionally made
+        // wider than the gap suggests.
+        if (idx + 1 < arr.length) {
+          const nextStart = arr[idx + 1].startIndex ?? canonicalEntries.length;
+          end = Math.max(end, Math.min(lastEntryIdx, nextStart - 1));
+        } else {
+          // Last section absorbs any trailing entries.
+          end = lastEntryIdx;
+        }
+        // Defensive clamps in case the LLM emitted backwards ranges.
+        if (end < start) end = start;
+        const slice = canonicalEntries.slice(start, end + 1);
+        return {
+          title: s.title,
+          summary: s.summary,
+          entries: slice,
+          startTime: slice[0]?.offset || 0,
+        };
+      })
+      .filter((c) => c.entries.length > 0);
+
+    // Attach speakers to each entry by timestamp match.
+    //
+    // Tricky bit: `entry.offset` came from parseBracketedTranscript,
+    // which extracted an INTEGER seconds value from a [m:ss] / [h:mm:ss]
+    // bracket. That bracket was originally emitted by formatMmSs in
+    // hardware.js using Math.floor(seg.start). So `entry.offset` is
+    // exactly Math.floor(sourceSegment.start). The segments' own
+    // `start` field still carries float precision.
+    //
+    // The earlier strict containment check (`seg.start <= t <= seg.end`)
+    // misses every entry where seg.start has a fractional part — e.g.
+    // seg.start=0.32 and t=0 fails because 0 < 0.32. That's why the
+    // detail view rendered no chips at all even though the speakers
+    // legend showed the diarized roster.
+    //
+    // Build a floored-start index for O(1) lookup, with a tolerant
+    // fallback for the rare cases where mergeShortEntries dropped a
+    // line.
+    if (Array.isArray(txResult.segments) && txResult.segments.length) {
+      const sortedSegs = txResult.segments
+        .slice()
+        .sort((a, b) => (a.start || 0) - (b.start || 0));
+      const segByFlooredStart = new Map();
+      for (const seg of sortedSegs) {
+        const k = Math.floor(seg.start || 0);
+        if (!segByFlooredStart.has(k)) segByFlooredStart.set(k, seg);
+      }
+      const pickSpeaker = (t) => {
+        // Primary: exact floored-start match — this is the segment
+        // that produced the bracket the entry was parsed from.
+        let found = segByFlooredStart.get(t);
+        if (found && found.speaker) return found;
+        // Secondary: containing segment (covers gaps where the
+        // bracket-source segment had no speaker but a neighboring
+        // diar segment does cover this timestamp).
+        for (const seg of sortedSegs) {
+          if ((seg.start || 0) > t + 5) break;
+          if ((seg.start || 0) - 0.5 <= t && t <= (seg.end || 0) + 0.5) {
+            if (seg.speaker) return seg;
+          }
+        }
+        // Tertiary: nearest preceding segment within 5s window.
+        let bestPrev = null;
+        let bestDist = Infinity;
+        for (const seg of sortedSegs) {
+          if ((seg.start || 0) > t) break;
+          const dist = t - (seg.start || 0);
+          if (dist < bestDist && seg.speaker) {
+            bestDist = dist;
+            bestPrev = seg;
+          }
+        }
+        if (bestPrev && bestDist <= 5) return bestPrev;
+        return null;
+      };
+      for (const chunk of chunks) {
+        for (const entry of chunk.entries) {
+          const t = entry.offset || 0;
+          const found = pickSpeaker(t);
+          if (found && found.speaker) {
+            entry.speaker = found.speaker;
+            entry.speaker_confidence = found.speaker_confidence ?? null;
+            entry.speaker_uncertain = !!found.speaker_uncertain;
+          }
+        }
+      }
+    }
+
+    const transcriptSegments = Array.isArray(txResult?.segments)
+      ? txResult.segments.map((s) => ({
+          start: s.start || 0,
+          end: s.end || 0,
+          text: s.text || "",
+          speaker: s.speaker || null,
+          speaker_confidence: s.speaker_confidence ?? null,
+          speaker_uncertain: !!s.speaker_uncertain,
+        }))
+      : null;
+
+    // ── Phase 2: Meeting extras ──
+    // Single LLM pass to pull out structured information operators
+    // want at the top of a meeting recap: decisions, action items,
+    // open questions, key quotes. Each item carries speaker IDs +
+    // offsets so the dashboard can render speaker chips and
+    // clickable timestamps that jump to the supporting transcript
+    // line. Failure is non-fatal — rec.extras stays null and the
+    // UI just hides the section.
+    const extrasEnabled = cfg.relay_meeting_extras_enabled !== false;
+    let extras = null;
+    if (extrasEnabled && Array.isArray(transcriptSegments) && transcriptSegments.length) {
+      appendEvent(jobId, "progress", { message: "extracting decisions + action items…" });
+      try {
+        extras = await runMeetingExtras({
+          title,
+          audioSec: audioSec || 0,
+          speakers: txResult.speakers || {},
+          speakerNames: speakerNames || {},
+          transcriptSegments,
+          topics: chunks.map((c) => ({
+            title: c.title,
+            summary: c.summary,
+            startTime: c.startTime,
+          })),
+          // Operator hints passed through to the extras prompt the
+          // same way they're passed to name-inference — explicit
+          // hints, framed in the prompt as suggestions, not truth.
+          participantHints: Array.isArray(participants) && participants.length
+            ? participants.join(", ")
+            : "",
+          operatorNotes: notes || "",
+          promptOverride: cfg.relay_meeting_extras_prompt || "",
+          backend: analyzeBackend,
+          pipelineBackend: "hardware",
+          jobId,
+          installId: "internal-meetings",
+          licenseFingerprint: null,
+          source: "internal-meetings",
+          computeCostDetails,
+        });
+      } catch (err) {
+        console.warn(
+          `[internal-meetings ${jobId.slice(0, 8)}] extras extraction failed (non-fatal): ${err?.message || err}`
+        );
+        extras = null;
+      }
+    }
+
+    // ── Save the record ──
+    // Note: `notes` from the upload form is intentionally NOT
+    // persisted here. Notes are LLM hints only — used by name-
+    // inference + extras at pipeline time, then dropped. They
+    // never appear in the dashboard detail view, the .md/.html/.json
+    // downloads, or any operator-readable artifact. The operator
+    // can write candid context ("Steve is the new guy still
+    // figuring stuff out", "John was angry about Q3") without
+    // worrying about it becoming part of a shareable meeting recap.
+    const record = {
+      id: jobId,
+      type: "internal-meeting",
+      title: title || "Untitled meeting",
+      participants: Array.isArray(participants) ? participants : [],
+      created_at: Date.now(),
+      audio_seconds: audioSec || 0,
+      transcript: txResult.text || "",
+      transcript_segments: transcriptSegments,
+      speakers: txResult.speakers || null,
+      speaker_names: speakerNames || null,
+      diarization: txResult.diarization || null,
+      chunks,
+      analysis: finalAnalysis,
+      extras,
+      meta: {
+        transcribe_model: txResult.model || null,
+        analyze_model: analyzeResult.model || null,
+        polish_done: !!speakerNames,
+        extras_done: !!extras,
+      },
+    };
+    await saveMeeting(dataDir, jobId, record);
+
+    markComplete(jobId, {
+      result: {
+        id: jobId,
+        title: record.title,
+        audio_seconds: record.audio_seconds,
+        topic_count: chunks.length,
+        speaker_count: Object.keys(record.speakers || {}).length,
+        named_speaker_count: speakerNames
+          ? Object.values(speakerNames).filter(Boolean).length
+          : 0,
+      },
+      credit_charged: 0,
+      tier: "operator",
+    });
+    console.log(
+      `[internal-meetings ${jobId.slice(0, 8)}] complete — ${chunks.length} topics, ${Object.keys(record.speakers || {}).length} speakers`
+    );
+  } finally {
+    release();
+    // ALWAYS delete the uploaded audio file after processing (success
+    // or failure). The relay never retains audio for internal
+    // meetings — same policy as the YouTube/podcast download path.
+    try {
+      await fs.unlink(audioPath);
+    } catch {}
+  }
+}
+
+// ─── Router ─────────────────────────────────────────────────────────
+
+export function internalMeetingsRouter({ dataDir }) {
+  const router = express.Router();
+
+  // Multer config: write uploads to OS tmp dir; we move/process and
+  // delete in the pipeline. memoryStorage would buffer the whole
+  // file in RAM — fine for short meetings, risky for 4-hour ones.
+  const upload = multer({
+    storage: multer.diskStorage({
+      destination: (_req, _file, cb) => {
+        fs.mkdtemp(path.join(os.tmpdir(), "relay-meeting-"))
+          .then((dir) => cb(null, dir))
+          .catch((err) => cb(err));
+      },
+      filename: (_req, file, cb) => {
+        // Preserve extension for mimeType detection downstream
+        const ext = path.extname(file.originalname || "") || ".bin";
+        cb(null, `upload${ext}`);
+      },
+    }),
+    limits: { fileSize: MAX_UPLOAD_BYTES },
+  });
+
+  // POST /admin/internal-meetings/upload
+  // multipart fields:
+  //   file         — audio (required)
+  //   title        — string (optional)
+  //   participants — CSV string of attendee names (optional, treated
+  //                  as HINTS only by the LLM)
+  //   notes        — free-form prose context for the LLM. Used by
+  //                  the name-inference + extras prompts as a soft
+  //                  signal for who-said-what attribution.
+  router.post("/upload", upload.single("file"), async (req, res) => {
+    const file = req.file;
+    if (!file) {
+      return res.status(400).json({ error: "no file uploaded" });
+    }
+    const title = (req.body?.title || "").toString().slice(0, 200);
+    const participantsCsv = (req.body?.participants || "").toString();
+    const participants = participantsCsv
+      .split(",")
+      .map((s) => s.trim())
+      .filter(Boolean)
+      .slice(0, 30); // soft cap
+    // Notes — free-form context the operator wants the LLM to factor
+    // in. Trimmed + clamped to 4000 chars (matches the cap in
+    // post-cluster-polish.js / meeting-extras.js so we don't store
+    // more than we'll ever send to the model). Empty string when
+    // not provided.
+    const notes = (req.body?.notes || "").toString().trim().slice(0, 4000);
+
+    // Probe audio duration up-front so the pipeline knows the
+    // window plan size. Falls back to 0 if probe fails (pipeline
+    // will single-shot in that case).
+    let audioSec = 0;
+    try {
+      audioSec = await getAudioDurationSeconds(file.path);
+    } catch (err) {
+      console.warn(
+        `[internal-meetings] duration probe failed for ${file.path}: ${err?.message || err}`
+      );
+    }
+
+    const job = createJob({
+      kind: "internal-meeting",
+      installId: "internal-meetings",
+      metadata: {
+        title,
+        participants,
+        notes,
+        audio_seconds: audioSec,
+        original_filename: file.originalname || null,
+        size_bytes: file.size,
+      },
+    });
+
+    console.log(
+      `[internal-meetings ${job.id.slice(0, 8)}] upload received — ${file.originalname || "(no name)"} ${Math.round((file.size || 0) / (1024 * 1024))}MB, ${Math.round(audioSec / 60)} min audio, title="${title}"${notes ? `, notes=${notes.length} chars` : ""}`
+    );
+
+    // Kick off pipeline in the background. Don't await — we return
+    // the job ID immediately so the client can subscribe via SSE.
+    (async () => {
+      try {
+        await runMeetingPipeline({
+          dataDir,
+          jobId: job.id,
+          audioPath: file.path,
+          mimeType: file.mimetype || "audio/mpeg",
+          audioSec,
+          title,
+          participants,
+          notes,
+        });
+      } catch (err) {
+        const msg = (err?.message || String(err)).slice(0, 400);
+        markFailed(job.id, "meeting_failed: " + msg);
+        console.error(
+          `[internal-meetings ${job.id.slice(0, 8)}] worker crashed:`,
+          err
+        );
+        // Best-effort cleanup of the temp file + dir
+        try {
+          await fs.unlink(file.path);
+        } catch {}
+        try {
+          await fs.rmdir(path.dirname(file.path));
+        } catch {}
+      }
+    })();
+
+    res.json({
+      job_id: job.id,
+      title,
+      audio_seconds: audioSec,
+      participants,
+      notes,
+    });
+  });
+
+  // GET /admin/internal-meetings/jobs/:id/stream
+  // SSE stream of live progress events. Same event types
+  // summarize-url emits: progress, queued, transcribe_complete,
+  // window_complete, done, error.
+  router.get("/jobs/:id/stream", (req, res) => {
+    const job = getJob(req.params.id);
+    if (!job) {
+      res.status(404).json({ error: "no such job" });
+      return;
+    }
+    res.setHeader("Content-Type", "text/event-stream");
+    res.setHeader("Cache-Control", "no-cache, no-transform");
+    res.setHeader("Connection", "keep-alive");
+    res.flushHeaders?.();
+
+    const send = (ev) => {
+      try {
+        res.write(`event: ${ev.type}\ndata: ${JSON.stringify(ev.data || {})}\n\n`);
+      } catch {}
+    };
+
+    // Replay any events that already happened before this connection
+    // opened — clients that subscribe after the job has progressed
+    // would otherwise miss them.
+    for (const ev of job.events) send(ev);
+    if (job.status === "complete" || job.status === "failed") {
+      // Already terminal; close the stream after replay.
+      res.end();
+      return;
+    }
+
+    const unsubscribe = subscribeToJob(job.id, (ev) => {
+      send(ev);
+      if (ev.type === "done" || ev.type === "error") {
+        try {
+          res.end();
+        } catch {}
+      }
+    });
+    req.on("close", () => {
+      try {
+        unsubscribe();
+      } catch {}
+    });
+  });
+
+  // GET /admin/internal-meetings/jobs/:id
+  router.get("/jobs/:id", (req, res) => {
+    const job = getJob(req.params.id);
+    if (!job) return res.status(404).json({ error: "no such job" });
+    res.json({
+      id: job.id,
+      kind: job.kind,
+      status: job.status,
+      progress: job.progress,
+      started_at: job.started_at,
+      completed_at: job.completed_at,
+      error: job.error,
+      result: job.result,
+    });
+  });
+
+  // GET /admin/internal-meetings — list saved meetings
+  router.get("/", async (_req, res) => {
+    res.json({ meetings: await listMeetings(dataDir) });
+  });
+
+  // GET /admin/internal-meetings/:id — get full record JSON
+  router.get("/:id", async (req, res) => {
+    const rec = await loadMeeting(dataDir, req.params.id);
+    if (!rec) return res.status(404).json({ error: "not found" });
+    res.json(rec);
+  });
+
+  // GET /admin/internal-meetings/:id/markdown — markdown download
+  router.get("/:id/markdown", async (req, res) => {
+    const rec = await loadMeeting(dataDir, req.params.id);
+    if (!rec) return res.status(404).send("not found");
+    const md = meetingToMarkdown(rec);
+    const safeTitle = (rec.title || "meeting")
+      .replace(/[^a-zA-Z0-9-_.]+/g, "-")
+      .slice(0, 80);
+    res.setHeader("Content-Type", "text/markdown; charset=utf-8");
+    res.setHeader(
+      "Content-Disposition",
+      `attachment; filename="${safeTitle}.md"`
+    );
+    res.send(md);
+  });
+
+  // PATCH /admin/internal-meetings/:id/entries — per-line operator
+  // speaker re-assignment. Body shape:
+  //   { overrides: [{ chunk_idx, entry_idx, speaker_id }] }
+  // - speaker_id = a known cluster id ("Speaker_A", "Speaker_Unknown")
+  //   sets entry.speaker_override
+  // - speaker_id = "" CLEARS the override (reverts the line to its
+  //   original diarization-assigned speaker, if any)
+  //
+  // We persist the override as a separate field (entry.speaker_override)
+  // rather than overwriting entry.speaker so provenance is never
+  // destroyed — the original Sortformer attribution stays for
+  // debugging and so the operator can always revert. All downstream
+  // rendering (dashboard chips, .html / .md downloads) uses
+  // (entry.speaker_override || entry.speaker) so corrections show
+  // up everywhere.
+  //
+  // Why per-line and not just per-cluster: diarization on 4+
+  // speakers gets noisy in real meetings — similar voices get
+  // merged, mid-sentence speaker swaps get assigned to the wrong
+  // person, and the LLM name-inference compounds the issue when it
+  // confidently guesses the wrong person from limited context.
+  // Per-line override is the only knob that lets the operator
+  // perfectly correct the transcript without re-running anything
+  // upstream.
+  router.patch("/:id/entries", express.json(), async (req, res) => {
+    const rec = await loadMeeting(dataDir, req.params.id);
+    if (!rec) return res.status(404).json({ error: "not found" });
+    const overrides = Array.isArray(req.body?.overrides) ? req.body.overrides : null;
+    if (!overrides) {
+      return res.status(400).json({ error: "overrides array required" });
+    }
+    const knownIds = new Set(Object.keys(rec.speakers || {}));
+    if (!knownIds.has("Speaker_Unknown")) knownIds.add("Speaker_Unknown");
+    let changed = 0;
+    for (const op of overrides) {
+      if (!op || typeof op !== "object") continue;
+      const ci = Number.isInteger(op.chunk_idx) ? op.chunk_idx : -1;
+      const ei = Number.isInteger(op.entry_idx) ? op.entry_idx : -1;
+      if (ci < 0 || ei < 0) continue;
+      const chunk = rec.chunks?.[ci];
+      if (!chunk) continue;
+      const entry = chunk.entries?.[ei];
+      if (!entry) continue;
+      const sid = typeof op.speaker_id === "string" ? op.speaker_id.trim() : "";
+      if (sid === "") {
+        if (entry.speaker_override) {
+          delete entry.speaker_override;
+          changed += 1;
+        }
+        continue;
+      }
+      if (!knownIds.has(sid)) continue; // ignore unknown ids silently
+      if (entry.speaker_override !== sid) {
+        entry.speaker_override = sid;
+        changed += 1;
+      }
+    }
+    if (changed > 0) {
+      rec.meta = rec.meta || {};
+      rec.meta.entries_edited_at = Date.now();
+      await saveMeeting(dataDir, req.params.id, rec);
+    }
+    res.json({ ok: true, changed });
+  });
+
+  // PATCH /admin/internal-meetings/:id/speakers — operator-driven
+  // speaker rename. Body: { speaker_names: { Speaker_A: "Matt", ... } }
+  // Persists into rec.speaker_names (the same field the polish-pass
+  // name inference writes). Markdown/HTML downloads and the
+  // dashboard speaker chips/legend pick this up immediately.
+  //
+  // Rationale: the LLM name inference is a best-guess from the first
+  // ~6 minutes of transcript context. On internal calls where
+  // participants speak each other's names rarely (or where the same
+  // first name is shared by two people), it gets things wrong. This
+  // endpoint lets the operator correct them after the fact. The
+  // change is a single field rewrite — no entry-rewriting, no
+  // re-clustering — because Speaker_X cluster IDs are stable; we
+  // just relabel the display name.
+  //
+  // Speaker MERGES (Speaker_A and Speaker_C are actually the same
+  // person) are a separate, harder change — they require rewriting
+  // every entry's .speaker and recomputing stats. Tracked as a
+  // follow-up; for now, two clusters with the same display name
+  // render with the same name on the legend but stay as distinct
+  // chips on the per-line attribution.
+  router.patch("/:id/speakers", express.json(), async (req, res) => {
+    const rec = await loadMeeting(dataDir, req.params.id);
+    if (!rec) return res.status(404).json({ error: "not found" });
+    const incoming = req.body?.speaker_names;
+    if (!incoming || typeof incoming !== "object") {
+      return res.status(400).json({ error: "speaker_names object required" });
+    }
+    const current = rec.speaker_names && typeof rec.speaker_names === "object"
+      ? { ...rec.speaker_names }
+      : {};
+    // Only allow updating keys that look like cluster IDs to avoid
+    // junk-write attacks. Empty string clears the name (falls back
+    // to "Speaker X" display).
+    const knownIds = new Set(Object.keys(rec.speakers || {}));
+    let changed = 0;
+    for (const [id, name] of Object.entries(incoming)) {
+      if (!/^Speaker_[A-Z]+$/.test(id)) continue;
+      if (!knownIds.has(id)) continue;
+      const trimmed = typeof name === "string" ? name.trim().slice(0, 60) : "";
+      if (trimmed) {
+        if (current[id] !== trimmed) {
+          current[id] = trimmed;
+          changed += 1;
+        }
+      } else if (current[id]) {
+        delete current[id];
+        changed += 1;
+      }
+    }
+    if (changed > 0) {
+      rec.speaker_names = current;
+      // Mark that this was operator-edited so we can preserve the
+      // edit if/when the pipeline ever re-runs name inference.
+      rec.meta = rec.meta || {};
+      rec.meta.speaker_names_edited_at = Date.now();
+      await saveMeeting(dataDir, req.params.id, rec);
+    }
+    res.json({
+      ok: true,
+      changed,
+      speaker_names: current,
+    });
+  });
+
+  // PATCH /admin/internal-meetings/:id/merge-speakers — fold one or
+  // more clusters that diarization mistakenly split apart into a single
+  // speaker. Body: { survivor: "Speaker_A", absorbed: ["Speaker_C"] }.
+  // Rewrites every label reference (segments, entries, overrides),
+  // sums the per-cluster stats, and rewrites extras attributions. The
+  // survivor keeps its own display name (inheriting the absorbed name
+  // only if it had none). This is the inverse of a re-cluster: use it
+  // when ONE person was diarized as two; use re-cluster when TWO people
+  // were diarized as one.
+  router.patch("/:id/merge-speakers", express.json(), async (req, res) => {
+    const rec = await loadMeeting(dataDir, req.params.id);
+    if (!rec) return res.status(404).json({ error: "not found" });
+    const survivor = req.body?.survivor;
+    const absorbed = req.body?.absorbed;
+    try {
+      const result = mergeSpeakersInRecord(rec, survivor, absorbed);
+      await saveMeeting(dataDir, req.params.id, rec);
+      res.json({ ok: true, ...result });
+    } catch (err) {
+      if (err?.code === "BAD_REQUEST") {
+        return res.status(400).json({ error: err.message });
+      }
+      console.error(
+        `[internal-meetings] merge-speakers failed for ${req.params.id}: ${err?.message || err}`
+      );
+      res.status(500).json({ error: "merge failed" });
+    }
+  });
+
+  // POST /admin/internal-meetings/:id/recluster — re-run the cross-chunk
+  // voice clustering on the persisted per-chunk fingerprints at a new
+  // strictness threshold, to separate speakers that were over-merged
+  // into one cluster. Fully offline (no audio, no Spark Control). Body:
+  //   { threshold, anchorMinSpeakingSec?, smallClusterMaxSpeakingSec?,
+  //     uncertainMarginPct? }
+  // Unspecified suppression knobs fall back to the operator's global
+  // hardware defaults. Re-clustering changes cluster identity, so the
+  // inferred names, per-line overrides, and extras speaker tags are
+  // RESET — the operator re-labels via the legend afterward. Returns
+  // 400 when the meeting has no saved fingerprints (diarization was off
+  // or it predates fingerprint capture).
+  router.post("/:id/recluster", express.json(), async (req, res) => {
+    const rec = await loadMeeting(dataDir, req.params.id);
+    if (!rec) return res.status(404).json({ error: "not found" });
+    const cfg = await getConfigSnapshot();
+    const numOr = (v, fallback) => (Number.isFinite(Number(v)) ? Number(v) : fallback);
+    try {
+      const result = reclusterMeetingRecord(rec, {
+        threshold: numOr(
+          req.body?.threshold,
+          cfg.relay_hardware_voice_clustering_threshold ?? 70
+        ),
+        anchorMinSpeakingSec: numOr(
+          req.body?.anchorMinSpeakingSec,
+          cfg.relay_hardware_anchor_min_speaking_sec ?? 30
+        ),
+        smallClusterMaxSpeakingSec: numOr(
+          req.body?.smallClusterMaxSpeakingSec,
+          cfg.relay_hardware_small_cluster_max_speaking_sec ?? 15
+        ),
+        uncertainMarginPct: numOr(
+          req.body?.uncertainMarginPct,
+          cfg.relay_hardware_uncertain_margin_pct ?? 10
+        ),
+      });
+      await saveMeeting(dataDir, req.params.id, rec);
+      res.json({
+        ok: true,
+        speakers: result.speakers,
+        cluster_count: result.clusterCount,
+        threshold: result.threshold,
+      });
+    } catch (err) {
+      if (err?.code === "NO_FINGERPRINTS") {
+        return res.status(400).json({ error: err.message, code: "NO_FINGERPRINTS" });
+      }
+      if (err?.code === "BAD_REQUEST") {
+        return res.status(400).json({ error: err.message });
+      }
+      console.error(
+        `[internal-meetings] recluster failed for ${req.params.id}: ${err?.message || err}`
+      );
+      res.status(500).json({ error: "recluster failed" });
+    }
+  });
+
+  // POST /admin/internal-meetings/:id/repolish — re-run the Phase-2
+  // summary polish using the meeting's CURRENT speaker names. After the
+  // operator corrects names in the legend (or merges/re-runs detection),
+  // the topic summaries still attribute statements to the old names —
+  // this rewrites each topic summary against the corrected roster. It
+  // does NOT re-infer names (uses rec.speaker_names as-is) and does NOT
+  // touch transcripts, entries, or per-line overrides — only the topic
+  // summary text. Needs the operator's analyze hardware online (it's an
+  // LLM pass, one call per analysis window).
+  router.post("/:id/repolish", express.json(), async (req, res) => {
+    const rec = await loadMeeting(dataDir, req.params.id);
+    if (!rec) return res.status(404).json({ error: "not found" });
+    if (!rec.analysis || !Array.isArray(rec.analysis.sections) || rec.analysis.sections.length === 0) {
+      return res.status(400).json({ error: "this meeting has no analysis sections to re-polish" });
+    }
+    if (typeof rec.transcript !== "string" || !rec.transcript.trim()) {
+      return res.status(400).json({ error: "this meeting has no transcript to polish against" });
+    }
+    const namedCount = Object.values(rec.speaker_names || {}).filter(
+      (v) => typeof v === "string" && v.trim()
+    ).length;
+    if (namedCount === 0) {
+      return res.status(400).json({
+        error: "no named speakers yet — rename speakers in the legend first, then re-polish",
+      });
+    }
+    try {
+      const cfg = await getConfigSnapshot();
+      const hw = await resolveHardwareConfig(cfg);
+      if (!hw.analyze || !hw.analyze.url) {
+        return res.status(503).json({
+          error: "analyze hardware not available — Spark Control isn't reporting a ready analyze endpoint",
+        });
+      }
+      const analyzeBackend = createHardwareBackend({
+        parakeetBaseURL: hw.transcribe.url || "",
+        gemmaBaseURL: hw.analyze.url,
+        sparkControlBaseURL: hw.sparkBase || "",
+        parakeetModel: hw.transcribe.model || "",
+        gemmaModel: hw.analyze.model || "",
+        anMaxTokens: cfg.relay_hardware_an_max_tokens || 16000,
+      });
+      const bodyMin = cfg.relay_hardware_analyze_window_minutes || 18;
+      const overlapMin = cfg.relay_hardware_analyze_overlap_minutes || 2;
+      const cutoffMin = cfg.relay_analyze_cutoff_minutes || 25;
+      const anConcurrency = cfg.relay_hardware_analyze_concurrency || 8;
+      const windows = planWindowsByDuration({
+        totalAudioSec: rec.audio_seconds || 0,
+        bodySeconds: bodyMin * 60,
+        overlapSeconds: overlapMin * 60,
+        cutoffSeconds: cutoffMin * 60,
+      });
+      const canonicalEntries = parseBracketedTranscript(rec.transcript);
+      const polished = await runSummaryPolish({
+        sections: rec.analysis.sections,
+        canonicalEntries,
+        windows,
+        transcriptSegments: rec.transcript_segments || [],
+        speakerNames: rec.speaker_names || {},
+        speakerStats: rec.speakers || {},
+        backend: analyzeBackend,
+        concurrency: anConcurrency,
+        pipelineBackend: "hardware",
+        jobId: "repolish-" + req.params.id,
+        batchId: null,
+        mediaUrl: null,
+        installId: "internal-meetings",
+        licenseFingerprint: null,
+        source: "internal-meetings",
+        computeCostDetails: () => ({
+          input_tokens: 0,
+          output_tokens: 0,
+          thinking_tokens: 0,
+          cost_usd: 0,
+        }),
+      });
+      const changed = applyPolishedSummaries(rec, polished);
+      rec.meta = rec.meta || {};
+      rec.meta.repolished_at = Date.now();
+      rec.meta.polish_done = true;
+      await saveMeeting(dataDir, req.params.id, rec);
+      res.json({ ok: true, polished_count: changed });
+    } catch (err) {
+      console.error(
+        `[internal-meetings] repolish failed for ${req.params.id}: ${err?.message || err}`
+      );
+      res.status(500).json({ error: "re-polish failed: " + (err?.message || "unknown error") });
+    }
+  });
+
+  // GET /admin/internal-meetings/:id/html — self-contained HTML
+  // download. Renders the same Recaps-style layout the dashboard uses,
+  // with inlined CSS so the file is a single shareable artifact.
+  router.get("/:id/html", async (req, res) => {
+    const rec = await loadMeeting(dataDir, req.params.id);
+    if (!rec) return res.status(404).send("not found");
+    const html = meetingToHtml(rec);
+    const safeTitle = (rec.title || "meeting")
+      .replace(/[^a-zA-Z0-9-_.]+/g, "-")
+      .slice(0, 80);
+    // ?inline=1 → render in-place (useful for clicking a saved link
+    // and reading it without forcing a download). Default = download.
+    if (req.query.inline === "1") {
+      res.setHeader("Content-Type", "text/html; charset=utf-8");
+    } else {
+      res.setHeader("Content-Type", "text/html; charset=utf-8");
+      res.setHeader(
+        "Content-Disposition",
+        `attachment; filename="${safeTitle}.html"`
+      );
+    }
+    res.send(html);
+  });
+
+  // GET /admin/internal-meetings/:id/download — raw JSON download
+  router.get("/:id/download", async (req, res) => {
+    const rec = await loadMeeting(dataDir, req.params.id);
+    if (!rec) return res.status(404).send("not found");
+    const safeTitle = (rec.title || "meeting")
+      .replace(/[^a-zA-Z0-9-_.]+/g, "-")
+      .slice(0, 80);
+    res.setHeader("Content-Type", "application/json; charset=utf-8");
+    res.setHeader(
+      "Content-Disposition",
+      `attachment; filename="${safeTitle}.json"`
+    );
+    res.send(JSON.stringify(rec, null, 2));
+  });
+
+  // DELETE /admin/internal-meetings/:id
+  router.delete("/:id", async (req, res) => {
+    const ok = await deleteMeeting(dataDir, req.params.id);
+    if (!ok) return res.status(404).json({ error: "not found" });
+    res.json({ deleted: true });
+  });
+
+  return router;
+}
diff --git a/server/speaker-clustering.js b/server/speaker-clustering.js
new file mode 100644
index 0000000..c2b5fb3
--- /dev/null
+++ b/server/speaker-clustering.js
@@ -0,0 +1,624 @@
+// Cross-chunk speaker reconciliation for Phase 1D of the diarization
+// pipeline. Spark Control's /api/audio/diarize-chunk hands back
+// per-chunk speaker labels ("Speaker_0", "Speaker_1") that are local
+// to one chunk — Sortformer has no memory across calls, so Speaker_0
+// in chunk 5 might or might not be the same person as Speaker_0 in
+// chunk 6. The per-speaker 192-dim TitaNet voice embedding it also
+// returns IS persistent though, so we cluster fingerprints across
+// chunks via cosine similarity to recover the global speaker identity.
+//
+// Algorithm: average-linkage agglomerative clustering. Start with N
+// singleton clusters (one per fingerprint), repeatedly merge the
+// closest pair until no pair is closer than the operator-configured
+// threshold. Average-linkage was the choice over single/complete
+// because it's robust to outlier embeddings (one bad embedding from
+// a noisy chunk doesn't anchor or repel an entire cluster).
+//
+// Complexity: O(N³) where N = total fingerprints across all chunks.
+// Typical: 2 speakers × 21 chunks = 42 → ~74k ops, sub-millisecond.
+// Worst case for a 4-hour all-talk-show video: 6 speakers × 48 chunks
+// = ~288 → ~24M ops, still milliseconds in Node.
+//
+// Threshold convention: configured as INTEGER percentage 50-95
+// representing cosine similarity. 70 (= 0.70 sim) is NeMo's
+// recommended default for TitaNet embeddings. Internally we work
+// in cosine DISTANCE (= 1 - similarity) for the merge condition.
+
+// ─── Cosine similarity ──────────────────────────────────────────────
+// Standard dot-product / (||a|| * ||b||). Both inputs must be number
+// arrays of the same length. Returns 0 for any zero-magnitude input
+// to avoid NaN propagation.
+export function cosineSimilarity(a, b) {
+  if (!a || !b || a.length !== b.length) return 0;
+  let dot = 0;
+  let na = 0;
+  let nb = 0;
+  for (let i = 0; i < a.length; i++) {
+    dot += a[i] * b[i];
+    na += a[i] * a[i];
+    nb += b[i] * b[i];
+  }
+  if (!na || !nb) return 0;
+  return dot / (Math.sqrt(na) * Math.sqrt(nb));
+}
+
+// ─── Cluster ID naming ──────────────────────────────────────────────
+// Speaker_A, Speaker_B, ..., Speaker_Z, Speaker_AA, Speaker_AB...
+// Capital letter prefix is intentionally distinct from the chunk-
+// local "Speaker_0" / "Speaker_1" naming that Sortformer uses, so
+// the source of a label is obvious at a glance.
+function globalSpeakerLabel(index) {
+  let n = index;
+  let s = "";
+  do {
+    s = String.fromCharCode(65 + (n % 26)) + s;
+    n = Math.floor(n / 26) - 1;
+  } while (n >= 0);
+  return "Speaker_" + s;
+}
+
+// ─── Agglomerative clustering (average linkage) ─────────────────────
+// Input: array of { key, vector } pairs. `key` is opaque to the
+// algorithm — we just propagate it into the returned cluster's
+// `members` list for the caller to map back to (chunkIdx, localLabel).
+//
+// Output: array of clusters, each { members: [keys], vectors: [vecs] }.
+// Order: clusters are emitted in the order their FIRST member was
+// added to the input — keeps "Speaker_A" assigned to whoever spoke
+// first across the audio, which is the natural user expectation.
+function agglomerativeCluster(items, distanceThreshold) {
+  if (items.length === 0) return [];
+  const clusters = items.map((it) => ({
+    members: [it.key],
+    vectors: [it.vector],
+    firstOrder: it.firstOrder, // preserve original input order for stable sort later
+  }));
+  // Cache pairwise singleton distances to avoid recomputing as
+  // clusters grow. distMatrix[i][j] = avg cosine distance between
+  // cluster i's vectors and cluster j's vectors. Recomputed on merge.
+  while (clusters.length > 1) {
+    let best = { dist: Infinity, i: -1, j: -1 };
+    for (let i = 0; i < clusters.length; i++) {
+      for (let j = i + 1; j < clusters.length; j++) {
+        const d = avgLinkageDistance(clusters[i], clusters[j]);
+        if (d < best.dist) {
+          best = { dist: d, i, j };
+        }
+      }
+    }
+    if (best.dist > distanceThreshold) break;
+    // Merge clusters[j] into clusters[i], remove clusters[j]
+    clusters[best.i].members.push(...clusters[best.j].members);
+    clusters[best.i].vectors.push(...clusters[best.j].vectors);
+    // Keep the earliest firstOrder so the merged cluster sorts to
+    // the position of its earliest-appearing member.
+    if (clusters[best.j].firstOrder < clusters[best.i].firstOrder) {
+      clusters[best.i].firstOrder = clusters[best.j].firstOrder;
+    }
+    clusters.splice(best.j, 1);
+  }
+  // Sort by first-appearance order so Speaker_A = whoever spoke first.
+  clusters.sort((a, b) => a.firstOrder - b.firstOrder);
+  return clusters;
+}
+
+function avgLinkageDistance(c1, c2) {
+  let sum = 0;
+  let count = 0;
+  for (const v1 of c1.vectors) {
+    for (const v2 of c2.vectors) {
+      sum += 1 - cosineSimilarity(v1, v2);
+      count += 1;
+    }
+  }
+  return count > 0 ? sum / count : Infinity;
+}
+
+// ─── Public: cluster per-chunk diarization → global speaker map ─────
+//
+// Input shape (one entry per chunk; failed/skipped chunks are
+// silently filtered):
+//   {
+//     ok: true,
+//     chunkIndex: 5,
+//     startSeconds: 1080,
+//     segments: [{ start, end, speaker_local, confidence }],
+//     speakers_local: ["Speaker_0", "Speaker_1"],
+//     fingerprints: { "Speaker_0": [192 floats], "Speaker_1": [192 floats] }
+//   }
+//
+// Returns:
+//   {
+//     globalMap: Map<"chunkIdx:localLabel", "Speaker_A">,
+//     speakers: {
+//       Speaker_A: { turns, total_speaking_seconds, mean_confidence,
+//                    chunks_appeared_in, fingerprint_count },
+//       ...
+//     },
+//     clusterCount: 2,
+//     thresholdSimilarity: 0.70
+//   }
+//
+// When fingerprintCount === 0 (diarization off or all chunks failed)
+// returns an empty result: { globalMap: empty, speakers: {}, ... }.
+// Post-cluster suppression tunables. After the initial agglomerative
+// cluster pass, walk the resulting clusters and re-categorize the
+// small ones to fix the "14 speakers detected when really only 2"
+// case Grant flagged on a 2h53m podcast. The clustering algorithm
+// itself stays strict (no false-positive merges); suppression is a
+// second pass that operates on cluster size + cross-cluster
+// similarity to catch the noise-induced spurious clusters.
+//
+//   anchor_min_speaking_sec — a cluster needs at least this much
+//   total speaking time to be considered an "anchor" (= a real
+//   speaker). Anchors keep their own global ID + colored chip.
+//
+//   small_cluster_max_speaking_sec — clusters with LESS than this
+//   are suppression candidates. Brief utterances are common false
+//   positives (background noise, crosstalk fragments, brief
+//   intros).
+//
+//   uncertain_margin_pct — a small cluster whose best similarity
+//   to any anchor is within this many percentage points of the
+//   main threshold gets REASSIGNED to that anchor and marked
+//   uncertain (chip shows "?"). Far-from-anchor small clusters
+//   become Speaker_Unknown.
+//
+// All three are operator-editable via Settings → Operator hardware.
+// Defaults are conservative — no false-positive merges into
+// anchors, just reassignment of small clusters that are PROBABLY
+// the anchor in noisy conditions. A real 30+ second second speaker
+// still gets their own chip; only brief flecks of similar voice get
+// pulled in.
+const DEFAULT_ANCHOR_MIN_SPEAKING_SEC = 30;
+const DEFAULT_SMALL_CLUSTER_MAX_SPEAKING_SEC = 15;
+const DEFAULT_UNCERTAIN_MARGIN_PCT = 10;
+
+// Average cosine similarity between two clusters' vector sets —
+// inverse of avgLinkageDistance, expressed as similarity for
+// readability in the suppression logic.
+function avgLinkageSimilarity(c1, c2) {
+  return 1 - avgLinkageDistance(c1, c2);
+}
+
+// Clamp an option value to an integer in [lo, hi], falling back to
+// `fallback` when the value is missing or non-finite. Used to make
+// out-of-range or absent operator settings safe.
+function clampInt(v, fallback, lo, hi) {
+  const n = Number(v);
+  if (!Number.isFinite(n)) return fallback;
+  const i = Math.round(n);
+  if (i < lo) return lo;
+  if (i > hi) return hi;
+  return i;
+}
+
+export function clusterSpeakers(
+  chunkDiarization,
+  clusterThresholdPct = 70,
+  options = {}
+) {
+  // Use Number.isFinite-guarded fallback rather than the `|| 70`
+  // idiom — the latter substitutes 70 for ANY falsy value including
+  // 0 (a valid input we want to clamp to 50, not silently bump up).
+  const raw = Number(clusterThresholdPct);
+  const pct = Math.max(50, Math.min(95, Number.isFinite(raw) ? raw : 70));
+  const similarityThreshold = pct / 100;
+  const distanceThreshold = 1 - similarityThreshold;
+
+  // Operator-tunable suppression thresholds — accept from options
+  // with Number.isFinite-guarded fallbacks to the conservative
+  // defaults. Clamped to the same ranges the admin.js SETTINGS_RANGES
+  // enforces on save, so a hand-edited relay-config.json with an
+  // out-of-range value still produces sane behavior.
+  const anchorMinSec = clampInt(
+    options.anchorMinSpeakingSec,
+    DEFAULT_ANCHOR_MIN_SPEAKING_SEC,
+    5,
+    120
+  );
+  const smallMaxSec = clampInt(
+    options.smallClusterMaxSpeakingSec,
+    DEFAULT_SMALL_CLUSTER_MAX_SPEAKING_SEC,
+    1,
+    60
+  );
+  const uncertainMarginPct = clampInt(
+    options.uncertainMarginPct,
+    DEFAULT_UNCERTAIN_MARGIN_PCT,
+    0,
+    30
+  );
+  const uncertainSimThreshold = Math.max(
+    0,
+    similarityThreshold - uncertainMarginPct / 100
+  );
+
+  // Flatten fingerprints into the clustering input. Preserve insertion
+  // order so the first-appearance speaker gets Speaker_A.
+  const items = [];
+  let order = 0;
+  for (const d of chunkDiarization || []) {
+    if (!d || !d.ok || !d.fingerprints) continue;
+    for (const [localLabel, vector] of Object.entries(d.fingerprints)) {
+      if (!Array.isArray(vector) || vector.length === 0) continue;
+      items.push({
+        key: `${d.chunkIndex}:${localLabel}`,
+        vector,
+        firstOrder: order++,
+      });
+    }
+  }
+
+  if (items.length === 0) {
+    return {
+      globalMap: new Map(),
+      uncertaintyMap: new Map(),
+      speakers: {},
+      clusterCount: 0,
+      thresholdSimilarity: similarityThreshold,
+    };
+  }
+
+  const clusters = agglomerativeCluster(items, distanceThreshold);
+
+  // ─── First pass: compute speaking time per cluster ───────────────
+  // We need cluster sizes BEFORE building the global map so the
+  // suppression pass can identify anchors. Walk all diar segments,
+  // map each (chunkIdx, speaker_local) to its cluster index, and
+  // accumulate seg duration.
+  const clusterIdxByMember = new Map();
+  for (let i = 0; i < clusters.length; i++) {
+    for (const memberKey of clusters[i].members) {
+      clusterIdxByMember.set(memberKey, i);
+    }
+  }
+  const totalSecsByCluster = new Array(clusters.length).fill(0);
+  for (const d of chunkDiarization || []) {
+    if (!d || !d.ok || !Array.isArray(d.segments)) continue;
+    for (const seg of d.segments) {
+      const key = `${d.chunkIndex}:${seg.speaker_local}`;
+      const ci = clusterIdxByMember.get(key);
+      if (ci === undefined) continue;
+      const dur = Math.max(0, (seg.end || 0) - (seg.start || 0));
+      totalSecsByCluster[ci] += dur;
+    }
+  }
+
+  // ─── Second pass: identify anchors + plan suppression ────────────
+  const isAnchorIdx = new Array(clusters.length).fill(false);
+  const anchorIdxs = [];
+  for (let i = 0; i < clusters.length; i++) {
+    if (totalSecsByCluster[i] >= anchorMinSec) {
+      isAnchorIdx[i] = true;
+      anchorIdxs.push(i);
+    }
+  }
+
+  // reassignTo[i] = anchor cluster idx that absorbs i; uncertain
+  // unknownClusters: set of cluster idxs whose members map to
+  // Speaker_Unknown. keptAsOwn: non-anchor cluster idxs that stay
+  // as their own speaker (large + low-sim — plausibly a real
+  // third+ speaker even if rare).
+  const reassignTo = new Map();
+  const unknownClusters = new Set();
+  if (anchorIdxs.length >= 1) {
+    for (let i = 0; i < clusters.length; i++) {
+      if (isAnchorIdx[i]) continue;
+      // Find best anchor by average cosine similarity
+      let bestAnchorIdx = -1;
+      let bestSim = -Infinity;
+      for (const ai of anchorIdxs) {
+        const sim = avgLinkageSimilarity(clusters[i], clusters[ai]);
+        if (sim > bestSim) {
+          bestSim = sim;
+          bestAnchorIdx = ai;
+        }
+      }
+      const totalSecs = totalSecsByCluster[i];
+      if (bestAnchorIdx >= 0 && bestSim >= uncertainSimThreshold) {
+        // Close-to-anchor (within uncertain_margin_pct of
+        // main threshold) → reassign to anchor with uncertainty.
+        // Chip will show e.g. "MH?" so the user knows attribution
+        // is best-guess.
+        reassignTo.set(i, bestAnchorIdx);
+      } else if (totalSecs < smallMaxSec) {
+        // Small + far-from-anchor → Unknown. Brief noise / crosstalk /
+        // background voices that don't confidently match either main
+        // speaker. Merged into a single Speaker_Unknown pseudo-
+        // speaker so the legend doesn't fill with N "unidentified
+        // brief speaker" entries.
+        unknownClusters.add(i);
+      }
+      // else: large (>= 15s) + far-from-anchor → keep as own speaker.
+      // Plausibly a real third+ person who's distinct from the main
+      // anchors. Rare but possible.
+    }
+  }
+
+  // ─── Build the final cluster-label ordering ──────────────────────
+  // Order by first-appearance: whoever spoke first in the audio
+  // gets Speaker_A. Anchors + kept-as-own clusters get labels;
+  // reassigned + unknown clusters don't.
+  const ordered = [];
+  for (let i = 0; i < clusters.length; i++) {
+    if (reassignTo.has(i) || unknownClusters.has(i)) continue;
+    ordered.push({ idx: i, firstOrder: clusters[i].firstOrder });
+  }
+  ordered.sort((a, b) => a.firstOrder - b.firstOrder);
+  const labelByOrigIdx = new Map();
+  for (let j = 0; j < ordered.length; j++) {
+    labelByOrigIdx.set(ordered[j].idx, globalSpeakerLabel(j));
+  }
+  // Reassigned clusters inherit their anchor's label
+  for (const [i, ai] of reassignTo) {
+    const anchorLabel = labelByOrigIdx.get(ai);
+    if (anchorLabel) labelByOrigIdx.set(i, anchorLabel);
+  }
+
+  // ─── Build globalMap + uncertaintyMap ────────────────────────────
+  const globalMap = new Map();
+  const uncertaintyMap = new Map();
+  let hasUnknown = false;
+  for (let i = 0; i < clusters.length; i++) {
+    if (unknownClusters.has(i)) {
+      for (const memberKey of clusters[i].members) {
+        globalMap.set(memberKey, "Speaker_Unknown");
+        hasUnknown = true;
+      }
+      continue;
+    }
+    const label = labelByOrigIdx.get(i);
+    if (!label) continue;
+    const isReassigned = reassignTo.has(i);
+    for (const memberKey of clusters[i].members) {
+      globalMap.set(memberKey, label);
+      if (isReassigned) uncertaintyMap.set(memberKey, true);
+    }
+  }
+
+  // ─── Build the per-speaker summary ───────────────────────────────
+  const speakers = {};
+  const seenLabels = new Set([...labelByOrigIdx.values()]);
+  for (const label of seenLabels) {
+    speakers[label] = {
+      turns: 0,
+      total_speaking_seconds: 0,
+      mean_confidence: null,
+      chunks_appeared_in: 0,
+      fingerprint_count: 0,
+    };
+  }
+  if (hasUnknown) {
+    speakers["Speaker_Unknown"] = {
+      turns: 0,
+      total_speaking_seconds: 0,
+      mean_confidence: null,
+      chunks_appeared_in: 0,
+      fingerprint_count: 0,
+    };
+  }
+  // Accumulate fingerprint counts from clusters that contributed to
+  // each label. Reassigned clusters' fingerprints count toward
+  // their anchor's total.
+  for (let i = 0; i < clusters.length; i++) {
+    let targetLabel;
+    if (unknownClusters.has(i)) targetLabel = "Speaker_Unknown";
+    else targetLabel = labelByOrigIdx.get(i);
+    if (!targetLabel || !speakers[targetLabel]) continue;
+    speakers[targetLabel].fingerprint_count += clusters[i].members.length;
+  }
+
+  // Accumulate turns / speaking time / confidence by walking
+  // diarization segments through the globalMap.
+  //
+  // Two earlier bugs fixed here:
+  //
+  // 1. UNFINGERPRINTED SEGMENTS WERE SILENTLY DROPPED. The cluster-
+  //    index lookup only contains entries that have fingerprints —
+  //    but Sortformer routinely emits diar segments for speakers
+  //    whose voice TitaNet didn't aggregate a fingerprint for (very
+  //    brief utterances, soft speech, overlapped speech). Those
+  //    segments produced globalId === undefined and were dropped,
+  //    so the "total speech detected" totals understated reality
+  //    dramatically. A 1.5-hour call could show as "34% speech
+  //    detected" when in reality 70%+ of the audio was speech that
+  //    Sortformer found but TitaNet couldn't fingerprint. Now: an
+  //    unmapped segment falls through to Speaker_Unknown so the
+  //    time still gets accounted for. (The chip on the per-line
+  //    transcript still shows "?" for those segments — they just
+  //    aren't claimed by a wrong cluster.)
+  //
+  // 2. CHUNK-OVERLAP DOUBLE-COUNTING. Transcribe segments are
+  //    deduped at the chunk overlap boundary (handled in
+  //    hardware.js), but diar segments are not. Until this fix the
+  //    same speech in a 30s overlap zone got counted toward TWO
+  //    chunks, inflating speaker totals. Dedup here using the
+  //    chunk's overlapBoundarySec when present.
+  const confidenceSum = new Map();
+  const confidenceCount = new Map();
+  const chunksByLabel = new Map();
+
+  // Ensure Speaker_Unknown exists in speakers map before we attribute
+  // any unmapped time to it — clusterSpeakers may have created it
+  // already (via the unknownClusters path) or not (when no clusters
+  // were suppressed). Either way, we want it as a destination bucket.
+  if (!speakers["Speaker_Unknown"]) {
+    speakers["Speaker_Unknown"] = {
+      turns: 0,
+      total_speaking_seconds: 0,
+      mean_confidence: null,
+      chunks_appeared_in: 0,
+      fingerprint_count: 0,
+    };
+    hasUnknown = true;
+  }
+
+  for (const d of chunkDiarization || []) {
+    if (!d || !d.ok || !Array.isArray(d.segments)) continue;
+    // Chunk-overlap dedup: skip any segment whose GLOBAL start time
+    // sits in the prior chunk's tail (which this chunk overlapped).
+    // chunkOverlapBoundary is the global timestamp BEFORE which
+    // segments in this chunk are duplicates of the prior chunk's
+    // tail. Comes from the chunk planner (audio-meta.js) and is
+    // 0 for chunk 0 (no prior chunk → no dedup).
+    const chunkOverlapBoundary =
+      typeof d.chunkOverlapBoundarySec === "number"
+        ? d.chunkOverlapBoundarySec
+        : 0;
+    const labelsInThisChunk = new Set();
+    for (const seg of d.segments) {
+      if ((seg.start || 0) < chunkOverlapBoundary) continue;
+      let globalId = globalMap.get(`${d.chunkIndex}:${seg.speaker_local}`);
+      // Unmapped (no fingerprint produced for this speaker_local in
+      // this chunk) → bucket into Speaker_Unknown rather than drop.
+      if (!globalId || !speakers[globalId]) {
+        globalId = "Speaker_Unknown";
+      }
+      speakers[globalId].turns += 1;
+      const segDuration = Math.max(0, (seg.end || 0) - (seg.start || 0));
+      speakers[globalId].total_speaking_seconds += segDuration;
+      if (typeof seg.confidence === "number" && Number.isFinite(seg.confidence)) {
+        confidenceSum.set(globalId, (confidenceSum.get(globalId) || 0) + seg.confidence);
+        confidenceCount.set(globalId, (confidenceCount.get(globalId) || 0) + 1);
+      }
+      labelsInThisChunk.add(globalId);
+    }
+    for (const label of labelsInThisChunk) {
+      if (!chunksByLabel.has(label)) chunksByLabel.set(label, new Set());
+      chunksByLabel.get(label).add(d.chunkIndex);
+    }
+  }
+
+  // If Speaker_Unknown ended up with zero turns (no unmapped + no
+  // suppressed clusters contributed), drop it from the legend so we
+  // don't show "? Unknown 0:00" by default.
+  if (speakers["Speaker_Unknown"] && speakers["Speaker_Unknown"].turns === 0) {
+    delete speakers["Speaker_Unknown"];
+    hasUnknown = false;
+  }
+  for (const label of Object.keys(speakers)) {
+    if (confidenceCount.get(label)) {
+      speakers[label].mean_confidence =
+        confidenceSum.get(label) / confidenceCount.get(label);
+    }
+    speakers[label].chunks_appeared_in = (chunksByLabel.get(label) || new Set()).size;
+    speakers[label].total_speaking_seconds =
+      Math.round(speakers[label].total_speaking_seconds * 10) / 10;
+  }
+
+  // Logging: surface the suppression summary so operators can see
+  // what happened ("14 clusters → 2 anchors + 12 small/uncertain
+  // suppressed").
+  const reassignedCount = reassignTo.size;
+  const unknownClusterCount = unknownClusters.size;
+  const finalCount =
+    Object.keys(speakers).length - (hasUnknown ? 1 : 0);
+  console.log(
+    `[clustering] ${clusters.length} raw clusters → ${finalCount} primary + ` +
+      `${reassignedCount} reassigned (uncertain) + ${unknownClusterCount} unknown ` +
+      `(anchors >= ${anchorMinSec}s, uncertain margin ${uncertainMarginPct}%, ` +
+      `unknown < ${smallMaxSec}s)`
+  );
+
+  return {
+    globalMap,
+    uncertaintyMap,
+    speakers,
+    clusterCount: clusters.length,
+    thresholdSimilarity: similarityThreshold,
+  };
+}
+
+// ─── Public: stamp global speaker labels onto transcript segments ───
+//
+// Walks the merged transcript segments and assigns each one a
+// `speaker` (global ID, e.g. "Speaker_A") + `speaker_confidence`
+// based on which diarization segment its midpoint falls inside.
+// When no diar segment covers the midpoint, we fall back to nearest-
+// midpoint matching with a 5-second window — beyond that, leave the
+// speaker null so the frontend can render as "(speaker unknown)" or
+// just drop the label.
+//
+// Mutates the segments in-place (and also returns the array) so
+// callers don't have to remember which they got.
+export function assignSpeakersToSegments(segments, chunkDiarization, globalMap, uncertaintyMap = null) {
+  if (!Array.isArray(segments) || segments.length === 0) return segments;
+  if (!globalMap || globalMap.size === 0) {
+    // Diarization didn't run / produced nothing — leave segments
+    // alone. Caller can detect this state via speakers === {}.
+    return segments;
+  }
+  // Flatten all per-chunk diar segments into one timeline annotated
+  // with the global speaker label + the suppression-uncertainty
+  // flag (set when a small cluster was reassigned to an anchor —
+  // chip will show "?" so the user knows attribution is best-guess).
+  const flatDiar = [];
+  for (const d of chunkDiarization || []) {
+    if (!d || !d.ok || !Array.isArray(d.segments)) continue;
+    for (const seg of d.segments) {
+      const memberKey = `${d.chunkIndex}:${seg.speaker_local}`;
+      const globalId = globalMap.get(memberKey);
+      if (!globalId) continue;
+      const uncertain = uncertaintyMap ? !!uncertaintyMap.get(memberKey) : false;
+      flatDiar.push({
+        start: seg.start || 0,
+        end: seg.end || 0,
+        speaker: globalId,
+        confidence: typeof seg.confidence === "number" ? seg.confidence : null,
+        uncertain,
+      });
+    }
+  }
+  flatDiar.sort((a, b) => a.start - b.start);
+
+  const NEAREST_FALLBACK_WINDOW_SEC = 5;
+
+  for (const e of segments) {
+    const mid = ((e.start || 0) + (e.end || 0)) / 2;
+    // Find segments that contain the midpoint
+    let containing = null;
+    let containingMostOverlap = 0;
+    for (const d of flatDiar) {
+      if (d.start <= mid && mid <= d.end) {
+        // Score by overlap with the entry to handle the rare case of
+        // multiple diar segments straddling one transcript line
+        // (chunk overlap zones, choppy speaker turns).
+        const overlap =
+          Math.min(d.end, e.end || 0) - Math.max(d.start, e.start || 0);
+        if (overlap > containingMostOverlap) {
+          containing = d;
+          containingMostOverlap = overlap;
+        }
+      }
+    }
+    if (containing) {
+      e.speaker = containing.speaker;
+      e.speaker_confidence = containing.confidence;
+      e.speaker_uncertain = !!containing.uncertain;
+      continue;
+    }
+    // Fall back to nearest by midpoint distance (within window)
+    let nearest = null;
+    let nearestDist = Infinity;
+    for (const d of flatDiar) {
+      const dMid = (d.start + d.end) / 2;
+      const dist = Math.abs(dMid - mid);
+      if (dist < nearestDist) {
+        nearestDist = dist;
+        nearest = d;
+      }
+    }
+    if (nearest && nearestDist <= NEAREST_FALLBACK_WINDOW_SEC) {
+      e.speaker = nearest.speaker;
+      e.speaker_confidence = nearest.confidence;
+      e.speaker_uncertain = !!nearest.uncertain;
+    } else {
+      e.speaker = null;
+      e.speaker_confidence = null;
+      e.speaker_uncertain = false;
+    }
+  }
+
+  return segments;
+}
diff --git a/server/test/meeting-speaker-edits.test.js b/server/test/meeting-speaker-edits.test.js
new file mode 100644
index 0000000..6dce7b5
--- /dev/null
+++ b/server/test/meeting-speaker-edits.test.js
@@ -0,0 +1,269 @@
+// Unit tests for post-hoc speaker edits (merge + re-cluster) on saved
+// internal-meeting records.
+// Run via: node --test server/test/meeting-speaker-edits.test.js
+
+import { test } from "node:test";
+import assert from "node:assert/strict";
+import {
+  mergeSpeakersInRecord,
+  reclusterMeetingRecord,
+  backfillEntrySpeakers,
+  applyPolishedSummaries,
+} from "../meeting-speaker-edits.js";
+
+// Distinct synthetic voice fingerprints (mirror speaker-clustering.test.js).
+const FP_A = (j = 0) => [1.0 + j * 0.01, 0.05 * j, 0];
+const FP_B = (j = 0) => [0.05 * j, 1.0 + j * 0.01, 0];
+
+// A 3-speaker record with labels spread across all four sync points.
+function makeMergeRecord() {
+  return {
+    id: "m1",
+    transcript_segments: [
+      { start: 0, end: 9, text: "a", speaker: "Speaker_A" },
+      { start: 10, end: 19, text: "b", speaker: "Speaker_B" },
+      { start: 20, end: 29, text: "c", speaker: "Speaker_C" },
+      { start: 30, end: 39, text: "c2", speaker: "Speaker_C" },
+    ],
+    chunks: [
+      {
+        title: "t",
+        summary: "s",
+        startTime: 0,
+        entries: [
+          { offset: 0, text: "a", speaker: "Speaker_A" },
+          { offset: 10, text: "b", speaker: "Speaker_B" },
+          { offset: 20, text: "c", speaker: "Speaker_C", speaker_override: "Speaker_C" },
+          { offset: 30, text: "c2", speaker: "Speaker_A", speaker_override: "Speaker_C" },
+        ],
+      },
+    ],
+    speakers: {
+      Speaker_A: { turns: 4, total_speaking_seconds: 40, mean_confidence: 0.8, chunks_appeared_in: 2, fingerprint_count: 2 },
+      Speaker_B: { turns: 2, total_speaking_seconds: 20, mean_confidence: 0.9, chunks_appeared_in: 1, fingerprint_count: 1 },
+      Speaker_C: { turns: 6, total_speaking_seconds: 18, mean_confidence: 0.6, chunks_appeared_in: 3, fingerprint_count: 3 },
+    },
+    speaker_names: { Speaker_A: "Matt", Speaker_B: "John" },
+    extras: {
+      tldr: { summary: "x", primary_speakers: ["Speaker_A", "Speaker_C"] },
+      decisions: [{ statement: "d", agreed_by: ["Speaker_C", "Speaker_A"], supporting_offset: 5 }],
+      action_items: [{ description: "do", owner: "Speaker_C", supporting_offset: 6 }],
+      key_quotes: [{ speaker: "Speaker_C", offset: 7, quote: "q" }],
+    },
+    meta: {},
+  };
+}
+
+test("merge: collapses absorbed speaker across all four label locations", () => {
+  const rec = makeMergeRecord();
+  const out = mergeSpeakersInRecord(rec, "Speaker_A", ["Speaker_C"]);
+
+  // transcript_segments
+  assert.deepEqual(
+    rec.transcript_segments.map((s) => s.speaker),
+    ["Speaker_A", "Speaker_B", "Speaker_A", "Speaker_A"]
+  );
+  // entries + per-line overrides
+  assert.deepEqual(
+    rec.chunks[0].entries.map((e) => e.speaker),
+    ["Speaker_A", "Speaker_B", "Speaker_A", "Speaker_A"]
+  );
+  assert.equal(rec.chunks[0].entries[2].speaker_override, "Speaker_A");
+  assert.equal(rec.chunks[0].entries[3].speaker_override, "Speaker_A");
+
+  // stats merged, Speaker_C gone
+  assert.ok(!("Speaker_C" in rec.speakers));
+  assert.equal(rec.speakers.Speaker_A.turns, 10); // 4 + 6
+  assert.equal(rec.speakers.Speaker_A.total_speaking_seconds, 58); // 40 + 18
+  assert.equal(rec.speakers.Speaker_A.fingerprint_count, 5); // 2 + 3
+  // turn-weighted mean confidence: (0.8*4 + 0.6*6) / 10 = 0.68
+  assert.ok(Math.abs(rec.speakers.Speaker_A.mean_confidence - 0.68) < 1e-9);
+
+  // names: survivor keeps its own, absorbed dropped
+  assert.equal(rec.speaker_names.Speaker_A, "Matt");
+  assert.ok(!("Speaker_C" in rec.speaker_names));
+
+  // extras remapped + deduped
+  assert.deepEqual(rec.extras.tldr.primary_speakers, ["Speaker_A"]);
+  assert.deepEqual(rec.extras.decisions[0].agreed_by, ["Speaker_A"]);
+  assert.equal(rec.extras.action_items[0].owner, "Speaker_A");
+  assert.equal(rec.extras.key_quotes[0].speaker, "Speaker_A");
+
+  assert.ok(rec.meta.speakers_merged_at > 0);
+  assert.equal(out.changed > 0, true);
+});
+
+test("merge: survivor with no name inherits the absorbed name", () => {
+  const rec = makeMergeRecord();
+  // Speaker_B has a name; clear it so it can inherit Speaker_C's.
+  delete rec.speaker_names.Speaker_B;
+  rec.speaker_names.Speaker_C = "Carol";
+  mergeSpeakersInRecord(rec, "Speaker_B", ["Speaker_C"]);
+  assert.equal(rec.speaker_names.Speaker_B, "Carol");
+  assert.ok(!("Speaker_C" in rec.speaker_names));
+});
+
+test("merge: rejects invalid input", () => {
+  const rec = makeMergeRecord();
+  assert.throws(() => mergeSpeakersInRecord(rec, "Speaker_Z", ["Speaker_A"]), /survivor/);
+  assert.throws(() => mergeSpeakersInRecord(rec, "Speaker_A", ["Speaker_A"]), /itself/);
+  assert.throws(() => mergeSpeakersInRecord(rec, "Speaker_A", ["Speaker_Z"]), /unknown/);
+  assert.throws(() => mergeSpeakersInRecord(rec, "Speaker_A", []), /at least one/);
+});
+
+// A record carrying per-chunk fingerprints so re-clustering can run
+// fully offline. Two distinct voices (FP_A first, FP_B second) →
+// Speaker_A / Speaker_B by first-appearance order.
+function makeReclusterRecord() {
+  return {
+    id: "r1",
+    transcript_segments: [
+      { start: 0, end: 9, text: "a", speaker: "STALE" },
+      { start: 10, end: 19, text: "b", speaker: "STALE" },
+      { start: 20, end: 29, text: "c", speaker: "STALE" },
+    ],
+    chunks: [
+      {
+        title: "t",
+        summary: "s",
+        startTime: 0,
+        entries: [
+          { offset: 0, text: "a", speaker: "STALE", speaker_override: "STALE" },
+          { offset: 10, text: "b", speaker: "STALE" },
+          { offset: 20, text: "c", speaker: "STALE" },
+        ],
+      },
+    ],
+    speakers: { STALE: { turns: 3, total_speaking_seconds: 30, mean_confidence: 0.5, chunks_appeared_in: 2, fingerprint_count: 3 } },
+    speaker_names: { STALE: "Wrong" },
+    extras: {
+      tldr: { summary: "x", primary_speakers: ["STALE"] },
+      decisions: [{ statement: "d", agreed_by: ["STALE"], supporting_offset: 5 }],
+      action_items: [{ description: "do", owner: "STALE", supporting_offset: 6 }],
+      key_quotes: [{ speaker: "STALE", offset: 7, quote: "q" }],
+    },
+    diarization: [
+      {
+        ok: true,
+        chunkIndex: 0,
+        segments: [
+          { start: 0, end: 10, speaker_local: "Speaker_0", confidence: 0.9 },
+          { start: 10, end: 20, speaker_local: "Speaker_1", confidence: 0.9 },
+        ],
+        fingerprints: { Speaker_0: FP_A(1), Speaker_1: FP_B(1) },
+      },
+      {
+        ok: true,
+        chunkIndex: 1,
+        segments: [{ start: 20, end: 30, speaker_local: "Speaker_0", confidence: 0.8 }],
+        fingerprints: { Speaker_0: FP_A(2) },
+      },
+    ],
+    meta: { polish_done: true },
+  };
+}
+
+test("recluster: re-stamps segments + entries and resets stale data", () => {
+  const rec = makeReclusterRecord();
+  const out = reclusterMeetingRecord(rec, { threshold: 70 });
+
+  // Two distinct voices recovered.
+  assert.equal(out.speakers ? Object.keys(out.speakers).filter((k) => k !== "Speaker_Unknown").length : 0, 2);
+
+  // Segments re-stamped: FP_A group = Speaker_A (first), FP_B = Speaker_B.
+  assert.deepEqual(
+    rec.transcript_segments.map((s) => s.speaker),
+    ["Speaker_A", "Speaker_B", "Speaker_A"]
+  );
+  // Entries re-derived to match.
+  assert.deepEqual(
+    rec.chunks[0].entries.map((e) => e.speaker),
+    ["Speaker_A", "Speaker_B", "Speaker_A"]
+  );
+  // Per-line override cleared.
+  assert.ok(!("speaker_override" in rec.chunks[0].entries[0]));
+
+  // Stale attribution data reset.
+  assert.deepEqual(rec.speaker_names, {});
+  assert.deepEqual(rec.extras.tldr.primary_speakers, []);
+  assert.deepEqual(rec.extras.decisions[0].agreed_by, []);
+  assert.equal(rec.extras.action_items[0].owner, null);
+  assert.equal(rec.extras.key_quotes[0].speaker, null);
+  // Decision text preserved.
+  assert.equal(rec.extras.decisions[0].statement, "d");
+
+  assert.ok(rec.meta.reclustered_at > 0);
+  assert.equal(rec.meta.recluster_threshold, 70);
+  assert.equal(rec.meta.polish_done, false);
+});
+
+test("recluster: throws NO_FINGERPRINTS when none are saved", () => {
+  const rec = makeReclusterRecord();
+  rec.diarization = null;
+  assert.throws(() => reclusterMeetingRecord(rec, { threshold: 70 }), (e) => e.code === "NO_FINGERPRINTS");
+
+  const rec2 = makeReclusterRecord();
+  rec2.diarization = [{ ok: true, chunkIndex: 0, segments: [], fingerprints: {} }];
+  assert.throws(() => reclusterMeetingRecord(rec2, { threshold: 70 }), (e) => e.code === "NO_FINGERPRINTS");
+});
+
+test("applyPolishedSummaries: writes summaries to analysis + chunks, leaves entries", () => {
+  const rec = {
+    analysis: { sections: [
+      { title: "Intro", summary: "OLD intro", startIndex: 0, endIndex: 1 },
+      { title: "Plan", summary: "OLD plan", startIndex: 2, endIndex: 3 },
+    ] },
+    chunks: [
+      { title: "Intro", summary: "OLD intro", entries: [{ offset: 0, speaker: "Speaker_A", speaker_override: "Speaker_B" }] },
+      { title: "Plan", summary: "OLD plan", entries: [{ offset: 20, speaker: "Speaker_B" }] },
+    ],
+    meta: {},
+  };
+  const polished = [
+    { title: "Intro", summary: "Matt opens the standup", startIndex: 0, endIndex: 1 },
+    { title: "Plan", summary: "John lays out the Q3 plan", startIndex: 2, endIndex: 3 },
+  ];
+  const changed = applyPolishedSummaries(rec, polished);
+  assert.equal(changed, 2);
+  // analysis store updated
+  assert.equal(rec.analysis.sections[0].summary, "Matt opens the standup");
+  // chunk cards updated by title
+  assert.equal(rec.chunks[0].summary, "Matt opens the standup");
+  assert.equal(rec.chunks[1].summary, "John lays out the Q3 plan");
+  // entries + per-line override untouched
+  assert.equal(rec.chunks[0].entries[0].speaker, "Speaker_A");
+  assert.equal(rec.chunks[0].entries[0].speaker_override, "Speaker_B");
+});
+
+test("applyPolishedSummaries: duplicate titles map in order", () => {
+  const rec = {
+    analysis: { sections: [] },
+    chunks: [
+      { title: "Discussion", summary: "old1", entries: [] },
+      { title: "Discussion", summary: "old2", entries: [] },
+    ],
+  };
+  const polished = [
+    { title: "Discussion", summary: "new1" },
+    { title: "Discussion", summary: "new2" },
+  ];
+  applyPolishedSummaries(rec, polished);
+  assert.equal(rec.chunks[0].summary, "new1");
+  assert.equal(rec.chunks[1].summary, "new2");
+});
+
+test("backfillEntrySpeakers force re-stamps already-labeled entries", () => {
+  const rec = {
+    transcript_segments: [
+      { start: 0, end: 9, text: "a", speaker: "Speaker_A" },
+      { start: 10, end: 19, text: "b", speaker: "Speaker_B" },
+    ],
+    chunks: [{ entries: [{ offset: 0, speaker: "OLD" }, { offset: 10, speaker: "OLD" }] }],
+  };
+  // Without force, existing speakers are left alone.
+  backfillEntrySpeakers(rec);
+  assert.deepEqual(rec.chunks[0].entries.map((e) => e.speaker), ["OLD", "OLD"]);
+  // With force, they are re-derived from the segments.
+  backfillEntrySpeakers(rec, { force: true });
+  assert.deepEqual(rec.chunks[0].entries.map((e) => e.speaker), ["Speaker_A", "Speaker_B"]);
+});
diff --git a/server/test/polish-speaker-labels.test.js b/server/test/polish-speaker-labels.test.js
new file mode 100644
index 0000000..6c0441e
--- /dev/null
+++ b/server/test/polish-speaker-labels.test.js
@@ -0,0 +1,60 @@
+// Re-polish bug fix: the summary-polish pass must label each transcript
+// line with the operator's CORRECTED speaker name, so a re-polish after a
+// legend rename actually re-attributes statements to the new name (rather
+// than echoing the stale name baked into the original summaries).
+
+import { test, describe } from "node:test";
+import assert from "node:assert/strict";
+
+import { formatSpeakerLabeledTranscript } from "../post-cluster-polish.js";
+
+const SEGMENTS = [
+  { start: 5, speaker: "Speaker_A", text: "Let's get started." },
+  { start: 12, speaker: "Speaker_B", text: "Sounds good." },
+  { start: 20, speaker: "Speaker_C", text: "One more thing." }, // unnamed
+  { start: 30, speaker: "", text: "(crosstalk)" }, // no speaker
+];
+
+describe("formatSpeakerLabeledTranscript", () => {
+  test("without speakerNames: labels by chip letter (name-inference pass)", () => {
+    const out = formatSpeakerLabeledTranscript(SEGMENTS);
+    assert.match(out, /\[A 0:05\] Let's get started\./);
+    assert.match(out, /\[B 0:12\] Sounds good\./);
+    assert.match(out, /\[C 0:20\] One more thing\./);
+    // Segment with no speaker → "?" label.
+    assert.match(out, /\[\? 0:30\] \(crosstalk\)/);
+  });
+
+  test("with speakerNames: named speakers labeled by NAME, unnamed fall back to letter", () => {
+    const out = formatSpeakerLabeledTranscript(SEGMENTS, {
+      speakerNames: { Speaker_A: "Matt", Speaker_B: "Grant" },
+    });
+    assert.match(out, /\[Matt 0:05\] Let's get started\./);
+    assert.match(out, /\[Grant 0:12\] Sounds good\./);
+    // Speaker_C has no name → still the letter.
+    assert.match(out, /\[C 0:20\] One more thing\./);
+    // Crucially, the OLD letter labels for the named speakers are gone.
+    assert.doesNotMatch(out, /\[A 0:05\]/);
+    assert.doesNotMatch(out, /\[B 0:12\]/);
+  });
+
+  test("respects the time window (startSec/endSec)", () => {
+    const out = formatSpeakerLabeledTranscript(SEGMENTS, {
+      startSec: 10,
+      endSec: 25,
+      speakerNames: { Speaker_A: "Matt" },
+    });
+    assert.doesNotMatch(out, /Let's get started/); // 0:05, before window
+    assert.match(out, /Sounds good/); // 0:12, in window
+    assert.match(out, /One more thing/); // 0:20, in window
+    assert.doesNotMatch(out, /crosstalk/); // 0:30, after window
+  });
+
+  test("strips brackets from a name so the [label] frame can't break", () => {
+    const out = formatSpeakerLabeledTranscript(
+      [{ start: 0, speaker: "Speaker_A", text: "hi" }],
+      { speakerNames: { Speaker_A: "Ma[t]t" } },
+    );
+    assert.match(out, /\[Matt 0:00\] hi/);
+  });
+});
diff --git a/server/test/speaker-clustering.test.js b/server/test/speaker-clustering.test.js
new file mode 100644
index 0000000..4418ec3
--- /dev/null
+++ b/server/test/speaker-clustering.test.js
@@ -0,0 +1,203 @@
+// Unit tests for the Phase 1D speaker-clustering module.
+// Run via: node --test server/test/speaker-clustering.test.js
+
+import { test } from "node:test";
+import assert from "node:assert/strict";
+import {
+  cosineSimilarity,
+  clusterSpeakers,
+  assignSpeakersToSegments,
+} from "../speaker-clustering.js";
+
+// Synthetic fingerprints — easier to reason about than 192-dim vectors.
+// "Person A" embeddings all point roughly toward [+1, 0, 0]
+// "Person B" embeddings all point roughly toward [0, +1, 0]
+// "Person C" embeddings (when present) point toward [0, 0, +1]
+const FP_A = (jitter = 0) => [1.0 + jitter * 0.01, 0.05 * jitter, 0];
+const FP_B = (jitter = 0) => [0.05 * jitter, 1.0 + jitter * 0.01, 0];
+const FP_C = (jitter = 0) => [0, 0, 1.0 + jitter * 0.01];
+
+test("cosineSimilarity: identical vectors = 1", () => {
+  assert.equal(cosineSimilarity([1, 0, 0], [1, 0, 0]), 1);
+});
+
+test("cosineSimilarity: orthogonal vectors = 0", () => {
+  assert.equal(cosineSimilarity([1, 0, 0], [0, 1, 0]), 0);
+});
+
+test("cosineSimilarity: zero-magnitude input returns 0 (no NaN)", () => {
+  assert.equal(cosineSimilarity([0, 0, 0], [1, 1, 1]), 0);
+});
+
+test("clusterSpeakers: two distinct speakers across 3 chunks → 2 clusters", () => {
+  const chunkDiar = [
+    {
+      ok: true,
+      chunkIndex: 0,
+      segments: [],
+      fingerprints: { Speaker_0: FP_A(1), Speaker_1: FP_B(1) },
+    },
+    {
+      ok: true,
+      chunkIndex: 1,
+      segments: [],
+      fingerprints: { Speaker_0: FP_A(2), Speaker_1: FP_B(2) },
+    },
+    {
+      ok: true,
+      chunkIndex: 2,
+      segments: [],
+      fingerprints: { Speaker_0: FP_B(3), Speaker_1: FP_A(3) }, // labels flipped this chunk
+    },
+  ];
+  const { clusterCount, globalMap, speakers } = clusterSpeakers(chunkDiar, 70);
+  assert.equal(clusterCount, 2, "should identify 2 distinct speakers");
+  // First speaker seen (chunk 0, Speaker_0 = FP_A) becomes Speaker_A
+  assert.equal(globalMap.get("0:Speaker_0"), "Speaker_A");
+  assert.equal(globalMap.get("0:Speaker_1"), "Speaker_B");
+  // Chunk 1 (same physical voices, same label assignment by SC)
+  assert.equal(globalMap.get("1:Speaker_0"), "Speaker_A");
+  assert.equal(globalMap.get("1:Speaker_1"), "Speaker_B");
+  // Chunk 2 has labels flipped — clustering should recover the truth
+  assert.equal(globalMap.get("2:Speaker_0"), "Speaker_B");
+  assert.equal(globalMap.get("2:Speaker_1"), "Speaker_A");
+  // Summary should report each speaker appearing in 3 chunks
+  assert.equal(speakers.Speaker_A.fingerprint_count, 3);
+  assert.equal(speakers.Speaker_B.fingerprint_count, 3);
+});
+
+test("clusterSpeakers: three distinct speakers → 3 clusters", () => {
+  const chunkDiar = [
+    {
+      ok: true,
+      chunkIndex: 0,
+      segments: [],
+      fingerprints: { Speaker_0: FP_A(1), Speaker_1: FP_B(1) },
+    },
+    {
+      ok: true,
+      chunkIndex: 1,
+      segments: [],
+      fingerprints: { Speaker_0: FP_C(2), Speaker_1: FP_B(2) },
+    },
+  ];
+  const { clusterCount } = clusterSpeakers(chunkDiar, 70);
+  assert.equal(clusterCount, 3);
+});
+
+test("clusterSpeakers: empty input returns empty result", () => {
+  const out = clusterSpeakers([], 70);
+  assert.equal(out.clusterCount, 0);
+  assert.equal(out.globalMap.size, 0);
+  assert.deepEqual(out.speakers, {});
+});
+
+test("clusterSpeakers: all-failed-chunks input returns empty result", () => {
+  const out = clusterSpeakers([{ ok: false }, { ok: false }], 70);
+  assert.equal(out.clusterCount, 0);
+});
+
+test("clusterSpeakers: threshold clamped to 50..95", () => {
+  const chunkDiar = [
+    {
+      ok: true,
+      chunkIndex: 0,
+      segments: [],
+      fingerprints: { Speaker_0: FP_A(1), Speaker_1: FP_B(1) },
+    },
+  ];
+  const lo = clusterSpeakers(chunkDiar, 0); // clamps to 50
+  assert.equal(lo.thresholdSimilarity, 0.5);
+  const hi = clusterSpeakers(chunkDiar, 200); // clamps to 95
+  assert.equal(hi.thresholdSimilarity, 0.95);
+});
+
+test("clusterSpeakers: very strict threshold (95%) splits tightly-grouped voices", () => {
+  // FP_A with significant jitter — at 70% they cluster as one, at 95% they may split.
+  const chunkDiar = [
+    {
+      ok: true,
+      chunkIndex: 0,
+      segments: [],
+      fingerprints: {
+        Speaker_0: [1.0, 0.0, 0.0],
+        // Same general direction but ~0.93 similarity — borderline.
+        Speaker_1: [0.93, 0.36, 0.06],
+      },
+    },
+  ];
+  const lenient = clusterSpeakers(chunkDiar, 70);
+  const strict = clusterSpeakers(chunkDiar, 95);
+  assert.equal(lenient.clusterCount, 1, "lenient should merge");
+  assert.equal(strict.clusterCount, 2, "strict should split");
+});
+
+test("clusterSpeakers: summary stats aggregate turns + speaking time", () => {
+  const chunkDiar = [
+    {
+      ok: true,
+      chunkIndex: 0,
+      segments: [
+        { start: 0, end: 10, speaker_local: "Speaker_0", confidence: 0.9 },
+        { start: 10, end: 25, speaker_local: "Speaker_1", confidence: 0.8 },
+        { start: 25, end: 30, speaker_local: "Speaker_0", confidence: 0.95 },
+      ],
+      fingerprints: { Speaker_0: FP_A(1), Speaker_1: FP_B(1) },
+    },
+  ];
+  const { speakers } = clusterSpeakers(chunkDiar, 70);
+  assert.equal(speakers.Speaker_A.turns, 2);
+  assert.equal(speakers.Speaker_A.total_speaking_seconds, 15);
+  assert.equal(speakers.Speaker_B.turns, 1);
+  assert.equal(speakers.Speaker_B.total_speaking_seconds, 15);
+  assert.ok(Math.abs(speakers.Speaker_A.mean_confidence - 0.925) < 0.001);
+});
+
+test("assignSpeakersToSegments: midpoint inside diar segment wins", () => {
+  const segments = [
+    { start: 0, end: 5, text: "hello" },
+    { start: 5, end: 10, text: "world" },
+  ];
+  const chunkDiar = [
+    {
+      ok: true,
+      chunkIndex: 0,
+      segments: [
+        { start: 0, end: 5, speaker_local: "Speaker_0", confidence: 0.9 },
+        { start: 5, end: 10, speaker_local: "Speaker_1", confidence: 0.85 },
+      ],
+      fingerprints: { Speaker_0: FP_A(1), Speaker_1: FP_B(1) },
+    },
+  ];
+  const { globalMap } = clusterSpeakers(chunkDiar, 70);
+  assignSpeakersToSegments(segments, chunkDiar, globalMap);
+  assert.equal(segments[0].speaker, "Speaker_A");
+  assert.equal(segments[1].speaker, "Speaker_B");
+  assert.equal(segments[0].speaker_confidence, 0.9);
+});
+
+test("assignSpeakersToSegments: nearest-fallback within 5s window", () => {
+  const segments = [
+    { start: 8, end: 12, text: "in between" }, // gap with no covering diar seg
+  ];
+  const chunkDiar = [
+    {
+      ok: true,
+      chunkIndex: 0,
+      segments: [
+        { start: 0, end: 5, speaker_local: "Speaker_0", confidence: 0.9 },
+      ],
+      fingerprints: { Speaker_0: FP_A(1) },
+    },
+  ];
+  const { globalMap } = clusterSpeakers(chunkDiar, 70);
+  assignSpeakersToSegments(segments, chunkDiar, globalMap);
+  // Diar segment ends at 5, transcript mid is 10 → distance 7.5 > 5s → speaker stays null
+  assert.equal(segments[0].speaker, null);
+});
+
+test("assignSpeakersToSegments: no diar data leaves segments unchanged", () => {
+  const segments = [{ start: 0, end: 5, text: "hello" }];
+  assignSpeakersToSegments(segments, [], new Map());
+  assert.equal(segments[0].speaker, undefined);
+});