Files
ten31-transcripts/Ten31Transcripts/Recap/RecapEditModel.swift
T
Grant Gilliam c539b78a58 Configurable recap templates (categories per meeting type, in Settings)
Takeaways categories are no longer hardcoded — they're editable templates. A
template = the always-on TLDR + an ordered list of sections, each with a title, a
type (attributed items / bulleted list / paragraph), and an instruction (the prompt
text for that category). The analyzer assembles the LLM prompt FROM the template
and parses generically, so adding/removing/renaming a category needs zero code and
the output always renders.

- RecapTemplate / TemplateSection / SectionKind + TopicGranularity; built-in
  defaults (Internal Meeting, 1:1, Company/Sales Call), all editable.
- Generic extras: RecapExtras{tldr, primarySpeakers, sections:[RenderedSection]} +
  RecapItem{text,who,when,note} replaces the fixed MeetingExtras. Analyzer builds
  per-section sec_N fields + parses by kind; renderer + remap are generic.
- Topic granularity (coarse/auto/fine) answers 'should chunking be configurable' —
  it scales the target topic count; raw window sizes stay as tuned defaults.
- AppSettings persists templates + defaultTemplateId (seeded once). Settings gets a
  default-template picker + 'Manage…' → TemplatesView (CRUD, edit sections/
  instructions, set default, **Preview prompt** for full transparency).
- Recap editor gains a template picker; Regenerate uses the chosen template. Auto
  recap uses the default template.

54/54 XCTest (template prompt build, generic parse/remap/render updated).
2026-06-06 19:26:03 -05:00

179 lines
8.3 KiB
Swift

import Foundation
/// Editable view-model for one session's speaker corrections. Loads `speakers.json`
/// (+ optional `recap.json` and `cluster_fingerprints.json`), applies rename / merge
/// / per-segment reassignment, and on save rewrites `speakers.json`, re-renders
/// `transcript.md` + `recap.html`, and updates the voiceprint store (learning a voice
/// when an Unknown speaker is named).
@MainActor
final class RecapEditModel: ObservableObject {
let folder: URL
let title: String
private let voiceprints: VoiceprintStore
private let baseURL: String
private let skipTLS: Bool
private let base: SpeakersFile
private var recapFile: RecapFile?
private let clusterFingerprints: [String: [Float]]
private var originalSpeakers: [String]
private var renameOps: [(from: String, to: String)] = []
let templates: [RecapTemplate]
@Published var selectedTemplateId: String
@Published private(set) var segments: [SpeakersFile.Segment]
@Published private(set) var speakers: [String]
@Published private(set) var dirty = false
@Published private(set) var regenerating = false
@Published private(set) var hasRecap: Bool
@Published private(set) var status: String?
init?(folder: URL, voiceprints: VoiceprintStore, baseURL: String, skipTLS: Bool,
templates: [RecapTemplate], defaultTemplateId: String) {
let speakersURL = folder.appendingPathComponent("speakers.json")
guard let data = try? Data(contentsOf: speakersURL),
let file = try? JSONDecoder().decode(SpeakersFile.self, from: data),
!file.segments.isEmpty else { return nil }
self.folder = folder
self.voiceprints = voiceprints
self.baseURL = baseURL
self.skipTLS = skipTLS
self.templates = templates.isEmpty ? RecapTemplate.builtIns : templates
self.selectedTemplateId = (templates.contains { $0.id == defaultTemplateId } ? defaultTemplateId : templates.first?.id)
?? RecapTemplate.builtIns.first!.id
self.base = file
self.segments = file.segments
self.speakers = SpeakerEditing.orderedSpeakers(file.segments)
self.originalSpeakers = SpeakerEditing.orderedSpeakers(file.segments)
let rf = RecapFile.read(from: folder.appendingPathComponent("recap.json"))
self.recapFile = rf
self.hasRecap = rf != nil
self.clusterFingerprints = Self.loadFingerprints(folder.appendingPathComponent("cluster_fingerprints.json"))
self.title = rf?.title ?? file.app.capitalized + " call"
}
// MARK: - Edits
func rename(_ name: String, to newName: String) {
let to = newName.trimmingCharacters(in: .whitespacesAndNewlines)
guard !to.isEmpty, to != name else { return }
renameOps.append((from: name, to: to))
segments = SpeakerEditing.replaceSpeaker(name, with: to, in: segments)
refresh()
}
/// Merge is just a rename onto an existing speaker.
func merge(_ absorbed: String, into survivor: String) {
guard absorbed != survivor else { return }
renameOps.append((from: absorbed, to: survivor))
segments = SpeakerEditing.replaceSpeaker(absorbed, with: survivor, in: segments)
refresh()
}
func reassign(_ index: Int, to speaker: String) {
segments = SpeakerEditing.reassign(index, to: speaker, in: segments)
refresh()
}
private func refresh() {
speakers = SpeakerEditing.orderedSpeakers(segments)
dirty = true
status = nil
}
// MARK: - Save
/// Persist corrections: rewrite speakers.json, re-render the recap with names
/// remapped in place (fast, no LLM), and update voiceprints.
func save() {
let file = commitCorrections()
let net = SpeakerEditing.netNameMap(originals: originalSpeakers, ops: renameOps)
let result = recapFile.map { SpeakerEditing.remap($0.result, names: net) } ?? RecapResult(sections: [], extras: nil)
if recapFile != nil {
let rf = RecapFile(title: title, result: result)
recapFile = rf
try? rf.write(to: folder.appendingPathComponent("recap.json"))
}
try? RecapRenderer.write(file: file, result: result, title: title, to: folder)
rebaseline()
status = "Saved — recap.html & transcript.md updated."
}
/// Re-run the LLM analysis on the CORRECTED transcript, so summaries/extras are
/// freshly written with the corrected names (not just find-replaced). Commits the
/// corrections first; needs the gateway LLM (no-op message if unavailable).
func regenerate() async {
guard !regenerating else { return }
regenerating = true
status = "Regenerating recap…"
defer { regenerating = false }
let file = commitCorrections()
let template = templates.first { $0.id == selectedTemplateId } ?? templates.first ?? .internalMeeting
let llm = GatewayLLMClient(baseURL: baseURL, skipTLS: skipTLS)
guard let model = await llm.chatModelId() else {
status = "No language model on the gateway — saved corrections only."
rebaseline(); return
}
let analyzer = RecapAnalyzer(llm: llm, model: model)
guard let result = try? await analyzer.recap(file: file, template: template) else {
status = "Recap regeneration failed — corrections were saved."
rebaseline(); return
}
let rf = RecapFile(title: title, result: result)
recapFile = rf
hasRecap = true
try? rf.write(to: folder.appendingPathComponent("recap.json"))
try? RecapRenderer.write(file: file, result: result, title: title, to: folder)
rebaseline()
status = "Recap regenerated with corrected names."
}
/// Write the corrected speakers.json and reconcile the voiceprint store. Shared by
/// save() and regenerate(); does NOT clear renameOps (caller rebaselines after).
private func commitCorrections() -> SpeakersFile {
let file = SpeakersFile(sessionId: base.sessionId, app: base.app, durationSec: base.durationSec,
speakers: buildSpeakerList(), segments: segments, models: base.models)
try? file.write(to: folder.appendingPathComponent("speakers.json"))
let net = SpeakerEditing.netNameMap(originals: originalSpeakers, ops: renameOps)
let stored = voiceprints.knownVoiceprints()
for (orig, final) in net where !LabelMergeResponse.isUnknownName(final) {
let finalHasPrint = clusterFingerprints[final] != nil || stored[final] != nil
if finalHasPrint {
// Merge into an existing identity keep the survivor's print, drop the absorbed.
if !LabelMergeResponse.isUnknownName(orig) { voiceprints.merge(orig, into: final) }
} else if let vec = clusterFingerprints[orig] {
// Rename / name an Unknown learn this voice for the new name.
voiceprints.enroll(name: final, vector: vec)
if !LabelMergeResponse.isUnknownName(orig) { voiceprints.merge(orig, into: final) }
} else {
voiceprints.rename(orig, to: final)
}
}
return file
}
/// After a commit, the corrected names become the new baseline so further edits
/// map cleanly (and the now-baked-in recap isn't double-remapped).
private func rebaseline() {
originalSpeakers = SpeakerEditing.orderedSpeakers(segments)
renameOps.removeAll()
dirty = false
}
/// Speaker roster from the edited segments: keep the original source where the
/// name is unchanged; mark new (renamed/merged) names as user-set.
private func buildSpeakerList() -> [SpeakersFile.Speaker] {
let byName = Dictionary(base.speakers.map { ($0.name, $0) }, uniquingKeysWith: { a, _ in a })
return SpeakerEditing.orderedSpeakers(segments).map { name in
byName[name] ?? SpeakersFile.Speaker(name: name, source: "manual", overlapConfidence: nil, matchSimilarity: nil)
}
}
private static func loadFingerprints(_ url: URL) -> [String: [Float]] {
guard let data = try? Data(contentsOf: url),
let obj = try? JSONSerialization.jsonObject(with: data) as? [String: [Any]] else { return [:] }
return obj.mapValues { $0.compactMap { ($0 as? NSNumber)?.floatValue } }
}
}