863136aeec
Phase 2 (call detection): CallDetector using CoreAudio per-process mic attribution (anarlog technique) — robust start+stop for Zoom/Teams/Signal/Meet, ignoring our own recording; auto-record toggle. Built; pending live multi-app confirmation by the user. Phase 3 (visual timeline foundation): AppAdapter protocol + SpeakerObservation, TimelineBuilder (hysteresis/overlap/self-merge/aliases), VisualTimeline (schema 1.1), TextRecognizer (Vision OCR), FrameSampler + GridCallAnalyzer (name OCR + saturated-highlight active-speaker attribution), SignalAdapter, VisualObserver (window capture; frames released, never saved; minimized->visual_gap, idle != gap). Synthetic-frame tested; adapter geometry pending real Signal fixtures + live VisualObserver validation. Phase 5 (backend hand-off): SparkControlClient (multipart label-merge, sequential, TLS-skip, 503 Retry-After/413), SessionPackager (chunk plan + WAV slice + timeline slice/rebase), TranscriptAssembler + SpeakersFile, TranscriptPipeline. Validated END-TO-END against the live backend (chunk -> label-merge -> speakers.json). Phase 6 (voiceprints): VoiceprintStore (known_voiceprints, persist named fingerprints, skip Unknown). Wired: 'Send to backend' button + transcript status, auto-send toggle (default off) + self-name setting. All adversarial-review findings fixed. App + XCTest suite build; tests pass.
84 lines
3.1 KiB
Swift
84 lines
3.1 KiB
Swift
import SwiftUI
|
|
import AppKit
|
|
|
|
/// Settings panel (pushed from the menu-bar panel).
|
|
struct SettingsView: View {
|
|
@EnvironmentObject private var settings: AppSettings
|
|
|
|
var body: some View {
|
|
Form {
|
|
Section("SparkControl backend") {
|
|
TextField("Base URL", text: $settings.backendBaseURL)
|
|
.textFieldStyle(.roundedBorder)
|
|
Toggle("Skip TLS verification (self-signed cert)",
|
|
isOn: $settings.skipTLSVerification)
|
|
}
|
|
|
|
Section("Call detection") {
|
|
Toggle("Auto-record when a call is detected", isOn: $settings.autoRecordOnDetection)
|
|
Text("Detects Zoom, Teams, Signal, and Google Meet (any browser).")
|
|
.font(.caption)
|
|
.foregroundStyle(.secondary)
|
|
}
|
|
|
|
Section("Transcription") {
|
|
TextField("Your name", text: $settings.selfName)
|
|
.textFieldStyle(.roundedBorder)
|
|
Toggle("Auto-send recordings to backend", isOn: $settings.autoSendOnStop)
|
|
Text("Your name labels the mic-VAD \"self\" spans. Auto-send transcribes each recording on stop.")
|
|
.font(.caption)
|
|
.foregroundStyle(.secondary)
|
|
}
|
|
|
|
Section("Output") {
|
|
HStack {
|
|
Text(settings.outputFolderPath)
|
|
.lineLimit(1)
|
|
.truncationMode(.middle)
|
|
.foregroundStyle(.secondary)
|
|
Spacer()
|
|
Button("Choose…", action: chooseFolder)
|
|
}
|
|
}
|
|
|
|
Section("Adapters") {
|
|
Text("Inert in Phase 0 — these toggles only persist for now.")
|
|
.font(.caption)
|
|
.foregroundStyle(.secondary)
|
|
ForEach(AppSettings.adapterKeys, id: \.key) { adapter in
|
|
Toggle(adapter.label, isOn: binding(for: adapter.key))
|
|
}
|
|
}
|
|
}
|
|
.formStyle(.grouped)
|
|
.frame(width: 320)
|
|
.navigationTitle("Settings")
|
|
}
|
|
|
|
private func binding(for key: String) -> Binding<Bool> {
|
|
Binding(
|
|
get: { settings.adapterEnabled[key] ?? true },
|
|
set: { settings.adapterEnabled[key] = $0 }
|
|
)
|
|
}
|
|
|
|
private func chooseFolder() {
|
|
let panel = NSOpenPanel()
|
|
panel.canChooseDirectories = true
|
|
panel.canChooseFiles = false
|
|
panel.allowsMultipleSelection = false
|
|
panel.prompt = "Choose"
|
|
panel.directoryURL = settings.outputFolderURL
|
|
|
|
// The app is a menu-bar accessory and this is invoked from the transient
|
|
// MenuBarExtra(.window) popover. Use the async begin(...) API rather than
|
|
// runModal() — a nested modal loop can let the popover dismiss the panel
|
|
// out from under it. Activate first so the panel comes to the front.
|
|
NSApp.activate(ignoringOtherApps: true)
|
|
panel.begin { response in
|
|
guard response == .OK, let url = panel.url else { return }
|
|
settings.outputFolderPath = url.path
|
|
}
|
|
}
|
|
}
|