7e0759846f
Move the ~20 optional cluster knobs out of the StartOS "Configure Sparks"
action (now just the 4 required fields) and into a dashboard ⚙ Settings gear,
backed by a /data/app_settings.json overlay keyed by env-var names. One shared
mutable Settings instance + Settings.reload() applies edits live without a
restart; existing installs' values migrate automatically on first boot.
Also: support-service ports (parakeet/kokoro/embed/qdrant + vllm) are now
configurable, and GET /api/swap/lock no longer 404s (it was shadowed by the
/api/swap/{job_id} catch-all). WebhookNotifier is re-pointed on save so its
url/secret reload live too.
206 lines
9.1 KiB
Python
206 lines
9.1 KiB
Python
from __future__ import annotations
|
|
import logging
|
|
import os
|
|
from dataclasses import dataclass, fields
|
|
from pathlib import Path
|
|
from typing import Mapping
|
|
|
|
from . import app_settings
|
|
from .shellsafe import validate_container
|
|
|
|
log = logging.getLogger(__name__)
|
|
|
|
|
|
def _env(src: Mapping[str, str], name: str, default: str = "") -> str:
|
|
return src.get(name, default)
|
|
|
|
|
|
def _env_container(src: Mapping[str, str], name: str, default: str) -> str:
|
|
"""Resolve a container-name env var, validating it at the config boundary.
|
|
|
|
The value flows into `docker logs`/`docker exec` over SSH, so it's quoted at
|
|
the sink — but per the repo's two-layer convention it's also whitelist-checked
|
|
here. A malformed optional value falls back to `default` rather than crashing
|
|
daemon startup (mirrors `_env_int`)."""
|
|
val = src.get(name, "") or default
|
|
try:
|
|
return validate_container(val)
|
|
except ValueError:
|
|
log.warning("ignoring invalid %s=%r; using %r", name, val, default)
|
|
return default
|
|
|
|
|
|
def _env_set(src: Mapping[str, str], name: str) -> frozenset[str]:
|
|
"""Parse a comma-separated env var into a lowercased frozenset of keys.
|
|
|
|
Used by DISABLED_SERVICES so an adopter whose cluster doesn't run a given
|
|
support service can switch its tile + probes off entirely (rather than have
|
|
the probe hit whatever else listens on that port — e.g. a vLLM sharing
|
|
Parakeet's default 8000)."""
|
|
raw = src.get(name, "")
|
|
return frozenset(part.strip().lower() for part in raw.split(",") if part.strip())
|
|
|
|
|
|
def _env_int(src: Mapping[str, str], name: str, default: int) -> int:
|
|
"""Parse an int env var, falling back to `default` when unset, blank, or
|
|
malformed. Optional numeric fields arrive as an empty string when left blank,
|
|
so a bare int("") would crash daemon startup."""
|
|
try:
|
|
return int(src.get(name, "") or default)
|
|
except (TypeError, ValueError):
|
|
return default
|
|
|
|
|
|
def _resolve_models_yaml() -> str:
|
|
if env := os.environ.get("MODELS_YAML"):
|
|
return env
|
|
here = Path(__file__).resolve().parent # app/
|
|
candidates = [
|
|
here.parent / "models.yaml", # image/models.yaml (Docker)
|
|
here.parent.parent / "models.yaml", # <repo>/models.yaml (dev)
|
|
Path("/app/models.yaml"), # explicit container path
|
|
]
|
|
for p in candidates:
|
|
if p.exists():
|
|
return str(p)
|
|
return str(candidates[0]) # let load fail with a clear path
|
|
|
|
|
|
def _effective_env() -> dict[str, str]:
|
|
"""The env Settings is built from: process env first, the in-app settings
|
|
overlay on top. The overlay (the dashboard 'gear') is keyed by the same env
|
|
var names, so a knob set in the UI overrides the value the StartOS action
|
|
injected — while an un-touched knob keeps falling through to the action's
|
|
value, then to the code default. See app_settings."""
|
|
return {**os.environ, **app_settings.load_overlay()}
|
|
|
|
|
|
@dataclass
|
|
class Settings:
|
|
# NOTE: intentionally NOT frozen. There is exactly one Settings instance,
|
|
# shared by reference across every router closure and manager (build_router,
|
|
# self.settings = settings). `reload()` mutates it in place so a change saved
|
|
# via the in-app settings gear goes live for all of them without rebuilding
|
|
# the app — the only window of inconsistency is the microseconds it takes to
|
|
# reassign the fields, acceptable for a single-operator config save.
|
|
spark1_host: str
|
|
spark1_user: str
|
|
spark2_host: str
|
|
spark2_user: str
|
|
parakeet_host: str
|
|
parakeet_user: str
|
|
parakeet_container: str
|
|
kokoro_host: str
|
|
kokoro_user: str
|
|
kokoro_container: str
|
|
embed_host: str
|
|
embed_user: str
|
|
embed_container: str
|
|
qdrant_host: str
|
|
qdrant_user: str
|
|
qdrant_container: str
|
|
qdrant_collection: str
|
|
matrix_bridge_host: str
|
|
matrix_bridge_user: str
|
|
matrix_bridge_container: str
|
|
matrix_bridge_dir: str
|
|
matrix_bridge_branch: str
|
|
redaction_map_db: str
|
|
redaction_map_ttl: int
|
|
ssh_key_path: str
|
|
ssh_known_hosts: str
|
|
models_yaml: str
|
|
vllm_port: int
|
|
vllm_container: str
|
|
disabled_services: frozenset[str]
|
|
parakeet_port: int
|
|
kokoro_port: int
|
|
embed_port: int
|
|
qdrant_port: int
|
|
bind_port: int
|
|
open_webui_url: str
|
|
ngc_api_key: str
|
|
swap_webhook_url: str
|
|
swap_webhook_secret: str
|
|
|
|
@classmethod
|
|
def from_env(cls, src: Mapping[str, str] | None = None) -> "Settings":
|
|
src = _effective_env() if src is None else src
|
|
spark2_host = _env(src, "SPARK2_HOST")
|
|
spark2_user = _env(src, "SPARK2_USER")
|
|
# Parakeet (STT) and Kokoro (TTS) default to Spark 2 unless overridden.
|
|
return cls(
|
|
spark1_host=_env(src, "SPARK1_HOST"),
|
|
spark1_user=_env(src, "SPARK1_USER"),
|
|
spark2_host=spark2_host,
|
|
spark2_user=spark2_user,
|
|
parakeet_host=_env(src, "PARAKEET_HOST") or spark2_host,
|
|
parakeet_user=_env(src, "PARAKEET_USER") or spark2_user,
|
|
parakeet_container=_env(src, "PARAKEET_CONTAINER") or "parakeet-asr",
|
|
kokoro_host=_env(src, "KOKORO_HOST") or spark2_host,
|
|
kokoro_user=_env(src, "KOKORO_USER") or spark2_user,
|
|
kokoro_container=_env(src, "KOKORO_CONTAINER") or "kokoro-tts",
|
|
# Embeddings (spark-embed: bge-m3 dense + reranker) and Qdrant
|
|
# (vector storage) default to Spark 2 unless overridden.
|
|
embed_host=_env(src, "EMBED_HOST") or spark2_host,
|
|
embed_user=_env(src, "EMBED_USER") or spark2_user,
|
|
embed_container=_env(src, "EMBED_CONTAINER") or "spark-embed",
|
|
qdrant_host=_env(src, "QDRANT_HOST") or spark2_host,
|
|
qdrant_user=_env(src, "QDRANT_USER") or spark2_user,
|
|
qdrant_container=_env(src, "QDRANT_CONTAINER") or "qdrant",
|
|
qdrant_collection=_env(src, "QDRANT_COLLECTION", ""),
|
|
# matrix-bridge bot container, driven as its own SSH user (the owner
|
|
# of the ~/matrix-bridge git clone) so git/docker run unprivileged.
|
|
# The user is BLANK by default and set via the settings gear; leaving
|
|
# it blank reports the service as unconfigured, which hides the tile.
|
|
# That keeps the shared package portable — a deployment without the
|
|
# bot never shows a stray tile or a hardcoded username. Host defaults
|
|
# to Spark 2 (same box); container/dir/branch are sensible defaults.
|
|
matrix_bridge_host=_env(src, "MATRIX_BRIDGE_HOST") or spark2_host,
|
|
matrix_bridge_user=_env(src, "MATRIX_BRIDGE_USER"),
|
|
matrix_bridge_container=_env(src, "MATRIX_BRIDGE_CONTAINER") or "matrix-bridge",
|
|
matrix_bridge_dir=_env(src, "MATRIX_BRIDGE_DIR") or "~/matrix-bridge",
|
|
matrix_bridge_branch=_env(src, "MATRIX_BRIDGE_BRANCH") or "master",
|
|
# Redaction gateway pseudonym-map store (server-held de-anon key).
|
|
redaction_map_db=_env(src, "REDACTION_MAP_DB", "/data/redaction_maps.db"),
|
|
redaction_map_ttl=_env_int(src, "REDACTION_MAP_TTL", 7200),
|
|
ssh_key_path=_env(src, "SSH_KEY_PATH"),
|
|
ssh_known_hosts=_env(src, "SSH_KNOWN_HOSTS"),
|
|
models_yaml=_resolve_models_yaml(),
|
|
vllm_port=_env_int(src, "VLLM_PORT", 8888),
|
|
# Container name for the swappable vLLM on Spark 1. Defaults to the
|
|
# bundled launch-cluster.sh container; override if you named yours
|
|
# something else (the swap log-tail and pre-flight validator exec
|
|
# into it by name).
|
|
vllm_container=_env_container(src, "VLLM_CONTAINER", "vllm_node"),
|
|
# Built-in support-service keys (parakeet, kokoro, embeddings,
|
|
# qdrant) the deployment doesn't run — hidden from the dashboard and
|
|
# never probed.
|
|
disabled_services=_env_set(src, "DISABLED_SERVICES"),
|
|
parakeet_port=_env_int(src, "PARAKEET_PORT", 8000),
|
|
kokoro_port=_env_int(src, "KOKORO_PORT", 8880),
|
|
embed_port=_env_int(src, "EMBED_PORT", 8088),
|
|
qdrant_port=_env_int(src, "QDRANT_PORT", 6333),
|
|
bind_port=_env_int(src, "BIND_PORT", 9999),
|
|
open_webui_url=_env(src, "OPEN_WEBUI_URL", ""),
|
|
ngc_api_key=_env(src, "NGC_API_KEY", ""),
|
|
# Coordination layer: fire a swap-lifecycle webhook to this URL so
|
|
# downstream consumers re-point their model config on a swap. Blank
|
|
# ⇒ disabled. The optional secret HMAC-signs the body (X-Spark-Signature).
|
|
swap_webhook_url=_env(src, "SWAP_WEBHOOK_URL", ""),
|
|
swap_webhook_secret=_env(src, "SWAP_WEBHOOK_SECRET", ""),
|
|
)
|
|
|
|
def reload(self) -> None:
|
|
"""Recompute every field from the current env + settings overlay and
|
|
assign it onto this same instance, so all holders of the reference see
|
|
the change without an app restart. Called after the gear writes the
|
|
overlay (see server.post_settings)."""
|
|
fresh = Settings.from_env()
|
|
for f in fields(self):
|
|
setattr(self, f.name, getattr(fresh, f.name))
|
|
|
|
@property
|
|
def configured(self) -> bool:
|
|
return bool(self.spark1_host)
|