Files
ten31-signal-engine/seeds/sources.seed.yaml
T

75 lines
7.2 KiB
YAML

# Source registry seed — handoff §7.3 (companies) + §7.4 (podcasts). VERIFY tickers/feeds at ingestion.
# `notes` flag backtest-era (2022-2023) coverage for §7.1, since some entities didn't exist yet.
# Podcast rss_url is left null where the real feed must still be resolved (some feeds truncate the
# back-catalog — resolution may need the show's archive feed or a YouTube back-catalog).
# Bitcoin-cluster podcasts are cluster_capped_low (§4.5 — most correlated with Ten31's own priors).
sources:
# ============================ COMPANIES (§7.3) ============================
# --- AI compute & hyperscalers → ai_tech ---
- {id: co-nvda, name: NVIDIA, kind: filing, cluster: ai_tech, ticker: NVDA}
- {id: co-googl, name: Alphabet, kind: filing, cluster: ai_tech, ticker: GOOGL}
- {id: co-msft, name: Microsoft, kind: filing, cluster: ai_tech, ticker: MSFT}
- {id: co-amzn, name: Amazon, kind: filing, cluster: ai_tech, ticker: AMZN}
- {id: co-meta, name: Meta, kind: filing, cluster: ai_tech, ticker: META}
- {id: co-avgo, name: Broadcom, kind: filing, cluster: ai_tech, ticker: AVGO}
- {id: co-tsm, name: TSMC, kind: filing, cluster: ai_tech, ticker: TSM, notes: "Foreign filer — files 20-F/6-K, NOT 10-K/10-Q; override forms at ingest"}
- {id: co-crwv, name: CoreWeave, kind: filing, cluster: ai_tech, ticker: CRWV, notes: "IPO 2025 — NO 2022-23 filings (backtest: absent, expected)"}
- {id: co-orcl, name: Oracle, kind: filing, cluster: ai_tech, ticker: ORCL}
# --- Energy & power (binding constraint) → energy ---
- {id: co-ceg, name: Constellation Energy, kind: filing, cluster: energy, ticker: CEG, notes: "Spun from Exelon Feb 2022 — backtest-era coverage from 2022"}
- {id: co-vst, name: Vistra, kind: filing, cluster: energy, ticker: VST}
- {id: co-tln, name: Talen Energy, kind: filing, cluster: energy, ticker: TLN, notes: "Relisted 2024 post-restructuring — thin pre-2024 public filings"}
- {id: co-gev, name: GE Vernova, kind: filing, cluster: energy, ticker: GEV, notes: "Spun from GE Apr 2024 — pre-2024 power data is inside GE filings"}
- {id: co-nee, name: NextEra Energy, kind: filing, cluster: energy, ticker: NEE}
- {id: co-ccj, name: Cameco, kind: filing, cluster: energy, ticker: CCJ, notes: "Foreign filer (Canada) — 40-F/6-K"}
- {id: co-vrt, name: Vertiv, kind: filing, cluster: energy, ticker: VRT}
- {id: co-pwr, name: Quanta Services, kind: filing, cluster: energy, ticker: PWR, notes: "watch — grid/interconnect picks-and-shovels"}
- {id: co-oklo, name: Oklo, kind: filing, cluster: energy, ticker: OKLO, notes: "watch; public 2024"}
- {id: co-smr, name: NuScale Power, kind: filing, cluster: energy, ticker: SMR, notes: "watch"}
# --- Mining <-> AI/HPC (energy-compute seam) → energy ---
- {id: co-corz, name: Core Scientific, kind: filing, cluster: energy, ticker: CORZ, notes: "Ch.11 Dec 2022, relisted Jan 2024 — messy 2022-23 filings"}
- {id: co-iren, name: IREN (Iris Energy), kind: filing, cluster: energy, ticker: IREN, notes: "IPO Nov 2021 — backtest-era OK; foreign filer 20-F"}
- {id: co-wulf, name: TeraWulf, kind: filing, cluster: energy, ticker: WULF, notes: "Public Dec 2021 — backtest-era OK"}
- {id: co-cifr, name: Cipher Mining, kind: filing, cluster: energy, ticker: CIFR, notes: "Public Aug 2021 — backtest-era OK"}
# --- Debasement <-> bitcoin (treasury/custody) → bitcoin ---
- {id: co-mstr, name: Strategy (MicroStrategy), kind: filing, cluster: bitcoin, ticker: MSTR}
- {id: co-coin, name: Coinbase, kind: filing, cluster: bitcoin, ticker: COIN}
- {id: co-xyz, name: Block, kind: filing, cluster: bitcoin, ticker: XYZ, notes: "Ticker SQ→XYZ (2025) — verify"}
- {id: co-hood, name: Robinhood Markets, kind: filing, cluster: bitcoin, ticker: HOOD, notes: "Crypto/fintech broker — alongside COIN/XYZ. Public Jul 2021, backtest-era OK."}
- {id: co-xxi, name: Twenty One, kind: filing, cluster: bitcoin, ticker: XXI, notes: "Formed 2025 — does not exist in backtest era"}
# --- Major banks (general corpus + Battery incumbent-entry/supply axis). New 'banks' cluster = genuine cross-cluster independence vs bitcoin. ---
- {id: co-jpm, name: JPMorgan Chase, kind: filing, cluster: banks, ticker: JPM}
- {id: co-bac, name: Bank of America, kind: filing, cluster: banks, ticker: BAC}
- {id: co-c, name: Citigroup, kind: filing, cluster: banks, ticker: C}
- {id: co-wfc, name: Wells Fargo, kind: filing, cluster: banks, ticker: WFC}
- {id: co-gs, name: Goldman Sachs, kind: filing, cluster: banks, ticker: GS, notes: "Battery incumbent-entry: executed ONE BTC-collateralized loan Apr-2022 (token, not at-scale)."}
- {id: co-ms, name: Morgan Stanley, kind: filing, cluster: banks, ticker: MS}
# ============================ PODCASTS (§7.4) ============================
# Macro/monetary
- {id: pod-oddlots, name: Odd Lots, kind: podcast, cluster: macro, role: IND, notes: "highest-independence cross-domain"}
- {id: pod-forwardguidance, name: Forward Guidance, kind: podcast, cluster: macro, role: DX}
- {id: pod-macrovoices, name: Macro Voices, kind: podcast, cluster: macro, role: DX, notes: "energy-heavy"}
- {id: pod-grantwilliams, name: The Grant Williams Podcast, kind: podcast, cluster: macro, role: IND}
- {id: pod-monetarymatters, name: Monetary Matters, kind: podcast, cluster: macro, role: DX, notes: "launched ~2024 — thin backtest-era coverage"}
- {id: pod-hiddenforces, name: Hidden Forces, kind: podcast, cluster: macro, role: IND, notes: "highest-independence cross-domain"}
# AI/tech
- {id: pod-dwarkesh, name: Dwarkesh Podcast, kind: podcast, cluster: ai_tech, role: DX, notes: "launched ~2023 — partial backtest-era coverage; highest-independence"}
- {id: pod-nopriors, name: No Priors, kind: podcast, cluster: ai_tech, role: DX, notes: "VC-consensus cluster — discount internal convergence"}
- {id: pod-latentspace, name: Latent Space, kind: podcast, cluster: ai_tech, role: DX, notes: "technical; launched ~2023"}
- {id: pod-cognitiverev, name: Cognitive Revolution, kind: podcast, cluster: ai_tech, role: DX}
- {id: pod-bg2, name: BG2, kind: podcast, cluster: vc_consensus, role: DX, notes: "launched ~2023; mild Ten31 correlation; VC-consensus"}
- {id: pod-a16z, name: a16z Podcast, kind: podcast, cluster: vc_consensus, role: DX, notes: "crypto correlation; VC-consensus"}
# Energy
- {id: pod-catalyst, name: Catalyst w/ Shayle Kann, kind: podcast, cluster: energy, role: DX}
- {id: pod-columbiaenergy, name: Columbia Energy Exchange, kind: podcast, cluster: energy, role: DX}
- {id: pod-doomberg, name: Doomberg, kind: podcast, cluster: energy, role: IND}
# Bitcoin (limited, capped low — §4.5)
- {id: pod-bitcoinlayer, name: The Bitcoin Layer, kind: podcast, cluster: bitcoin, role: DX, cluster_capped_low: true, notes: "macro-literate"}
- {id: pod-whatbitcoindid, name: What Bitcoin Did, kind: podcast, cluster: bitcoin, role: none, cluster_capped_low: true}
# Generalist
- {id: pod-allin, name: All-In, kind: podcast, cluster: vc_consensus, role: CB, notes: "consensus barometer"}
- {id: pod-iltb, name: Invest Like the Best, kind: podcast, cluster: generalist, role: DX, notes: "cross-domain"}
- {id: pod-lex, name: Lex Fridman, kind: podcast, cluster: generalist, role: none, notes: "wide reach, variable"}