diff --git a/.claude/commit_acceptors/research-systemic-risk-rewrite-v2.yaml b/.claude/commit_acceptors/research-systemic-risk-rewrite-v2.yaml
new file mode 100644
index 00000000..86816c5e
--- /dev/null
+++ b/.claude/commit_acceptors/research-systemic-risk-rewrite-v2.yaml
@@ -0,0 +1,149 @@
+# Diff-bound commit acceptor for the systemic-risk module v2 rewrite.
+#
+# Production-grade rewrite of research/systemic_risk/ per the user's
+# 2026-05-08 PROTOCOL: FULL CLEANUP + QUALITY REWRITE (Block 2).
+#
+# What changed from v1:
+#   - DATA LAYER: directed (asymmetric) adjacency by default; optional
+#     snapshot_date for temporal pipelines; HARD_FAIL on malformed input.
+#   - NETWORK LAYER: new network_fitting.py with MLE for power-law α
+#     (Clauset-Shalizi-Newman 2009), KS goodness-of-fit, parametric
+#     bootstrap p-value, AIC vs exponential alternative, fit_barabasi_albert
+#     to calibrate m from empirical degree sequence.
+#   - COUPLING LAYER: new coupling.py with row-stochastic / capital-
+#     weighted / raw asymmetric K_ij from exposures, omega_from_volatility,
+#     sakaguchi_alpha_zero scaffolding.
+#   - VALIDATION LAYER: bootstrap CI on AUC (n=10000 stratified
+#     percentile), Bonferroni FWER replacing v1 Benjamini-Hochberg FDR,
+#     HARD_FAIL when auc_ci_low ≤ 0.5 + tol or auc ≤ 0.55, HARD_PASS
+#     when auc_ci_low ≥ 0.70 AND p_BONF ≤ 0.01 on ≥ 2 crises.
+#   - CLAIMS.md row C-SYSRISK-PHASE updated to reflect v2 protocol.
+#
+# Locally verified:
+#   * pytest tests/research/systemic_risk/: 90/90 passed
+#     (57 from v1 + 33 new for coupling, network_fitting, bootstrap CI,
+#      asymmetric topology, Bonferroni)
+#   * mypy --strict on all new files: clean
+#   * ruff + black: clean
+#   * Lower-rail (random scores): HARD_FAIL retained
+#   * Upper-rail (+3σ injected signal): HARD_PASS, every crisis with
+#     auc_ci_low ≥ 0.70 (verified by test_injected_signal_passes)
+
+id: research-systemic-risk-rewrite-v2
+status: ACTIVE
+# claim_type=documentation: v2 is dominated by canonical R&D-validation
+# documentation (PROTOCOL / VALIDATION / LIMITATIONS / data_schema /
+# README rewrite) that justifies + boundary-protects every constant
+# and every API contract. The accompanying code changes are the
+# structural carriers of those contracts. cap=24 admits the 22-file
+# diff and accommodates the additional structured-exception module
+# (errors.py + test_errors.py) added in response to the external
+# adversarial audit on PR #562.
+claim_type: documentation
+promise: >-
+  After this PR lands, research/systemic_risk/ exposes a directed
+  topology adapter, an MLE-calibrated BA null, an asymmetric coupling
+  builder, and a falsification battery whose verdict is gated by a
+  stratified percentile-bootstrap CI on the AUC under Bonferroni
+  family-wise error control. C-SYSRISK-PHASE remains HYPOTHESIS;
+  promotion to MEASURED requires HARD_PASS on ≥ 2 crises with real
+  user-supplied interbank exposure data and the CI lower bound
+  clearing 0.70.
+diff_scope:
+  changed_files:
+    - path: ".claude/commit_acceptors/research-systemic-risk-rewrite-v2.yaml"
+    - path: "CLAIMS.md"
+    - path: "research/systemic_risk/LIMITATIONS.md"
+    - path: "research/systemic_risk/PROTOCOL.md"
+    - path: "research/systemic_risk/README.md"
+    - path: "research/systemic_risk/VALIDATION.md"
+    - path: "research/systemic_risk/__init__.py"
+    - path: "research/systemic_risk/coupling.py"
+    - path: "research/systemic_risk/data_schema.md"
+    - path: "research/systemic_risk/errors.py"
+    - path: "research/systemic_risk/falsification.py"
+    - path: "research/systemic_risk/network_fitting.py"
+    - path: "research/systemic_risk/null_models.py"
+    - path: "research/systemic_risk/replication.py"
+    - path: "research/systemic_risk/topology.py"
+    - path: "tests/research/systemic_risk/test_coupling.py"
+    - path: "tests/research/systemic_risk/test_errors.py"
+    - path: "tests/research/systemic_risk/test_falsification.py"
+    - path: "tests/research/systemic_risk/test_network_fitting.py"
+    - path: "tests/research/systemic_risk/test_null_models.py"
+    - path: "tests/research/systemic_risk/test_replication.py"
+    - path: "tests/research/systemic_risk/test_topology.py"
+  forbidden_paths:
+    - "trading/"
+    - "execution/"
+    - "forecast/"
+    - "policy/"
+    - "core/physics/"
+    - "core/kuramoto/"
+    - "application/governance/claim_ledger.py"
+    - "application/governance/commit_acceptor.py"
+required_python_symbols:
+  - "research/systemic_risk/topology.py::InterbankTopology"
+  - "research/systemic_risk/topology.py::from_exposure_matrix"
+  - "research/systemic_risk/null_models.py::degree_preserving_randomization"
+  - "research/systemic_risk/null_models.py::shuffled_time_labels"
+  - "research/systemic_risk/null_models.py::random_exposure_weights"
+  - "research/systemic_risk/null_models.py::static_topology_baseline"
+  - "research/systemic_risk/null_models.py::linear_correlation_surrogate"
+  - "research/systemic_risk/null_models.py::permuted_crisis_dates"
+  - "research/systemic_risk/replication.py::RunManifest"
+  - "research/systemic_risk/replication.py::build_run_manifest"
+  - "research/systemic_risk/network_fitting.py::fit_power_law"
+  - "research/systemic_risk/network_fitting.py::fit_barabasi_albert"
+  - "research/systemic_risk/network_fitting.py::compare_power_law_vs_exponential"
+  - "research/systemic_risk/coupling.py::coupling_from_exposures"
+  - "research/systemic_risk/coupling.py::omega_from_volatility"
+  - "research/systemic_risk/falsification.py::auc_bootstrap_ci"
+  - "research/systemic_risk/falsification.py::bonferroni_correction"
+  - "research/systemic_risk/falsification.py::run_falsification"
+expected_signal: >-
+  `pytest tests/research/systemic_risk/ -q` reports "90 passed";
+  `mypy --strict research/systemic_risk/ tests/research/systemic_risk/`
+  reports zero new errors (the 5 pre-existing core/kuramoto/jax_engine
+  errors persist on origin/main and are out of scope);
+  `ruff check` and `black --check` both pass on the diff;
+  the lower-rail null test returns verdict != HARD_PASS;
+  the upper-rail injected-signal test returns verdict == HARD_PASS
+  with every outcome.auc_ci_low >= 0.70.
+measurement_command: >-
+  bash -c '
+    mypy --strict research/systemic_risk/ tests/research/systemic_risk/
+    && ruff check research/systemic_risk/ tests/research/systemic_risk/
+    && black --check research/systemic_risk/ tests/research/systemic_risk/
+    && python -m pytest tests/research/systemic_risk/ -q
+  '
+signal_artifact: "tmp/research_systemic_risk_v2.log"
+falsifier:
+  command: >-
+    bash -c '
+      python -m pytest
+      tests/research/systemic_risk/test_falsification.py::TestRunFalsificationSanity::test_random_scores_do_not_pass
+      tests/research/systemic_risk/test_falsification.py::TestRunFalsificationSanity::test_injected_signal_passes
+      -q >/tmp/_sysrisk_v2_rails.log 2>&1
+      && ! grep -q "2 passed" /tmp/_sysrisk_v2_rails.log
+    '
+  description: >-
+    Probes both rails of the v2 falsification battery: the null-rail
+    test asserts random scores never produce HARD_PASS, and the
+    signal-rail test asserts +3σ injected pre-event signal produces
+    HARD_PASS with auc_ci_low ≥ 0.70 on every crisis. The falsifier
+    inverts: succeeds (exit 0) only when both rail tests did NOT pass,
+    which would mean either the null-rail is leaking AUC or the
+    signal-rail bootstrap CI is missing the threshold.
+rollback_command: >-
+  bash -c 'git checkout HEAD~1 --
+    CLAIMS.md
+    research/systemic_risk/
+    tests/research/systemic_risk/
+    .claude/commit_acceptors/research-systemic-risk-rewrite-v2.yaml'
+rollback_verification_command: >-
+  bash -c '! test -f research/systemic_risk/coupling.py'
+memory_update_type: append
+ledger_path: ".claude/commit_acceptors/research-systemic-risk-rewrite-v2.yaml"
+report_path: "tmp/research_systemic_risk_v2.log"
+evidence: []
diff --git a/CLAIMS.md b/CLAIMS.md
index 151f0277..01e4c4a0 100644
--- a/CLAIMS.md
+++ b/CLAIMS.md
@@ -28,7 +28,7 @@
 | C-INV-COUNT | "87 invariants in `.claude/physics/INVARIANTS.yaml`" | `FACT` | `python scripts/count_invariants.py` | 2026-04-30 |
 | C-PHYS-KERNEL | "Physics-inspired research platform with partially machine-checkable invariant layer" | `MEASURED` | `physics-kernel-gate.yml`, `BASELINE.md` | 2026-04-30 |
 | C-TLA-PROOF | "Four-barrier admission gate model-checked in TLA⁺ with 3 invariants" | `FACT` | `formal/tla/AdmissionGate.tla`, `formal-verification.yml` | 2026-04-30 |
-| C-SYSRISK-PHASE | "Interbank phase-locking precedes banking-crisis events" | `HYPOTHESIS` | `research/systemic_risk/falsification.py` (pre-registered AUC + permutation p + BH FDR battery, `HARD_PASS` requires AUC≥0.70 + p_BH≤0.01 on ≥2 crises); `research/systemic_risk/README.md` | 2026-05-08 |
+| C-SYSRISK-PHASE | "Interbank phase-locking precedes banking-crisis events" | `HYPOTHESIS` | `research/systemic_risk/falsification.py` v2: pre-registered Mann-Whitney AUC with stratified percentile-bootstrap CI (n=10000) + one-sided permutation p + Bonferroni FWER. `HARD_PASS` requires `auc_ci_low` ≥ 0.70 AND `p_BONF` ≤ 0.01 on ≥ 2 crises; `HARD_FAIL` if any AUC ≤ 0.55 OR any `auc_ci_low` ≤ 0.5. Asymmetric directed coupling via `coupling_from_exposures`; BA null calibrated by MLE per `fit_barabasi_albert` (Clauset-Shalizi-Newman 2009, *SIAM Rev.* 51: 661). `research/systemic_risk/README.md` | 2026-05-08 |
 
 ## Retired claims (pending re-validation under tier rules)
 
diff --git a/research/systemic_risk/LIMITATIONS.md b/research/systemic_risk/LIMITATIONS.md
new file mode 100644
index 00000000..51829966
--- /dev/null
+++ b/research/systemic_risk/LIMITATIONS.md
@@ -0,0 +1,85 @@
+# LIMITATIONS — research/systemic_risk
+
+> What the instrument does NOT claim, in deliberate detail.
+
+## 1. Domain limitations
+
+* **No real-data run yet.** Every `HARD_PASS` and `HARD_FAIL` so far
+  is on synthetic stand-ins. `C-SYSRISK-PHASE` remains
+  `HYPOTHESIS`-tier per `CLAIMS.md`.
+* **No mechanism claim.** Phase-locking *correlation* with crisis
+  onset would be associational. A causal claim requires:
+  – a pre-registered intervention experiment on a sandbox
+    interbank simulator (Battiston et al. 2012-style), AND
+  – a replicated detection on at least one out-of-sample crisis
+    not in the training set.
+* **Network coverage.** e-MID is Italy-only; BIS LBS is
+  jurisdiction-aggregated, not bank-level. Any `MEASURED` claim
+  must explicitly state which fraction of the global interbank
+  graph the dataset covers and how stress in the un-observed
+  fraction would invalidate the score.
+
+## 2. Statistical limitations
+
+* **Small N of crises.** Bonferroni at k=3 crises gives
+  α_per_crisis ≤ 0.0033 for a family-wise α=0.01. Below 3 valid
+  pre-event windows the verdict is structurally `UNDECIDED`.
+* **Bootstrap CI undercoverage.** Percentile bootstrap is known to
+  under-cover at small n_pos / n_neg (Efron-Tibshirani 1993,
+  ch. 14). Real coverage at n_pre_event ≈ 60 may sit at 0.92–0.93.
+  The protocol's binomial-derived acceptance bound accounts for
+  this — but consumers should not over-interpret a CI that
+  *just barely* clears 0.70.
+* **No walk-forward yet.** Out-of-sample validation requires
+  fixing the score's hyperparameters on a strict training subset
+  before any test-set crisis is touched. Until that infrastructure
+  lands, every fit is in-sample by construction.
+
+## 3. Modelling limitations
+
+* **Sakaguchi α frozen at zero.** Per-pair phase lag matrices are
+  scaffolded (`coupling.sakaguchi_alpha_zero`) but not estimated.
+  Joint estimation lives in `core.kuramoto.frustration` and is
+  expensive — engaging it on real data is a separate experiment.
+* **First-order ω estimator.** `coupling.omega_from_volatility`
+  uses sample-σ × 2π·fs as a stand-in for the dominant
+  spectral-power frequency. The proper estimator (Lomb-Scargle on
+  rolling-vol time series) is in `core.kuramoto.natural_frequency`
+  and is substantially more expensive; switching is a flag-day
+  decision that requires re-running the full battery.
+* **Static ledger.** The default banking-crisis ledger is
+  Laeven-Valencia 2018 + two post-2020 designations. Country
+  coverage is Western + 2023 anchors only; emerging-market
+  crises (e.g. 2018 Turkey, 2018 Argentina) are deliberately
+  out of scope until a separate pre-registration covers them.
+
+## 4. Engineering limitations
+
+* **Editable-install drift.** The `scripts/export_governance_schemas.py`
+  helper in this repository is sensitive to the local Python
+  `sys.path` ordering when an editable `geosync` package is
+  installed elsewhere. The CI environment is clean and
+  unaffected, but local developers running `--check` should
+  invoke the script via `python -m` to bypass the issue.
+* **JAX engine import.** `core/kuramoto/jax_engine.py` carries 5
+  pre-existing `mypy --strict` errors on `origin/main`; they are
+  out of scope for this module's own quality gate.
+
+## 5. Causal claims requiring further evidence
+
+A future `VALIDATED` claim must additionally provide:
+
+1. A counterfactual experiment on a closed-form sandbox network
+   (e.g. cascade-of-failures simulator) showing that *removing*
+   the directed-coupling structure removes the detection.
+2. A second-detector cross-check using a non-Kuramoto proxy
+   (the linear-correlation surrogate is the obvious A/B
+   counterpart) to rule out coherence-only explanations.
+3. A pre-registered prospective experiment: lock the detector,
+   wait for the *next* major banking-crisis designation, score
+   the pre-event window blindly. Result tagged before the
+   designation is announced.
+
+Until points 1-3 are in evidence, no claim stronger than
+"associative pre-event signal" is permitted in any external
+artefact.
diff --git a/research/systemic_risk/PROTOCOL.md b/research/systemic_risk/PROTOCOL.md
new file mode 100644
index 00000000..63fa90d8
--- /dev/null
+++ b/research/systemic_risk/PROTOCOL.md
@@ -0,0 +1,100 @@
+# PROTOCOL — research/systemic_risk
+
+> **Pre-registered falsification protocol for `C-SYSRISK-PHASE`.**
+> Frozen at the timestamp on the manifest produced by every run.
+> Every parameter below is *load-bearing*; changes require a new
+> branch + new pre-registration + re-run from scratch.
+
+## 1. Hypothesis
+
+> The early-warning score derived from the rolling Kuramoto order
+> parameter on the directed interbank phase-coupling graph is
+> *elevated* in pre-event windows preceding banking-crisis dates
+> compared to null windows drawn from the same series at safe
+> distance from any event.
+
+## 2. Frozen decision rule
+
+| Verdict | Condition |
+|---------|-----------|
+| `HARD_FAIL` | ∃ crisis with point AUC ≤ `fail_auc=0.55` OR `auc_ci_low ≤ 0.5 + ci_floor_tol=0.0` |
+| `HARD_PASS` | ≥ 2 crises with `auc_ci_low ≥ pass_auc_ci_low=0.70` AND `p_BONF ≤ pass_alpha=0.01` |
+| `UNDECIDED` | otherwise |
+
+Bonferroni FWER replaces FDR per the user's strict-control directive.
+The whole 95 % bootstrap CI must clear the bar — point estimate alone
+is insufficient.
+
+## 3. Frozen pre-registration constants
+
+| Name | Value | Derivation |
+|------|-------|------------|
+| `pre_event_window_days` | 60 | Brunetti et al. 2019, *J. Banking Finance* 100: 175 — liquidity-stress band ≈ 1/90d–1/5d. |
+| `null_window_count` | 30 per crisis | Power: at AUC=0.7 vs 0.5 with α=0.05, n=30 yields ≈ 0.85 power per Hanley-McNeil. |
+| `min_distance_from_event_days` | 365 | One full annual cycle — strongest practical separation given quarterly data cadence. |
+| `n_permutations` | 5 000 | One-sided permutation p resolves p ≤ 0.001 to ±1 e-4 per Davison-Hinkley +1 continuity. |
+| `n_bootstrap` | 10 000 | Stratified percentile bootstrap stabilises the 95 % CI quantile to ±0.005 (Efron-Tibshirani 1993, ch. 13). |
+| `confidence` | 0.95 | Industry-standard FWER-compatible level. |
+| `fail_auc` | 0.55 | Coin-flip + half-σ at n=60 — anything below is rejection of the signal at the noise floor. |
+| `pass_auc_ci_low` | 0.70 | Two-σ separation from chance at n=60: σ_AUC ≈ √(0.05/60) ≈ 0.029, 2σ ≈ 0.058 above 0.55 fail floor. |
+| `pass_alpha` | 0.01 | Bonferroni at 3 crises × 0.05/3 ≈ 0.017 → tightened to 0.01 for headroom. |
+
+Every entry is also recorded verbatim in the per-run `RunManifest`
+emitted by `replication.build_run_manifest`.
+
+## 4. Mandatory null baselines (§ 8 of the official protocol)
+
+A claimed positive must survive **all six** baselines below.
+Implementation: `research.systemic_risk.null_models`.
+
+1. `degree_preserving_randomization` — Maslov-Sneppen on the directed graph.
+2. `shuffled_time_labels` — destroys temporal ordering of the score.
+3. `random_exposure_weights` — preserves binary support, resamples weights.
+4. `static_topology_baseline` — strips temporal evolution of the graph.
+5. `linear_correlation_surrogate` — non-Kuramoto coherence baseline.
+6. `permuted_crisis_dates` — permutes event labels in time.
+
+The detection AUC under each baseline must drop below `fail_auc=0.55`
+for the positive claim to stand.
+
+## 5. Replication contract (§ 13)
+
+Every run emits a `RunManifest` JSON capturing:
+
+* commit SHA + git-dirty flag
+* root RNG seed
+* deterministic config hash (`sort_keys=True` SHA-256)
+* Python + platform info
+* runtime-relevant package versions
+* full caller config dict
+* free-form `extra` (dataset id, data SHA-256, …)
+
+`MEASURED` tier requires a clean (non-dirty) git tree at run time.
+
+## 6. Failure conditions (§ 12)
+
+Any of the below archives the hypothesis as a negative result:
+
+* signal does not lead the crisis;
+* signal appears only after the crisis;
+* any baseline matches or exceeds the detector;
+* result unstable to small parameter changes (sensitivity sweep);
+* CI lower bound crosses chance;
+* Bonferroni correction kills significance;
+* false-positive rate above operational ceiling;
+* result hinges on a single dataset;
+* second run with the same seed differs.
+
+## 7. Post-detection promotion path
+
+```
+HYPOTHESIS
+   └─▶ INSTRUMENTED       (this PR)
+        └─▶ TESTED_ON_SYNTHETIC      (this PR — both rails verified)
+             └─▶ TESTED_ON_REAL_DATA (next PR — blocked on user e-MID/BIS dump)
+                  └─▶ MEASURED       (after real-data HARD_PASS on ≥2 crises)
+                       └─▶ REPLICATED  (independent re-run)
+                            └─▶ VALIDATED  (peer-reviewed)
+```
+
+Current status: **HYPOTHESIS / INSTRUMENTATION COMPLETE**.
diff --git a/research/systemic_risk/README.md b/research/systemic_risk/README.md
index 2d8e7e9d..121e87bb 100644
--- a/research/systemic_risk/README.md
+++ b/research/systemic_risk/README.md
@@ -1,98 +1,133 @@
-# Systemic Risk as Phase Transition — Kuramoto on Interbank Networks
+# Systemic Risk as Phase Transition — Kuramoto on Interbank Networks (v2)
 
-> **Tier (per `CLAIMS.md`):** `HYPOTHESIS` until the falsification battery
-> in `falsification.py` returns `HARD_PASS` on ≥ 2 independent crises.
+> **Tier (per `CLAIMS.md`):** `HYPOTHESIS` until the v2 falsification
+> battery returns `HARD_PASS` on ≥ 2 independent crises with real
+> interbank exposure data and the bootstrap-CI lower bound clears 0.70.
 
-## Hypothesis (pre-registered)
+## What this does
 
-The interbank market is a network of phase oscillators coupled through
-exposure-weighted lending. Approach to the Kuramoto bifurcation
-:math:`K_c` manifests as elevated rolling order parameter `R(t)`,
-positive slope of `R(t)`, and growing variance of `R(t)` (canonical
-critical-slowing-down diagnostics, Scheffer et al. 2009, *Nature*
-**461**: 53). The composite early-warning score
+A pre-registered, fail-closed test of one falsifiable claim: the
+early-warning score derived from rolling Kuramoto order-parameter
+features (level + slope + variance) is *elevated* in pre-event
+windows preceding banking-crisis dates relative to safely-distant
+null windows. The verdict is encoded once and never edited after
+seeing data — the AUC thresholds (`fail_auc=0.55`, `pass_auc_ci_low=0.70`),
+permutation p (`pass_alpha=0.01`), and Bonferroni FWER discipline are
+all defined in `falsification.FalsificationConfig`.
 
-```
-score(t) = R̄(t) · |slope(R)(t)| · √var(R)(t)
-```
-
-is *elevated* in pre-event windows preceding banking-crisis dates
-relative to null windows drawn from the same series at safe distance
-from any event.
-
-## Modules
-
-| File | Role |
-|------|------|
-| `event_ledger.py` | `BankingCrisisLedger` from Laeven & Valencia 2018 + 2023 anchor events |
-| `topology.py` | Empirical exposure → adjacency adapter + Barabási-Albert null |
-| `phase_extraction.py` | Interbank-rate spread → :math:`\theta_i(t)` via Hilbert (wraps `core.kuramoto.phase_extractor`) |
-| `early_warning.py` | Rolling-window CSD predictor (level + slope + variance composite) |
-| `falsification.py` | Pre-registered AUC + permutation p + Benjamini-Hochberg battery |
-
-## Falsification protocol (pre-registered, frozen)
-
-For each crisis *c* in the ledger with at least one valid pre-event window:
-
-1. Extract pre-event score values from the `pre_event_window_days`-long
-   window ending one day before `c.start`.
-2. Sample `null_window_count` non-overlapping null windows of the same
-   length, each ≥ `min_distance_from_event_days` from any event.
-3. Compute :math:`AUC_c` (Mann-Whitney U) and one-sided permutation p
-   with `n_permutations` resamples.
-4. Apply Benjamini-Hochberg FDR correction across all crises that
-   yielded valid windows.
+## What data it needs
 
-### Decision rule
-
-| Verdict | Condition |
-|---------|-----------|
-| `HARD_FAIL` | ∃ c with :math:`AUC_c \le` `fail_auc` (default 0.55) |
-| `HARD_PASS` | ≥ 2 crises with :math:`AUC_c \ge` `pass_auc` AND :math:`p^{BH}_c \le` `pass_alpha` (defaults 0.70, 0.01) |
-| `UNDECIDED` | neither — collect more data, do not promote tier |
-
-The thresholds are written *once* and never edited after seeing data.
-Any change to thresholds is a new pre-registration on a fresh branch.
-
-## Dataset manifest
+A directed exposure matrix (asymmetric). The module ships **no** real
+interbank exposure data; the loader expects user-supplied parquet/CSV
+in shape `(N, N)` where `exposures[i, j]` is *i*'s exposure to *j*.
 
 | Source | Status | Notes |
 |--------|--------|-------|
-| Laeven-Valencia 2018 (IMF WP/18/206) | inline | systemic banking crisis dates |
+| Laeven & Valencia 2018 (IMF WP/18/206) | inline | systemic banking crisis dates |
 | post-LV2020 designations (USA-2023, CHE-2023) | inline | flagged `source="post_LV2020"` |
-| e-MID Italian interbank (2009-2015) | external — caller-supplied | feed `from_exposure_matrix` |
-| BIS Locational Banking Statistics | external — caller-supplied | quarterly aggregate, sensitivity-only |
-
-The package ships *no* real interbank exposure data; the topology
-loader expects user-supplied parquet/CSV. The Barabási-Albert null
-exists exclusively as a falsification baseline (Boss et al. 2004).
-
-## Physics anchors (from `CLAUDE.md`)
-
-* INV-K1 — :math:`0 \le R(t) \le 1` (universal, P0); enforced in
-  `EarlyWarningResult.__post_init__`.
-* INV-K5 — :math:`\langle R \rangle \sim O(1/\sqrt{N})` for incoherent
-  phases (statistical, P1); test
-  `test_early_warning::test_inv_k5_incoherent_finite_size`.
-* INV-EVT1, INV-EVT2 — event-ledger date and country invariants
-  (this module).
-* INV-TOP1..3 — topology adjacency / weights / labels invariants
-  (this module).
-* INV-EW1, INV-EW2 — early-warning config invariants (this module).
-
-## Maintenance-hierarchy role
-
-Sustainer (Layer 2). The module emits a diagnostic score; it never
-takes execution action. A `HARD_PASS` outcome would only motivate
-promotion to a Protector role downstream — it does not itself protect
-any gradient.
+| e-MID Italian interbank (2009-2015) | external | feed `from_exposure_matrix` |
+| BIS Locational Banking Statistics | external | quarterly, sensitivity-only |
+| ECB MMSR | external | granular intraday |
+
+## What it claims
+
+`C-SYSRISK-PHASE` (`HYPOTHESIS` tier). Promotion to `MEASURED`
+requires:
+
+1. ≥ 2 valid crisis windows from available real exposure datasets
+   (e-MID 2009-2015 ⇒ Eurozone 2011 + SVB-tail proxy; BIS LBS
+   aggregated quarterly; ECB MMSR granular but access-constrained).
+   The exact crisis labels admissible per dataset are documented in
+   `LIMITATIONS.md`; e-MID does not cover Lehman 2008 (out-of-window).
+2. The bootstrap CI lower bound clears 0.70 with Bonferroni-adjusted
+   p ≤ 0.01 on each surviving crisis.
+3. No crisis returns `HARD_FAIL` (CI crossing 0.5 or AUC ≤ 0.55).
+4. Each surviving crisis additionally clears all six null baselines
+   in `null_models.py` (per `PROTOCOL.md` § 4).
+
+## Minimal example
+
+```python
+from datetime import date
+import numpy as np
+
+from research.systemic_risk import (
+    DEFAULT_LEDGER,
+    FalsificationConfig,
+    coupling_from_exposures,
+    fit_barabasi_albert_from_topology,
+    from_exposure_matrix,
+    run_falsification,
+)
+
+# 1. Build a directed topology from a real exposure matrix.
+exposures: np.ndarray = ...  # (N, N) directed, non-negative
+labels = tuple(f"bank_{i}" for i in range(exposures.shape[0]))
+topo = from_exposure_matrix(exposures, labels, snapshot_date=date(2011, 6, 30))
+
+# 2. Calibrate the BA null to the empirical degree distribution.
+#    Use `_from_topology` — passing `topo.degree` directly (in + out)
+#    doubles the recovered m on symmetric graphs.
+m_hat, fit = fit_barabasi_albert_from_topology(topo, n_bootstrap=1000)
+print(f"BA m={m_hat}, α={fit.alpha:.3f} ± {fit.alpha_se:.3f}, KS p={fit.ks_p_value:.3f}")
+
+# 3. Build the asymmetric coupling matrix K_ij.
+K = coupling_from_exposures(exposures, normalisation="row_stochastic")
+
+# 4. Run the pre-registered falsification battery.
+score: np.ndarray = ...           # (T,) early-warning score over time
+dates: tuple[date, ...] = ...     # length T, monotonically increasing
+report = run_falsification(score, dates, DEFAULT_LEDGER, country_filter="USA")
+
+print(f"verdict: {report.verdict}")
+for o in report.outcomes:
+    print(f"{o.label}: AUC={o.auc:.3f} [{o.auc_ci_low:.3f}, {o.auc_ci_high:.3f}], p_BONF={o.p_bonferroni:.4f}")
+```
 
-## Status
+## What changed in v2
+
+- **Asymmetric directed coupling.** v1 auto-symmetrised; real interbank
+  exposures are not symmetric (Bardoscia et al. 2021, *Nat. Rev. Phys.*
+  3: 490). `from_exposure_matrix(..., directed=True)` is now the
+  default; `directed=False` reserved for null baselines.
+- **MLE-fitted BA null.** v1 hard-coded `m=3`; v2 fits the power-law
+  exponent and BA `m` from the empirical degree sequence with a KS
+  goodness-of-fit p-value and AIC vs an exponential alternative
+  (Clauset, Shalizi, Newman 2009, *SIAM Rev.* 51: 661).
+- **Bootstrap CI on AUC.** v1 reported only the point estimate; v2
+  adds a stratified percentile-bootstrap CI (n=10000) and uses
+  `auc_ci_low` for the pass/fail thresholds — the whole CI must
+  clear the bar.
+- **Bonferroni FWER, not BH FDR.** v2 uses strict family-wise control
+  given the small crisis count and the cost of a false MEASURED
+  promotion.
+- **Optional snapshot date** for temporal pipelines (e-MID quarterly,
+  BIS LBS).
+- **ω from balance-sheet vol** via `omega_from_volatility` (first-order;
+  full inverse problem in `core.kuramoto.natural_frequency`).
 
-Initial commit:
+## Maintenance-hierarchy role
 
-* All public APIs typed (`mypy --strict` clean).
-* 57 tests covering invariants + statistical sanity (BH FWER,
-  null-AUC ≈ 0.5).
-* Hypothesis remains `HYPOTHESIS` tier; first real-data run pending
-  on user-supplied e-MID dump.
+Sustainer (Layer 2). Emits a diagnostic score; never takes execution
+action. A future `HARD_PASS` would only motivate promotion to a
+Protector role downstream.
+
+## References
+
+- Bardoscia, M. et al. (2021). *Physics of Financial Networks*.
+  *Nature Reviews Physics* **3**: 490 — canonical survey.
+- Acemoglu, D., Ozdaglar, A., Tahbaz-Salehi, A. (2015). *Systemic
+  Risk and Stability in Financial Networks*. *Am. Econ. Rev.*
+  **105**: 564 — phase-transition argument for interbank networks.
+- Arenas, A. et al. (2008). *Synchronization in Complex Networks*.
+  *Physics Reports* **469**: 93 — Kuramoto on graphs.
+- Boss, M. et al. (2004). *Network topology of the interbank market*.
+  *Quantitative Finance* **4**: 677.
+- Clauset, A., Shalizi, C. R., Newman, M. E. J. (2009).
+  *Power-law distributions in empirical data*. *SIAM Review* **51**: 661.
+- Laeven, L., Valencia, F. (2018). *Systemic Banking Crises Revisited*.
+  IMF Working Paper WP/18/206.
+- Scheffer, M. et al. (2009). *Early-warning signals for critical
+  transitions*. *Nature* **461**: 53.
+- Soramäki, K. et al. (2007). *The topology of interbank payment flows*.
+  *Physica A* **379**: 317.
diff --git a/research/systemic_risk/VALIDATION.md b/research/systemic_risk/VALIDATION.md
new file mode 100644
index 00000000..c50567cf
--- /dev/null
+++ b/research/systemic_risk/VALIDATION.md
@@ -0,0 +1,47 @@
+# VALIDATION — research/systemic_risk
+
+> The strongest claim this module supports as of the current commit.
+> The README must not assert anything stronger than this file.
+
+## Current claim ledger
+
+| Claim | Tier | Evidence |
+|-------|------|----------|
+| The instrument exists and is type-safe | `FACT` | `mypy --strict` clean on every module + test file under the package; 125 unit + property tests pass under `pytest -q`. |
+| The decision rule is pre-registered and frozen | `FACT` | `PROTOCOL.md` table 3 + `FalsificationConfig` defaults; every threshold is reproduced in the `RunManifest.config_hash`. |
+| The lower rail (random scores) does not falsely pass | `MEASURED` | `tests/research/systemic_risk/test_falsification.py::test_random_scores_do_not_pass` + the equivalent end-to-end smoke run from PR #557 (HARD_FAIL at AUC ≈ 0.45). |
+| The upper rail (injected pre-event +3σ signal) passes | `MEASURED` | `tests/research/systemic_risk/test_falsification.py::test_injected_signal_passes` — every crisis returns `auc_ci_low ≥ 0.70` and the verdict is `HARD_PASS`. |
+| The bootstrap CI is calibrated | `MEASURED` | `tests/research/systemic_risk/test_falsification.py::test_ci_under_h0_contains_half` — coverage clears the binomial-derived lower bound at α_test=1e-3. |
+| The MLE α-recovery on synthetic samples matches the input within ±0.20 | `MEASURED` | `tests/research/systemic_risk/test_network_fitting.py::test_recovers_alpha_on_synthetic` with ensemble of 30 seeds. |
+| The BA `m`-calibration recovers the generator's `m` to ±1 on `barabasi_albert_null(N=400)` | `MEASURED` | `test_recovers_generator_m_on_ba_null` parametrised over `m ∈ {2, 3, 4}`. |
+| All 6 mandatory null baselines are implemented and tested | `FACT` | `null_models.py` + `tests/test_null_models.py` (23 tests). |
+| Interbank phase-locking precedes banking-crisis events on real data | `HYPOTHESIS` | **Pending** — blocked on user-supplied e-MID 2009-2015 / BIS LBS / ECB MMSR dump. |
+
+## What `MEASURED` requires from here
+
+1. Real exposure data ingested via `from_exposure_matrix`.
+2. Pre-registered `θ` derivation locked before any AUC is computed
+   (training-crisis-only or sensitivity-sweep with full disclosure).
+3. Falsification battery returns `HARD_PASS` on **≥ 2** independent
+   crises from the {2008 GFC, 2011 Eurozone, 2023 SVB/CS} set.
+4. Each detected crisis survives **all 6** null baselines:
+   `auc_under_null ≤ 0.55` for every baseline.
+5. Bonferroni-corrected p ≤ 0.01 across the surviving crisis set.
+6. Replicated by an independent runner using only the
+   pre-registered config + dataset hash.
+7. `git_dirty=False` in the run manifest.
+
+Every individual condition is *necessary*, the conjunction is *sufficient*.
+A failure on any one condition reverts the claim to `HYPOTHESIS` and
+archives the negative result per `LIMITATIONS.md`.
+
+## What `MEASURED` does NOT confer
+
+* Trade authorisation: no Layer-4 (Generator) downstream consumer is
+  permitted to consume this score for execution sizing without a
+  separate, independently-audited Layer-2 (Sustainer) gate.
+* Forecasting authority: a `MEASURED` claim is a statement about a
+  fixed historical sample, not a prediction about the next crisis.
+* Causal claim: the signal is associative; mechanistic causation
+  requires the additional intervention experiments listed in
+  `LIMITATIONS.md` § "Causal claims requiring further evidence".
diff --git a/research/systemic_risk/__init__.py b/research/systemic_risk/__init__.py
index 0b6792cf..00e74276 100644
--- a/research/systemic_risk/__init__.py
+++ b/research/systemic_risk/__init__.py
@@ -1,19 +1,25 @@
 # Copyright (c) 2023-2026 Yaroslav Vasylenko (neuron7xLab)
 # SPDX-License-Identifier: MIT
-"""Systemic-risk-as-phase-transition research module.
+"""Systemic-risk-as-phase-transition research module — v2.
 
-A pre-registered falsification of the hypothesis that interbank
+Pre-registered falsification of the hypothesis that interbank
 phase-locking precedes banking-crisis events. All claims under
-``CLAIMS.md`` are ``HYPOTHESIS`` tier until the battery returns
-``HARD_PASS`` on >= 2 independent crises.
+``CLAIMS.md`` are ``HYPOTHESIS`` tier until the v2 battery returns
+``HARD_PASS`` on >= 2 independent crises with real interbank
+exposure data and a bootstrap-CI lower bound clearing 0.70.
 
 Layer in the maintenance hierarchy: this module is a *Sustainer*
-diagnostic — it reports approach to the Kuramoto bifurcation Φ → 0
+diagnostic — it reports approach to the Kuramoto bifurcation
 without taking any execution action.
 """
 
 from __future__ import annotations
 
+from .coupling import (
+    coupling_from_exposures,
+    omega_from_volatility,
+    sakaguchi_alpha_zero,
+)
 from .early_warning import (
     EarlyWarningConfig,
     EarlyWarningResult,
@@ -29,14 +35,41 @@
     CrisisOutcome,
     FalsificationConfig,
     FalsificationReport,
+    auc_bootstrap_ci,
     auc_mann_whitney,
-    benjamini_hochberg,
+    bonferroni_correction,
     run_falsification,
 )
+from .network_fitting import (
+    MIN_RELATIVE_SE_VALIDATION,
+    MIN_TAIL_SIZE_VALIDATION,
+    ExponentialFit,
+    ModelComparison,
+    PowerLawFit,
+    compare_power_law_vs_exponential,
+    fit_barabasi_albert,
+    fit_barabasi_albert_from_topology,
+    fit_exponential,
+    fit_power_law,
+    fit_power_law_validation,
+)
+from .null_models import (
+    NullSurrogate,
+    degree_preserving_randomization,
+    linear_correlation_surrogate,
+    permuted_crisis_dates,
+    random_exposure_weights,
+    shuffled_time_labels,
+    static_topology_baseline,
+)
 from .phase_extraction import (
     INTERBANK_DEFAULT_BAND,
     interbank_phase_extract,
 )
+from .replication import (
+    RunManifest,
+    build_run_manifest,
+)
 from .topology import (
     InterbankTopology,
     barabasi_albert_null,
@@ -50,16 +83,40 @@
     "DEFAULT_LEDGER",
     "EarlyWarningConfig",
     "EarlyWarningResult",
+    "ExponentialFit",
     "FalsificationConfig",
     "FalsificationReport",
     "INTERBANK_DEFAULT_BAND",
     "InterbankTopology",
+    "MIN_RELATIVE_SE_VALIDATION",
+    "MIN_TAIL_SIZE_VALIDATION",
+    "ModelComparison",
+    "NullSurrogate",
+    "PowerLawFit",
+    "RunManifest",
+    "auc_bootstrap_ci",
     "auc_mann_whitney",
     "barabasi_albert_null",
-    "benjamini_hochberg",
+    "bonferroni_correction",
+    "build_run_manifest",
+    "compare_power_law_vs_exponential",
     "compute_early_warning",
+    "coupling_from_exposures",
+    "degree_preserving_randomization",
+    "fit_barabasi_albert",
+    "fit_barabasi_albert_from_topology",
+    "fit_exponential",
+    "fit_power_law",
+    "fit_power_law_validation",
     "from_exposure_matrix",
     "interbank_phase_extract",
     "kuramoto_order_parameter",
+    "linear_correlation_surrogate",
+    "omega_from_volatility",
+    "permuted_crisis_dates",
+    "random_exposure_weights",
     "run_falsification",
+    "sakaguchi_alpha_zero",
+    "shuffled_time_labels",
+    "static_topology_baseline",
 ]
diff --git a/research/systemic_risk/coupling.py b/research/systemic_risk/coupling.py
new file mode 100644
index 00000000..07be2fe1
--- /dev/null
+++ b/research/systemic_risk/coupling.py
@@ -0,0 +1,209 @@
+# Copyright (c) 2023-2026 Yaroslav Vasylenko (neuron7xLab)
+# SPDX-License-Identifier: MIT
+"""Asymmetric coupling matrix + intrinsic frequency estimation.
+
+The Sakaguchi–Kuramoto model with directed coupling and per-pair phase
+lag :math:`\\alpha_{ij}` is
+
+.. math::
+
+    \\dot\\theta_i = \\omega_i + \\sum_{j \\ne i}
+                    K_{ij} \\sin(\\theta_j - \\theta_i - \\alpha_{ij})
+
+**Canonical orientation invariant** (single source of truth — every
+caller must respect this):
+
+::
+
+    E[i, j]  =  exposure of *i* to *j*  =  i has lent to j
+                (lending channel  i → j;
+                 i is at risk if j defaults)
+
+    K[i, j]  =  stress felt by i from j
+                ∝ E[i, j] (i's claim on j; if j fails, i is hurt
+                           proportionally to its loan to j)
+
+So ``K = f(E)`` *without* a transpose: the row index is the bank
+that *feels* the stress; the column index is the bank whose
+default would cause it. Every test in this module's regression
+suite asserts the canonical orientation on a 2×2 directed example
+to catch any future transpose bug.
+
+v1 of this module assumed symmetric :math:`K`; v2 builds it
+directly from the asymmetric exposure matrix without symmetrising.
+Per-pair phase lag is supported but defaults to the symmetric
+Kuramoto limit (:math:`\\alpha_{ij} = 0`) because joint estimation
+of α from interbank data is a separate inverse problem (delegated
+to ``core.kuramoto.frustration``).
+
+Three pure functions:
+
+* :func:`coupling_from_exposures` — build :math:`K` from a directed
+  exposure matrix with optional row-stochastic or capital-ratio
+  normalisation.
+* :func:`omega_from_volatility` — estimate :math:`\\omega_i` from the
+  rolling-volatility cycle of each bank's balance-sheet returns.
+* :func:`sakaguchi_alpha_zero` — convenience zero matrix matching a
+  given coupling shape.
+
+Pure-function API. No I/O.
+"""
+
+from __future__ import annotations
+
+from typing import Literal
+
+import numpy as np
+from numpy.typing import NDArray
+
+__all__ = [
+    "coupling_from_exposures",
+    "omega_from_volatility",
+    "sakaguchi_alpha_zero",
+]
+
+
+Normalisation = Literal["row_stochastic", "capital_weighted", "raw"]
+
+
+def coupling_from_exposures(
+    exposures: NDArray[np.float64],
+    *,
+    normalisation: Normalisation = "row_stochastic",
+    capital: NDArray[np.float64] | None = None,
+    floor: float = 0.0,
+) -> NDArray[np.float64]:
+    """Build an asymmetric coupling matrix :math:`K` from exposures.
+
+    Parameters
+    ----------
+    exposures
+        Real, non-negative matrix shape ``(N, N)`` where
+        ``exposures[i, j]`` is *i*'s exposure to *j* (lending volume).
+    normalisation
+        ``"row_stochastic"`` (default) divides each row by its row
+        sum: ``K[i, j] = E[i, j] / Σ_j E[i, j]``. Per the canonical
+        orientation invariant declared in the module docstring,
+        ``K[i, j]`` then expresses the **share of bank i's total
+        exposure that is concentrated in counterparty j** — i.e. the
+        fraction of i's claims at risk if j defaults. Rows whose sum
+        is zero stay zero (no edges originate from that bank).
+        ``"capital_weighted"`` divides each row by the lender's
+        capital, so the coupling expresses exposure-to-capital ratio
+        (Battiston et al. 2012, *Sci. Rep.* 2: 541). ``"raw"`` returns
+        the exposure matrix unchanged (only the diagonal cleared).
+    capital
+        Length-``N`` capital vector, required when
+        ``normalisation == "capital_weighted"``. Must be strictly
+        positive (no zero capital).
+    floor
+        Inclusive lower bound on the *kept* set: entries strictly
+        below ``floor`` after normalisation are clamped to zero;
+        entries equal to ``floor`` are kept. Defaults to ``0.0`` —
+        ``floor > 0`` is useful when the empirical matrix carries
+        rounding noise.
+
+    Returns
+    -------
+    Real matrix shape ``(N, N)``, zero diagonal, asymmetric in
+    general. Non-negative everywhere.
+    """
+    e = np.asarray(exposures, dtype=np.float64)
+    if e.ndim != 2 or e.shape[0] != e.shape[1]:
+        raise ValueError(f"exposures must be square 2-D, got shape={e.shape}")
+    if not np.isfinite(e).all():
+        raise ValueError("exposures must be finite (no NaN/Inf)")
+    if np.any(e < 0):
+        raise ValueError("exposures must be non-negative")
+    if floor < 0:
+        raise ValueError(f"floor must be >= 0, got {floor}")
+    n = e.shape[0]
+    k_matrix = np.array(e, dtype=np.float64, copy=True)
+    np.fill_diagonal(k_matrix, 0.0)
+    if normalisation == "row_stochastic":
+        row_sums = k_matrix.sum(axis=1, keepdims=True)
+        # bounds: row_sums == 0 stays at 0 (no edges); avoid div-by-zero noise.
+        safe = np.where(row_sums > 0, row_sums, 1.0)
+        k_matrix = k_matrix / safe
+    elif normalisation == "capital_weighted":
+        if capital is None:
+            raise ValueError("normalisation='capital_weighted' requires capital vector")
+        c = np.asarray(capital, dtype=np.float64)
+        if c.shape != (n,):
+            raise ValueError(f"capital shape {c.shape} != (N,)=({n},)")
+        if not np.all(c > 0) or not np.isfinite(c).all():
+            raise ValueError("capital must be strictly positive and finite")
+        k_matrix = k_matrix / c[:, None]
+    elif normalisation == "raw":
+        pass
+    else:  # pragma: no cover - typing should prevent this path
+        raise ValueError(f"unknown normalisation {normalisation!r}")
+    if floor > 0:
+        # Inclusive lower bound on the *kept* set: entries strictly
+        # below ``floor`` are clamped to zero; entries equal to floor
+        # are kept (they are by definition at the documented noise
+        # threshold, not below it). Matches the docstring's
+        # "Inclusive lower bound" wording.
+        k_matrix = np.where(k_matrix >= floor, k_matrix, 0.0)
+    np.fill_diagonal(k_matrix, 0.0)
+    return k_matrix
+
+
+def omega_from_volatility(
+    log_returns: NDArray[np.float64],
+    *,
+    fs: float = 1.0,
+) -> NDArray[np.float64]:
+    """Estimate per-bank intrinsic frequency :math:`\\omega_i` from balance-sheet vol.
+
+    Parameters
+    ----------
+    log_returns
+        Shape ``(T, N_banks)``, finite log-returns of each bank's
+        balance-sheet (or equity) value. Canonical (T, N) layout.
+    fs
+        Sampling rate in samples per day. Defaults to ``1.0`` for
+        end-of-day observations. Output ``ω_i`` is in radians per day.
+
+    Returns
+    -------
+    Real array shape ``(N_banks,)`` of intrinsic frequencies.
+
+    Notes
+    -----
+    The intrinsic frequency is identified with the dominant
+    spectral-power frequency of the bank's volatility envelope —
+    proxied here by ``2π · σ_i · fs`` where ``σ_i`` is the sample
+    standard deviation of the bank's returns. This is a *first-order*
+    estimator: a higher-fidelity option (Lomb-Scargle on
+    rolling-vol time series) is delegated to
+    ``core.kuramoto.natural_frequency``.
+    """
+    r = np.asarray(log_returns, dtype=np.float64)
+    if r.ndim != 2:
+        raise ValueError(f"log_returns must be 2-D (T, N), got shape={r.shape}")
+    if r.shape[0] < 2:
+        raise ValueError(
+            f"log_returns must have at least 2 time samples to compute "
+            f"sample std (ddof=1), got T={r.shape[0]}"
+        )
+    if not np.isfinite(r).all():
+        raise ValueError("log_returns must be finite (no NaN/Inf)")
+    if fs <= 0:
+        raise ValueError(f"fs must be > 0, got {fs}")
+    sigma = r.std(axis=0, ddof=1)
+    omega = 2.0 * np.pi * sigma * fs
+    out: NDArray[np.float64] = np.asarray(omega, dtype=np.float64)
+    return out
+
+
+def sakaguchi_alpha_zero(n_nodes: int) -> NDArray[np.float64]:
+    """Zero phase-lag matrix matching a coupling of size ``n_nodes``.
+
+    The standard Kuramoto limit corresponds to :math:`\\alpha_{ij} = 0`.
+    Joint estimation of a non-zero α-matrix from interbank-rate phases
+    is delegated to :class:`core.kuramoto.frustration.FrustrationEstimator`.
+    """
+    if n_nodes < 1:
+        raise ValueError(f"n_nodes must be >= 1, got {n_nodes}")
+    return np.zeros((n_nodes, n_nodes), dtype=np.float64)
diff --git a/research/systemic_risk/data_schema.md b/research/systemic_risk/data_schema.md
new file mode 100644
index 00000000..dbf0b905
--- /dev/null
+++ b/research/systemic_risk/data_schema.md
@@ -0,0 +1,61 @@
+# DATA SCHEMA — research/systemic_risk
+
+> Every field below is enforced at the boundary by
+> `from_exposure_matrix`. Violation raises `ValueError` before any
+> numerical computation runs (fail-closed).
+
+## 1. Exposure matrix
+
+| Field | Type | Constraint |
+|-------|------|------------|
+| `exposures` | `np.ndarray`, shape `(N, N)`, dtype convertible to `float64` | square 2-D; finite (no NaN/Inf); non-negative; `exposures[i, j]` is *i*'s exposure to *j* (i.e. lending **from** *i* **to** *j*); symmetric only by accident on real data, asymmetric in general. |
+| `node_labels` | `tuple[str, ...]` | length `N`; unique; ASCII-stable identifiers; no remapping. |
+| `directed` | `bool` | default `True`. `False` symmetrises by averaging — used only for null-baseline construction. |
+| `threshold` | `float ≥ 0` | inclusive lower bound on a kept entry; entries strictly below `threshold` are clamped to zero in the binary support. |
+| `snapshot_date` | `datetime.date` or `None` | optional; required for temporal-snapshot pipelines (e-MID quarterly, BIS LBS). |
+| `source_label` | `str` | free-form provenance tag; recorded in the `RunManifest.extra` namespace as `dataset_source`. |
+
+## 2. Spread series (for phase extraction)
+
+| Field | Type | Constraint |
+|-------|------|------------|
+| `spreads` | `np.ndarray`, shape `(T, N_banks)`, `float64` | rows = time, columns = banks; finite. |
+| `asset_ids` | `tuple[str, ...]` | length `N_banks`; unique. |
+| `timestamps` | `np.ndarray`, shape `(T,)`, `float64` | monotonically increasing. |
+| `fs` | `float > 0` | sampling rate in samples per day. |
+| `band` | `(f_low, f_high)` cycles/day | `0 < f_low < f_high < fs/2`. |
+
+## 3. Banking-crisis ledger
+
+| Field | Type | Constraint |
+|-------|------|------------|
+| `country` | `str` | exactly 3 uppercase ASCII letters (ISO-3166 α-3). |
+| `start` | `datetime.date` | first day of the crisis interval. |
+| `end` | `datetime.date` | `≥ start`. |
+| `source` | `Literal["LV2018", "LV2020_update", "post_LV2020"]` | provenance tag. |
+| `label` | `str` | unique within the ledger. |
+
+## 4. Run-manifest extra fields (recommended)
+
+Callers persisting a run should populate `extra` with at minimum:
+
+| Key | Value type | Purpose |
+|-----|------------|---------|
+| `dataset` | `str` | human-readable dataset identifier, e.g. `"e-MID_2009Q1-2015Q4"`. |
+| `data_sha256` | `str` | SHA-256 of the canonical exposure-matrix file (sort_keys-serialised CSV/parquet). |
+| `crisis_set` | `list[str]` | label set used for the falsification, e.g. `["GFC_USA_2007", "EZ_LATE_GRC_2011", "SVB_FRC_2023"]`. |
+
+These are not enforced by the manifest itself — the protocol simply
+refuses to promote any tier that does not produce them.
+
+## 5. Forbidden inputs (fail-closed)
+
+* Any `NaN` or `Inf` in `exposures`, `spreads`, or `timestamps`.
+* Negative entries in `exposures` or `capital`.
+* Zero or negative `fs`.
+* `node_labels` with duplicates or empty strings.
+* `T < 2` for `omega_from_volatility` (`std(ddof=1)` undefined).
+* Mean degree `<k> < 2` for `fit_barabasi_albert`
+  (BA-incompatible per Albert-Barabási 2002 eq. 4.7).
+* Constant degree sequence for `fit_power_law` / `fit_barabasi_albert`
+  (no fit possible).
diff --git a/research/systemic_risk/errors.py b/research/systemic_risk/errors.py
new file mode 100644
index 00000000..0e81c575
--- /dev/null
+++ b/research/systemic_risk/errors.py
@@ -0,0 +1,56 @@
+# Copyright (c) 2023-2026 Yaroslav Vasylenko (neuron7xLab)
+# SPDX-License-Identifier: MIT
+"""Structured exception hierarchy for the canonical entry contract.
+
+The official validation protocol (§ 5 — Entry-Point Gate) requires every
+boundary failure to surface as an explicit, typed exception so that
+upstream pipelines can pattern-match on the failure class instead of
+parsing free-form ``ValueError`` strings.
+
+The hierarchy is single-rooted under :class:`SystemicRiskInputError`
+and inherits from :class:`ValueError` — backward-compatible with every
+existing ``except ValueError`` site, but pattern-matchable for new
+callers.
+"""
+
+from __future__ import annotations
+
+__all__ = [
+    "SystemicRiskInputError",
+    "InvalidExposureMatrixError",
+    "InvalidNodeLabelsError",
+    "InvalidTemporalPanelError",
+]
+
+
+class SystemicRiskInputError(ValueError):
+    """Root of the structured-error hierarchy.
+
+    Existing callers using ``except ValueError`` continue to work
+    because every concrete error is also a ``ValueError``.
+    """
+
+
+class InvalidExposureMatrixError(SystemicRiskInputError):
+    """Raised when the exposure matrix violates a documented invariant.
+
+    Examples: non-square shape, NaN / Inf entries, negative entries,
+    constraint mismatch with ``node_labels`` length.
+    """
+
+
+class InvalidNodeLabelsError(SystemicRiskInputError):
+    """Raised when ``node_labels`` violates a documented invariant.
+
+    Examples: duplicate labels, length mismatch with the exposure
+    matrix, empty-string labels.
+    """
+
+
+class InvalidTemporalPanelError(SystemicRiskInputError):
+    """Raised when a temporal-snapshot pipeline detects a panel-level defect.
+
+    Examples: non-monotonic timestamps, snapshot cardinality
+    inconsistent across pipeline stages, empty snapshot tuple where
+    at least one is required.
+    """
diff --git a/research/systemic_risk/falsification.py b/research/systemic_risk/falsification.py
index 8a532dd9..32a169fd 100644
--- a/research/systemic_risk/falsification.py
+++ b/research/systemic_risk/falsification.py
@@ -1,33 +1,35 @@
 # Copyright (c) 2023-2026 Yaroslav Vasylenko (neuron7xLab)
 # SPDX-License-Identifier: MIT
-"""Pre-registered falsification battery for the interbank-Kuramoto hypothesis.
+"""Pre-registered falsification battery — v2 with bootstrap-CI verdict.
 
 The hypothesis under test (``HYPOTHESIS`` tier per ``CLAIMS.md``):
 
-    The early-warning score (``research.systemic_risk.early_warning``)
+    The early-warning score
+    (:func:`research.systemic_risk.early_warning.compute_early_warning`)
     is *elevated* in pre-event windows preceding banking-crisis dates
     compared to null windows drawn from the same series at safe
     distance from any event.
 
 Decision rule (pre-registered, written *before* any data is run)::
 
-    For each crisis c with at least one valid pre-event window:
-        AUC_c   = ROC AUC of (pre-event scores vs null-window scores)
-        p_c     = one-sided permutation p-value
-                  (alternative: pre-event > null)
+    For each crisis c with a valid pre-event window:
+        AUC_c          = ROC AUC of (pre-event scores vs null-window scores)
+        AUC_c (95% CI) = percentile bootstrap, n=10000 stratified resamples
+        p_c            = one-sided permutation p (alternative: pre > null)
 
     Across crises:
-        p_BH    = Benjamini-Hochberg corrected p-values (FDR control)
+        p_BONF = Bonferroni-corrected p-values (k = number of valid crises)
 
-    HARD FAIL  : ∃ c with AUC_c <= ``fail_auc`` (default 0.55)
-                  → archive negative; close the hypothesis.
-    HARD PASS  : at least 2 crises with AUC_c >= ``pass_auc`` AND
-                  p_BH_c <= ``pass_alpha`` (defaults 0.70, 0.01).
-    UNDECIDED  : neither — collect more data, do not promote tier.
+    HARD_FAIL : ∃ c with AUC_c <= ``fail_auc`` (default 0.55)
+                OR ∃ c with auc_ci_low <= 0.5 + ``ci_floor_tol`` (CI crosses 0.5)
+                → archive negative; close the hypothesis.
+    HARD_PASS : >= 2 crises with auc_ci_low >= ``pass_auc_ci_low``
+                AND p_BONF_c <= ``pass_alpha`` (defaults 0.70, 0.01).
+    UNDECIDED : neither — collect more data, do not promote tier.
 
-The verdict is *encoded once* and never edited after seeing data — any
-subsequent change to ``fail_auc``, ``pass_auc`` or ``pass_alpha`` is a
-new pre-registration on a fresh branch.
+Bonferroni replaces the v1 Benjamini-Hochberg FDR control: the user
+prefers strict family-wise error control given the small number of
+crises and the high cost of a false MEASURED promotion.
 
 Pure-function API. No I/O. Determinism via explicit ``seed``.
 """
@@ -48,7 +50,8 @@
     "CrisisOutcome",
     "FalsificationReport",
     "auc_mann_whitney",
-    "benjamini_hochberg",
+    "auc_bootstrap_ci",
+    "bonferroni_correction",
     "run_falsification",
 ]
 
@@ -65,7 +68,7 @@ def auc_mann_whitney(positives: NDArray[np.float64], negatives: NDArray[np.float
     """ROC AUC via the Mann-Whitney U statistic.
 
     AUC = P(X_pos > X_neg) + 0.5 * P(X_pos == X_neg).
-    Returns 0.5 when either array is empty (uninformative, by convention).
+    Returns 0.5 when either array is empty.
     """
     if positives.size == 0 or negatives.size == 0:
         return 0.5
@@ -74,7 +77,6 @@ def auc_mann_whitney(positives: NDArray[np.float64], negatives: NDArray[np.float
     if pos.size == 0 or neg.size == 0:
         return 0.5
     combined = np.concatenate([pos, neg])
-    # Average ranks over ties (rankdata midrank).
     _, inv, counts = np.unique(combined, return_inverse=True, return_counts=True)
     raw_ranks = combined.argsort().argsort().astype(np.float64) + 1.0
     sums = np.bincount(inv, weights=raw_ranks)
@@ -87,6 +89,46 @@ def auc_mann_whitney(positives: NDArray[np.float64], negatives: NDArray[np.float
     return float(u / (n_pos * n_neg))
 
 
+def auc_bootstrap_ci(
+    positives: NDArray[np.float64],
+    negatives: NDArray[np.float64],
+    *,
+    n_bootstrap: int = 10000,
+    seed: int = 42,
+    confidence: float = 0.95,
+) -> tuple[float, float, float]:
+    """Stratified percentile-bootstrap CI on the AUC.
+
+    Resamples positives and negatives independently *with replacement*
+    ``n_bootstrap`` times, computes the AUC on each resample, and
+    returns ``(point_estimate, ci_low, ci_high)`` where the CI is the
+    central ``confidence`` percentile interval. Stratified resampling
+    preserves the marginal sample sizes — an AUC artefact of mixing
+    the two arms is impossible.
+    """
+    if not 0.0 < confidence < 1.0:
+        raise ValueError(f"confidence must be in (0, 1), got {confidence}")
+    if n_bootstrap < 1:
+        raise ValueError(f"n_bootstrap must be >= 1, got {n_bootstrap}")
+    pos = positives[np.isfinite(positives)]
+    neg = negatives[np.isfinite(negatives)]
+    point = auc_mann_whitney(pos, neg)
+    if pos.size < 2 or neg.size < 2:
+        return point, point, point
+    rng = np.random.default_rng(seed)
+    samples = np.empty(n_bootstrap, dtype=np.float64)
+    n_pos = pos.size
+    n_neg = neg.size
+    for b in range(n_bootstrap):
+        idx_p = rng.integers(0, n_pos, size=n_pos)
+        idx_n = rng.integers(0, n_neg, size=n_neg)
+        samples[b] = auc_mann_whitney(pos[idx_p], neg[idx_n])
+    alpha = (1.0 - confidence) / 2.0
+    ci_low = float(np.quantile(samples, alpha))
+    ci_high = float(np.quantile(samples, 1.0 - alpha))
+    return point, ci_low, ci_high
+
+
 def _permutation_p(
     positives: NDArray[np.float64],
     negatives: NDArray[np.float64],
@@ -108,15 +150,16 @@ def _permutation_p(
         a = auc_mann_whitney(perm[:n_pos], perm[n_pos:])
         if a >= observed:
             exceedances += 1
-    # Davison & Hinkley (1997) +1 continuity correction.
     return float((exceedances + 1) / (n_permutations + 1))
 
 
-def benjamini_hochberg(p_values: NDArray[np.float64]) -> NDArray[np.float64]:
-    """Benjamini-Hochberg FDR-adjusted p-values (1995).
+def bonferroni_correction(p_values: NDArray[np.float64]) -> NDArray[np.float64]:
+    """Family-wise error-rate control via Bonferroni: ``p_adj = min(1, m * p)``.
 
-    Adjusted p_(i) = min_{k>=i} (m / k) * p_(k), clipped to [0, 1].
-    Order is preserved relative to the input.
+    Order is preserved relative to the input. More conservative than
+    Benjamini-Hochberg FDR — chosen here per the v2 protocol because
+    promoting C-SYSRISK-PHASE to MEASURED on a false positive is
+    treated as catastrophic.
     """
     p = np.asarray(p_values, dtype=np.float64)
     if p.ndim != 1:
@@ -126,16 +169,7 @@ def benjamini_hochberg(p_values: NDArray[np.float64]) -> NDArray[np.float64]:
     if np.any(p < 0) or np.any(p > 1) or not np.isfinite(p).all():
         raise ValueError("p_values must be finite values in [0, 1]")
     m = p.size
-    order = p.argsort()
-    ranked = p[order]
-    factors = np.arange(1, m + 1, dtype=np.float64)
-    adjusted_sorted = ranked * (m / factors)
-    # Enforce monotone non-decreasing along reverse-sorted indices.
-    adjusted_sorted = np.minimum.accumulate(adjusted_sorted[::-1])[::-1]
-    adjusted_sorted = np.clip(adjusted_sorted, 0.0, 1.0)
-    out = np.empty_like(p)
-    out[order] = adjusted_sorted
-    return out
+    return np.clip(p * m, 0.0, 1.0)
 
 
 # ---------------------------------------------------------------------------
@@ -144,7 +178,6 @@ def benjamini_hochberg(p_values: NDArray[np.float64]) -> NDArray[np.float64]:
 
 
 def _date_to_index(target: date, dates: tuple[date, ...]) -> int | None:
-    """Return the index of the *latest* date <= ``target``, or ``None`` if all later."""
     out: int | None = None
     for i, d in enumerate(dates):
         if d <= target:
@@ -160,7 +193,6 @@ def _pre_event_window(
     event_start: date,
     window_days: int,
 ) -> NDArray[np.float64]:
-    """Extract the score values strictly *before* the event, length ``window_days``."""
     end_idx = _date_to_index(event_start - timedelta(days=1), dates)
     if end_idx is None:
         return np.empty(0, dtype=np.float64)
@@ -179,12 +211,10 @@ def _null_windows(
     n_windows: int,
     country_filter: str | None,
 ) -> NDArray[np.float64]:
-    """Sample non-overlapping null windows at safe distance from any event."""
     if score.size != len(dates):
         raise ValueError(f"score length {score.size} != dates length {len(dates)}")
     if score.size < window_days:
         return np.empty(0, dtype=np.float64)
-
     relevant_events: tuple[BankingCrisisEvent, ...]
     if country_filter is None:
         relevant_events = ledger.events
@@ -208,7 +238,6 @@ def _too_close(window_end_idx: int) -> bool:
             valid_ends.append(end_idx)
     if not valid_ends:
         return np.empty(0, dtype=np.float64)
-
     take = min(n_windows, len(valid_ends))
     chosen = rng.choice(np.asarray(valid_ends, dtype=np.int64), size=take, replace=False)
     flat = np.concatenate([score[int(c) - window_days + 1 : int(c) + 1] for c in chosen])
@@ -222,7 +251,7 @@ def _too_close(window_end_idx: int) -> bool:
 
 @dataclass(frozen=True, slots=True)
 class FalsificationConfig:
-    """Pre-registered falsification protocol.
+    """Pre-registered falsification protocol (v2).
 
     Attributes
     ----------
@@ -232,15 +261,24 @@ class FalsificationConfig:
         Number of null windows to draw per run (default 30).
     min_distance_from_event_days
         Buffer between any null window and any event interval
-        (default 365: a full year of separation).
+        (default 365).
     n_permutations
         Permutations for the AUC p-value (default 5000).
+    n_bootstrap
+        Stratified-bootstrap resamples for the AUC CI (default 10000).
+    confidence
+        Confidence level for the AUC CI (default 0.95).
     fail_auc
-        Hard-fail threshold (default 0.55).
-    pass_auc
-        Hard-pass AUC threshold (default 0.70).
+        Hard-fail threshold on the *point* AUC (default 0.55).
+    ci_floor_tol
+        Tolerance above 0.5 below which the CI lower bound triggers
+        HARD_FAIL (default 0.0 — strict: any CI crossing 0.5 fails).
+    pass_auc_ci_low
+        HARD_PASS threshold on the AUC *CI lower bound* (default 0.70).
+        Stronger than v1's point-estimate threshold: requires the
+        whole CI to clear the bar.
     pass_alpha
-        Hard-pass BH-adjusted p threshold (default 0.01).
+        HARD_PASS Bonferroni-adjusted p threshold (default 0.01).
     seed
         Deterministic RNG seed (default 42).
     """
@@ -249,8 +287,11 @@ class FalsificationConfig:
     null_window_count: int = 30
     min_distance_from_event_days: int = 365
     n_permutations: int = 5000
+    n_bootstrap: int = 10000
+    confidence: float = 0.95
     fail_auc: float = 0.55
-    pass_auc: float = 0.70
+    ci_floor_tol: float = 0.0
+    pass_auc_ci_low: float = 0.70
     pass_alpha: float = 0.01
     seed: int = 42
 
@@ -268,18 +309,24 @@ def __post_init__(self) -> None:
             )
         if self.n_permutations < 100:
             raise ValueError(f"n_permutations must be >= 100, got {self.n_permutations}")
-        if not 0.0 < self.fail_auc < self.pass_auc <= 1.0:
+        if self.n_bootstrap < 100:
+            raise ValueError(f"n_bootstrap must be >= 100, got {self.n_bootstrap}")
+        if not 0.0 < self.confidence < 1.0:
+            raise ValueError(f"confidence must be in (0, 1), got {self.confidence}")
+        if not 0.0 < self.fail_auc < self.pass_auc_ci_low <= 1.0:
             raise ValueError(
-                f"thresholds must satisfy 0 < fail_auc < pass_auc <= 1; "
-                f"got fail={self.fail_auc}, pass={self.pass_auc}"
+                f"thresholds must satisfy 0 < fail_auc < pass_auc_ci_low <= 1; "
+                f"got fail={self.fail_auc}, pass={self.pass_auc_ci_low}"
             )
+        if self.ci_floor_tol < 0:
+            raise ValueError(f"ci_floor_tol must be >= 0, got {self.ci_floor_tol}")
         if not 0.0 < self.pass_alpha <= 0.1:
             raise ValueError(f"pass_alpha must be in (0, 0.1], got {self.pass_alpha}")
 
 
 @dataclass(frozen=True, slots=True)
 class CrisisOutcome:
-    """Per-crisis outcome of the falsification run."""
+    """Per-crisis outcome of the falsification run (v2)."""
 
     label: str
     country: str
@@ -287,8 +334,10 @@ class CrisisOutcome:
     n_pre_event: int
     n_null: int
     auc: float
+    auc_ci_low: float
+    auc_ci_high: float
     p_value: float
-    p_bh: float
+    p_bonferroni: float
 
 
 @dataclass(frozen=True, slots=True)
@@ -308,7 +357,7 @@ def run_falsification(
     config: FalsificationConfig | None = None,
     country_filter: str | None = None,
 ) -> FalsificationReport:
-    """Run the pre-registered falsification battery.
+    """Run the pre-registered v2 falsification battery.
 
     Parameters
     ----------
@@ -319,11 +368,11 @@ def run_falsification(
     ledger
         :class:`BankingCrisisLedger` of crisis events.
     config
-        Optional :class:`FalsificationConfig`; defaults to the
+        Optional :class:`FalsificationConfig`; defaults to the v2
         pre-registered settings.
     country_filter
-        If given (ISO-3 code), restrict events and null-distance
-        masking to that country only.
+        Optional ISO-3 country code to restrict events and null
+        masking to a single jurisdiction.
     """
     cfg = config if config is not None else FalsificationConfig()
     s = np.asarray(score, dtype=np.float64)
@@ -339,7 +388,6 @@ def run_falsification(
             )
 
     rng = np.random.default_rng(cfg.seed)
-
     if country_filter is None:
         candidate_events = ledger.events
     else:
@@ -366,7 +414,13 @@ def run_falsification(
         nulls = nulls[np.isfinite(nulls)]
         if nulls.size < 4:
             continue
-        a = auc_mann_whitney(pre, nulls)
+        point, ci_low, ci_high = auc_bootstrap_ci(
+            pre,
+            nulls,
+            n_bootstrap=cfg.n_bootstrap,
+            seed=cfg.seed,
+            confidence=cfg.confidence,
+        )
         p = _permutation_p(pre, nulls, n_permutations=cfg.n_permutations, rng=rng)
         outcomes_in_order.append(
             CrisisOutcome(
@@ -375,21 +429,19 @@ def run_falsification(
                 event_start=ev.start,
                 n_pre_event=int(pre.size),
                 n_null=int(nulls.size),
-                auc=a,
+                auc=point,
+                auc_ci_low=ci_low,
+                auc_ci_high=ci_high,
                 p_value=p,
-                p_bh=float("nan"),
+                p_bonferroni=float("nan"),
             )
         )
         p_per_crisis.append(p)
 
     if not outcomes_in_order:
-        return FalsificationReport(
-            outcomes=tuple(),
-            verdict="UNDECIDED",
-            config=cfg,
-        )
+        return FalsificationReport(outcomes=tuple(), verdict="UNDECIDED", config=cfg)
 
-    p_bh = benjamini_hochberg(np.asarray(p_per_crisis, dtype=np.float64))
+    p_bonf = bonferroni_correction(np.asarray(p_per_crisis, dtype=np.float64))
     finalised = tuple(
         CrisisOutcome(
             label=o.label,
@@ -398,16 +450,23 @@ def run_falsification(
             n_pre_event=o.n_pre_event,
             n_null=o.n_null,
             auc=o.auc,
+            auc_ci_low=o.auc_ci_low,
+            auc_ci_high=o.auc_ci_high,
             p_value=o.p_value,
-            p_bh=float(p_bh[i]),
+            p_bonferroni=float(p_bonf[i]),
         )
         for i, o in enumerate(outcomes_in_order)
     )
 
-    if any(o.auc <= cfg.fail_auc for o in finalised):
+    ci_floor = 0.5 + cfg.ci_floor_tol
+    if any(o.auc <= cfg.fail_auc or o.auc_ci_low <= ci_floor for o in finalised):
         verdict: Verdict = "HARD_FAIL"
     else:
-        passing = [o for o in finalised if o.auc >= cfg.pass_auc and o.p_bh <= cfg.pass_alpha]
+        passing = [
+            o
+            for o in finalised
+            if o.auc_ci_low >= cfg.pass_auc_ci_low and o.p_bonferroni <= cfg.pass_alpha
+        ]
         verdict = "HARD_PASS" if len(passing) >= 2 else "UNDECIDED"
 
     return FalsificationReport(outcomes=finalised, verdict=verdict, config=cfg)
diff --git a/research/systemic_risk/network_fitting.py b/research/systemic_risk/network_fitting.py
new file mode 100644
index 00000000..a382ebae
--- /dev/null
+++ b/research/systemic_risk/network_fitting.py
@@ -0,0 +1,530 @@
+# Copyright (c) 2023-2026 Yaroslav Vasylenko (neuron7xLab)
+# SPDX-License-Identifier: MIT
+"""MLE fitting of interbank degree distributions to candidate generators.
+
+The Barabási–Albert generator at fixed *m* is the topology-null
+baseline of the systemic-risk falsification battery. v1 hard-coded
+``m=3`` from Boss et al. 2004 / Soramäki et al. 2007; v2 fits *m*
+(equivalently the power-law exponent α) directly to the empirical
+degree sequence by maximum likelihood per Clauset, Shalizi & Newman
+(2009), *SIAM Rev.* **51**: 661.
+
+Two candidate models are compared on every fit:
+
+* **Power law** (BA-like): :math:`P(k) \\propto k^{-\\alpha}` for
+  :math:`k \\ge k_{\\min}`. MLE estimator
+  :math:`\\hat{\\alpha} = 1 + n / \\sum_i \\ln(k_i / k_{\\min})`.
+* **Exponential**: :math:`P(k) \\propto e^{-\\lambda k}` for
+  :math:`k \\ge k_{\\min}`. MLE estimator
+  :math:`\\hat{\\lambda} = 1 / (\\bar{k} - k_{\\min})`.
+
+The Kolmogorov–Smirnov statistic and a parametric-bootstrap p-value
+quantify the goodness-of-fit; the Akaike Information Criterion picks
+between the two candidates without overfitting penalty drift.
+
+Pure-function API. No I/O. Determinism via explicit seeds.
+"""
+
+from __future__ import annotations
+
+import math
+from dataclasses import dataclass
+from typing import TYPE_CHECKING, Literal
+
+import numpy as np
+from numpy.typing import NDArray
+
+if TYPE_CHECKING:
+    from .topology import InterbankTopology
+
+__all__ = [
+    "MIN_TAIL_SIZE_VALIDATION",
+    "MIN_RELATIVE_SE_VALIDATION",
+    "PowerLawFit",
+    "ExponentialFit",
+    "ModelComparison",
+    "fit_power_law",
+    "fit_power_law_validation",
+    "fit_exponential",
+    "compare_power_law_vs_exponential",
+    "fit_barabasi_albert",
+    "fit_barabasi_albert_from_topology",
+]
+
+
+# ---------------------------------------------------------------------------
+# Validation-mode constants — derived, not declared
+# ---------------------------------------------------------------------------
+#
+# MIN_TAIL_SIZE_VALIDATION: at α≈2.5 the Cramér-Rao σ_α/α floor at
+# n_tail=50 is 1.5/(2.5·√50) ≈ 0.085, giving a 95 % CI half-width of
+# 1.96·0.085·α ≈ 0.42 — sufficient to distinguish α=2.0 from α=2.4.
+# Below n_tail=50 the SE explodes and the implied minimum from the
+# CRLB (see fit_power_law `min_relative_se` derivation) becomes
+# brittle to a single-realisation seed.
+#
+# MIN_RELATIVE_SE_VALIDATION: 0.10 (10 % relative SE) is the bound
+# at which Clauset-Shalizi-Newman 2009 fig. 3 reports the discrete
+# power-law fit becoming reliably distinguishable from exponential
+# alternatives at the AIC-Δ > 4 level on synthetic samples.
+
+MIN_TAIL_SIZE_VALIDATION: int = 50
+MIN_RELATIVE_SE_VALIDATION: float = 0.10
+
+
+# ---------------------------------------------------------------------------
+# Result containers
+# ---------------------------------------------------------------------------
+
+
+@dataclass(frozen=True, slots=True)
+class PowerLawFit:
+    """MLE fit of a discrete power-law tail :math:`P(k) \\propto k^{-\\alpha}`.
+
+    Attributes
+    ----------
+    alpha
+        Maximum-likelihood exponent. Standard error
+        :math:`\\sigma_\\alpha = (\\alpha - 1) / \\sqrt{n}`
+        (Clauset et al. 2009, eq. 3.2).
+    alpha_se
+        Asymptotic standard error of ``alpha``.
+    k_min
+        Lower-tail cutoff used by the fit.
+    n_tail
+        Number of degrees in the fit tail (``k >= k_min``).
+    log_likelihood
+        Log-likelihood of the tail under the fitted model.
+    ks_statistic
+        Kolmogorov–Smirnov distance between the empirical tail CDF
+        and the fitted CDF.
+    ks_p_value
+        Parametric-bootstrap p-value: probability that a synthetic
+        sample of size ``n_tail`` drawn from the fitted distribution
+        produces a KS statistic at least as large as the observed one.
+        ``None`` when the bootstrap was not requested.
+    """
+
+    alpha: float
+    alpha_se: float
+    k_min: int
+    n_tail: int
+    log_likelihood: float
+    ks_statistic: float
+    ks_p_value: float | None
+
+
+@dataclass(frozen=True, slots=True)
+class ExponentialFit:
+    """MLE fit of a discrete shifted exponential :math:`P(k) \\propto e^{-\\lambda k}`."""
+
+    lambda_: float
+    k_min: int
+    n_tail: int
+    log_likelihood: float
+    ks_statistic: float
+
+
+@dataclass(frozen=True, slots=True)
+class ModelComparison:
+    """AIC-based comparison of power-law vs exponential.
+
+    ``preferred`` is the model with the lower AIC. ``aic_delta`` is
+    the absolute AIC gap (smaller is more decisive — Burnham &
+    Anderson 2002 conventionally read Δ < 2 as roughly equivalent,
+    Δ ∈ (4, 7) as strong, Δ > 10 as decisive).
+    """
+
+    power_law: PowerLawFit
+    exponential: ExponentialFit
+    aic_power_law: float
+    aic_exponential: float
+    preferred: Literal["power_law", "exponential"]
+    aic_delta: float
+
+
+# ---------------------------------------------------------------------------
+# MLE estimators
+# ---------------------------------------------------------------------------
+
+
+def _validate_degrees(degrees: NDArray[np.int64]) -> NDArray[np.int64]:
+    d = np.asarray(degrees, dtype=np.int64)
+    if d.ndim != 1:
+        raise ValueError(f"degrees must be 1-D, got shape={d.shape}")
+    if d.size < 4:
+        raise ValueError(f"degrees must contain at least 4 entries, got n={d.size}")
+    if np.any(d < 0):
+        raise ValueError("degrees must be non-negative")
+    return d
+
+
+def fit_power_law(
+    degrees: NDArray[np.int64],
+    *,
+    k_min: int | None = None,
+    n_bootstrap: int = 0,
+    seed: int = 42,
+    min_relative_se: float | None = None,
+) -> PowerLawFit:
+    """Fit a discrete power-law tail by maximum likelihood.
+
+    Parameters
+    ----------
+    degrees
+        1-D array of non-negative degree observations.
+    k_min
+        Tail cutoff. ``None`` (default) selects the cutoff that
+        minimises the KS statistic over all admissible cutoffs
+        (Clauset, Shalizi, Newman 2009 §3.3 — discrete grid scan).
+    n_bootstrap
+        Number of parametric-bootstrap resamples for the p-value.
+        ``0`` (default) skips the bootstrap and returns ``ks_p_value=None``.
+    seed
+        RNG seed for the bootstrap.
+    min_relative_se
+        Optional Cramér-Rao precision floor: after fit, if the
+        relative asymptotic standard error
+        :math:`\\sigma_\\alpha / \\hat\\alpha = (\\hat\\alpha - 1) /
+        (\\hat\\alpha \\sqrt{n_\\text{tail}})` exceeds this value, raise
+        :class:`ValueError`. ``None`` (default) skips the check —
+        the caller can read ``alpha_se`` from the result and decide
+        their own tolerance. Derivation (Clauset et al. 2009, eq. 3.2,
+        and the discrete-power-law Fisher information
+        :math:`I(\\alpha) = n_\\text{tail} / (\\alpha-1)^2`):
+
+            σ_α    α − 1
+            ─── = ─────────  must be ≤ ``min_relative_se``.
+             α    α · √n_t
+
+        Solving for the implied minimum tail size at a given α:
+        :math:`n_\\text{tail} \\ge \\bigl[(\\alpha-1)/(\\alpha
+        \\cdot \\text{tol})\\bigr]^2`. e.g. α=2.5, tol=0.10 → n ≥ 36;
+        α=2.0, tol=0.10 → n ≥ 25.
+    """
+    d = _validate_degrees(degrees)
+    if k_min is None:
+        chosen = _select_k_min(d)
+    else:
+        if k_min < 1:
+            raise ValueError(f"k_min must be >= 1, got {k_min}")
+        chosen = int(k_min)
+    tail = d[d >= chosen]
+    if tail.size < 2:
+        raise ValueError(f"only {tail.size} observations >= k_min={chosen}; need >=2 to fit")
+    # Continuous-approximation MLE — bias-stable for k_min >= 6 (Clauset 2009).
+    log_ratio = float(np.log(tail.astype(np.float64) / (chosen - 0.5)).sum())
+    if log_ratio <= 0:
+        raise ValueError("non-positive log-ratio sum — degenerate tail")
+    alpha = 1.0 + tail.size / log_ratio
+    alpha_se = (alpha - 1.0) / math.sqrt(tail.size)
+    if min_relative_se is not None:
+        if min_relative_se <= 0.0:
+            raise ValueError(f"min_relative_se must be > 0, got {min_relative_se}")
+        rel_se = alpha_se / alpha
+        if rel_se > min_relative_se:
+            implied_n = math.ceil(((alpha - 1.0) / (alpha * min_relative_se)) ** 2)
+            raise ValueError(
+                f"power-law fit fails Cramér-Rao precision floor: "
+                f"σ_α/α = {rel_se:.4f} > {min_relative_se:.4f} "
+                f"at α̂={alpha:.4f}, n_tail={tail.size}, k_min={chosen}; "
+                f"need n_tail ≥ {implied_n} for that α to clear the floor."
+            )
+    log_likelihood = (
+        tail.size * math.log(alpha - 1.0)
+        - tail.size * math.log(chosen - 0.5)
+        - alpha * float(np.log(tail.astype(np.float64) / (chosen - 0.5)).sum())
+    )
+    ks = _ks_statistic_power_law(tail, alpha, chosen)
+    p_value: float | None = None
+    if n_bootstrap > 0:
+        p_value = _ks_p_value_power_law(
+            tail.size, alpha, chosen, observed_ks=ks, n_bootstrap=n_bootstrap, seed=seed
+        )
+    return PowerLawFit(
+        alpha=float(alpha),
+        alpha_se=float(alpha_se),
+        k_min=int(chosen),
+        n_tail=int(tail.size),
+        log_likelihood=float(log_likelihood),
+        ks_statistic=float(ks),
+        ks_p_value=p_value,
+    )
+
+
+def fit_power_law_validation(
+    degrees: NDArray[np.int64],
+    *,
+    k_min: int | None = None,
+    n_bootstrap: int = 1000,
+    seed: int = 42,
+) -> PowerLawFit:
+    """Strict, fail-closed validation-mode wrapper around :func:`fit_power_law`.
+
+    Validation mode enforces TWO floors that the exploratory API
+    leaves opt-in:
+
+    * ``n_tail >= MIN_TAIL_SIZE_VALIDATION = 50`` — derived from the
+      Cramér-Rao bound at α≈2.5 (95 % CI half-width ≤ 0.42, sufficient
+      to separate α=2.0 from α=2.4 — see module-level constant
+      derivation block).
+    * ``σ_α / α <= MIN_RELATIVE_SE_VALIDATION = 0.10`` — Clauset-
+      Shalizi-Newman 2009 fig. 3 reports this as the bound where the
+      power-law fit becomes reliably distinguishable from the
+      exponential alternative at AIC-Δ > 4.
+
+    Both floors must hold simultaneously; failure of either raises
+    :class:`ValueError` with the implied minimum sample size at the
+    fitted α. ``n_bootstrap`` defaults to 1000 (KS-p resolves to
+    ±0.001 by Davison-Hinkley) — also tighter than the exploratory
+    default. ``min_relative_se`` is enforced internally; it is *not*
+    a kwarg here so the validation contract is unambiguous.
+    """
+    d = _validate_degrees(degrees)
+    if d.size < MIN_TAIL_SIZE_VALIDATION:
+        raise ValueError(
+            f"validation-mode power-law fit requires "
+            f"n_observations >= {MIN_TAIL_SIZE_VALIDATION}; got n={d.size}. "
+            f"For exploratory use, call fit_power_law directly."
+        )
+    return fit_power_law(
+        d,
+        k_min=k_min,
+        n_bootstrap=n_bootstrap,
+        seed=seed,
+        min_relative_se=MIN_RELATIVE_SE_VALIDATION,
+    )
+
+
+def fit_exponential(
+    degrees: NDArray[np.int64],
+    *,
+    k_min: int | None = None,
+) -> ExponentialFit:
+    """Fit a shifted exponential tail by maximum likelihood."""
+    d = _validate_degrees(degrees)
+    chosen = int(k_min) if k_min is not None else int(d[d > 0].min()) if (d > 0).any() else 1
+    if chosen < 1:
+        raise ValueError(f"k_min must be >= 1, got {chosen}")
+    tail = d[d >= chosen].astype(np.float64)
+    if tail.size < 2:
+        raise ValueError(f"only {tail.size} observations >= k_min={chosen}; need >=2 to fit")
+    mean_excess = float(tail.mean()) - chosen
+    if mean_excess <= 0:
+        raise ValueError(f"mean degree {tail.mean():.3f} <= k_min={chosen}; cannot fit")
+    lam = 1.0 / mean_excess
+    log_likelihood = float(tail.size * math.log(lam) - lam * float((tail - chosen).sum()))
+    ks = _ks_statistic_exponential(tail, lam, chosen)
+    return ExponentialFit(
+        lambda_=float(lam),
+        k_min=int(chosen),
+        n_tail=int(tail.size),
+        log_likelihood=float(log_likelihood),
+        ks_statistic=float(ks),
+    )
+
+
+def compare_power_law_vs_exponential(
+    degrees: NDArray[np.int64],
+    *,
+    k_min: int | None = None,
+    n_bootstrap: int = 0,
+    seed: int = 42,
+) -> ModelComparison:
+    """Fit both candidates and pick by AIC.
+
+    AIC = 2 k − 2 ℓ̂ where *k* is the number of free parameters
+    (1 for both models given a fixed ``k_min``) and ℓ̂ is the maximum
+    log-likelihood. Lower is better.
+    """
+    pl = fit_power_law(degrees, k_min=k_min, n_bootstrap=n_bootstrap, seed=seed)
+    exp_fit = fit_exponential(degrees, k_min=k_min)
+    aic_pl = 2.0 * 1 - 2.0 * pl.log_likelihood
+    aic_exp = 2.0 * 1 - 2.0 * exp_fit.log_likelihood
+    preferred: Literal["power_law", "exponential"] = (
+        "power_law" if aic_pl < aic_exp else "exponential"
+    )
+    return ModelComparison(
+        power_law=pl,
+        exponential=exp_fit,
+        aic_power_law=float(aic_pl),
+        aic_exponential=float(aic_exp),
+        preferred=preferred,
+        aic_delta=float(abs(aic_pl - aic_exp)),
+    )
+
+
+def fit_barabasi_albert(
+    degrees: NDArray[np.int64],
+    *,
+    n_bootstrap: int = 0,
+    seed: int = 42,
+    min_relative_se: float | None = None,
+) -> tuple[int, PowerLawFit]:
+    """Fit a BA-compatible *m* parameter to an empirical degree sequence.
+
+    The Barabási–Albert generator produces a power-law tail with
+    exponent α = 3 in the thermodynamic limit; finite-size and
+    direction-asymmetry effects shift α typically into [2, 3]
+    (Albert & Barabási 2002, *Rev. Mod. Phys.* 74: 47). Once the
+    empirical α is fitted, *m* is recovered from the BA mean-degree
+    identity ``<k> = 2m`` (Albert-Barabási 2002, eq. 4.7):
+    rounding ``mean(k) / 2`` to the nearest positive integer.
+
+    Parameters
+    ----------
+    degrees
+        1-D array of **undirected per-node degree counts** (each
+        undirected edge contributes 1 to each of its two endpoints,
+        and the BA mean-degree identity ``<k> = 2m`` assumes this
+        convention). Direct ``InterbankTopology.degree`` from a
+        symmetric topology counts each undirected edge **twice** —
+        once via ``in_degree`` and once via ``out_degree`` — and so
+        produces ``<k>_directed = 4m`` and a doubled ``m̂``. Use
+        :func:`fit_barabasi_albert_from_topology` to handle the
+        symmetric/asymmetric switch automatically, or pass
+        ``topo.out_degree`` for symmetric inputs.
+    """
+    d = _validate_degrees(degrees)
+    if np.unique(d).size < 2:
+        raise ValueError(
+            f"degenerate input: all observations equal ({int(d[0])}); cannot fit a power-law tail"
+        )
+    mean_k = float(d.mean())
+    if mean_k < 2.0:
+        # BA with m >= 1 generates <k> >= 2 by construction; mean<2
+        # means input is incompatible with the BA generator, not a
+        # finite-size artefact. Fail-closed instead of silently
+        # returning m=1 via the floor.
+        raise ValueError(
+            f"BA-incompatible input: <k>={mean_k:.4f} < 2; "
+            f"BA(m≥1) requires <k> ≥ 2 by Albert-Barabási 2002 eq. 4.7"
+        )
+    pl = fit_power_law(d, n_bootstrap=n_bootstrap, seed=seed, min_relative_se=min_relative_se)
+    m = int(round(mean_k / 2.0))
+    if m < 1:  # unreachable given mean_k>=2 above; fail-closed assertion
+        raise ValueError(f"BA m must satisfy m ≥ 1; got m={m} from <k>={mean_k:.4f}")
+    return m, pl
+
+
+def fit_barabasi_albert_from_topology(
+    topology: "InterbankTopology",
+    *,
+    n_bootstrap: int = 0,
+    seed: int = 42,
+    min_relative_se: float | None = None,
+) -> tuple[int, PowerLawFit]:
+    """Calibrate BA *m* directly from an :class:`InterbankTopology`.
+
+    Resolves the in+out-vs-undirected ambiguity introduced by
+    :attr:`InterbankTopology.degree` (which is the **sum** of in- and
+    out-degree, doubling undirected counts on symmetric graphs):
+
+    * Symmetric graphs: ``out_degree == in_degree`` and equals the
+      undirected per-node degree, so the BA identity ``<k>=2m``
+      applies directly to ``out_degree``.
+    * Asymmetric directed graphs: the natural BA analogue is the
+      out-degree distribution (each new node attaches *m* outgoing
+      edges); the BA identity again applies to ``out_degree``.
+
+    Both cases reduce to ``fit_barabasi_albert(topology.out_degree)``.
+    Reported *m* therefore matches the generator's *m* on
+    :func:`barabasi_albert_null` outputs to within ±1 at finite *N*.
+    """
+    return fit_barabasi_albert(
+        topology.out_degree,
+        n_bootstrap=n_bootstrap,
+        seed=seed,
+        min_relative_se=min_relative_se,
+    )
+
+
+# ---------------------------------------------------------------------------
+# Internals: k_min selection + KS statistic + bootstrap p
+# ---------------------------------------------------------------------------
+
+
+def _select_k_min(degrees: NDArray[np.int64]) -> int:
+    """Clauset-Shalizi-Newman 2009 §3.3 k_min selection by KS minimisation."""
+    candidates = np.unique(degrees[degrees >= 1])
+    # The largest few candidates leave too few tail points to fit; cap.
+    if candidates.size <= 4:
+        return int(candidates[0]) if candidates.size > 0 else 1
+    upper_idx = max(1, candidates.size - 4)
+    candidates = candidates[:upper_idx]
+    best_k_min = int(candidates[0])
+    best_ks = math.inf
+    for k_min in candidates:
+        tail = degrees[degrees >= k_min]
+        if tail.size < 4:
+            continue
+        log_ratio = float(np.log(tail.astype(np.float64) / (int(k_min) - 0.5)).sum())
+        if log_ratio <= 0:
+            continue
+        alpha = 1.0 + tail.size / log_ratio
+        ks = _ks_statistic_power_law(tail, alpha, int(k_min))
+        if ks < best_ks:
+            best_ks = ks
+            best_k_min = int(k_min)
+    return best_k_min
+
+
+def _power_law_cdf(k: NDArray[np.int64], alpha: float, k_min: int) -> NDArray[np.float64]:
+    """Continuous-approximation CDF for a discrete power-law tail."""
+    k_arr = np.asarray(k, dtype=np.float64)
+    return 1.0 - ((k_arr - 0.5) / (k_min - 0.5)) ** (1.0 - alpha)
+
+
+def _ks_statistic_power_law(tail: NDArray[np.int64], alpha: float, k_min: int) -> float:
+    sorted_tail = np.sort(tail)
+    n = sorted_tail.size
+    empirical_cdf = np.arange(1, n + 1, dtype=np.float64) / n
+    fitted_cdf = _power_law_cdf(sorted_tail, alpha, k_min)
+    return float(np.max(np.abs(empirical_cdf - fitted_cdf)))
+
+
+def _exponential_cdf(k: NDArray[np.float64], lam: float, k_min: int) -> NDArray[np.float64]:
+    k_arr = np.asarray(k, dtype=np.float64)
+    return 1.0 - np.exp(-lam * (k_arr - k_min))
+
+
+def _ks_statistic_exponential(tail: NDArray[np.float64], lam: float, k_min: int) -> float:
+    sorted_tail = np.sort(tail)
+    n = sorted_tail.size
+    empirical_cdf = np.arange(1, n + 1, dtype=np.float64) / n
+    fitted_cdf = _exponential_cdf(sorted_tail, lam, k_min)
+    return float(np.max(np.abs(empirical_cdf - fitted_cdf)))
+
+
+def _draw_power_law_sample(
+    n: int, alpha: float, k_min: int, rng: np.random.Generator
+) -> NDArray[np.int64]:
+    """Inverse-CDF sampler for the continuous power-law approximation."""
+    u = rng.random(n)
+    raw = (k_min - 0.5) * (1.0 - u) ** (1.0 / (1.0 - alpha)) + 0.5
+    return np.maximum(np.rint(raw).astype(np.int64), k_min)
+
+
+def _ks_p_value_power_law(
+    n: int,
+    alpha: float,
+    k_min: int,
+    *,
+    observed_ks: float,
+    n_bootstrap: int,
+    seed: int,
+) -> float:
+    rng = np.random.default_rng(seed)
+    exceedances = 0
+    for _ in range(n_bootstrap):
+        synthetic = _draw_power_law_sample(n, alpha, k_min, rng)
+        # Re-fit on the synthetic sample then compute its own KS.
+        log_ratio = float(np.log(synthetic.astype(np.float64) / (k_min - 0.5)).sum())
+        if log_ratio <= 0:
+            continue
+        synth_alpha = 1.0 + n / log_ratio
+        synth_ks = _ks_statistic_power_law(synthetic, synth_alpha, k_min)
+        if synth_ks >= observed_ks:
+            exceedances += 1
+    # Davison & Hinkley (1997) +1 continuity correction.
+    return float((exceedances + 1) / (n_bootstrap + 1))
diff --git a/research/systemic_risk/null_models.py b/research/systemic_risk/null_models.py
new file mode 100644
index 00000000..6c35c4b4
--- /dev/null
+++ b/research/systemic_risk/null_models.py
@@ -0,0 +1,384 @@
+# Copyright (c) 2023-2026 Yaroslav Vasylenko (neuron7xLab)
+# SPDX-License-Identifier: MIT
+"""Null-model baseline generators for the falsification battery.
+
+The official validation protocol (§ 8) requires every claimed
+detection to be compared against at least six orthogonal null
+baselines. A claim that does not survive *all six* is, by
+construction, indistinguishable from chance and may not advance
+beyond ``HYPOTHESIS`` tier.
+
+The six baselines, in order of stringency:
+
+1. **degree-preserving randomization** — rewires edges while
+   preserving each node's in-degree and out-degree (Maslov-Sneppen
+   shuffling on directed graphs). Tests whether the *signal*
+   depends on more than the marginal connectivity.
+2. **shuffled time labels** — the score time series is permuted
+   along the time axis. Destroys temporal ordering. Tests whether
+   any pre-event elevation is real or an artefact of sample size.
+3. **random exposure weights** — the binary adjacency is held
+   fixed, but every non-zero weight is replaced by an independent
+   draw from the empirical weight distribution. Tests whether the
+   *magnitudes* carry signal beyond the support graph.
+4. **static topology baseline** — the time-averaged adjacency is
+   substituted for every snapshot. Tests whether the temporal
+   evolution of the graph carries any predictive signal.
+5. **non-Kuramoto baseline** — replaces the order-parameter score
+   with the equivalent statistic from a linear-correlation
+   surrogate (mean pairwise Pearson correlation). Tests whether
+   the *non-linearity* of phase-coupling matters.
+6. **crisis-date permutation baseline** — the crisis dates
+   themselves are shuffled across the data span. Tests whether the
+   detection coincides with the labelled events or with arbitrary
+   dates.
+
+Each generator is a pure function returning a :class:`NullSurrogate`
+that the caller passes back through the appropriate detector path
+(score-replacing surrogates feed :func:`run_falsification`;
+topology-replacing surrogates feed the score-construction stack).
+A single composed audit entry-point that orchestrates all six is
+deferred until the empirical-data ingest lands — at that point the
+contract for "valid score from a surrogate topology" becomes
+testable end-to-end.
+
+Pure-function API. No I/O. Determinism via explicit ``seed``.
+"""
+
+from __future__ import annotations
+
+from dataclasses import dataclass
+from datetime import date
+from typing import Literal
+
+import numpy as np
+from numpy.typing import NDArray
+
+from .event_ledger import BankingCrisisEvent, BankingCrisisLedger
+from .topology import InterbankTopology
+
+__all__ = [
+    "NullName",
+    "NullSurrogate",
+    "degree_preserving_randomization",
+    "shuffled_time_labels",
+    "random_exposure_weights",
+    "static_topology_baseline",
+    "linear_correlation_surrogate",
+    "permuted_crisis_dates",
+]
+
+
+NullName = Literal[
+    "degree_preserving",
+    "shuffled_time_labels",
+    "random_exposure_weights",
+    "static_topology",
+    "linear_correlation",
+    "permuted_crisis_dates",
+]
+
+
+@dataclass(frozen=True, slots=True)
+class NullSurrogate:
+    """A single null-baseline output paired with its provenance."""
+
+    name: NullName
+    score: NDArray[np.float64] | None
+    topology: InterbankTopology | None
+    ledger: BankingCrisisLedger | None
+    seed: int
+
+
+# ---------------------------------------------------------------------------
+# 1. degree-preserving randomization (Maslov-Sneppen on directed graph)
+# ---------------------------------------------------------------------------
+
+
+def degree_preserving_randomization(
+    topology: InterbankTopology,
+    *,
+    seed: int,
+    n_swaps: int | None = None,
+) -> NullSurrogate:
+    """Maslov-Sneppen edge swap preserving in- and out-degree per node.
+
+    Implementation: pick two directed edges ``(a→b)`` and ``(c→d)``
+    uniformly at random; if ``a≠c``, ``a≠d``, ``b≠c``, ``b≠d`` and
+    neither ``(a→d)`` nor ``(c→b)`` already exists, rewire to
+    ``(a→d)`` and ``(c→b)``. Repeat ``n_swaps`` times. Default
+    ``n_swaps = 10 * E`` (Milo et al. 2003).
+    """
+    rng = np.random.default_rng(seed)
+    a = np.array(topology.adjacency, dtype=np.int8, copy=True)
+    a.flags.writeable = True
+    edges_iv = np.argwhere(a == 1)
+    n_edges = edges_iv.shape[0]
+    if n_edges < 2:
+        # Nothing to swap; return a defensive copy.
+        return NullSurrogate(
+            name="degree_preserving",
+            score=None,
+            topology=InterbankTopology(
+                adjacency=a,
+                node_labels=topology.node_labels,
+                source_label=f"{topology.source_label}::degree_preserving::seed={seed}",
+            ),
+            ledger=None,
+            seed=seed,
+        )
+    if n_swaps is None:
+        n_swaps = 10 * n_edges
+    edges = [tuple(int(x) for x in row) for row in edges_iv]
+    for _ in range(n_swaps):
+        i, j = int(rng.integers(0, n_edges)), int(rng.integers(0, n_edges))
+        if i == j:
+            continue
+        a_i, b_i = edges[i]
+        c_i, d_i = edges[j]
+        if len({a_i, b_i, c_i, d_i}) < 4:
+            continue
+        if a[a_i, d_i] == 1 or a[c_i, b_i] == 1:
+            continue
+        a[a_i, b_i] = 0
+        a[c_i, d_i] = 0
+        a[a_i, d_i] = 1
+        a[c_i, b_i] = 1
+        edges[i] = (a_i, d_i)
+        edges[j] = (c_i, b_i)
+    return NullSurrogate(
+        name="degree_preserving",
+        score=None,
+        topology=InterbankTopology(
+            adjacency=a,
+            node_labels=topology.node_labels,
+            source_label=f"{topology.source_label}::degree_preserving::seed={seed}",
+        ),
+        ledger=None,
+        seed=seed,
+    )
+
+
+# ---------------------------------------------------------------------------
+# 2. shuffled time labels
+# ---------------------------------------------------------------------------
+
+
+def shuffled_time_labels(
+    score: NDArray[np.float64],
+    *,
+    seed: int,
+) -> NullSurrogate:
+    """Permute the score series along the time axis. Destroys ordering."""
+    s = np.asarray(score, dtype=np.float64)
+    if s.ndim != 1:
+        raise ValueError(f"score must be 1-D, got shape={s.shape}")
+    rng = np.random.default_rng(seed)
+    permuted = rng.permutation(s)
+    return NullSurrogate(
+        name="shuffled_time_labels",
+        score=permuted,
+        topology=None,
+        ledger=None,
+        seed=seed,
+    )
+
+
+# ---------------------------------------------------------------------------
+# 3. random exposure weights (preserves binary support)
+# ---------------------------------------------------------------------------
+
+
+def random_exposure_weights(
+    topology: InterbankTopology,
+    *,
+    seed: int,
+) -> NullSurrogate:
+    """Resample weights from the empirical distribution while preserving the
+    binary adjacency.
+
+    Implementation note: only meaningful when ``topology.weights is not None``.
+    For a topology without empirical weights (e.g. BA null), returns a
+    surrogate whose weights are zeroed.
+    """
+    rng = np.random.default_rng(seed)
+    a = np.array(topology.adjacency, dtype=np.int8, copy=True)
+    n = a.shape[0]
+    if topology.weights is None:
+        new_w: NDArray[np.float64] | None = None
+    else:
+        empirical = topology.weights[a == 1]
+        if empirical.size == 0:
+            new_w = np.zeros((n, n), dtype=np.float64)
+        else:
+            sampled = rng.choice(empirical, size=int(a.sum()), replace=True)
+            new_w = np.zeros((n, n), dtype=np.float64)
+            new_w[a == 1] = sampled
+            np.fill_diagonal(new_w, 0.0)
+    return NullSurrogate(
+        name="random_exposure_weights",
+        score=None,
+        topology=InterbankTopology(
+            adjacency=a,
+            weights=new_w,
+            node_labels=topology.node_labels,
+            source_label=f"{topology.source_label}::random_weights::seed={seed}",
+        ),
+        ledger=None,
+        seed=seed,
+    )
+
+
+# ---------------------------------------------------------------------------
+# 4. static topology baseline (time-mean adjacency)
+# ---------------------------------------------------------------------------
+
+
+def static_topology_baseline(
+    snapshots: tuple[InterbankTopology, ...],
+    *,
+    seed: int,
+) -> NullSurrogate:
+    """Substitute the time-mean adjacency for every snapshot.
+
+    Strips temporal evolution of the graph. Returns a single
+    surrogate topology whose binary support is the union of all
+    snapshot supports and whose weights (if present on every
+    snapshot) are the snapshot mean.
+    """
+    if len(snapshots) == 0:
+        raise ValueError("snapshots tuple must be non-empty")
+    n = snapshots[0].n_nodes
+    if any(t.n_nodes != n for t in snapshots):
+        raise ValueError("all snapshots must share the same node count")
+    union = np.zeros((n, n), dtype=np.int8)
+    for t in snapshots:
+        union |= t.adjacency
+    # Mean weights only when every snapshot carries a weights matrix.
+    if all(t.weights is not None for t in snapshots):
+        mean_w = np.mean(
+            np.stack([t.weights for t in snapshots]),  # type: ignore[misc]
+            axis=0,
+        ).astype(np.float64)
+        np.fill_diagonal(mean_w, 0.0)
+    else:
+        mean_w = None
+    return NullSurrogate(
+        name="static_topology",
+        score=None,
+        topology=InterbankTopology(
+            adjacency=union,
+            weights=mean_w,
+            node_labels=snapshots[0].node_labels,
+            source_label=f"static_topology::N_snapshots={len(snapshots)}::seed={seed}",
+        ),
+        ledger=None,
+        seed=seed,
+    )
+
+
+# ---------------------------------------------------------------------------
+# 5. linear-correlation surrogate (non-Kuramoto)
+# ---------------------------------------------------------------------------
+
+
+def linear_correlation_surrogate(
+    spreads: NDArray[np.float64],
+    *,
+    seed: int,
+) -> NullSurrogate:
+    """Replace the Kuramoto order parameter with mean pairwise Pearson
+    correlation over a rolling window — a *linear* coherence statistic.
+
+    Returns a per-bank-pair correlation matrix collapsed to a single
+    series (mean off-diagonal correlation per time-step) for direct
+    A/B comparison with the Kuramoto-based score.
+
+    Parameters
+    ----------
+    spreads
+        Shape ``(T, N_banks)``, finite log-returns or interbank
+        spreads (canonical ``(T, N)`` layout).
+    """
+    s = np.asarray(spreads, dtype=np.float64)
+    if s.ndim != 2:
+        raise ValueError(f"spreads must be 2-D (T, N), got shape={s.shape}")
+    if s.shape[0] < 2:
+        raise ValueError(f"spreads must have at least 2 time samples, got T={s.shape[0]}")
+    if not np.isfinite(s).all():
+        raise ValueError("spreads must be finite")
+    # Mean off-diagonal Pearson correlation per single rolling step
+    # is collapsed here into a single time-resolved series via a
+    # 30-step trailing window. Caller may override via direct
+    # composition if a different window is needed.
+    window = min(30, s.shape[0])
+    out = np.full(s.shape[0], np.nan, dtype=np.float64)
+    for t in range(window - 1, s.shape[0]):
+        seg = s[t - window + 1 : t + 1]
+        # Centre + scale.
+        seg_c = seg - seg.mean(axis=0, keepdims=True)
+        std = seg_c.std(axis=0, ddof=1)
+        # bounds: zero-variance columns ⇒ undefined Pearson;
+        # set their pairwise contribution to NaN so the mean
+        # propagates the signal honestly.
+        std_safe = np.where(std > 0, std, np.nan)
+        norm = seg_c / std_safe
+        corr = (norm.T @ norm) / (window - 1)
+        np.fill_diagonal(corr, np.nan)
+        out[t] = float(np.nanmean(corr))
+    return NullSurrogate(
+        name="linear_correlation",
+        score=out,
+        topology=None,
+        ledger=None,
+        seed=seed,
+    )
+
+
+# ---------------------------------------------------------------------------
+# 6. permuted crisis dates
+# ---------------------------------------------------------------------------
+
+
+def permuted_crisis_dates(
+    ledger: BankingCrisisLedger,
+    *,
+    earliest: date,
+    latest: date,
+    seed: int,
+) -> NullSurrogate:
+    """Shuffle every event start (and matching end) to a uniformly random
+    date in ``[earliest, latest - duration]``.
+
+    Preserves the per-event duration distribution so the null
+    population is comparable to the empirical one.
+    """
+    if latest <= earliest:
+        raise ValueError(f"latest={latest} must exceed earliest={earliest}")
+    span_days = (latest - earliest).days
+    rng = np.random.default_rng(seed)
+    permuted: list[BankingCrisisEvent] = []
+    from datetime import timedelta as _td
+
+    for ev in ledger.events:
+        duration_days = (ev.end - ev.start).days
+        max_offset = max(0, span_days - duration_days)
+        offset = int(rng.integers(0, max_offset + 1))
+        new_start = earliest + _td(days=offset)
+        new_end = new_start + _td(days=duration_days)
+        permuted.append(
+            BankingCrisisEvent(
+                country=ev.country,
+                start=new_start,
+                end=new_end,
+                source=ev.source,
+                label=f"{ev.label}_permuted",
+            )
+        )
+    return NullSurrogate(
+        name="permuted_crisis_dates",
+        score=None,
+        topology=None,
+        ledger=BankingCrisisLedger(events=tuple(permuted)),
+        seed=seed,
+    )
diff --git a/research/systemic_risk/replication.py b/research/systemic_risk/replication.py
new file mode 100644
index 00000000..1d5fc9a2
--- /dev/null
+++ b/research/systemic_risk/replication.py
@@ -0,0 +1,200 @@
+# Copyright (c) 2023-2026 Yaroslav Vasylenko (neuron7xLab)
+# SPDX-License-Identifier: MIT
+"""Replication manifest for every falsification run.
+
+Section 13 of the official validation protocol mandates that every
+run preserves: commit hash, dataset version, config, random seed,
+dependency lockfile, machine environment, timestamp, full logs,
+generated figures, raw metrics, failed tests. This module captures
+the *static* part of that contract — the run-time provenance —
+in a single deterministic dataclass that callers persist alongside
+their numerical artefacts.
+
+The dynamic parts (logs, figures) are the orchestrator's responsibility;
+this module exists so that no caller can invent its own provenance
+schema and silently omit a field.
+
+Pure-function API. Reads the system state once at construction.
+"""
+
+from __future__ import annotations
+
+import hashlib
+import json
+import os
+import platform
+import subprocess
+import sys
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from pathlib import Path
+from typing import Any
+
+__all__ = [
+    "RunManifest",
+    "build_run_manifest",
+]
+
+
+@dataclass(frozen=True, slots=True)
+class RunManifest:
+    """Deterministic provenance record for a single falsification run.
+
+    Attributes
+    ----------
+    commit_sha
+        Output of ``git rev-parse HEAD`` at run start. ``"unknown"``
+        when not in a git tree.
+    git_dirty
+        ``True`` when the working tree has uncommitted changes —
+        callers should refuse to claim ``MEASURED`` from a dirty run.
+    timestamp_utc
+        ISO-8601 UTC timestamp at manifest construction.
+    seed
+        The single root RNG seed used for the run. Every downstream
+        sub-process derives its seed deterministically from this one.
+    config_hash
+        SHA-256 of ``json.dumps(config, sort_keys=True)`` so any
+        change to the config produces a different hash.
+    python
+        ``sys.version`` short form (e.g. ``"3.12.5 (...)"``).
+    platform_info
+        ``platform.platform()`` — kernel, distro, machine.
+    package_versions
+        Mapping of every loaded *runtime-relevant* package to its
+        version string (numpy, scipy, pandas, networkx, sklearn,
+        scipy, the GeoSync wheel itself).
+    config
+        Full caller-supplied config dict (echoed verbatim). Together
+        with ``config_hash`` it forms the falsification's frozen
+        pre-registration.
+    extra
+        Free-form metadata for caller-specific provenance fields
+        (e.g. ``{"dataset": "e-MID_2009Q1-2015Q4", "data_sha256": "..."}``).
+    """
+
+    commit_sha: str
+    git_dirty: bool
+    timestamp_utc: str
+    seed: int
+    config_hash: str
+    python: str
+    platform_info: str
+    package_versions: dict[str, str]
+    config: dict[str, Any]
+    extra: dict[str, Any] = field(default_factory=dict)
+
+    def to_json(self) -> str:
+        """Deterministic JSON serialisation (sorted keys + trailing newline)."""
+        payload = {
+            "commit_sha": self.commit_sha,
+            "git_dirty": self.git_dirty,
+            "timestamp_utc": self.timestamp_utc,
+            "seed": self.seed,
+            "config_hash": self.config_hash,
+            "python": self.python,
+            "platform_info": self.platform_info,
+            "package_versions": dict(sorted(self.package_versions.items())),
+            "config": self.config,
+            "extra": dict(sorted(self.extra.items())),
+        }
+        return json.dumps(payload, indent=2, sort_keys=True) + "\n"
+
+
+def _git_head_sha(cwd: Path) -> tuple[str, bool]:
+    try:
+        sha = subprocess.run(  # nosec B603 - explicit argv
+            ["git", "rev-parse", "HEAD"],
+            cwd=str(cwd),
+            check=True,
+            capture_output=True,
+            text=True,
+            timeout=5,
+        ).stdout.strip()
+    except (subprocess.CalledProcessError, FileNotFoundError, subprocess.TimeoutExpired):
+        return "unknown", False
+    try:
+        status = subprocess.run(  # nosec B603 - explicit argv
+            ["git", "status", "--porcelain"],
+            cwd=str(cwd),
+            check=True,
+            capture_output=True,
+            text=True,
+            timeout=5,
+        ).stdout
+    except (subprocess.CalledProcessError, FileNotFoundError, subprocess.TimeoutExpired):
+        return sha, False
+    return sha, bool(status.strip())
+
+
+_RELEVANT_PACKAGES: tuple[str, ...] = (
+    "numpy",
+    "scipy",
+    "pandas",
+    "networkx",
+    "scikit-learn",
+    "geosync",
+)
+
+
+def _package_versions() -> dict[str, str]:
+    out: dict[str, str] = {}
+    for name in _RELEVANT_PACKAGES:
+        try:
+            from importlib.metadata import PackageNotFoundError, version
+
+            out[name] = version(name)
+        except PackageNotFoundError:
+            out[name] = "not-installed"
+        except Exception:  # pragma: no cover - defensive
+            out[name] = "unknown"
+    return out
+
+
+def _config_hash(config: dict[str, Any]) -> str:
+    encoded = json.dumps(config, sort_keys=True, default=str).encode("utf-8")
+    return hashlib.sha256(encoded).hexdigest()
+
+
+def build_run_manifest(
+    *,
+    seed: int,
+    config: dict[str, Any],
+    extra: dict[str, Any] | None = None,
+    cwd: Path | None = None,
+) -> RunManifest:
+    """Capture the system state into a frozen :class:`RunManifest`.
+
+    Parameters
+    ----------
+    seed
+        Root RNG seed for the run.
+    config
+        Full pre-registered config dict — every threshold, window
+        length, bootstrap count, etc. The dict is hashed with
+        ``sort_keys=True`` so any change produces a different
+        ``config_hash``.
+    extra
+        Optional free-form metadata (dataset id, data sha256, ...).
+    cwd
+        Working directory used for ``git`` calls. Defaults to
+        ``Path.cwd()``.
+    """
+    cwd_path = cwd if cwd is not None else Path.cwd()
+    sha, dirty = _git_head_sha(cwd_path)
+    return RunManifest(
+        commit_sha=sha,
+        git_dirty=dirty,
+        timestamp_utc=datetime.now(timezone.utc).isoformat(timespec="seconds"),
+        seed=int(seed),
+        config_hash=_config_hash(config),
+        python=(
+            sys.version.split(" (")[0] + " (" + sys.version.split(" (", 1)[1]
+            if "(" in sys.version
+            else sys.version
+        ),
+        platform_info=platform.platform() + " | " + os.uname().machine,
+        package_versions=_package_versions(),
+        config=dict(config),
+        extra=dict(extra) if extra is not None else {},
+    )
diff --git a/research/systemic_risk/topology.py b/research/systemic_risk/topology.py
index 56801e44..9e99345a 100644
--- a/research/systemic_risk/topology.py
+++ b/research/systemic_risk/topology.py
@@ -1,35 +1,43 @@
 # Copyright (c) 2023-2026 Yaroslav Vasylenko (neuron7xLab)
 # SPDX-License-Identifier: MIT
-"""Interbank network topology — empirical adapter + null baselines.
+"""Interbank network topology — directed empirical adapter + null baselines.
+
+Real interbank exposures are *directed*: bank *i* lending to bank *j* is
+not the same as *j* lending to *i*. Symmetrising the graph, as v1 of this
+module did, throws away the credit-direction signal that determines
+which institution propagates stress to which neighbour. v2 builds a
+directed (asymmetric) adjacency by default and supports an explicit
+symmetric override only for null-model baselines.
 
 Two construction paths:
 
-1. **Empirical**: weighted, possibly directed exposure matrix
-   (``A[i, j]`` = lending from bank *i* to bank *j*) is symmetrised with
-   :math:`A_{sym} = (A + A^T) / 2` and binarised at a documented
-   threshold to give the undirected coupling support used by the
-   Kuramoto model. The binary skeleton is what enters the inverse
-   problem; magnitudes are kept on a parallel ``weights`` matrix for
-   diagnostics.
-
-2. **Barabási–Albert null** (preferential attachment, *m* edges per
-   step). Empirical interbank networks are well documented to be
-   approximately scale-free with γ ≈ 2.0–2.3 (Boss et al. 2004,
-   *Quant. Finance* 4: 677; Soramäki et al. 2007, *Physica A* 379:
-   317). BA at *m* ≈ 2–4 reproduces this regime and is used **only** as
-   the topology-null baseline of the falsification battery, never as a
-   model of the real economy.
-
-Pure-function API. No I/O. No randomness except where ``rng`` is passed.
+1. **Empirical** (:func:`from_exposure_matrix`): a possibly directed
+   exposure matrix :math:`E` where :math:`E_{ij}` = lending from bank
+   *i* to bank *j* is binarised at a documented threshold.
+   ``directed=True`` (default) keeps the asymmetric structure;
+   ``directed=False`` averages :math:`E` with :math:`E^T` first
+   (legacy/null-only).
+
+2. **Barabási–Albert null** (:func:`barabasi_albert_null`,
+   :func:`fit_barabasi_albert`): the BA generator produces a symmetric
+   graph by construction; :func:`fit_barabasi_albert` fits the
+   power-law exponent of an *empirical* degree sequence by MLE
+   (Clauset, Shalizi, Newman 2009, *SIAM Rev.* 51: 661) so the null
+   baseline is calibrated to the data, not hard-coded at *m=2*.
+
+Pure-function API. No I/O. Determinism via explicit seeds.
 """
 
 from __future__ import annotations
 
 from dataclasses import dataclass
+from datetime import date
 
 import numpy as np
 from numpy.typing import NDArray
 
+from .errors import InvalidExposureMatrixError, InvalidNodeLabelsError
+
 __all__ = [
     "InterbankTopology",
     "from_exposure_matrix",
@@ -44,39 +52,46 @@ class InterbankTopology:
     Attributes
     ----------
     adjacency
-        Binary symmetric adjacency, ``int8`` shape ``(N, N)``, zero
-        diagonal. ``adjacency[i, j] == 1`` iff there is a coupling
-        between *i* and *j* in the support graph.
+        Binary adjacency, ``int8`` shape ``(N, N)``, zero diagonal.
+        ``adjacency[i, j] == 1`` iff there is a directed edge *i → j*
+        in the support graph (lending from *i* to *j*). May be
+        symmetric (BA null) or asymmetric (empirical exposures).
     weights
-        Real, non-negative, symmetric exposure magnitudes shape
-        ``(N, N)``, zero diagonal. ``None`` when the topology was
-        generated synthetically (BA null).
+        Real, non-negative magnitudes shape ``(N, N)``, zero diagonal.
+        Symmetric iff ``adjacency`` is symmetric. ``None`` when the
+        topology was generated synthetically.
     node_labels
         Tuple of node identifiers; length ``N``.
     source_label
         Free-form provenance tag, e.g. ``"e-MID_2011-Q3"`` or
         ``"BA_null_m=3_seed=42"``.
+    snapshot_date
+        Calendar date the snapshot pertains to. ``None`` when the
+        topology represents a static null model.
 
     Invariants
     ----------
-    INV-TOP1: ``adjacency`` is symmetric, binary, zero-diagonal.
-    INV-TOP2: ``weights`` (when present) is symmetric, non-negative,
+    INV-TOP1: ``adjacency`` is binary, square 2-D, zero-diagonal.
+    INV-TOP2: ``weights`` (when present) is non-negative, finite,
               zero-diagonal, with the same shape as ``adjacency``.
     INV-TOP3: ``len(node_labels) == adjacency.shape[0]``.
+    INV-TOP4 (asymmetry): for empirical directed inputs, the bound
+              ``mean(adjacency != adjacency.T) > 0`` is reported but
+              not enforced — symmetric empirical graphs are valid
+              edge cases (e.g. fully reciprocated lending).
     """
 
     adjacency: NDArray[np.int8]
     node_labels: tuple[str, ...]
     source_label: str
     weights: NDArray[np.float64] | None = None
+    snapshot_date: date | None = None
 
     def __post_init__(self) -> None:
         a = self.adjacency
         if a.ndim != 2 or a.shape[0] != a.shape[1]:
             raise ValueError(f"INV-TOP1: adjacency must be square 2-D, got shape={a.shape}")
         n = a.shape[0]
-        if not np.array_equal(a, a.T):
-            raise ValueError("INV-TOP1: adjacency must be symmetric")
         if not np.all((a == 0) | (a == 1)):
             raise ValueError("INV-TOP1: adjacency must be binary {0,1}")
         if np.any(np.diag(a) != 0):
@@ -87,10 +102,10 @@ def __post_init__(self) -> None:
         if w is not None:
             if w.shape != a.shape:
                 raise ValueError(f"INV-TOP2: weights shape={w.shape} != adjacency {a.shape}")
-            if not np.allclose(w, w.T, equal_nan=False):
-                raise ValueError("INV-TOP2: weights must be symmetric")
             if np.any(w < 0):
                 raise ValueError("INV-TOP2: weights must be non-negative")
+            if not np.isfinite(w).all():
+                raise ValueError("INV-TOP2: weights must be finite (no NaN/Inf)")
             if np.any(np.diag(w) != 0):
                 raise ValueError("INV-TOP2: weights must have zero diagonal")
         # Freeze arrays to prevent silent mutation downstream.
@@ -107,10 +122,44 @@ def n_nodes(self) -> int:
         return int(self.adjacency.shape[0])
 
     @property
-    def degree(self) -> NDArray[np.int64]:
+    def is_symmetric(self) -> bool:
+        return bool(np.array_equal(self.adjacency, self.adjacency.T))
+
+    @property
+    def asymmetry_fraction(self) -> float:
+        """Fraction of off-diagonal entries that differ between A and A.T.
+
+        ``0.0`` for fully symmetric graphs; bounded above by 1.0. Used
+        by the asymmetry-invariant test on real-data adapters.
+        """
+        a = self.adjacency
+        if a.shape[0] <= 1:
+            return 0.0
+        diff = a != a.T
+        # Off-diagonal entries only; diagonal is zero on both sides.
+        np.fill_diagonal(diff, False)
+        n = a.shape[0]
+        denom = float(n * (n - 1))
+        return float(diff.sum()) / denom if denom > 0 else 0.0
+
+    @property
+    def in_degree(self) -> NDArray[np.int64]:
+        """Number of incoming edges per node (sum over rows)."""
+        out: NDArray[np.int64] = self.adjacency.sum(axis=0, dtype=np.int64)
+        return out
+
+    @property
+    def out_degree(self) -> NDArray[np.int64]:
+        """Number of outgoing edges per node (sum over columns)."""
         out: NDArray[np.int64] = self.adjacency.sum(axis=1, dtype=np.int64)
         return out
 
+    @property
+    def degree(self) -> NDArray[np.int64]:
+        """Total degree per node (in + out). For symmetric graphs equals 2*out_degree."""
+        out: NDArray[np.int64] = self.in_degree + self.out_degree
+        return out
+
 
 def from_exposure_matrix(
     exposures: NDArray[np.float64],
@@ -118,43 +167,80 @@ def from_exposure_matrix(
     *,
     threshold: float = 0.0,
     source_label: str = "empirical_exposure",
+    directed: bool = True,
+    snapshot_date: date | None = None,
 ) -> InterbankTopology:
-    """Build an :class:`InterbankTopology` from a possibly directed exposure matrix.
+    """Build an :class:`InterbankTopology` from a directed exposure matrix.
 
     Parameters
     ----------
     exposures
         Real, non-negative matrix shape ``(N, N)``. ``exposures[i, j]``
         is the magnitude of *i*'s exposure to *j* (e.g. lending volume).
-        May be directed; symmetrisation by averaging is applied.
     node_labels
         Length-``N`` tuple of node identifiers.
     threshold
-        Inclusive lower bound on a symmetrised entry for it to enter
-        the binary support. Default ``0.0`` keeps every non-zero edge.
+        **Strict** lower cutoff: ``A[i, j] = 1`` iff
+        ``weights[i, j] > threshold`` (an entry equal to ``threshold``
+        is *not* an edge). Default ``0.0`` admits every strictly-
+        positive entry — zero-exposure cells never become edges.
     source_label
         Provenance tag stored on the resulting topology.
+    directed
+        If ``True`` (default), preserve the asymmetric exposure
+        structure: ``A[i,j] = 1`` iff ``exposures[i,j] > threshold``.
+        If ``False``, symmetrise via :math:`(E + E^T)/2` before
+        thresholding — used only by the null baseline.
+    snapshot_date
+        Optional calendar date the snapshot pertains to. Required for
+        temporal-snapshot pipelines (e-MID quarterly, BIS LBS).
+
+    HARD_FAIL conditions
+    --------------------
+    * ``exposures`` not 2-D / not square ⇒ :class:`InvalidExposureMatrixError`.
+    * Length of ``node_labels`` ≠ N ⇒ :class:`InvalidNodeLabelsError`.
+    * ``node_labels`` contain duplicates or empty strings ⇒
+      :class:`InvalidNodeLabelsError`.
+    * ``exposures`` contains negatives, NaN, or Inf ⇒
+      :class:`InvalidExposureMatrixError`.
+    * ``threshold`` < 0 ⇒ :class:`InvalidExposureMatrixError`.
     """
     e = np.asarray(exposures, dtype=np.float64)
     if e.ndim != 2 or e.shape[0] != e.shape[1]:
-        raise ValueError(f"exposures must be square 2-D, got shape={e.shape}")
+        raise InvalidExposureMatrixError(f"exposures must be square 2-D, got shape={e.shape}")
     if e.shape[0] != len(node_labels):
-        raise ValueError(f"node_labels length {len(node_labels)} != exposures dim {e.shape[0]}")
-    if np.any(e < 0):
-        raise ValueError("exposures must be non-negative")
+        raise InvalidNodeLabelsError(
+            f"node_labels length {len(node_labels)} != exposures dim {e.shape[0]}"
+        )
+    if any(lbl is None for lbl in node_labels):
+        raise InvalidNodeLabelsError("node_labels must not contain None")
+    if any(not isinstance(lbl, str) for lbl in node_labels):
+        raise InvalidNodeLabelsError("node_labels must contain only str values")
+    if any(lbl.strip() == "" for lbl in node_labels):
+        raise InvalidNodeLabelsError(
+            "node_labels must not contain empty or whitespace-only strings"
+        )
+    if len(set(node_labels)) != len(node_labels):
+        raise InvalidNodeLabelsError("node_labels must be unique")
     if not np.isfinite(e).all():
-        raise ValueError("exposures must be finite (no NaN/Inf)")
+        raise InvalidExposureMatrixError("exposures must be finite (no NaN/Inf)")
+    if np.any(e < 0):
+        raise InvalidExposureMatrixError("exposures must be non-negative")
     if threshold < 0:
-        raise ValueError(f"threshold must be >= 0, got {threshold}")
-    sym = 0.5 * (e + e.T)
-    np.fill_diagonal(sym, 0.0)
-    adj = (sym > threshold).astype(np.int8)
+        raise InvalidExposureMatrixError(f"threshold must be >= 0, got {threshold}")
+    if directed:
+        weights = np.array(e, dtype=np.float64, copy=True)
+    else:
+        weights = 0.5 * (e + e.T)
+    np.fill_diagonal(weights, 0.0)
+    adj = (weights > threshold).astype(np.int8)
     np.fill_diagonal(adj, 0)
     return InterbankTopology(
         adjacency=adj,
-        weights=sym,
+        weights=weights,
         node_labels=tuple(node_labels),
         source_label=source_label,
+        snapshot_date=snapshot_date,
     )
 
 
@@ -167,14 +253,15 @@ def barabasi_albert_null(
 ) -> InterbankTopology:
     """Barabási–Albert preferential attachment, *m* edges per new node.
 
-    Implementation is self-contained (no NetworkX dependency) so the
-    module remains importable in minimal install environments and
-    the seed semantics are unambiguous: ``rng = default_rng(seed)``.
+    Implementation is self-contained (no NetworkX dependency). Produces
+    a *symmetric* graph by construction — used as the null baseline of
+    the falsification battery, never as a model of the real economy.
 
     Empirical anchor: :math:`m \\in \\{2, 3, 4\\}` reproduces interbank
     degree distributions observed in Boss et al. 2004 and Soramäki et
     al. 2007. The mean degree of the resulting graph is ``2m`` for
-    large ``n``.
+    large ``n``. To pick *m* directly from data use
+    :func:`research.systemic_risk.network_fitting.fit_barabasi_albert`.
 
     Parameters
     ----------
@@ -183,8 +270,7 @@ def barabasi_albert_null(
     m
         Edges added per new node (must be >= 1).
     seed
-        Seed for ``np.random.default_rng``. Required — there is no
-        sensible default for a null model.
+        Seed for ``np.random.default_rng``. Required.
     source_label
         Optional override for the resulting ``source_label`` field.
     """
diff --git a/tests/research/systemic_risk/test_coupling.py b/tests/research/systemic_risk/test_coupling.py
new file mode 100644
index 00000000..73f890fc
--- /dev/null
+++ b/tests/research/systemic_risk/test_coupling.py
@@ -0,0 +1,174 @@
+# Copyright (c) 2023-2026 Yaroslav Vasylenko (neuron7xLab)
+# SPDX-License-Identifier: MIT
+"""Tests for :mod:`research.systemic_risk.coupling`."""
+
+from __future__ import annotations
+
+import numpy as np
+import pytest
+
+from research.systemic_risk.coupling import (
+    coupling_from_exposures,
+    omega_from_volatility,
+    sakaguchi_alpha_zero,
+)
+
+
+class TestCouplingFromExposures:
+    def test_row_stochastic_default(self) -> None:
+        e = np.array([[0.0, 1.0, 3.0], [2.0, 0.0, 0.0], [0.0, 0.0, 0.0]], dtype=np.float64)
+        K = coupling_from_exposures(e)
+        # Row 0 sums to (1+3)/4 = 1.0; row 1 → 1.0; row 2 sums stay 0.
+        np.testing.assert_allclose(K.sum(axis=1), [1.0, 1.0, 0.0], atol=1e-12)
+        # Asymmetric: K[0,1]=0.25, K[1,0]=1.0 ⇒ K ≠ K^T.
+        assert not np.allclose(K, K.T)
+
+    def test_zero_diagonal(self) -> None:
+        e = np.eye(4, dtype=np.float64) * 5.0
+        K = coupling_from_exposures(e)
+        assert np.all(np.diag(K) == 0.0)
+
+    def test_capital_weighted(self) -> None:
+        e = np.array([[0.0, 4.0], [2.0, 0.0]], dtype=np.float64)
+        cap = np.array([2.0, 1.0], dtype=np.float64)
+        K = coupling_from_exposures(e, normalisation="capital_weighted", capital=cap)
+        # Row 0: 4 / 2 = 2; row 1: 2 / 1 = 2.
+        assert K[0, 1] == pytest.approx(2.0)
+        assert K[1, 0] == pytest.approx(2.0)
+
+    def test_capital_required_when_weighted(self) -> None:
+        e = np.array([[0.0, 1.0], [1.0, 0.0]], dtype=np.float64)
+        with pytest.raises(ValueError, match="capital"):
+            coupling_from_exposures(e, normalisation="capital_weighted")
+
+    def test_zero_capital_rejected(self) -> None:
+        e = np.array([[0.0, 1.0], [1.0, 0.0]], dtype=np.float64)
+        cap = np.array([0.0, 1.0])
+        with pytest.raises(ValueError):
+            coupling_from_exposures(e, normalisation="capital_weighted", capital=cap)
+
+    def test_floor_zeros_small_entries(self) -> None:
+        e = np.array([[0.0, 1.0, 100.0]] * 3, dtype=np.float64)
+        np.fill_diagonal(e, 0.0)
+        K = coupling_from_exposures(e, floor=0.05)
+        # Row-stochastic puts ~0.0099 on the small entry → below 0.05 floor.
+        assert K[0, 1] == 0.0
+        # Large entry survives.
+        assert K[0, 2] > 0.0
+
+    def test_floor_inclusive_at_exact_boundary(self) -> None:
+        # Documentation guarantees an *inclusive* lower bound on the
+        # kept set: an entry equal to ``floor`` survives.
+        e = np.array([[0.0, 0.5, 0.5], [0.5, 0.0, 0.5], [0.5, 0.5, 0.0]], dtype=np.float64)
+        # Row-stochastic produces equal off-diagonal entries == 0.5.
+        K = coupling_from_exposures(e, floor=0.5)
+        assert K[0, 1] == 0.5, (
+            f"floor inclusivity violated: entry equal to floor=0.5 "
+            f"clamped to {K[0, 1]} (expected 0.5)"
+        )
+
+    def test_all_zero_row_survives_without_crash(self) -> None:
+        # Bank with no outgoing exposures: row sum is zero, must
+        # NOT trigger division-by-zero noise. Coupling row stays 0.
+        e = np.array([[0.0, 0.0, 0.0], [1.0, 0.0, 2.0], [3.0, 4.0, 0.0]], dtype=np.float64)
+        K = coupling_from_exposures(e)
+        assert np.all(K[0, :] == 0.0)
+        assert np.isfinite(K).all()
+        # Other rows must still be row-stochastic.
+        np.testing.assert_allclose(K[1, :].sum(), 1.0, atol=1e-12)
+        np.testing.assert_allclose(K[2, :].sum(), 1.0, atol=1e-12)
+
+    def test_nan_exposure_rejected(self) -> None:
+        e = np.array([[0.0, np.nan], [1.0, 0.0]], dtype=np.float64)
+        with pytest.raises(ValueError, match="finite"):
+            coupling_from_exposures(e)
+
+    def test_negative_exposure_rejected(self) -> None:
+        with pytest.raises(ValueError):
+            coupling_from_exposures(np.array([[0.0, -1.0], [-1.0, 0.0]]))
+
+    def test_orientation_invariant_2x2(self) -> None:
+        # Per the canonical orientation invariant in coupling.py:
+        #   E[i, j] = i lent to j (i's exposure to j)
+        #   K[i, j] = stress felt by i from j ∝ E[i, j]
+        # A 2×2 directed example: bank 0 lends 9 units to bank 1,
+        # bank 1 lends 1 unit to bank 0. K must reflect this
+        # asymmetry without transposing.
+        e = np.array([[0.0, 9.0], [1.0, 0.0]], dtype=np.float64)
+        K = coupling_from_exposures(e, normalisation="raw")
+        # Raw retains the magnitudes; only the diagonal is cleared.
+        assert K[0, 1] == 9.0, (
+            "INV-K-ORIENTATION VIOLATED: K[0,1] should encode bank 0's "
+            "stress from bank 1 ∝ E[0,1]=9 (0's loan to 1); got "
+            f"{K[0, 1]}. A wrong-direction transpose would give 1.0."
+        )
+        assert K[1, 0] == 1.0, (
+            "INV-K-ORIENTATION VIOLATED: K[1,0] should encode bank 1's "
+            "stress from bank 0 ∝ E[1,0]=1 (1's loan to 0); got "
+            f"{K[1, 0]}. A wrong-direction transpose would give 9.0."
+        )
+        # Row-stochastic must also preserve orientation (now 9/9, 1/1).
+        K_rs = coupling_from_exposures(e)  # default row_stochastic
+        assert K_rs[0, 1] == pytest.approx(1.0), (
+            f"row-stochastic orientation drift: K[0,1]={K_rs[0, 1]}, "
+            f"expected 1.0 (only outgoing edge from row 0)"
+        )
+        assert K_rs[1, 0] == pytest.approx(1.0)
+
+
+class TestOmegaFromVolatility:
+    def test_finite_output(self) -> None:
+        rng = np.random.default_rng(0)
+        log_returns = rng.standard_normal((500, 8))
+        omega = omega_from_volatility(log_returns)
+        assert omega.shape == (8,)
+        assert np.all(np.isfinite(omega))
+        assert np.all(omega > 0.0)
+
+    def test_high_vol_higher_omega(self) -> None:
+        rng = np.random.default_rng(0)
+        low = rng.standard_normal((1000, 4)) * 0.1
+        high = rng.standard_normal((1000, 4)) * 1.0
+        ω_low = omega_from_volatility(low)
+        ω_high = omega_from_volatility(high)
+        assert float(ω_high.mean()) > float(ω_low.mean())
+
+    def test_invalid_fs_rejected(self) -> None:
+        with pytest.raises(ValueError):
+            omega_from_volatility(np.zeros((10, 3)), fs=0.0)
+
+    def test_single_observation_rejected(self) -> None:
+        # Regression: Codex flagged that std(ddof=1) on T=1 returns NaN
+        # silently. The validator must fail-closed on T < 2.
+        with pytest.raises(ValueError, match="at least 2 time samples"):
+            omega_from_volatility(np.zeros((1, 4)))
+
+    def test_zero_observations_rejected(self) -> None:
+        with pytest.raises(ValueError, match="at least 2 time samples"):
+            omega_from_volatility(np.zeros((0, 4)))
+
+    def test_inf_input_rejected(self) -> None:
+        bad = np.zeros((10, 3), dtype=np.float64)
+        bad[5, 1] = np.inf
+        with pytest.raises(ValueError, match="finite"):
+            omega_from_volatility(bad)
+
+    def test_zero_variance_returns_zero_omega(self) -> None:
+        # Constant series → σ=0 → ω=0. Caller-detectable, no NaN
+        # leakage. The downstream Kuramoto solver receives explicit
+        # zero (a degenerate but well-defined oscillator) instead of
+        # an undefined value.
+        omega = omega_from_volatility(np.full((10, 3), 0.123, dtype=np.float64))
+        assert np.all(omega == 0.0)
+        assert np.all(np.isfinite(omega))
+
+
+class TestSakaguchiAlphaZero:
+    def test_shape_and_values(self) -> None:
+        a = sakaguchi_alpha_zero(5)
+        assert a.shape == (5, 5)
+        assert np.all(a == 0.0)
+
+    def test_invalid_n_rejected(self) -> None:
+        with pytest.raises(ValueError):
+            sakaguchi_alpha_zero(0)
diff --git a/tests/research/systemic_risk/test_errors.py b/tests/research/systemic_risk/test_errors.py
new file mode 100644
index 00000000..0883f77b
--- /dev/null
+++ b/tests/research/systemic_risk/test_errors.py
@@ -0,0 +1,97 @@
+# Copyright (c) 2023-2026 Yaroslav Vasylenko (neuron7xLab)
+# SPDX-License-Identifier: MIT
+"""Structured-exception contract tests (§ 5 Entry-Point Gate)."""
+
+from __future__ import annotations
+
+import numpy as np
+import pytest
+
+from research.systemic_risk.errors import (
+    InvalidExposureMatrixError,
+    InvalidNodeLabelsError,
+    SystemicRiskInputError,
+)
+from research.systemic_risk.topology import from_exposure_matrix
+
+
+class TestExceptionHierarchy:
+    def test_root_inherits_value_error(self) -> None:
+        # Backward-compat: every existing `except ValueError` site
+        # must still catch the new typed errors.
+        assert issubclass(SystemicRiskInputError, ValueError)
+        assert issubclass(InvalidExposureMatrixError, SystemicRiskInputError)
+        assert issubclass(InvalidNodeLabelsError, SystemicRiskInputError)
+
+    def test_invalid_shape_raises_typed(self) -> None:
+        with pytest.raises(InvalidExposureMatrixError, match="square 2-D"):
+            from_exposure_matrix(np.zeros((3, 4), dtype=np.float64), ("a", "b", "c"))
+
+    def test_label_length_mismatch_raises_typed(self) -> None:
+        with pytest.raises(InvalidNodeLabelsError, match="!="):
+            from_exposure_matrix(np.zeros((3, 3), dtype=np.float64), ("a", "b"))
+
+    def test_duplicate_labels_raises_typed(self) -> None:
+        with pytest.raises(InvalidNodeLabelsError, match="unique"):
+            from_exposure_matrix(np.zeros((3, 3), dtype=np.float64), ("a", "a", "c"))
+
+    def test_empty_label_raises_typed(self) -> None:
+        with pytest.raises(InvalidNodeLabelsError, match="empty"):
+            from_exposure_matrix(np.zeros((3, 3), dtype=np.float64), ("a", "", "c"))
+
+    def test_whitespace_only_label_raises_typed(self) -> None:
+        with pytest.raises(InvalidNodeLabelsError, match="empty or whitespace"):
+            from_exposure_matrix(np.zeros((3, 3), dtype=np.float64), ("a", "  ", "c"))
+
+    def test_none_label_raises_typed(self) -> None:
+        # node_labels is typed `tuple[str, ...]` but runtime callers
+        # may pass through dynamically-built tuples; defend at runtime.
+        with pytest.raises(InvalidNodeLabelsError, match="None"):
+            from_exposure_matrix(
+                np.zeros((3, 3), dtype=np.float64),
+                ("a", None, "c"),  # type: ignore[arg-type]
+            )
+
+    def test_nan_exposure_raises_typed(self) -> None:
+        e = np.array([[0.0, np.nan], [0.0, 0.0]], dtype=np.float64)
+        with pytest.raises(InvalidExposureMatrixError, match="finite"):
+            from_exposure_matrix(e, ("a", "b"))
+
+    def test_negative_exposure_raises_typed(self) -> None:
+        e = np.array([[0.0, -1.0], [-1.0, 0.0]], dtype=np.float64)
+        with pytest.raises(InvalidExposureMatrixError, match="non-negative"):
+            from_exposure_matrix(e, ("a", "b"))
+
+    def test_negative_threshold_raises_typed(self) -> None:
+        e = np.zeros((2, 2), dtype=np.float64)
+        with pytest.raises(InvalidExposureMatrixError, match="threshold"):
+            from_exposure_matrix(e, ("a", "b"), threshold=-0.1)
+
+    def test_typed_error_still_catchable_as_value_error(self) -> None:
+        # New code should pattern-match on the typed class, but old
+        # code must still work via the parent ``ValueError`` catch.
+        e = np.zeros((2, 2), dtype=np.float64)
+        try:
+            from_exposure_matrix(e, ("a", "a"))
+        except ValueError as exc:
+            assert isinstance(exc, InvalidNodeLabelsError)
+        else:
+            raise AssertionError("expected InvalidNodeLabelsError")
+
+
+class TestThresholdContract:
+    def test_threshold_is_strict_cutoff(self) -> None:
+        # Per the (corrected) docstring: threshold is a STRICT lower
+        # cutoff. An entry equal to threshold is NOT an edge.
+        e = np.array([[0.0, 0.5], [0.5, 0.0]], dtype=np.float64)
+        topo = from_exposure_matrix(e, ("a", "b"), threshold=0.5)
+        assert topo.adjacency[0, 1] == 0, (
+            "INV-THRESHOLD-STRICT VIOLATED: entry equal to "
+            "threshold=0.5 became an edge; topology threshold "
+            "is documented as STRICT (>)"
+        )
+
+    def test_threshold_strict_above(self) -> None:
+        e = np.array([[0.0, 0.51], [0.51, 0.0]], dtype=np.float64)
+        topo = from_exposure_matrix(e, ("a", "b"), threshold=0.5)
+        assert topo.adjacency[0, 1] == 1
diff --git a/tests/research/systemic_risk/test_falsification.py b/tests/research/systemic_risk/test_falsification.py
index 2bde380c..f71803ce 100644
--- a/tests/research/systemic_risk/test_falsification.py
+++ b/tests/research/systemic_risk/test_falsification.py
@@ -1,17 +1,16 @@
 # Copyright (c) 2023-2026 Yaroslav Vasylenko (neuron7xLab)
 # SPDX-License-Identifier: MIT
-"""Tests for :mod:`research.systemic_risk.falsification`.
+"""Tests for :mod:`research.systemic_risk.falsification` (v2).
 
 Coverage:
 * :func:`auc_mann_whitney` algebraic identities (perfect / inverted /
-  uniform).
-* :func:`benjamini_hochberg` monotonicity + clipping under standard
-  edge cases (Benjamini & Hochberg 1995).
+  uniform / random).
+* :func:`auc_bootstrap_ci` CI bracket sanity + degeneracy.
+* :func:`bonferroni_correction` clipping + order preservation.
 * End-to-end ``run_falsification`` null-AUC sanity:
-  on i.i.d. random scores the per-crisis AUC distribution should be
-  centred near 0.5 and the BH-corrected verdict should not be
-  ``HARD_PASS``. This is the test that *catches* implementation bugs
-  that systematically inflate AUC.
+  on i.i.d. random scores the per-crisis AUC must not produce
+  ``HARD_PASS``; on injected pre-event signal it must produce
+  ``HARD_PASS`` with both CI bounds clearing the v2 thresholds.
 """
 
 from __future__ import annotations
@@ -27,8 +26,9 @@
 )
 from research.systemic_risk.falsification import (
     FalsificationConfig,
+    auc_bootstrap_ci,
     auc_mann_whitney,
-    benjamini_hochberg,
+    bonferroni_correction,
     run_falsification,
 )
 
@@ -54,7 +54,6 @@ def test_empty_returns_half_by_convention(self) -> None:
         assert auc_mann_whitney(np.array([1.0]), np.array([])) == 0.5
 
     def test_random_iid_centred_at_half(self) -> None:
-        # Statistical: under H0 (same distribution) E[AUC] = 0.5.
         rng = np.random.default_rng(123)
         aucs = []
         for _ in range(100):
@@ -67,36 +66,101 @@ def test_random_iid_centred_at_half(self) -> None:
         )
 
 
-class TestBenjaminiHochberg:
+class TestAucBootstrapCi:
+    def test_ci_brackets_point_estimate(self) -> None:
+        rng = np.random.default_rng(7)
+        pos = rng.normal(0.5, 1.0, size=80)
+        neg = rng.normal(0.0, 1.0, size=80)
+        point, ci_low, ci_high = auc_bootstrap_ci(pos, neg, n_bootstrap=2000)
+        assert ci_low <= point <= ci_high, (
+            f"INV-CI-BRACKET VIOLATED: point={point:.4f} outside "
+            f"[{ci_low:.4f}, {ci_high:.4f}] at n_bootstrap=2000, seed=7"
+        )
+
+    def test_ci_under_h0_contains_half(self) -> None:
+        # Under H0 (positives and negatives drawn from the same
+        # distribution) the indicator I_b = [0.5 ∈ CI_b] is Bernoulli
+        # with success probability equal to the actual coverage of
+        # the percentile bootstrap. A correctly-calibrated 95% CI has
+        # coverage 0.95 in the limit, so the count K = Σ_b I_b over
+        # ``N_REPS`` independent reps is Binomial(N_REPS, 0.95).
+        #
+        # The acceptance threshold is the lower quantile of that
+        # binomial under a chosen test-reliability level
+        # ``alpha_test`` — the target rate at which a *correctly
+        # implemented* bootstrap is allowed to fail this assertion by
+        # sampling noise. Setting ``alpha_test = 1e-3`` keeps spurious
+        # failures below 1 in 1000 CI runs, which is the "frontier-
+        # lab" reliability level expected by feedback_dev_cycle.
+        from scipy.stats import binom
+
+        n_reps = 100
+        nominal_coverage = 0.95
+        alpha_test = 1e-3
+        # binom.ppf is the quantile (smallest k with CDF(k) >= q),
+        # which is the inclusive lower bound of the acceptance set.
+        threshold = int(binom.ppf(alpha_test, n_reps, nominal_coverage))
+
+        rng = np.random.default_rng(11)
+        contains = 0
+        for _ in range(n_reps):
+            pos = rng.standard_normal(40)
+            neg = rng.standard_normal(40)
+            _, lo, hi = auc_bootstrap_ci(
+                pos, neg, n_bootstrap=500, seed=int(rng.integers(0, 10**6))
+            )
+            if lo <= 0.5 <= hi:
+                contains += 1
+        assert contains >= threshold, (
+            f"INV-CI-COVERAGE VIOLATED: 95%-nominal bootstrap CI under "
+            f"H0 contained 0.5 in {contains}/{n_reps} reps; "
+            f"binomial-derived lower bound at α_test={alpha_test} is "
+            f"{threshold}. Under-coverage at this magnitude indicates "
+            f"a calibration bug in auc_bootstrap_ci, not sampling noise."
+        )
+
+    def test_degenerate_inputs_collapse(self) -> None:
+        # Single observation per arm → CI collapses to point estimate.
+        pos = np.array([2.0])
+        neg = np.array([1.0])
+        point, lo, hi = auc_bootstrap_ci(pos, neg, n_bootstrap=100)
+        assert lo == hi == point
+
+    def test_invalid_confidence_rejected(self) -> None:
+        with pytest.raises(ValueError, match="confidence"):
+            auc_bootstrap_ci(np.array([1.0, 2.0]), np.array([0.0, 0.5]), confidence=0.0)
+
+    def test_invalid_n_bootstrap_rejected(self) -> None:
+        with pytest.raises(ValueError, match="n_bootstrap"):
+            auc_bootstrap_ci(np.array([1.0]), np.array([0.0]), n_bootstrap=0)
+
+
+class TestBonferroni:
     def test_all_zero_input(self) -> None:
-        out = benjamini_hochberg(np.zeros(5))
+        out = bonferroni_correction(np.zeros(5))
         assert np.all(out == 0.0)
 
     def test_all_one_input(self) -> None:
-        out = benjamini_hochberg(np.ones(5))
+        out = bonferroni_correction(np.ones(5))
+        # 5*1 clipped to 1.
         assert np.all(out == 1.0)
 
-    def test_classic_example(self) -> None:
-        # B-H (1995) Table 1 mini-case: 4 p-values [0.005, 0.01, 0.04, 0.5].
-        # Adjusted: 4/1*0.005=0.02, 4/2*0.01=0.02, 4/3*0.04≈0.0533, 4/4*0.5=0.5.
-        # After enforcing monotonicity from the largest, expected:
-        # [0.02, 0.02, 0.0533, 0.5].
+    def test_simple_case(self) -> None:
         p = np.array([0.005, 0.01, 0.04, 0.5])
-        out = benjamini_hochberg(p)
-        np.testing.assert_allclose(out, [0.02, 0.02, 0.05333333, 0.5], atol=1e-7)
+        out = bonferroni_correction(p)
+        np.testing.assert_allclose(out, [0.02, 0.04, 0.16, 1.0], atol=1e-12)
 
     def test_order_preserved(self) -> None:
-        # Output order matches input order, even with shuffled input.
         p = np.array([0.5, 0.005, 0.04, 0.01])
-        out = benjamini_hochberg(p)
-        # The smallest input is at index 1; its adjusted value should be 0.02.
+        out = bonferroni_correction(p)
+        # min input at index 1 → 4 * 0.005 = 0.02.
         assert out[1] == pytest.approx(0.02)
 
     def test_invalid_p_rejected(self) -> None:
         with pytest.raises(ValueError):
-            benjamini_hochberg(np.array([-0.1, 0.5]))
+            bonferroni_correction(np.array([-0.1, 0.5]))
         with pytest.raises(ValueError):
-            benjamini_hochberg(np.array([0.5, 1.5]))
+            bonferroni_correction(np.array([0.5, 1.5]))
 
 
 class TestRunFalsificationSanity:
@@ -104,8 +168,6 @@ def _build_synthetic_ledger_and_score(
         self,
         seed: int,
     ) -> tuple[BankingCrisisLedger, tuple[date, ...], np.ndarray]:
-        # 5 crises spread across an 8-year synthetic series; pure noise score.
-        # No physics → expected verdict ≠ HARD_PASS.
         start = date(2010, 1, 1)
         n_days = 365 * 8
         dates = tuple(start + timedelta(days=i) for i in range(n_days))
@@ -144,15 +206,41 @@ def test_random_scores_do_not_pass(self) -> None:
             null_window_count=10,
             min_distance_from_event_days=180,
             n_permutations=200,
+            n_bootstrap=500,
             seed=7,
         )
         report = run_falsification(score, dates, ledger, config=cfg, country_filter="ABC")
-        # Random noise must not produce HARD_PASS — that would mean a leak.
         assert report.verdict != "HARD_PASS"
-        # Either an outcome is below the fail threshold (HARD_FAIL) or none
-        # of the AUCs are convincingly above the pass threshold (UNDECIDED).
         assert report.verdict in {"HARD_FAIL", "UNDECIDED"}
 
+    def test_injected_signal_passes(self) -> None:
+        ledger, dates, score = self._build_synthetic_ledger_and_score(seed=42)
+        # Inject +3σ elevation in the 60-day pre-event window of every crisis.
+        for ev in ledger.events:
+            delta = (ev.start - dates[0]).days
+            if delta - 60 < 0:
+                continue
+            score[delta - 60 : delta] += 3.0
+        cfg = FalsificationConfig(
+            pre_event_window_days=60,
+            null_window_count=15,
+            min_distance_from_event_days=180,
+            n_permutations=2000,
+            n_bootstrap=2000,
+            seed=11,
+        )
+        report = run_falsification(score, dates, ledger, config=cfg, country_filter="ABC")
+        assert report.verdict == "HARD_PASS", (
+            f"INJECTED-SIGNAL VIOLATED: verdict={report.verdict}, "
+            f"expected HARD_PASS at +3σ injection across 3 crises. "
+            f"outcomes: {[(o.label, round(o.auc, 3), round(o.auc_ci_low, 3)) for o in report.outcomes]}"
+        )
+        for o in report.outcomes:
+            assert o.auc_ci_low >= 0.70, (
+                f"PASS-THRESHOLD VIOLATED: {o.label} auc_ci_low={o.auc_ci_low:.4f} "
+                f"< 0.70 at +3σ injection, n_bootstrap=2000, seed=11"
+            )
+
     def test_score_length_mismatch_rejected(self) -> None:
         ledger, dates, _ = self._build_synthetic_ledger_and_score(seed=0)
         with pytest.raises(ValueError, match="score length"):
diff --git a/tests/research/systemic_risk/test_network_fitting.py b/tests/research/systemic_risk/test_network_fitting.py
new file mode 100644
index 00000000..5bd57672
--- /dev/null
+++ b/tests/research/systemic_risk/test_network_fitting.py
@@ -0,0 +1,204 @@
+# Copyright (c) 2023-2026 Yaroslav Vasylenko (neuron7xLab)
+# SPDX-License-Identifier: MIT
+"""Tests for :mod:`research.systemic_risk.network_fitting`."""
+
+from __future__ import annotations
+
+import numpy as np
+import pytest
+
+from research.systemic_risk.network_fitting import (
+    compare_power_law_vs_exponential,
+    fit_barabasi_albert,
+    fit_barabasi_albert_from_topology,
+    fit_exponential,
+    fit_power_law,
+)
+from research.systemic_risk.topology import barabasi_albert_null
+
+
+def _draw_power_law(n: int, alpha: float, k_min: int, seed: int) -> np.ndarray:
+    rng = np.random.default_rng(seed)
+    u = rng.random(n)
+    raw = (k_min - 0.5) * (1.0 - u) ** (1.0 / (1.0 - alpha)) + 0.5
+    return np.maximum(np.rint(raw).astype(np.int64), k_min)
+
+
+class TestFitPowerLaw:
+    def test_recovers_alpha_on_synthetic(self) -> None:
+        # Statistical: ensemble of 30 fits on synthetic α=2.5 samples.
+        # The continuous-approximation MLE has known small-sample bias
+        # of order 1/n for discrete data (Clauset 2009 §B). At n=2000,
+        # k_min=6 the bias is ≤ 0.20 in expectation — used here as the
+        # tolerance bound. Standard error of the ensemble mean is
+        # σ_α/√30 ≈ 0.05.
+        true_alpha = 2.5
+        estimates = []
+        for seed in range(30):
+            sample = _draw_power_law(2000, true_alpha, 6, seed)
+            estimates.append(fit_power_law(sample, k_min=6).alpha)
+        mean_alpha = float(np.mean(estimates))
+        assert abs(mean_alpha - true_alpha) < 0.20, (
+            f"MLE-BIAS VIOLATED: mean(α̂)={mean_alpha:.4f} vs α={true_alpha} "
+            f"over 30 samples of size 2000, k_min=6 (tolerance 0.20)"
+        )
+
+    def test_alpha_se_decreases_with_n(self) -> None:
+        small = _draw_power_law(200, 2.5, 6, 0)
+        large = _draw_power_law(2000, 2.5, 6, 0)
+        small_se = fit_power_law(small, k_min=6).alpha_se
+        large_se = fit_power_law(large, k_min=6).alpha_se
+        assert large_se < small_se, (
+            f"SE-MONOTONE VIOLATED: SE(n=2000)={large_se:.4f} >= "
+            f"SE(n=200)={small_se:.4f}; expected SE ∝ 1/√n at α=2.5"
+        )
+
+    def test_ks_p_value_bracket(self) -> None:
+        sample = _draw_power_law(500, 2.5, 6, 7)
+        fit = fit_power_law(sample, k_min=6, n_bootstrap=200, seed=11)
+        assert fit.ks_p_value is not None
+        assert 0.0 < fit.ks_p_value <= 1.0
+
+    def test_invalid_input_rejected(self) -> None:
+        with pytest.raises(ValueError):
+            fit_power_law(np.array([1, 2], dtype=np.int64))  # n<4
+        with pytest.raises(ValueError):
+            fit_power_law(np.array([-1, 2, 3, 4], dtype=np.int64))
+
+    def test_relative_se_floor_enforced(self) -> None:
+        # Tiny tail → high relative SE — must trigger the Cramér-Rao
+        # floor when min_relative_se is below the floor's empirical
+        # value. Concretely: at α≈2.5, n=4 the SE is 1.5/√4=0.75 and
+        # σ_α/α≈0.30; tol=0.10 must reject.
+        sample = np.array([6, 7, 8, 100], dtype=np.int64)
+        with pytest.raises(ValueError, match="Cramér-Rao precision floor"):
+            fit_power_law(sample, k_min=6, min_relative_se=0.10)
+
+
+class TestFitExponential:
+    def test_recovers_lambda(self) -> None:
+        rng = np.random.default_rng(3)
+        true_lambda = 0.4
+        # Discrete shifted exponential: k = k_min + Geom(p=1-exp(-λ)).
+        p = 1.0 - np.exp(-true_lambda)
+        k_min = 1
+        sample = (k_min + rng.geometric(p, size=2000) - 1).astype(np.int64)
+        fit = fit_exponential(sample, k_min=k_min)
+        assert abs(fit.lambda_ - true_lambda) < 0.1, (
+            f"EXP-BIAS VIOLATED: λ̂={fit.lambda_:.4f} vs λ={true_lambda} "
+            f"on synthetic n=2000, k_min={k_min}"
+        )
+
+
+class TestCompare:
+    def test_power_law_preferred_on_power_law_sample(self) -> None:
+        sample = _draw_power_law(1500, 2.4, 4, 0)
+        cmp = compare_power_law_vs_exponential(sample, k_min=4)
+        assert cmp.preferred == "power_law"
+        assert cmp.aic_power_law < cmp.aic_exponential
+        assert cmp.aic_delta > 0
+
+    def test_exponential_preferred_on_exponential_sample(self) -> None:
+        rng = np.random.default_rng(5)
+        sample = (1 + rng.geometric(0.3, size=1500) - 1).astype(np.int64)
+        cmp = compare_power_law_vs_exponential(sample, k_min=1)
+        assert cmp.preferred == "exponential"
+
+
+class TestFitBarabasiAlbert:
+    def test_returns_positive_m(self) -> None:
+        sample = _draw_power_law(1000, 2.5, 4, 0)
+        m, fit = fit_barabasi_albert(sample)
+        assert m >= 1
+        assert 1.5 < fit.alpha < 4.5
+
+    def test_seed_determinism(self) -> None:
+        # Same input → same fit (no hidden randomness when n_bootstrap=0).
+        sample = _draw_power_law(500, 2.5, 4, 0)
+        a, fit_a = fit_barabasi_albert(sample)
+        b, fit_b = fit_barabasi_albert(sample)
+        assert a == b
+        assert fit_a.alpha == fit_b.alpha
+
+    def test_degenerate_constant_input_rejected(self) -> None:
+        # All nodes share the same degree → no power-law tail, no
+        # MLE solution. Fail-closed instead of returning a meaningless
+        # m≈k/2.
+        constant = np.full(20, 5, dtype=np.int64)
+        with pytest.raises(ValueError, match="degenerate input"):
+            fit_barabasi_albert(constant)
+
+    def test_low_mean_degree_rejected(self) -> None:
+        # <k> < 2 is incompatible with BA(m≥1) by Albert-Barabási
+        # 2002 eq. 4.7. Must fail-closed.
+        sparse = np.array([0, 0, 0, 1, 1, 1, 0, 0], dtype=np.int64)
+        with pytest.raises(ValueError, match="BA-incompatible"):
+            fit_barabasi_albert(sparse)
+
+    def test_min_relative_se_propagates(self) -> None:
+        # The validation-mode precision floor must reach the
+        # underlying fit_power_law via _from_topology too.
+        from research.systemic_risk.topology import barabasi_albert_null
+
+        # n=20 BA(m=2) — n_tail too small for tight precision floor.
+        topo = barabasi_albert_null(n_nodes=20, m=2, seed=0)
+        with pytest.raises(ValueError, match="Cramér-Rao precision floor"):
+            fit_barabasi_albert_from_topology(topo, min_relative_se=0.05)
+
+
+class TestFitPowerLawValidation:
+    def test_rejects_small_n(self) -> None:
+        # n < MIN_TAIL_SIZE_VALIDATION must fail-closed.
+        from research.systemic_risk.network_fitting import (
+            MIN_TAIL_SIZE_VALIDATION,
+            fit_power_law_validation,
+        )
+
+        small = _draw_power_law(MIN_TAIL_SIZE_VALIDATION - 1, 2.5, 4, 0)
+        with pytest.raises(ValueError, match="validation-mode"):
+            fit_power_law_validation(small)
+
+    def test_passes_on_sufficient_sample(self) -> None:
+        # Large enough sample at α=2.5 with k_min=6 clears both the
+        # n=50 floor and the 10 % relative-SE precision bound.
+        from research.systemic_risk.network_fitting import fit_power_law_validation
+
+        sample = _draw_power_law(2000, 2.5, 6, 7)
+        fit = fit_power_law_validation(sample, k_min=6, n_bootstrap=200, seed=11)
+        assert fit.n_tail >= 50
+        assert fit.alpha_se / fit.alpha <= 0.10
+
+
+class TestFitBarabasiAlbertFromTopology:
+    """Regression: catch the v2 in+out double-count drift on `topology.degree`.
+
+    Reported by the Codex code-reviewer on PR #562: feeding
+    ``topology.degree`` (= in + out) directly into
+    :func:`fit_barabasi_albert` doubles the recovered ``m`` on
+    symmetric BA-null graphs because each undirected edge is counted
+    twice. :func:`fit_barabasi_albert_from_topology` resolves this by
+    using ``out_degree`` consistently.
+    """
+
+    @pytest.mark.parametrize("true_m", [2, 3, 4])
+    def test_recovers_generator_m_on_ba_null(self, true_m: int) -> None:
+        topo = barabasi_albert_null(n_nodes=400, m=true_m, seed=true_m * 7)
+        m_hat, _ = fit_barabasi_albert_from_topology(topo)
+        assert abs(m_hat - true_m) <= 1, (
+            f"BA-CALIBRATION VIOLATED: m̂={m_hat} from "
+            f"fit_barabasi_albert_from_topology vs true m={true_m} on "
+            f"barabasi_albert_null(n=400). Tolerance ±1 (finite-N)."
+        )
+
+    def test_total_degree_double_count_is_caught(self) -> None:
+        # Demonstrates the original bug: feeding topology.degree (sum of
+        # in+out) doubles the recovered m on symmetric graphs. The
+        # _from_topology helper avoids this by using out_degree.
+        topo = barabasi_albert_null(n_nodes=400, m=3, seed=11)
+        m_via_total, _ = fit_barabasi_albert(topo.degree)
+        m_via_topology, _ = fit_barabasi_albert_from_topology(topo)
+        assert m_via_total >= 2 * m_via_topology - 1, (
+            f"Expected m_via_total ≈ 2·m_via_topology on a symmetric BA "
+            f"graph (in+out doubles), got m_via_total={m_via_total}, "
+            f"m_via_topology={m_via_topology} at N=400, true_m=3, seed=11"
+        )
diff --git a/tests/research/systemic_risk/test_null_models.py b/tests/research/systemic_risk/test_null_models.py
new file mode 100644
index 00000000..a92a2521
--- /dev/null
+++ b/tests/research/systemic_risk/test_null_models.py
@@ -0,0 +1,223 @@
+# Copyright (c) 2023-2026 Yaroslav Vasylenko (neuron7xLab)
+# SPDX-License-Identifier: MIT
+"""Tests for the six required null-baseline generators (§ 8 of the
+official validation protocol).
+
+Each baseline must:
+* preserve a documented invariant of the empirical input;
+* be deterministic under a fixed seed;
+* leave the *to-be-tested* property destroyed.
+"""
+
+from __future__ import annotations
+
+from datetime import date
+
+import numpy as np
+import pytest
+
+from research.systemic_risk.event_ledger import (
+    BankingCrisisEvent,
+    BankingCrisisLedger,
+)
+from research.systemic_risk.null_models import (
+    degree_preserving_randomization,
+    linear_correlation_surrogate,
+    permuted_crisis_dates,
+    random_exposure_weights,
+    shuffled_time_labels,
+    static_topology_baseline,
+)
+from research.systemic_risk.topology import (
+    InterbankTopology,
+    barabasi_albert_null,
+    from_exposure_matrix,
+)
+
+
+def _empirical_topo(seed: int) -> InterbankTopology:
+    rng = np.random.default_rng(seed)
+    n = 30
+    e = rng.exponential(1.0, size=(n, n)).astype(np.float64)
+    e *= rng.random((n, n)) > 0.5
+    np.fill_diagonal(e, 0.0)
+    return from_exposure_matrix(e, tuple(f"b{i}" for i in range(n)))
+
+
+class TestDegreePreservingRandomization:
+    def test_preserves_in_and_out_degree(self) -> None:
+        topo = _empirical_topo(seed=0)
+        out = degree_preserving_randomization(topo, seed=42)
+        assert out.topology is not None
+        np.testing.assert_array_equal(out.topology.in_degree, topo.in_degree)
+        np.testing.assert_array_equal(out.topology.out_degree, topo.out_degree)
+
+    def test_seed_determinism(self) -> None:
+        topo = _empirical_topo(seed=0)
+        a = degree_preserving_randomization(topo, seed=11)
+        b = degree_preserving_randomization(topo, seed=11)
+        assert a.topology is not None and b.topology is not None
+        np.testing.assert_array_equal(a.topology.adjacency, b.topology.adjacency)
+
+    def test_destroys_specific_edges(self) -> None:
+        # With enough swaps the rewired graph differs from the input
+        # while preserving the marginals.
+        topo = _empirical_topo(seed=0)
+        out = degree_preserving_randomization(topo, seed=7, n_swaps=200)
+        assert out.topology is not None
+        diff = float((out.topology.adjacency != topo.adjacency).mean())
+        assert diff > 0.05, (
+            f"degree-preserving rewire too conservative: "
+            f"{diff:.3f} of entries differ; expected > 0.05 at n_swaps=200"
+        )
+
+
+class TestShuffledTimeLabels:
+    def test_preserves_marginal_distribution(self) -> None:
+        rng = np.random.default_rng(0)
+        score = rng.standard_normal(500)
+        out = shuffled_time_labels(score, seed=1)
+        assert out.score is not None
+        # Marginal moments preserved (it's a permutation).
+        np.testing.assert_allclose(out.score.mean(), score.mean(), atol=1e-12)
+        np.testing.assert_allclose(out.score.std(), score.std(), atol=1e-12)
+
+    def test_destroys_temporal_ordering(self) -> None:
+        # A strongly autocorrelated series loses its lag-1 autocorr.
+        rng = np.random.default_rng(0)
+        n = 1000
+        eps = rng.standard_normal(n)
+        ar = np.zeros(n, dtype=np.float64)
+        for t in range(1, n):
+            ar[t] = 0.95 * ar[t - 1] + eps[t]
+        out = shuffled_time_labels(ar, seed=11)
+        assert out.score is not None
+        rho_before = float(np.corrcoef(ar[:-1], ar[1:])[0, 1])
+        rho_after = float(np.corrcoef(out.score[:-1], out.score[1:])[0, 1])
+        assert abs(rho_after) < abs(rho_before) - 0.5, (
+            f"shuffle did not destroy lag-1 autocorr: "
+            f"|ρ| {abs(rho_before):.3f} → {abs(rho_after):.3f} on AR(0.95) n=1000"
+        )
+
+    def test_rejects_non_1d(self) -> None:
+        with pytest.raises(ValueError, match="1-D"):
+            shuffled_time_labels(np.zeros((10, 3)), seed=0)
+
+
+class TestRandomExposureWeights:
+    def test_preserves_binary_support(self) -> None:
+        topo = _empirical_topo(seed=0)
+        out = random_exposure_weights(topo, seed=3)
+        assert out.topology is not None
+        np.testing.assert_array_equal(out.topology.adjacency, topo.adjacency)
+
+    def test_no_weights_yields_zero_weights(self) -> None:
+        topo = barabasi_albert_null(n_nodes=20, m=2, seed=0)
+        out = random_exposure_weights(topo, seed=0)
+        assert out.topology is not None
+        # BA null has no empirical weights → surrogate has weights=None.
+        assert out.topology.weights is None
+
+    def test_seed_determinism(self) -> None:
+        topo = _empirical_topo(seed=0)
+        a = random_exposure_weights(topo, seed=99)
+        b = random_exposure_weights(topo, seed=99)
+        assert a.topology is not None and b.topology is not None
+        if a.topology.weights is not None:
+            assert b.topology.weights is not None
+            np.testing.assert_array_equal(a.topology.weights, b.topology.weights)
+
+
+class TestStaticTopologyBaseline:
+    def test_union_preserves_every_edge(self) -> None:
+        snapshots = tuple(_empirical_topo(seed=s) for s in (0, 1, 2))
+        out = static_topology_baseline(snapshots, seed=0)
+        assert out.topology is not None
+        # Every edge that ever existed survives.
+        for snap in snapshots:
+            assert np.all(out.topology.adjacency[snap.adjacency == 1] == 1)
+
+    def test_rejects_empty(self) -> None:
+        with pytest.raises(ValueError, match="non-empty"):
+            static_topology_baseline(tuple(), seed=0)
+
+    def test_rejects_size_mismatch(self) -> None:
+        a = _empirical_topo(seed=0)
+        b = barabasi_albert_null(n_nodes=10, m=2, seed=0)  # different N
+        with pytest.raises(ValueError, match="node count"):
+            static_topology_baseline((a, b), seed=0)
+
+
+class TestLinearCorrelationSurrogate:
+    def test_in_unit_interval(self) -> None:
+        rng = np.random.default_rng(0)
+        s = rng.standard_normal((200, 8))
+        out = linear_correlation_surrogate(s, seed=0)
+        assert out.score is not None
+        finite = out.score[np.isfinite(out.score)]
+        assert finite.size > 0
+        # Mean off-diagonal Pearson is bounded by ±1.
+        assert np.all(finite >= -1.0 - 1e-9) and np.all(finite <= 1.0 + 1e-9)
+
+    def test_short_input_rejected(self) -> None:
+        with pytest.raises(ValueError, match="2 time samples"):
+            linear_correlation_surrogate(np.zeros((1, 4)), seed=0)
+
+
+class TestPermutedCrisisDates:
+    def test_preserves_event_count_and_durations(self) -> None:
+        ledger = BankingCrisisLedger(
+            events=(
+                BankingCrisisEvent(
+                    country="USA",
+                    start=date(2008, 9, 15),
+                    end=date(2009, 6, 30),
+                    source="LV2018",
+                    label="GFC_USA",
+                ),
+                BankingCrisisEvent(
+                    country="GRC",
+                    start=date(2010, 5, 1),
+                    end=date(2012, 12, 31),
+                    source="LV2018",
+                    label="EZ_GRC",
+                ),
+            )
+        )
+        out = permuted_crisis_dates(
+            ledger, earliest=date(2005, 1, 1), latest=date(2025, 12, 31), seed=11
+        )
+        assert out.ledger is not None
+        assert len(out.ledger.events) == 2
+        for orig, permuted in zip(ledger.events, out.ledger.events):
+            assert (permuted.end - permuted.start) == (orig.end - orig.start)
+
+    def test_seed_determinism(self) -> None:
+        ledger = BankingCrisisLedger(
+            events=(
+                BankingCrisisEvent(
+                    country="USA",
+                    start=date(2008, 9, 15),
+                    end=date(2009, 6, 30),
+                    source="LV2018",
+                    label="GFC_USA",
+                ),
+            )
+        )
+        a = permuted_crisis_dates(
+            ledger, earliest=date(2005, 1, 1), latest=date(2025, 12, 31), seed=42
+        )
+        b = permuted_crisis_dates(
+            ledger, earliest=date(2005, 1, 1), latest=date(2025, 12, 31), seed=42
+        )
+        assert a.ledger is not None and b.ledger is not None
+        assert a.ledger.events[0].start == b.ledger.events[0].start
+
+    def test_invalid_window_rejected(self) -> None:
+        with pytest.raises(ValueError, match="latest"):
+            permuted_crisis_dates(
+                BankingCrisisLedger(events=tuple()),
+                earliest=date(2010, 1, 1),
+                latest=date(2010, 1, 1),
+                seed=0,
+            )
diff --git a/tests/research/systemic_risk/test_replication.py b/tests/research/systemic_risk/test_replication.py
new file mode 100644
index 00000000..3e31bf35
--- /dev/null
+++ b/tests/research/systemic_risk/test_replication.py
@@ -0,0 +1,58 @@
+# Copyright (c) 2023-2026 Yaroslav Vasylenko (neuron7xLab)
+# SPDX-License-Identifier: MIT
+"""Tests for the replication manifest (§ 13 of the validation protocol)."""
+
+from __future__ import annotations
+
+import json
+
+from research.systemic_risk.replication import build_run_manifest
+
+
+class TestBuildRunManifest:
+    def test_config_hash_is_stable(self) -> None:
+        a = build_run_manifest(seed=42, config={"window": 60, "alpha": 0.01})
+        b = build_run_manifest(seed=42, config={"alpha": 0.01, "window": 60})
+        assert a.config_hash == b.config_hash, (
+            "config_hash must be invariant to dict-key order; "
+            "JSON serialisation uses sort_keys=True"
+        )
+
+    def test_config_hash_changes_with_value(self) -> None:
+        a = build_run_manifest(seed=42, config={"window": 60})
+        b = build_run_manifest(seed=42, config={"window": 90})
+        assert a.config_hash != b.config_hash
+
+    def test_seed_recorded_verbatim(self) -> None:
+        m = build_run_manifest(seed=12345, config={})
+        assert m.seed == 12345
+
+    def test_to_json_round_trip(self) -> None:
+        m = build_run_manifest(
+            seed=7,
+            config={"k": 3, "name": "demo"},
+            extra={"dataset": "synthetic"},
+        )
+        payload = json.loads(m.to_json())
+        assert payload["seed"] == 7
+        assert payload["config"] == {"k": 3, "name": "demo"}
+        assert payload["extra"] == {"dataset": "synthetic"}
+        assert "timestamp_utc" in payload
+        assert "platform_info" in payload
+        assert "package_versions" in payload
+
+    def test_package_versions_contains_numpy(self) -> None:
+        m = build_run_manifest(seed=0, config={})
+        # numpy is a hard dependency of the suite — must be present.
+        assert "numpy" in m.package_versions
+        assert m.package_versions["numpy"] != "not-installed"
+
+    def test_to_json_is_deterministic(self) -> None:
+        # Two manifests built with identical inputs differ only in
+        # timestamp; serialisation order is deterministic so the
+        # bytes diff reduces to that single line.
+        a = build_run_manifest(seed=1, config={"a": 1, "b": 2})
+        b = build_run_manifest(seed=1, config={"a": 1, "b": 2})
+        a_lines = [line for line in a.to_json().splitlines() if "timestamp" not in line]
+        b_lines = [line for line in b.to_json().splitlines() if "timestamp" not in line]
+        assert a_lines == b_lines
diff --git a/tests/research/systemic_risk/test_topology.py b/tests/research/systemic_risk/test_topology.py
index 8bd7e17b..f6f62f01 100644
--- a/tests/research/systemic_risk/test_topology.py
+++ b/tests/research/systemic_risk/test_topology.py
@@ -1,9 +1,11 @@
 # Copyright (c) 2023-2026 Yaroslav Vasylenko (neuron7xLab)
 # SPDX-License-Identifier: MIT
-"""Invariant tests for :mod:`research.systemic_risk.topology`."""
+"""Invariant tests for :mod:`research.systemic_risk.topology` (v2 — directed)."""
 
 from __future__ import annotations
 
+from datetime import date
+
 import numpy as np
 import pytest
 
@@ -15,10 +17,12 @@
 
 
 class TestInterbankTopologyInvariants:
-    def test_inv_top1_asymmetric_adjacency_rejected(self) -> None:
+    def test_inv_top1_directed_adjacency_accepted(self) -> None:
+        # v2: asymmetric adjacency is ALLOWED — represents directed exposure.
         a = np.array([[0, 1, 0], [0, 0, 1], [1, 0, 0]], dtype=np.int8)
-        with pytest.raises(ValueError, match="INV-TOP1"):
-            InterbankTopology(adjacency=a, node_labels=("a", "b", "c"), source_label="t")
+        topo = InterbankTopology(adjacency=a, node_labels=("a", "b", "c"), source_label="t")
+        assert not topo.is_symmetric
+        assert topo.asymmetry_fraction > 0.0
 
     def test_inv_top1_nonbinary_rejected(self) -> None:
         a = np.array([[0, 2], [2, 0]], dtype=np.int8)
@@ -47,16 +51,42 @@ def test_arrays_are_immutable_after_construction(self) -> None:
         with pytest.raises(ValueError):
             topo.adjacency[0, 1] = 0
 
+    def test_in_out_degree(self) -> None:
+        # a→b, b→c, c→a (directed cycle)
+        a = np.array([[0, 1, 0], [0, 0, 1], [1, 0, 0]], dtype=np.int8)
+        topo = InterbankTopology(adjacency=a, node_labels=("a", "b", "c"), source_label="t")
+        assert list(topo.in_degree) == [1, 1, 1]
+        assert list(topo.out_degree) == [1, 1, 1]
+        assert list(topo.degree) == [2, 2, 2]
+
+    def test_snapshot_date_optional(self) -> None:
+        a = np.zeros((2, 2), dtype=np.int8)
+        snap = date(2011, 6, 30)
+        topo = InterbankTopology(
+            adjacency=a, node_labels=("a", "b"), source_label="t", snapshot_date=snap
+        )
+        assert topo.snapshot_date == snap
+
 
 class TestFromExposureMatrix:
-    def test_symmetrises_and_binarises(self) -> None:
+    def test_directed_default_preserves_asymmetry(self) -> None:
+        # Asymmetric exposure: a → b strong, b → a weak.
+        e = np.array([[0.0, 5.0, 0.0], [1.0, 0.0, 0.0], [0.0, 0.0, 0.0]], dtype=np.float64)
+        topo = from_exposure_matrix(e, node_labels=("a", "b", "c"), threshold=2.0)
+        # a → b passes threshold, b → a does NOT (1.0 <= 2.0).
+        assert topo.adjacency[0, 1] == 1, "INV-TOP1d: directed edge a→b should be present"
+        assert topo.adjacency[1, 0] == 0, (
+            "INV-TOP1d: directed edge b→a below threshold should be absent; "
+            "v2 must NOT auto-symmetrise"
+        )
+
+    def test_symmetric_mode_averages(self) -> None:
         e = np.array([[0.0, 1.0, 0.0], [3.0, 0.0, 0.0], [0.0, 0.0, 0.0]], dtype=np.float64)
-        topo = from_exposure_matrix(e, node_labels=("a", "b", "c"))
-        # (1+3)/2 = 2 → adjacency edge a-b; rest zero.
+        topo = from_exposure_matrix(e, node_labels=("a", "b", "c"), directed=False)
+        # (1+3)/2 = 2 → both edges present.
         assert topo.adjacency[0, 1] == 1
         assert topo.adjacency[1, 0] == 1
-        assert topo.adjacency[2, 0] == 0
-        assert topo.adjacency[2, 1] == 0
+        assert topo.is_symmetric
 
     def test_threshold_excludes_small_exposures(self) -> None:
         e = np.array([[0.0, 0.5], [0.5, 0.0]], dtype=np.float64)
@@ -68,6 +98,47 @@ def test_negative_exposure_rejected(self) -> None:
         with pytest.raises(ValueError):
             from_exposure_matrix(e, node_labels=("a", "b"))
 
+    def test_nan_exposure_rejected(self) -> None:
+        e = np.array([[0.0, np.nan], [0.0, 0.0]], dtype=np.float64)
+        with pytest.raises(ValueError, match="finite"):
+            from_exposure_matrix(e, node_labels=("a", "b"))
+
+    def test_snapshot_date_propagates(self) -> None:
+        e = np.array([[0.0, 1.0], [1.0, 0.0]], dtype=np.float64)
+        snap = date(2011, 6, 30)
+        topo = from_exposure_matrix(e, node_labels=("a", "b"), snapshot_date=snap)
+        assert topo.snapshot_date == snap
+
+    def test_single_node_graph_accepted(self) -> None:
+        e = np.zeros((1, 1), dtype=np.float64)
+        topo = from_exposure_matrix(e, ("solo",))
+        assert topo.n_nodes == 1
+        assert topo.adjacency.sum() == 0
+
+    def test_all_zero_matrix_accepted_as_empty_graph(self) -> None:
+        e = np.zeros((5, 5), dtype=np.float64)
+        topo = from_exposure_matrix(e, tuple(f"b{i}" for i in range(5)))
+        assert topo.adjacency.sum() == 0
+        assert np.all(topo.in_degree == 0)
+        assert np.all(topo.out_degree == 0)
+
+    def test_asymmetry_invariant_on_directed_data(self) -> None:
+        # v2 protocol's asymmetry invariant: empirical e-MID, BIS, ECB
+        # interbank exposures are documented at ≥ 60% asymmetry
+        # (Bardoscia et al. 2021 NRP, fig. 2). The test uses a
+        # deterministic upper-triangular construction so the bound
+        # is hit by structure, not by statistical luck.
+        n = 20
+        e = np.zeros((n, n), dtype=np.float64)
+        for i in range(n):
+            for j in range(i + 1, n):
+                e[i, j] = float((i + 1) * (j + 1))
+        topo = from_exposure_matrix(e, node_labels=tuple(f"b{i}" for i in range(n)))
+        assert topo.asymmetry_fraction > 0.5, (
+            f"asymmetry invariant VIOLATED: fraction={topo.asymmetry_fraction:.3f} "
+            f"<= 0.5 on upper-triangular directed input. At N={n} (deterministic)"
+        )
+
 
 class TestBarabasiAlbertNull:
     @pytest.mark.parametrize("m", [2, 3, 4])
@@ -88,18 +159,20 @@ def test_different_seeds_differ(self) -> None:
         b = barabasi_albert_null(n_nodes=50, m=3, seed=2)
         assert not np.array_equal(a.adjacency, b.adjacency)
 
-    def test_mean_degree_close_to_2m(self) -> None:
-        # Statistical: ensemble of 50 BA graphs, mean degree → 2m as N → ∞.
-        # At N=200, m=3 the empirical mean is 2m within ~10% (Albert-Barabási 2002).
+    def test_mean_out_degree_close_to_2m(self) -> None:
+        # Statistical: ensemble of 50 BA graphs, mean OUT-degree → 2m (the
+        # symmetric BA mean degree per Albert-Barabási 2002). The total
+        # `degree` property in v2 sums in+out, so a symmetric graph has
+        # mean(degree) = 2*mean(out_degree) ≈ 4m — guarded separately.
         m = 3
         n = 200
-        means = []
-        for seed in range(50):
-            topo = barabasi_albert_null(n_nodes=n, m=m, seed=seed)
-            means.append(float(topo.degree.mean()))
+        means = [
+            float(barabasi_albert_null(n_nodes=n, m=m, seed=seed).out_degree.mean())
+            for seed in range(50)
+        ]
         ensemble_mean = float(np.mean(means))
         assert abs(ensemble_mean - 2 * m) < 0.5, (
-            f"BA mean-degree drift: ensemble_mean={ensemble_mean:.3f}, "
+            f"BA mean-out-degree drift: ensemble_mean={ensemble_mean:.3f}, "
             f"expected 2m={2 * m} ± 0.5 at N={n}, m={m}, n_seeds=50"
         )