hyperpolymath · hyperpolymath · May 17, 2026 · May 18, 2026 · May 18, 2026 · May 18, 2026
diff --git a/.github/workflows/build-gossamer-gui.yml b/.github/workflows/build-gossamer-gui.yml
@@ -152,7 +152,7 @@ jobs:
       - name: Install just
         uses: taiki-e/install-action@184183c2401be73c3bf42c2e61268aa5855379c1 # v2.78.1
         with:
-          tool: just
+          tool: just@1.34.0
 
       - name: Cache Ephapax build
         id: cache-ephapax

diff --git a/.github/workflows/tests.yml b/.github/workflows/tests.yml
@@ -647,7 +647,9 @@ jobs:
         if: ${{ github.event.inputs.mode != 'regenerate-baseline' }}
         run: |
           set -euo pipefail
-          python3 scripts/check-bench-regression.py \
+          cargo run --quiet --release \
+              --manifest-path scripts/bench-tools/Cargo.toml \
+              --bin check-bench-regression -- \
               bench-output.txt \
               .machine_readable/benchmarks/baselines.json \
               | tee -a "$GITHUB_STEP_SUMMARY"
@@ -656,7 +658,9 @@ jobs:
         if: ${{ github.event.inputs.mode == 'regenerate-baseline' }}
         run: |
           set -euo pipefail
-          python3 scripts/update-bench-baselines.py \
+          cargo run --quiet --release \
+              --manifest-path scripts/bench-tools/Cargo.toml \
+              --bin update-bench-baselines -- \
               bench-output.txt \
               .machine_readable/benchmarks/baselines.json
           echo "## Regenerated baseline" >> "$GITHUB_STEP_SUMMARY"

diff --git a/.hypatia-baseline.json b/.hypatia-baseline.json
@@ -1,18 +1,4 @@
 [
-  {
-    "severity": "critical",
-    "rule_module": "cicd_rules",
-    "type": "banned_language_file",
-    "file": "scripts/check-bench-regression.py",
-    "action": "flag"
-  },
-  {
-    "severity": "critical",
-    "rule_module": "cicd_rules",
-    "type": "banned_language_file",
-    "file": "scripts/update-bench-baselines.py",
-    "action": "flag"
-  },
   {
     "severity": "critical",
     "rule_module": "code_safety",

diff --git a/.hypatia-exemptions.md b/.hypatia-exemptions.md
@@ -19,8 +19,6 @@ already placed at each file's site.
 
 | File | Rule | Inline marker | Rationale | Revisit when |
 |---|---|---|---|---|
-| `scripts/update-bench-baselines.py` | `cicd_rules/banned_language_file` | `# hypatia:ignore cicd_rules/banned_language_file` (line 3) | Parses criterion's bencher-format output; criterion's tooling assumes Python downstream. | A maintained Rust/shell parser exists for criterion bencher format. |
-| `scripts/check-bench-regression.py` | `cicd_rules/banned_language_file` | `# hypatia:ignore cicd_rules/banned_language_file` (line 3) | Pair of the above. | Same. |
 | `src/abi/RuleEngine.idr` | `code_safety/believe_me`, `structural_drift/SD008` | `-- hypatia:ignore code_safety/believe_me structural_drift/SD008` (line 19) | The scanner is counting the literal token `believe_me` inside an Idris2 comment that asserts there are *no* such primitives. There is no actual `believe_me` call site in the module. | The scanner learns to skip comment lines (token vs syntactic match). |
 
 ## Audit-training and remediation-script corpora

diff --git a/.hypatia-ignore b/.hypatia-ignore
@@ -23,13 +23,5 @@
 #
 # This file is for exemptions that span a whole file or directory.
 
-# ─── Python bench helpers ───────────────────────────────────────────────
-#
-# Scoped exemption — RSR org policy bans Python except SaltStack. These two
-# scripts are bench-data helpers used only by .github/workflows/bench.yml;
-# they parse criterion output and update baseline JSON. Rust/Julia port is
-# tracked but not blocking. Until the port lands, suppress the
-# banned_language_file finding on these two specific paths so the gate
-# treats them as a known, documented carve-out rather than baseline noise.
-cicd_rules/banned_language_file:scripts/check-bench-regression.py
-cicd_rules/banned_language_file:scripts/update-bench-baselines.py
+# (The former Python bench-helper carve-out was removed once the helpers
+#  were ported to the zero-dependency Rust crate scripts/bench-tools/.)
@@ -84,7 +84,8 @@ cargo bench --bench hypatia_bench -- \
   | tee /tmp/bench.txt
 
 # Parse the output and update baselines.json:
-python3 scripts/update-bench-baselines.py /tmp/bench.txt \
+cargo run --release --manifest-path scripts/bench-tools/Cargo.toml \
+  --bin update-bench-baselines -- /tmp/bench.txt \
   .machine_readable/benchmarks/baselines.json
 ```
 

diff --git a/CHANGELOG.adoc b/CHANGELOG.adoc
@@ -12,6 +12,26 @@ https://semver.org/[Semantic Versioning].
 
 === Changed
 
+==== Bench tooling: Python → zero-dependency Rust (2026-05-18)
+
+Eliminates the last org-policy Python carve-out. `scripts/check-bench-regression.py`
+and `scripts/update-bench-baselines.py` were ported 1:1 to a standalone,
+zero-dependency Rust crate at `scripts/bench-tools/` (deliberately outside
+the Cargo workspace so it never perturbs the main build / proof gates).
+Behaviour is identical (criterion bencher parsing, Markdown summary +
+`::error::` annotations, exit codes, byte-identical `baselines.json`
+serializer). `tests.yml` and `.machine_readable/benchmarks/README.md`
+now invoke `cargo run --manifest-path scripts/bench-tools/Cargo.toml`.
+The now-moot `.hypatia-ignore`, `.hypatia-exemptions.md` and
+`.hypatia-baseline.json` carve-outs were removed so the exemption cannot
+silently become drift.
+
+==== Pin `just@1.34.0` in build-gossamer-gui (2026-05-18)
+
+`taiki-e/install-action` installed `just` unpinned, tripping the
+governance R1 tooling-version-integrity rule. Pinned to the
+estate-canonical `just@1.34.0`.
+
 ==== VQL → VCL + verisimdb → verisim Rename (2026-04-05)
 
 Matches the ecosystem-wide rename landed in Verisim on the same day.

@@ -41,7 +41,14 @@ defmodule Mix.Tasks.Hypatia.Reconcile do
 
         result =
           if opts[:verify] do
-            ScorecardReconciler.verify(owner, repo)
+            # verify/2 returns {:ok, summary} | {:error, reason}; reconcile/3
+            # returns a bare map. Normalise verify to a bare map so the
+            # Jason.encode! below never receives a tuple (it cannot encode
+            # one — `mix hypatia.reconcile --verify` used to crash here).
+            case ScorecardReconciler.verify(owner, repo) do
+              {:ok, summary} -> summary
+              {:error, reason} -> %{repo: "#{owner}/#{repo}", verified: false, error: reason}
+            end
           else
             ScorecardReconciler.reconcile(owner, repo,
               dry_run: !!opts[:dry_run],

diff --git a/scripts/README.adoc b/scripts/README.adoc
@@ -30,3 +30,12 @@ and gitbot-fleet dispatch on the hyperpolymath estate.
 
 Per-pattern fix scripts referenced by dispatch manifests.
 Each script is named after the canonical pattern ID (e.g., `fix-PA009.sh`).
+
+== bench-tools/
+
+Standalone, zero-dependency Rust crate (deliberately outside the Cargo
+workspace) providing the criterion bench-data tooling — `check-bench-regression`
+and `update-bench-baselines`. Replaces the former `scripts/*.py`
+(org policy bans Python outside SaltStack). Invoked by the benchmark
+workflow via `cargo run --manifest-path scripts/bench-tools/Cargo.toml`;
+see `.machine_readable/benchmarks/README.md`.
diff --git a/scripts/bench-tools/.gitignore b/scripts/bench-tools/.gitignore
@@ -0,0 +1,2 @@
+/target
+Cargo.lock
diff --git a/scripts/bench-tools/Cargo.toml b/scripts/bench-tools/Cargo.toml
@@ -0,0 +1,30 @@
+# SPDX-License-Identifier: PMPL-1.0-or-later
+#
+# Standalone bench-data tooling — deliberately NOT a workspace member so it
+# never perturbs the main build / proof gates, and zero-dependency so CI
+# needs no crates.io fetch. Replaces the former scripts/*.py (org policy
+# bans Python outside SaltStack; see standards Explicit-Escape Principle).
+# Empty table: keep this crate out of the repo's main Cargo workspace so it
+# never perturbs the main build / proof gates.
+[workspace]
+
+[package]
+name = "bench-tools"
+version = "0.1.0"
+edition = "2021"
+license = "PMPL-1.0-or-later"
+publish = false
+
+[lib]
+path = "src/lib.rs"
+
+[[bin]]
+name = "check-bench-regression"
+path = "src/bin/check-bench-regression.rs"
+
+[[bin]]
+name = "update-bench-baselines"
+path = "src/bin/update-bench-baselines.rs"
+
+[profile.release]
+opt-level = 1
diff --git a/scripts/bench-tools/src/bin/check-bench-regression.rs b/scripts/bench-tools/src/bin/check-bench-regression.rs
@@ -0,0 +1,157 @@
+// SPDX-License-Identifier: PMPL-1.0-or-later
+//
+// check-bench-regression — compare a criterion bencher run against
+// .machine_readable/benchmarks/baselines.json and fail if any benchmark
+// regressed by more than the configured threshold. A faithful Rust port of
+// the former scripts/check-bench-regression.py (org policy bans Python
+// outside SaltStack). Pairs with update-bench-baselines.
+//
+// Usage:
+//     check-bench-regression <bencher-output> <baselines.json>
+//
+// Exit status:  0 = no regressions over threshold (or no baselines yet),
+//               1 = at least one regression,  2 = usage / file error.
+//
+// Markdown summary -> stdout (for $GITHUB_STEP_SUMMARY); `::error::`
+// annotations -> stderr.
+
+use bench_tools::{fmt_ns, parse_bencher_output, parse_json, Json};
+use std::process::exit;
+
+fn main() {
+    let argv: Vec<String> = std::env::args().collect();
+    if argv.len() != 3 {
+        eprintln!("usage: check-bench-regression <bencher-output> <baselines.json>");
+        exit(2);
+    }
+    let current_path = &argv[1];
+    let baselines_path = &argv[2];
+
+    let current_text = match std::fs::read_to_string(current_path) {
+        Ok(t) => t,
+        Err(_) => {
+            eprintln!("error: {current_path} missing");
+            exit(2);
+        }
+    };
+
+    let mut current = parse_bencher_output(&current_text);
+    current.sort_by(|a, b| a.0.cmp(&b.0)); // Python iterates `sorted(current.items())`
+
+    if current.is_empty() {
+        println!(
+            "::warning::no bench lines parsed from current run \u{2014} \
+             did criterion use --output-format bencher?"
+        );
+        exit(0);
+    }
+
+    let baseline_doc: Json = match std::fs::read_to_string(baselines_path) {
+        Ok(t) => match parse_json(&t) {
+            Ok(v) => v,
+            Err(_) => {
+                println!(
+                    "::warning::{baselines_path} is not valid JSON; \
+                     treating as empty baseline"
+                );
+                Json::Obj(vec![])
+            }
+        },
+        Err(_) => Json::Obj(vec![]),
+    };
+
+    let baselines: Vec<(String, f64)> = match baseline_doc.get("baselines") {
+        Some(Json::Obj(p)) => p
+            .iter()
+            .filter_map(|(k, v)| v.as_f64().map(|n| (k.clone(), n)))
+            .collect(),
+        _ => vec![],
+    };
+    let lookup = |name: &str| baselines.iter().find(|(k, _)| k == name).map(|(_, v)| *v);
+
+    let threshold_pct = baseline_doc
+        .get("_regression_threshold_pct")
+        .and_then(|v| v.as_f64())
+        .unwrap_or(50.0);
+
+    if baselines.is_empty() {
+        println!("## Benchmark run (advisory mode \u{2014} no baselines yet)");
+        println!();
+        println!("| Benchmark | Current |");
+        println!("|-----------|---------|");
+        for (name, ns) in &current {
+            println!("| `{name}` | {} |", fmt_ns(*ns));
+        }
+        println!();
+        println!(
+            "_No entries in `baselines.json` yet \u{2014} see \
+             `.machine_readable/benchmarks/README.md` for how to seed them._"
+        );
+        exit(0);
+    }
+
+    let mut regressions: Vec<(String, i64, i64, f64)> = vec![];
+    let mut rows: Vec<(String, String, String, String, String)> = vec![];
+
+    for (name, ns_now) in &current {
+        let ns_now = *ns_now;
+        match lookup(name) {
+            None => rows.push((
+                name.clone(),
+                fmt_ns(ns_now),
+                "\u{2014}".into(),
+                "new".into(),
+                "\u{2728}".into(),
+            )),
+            Some(ns_base) => {
+                let pct = if ns_base != 0.0 {
+                    (ns_now as f64 - ns_base) / ns_base * 100.0
+                } else {
+                    0.0
+                };
+                let mut verdict = "\u{2705}";
+                if pct > threshold_pct {
+                    verdict = "\u{274c}";
+                    regressions.push((name.clone(), ns_base as i64, ns_now, pct));
+                } else if pct > threshold_pct / 2.0 {
+                    verdict = "\u{26a0}\u{fe0f}";
+                } else if pct < -10.0 {
+                    verdict = "\u{1f680}";
+                }
+                rows.push((
+                    name.clone(),
+                    fmt_ns(ns_now),
+                    fmt_ns(ns_base as i64),
+                    format!("{pct:+.1}%"),
+                    verdict.into(),
+                ));
+            }
+        }
+    }
+
+    println!("## Benchmark comparison");
+    println!();
+    println!("Threshold: regression > **{threshold_pct:.0}%** fails CI.");
+    println!();
+    println!("| Benchmark | Current | Baseline | \u{0394} | |");
+    println!("|-----------|---------|----------|---|---|");
+    for (a, b, c, d, e) in &rows {
+        println!("| `{a}` | {b} | {c} | {d} | {e} |");
+    }
+    println!();
+
+    if !regressions.is_empty() {
+        println!("### Regressions exceeding threshold");
+        println!();
+        for (name, ns_base, ns_now, pct) in &regressions {
+            let msg = format!(
+                "{name}: {} \u{2192} {} ({pct:+.1}%, threshold {threshold_pct:.0}%)",
+                fmt_ns(*ns_base),
+                fmt_ns(*ns_now),
+            );
+            println!("- {msg}");
+            eprintln!("::error::benchmark regression: {msg}");
+        }
+        exit(1);
+    }
+}