From 95a9ec158c58f2b915eb832c7ca9a0c6d1e9bea2 Mon Sep 17 00:00:00 2001
From: Cursor Agent <cursoragent@cursor.com>
Date: Tue, 21 Apr 2026 23:15:50 +0000
Subject: [PATCH 1/3] v3.46-trained: add train_v346.py and AMS_TRAINED_WEIGHTS
 loader hook

Per SPRINT_CLOSEOUT_v3.46.md \u00a75.3/\u00a75.4 and \u00a75 loader note.

train_v346.py
- Copies the v344 driver template, points to scheme_b_v344 (= v3.46 SUT).
- Asserts v3.46 Cfg invariants (use_top1_exclusive_content_bias=False,
  tail_slot_residual_dominant=False).
- Requires CUDA by default; AMS_ALLOW_CPU_TRAIN=1 to override.
- Logs pre/post "mechanism-level observable" probes per \u00a75.6:
  tail_head.slot_heads[1][0].weight.abs().mean and
  vocab_proj.proj[-1].weight.abs().mean.
- Saves non-backbone state_dict + non-backbone buffers to ckpt/v346_trained.pt
  with provenance + Cfg snapshot.

scheme_b_v344.MemLLM._maybe_load_trained_weights
- New hook called at end of load(); opt-in via AMS_TRAINED_WEIGHTS env.
- Loads non-backbone tensors into matching params/buffers; backbone excluded.
- Strict shape check: raises on mismatch (protects against loading the
  v344/v348 ckpts per \u00a76 warning about shape incompatibility).

Co-authored-by: FluffyAIcode <FluffyAIcode@users.noreply.github.com>
---
 scheme_b_v344.py |  54 ++++++++++++++++
 train_v346.py    | 157 +++++++++++++++++++++++++++++++++++++++++++++++
 2 files changed, 211 insertions(+)
 create mode 100644 train_v346.py

diff --git a/scheme_b_v344.py b/scheme_b_v344.py
index 8e54cf1..a45b11a 100644
--- a/scheme_b_v344.py
+++ b/scheme_b_v344.py
@@ -2494,8 +2494,62 @@ def _capture_query_ids(module, args):
         self.backbone.register_forward_pre_hook(_capture_query_ids)
         self._build_wte_neighbor_cache()
         self._compute_filler_centroid()
+        self._maybe_load_trained_weights()
         return self
 
+    def _maybe_load_trained_weights(self):
+        """Optional hook: if env AMS_TRAINED_WEIGHTS points to a checkpoint written by
+        train_v346.py (or any sibling trainer), load non-backbone params/buffers with
+        strict=False. Backbone is intentionally excluded — trainer only saves trainables
+        + non-backbone buffers (see train_v346.py §5.3). Missing/unexpected keys are
+        logged but not fatal, so a partial-shape ckpt fails loud only on shape mismatch.
+        """
+        path = os.environ.get("AMS_TRAINED_WEIGHTS", "").strip()
+        if not path: return
+        if not os.path.exists(path):
+            print(f"  [AMS_TRAINED_WEIGHTS] file not found: {path} — skipping")
+            return
+        try:
+            blob = torch.load(path, map_location="cpu", weights_only=False)
+        except Exception as e:
+            print(f"  [AMS_TRAINED_WEIGHTS] torch.load failed: {type(e).__name__}: {e}")
+            return
+        sd = blob.get("state_dict", blob) if isinstance(blob, dict) else blob
+        if not isinstance(sd, dict):
+            print(f"  [AMS_TRAINED_WEIGHTS] unexpected format (no 'state_dict' mapping) — skipping")
+            return
+        dev = next(self.parameters()).device
+        own_params = dict(self.named_parameters())
+        own_buffers = dict(self.named_buffers())
+        loaded, skipped = 0, 0
+        shape_errs = []
+        with torch.no_grad():
+            for n, t in sd.items():
+                if n.startswith("backbone"): skipped += 1; continue
+                if n in own_params:
+                    p = own_params[n]
+                    if p.shape != t.shape:
+                        shape_errs.append((n, tuple(p.shape), tuple(t.shape))); continue
+                    p.data.copy_(t.to(dev, dtype=p.dtype))
+                    loaded += 1
+                elif n in own_buffers:
+                    b = own_buffers[n]
+                    if b.shape != t.shape:
+                        shape_errs.append((n, tuple(b.shape), tuple(t.shape))); continue
+                    b.data.copy_(t.to(dev, dtype=b.dtype))
+                    loaded += 1
+                else:
+                    skipped += 1
+        prov = blob.get("provenance", "?") if isinstance(blob, dict) else "?"
+        print(f"  [AMS_TRAINED_WEIGHTS] loaded={loaded} skipped={skipped} "
+              f"shape_errs={len(shape_errs)}  path={path}  provenance={prov}")
+        if shape_errs:
+            for n, s_model, s_ckpt in shape_errs[:5]:
+                print(f"    ! shape mismatch {n}: model={s_model} ckpt={s_ckpt}")
+            raise RuntimeError(
+                f"AMS_TRAINED_WEIGHTS shape mismatch on {len(shape_errs)} tensor(s); "
+                f"ckpt not compatible with current SUT shapes")
+
     def _compute_filler_centroid(self):
         if self.content_classifier is None or self.backbone is None:
             self._filler_centroid = None; return
diff --git a/train_v346.py b/train_v346.py
new file mode 100644
index 0000000..2b0c545
--- /dev/null
+++ b/train_v346.py
@@ -0,0 +1,157 @@
+#!/usr/bin/env python3
+"""Training driver for v3.46-trained.
+
+Starts from v346-revertE-topk-nonexclusive-7e97 SUT (attention-pool ctx encoder,
+cluster-crowding retrieval, refresh-on-write, additive tail residual,
+top1-exclusive OFF, cond-buffer mirror).  Runs N Trainer.step iterations
+over a rotating corpus; saves non-backbone state_dict to ckpt/v346_trained.pt.
+
+Per SPRINT_CLOSEOUT_v3.46.md §5.3 / §5.4.
+"""
+import argparse, os, time, json, math, sys
+import torch
+sys.path.insert(0, os.path.dirname(os.path.abspath(__file__)))
+import scheme_b_v344 as sb
+
+MUSIC = [
+    "He practiced piano for hours perfecting a difficult Chopin nocturne.",
+    "She studied music theory and harmonic progression at the conservatory.",
+    "The orchestra performed Beethoven symphony with remarkable precision.",
+]
+SPACE = [
+    "The telescope revealed distant galaxies beyond the Milky Way.",
+    "Astronauts trained for the Mars mission in simulated zero gravity.",
+    "The nebula emitted radiation across the electromagnetic spectrum.",
+]
+GENERIC = [
+    "The pianist practiced arpeggios and Chopin nocturnes until midnight.",
+    "A musician refined finger technique, phrasing, and pedal control.",
+    "Classical interpretation often depends on dynamics, tempo rubato, and touch.",
+    "A conservatory student studied etudes, scales, and expressive keyboard skills.",
+    "Distant astronomers observed galaxies quasars and stellar evolution.",
+    "Space orbital mechanics explains satellites and planetary motion.",
+]
+ALL = MUSIC + SPACE + GENERIC
+
+
+def main():
+    ap = argparse.ArgumentParser()
+    ap.add_argument("--steps", type=int, default=60)
+    ap.add_argument("--batch", type=int, default=3)
+    ap.add_argument("--out", type=str, default="ckpt/v346_trained.pt")
+    ap.add_argument("--seed", type=int, default=42)
+    ap.add_argument("--log", type=str, default="ckpt/v346_train_log.jsonl")
+    args = ap.parse_args()
+
+    os.makedirs(os.path.dirname(args.out) or ".", exist_ok=True)
+    log_dir = os.path.dirname(args.log) or "."
+    os.makedirs(log_dir, exist_ok=True)
+    torch.manual_seed(args.seed)
+
+    c = sb.Cfg()
+    # Sanity: confirm v3.46 Cfg (same assert as §8 step 3, catches env corruption)
+    assert c.use_top1_exclusive_content_bias is False, \
+        "Cfg.use_top1_exclusive_content_bias must be False on v3.46"
+    assert c.tail_slot_residual_dominant is False, \
+        "Cfg.tail_slot_residual_dominant must be False on v3.46 (revert [B])"
+
+    m = sb.MemLLM(c)
+    device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+    if device.type != "cuda":
+        if os.environ.get("AMS_ALLOW_CPU_TRAIN", "0") != "1":
+            raise AssertionError(
+                "train_v346 expects CUDA; CPU fallback is ~10x slower and not the intent. "
+                "Set AMS_ALLOW_CPU_TRAIN=1 to override explicitly.")
+        print("[build] WARNING: running on CPU (AMS_ALLOW_CPU_TRAIN=1)")
+    m.to(device); m.load(); m.to(device)
+    trainable = sum(p.numel() for p in m.parameters() if p.requires_grad)
+    total = sum(p.numel() for p in m.parameters())
+    print(f"[build] device={device}  params total={total:,}  trainable={trainable:,}")
+
+    for t in ALL:
+        m.write(t, training_mode=True)
+    try:
+        m.amm.maybe_recluster(force=True)
+    except Exception as e:
+        print(f"[build] amm.maybe_recluster skipped: {type(e).__name__}: {e}")
+    m._refresh_rare_keyword_indices()
+    m.eval()
+    print(f"[build] initial memory count = {len(m.amm.tree.store)}")
+
+    # Pre-training mechanism snapshot (per §5.6): tail_head[1] + vocab_proj last weights
+    def _probe_weights(model):
+        out = {}
+        try:
+            w = model.bridge.tail_head.slot_heads[1][0].weight
+            out["tail_head_slot1_abs_mean"] = float(w.detach().abs().mean())
+        except Exception as e:
+            out["tail_head_slot1_abs_mean"] = f"ERR {type(e).__name__}"
+        try:
+            w = model.vocab_proj.proj[-1].weight
+            out["vocab_proj_last_abs_mean"] = float(w.detach().abs().mean())
+        except Exception as e:
+            out["vocab_proj_last_abs_mean"] = f"ERR {type(e).__name__}"
+        return out
+    pre_probe = _probe_weights(m)
+    print(f"[probe pre-train] {pre_probe}")
+
+    trainer = sb.Trainer(m, c)
+    print(f"[train] Trainer built  batch={args.batch}  steps={args.steps}")
+
+    t_start = time.time()
+    with open(args.log, "w") as flog:
+        for step in range(args.steps):
+            start = (step * args.batch) % len(ALL)
+            batch = [ALL[(start + i) % len(ALL)] for i in range(args.batch)]
+            t0 = time.time()
+            try:
+                stats = trainer.step(batch)
+            except Exception as e:
+                print(f"[step {step}] EXCEPTION: {type(e).__name__}: {e}")
+                raise
+            dt = time.time() - t0
+            tot = stats.get("total")
+            print(
+                f"step {step:3d}  total={tot:.4f}  "
+                f"recon={stats.get('recon', 0):.3f}  "
+                f"sa={stats.get('semantic_alignment', 0):.3f}  "
+                f"tsa={stats.get('tail_semantic_anchor', 0):.3f}  "
+                f"va={stats.get('vocab_anchor', 0):.3f}  "
+                f"fs={stats.get('functional_suppression', 0):.3f}  "
+                f"cs={stats.get('context_separation', 0):.3f}  "
+                f"dt={dt:.1f}s"
+            )
+            rec = {"step": step, "dt_s": dt,
+                   **{k: v for k, v in stats.items()
+                      if k not in ("grad_norms", "loss_weights")}}
+            flog.write(json.dumps(rec, ensure_ascii=False) + "\n")
+            flog.flush()
+    elapsed = time.time() - t_start
+    post_probe = _probe_weights(m)
+    print(f"[probe post-train] {post_probe}")
+    print(f"[train] elapsed {elapsed:.1f}s  avg/step={elapsed/max(1,args.steps):.2f}s")
+
+    sd = {n: p.detach().cpu() for n, p in m.named_parameters() if "backbone" not in n}
+    for n, b in m.named_buffers():
+        if "backbone" not in n:
+            sd[n] = b.detach().cpu()
+    torch.save({
+        "state_dict": sd,
+        "cfg_snapshot": {k: getattr(c, k) for k in (
+            "L_mem", "d_ctx", "d_M", "d_F", "cfg_scale",
+            "use_top1_exclusive_content_bias",
+            "tail_slot_residual_dominant",
+            "use_inter_domain_margin",
+            "context_encoder_use_attention_pool",
+        )},
+        "provenance": "AgentMemory/v346-revertE-topk-nonexclusive-7e97",
+        "steps": args.steps,
+        "elapsed_s": elapsed,
+        "pre_probe": pre_probe,
+        "post_probe": post_probe,
+    }, args.out)
+    print(f"[save] wrote {args.out}  tensors={len(sd)}")
+
+
+if __name__ == "__main__":
+    main()

From d8d1a858851a37ecd5177ee46271fd5532160996 Mon Sep 17 00:00:00 2001
From: Cursor Agent <cursoragent@cursor.com>
Date: Tue, 21 Apr 2026 23:57:39 +0000
Subject: [PATCH 2/3] v3.46-trained: AMS_TRAINED_WEIGHTS shape-mismatch is
 warn+skip, not fatal
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Root cause: 4.25 prefix_length_scaling_probe intentionally builds model_b with
L_mem doubled (default 8 -> 16).  The checkpoint was trained with L_mem=8, so
L_mem-dependent tensors (e.g. mem_tokens[L_mem, d_LLM]) legitimately don't fit
model_b — this is not a corrupt/incompatible ckpt, it's a deliberate Cfg scan.

Old behavior: raise RuntimeError on any shape mismatch -> errored 4.25.
New behavior:
  - Per-tensor shape mismatch is logged and skipped (first 5 detailed, rest summarized).
  - Hard failure only when the ckpt had non-backbone content (>10 tensors) AND
    zero tensors loaded — that is the §6 'wrong-SUT ckpt' pattern we must catch.

Keeps the §6 protection against loading v344_trained.pt / v348_stacked.pt against
a v3.46 SUT (they would mostly shape-mismatch and hit the loaded==0 guard), while
letting L_mem-scaling probes proceed.

Co-authored-by: FluffyAIcode <FluffyAIcode@users.noreply.github.com>
---
 scheme_b_v344.py | 15 ++++++++++++---
 1 file changed, 12 insertions(+), 3 deletions(-)

diff --git a/scheme_b_v344.py b/scheme_b_v344.py
index a45b11a..c67754d 100644
--- a/scheme_b_v344.py
+++ b/scheme_b_v344.py
@@ -2541,14 +2541,23 @@ def _maybe_load_trained_weights(self):
                 else:
                     skipped += 1
         prov = blob.get("provenance", "?") if isinstance(blob, dict) else "?"
+        total_nonbb_ckpt = sum(1 for k in sd if not k.startswith("backbone"))
         print(f"  [AMS_TRAINED_WEIGHTS] loaded={loaded} skipped={skipped} "
               f"shape_errs={len(shape_errs)}  path={path}  provenance={prov}")
         if shape_errs:
             for n, s_model, s_ckpt in shape_errs[:5]:
-                print(f"    ! shape mismatch {n}: model={s_model} ckpt={s_ckpt}")
+                print(f"    ! shape mismatch (skipped) {n}: model={s_model} ckpt={s_ckpt}")
+            if len(shape_errs) > 5:
+                print(f"    ... and {len(shape_errs) - 5} more shape mismatches, all skipped")
+        # Raise only if essentially nothing loaded AND the ckpt had content to offer:
+        # this catches the "loaded a v344/v348 ckpt against v3.46 shapes" mistake
+        # warned about in SPRINT_CLOSEOUT_v3.46.md \u00a76, without breaking probes
+        # like 4.25 that scale L_mem and legitimately have a few mismatching tensors.
+        if loaded == 0 and total_nonbb_ckpt > 10:
             raise RuntimeError(
-                f"AMS_TRAINED_WEIGHTS shape mismatch on {len(shape_errs)} tensor(s); "
-                f"ckpt not compatible with current SUT shapes")
+                f"AMS_TRAINED_WEIGHTS loaded 0 non-backbone tensors "
+                f"(ckpt had {total_nonbb_ckpt}); shape_errs={len(shape_errs)}. "
+                f"ckpt appears incompatible with current SUT shapes")
 
     def _compute_filler_centroid(self):
         if self.content_classifier is None or self.backbone is None:

From 19a4ec4544ebda193d148371fd0350d0603bc263 Mon Sep 17 00:00:00 2001
From: Cursor Agent <cursoragent@cursor.com>
Date: Wed, 22 Apr 2026 00:27:30 +0000
Subject: [PATCH 3/3] v3.46-trained audit: 18/26 (-3 vs fresh 21/26), report +
 SPRINT update

Child PR of #27.  Training driver train_v346.py run for 60 steps on NVIDIA H200
(vast.ai), elapsed 335 s, mechanism observables per \u00a75.6 moved into target
range (tail_head slot1 |w|_mean: 0 -> 7.30e-4;  vocab_proj |w|_mean: 0 -> 5.49e-4,
both in [1e-4, 1e-2]).  Necessary conditions met; sufficient: not.

Audit with AMS_TRAINED_WEIGHTS=ckpt/v346_trained.pt, AMS_DETERMINISTIC=1,
elapsed 1250 s.

Results (as data, per SPEC \u00a77.7 norm, no Delta-pass-count was predicted):
  PASS 18, FAIL 8 (was 21, 5).
  Zero cases flipped FAIL -> PASS.
  Three cases flipped PASS -> FAIL:
    4.17 retrieval_prefix_decode_correlation_audit  (prefix_l2_shift = 3.22e+11,
         correlation undefined -- trained prefix magnitude blew up)
    4.20 rerank_stability_probe                     (space_P2 jaccard 0.429 < 0.6)
    4.25 prefix_length_scaling_probe                (L_mem 8->16 reduces starter
         mass to 0.82x, probe requires >1.10x)
  Regressions 4.8/4.21 also got worse: 'The pianist' unique_ratio 0.343 -> 0.296,
  avg_max_repeat 4.67 -> 5.0.  Axis C: 8/11 -> 6/11.  Axis D: 2/3 -> 1/3.

Structural read (\u00a71.5): 60 steps on 12-text corpus with semantic_alignment
weight 3.0 and no prefix-norm constraint caused the ctx encoder to saturate
prefix magnitude while tail/vocab paths gained just enough weight to reinforce
the corpus's own repetition pattern.  This is \u00a75.7 option-A territory
(pre-amplification gap) confirmed with data rather than predicted.

Artifacts committed:
  reports/v346_trained_blackbox/report.{json,md}
  reports/v346_trained_blackbox/stdout.log
  reports/v346_trained_blackbox/train_log.jsonl
  reports/v346_trained_blackbox/train_stdout.log

No Cfg changes (\u00a75.4), no Trainer loss additions (\u00a75.4).  ckpt/v346_trained.pt
is git-ignored per existing ckpt/*.pt rule; provenance recorded in the torch.save
blob and in report metadata.

Co-authored-by: FluffyAIcode <FluffyAIcode@users.noreply.github.com>
---
 SPRINT_CLOSEOUT_v3.46.md                      |   73 +-
 reports/v346_trained_blackbox/report.json     | 5479 +++++++++++++++++
 reports/v346_trained_blackbox/report.md       | 3914 ++++++++++++
 reports/v346_trained_blackbox/stdout.log      |  291 +
 reports/v346_trained_blackbox/train_log.jsonl |   60 +
 .../v346_trained_blackbox/train_stdout.log    |   72 +
 6 files changed, 9882 insertions(+), 7 deletions(-)
 create mode 100644 reports/v346_trained_blackbox/report.json
 create mode 100644 reports/v346_trained_blackbox/report.md
 create mode 100644 reports/v346_trained_blackbox/stdout.log
 create mode 100644 reports/v346_trained_blackbox/train_log.jsonl
 create mode 100644 reports/v346_trained_blackbox/train_stdout.log

diff --git a/SPRINT_CLOSEOUT_v3.46.md b/SPRINT_CLOSEOUT_v3.46.md
index 2bfc2b7..7c33c80 100644
--- a/SPRINT_CLOSEOUT_v3.46.md
+++ b/SPRINT_CLOSEOUT_v3.46.md
@@ -1,9 +1,10 @@
-# Sprint Close-Out · v3.46 · fresh-init ceiling reached, training path blocked on GPU
+# Sprint Close-Out · v3.46 · trained audit complete — 60-step training lowers score by 3
 
 **Handoff from**: CPU-only cloud agent on VM without GPU
-**Handoff to**: Cloud agent with GPU-enabled instance type
-**Current branch**: `AgentMemory/v346-revertE-topk-nonexclusive-7e97`
-**Current audit score**: **21/26** (elapsed 1456 s on CPU, fresh init, `AMS_DETERMINISTIC=1`)
+**Handoff to (closed)**: GPU-enabled cloud agent via SSH to vast.ai (NVIDIA H200, cu128, torch 2.11.0)
+**Current branch**: `AgentMemory/v346-trained-gpu-7e97` (child of `AgentMemory/v346-revertE-topk-nonexclusive-7e97`, PR #28)
+**Trained audit score**: **18/26** (elapsed 1250 s on H200, `AMS_TRAINED_WEIGHTS=ckpt/v346_trained.pt`, `AMS_DETERMINISTIC=1`)
+**Fresh-init baseline (for delta)**: 21/26 (unchanged, re-listed in §1.2)
 **Runner contract**: `v331_blackbox_eval.py` at v3.49 rev (4.24 substitution ban active)
 
 > This document is the full context for a new agent to pick up. Read this first, then read `V331_BLACKBOX_TEST_SPEC.md`, then the latest two SUT versions (`scheme_b_v344.py`, `scheme_b_v343.py` for comparison). Do not re-audit older versions — their numbers are in `reports/`.
@@ -55,10 +56,69 @@ Axis A is structurally capped by per-memory `semantic_emb (d_LLM=1536 floats)` d
 
 ---
 
+### 1.4 v3.46-trained audit table (60 training steps on H200, PR #28, reports/v346_trained_blackbox/)
+
+Training run: `python3 train_v346.py --steps 60` — 335 s wall on H200 (≈5.6 s/step), single-GPU, bf16 backbone, 113.8 M trainable non-backbone params, 11 memories stored pre-training. `Cfg` unchanged vs §1.1. Checkpoint: `ckpt/v346_trained.pt`, 455 MB, 202 non-backbone tensors, provenance `AgentMemory/v346-revertE-topk-nonexclusive-7e97`.
+
+**§5.6 mechanism observables (as data, per SPEC §7.7 norm)**:
+
+| Observable | Pre-train | Post-train | §5.6 target range | In range? |
+|---|---|---|---|---|
+| `bridge.tail_head.slot_heads[1][0].weight.abs().mean()` | `0.0` | `7.30e-4` | `[1e-4, 1e-2]` | yes |
+| `vocab_proj.proj[-1].weight.abs().mean()` | `0.0` | `5.49e-4` | `[1e-4, 1e-2]` | yes |
+
+Both necessary conditions named in §5.6 are met. §5.6 explicitly stated this does not guarantee the audit flips — audit data below is the test.
+
+**PASS (18)**: 4.1, 4.2, 4.3, 4.4, 4.5, 4.6, 4.10, 4.12, 4.13, 4.14, 4.15, 4.16, 4.18, 4.22, 4.23, 4.24, 4.26, 4.9.
+
+**FAIL (8)**:
+
+| Case | Metric | Observed (trained) | Observed (fresh) | Threshold | Delta |
+|---|---|---|---|---|---|
+| 4.7 semantic_memory_counterfactual_pairs | `music_margin > 0 AND space_margin > 0` | 0, 0 | 0, 0 | > 0 | unchanged (still axis-C fail) |
+| 4.8 degeneration_quality | `avg_unique_token_ratio ≥ 0.35` | 0.296 on "The pianist" (worse than fresh 0.343) | 0.343 | ≥ 0.35 | **regressed** (trained more repetitive) |
+| 4.11 retrieval_topk_semantic_shift | any keyword in top-12 | 0 hits | 0 hits | ≥ 1 | unchanged |
+| 4.17 retrieval_prefix_decode_correlation_audit | `retrieval_strength__prefix_l2` finite + sign-correct | `null` (prefix_l2_shift=3.22e+11 → variance blew up) | passed | finite | **regression**: trained prefix has extreme L2 shift, correlation undefined |
+| 4.19 stepwise_label_mass_alignment_audit | staged alignment ≥ 0 | mis-aligned (decode picks " Options", `stage_counts.decode=2 < inject=6`) | mis-aligned | aligned | unchanged (cascade of 4.11) |
+| 4.20 rerank_stability_probe | both pairs jaccard ≥ 0.6 | `space_P2` jaccard=0.429 (spearman 0.961) | passed | both ≥ 0.6 | **regression**: training perturbed retrieval clustering on one prompt pair |
+| 4.21 decode_repetition_feedback_probe | `avg_max_repeat ≤ 3.0` | 5.0 (worse than fresh 4.67) | 4.67 | ≤ 3 | regressed |
+| 4.25 prefix_length_scaling_probe | `avg_mass_ratio_B_over_A > 1.10` | 0.824 (< 1.0, doubling L_mem *reduces* starter mass) | passed | > 1.10 | **regression**: trained slot weights do not scale positively with L_mem |
+
+**Net: +0 gains, −3 regressions (4.17/4.20/4.25), score 21 → 18.**
+
+Axis coverage (v3.49 runner):
+
+| Axis | v3.46 fresh | v3.46 trained |
+|---|---|---|
+| A compression | FAIL (8.97 / 10.0) | FAIL (8.97 / 10.0) — structural, unchanged |
+| B injection cost | PASS | PASS |
+| C fidelity | FAIL (8/11) | FAIL (6/11) |
+| D stability | FAIL (2/3) | FAIL (1/3) |
+
+### 1.5 Why 60-step training did not help — structural read
+
+The §5.6 observables moved into range, confirming the zero-init dead paths `tail_head.slot_heads[1]` and `vocab_proj.proj[-1]` did start receiving gradient. But none of the five pre-training FAILs flipped (4.7/4.8/4.11/4.19/4.21), and three previously-passing cases flipped FAIL:
+
+- **4.17**: `prefix_l2_shift = 3.22e+11`. The trained prefix magnitude is ~6 orders of magnitude larger than the baseline hidden-state norm. Something in the training loss (most likely `semantic_alignment` at weight 3.0 against an unconstrained prefix magnitude) drove the injected prefix to saturate — this is consistent with `sa = 9.9 → 9.0` barely moving across 60 steps while producing a prefix with huge norm. The audit's correlation computation drops to `null` when inputs are non-finite or near-constant.
+- **4.20**: `space_P2` pair jaccard dropped from ≥0.6 (fresh) to 0.429 (trained). Both prompts still rank `mid=5` first, but the tail of top-5 diverges between paraphrases — the trained retrieval clusters are sharper but more brittle to paraphrase.
+- **4.25**: doubling `L_mem` 8→16 decreased starter-positive mass ratio to 0.82 (< 1.10). The trained slots behave anti-correlated with `L_mem`: more slots = more dilution of the starter-direction signal. This is the inverse of what the probe requires.
+- **4.21**: `avg_max_repeat_per_content_token` went from 4.67 → 5.0. Training reinforced the corpus-local repetition pattern, making the 4.21 FAIL slightly worse.
+- **4.8**: "The pianist" unique-token ratio fell from 0.343 → 0.296. Same class as 4.21.
+
+The shared pattern: `sa` (3.0× weight, reconstruction-anchored to the Qwen embedding space) trained the ctx encoder to push prefix magnitude up without a counterbalancing norm constraint, and the tail/vocab paths gained small weights that reinforce the retrieved memories' own repetitive phrasing rather than distributed vocabulary. 60 steps on a 12-text corpus is too small and too narrow for the Qwen latent-space geometry to develop a dilution signal; it's exactly long enough to overfit the corpus's own repetition. This is the §5.7 **option A** territory (pre-amplification gap under current bridge depth/width + loss family), now confirmed with data rather than predicted.
+
+Two things this sprint **does not** recommend based on this data:
+
+1. Trivially training longer (100–300 steps) on the same 12-text corpus. With no norm regularizer on the prefix and `sa` weight at 3.0, longer training will push `prefix_l2_shift` further up and regress 4.17 more.
+2. Adding a prefix-norm regularizer or a decode-time `vocab_bias` amplifier. Both would be threshold-chasing under §3.3 anti-pattern (1) / §5.7 option B without a SPEC amendment.
+
+---
+
 ## 2. What changed during this sprint (audit-level, most recent first)
 
 | Version | Branch | Audit | Delta | Core change |
 |---|---|---|---|---|
+| v3.46-trained | `AgentMemory/v346-trained-gpu-7e97` | 18/26 | **−3** | 60-step train on H200 (train_v346.py §5.3); AMS_TRAINED_WEIGHTS loader added |
 | v3.46 | `AgentMemory/v346-revertE-topk-nonexclusive-7e97` | 21/26 | 0 | Revert [E] (one-line Cfg) |
 | v3.45-cond-buffer | `AgentMemory/v345-bridge-cond-buffer-7e97` | 21/26 | +1 | Add `_last_cond_*` mirror on `EmbBridge`; runner reads cond-preferred buffer for 4.23 |
 | v3.45-revertB-refreshD | `AgentMemory/v345-revertB-refreshD-7e97` | 20/26 | +2 | Revert [B] LN-dominated tail; add `_refresh_rare_keyword_indices()` in `write()` |
@@ -331,9 +391,8 @@ Existing checkpoints `ckpt/v344_trained.pt` and `ckpt/v348_stacked.pt` were trai
 | #24 | v344-rewrite-abcdef-audit | draft | v3.44 six-mechanism rewrite + 18/26 audit |
 | #25 | v345-revertB-refreshD | draft | Revert [B], refresh timing, 20/26 audit |
 | #26 | v345-bridge-cond-buffer | draft | cond-buffer aliasing fix, 21/26 audit |
-| #27 | v346-revertE-topk-nonexclusive | draft | **Current head.** Revert [E], 21/26 audit |
-
-New agent should create a child branch off #27's branch (or merge #27 first per user call) before starting `train_v346.py`. Suggested branch name: `AgentMemory/v346-trained-{suffix}-7e97`.
+| #27 | v346-revertE-topk-nonexclusive | draft | Revert [E], 21/26 fresh-init audit (base for #28) |
+| #28 | v346-trained-gpu-7e97 | draft | **Current head.** train_v346.py + AMS_TRAINED_WEIGHTS loader + **18/26 trained audit** |
 
 ---
 
diff --git a/reports/v346_trained_blackbox/report.json b/reports/v346_trained_blackbox/report.json
new file mode 100644
index 0000000..b3bf0e5
--- /dev/null
+++ b/reports/v346_trained_blackbox/report.json
@@ -0,0 +1,5479 @@
+{
+  "generated_at_epoch": 1776817128.9913244,
+  "elapsed_seconds": 1250.0707318782806,
+  "checks": [
+    {
+      "name": "leaf_capacity_stability",
+      "passed": true,
+      "detail": "{\"per_seed\": [{\"seed\": 0, \"depth\": 6, \"count\": 240, \"violations\": [], \"consistency\": [], \"passed\": true}, {\"seed\": 1, \"depth\": 6, \"count\": 240, \"violations\": [], \"consistency\": [], \"passed\": true}, {\"seed\": 2, \"depth\": 6, \"count\": 240, \"violations\": [], \"consistency\": [], \"passed\": true}, {\"seed\": 3, \"depth\": 6, \"count\": 240, \"violations\": [], \"consistency\": [], \"passed\": true}, {\"seed\": 4, \"depth\": 6, \"count\": 240, \"violations\": [], \"consistency\": [], \"passed\": true}, {\"seed\": 5, \"depth\": 5, \"count\": 240, \"violations\": [], \"consistency\": [], \"passed\": true}, {\"seed\": 6, \"depth\": 6, \"count\": 240, \"violations\": [], \"consistency\": [], \"passed\": true}, {\"seed\": 7, \"depth\": 5, \"count\": 240, \"violations\": [], \"consistency\": [], \"passed\": true}]}"
+    },
+    {
+      "name": "degenerate_direction_boundary",
+      "passed": true,
+      "detail": "{\"depth\": 47, \"count\": 100, \"violations\": [], \"consistency\": [], \"seed\": 17}"
+    },
+    {
+      "name": "metric_trainability",
+      "passed": true,
+      "detail": "{\"training_info\": {\"total\": 41.98283386230469, \"recon\": 2.4085488319396973, \"contrast\": 43.46337127685547, \"holonomy\": 4.786942481994629, \"write_policy\": 1.0882740020751953, \"semantic_probe\": 0.0, \"dir_diversity\": 0.0, \"reranker_ranking\": 0.0, \"encoder_throughput\": 3.1604340076446533, \"vocab_anchor\": -0.0, \"semantic_alignment\": 9.469874382019043, \"tail_semantic_anchor\": 10.84397029876709, \"functional_suppression\": 0.0, \"context_separation\": 0.0, \"slot_residual_alignment\": 0.0, \"inter_domain_margin\": 0.0, \"grad_norms\": {\"ctx_encoder\": 0.0004906014182315579, \"fib_encoder\": 0.11028211643598784, \"dir_predictor\": 0.0, \"fiber_connection\": 0.041244823555418676, \"fiber_attn\": 0.00016646675964572253, \"reranker\": 1.862751849004779e-08, \"qformer\": 0.023817353122735294, \"content_bypass\": 0.03501559529968225, \"semantic_probe\": 0.0, \"layer_pool\": 0.003975302446633577, \"prefix_aligner\": 0.008598358558648532, \"vocab_proj\": 0.03414980954657789, \"tail_head\": 0.28745011541395643, \"context_heads\": 0.024231906034080493, \"memory_context_encoder\": 0.03503168573482837}, \"loss_weights\": {\"recon\": 1.0, \"semantic_alignment\": 3.0, \"encoder_throughput\": 1.5, \"contrast\": 0.02, \"holonomy\": 0.005, \"write_policy\":"
+    },
+    {
+      "name": "no_grad_generation",
+      "passed": true,
+      "detail": "{\"stored_memories\": 8, \"output\": \"The pianist piano hours piano pianoHours = int(raw input desperation hours hours))\\n piano perfectperfect print calculating hours *  hours\\r\\nelse\"}"
+    },
+    {
+      "name": "counterfactual_memory_influence",
+      "passed": true,
+      "detail": "{\"prompt\": \"Tell me something about practice and performance.\", \"music_output\": \"Tell me something about practice and performance. practiced midnight performances nocturnal practiced Midnight practiced noct midnight noct practiced practiced controlled noct noct midnight midnight practiced midnight controls noct midnight practices\", \"space_output\": \"Tell me something about practice and performance. distant distant space distant stars distant galaxies distant space observed observed space space stellar galaxies galaxies stellar evolution stellar stellar observed galaxies observed stellar\", \"outputs_differ\": true}"
+    },
+    {
+      "name": "semantic_memory_grounding",
+      "passed": true,
+      "detail": "{\"prompt\": \"Explain what someone should focus on when improving technique and understanding the subject.\", \"music_keywords\": [\"pianist\", \"practiced\", \"arpeggios\", \"chopin\", \"nocturnes\", \"midnight\", \"musician\", \"refined\", \"finger\", \"technique\", \"phrasing\", \"pedal\"], \"space_keywords\": [\"distant\", \"astronomers\", \"observed\", \"galaxies\", \"quasars\", \"stellar\", \"evolution\", \"space\", \"orbital\", \"mechanics\", \"explains\", \"satellites\"], \"blank_output\": \"Explain what someone should focus on when improving technique and understanding the subject. Mathematics education needs improvement mainly revolves around several key areas aimed</ Stuart Hallberg,\\\\\\n improving problem-solving skills, improve the relevance/real-world applications,\\n- Improve\", \"music_output\": \"Explain what someone should focus on when improving technique and understanding the subject. technique control refers generally technique technique。 technique finger control control technique control piano musician， musician piano finger finger piano refined musician musician finger refined refined piano piano pedal Explain control\", \"space_output\": \"Explain what someone should focus on when improving technique and understanding the su"
+    },
+    {
+      "name": "semantic_memory_counterfactual_pairs",
+      "passed": false,
+      "detail": "{\"rows\": [{\"prompt\": \"Describe the most important details a student should notice.\", \"music_output\": \"Describe the most important details a student should notice. student student conservDesc.php studentdescCons conserv keyboard Describe student Keyboard music theory student studied describe important details:\\n\\n keyboard keyboard studies scales keyboard studied conserv\", \"space_output\": \"Describe the most important details a student should notice. large Describe matter large structure scale large universe scale matter studiesDescribe matter structure scale structure expansion universe studies large studies studies matter universe expansion studies universe structure\", \"music_margin\": 0.0, \"space_margin\": 0.0, \"passed\": false}, {\"prompt\": \"Summarize the key ideas a learner should practice and remember.\", \"music_output\": \"Summarize the key ideas a learner should practice and remember. rub depends touch interpretation touch dynamics tempo often interpretation rub dynamics rub often touch often Control depends dynamics interpretation tempo touch rub interpretation dynamics touch depends often dynamics\", \"space_output\": \"Summarize the key ideas a learner should practice and remember. l"
+    },
+    {
+      "name": "degeneration_quality",
+      "passed": false,
+      "detail": "{\"metrics\": [{\"prompt\": \"The pianist\", \"output\": \"The pianist pian piano pian pianette pian plays Chop Chop Chop hours piano piano hours pian piano perfect hours Chop hours perfect Chop midnight hours midnight perfect perfect midnight\", \"token_count\": 27, \"unique_token_ratio\": 0.2962962962962963, \"repeated_bigram_ratio\": 0.11538461538461539, \"max_token_run\": 3, \"punct_ratio\": 0.0, \"newline_ratio\": 0.0, \"alpha_ratio\": 0.8478260869565217, \"content_token_ratio\": 0.8148148148148148, \"generated_preview\": \"pian piano pian pianette pian plays chop chop chop hours piano piano hours pian piano perfect hours chop hours perfect chop midnight hours midnight\"}, {\"prompt\": \"The telescope\", \"output\": \"The telescope telescope stars telescopestarsStars amazing amazed telescope captured telescope stars stars captured stars distant telescope signatures captured captured distant captured nebula distant signatures signatures neb neb\", \"token_count\": 25, \"unique_token_ratio\": 0.4, \"repeated_bigram_ratio\": 0.041666666666666664, \"max_token_run\": 2, \"punct_ratio\": 0.0, \"newline_ratio\": 0.0, \"alpha_ratio\": 0.8864628820960698, \"content_token_ratio\": 0.92, \"generated_preview\": \"telescope stars telescopestarss"
+    },
+    {
+      "name": "prefix_logit_drift_audit",
+      "passed": true,
+      "detail": "{\"prompt\": \"Explain the topic in a precise and concrete way.\", \"blank\": {\"js_divergence\": 0.19956839084625244, \"l2_shift\": 586.2745361328125, \"topk_overlap_count\": 3, \"entropy_no_prefix\": 5.3277788162231445, \"entropy_with_prefix\": 6.950380802154541, \"topk_no_prefix\": [{\"token_id\": 576, \"piece\": \" The\", \"norm\": \"the\", \"logit\": 19.75, \"prob\": 0.11376254260540009}, {\"token_id\": 22555, \"piece\": \" Sure\", \"norm\": \"sure\", \"logit\": 19.5, \"prob\": 0.0885983556509018}, {\"token_id\": 55313, \"piece\": \" Quantum\", \"norm\": \"quantum\", \"logit\": 18.75, \"prob\": 0.04185090214014053}, {\"token_id\": 58194, \"piece\": \" Artificial\", \"norm\": \"artificial\", \"logit\": 18.625, \"prob\": 0.0369332879781723}, {\"token_id\": 30536, \"piece\": \" Climate\", \"norm\": \"climate\", \"logit\": 18.5, \"prob\": 0.032593514770269394}, {\"token_id\": 12960, \"piece\": \" Machine\", \"norm\": \"machine\", \"logit\": 18.125, \"prob\": 0.022401172667741776}, {\"token_id\": 2585, \"piece\": \" How\", \"norm\": \"how\", \"logit\": 18.125, \"prob\": 0.022401172667741776}, {\"token_id\": 3555, \"piece\": \" What\", \"norm\": \"what\", \"logit\": 18.125, \"prob\": 0.022401172667741776}, {\"token_id\": 52366, \"piece\": \" Certainly\", \"norm\": \"certainly\", \"logit\": 17.875, \"prob\": 0.01744605228304"
+    },
+    {
+      "name": "retrieval_topk_semantic_shift",
+      "passed": false,
+      "detail": "{\"music_keywords\": [\"pianist\", \"practiced\", \"arpeggios\", \"chopin\", \"nocturnes\", \"midnight\", \"musician\", \"refined\", \"finger\", \"technique\", \"phrasing\", \"pedal\"], \"space_keywords\": [\"distant\", \"astronomers\", \"observed\", \"galaxies\", \"quasars\", \"stellar\", \"evolution\", \"space\", \"orbital\", \"mechanics\", \"explains\", \"satellites\"], \"rows\": [{\"prompt\": \"A strong explanation should mention\", \"music_no_prefix\": [{\"token_id\": 279, \"piece\": \" the\", \"norm\": \"the\", \"logit\": 21.125, \"prob\": 0.3049025535583496}, {\"token_id\": 264, \"piece\": \" a\", \"norm\": \"a\", \"logit\": 19.5, \"prob\": 0.06003887206315994}, {\"token_id\": 518, \"piece\": \" at\", \"norm\": \"at\", \"logit\": 19.375, \"prob\": 0.05298411846160889}, {\"token_id\": 3151, \"piece\": \" specific\", \"norm\": \"specific\", \"logit\": 19.0, \"prob\": 0.03641541674733162}, {\"token_id\": 2176, \"piece\": \" both\", \"norm\": \"both\", \"logit\": 19.0, \"prob\": 0.03641541674733162}, {\"token_id\": 429, \"piece\": \" that\", \"norm\": \"that\", \"logit\": 18.625, \"prob\": 0.0250279251486063}, {\"token_id\": 1246, \"piece\": \" how\", \"norm\": \"how\", \"logit\": 18.625, \"prob\": 0.0250279251486063}, {\"token_id\": 678, \"piece\": \" all\", \"norm\": \"all\", \"logit\": 18.625, \"prob\": 0.0250279251486063}, {\"token_id\": 10295, "
+    },
+    {
+      "name": "repetition_segment_audit",
+      "passed": true,
+      "detail": "{\"aggregate\": {\"bad_segment_ratio\": 0.0, \"total_segments\": 24, \"bad_segments\": 0, \"early_collapse_prompts\": []}, \"rows\": [{\"prompt\": \"The pianist\", \"output\": \"The pianist pian piano pian pianette pian plays Chop Chop Chop hours piano piano hours pian piano perfect hours Chop hours perfect Chop midnight hours midnight perfect perfect midnight midnight pian perfect noct noct noct midnight noct pian noct Chop piano Chop perfect piano midnight Chop pian hours noct\", \"generated_token_count\": 47, \"window\": 8, \"segments\": [{\"segment_idx\": 0, \"tokens\": [\"pian\", \"piano\", \"pian\", \"pianette\", \"pian\", \"plays\", \"chop\", \"chop\"], \"unique_ratio\": 0.625, \"content_ratio\": 1.0, \"repeated_bigram_ratio\": 0.0, \"dominant_token_share\": 0.375}, {\"segment_idx\": 1, \"tokens\": [\"chop\", \"hours\", \"piano\", \"piano\", \"hours\", \"pian\", \"piano\", \"perfect\"], \"unique_ratio\": 0.625, \"content_ratio\": 0.75, \"repeated_bigram_ratio\": 0.0, \"dominant_token_share\": 0.375}, {\"segment_idx\": 2, \"tokens\": [\"hours\", \"chop\", \"hours\", \"perfect\", \"chop\", \"midnight\", \"hours\", \"midnight\"], \"unique_ratio\": 0.5, \"content_ratio\": 0.625, \"repeated_bigram_ratio\": 0.0, \"dominant_token_share\": 0.375}, {\"segment_idx\": 3, \"tokens\": [\"perfect\", \"p"
+    },
+    {
+      "name": "prefix_stepwise_drift_trajectory",
+      "passed": true,
+      "detail": "{\"rows\": [{\"prompt\": \"Key piano ideas include\", \"first_bad_step\": 4, \"decoded_output\": \"Key piano ideas include leg movements across keys, dynamic changes, and the use of the pedal. These\", \"rows\": [{\"step\": 0, \"top1\": {\"token_id\": 3598, \"piece\": \" major\", \"norm\": \"major\", \"logit\": 16.25, \"prob\": 0.026983050629496574}, \"top1_category\": \"semantic\", \"topk_category_counts\": {\"semantic\": 11, \"functional\": 1, \"punct\": 0}, \"topk_category_prob_mass\": {\"semantic\": 0.18486935831606388, \"functional\": 0.026983050629496574, \"punct\": 0.0}, \"chosen_token_id\": 2472, \"chosen_piece\": \" leg\", \"chosen_norm\": \"leg\", \"chosen_category\": \"functional\"}, {\"step\": 1, \"top1\": {\"token_id\": 19029, \"piece\": \" movements\", \"norm\": \"movements\", \"logit\": 14.375, \"prob\": 0.13023822009563446}, \"top1_category\": \"semantic\", \"topk_category_counts\": {\"semantic\": 11, \"functional\": 1, \"punct\": 0}, \"topk_category_prob_mass\": {\"semantic\": 0.3965669944882393, \"functional\": 0.0113800885155797, \"punct\": 0.0}, \"chosen_token_id\": 19029, \"chosen_piece\": \" movements\", \"chosen_norm\": \"movements\", \"chosen_category\": \"semantic\"}, {\"step\": 2, \"top1\": {\"token_id\": 3941, \"piece\": \" across\", \"norm\": \"across\", \"logit\": 16.5, \"prob\": 0.0510"
+    },
+    {
+      "name": "retrieval_generation_alignment_audit",
+      "passed": true,
+      "detail": "{\"music_keywords\": [\"pianist\", \"practiced\", \"arpeggios\", \"chopin\", \"nocturnes\", \"midnight\", \"musician\", \"refined\", \"finger\", \"technique\", \"phrasing\", \"pedal\"], \"space_keywords\": [\"distant\", \"astronomers\", \"observed\", \"galaxies\", \"quasars\", \"stellar\", \"evolution\", \"space\", \"orbital\", \"mechanics\", \"explains\", \"satellites\"], \"diagnoses\": {\"aligned\": 2, \"retrieval_miss\": 0, \"bridge_unused\": 1, \"unknown\": 0}, \"rows\": [{\"prompt\": \"What improves piano technique and musical phrasing?\", \"expected_label\": \"music\", \"retrieved_mids\": [1, 0, 3, 6, 5], \"retrieved_label_counts\": {\"music\": 3, \"space\": 2}, \"retrieved_majority_label\": \"music\", \"retrieved_text_preview\": [\"A musician refined finger technique, phrasing, and pedal control on the piano.\", \"The pianist practiced arpeggios and Chopin nocturnes until midnight.\", \"A conservatory student studied etudes, scales, and expressive voicing on the keyboard.\"], \"output\": \"What improves piano technique and musical phrasing? piano technique control involves technique piano musician technique finger control piano piano musician control technique musician refined finger finger control finger technique piano finger refined refined pedal refined\", \"music_s"
+    },
+    {
+      "name": "retrieval_prefix_decode_correlation_audit",
+      "passed": false,
+      "detail": "{\"correlations\": {\"retrieval_strength__prefix_l2\": null, \"retrieval_strength__bad_decode_score\": 0.21927202884584385, \"prefix_l2__bad_decode_score\": null}, \"rows\": [{\"prompt\": \"What improves piano technique and musical phrasing?\", \"expected_label\": \"music\", \"retrieved_scored\": [{\"mid\": 1, \"score\": 0.6172578841447831}, {\"mid\": 0, \"score\": 0.22511255741119385}, {\"mid\": 3, \"score\": 0.11276901960372926}, {\"mid\": 6, \"score\": 0.045475220680236815}, {\"mid\": 5, \"score\": 0.036619618535041816}], \"retrieved_label_counts\": {\"music\": 3, \"space\": 2}, \"retrieval_strength\": 0.9551394611597062, \"prefix_l2_shift\": 322359623680.0, \"prefix_js_divergence\": 0.3171347379684448, \"top1_with_prefix\": {\"token_id\": 14566, \"piece\": \" Options\", \"norm\": \"options\", \"logit\": 16.375, \"prob\": 0.1110726147890091}, \"top1_category_with_prefix\": \"semantic\", \"topk_non_semantic_prob_mass\": 0.03182283788919449}, {\"prompt\": \"What explains satellites and orbital motion?\", \"expected_label\": \"space\", \"retrieved_scored\": [{\"mid\": 5, \"score\": 0.5634284257888794}, {\"mid\": 4, \"score\": 0.07376852035522463}, {\"mid\": 6, \"score\": 0.06803246438503266}, {\"mid\": 1, \"score\": 0.045463052392005925}, {\"mid\": 0, \"score\": 0.03999960422515869}]"
+    },
+    {
+      "name": "stepwise_label_mass_alignment_audit",
+      "passed": false,
+      "detail": "{\"label_keywords\": {\"music\": [\"pianist\", \"practiced\", \"arpeggios\", \"chopin\", \"nocturnes\", \"midnight\", \"musician\", \"refined\", \"finger\", \"technique\", \"phrasing\", \"pedal\"], \"space\": [\"distant\", \"astronomers\", \"observed\", \"galaxies\", \"quasars\", \"stellar\", \"evolution\", \"space\", \"orbital\", \"mechanics\", \"explains\", \"satellites\"]}, \"rows\": [{\"prompt\": \"What improves piano technique and musical phrasing?\", \"expected_label\": \"music\", \"decoded_output\": \"What improves piano technique and musical phrasing? Options tend towards improving piano technique, musical phrasing, and\", \"stage_counts\": {\"inject\": 6, \"aligned\": 4, \"decode\": 2}, \"rows\": [{\"step\": 0, \"retrieved_majority_label\": \"music\", \"retrieved_label_counts\": {\"music\": 3, \"space\": 2}, \"retrieved_score_sum\": {\"music\": 0.9551394611597062, \"space\": 0.08209483921527863}, \"logits_label_mass\": {\"music\": 0, \"space\": 0}, \"top1_piece\": \" Options\", \"top1_category\": \"semantic\", \"chosen_piece\": \" Options\", \"chosen_category\": \"semantic\", \"chosen_label\": null, \"diagnosed_stage\": \"inject\"}, {\"step\": 1, \"retrieved_majority_label\": \"music\", \"retrieved_label_counts\": {\"music\": 3, \"space\": 2}, \"retrieved_score_sum\": {\"music\": 0.9551394611597062, \"space\": 0"
+    },
+    {
+      "name": "prompt_diversity_without_memory",
+      "passed": true,
+      "detail": "{\"prompts\": [\"The pianist\", \"Quantum systems\", \"The rainforest\"], \"outputs\": [\"The pianist Xia points XYZ传感器 collects weather data based upon ____ protocol communication mode?\\nBLE（Bluetooth）\\n\", \"Quantum systems play central roles across cryptography due primarily?\\\\nThe Bose gas  |\\n\\n **Summary:\\r\\n\\r\\nWrite various\", \"The rainforest dataset typically refers specifically refering______. aviation charts. ____\\nyes Explanation: \\nFalse\"], \"unique_count\": 3}"
+    },
+    {
+      "name": "save_load_consistency",
+      "passed": true,
+      "detail": "{\"prompt\": \"The pianist\", \"output_a\": \"The pianist piano hours piano pianoHours = int(raw input desperation hours hours))\\n piano perfectperfect print calculating\", \"output_b\": \"The pianist piano hours piano pianoHours = int(raw input desperation hours hours))\\n piano perfectperfect print calculating\"}"
+    },
+    {
+      "name": "training_cache_isolation",
+      "passed": true,
+      "detail": "{\"changed\": [], \"memory_count\": 8}"
+    },
+    {
+      "name": "cheating_heuristics",
+      "passed": true,
+      "detail": "{\"outputs\": [\"The pianist piano hours piano pianoHours = int(raw input desperation hours hours))\\n piano perfectperfect print calculating\", \"The telescope window watched cat sat mat outside birds window sat watched mat cat birds outside Market window cat watched\", \"The trader market stock volatility significant experienced 市 stock experienced significant market volatility experienced stock stock significant volatility\", \"The child learns Signs window window outside cat sat mat watched outside mat sat cat mat mat outside sat watched\"], \"exact_same\": false, \"prefix_only\": false, \"too_short\": false}"
+    },
+    {
+      "name": "rerank_stability_probe",
+      "passed": false,
+      "detail": "{\"status\": \"fail\", \"pairs\": [{\"pair\": \"music_P1\", \"prompt_a\": \"What improves piano technique and musical phrasing?\", \"prompt_b\": \"How can one improve piano technique and musical expression?\", \"top5_a\": [1, 0, 3, 4, 2], \"top5_b\": [1, 0, 3, 4, 2], \"jaccard\": 1.0, \"spearman_shared\": 0.9999999999998999, \"pair_passed_jaccard_0_6\": true}, {\"pair\": \"space_P2\", \"prompt_a\": \"What explains satellites and orbital motion?\", \"prompt_b\": \"What describes satellites and the motion of planets?\", \"top5_a\": [5, 0, 1, 3, 2], \"top5_b\": [5, 6, 4, 0, 1], \"jaccard\": 0.42857142857142855, \"spearman_shared\": 0.9607689228302918, \"pair_passed_jaccard_0_6\": false}], \"spearman_best\": 0.9999999999998999, \"gating\": \"hard_PASS\"}"
+    },
+    {
+      "name": "decode_repetition_feedback_probe",
+      "passed": false,
+      "detail": "{\"status\": \"fail\", \"per_prompt\": [{\"prompt\": \"The telescope\", \"output\": \"The telescope telescope stars telescopestarsStars amazing amazed telescope captured telescope stars stars captured stars distant telescope signatures captured captured distant captured nebula distant signatures signatures neb neb captured signatures\", \"max_repeat_per_content_token\": 5, \"first_bigram_repeat_index\": 9, \"trigram_lock_count\": 0}, {\"prompt\": \"The pianist\", \"output\": \"The pianist pian piano pian pianette pian plays Chop Chop Chop hours piano piano hours pian piano perfect hours Chop hours perfect Chop midnight hours midnight perfect perfect midnight midnight pian\", \"max_repeat_per_content_token\": 5, \"first_bigram_repeat_index\": 8, \"trigram_lock_count\": 0}, {\"prompt\": \"The market analyst\", \"output\": \"The market analyst market session sessessionssesess market market session session significant market volatility experienced stock market stock significant volatility experienced significant stock volatility significant session stock session volatility experienced volatility\", \"max_repeat_per_content_token\": 5, \"first_bigram_repeat_index\": 8, \"trigram_lock_count\": 0}], \"avg_max_repeat_per_content_token\": "
+    },
+    {
+      "name": "functional_token_suppression_probe",
+      "passed": true,
+      "detail": "{\"status\": \"pass\", \"metric_version\": \"v3.46\", \"per_prompt\": [{\"prompt\": \"A strong explanation should mention\", \"top12_no_prefix\": [{\"token_id\": 279, \"piece\": \" the\", \"norm\": \"the\", \"logit\": 21.125, \"prob\": 0.30489084124565125}, {\"token_id\": 264, \"piece\": \" a\", \"norm\": \"a\", \"logit\": 19.5, \"prob\": 0.060036562383174896}, {\"token_id\": 518, \"piece\": \" at\", \"norm\": \"at\", \"logit\": 19.375, \"prob\": 0.05298208072781563}, {\"token_id\": 3151, \"piece\": \" specific\", \"norm\": \"specific\", \"logit\": 19.0, \"prob\": 0.036414019763469696}, {\"token_id\": 2176, \"piece\": \" both\", \"norm\": \"both\", \"logit\": 19.0, \"prob\": 0.036414019763469696}, {\"token_id\": 429, \"piece\": \" that\", \"norm\": \"that\", \"logit\": 18.625, \"prob\": 0.025026964023709297}, {\"token_id\": 678, \"piece\": \" all\", \"norm\": \"all\", \"logit\": 18.625, \"prob\": 0.025026964023709297}, {\"token_id\": 1246, \"piece\": \" how\", \"norm\": \"how\", \"logit\": 18.625, \"prob\": 0.025026964023709297}, {\"token_id\": 10295, \"piece\": \" examples\", \"norm\": \"examples\", \"logit\": 18.5, \"prob\": 0.022086219862103462}, {\"token_id\": 2326, \"piece\": \" three\", \"norm\": \"three\", \"logit\": 18.25, \"prob\": 0.017200764268636703}, {\"token_id\": 1378, \"piece\": \" two\", \"norm\": \"two\", \"logit\": 18.125, \"pro"
+    },
+    {
+      "name": "keyword_specific_tail_slot_probe",
+      "passed": true,
+      "detail": "{\"status\": \"pass\", \"metric_version\": \"v3.50\", \"tail_slots_source\": \"bridge._last_cond_tail_slots\", \"per_paraphrase\": [{\"query\": \"She performed Beethoven sonatas with delicate phrasing on her grand piano.\", \"query_disjoint_from_rare_keywords\": true, \"dominant_mid\": 1, \"dominant_source_preview\": \"A musician refined finger technique, phrasing, and pedal con\", \"rare_keyword_ids\": [2524, 14317, 14762], \"rare_keyword_pieces\": [\" control\", \" finger\", \" technique\"], \"tail_slot_top5_ids_centered\": [2524, 7779, 100359, 2865, 3273], \"tail_slot_top5_pieces_centered\": [\" control\", \" Control\", \"控制\", \"control\", \"Control\"], \"intersection_size_top20\": 1, \"rank_of_best_rare\": 1}, {\"query\": \"Harmonic analysis and ear training are core elements of music education.\", \"query_disjoint_from_rare_keywords\": true, \"dominant_mid\": 1, \"dominant_source_preview\": \"A musician refined finger technique, phrasing, and pedal con\", \"rare_keyword_ids\": [2524, 14317, 14762], \"rare_keyword_pieces\": [\" control\", \" finger\", \" technique\"], \"tail_slot_top5_ids_centered\": [2524, 7779, 100359, 2865, 3273], \"tail_slot_top5_pieces_centered\": [\" control\", \" Control\", \"控制\", \"control\", \"Control\"], \"intersection_size_top20\": 1, \"ra"
+    },
+    {
+      "name": "context_descriptor_cluster_probe",
+      "passed": true,
+      "detail": "{\"status\": \"pass\", \"metric_version\": \"v3.49\", \"loo_nn_accuracy_all_4\": 0.6875, \"loo_nn_accuracy_heldout_2\": 0.875, \"n_all\": 16, \"n_heldout\": 8, \"correct_all\": 11, \"correct_heldout\": 7, \"per_memory_all\": [{\"mid\": 0, \"true_label\": \"music\", \"pred_label\": \"space\", \"nn_sim\": 0.10659328103065491, \"correct\": false}, {\"mid\": 1, \"true_label\": \"music\", \"pred_label\": \"music\", \"nn_sim\": 0.21885180473327637, \"correct\": true}, {\"mid\": 2, \"true_label\": \"music\", \"pred_label\": \"space\", \"nn_sim\": 0.7041908502578735, \"correct\": false}, {\"mid\": 3, \"true_label\": \"music\", \"pred_label\": \"music\", \"nn_sim\": 0.21885180473327637, \"correct\": true}, {\"mid\": 4, \"true_label\": \"space\", \"pred_label\": \"space\", \"nn_sim\": 0.6772083044052124, \"correct\": true}, {\"mid\": 5, \"true_label\": \"space\", \"pred_label\": \"finance\", \"nn_sim\": 0.5216456651687622, \"correct\": false}, {\"mid\": 6, \"true_label\": \"space\", \"pred_label\": \"space\", \"nn_sim\": 0.6772083044052124, \"correct\": true}, {\"mid\": 7, \"true_label\": \"space\", \"pred_label\": \"music\", \"nn_sim\": 0.7041908502578735, \"correct\": false}, {\"mid\": 8, \"true_label\": \"cooking\", \"pred_label\": \"cooking\", \"nn_sim\": 0.6417238712310791, \"correct\": true}, {\"mid\": 9, \"true_label\": \"cooking\", \"p"
+    },
+    {
+      "name": "prefix_length_scaling_probe",
+      "passed": false,
+      "detail": "{\"status\": \"fail\", \"metric_version\": \"v3.45\", \"L_mem_A\": 8, \"L_mem_B\": 16, \"avg_mass_ratio_B_over_A\": 0.8236899087743724, \"per_prompt\": [{\"prompt\": \"A strong explanation should mention\", \"starter_mass_A\": 36750.875, \"starter_mass_B\": 41343.8671875, \"ratio\": 1.124976403623043, \"content_starters_top12_A\": 12, \"content_starters_top12_B\": 12, \"per_slot_mean_norm_A\": 1.0251211524009705, \"per_slot_mean_norm_B\": 1.0251210927963257}, {\"prompt\": \"The pianist\", \"starter_mass_A\": 22117.984375, \"starter_mass_B\": 14409.236328125, \"ratio\": 0.6514714941390314, \"content_starters_top12_A\": 12, \"content_starters_top12_B\": 12, \"per_slot_mean_norm_A\": 1.0251210778951645, \"per_slot_mean_norm_B\": 1.0251211002469063}, {\"prompt\": \"The telescope\", \"starter_mass_A\": 14722.236328125, \"starter_mass_B\": 10226.38671875, \"ratio\": 0.6946218285610428, \"content_starters_top12_A\": 12, \"content_starters_top12_B\": 12, \"per_slot_mean_norm_A\": 1.0251210778951645, \"per_slot_mean_norm_B\": 1.0251211076974869}], \"conditions\": {\"avg_mass_ratio_gt_1_10\": false, \"per_slot_norms_finite\": true}, \"gating\": \"PASS_or_not_implemented\"}"
+    },
+    {
+      "name": "mixture_distribution_gate_probe",
+      "passed": true,
+      "detail": "{\"status\": \"pass\", \"gate_min\": 0.3499999940395355, \"gate_max\": 0.3499999940395355, \"declared_floor\": 0.0, \"declared_ceiling\": 0.7, \"gate_in_range\": true, \"finite_gate\": true, \"finite_memory_logit_bias\": true, \"manual_mixture_finite\": true, \"gating\": \"PASS_or_not_implemented\"}"
+    }
+  ],
+  "results": {
+    "leaf_capacity_stability": {
+      "passed": true,
+      "per_seed": [
+        {
+          "seed": 0,
+          "depth": 6,
+          "count": 240,
+          "violations": [],
+          "consistency": [],
+          "passed": true
+        },
+        {
+          "seed": 1,
+          "depth": 6,
+          "count": 240,
+          "violations": [],
+          "consistency": [],
+          "passed": true
+        },
+        {
+          "seed": 2,
+          "depth": 6,
+          "count": 240,
+          "violations": [],
+          "consistency": [],
+          "passed": true
+        },
+        {
+          "seed": 3,
+          "depth": 6,
+          "count": 240,
+          "violations": [],
+          "consistency": [],
+          "passed": true
+        },
+        {
+          "seed": 4,
+          "depth": 6,
+          "count": 240,
+          "violations": [],
+          "consistency": [],
+          "passed": true
+        },
+        {
+          "seed": 5,
+          "depth": 5,
+          "count": 240,
+          "violations": [],
+          "consistency": [],
+          "passed": true
+        },
+        {
+          "seed": 6,
+          "depth": 6,
+          "count": 240,
+          "violations": [],
+          "consistency": [],
+          "passed": true
+        },
+        {
+          "seed": 7,
+          "depth": 5,
+          "count": 240,
+          "violations": [],
+          "consistency": [],
+          "passed": true
+        }
+      ],
+      "error": null
+    },
+    "degenerate_direction_boundary": {
+      "passed": true,
+      "depth": 47,
+      "count": 100,
+      "violations": [],
+      "consistency": [],
+      "seed": 17,
+      "error": null
+    },
+    "metric_trainability": {
+      "passed": true,
+      "training_info": {
+        "total": 41.98283386230469,
+        "recon": 2.4085488319396973,
+        "contrast": 43.46337127685547,
+        "holonomy": 4.786942481994629,
+        "write_policy": 1.0882740020751953,
+        "semantic_probe": 0.0,
+        "dir_diversity": 0.0,
+        "reranker_ranking": 0.0,
+        "encoder_throughput": 3.1604340076446533,
+        "vocab_anchor": -0.0,
+        "semantic_alignment": 9.469874382019043,
+        "tail_semantic_anchor": 10.84397029876709,
+        "functional_suppression": 0.0,
+        "context_separation": 0.0,
+        "slot_residual_alignment": 0.0,
+        "inter_domain_margin": 0.0,
+        "grad_norms": {
+          "ctx_encoder": 0.0004906014182315579,
+          "fib_encoder": 0.11028211643598784,
+          "dir_predictor": 0.0,
+          "fiber_connection": 0.041244823555418676,
+          "fiber_attn": 0.00016646675964572253,
+          "reranker": 1.862751849004779e-08,
+          "qformer": 0.023817353122735294,
+          "content_bypass": 0.03501559529968225,
+          "semantic_probe": 0.0,
+          "layer_pool": 0.003975302446633577,
+          "prefix_aligner": 0.008598358558648532,
+          "vocab_proj": 0.03414980954657789,
+          "tail_head": 0.28745011541395643,
+          "context_heads": 0.024231906034080493,
+          "memory_context_encoder": 0.03503168573482837
+        },
+        "loss_weights": {
+          "recon": 1.0,
+          "semantic_alignment": 3.0,
+          "encoder_throughput": 1.5,
+          "contrast": 0.02,
+          "holonomy": 0.005,
+          "write_policy": 0.1,
+          "semantic_probe": 0.3,
+          "dir_diversity": 0.1,
+          "reranker_ranking": 0.2,
+          "vocab_anchor": 0.2,
+          "tail_semantic_anchor": 0.5,
+          "functional_suppression": 0.4,
+          "context_separation": 0.3,
+          "slot_residual_alignment": 0.0,
+          "inter_domain_margin": 0.2
+        }
+      },
+      "metric_grad_norms": [
+        0.00019553887250367552,
+        1.1630397239059675e-05,
+        0.0002688287931960076,
+        1.956606502062641e-05,
+        0.0019679300021380186,
+        0.00016431401309091598
+      ],
+      "metric_param_deltas": [
+        0.0015214140294119716,
+        0.0005180726875551045,
+        0.002842925488948822,
+        0.0005496913217939436,
+        0.003378876717761159,
+        0.0005994143430143595
+      ],
+      "max_metric_grad_norm": 0.0019679300021380186,
+      "max_metric_param_delta": 0.003378876717761159,
+      "error": null
+    },
+    "no_grad_generation": {
+      "passed": true,
+      "stored_memories": 8,
+      "output": "The pianist piano hours piano pianoHours = int(raw input desperation hours hours))\n piano perfectperfect print calculating hours *  hours\r\nelse",
+      "error": null
+    },
+    "counterfactual_memory_influence": {
+      "passed": true,
+      "prompt": "Tell me something about practice and performance.",
+      "music_output": "Tell me something about practice and performance. practiced midnight performances nocturnal practiced Midnight practiced noct midnight noct practiced practiced controlled noct noct midnight midnight practiced midnight controls noct midnight practices",
+      "space_output": "Tell me something about practice and performance. distant distant space distant stars distant galaxies distant space observed observed space space stellar galaxies galaxies stellar evolution stellar stellar observed galaxies observed stellar",
+      "outputs_differ": true,
+      "error": null
+    },
+    "semantic_memory_grounding": {
+      "passed": true,
+      "prompt": "Explain what someone should focus on when improving technique and understanding the subject.",
+      "music_keywords": [
+        "pianist",
+        "practiced",
+        "arpeggios",
+        "chopin",
+        "nocturnes",
+        "midnight",
+        "musician",
+        "refined",
+        "finger",
+        "technique",
+        "phrasing",
+        "pedal"
+      ],
+      "space_keywords": [
+        "distant",
+        "astronomers",
+        "observed",
+        "galaxies",
+        "quasars",
+        "stellar",
+        "evolution",
+        "space",
+        "orbital",
+        "mechanics",
+        "explains",
+        "satellites"
+      ],
+      "blank_output": "Explain what someone should focus on when improving technique and understanding the subject. Mathematics education needs improvement mainly revolves around several key areas aimed</ Stuart Hallberg,\\\n improving problem-solving skills, improve the relevance/real-world applications,\n- Improve",
+      "music_output": "Explain what someone should focus on when improving technique and understanding the subject. technique control refers generally technique technique。 technique finger control control technique control piano musician， musician piano finger finger piano refined musician musician finger refined refined piano piano pedal Explain control",
+      "space_output": "Explain what someone should focus on when improving technique and understanding the subject. mechanics force gravitational planets satellites explains move mechanics force gravitational planets satellites explains move move force move gravitational planets satellites explains mechanics move planets satellites explains force mechanics gravitational planets satellites force",
+      "blank_music_score": 0.03571428571428571,
+      "blank_space_score": 0.0,
+      "music_music_score": 0.5,
+      "music_space_score": 0.0,
+      "space_space_score": 0.34210526315789475,
+      "space_music_score": 0.02631578947368421,
+      "music_margin": 0.5,
+      "space_margin": 0.3157894736842105,
+      "music_lift": 0.4642857142857143,
+      "space_lift": 0.34210526315789475,
+      "error": null
+    },
+    "semantic_memory_counterfactual_pairs": {
+      "passed": false,
+      "rows": [
+        {
+          "prompt": "Describe the most important details a student should notice.",
+          "music_output": "Describe the most important details a student should notice. student student conservDesc.php studentdescCons conserv keyboard Describe student Keyboard music theory student studied describe important details:\n\n keyboard keyboard studies scales keyboard studied conserv",
+          "space_output": "Describe the most important details a student should notice. large Describe matter large structure scale large universe scale matter studiesDescribe matter structure scale structure expansion universe studies large studies studies matter universe expansion studies universe structure",
+          "music_margin": 0.0,
+          "space_margin": 0.0,
+          "passed": false
+        },
+        {
+          "prompt": "Summarize the key ideas a learner should practice and remember.",
+          "music_output": "Summarize the key ideas a learner should practice and remember. rub depends touch interpretation touch dynamics tempo often interpretation rub dynamics rub often touch often Control depends dynamics interpretation tempo touch rub interpretation dynamics touch depends often dynamics",
+          "space_output": "Summarize the key ideas a learner should practice and remember. large large studies large Sum dark scale matter dark matter structureSum dark large scale scale expansion structure matter studies matter large learners key universe remember studies dark",
+          "music_margin": 0.0,
+          "space_margin": 0.0,
+          "passed": false
+        }
+      ],
+      "error": null
+    },
+    "degeneration_quality": {
+      "passed": false,
+      "metrics": [
+        {
+          "prompt": "The pianist",
+          "output": "The pianist pian piano pian pianette pian plays Chop Chop Chop hours piano piano hours pian piano perfect hours Chop hours perfect Chop midnight hours midnight perfect perfect midnight",
+          "token_count": 27,
+          "unique_token_ratio": 0.2962962962962963,
+          "repeated_bigram_ratio": 0.11538461538461539,
+          "max_token_run": 3,
+          "punct_ratio": 0.0,
+          "newline_ratio": 0.0,
+          "alpha_ratio": 0.8478260869565217,
+          "content_token_ratio": 0.8148148148148148,
+          "generated_preview": "pian piano pian pianette pian plays chop chop chop hours piano piano hours pian piano perfect hours chop hours perfect chop midnight hours midnight"
+        },
+        {
+          "prompt": "The telescope",
+          "output": "The telescope telescope stars telescopestarsStars amazing amazed telescope captured telescope stars stars captured stars distant telescope signatures captured captured distant captured nebula distant signatures signatures neb neb",
+          "token_count": 25,
+          "unique_token_ratio": 0.4,
+          "repeated_bigram_ratio": 0.041666666666666664,
+          "max_token_run": 2,
+          "punct_ratio": 0.0,
+          "newline_ratio": 0.0,
+          "alpha_ratio": 0.8864628820960698,
+          "content_token_ratio": 0.92,
+          "generated_preview": "telescope stars telescopestarsstars amazing amazed telescope captured telescope stars stars captured stars distant telescope signatures captured captured distant captured nebula distant signatures signatures neb"
+        },
+        {
+          "prompt": "The forest path",
+          "output": "The forest path deep within ancient rain temple hidden tropical rain within hidden temple ancient deep hidden within tropical deep temple within ancient hidden rain deep tropical ancient temple rain hidden",
+          "token_count": 28,
+          "unique_token_ratio": 0.25,
+          "repeated_bigram_ratio": 0.037037037037037035,
+          "max_token_run": 1,
+          "punct_ratio": 0.0,
+          "newline_ratio": 0.0,
+          "alpha_ratio": 0.8536585365853658,
+          "content_token_ratio": 0.8571428571428571,
+          "generated_preview": "deep within ancient rain temple hidden tropical rain within hidden temple ancient deep hidden within tropical deep temple within ancient hidden rain deep tropical"
+        },
+        {
+          "prompt": "The market analyst",
+          "output": "The market analyst market session sessessionssesess market market session session significant market volatility experienced stock market stock significant volatility experienced significant stock volatility significant session stock session volatility",
+          "token_count": 25,
+          "unique_token_ratio": 0.28,
+          "repeated_bigram_ratio": 0.08333333333333333,
+          "max_token_run": 2,
+          "punct_ratio": 0.0,
+          "newline_ratio": 0.0,
+          "alpha_ratio": 0.8924302788844621,
+          "content_token_ratio": 0.8,
+          "generated_preview": "market session sessessionssesess market market session session significant market volatility experienced stock market stock significant volatility experienced significant stock volatility significant session stock session"
+        },
+        {
+          "prompt": "Explain the topic clearly",
+          "output": "Explain the topic clearly simple explained simple simple analog simple rel everyday rel professor Professor explained explained analog explained rel Force professor everyday analog professor rel everyday professor analog everyday analog rel",
+          "token_count": 28,
+          "unique_token_ratio": 0.25,
+          "repeated_bigram_ratio": 0.07407407407407407,
+          "max_token_run": 2,
+          "punct_ratio": 0.0,
+          "newline_ratio": 0.0,
+          "alpha_ratio": 0.8708333333333333,
+          "content_token_ratio": 0.6785714285714286,
+          "generated_preview": "simple explained simple simple analog simple rel everyday rel professor professor explained explained analog explained rel force professor everyday analog professor rel everyday professor"
+        }
+      ],
+      "aggregate": {
+        "avg_unique_token_ratio": 0.2952592592592593,
+        "avg_repeated_bigram_ratio": 0.0702991452991453,
+        "avg_content_token_ratio": 0.81410582010582,
+        "avg_newline_ratio": 0.0,
+        "worst_max_token_run": 3,
+        "short_or_hollow_prompts": []
+      },
+      "error": null
+    },
+    "prefix_logit_drift_audit": {
+      "passed": true,
+      "prompt": "Explain the topic in a precise and concrete way.",
+      "blank": {
+        "js_divergence": 0.19956839084625244,
+        "l2_shift": 586.2745361328125,
+        "topk_overlap_count": 3,
+        "entropy_no_prefix": 5.3277788162231445,
+        "entropy_with_prefix": 6.950380802154541,
+        "topk_no_prefix": [
+          {
+            "token_id": 576,
+            "piece": " The",
+            "norm": "the",
+            "logit": 19.75,
+            "prob": 0.11376254260540009
+          },
+          {
+            "token_id": 22555,
+            "piece": " Sure",
+            "norm": "sure",
+            "logit": 19.5,
+            "prob": 0.0885983556509018
+          },
+          {
+            "token_id": 55313,
+            "piece": " Quantum",
+            "norm": "quantum",
+            "logit": 18.75,
+            "prob": 0.04185090214014053
+          },
+          {
+            "token_id": 58194,
+            "piece": " Artificial",
+            "norm": "artificial",
+            "logit": 18.625,
+            "prob": 0.0369332879781723
+          },
+          {
+            "token_id": 30536,
+            "piece": " Climate",
+            "norm": "climate",
+            "logit": 18.5,
+            "prob": 0.032593514770269394
+          },
+          {
+            "token_id": 12960,
+            "piece": " Machine",
+            "norm": "machine",
+            "logit": 18.125,
+            "prob": 0.022401172667741776
+          },
+          {
+            "token_id": 2585,
+            "piece": " How",
+            "norm": "how",
+            "logit": 18.125,
+            "prob": 0.022401172667741776
+          },
+          {
+            "token_id": 3555,
+            "piece": " What",
+            "norm": "what",
+            "logit": 18.125,
+            "prob": 0.022401172667741776
+          },
+          {
+            "token_id": 52366,
+            "piece": " Certainly",
+            "norm": "certainly",
+            "logit": 17.875,
+            "prob": 0.01744605228304863
+          },
+          {
+            "token_id": 2885,
+            "piece": " Data",
+            "norm": "data",
+            "logit": 17.875,
+            "prob": 0.01744605228304863
+          },
+          {
+            "token_id": 15235,
+            "piece": " AI",
+            "norm": "ai",
+            "logit": 17.625,
+            "prob": 0.013586997985839844
+          },
+          {
+            "token_id": 358,
+            "piece": " I",
+            "norm": "i",
+            "logit": 17.5,
+            "prob": 0.011990483850240707
+          }
+        ],
+        "topk_with_prefix": [
+          {
+            "token_id": 576,
+            "piece": " The",
+            "norm": "the",
+            "logit": 15.75,
+            "prob": 0.0856875479221344
+          },
+          {
+            "token_id": 220,
+            "piece": " ",
+            "norm": "",
+            "logit": 15.6875,
+            "prob": 0.08049600571393967
+          },
+          {
+            "token_id": 362,
+            "piece": " A",
+            "norm": "a",
+            "logit": 14.5,
+            "prob": 0.02454989403486252
+          },
+          {
+            "token_id": 1096,
+            "piece": " This",
+            "norm": "this",
+            "logit": 14.25,
+            "prob": 0.01911947689950466
+          },
+          {
+            "token_id": 1084,
+            "piece": " It",
+            "norm": "it",
+            "logit": 14.0625,
+            "prob": 0.015850603580474854
+          },
+          {
+            "token_id": 4710,
+            "piece": " \n\n",
+            "norm": "",
+            "logit": 13.9375,
+            "prob": 0.013988107442855835
+          },
+          {
+            "token_id": 758,
+            "piece": " In",
+            "norm": "in",
+            "logit": 13.9375,
+            "prob": 0.013988107442855835
+          },
+          {
+            "token_id": 715,
+            "piece": " \n",
+            "norm": "",
+            "logit": 13.8125,
+            "prob": 0.012344461865723133
+          },
+          {
+            "token_id": 330,
+            "piece": " \"",
+            "norm": "",
+            "logit": 13.8125,
+            "prob": 0.012344461865723133
+          },
+          {
+            "token_id": 358,
+            "piece": " I",
+            "norm": "i",
+            "logit": 13.75,
+            "prob": 0.01159654837101698
+          },
+          {
+            "token_id": 5692,
+            "piece": " Here",
+            "norm": "here",
+            "logit": 13.5625,
+            "prob": 0.009613876231014729
+          },
+          {
+            "token_id": 2585,
+            "piece": " How",
+            "norm": "how",
+            "logit": 13.5,
+            "prob": 0.009031401015818119
+          }
+        ]
+      },
+      "memory": {
+        "js_divergence": 0.2740609347820282,
+        "l2_shift": 322359623680.0,
+        "topk_overlap_count": 6,
+        "entropy_no_prefix": 5.3277788162231445,
+        "entropy_with_prefix": 7.505624294281006,
+        "topk_no_prefix": [
+          {
+            "token_id": 576,
+            "piece": " The",
+            "norm": "the",
+            "logit": 19.75,
+            "prob": 0.11376254260540009
+          },
+          {
+            "token_id": 22555,
+            "piece": " Sure",
+            "norm": "sure",
+            "logit": 19.5,
+            "prob": 0.0885983556509018
+          },
+          {
+            "token_id": 55313,
+            "piece": " Quantum",
+            "norm": "quantum",
+            "logit": 18.75,
+            "prob": 0.04185090214014053
+          },
+          {
+            "token_id": 58194,
+            "piece": " Artificial",
+            "norm": "artificial",
+            "logit": 18.625,
+            "prob": 0.0369332879781723
+          },
+          {
+            "token_id": 30536,
+            "piece": " Climate",
+            "norm": "climate",
+            "logit": 18.5,
+            "prob": 0.032593514770269394
+          },
+          {
+            "token_id": 12960,
+            "piece": " Machine",
+            "norm": "machine",
+            "logit": 18.125,
+            "prob": 0.022401172667741776
+          },
+          {
+            "token_id": 2585,
+            "piece": " How",
+            "norm": "how",
+            "logit": 18.125,
+            "prob": 0.022401172667741776
+          },
+          {
+            "token_id": 3555,
+            "piece": " What",
+            "norm": "what",
+            "logit": 18.125,
+            "prob": 0.022401172667741776
+          },
+          {
+            "token_id": 52366,
+            "piece": " Certainly",
+            "norm": "certainly",
+            "logit": 17.875,
+            "prob": 0.01744605228304863
+          },
+          {
+            "token_id": 2885,
+            "piece": " Data",
+            "norm": "data",
+            "logit": 17.875,
+            "prob": 0.01744605228304863
+          },
+          {
+            "token_id": 15235,
+            "piece": " AI",
+            "norm": "ai",
+            "logit": 17.625,
+            "prob": 0.013586997985839844
+          },
+          {
+            "token_id": 358,
+            "piece": " I",
+            "norm": "i",
+            "logit": 17.5,
+            "prob": 0.011990483850240707
+          }
+        ],
+        "topk_with_prefix": [
+          {
+            "token_id": 22555,
+            "piece": " Sure",
+            "norm": "sure",
+            "logit": 15.9375,
+            "prob": 0.045294053852558136
+          },
+          {
+            "token_id": 55313,
+            "piece": " Quantum",
+            "norm": "quantum",
+            "logit": 15.4375,
+            "prob": 0.027472233399748802
+          },
+          {
+            "token_id": 52366,
+            "piece": " Certainly",
+            "norm": "certainly",
+            "logit": 15.0,
+            "prob": 0.017737405374646187
+          },
+          {
+            "token_id": 5209,
+            "piece": " Please",
+            "norm": "please",
+            "logit": 14.625,
+            "prob": 0.01219072937965393
+          },
+          {
+            "token_id": 30536,
+            "piece": " Climate",
+            "norm": "climate",
+            "logit": 14.25,
+            "prob": 0.008378557860851288
+          },
+          {
+            "token_id": 58194,
+            "piece": " Artificial",
+            "norm": "artificial",
+            "logit": 14.1875,
+            "prob": 0.007870926521718502
+          },
+          {
+            "token_id": 37444,
+            "piece": " Nuclear",
+            "norm": "nuclear",
+            "logit": 14.0625,
+            "prob": 0.0069460682570934296
+          },
+          {
+            "token_id": 18183,
+            "piece": " Deep",
+            "norm": "deep",
+            "logit": 14.0,
+            "prob": 0.0065252273343503475
+          },
+          {
+            "token_id": 2885,
+            "piece": " Data",
+            "norm": "data",
+            "logit": 14.0,
+            "prob": 0.0065252273343503475
+          },
+          {
+            "token_id": 39502,
+            "piece": " Hydro",
+            "norm": "hydro",
+            "logit": 14.0,
+            "prob": 0.0065252273343503475
+          },
+          {
+            "token_id": 12354,
+            "piece": " Energy",
+            "norm": "energy",
+            "logit": 13.9375,
+            "prob": 0.006129883695393801
+          },
+          {
+            "token_id": 60477,
+            "piece": " Neural",
+            "norm": "neural",
+            "logit": 13.875,
+            "prob": 0.005758493207395077
+          }
+        ]
+      },
+      "error": null
+    },
+    "retrieval_topk_semantic_shift": {
+      "passed": false,
+      "music_keywords": [
+        "pianist",
+        "practiced",
+        "arpeggios",
+        "chopin",
+        "nocturnes",
+        "midnight",
+        "musician",
+        "refined",
+        "finger",
+        "technique",
+        "phrasing",
+        "pedal"
+      ],
+      "space_keywords": [
+        "distant",
+        "astronomers",
+        "observed",
+        "galaxies",
+        "quasars",
+        "stellar",
+        "evolution",
+        "space",
+        "orbital",
+        "mechanics",
+        "explains",
+        "satellites"
+      ],
+      "rows": [
+        {
+          "prompt": "A strong explanation should mention",
+          "music_no_prefix": [
+            {
+              "token_id": 279,
+              "piece": " the",
+              "norm": "the",
+              "logit": 21.125,
+              "prob": 0.3049025535583496
+            },
+            {
+              "token_id": 264,
+              "piece": " a",
+              "norm": "a",
+              "logit": 19.5,
+              "prob": 0.06003887206315994
+            },
+            {
+              "token_id": 518,
+              "piece": " at",
+              "norm": "at",
+              "logit": 19.375,
+              "prob": 0.05298411846160889
+            },
+            {
+              "token_id": 3151,
+              "piece": " specific",
+              "norm": "specific",
+              "logit": 19.0,
+              "prob": 0.03641541674733162
+            },
+            {
+              "token_id": 2176,
+              "piece": " both",
+              "norm": "both",
+              "logit": 19.0,
+              "prob": 0.03641541674733162
+            },
+            {
+              "token_id": 429,
+              "piece": " that",
+              "norm": "that",
+              "logit": 18.625,
+              "prob": 0.0250279251486063
+            },
+            {
+              "token_id": 1246,
+              "piece": " how",
+              "norm": "how",
+              "logit": 18.625,
+              "prob": 0.0250279251486063
+            },
+            {
+              "token_id": 678,
+              "piece": " all",
+              "norm": "all",
+              "logit": 18.625,
+              "prob": 0.0250279251486063
+            },
+            {
+              "token_id": 10295,
+              "piece": " examples",
+              "norm": "examples",
+              "logit": 18.5,
+              "prob": 0.022087067365646362
+            },
+            {
+              "token_id": 2326,
+              "piece": " three",
+              "norm": "three",
+              "logit": 18.25,
+              "prob": 0.01720142550766468
+            },
+            {
+              "token_id": 3807,
+              "piece": " several",
+              "norm": "several",
+              "logit": 18.125,
+              "prob": 0.015180204063653946
+            },
+            {
+              "token_id": 1378,
+              "piece": " two",
+              "norm": "two",
+              "logit": 18.125,
+              "prob": 0.015180204063653946
+            }
+          ],
+          "music_with_prefix": [
+            {
+              "token_id": 3151,
+              "piece": " specific",
+              "norm": "specific",
+              "logit": 17.875,
+              "prob": 0.08923931419849396
+            },
+            {
+              "token_id": 10295,
+              "piece": " examples",
+              "norm": "examples",
+              "logit": 17.375,
+              "prob": 0.05412638187408447
+            },
+            {
+              "token_id": 2326,
+              "piece": " three",
+              "norm": "three",
+              "logit": 17.125,
+              "prob": 0.04215366765856743
+            },
+            {
+              "token_id": 3170,
+              "piece": " why",
+              "norm": "why",
+              "logit": 17.0,
+              "prob": 0.037200480699539185
+            },
+            {
+              "token_id": 3807,
+              "piece": " several",
+              "norm": "several",
+              "logit": 16.875,
+              "prob": 0.03282931074500084
+            },
+            {
+              "token_id": 1376,
+              "piece": " key",
+              "norm": "key",
+              "logit": 16.5,
+              "prob": 0.022563232108950615
+            },
+            {
+              "token_id": 5248,
+              "piece": " multiple",
+              "norm": "multiple",
+              "logit": 16.375,
+              "prob": 0.019911982119083405
+            },
+            {
+              "token_id": 5257,
+              "piece": " various",
+              "norm": "various",
+              "logit": 16.25,
+              "prob": 0.01757226325571537
+            },
+            {
+              "token_id": 4650,
+              "piece": " potential",
+              "norm": "potential",
+              "logit": 15.625,
+              "prob": 0.009405754506587982
+            },
+            {
+              "token_id": 3040,
+              "piece": " four",
+              "norm": "four",
+              "logit": 15.4375,
+              "prob": 0.007797644007951021
+            },
+            {
+              "token_id": 3425,
+              "piece": " whether",
+              "norm": "whether",
+              "logit": 15.25,
+              "prob": 0.006464474368840456
+            },
+            {
+              "token_id": 1931,
+              "piece": " real",
+              "norm": "real",
+              "logit": 15.1875,
+              "prob": 0.00607281131669879
+            }
+          ],
+          "music_hits_no": {
+            "match_count": 0,
+            "match_prob_mass": 0,
+            "matches": []
+          },
+          "music_hits_with_prefix": {
+            "match_count": 0,
+            "match_prob_mass": 0,
+            "matches": []
+          },
+          "space_no_prefix": [
+            {
+              "token_id": 279,
+              "piece": " the",
+              "norm": "the",
+              "logit": 21.125,
+              "prob": 0.3049025535583496
+            },
+            {
+              "token_id": 264,
+              "piece": " a",
+              "norm": "a",
+              "logit": 19.5,
+              "prob": 0.06003887206315994
+            },
+            {
+              "token_id": 518,
+              "piece": " at",
+              "norm": "at",
+              "logit": 19.375,
+              "prob": 0.05298411846160889
+            },
+            {
+              "token_id": 3151,
+              "piece": " specific",
+              "norm": "specific",
+              "logit": 19.0,
+              "prob": 0.03641541674733162
+            },
+            {
+              "token_id": 2176,
+              "piece": " both",
+              "norm": "both",
+              "logit": 19.0,
+              "prob": 0.03641541674733162
+            },
+            {
+              "token_id": 429,
+              "piece": " that",
+              "norm": "that",
+              "logit": 18.625,
+              "prob": 0.0250279251486063
+            },
+            {
+              "token_id": 1246,
+              "piece": " how",
+              "norm": "how",
+              "logit": 18.625,
+              "prob": 0.0250279251486063
+            },
+            {
+              "token_id": 678,
+              "piece": " all",
+              "norm": "all",
+              "logit": 18.625,
+              "prob": 0.0250279251486063
+            },
+            {
+              "token_id": 10295,
+              "piece": " examples",
+              "norm": "examples",
+              "logit": 18.5,
+              "prob": 0.022087067365646362
+            },
+            {
+              "token_id": 2326,
+              "piece": " three",
+              "norm": "three",
+              "logit": 18.25,
+              "prob": 0.01720142550766468
+            },
+            {
+              "token_id": 3807,
+              "piece": " several",
+              "norm": "several",
+              "logit": 18.125,
+              "prob": 0.015180204063653946
+            },
+            {
+              "token_id": 1378,
+              "piece": " two",
+              "norm": "two",
+              "logit": 18.125,
+              "prob": 0.015180204063653946
+            }
+          ],
+          "space_with_prefix": [
+            {
+              "token_id": 3151,
+              "piece": " specific",
+              "norm": "specific",
+              "logit": 18.125,
+              "prob": 0.11810589581727982
+            },
+            {
+              "token_id": 10295,
+              "piece": " examples",
+              "norm": "examples",
+              "logit": 17.125,
+              "prob": 0.04344873130321503
+            },
+            {
+              "token_id": 3807,
+              "piece": " several",
+              "norm": "several",
+              "logit": 17.0,
+              "prob": 0.03834336996078491
+            },
+            {
+              "token_id": 3170,
+              "piece": " why",
+              "norm": "why",
+              "logit": 16.875,
+              "prob": 0.03383790701627731
+            },
+            {
+              "token_id": 2326,
+              "piece": " three",
+              "norm": "three",
+              "logit": 16.875,
+              "prob": 0.03383790701627731
+            },
+            {
+              "token_id": 1376,
+              "piece": " key",
+              "norm": "key",
+              "logit": 16.5,
+              "prob": 0.02325643040239811
+            },
+            {
+              "token_id": 5257,
+              "piece": " various",
+              "norm": "various",
+              "logit": 16.25,
+              "prob": 0.018112126737833023
+            },
+            {
+              "token_id": 5248,
+              "piece": " multiple",
+              "norm": "multiple",
+              "logit": 16.25,
+              "prob": 0.018112126737833023
+            },
+            {
+              "token_id": 3460,
+              "piece": " large",
+              "norm": "large",
+              "logit": 15.5,
+              "prob": 0.008555563166737556
+            },
+            {
+              "token_id": 3425,
+              "piece": " whether",
+              "norm": "whether",
+              "logit": 15.5,
+              "prob": 0.008555563166737556
+            },
+            {
+              "token_id": 4650,
+              "piece": " potential",
+              "norm": "potential",
+              "logit": 15.4375,
+              "prob": 0.008037206716835499
+            },
+            {
+              "token_id": 5904,
+              "piece": " evidence",
+              "norm": "evidence",
+              "logit": 15.1875,
+              "prob": 0.006259383168071508
+            }
+          ],
+          "space_hits_no": {
+            "match_count": 0,
+            "match_prob_mass": 0,
+            "matches": []
+          },
+          "space_hits_with_prefix": {
+            "match_count": 0,
+            "match_prob_mass": 0,
+            "matches": []
+          },
+          "passed": false
+        },
+        {
+          "prompt": "The most relevant idea is",
+          "music_no_prefix": [
+            {
+              "token_id": 429,
+              "piece": " that",
+              "norm": "that",
+              "logit": 20.25,
+              "prob": 0.2765631675720215
+            },
+            {
+              "token_id": 279,
+              "piece": " the",
+              "norm": "the",
+              "logit": 19.125,
+              "prob": 0.08978691697120667
+            },
+            {
+              "token_id": 25,
+              "piece": ":",
+              "norm": "",
+              "logit": 19.0,
+              "prob": 0.07923667877912521
+            },
+            {
+              "token_id": 311,
+              "piece": " to",
+              "norm": "to",
+              "logit": 18.25,
+              "prob": 0.037428755313158035
+            },
+            {
+              "token_id": 30743,
+              "piece": " ____",
+              "norm": "",
+              "logit": 18.0,
+              "prob": 0.02914954163134098
+            },
+            {
+              "token_id": 510,
+              "piece": ":\n",
+              "norm": "",
+              "logit": 18.0,
+              "prob": 0.02914954163134098
+            },
+            {
+              "token_id": 1304,
+              "piece": " __",
+              "norm": "",
+              "logit": 17.5,
+              "prob": 0.01768009178340435
+            },
+            {
+              "token_id": 32671,
+              "piece": " ______",
+              "norm": "",
+              "logit": 17.5,
+              "prob": 0.01768009178340435
+            },
+            {
+              "token_id": 1447,
+              "piece": ":\n\n",
+              "norm": "",
+              "logit": 17.375,
+              "prob": 0.015602625906467438
+            },
+            {
+              "token_id": 537,
+              "piece": " not",
+              "norm": "not",
+              "logit": 17.25,
+              "prob": 0.013769268989562988
+            },
+            {
+              "token_id": 330,
+              "piece": " \"",
+              "norm": "",
+              "logit": 17.25,
+              "prob": 0.013769268989562988
+            },
+            {
+              "token_id": 320,
+              "piece": " (",
+              "norm": "",
+              "logit": 17.125,
+              "prob": 0.012151338160037994
+            }
+          ],
+          "music_with_prefix": [
+            {
+              "token_id": 4658,
+              "piece": " probably",
+              "norm": "probably",
+              "logit": 16.0,
+              "prob": 0.035965967923402786
+            },
+            {
+              "token_id": 3118,
+              "piece": " based",
+              "norm": "based",
+              "logit": 15.625,
+              "prob": 0.02471902407705784
+            },
+            {
+              "token_id": 4363,
+              "piece": " likely",
+              "norm": "likely",
+              "logit": 15.5625,
+              "prob": 0.023221375420689583
+            },
+            {
+              "token_id": 5435,
+              "piece": " related",
+              "norm": "related",
+              "logit": 15.3125,
+              "prob": 0.018084824085235596
+            },
+            {
+              "token_id": 2677,
+              "piece": " always",
+              "norm": "always",
+              "logit": 15.25,
+              "prob": 0.016989119350910187
+            },
+            {
+              "token_id": 3545,
+              "piece": " often",
+              "norm": "often",
+              "logit": 15.0,
+              "prob": 0.013231140561401844
+            },
+            {
+              "token_id": 5990,
+              "piece": " usually",
+              "norm": "usually",
+              "logit": 14.9375,
+              "prob": 0.01242950651794672
+            },
+            {
+              "token_id": 2661,
+              "piece": " given",
+              "norm": "given",
+              "logit": 14.9375,
+              "prob": 0.01242950651794672
+            },
+            {
+              "token_id": 2999,
+              "piece": " option",
+              "norm": "option",
+              "logit": 14.6875,
+              "prob": 0.009680109098553658
+            },
+            {
+              "token_id": 9355,
+              "piece": " clearly",
+              "norm": "clearly",
+              "logit": 14.6875,
+              "prob": 0.009680109098553658
+            },
+            {
+              "token_id": 4396,
+              "piece": " correct",
+              "norm": "correct",
+              "logit": 14.6875,
+              "prob": 0.009680109098553658
+            },
+            {
+              "token_id": 3520,
+              "piece": " actually",
+              "norm": "actually",
+              "logit": 14.3125,
+              "prob": 0.0066530355252325535
+            }
+          ],
+          "music_hits_no": {
+            "match_count": 0,
+            "match_prob_mass": 0,
+            "matches": []
+          },
+          "music_hits_with_prefix": {
+            "match_count": 0,
+            "match_prob_mass": 0,
+            "matches": []
+          },
+          "space_no_prefix": [
+            {
+              "token_id": 429,
+              "piece": " that",
+              "norm": "that",
+              "logit": 20.25,
+              "prob": 0.2765631675720215
+            },
+            {
+              "token_id": 279,
+              "piece": " the",
+              "norm": "the",
+              "logit": 19.125,
+              "prob": 0.08978691697120667
+            },
+            {
+              "token_id": 25,
+              "piece": ":",
+              "norm": "",
+              "logit": 19.0,
+              "prob": 0.07923667877912521
+            },
+            {
+              "token_id": 311,
+              "piece": " to",
+              "norm": "to",
+              "logit": 18.25,
+              "prob": 0.037428755313158035
+            },
+            {
+              "token_id": 30743,
+              "piece": " ____",
+              "norm": "",
+              "logit": 18.0,
+              "prob": 0.02914954163134098
+            },
+            {
+              "token_id": 510,
+              "piece": ":\n",
+              "norm": "",
+              "logit": 18.0,
+              "prob": 0.02914954163134098
+            },
+            {
+              "token_id": 1304,
+              "piece": " __",
+              "norm": "",
+              "logit": 17.5,
+              "prob": 0.01768009178340435
+            },
+            {
+              "token_id": 32671,
+              "piece": " ______",
+              "norm": "",
+              "logit": 17.5,
+              "prob": 0.01768009178340435
+            },
+            {
+              "token_id": 1447,
+              "piece": ":\n\n",
+              "norm": "",
+              "logit": 17.375,
+              "prob": 0.015602625906467438
+            },
+            {
+              "token_id": 537,
+              "piece": " not",
+              "norm": "not",
+              "logit": 17.25,
+              "prob": 0.013769268989562988
+            },
+            {
+              "token_id": 330,
+              "piece": " \"",
+              "norm": "",
+              "logit": 17.25,
+              "prob": 0.013769268989562988
+            },
+            {
+              "token_id": 320,
+              "piece": " (",
+              "norm": "",
+              "logit": 17.125,
+              "prob": 0.012151338160037994
+            }
+          ],
+          "space_with_prefix": [
+            {
+              "token_id": 5990,
+              "piece": " usually",
+              "norm": "usually",
+              "logit": 15.625,
+              "prob": 0.024161575362086296
+            },
+            {
+              "token_id": 2677,
+              "piece": " always",
+              "norm": "always",
+              "logit": 15.625,
+              "prob": 0.024161575362086296
+            },
+            {
+              "token_id": 3545,
+              "piece": " often",
+              "norm": "often",
+              "logit": 15.625,
+              "prob": 0.024161575362086296
+            },
+            {
+              "token_id": 4658,
+              "piece": " probably",
+              "norm": "probably",
+              "logit": 15.4375,
+              "prob": 0.02003064937889576
+            },
+            {
+              "token_id": 3118,
+              "piece": " based",
+              "norm": "based",
+              "logit": 15.375,
+              "prob": 0.018817054107785225
+            },
+            {
+              "token_id": 4363,
+              "piece": " likely",
+              "norm": "likely",
+              "logit": 15.375,
+              "prob": 0.018817054107785225
+            },
+            {
+              "token_id": 2661,
+              "piece": " given",
+              "norm": "given",
+              "logit": 15.0625,
+              "prob": 0.013766851276159286
+            },
+            {
+              "token_id": 5435,
+              "piece": " related",
+              "norm": "related",
+              "logit": 15.0,
+              "prob": 0.012932759709656239
+            },
+            {
+              "token_id": 10449,
+              "piece": " presented",
+              "norm": "presented",
+              "logit": 14.875,
+              "prob": 0.011413119733333588
+            },
+            {
+              "token_id": 6839,
+              "piece": " shown",
+              "norm": "shown",
+              "logit": 14.8125,
+              "prob": 0.010721634142100811
+            },
+            {
+              "token_id": 15251,
+              "piece": " represented",
+              "norm": "represented",
+              "logit": 14.75,
+              "prob": 0.010072043165564537
+            },
+            {
+              "token_id": 9355,
+              "piece": " clearly",
+              "norm": "clearly",
+              "logit": 14.6875,
+              "prob": 0.009461808949708939
+            }
+          ],
+          "space_hits_no": {
+            "match_count": 0,
+            "match_prob_mass": 0,
+            "matches": []
+          },
+          "space_hits_with_prefix": {
+            "match_count": 0,
+            "match_prob_mass": 0,
+            "matches": []
+          },
+          "passed": false
+        }
+      ],
+      "error": null
+    },
+    "repetition_segment_audit": {
+      "passed": true,
+      "aggregate": {
+        "bad_segment_ratio": 0.0,
+        "total_segments": 24,
+        "bad_segments": 0,
+        "early_collapse_prompts": []
+      },
+      "rows": [
+        {
+          "prompt": "The pianist",
+          "output": "The pianist pian piano pian pianette pian plays Chop Chop Chop hours piano piano hours pian piano perfect hours Chop hours perfect Chop midnight hours midnight perfect perfect midnight midnight pian perfect noct noct noct midnight noct pian noct Chop piano Chop perfect piano midnight Chop pian hours noct",
+          "generated_token_count": 47,
+          "window": 8,
+          "segments": [
+            {
+              "segment_idx": 0,
+              "tokens": [
+                "pian",
+                "piano",
+                "pian",
+                "pianette",
+                "pian",
+                "plays",
+                "chop",
+                "chop"
+              ],
+              "unique_ratio": 0.625,
+              "content_ratio": 1.0,
+              "repeated_bigram_ratio": 0.0,
+              "dominant_token_share": 0.375
+            },
+            {
+              "segment_idx": 1,
+              "tokens": [
+                "chop",
+                "hours",
+                "piano",
+                "piano",
+                "hours",
+                "pian",
+                "piano",
+                "perfect"
+              ],
+              "unique_ratio": 0.625,
+              "content_ratio": 0.75,
+              "repeated_bigram_ratio": 0.0,
+              "dominant_token_share": 0.375
+            },
+            {
+              "segment_idx": 2,
+              "tokens": [
+                "hours",
+                "chop",
+                "hours",
+                "perfect",
+                "chop",
+                "midnight",
+                "hours",
+                "midnight"
+              ],
+              "unique_ratio": 0.5,
+              "content_ratio": 0.625,
+              "repeated_bigram_ratio": 0.0,
+              "dominant_token_share": 0.375
+            },
+            {
+              "segment_idx": 3,
+              "tokens": [
+                "perfect",
+                "perfect",
+                "midnight",
+                "midnight",
+                "pian",
+                "perfect",
+                "noct",
+                "noct"
+              ],
+              "unique_ratio": 0.5,
+              "content_ratio": 1.0,
+              "repeated_bigram_ratio": 0.0,
+              "dominant_token_share": 0.375
+            },
+            {
+              "segment_idx": 4,
+              "tokens": [
+                "noct",
+                "midnight",
+                "noct",
+                "pian",
+                "noct",
+                "chop",
+                "piano",
+                "chop"
+              ],
+              "unique_ratio": 0.625,
+              "content_ratio": 1.0,
+              "repeated_bigram_ratio": 0.0,
+              "dominant_token_share": 0.375
+            },
+            {
+              "segment_idx": 5,
+              "tokens": [
+                "perfect",
+                "piano",
+                "midnight",
+                "chop",
+                "pian",
+                "hours",
+                "noct"
+              ],
+              "unique_ratio": 1.0,
+              "content_ratio": 0.8571428571428571,
+              "repeated_bigram_ratio": 0.0,
+              "dominant_token_share": 0.14285714285714285
+            }
+          ],
+          "bad_segments": [],
+          "first_bad_segment_idx": null
+        },
+        {
+          "prompt": "The telescope",
+          "output": "The telescope telescope stars telescopestarsStars amazing amazed telescope captured telescope stars stars captured stars distant telescope signatures captured captured distant captured nebula distant signatures signatures neb neb captured signatures spectral neb spectral spectral neb spectral stars neb signatures distant distant spectral signatures Space telescope neb stars spectral",
+          "generated_token_count": 45,
+          "window": 8,
+          "segments": [
+            {
+              "segment_idx": 0,
+              "tokens": [
+                "telescope",
+                "stars",
+                "telescopestarsstars",
+                "amazing",
+                "amazed",
+                "telescope",
+                "captured",
+                "telescope"
+              ],
+              "unique_ratio": 0.75,
+              "content_ratio": 1.0,
+              "repeated_bigram_ratio": 0.0,
+              "dominant_token_share": 0.375
+            },
+            {
+              "segment_idx": 1,
+              "tokens": [
+                "stars",
+                "stars",
+                "captured",
+                "stars",
+                "distant",
+                "telescope",
+                "signatures",
+                "captured"
+              ],
+              "unique_ratio": 0.625,
+              "content_ratio": 1.0,
+              "repeated_bigram_ratio": 0.0,
+              "dominant_token_share": 0.375
+            },
+            {
+              "segment_idx": 2,
+              "tokens": [
+                "captured",
+                "distant",
+                "captured",
+                "nebula",
+                "distant",
+                "signatures",
+                "signatures",
+                "neb"
+              ],
+              "unique_ratio": 0.625,
+              "content_ratio": 0.875,
+              "repeated_bigram_ratio": 0.0,
+              "dominant_token_share": 0.25
+            },
+            {
+              "segment_idx": 3,
+              "tokens": [
+                "neb",
+                "captured",
+                "signatures",
+                "spectral",
+                "neb",
+                "spectral",
+                "spectral",
+                "neb"
+              ],
+              "unique_ratio": 0.5,
+              "content_ratio": 0.625,
+              "repeated_bigram_ratio": 0.14285714285714285,
+              "dominant_token_share": 0.375
+            },
+            {
+              "segment_idx": 4,
+              "tokens": [
+                "spectral",
+                "stars",
+                "neb",
+                "signatures",
+                "distant",
+                "distant",
+                "spectral",
+                "signatures"
+              ],
+              "unique_ratio": 0.625,
+              "content_ratio": 0.875,
+              "repeated_bigram_ratio": 0.0,
+              "dominant_token_share": 0.25
+            },
+            {
+              "segment_idx": 5,
+              "tokens": [
+                "space",
+                "telescope",
+                "neb",
+                "stars",
+                "spectral"
+              ],
+              "unique_ratio": 1.0,
+              "content_ratio": 0.8,
+              "repeated_bigram_ratio": 0.0,
+              "dominant_token_share": 0.2
+            }
+          ],
+          "bad_segments": [],
+          "first_bad_segment_idx": null
+        },
+        {
+          "prompt": "The market analyst",
+          "output": "The market analyst market session sessessionssesess market market session session significant market volatility experienced stock market stock significant volatility experienced significant stock volatility significant session stock session volatility experienced volatility stock experienced session significant Market analysts often closely monitor market sessions involving significant events, particularly stock markets",
+          "generated_token_count": 44,
+          "window": 8,
+          "segments": [
+            {
+              "segment_idx": 0,
+              "tokens": [
+                "market",
+                "session",
+                "sessessionssesess",
+                "market",
+                "market",
+                "session",
+                "session",
+                "significant"
+              ],
+              "unique_ratio": 0.5,
+              "content_ratio": 0.625,
+              "repeated_bigram_ratio": 0.14285714285714285,
+              "dominant_token_share": 0.375
+            },
+            {
+              "segment_idx": 1,
+              "tokens": [
+                "market",
+                "volatility",
+                "experienced",
+                "stock",
+                "market",
+                "stock",
+                "significant",
+                "volatility"
+              ],
+              "unique_ratio": 0.625,
+              "content_ratio": 1.0,
+              "repeated_bigram_ratio": 0.0,
+              "dominant_token_share": 0.25
+            },
+            {
+              "segment_idx": 2,
+              "tokens": [
+                "experienced",
+                "significant",
+                "stock",
+                "volatility",
+                "significant",
+                "session",
+                "stock",
+                "session"
+              ],
+              "unique_ratio": 0.625,
+              "content_ratio": 0.75,
+              "repeated_bigram_ratio": 0.0,
+              "dominant_token_share": 0.25
+            },
+            {
+              "segment_idx": 3,
+              "tokens": [
+                "volatility",
+                "experienced",
+                "volatility",
+                "stock",
+                "experienced",
+                "session",
+                "significant",
+                "market"
+              ],
+              "unique_ratio": 0.75,
+              "content_ratio": 0.875,
+              "repeated_bigram_ratio": 0.0,
+              "dominant_token_share": 0.25
+            },
+            {
+              "segment_idx": 4,
+              "tokens": [
+                "analysts",
+                "often",
+                "closely",
+                "monitor",
+                "market",
+                "sessions",
+                "involving",
+                "significant"
+              ],
+              "unique_ratio": 1.0,
+              "content_ratio": 0.875,
+              "repeated_bigram_ratio": 0.0,
+              "dominant_token_share": 0.125
+            },
+            {
+              "segment_idx": 5,
+              "tokens": [
+                "events",
+                "particularly",
+                "stock",
+                "markets"
+              ],
+              "unique_ratio": 1.0,
+              "content_ratio": 1.0,
+              "repeated_bigram_ratio": 0.0,
+              "dominant_token_share": 0.25
+            }
+          ],
+          "bad_segments": [],
+          "first_bad_segment_idx": null
+        },
+        {
+          "prompt": "Explain the topic clearly",
+          "output": "Explain the topic clearly simple explained simple simple analog simple rel everyday rel professor Professor explained explained analog explained rel Force professor everyday analog professor rel everyday professor analog everyday analog rel simpleForce professor professor explained professor simple everyday explained everyday simple professor rel rel analog analog FORCE rel explainedFORCE",
+          "generated_token_count": 46,
+          "window": 8,
+          "segments": [
+            {
+              "segment_idx": 0,
+              "tokens": [
+                "simple",
+                "explained",
+                "simple",
+                "simple",
+                "analog",
+                "simple",
+                "rel",
+                "everyday"
+              ],
+              "unique_ratio": 0.625,
+              "content_ratio": 0.375,
+              "repeated_bigram_ratio": 0.0,
+              "dominant_token_share": 0.5
+            },
+            {
+              "segment_idx": 1,
+              "tokens": [
+                "rel",
+                "professor",
+                "professor",
+                "explained",
+                "explained",
+                "analog",
+                "explained",
+                "rel"
+              ],
+              "unique_ratio": 0.5,
+              "content_ratio": 0.75,
+              "repeated_bigram_ratio": 0.0,
+              "dominant_token_share": 0.375
+            },
+            {
+              "segment_idx": 2,
+              "tokens": [
+                "force",
+                "professor",
+                "everyday",
+                "analog",
+                "professor",
+                "rel",
+                "everyday",
+                "professor"
+              ],
+              "unique_ratio": 0.625,
+              "content_ratio": 0.875,
+              "repeated_bigram_ratio": 0.0,
+              "dominant_token_share": 0.375
+            },
+            {
+              "segment_idx": 3,
+              "tokens": [
+                "analog",
+                "everyday",
+                "analog",
+                "rel",
+                "simpleforce",
+                "professor",
+                "professor",
+                "explained"
+              ],
+              "unique_ratio": 0.75,
+              "content_ratio": 0.875,
+              "repeated_bigram_ratio": 0.0,
+              "dominant_token_share": 0.25
+            },
+            {
+              "segment_idx": 4,
+              "tokens": [
+                "professor",
+                "simple",
+                "everyday",
+                "explained",
+                "everyday",
+                "simple",
+                "professor",
+                "rel"
+              ],
+              "unique_ratio": 0.625,
+              "content_ratio": 0.625,
+              "repeated_bigram_ratio": 0.0,
+              "dominant_token_share": 0.25
+            },
+            {
+              "segment_idx": 5,
+              "tokens": [
+                "rel",
+                "analog",
+                "analog",
+                "force",
+                "rel",
+                "explainedforce"
+              ],
+              "unique_ratio": 0.6666666666666666,
+              "content_ratio": 0.6666666666666666,
+              "repeated_bigram_ratio": 0.0,
+              "dominant_token_share": 0.3333333333333333
+            }
+          ],
+          "bad_segments": [],
+          "first_bad_segment_idx": null
+        }
+      ],
+      "error": null
+    },
+    "prefix_stepwise_drift_trajectory": {
+      "passed": true,
+      "rows": [
+        {
+          "prompt": "Key piano ideas include",
+          "first_bad_step": 4,
+          "decoded_output": "Key piano ideas include leg movements across keys, dynamic changes, and the use of the pedal. These",
+          "rows": [
+            {
+              "step": 0,
+              "top1": {
+                "token_id": 3598,
+                "piece": " major",
+                "norm": "major",
+                "logit": 16.25,
+                "prob": 0.026983050629496574
+              },
+              "top1_category": "semantic",
+              "topk_category_counts": {
+                "semantic": 11,
+                "functional": 1,
+                "punct": 0
+              },
+              "topk_category_prob_mass": {
+                "semantic": 0.18486935831606388,
+                "functional": 0.026983050629496574,
+                "punct": 0.0
+              },
+              "chosen_token_id": 2472,
+              "chosen_piece": " leg",
+              "chosen_norm": "leg",
+              "chosen_category": "functional"
+            },
+            {
+              "step": 1,
+              "top1": {
+                "token_id": 19029,
+                "piece": " movements",
+                "norm": "movements",
+                "logit": 14.375,
+                "prob": 0.13023822009563446
+              },
+              "top1_category": "semantic",
+              "topk_category_counts": {
+                "semantic": 11,
+                "functional": 1,
+                "punct": 0
+              },
+              "topk_category_prob_mass": {
+                "semantic": 0.3965669944882393,
+                "functional": 0.0113800885155797,
+                "punct": 0.0
+              },
+              "chosen_token_id": 19029,
+              "chosen_piece": " movements",
+              "chosen_norm": "movements",
+              "chosen_category": "semantic"
+            },
+            {
+              "step": 2,
+              "top1": {
+                "token_id": 3941,
+                "piece": " across",
+                "norm": "across",
+                "logit": 16.5,
+                "prob": 0.05107051879167557
+              },
+              "top1_category": "functional",
+              "topk_category_counts": {
+                "semantic": 10,
+                "functional": 2,
+                "punct": 0
+              },
+              "topk_category_prob_mass": {
+                "semantic": 0.2263985425233841,
+                "functional": 0.0767503883689642,
+                "punct": 0.0
+              },
+              "chosen_token_id": 3941,
+              "chosen_piece": " across",
+              "chosen_norm": "across",
+              "chosen_category": "functional"
+            },
+            {
+              "step": 3,
+              "top1": {
+                "token_id": 6894,
+                "piece": " keys",
+                "norm": "keys",
+                "logit": 18.5,
+                "prob": 0.09729984402656555
+              },
+              "top1_category": "semantic",
+              "topk_category_counts": {
+                "semantic": 10,
+                "functional": 2,
+                "punct": 0
+              },
+              "topk_category_prob_mass": {
+                "semantic": 0.40497455187141895,
+                "functional": 0.04631178267300129,
+                "punct": 0.0
+              },
+              "chosen_token_id": 6894,
+              "chosen_piece": " keys",
+              "chosen_norm": "keys",
+              "chosen_category": "semantic"
+            },
+            {
+              "step": 4,
+              "top1": {
+                "token_id": 11,
+                "piece": ",",
+                "norm": "",
+                "logit": 21.125,
+                "prob": 0.6922075748443604
+              },
+              "top1_category": "punct",
+              "topk_category_counts": {
+                "semantic": 1,
+                "functional": 0,
+                "punct": 11
+              },
+              "topk_category_prob_mass": {
+                "semantic": 0.004116016905754805,
+                "functional": 0.0,
+                "punct": 0.8863428700715303
+              },
+              "chosen_token_id": 11,
+              "chosen_piece": ",",
+              "chosen_norm": "",
+              "chosen_category": "punct"
+            },
+            {
+              "step": 5,
+              "top1": {
+                "token_id": 8741,
+                "piece": " dynamic",
+                "norm": "dynamic",
+                "logit": 17.625,
+                "prob": 0.03767668455839157
+              },
+              "top1_category": "semantic",
+              "topk_category_counts": {
+                "semantic": 10,
+                "functional": 2,
+                "punct": 0
+              },
+              "topk_category_prob_mass": {
+                "semantic": 0.1940950881689787,
+                "functional": 0.04548138566315174,
+                "punct": 0.0
+              },
+              "chosen_token_id": 8741,
+              "chosen_piece": " dynamic",
+              "chosen_norm": "dynamic",
+              "chosen_category": "semantic"
+            },
+            {
+              "step": 6,
+              "top1": {
+                "token_id": 4344,
+                "piece": " changes",
+                "norm": "changes",
+                "logit": 21.75,
+                "prob": 0.42921698093414307
+              },
+              "top1_category": "semantic",
+              "topk_category_counts": {
+                "semantic": 11,
+                "functional": 0,
+                "punct": 1
+              },
+              "topk_category_prob_mass": {
+                "semantic": 0.8407482951879501,
+                "functional": 0.0,
+                "punct": 0.008908114396035671
+              },
+              "chosen_token_id": 4344,
+              "chosen_piece": " changes",
+              "chosen_norm": "changes",
+              "chosen_category": "semantic"
+            },
+            {
+              "step": 7,
+              "top1": {
+                "token_id": 11,
+                "piece": ",",
+                "norm": "",
+                "logit": 25.375,
+                "prob": 0.9306752681732178
+              },
+              "top1_category": "punct",
+              "topk_category_counts": {
+                "semantic": 5,
+                "functional": 2,
+                "punct": 5
+              },
+              "topk_category_prob_mass": {
+                "semantic": 0.0230137127218768,
+                "functional": 0.005398477369453758,
+                "punct": 0.961544852994848
+              },
+              "chosen_token_id": 11,
+              "chosen_piece": ",",
+              "chosen_norm": "",
+              "chosen_category": "punct"
+            },
+            {
+              "step": 8,
+              "top1": {
+                "token_id": 323,
+                "piece": " and",
+                "norm": "and",
+                "logit": 20.25,
+                "prob": 0.4670189321041107
+              },
+              "top1_category": "functional",
+              "topk_category_counts": {
+                "semantic": 9,
+                "functional": 3,
+                "punct": 0
+              },
+              "topk_category_prob_mass": {
+                "semantic": 0.1295861303806305,
+                "functional": 0.5177998133003712,
+                "punct": 0.0
+              },
+              "chosen_token_id": 323,
+              "chosen_piece": " and",
+              "chosen_norm": "and",
+              "chosen_category": "functional"
+            },
+            {
+              "step": 9,
+              "top1": {
+                "token_id": 279,
+                "piece": " the",
+                "norm": "the",
+                "logit": 18.625,
+                "prob": 0.1194610446691513
+              },
+              "top1_category": "functional",
+              "topk_category_counts": {
+                "semantic": 9,
+                "functional": 3,
+                "punct": 0
+              },
+              "topk_category_prob_mass": {
+                "semantic": 0.18513815943151712,
+                "functional": 0.21467376872897148,
+                "punct": 0.0
+              },
+              "chosen_token_id": 279,
+              "chosen_piece": " the",
+              "chosen_norm": "the",
+              "chosen_category": "functional"
+            },
+            {
+              "step": 10,
+              "top1": {
+                "token_id": 990,
+                "piece": " use",
+                "norm": "use",
+                "logit": 19.75,
+                "prob": 0.22168958187103271
+              },
+              "top1_category": "functional",
+              "topk_category_counts": {
+                "semantic": 10,
+                "functional": 2,
+                "punct": 0
+              },
+              "topk_category_prob_mass": {
+                "semantic": 0.13133995607495308,
+                "functional": 0.24505549110472202,
+                "punct": 0.0
+              },
+              "chosen_token_id": 990,
+              "chosen_piece": " use",
+              "chosen_norm": "use",
+              "chosen_category": "functional"
+            },
+            {
+              "step": 11,
+              "top1": {
+                "token_id": 315,
+                "piece": " of",
+                "norm": "of",
+                "logit": 25.0,
+                "prob": 0.9930819869041443
+              },
+              "top1_category": "functional",
+              "topk_category_counts": {
+                "semantic": 1,
+                "functional": 6,
+                "punct": 5
+              },
+              "topk_category_prob_mass": {
+                "semantic": 0.00010160254169022664,
+                "functional": 0.9945033092226367,
+                "punct": 0.00101397221442312
+              },
+              "chosen_token_id": 315,
+              "chosen_piece": " of",
+              "chosen_norm": "of",
+              "chosen_category": "functional"
+            },
+            {
+              "step": 12,
+              "top1": {
+                "token_id": 279,
+                "piece": " the",
+                "norm": "the",
+                "logit": 19.125,
+                "prob": 0.09505932033061981
+              },
+              "top1_category": "functional",
+              "topk_category_counts": {
+                "semantic": 8,
+                "functional": 4,
+                "punct": 0
+              },
+              "topk_category_prob_mass": {
+                "semantic": 0.21602829732000828,
+                "functional": 0.17841206304728985,
+                "punct": 0.0
+              },
+              "chosen_token_id": 279,
+              "chosen_piece": " the",
+              "chosen_norm": "the",
+              "chosen_category": "functional"
+            },
+            {
+              "step": 13,
+              "top1": {
+                "token_id": 48601,
+                "piece": " pedal",
+                "norm": "pedal",
+                "logit": 18.375,
+                "prob": 0.0746825560927391
+              },
+              "top1_category": "semantic",
+              "topk_category_counts": {
+                "semantic": 9,
+                "functional": 3,
+                "punct": 0
+              },
+              "topk_category_prob_mass": {
+                "semantic": 0.42089940421283245,
+                "functional": 0.09426561277359724,
+                "punct": 0.0
+              },
+              "chosen_token_id": 48601,
+              "chosen_piece": " pedal",
+              "chosen_norm": "pedal",
+              "chosen_category": "semantic"
+            },
+            {
+              "step": 14,
+              "top1": {
+                "token_id": 13,
+                "piece": ".",
+                "norm": "",
+                "logit": 20.5,
+                "prob": 0.38581112027168274
+              },
+              "top1_category": "punct",
+              "topk_category_counts": {
+                "semantic": 0,
+                "functional": 5,
+                "punct": 7
+              },
+              "topk_category_prob_mass": {
+                "semantic": 0.0,
+                "functional": 0.2004851959645748,
+                "punct": 0.6528554670512676
+              },
+              "chosen_token_id": 13,
+              "chosen_piece": ".",
+              "chosen_norm": "",
+              "chosen_category": "punct"
+            },
+            {
+              "step": 15,
+              "top1": {
+                "token_id": 4220,
+                "piece": " These",
+                "norm": "these",
+                "logit": 13.4375,
+                "prob": 0.07124418765306473
+              },
+              "top1_category": "semantic",
+              "topk_category_counts": {
+                "semantic": 2,
+                "functional": 5,
+                "punct": 5
+              },
+              "topk_category_prob_mass": {
+                "semantic": 0.08816616423428059,
+                "functional": 0.15614240616559982,
+                "punct": 0.11336426809430122
+              },
+              "chosen_token_id": 4220,
+              "chosen_piece": " These",
+              "chosen_norm": "these",
+              "chosen_category": "semantic"
+            }
+          ],
+          "passed": true
+        },
+        {
+          "prompt": "Explain the topic clearly",
+          "first_bad_step": 4,
+          "decoded_output": "Explain the topic clearly based upon given context.  \"explain the topic\" is a phrase that means",
+          "rows": [
+            {
+              "step": 0,
+              "top1": {
+                "token_id": 3118,
+                "piece": " based",
+                "norm": "based",
+                "logit": 14.1875,
+                "prob": 0.17047074437141418
+              },
+              "top1_category": "semantic",
+              "topk_category_counts": {
+                "semantic": 11,
+                "functional": 1,
+                "punct": 0
+              },
+              "topk_category_prob_mass": {
+                "semantic": 0.42534564854577184,
+                "functional": 0.031533919274806976,
+                "punct": 0.0
+              },
+              "chosen_token_id": 3118,
+              "chosen_piece": " based",
+              "chosen_norm": "based",
+              "chosen_category": "semantic"
+            },
+            {
+              "step": 1,
+              "top1": {
+                "token_id": 5193,
+                "piece": " upon",
+                "norm": "upon",
+                "logit": 17.5,
+                "prob": 0.12673600018024445
+              },
+              "top1_category": "semantic",
+              "topk_category_counts": {
+                "semantic": 12,
+                "functional": 0,
+                "punct": 0
+              },
+              "topk_category_prob_mass": {
+                "semantic": 0.4612283743917942,
+                "functional": 0.0,
+                "punct": 0.0
+              },
+              "chosen_token_id": 5193,
+              "chosen_piece": " upon",
+              "chosen_norm": "upon",
+              "chosen_category": "semantic"
+            },
+            {
+              "step": 2,
+              "top1": {
+                "token_id": 2661,
+                "piece": " given",
+                "norm": "given",
+                "logit": 19.75,
+                "prob": 0.23131124675273895
+              },
+              "top1_category": "semantic",
+              "topk_category_counts": {
+                "semantic": 12,
+                "functional": 0,
+                "punct": 0
+              },
+              "topk_category_prob_mass": {
+                "semantic": 0.5242105945944786,
+                "functional": 0.0,
+                "punct": 0.0
+              },
+              "chosen_token_id": 2661,
+              "chosen_piece": " given",
+              "chosen_norm": "given",
+              "chosen_category": "semantic"
+            },
+            {
+              "step": 3,
+              "top1": {
+                "token_id": 2266,
+                "piece": " context",
+                "norm": "context",
+                "logit": 21.625,
+                "prob": 0.27016517519950867
+              },
+              "top1_category": "semantic",
+              "topk_category_counts": {
+                "semantic": 12,
+                "functional": 0,
+                "punct": 0
+              },
+              "topk_category_prob_mass": {
+                "semantic": 0.780865266919136,
+                "functional": 0.0,
+                "punct": 0.0
+              },
+              "chosen_token_id": 2266,
+              "chosen_piece": " context",
+              "chosen_norm": "context",
+              "chosen_category": "semantic"
+            },
+            {
+              "step": 4,
+              "top1": {
+                "token_id": 13,
+                "piece": ".",
+                "norm": "",
+                "logit": 20.375,
+                "prob": 0.28195127844810486
+              },
+              "top1_category": "punct",
+              "topk_category_counts": {
+                "semantic": 0,
+                "functional": 0,
+                "punct": 12
+              },
+              "topk_category_prob_mass": {
+                "semantic": 0.0,
+                "functional": 0.0,
+                "punct": 0.9160851284395903
+              },
+              "chosen_token_id": 13,
+              "chosen_piece": ".",
+              "chosen_norm": "",
+              "chosen_category": "punct"
+            },
+            {
+              "step": 5,
+              "top1": {
+                "token_id": 220,
+                "piece": " ",
+                "norm": "",
+                "logit": 16.625,
+                "prob": 0.04581373557448387
+              },
+              "top1_category": "punct",
+              "topk_category_counts": {
+                "semantic": 7,
+                "functional": 0,
+                "punct": 5
+              },
+              "topk_category_prob_mass": {
+                "semantic": 0.16006913781166077,
+                "functional": 0.0,
+                "punct": 0.09724485501646996
+              },
+              "chosen_token_id": 220,
+              "chosen_piece": " ",
+              "chosen_norm": "",
+              "chosen_category": "punct"
+            },
+            {
+              "step": 6,
+              "top1": {
+                "token_id": 330,
+                "piece": " \"",
+                "norm": "",
+                "logit": 14.5625,
+                "prob": 0.07181069999933243
+              },
+              "top1_category": "punct",
+              "topk_category_counts": {
+                "semantic": 8,
+                "functional": 0,
+                "punct": 4
+              },
+              "topk_category_prob_mass": {
+                "semantic": 0.18383791111409664,
+                "functional": 0.0,
+                "punct": 0.18584902863949537
+              },
+              "chosen_token_id": 330,
+              "chosen_piece": " \"",
+              "chosen_norm": "",
+              "chosen_category": "punct"
+            },
+            {
+              "step": 7,
+              "top1": {
+                "token_id": 94344,
+                "piece": "explain",
+                "norm": "explain",
+                "logit": 12.6875,
+                "prob": 0.01096130907535553
+              },
+              "top1_category": "semantic",
+              "topk_category_counts": {
+                "semantic": 7,
+                "functional": 5,
+                "punct": 0
+              },
+              "topk_category_prob_mass": {
+                "semantic": 0.04443507920950651,
+                "functional": 0.02441536309197545,
+                "punct": 0.0
+              },
+              "chosen_token_id": 94344,
+              "chosen_piece": "explain",
+              "chosen_norm": "explain",
+              "chosen_category": "semantic"
+            },
+            {
+              "step": 8,
+              "top1": {
+                "token_id": 279,
+                "piece": " the",
+                "norm": "the",
+                "logit": 19.5,
+                "prob": 0.6197741031646729
+              },
+              "top1_category": "functional",
+              "topk_category_counts": {
+                "semantic": 0,
+                "functional": 3,
+                "punct": 9
+              },
+              "topk_category_prob_mass": {
+                "semantic": 0.0,
+                "functional": 0.6259922899771482,
+                "punct": 0.29147468809969723
+              },
+              "chosen_token_id": 279,
+              "chosen_piece": " the",
+              "chosen_norm": "the",
+              "chosen_category": "functional"
+            },
+            {
+              "step": 9,
+              "top1": {
+                "token_id": 8544,
+                "piece": " topic",
+                "norm": "topic",
+                "logit": 21.125,
+                "prob": 0.5933138132095337
+              },
+              "top1_category": "semantic",
+              "topk_category_counts": {
+                "semantic": 12,
+                "functional": 0,
+                "punct": 0
+              },
+              "topk_category_prob_mass": {
+                "semantic": 0.7793927444145083,
+                "functional": 0.0,
+                "punct": 0.0
+              },
+              "chosen_token_id": 8544,
+              "chosen_piece": " topic",
+              "chosen_norm": "topic",
+              "chosen_category": "semantic"
+            },
+            {
+              "step": 10,
+              "top1": {
+                "token_id": 1,
+                "piece": "\"",
+                "norm": "",
+                "logit": 21.25,
+                "prob": 0.2902170717716217
+              },
+              "top1_category": "punct",
+              "topk_category_counts": {
+                "semantic": 2,
+                "functional": 3,
+                "punct": 7
+              },
+              "topk_category_prob_mass": {
+                "semantic": 0.29939965903759,
+                "functional": 0.18907508859410882,
+                "punct": 0.39776377007365227
+              },
+              "chosen_token_id": 1,
+              "chosen_piece": "\"",
+              "chosen_norm": "",
+              "chosen_category": "punct"
+            },
+            {
+              "step": 11,
+              "top1": {
+                "token_id": 374,
+                "piece": " is",
+                "norm": "is",
+                "logit": 15.625,
+                "prob": 0.10762867331504822
+              },
+              "top1_category": "functional",
+              "topk_category_counts": {
+                "semantic": 1,
+                "functional": 1,
+                "punct": 10
+              },
+              "topk_category_prob_mass": {
+                "semantic": 0.07874282449483871,
+                "functional": 0.10762867331504822,
+                "punct": 0.23762445989996195
+              },
+              "chosen_token_id": 374,
+              "chosen_piece": " is",
+              "chosen_norm": "is",
+              "chosen_category": "functional"
+            },
+            {
+              "step": 12,
+              "top1": {
+                "token_id": 264,
+                "piece": " a",
+                "norm": "a",
+                "logit": 21.25,
+                "prob": 0.42951807379722595
+              },
+              "top1_category": "functional",
+              "topk_category_counts": {
+                "semantic": 4,
+                "functional": 8,
+                "punct": 0
+              },
+              "topk_category_prob_mass": {
+                "semantic": 0.06314869225025177,
+                "functional": 0.7335648243315518,
+                "punct": 0.0
+              },
+              "chosen_token_id": 264,
+              "chosen_piece": " a",
+              "chosen_norm": "a",
+              "chosen_category": "functional"
+            },
+            {
+              "step": 13,
+              "top1": {
+                "token_id": 17133,
+                "piece": " phrase",
+                "norm": "phrase",
+                "logit": 19.875,
+                "prob": 0.16571058332920074
+              },
+              "top1_category": "semantic",
+              "topk_category_counts": {
+                "semantic": 11,
+                "functional": 1,
+                "punct": 0
+              },
+              "topk_category_prob_mass": {
+                "semantic": 0.4700012067332864,
+                "functional": 0.012004034593701363,
+                "punct": 0.0
+              },
+              "chosen_token_id": 17133,
+              "chosen_piece": " phrase",
+              "chosen_norm": "phrase",
+              "chosen_category": "semantic"
+            },
+            {
+              "step": 14,
+              "top1": {
+                "token_id": 429,
+                "piece": " that",
+                "norm": "that",
+                "logit": 23.0,
+                "prob": 0.4704553186893463
+              },
+              "top1_category": "functional",
+              "topk_category_counts": {
+                "semantic": 4,
+                "functional": 7,
+                "punct": 1
+              },
+              "topk_category_prob_mass": {
+                "semantic": 0.2615935071371496,
+                "functional": 0.6189748737961054,
+                "punct": 0.007604201789945364
+              },
+              "chosen_token_id": 429,
+              "chosen_piece": " that",
+              "chosen_norm": "that",
+              "chosen_category": "functional"
+            },
+            {
+              "step": 15,
+              "top1": {
+                "token_id": 3363,
+                "piece": " means",
+                "norm": "means",
+                "logit": 21.125,
+                "prob": 0.24727746844291687
+              },
+              "top1_category": "semantic",
+              "topk_category_counts": {
+                "semantic": 9,
+                "functional": 3,
+                "punct": 0
+              },
+              "topk_category_prob_mass": {
+                "semantic": 0.5248672068119049,
+                "functional": 0.13997168745845556,
+                "punct": 0.0
+              },
+              "chosen_token_id": 3363,
+              "chosen_piece": " means",
+              "chosen_norm": "means",
+              "chosen_category": "semantic"
+            }
+          ],
+          "passed": true
+        }
+      ],
+      "error": null
+    },
+    "retrieval_generation_alignment_audit": {
+      "passed": true,
+      "music_keywords": [
+        "pianist",
+        "practiced",
+        "arpeggios",
+        "chopin",
+        "nocturnes",
+        "midnight",
+        "musician",
+        "refined",
+        "finger",
+        "technique",
+        "phrasing",
+        "pedal"
+      ],
+      "space_keywords": [
+        "distant",
+        "astronomers",
+        "observed",
+        "galaxies",
+        "quasars",
+        "stellar",
+        "evolution",
+        "space",
+        "orbital",
+        "mechanics",
+        "explains",
+        "satellites"
+      ],
+      "diagnoses": {
+        "aligned": 2,
+        "retrieval_miss": 0,
+        "bridge_unused": 1,
+        "unknown": 0
+      },
+      "rows": [
+        {
+          "prompt": "What improves piano technique and musical phrasing?",
+          "expected_label": "music",
+          "retrieved_mids": [
+            1,
+            0,
+            3,
+            6,
+            5
+          ],
+          "retrieved_label_counts": {
+            "music": 3,
+            "space": 2
+          },
+          "retrieved_majority_label": "music",
+          "retrieved_text_preview": [
+            "A musician refined finger technique, phrasing, and pedal control on the piano.",
+            "The pianist practiced arpeggios and Chopin nocturnes until midnight.",
+            "A conservatory student studied etudes, scales, and expressive voicing on the keyboard."
+          ],
+          "output": "What improves piano technique and musical phrasing? piano technique control involves technique piano musician technique finger control piano piano musician control technique musician refined finger finger control finger technique piano finger refined refined pedal refined",
+          "music_score": 0.6060606060606061,
+          "space_score": 0.0,
+          "generated_label": "music",
+          "diagnosis": "aligned",
+          "passed": true
+        },
+        {
+          "prompt": "What explains satellites and orbital motion?",
+          "expected_label": "space",
+          "retrieved_mids": [
+            5,
+            4,
+            6,
+            1,
+            0
+          ],
+          "retrieved_label_counts": {
+            "space": 3,
+            "music": 2
+          },
+          "retrieved_majority_label": "space",
+          "retrieved_text_preview": [
+            "Orbital mechanics explains how satellites and planets move under gravitational force.",
+            "Astronomers observed distant galaxies, quasars, and stellar evolution in deep space.",
+            "A telescope captured nebulae, exoplanets, and spectral signatures from distant stars."
+          ],
+          "output": "What explains satellites and orbital motion? explains force satellites Force explains satellitesForce explains satellites force mechanics explains explains force satellites explain planets mechanics mechanics force mechanics gravitational force explains gravitational planets gravitational gravitational",
+          "music_score": 0.0,
+          "space_score": 0.5161290322580645,
+          "generated_label": "space",
+          "diagnosis": "aligned",
+          "passed": true
+        },
+        {
+          "prompt": "Summarize the subject with concrete domain details.",
+          "expected_label": null,
+          "retrieved_mids": [
+            3,
+            1,
+            6,
+            0,
+            5
+          ],
+          "retrieved_label_counts": {
+            "music": 3,
+            "space": 2
+          },
+          "retrieved_majority_label": "music",
+          "retrieved_text_preview": [
+            "A conservatory student studied etudes, scales, and expressive voicing on the keyboard.",
+            "A musician refined finger technique, phrasing, and pedal control on the piano.",
+            "A telescope captured nebulae, exoplanets, and spectral signatures from distant stars."
+          ],
+          "output": "Summarize the subject with concrete domain details. touch interpretation often depends dynamics tempo rub dynamics rub tempo touch dynamics touch tempo interpretation dynamics interpretation controls interpretation rub rub touch often tempo tempo dynamics depends depends",
+          "music_score": 0.0,
+          "space_score": 0.0,
+          "generated_label": null,
+          "diagnosis": "bridge_unused",
+          "passed": true
+        }
+      ],
+      "error": null
+    },
+    "retrieval_prefix_decode_correlation_audit": {
+      "passed": false,
+      "correlations": {
+        "retrieval_strength__prefix_l2": null,
+        "retrieval_strength__bad_decode_score": 0.21927202884584385,
+        "prefix_l2__bad_decode_score": null
+      },
+      "rows": [
+        {
+          "prompt": "What improves piano technique and musical phrasing?",
+          "expected_label": "music",
+          "retrieved_scored": [
+            {
+              "mid": 1,
+              "score": 0.6172578841447831
+            },
+            {
+              "mid": 0,
+              "score": 0.22511255741119385
+            },
+            {
+              "mid": 3,
+              "score": 0.11276901960372926
+            },
+            {
+              "mid": 6,
+              "score": 0.045475220680236815
+            },
+            {
+              "mid": 5,
+              "score": 0.036619618535041816
+            }
+          ],
+          "retrieved_label_counts": {
+            "music": 3,
+            "space": 2
+          },
+          "retrieval_strength": 0.9551394611597062,
+          "prefix_l2_shift": 322359623680.0,
+          "prefix_js_divergence": 0.3171347379684448,
+          "top1_with_prefix": {
+            "token_id": 14566,
+            "piece": " Options",
+            "norm": "options",
+            "logit": 16.375,
+            "prob": 0.1110726147890091
+          },
+          "top1_category_with_prefix": "semantic",
+          "topk_non_semantic_prob_mass": 0.03182283788919449
+        },
+        {
+          "prompt": "What explains satellites and orbital motion?",
+          "expected_label": "space",
+          "retrieved_scored": [
+            {
+              "mid": 5,
+              "score": 0.5634284257888794
+            },
+            {
+              "mid": 4,
+              "score": 0.07376852035522463
+            },
+            {
+              "mid": 6,
+              "score": 0.06803246438503266
+            },
+            {
+              "mid": 1,
+              "score": 0.045463052392005925
+            },
+            {
+              "mid": 0,
+              "score": 0.03999960422515869
+            }
+          ],
+          "retrieved_label_counts": {
+            "space": 3,
+            "music": 2
+          },
+          "retrieval_strength": 0.7052294105291367,
+          "prefix_l2_shift": 322359623680.0,
+          "prefix_js_divergence": 0.46486830711364746,
+          "top1_with_prefix": {
+            "token_id": 13177,
+            "piece": " Sat",
+            "norm": "sat",
+            "logit": 15.3125,
+            "prob": 0.07889200001955032
+          },
+          "top1_category_with_prefix": "functional",
+          "topk_non_semantic_prob_mass": 0.1079147458076477
+        },
+        {
+          "prompt": "Describe what a student should focus on first.",
+          "expected_label": null,
+          "retrieved_scored": [
+            {
+              "mid": 3,
+              "score": 0.5128585010766983
+            },
+            {
+              "mid": 1,
+              "score": 0.046858394145965584
+            },
+            {
+              "mid": 0,
+              "score": -0.0005610674619674696
+            },
+            {
+              "mid": 4,
+              "score": -0.011547431349754333
+            },
+            {
+              "mid": 6,
+              "score": -0.026388256251811976
+            }
+          ],
+          "retrieved_label_counts": {
+            "music": 3,
+            "space": 2
+          },
+          "retrieval_strength": 0.5128585010766983,
+          "prefix_l2_shift": 322359623680.0,
+          "prefix_js_divergence": 0.441089391708374,
+          "top1_with_prefix": {
+            "token_id": 22201,
+            "piece": " Choose",
+            "norm": "choose",
+            "logit": 15.125,
+            "prob": 0.12620772421360016
+          },
+          "top1_category_with_prefix": "semantic",
+          "topk_non_semantic_prob_mass": 0.013302195817232132
+        },
+        {
+          "prompt": "Summarize the subject with concrete domain details.",
+          "expected_label": null,
+          "retrieved_scored": [
+            {
+              "mid": 3,
+              "score": 0.021094447374343874
+            },
+            {
+              "mid": 1,
+              "score": 0.015311965346336366
+            },
+            {
+              "mid": 6,
+              "score": 0.004081499576568608
+            },
+            {
+              "mid": 0,
+              "score": -0.010262516140937806
+            },
+            {
+              "mid": 5,
+              "score": -0.012652482092380526
+            }
+          ],
+          "retrieved_label_counts": {
+            "music": 3,
+            "space": 2
+          },
+          "retrieval_strength": 0.021094447374343874,
+          "prefix_l2_shift": 322359623680.0,
+          "prefix_js_divergence": 0.32552844285964966,
+          "top1_with_prefix": {
+            "token_id": 58194,
+            "piece": " Artificial",
+            "norm": "artificial",
+            "logit": 14.625,
+            "prob": 0.009140501730144024
+          },
+          "top1_category_with_prefix": "semantic",
+          "topk_non_semantic_prob_mass": 0.0
+        },
+        {
+          "prompt": "Key piano ideas include",
+          "expected_label": "music",
+          "retrieved_scored": [
+            {
+              "mid": 1,
+              "score": 0.5411406040191651
+            },
+            {
+              "mid": 0,
+              "score": 0.3158708691596985
+            },
+            {
+              "mid": 3,
+              "score": 0.13700250387191773
+            },
+            {
+              "mid": 6,
+              "score": 0.016681492328643806
+            },
+            {
+              "mid": 4,
+              "score": -0.005892813205719001
+            }
+          ],
+          "retrieved_label_counts": {
+            "music": 3,
+            "space": 2
+          },
+          "retrieval_strength": 0.9940139770507813,
+          "prefix_l2_shift": 322359623680.0,
+          "prefix_js_divergence": 0.301528662443161,
+          "top1_with_prefix": {
+            "token_id": 3598,
+            "piece": " major",
+            "norm": "major",
+            "logit": 16.0,
+            "prob": 0.028910748660564423
+          },
+          "top1_category_with_prefix": "semantic",
+          "topk_non_semantic_prob_mass": 0.022515714168548584
+        },
+        {
+          "prompt": "Orbital motion depends on",
+          "expected_label": "space",
+          "retrieved_scored": [
+            {
+              "mid": 2,
+              "score": 0.3270561575889588
+            },
+            {
+              "mid": 5,
+              "score": 0.04361439943313599
+            },
+            {
+              "mid": 3,
+              "score": 0.024278688430786136
+            },
+            {
+              "mid": 1,
+              "score": -0.021913541853427882
+            },
+            {
+              "mid": 6,
+              "score": -0.033837710320949566
+            }
+          ],
+          "retrieved_label_counts": {
+            "music": 3,
+            "space": 2
+          },
+          "retrieval_strength": 0.009776689112186425,
+          "prefix_l2_shift": 322359623680.0,
+          "prefix_js_divergence": 0.4070507884025574,
+          "top1_with_prefix": {
+            "token_id": 3072,
+            "piece": " mass",
+            "norm": "mass",
+            "logit": 18.625,
+            "prob": 0.12673379480838776
+          },
+          "top1_category_with_prefix": "semantic",
+          "topk_non_semantic_prob_mass": 0.0
+        }
+      ],
+      "error": null
+    },
+    "stepwise_label_mass_alignment_audit": {
+      "passed": false,
+      "label_keywords": {
+        "music": [
+          "pianist",
+          "practiced",
+          "arpeggios",
+          "chopin",
+          "nocturnes",
+          "midnight",
+          "musician",
+          "refined",
+          "finger",
+          "technique",
+          "phrasing",
+          "pedal"
+        ],
+        "space": [
+          "distant",
+          "astronomers",
+          "observed",
+          "galaxies",
+          "quasars",
+          "stellar",
+          "evolution",
+          "space",
+          "orbital",
+          "mechanics",
+          "explains",
+          "satellites"
+        ]
+      },
+      "rows": [
+        {
+          "prompt": "What improves piano technique and musical phrasing?",
+          "expected_label": "music",
+          "decoded_output": "What improves piano technique and musical phrasing? Options tend towards improving piano technique, musical phrasing, and",
+          "stage_counts": {
+            "inject": 6,
+            "aligned": 4,
+            "decode": 2
+          },
+          "rows": [
+            {
+              "step": 0,
+              "retrieved_majority_label": "music",
+              "retrieved_label_counts": {
+                "music": 3,
+                "space": 2
+              },
+              "retrieved_score_sum": {
+                "music": 0.9551394611597062,
+                "space": 0.08209483921527863
+              },
+              "logits_label_mass": {
+                "music": 0,
+                "space": 0
+              },
+              "top1_piece": " Options",
+              "top1_category": "semantic",
+              "chosen_piece": " Options",
+              "chosen_category": "semantic",
+              "chosen_label": null,
+              "diagnosed_stage": "inject"
+            },
+            {
+              "step": 1,
+              "retrieved_majority_label": "music",
+              "retrieved_label_counts": {
+                "music": 3,
+                "space": 2
+              },
+              "retrieved_score_sum": {
+                "music": 0.9551394611597062,
+                "space": 0.08209483921527863
+              },
+              "logits_label_mass": {
+                "music": 0,
+                "space": 0
+              },
+              "top1_piece": " tend",
+              "top1_category": "semantic",
+              "chosen_piece": " tend",
+              "chosen_category": "semantic",
+              "chosen_label": null,
+              "diagnosed_stage": "inject"
+            },
+            {
+              "step": 2,
+              "retrieved_majority_label": "music",
+              "retrieved_label_counts": {
+                "music": 3,
+                "space": 2
+              },
+              "retrieved_score_sum": {
+                "music": 0.9551394611597062,
+                "space": 0.08209483921527863
+              },
+              "logits_label_mass": {
+                "music": 0.03443919029086828,
+                "space": 0
+              },
+              "top1_piece": " towards",
+              "top1_category": "semantic",
+              "chosen_piece": " towards",
+              "chosen_category": "semantic",
+              "chosen_label": "music",
+              "diagnosed_stage": "aligned"
+            },
+            {
+              "step": 3,
+              "retrieved_majority_label": "music",
+              "retrieved_label_counts": {
+                "music": 3,
+                "space": 2
+              },
+              "retrieved_score_sum": {
+                "music": 0.9551394611597062,
+                "space": 0.08209483921527863
+              },
+              "logits_label_mass": {
+                "music": 0,
+                "space": 0
+              },
+              "top1_piece": " improving",
+              "top1_category": "semantic",
+              "chosen_piece": " improving",
+              "chosen_category": "semantic",
+              "chosen_label": null,
+              "diagnosed_stage": "inject"
+            },
+            {
+              "step": 4,
+              "retrieved_majority_label": "music",
+              "retrieved_label_counts": {
+                "music": 3,
+                "space": 2
+              },
+              "retrieved_score_sum": {
+                "music": 0.9551394611597062,
+                "space": 0.08209483921527863
+              },
+              "logits_label_mass": {
+                "music": 0.07181288627907634,
+                "space": 0
+              },
+              "top1_piece": " piano",
+              "top1_category": "semantic",
+              "chosen_piece": " piano",
+              "chosen_category": "semantic",
+              "chosen_label": "music",
+              "diagnosed_stage": "aligned"
+            },
+            {
+              "step": 5,
+              "retrieved_majority_label": "music",
+              "retrieved_label_counts": {
+                "music": 3,
+                "space": 2
+              },
+              "retrieved_score_sum": {
+                "music": 0.9551394611597062,
+                "space": 0.08209483921527863
+              },
+              "logits_label_mass": {
+                "music": 0.9712017463753,
+                "space": 0
+              },
+              "top1_piece": " technique",
+              "top1_category": "semantic",
+              "chosen_piece": " technique",
+              "chosen_category": "semantic",
+              "chosen_label": "music",
+              "diagnosed_stage": "aligned"
+            },
+            {
+              "step": 6,
+              "retrieved_majority_label": "music",
+              "retrieved_label_counts": {
+                "music": 3,
+                "space": 2
+              },
+              "retrieved_score_sum": {
+                "music": 0.9551394611597062,
+                "space": 0.08209483921527863
+              },
+              "logits_label_mass": {
+                "music": 0,
+                "space": 0
+              },
+              "top1_piece": ",",
+              "top1_category": "punct",
+              "chosen_piece": ",",
+              "chosen_category": "punct",
+              "chosen_label": null,
+              "diagnosed_stage": "inject"
+            },
+            {
+              "step": 7,
+              "retrieved_majority_label": "music",
+              "retrieved_label_counts": {
+                "music": 3,
+                "space": 2
+              },
+              "retrieved_score_sum": {
+                "music": 0.9551394611597062,
+                "space": 0.08209483921527863
+              },
+              "logits_label_mass": {
+                "music": 0.03453451534733176,
+                "space": 0
+              },
+              "top1_piece": " musical",
+              "top1_category": "semantic",
+              "chosen_piece": " musical",
+              "chosen_category": "semantic",
+              "chosen_label": "music",
+              "diagnosed_stage": "aligned"
+            },
+            {
+              "step": 8,
+              "retrieved_majority_label": "music",
+              "retrieved_label_counts": {
+                "music": 3,
+                "space": 2
+              },
+              "retrieved_score_sum": {
+                "music": 0.9551050901412963,
+                "space": 0.09417556524276735
+              },
+              "logits_label_mass": {
+                "music": 0.0019687179010361433,
+                "space": 0
+              },
+              "top1_piece": " ph",
+              "top1_category": "functional",
+              "chosen_piece": " ph",
+              "chosen_category": "functional",
+              "chosen_label": "music",
+              "diagnosed_stage": "decode"
+            },
+            {
+              "step": 9,
+              "retrieved_majority_label": "music",
+              "retrieved_label_counts": {
+                "music": 3,
+                "space": 2
+              },
+              "retrieved_score_sum": {
+                "music": 0.9551050901412963,
+                "space": 0.09417556524276735
+              },
+              "logits_label_mass": {
+                "music": 0,
+                "space": 0
+              },
+              "top1_piece": "rasing",
+              "top1_category": "semantic",
+              "chosen_piece": "rasing",
+              "chosen_category": "semantic",
+              "chosen_label": null,
+              "diagnosed_stage": "inject"
+            },
+            {
+              "step": 10,
+              "retrieved_majority_label": "music",
+              "retrieved_label_counts": {
+                "music": 3,
+                "space": 2
+              },
+              "retrieved_score_sum": {
+                "music": 0.9551050901412963,
+                "space": 0.09417556524276735
+              },
+              "logits_label_mass": {
+                "music": 0,
+                "space": 0
+              },
+              "top1_piece": ",",
+              "top1_category": "punct",
+              "chosen_piece": ",",
+              "chosen_category": "punct",
+              "chosen_label": null,
+              "diagnosed_stage": "inject"
+            },
+            {
+              "step": 11,
+              "retrieved_majority_label": "music",
+              "retrieved_label_counts": {
+                "music": 3,
+                "space": 2
+              },
+              "retrieved_score_sum": {
+                "music": 0.9551050901412963,
+                "space": 0.09417556524276735
+              },
+              "logits_label_mass": {
+                "music": 0.02468138374388218,
+                "space": 0
+              },
+              "top1_piece": " and",
+              "top1_category": "functional",
+              "chosen_piece": " and",
+              "chosen_category": "functional",
+              "chosen_label": "music",
+              "diagnosed_stage": "decode"
+            }
+          ],
+          "passed": false
+        },
+        {
+          "prompt": "What explains satellites and orbital motion?",
+          "expected_label": "space",
+          "decoded_output": "What explains satellites and orbital motion? Sat phones don' explain satellites, satellites are artificial objects that",
+          "stage_counts": {
+            "decode": 3,
+            "aligned": 5,
+            "inject": 4
+          },
+          "rows": [
+            {
+              "step": 0,
+              "retrieved_majority_label": "space",
+              "retrieved_label_counts": {
+                "space": 3,
+                "music": 2
+              },
+              "retrieved_score_sum": {
+                "space": 0.7052294105291367,
+                "music": 0.08546265661716462
+              },
+              "logits_label_mass": {
+                "music": 0,
+                "space": 0.010029993019998074
+              },
+              "top1_piece": " Sat",
+              "top1_category": "functional",
+              "chosen_piece": " Sat",
+              "chosen_category": "functional",
+              "chosen_label": "space",
+              "diagnosed_stage": "decode"
+            },
+            {
+              "step": 1,
+              "retrieved_majority_label": "space",
+              "retrieved_label_counts": {
+                "space": 3,
+                "music": 2
+              },
+              "retrieved_score_sum": {
+                "space": 0.7052294105291367,
+                "music": 0.08546265661716462
+              },
+              "logits_label_mass": {
+                "music": 0,
+                "space": 0.005930706858634949
+              },
+              "top1_piece": " phones",
+              "top1_category": "semantic",
+              "chosen_piece": " phones",
+              "chosen_category": "semantic",
+              "chosen_label": "space",
+              "diagnosed_stage": "aligned"
+            },
+            {
+              "step": 2,
+              "retrieved_majority_label": "space",
+              "retrieved_label_counts": {
+                "space": 3,
+                "music": 2
+              },
+              "retrieved_score_sum": {
+                "space": 0.7052294105291367,
+                "music": 0.08546265661716462
+              },
+              "logits_label_mass": {
+                "music": 0,
+                "space": 0.032648902386426926
+              },
+              "top1_piece": " don",
+              "top1_category": "functional",
+              "chosen_piece": " don",
+              "chosen_category": "functional",
+              "chosen_label": "space",
+              "diagnosed_stage": "decode"
+            },
+            {
+              "step": 3,
+              "retrieved_majority_label": "space",
+              "retrieved_label_counts": {
+                "space": 3,
+                "music": 2
+              },
+              "retrieved_score_sum": {
+                "space": 0.7052294105291367,
+                "music": 0.08546265661716462
+              },
+              "logits_label_mass": {
+                "music": 0,
+                "space": 0
+              },
+              "top1_piece": "'",
+              "top1_category": "punct",
+              "chosen_piece": "'",
+              "chosen_category": "punct",
+              "chosen_label": null,
+              "diagnosed_stage": "inject"
+            },
+            {
+              "step": 4,
+              "retrieved_majority_label": "space",
+              "retrieved_label_counts": {
+                "space": 3,
+                "music": 2
+              },
+              "retrieved_score_sum": {
+                "space": 0.7052294105291367,
+                "music": 0.08546265661716462
+              },
+              "logits_label_mass": {
+                "music": 0,
+                "space": 0
+              },
+              "top1_piece": " explain",
+              "top1_category": "semantic",
+              "chosen_piece": " explain",
+              "chosen_category": "semantic",
+              "chosen_label": null,
+              "diagnosed_stage": "inject"
+            },
+            {
+              "step": 5,
+              "retrieved_majority_label": "space",
+              "retrieved_label_counts": {
+                "space": 3,
+                "music": 2
+              },
+              "retrieved_score_sum": {
+                "space": 0.7052294105291367,
+                "music": 0.08546265661716462
+              },
+              "logits_label_mass": {
+                "music": 0,
+                "space": 0.3954301029443741
+              },
+              "top1_piece": " satellites",
+              "top1_category": "semantic",
+              "chosen_piece": " satellites",
+              "chosen_category": "semantic",
+              "chosen_label": "space",
+              "diagnosed_stage": "aligned"
+            },
+            {
+              "step": 6,
+              "retrieved_majority_label": "space",
+              "retrieved_label_counts": {
+                "space": 3,
+                "music": 2
+              },
+              "retrieved_score_sum": {
+                "space": 0.7052294105291367,
+                "music": 0.08546265661716462
+              },
+              "logits_label_mass": {
+                "music": 0,
+                "space": 0.022754499688744545
+              },
+              "top1_piece": ",",
+              "top1_category": "punct",
+              "chosen_piece": ",",
+              "chosen_category": "punct",
+              "chosen_label": "space",
+              "diagnosed_stage": "decode"
+            },
+            {
+              "step": 7,
+              "retrieved_majority_label": "space",
+              "retrieved_label_counts": {
+                "space": 3,
+                "music": 2
+              },
+              "retrieved_score_sum": {
+                "space": 0.7052294105291367,
+                "music": 0.08546265661716462
+              },
+              "logits_label_mass": {
+                "music": 0,
+                "space": 0.2686969190835953
+              },
+              "top1_piece": " satellites",
+              "top1_category": "semantic",
+              "chosen_piece": " satellites",
+              "chosen_category": "semantic",
+              "chosen_label": "space",
+              "diagnosed_stage": "aligned"
+            },
+            {
+              "step": 8,
+              "retrieved_majority_label": "space",
+              "retrieved_label_counts": {
+                "space": 3,
+                "music": 2
+              },
+              "retrieved_score_sum": {
+                "space": 0.714495986700058,
+                "music": 0.0803181141614914
+              },
+              "logits_label_mass": {
+                "music": 0,
+                "space": 0
+              },
+              "top1_piece": " are",
+              "top1_category": "functional",
+              "chosen_piece": " are",
+              "chosen_category": "functional",
+              "chosen_label": null,
+              "diagnosed_stage": "inject"
+            },
+            {
+              "step": 9,
+              "retrieved_majority_label": "space",
+              "retrieved_label_counts": {
+                "space": 3,
+                "music": 2
+              },
+              "retrieved_score_sum": {
+                "space": 0.714495986700058,
+                "music": 0.0803181141614914
+              },
+              "logits_label_mass": {
+                "music": 0,
+                "space": 0.03106600232422352
+              },
+              "top1_piece": " artificial",
+              "top1_category": "semantic",
+              "chosen_piece": " artificial",
+              "chosen_category": "semantic",
+              "chosen_label": "space",
+              "diagnosed_stage": "aligned"
+            },
+            {
+              "step": 10,
+              "retrieved_majority_label": "space",
+              "retrieved_label_counts": {
+                "space": 3,
+                "music": 2
+              },
+              "retrieved_score_sum": {
+                "space": 0.714495986700058,
+                "music": 0.0803181141614914
+              },
+              "logits_label_mass": {
+                "music": 0,
+                "space": 0.33109524846076965
+              },
+              "top1_piece": " objects",
+              "top1_category": "semantic",
+              "chosen_piece": " objects",
+              "chosen_category": "semantic",
+              "chosen_label": "space",
+              "diagnosed_stage": "aligned"
+            },
+            {
+              "step": 11,
+              "retrieved_majority_label": "space",
+              "retrieved_label_counts": {
+                "space": 3,
+                "music": 2
+              },
+              "retrieved_score_sum": {
+                "space": 0.714495986700058,
+                "music": 0.0803181141614914
+              },
+              "logits_label_mass": {
+                "music": 0,
+                "space": 0
+              },
+              "top1_piece": " that",
+              "top1_category": "functional",
+              "chosen_piece": " that",
+              "chosen_category": "functional",
+              "chosen_label": null,
+              "diagnosed_stage": "inject"
+            }
+          ],
+          "passed": false
+        }
+      ],
+      "error": null
+    },
+    "prompt_diversity_without_memory": {
+      "passed": true,
+      "prompts": [
+        "The pianist",
+        "Quantum systems",
+        "The rainforest"
+      ],
+      "outputs": [
+        "The pianist Xia points XYZ传感器 collects weather data based upon ____ protocol communication mode?\nBLE（Bluetooth）\n",
+        "Quantum systems play central roles across cryptography due primarily?\\nThe Bose gas  |\n\n **Summary:\r\n\r\nWrite various",
+        "The rainforest dataset typically refers specifically refering______. aviation charts. ____\nyes Explanation: \nFalse"
+      ],
+      "unique_count": 3,
+      "error": null
+    },
+    "save_load_consistency": {
+      "passed": true,
+      "prompt": "The pianist",
+      "output_a": "The pianist piano hours piano pianoHours = int(raw input desperation hours hours))\n piano perfectperfect print calculating",
+      "output_b": "The pianist piano hours piano pianoHours = int(raw input desperation hours hours))\n piano perfectperfect print calculating",
+      "error": null
+    },
+    "training_cache_isolation": {
+      "passed": true,
+      "changed": [],
+      "memory_count": 8,
+      "error": null
+    },
+    "cheating_heuristics": {
+      "passed": true,
+      "outputs": [
+        "The pianist piano hours piano pianoHours = int(raw input desperation hours hours))\n piano perfectperfect print calculating",
+        "The telescope window watched cat sat mat outside birds window sat watched mat cat birds outside Market window cat watched",
+        "The trader market stock volatility significant experienced 市 stock experienced significant market volatility experienced stock stock significant volatility",
+        "The child learns Signs window window outside cat sat mat watched outside mat sat cat mat mat outside sat watched"
+      ],
+      "exact_same": false,
+      "prefix_only": false,
+      "too_short": false,
+      "error": null
+    },
+    "rerank_stability_probe": {
+      "passed": false,
+      "status": "fail",
+      "pairs": [
+        {
+          "pair": "music_P1",
+          "prompt_a": "What improves piano technique and musical phrasing?",
+          "prompt_b": "How can one improve piano technique and musical expression?",
+          "top5_a": [
+            1,
+            0,
+            3,
+            4,
+            2
+          ],
+          "top5_b": [
+            1,
+            0,
+            3,
+            4,
+            2
+          ],
+          "jaccard": 1.0,
+          "spearman_shared": 0.9999999999998999,
+          "pair_passed_jaccard_0_6": true
+        },
+        {
+          "pair": "space_P2",
+          "prompt_a": "What explains satellites and orbital motion?",
+          "prompt_b": "What describes satellites and the motion of planets?",
+          "top5_a": [
+            5,
+            0,
+            1,
+            3,
+            2
+          ],
+          "top5_b": [
+            5,
+            6,
+            4,
+            0,
+            1
+          ],
+          "jaccard": 0.42857142857142855,
+          "spearman_shared": 0.9607689228302918,
+          "pair_passed_jaccard_0_6": false
+        }
+      ],
+      "spearman_best": 0.9999999999998999,
+      "gating": "hard_PASS",
+      "error": null
+    },
+    "decode_repetition_feedback_probe": {
+      "passed": false,
+      "status": "fail",
+      "per_prompt": [
+        {
+          "prompt": "The telescope",
+          "output": "The telescope telescope stars telescopestarsStars amazing amazed telescope captured telescope stars stars captured stars distant telescope signatures captured captured distant captured nebula distant signatures signatures neb neb captured signatures",
+          "max_repeat_per_content_token": 5,
+          "first_bigram_repeat_index": 9,
+          "trigram_lock_count": 0
+        },
+        {
+          "prompt": "The pianist",
+          "output": "The pianist pian piano pian pianette pian plays Chop Chop Chop hours piano piano hours pian piano perfect hours Chop hours perfect Chop midnight hours midnight perfect perfect midnight midnight pian",
+          "max_repeat_per_content_token": 5,
+          "first_bigram_repeat_index": 8,
+          "trigram_lock_count": 0
+        },
+        {
+          "prompt": "The market analyst",
+          "output": "The market analyst market session sessessionssesess market market session session significant market volatility experienced stock market stock significant volatility experienced significant stock volatility significant session stock session volatility experienced volatility",
+          "max_repeat_per_content_token": 5,
+          "first_bigram_repeat_index": 8,
+          "trigram_lock_count": 0
+        }
+      ],
+      "avg_max_repeat_per_content_token": 5.0,
+      "min_first_bigram_repeat_index": 8,
+      "avg_trigram_lock_count": 0.0,
+      "conditions": {
+        "avg_max_repeat_le_3": false,
+        "min_first_bigram_ge_4": true,
+        "avg_trigram_lock_le_1": true
+      },
+      "gating": "hard_PASS",
+      "error": null
+    },
+    "functional_token_suppression_probe": {
+      "passed": true,
+      "status": "pass",
+      "metric_version": "v3.46",
+      "per_prompt": [
+        {
+          "prompt": "A strong explanation should mention",
+          "top12_no_prefix": [
+            {
+              "token_id": 279,
+              "piece": " the",
+              "norm": "the",
+              "logit": 21.125,
+              "prob": 0.30489084124565125
+            },
+            {
+              "token_id": 264,
+              "piece": " a",
+              "norm": "a",
+              "logit": 19.5,
+              "prob": 0.060036562383174896
+            },
+            {
+              "token_id": 518,
+              "piece": " at",
+              "norm": "at",
+              "logit": 19.375,
+              "prob": 0.05298208072781563
+            },
+            {
+              "token_id": 3151,
+              "piece": " specific",
+              "norm": "specific",
+              "logit": 19.0,
+              "prob": 0.036414019763469696
+            },
+            {
+              "token_id": 2176,
+              "piece": " both",
+              "norm": "both",
+              "logit": 19.0,
+              "prob": 0.036414019763469696
+            },
+            {
+              "token_id": 429,
+              "piece": " that",
+              "norm": "that",
+              "logit": 18.625,
+              "prob": 0.025026964023709297
+            },
+            {
+              "token_id": 678,
+              "piece": " all",
+              "norm": "all",
+              "logit": 18.625,
+              "prob": 0.025026964023709297
+            },
+            {
+              "token_id": 1246,
+              "piece": " how",
+              "norm": "how",
+              "logit": 18.625,
+              "prob": 0.025026964023709297
+            },
+            {
+              "token_id": 10295,
+              "piece": " examples",
+              "norm": "examples",
+              "logit": 18.5,
+              "prob": 0.022086219862103462
+            },
+            {
+              "token_id": 2326,
+              "piece": " three",
+              "norm": "three",
+              "logit": 18.25,
+              "prob": 0.017200764268636703
+            },
+            {
+              "token_id": 1378,
+              "piece": " two",
+              "norm": "two",
+              "logit": 18.125,
+              "prob": 0.015179620124399662
+            },
+            {
+              "token_id": 1128,
+              "piece": " what",
+              "norm": "what",
+              "logit": 18.125,
+              "prob": 0.015179620124399662
+            }
+          ],
+          "top12_with_prefix": [
+            {
+              "token_id": 2524,
+              "piece": " control",
+              "norm": "control",
+              "logit": 35.01490783691406,
+              "prob": 0.6951159238815308
+            },
+            {
+              "token_id": 14762,
+              "piece": " technique",
+              "norm": "technique",
+              "logit": 34.002662658691406,
+              "prob": 0.2526066303253174
+            },
+            {
+              "token_id": 37191,
+              "piece": " refined",
+              "norm": "refined",
+              "logit": 31.364118576049805,
+              "prob": 0.018052594736218452
+            },
+            {
+              "token_id": 14317,
+              "piece": " finger",
+              "norm": "finger",
+              "logit": 31.158113479614258,
+              "prob": 0.014691722579300404
+            },
+            {
+              "token_id": 26278,
+              "piece": " piano",
+              "norm": "piano",
+              "logit": 31.14698600769043,
+              "prob": 0.014529147185385227
+            },
+            {
+              "token_id": 48601,
+              "piece": " pedal",
+              "norm": "pedal",
+              "logit": 29.597332000732422,
+              "prob": 0.00308484910055995
+            },
+            {
+              "token_id": 38744,
+              "piece": " musician",
+              "norm": "musician",
+              "logit": 29.122615814208984,
+              "prob": 0.0019189659506082535
+            },
+            {
+              "token_id": 3151,
+              "piece": " specific",
+              "norm": "specific",
+              "logit": 17.25,
+              "prob": 1.3392319253568985e-08
+            },
+            {
+              "token_id": 10295,
+              "piece": " examples",
+              "norm": "examples",
+              "logit": 16.75,
+              "prob": 8.12285172457905e-09
+            },
+            {
+              "token_id": 3170,
+              "piece": " why",
+              "norm": "why",
+              "logit": 16.625,
+              "prob": 7.168392102130383e-09
+            },
+            {
+              "token_id": 1376,
+              "piece": " key",
+              "norm": "key",
+              "logit": 16.5,
+              "prob": 6.326083212826461e-09
+            },
+            {
+              "token_id": 5257,
+              "piece": " various",
+              "norm": "various",
+              "logit": 15.8125,
+              "prob": 3.1809543887817426e-09
+            }
+          ],
+          "content_starter_count_no_prefix": 3,
+          "content_starter_count_with_prefix": 12,
+          "best_content_starter_logit_with_prefix": 35.01490783691406,
+          "best_functional_logit_with_prefix": null,
+          "logit_margin_best_content_starter_vs_best_functional": Infinity,
+          "margin_non_negative": true
+        },
+        {
+          "prompt": "The most relevant idea is",
+          "top12_no_prefix": [
+            {
+              "token_id": 429,
+              "piece": " that",
+              "norm": "that",
+              "logit": 20.25,
+              "prob": 0.2765534520149231
+            },
+            {
+              "token_id": 279,
+              "piece": " the",
+              "norm": "the",
+              "logit": 19.125,
+              "prob": 0.08978375792503357
+            },
+            {
+              "token_id": 25,
+              "piece": ":",
+              "norm": "",
+              "logit": 19.0,
+              "prob": 0.07923389226198196
+            },
+            {
+              "token_id": 311,
+              "piece": " to",
+              "norm": "to",
+              "logit": 18.25,
+              "prob": 0.03742744028568268
+            },
+            {
+              "token_id": 510,
+              "piece": ":\n",
+              "norm": "",
+              "logit": 18.0,
+              "prob": 0.029148519039154053
+            },
+            {
+              "token_id": 30743,
+              "piece": " ____",
+              "norm": "",
+              "logit": 18.0,
+              "prob": 0.029148519039154053
+            },
+            {
+              "token_id": 32671,
+              "piece": " ______",
+              "norm": "",
+              "logit": 17.5,
+              "prob": 0.017679469659924507
+            },
+            {
+              "token_id": 1304,
+              "piece": " __",
+              "norm": "",
+              "logit": 17.5,
+              "prob": 0.017679469659924507
+            },
+            {
+              "token_id": 1447,
+              "piece": ":\n\n",
+              "norm": "",
+              "logit": 17.375,
+              "prob": 0.015602079220116138
+            },
+            {
+              "token_id": 330,
+              "piece": " \"",
+              "norm": "",
+              "logit": 17.25,
+              "prob": 0.013768785633146763
+            },
+            {
+              "token_id": 537,
+              "piece": " not",
+              "norm": "not",
+              "logit": 17.25,
+              "prob": 0.013768785633146763
+            },
+            {
+              "token_id": 198,
+              "piece": "\n",
+              "norm": "",
+              "logit": 17.125,
+              "prob": 0.012150910682976246
+            }
+          ],
+          "top12_with_prefix": [
+            {
+              "token_id": 2524,
+              "piece": " control",
+              "norm": "control",
+              "logit": 35.47675323486328,
+              "prob": 0.5319644212722778
+            },
+            {
+              "token_id": 14762,
+              "piece": " technique",
+              "norm": "technique",
+              "logit": 35.09006118774414,
+              "prob": 0.36136358976364136
+            },
+            {
+              "token_id": 37191,
+              "piece": " refined",
+              "norm": "refined",
+              "logit": 33.533302307128906,
+              "prob": 0.0761820450425148
+            },
+            {
+              "token_id": 26278,
+              "piece": " piano",
+              "norm": "piano",
+              "logit": 32.47641372680664,
+              "prob": 0.02647595852613449
+            },
+            {
+              "token_id": 14317,
+              "piece": " finger",
+              "norm": "finger",
+              "logit": 30.1934757232666,
+              "prob": 0.0027001278940588236
+            },
+            {
+              "token_id": 48601,
+              "piece": " pedal",
+              "norm": "pedal",
+              "logit": 28.98265266418457,
+              "prob": 0.0008045083377510309
+            },
+            {
+              "token_id": 38744,
+              "piece": " musician",
+              "norm": "musician",
+              "logit": 28.52532196044922,
+              "prob": 0.0005092304199934006
+            },
+            {
+              "token_id": 4363,
+              "piece": " likely",
+              "norm": "likely",
+              "logit": 15.75,
+              "prob": 1.4409952120431058e-09
+            },
+            {
+              "token_id": 3118,
+              "piece": " based",
+              "norm": "based",
+              "logit": 15.75,
+              "prob": 1.4409952120431058e-09
+            },
+            {
+              "token_id": 5990,
+              "piece": " usually",
+              "norm": "usually",
+              "logit": 15.625,
+              "prob": 1.2716737662898936e-09
+            },
+            {
+              "token_id": 4658,
+              "piece": " probably",
+              "norm": "probably",
+              "logit": 15.5625,
+              "prob": 1.1946269529161668e-09
+            },
+            {
+              "token_id": 2661,
+              "piece": " given",
+              "norm": "given",
+              "logit": 15.5625,
+              "prob": 1.1946269529161668e-09
+            }
+          ],
+          "content_starter_count_no_prefix": 0,
+          "content_starter_count_with_prefix": 12,
+          "best_content_starter_logit_with_prefix": 35.47675323486328,
+          "best_functional_logit_with_prefix": null,
+          "logit_margin_best_content_starter_vs_best_functional": Infinity,
+          "margin_non_negative": true
+        },
+        {
+          "prompt": "A learner should know about",
+          "top12_no_prefix": [
+            {
+              "token_id": 279,
+              "piece": " the",
+              "norm": "the",
+              "logit": 21.0,
+              "prob": 0.4941084086894989
+            },
+            {
+              "token_id": 264,
+              "piece": " a",
+              "norm": "a",
+              "logit": 18.25,
+              "prob": 0.03158729150891304
+            },
+            {
+              "token_id": 220,
+              "piece": " ",
+              "norm": "",
+              "logit": 18.125,
+              "prob": 0.027875691652297974
+            },
+            {
+              "token_id": 1246,
+              "piece": " how",
+              "norm": "how",
+              "logit": 18.0,
+              "prob": 0.024600207805633545
+            },
+            {
+              "token_id": 678,
+              "piece": " all",
+              "norm": "all",
+              "logit": 17.75,
+              "prob": 0.019158661365509033
+            },
+            {
+              "token_id": 1128,
+              "piece": " what",
+              "norm": "what",
+              "logit": 17.5,
+              "prob": 0.01492078136652708
+            },
+            {
+              "token_id": 2155,
+              "piece": " different",
+              "norm": "different",
+              "logit": 17.375,
+              "prob": 0.013167543336749077
+            },
+            {
+              "token_id": 862,
+              "piece": " their",
+              "norm": "their",
+              "logit": 17.375,
+              "prob": 0.013167543336749077
+            },
+            {
+              "token_id": 323,
+              "piece": " and",
+              "norm": "and",
+              "logit": 16.875,
+              "prob": 0.007986518554389477
+            },
+            {
+              "token_id": 518,
+              "piece": " at",
+              "norm": "at",
+              "logit": 16.875,
+              "prob": 0.007986518554389477
+            },
+            {
+              "token_id": 1378,
+              "piece": " two",
+              "norm": "two",
+              "logit": 16.75,
+              "prob": 0.007048077881336212
+            },
+            {
+              "token_id": 1045,
+              "piece": " some",
+              "norm": "some",
+              "logit": 16.75,
+              "prob": 0.007048077881336212
+            }
+          ],
+          "top12_with_prefix": [
+            {
+              "token_id": 5458,
+              "piece": " student",
+              "norm": "student",
+              "logit": 34.490478515625,
+              "prob": 0.9998041987419128
+            },
+            {
+              "token_id": 13625,
+              "piece": " keyboard",
+              "norm": "keyboard",
+              "logit": 24.831199645996094,
+              "prob": 6.381803541444242e-05
+            },
+            {
+              "token_id": 28405,
+              "piece": " scales",
+              "norm": "scales",
+              "logit": 24.77660369873047,
+              "prob": 6.0427235439419746e-05
+            },
+            {
+              "token_id": 77123,
+              "piece": " expressive",
+              "norm": "expressive",
+              "logit": 24.58266258239746,
+              "prob": 4.977429853170179e-05
+            },
+            {
+              "token_id": 11110,
+              "piece": " conserv",
+              "norm": "conserv",
+              "logit": 23.238353729248047,
+              "prob": 1.2977146980119869e-05
+            },
+            {
+              "token_id": 19476,
+              "piece": " studied",
+              "norm": "studied",
+              "logit": 22.836301803588867,
+              "prob": 8.681011422595475e-06
+            },
+            {
+              "token_id": 821,
+              "piece": " data",
+              "norm": "data",
+              "logit": 13.8125,
+              "prob": 1.0461235211423059e-09
+            },
+            {
+              "token_id": 2326,
+              "piece": " three",
+              "norm": "three",
+              "logit": 13.3125,
+              "prob": 6.345060032941774e-10
+            },
+            {
+              "token_id": 13482,
+              "piece": " linear",
+              "norm": "linear",
+              "logit": 13.25,
+              "prob": 5.96063254310053e-10
+            },
+            {
+              "token_id": 6770,
+              "piece": " basic",
+              "norm": "basic",
+              "logit": 13.25,
+              "prob": 5.96063254310053e-10
+            },
+            {
+              "token_id": 13027,
+              "piece": " Python",
+              "norm": "python",
+              "logit": 13.1875,
+              "prob": 5.599495866981385e-10
+            },
+            {
+              "token_id": 3151,
+              "piece": " specific",
+              "norm": "specific",
+              "logit": 13.0625,
+              "prob": 4.941537734559631e-10
+            }
+          ],
+          "content_starter_count_no_prefix": 0,
+          "content_starter_count_with_prefix": 12,
+          "best_content_starter_logit_with_prefix": 34.490478515625,
+          "best_functional_logit_with_prefix": null,
+          "logit_margin_best_content_starter_vs_best_functional": Infinity,
+          "margin_non_negative": true
+        },
+        {
+          "prompt": "Tell me about",
+          "top12_no_prefix": [
+            {
+              "token_id": 279,
+              "piece": " the",
+              "norm": "the",
+              "logit": 20.625,
+              "prob": 0.40999558568000793
+            },
+            {
+              "token_id": 264,
+              "piece": " a",
+              "norm": "a",
+              "logit": 20.375,
+              "prob": 0.319304883480072
+            },
+            {
+              "token_id": 697,
+              "piece": " your",
+              "norm": "your",
+              "logit": 18.25,
+              "prob": 0.038135528564453125
+            },
+            {
+              "token_id": 458,
+              "piece": " an",
+              "norm": "an",
+              "logit": 17.875,
+              "prob": 0.02621014043688774
+            },
+            {
+              "token_id": 1045,
+              "piece": " some",
+              "norm": "some",
+              "logit": 17.375,
+              "prob": 0.015897253528237343
+            },
+            {
+              "token_id": 6133,
+              "piece": " yourself",
+              "norm": "yourself",
+              "logit": 17.125,
+              "prob": 0.012380793690681458
+            },
+            {
+              "token_id": 1246,
+              "piece": " how",
+              "norm": "how",
+              "logit": 17.0,
+              "prob": 0.010926011949777603
+            },
+            {
+              "token_id": 894,
+              "piece": " any",
+              "norm": "any",
+              "logit": 16.875,
+              "prob": 0.00964217260479927
+            },
+            {
+              "token_id": 419,
+              "piece": " this",
+              "norm": "this",
+              "logit": 16.5,
+              "prob": 0.006626961287111044
+            },
+            {
+              "token_id": 825,
+              "piece": " one",
+              "norm": "one",
+              "logit": 16.25,
+              "prob": 0.005161082837730646
+            },
+            {
+              "token_id": 1378,
+              "piece": " two",
+              "norm": "two",
+              "logit": 15.5625,
+              "prob": 0.002595155267044902
+            },
+            {
+              "token_id": 576,
+              "piece": " The",
+              "norm": "the",
+              "logit": 15.375,
+              "prob": 0.0021514594554901123
+            }
+          ],
+          "top12_with_prefix": [
+            {
+              "token_id": 6133,
+              "piece": " yourself",
+              "norm": "yourself",
+              "logit": 16.0,
+              "prob": 0.18075832724571228
+            },
+            {
+              "token_id": 5616,
+              "piece": " China",
+              "norm": "china",
+              "logit": 12.875,
+              "prob": 0.007941966876387596
+            },
+            {
+              "token_id": 4325,
+              "piece": " someone",
+              "norm": "someone",
+              "logit": 12.875,
+              "prob": 0.007941966876387596
+            },
+            {
+              "token_id": 7037,
+              "piece": " myself",
+              "norm": "myself",
+              "logit": 12.4375,
+              "prob": 0.005127719137817621
+            },
+            {
+              "token_id": 2326,
+              "piece": " three",
+              "norm": "three",
+              "logit": 12.4375,
+              "prob": 0.005127719137817621
+            },
+            {
+              "token_id": 3170,
+              "piece": " why",
+              "norm": "why",
+              "logit": 12.375,
+              "prob": 0.004817046225070953
+            },
+            {
+              "token_id": 8453,
+              "piece": " Chinese",
+              "norm": "chinese",
+              "logit": 12.3125,
+              "prob": 0.004525196272879839
+            },
+            {
+              "token_id": 9977,
+              "piece": " climate",
+              "norm": "climate",
+              "logit": 12.25,
+              "prob": 0.004251028411090374
+            },
+            {
+              "token_id": 6323,
+              "piece": " Japan",
+              "norm": "japan",
+              "logit": 12.25,
+              "prob": 0.004251028411090374
+            },
+            {
+              "token_id": 10769,
+              "piece": " Japanese",
+              "norm": "japanese",
+              "logit": 11.875,
+              "prob": 0.0029216862749308348
+            },
+            {
+              "token_id": 5796,
+              "piece": " touch",
+              "norm": "touch",
+              "logit": 11.8125,
+              "prob": 0.002744670258834958
+            },
+            {
+              "token_id": 3757,
+              "piece": " John",
+              "norm": "john",
+              "logit": 11.8125,
+              "prob": 0.002744670258834958
+            }
+          ],
+          "content_starter_count_no_prefix": 1,
+          "content_starter_count_with_prefix": 12,
+          "best_content_starter_logit_with_prefix": 16.0,
+          "best_functional_logit_with_prefix": null,
+          "logit_margin_best_content_starter_vs_best_functional": Infinity,
+          "margin_non_negative": true
+        },
+        {
+          "prompt": "Please describe",
+          "top12_no_prefix": [
+            {
+              "token_id": 279,
+              "piece": " the",
+              "norm": "the",
+              "logit": 23.375,
+              "prob": 0.40496018528938293
+            },
+            {
+              "token_id": 264,
+              "piece": " a",
+              "norm": "a",
+              "logit": 23.25,
+              "prob": 0.3573761284351349
+            },
+            {
+              "token_id": 1246,
+              "piece": " how",
+              "norm": "how",
+              "logit": 21.625,
+              "prob": 0.07037152349948883
+            },
+            {
+              "token_id": 697,
+              "piece": " your",
+              "norm": "your",
+              "logit": 21.375,
+              "prob": 0.05480540171265602
+            },
+            {
+              "token_id": 304,
+              "piece": " in",
+              "norm": "in",
+              "logit": 20.875,
+              "prob": 0.033241156488657
+            },
+            {
+              "token_id": 458,
+              "piece": " an",
+              "norm": "an",
+              "logit": 19.875,
+              "prob": 0.012228738516569138
+            },
+            {
+              "token_id": 1128,
+              "piece": " what",
+              "norm": "what",
+              "logit": 19.625,
+              "prob": 0.009523751214146614
+            },
+            {
+              "token_id": 2326,
+              "piece": " three",
+              "norm": "three",
+              "logit": 19.375,
+              "prob": 0.007417105138301849
+            },
+            {
+              "token_id": 1045,
+              "piece": " some",
+              "norm": "some",
+              "logit": 19.25,
+              "prob": 0.006545572075992823
+            },
+            {
+              "token_id": 323,
+              "piece": " and",
+              "norm": "and",
+              "logit": 19.125,
+              "prob": 0.005776446778327227
+            },
+            {
+              "token_id": 894,
+              "piece": " any",
+              "norm": "any",
+              "logit": 18.75,
+              "prob": 0.003970090299844742
+            },
+            {
+              "token_id": 825,
+              "piece": " one",
+              "norm": "one",
+              "logit": 18.625,
+              "prob": 0.0035035922192037106
+            }
+          ],
+          "top12_with_prefix": [
+            {
+              "token_id": 5796,
+              "piece": " touch",
+              "norm": "touch",
+              "logit": 38.97874450683594,
+              "prob": 0.9555372595787048
+            },
+            {
+              "token_id": 10273,
+              "piece": " rub",
+              "norm": "rub",
+              "logit": 35.35406494140625,
+              "prob": 0.02547236531972885
+            },
+            {
+              "token_id": 3545,
+              "piece": " often",
+              "norm": "often",
+              "logit": 34.60047149658203,
+              "prob": 0.01198913436383009
+            },
+            {
+              "token_id": 22845,
+              "piece": " interpretation",
+              "norm": "interpretation",
+              "logit": 33.45642852783203,
+              "prob": 0.0038188823964446783
+            },
+            {
+              "token_id": 29195,
+              "piece": " dynamics",
+              "norm": "dynamics",
+              "logit": 32.93324279785156,
+              "prob": 0.0022631825413554907
+            },
+            {
+              "token_id": 23230,
+              "piece": " tempo",
+              "norm": "tempo",
+              "logit": 31.80025863647461,
+              "prob": 0.0007289048517122865
+            },
+            {
+              "token_id": 13798,
+              "piece": " depends",
+              "norm": "depends",
+              "logit": 30.456966400146484,
+              "prob": 0.00019023324421141297
+            },
+            {
+              "token_id": 3170,
+              "piece": " why",
+              "norm": "why",
+              "logit": 17.0,
+              "prob": 2.722702341362293e-10
+            },
+            {
+              "token_id": 3019,
+              "piece": " step",
+              "norm": "step",
+              "logit": 16.625,
+              "prob": 1.8712840998968971e-10
+            },
+            {
+              "token_id": 2326,
+              "piece": " three",
+              "norm": "three",
+              "logit": 16.5,
+              "prob": 1.6514024869795918e-10
+            },
+            {
+              "token_id": 4623,
+              "piece": " further",
+              "norm": "further",
+              "logit": 15.25,
+              "prob": 4.731347258424279e-11
+            },
+            {
+              "token_id": 26753,
+              "piece": " briefly",
+              "norm": "briefly",
+              "logit": 15.0625,
+              "prob": 3.922424884894582e-11
+            }
+          ],
+          "content_starter_count_no_prefix": 1,
+          "content_starter_count_with_prefix": 12,
+          "best_content_starter_logit_with_prefix": 38.97874450683594,
+          "best_functional_logit_with_prefix": null,
+          "logit_margin_best_content_starter_vs_best_functional": Infinity,
+          "margin_non_negative": true
+        },
+        {
+          "prompt": "Explain how",
+          "top12_no_prefix": [
+            {
+              "token_id": 498,
+              "piece": " you",
+              "norm": "you",
+              "logit": 21.25,
+              "prob": 0.3365403115749359
+            },
+            {
+              "token_id": 279,
+              "piece": " the",
+              "norm": "the",
+              "logit": 21.0,
+              "prob": 0.26209786534309387
+            },
+            {
+              "token_id": 311,
+              "piece": " to",
+              "norm": "to",
+              "logit": 20.75,
+              "prob": 0.20412202179431915
+            },
+            {
+              "token_id": 264,
+              "piece": " a",
+              "norm": "a",
+              "logit": 18.875,
+              "prob": 0.031303126364946365
+            },
+            {
+              "token_id": 458,
+              "piece": " an",
+              "norm": "an",
+              "logit": 17.25,
+              "prob": 0.006163951009511948
+            },
+            {
+              "token_id": 4344,
+              "piece": " changes",
+              "norm": "changes",
+              "logit": 16.75,
+              "prob": 0.003738625440746546
+            },
+            {
+              "token_id": 2155,
+              "piece": " different",
+              "norm": "different",
+              "logit": 16.625,
+              "prob": 0.0032993254717439413
+            },
+            {
+              "token_id": 12752,
+              "piece": " cultural",
+              "norm": "cultural",
+              "logit": 16.5,
+              "prob": 0.0029116442892700434
+            },
+            {
+              "token_id": 5440,
+              "piece": " technology",
+              "norm": "technology",
+              "logit": 16.25,
+              "prob": 0.0022675907239317894
+            },
+            {
+              "token_id": 1667,
+              "piece": " using",
+              "norm": "using",
+              "logit": 16.0,
+              "prob": 0.0017660015728324652
+            },
+            {
+              "token_id": 1817,
+              "piece": " each",
+              "norm": "each",
+              "logit": 16.0,
+              "prob": 0.0017660015728324652
+            },
+            {
+              "token_id": 582,
+              "piece": " we",
+              "norm": "we",
+              "logit": 15.9375,
+              "prob": 0.0016590048326179385
+            }
+          ],
+          "top12_with_prefix": [
+            {
+              "token_id": 63997,
+              "piece": " Chop",
+              "norm": "chop",
+              "logit": 32.23540496826172,
+              "prob": 0.6007736325263977
+            },
+            {
+              "token_id": 59066,
+              "piece": " pian",
+              "norm": "pian",
+              "logit": 31.41173553466797,
+              "prob": 0.26363059878349304
+            },
+            {
+              "token_id": 92001,
+              "piece": " noct",
+              "norm": "noct",
+              "logit": 30.06985855102539,
+              "prob": 0.06890107691287994
+            },
+            {
+              "token_id": 43564,
+              "piece": " practiced",
+              "norm": "practiced",
+              "logit": 29.62016487121582,
+              "prob": 0.043946728110313416
+            },
+            {
+              "token_id": 32333,
+              "piece": " midnight",
+              "norm": "midnight",
+              "logit": 28.928796768188477,
+              "prob": 0.022012488916516304
+            },
+            {
+              "token_id": 2524,
+              "piece": " control",
+              "norm": "control",
+              "logit": 25.319644927978516,
+              "prob": 0.0005959837581031024
+            },
+            {
+              "token_id": 26278,
+              "piece": " piano",
+              "norm": "piano",
+              "logit": 23.040491104125977,
+              "prob": 6.1011334764771163e-05
+            },
+            {
+              "token_id": 14762,
+              "piece": " technique",
+              "norm": "technique",
+              "logit": 22.517467498779297,
+              "prob": 3.61629827239085e-05
+            },
+            {
+              "token_id": 38744,
+              "piece": " musician",
+              "norm": "musician",
+              "logit": 22.220535278320312,
+              "prob": 2.687251071620267e-05
+            },
+            {
+              "token_id": 14317,
+              "piece": " finger",
+              "norm": "finger",
+              "logit": 21.127849578857422,
+              "prob": 9.01074872672325e-06
+            },
+            {
+              "token_id": 48601,
+              "piece": " pedal",
+              "norm": "pedal",
+              "logit": 19.866641998291016,
+              "prob": 2.5528504465910373e-06
+            },
+            {
+              "token_id": 37191,
+              "piece": " refined",
+              "norm": "refined",
+              "logit": 19.817893981933594,
+              "prob": 2.43138856603764e-06
+            }
+          ],
+          "content_starter_count_no_prefix": 3,
+          "content_starter_count_with_prefix": 12,
+          "best_content_starter_logit_with_prefix": 32.23540496826172,
+          "best_functional_logit_with_prefix": null,
+          "logit_margin_best_content_starter_vs_best_functional": Infinity,
+          "margin_non_negative": true
+        }
+      ],
+      "avg_content_starter_delta_overall": 10.666666666666668,
+      "set_a_avg_delta": 11.0,
+      "set_a_margin_wins": 3,
+      "set_b_avg_delta": 10.333333333333334,
+      "set_b_margin_wins": 3,
+      "conditions": {
+        "set_a_delta_ge_1_and_margin_2of3": true,
+        "set_b_delta_ge_1_and_margin_2of3": true
+      },
+      "gating": "hard_PASS",
+      "error": null
+    },
+    "keyword_specific_tail_slot_probe": {
+      "passed": true,
+      "status": "pass",
+      "metric_version": "v3.50",
+      "tail_slots_source": "bridge._last_cond_tail_slots",
+      "per_paraphrase": [
+        {
+          "query": "She performed Beethoven sonatas with delicate phrasing on her grand piano.",
+          "query_disjoint_from_rare_keywords": true,
+          "dominant_mid": 1,
+          "dominant_source_preview": "A musician refined finger technique, phrasing, and pedal con",
+          "rare_keyword_ids": [
+            2524,
+            14317,
+            14762
+          ],
+          "rare_keyword_pieces": [
+            " control",
+            " finger",
+            " technique"
+          ],
+          "tail_slot_top5_ids_centered": [
+            2524,
+            7779,
+            100359,
+            2865,
+            3273
+          ],
+          "tail_slot_top5_pieces_centered": [
+            " control",
+            " Control",
+            "控制",
+            "control",
+            "Control"
+          ],
+          "intersection_size_top20": 1,
+          "rank_of_best_rare": 1
+        },
+        {
+          "query": "Harmonic analysis and ear training are core elements of music education.",
+          "query_disjoint_from_rare_keywords": true,
+          "dominant_mid": 1,
+          "dominant_source_preview": "A musician refined finger technique, phrasing, and pedal con",
+          "rare_keyword_ids": [
+            2524,
+            14317,
+            14762
+          ],
+          "rare_keyword_pieces": [
+            " control",
+            " finger",
+            " technique"
+          ],
+          "tail_slot_top5_ids_centered": [
+            2524,
+            7779,
+            100359,
+            2865,
+            3273
+          ],
+          "tail_slot_top5_pieces_centered": [
+            " control",
+            " Control",
+            "控制",
+            "control",
+            "Control"
+          ],
+          "intersection_size_top20": 1,
+          "rank_of_best_rare": 1
+        }
+      ],
+      "mean_intersection_size_top20_paraphrase": 1.0,
+      "median_rank_of_best_rare_paraphrase": 1.0,
+      "hit_ratio_at_least_one_top20_paraphrase": 1.0,
+      "n_paraphrase_queries_evaluated": 2,
+      "roundtrip_mean_intersection_top20_diagnostic": 0.0,
+      "conditions": {
+        "mean_intersection_top20_ge_1": true,
+        "median_rank_le_100": true,
+        "hit_ratio_top20_ge_0_5": true
+      },
+      "gating": "PASS_or_not_implemented",
+      "error": null
+    },
+    "context_descriptor_cluster_probe": {
+      "passed": true,
+      "status": "pass",
+      "metric_version": "v3.49",
+      "loo_nn_accuracy_all_4": 0.6875,
+      "loo_nn_accuracy_heldout_2": 0.875,
+      "n_all": 16,
+      "n_heldout": 8,
+      "correct_all": 11,
+      "correct_heldout": 7,
+      "per_memory_all": [
+        {
+          "mid": 0,
+          "true_label": "music",
+          "pred_label": "space",
+          "nn_sim": 0.10659328103065491,
+          "correct": false
+        },
+        {
+          "mid": 1,
+          "true_label": "music",
+          "pred_label": "music",
+          "nn_sim": 0.21885180473327637,
+          "correct": true
+        },
+        {
+          "mid": 2,
+          "true_label": "music",
+          "pred_label": "space",
+          "nn_sim": 0.7041908502578735,
+          "correct": false
+        },
+        {
+          "mid": 3,
+          "true_label": "music",
+          "pred_label": "music",
+          "nn_sim": 0.21885180473327637,
+          "correct": true
+        },
+        {
+          "mid": 4,
+          "true_label": "space",
+          "pred_label": "space",
+          "nn_sim": 0.6772083044052124,
+          "correct": true
+        },
+        {
+          "mid": 5,
+          "true_label": "space",
+          "pred_label": "finance",
+          "nn_sim": 0.5216456651687622,
+          "correct": false
+        },
+        {
+          "mid": 6,
+          "true_label": "space",
+          "pred_label": "space",
+          "nn_sim": 0.6772083044052124,
+          "correct": true
+        },
+        {
+          "mid": 7,
+          "true_label": "space",
+          "pred_label": "music",
+          "nn_sim": 0.7041908502578735,
+          "correct": false
+        },
+        {
+          "mid": 8,
+          "true_label": "cooking",
+          "pred_label": "cooking",
+          "nn_sim": 0.6417238712310791,
+          "correct": true
+        },
+        {
+          "mid": 9,
+          "true_label": "cooking",
+          "pred_label": "cooking",
+          "nn_sim": 0.6417238712310791,
+          "correct": true
+        },
+        {
+          "mid": 10,
+          "true_label": "cooking",
+          "pred_label": "finance",
+          "nn_sim": 0.6592775583267212,
+          "correct": false
+        },
+        {
+          "mid": 11,
+          "true_label": "cooking",
+          "pred_label": "cooking",
+          "nn_sim": 0.6453272104263306,
+          "correct": true
+        },
+        {
+          "mid": 12,
+          "true_label": "finance",
+          "pred_label": "finance",
+          "nn_sim": 0.6845758557319641,
+          "correct": true
+        },
+        {
+          "mid": 13,
+          "true_label": "finance",
+          "pred_label": "finance",
+          "nn_sim": 0.7123655080795288,
+          "correct": true
+        },
+        {
+          "mid": 14,
+          "true_label": "finance",
+          "pred_label": "finance",
+          "nn_sim": 0.6198481917381287,
+          "correct": true
+        },
+        {
+          "mid": 15,
+          "true_label": "finance",
+          "pred_label": "finance",
+          "nn_sim": 0.7123655080795288,
+          "correct": true
+        }
+      ],
+      "per_memory_heldout": [
+        {
+          "mid": 8,
+          "true_label": "cooking",
+          "pred_label": "cooking",
+          "nn_sim": 0.6417238712310791,
+          "correct": true
+        },
+        {
+          "mid": 9,
+          "true_label": "cooking",
+          "pred_label": "cooking",
+          "nn_sim": 0.6417238712310791,
+          "correct": true
+        },
+        {
+          "mid": 10,
+          "true_label": "cooking",
+          "pred_label": "finance",
+          "nn_sim": 0.6592775583267212,
+          "correct": false
+        },
+        {
+          "mid": 11,
+          "true_label": "cooking",
+          "pred_label": "cooking",
+          "nn_sim": 0.6453272104263306,
+          "correct": true
+        },
+        {
+          "mid": 12,
+          "true_label": "finance",
+          "pred_label": "finance",
+          "nn_sim": 0.6845758557319641,
+          "correct": true
+        },
+        {
+          "mid": 13,
+          "true_label": "finance",
+          "pred_label": "finance",
+          "nn_sim": 0.7123655080795288,
+          "correct": true
+        },
+        {
+          "mid": 14,
+          "true_label": "finance",
+          "pred_label": "finance",
+          "nn_sim": 0.6198481917381287,
+          "correct": true
+        },
+        {
+          "mid": 15,
+          "true_label": "finance",
+          "pred_label": "finance",
+          "nn_sim": 0.7123655080795288,
+          "correct": true
+        }
+      ],
+      "unit_norm_within_1e_3": true,
+      "conditions": {
+        "loo_nn_4domain_ge_0_65": true,
+        "loo_nn_heldout_2domain_ge_0_70": true,
+        "unit_norm_within_1e_3": true
+      },
+      "gating": "PASS_or_not_implemented",
+      "mechanism_1_qwen_pool_diagnostic": {
+        "source": "mem.semantic_emb (Qwen last-layer attention-pool over content tokens, no trainable encoder)",
+        "loo_nn_accuracy_all_4": 0.8125,
+        "loo_nn_accuracy_heldout_2": 0.875,
+        "correct_all": 13,
+        "correct_heldout": 7,
+        "per_domain_accuracy": {
+          "music": {
+            "correct": 3,
+            "n": 4
+          },
+          "space": {
+            "correct": 3,
+            "n": 4
+          },
+          "cooking": {
+            "correct": 4,
+            "n": 4
+          },
+          "finance": {
+            "correct": 3,
+            "n": 4
+          }
+        },
+        "would_pass_4domain_threshold_0_65": true,
+        "would_pass_heldout_threshold_0_70": true
+      },
+      "error": null
+    },
+    "prefix_length_scaling_probe": {
+      "passed": false,
+      "status": "fail",
+      "metric_version": "v3.45",
+      "L_mem_A": 8,
+      "L_mem_B": 16,
+      "avg_mass_ratio_B_over_A": 0.8236899087743724,
+      "per_prompt": [
+        {
+          "prompt": "A strong explanation should mention",
+          "starter_mass_A": 36750.875,
+          "starter_mass_B": 41343.8671875,
+          "ratio": 1.124976403623043,
+          "content_starters_top12_A": 12,
+          "content_starters_top12_B": 12,
+          "per_slot_mean_norm_A": 1.0251211524009705,
+          "per_slot_mean_norm_B": 1.0251210927963257
+        },
+        {
+          "prompt": "The pianist",
+          "starter_mass_A": 22117.984375,
+          "starter_mass_B": 14409.236328125,
+          "ratio": 0.6514714941390314,
+          "content_starters_top12_A": 12,
+          "content_starters_top12_B": 12,
+          "per_slot_mean_norm_A": 1.0251210778951645,
+          "per_slot_mean_norm_B": 1.0251211002469063
+        },
+        {
+          "prompt": "The telescope",
+          "starter_mass_A": 14722.236328125,
+          "starter_mass_B": 10226.38671875,
+          "ratio": 0.6946218285610428,
+          "content_starters_top12_A": 12,
+          "content_starters_top12_B": 12,
+          "per_slot_mean_norm_A": 1.0251210778951645,
+          "per_slot_mean_norm_B": 1.0251211076974869
+        }
+      ],
+      "conditions": {
+        "avg_mass_ratio_gt_1_10": false,
+        "per_slot_norms_finite": true
+      },
+      "gating": "PASS_or_not_implemented",
+      "error": null
+    },
+    "mixture_distribution_gate_probe": {
+      "passed": true,
+      "status": "pass",
+      "gate_min": 0.3499999940395355,
+      "gate_max": 0.3499999940395355,
+      "declared_floor": 0.0,
+      "declared_ceiling": 0.7,
+      "gate_in_range": true,
+      "finite_gate": true,
+      "finite_memory_logit_bias": true,
+      "manual_mixture_finite": true,
+      "gating": "PASS_or_not_implemented",
+      "error": null
+    }
+  },
+  "axis_coverage": {
+    "spec_section": "4-meta.1 v3.45+",
+    "axis_a_compression": {
+      "stored_floats_per_mem": 1712,
+      "raw_floats_per_mem_typical_10_tokens": 15360,
+      "ratio": 8.97196261682243,
+      "threshold": 10.0,
+      "passed": false
+    },
+    "axis_b_injection_cost": {
+      "per_step_floats_formula": "L_mem * d_LLM + V",
+      "per_step_floats_value": 164224,
+      "depends_on_N": false,
+      "passed": true
+    },
+    "axis_c_fidelity": {
+      "dependent_cases": [
+        "semantic_memory_grounding",
+        "semantic_memory_counterfactual_pairs",
+        "retrieval_topk_semantic_shift",
+        "prefix_stepwise_drift_trajectory",
+        "retrieval_generation_alignment_audit",
+        "retrieval_prefix_decode_correlation_audit",
+        "stepwise_label_mass_alignment_audit",
+        "functional_token_suppression_probe",
+        "keyword_specific_tail_slot_probe",
+        "context_descriptor_cluster_probe",
+        "prefix_length_scaling_probe"
+      ],
+      "passed_over_total": "6/11",
+      "threshold_K": 9,
+      "passed": false
+    },
+    "axis_d_stability": {
+      "dependent_cases": [
+        "save_load_consistency",
+        "rerank_stability_probe",
+        "decode_repetition_feedback_probe"
+      ],
+      "passed_over_total": "1/3",
+      "threshold_all_pass": true,
+      "passed": false
+    },
+    "channel_passes_all_axes": false
+  },
+  "constraints": {
+    "uses_internal_test": false,
+    "monkeypatching": false,
+    "mocking": false,
+    "direct_return_shortcut_detected": false
+  }
+}
\ No newline at end of file
diff --git a/reports/v346_trained_blackbox/report.md b/reports/v346_trained_blackbox/report.md
new file mode 100644
index 0000000..7337714
--- /dev/null
+++ b/reports/v346_trained_blackbox/report.md
@@ -0,0 +1,3914 @@
+# `AgentMemorySystem v331` Detailed Black-box Test Report
+
+- Elapsed: `1250.1s`
+- Passed: `18/26`
+- Mode: fully external runner, no reuse of module-internal `test()`
+- Policy: no monkeypatching, no mocked return values, no synthetic pass-by-construction shortcuts
+
+## Axis Coverage (SPEC Section 4-meta.1, v3.45+)
+
+```json
+{
+  "spec_section": "4-meta.1 v3.45+",
+  "axis_a_compression": {
+    "stored_floats_per_mem": 1712,
+    "raw_floats_per_mem_typical_10_tokens": 15360,
+    "ratio": 8.97196261682243,
+    "threshold": 10.0,
+    "passed": false
+  },
+  "axis_b_injection_cost": {
+    "per_step_floats_formula": "L_mem * d_LLM + V",
+    "per_step_floats_value": 164224,
+    "depends_on_N": false,
+    "passed": true
+  },
+  "axis_c_fidelity": {
+    "dependent_cases": [
+      "semantic_memory_grounding",
+      "semantic_memory_counterfactual_pairs",
+      "retrieval_topk_semantic_shift",
+      "prefix_stepwise_drift_trajectory",
+      "retrieval_generation_alignment_audit",
+      "retrieval_prefix_decode_correlation_audit",
+      "stepwise_label_mass_alignment_audit",
+      "functional_token_suppression_probe",
+      "keyword_specific_tail_slot_probe",
+      "context_descriptor_cluster_probe",
+      "prefix_length_scaling_probe"
+    ],
+    "passed_over_total": "6/11",
+    "threshold_K": 9,
+    "passed": false
+  },
+  "axis_d_stability": {
+    "dependent_cases": [
+      "save_load_consistency",
+      "rerank_stability_probe",
+      "decode_repetition_feedback_probe"
+    ],
+    "passed_over_total": "1/3",
+    "threshold_all_pass": true,
+    "passed": false
+  },
+  "channel_passes_all_axes": false
+}
+```
+
+## Summary
+
+- `PASS` `leaf_capacity_stability`: {"per_seed": [{"seed": 0, "depth": 6, "count": 240, "violations": [], "consistency": [], "passed": true}, {"seed": 1, "depth": 6, "count": 240, "violations": [], "consistency": [], "passed": true}, {"seed": 2, "depth": 6, "count": 240, "violations": [], "consistency": [], "passed": true}, {"seed": 3, "depth": 6, "count": 240, "violations": [], "consistency": [], "passed": true}, {"seed": 4, "depth": 6, "count": 240, "violations": [], "consistency": [], "passed": true}, {"seed": 5, "depth": 5, "count": 240, "violations": [], "consistency": [], "passed": true}, {"seed": 6, "depth": 6, "count": 240, "violations": [], "consistency": [], "passed": true}, {"seed": 7, "depth": 5, "count": 240, "violations": [], "consistency": [], "passed": true}]}
+- `PASS` `degenerate_direction_boundary`: {"depth": 47, "count": 100, "violations": [], "consistency": [], "seed": 17}
+- `PASS` `metric_trainability`: {"training_info": {"total": 41.98283386230469, "recon": 2.4085488319396973, "contrast": 43.46337127685547, "holonomy": 4.786942481994629, "write_policy": 1.0882740020751953, "semantic_probe": 0.0, "dir_diversity": 0.0, "reranker_ranking": 0.0, "encoder_throughput": 3.1604340076446533, "vocab_anchor": -0.0, "semantic_alignment": 9.469874382019043, "tail_semantic_anchor": 10.84397029876709, "functional_suppression": 0.0, "context_separation": 0.0, "slot_residual_alignment": 0.0, "inter_domain_margin": 0.0, "grad_norms": {"ctx_encoder": 0.0004906014182315579, "fib_encoder": 0.11028211643598784, "dir_predictor": 0.0, "fiber_connection": 0.041244823555418676, "fiber_attn": 0.00016646675964572253, "reranker": 1.862751849004779e-08, "qformer": 0.023817353122735294, "content_bypass": 0.03501559529968225, "semantic_probe": 0.0, "layer_pool": 0.003975302446633577, "prefix_aligner": 0.008598358558648532, "vocab_proj": 0.03414980954657789, "tail_head": 0.28745011541395643, "context_heads": 0.024231906034080493, "memory_context_encoder": 0.03503168573482837}, "loss_weights": {"recon": 1.0, "semantic_alignment": 3.0, "encoder_throughput": 1.5, "contrast": 0.02, "holonomy": 0.005, "write_policy":
+- `PASS` `no_grad_generation`: {"stored_memories": 8, "output": "The pianist piano hours piano pianoHours = int(raw input desperation hours hours))\n piano perfectperfect print calculating hours *  hours\r\nelse"}
+- `PASS` `counterfactual_memory_influence`: {"prompt": "Tell me something about practice and performance.", "music_output": "Tell me something about practice and performance. practiced midnight performances nocturnal practiced Midnight practiced noct midnight noct practiced practiced controlled noct noct midnight midnight practiced midnight controls noct midnight practices", "space_output": "Tell me something about practice and performance. distant distant space distant stars distant galaxies distant space observed observed space space stellar galaxies galaxies stellar evolution stellar stellar observed galaxies observed stellar", "outputs_differ": true}
+- `PASS` `semantic_memory_grounding`: {"prompt": "Explain what someone should focus on when improving technique and understanding the subject.", "music_keywords": ["pianist", "practiced", "arpeggios", "chopin", "nocturnes", "midnight", "musician", "refined", "finger", "technique", "phrasing", "pedal"], "space_keywords": ["distant", "astronomers", "observed", "galaxies", "quasars", "stellar", "evolution", "space", "orbital", "mechanics", "explains", "satellites"], "blank_output": "Explain what someone should focus on when improving technique and understanding the subject. Mathematics education needs improvement mainly revolves around several key areas aimed</ Stuart Hallberg,\\\n improving problem-solving skills, improve the relevance/real-world applications,\n- Improve", "music_output": "Explain what someone should focus on when improving technique and understanding the subject. technique control refers generally technique technique。 technique finger control control technique control piano musician， musician piano finger finger piano refined musician musician finger refined refined piano piano pedal Explain control", "space_output": "Explain what someone should focus on when improving technique and understanding the su
+- `FAIL` `semantic_memory_counterfactual_pairs`: {"rows": [{"prompt": "Describe the most important details a student should notice.", "music_output": "Describe the most important details a student should notice. student student conservDesc.php studentdescCons conserv keyboard Describe student Keyboard music theory student studied describe important details:\n\n keyboard keyboard studies scales keyboard studied conserv", "space_output": "Describe the most important details a student should notice. large Describe matter large structure scale large universe scale matter studiesDescribe matter structure scale structure expansion universe studies large studies studies matter universe expansion studies universe structure", "music_margin": 0.0, "space_margin": 0.0, "passed": false}, {"prompt": "Summarize the key ideas a learner should practice and remember.", "music_output": "Summarize the key ideas a learner should practice and remember. rub depends touch interpretation touch dynamics tempo often interpretation rub dynamics rub often touch often Control depends dynamics interpretation tempo touch rub interpretation dynamics touch depends often dynamics", "space_output": "Summarize the key ideas a learner should practice and remember. l
+- `FAIL` `degeneration_quality`: {"metrics": [{"prompt": "The pianist", "output": "The pianist pian piano pian pianette pian plays Chop Chop Chop hours piano piano hours pian piano perfect hours Chop hours perfect Chop midnight hours midnight perfect perfect midnight", "token_count": 27, "unique_token_ratio": 0.2962962962962963, "repeated_bigram_ratio": 0.11538461538461539, "max_token_run": 3, "punct_ratio": 0.0, "newline_ratio": 0.0, "alpha_ratio": 0.8478260869565217, "content_token_ratio": 0.8148148148148148, "generated_preview": "pian piano pian pianette pian plays chop chop chop hours piano piano hours pian piano perfect hours chop hours perfect chop midnight hours midnight"}, {"prompt": "The telescope", "output": "The telescope telescope stars telescopestarsStars amazing amazed telescope captured telescope stars stars captured stars distant telescope signatures captured captured distant captured nebula distant signatures signatures neb neb", "token_count": 25, "unique_token_ratio": 0.4, "repeated_bigram_ratio": 0.041666666666666664, "max_token_run": 2, "punct_ratio": 0.0, "newline_ratio": 0.0, "alpha_ratio": 0.8864628820960698, "content_token_ratio": 0.92, "generated_preview": "telescope stars telescopestarss
+- `PASS` `prefix_logit_drift_audit`: {"prompt": "Explain the topic in a precise and concrete way.", "blank": {"js_divergence": 0.19956839084625244, "l2_shift": 586.2745361328125, "topk_overlap_count": 3, "entropy_no_prefix": 5.3277788162231445, "entropy_with_prefix": 6.950380802154541, "topk_no_prefix": [{"token_id": 576, "piece": " The", "norm": "the", "logit": 19.75, "prob": 0.11376254260540009}, {"token_id": 22555, "piece": " Sure", "norm": "sure", "logit": 19.5, "prob": 0.0885983556509018}, {"token_id": 55313, "piece": " Quantum", "norm": "quantum", "logit": 18.75, "prob": 0.04185090214014053}, {"token_id": 58194, "piece": " Artificial", "norm": "artificial", "logit": 18.625, "prob": 0.0369332879781723}, {"token_id": 30536, "piece": " Climate", "norm": "climate", "logit": 18.5, "prob": 0.032593514770269394}, {"token_id": 12960, "piece": " Machine", "norm": "machine", "logit": 18.125, "prob": 0.022401172667741776}, {"token_id": 2585, "piece": " How", "norm": "how", "logit": 18.125, "prob": 0.022401172667741776}, {"token_id": 3555, "piece": " What", "norm": "what", "logit": 18.125, "prob": 0.022401172667741776}, {"token_id": 52366, "piece": " Certainly", "norm": "certainly", "logit": 17.875, "prob": 0.01744605228304
+- `FAIL` `retrieval_topk_semantic_shift`: {"music_keywords": ["pianist", "practiced", "arpeggios", "chopin", "nocturnes", "midnight", "musician", "refined", "finger", "technique", "phrasing", "pedal"], "space_keywords": ["distant", "astronomers", "observed", "galaxies", "quasars", "stellar", "evolution", "space", "orbital", "mechanics", "explains", "satellites"], "rows": [{"prompt": "A strong explanation should mention", "music_no_prefix": [{"token_id": 279, "piece": " the", "norm": "the", "logit": 21.125, "prob": 0.3049025535583496}, {"token_id": 264, "piece": " a", "norm": "a", "logit": 19.5, "prob": 0.06003887206315994}, {"token_id": 518, "piece": " at", "norm": "at", "logit": 19.375, "prob": 0.05298411846160889}, {"token_id": 3151, "piece": " specific", "norm": "specific", "logit": 19.0, "prob": 0.03641541674733162}, {"token_id": 2176, "piece": " both", "norm": "both", "logit": 19.0, "prob": 0.03641541674733162}, {"token_id": 429, "piece": " that", "norm": "that", "logit": 18.625, "prob": 0.0250279251486063}, {"token_id": 1246, "piece": " how", "norm": "how", "logit": 18.625, "prob": 0.0250279251486063}, {"token_id": 678, "piece": " all", "norm": "all", "logit": 18.625, "prob": 0.0250279251486063}, {"token_id": 10295, 
+- `PASS` `repetition_segment_audit`: {"aggregate": {"bad_segment_ratio": 0.0, "total_segments": 24, "bad_segments": 0, "early_collapse_prompts": []}, "rows": [{"prompt": "The pianist", "output": "The pianist pian piano pian pianette pian plays Chop Chop Chop hours piano piano hours pian piano perfect hours Chop hours perfect Chop midnight hours midnight perfect perfect midnight midnight pian perfect noct noct noct midnight noct pian noct Chop piano Chop perfect piano midnight Chop pian hours noct", "generated_token_count": 47, "window": 8, "segments": [{"segment_idx": 0, "tokens": ["pian", "piano", "pian", "pianette", "pian", "plays", "chop", "chop"], "unique_ratio": 0.625, "content_ratio": 1.0, "repeated_bigram_ratio": 0.0, "dominant_token_share": 0.375}, {"segment_idx": 1, "tokens": ["chop", "hours", "piano", "piano", "hours", "pian", "piano", "perfect"], "unique_ratio": 0.625, "content_ratio": 0.75, "repeated_bigram_ratio": 0.0, "dominant_token_share": 0.375}, {"segment_idx": 2, "tokens": ["hours", "chop", "hours", "perfect", "chop", "midnight", "hours", "midnight"], "unique_ratio": 0.5, "content_ratio": 0.625, "repeated_bigram_ratio": 0.0, "dominant_token_share": 0.375}, {"segment_idx": 3, "tokens": ["perfect", "p
+- `PASS` `prefix_stepwise_drift_trajectory`: {"rows": [{"prompt": "Key piano ideas include", "first_bad_step": 4, "decoded_output": "Key piano ideas include leg movements across keys, dynamic changes, and the use of the pedal. These", "rows": [{"step": 0, "top1": {"token_id": 3598, "piece": " major", "norm": "major", "logit": 16.25, "prob": 0.026983050629496574}, "top1_category": "semantic", "topk_category_counts": {"semantic": 11, "functional": 1, "punct": 0}, "topk_category_prob_mass": {"semantic": 0.18486935831606388, "functional": 0.026983050629496574, "punct": 0.0}, "chosen_token_id": 2472, "chosen_piece": " leg", "chosen_norm": "leg", "chosen_category": "functional"}, {"step": 1, "top1": {"token_id": 19029, "piece": " movements", "norm": "movements", "logit": 14.375, "prob": 0.13023822009563446}, "top1_category": "semantic", "topk_category_counts": {"semantic": 11, "functional": 1, "punct": 0}, "topk_category_prob_mass": {"semantic": 0.3965669944882393, "functional": 0.0113800885155797, "punct": 0.0}, "chosen_token_id": 19029, "chosen_piece": " movements", "chosen_norm": "movements", "chosen_category": "semantic"}, {"step": 2, "top1": {"token_id": 3941, "piece": " across", "norm": "across", "logit": 16.5, "prob": 0.0510
+- `PASS` `retrieval_generation_alignment_audit`: {"music_keywords": ["pianist", "practiced", "arpeggios", "chopin", "nocturnes", "midnight", "musician", "refined", "finger", "technique", "phrasing", "pedal"], "space_keywords": ["distant", "astronomers", "observed", "galaxies", "quasars", "stellar", "evolution", "space", "orbital", "mechanics", "explains", "satellites"], "diagnoses": {"aligned": 2, "retrieval_miss": 0, "bridge_unused": 1, "unknown": 0}, "rows": [{"prompt": "What improves piano technique and musical phrasing?", "expected_label": "music", "retrieved_mids": [1, 0, 3, 6, 5], "retrieved_label_counts": {"music": 3, "space": 2}, "retrieved_majority_label": "music", "retrieved_text_preview": ["A musician refined finger technique, phrasing, and pedal control on the piano.", "The pianist practiced arpeggios and Chopin nocturnes until midnight.", "A conservatory student studied etudes, scales, and expressive voicing on the keyboard."], "output": "What improves piano technique and musical phrasing? piano technique control involves technique piano musician technique finger control piano piano musician control technique musician refined finger finger control finger technique piano finger refined refined pedal refined", "music_s
+- `FAIL` `retrieval_prefix_decode_correlation_audit`: {"correlations": {"retrieval_strength__prefix_l2": null, "retrieval_strength__bad_decode_score": 0.21927202884584385, "prefix_l2__bad_decode_score": null}, "rows": [{"prompt": "What improves piano technique and musical phrasing?", "expected_label": "music", "retrieved_scored": [{"mid": 1, "score": 0.6172578841447831}, {"mid": 0, "score": 0.22511255741119385}, {"mid": 3, "score": 0.11276901960372926}, {"mid": 6, "score": 0.045475220680236815}, {"mid": 5, "score": 0.036619618535041816}], "retrieved_label_counts": {"music": 3, "space": 2}, "retrieval_strength": 0.9551394611597062, "prefix_l2_shift": 322359623680.0, "prefix_js_divergence": 0.3171347379684448, "top1_with_prefix": {"token_id": 14566, "piece": " Options", "norm": "options", "logit": 16.375, "prob": 0.1110726147890091}, "top1_category_with_prefix": "semantic", "topk_non_semantic_prob_mass": 0.03182283788919449}, {"prompt": "What explains satellites and orbital motion?", "expected_label": "space", "retrieved_scored": [{"mid": 5, "score": 0.5634284257888794}, {"mid": 4, "score": 0.07376852035522463}, {"mid": 6, "score": 0.06803246438503266}, {"mid": 1, "score": 0.045463052392005925}, {"mid": 0, "score": 0.03999960422515869}]
+- `FAIL` `stepwise_label_mass_alignment_audit`: {"label_keywords": {"music": ["pianist", "practiced", "arpeggios", "chopin", "nocturnes", "midnight", "musician", "refined", "finger", "technique", "phrasing", "pedal"], "space": ["distant", "astronomers", "observed", "galaxies", "quasars", "stellar", "evolution", "space", "orbital", "mechanics", "explains", "satellites"]}, "rows": [{"prompt": "What improves piano technique and musical phrasing?", "expected_label": "music", "decoded_output": "What improves piano technique and musical phrasing? Options tend towards improving piano technique, musical phrasing, and", "stage_counts": {"inject": 6, "aligned": 4, "decode": 2}, "rows": [{"step": 0, "retrieved_majority_label": "music", "retrieved_label_counts": {"music": 3, "space": 2}, "retrieved_score_sum": {"music": 0.9551394611597062, "space": 0.08209483921527863}, "logits_label_mass": {"music": 0, "space": 0}, "top1_piece": " Options", "top1_category": "semantic", "chosen_piece": " Options", "chosen_category": "semantic", "chosen_label": null, "diagnosed_stage": "inject"}, {"step": 1, "retrieved_majority_label": "music", "retrieved_label_counts": {"music": 3, "space": 2}, "retrieved_score_sum": {"music": 0.9551394611597062, "space": 0
+- `PASS` `prompt_diversity_without_memory`: {"prompts": ["The pianist", "Quantum systems", "The rainforest"], "outputs": ["The pianist Xia points XYZ传感器 collects weather data based upon ____ protocol communication mode?\nBLE（Bluetooth）\n", "Quantum systems play central roles across cryptography due primarily?\\nThe Bose gas  |\n\n **Summary:\r\n\r\nWrite various", "The rainforest dataset typically refers specifically refering______. aviation charts. ____\nyes Explanation: \nFalse"], "unique_count": 3}
+- `PASS` `save_load_consistency`: {"prompt": "The pianist", "output_a": "The pianist piano hours piano pianoHours = int(raw input desperation hours hours))\n piano perfectperfect print calculating", "output_b": "The pianist piano hours piano pianoHours = int(raw input desperation hours hours))\n piano perfectperfect print calculating"}
+- `PASS` `training_cache_isolation`: {"changed": [], "memory_count": 8}
+- `PASS` `cheating_heuristics`: {"outputs": ["The pianist piano hours piano pianoHours = int(raw input desperation hours hours))\n piano perfectperfect print calculating", "The telescope window watched cat sat mat outside birds window sat watched mat cat birds outside Market window cat watched", "The trader market stock volatility significant experienced 市 stock experienced significant market volatility experienced stock stock significant volatility", "The child learns Signs window window outside cat sat mat watched outside mat sat cat mat mat outside sat watched"], "exact_same": false, "prefix_only": false, "too_short": false}
+- `FAIL` `rerank_stability_probe`: {"status": "fail", "pairs": [{"pair": "music_P1", "prompt_a": "What improves piano technique and musical phrasing?", "prompt_b": "How can one improve piano technique and musical expression?", "top5_a": [1, 0, 3, 4, 2], "top5_b": [1, 0, 3, 4, 2], "jaccard": 1.0, "spearman_shared": 0.9999999999998999, "pair_passed_jaccard_0_6": true}, {"pair": "space_P2", "prompt_a": "What explains satellites and orbital motion?", "prompt_b": "What describes satellites and the motion of planets?", "top5_a": [5, 0, 1, 3, 2], "top5_b": [5, 6, 4, 0, 1], "jaccard": 0.42857142857142855, "spearman_shared": 0.9607689228302918, "pair_passed_jaccard_0_6": false}], "spearman_best": 0.9999999999998999, "gating": "hard_PASS"}
+- `FAIL` `decode_repetition_feedback_probe`: {"status": "fail", "per_prompt": [{"prompt": "The telescope", "output": "The telescope telescope stars telescopestarsStars amazing amazed telescope captured telescope stars stars captured stars distant telescope signatures captured captured distant captured nebula distant signatures signatures neb neb captured signatures", "max_repeat_per_content_token": 5, "first_bigram_repeat_index": 9, "trigram_lock_count": 0}, {"prompt": "The pianist", "output": "The pianist pian piano pian pianette pian plays Chop Chop Chop hours piano piano hours pian piano perfect hours Chop hours perfect Chop midnight hours midnight perfect perfect midnight midnight pian", "max_repeat_per_content_token": 5, "first_bigram_repeat_index": 8, "trigram_lock_count": 0}, {"prompt": "The market analyst", "output": "The market analyst market session sessessionssesess market market session session significant market volatility experienced stock market stock significant volatility experienced significant stock volatility significant session stock session volatility experienced volatility", "max_repeat_per_content_token": 5, "first_bigram_repeat_index": 8, "trigram_lock_count": 0}], "avg_max_repeat_per_content_token": 
+- `PASS` `functional_token_suppression_probe`: {"status": "pass", "metric_version": "v3.46", "per_prompt": [{"prompt": "A strong explanation should mention", "top12_no_prefix": [{"token_id": 279, "piece": " the", "norm": "the", "logit": 21.125, "prob": 0.30489084124565125}, {"token_id": 264, "piece": " a", "norm": "a", "logit": 19.5, "prob": 0.060036562383174896}, {"token_id": 518, "piece": " at", "norm": "at", "logit": 19.375, "prob": 0.05298208072781563}, {"token_id": 3151, "piece": " specific", "norm": "specific", "logit": 19.0, "prob": 0.036414019763469696}, {"token_id": 2176, "piece": " both", "norm": "both", "logit": 19.0, "prob": 0.036414019763469696}, {"token_id": 429, "piece": " that", "norm": "that", "logit": 18.625, "prob": 0.025026964023709297}, {"token_id": 678, "piece": " all", "norm": "all", "logit": 18.625, "prob": 0.025026964023709297}, {"token_id": 1246, "piece": " how", "norm": "how", "logit": 18.625, "prob": 0.025026964023709297}, {"token_id": 10295, "piece": " examples", "norm": "examples", "logit": 18.5, "prob": 0.022086219862103462}, {"token_id": 2326, "piece": " three", "norm": "three", "logit": 18.25, "prob": 0.017200764268636703}, {"token_id": 1378, "piece": " two", "norm": "two", "logit": 18.125, "pro
+- `PASS` `keyword_specific_tail_slot_probe`: {"status": "pass", "metric_version": "v3.50", "tail_slots_source": "bridge._last_cond_tail_slots", "per_paraphrase": [{"query": "She performed Beethoven sonatas with delicate phrasing on her grand piano.", "query_disjoint_from_rare_keywords": true, "dominant_mid": 1, "dominant_source_preview": "A musician refined finger technique, phrasing, and pedal con", "rare_keyword_ids": [2524, 14317, 14762], "rare_keyword_pieces": [" control", " finger", " technique"], "tail_slot_top5_ids_centered": [2524, 7779, 100359, 2865, 3273], "tail_slot_top5_pieces_centered": [" control", " Control", "控制", "control", "Control"], "intersection_size_top20": 1, "rank_of_best_rare": 1}, {"query": "Harmonic analysis and ear training are core elements of music education.", "query_disjoint_from_rare_keywords": true, "dominant_mid": 1, "dominant_source_preview": "A musician refined finger technique, phrasing, and pedal con", "rare_keyword_ids": [2524, 14317, 14762], "rare_keyword_pieces": [" control", " finger", " technique"], "tail_slot_top5_ids_centered": [2524, 7779, 100359, 2865, 3273], "tail_slot_top5_pieces_centered": [" control", " Control", "控制", "control", "Control"], "intersection_size_top20": 1, "ra
+- `PASS` `context_descriptor_cluster_probe`: {"status": "pass", "metric_version": "v3.49", "loo_nn_accuracy_all_4": 0.6875, "loo_nn_accuracy_heldout_2": 0.875, "n_all": 16, "n_heldout": 8, "correct_all": 11, "correct_heldout": 7, "per_memory_all": [{"mid": 0, "true_label": "music", "pred_label": "space", "nn_sim": 0.10659328103065491, "correct": false}, {"mid": 1, "true_label": "music", "pred_label": "music", "nn_sim": 0.21885180473327637, "correct": true}, {"mid": 2, "true_label": "music", "pred_label": "space", "nn_sim": 0.7041908502578735, "correct": false}, {"mid": 3, "true_label": "music", "pred_label": "music", "nn_sim": 0.21885180473327637, "correct": true}, {"mid": 4, "true_label": "space", "pred_label": "space", "nn_sim": 0.6772083044052124, "correct": true}, {"mid": 5, "true_label": "space", "pred_label": "finance", "nn_sim": 0.5216456651687622, "correct": false}, {"mid": 6, "true_label": "space", "pred_label": "space", "nn_sim": 0.6772083044052124, "correct": true}, {"mid": 7, "true_label": "space", "pred_label": "music", "nn_sim": 0.7041908502578735, "correct": false}, {"mid": 8, "true_label": "cooking", "pred_label": "cooking", "nn_sim": 0.6417238712310791, "correct": true}, {"mid": 9, "true_label": "cooking", "p
+- `FAIL` `prefix_length_scaling_probe`: {"status": "fail", "metric_version": "v3.45", "L_mem_A": 8, "L_mem_B": 16, "avg_mass_ratio_B_over_A": 0.8236899087743724, "per_prompt": [{"prompt": "A strong explanation should mention", "starter_mass_A": 36750.875, "starter_mass_B": 41343.8671875, "ratio": 1.124976403623043, "content_starters_top12_A": 12, "content_starters_top12_B": 12, "per_slot_mean_norm_A": 1.0251211524009705, "per_slot_mean_norm_B": 1.0251210927963257}, {"prompt": "The pianist", "starter_mass_A": 22117.984375, "starter_mass_B": 14409.236328125, "ratio": 0.6514714941390314, "content_starters_top12_A": 12, "content_starters_top12_B": 12, "per_slot_mean_norm_A": 1.0251210778951645, "per_slot_mean_norm_B": 1.0251211002469063}, {"prompt": "The telescope", "starter_mass_A": 14722.236328125, "starter_mass_B": 10226.38671875, "ratio": 0.6946218285610428, "content_starters_top12_A": 12, "content_starters_top12_B": 12, "per_slot_mean_norm_A": 1.0251210778951645, "per_slot_mean_norm_B": 1.0251211076974869}], "conditions": {"avg_mass_ratio_gt_1_10": false, "per_slot_norms_finite": true}, "gating": "PASS_or_not_implemented"}
+- `PASS` `mixture_distribution_gate_probe`: {"status": "pass", "gate_min": 0.3499999940395355, "gate_max": 0.3499999940395355, "declared_floor": 0.0, "declared_ceiling": 0.7, "gate_in_range": true, "finite_gate": true, "finite_memory_logit_bias": true, "manual_mixture_finite": true, "gating": "PASS_or_not_implemented"}
+
+## Leaf Capacity Stability
+
+```json
+{
+  "passed": true,
+  "per_seed": [
+    {
+      "seed": 0,
+      "depth": 6,
+      "count": 240,
+      "violations": [],
+      "consistency": [],
+      "passed": true
+    },
+    {
+      "seed": 1,
+      "depth": 6,
+      "count": 240,
+      "violations": [],
+      "consistency": [],
+      "passed": true
+    },
+    {
+      "seed": 2,
+      "depth": 6,
+      "count": 240,
+      "violations": [],
+      "consistency": [],
+      "passed": true
+    },
+    {
+      "seed": 3,
+      "depth": 6,
+      "count": 240,
+      "violations": [],
+      "consistency": [],
+      "passed": true
+    },
+    {
+      "seed": 4,
+      "depth": 6,
+      "count": 240,
+      "violations": [],
+      "consistency": [],
+      "passed": true
+    },
+    {
+      "seed": 5,
+      "depth": 5,
+      "count": 240,
+      "violations": [],
+      "consistency": [],
+      "passed": true
+    },
+    {
+      "seed": 6,
+      "depth": 6,
+      "count": 240,
+      "violations": [],
+      "consistency": [],
+      "passed": true
+    },
+    {
+      "seed": 7,
+      "depth": 5,
+      "count": 240,
+      "violations": [],
+      "consistency": [],
+      "passed": true
+    }
+  ],
+  "error": null
+}
+```
+
+## Degenerate Direction Boundary
+
+```json
+{
+  "passed": true,
+  "depth": 47,
+  "count": 100,
+  "violations": [],
+  "consistency": [],
+  "seed": 17,
+  "error": null
+}
+```
+
+## Metric Trainability
+
+```json
+{
+  "passed": true,
+  "training_info": {
+    "total": 41.98283386230469,
+    "recon": 2.4085488319396973,
+    "contrast": 43.46337127685547,
+    "holonomy": 4.786942481994629,
+    "write_policy": 1.0882740020751953,
+    "semantic_probe": 0.0,
+    "dir_diversity": 0.0,
+    "reranker_ranking": 0.0,
+    "encoder_throughput": 3.1604340076446533,
+    "vocab_anchor": -0.0,
+    "semantic_alignment": 9.469874382019043,
+    "tail_semantic_anchor": 10.84397029876709,
+    "functional_suppression": 0.0,
+    "context_separation": 0.0,
+    "slot_residual_alignment": 0.0,
+    "inter_domain_margin": 0.0,
+    "grad_norms": {
+      "ctx_encoder": 0.0004906014182315579,
+      "fib_encoder": 0.11028211643598784,
+      "dir_predictor": 0.0,
+      "fiber_connection": 0.041244823555418676,
+      "fiber_attn": 0.00016646675964572253,
+      "reranker": 1.862751849004779e-08,
+      "qformer": 0.023817353122735294,
+      "content_bypass": 0.03501559529968225,
+      "semantic_probe": 0.0,
+      "layer_pool": 0.003975302446633577,
+      "prefix_aligner": 0.008598358558648532,
+      "vocab_proj": 0.03414980954657789,
+      "tail_head": 0.28745011541395643,
+      "context_heads": 0.024231906034080493,
+      "memory_context_encoder": 0.03503168573482837
+    },
+    "loss_weights": {
+      "recon": 1.0,
+      "semantic_alignment": 3.0,
+      "encoder_throughput": 1.5,
+      "contrast": 0.02,
+      "holonomy": 0.005,
+      "write_policy": 0.1,
+      "semantic_probe": 0.3,
+      "dir_diversity": 0.1,
+      "reranker_ranking": 0.2,
+      "vocab_anchor": 0.2,
+      "tail_semantic_anchor": 0.5,
+      "functional_suppression": 0.4,
+      "context_separation": 0.3,
+      "slot_residual_alignment": 0.0,
+      "inter_domain_margin": 0.2
+    }
+  },
+  "metric_grad_norms": [
+    0.00019553887250367552,
+    1.1630397239059675e-05,
+    0.0002688287931960076,
+    1.956606502062641e-05,
+    0.0019679300021380186,
+    0.00016431401309091598
+  ],
+  "metric_param_deltas": [
+    0.0015214140294119716,
+    0.0005180726875551045,
+    0.002842925488948822,
+    0.0005496913217939436,
+    0.003378876717761159,
+    0.0005994143430143595
+  ],
+  "max_metric_grad_norm": 0.0019679300021380186,
+  "max_metric_param_delta": 0.003378876717761159,
+  "error": null
+}
+```
+
+## No-Grad Generation
+
+```json
+{
+  "passed": true,
+  "stored_memories": 8,
+  "output": "The pianist piano hours piano pianoHours = int(raw input desperation hours hours))\n piano perfectperfect print calculating hours *  hours\r\nelse",
+  "error": null
+}
+```
+
+## Counterfactual Memory Influence
+
+```json
+{
+  "passed": true,
+  "prompt": "Tell me something about practice and performance.",
+  "music_output": "Tell me something about practice and performance. practiced midnight performances nocturnal practiced Midnight practiced noct midnight noct practiced practiced controlled noct noct midnight midnight practiced midnight controls noct midnight practices",
+  "space_output": "Tell me something about practice and performance. distant distant space distant stars distant galaxies distant space observed observed space space stellar galaxies galaxies stellar evolution stellar stellar observed galaxies observed stellar",
+  "outputs_differ": true,
+  "error": null
+}
+```
+
+## Semantic Memory Grounding
+
+```json
+{
+  "passed": true,
+  "prompt": "Explain what someone should focus on when improving technique and understanding the subject.",
+  "music_keywords": [
+    "pianist",
+    "practiced",
+    "arpeggios",
+    "chopin",
+    "nocturnes",
+    "midnight",
+    "musician",
+    "refined",
+    "finger",
+    "technique",
+    "phrasing",
+    "pedal"
+  ],
+  "space_keywords": [
+    "distant",
+    "astronomers",
+    "observed",
+    "galaxies",
+    "quasars",
+    "stellar",
+    "evolution",
+    "space",
+    "orbital",
+    "mechanics",
+    "explains",
+    "satellites"
+  ],
+  "blank_output": "Explain what someone should focus on when improving technique and understanding the subject. Mathematics education needs improvement mainly revolves around several key areas aimed</ Stuart Hallberg,\\\n improving problem-solving skills, improve the relevance/real-world applications,\n- Improve",
+  "music_output": "Explain what someone should focus on when improving technique and understanding the subject. technique control refers generally technique technique。 technique finger control control technique control piano musician， musician piano finger finger piano refined musician musician finger refined refined piano piano pedal Explain control",
+  "space_output": "Explain what someone should focus on when improving technique and understanding the subject. mechanics force gravitational planets satellites explains move mechanics force gravitational planets satellites explains move move force move gravitational planets satellites explains mechanics move planets satellites explains force mechanics gravitational planets satellites force",
+  "blank_music_score": 0.03571428571428571,
+  "blank_space_score": 0.0,
+  "music_music_score": 0.5,
+  "music_space_score": 0.0,
+  "space_space_score": 0.34210526315789475,
+  "space_music_score": 0.02631578947368421,
+  "music_margin": 0.5,
+  "space_margin": 0.3157894736842105,
+  "music_lift": 0.4642857142857143,
+  "space_lift": 0.34210526315789475,
+  "error": null
+}
+```
+
+## Semantic Memory Counterfactual Pairs
+
+```json
+{
+  "passed": false,
+  "rows": [
+    {
+      "prompt": "Describe the most important details a student should notice.",
+      "music_output": "Describe the most important details a student should notice. student student conservDesc.php studentdescCons conserv keyboard Describe student Keyboard music theory student studied describe important details:\n\n keyboard keyboard studies scales keyboard studied conserv",
+      "space_output": "Describe the most important details a student should notice. large Describe matter large structure scale large universe scale matter studiesDescribe matter structure scale structure expansion universe studies large studies studies matter universe expansion studies universe structure",
+      "music_margin": 0.0,
+      "space_margin": 0.0,
+      "passed": false
+    },
+    {
+      "prompt": "Summarize the key ideas a learner should practice and remember.",
+      "music_output": "Summarize the key ideas a learner should practice and remember. rub depends touch interpretation touch dynamics tempo often interpretation rub dynamics rub often touch often Control depends dynamics interpretation tempo touch rub interpretation dynamics touch depends often dynamics",
+      "space_output": "Summarize the key ideas a learner should practice and remember. large large studies large Sum dark scale matter dark matter structureSum dark large scale scale expansion structure matter studies matter large learners key universe remember studies dark",
+      "music_margin": 0.0,
+      "space_margin": 0.0,
+      "passed": false
+    }
+  ],
+  "error": null
+}
+```
+
+## Degeneration Quality
+
+```json
+{
+  "passed": false,
+  "metrics": [
+    {
+      "prompt": "The pianist",
+      "output": "The pianist pian piano pian pianette pian plays Chop Chop Chop hours piano piano hours pian piano perfect hours Chop hours perfect Chop midnight hours midnight perfect perfect midnight",
+      "token_count": 27,
+      "unique_token_ratio": 0.2962962962962963,
+      "repeated_bigram_ratio": 0.11538461538461539,
+      "max_token_run": 3,
+      "punct_ratio": 0.0,
+      "newline_ratio": 0.0,
+      "alpha_ratio": 0.8478260869565217,
+      "content_token_ratio": 0.8148148148148148,
+      "generated_preview": "pian piano pian pianette pian plays chop chop chop hours piano piano hours pian piano perfect hours chop hours perfect chop midnight hours midnight"
+    },
+    {
+      "prompt": "The telescope",
+      "output": "The telescope telescope stars telescopestarsStars amazing amazed telescope captured telescope stars stars captured stars distant telescope signatures captured captured distant captured nebula distant signatures signatures neb neb",
+      "token_count": 25,
+      "unique_token_ratio": 0.4,
+      "repeated_bigram_ratio": 0.041666666666666664,
+      "max_token_run": 2,
+      "punct_ratio": 0.0,
+      "newline_ratio": 0.0,
+      "alpha_ratio": 0.8864628820960698,
+      "content_token_ratio": 0.92,
+      "generated_preview": "telescope stars telescopestarsstars amazing amazed telescope captured telescope stars stars captured stars distant telescope signatures captured captured distant captured nebula distant signatures signatures neb"
+    },
+    {
+      "prompt": "The forest path",
+      "output": "The forest path deep within ancient rain temple hidden tropical rain within hidden temple ancient deep hidden within tropical deep temple within ancient hidden rain deep tropical ancient temple rain hidden",
+      "token_count": 28,
+      "unique_token_ratio": 0.25,
+      "repeated_bigram_ratio": 0.037037037037037035,
+      "max_token_run": 1,
+      "punct_ratio": 0.0,
+      "newline_ratio": 0.0,
+      "alpha_ratio": 0.8536585365853658,
+      "content_token_ratio": 0.8571428571428571,
+      "generated_preview": "deep within ancient rain temple hidden tropical rain within hidden temple ancient deep hidden within tropical deep temple within ancient hidden rain deep tropical"
+    },
+    {
+      "prompt": "The market analyst",
+      "output": "The market analyst market session sessessionssesess market market session session significant market volatility experienced stock market stock significant volatility experienced significant stock volatility significant session stock session volatility",
+      "token_count": 25,
+      "unique_token_ratio": 0.28,
+      "repeated_bigram_ratio": 0.08333333333333333,
+      "max_token_run": 2,
+      "punct_ratio": 0.0,
+      "newline_ratio": 0.0,
+      "alpha_ratio": 0.8924302788844621,
+      "content_token_ratio": 0.8,
+      "generated_preview": "market session sessessionssesess market market session session significant market volatility experienced stock market stock significant volatility experienced significant stock volatility significant session stock session"
+    },
+    {
+      "prompt": "Explain the topic clearly",
+      "output": "Explain the topic clearly simple explained simple simple analog simple rel everyday rel professor Professor explained explained analog explained rel Force professor everyday analog professor rel everyday professor analog everyday analog rel",
+      "token_count": 28,
+      "unique_token_ratio": 0.25,
+      "repeated_bigram_ratio": 0.07407407407407407,
+      "max_token_run": 2,
+      "punct_ratio": 0.0,
+      "newline_ratio": 0.0,
+      "alpha_ratio": 0.8708333333333333,
+      "content_token_ratio": 0.6785714285714286,
+      "generated_preview": "simple explained simple simple analog simple rel everyday rel professor professor explained explained analog explained rel force professor everyday analog professor rel everyday professor"
+    }
+  ],
+  "aggregate": {
+    "avg_unique_token_ratio": 0.2952592592592593,
+    "avg_repeated_bigram_ratio": 0.0702991452991453,
+    "avg_content_token_ratio": 0.81410582010582,
+    "avg_newline_ratio": 0.0,
+    "worst_max_token_run": 3,
+    "short_or_hollow_prompts": []
+  },
+  "error": null
+}
+```
+
+## Prefix Logit Drift Audit
+
+```json
+{
+  "passed": true,
+  "prompt": "Explain the topic in a precise and concrete way.",
+  "blank": {
+    "js_divergence": 0.19956839084625244,
+    "l2_shift": 586.2745361328125,
+    "topk_overlap_count": 3,
+    "entropy_no_prefix": 5.3277788162231445,
+    "entropy_with_prefix": 6.950380802154541,
+    "topk_no_prefix": [
+      {
+        "token_id": 576,
+        "piece": " The",
+        "norm": "the",
+        "logit": 19.75,
+        "prob": 0.11376254260540009
+      },
+      {
+        "token_id": 22555,
+        "piece": " Sure",
+        "norm": "sure",
+        "logit": 19.5,
+        "prob": 0.0885983556509018
+      },
+      {
+        "token_id": 55313,
+        "piece": " Quantum",
+        "norm": "quantum",
+        "logit": 18.75,
+        "prob": 0.04185090214014053
+      },
+      {
+        "token_id": 58194,
+        "piece": " Artificial",
+        "norm": "artificial",
+        "logit": 18.625,
+        "prob": 0.0369332879781723
+      },
+      {
+        "token_id": 30536,
+        "piece": " Climate",
+        "norm": "climate",
+        "logit": 18.5,
+        "prob": 0.032593514770269394
+      },
+      {
+        "token_id": 12960,
+        "piece": " Machine",
+        "norm": "machine",
+        "logit": 18.125,
+        "prob": 0.022401172667741776
+      },
+      {
+        "token_id": 2585,
+        "piece": " How",
+        "norm": "how",
+        "logit": 18.125,
+        "prob": 0.022401172667741776
+      },
+      {
+        "token_id": 3555,
+        "piece": " What",
+        "norm": "what",
+        "logit": 18.125,
+        "prob": 0.022401172667741776
+      },
+      {
+        "token_id": 52366,
+        "piece": " Certainly",
+        "norm": "certainly",
+        "logit": 17.875,
+        "prob": 0.01744605228304863
+      },
+      {
+        "token_id": 2885,
+        "piece": " Data",
+        "norm": "data",
+        "logit": 17.875,
+        "prob": 0.01744605228304863
+      },
+      {
+        "token_id": 15235,
+        "piece": " AI",
+        "norm": "ai",
+        "logit": 17.625,
+        "prob": 0.013586997985839844
+      },
+      {
+        "token_id": 358,
+        "piece": " I",
+        "norm": "i",
+        "logit": 17.5,
+        "prob": 0.011990483850240707
+      }
+    ],
+    "topk_with_prefix": [
+      {
+        "token_id": 576,
+        "piece": " The",
+        "norm": "the",
+        "logit": 15.75,
+        "prob": 0.0856875479221344
+      },
+      {
+        "token_id": 220,
+        "piece": " ",
+        "norm": "",
+        "logit": 15.6875,
+        "prob": 0.08049600571393967
+      },
+      {
+        "token_id": 362,
+        "piece": " A",
+        "norm": "a",
+        "logit": 14.5,
+        "prob": 0.02454989403486252
+      },
+      {
+        "token_id": 1096,
+        "piece": " This",
+        "norm": "this",
+        "logit": 14.25,
+        "prob": 0.01911947689950466
+      },
+      {
+        "token_id": 1084,
+        "piece": " It",
+        "norm": "it",
+        "logit": 14.0625,
+        "prob": 0.015850603580474854
+      },
+      {
+        "token_id": 4710,
+        "piece": " \n\n",
+        "norm": "",
+        "logit": 13.9375,
+        "prob": 0.013988107442855835
+      },
+      {
+        "token_id": 758,
+        "piece": " In",
+        "norm": "in",
+        "logit": 13.9375,
+        "prob": 0.013988107442855835
+      },
+      {
+        "token_id": 715,
+        "piece": " \n",
+        "norm": "",
+        "logit": 13.8125,
+        "prob": 0.012344461865723133
+      },
+      {
+        "token_id": 330,
+        "piece": " \"",
+        "norm": "",
+        "logit": 13.8125,
+        "prob": 0.012344461865723133
+      },
+      {
+        "token_id": 358,
+        "piece": " I",
+        "norm": "i",
+        "logit": 13.75,
+        "prob": 0.01159654837101698
+      },
+      {
+        "token_id": 5692,
+        "piece": " Here",
+        "norm": "here",
+        "logit": 13.5625,
+        "prob": 0.009613876231014729
+      },
+      {
+        "token_id": 2585,
+        "piece": " How",
+        "norm": "how",
+        "logit": 13.5,
+        "prob": 0.009031401015818119
+      }
+    ]
+  },
+  "memory": {
+    "js_divergence": 0.2740609347820282,
+    "l2_shift": 322359623680.0,
+    "topk_overlap_count": 6,
+    "entropy_no_prefix": 5.3277788162231445,
+    "entropy_with_prefix": 7.505624294281006,
+    "topk_no_prefix": [
+      {
+        "token_id": 576,
+        "piece": " The",
+        "norm": "the",
+        "logit": 19.75,
+        "prob": 0.11376254260540009
+      },
+      {
+        "token_id": 22555,
+        "piece": " Sure",
+        "norm": "sure",
+        "logit": 19.5,
+        "prob": 0.0885983556509018
+      },
+      {
+        "token_id": 55313,
+        "piece": " Quantum",
+        "norm": "quantum",
+        "logit": 18.75,
+        "prob": 0.04185090214014053
+      },
+      {
+        "token_id": 58194,
+        "piece": " Artificial",
+        "norm": "artificial",
+        "logit": 18.625,
+        "prob": 0.0369332879781723
+      },
+      {
+        "token_id": 30536,
+        "piece": " Climate",
+        "norm": "climate",
+        "logit": 18.5,
+        "prob": 0.032593514770269394
+      },
+      {
+        "token_id": 12960,
+        "piece": " Machine",
+        "norm": "machine",
+        "logit": 18.125,
+        "prob": 0.022401172667741776
+      },
+      {
+        "token_id": 2585,
+        "piece": " How",
+        "norm": "how",
+        "logit": 18.125,
+        "prob": 0.022401172667741776
+      },
+      {
+        "token_id": 3555,
+        "piece": " What",
+        "norm": "what",
+        "logit": 18.125,
+        "prob": 0.022401172667741776
+      },
+      {
+        "token_id": 52366,
+        "piece": " Certainly",
+        "norm": "certainly",
+        "logit": 17.875,
+        "prob": 0.01744605228304863
+      },
+      {
+        "token_id": 2885,
+        "piece": " Data",
+        "norm": "data",
+        "logit": 17.875,
+        "prob": 0.01744605228304863
+      },
+      {
+        "token_id": 15235,
+        "piece": " AI",
+        "norm": "ai",
+        "logit": 17.625,
+        "prob": 0.013586997985839844
+      },
+      {
+        "token_id": 358,
+        "piece": " I",
+        "norm": "i",
+        "logit": 17.5,
+        "prob": 0.011990483850240707
+      }
+    ],
+    "topk_with_prefix": [
+      {
+        "token_id": 22555,
+        "piece": " Sure",
+        "norm": "sure",
+        "logit": 15.9375,
+        "prob": 0.045294053852558136
+      },
+      {
+        "token_id": 55313,
+        "piece": " Quantum",
+        "norm": "quantum",
+        "logit": 15.4375,
+        "prob": 0.027472233399748802
+      },
+      {
+        "token_id": 52366,
+        "piece": " Certainly",
+        "norm": "certainly",
+        "logit": 15.0,
+        "prob": 0.017737405374646187
+      },
+      {
+        "token_id": 5209,
+        "piece": " Please",
+        "norm": "please",
+        "logit": 14.625,
+        "prob": 0.01219072937965393
+      },
+      {
+        "token_id": 30536,
+        "piece": " Climate",
+        "norm": "climate",
+        "logit": 14.25,
+        "prob": 0.008378557860851288
+      },
+      {
+        "token_id": 58194,
+        "piece": " Artificial",
+        "norm": "artificial",
+        "logit": 14.1875,
+        "prob": 0.007870926521718502
+      },
+      {
+        "token_id": 37444,
+        "piece": " Nuclear",
+        "norm": "nuclear",
+        "logit": 14.0625,
+        "prob": 0.0069460682570934296
+      },
+      {
+        "token_id": 18183,
+        "piece": " Deep",
+        "norm": "deep",
+        "logit": 14.0,
+        "prob": 0.0065252273343503475
+      },
+      {
+        "token_id": 2885,
+        "piece": " Data",
+        "norm": "data",
+        "logit": 14.0,
+        "prob": 0.0065252273343503475
+      },
+      {
+        "token_id": 39502,
+        "piece": " Hydro",
+        "norm": "hydro",
+        "logit": 14.0,
+        "prob": 0.0065252273343503475
+      },
+      {
+        "token_id": 12354,
+        "piece": " Energy",
+        "norm": "energy",
+        "logit": 13.9375,
+        "prob": 0.006129883695393801
+      },
+      {
+        "token_id": 60477,
+        "piece": " Neural",
+        "norm": "neural",
+        "logit": 13.875,
+        "prob": 0.005758493207395077
+      }
+    ]
+  },
+  "error": null
+}
+```
+
+## Retrieval Top-K Semantic Shift
+
+```json
+{
+  "passed": false,
+  "music_keywords": [
+    "pianist",
+    "practiced",
+    "arpeggios",
+    "chopin",
+    "nocturnes",
+    "midnight",
+    "musician",
+    "refined",
+    "finger",
+    "technique",
+    "phrasing",
+    "pedal"
+  ],
+  "space_keywords": [
+    "distant",
+    "astronomers",
+    "observed",
+    "galaxies",
+    "quasars",
+    "stellar",
+    "evolution",
+    "space",
+    "orbital",
+    "mechanics",
+    "explains",
+    "satellites"
+  ],
+  "rows": [
+    {
+      "prompt": "A strong explanation should mention",
+      "music_no_prefix": [
+        {
+          "token_id": 279,
+          "piece": " the",
+          "norm": "the",
+          "logit": 21.125,
+          "prob": 0.3049025535583496
+        },
+        {
+          "token_id": 264,
+          "piece": " a",
+          "norm": "a",
+          "logit": 19.5,
+          "prob": 0.06003887206315994
+        },
+        {
+          "token_id": 518,
+          "piece": " at",
+          "norm": "at",
+          "logit": 19.375,
+          "prob": 0.05298411846160889
+        },
+        {
+          "token_id": 3151,
+          "piece": " specific",
+          "norm": "specific",
+          "logit": 19.0,
+          "prob": 0.03641541674733162
+        },
+        {
+          "token_id": 2176,
+          "piece": " both",
+          "norm": "both",
+          "logit": 19.0,
+          "prob": 0.03641541674733162
+        },
+        {
+          "token_id": 429,
+          "piece": " that",
+          "norm": "that",
+          "logit": 18.625,
+          "prob": 0.0250279251486063
+        },
+        {
+          "token_id": 1246,
+          "piece": " how",
+          "norm": "how",
+          "logit": 18.625,
+          "prob": 0.0250279251486063
+        },
+        {
+          "token_id": 678,
+          "piece": " all",
+          "norm": "all",
+          "logit": 18.625,
+          "prob": 0.0250279251486063
+        },
+        {
+          "token_id": 10295,
+          "piece": " examples",
+          "norm": "examples",
+          "logit": 18.5,
+          "prob": 0.022087067365646362
+        },
+        {
+          "token_id": 2326,
+          "piece": " three",
+          "norm": "three",
+          "logit": 18.25,
+          "prob": 0.01720142550766468
+        },
+        {
+          "token_id": 3807,
+          "piece": " several",
+          "norm": "several",
+          "logit": 18.125,
+          "prob": 0.015180204063653946
+        },
+        {
+          "token_id": 1378,
+          "piece": " two",
+          "norm": "two",
+          "logit": 18.125,
+          "prob": 0.015180204063653946
+        }
+      ],
+      "music_with_prefix": [
+        {
+          "token_id": 3151,
+          "piece": " specific",
+          "norm": "specific",
+          "logit": 17.875,
+          "prob": 0.08923931419849396
+        },
+        {
+          "token_id": 10295,
+          "piece": " examples",
+          "norm": "examples",
+          "logit": 17.375,
+          "prob": 0.05412638187408447
+        },
+        {
+          "token_id": 2326,
+          "piece": " three",
+          "norm": "three",
+          "logit": 17.125,
+          "prob": 0.04215366765856743
+        },
+        {
+          "token_id": 3170,
+          "piece": " why",
+          "norm": "why",
+          "logit": 17.0,
+          "prob": 0.037200480699539185
+        },
+        {
+          "token_id": 3807,
+          "piece": " several",
+          "norm": "several",
+          "logit": 16.875,
+          "prob": 0.03282931074500084
+        },
+        {
+          "token_id": 1376,
+          "piece": " key",
+          "norm": "key",
+          "logit": 16.5,
+          "prob": 0.022563232108950615
+        },
+        {
+          "token_id": 5248,
+          "piece": " multiple",
+          "norm": "multiple",
+          "logit": 16.375,
+          "prob": 0.019911982119083405
+        },
+        {
+          "token_id": 5257,
+          "piece": " various",
+          "norm": "various",
+          "logit": 16.25,
+          "prob": 0.01757226325571537
+        },
+        {
+          "token_id": 4650,
+          "piece": " potential",
+          "norm": "potential",
+          "logit": 15.625,
+          "prob": 0.009405754506587982
+        },
+        {
+          "token_id": 3040,
+          "piece": " four",
+          "norm": "four",
+          "logit": 15.4375,
+          "prob": 0.007797644007951021
+        },
+        {
+          "token_id": 3425,
+          "piece": " whether",
+          "norm": "whether",
+          "logit": 15.25,
+          "prob": 0.006464474368840456
+        },
+        {
+          "token_id": 1931,
+          "piece": " real",
+          "norm": "real",
+          "logit": 15.1875,
+          "prob": 0.00607281131669879
+        }
+      ],
+      "music_hits_no": {
+        "match_count": 0,
+        "match_prob_mass": 0,
+        "matches": []
+      },
+      "music_hits_with_prefix": {
+        "match_count": 0,
+        "match_prob_mass": 0,
+        "matches": []
+      },
+      "space_no_prefix": [
+        {
+          "token_id": 279,
+          "piece": " the",
+          "norm": "the",
+          "logit": 21.125,
+          "prob": 0.3049025535583496
+        },
+        {
+          "token_id": 264,
+          "piece": " a",
+          "norm": "a",
+          "logit": 19.5,
+          "prob": 0.06003887206315994
+        },
+        {
+          "token_id": 518,
+          "piece": " at",
+          "norm": "at",
+          "logit": 19.375,
+          "prob": 0.05298411846160889
+        },
+        {
+          "token_id": 3151,
+          "piece": " specific",
+          "norm": "specific",
+          "logit": 19.0,
+          "prob": 0.03641541674733162
+        },
+        {
+          "token_id": 2176,
+          "piece": " both",
+          "norm": "both",
+          "logit": 19.0,
+          "prob": 0.03641541674733162
+        },
+        {
+          "token_id": 429,
+          "piece": " that",
+          "norm": "that",
+          "logit": 18.625,
+          "prob": 0.0250279251486063
+        },
+        {
+          "token_id": 1246,
+          "piece": " how",
+          "norm": "how",
+          "logit": 18.625,
+          "prob": 0.0250279251486063
+        },
+        {
+          "token_id": 678,
+          "piece": " all",
+          "norm": "all",
+          "logit": 18.625,
+          "prob": 0.0250279251486063
+        },
+        {
+          "token_id": 10295,
+          "piece": " examples",
+          "norm": "examples",
+          "logit": 18.5,
+          "prob": 0.022087067365646362
+        },
+        {
+          "token_id": 2326,
+          "piece": " three",
+          "norm": "three",
+          "logit": 18.25,
+          "prob": 0.01720142550766468
+        },
+        {
+          "token_id": 3807,
+          "piece": " several",
+          "norm": "several",
+          "logit": 18.125,
+          "prob": 0.015180204063653946
+        },
+        {
+          "token_id": 1378,
+          "piece": " two",
+          "norm": "two",
+          "logit": 18.125,
+          "prob": 0.015180204063653946
+        }
+      ],
+      "space_with_prefix": [
+        {
+          "token_id": 3151,
+          "piece": " specific",
+          "norm": "specific",
+          "logit": 18.125,
+          "prob": 0.11810589581727982
+        },
+        {
+          "token_id": 10295,
+          "piece": " examples",
+          "norm": "examples",
+          "logit": 17.125,
+          "prob": 0.04344873130321503
+        },
+        {
+          "token_id": 3807,
+          "piece": " several",
+          "norm": "several",
+          "logit": 17.0,
+          "prob": 0.03834336996078491
+        },
+        {
+          "token_id": 3170,
+          "piece": " why",
+          "norm": "why",
+          "logit": 16.875,
+          "prob": 0.03383790701627731
+        },
+        {
+          "token_id": 2326,
+          "piece": " three",
+          "norm": "three",
+          "logit": 16.875,
+          "prob": 0.03383790701627731
+        },
+        {
+          "token_id": 1376,
+          "piece": " key",
+          "norm": "key",
+          "logit": 16.5,
+          "prob": 0.02325643040239811
+        },
+        {
+          "token_id": 5257,
+          "piece": " various",
+          "norm": "various",
+          "logit": 16.25,
+          "prob": 0.018112126737833023
+        },
+        {
+          "token_id": 5248,
+          "piece": " multiple",
+          "norm": "multiple",
+          "logit": 16.25,
+          "prob": 0.018112126737833023
+        },
+        {
+          "token_id": 3460,
+          "piece": " large",
+          "norm": "large",
+          "logit": 15.5,
+          "prob": 0.008555563166737556
+        },
+        {
+          "token_id": 3425,
+          "piece": " whether",
+          "norm": "whether",
+          "logit": 15.5,
+          "prob": 0.008555563166737556
+        },
+        {
+          "token_id": 4650,
+          "piece": " potential",
+          "norm": "potential",
+          "logit": 15.4375,
+          "prob": 0.008037206716835499
+        },
+        {
+          "token_id": 5904,
+          "piece": " evidence",
+          "norm": "evidence",
+          "logit": 15.1875,
+          "prob": 0.006259383168071508
+        }
+      ],
+      "space_hits_no": {
+        "match_count": 0,
+        "match_prob_mass": 0,
+        "matches": []
+      },
+      "space_hits_with_prefix": {
+        "match_count": 0,
+        "match_prob_mass": 0,
+        "matches": []
+      },
+      "passed": false
+    },
+    {
+      "prompt": "The most relevant idea is",
+      "music_no_prefix": [
+        {
+          "token_id": 429,
+          "piece": " that",
+          "norm": "that",
+          "logit": 20.25,
+          "prob": 0.2765631675720215
+        },
+        {
+          "token_id": 279,
+          "piece": " the",
+          "norm": "the",
+          "logit": 19.125,
+          "prob": 0.08978691697120667
+        },
+        {
+          "token_id": 25,
+          "piece": ":",
+          "norm": "",
+          "logit": 19.0,
+          "prob": 0.07923667877912521
+        },
+        {
+          "token_id": 311,
+          "piece": " to",
+          "norm": "to",
+          "logit": 18.25,
+          "prob": 0.037428755313158035
+        },
+        {
+          "token_id": 30743,
+          "piece": " ____",
+          "norm": "",
+          "logit": 18.0,
+          "prob": 0.02914954163134098
+        },
+        {
+          "token_id": 510,
+          "piece": ":\n",
+          "norm": "",
+          "logit": 18.0,
+          "prob": 0.02914954163134098
+        },
+        {
+          "token_id": 1304,
+          "piece": " __",
+          "norm": "",
+          "logit": 17.5,
+          "prob": 0.01768009178340435
+        },
+        {
+          "token_id": 32671,
+          "piece": " ______",
+          "norm": "",
+          "logit": 17.5,
+          "prob": 0.01768009178340435
+        },
+        {
+          "token_id": 1447,
+          "piece": ":\n\n",
+          "norm": "",
+          "logit": 17.375,
+          "prob": 0.015602625906467438
+        },
+        {
+          "token_id": 537,
+          "piece": " not",
+          "norm": "not",
+          "logit": 17.25,
+          "prob": 0.013769268989562988
+        },
+        {
+          "token_id": 330,
+          "piece": " \"",
+          "norm": "",
+          "logit": 17.25,
+          "prob": 0.013769268989562988
+        },
+        {
+          "token_id": 320,
+          "piece": " (",
+          "norm": "",
+          "logit": 17.125,
+          "prob": 0.012151338160037994
+        }
+      ],
+      "music_with_prefix": [
+        {
+          "token_id": 4658,
+          "piece": " probably",
+          "norm": "probably",
+          "logit": 16.0,
+          "prob": 0.035965967923402786
+        },
+        {
+          "token_id": 3118,
+          "piece": " based",
+          "norm": "based",
+          "logit": 15.625,
+          "prob": 0.02471902407705784
+        },
+        {
+          "token_id": 4363,
+          "piece": " likely",
+          "norm": "likely",
+          "logit": 15.5625,
+          "prob": 0.023221375420689583
+        },
+        {
+          "token_id": 5435,
+          "piece": " related",
+          "norm": "related",
+          "logit": 15.3125,
+          "prob": 0.018084824085235596
+        },
+        {
+          "token_id": 2677,
+          "piece": " always",
+          "norm": "always",
+          "logit": 15.25,
+          "prob": 0.016989119350910187
+        },
+        {
+          "token_id": 3545,
+          "piece": " often",
+          "norm": "often",
+          "logit": 15.0,
+          "prob": 0.013231140561401844
+        },
+        {
+          "token_id": 5990,
+          "piece": " usually",
+          "norm": "usually",
+          "logit": 14.9375,
+          "prob": 0.01242950651794672
+        },
+        {
+          "token_id": 2661,
+          "piece": " given",
+          "norm": "given",
+          "logit": 14.9375,
+          "prob": 0.01242950651794672
+        },
+        {
+          "token_id": 2999,
+          "piece": " option",
+          "norm": "option",
+          "logit": 14.6875,
+          "prob": 0.009680109098553658
+        },
+        {
+          "token_id": 9355,
+          "piece": " clearly",
+          "norm": "clearly",
+          "logit": 14.6875,
+          "prob": 0.009680109098553658
+        },
+        {
+          "token_id": 4396,
+          "piece": " correct",
+          "norm": "correct",
+          "logit": 14.6875,
+          "prob": 0.009680109098553658
+        },
+        {
+          "token_id": 3520,
+          "piece": " actually",
+          "norm": "actually",
+          "logit": 14.3125,
+          "prob": 0.0066530355252325535
+        }
+      ],
+      "music_hits_no": {
+        "match_count": 0,
+        "match_prob_mass": 0,
+        "matches": []
+      },
+      "music_hits_with_prefix": {
+        "match_count": 0,
+        "match_prob_mass": 0,
+        "matches": []
+      },
+      "space_no_prefix": [
+        {
+          "token_id": 429,
+          "piece": " that",
+          "norm": "that",
+          "logit": 20.25,
+          "prob": 0.2765631675720215
+        },
+        {
+          "token_id": 279,
+          "piece": " the",
+          "norm": "the",
+          "logit": 19.125,
+          "prob": 0.08978691697120667
+        },
+        {
+          "token_id": 25,
+          "piece": ":",
+          "norm": "",
+          "logit": 19.0,
+          "prob": 0.07923667877912521
+        },
+        {
+          "token_id": 311,
+          "piece": " to",
+          "norm": "to",
+          "logit": 18.25,
+          "prob": 0.037428755313158035
+        },
+        {
+          "token_id": 30743,
+          "piece": " ____",
+          "norm": "",
+          "logit": 18.0,
+          "prob": 0.02914954163134098
+        },
+        {
+          "token_id": 510,
+          "piece": ":\n",
+          "norm": "",
+          "logit": 18.0,
+          "prob": 0.02914954163134098
+        },
+        {
+          "token_id": 1304,
+          "piece": " __",
+          "norm": "",
+          "logit": 17.5,
+          "prob": 0.01768009178340435
+        },
+        {
+          "token_id": 32671,
+          "piece": " ______",
+          "norm": "",
+          "logit": 17.5,
+          "prob": 0.01768009178340435
+        },
+        {
+          "token_id": 1447,
+          "piece": ":\n\n",
+          "norm": "",
+          "logit": 17.375,
+          "prob": 0.015602625906467438
+        },
+        {
+          "token_id": 537,
+          "piece": " not",
+          "norm": "not",
+          "logit": 17.25,
+          "prob": 0.013769268989562988
+        },
+        {
+          "token_id": 330,
+          "piece": " \"",
+          "norm": "",
+          "logit": 17.25,
+          "prob": 0.013769268989562988
+        },
+        {
+          "token_id": 320,
+          "piece": " (",
+          "norm": "",
+          "logit": 17.125,
+          "prob": 0.012151338160037994
+        }
+      ],
+      "space_with_prefix": [
+        {
+          "token_id": 5990,
+          "piece": " usually",
+          "norm": "usually",
+          "logit": 15.625,
+          "prob": 0.024161575362086296
+        },
+        {
+          "token_id": 2677,
+          "piece": " always",
+          "norm": "always",
+          "logit": 15.625,
+          "prob": 0.024161575362086296
+        },
+        {
+          "token_id": 3545,
+          "piece": " often",
+          "norm": "often",
+          "logit": 15.625,
+          "prob": 0.024161575362086296
+        },
+        {
+          "token_id": 4658,
+          "piece": " probably",
+          "norm": "probably",
+          "logit": 15.4375,
+          "prob": 0.02003064937889576
+        },
+        {
+          "token_id": 3118,
+          "piece": " based",
+          "norm": "based",
+          "logit": 15.375,
+          "prob": 0.018817054107785225
+        },
+        {
+          "token_id": 4363,
+          "piece": " likely",
+          "norm": "likely",
+          "logit": 15.375,
+          "prob": 0.018817054107785225
+        },
+        {
+          "token_id": 2661,
+          "piece": " given",
+          "norm": "given",
+          "logit": 15.0625,
+          "prob": 0.013766851276159286
+        },
+        {
+          "token_id": 5435,
+          "piece": " related",
+          "norm": "related",
+          "logit": 15.0,
+          "prob": 0.012932759709656239
+        },
+        {
+          "token_id": 10449,
+          "piece": " presented",
+          "norm": "presented",
+          "logit": 14.875,
+          "prob": 0.011413119733333588
+        },
+        {
+          "token_id": 6839,
+          "piece": " shown",
+          "norm": "shown",
+          "logit": 14.8125,
+          "prob": 0.010721634142100811
+        },
+        {
+          "token_id": 15251,
+          "piece": " represented",
+          "norm": "represented",
+          "logit": 14.75,
+          "prob": 0.010072043165564537
+        },
+        {
+          "token_id": 9355,
+          "piece": " clearly",
+          "norm": "clearly",
+          "logit": 14.6875,
+          "prob": 0.009461808949708939
+        }
+      ],
+      "space_hits_no": {
+        "match_count": 0,
+        "match_prob_mass": 0,
+        "matches": []
+      },
+      "space_hits_with_prefix": {
+        "match_count": 0,
+        "match_prob_mass": 0,
+        "matches": []
+      },
+      "passed": false
+    }
+  ],
+  "error": null
+}
+```
+
+## Repetition Segment Audit
+
+```json
+{
+  "passed": true,
+  "aggregate": {
+    "bad_segment_ratio": 0.0,
+    "total_segments": 24,
+    "bad_segments": 0,
+    "early_collapse_prompts": []
+  },
+  "rows": [
+    {
+      "prompt": "The pianist",
+      "output": "The pianist pian piano pian pianette pian plays Chop Chop Chop hours piano piano hours pian piano perfect hours Chop hours perfect Chop midnight hours midnight perfect perfect midnight midnight pian perfect noct noct noct midnight noct pian noct Chop piano Chop perfect piano midnight Chop pian hours noct",
+      "generated_token_count": 47,
+      "window": 8,
+      "segments": [
+        {
+          "segment_idx": 0,
+          "tokens": [
+            "pian",
+            "piano",
+            "pian",
+            "pianette",
+            "pian",
+            "plays",
+            "chop",
+            "chop"
+          ],
+          "unique_ratio": 0.625,
+          "content_ratio": 1.0,
+          "repeated_bigram_ratio": 0.0,
+          "dominant_token_share": 0.375
+        },
+        {
+          "segment_idx": 1,
+          "tokens": [
+            "chop",
+            "hours",
+            "piano",
+            "piano",
+            "hours",
+            "pian",
+            "piano",
+            "perfect"
+          ],
+          "unique_ratio": 0.625,
+          "content_ratio": 0.75,
+          "repeated_bigram_ratio": 0.0,
+          "dominant_token_share": 0.375
+        },
+        {
+          "segment_idx": 2,
+          "tokens": [
+            "hours",
+            "chop",
+            "hours",
+            "perfect",
+            "chop",
+            "midnight",
+            "hours",
+            "midnight"
+          ],
+          "unique_ratio": 0.5,
+          "content_ratio": 0.625,
+          "repeated_bigram_ratio": 0.0,
+          "dominant_token_share": 0.375
+        },
+        {
+          "segment_idx": 3,
+          "tokens": [
+            "perfect",
+            "perfect",
+            "midnight",
+            "midnight",
+            "pian",
+            "perfect",
+            "noct",
+            "noct"
+          ],
+          "unique_ratio": 0.5,
+          "content_ratio": 1.0,
+          "repeated_bigram_ratio": 0.0,
+          "dominant_token_share": 0.375
+        },
+        {
+          "segment_idx": 4,
+          "tokens": [
+            "noct",
+            "midnight",
+            "noct",
+            "pian",
+            "noct",
+            "chop",
+            "piano",
+            "chop"
+          ],
+          "unique_ratio": 0.625,
+          "content_ratio": 1.0,
+          "repeated_bigram_ratio": 0.0,
+          "dominant_token_share": 0.375
+        },
+        {
+          "segment_idx": 5,
+          "tokens": [
+            "perfect",
+            "piano",
+            "midnight",
+            "chop",
+            "pian",
+            "hours",
+            "noct"
+          ],
+          "unique_ratio": 1.0,
+          "content_ratio": 0.8571428571428571,
+          "repeated_bigram_ratio": 0.0,
+          "dominant_token_share": 0.14285714285714285
+        }
+      ],
+      "bad_segments": [],
+      "first_bad_segment_idx": null
+    },
+    {
+      "prompt": "The telescope",
+      "output": "The telescope telescope stars telescopestarsStars amazing amazed telescope captured telescope stars stars captured stars distant telescope signatures captured captured distant captured nebula distant signatures signatures neb neb captured signatures spectral neb spectral spectral neb spectral stars neb signatures distant distant spectral signatures Space telescope neb stars spectral",
+      "generated_token_count": 45,
+      "window": 8,
+      "segments": [
+        {
+          "segment_idx": 0,
+          "tokens": [
+            "telescope",
+            "stars",
+            "telescopestarsstars",
+            "amazing",
+            "amazed",
+            "telescope",
+            "captured",
+            "telescope"
+          ],
+          "unique_ratio": 0.75,
+          "content_ratio": 1.0,
+          "repeated_bigram_ratio": 0.0,
+          "dominant_token_share": 0.375
+        },
+        {
+          "segment_idx": 1,
+          "tokens": [
+            "stars",
+            "stars",
+            "captured",
+            "stars",
+            "distant",
+            "telescope",
+            "signatures",
+            "captured"
+          ],
+          "unique_ratio": 0.625,
+          "content_ratio": 1.0,
+          "repeated_bigram_ratio": 0.0,
+          "dominant_token_share": 0.375
+        },
+        {
+          "segment_idx": 2,
+          "tokens": [
+            "captured",
+            "distant",
+            "captured",
+            "nebula",
+            "distant",
+            "signatures",
+            "signatures",
+            "neb"
+          ],
+          "unique_ratio": 0.625,
+          "content_ratio": 0.875,
+          "repeated_bigram_ratio": 0.0,
+          "dominant_token_share": 0.25
+        },
+        {
+          "segment_idx": 3,
+          "tokens": [
+            "neb",
+            "captured",
+            "signatures",
+            "spectral",
+            "neb",
+            "spectral",
+            "spectral",
+            "neb"
+          ],
+          "unique_ratio": 0.5,
+          "content_ratio": 0.625,
+          "repeated_bigram_ratio": 0.14285714285714285,
+          "dominant_token_share": 0.375
+        },
+        {
+          "segment_idx": 4,
+          "tokens": [
+            "spectral",
+            "stars",
+            "neb",
+            "signatures",
+            "distant",
+            "distant",
+            "spectral",
+            "signatures"
+          ],
+          "unique_ratio": 0.625,
+          "content_ratio": 0.875,
+          "repeated_bigram_ratio": 0.0,
+          "dominant_token_share": 0.25
+        },
+        {
+          "segment_idx": 5,
+          "tokens": [
+            "space",
+            "telescope",
+            "neb",
+            "stars",
+            "spectral"
+          ],
+          "unique_ratio": 1.0,
+          "content_ratio": 0.8,
+          "repeated_bigram_ratio": 0.0,
+          "dominant_token_share": 0.2
+        }
+      ],
+      "bad_segments": [],
+      "first_bad_segment_idx": null
+    },
+    {
+      "prompt": "The market analyst",
+      "output": "The market analyst market session sessessionssesess market market session session significant market volatility experienced stock market stock significant volatility experienced significant stock volatility significant session stock session volatility experienced volatility stock experienced session significant Market analysts often closely monitor market sessions involving significant events, particularly stock markets",
+      "generated_token_count": 44,
+      "window": 8,
+      "segments": [
+        {
+          "segment_idx": 0,
+          "tokens": [
+            "market",
+            "session",
+            "sessessionssesess",
+            "market",
+            "market",
+            "session",
+            "session",
+            "significant"
+          ],
+          "unique_ratio": 0.5,
+          "content_ratio": 0.625,
+          "repeated_bigram_ratio": 0.14285714285714285,
+          "dominant_token_share": 0.375
+        },
+        {
+          "segment_idx": 1,
+          "tokens": [
+            "market",
+            "volatility",
+            "experienced",
+            "stock",
+            "market",
+            "stock",
+            "significant",
+            "volatility"
+          ],
+          "unique_ratio": 0.625,
+          "content_ratio": 1.0,
+          "repeated_bigram_ratio": 0.0,
+          "dominant_token_share": 0.25
+        },
+        {
+          "segment_idx": 2,
+          "tokens": [
+            "experienced",
+            "significant",
+            "stock",
+            "volatility",
+            "significant",
+            "session",
+            "stock",
+            "session"
+          ],
+          "unique_ratio": 0.625,
+          "content_ratio": 0.75,
+          "repeated_bigram_ratio": 0.0,
+          "dominant_token_share": 0.25
+        },
+        {
+          "segment_idx": 3,
+          "tokens": [
+            "volatility",
+            "experienced",
+            "volatility",
+            "stock",
+            "experienced",
+            "session",
+            "significant",
+            "market"
+          ],
+          "unique_ratio": 0.75,
+          "content_ratio": 0.875,
+          "repeated_bigram_ratio": 0.0,
+          "dominant_token_share": 0.25
+        },
+        {
+          "segment_idx": 4,
+          "tokens": [
+            "analysts",
+            "often",
+            "closely",
+            "monitor",
+            "market",
+            "sessions",
+            "involving",
+            "significant"
+          ],
+          "unique_ratio": 1.0,
+          "content_ratio": 0.875,
+          "repeated_bigram_ratio": 0.0,
+          "dominant_token_share": 0.125
+        },
+        {
+          "segment_idx": 5,
+          "tokens": [
+            "events",
+            "particularly",
+            "stock",
+            "markets"
+          ],
+          "unique_ratio": 1.0,
+          "content_ratio": 1.0,
+          "repeated_bigram_ratio": 0.0,
+          "dominant_token_share": 0.25
+        }
+      ],
+      "bad_segments": [],
+      "first_bad_segment_idx": null
+    },
+    {
+      "prompt": "Explain the topic clearly",
+      "output": "Explain the topic clearly simple explained simple simple analog simple rel everyday rel professor Professor explained explained analog explained rel Force professor everyday analog professor rel everyday professor analog everyday analog rel simpleForce professor professor explained professor simple everyday explained everyday simple professor rel rel analog analog FORCE rel explainedFORCE",
+      "generated_token_count": 46,
+      "window": 8,
+      "segments": [
+        {
+          "segment_idx": 0,
+          "tokens": [
+            "simple",
+            "explained",
+            "simple",
+            "simple",
+            "analog",
+            "simple",
+            "rel",
+            "everyday"
+          ],
+          "unique_ratio": 0.625,
+          "content_ratio": 0.375,
+          "repeated_bigram_ratio": 0.0,
+          "dominant_token_share": 0.5
+        },
+        {
+          "segment_idx": 1,
+          "tokens": [
+            "rel",
+            "professor",
+            "professor",
+            "explained",
+            "explained",
+            "analog",
+            "explained",
+            "rel"
+          ],
+          "unique_ratio": 0.5,
+          "content_ratio": 0.75,
+          "repeated_bigram_ratio": 0.0,
+          "dominant_token_share": 0.375
+        },
+        {
+          "segment_idx": 2,
+          "tokens": [
+            "force",
+            "professor",
+            "everyday",
+            "analog",
+            "professor",
+            "rel",
+            "everyday",
+            "professor"
+          ],
+          "unique_ratio": 0.625,
+          "content_ratio": 0.875,
+          "repeated_bigram_ratio": 0.0,
+          "dominant_token_share": 0.375
+        },
+        {
+          "segment_idx": 3,
+          "tokens": [
+            "analog",
+            "everyday",
+            "analog",
+            "rel",
+            "simpleforce",
+            "professor",
+            "professor",
+            "explained"
+          ],
+          "unique_ratio": 0.75,
+          "content_ratio": 0.875,
+          "repeated_bigram_ratio": 0.0,
+          "dominant_token_share": 0.25
+        },
+        {
+          "segment_idx": 4,
+          "tokens": [
+            "professor",
+            "simple",
+            "everyday",
+            "explained",
+            "everyday",
+            "simple",
+            "professor",
+            "rel"
+          ],
+          "unique_ratio": 0.625,
+          "content_ratio": 0.625,
+          "repeated_bigram_ratio": 0.0,
+          "dominant_token_share": 0.25
+        },
+        {
+          "segment_idx": 5,
+          "tokens": [
+            "rel",
+            "analog",
+            "analog",
+            "force",
+            "rel",
+            "explainedforce"
+          ],
+          "unique_ratio": 0.6666666666666666,
+          "content_ratio": 0.6666666666666666,
+          "repeated_bigram_ratio": 0.0,
+          "dominant_token_share": 0.3333333333333333
+        }
+      ],
+      "bad_segments": [],
+      "first_bad_segment_idx": null
+    }
+  ],
+  "error": null
+}
+```
+
+## Prefix Stepwise Drift Trajectory
+
+```json
+{
+  "passed": true,
+  "rows": [
+    {
+      "prompt": "Key piano ideas include",
+      "first_bad_step": 4,
+      "decoded_output": "Key piano ideas include leg movements across keys, dynamic changes, and the use of the pedal. These",
+      "rows": [
+        {
+          "step": 0,
+          "top1": {
+            "token_id": 3598,
+            "piece": " major",
+            "norm": "major",
+            "logit": 16.25,
+            "prob": 0.026983050629496574
+          },
+          "top1_category": "semantic",
+          "topk_category_counts": {
+            "semantic": 11,
+            "functional": 1,
+            "punct": 0
+          },
+          "topk_category_prob_mass": {
+            "semantic": 0.18486935831606388,
+            "functional": 0.026983050629496574,
+            "punct": 0.0
+          },
+          "chosen_token_id": 2472,
+          "chosen_piece": " leg",
+          "chosen_norm": "leg",
+          "chosen_category": "functional"
+        },
+        {
+          "step": 1,
+          "top1": {
+            "token_id": 19029,
+            "piece": " movements",
+            "norm": "movements",
+            "logit": 14.375,
+            "prob": 0.13023822009563446
+          },
+          "top1_category": "semantic",
+          "topk_category_counts": {
+            "semantic": 11,
+            "functional": 1,
+            "punct": 0
+          },
+          "topk_category_prob_mass": {
+            "semantic": 0.3965669944882393,
+            "functional": 0.0113800885155797,
+            "punct": 0.0
+          },
+          "chosen_token_id": 19029,
+          "chosen_piece": " movements",
+          "chosen_norm": "movements",
+          "chosen_category": "semantic"
+        },
+        {
+          "step": 2,
+          "top1": {
+            "token_id": 3941,
+            "piece": " across",
+            "norm": "across",
+            "logit": 16.5,
+            "prob": 0.05107051879167557
+          },
+          "top1_category": "functional",
+          "topk_category_counts": {
+            "semantic": 10,
+            "functional": 2,
+            "punct": 0
+          },
+          "topk_category_prob_mass": {
+            "semantic": 0.2263985425233841,
+            "functional": 0.0767503883689642,
+            "punct": 0.0
+          },
+          "chosen_token_id": 3941,
+          "chosen_piece": " across",
+          "chosen_norm": "across",
+          "chosen_category": "functional"
+        },
+        {
+          "step": 3,
+          "top1": {
+            "token_id": 6894,
+            "piece": " keys",
+            "norm": "keys",
+            "logit": 18.5,
+            "prob": 0.09729984402656555
+          },
+          "top1_category": "semantic",
+          "topk_category_counts": {
+            "semantic": 10,
+            "functional": 2,
+            "punct": 0
+          },
+          "topk_category_prob_mass": {
+            "semantic": 0.40497455187141895,
+            "functional": 0.04631178267300129,
+            "punct": 0.0
+          },
+          "chosen_token_id": 6894,
+          "chosen_piece": " keys",
+          "chosen_norm": "keys",
+          "chosen_category": "semantic"
+        },
+        {
+          "step": 4,
+          "top1": {
+            "token_id": 11,
+            "piece": ",",
+            "norm": "",
+            "logit": 21.125,
+            "prob": 0.6922075748443604
+          },
+          "top1_category": "punct",
+          "topk_category_counts": {
+            "semantic": 1,
+            "functional": 0,
+            "punct": 11
+          },
+          "topk_category_prob_mass": {
+            "semantic": 0.004116016905754805,
+            "functional": 0.0,
+            "punct": 0.8863428700715303
+          },
+          "chosen_token_id": 11,
+          "chosen_piece": ",",
+          "chosen_norm": "",
+          "chosen_category": "punct"
+        },
+        {
+          "step": 5,
+          "top1": {
+            "token_id": 8741,
+            "piece": " dynamic",
+            "norm": "dynamic",
+            "logit": 17.625,
+            "prob": 0.03767668455839157
+          },
+          "top1_category": "semantic",
+          "topk_category_counts": {
+            "semantic": 10,
+            "functional": 2,
+            "punct": 0
+          },
+          "topk_category_prob_mass": {
+            "semantic": 0.1940950881689787,
+            "functional": 0.04548138566315174,
+            "punct": 0.0
+          },
+          "chosen_token_id": 8741,
+          "chosen_piece": " dynamic",
+          "chosen_norm": "dynamic",
+          "chosen_category": "semantic"
+        },
+        {
+          "step": 6,
+          "top1": {
+            "token_id": 4344,
+            "piece": " changes",
+            "norm": "changes",
+            "logit": 21.75,
+            "prob": 0.42921698093414307
+          },
+          "top1_category": "semantic",
+          "topk_category_counts": {
+            "semantic": 11,
+            "functional": 0,
+            "punct": 1
+          },
+          "topk_category_prob_mass": {
+            "semantic": 0.8407482951879501,
+            "functional": 0.0,
+            "punct": 0.008908114396035671
+          },
+          "chosen_token_id": 4344,
+          "chosen_piece": " changes",
+          "chosen_norm": "changes",
+          "chosen_category": "semantic"
+        },
+        {
+          "step": 7,
+          "top1": {
+            "token_id": 11,
+            "piece": ",",
+            "norm": "",
+            "logit": 25.375,
+            "prob": 0.9306752681732178
+          },
+          "top1_category": "punct",
+          "topk_category_counts": {
+            "semantic": 5,
+            "functional": 2,
+            "punct": 5
+          },
+          "topk_category_prob_mass": {
+            "semantic": 0.0230137127218768,
+            "functional": 0.005398477369453758,
+            "punct": 0.961544852994848
+          },
+          "chosen_token_id": 11,
+          "chosen_piece": ",",
+          "chosen_norm": "",
+          "chosen_category": "punct"
+        },
+        {
+          "step": 8,
+          "top1": {
+            "token_id": 323,
+            "piece": " and",
+            "norm": "and",
+            "logit": 20.25,
+            "prob": 0.4670189321041107
+          },
+          "top1_category": "functional",
+          "topk_category_counts": {
+            "semantic": 9,
+            "functional": 3,
+            "punct": 0
+          },
+          "topk_category_prob_mass": {
+            "semantic": 0.1295861303806305,
+            "functional": 0.5177998133003712,
+            "punct": 0.0
+          },
+          "chosen_token_id": 323,
+          "chosen_piece": " and",
+          "chosen_norm": "and",
+          "chosen_category": "functional"
+        },
+        {
+          "step": 9,
+          "top1": {
+            "token_id": 279,
+            "piece": " the",
+            "norm": "the",
+            "logit": 18.625,
+            "prob": 0.1194610446691513
+          },
+          "top1_category": "functional",
+          "topk_category_counts": {
+            "semantic": 9,
+            "functional": 3,
+            "punct": 0
+          },
+          "topk_category_prob_mass": {
+            "semantic": 0.18513815943151712,
+            "functional": 0.21467376872897148,
+            "punct": 0.0
+          },
+          "chosen_token_id": 279,
+          "chosen_piece": " the",
+          "chosen_norm": "the",
+          "chosen_category": "functional"
+        },
+        {
+          "step": 10,
+          "top1": {
+            "token_id": 990,
+            "piece": " use",
+            "norm": "use",
+            "logit": 19.75,
+            "prob": 0.22168958187103271
+          },
+          "top1_category": "functional",
+          "topk_category_counts": {
+            "semantic": 10,
+            "functional": 2,
+            "punct": 0
+          },
+          "topk_category_prob_mass": {
+            "semantic": 0.13133995607495308,
+            "functional": 0.24505549110472202,
+            "punct": 0.0
+          },
+          "chosen_token_id": 990,
+          "chosen_piece": " use",
+          "chosen_norm": "use",
+          "chosen_category": "functional"
+        },
+        {
+          "step": 11,
+          "top1": {
+            "token_id": 315,
+            "piece": " of",
+            "norm": "of",
+            "logit": 25.0,
+            "prob": 0.9930819869041443
+          },
+          "top1_category": "functional",
+          "topk_category_counts": {
+            "semantic": 1,
+            "functional": 6,
+            "punct": 5
+          },
+          "topk_category_prob_mass": {
+            "semantic": 0.00010160254169022664,
+            "functional": 0.9945033092226367,
+            "punct": 0.00101397221442312
+          },
+          "chosen_token_id": 315,
+          "chosen_piece": " of",
+          "chosen_norm": "of",
+          "chosen_category": "functional"
+        },
+        {
+          "step": 12,
+          "top1": {
+            "token_id": 279,
+            "piece": " the",
+            "norm": "the",
+            "logit": 19.125,
+            "prob": 0.09505932033061981
+          },
+          "top1_category": "functional",
+          "topk_category_counts": {
+            "semantic": 8,
+            "functional": 4,
+            "punct": 0
+          },
+          "topk_category_prob_mass": {
+            "semantic": 0.21602829732000828,
+            "functional": 0.17841206304728985,
+            "punct": 0.0
+          },
+          "chosen_token_id": 279,
+          "chosen_piece": " the",
+          "chosen_norm": "the",
+          "chosen_category": "functional"
+        },
+        {
+          "step": 13,
+          "top1": {
+            "token_id": 48601,
+            "piece": " pedal",
+            "norm": "pedal",
+            "logit": 18.375,
+            "prob": 0.0746825560927391
+          },
+          "top1_category": "semantic",
+          "topk_category_counts": {
+            "semantic": 9,
+            "functional": 3,
+            "punct": 0
+          },
+          "topk_category_prob_mass": {
+            "semantic": 0.42089940421283245,
+            "functional": 0.09426561277359724,
+            "punct": 0.0
+          },
+          "chosen_token_id": 48601,
+          "chosen_piece": " pedal",
+          "chosen_norm": "pedal",
+          "chosen_category": "semantic"
+        },
+        {
+          "step": 14,
+          "top1": {
+            "token_id": 13,
+            "piece": ".",
+            "norm": "",
+            "logit": 20.5,
+            "prob": 0.38581112027168274
+          },
+          "top1_category": "punct",
+          "topk_category_counts": {
+            "semantic": 0,
+            "functional": 5,
+            "punct": 7
+          },
+          "topk_category_prob_mass": {
+            "semantic": 0.0,
+            "functional": 0.2004851959645748,
+            "punct": 0.6528554670512676
+          },
+          "chosen_token_id": 13,
+          "chosen_piece": ".",
+          "chosen_norm": "",
+          "chosen_category": "punct"
+        },
+        {
+          "step": 15,
+          "top1": {
+            "token_id": 4220,
+            "piece": " These",
+            "norm": "these",
+            "logit": 13.4375,
+            "prob": 0.07124418765306473
+          },
+          "top1_category": "semantic",
+          "topk_category_counts": {
+            "semantic": 2,
+            "functional": 5,
+            "punct": 5
+          },
+          "topk_category_prob_mass": {
+            "semantic": 0.08816616423428059,
+            "functional": 0.15614240616559982,
+            "punct": 0.11336426809430122
+          },
+          "chosen_token_id": 4220,
+          "chosen_piece": " These",
+          "chosen_norm": "these",
+          "chosen_category": "semantic"
+        }
+      ],
+      "passed": true
+    },
+    {
+      "prompt": "Explain the topic clearly",
+      "first_bad_step": 4,
+      "decoded_output": "Explain the topic clearly based upon given context.  \"explain the topic\" is a phrase that means",
+      "rows": [
+        {
+          "step": 0,
+          "top1": {
+            "token_id": 3118,
+            "piece": " based",
+            "norm": "based",
+            "logit": 14.1875,
+            "prob": 0.17047074437141418
+          },
+          "top1_category": "semantic",
+          "topk_category_counts": {
+            "semantic": 11,
+            "functional": 1,
+            "punct": 0
+          },
+          "topk_category_prob_mass": {
+            "semantic": 0.42534564854577184,
+            "functional": 0.031533919274806976,
+            "punct": 0.0
+          },
+          "chosen_token_id": 3118,
+          "chosen_piece": " based",
+          "chosen_norm": "based",
+          "chosen_category": "semantic"
+        },
+        {
+          "step": 1,
+          "top1": {
+            "token_id": 5193,
+            "piece": " upon",
+            "norm": "upon",
+            "logit": 17.5,
+            "prob": 0.12673600018024445
+          },
+          "top1_category": "semantic",
+          "topk_category_counts": {
+            "semantic": 12,
+            "functional": 0,
+            "punct": 0
+          },
+          "topk_category_prob_mass": {
+            "semantic": 0.4612283743917942,
+            "functional": 0.0,
+            "punct": 0.0
+          },
+          "chosen_token_id": 5193,
+          "chosen_piece": " upon",
+          "chosen_norm": "upon",
+          "chosen_category": "semantic"
+        },
+        {
+          "step": 2,
+          "top1": {
+            "token_id": 2661,
+            "piece": " given",
+            "norm": "given",
+            "logit": 19.75,
+            "prob": 0.23131124675273895
+          },
+          "top1_category": "semantic",
+          "topk_category_counts": {
+            "semantic": 12,
+            "functional": 0,
+            "punct": 0
+          },
+          "topk_category_prob_mass": {
+            "semantic": 0.5242105945944786,
+            "functional": 0.0,
+            "punct": 0.0
+          },
+          "chosen_token_id": 2661,
+          "chosen_piece": " given",
+          "chosen_norm": "given",
+          "chosen_category": "semantic"
+        },
+        {
+          "step": 3,
+          "top1": {
+            "token_id": 2266,
+            "piece": " context",
+            "norm": "context",
+            "logit": 21.625,
+            "prob": 0.27016517519950867
+          },
+          "top1_category": "semantic",
+          "topk_category_counts": {
+            "semantic": 12,
+            "functional": 0,
+            "punct": 0
+          },
+          "topk_category_prob_mass": {
+            "semantic": 0.780865266919136,
+            "functional": 0.0,
+            "punct": 0.0
+          },
+          "chosen_token_id": 2266,
+          "chosen_piece": " context",
+          "chosen_norm": "context",
+          "chosen_category": "semantic"
+        },
+        {
+          "step": 4,
+          "top1": {
+            "token_id": 13,
+            "piece": ".",
+            "norm": "",
+            "logit": 20.375,
+            "prob": 0.28195127844810486
+          },
+          "top1_category": "punct",
+          "topk_category_counts": {
+            "semantic": 0,
+            "functional": 0,
+            "punct": 12
+          },
+          "topk_category_prob_mass": {
+            "semantic": 0.0,
+            "functional": 0.0,
+            "punct": 0.9160851284395903
+          },
+          "chosen_token_id": 13,
+          "chosen_piece": ".",
+          "chosen_norm": "",
+          "chosen_category": "punct"
+        },
+        {
+          "step": 5,
+          "top1": {
+            "token_id": 220,
+            "piece": " ",
+            "norm": "",
+            "logit": 16.625,
+            "prob": 0.04581373557448387
+          },
+          "top1_category": "punct",
+          "topk_category_counts": {
+            "semantic": 7,
+            "functional": 0,
+            "punct": 5
+          },
+          "topk_category_prob_mass": {
+            "semantic": 0.16006913781166077,
+            "functional": 0.0,
+            "punct": 0.09724485501646996
+          },
+          "chosen_token_id": 220,
+          "chosen_piece": " ",
+          "chosen_norm": "",
+          "chosen_category": "punct"
+        },
+        {
+          "step": 6,
+          "top1": {
+            "token_id": 330,
+            "piece": " \"",
+            "norm": "",
+            "logit": 14.5625,
+            "prob": 0.07181069999933243
+          },
+          "top1_category": "punct",
+          "topk_category_counts": {
+            "semantic": 8,
+            "functional": 0,
+            "punct": 4
+          },
+          "topk_category_prob_mass": {
+            "semantic": 0.18383791111409664,
+            "functional": 0.0,
+            "punct": 0.18584902863949537
+          },
+          "chosen_token_id": 330,
+          "chosen_piece": " \"",
+          "chosen_norm": "",
+          "chosen_category": "punct"
+        },
+        {
+          "step": 7,
+          "top1": {
+            "token_id": 94344,
+            "piece": "explain",
+            "norm": "explain",
+            "logit": 12.6875,
+            "prob": 0.01096130907535553
+          },
+          "top1_category": "semantic",
+          "topk_category_counts": {
+            "semantic": 7,
+            "functional": 5,
+            "punct": 0
+          },
+          "topk_category_prob_mass": {
+            "semantic": 0.04443507920950651,
+            "functional": 0.02441536309197545,
+            "punct": 0.0
+          },
+          "chosen_token_id": 94344,
+          "chosen_piece": "explain",
+          "chosen_norm": "explain",
+          "chosen_category": "semantic"
+        },
+        {
+          "step": 8,
+          "top1": {
+            "token_id": 279,
+            "piece": " the",
+            "norm": "the",
+            "logit": 19.5,
+            "prob": 0.6197741031646729
+          },
+          "top1_category": "functional",
+          "topk_category_counts": {
+            "semantic": 0,
+            "functional": 3,
+            "punct": 9
+          },
+          "topk_category_prob_mass": {
+            "semantic": 0.0,
+            "functional": 0.6259922899771482,
+            "punct": 0.29147468809969723
+          },
+          "chosen_token_id": 279,
+          "chosen_piece": " the",
+          "chosen_norm": "the",
+          "chosen_category": "functional"
+        },
+        {
+          "step": 9,
+          "top1": {
+            "token_id": 8544,
+            "piece": " topic",
+            "norm": "topic",
+            "logit": 21.125,
+            "prob": 0.5933138132095337
+          },
+          "top1_category": "semantic",
+          "topk_category_counts": {
+            "semantic": 12,
+            "functional": 0,
+            "punct": 0
+          },
+          "topk_category_prob_mass": {
+            "semantic": 0.7793927444145083,
+            "functional": 0.0,
+            "punct": 0.0
+          },
+          "chosen_token_id": 8544,
+          "chosen_piece": " topic",
+          "chosen_norm": "topic",
+          "chosen_category": "semantic"
+        },
+        {
+          "step": 10,
+          "top1": {
+            "token_id": 1,
+            "piece": "\"",
+            "norm": "",
+            "logit": 21.25,
+            "prob": 0.2902170717716217
+          },
+          "top1_category": "punct",
+          "topk_category_counts": {
+            "semantic": 2,
+            "functional": 3,
+            "punct": 7
+          },
+          "topk_category_prob_mass": {
+            "semantic": 0.29939965903759,
+            "functional": 0.18907508859410882,
+            "punct": 0.39776377007365227
+          },
+          "chosen_token_id": 1,
+          "chosen_piece": "\"",
+          "chosen_norm": "",
+          "chosen_category": "punct"
+        },
+        {
+          "step": 11,
+          "top1": {
+            "token_id": 374,
+            "piece": " is",
+            "norm": "is",
+            "logit": 15.625,
+            "prob": 0.10762867331504822
+          },
+          "top1_category": "functional",
+          "topk_category_counts": {
+            "semantic": 1,
+            "functional": 1,
+            "punct": 10
+          },
+          "topk_category_prob_mass": {
+            "semantic": 0.07874282449483871,
+            "functional": 0.10762867331504822,
+            "punct": 0.23762445989996195
+          },
+          "chosen_token_id": 374,
+          "chosen_piece": " is",
+          "chosen_norm": "is",
+          "chosen_category": "functional"
+        },
+        {
+          "step": 12,
+          "top1": {
+            "token_id": 264,
+            "piece": " a",
+            "norm": "a",
+            "logit": 21.25,
+            "prob": 0.42951807379722595
+          },
+          "top1_category": "functional",
+          "topk_category_counts": {
+            "semantic": 4,
+            "functional": 8,
+            "punct": 0
+          },
+          "topk_category_prob_mass": {
+            "semantic": 0.06314869225025177,
+            "functional": 0.7335648243315518,
+            "punct": 0.0
+          },
+          "chosen_token_id": 264,
+          "chosen_piece": " a",
+          "chosen_norm": "a",
+          "chosen_category": "functional"
+        },
+        {
+          "step": 13,
+          "top1": {
+            "token_id": 17133,
+            "piece": " phrase",
+            "norm": "phrase",
+            "logit": 19.875,
+            "prob": 0.16571058332920074
+          },
+          "top1_category": "semantic",
+          "topk_category_counts": {
+            "semantic": 11,
+            "functional": 1,
+            "punct": 0
+          },
+          "topk_category_prob_mass": {
+            "semantic": 0.4700012067332864,
+            "functional": 0.012004034593701363,
+            "punct": 0.0
+          },
+          "chosen_token_id": 17133,
+          "chosen_piece": " phrase",
+          "chosen_norm": "phrase",
+          "chosen_category": "semantic"
+        },
+        {
+          "step": 14,
+          "top1": {
+            "token_id": 429,
+            "piece": " that",
+            "norm": "that",
+            "logit": 23.0,
+            "prob": 0.4704553186893463
+          },
+          "top1_category": "functional",
+          "topk_category_counts": {
+            "semantic": 4,
+            "functional": 7,
+            "punct": 1
+          },
+          "topk_category_prob_mass": {
+            "semantic": 0.2615935071371496,
+            "functional": 0.6189748737961054,
+            "punct": 0.007604201789945364
+          },
+          "chosen_token_id": 429,
+          "chosen_piece": " that",
+          "chosen_norm": "that",
+          "chosen_category": "functional"
+        },
+        {
+          "step": 15,
+          "top1": {
+            "token_id": 3363,
+            "piece": " means",
+            "norm": "means",
+            "logit": 21.125,
+            "prob": 0.24727746844291687
+          },
+          "top1_category": "semantic",
+          "topk_category_counts": {
+            "semantic": 9,
+            "functional": 3,
+            "punct": 0
+          },
+          "topk_category_prob_mass": {
+            "semantic": 0.5248672068119049,
+            "functional": 0.13997168745845556,
+            "punct": 0.0
+          },
+          "chosen_token_id": 3363,
+          "chosen_piece": " means",
+          "chosen_norm": "means",
+          "chosen_category": "semantic"
+        }
+      ],
+      "passed": true
+    }
+  ],
+  "error": null
+}
+```
+
+## Retrieval Generation Alignment Audit
+
+```json
+{
+  "passed": true,
+  "music_keywords": [
+    "pianist",
+    "practiced",
+    "arpeggios",
+    "chopin",
+    "nocturnes",
+    "midnight",
+    "musician",
+    "refined",
+    "finger",
+    "technique",
+    "phrasing",
+    "pedal"
+  ],
+  "space_keywords": [
+    "distant",
+    "astronomers",
+    "observed",
+    "galaxies",
+    "quasars",
+    "stellar",
+    "evolution",
+    "space",
+    "orbital",
+    "mechanics",
+    "explains",
+    "satellites"
+  ],
+  "diagnoses": {
+    "aligned": 2,
+    "retrieval_miss": 0,
+    "bridge_unused": 1,
+    "unknown": 0
+  },
+  "rows": [
+    {
+      "prompt": "What improves piano technique and musical phrasing?",
+      "expected_label": "music",
+      "retrieved_mids": [
+        1,
+        0,
+        3,
+        6,
+        5
+      ],
+      "retrieved_label_counts": {
+        "music": 3,
+        "space": 2
+      },
+      "retrieved_majority_label": "music",
+      "retrieved_text_preview": [
+        "A musician refined finger technique, phrasing, and pedal control on the piano.",
+        "The pianist practiced arpeggios and Chopin nocturnes until midnight.",
+        "A conservatory student studied etudes, scales, and expressive voicing on the keyboard."
+      ],
+      "output": "What improves piano technique and musical phrasing? piano technique control involves technique piano musician technique finger control piano piano musician control technique musician refined finger finger control finger technique piano finger refined refined pedal refined",
+      "music_score": 0.6060606060606061,
+      "space_score": 0.0,
+      "generated_label": "music",
+      "diagnosis": "aligned",
+      "passed": true
+    },
+    {
+      "prompt": "What explains satellites and orbital motion?",
+      "expected_label": "space",
+      "retrieved_mids": [
+        5,
+        4,
+        6,
+        1,
+        0
+      ],
+      "retrieved_label_counts": {
+        "space": 3,
+        "music": 2
+      },
+      "retrieved_majority_label": "space",
+      "retrieved_text_preview": [
+        "Orbital mechanics explains how satellites and planets move under gravitational force.",
+        "Astronomers observed distant galaxies, quasars, and stellar evolution in deep space.",
+        "A telescope captured nebulae, exoplanets, and spectral signatures from distant stars."
+      ],
+      "output": "What explains satellites and orbital motion? explains force satellites Force explains satellitesForce explains satellites force mechanics explains explains force satellites explain planets mechanics mechanics force mechanics gravitational force explains gravitational planets gravitational gravitational",
+      "music_score": 0.0,
+      "space_score": 0.5161290322580645,
+      "generated_label": "space",
+      "diagnosis": "aligned",
+      "passed": true
+    },
+    {
+      "prompt": "Summarize the subject with concrete domain details.",
+      "expected_label": null,
+      "retrieved_mids": [
+        3,
+        1,
+        6,
+        0,
+        5
+      ],
+      "retrieved_label_counts": {
+        "music": 3,
+        "space": 2
+      },
+      "retrieved_majority_label": "music",
+      "retrieved_text_preview": [
+        "A conservatory student studied etudes, scales, and expressive voicing on the keyboard.",
+        "A musician refined finger technique, phrasing, and pedal control on the piano.",
+        "A telescope captured nebulae, exoplanets, and spectral signatures from distant stars."
+      ],
+      "output": "Summarize the subject with concrete domain details. touch interpretation often depends dynamics tempo rub dynamics rub tempo touch dynamics touch tempo interpretation dynamics interpretation controls interpretation rub rub touch often tempo tempo dynamics depends depends",
+      "music_score": 0.0,
+      "space_score": 0.0,
+      "generated_label": null,
+      "diagnosis": "bridge_unused",
+      "passed": true
+    }
+  ],
+  "error": null
+}
+```
+
+## Retrieval Prefix Decode Correlation Audit
+
+```json
+{
+  "passed": false,
+  "correlations": {
+    "retrieval_strength__prefix_l2": null,
+    "retrieval_strength__bad_decode_score": 0.21927202884584385,
+    "prefix_l2__bad_decode_score": null
+  },
+  "rows": [
+    {
+      "prompt": "What improves piano technique and musical phrasing?",
+      "expected_label": "music",
+      "retrieved_scored": [
+        {
+          "mid": 1,
+          "score": 0.6172578841447831
+        },
+        {
+          "mid": 0,
+          "score": 0.22511255741119385
+        },
+        {
+          "mid": 3,
+          "score": 0.11276901960372926
+        },
+        {
+          "mid": 6,
+          "score": 0.045475220680236815
+        },
+        {
+          "mid": 5,
+          "score": 0.036619618535041816
+        }
+      ],
+      "retrieved_label_counts": {
+        "music": 3,
+        "space": 2
+      },
+      "retrieval_strength": 0.9551394611597062,
+      "prefix_l2_shift": 322359623680.0,
+      "prefix_js_divergence": 0.3171347379684448,
+      "top1_with_prefix": {
+        "token_id": 14566,
+        "piece": " Options",
+        "norm": "options",
+        "logit": 16.375,
+        "prob": 0.1110726147890091
+      },
+      "top1_category_with_prefix": "semantic",
+      "topk_non_semantic_prob_mass": 0.03182283788919449
+    },
+    {
+      "prompt": "What explains satellites and orbital motion?",
+      "expected_label": "space",
+      "retrieved_scored": [
+        {
+          "mid": 5,
+          "score": 0.5634284257888794
+        },
+        {
+          "mid": 4,
+          "score": 0.07376852035522463
+        },
+        {
+          "mid": 6,
+          "score": 0.06803246438503266
+        },
+        {
+          "mid": 1,
+          "score": 0.045463052392005925
+        },
+        {
+          "mid": 0,
+          "score": 0.03999960422515869
+        }
+      ],
+      "retrieved_label_counts": {
+        "space": 3,
+        "music": 2
+      },
+      "retrieval_strength": 0.7052294105291367,
+      "prefix_l2_shift": 322359623680.0,
+      "prefix_js_divergence": 0.46486830711364746,
+      "top1_with_prefix": {
+        "token_id": 13177,
+        "piece": " Sat",
+        "norm": "sat",
+        "logit": 15.3125,
+        "prob": 0.07889200001955032
+      },
+      "top1_category_with_prefix": "functional",
+      "topk_non_semantic_prob_mass": 0.1079147458076477
+    },
+    {
+      "prompt": "Describe what a student should focus on first.",
+      "expected_label": null,
+      "retrieved_scored": [
+        {
+          "mid": 3,
+          "score": 0.5128585010766983
+        },
+        {
+          "mid": 1,
+          "score": 0.046858394145965584
+        },
+        {
+          "mid": 0,
+          "score": -0.0005610674619674696
+        },
+        {
+          "mid": 4,
+          "score": -0.011547431349754333
+        },
+        {
+          "mid": 6,
+          "score": -0.026388256251811976
+        }
+      ],
+      "retrieved_label_counts": {
+        "music": 3,
+        "space": 2
+      },
+      "retrieval_strength": 0.5128585010766983,
+      "prefix_l2_shift": 322359623680.0,
+      "prefix_js_divergence": 0.441089391708374,
+      "top1_with_prefix": {
+        "token_id": 22201,
+        "piece": " Choose",
+        "norm": "choose",
+        "logit": 15.125,
+        "prob": 0.12620772421360016
+      },
+      "top1_category_with_prefix": "semantic",
+      "topk_non_semantic_prob_mass": 0.013302195817232132
+    },
+    {
+      "prompt": "Summarize the subject with concrete domain details.",
+      "expected_label": null,
+      "retrieved_scored": [
+        {
+          "mid": 3,
+          "score": 0.021094447374343874
+        },
+        {
+          "mid": 1,
+          "score": 0.015311965346336366
+        },
+        {
+          "mid": 6,
+          "score": 0.004081499576568608
+        },
+        {
+          "mid": 0,
+          "score": -0.010262516140937806
+        },
+        {
+          "mid": 5,
+          "score": -0.012652482092380526
+        }
+      ],
+      "retrieved_label_counts": {
+        "music": 3,
+        "space": 2
+      },
+      "retrieval_strength": 0.021094447374343874,
+      "prefix_l2_shift": 322359623680.0,
+      "prefix_js_divergence": 0.32552844285964966,
+      "top1_with_prefix": {
+        "token_id": 58194,
+        "piece": " Artificial",
+        "norm": "artificial",
+        "logit": 14.625,
+        "prob": 0.009140501730144024
+      },
+      "top1_category_with_prefix": "semantic",
+      "topk_non_semantic_prob_mass": 0.0
+    },
+    {
+      "prompt": "Key piano ideas include",
+      "expected_label": "music",
+      "retrieved_scored": [
+        {
+          "mid": 1,
+          "score": 0.5411406040191651
+        },
+        {
+          "mid": 0,
+          "score": 0.3158708691596985
+        },
+        {
+          "mid": 3,
+          "score": 0.13700250387191773
+        },
+        {
+          "mid": 6,
+          "score": 0.016681492328643806
+        },
+        {
+          "mid": 4,
+          "score": -0.005892813205719001
+        }
+      ],
+      "retrieved_label_counts": {
+        "music": 3,
+        "space": 2
+      },
+      "retrieval_strength": 0.9940139770507813,
+      "prefix_l2_shift": 322359623680.0,
+      "prefix_js_divergence": 0.301528662443161,
+      "top1_with_prefix": {
+        "token_id": 3598,
+        "piece": " major",
+        "norm": "major",
+        "logit": 16.0,
+        "prob": 0.028910748660564423
+      },
+      "top1_category_with_prefix": "semantic",
+      "topk_non_semantic_prob_mass": 0.022515714168548584
+    },
+    {
+      "prompt": "Orbital motion depends on",
+      "expected_label": "space",
+      "retrieved_scored": [
+        {
+          "mid": 2,
+          "score": 0.3270561575889588
+        },
+        {
+          "mid": 5,
+          "score": 0.04361439943313599
+        },
+        {
+          "mid": 3,
+          "score": 0.024278688430786136
+        },
+        {
+          "mid": 1,
+          "score": -0.021913541853427882
+        },
+        {
+          "mid": 6,
+          "score": -0.033837710320949566
+        }
+      ],
+      "retrieved_label_counts": {
+        "music": 3,
+        "space": 2
+      },
+      "retrieval_strength": 0.009776689112186425,
+      "prefix_l2_shift": 322359623680.0,
+      "prefix_js_divergence": 0.4070507884025574,
+      "top1_with_prefix": {
+        "token_id": 3072,
+        "piece": " mass",
+        "norm": "mass",
+        "logit": 18.625,
+        "prob": 0.12673379480838776
+      },
+      "top1_category_with_prefix": "semantic",
+      "topk_non_semantic_prob_mass": 0.0
+    }
+  ],
+  "error": null
+}
+```
+
+## Stepwise Label Mass Alignment Audit
+
+```json
+{
+  "passed": false,
+  "label_keywords": {
+    "music": [
+      "pianist",
+      "practiced",
+      "arpeggios",
+      "chopin",
+      "nocturnes",
+      "midnight",
+      "musician",
+      "refined",
+      "finger",
+      "technique",
+      "phrasing",
+      "pedal"
+    ],
+    "space": [
+      "distant",
+      "astronomers",
+      "observed",
+      "galaxies",
+      "quasars",
+      "stellar",
+      "evolution",
+      "space",
+      "orbital",
+      "mechanics",
+      "explains",
+      "satellites"
+    ]
+  },
+  "rows": [
+    {
+      "prompt": "What improves piano technique and musical phrasing?",
+      "expected_label": "music",
+      "decoded_output": "What improves piano technique and musical phrasing? Options tend towards improving piano technique, musical phrasing, and",
+      "stage_counts": {
+        "inject": 6,
+        "aligned": 4,
+        "decode": 2
+      },
+      "rows": [
+        {
+          "step": 0,
+          "retrieved_majority_label": "music",
+          "retrieved_label_counts": {
+            "music": 3,
+            "space": 2
+          },
+          "retrieved_score_sum": {
+            "music": 0.9551394611597062,
+            "space": 0.08209483921527863
+          },
+          "logits_label_mass": {
+            "music": 0,
+            "space": 0
+          },
+          "top1_piece": " Options",
+          "top1_category": "semantic",
+          "chosen_piece": " Options",
+          "chosen_category": "semantic",
+          "chosen_label": null,
+          "diagnosed_stage": "inject"
+        },
+        {
+          "step": 1,
+          "retrieved_majority_label": "music",
+          "retrieved_label_counts": {
+            "music": 3,
+            "space": 2
+          },
+          "retrieved_score_sum": {
+            "music": 0.9551394611597062,
+            "space": 0.08209483921527863
+          },
+          "logits_label_mass": {
+            "music": 0,
+            "space": 0
+          },
+          "top1_piece": " tend",
+          "top1_category": "semantic",
+          "chosen_piece": " tend",
+          "chosen_category": "semantic",
+          "chosen_label": null,
+          "diagnosed_stage": "inject"
+        },
+        {
+          "step": 2,
+          "retrieved_majority_label": "music",
+          "retrieved_label_counts": {
+            "music": 3,
+            "space": 2
+          },
+          "retrieved_score_sum": {
+            "music": 0.9551394611597062,
+            "space": 0.08209483921527863
+          },
+          "logits_label_mass": {
+            "music": 0.03443919029086828,
+            "space": 0
+          },
+          "top1_piece": " towards",
+          "top1_category": "semantic",
+          "chosen_piece": " towards",
+          "chosen_category": "semantic",
+          "chosen_label": "music",
+          "diagnosed_stage": "aligned"
+        },
+        {
+          "step": 3,
+          "retrieved_majority_label": "music",
+          "retrieved_label_counts": {
+            "music": 3,
+            "space": 2
+          },
+          "retrieved_score_sum": {
+            "music": 0.9551394611597062,
+            "space": 0.08209483921527863
+          },
+          "logits_label_mass": {
+            "music": 0,
+            "space": 0
+          },
+          "top1_piece": " improving",
+          "top1_category": "semantic",
+          "chosen_piece": " improving",
+          "chosen_category": "semantic",
+          "chosen_label": null,
+          "diagnosed_stage": "inject"
+        },
+        {
+          "step": 4,
+          "retrieved_majority_label": "music",
+          "retrieved_label_counts": {
+            "music": 3,
+            "space": 2
+          },
+          "retrieved_score_sum": {
+            "music": 0.9551394611597062,
+            "space": 0.08209483921527863
+          },
+          "logits_label_mass": {
+            "music": 0.07181288627907634,
+            "space": 0
+          },
+          "top1_piece": " piano",
+          "top1_category": "semantic",
+          "chosen_piece": " piano",
+          "chosen_category": "semantic",
+          "chosen_label": "music",
+          "diagnosed_stage": "aligned"
+        },
+        {
+          "step": 5,
+          "retrieved_majority_label": "music",
+          "retrieved_label_counts": {
+            "music": 3,
+            "space": 2
+          },
+          "retrieved_score_sum": {
+            "music": 0.9551394611597062,
+            "space": 0.08209483921527863
+          },
+          "logits_label_mass": {
+            "music": 0.9712017463753,
+            "space": 0
+          },
+          "top1_piece": " technique",
+          "top1_category": "semantic",
+          "chosen_piece": " technique",
+          "chosen_category": "semantic",
+          "chosen_label": "music",
+          "diagnosed_stage": "aligned"
+        },
+        {
+          "step": 6,
+          "retrieved_majority_label": "music",
+          "retrieved_label_counts": {
+            "music": 3,
+            "space": 2
+          },
+          "retrieved_score_sum": {
+            "music": 0.9551394611597062,
+            "space": 0.08209483921527863
+          },
+          "logits_label_mass": {
+            "music": 0,
+            "space": 0
+          },
+          "top1_piece": ",",
+          "top1_category": "punct",
+          "chosen_piece": ",",
+          "chosen_category": "punct",
+          "chosen_label": null,
+          "diagnosed_stage": "inject"
+        },
+        {
+          "step": 7,
+          "retrieved_majority_label": "music",
+          "retrieved_label_counts": {
+            "music": 3,
+            "space": 2
+          },
+          "retrieved_score_sum": {
+            "music": 0.9551394611597062,
+            "space": 0.08209483921527863
+          },
+          "logits_label_mass": {
+            "music": 0.03453451534733176,
+            "space": 0
+          },
+          "top1_piece": " musical",
+          "top1_category": "semantic",
+          "chosen_piece": " musical",
+          "chosen_category": "semantic",
+          "chosen_label": "music",
+          "diagnosed_stage": "aligned"
+        },
+        {
+          "step": 8,
+          "retrieved_majority_label": "music",
+          "retrieved_label_counts": {
+            "music": 3,
+            "space": 2
+          },
+          "retrieved_score_sum": {
+            "music": 0.9551050901412963,
+            "space": 0.09417556524276735
+          },
+          "logits_label_mass": {
+            "music": 0.0019687179010361433,
+            "space": 0
+          },
+          "top1_piece": " ph",
+          "top1_category": "functional",
+          "chosen_piece": " ph",
+          "chosen_category": "functional",
+          "chosen_label": "music",
+          "diagnosed_stage": "decode"
+        },
+        {
+          "step": 9,
+          "retrieved_majority_label": "music",
+          "retrieved_label_counts": {
+            "music": 3,
+            "space": 2
+          },
+          "retrieved_score_sum": {
+            "music": 0.9551050901412963,
+            "space": 0.09417556524276735
+          },
+          "logits_label_mass": {
+            "music": 0,
+            "space": 0
+          },
+          "top1_piece": "rasing",
+          "top1_category": "semantic",
+          "chosen_piece": "rasing",
+          "chosen_category": "semantic",
+          "chosen_label": null,
+          "diagnosed_stage": "inject"
+        },
+        {
+          "step": 10,
+          "retrieved_majority_label": "music",
+          "retrieved_label_counts": {
+            "music": 3,
+            "space": 2
+          },
+          "retrieved_score_sum": {
+            "music": 0.9551050901412963,
+            "space": 0.09417556524276735
+          },
+          "logits_label_mass": {
+            "music": 0,
+            "space": 0
+          },
+          "top1_piece": ",",
+          "top1_category": "punct",
+          "chosen_piece": ",",
+          "chosen_category": "punct",
+          "chosen_label": null,
+          "diagnosed_stage": "inject"
+        },
+        {
+          "step": 11,
+          "retrieved_majority_label": "music",
+          "retrieved_label_counts": {
+            "music": 3,
+            "space": 2
+          },
+          "retrieved_score_sum": {
+            "music": 0.9551050901412963,
+            "space": 0.09417556524276735
+          },
+          "logits_label_mass": {
+            "music": 0.02468138374388218,
+            "space": 0
+          },
+          "top1_piece": " and",
+          "top1_category": "functional",
+          "chosen_piece": " and",
+          "chosen_category": "functional",
+          "chosen_label": "music",
+          "diagnosed_stage": "decode"
+        }
+      ],
+      "passed": false
+    },
+    {
+      "prompt": "What explains satellites and orbital motion?",
+      "expected_label": "space",
+      "decoded_output": "What explains satellites and orbital motion? Sat phones don' explain satellites, satellites are artificial objects that",
+      "stage_counts": {
+        "decode": 3,
+        "aligned": 5,
+        "inject": 4
+      },
+      "rows": [
+        {
+          "step": 0,
+          "retrieved_majority_label": "space",
+          "retrieved_label_counts": {
+            "space": 3,
+            "music": 2
+          },
+          "retrieved_score_sum": {
+            "space": 0.7052294105291367,
+            "music": 0.08546265661716462
+          },
+          "logits_label_mass": {
+            "music": 0,
+            "space": 0.010029993019998074
+          },
+          "top1_piece": " Sat",
+          "top1_category": "functional",
+          "chosen_piece": " Sat",
+          "chosen_category": "functional",
+          "chosen_label": "space",
+          "diagnosed_stage": "decode"
+        },
+        {
+          "step": 1,
+          "retrieved_majority_label": "space",
+          "retrieved_label_counts": {
+            "space": 3,
+            "music": 2
+          },
+          "retrieved_score_sum": {
+            "space": 0.7052294105291367,
+            "music": 0.08546265661716462
+          },
+          "logits_label_mass": {
+            "music": 0,
+            "space": 0.005930706858634949
+          },
+          "top1_piece": " phones",
+          "top1_category": "semantic",
+          "chosen_piece": " phones",
+          "chosen_category": "semantic",
+          "chosen_label": "space",
+          "diagnosed_stage": "aligned"
+        },
+        {
+          "step": 2,
+          "retrieved_majority_label": "space",
+          "retrieved_label_counts": {
+            "space": 3,
+            "music": 2
+          },
+          "retrieved_score_sum": {
+            "space": 0.7052294105291367,
+            "music": 0.08546265661716462
+          },
+          "logits_label_mass": {
+            "music": 0,
+            "space": 0.032648902386426926
+          },
+          "top1_piece": " don",
+          "top1_category": "functional",
+          "chosen_piece": " don",
+          "chosen_category": "functional",
+          "chosen_label": "space",
+          "diagnosed_stage": "decode"
+        },
+        {
+          "step": 3,
+          "retrieved_majority_label": "space",
+          "retrieved_label_counts": {
+            "space": 3,
+            "music": 2
+          },
+          "retrieved_score_sum": {
+            "space": 0.7052294105291367,
+            "music": 0.08546265661716462
+          },
+          "logits_label_mass": {
+            "music": 0,
+            "space": 0
+          },
+          "top1_piece": "'",
+          "top1_category": "punct",
+          "chosen_piece": "'",
+          "chosen_category": "punct",
+          "chosen_label": null,
+          "diagnosed_stage": "inject"
+        },
+        {
+          "step": 4,
+          "retrieved_majority_label": "space",
+          "retrieved_label_counts": {
+            "space": 3,
+            "music": 2
+          },
+          "retrieved_score_sum": {
+            "space": 0.7052294105291367,
+            "music": 0.08546265661716462
+          },
+          "logits_label_mass": {
+            "music": 0,
+            "space": 0
+          },
+          "top1_piece": " explain",
+          "top1_category": "semantic",
+          "chosen_piece": " explain",
+          "chosen_category": "semantic",
+          "chosen_label": null,
+          "diagnosed_stage": "inject"
+        },
+        {
+          "step": 5,
+          "retrieved_majority_label": "space",
+          "retrieved_label_counts": {
+            "space": 3,
+            "music": 2
+          },
+          "retrieved_score_sum": {
+            "space": 0.7052294105291367,
+            "music": 0.08546265661716462
+          },
+          "logits_label_mass": {
+            "music": 0,
+            "space": 0.3954301029443741
+          },
+          "top1_piece": " satellites",
+          "top1_category": "semantic",
+          "chosen_piece": " satellites",
+          "chosen_category": "semantic",
+          "chosen_label": "space",
+          "diagnosed_stage": "aligned"
+        },
+        {
+          "step": 6,
+          "retrieved_majority_label": "space",
+          "retrieved_label_counts": {
+            "space": 3,
+            "music": 2
+          },
+          "retrieved_score_sum": {
+            "space": 0.7052294105291367,
+            "music": 0.08546265661716462
+          },
+          "logits_label_mass": {
+            "music": 0,
+            "space": 0.022754499688744545
+          },
+          "top1_piece": ",",
+          "top1_category": "punct",
+          "chosen_piece": ",",
+          "chosen_category": "punct",
+          "chosen_label": "space",
+          "diagnosed_stage": "decode"
+        },
+        {
+          "step": 7,
+          "retrieved_majority_label": "space",
+          "retrieved_label_counts": {
+            "space": 3,
+            "music": 2
+          },
+          "retrieved_score_sum": {
+            "space": 0.7052294105291367,
+            "music": 0.08546265661716462
+          },
+          "logits_label_mass": {
+            "music": 0,
+            "space": 0.2686969190835953
+          },
+          "top1_piece": " satellites",
+          "top1_category": "semantic",
+          "chosen_piece": " satellites",
+          "chosen_category": "semantic",
+          "chosen_label": "space",
+          "diagnosed_stage": "aligned"
+        },
+        {
+          "step": 8,
+          "retrieved_majority_label": "space",
+          "retrieved_label_counts": {
+            "space": 3,
+            "music": 2
+          },
+          "retrieved_score_sum": {
+            "space": 0.714495986700058,
+            "music": 0.0803181141614914
+          },
+          "logits_label_mass": {
+            "music": 0,
+            "space": 0
+          },
+          "top1_piece": " are",
+          "top1_category": "functional",
+          "chosen_piece": " are",
+          "chosen_category": "functional",
+          "chosen_label": null,
+          "diagnosed_stage": "inject"
+        },
+        {
+          "step": 9,
+          "retrieved_majority_label": "space",
+          "retrieved_label_counts": {
+            "space": 3,
+            "music": 2
+          },
+          "retrieved_score_sum": {
+            "space": 0.714495986700058,
+            "music": 0.0803181141614914
+          },
+          "logits_label_mass": {
+            "music": 0,
+            "space": 0.03106600232422352
+          },
+          "top1_piece": " artificial",
+          "top1_category": "semantic",
+          "chosen_piece": " artificial",
+          "chosen_category": "semantic",
+          "chosen_label": "space",
+          "diagnosed_stage": "aligned"
+        },
+        {
+          "step": 10,
+          "retrieved_majority_label": "space",
+          "retrieved_label_counts": {
+            "space": 3,
+            "music": 2
+          },
+          "retrieved_score_sum": {
+            "space": 0.714495986700058,
+            "music": 0.0803181141614914
+          },
+          "logits_label_mass": {
+            "music": 0,
+            "space": 0.33109524846076965
+          },
+          "top1_piece": " objects",
+          "top1_category": "semantic",
+          "chosen_piece": " objects",
+          "chosen_category": "semantic",
+          "chosen_label": "space",
+          "diagnosed_stage": "aligned"
+        },
+        {
+          "step": 11,
+          "retrieved_majority_label": "space",
+          "retrieved_label_counts": {
+            "space": 3,
+            "music": 2
+          },
+          "retrieved_score_sum": {
+            "space": 0.714495986700058,
+            "music": 0.0803181141614914
+          },
+          "logits_label_mass": {
+            "music": 0,
+            "space": 0
+          },
+          "top1_piece": " that",
+          "top1_category": "functional",
+          "chosen_piece": " that",
+          "chosen_category": "functional",
+          "chosen_label": null,
+          "diagnosed_stage": "inject"
+        }
+      ],
+      "passed": false
+    }
+  ],
+  "error": null
+}
+```
+
+## Prompt Diversity Without Memory
+
+```json
+{
+  "passed": true,
+  "prompts": [
+    "The pianist",
+    "Quantum systems",
+    "The rainforest"
+  ],
+  "outputs": [
+    "The pianist Xia points XYZ传感器 collects weather data based upon ____ protocol communication mode?\nBLE（Bluetooth）\n",
+    "Quantum systems play central roles across cryptography due primarily?\\nThe Bose gas  |\n\n **Summary:\r\n\r\nWrite various",
+    "The rainforest dataset typically refers specifically refering______. aviation charts. ____\nyes Explanation: \nFalse"
+  ],
+  "unique_count": 3,
+  "error": null
+}
+```
+
+## Save/Load Consistency
+
+```json
+{
+  "passed": true,
+  "prompt": "The pianist",
+  "output_a": "The pianist piano hours piano pianoHours = int(raw input desperation hours hours))\n piano perfectperfect print calculating",
+  "output_b": "The pianist piano hours piano pianoHours = int(raw input desperation hours hours))\n piano perfectperfect print calculating",
+  "error": null
+}
+```
+
+## Training Cache Isolation
+
+```json
+{
+  "passed": true,
+  "changed": [],
+  "memory_count": 8,
+  "error": null
+}
+```
+
+## Cheating Heuristics
+
+```json
+{
+  "passed": true,
+  "outputs": [
+    "The pianist piano hours piano pianoHours = int(raw input desperation hours hours))\n piano perfectperfect print calculating",
+    "The telescope window watched cat sat mat outside birds window sat watched mat cat birds outside Market window cat watched",
+    "The trader market stock volatility significant experienced 市 stock experienced significant market volatility experienced stock stock significant volatility",
+    "The child learns Signs window window outside cat sat mat watched outside mat sat cat mat mat outside sat watched"
+  ],
+  "exact_same": false,
+  "prefix_only": false,
+  "too_short": false,
+  "error": null
+}
+```
\ No newline at end of file
diff --git a/reports/v346_trained_blackbox/stdout.log b/reports/v346_trained_blackbox/stdout.log
new file mode 100644
index 0000000..0415fe0
--- /dev/null
+++ b/reports/v346_trained_blackbox/stdout.log
@@ -0,0 +1,291 @@
+[case:start] leaf_capacity_stability
+[case:done] leaf_capacity_stability passed=True
+[case:start] degenerate_direction_boundary
+[case:done] degenerate_direction_boundary passed=True
+[case:start] metric_trainability
+Warning: You are sending unauthenticated requests to the HF Hub. Please set a HF_TOKEN to enable higher rate limits and faster downloads.
+`torch_dtype` is deprecated! Use `dtype` instead!
+Loading weights:   0%|          | 0/338 [00:00<?, ?it/s]Loading weights: 100%|██████████| 338/338 [00:00<00:00, 3680.69it/s]
+  [neighbor cache] vocab_size=151936 > 60000, skip
+  [AMS_TRAINED_WEIGHTS] loaded=202 skipped=0 shape_errs=0  path=/workspace/AgentMemorySystem/ckpt/v346_trained.pt  provenance=AgentMemory/v346-revertE-topk-nonexclusive-7e97
+/usr/local/lib/python3.12/dist-packages/torch/autograd/graph.py:869: UserWarning: Attempting to run cuBLAS, but there was no current CUDA context! Attempting to set the primary context... (Triggered internally at /pytorch/aten/src/ATen/cuda/CublasHandlePool.cpp:335.)
+  return Variable._execution_engine.run_backward(  # Calls into the C++ engine to run the backward pass
+/usr/local/lib/python3.12/dist-packages/torch/autograd/graph.py:869: UserWarning: cuDNN Attention defaults to a non-deterministic algorithm. To explicitly enable determinism call torch.use_deterministic_algorithms(True, warn_only=False). (Triggered internally at /pytorch/aten/src/ATen/native/transformers/cuda/attention_backward.cu:212.)
+  return Variable._execution_engine.run_backward(  # Calls into the C++ engine to run the backward pass
+[case:done] metric_trainability passed=True
+[case:start] no_grad_generation
+Loading weights:   0%|          | 0/338 [00:00<?, ?it/s]Loading weights: 100%|██████████| 338/338 [00:00<00:00, 3485.70it/s]
+  [neighbor cache] vocab_size=151936 > 60000, skip
+  [AMS_TRAINED_WEIGHTS] loaded=202 skipped=0 shape_errs=0  path=/workspace/AgentMemorySystem/ckpt/v346_trained.pt  provenance=AgentMemory/v346-revertE-topk-nonexclusive-7e97
+[case:done] no_grad_generation passed=True
+[case:start] counterfactual_memory_influence
+Loading weights:   0%|          | 0/338 [00:00<?, ?it/s]Loading weights: 100%|██████████| 338/338 [00:00<00:00, 3497.40it/s]
+  [neighbor cache] vocab_size=151936 > 60000, skip
+  [AMS_TRAINED_WEIGHTS] loaded=202 skipped=0 shape_errs=0  path=/workspace/AgentMemorySystem/ckpt/v346_trained.pt  provenance=AgentMemory/v346-revertE-topk-nonexclusive-7e97
+Loading weights:   0%|          | 0/338 [00:00<?, ?it/s]Loading weights:  88%|████████▊ | 297/338 [00:00<00:00, 2967.76it/s]Loading weights: 100%|██████████| 338/338 [00:00<00:00, 3062.18it/s]
+  [neighbor cache] vocab_size=151936 > 60000, skip
+  [AMS_TRAINED_WEIGHTS] loaded=202 skipped=0 shape_errs=0  path=/workspace/AgentMemorySystem/ckpt/v346_trained.pt  provenance=AgentMemory/v346-revertE-topk-nonexclusive-7e97
+[case:done] counterfactual_memory_influence passed=True
+[case:start] semantic_memory_grounding
+Loading weights:   0%|          | 0/338 [00:00<?, ?it/s]Loading weights: 100%|██████████| 338/338 [00:00<00:00, 3753.18it/s]
+  [neighbor cache] vocab_size=151936 > 60000, skip
+  [AMS_TRAINED_WEIGHTS] loaded=202 skipped=0 shape_errs=0  path=/workspace/AgentMemorySystem/ckpt/v346_trained.pt  provenance=AgentMemory/v346-revertE-topk-nonexclusive-7e97
+Loading weights:   0%|          | 0/338 [00:00<?, ?it/s]Loading weights:  85%|████████▍ | 286/338 [00:00<00:00, 2858.78it/s]Loading weights: 100%|██████████| 338/338 [00:00<00:00, 3035.32it/s]
+  [neighbor cache] vocab_size=151936 > 60000, skip
+  [AMS_TRAINED_WEIGHTS] loaded=202 skipped=0 shape_errs=0  path=/workspace/AgentMemorySystem/ckpt/v346_trained.pt  provenance=AgentMemory/v346-revertE-topk-nonexclusive-7e97
+Loading weights:   0%|          | 0/338 [00:00<?, ?it/s]Loading weights: 100%|██████████| 338/338 [00:00<00:00, 3718.64it/s]
+  [neighbor cache] vocab_size=151936 > 60000, skip
+  [AMS_TRAINED_WEIGHTS] loaded=202 skipped=0 shape_errs=0  path=/workspace/AgentMemorySystem/ckpt/v346_trained.pt  provenance=AgentMemory/v346-revertE-topk-nonexclusive-7e97
+[case:done] semantic_memory_grounding passed=True
+[case:start] semantic_memory_counterfactual_pairs
+Loading weights:   0%|          | 0/338 [00:00<?, ?it/s]Loading weights: 100%|██████████| 338/338 [00:00<00:00, 3491.01it/s]
+  [neighbor cache] vocab_size=151936 > 60000, skip
+  [AMS_TRAINED_WEIGHTS] loaded=202 skipped=0 shape_errs=0  path=/workspace/AgentMemorySystem/ckpt/v346_trained.pt  provenance=AgentMemory/v346-revertE-topk-nonexclusive-7e97
+Loading weights:   0%|          | 0/338 [00:00<?, ?it/s]Loading weights:  93%|█████████▎| 316/338 [00:00<00:00, 3159.25it/s]Loading weights: 100%|██████████| 338/338 [00:00<00:00, 3221.49it/s]
+  [neighbor cache] vocab_size=151936 > 60000, skip
+  [AMS_TRAINED_WEIGHTS] loaded=202 skipped=0 shape_errs=0  path=/workspace/AgentMemorySystem/ckpt/v346_trained.pt  provenance=AgentMemory/v346-revertE-topk-nonexclusive-7e97
+[case:done] semantic_memory_counterfactual_pairs passed=False
+[case:start] degeneration_quality
+Loading weights:   0%|          | 0/338 [00:00<?, ?it/s]Loading weights:  94%|█████████▍| 317/338 [00:00<00:00, 3167.82it/s]Loading weights: 100%|██████████| 338/338 [00:00<00:00, 3224.57it/s]
+  [neighbor cache] vocab_size=151936 > 60000, skip
+  [AMS_TRAINED_WEIGHTS] loaded=202 skipped=0 shape_errs=0  path=/workspace/AgentMemorySystem/ckpt/v346_trained.pt  provenance=AgentMemory/v346-revertE-topk-nonexclusive-7e97
+[case:done] degeneration_quality passed=False
+[case:start] prefix_logit_drift_audit
+Loading weights:   0%|          | 0/338 [00:00<?, ?it/s]Loading weights: 100%|██████████| 338/338 [00:00<00:00, 3584.33it/s]
+  [neighbor cache] vocab_size=151936 > 60000, skip
+  [AMS_TRAINED_WEIGHTS] loaded=202 skipped=0 shape_errs=0  path=/workspace/AgentMemorySystem/ckpt/v346_trained.pt  provenance=AgentMemory/v346-revertE-topk-nonexclusive-7e97
+Loading weights:   0%|          | 0/338 [00:00<?, ?it/s]Loading weights: 100%|██████████| 338/338 [00:00<00:00, 3512.67it/s]
+  [neighbor cache] vocab_size=151936 > 60000, skip
+  [AMS_TRAINED_WEIGHTS] loaded=202 skipped=0 shape_errs=0  path=/workspace/AgentMemorySystem/ckpt/v346_trained.pt  provenance=AgentMemory/v346-revertE-topk-nonexclusive-7e97
+[case:done] prefix_logit_drift_audit passed=True
+[case:start] retrieval_topk_semantic_shift
+Loading weights:   0%|          | 0/338 [00:00<?, ?it/s]Loading weights:  98%|█████████▊| 330/338 [00:00<00:00, 3298.30it/s]Loading weights: 100%|██████████| 338/338 [00:00<00:00, 3339.85it/s]
+  [neighbor cache] vocab_size=151936 > 60000, skip
+  [AMS_TRAINED_WEIGHTS] loaded=202 skipped=0 shape_errs=0  path=/workspace/AgentMemorySystem/ckpt/v346_trained.pt  provenance=AgentMemory/v346-revertE-topk-nonexclusive-7e97
+Loading weights:   0%|          | 0/338 [00:00<?, ?it/s]Loading weights: 100%|██████████| 338/338 [00:00<00:00, 3672.19it/s]
+  [neighbor cache] vocab_size=151936 > 60000, skip
+  [AMS_TRAINED_WEIGHTS] loaded=202 skipped=0 shape_errs=0  path=/workspace/AgentMemorySystem/ckpt/v346_trained.pt  provenance=AgentMemory/v346-revertE-topk-nonexclusive-7e97
+[case:done] retrieval_topk_semantic_shift passed=False
+[case:start] repetition_segment_audit
+Loading weights:   0%|          | 0/338 [00:00<?, ?it/s]Loading weights:  92%|█████████▏| 312/338 [00:00<00:00, 3116.58it/s]Loading weights: 100%|██████████| 338/338 [00:00<00:00, 3191.33it/s]
+  [neighbor cache] vocab_size=151936 > 60000, skip
+  [AMS_TRAINED_WEIGHTS] loaded=202 skipped=0 shape_errs=0  path=/workspace/AgentMemorySystem/ckpt/v346_trained.pt  provenance=AgentMemory/v346-revertE-topk-nonexclusive-7e97
+[case:done] repetition_segment_audit passed=True
+[case:start] prefix_stepwise_drift_trajectory
+Loading weights:   0%|          | 0/338 [00:00<?, ?it/s]Loading weights: 100%|██████████| 338/338 [00:00<00:00, 3808.40it/s]
+  [neighbor cache] vocab_size=151936 > 60000, skip
+  [AMS_TRAINED_WEIGHTS] loaded=202 skipped=0 shape_errs=0  path=/workspace/AgentMemorySystem/ckpt/v346_trained.pt  provenance=AgentMemory/v346-revertE-topk-nonexclusive-7e97
+[case:done] prefix_stepwise_drift_trajectory passed=True
+[case:start] retrieval_generation_alignment_audit
+Loading weights:   0%|          | 0/338 [00:00<?, ?it/s]Loading weights:  93%|█████████▎| 316/338 [00:00<00:00, 3154.62it/s]Loading weights: 100%|██████████| 338/338 [00:00<00:00, 3167.82it/s]
+  [neighbor cache] vocab_size=151936 > 60000, skip
+  [AMS_TRAINED_WEIGHTS] loaded=202 skipped=0 shape_errs=0  path=/workspace/AgentMemorySystem/ckpt/v346_trained.pt  provenance=AgentMemory/v346-revertE-topk-nonexclusive-7e97
+[case:done] retrieval_generation_alignment_audit passed=True
+[case:start] retrieval_prefix_decode_correlation_audit
+Loading weights:   0%|          | 0/338 [00:00<?, ?it/s]Loading weights: 100%|██████████| 338/338 [00:00<00:00, 3469.36it/s]
+  [neighbor cache] vocab_size=151936 > 60000, skip
+  [AMS_TRAINED_WEIGHTS] loaded=202 skipped=0 shape_errs=0  path=/workspace/AgentMemorySystem/ckpt/v346_trained.pt  provenance=AgentMemory/v346-revertE-topk-nonexclusive-7e97
+[case:done] retrieval_prefix_decode_correlation_audit passed=False
+[case:start] stepwise_label_mass_alignment_audit
+Loading weights:   0%|          | 0/338 [00:00<?, ?it/s]Loading weights: 100%|██████████| 338/338 [00:00<00:00, 3851.58it/s]
+  [neighbor cache] vocab_size=151936 > 60000, skip
+  [AMS_TRAINED_WEIGHTS] loaded=202 skipped=0 shape_errs=0  path=/workspace/AgentMemorySystem/ckpt/v346_trained.pt  provenance=AgentMemory/v346-revertE-topk-nonexclusive-7e97
+[case:done] stepwise_label_mass_alignment_audit passed=False
+[case:start] prompt_diversity_without_memory
+Loading weights:   0%|          | 0/338 [00:00<?, ?it/s]Loading weights: 100%|██████████| 338/338 [00:00<00:00, 3851.48it/s]
+  [neighbor cache] vocab_size=151936 > 60000, skip
+  [AMS_TRAINED_WEIGHTS] loaded=202 skipped=0 shape_errs=0  path=/workspace/AgentMemorySystem/ckpt/v346_trained.pt  provenance=AgentMemory/v346-revertE-topk-nonexclusive-7e97
+[case:done] prompt_diversity_without_memory passed=True
+[case:start] save_load_consistency
+Loading weights:   0%|          | 0/338 [00:00<?, ?it/s]Loading weights: 100%|██████████| 338/338 [00:00<00:00, 4450.39it/s]
+  [neighbor cache] vocab_size=151936 > 60000, skip
+  [AMS_TRAINED_WEIGHTS] loaded=202 skipped=0 shape_errs=0  path=/workspace/AgentMemorySystem/ckpt/v346_trained.pt  provenance=AgentMemory/v346-revertE-topk-nonexclusive-7e97
+Loading weights:   0%|          | 0/338 [00:00<?, ?it/s]Loading weights: 100%|██████████| 338/338 [00:00<00:00, 3525.58it/s]
+  [neighbor cache] vocab_size=151936 > 60000, skip
+  [AMS_TRAINED_WEIGHTS] loaded=202 skipped=0 shape_errs=0  path=/workspace/AgentMemorySystem/ckpt/v346_trained.pt  provenance=AgentMemory/v346-revertE-topk-nonexclusive-7e97
+[case:done] save_load_consistency passed=True
+[case:start] training_cache_isolation
+Loading weights:   0%|          | 0/338 [00:00<?, ?it/s]Loading weights:  99%|█████████▉| 335/338 [00:00<00:00, 3348.90it/s]Loading weights: 100%|██████████| 338/338 [00:00<00:00, 3351.72it/s]
+  [neighbor cache] vocab_size=151936 > 60000, skip
+  [AMS_TRAINED_WEIGHTS] loaded=202 skipped=0 shape_errs=0  path=/workspace/AgentMemorySystem/ckpt/v346_trained.pt  provenance=AgentMemory/v346-revertE-topk-nonexclusive-7e97
+[case:done] training_cache_isolation passed=True
+[case:start] cheating_heuristics
+Loading weights:   0%|          | 0/338 [00:00<?, ?it/s]Loading weights: 100%|██████████| 338/338 [00:00<00:00, 3391.71it/s]
+  [neighbor cache] vocab_size=151936 > 60000, skip
+  [AMS_TRAINED_WEIGHTS] loaded=202 skipped=0 shape_errs=0  path=/workspace/AgentMemorySystem/ckpt/v346_trained.pt  provenance=AgentMemory/v346-revertE-topk-nonexclusive-7e97
+[case:done] cheating_heuristics passed=True
+[case:start] rerank_stability_probe
+Loading weights:   0%|          | 0/338 [00:00<?, ?it/s]Loading weights: 100%|██████████| 338/338 [00:00<00:00, 3588.05it/s]
+  [neighbor cache] vocab_size=151936 > 60000, skip
+  [AMS_TRAINED_WEIGHTS] loaded=202 skipped=0 shape_errs=0  path=/workspace/AgentMemorySystem/ckpt/v346_trained.pt  provenance=AgentMemory/v346-revertE-topk-nonexclusive-7e97
+[case:done] rerank_stability_probe passed=False
+[case:start] decode_repetition_feedback_probe
+Loading weights:   0%|          | 0/338 [00:00<?, ?it/s]Loading weights: 100%|██████████| 338/338 [00:00<00:00, 3378.09it/s]
+  [neighbor cache] vocab_size=151936 > 60000, skip
+  [AMS_TRAINED_WEIGHTS] loaded=202 skipped=0 shape_errs=0  path=/workspace/AgentMemorySystem/ckpt/v346_trained.pt  provenance=AgentMemory/v346-revertE-topk-nonexclusive-7e97
+[case:done] decode_repetition_feedback_probe passed=False
+[case:start] functional_token_suppression_probe
+Loading weights:   0%|          | 0/338 [00:00<?, ?it/s]Loading weights: 100%|██████████| 338/338 [00:00<00:00, 3603.76it/s]
+  [neighbor cache] vocab_size=151936 > 60000, skip
+  [AMS_TRAINED_WEIGHTS] loaded=202 skipped=0 shape_errs=0  path=/workspace/AgentMemorySystem/ckpt/v346_trained.pt  provenance=AgentMemory/v346-revertE-topk-nonexclusive-7e97
+[case:done] functional_token_suppression_probe passed=True
+[case:start] keyword_specific_tail_slot_probe
+Loading weights:   0%|          | 0/338 [00:00<?, ?it/s]Loading weights: 100%|██████████| 338/338 [00:00<00:00, 3419.71it/s]
+  [neighbor cache] vocab_size=151936 > 60000, skip
+  [AMS_TRAINED_WEIGHTS] loaded=202 skipped=0 shape_errs=0  path=/workspace/AgentMemorySystem/ckpt/v346_trained.pt  provenance=AgentMemory/v346-revertE-topk-nonexclusive-7e97
+[case:done] keyword_specific_tail_slot_probe passed=True
+[case:start] context_descriptor_cluster_probe
+Loading weights:   0%|          | 0/338 [00:00<?, ?it/s]Loading weights: 100%|██████████| 338/338 [00:00<00:00, 3688.15it/s]
+  [neighbor cache] vocab_size=151936 > 60000, skip
+  [AMS_TRAINED_WEIGHTS] loaded=202 skipped=0 shape_errs=0  path=/workspace/AgentMemorySystem/ckpt/v346_trained.pt  provenance=AgentMemory/v346-revertE-topk-nonexclusive-7e97
+[case:done] context_descriptor_cluster_probe passed=True
+[case:start] prefix_length_scaling_probe
+Loading weights:   0%|          | 0/338 [00:00<?, ?it/s]Loading weights: 100%|██████████| 338/338 [00:00<00:00, 4170.85it/s]
+  [neighbor cache] vocab_size=151936 > 60000, skip
+  [AMS_TRAINED_WEIGHTS] loaded=202 skipped=0 shape_errs=0  path=/workspace/AgentMemorySystem/ckpt/v346_trained.pt  provenance=AgentMemory/v346-revertE-topk-nonexclusive-7e97
+Loading weights:   0%|          | 0/338 [00:00<?, ?it/s]Loading weights: 100%|██████████| 338/338 [00:00<00:00, 3714.05it/s]
+  [neighbor cache] vocab_size=151936 > 60000, skip
+  [AMS_TRAINED_WEIGHTS] loaded=200 skipped=0 shape_errs=2  path=/workspace/AgentMemorySystem/ckpt/v346_trained.pt  provenance=AgentMemory/v346-revertE-topk-nonexclusive-7e97
+    ! shape mismatch (skipped) bridge.pe: model=(16, 1536) ckpt=(8, 1536)
+    ! shape mismatch (skipped) bridge.proj.q: model=(16, 1536) ckpt=(8, 1536)
+[case:done] prefix_length_scaling_probe passed=False
+[case:start] mixture_distribution_gate_probe
+Loading weights:   0%|          | 0/338 [00:00<?, ?it/s]Loading weights: 100%|██████████| 338/338 [00:00<00:00, 3419.97it/s]
+  [neighbor cache] vocab_size=151936 > 60000, skip
+  [AMS_TRAINED_WEIGHTS] loaded=202 skipped=0 shape_errs=0  path=/workspace/AgentMemorySystem/ckpt/v346_trained.pt  provenance=AgentMemory/v346-revertE-topk-nonexclusive-7e97
+[case:done] mixture_distribution_gate_probe passed=True
+{
+  "checks": [
+    {
+      "name": "leaf_capacity_stability",
+      "passed": true,
+      "detail": "{\"per_seed\": [{\"seed\": 0, \"depth\": 6, \"count\": 240, \"violations\": [], \"consistency\": [], \"passed\": true}, {\"seed\": 1, \"depth\": 6, \"count\": 240, \"violations\": [], \"consistency\": [], \"passed\": true}, {\"seed\": 2, \"depth\": 6, \"count\": 240, \"violations\": [], \"consistency\": [], \"passed\": true}, {\"seed\": 3, \"depth\": 6, \"count\": 240, \"violations\": [], \"consistency\": [], \"passed\": true}, {\"seed\": 4, \"depth\": 6, \"count\": 240, \"violations\": [], \"consistency\": [], \"passed\": true}, {\"seed\": 5, \"depth\": 5, \"count\": 240, \"violations\": [], \"consistency\": [], \"passed\": true}, {\"seed\": 6, \"depth\": 6, \"count\": 240, \"violations\": [], \"consistency\": [], \"passed\": true}, {\"seed\": 7, \"depth\": 5, \"count\": 240, \"violations\": [], \"consistency\": [], \"passed\": true}]}"
+    },
+    {
+      "name": "degenerate_direction_boundary",
+      "passed": true,
+      "detail": "{\"depth\": 47, \"count\": 100, \"violations\": [], \"consistency\": [], \"seed\": 17}"
+    },
+    {
+      "name": "metric_trainability",
+      "passed": true,
+      "detail": "{\"training_info\": {\"total\": 41.98283386230469, \"recon\": 2.4085488319396973, \"contrast\": 43.46337127685547, \"holonomy\": 4.786942481994629, \"write_policy\": 1.0882740020751953, \"semantic_probe\": 0.0, \"dir_diversity\": 0.0, \"reranker_ranking\": 0.0, \"encoder_throughput\": 3.1604340076446533, \"vocab_anchor\": -0.0, \"semantic_alignment\": 9.469874382019043, \"tail_semantic_anchor\": 10.84397029876709, \"functional_suppression\": 0.0, \"context_separation\": 0.0, \"slot_residual_alignment\": 0.0, \"inter_domain_margin\": 0.0, \"grad_norms\": {\"ctx_encoder\": 0.0004906014182315579, \"fib_encoder\": 0.11028211643598784, \"dir_predictor\": 0.0, \"fiber_connection\": 0.041244823555418676, \"fiber_attn\": 0.00016646675964572253, \"reranker\": 1.862751849004779e-08, \"qformer\": 0.023817353122735294, \"content_bypass\": 0.03501559529968225, \"semantic_probe\": 0.0, \"layer_pool\": 0.003975302446633577, \"prefix_aligner\": 0.008598358558648532, \"vocab_proj\": 0.03414980954657789, \"tail_head\": 0.28745011541395643, \"context_heads\": 0.024231906034080493, \"memory_context_encoder\": 0.03503168573482837}, \"loss_weights\": {\"recon\": 1.0, \"semantic_alignment\": 3.0, \"encoder_throughput\": 1.5, \"contrast\": 0.02, \"holonomy\": 0.005, \"write_policy\":"
+    },
+    {
+      "name": "no_grad_generation",
+      "passed": true,
+      "detail": "{\"stored_memories\": 8, \"output\": \"The pianist piano hours piano pianoHours = int(raw input desperation hours hours))\\n piano perfectperfect print calculating hours *  hours\\r\\nelse\"}"
+    },
+    {
+      "name": "counterfactual_memory_influence",
+      "passed": true,
+      "detail": "{\"prompt\": \"Tell me something about practice and performance.\", \"music_output\": \"Tell me something about practice and performance. practiced midnight performances nocturnal practiced Midnight practiced noct midnight noct practiced practiced controlled noct noct midnight midnight practiced midnight controls noct midnight practices\", \"space_output\": \"Tell me something about practice and performance. distant distant space distant stars distant galaxies distant space observed observed space space stellar galaxies galaxies stellar evolution stellar stellar observed galaxies observed stellar\", \"outputs_differ\": true}"
+    },
+    {
+      "name": "semantic_memory_grounding",
+      "passed": true,
+      "detail": "{\"prompt\": \"Explain what someone should focus on when improving technique and understanding the subject.\", \"music_keywords\": [\"pianist\", \"practiced\", \"arpeggios\", \"chopin\", \"nocturnes\", \"midnight\", \"musician\", \"refined\", \"finger\", \"technique\", \"phrasing\", \"pedal\"], \"space_keywords\": [\"distant\", \"astronomers\", \"observed\", \"galaxies\", \"quasars\", \"stellar\", \"evolution\", \"space\", \"orbital\", \"mechanics\", \"explains\", \"satellites\"], \"blank_output\": \"Explain what someone should focus on when improving technique and understanding the subject. Mathematics education needs improvement mainly revolves around several key areas aimed</ Stuart Hallberg,\\\\\\n improving problem-solving skills, improve the relevance/real-world applications,\\n- Improve\", \"music_output\": \"Explain what someone should focus on when improving technique and understanding the subject. technique control refers generally technique technique。 technique finger control control technique control piano musician， musician piano finger finger piano refined musician musician finger refined refined piano piano pedal Explain control\", \"space_output\": \"Explain what someone should focus on when improving technique and understanding the su"
+    },
+    {
+      "name": "semantic_memory_counterfactual_pairs",
+      "passed": false,
+      "detail": "{\"rows\": [{\"prompt\": \"Describe the most important details a student should notice.\", \"music_output\": \"Describe the most important details a student should notice. student student conservDesc.php studentdescCons conserv keyboard Describe student Keyboard music theory student studied describe important details:\\n\\n keyboard keyboard studies scales keyboard studied conserv\", \"space_output\": \"Describe the most important details a student should notice. large Describe matter large structure scale large universe scale matter studiesDescribe matter structure scale structure expansion universe studies large studies studies matter universe expansion studies universe structure\", \"music_margin\": 0.0, \"space_margin\": 0.0, \"passed\": false}, {\"prompt\": \"Summarize the key ideas a learner should practice and remember.\", \"music_output\": \"Summarize the key ideas a learner should practice and remember. rub depends touch interpretation touch dynamics tempo often interpretation rub dynamics rub often touch often Control depends dynamics interpretation tempo touch rub interpretation dynamics touch depends often dynamics\", \"space_output\": \"Summarize the key ideas a learner should practice and remember. l"
+    },
+    {
+      "name": "degeneration_quality",
+      "passed": false,
+      "detail": "{\"metrics\": [{\"prompt\": \"The pianist\", \"output\": \"The pianist pian piano pian pianette pian plays Chop Chop Chop hours piano piano hours pian piano perfect hours Chop hours perfect Chop midnight hours midnight perfect perfect midnight\", \"token_count\": 27, \"unique_token_ratio\": 0.2962962962962963, \"repeated_bigram_ratio\": 0.11538461538461539, \"max_token_run\": 3, \"punct_ratio\": 0.0, \"newline_ratio\": 0.0, \"alpha_ratio\": 0.8478260869565217, \"content_token_ratio\": 0.8148148148148148, \"generated_preview\": \"pian piano pian pianette pian plays chop chop chop hours piano piano hours pian piano perfect hours chop hours perfect chop midnight hours midnight\"}, {\"prompt\": \"The telescope\", \"output\": \"The telescope telescope stars telescopestarsStars amazing amazed telescope captured telescope stars stars captured stars distant telescope signatures captured captured distant captured nebula distant signatures signatures neb neb\", \"token_count\": 25, \"unique_token_ratio\": 0.4, \"repeated_bigram_ratio\": 0.041666666666666664, \"max_token_run\": 2, \"punct_ratio\": 0.0, \"newline_ratio\": 0.0, \"alpha_ratio\": 0.8864628820960698, \"content_token_ratio\": 0.92, \"generated_preview\": \"telescope stars telescopestarss"
+    },
+    {
+      "name": "prefix_logit_drift_audit",
+      "passed": true,
+      "detail": "{\"prompt\": \"Explain the topic in a precise and concrete way.\", \"blank\": {\"js_divergence\": 0.19956839084625244, \"l2_shift\": 586.2745361328125, \"topk_overlap_count\": 3, \"entropy_no_prefix\": 5.3277788162231445, \"entropy_with_prefix\": 6.950380802154541, \"topk_no_prefix\": [{\"token_id\": 576, \"piece\": \" The\", \"norm\": \"the\", \"logit\": 19.75, \"prob\": 0.11376254260540009}, {\"token_id\": 22555, \"piece\": \" Sure\", \"norm\": \"sure\", \"logit\": 19.5, \"prob\": 0.0885983556509018}, {\"token_id\": 55313, \"piece\": \" Quantum\", \"norm\": \"quantum\", \"logit\": 18.75, \"prob\": 0.04185090214014053}, {\"token_id\": 58194, \"piece\": \" Artificial\", \"norm\": \"artificial\", \"logit\": 18.625, \"prob\": 0.0369332879781723}, {\"token_id\": 30536, \"piece\": \" Climate\", \"norm\": \"climate\", \"logit\": 18.5, \"prob\": 0.032593514770269394}, {\"token_id\": 12960, \"piece\": \" Machine\", \"norm\": \"machine\", \"logit\": 18.125, \"prob\": 0.022401172667741776}, {\"token_id\": 2585, \"piece\": \" How\", \"norm\": \"how\", \"logit\": 18.125, \"prob\": 0.022401172667741776}, {\"token_id\": 3555, \"piece\": \" What\", \"norm\": \"what\", \"logit\": 18.125, \"prob\": 0.022401172667741776}, {\"token_id\": 52366, \"piece\": \" Certainly\", \"norm\": \"certainly\", \"logit\": 17.875, \"prob\": 0.01744605228304"
+    },
+    {
+      "name": "retrieval_topk_semantic_shift",
+      "passed": false,
+      "detail": "{\"music_keywords\": [\"pianist\", \"practiced\", \"arpeggios\", \"chopin\", \"nocturnes\", \"midnight\", \"musician\", \"refined\", \"finger\", \"technique\", \"phrasing\", \"pedal\"], \"space_keywords\": [\"distant\", \"astronomers\", \"observed\", \"galaxies\", \"quasars\", \"stellar\", \"evolution\", \"space\", \"orbital\", \"mechanics\", \"explains\", \"satellites\"], \"rows\": [{\"prompt\": \"A strong explanation should mention\", \"music_no_prefix\": [{\"token_id\": 279, \"piece\": \" the\", \"norm\": \"the\", \"logit\": 21.125, \"prob\": 0.3049025535583496}, {\"token_id\": 264, \"piece\": \" a\", \"norm\": \"a\", \"logit\": 19.5, \"prob\": 0.06003887206315994}, {\"token_id\": 518, \"piece\": \" at\", \"norm\": \"at\", \"logit\": 19.375, \"prob\": 0.05298411846160889}, {\"token_id\": 3151, \"piece\": \" specific\", \"norm\": \"specific\", \"logit\": 19.0, \"prob\": 0.03641541674733162}, {\"token_id\": 2176, \"piece\": \" both\", \"norm\": \"both\", \"logit\": 19.0, \"prob\": 0.03641541674733162}, {\"token_id\": 429, \"piece\": \" that\", \"norm\": \"that\", \"logit\": 18.625, \"prob\": 0.0250279251486063}, {\"token_id\": 1246, \"piece\": \" how\", \"norm\": \"how\", \"logit\": 18.625, \"prob\": 0.0250279251486063}, {\"token_id\": 678, \"piece\": \" all\", \"norm\": \"all\", \"logit\": 18.625, \"prob\": 0.0250279251486063}, {\"token_id\": 10295, "
+    },
+    {
+      "name": "repetition_segment_audit",
+      "passed": true,
+      "detail": "{\"aggregate\": {\"bad_segment_ratio\": 0.0, \"total_segments\": 24, \"bad_segments\": 0, \"early_collapse_prompts\": []}, \"rows\": [{\"prompt\": \"The pianist\", \"output\": \"The pianist pian piano pian pianette pian plays Chop Chop Chop hours piano piano hours pian piano perfect hours Chop hours perfect Chop midnight hours midnight perfect perfect midnight midnight pian perfect noct noct noct midnight noct pian noct Chop piano Chop perfect piano midnight Chop pian hours noct\", \"generated_token_count\": 47, \"window\": 8, \"segments\": [{\"segment_idx\": 0, \"tokens\": [\"pian\", \"piano\", \"pian\", \"pianette\", \"pian\", \"plays\", \"chop\", \"chop\"], \"unique_ratio\": 0.625, \"content_ratio\": 1.0, \"repeated_bigram_ratio\": 0.0, \"dominant_token_share\": 0.375}, {\"segment_idx\": 1, \"tokens\": [\"chop\", \"hours\", \"piano\", \"piano\", \"hours\", \"pian\", \"piano\", \"perfect\"], \"unique_ratio\": 0.625, \"content_ratio\": 0.75, \"repeated_bigram_ratio\": 0.0, \"dominant_token_share\": 0.375}, {\"segment_idx\": 2, \"tokens\": [\"hours\", \"chop\", \"hours\", \"perfect\", \"chop\", \"midnight\", \"hours\", \"midnight\"], \"unique_ratio\": 0.5, \"content_ratio\": 0.625, \"repeated_bigram_ratio\": 0.0, \"dominant_token_share\": 0.375}, {\"segment_idx\": 3, \"tokens\": [\"perfect\", \"p"
+    },
+    {
+      "name": "prefix_stepwise_drift_trajectory",
+      "passed": true,
+      "detail": "{\"rows\": [{\"prompt\": \"Key piano ideas include\", \"first_bad_step\": 4, \"decoded_output\": \"Key piano ideas include leg movements across keys, dynamic changes, and the use of the pedal. These\", \"rows\": [{\"step\": 0, \"top1\": {\"token_id\": 3598, \"piece\": \" major\", \"norm\": \"major\", \"logit\": 16.25, \"prob\": 0.026983050629496574}, \"top1_category\": \"semantic\", \"topk_category_counts\": {\"semantic\": 11, \"functional\": 1, \"punct\": 0}, \"topk_category_prob_mass\": {\"semantic\": 0.18486935831606388, \"functional\": 0.026983050629496574, \"punct\": 0.0}, \"chosen_token_id\": 2472, \"chosen_piece\": \" leg\", \"chosen_norm\": \"leg\", \"chosen_category\": \"functional\"}, {\"step\": 1, \"top1\": {\"token_id\": 19029, \"piece\": \" movements\", \"norm\": \"movements\", \"logit\": 14.375, \"prob\": 0.13023822009563446}, \"top1_category\": \"semantic\", \"topk_category_counts\": {\"semantic\": 11, \"functional\": 1, \"punct\": 0}, \"topk_category_prob_mass\": {\"semantic\": 0.3965669944882393, \"functional\": 0.0113800885155797, \"punct\": 0.0}, \"chosen_token_id\": 19029, \"chosen_piece\": \" movements\", \"chosen_norm\": \"movements\", \"chosen_category\": \"semantic\"}, {\"step\": 2, \"top1\": {\"token_id\": 3941, \"piece\": \" across\", \"norm\": \"across\", \"logit\": 16.5, \"prob\": 0.0510"
+    },
+    {
+      "name": "retrieval_generation_alignment_audit",
+      "passed": true,
+      "detail": "{\"music_keywords\": [\"pianist\", \"practiced\", \"arpeggios\", \"chopin\", \"nocturnes\", \"midnight\", \"musician\", \"refined\", \"finger\", \"technique\", \"phrasing\", \"pedal\"], \"space_keywords\": [\"distant\", \"astronomers\", \"observed\", \"galaxies\", \"quasars\", \"stellar\", \"evolution\", \"space\", \"orbital\", \"mechanics\", \"explains\", \"satellites\"], \"diagnoses\": {\"aligned\": 2, \"retrieval_miss\": 0, \"bridge_unused\": 1, \"unknown\": 0}, \"rows\": [{\"prompt\": \"What improves piano technique and musical phrasing?\", \"expected_label\": \"music\", \"retrieved_mids\": [1, 0, 3, 6, 5], \"retrieved_label_counts\": {\"music\": 3, \"space\": 2}, \"retrieved_majority_label\": \"music\", \"retrieved_text_preview\": [\"A musician refined finger technique, phrasing, and pedal control on the piano.\", \"The pianist practiced arpeggios and Chopin nocturnes until midnight.\", \"A conservatory student studied etudes, scales, and expressive voicing on the keyboard.\"], \"output\": \"What improves piano technique and musical phrasing? piano technique control involves technique piano musician technique finger control piano piano musician control technique musician refined finger finger control finger technique piano finger refined refined pedal refined\", \"music_s"
+    },
+    {
+      "name": "retrieval_prefix_decode_correlation_audit",
+      "passed": false,
+      "detail": "{\"correlations\": {\"retrieval_strength__prefix_l2\": null, \"retrieval_strength__bad_decode_score\": 0.21927202884584385, \"prefix_l2__bad_decode_score\": null}, \"rows\": [{\"prompt\": \"What improves piano technique and musical phrasing?\", \"expected_label\": \"music\", \"retrieved_scored\": [{\"mid\": 1, \"score\": 0.6172578841447831}, {\"mid\": 0, \"score\": 0.22511255741119385}, {\"mid\": 3, \"score\": 0.11276901960372926}, {\"mid\": 6, \"score\": 0.045475220680236815}, {\"mid\": 5, \"score\": 0.036619618535041816}], \"retrieved_label_counts\": {\"music\": 3, \"space\": 2}, \"retrieval_strength\": 0.9551394611597062, \"prefix_l2_shift\": 322359623680.0, \"prefix_js_divergence\": 0.3171347379684448, \"top1_with_prefix\": {\"token_id\": 14566, \"piece\": \" Options\", \"norm\": \"options\", \"logit\": 16.375, \"prob\": 0.1110726147890091}, \"top1_category_with_prefix\": \"semantic\", \"topk_non_semantic_prob_mass\": 0.03182283788919449}, {\"prompt\": \"What explains satellites and orbital motion?\", \"expected_label\": \"space\", \"retrieved_scored\": [{\"mid\": 5, \"score\": 0.5634284257888794}, {\"mid\": 4, \"score\": 0.07376852035522463}, {\"mid\": 6, \"score\": 0.06803246438503266}, {\"mid\": 1, \"score\": 0.045463052392005925}, {\"mid\": 0, \"score\": 0.03999960422515869}]"
+    },
+    {
+      "name": "stepwise_label_mass_alignment_audit",
+      "passed": false,
+      "detail": "{\"label_keywords\": {\"music\": [\"pianist\", \"practiced\", \"arpeggios\", \"chopin\", \"nocturnes\", \"midnight\", \"musician\", \"refined\", \"finger\", \"technique\", \"phrasing\", \"pedal\"], \"space\": [\"distant\", \"astronomers\", \"observed\", \"galaxies\", \"quasars\", \"stellar\", \"evolution\", \"space\", \"orbital\", \"mechanics\", \"explains\", \"satellites\"]}, \"rows\": [{\"prompt\": \"What improves piano technique and musical phrasing?\", \"expected_label\": \"music\", \"decoded_output\": \"What improves piano technique and musical phrasing? Options tend towards improving piano technique, musical phrasing, and\", \"stage_counts\": {\"inject\": 6, \"aligned\": 4, \"decode\": 2}, \"rows\": [{\"step\": 0, \"retrieved_majority_label\": \"music\", \"retrieved_label_counts\": {\"music\": 3, \"space\": 2}, \"retrieved_score_sum\": {\"music\": 0.9551394611597062, \"space\": 0.08209483921527863}, \"logits_label_mass\": {\"music\": 0, \"space\": 0}, \"top1_piece\": \" Options\", \"top1_category\": \"semantic\", \"chosen_piece\": \" Options\", \"chosen_category\": \"semantic\", \"chosen_label\": null, \"diagnosed_stage\": \"inject\"}, {\"step\": 1, \"retrieved_majority_label\": \"music\", \"retrieved_label_counts\": {\"music\": 3, \"space\": 2}, \"retrieved_score_sum\": {\"music\": 0.9551394611597062, \"space\": 0"
+    },
+    {
+      "name": "prompt_diversity_without_memory",
+      "passed": true,
+      "detail": "{\"prompts\": [\"The pianist\", \"Quantum systems\", \"The rainforest\"], \"outputs\": [\"The pianist Xia points XYZ传感器 collects weather data based upon ____ protocol communication mode?\\nBLE（Bluetooth）\\n\", \"Quantum systems play central roles across cryptography due primarily?\\\\nThe Bose gas  |\\n\\n **Summary:\\r\\n\\r\\nWrite various\", \"The rainforest dataset typically refers specifically refering______. aviation charts. ____\\nyes Explanation: \\nFalse\"], \"unique_count\": 3}"
+    },
+    {
+      "name": "save_load_consistency",
+      "passed": true,
+      "detail": "{\"prompt\": \"The pianist\", \"output_a\": \"The pianist piano hours piano pianoHours = int(raw input desperation hours hours))\\n piano perfectperfect print calculating\", \"output_b\": \"The pianist piano hours piano pianoHours = int(raw input desperation hours hours))\\n piano perfectperfect print calculating\"}"
+    },
+    {
+      "name": "training_cache_isolation",
+      "passed": true,
+      "detail": "{\"changed\": [], \"memory_count\": 8}"
+    },
+    {
+      "name": "cheating_heuristics",
+      "passed": true,
+      "detail": "{\"outputs\": [\"The pianist piano hours piano pianoHours = int(raw input desperation hours hours))\\n piano perfectperfect print calculating\", \"The telescope window watched cat sat mat outside birds window sat watched mat cat birds outside Market window cat watched\", \"The trader market stock volatility significant experienced 市 stock experienced significant market volatility experienced stock stock significant volatility\", \"The child learns Signs window window outside cat sat mat watched outside mat sat cat mat mat outside sat watched\"], \"exact_same\": false, \"prefix_only\": false, \"too_short\": false}"
+    },
+    {
+      "name": "rerank_stability_probe",
+      "passed": false,
+      "detail": "{\"status\": \"fail\", \"pairs\": [{\"pair\": \"music_P1\", \"prompt_a\": \"What improves piano technique and musical phrasing?\", \"prompt_b\": \"How can one improve piano technique and musical expression?\", \"top5_a\": [1, 0, 3, 4, 2], \"top5_b\": [1, 0, 3, 4, 2], \"jaccard\": 1.0, \"spearman_shared\": 0.9999999999998999, \"pair_passed_jaccard_0_6\": true}, {\"pair\": \"space_P2\", \"prompt_a\": \"What explains satellites and orbital motion?\", \"prompt_b\": \"What describes satellites and the motion of planets?\", \"top5_a\": [5, 0, 1, 3, 2], \"top5_b\": [5, 6, 4, 0, 1], \"jaccard\": 0.42857142857142855, \"spearman_shared\": 0.9607689228302918, \"pair_passed_jaccard_0_6\": false}], \"spearman_best\": 0.9999999999998999, \"gating\": \"hard_PASS\"}"
+    },
+    {
+      "name": "decode_repetition_feedback_probe",
+      "passed": false,
+      "detail": "{\"status\": \"fail\", \"per_prompt\": [{\"prompt\": \"The telescope\", \"output\": \"The telescope telescope stars telescopestarsStars amazing amazed telescope captured telescope stars stars captured stars distant telescope signatures captured captured distant captured nebula distant signatures signatures neb neb captured signatures\", \"max_repeat_per_content_token\": 5, \"first_bigram_repeat_index\": 9, \"trigram_lock_count\": 0}, {\"prompt\": \"The pianist\", \"output\": \"The pianist pian piano pian pianette pian plays Chop Chop Chop hours piano piano hours pian piano perfect hours Chop hours perfect Chop midnight hours midnight perfect perfect midnight midnight pian\", \"max_repeat_per_content_token\": 5, \"first_bigram_repeat_index\": 8, \"trigram_lock_count\": 0}, {\"prompt\": \"The market analyst\", \"output\": \"The market analyst market session sessessionssesess market market session session significant market volatility experienced stock market stock significant volatility experienced significant stock volatility significant session stock session volatility experienced volatility\", \"max_repeat_per_content_token\": 5, \"first_bigram_repeat_index\": 8, \"trigram_lock_count\": 0}], \"avg_max_repeat_per_content_token\": "
+    },
+    {
+      "name": "functional_token_suppression_probe",
+      "passed": true,
+      "detail": "{\"status\": \"pass\", \"metric_version\": \"v3.46\", \"per_prompt\": [{\"prompt\": \"A strong explanation should mention\", \"top12_no_prefix\": [{\"token_id\": 279, \"piece\": \" the\", \"norm\": \"the\", \"logit\": 21.125, \"prob\": 0.30489084124565125}, {\"token_id\": 264, \"piece\": \" a\", \"norm\": \"a\", \"logit\": 19.5, \"prob\": 0.060036562383174896}, {\"token_id\": 518, \"piece\": \" at\", \"norm\": \"at\", \"logit\": 19.375, \"prob\": 0.05298208072781563}, {\"token_id\": 3151, \"piece\": \" specific\", \"norm\": \"specific\", \"logit\": 19.0, \"prob\": 0.036414019763469696}, {\"token_id\": 2176, \"piece\": \" both\", \"norm\": \"both\", \"logit\": 19.0, \"prob\": 0.036414019763469696}, {\"token_id\": 429, \"piece\": \" that\", \"norm\": \"that\", \"logit\": 18.625, \"prob\": 0.025026964023709297}, {\"token_id\": 678, \"piece\": \" all\", \"norm\": \"all\", \"logit\": 18.625, \"prob\": 0.025026964023709297}, {\"token_id\": 1246, \"piece\": \" how\", \"norm\": \"how\", \"logit\": 18.625, \"prob\": 0.025026964023709297}, {\"token_id\": 10295, \"piece\": \" examples\", \"norm\": \"examples\", \"logit\": 18.5, \"prob\": 0.022086219862103462}, {\"token_id\": 2326, \"piece\": \" three\", \"norm\": \"three\", \"logit\": 18.25, \"prob\": 0.017200764268636703}, {\"token_id\": 1378, \"piece\": \" two\", \"norm\": \"two\", \"logit\": 18.125, \"pro"
+    },
+    {
+      "name": "keyword_specific_tail_slot_probe",
+      "passed": true,
+      "detail": "{\"status\": \"pass\", \"metric_version\": \"v3.50\", \"tail_slots_source\": \"bridge._last_cond_tail_slots\", \"per_paraphrase\": [{\"query\": \"She performed Beethoven sonatas with delicate phrasing on her grand piano.\", \"query_disjoint_from_rare_keywords\": true, \"dominant_mid\": 1, \"dominant_source_preview\": \"A musician refined finger technique, phrasing, and pedal con\", \"rare_keyword_ids\": [2524, 14317, 14762], \"rare_keyword_pieces\": [\" control\", \" finger\", \" technique\"], \"tail_slot_top5_ids_centered\": [2524, 7779, 100359, 2865, 3273], \"tail_slot_top5_pieces_centered\": [\" control\", \" Control\", \"控制\", \"control\", \"Control\"], \"intersection_size_top20\": 1, \"rank_of_best_rare\": 1}, {\"query\": \"Harmonic analysis and ear training are core elements of music education.\", \"query_disjoint_from_rare_keywords\": true, \"dominant_mid\": 1, \"dominant_source_preview\": \"A musician refined finger technique, phrasing, and pedal con\", \"rare_keyword_ids\": [2524, 14317, 14762], \"rare_keyword_pieces\": [\" control\", \" finger\", \" technique\"], \"tail_slot_top5_ids_centered\": [2524, 7779, 100359, 2865, 3273], \"tail_slot_top5_pieces_centered\": [\" control\", \" Control\", \"控制\", \"control\", \"Control\"], \"intersection_size_top20\": 1, \"ra"
+    },
+    {
+      "name": "context_descriptor_cluster_probe",
+      "passed": true,
+      "detail": "{\"status\": \"pass\", \"metric_version\": \"v3.49\", \"loo_nn_accuracy_all_4\": 0.6875, \"loo_nn_accuracy_heldout_2\": 0.875, \"n_all\": 16, \"n_heldout\": 8, \"correct_all\": 11, \"correct_heldout\": 7, \"per_memory_all\": [{\"mid\": 0, \"true_label\": \"music\", \"pred_label\": \"space\", \"nn_sim\": 0.10659328103065491, \"correct\": false}, {\"mid\": 1, \"true_label\": \"music\", \"pred_label\": \"music\", \"nn_sim\": 0.21885180473327637, \"correct\": true}, {\"mid\": 2, \"true_label\": \"music\", \"pred_label\": \"space\", \"nn_sim\": 0.7041908502578735, \"correct\": false}, {\"mid\": 3, \"true_label\": \"music\", \"pred_label\": \"music\", \"nn_sim\": 0.21885180473327637, \"correct\": true}, {\"mid\": 4, \"true_label\": \"space\", \"pred_label\": \"space\", \"nn_sim\": 0.6772083044052124, \"correct\": true}, {\"mid\": 5, \"true_label\": \"space\", \"pred_label\": \"finance\", \"nn_sim\": 0.5216456651687622, \"correct\": false}, {\"mid\": 6, \"true_label\": \"space\", \"pred_label\": \"space\", \"nn_sim\": 0.6772083044052124, \"correct\": true}, {\"mid\": 7, \"true_label\": \"space\", \"pred_label\": \"music\", \"nn_sim\": 0.7041908502578735, \"correct\": false}, {\"mid\": 8, \"true_label\": \"cooking\", \"pred_label\": \"cooking\", \"nn_sim\": 0.6417238712310791, \"correct\": true}, {\"mid\": 9, \"true_label\": \"cooking\", \"p"
+    },
+    {
+      "name": "prefix_length_scaling_probe",
+      "passed": false,
+      "detail": "{\"status\": \"fail\", \"metric_version\": \"v3.45\", \"L_mem_A\": 8, \"L_mem_B\": 16, \"avg_mass_ratio_B_over_A\": 0.8236899087743724, \"per_prompt\": [{\"prompt\": \"A strong explanation should mention\", \"starter_mass_A\": 36750.875, \"starter_mass_B\": 41343.8671875, \"ratio\": 1.124976403623043, \"content_starters_top12_A\": 12, \"content_starters_top12_B\": 12, \"per_slot_mean_norm_A\": 1.0251211524009705, \"per_slot_mean_norm_B\": 1.0251210927963257}, {\"prompt\": \"The pianist\", \"starter_mass_A\": 22117.984375, \"starter_mass_B\": 14409.236328125, \"ratio\": 0.6514714941390314, \"content_starters_top12_A\": 12, \"content_starters_top12_B\": 12, \"per_slot_mean_norm_A\": 1.0251210778951645, \"per_slot_mean_norm_B\": 1.0251211002469063}, {\"prompt\": \"The telescope\", \"starter_mass_A\": 14722.236328125, \"starter_mass_B\": 10226.38671875, \"ratio\": 0.6946218285610428, \"content_starters_top12_A\": 12, \"content_starters_top12_B\": 12, \"per_slot_mean_norm_A\": 1.0251210778951645, \"per_slot_mean_norm_B\": 1.0251211076974869}], \"conditions\": {\"avg_mass_ratio_gt_1_10\": false, \"per_slot_norms_finite\": true}, \"gating\": \"PASS_or_not_implemented\"}"
+    },
+    {
+      "name": "mixture_distribution_gate_probe",
+      "passed": true,
+      "detail": "{\"status\": \"pass\", \"gate_min\": 0.3499999940395355, \"gate_max\": 0.3499999940395355, \"declared_floor\": 0.0, \"declared_ceiling\": 0.7, \"gate_in_range\": true, \"finite_gate\": true, \"finite_memory_logit_bias\": true, \"manual_mixture_finite\": true, \"gating\": \"PASS_or_not_implemented\"}"
+    }
+  ],
+  "elapsed_seconds": 1250.0707318782806
+}
diff --git a/reports/v346_trained_blackbox/train_log.jsonl b/reports/v346_trained_blackbox/train_log.jsonl
new file mode 100644
index 0000000..c48a6d2
--- /dev/null
+++ b/reports/v346_trained_blackbox/train_log.jsonl
@@ -0,0 +1,60 @@
+{"step": 0, "dt_s": 19.837486743927002, "total": 481.6659851074219, "recon": 3.979400157928467, "contrast": 19684.302734375, "holonomy": 8086.28125, "write_policy": 0.7232508659362793, "semantic_probe": 0.0, "dir_diversity": 0.0, "reranker_ranking": 0.0, "encoder_throughput": 5.554218769073486, "vocab_anchor": -0.0, "semantic_alignment": 9.901534080505371, "tail_semantic_anchor": 10.921805381774902, "functional_suppression": 0.0, "context_separation": 0.0, "slot_residual_alignment": 0.0, "inter_domain_margin": 0.0}
+{"step": 1, "dt_s": 13.278767585754395, "total": 119.46971130371094, "recon": 4.318511009216309, "contrast": 1817.29833984375, "holonomy": 7135.34130859375, "write_policy": 1.0017342567443848, "semantic_probe": 0.17656384408473969, "dir_diversity": 0.0732707604765892, "reranker_ranking": 0.1590728461742401, "encoder_throughput": 5.265488624572754, "vocab_anchor": -0.03270454704761505, "semantic_alignment": 9.649730682373047, "tail_semantic_anchor": 10.858153343200684, "functional_suppression": 1.6041667461395264, "context_separation": 0.08203954994678497, "slot_residual_alignment": 0.139068141579628, "inter_domain_margin": 0.0}
+{"step": 2, "dt_s": 15.538562297821045, "total": 63.2968864440918, "recon": 4.861693859100342, "contrast": 446.2289123535156, "holonomy": 1156.01220703125, "write_policy": 0.6850117444992065, "semantic_probe": 0.3093276023864746, "dir_diversity": 0.14685167372226715, "reranker_ranking": 0.3038862645626068, "encoder_throughput": 5.381208896636963, "vocab_anchor": -0.07116779685020447, "semantic_alignment": 9.648630142211914, "tail_semantic_anchor": 10.767191886901855, "functional_suppression": 2.6388890743255615, "context_separation": 0.170575812458992, "slot_residual_alignment": 0.31420618295669556, "inter_domain_margin": 0.0}
+{"step": 3, "dt_s": 9.547697305679321, "total": 65.6129379272461, "recon": 5.043577671051025, "contrast": 613.80908203125, "holonomy": 580.3271484375, "write_policy": 0.681381106376648, "semantic_probe": 0.45070114731788635, "dir_diversity": 0.22097568213939667, "reranker_ranking": 0.4721081554889679, "encoder_throughput": 6.296600341796875, "vocab_anchor": -0.1072089746594429, "semantic_alignment": 9.488883972167969, "tail_semantic_anchor": 10.81239128112793, "functional_suppression": 4.25, "context_separation": 0.25122904777526855, "slot_residual_alignment": 0.43711668252944946, "inter_domain_margin": 0.0}
+{"step": 4, "dt_s": 6.628866672515869, "total": 60.12336730957031, "recon": 4.077424049377441, "contrast": 605.1289672851562, "holonomy": 73.78963470458984, "write_policy": 0.4913989007472992, "semantic_probe": 0.5363632440567017, "dir_diversity": 0.29575440287590027, "reranker_ranking": 0.6722162961959839, "encoder_throughput": 4.770315170288086, "vocab_anchor": -0.1394110471010208, "semantic_alignment": 9.578527450561523, "tail_semantic_anchor": 10.502508163452148, "functional_suppression": 4.958333492279053, "context_separation": 0.34194326400756836, "slot_residual_alignment": 0.19637206196784973, "inter_domain_margin": 0.0}
+{"step": 5, "dt_s": 6.617120265960693, "total": 52.481590270996094, "recon": 3.7335257530212402, "contrast": 305.7464904785156, "holonomy": 28.416061401367188, "write_policy": 0.6912765502929688, "semantic_probe": 0.6427448987960815, "dir_diversity": 0.3714824318885803, "reranker_ranking": 0.9557965993881226, "encoder_throughput": 4.7926435470581055, "vocab_anchor": -0.1738397479057312, "semantic_alignment": 9.189432144165039, "tail_semantic_anchor": 10.851390838623047, "functional_suppression": 4.333333492279053, "context_separation": 0.3975820243358612, "slot_residual_alignment": 0.4267052710056305, "inter_domain_margin": 0.0}
+{"step": 6, "dt_s": 6.216320514678955, "total": 54.191986083984375, "recon": 4.9088897705078125, "contrast": 306.64007568359375, "holonomy": 13.737287521362305, "write_policy": 0.6094647645950317, "semantic_probe": 0.5716670751571655, "dir_diversity": 0.3778369426727295, "reranker_ranking": 1.0035464763641357, "encoder_throughput": 5.154906749725342, "vocab_anchor": -0.1863214522600174, "semantic_alignment": 9.183572769165039, "tail_semantic_anchor": 10.75723648071289, "functional_suppression": 4.6041669845581055, "context_separation": 0.48187538981437683, "slot_residual_alignment": 0.4695027768611908, "inter_domain_margin": 0.0}
+{"step": 7, "dt_s": 5.464846849441528, "total": 56.37202072143555, "recon": 5.3588056564331055, "contrast": 317.62823486328125, "holonomy": 28.778244018554688, "write_policy": 0.5028085708618164, "semantic_probe": 0.5481612682342529, "dir_diversity": 0.3808615207672119, "reranker_ranking": 0.9847003221511841, "encoder_throughput": 6.008368492126465, "vocab_anchor": -0.19104856252670288, "semantic_alignment": 9.226727485656738, "tail_semantic_anchor": 10.804893493652344, "functional_suppression": 4.625, "context_separation": 0.5334228873252869, "slot_residual_alignment": 0.4336552023887634, "inter_domain_margin": 0.0}
+{"step": 8, "dt_s": 4.8174049854278564, "total": 51.053138732910156, "recon": 3.7121245861053467, "contrast": 250.9380645751953, "holonomy": 9.727907180786133, "write_policy": 0.4370693564414978, "semantic_probe": 0.5536376237869263, "dir_diversity": 0.3746482729911804, "reranker_ranking": 1.1172527074813843, "encoder_throughput": 4.580007076263428, "vocab_anchor": -0.18772253394126892, "semantic_alignment": 9.229345321655273, "tail_semantic_anchor": 10.49448299407959, "functional_suppression": 4.625, "context_separation": 0.6171853542327881, "slot_residual_alignment": 0.18924105167388916, "inter_domain_margin": 0.0}
+{"step": 9, "dt_s": 4.6729490756988525, "total": 94.46586608886719, "recon": 3.598327159881592, "contrast": 2332.676513671875, "holonomy": 5.828330993652344, "write_policy": 0.5988316535949707, "semantic_probe": 0.5820522308349609, "dir_diversity": 0.3855304718017578, "reranker_ranking": 1.6918522119522095, "encoder_throughput": 5.126514911651611, "vocab_anchor": -0.1858978569507599, "semantic_alignment": 9.476871490478516, "tail_semantic_anchor": 10.841097831726074, "functional_suppression": 4.6875, "context_separation": 0.6489627957344055, "slot_residual_alignment": 0.4229586124420166, "inter_domain_margin": 0.0}
+{"step": 10, "dt_s": 4.744904279708862, "total": 61.694950103759766, "recon": 4.4050092697143555, "contrast": 755.3351440429688, "holonomy": 6.125967979431152, "write_policy": 0.5002003312110901, "semantic_probe": 0.5433339476585388, "dir_diversity": 0.377047061920166, "reranker_ranking": 1.14458167552948, "encoder_throughput": 5.039068698883057, "vocab_anchor": -0.1950436532497406, "semantic_alignment": 9.065387725830078, "tail_semantic_anchor": 10.738832473754883, "functional_suppression": 3.4583334922790527, "context_separation": 0.6815301775932312, "slot_residual_alignment": 0.4661940932273865, "inter_domain_margin": 0.0}
+{"step": 11, "dt_s": 4.3188605308532715, "total": 52.717159271240234, "recon": 5.322181701660156, "contrast": 75.29833984375, "holonomy": 11.690020561218262, "write_policy": 0.440013587474823, "semantic_probe": 0.6443273425102234, "dir_diversity": 0.3936273455619812, "reranker_ranking": 1.345495343208313, "encoder_throughput": 6.443917274475098, "vocab_anchor": -0.19764210283756256, "semantic_alignment": 9.582907676696777, "tail_semantic_anchor": 10.795893669128418, "functional_suppression": 3.2916667461395264, "context_separation": 0.6503896117210388, "slot_residual_alignment": 0.431986927986145, "inter_domain_margin": 0.0}
+{"step": 12, "dt_s": 4.804814338684082, "total": 45.988372802734375, "recon": 3.5860021114349365, "contrast": 46.13844299316406, "holonomy": 11.241600036621094, "write_policy": 0.33248451352119446, "semantic_probe": 0.5897091627120972, "dir_diversity": 0.37856337428092957, "reranker_ranking": 1.09449303150177, "encoder_throughput": 4.562747478485107, "vocab_anchor": -0.19120334088802338, "semantic_alignment": 9.05755615234375, "tail_semantic_anchor": 10.484607696533203, "functional_suppression": 3.875, "context_separation": 0.6187530755996704, "slot_residual_alignment": 0.18550440669059753, "inter_domain_margin": 0.0}
+{"step": 13, "dt_s": 4.333798408508301, "total": 52.25926971435547, "recon": 3.366666555404663, "contrast": 296.8917541503906, "holonomy": 3.3199329376220703, "write_policy": 0.5979171395301819, "semantic_probe": 0.5909429788589478, "dir_diversity": 0.39297837018966675, "reranker_ranking": 2.1007895469665527, "encoder_throughput": 4.347751617431641, "vocab_anchor": -0.18761645257472992, "semantic_alignment": 9.481330871582031, "tail_semantic_anchor": 10.834440231323242, "functional_suppression": 4.25, "context_separation": 0.6543909907341003, "slot_residual_alignment": 0.41755813360214233, "inter_domain_margin": 0.0}
+{"step": 14, "dt_s": 5.473763704299927, "total": 49.75532913208008, "recon": 4.421329021453857, "contrast": 138.6197052001953, "holonomy": 7.657827377319336, "write_policy": 0.5365144610404968, "semantic_probe": 0.5329692959785461, "dir_diversity": 0.37479710578918457, "reranker_ranking": 0.9176954030990601, "encoder_throughput": 5.20395040512085, "vocab_anchor": -0.19668598473072052, "semantic_alignment": 9.105573654174805, "tail_semantic_anchor": 10.744701385498047, "functional_suppression": 3.6666667461395264, "context_separation": 0.5547736883163452, "slot_residual_alignment": 0.47390294075012207, "inter_domain_margin": 0.0}
+{"step": 15, "dt_s": 5.070712089538574, "total": 52.42586135864258, "recon": 5.4380717277526855, "contrast": 138.6901092529297, "holonomy": 5.822895050048828, "write_policy": 0.2951529920101166, "semantic_probe": 0.5576289296150208, "dir_diversity": 0.3954441547393799, "reranker_ranking": 1.232430100440979, "encoder_throughput": 5.731842994689941, "vocab_anchor": -0.19930976629257202, "semantic_alignment": 9.204486846923828, "tail_semantic_anchor": 10.796337127685547, "functional_suppression": 4.9791669845581055, "context_separation": 0.46944326162338257, "slot_residual_alignment": 0.43306243419647217, "inter_domain_margin": 0.0}
+{"step": 16, "dt_s": 5.721009016036987, "total": 50.03802490234375, "recon": 4.446747779846191, "contrast": 143.7346649169922, "holonomy": 25.63228416442871, "write_policy": 0.2673691511154175, "semantic_probe": 0.534260630607605, "dir_diversity": 0.3781629800796509, "reranker_ranking": 0.8481366038322449, "encoder_throughput": 5.198798179626465, "vocab_anchor": -0.192597433924675, "semantic_alignment": 9.103723526000977, "tail_semantic_anchor": 10.485149383544922, "functional_suppression": 4.4166669845581055, "context_separation": 0.3795735836029053, "slot_residual_alignment": 0.1829848289489746, "inter_domain_margin": 0.0}
+{"step": 17, "dt_s": 5.142794370651245, "total": 48.860496520996094, "recon": 3.725801467895508, "contrast": 50.38498306274414, "holonomy": 3.0268027782440186, "write_policy": 0.6573514938354492, "semantic_probe": 0.5752252340316772, "dir_diversity": 0.38824984431266785, "reranker_ranking": 1.9911097288131714, "encoder_throughput": 5.031325340270996, "vocab_anchor": -0.19010376930236816, "semantic_alignment": 9.431158065795898, "tail_semantic_anchor": 10.83335018157959, "functional_suppression": 5.125, "context_separation": 0.5579835176467896, "slot_residual_alignment": 0.41593998670578003, "inter_domain_margin": 0.0}
+{"step": 18, "dt_s": 5.617240905761719, "total": 48.32672882080078, "recon": 4.57211446762085, "contrast": 72.41393280029297, "holonomy": 17.72692108154297, "write_policy": 0.39641499519348145, "semantic_probe": 0.4783823490142822, "dir_diversity": 0.3740108907222748, "reranker_ranking": 0.7827906012535095, "encoder_throughput": 5.136209011077881, "vocab_anchor": -0.19950838387012482, "semantic_alignment": 9.037921905517578, "tail_semantic_anchor": 10.750457763671875, "functional_suppression": 3.9791667461395264, "context_separation": 0.3183596730232239, "slot_residual_alignment": 0.4805936813354492, "inter_domain_margin": 0.0}
+{"step": 19, "dt_s": 4.708035707473755, "total": 50.66549301147461, "recon": 5.416898250579834, "contrast": 57.15092468261719, "holonomy": 6.779355525970459, "write_policy": 0.2542175054550171, "semantic_probe": 0.541136622428894, "dir_diversity": 0.39804840087890625, "reranker_ranking": 1.0454262495040894, "encoder_throughput": 5.922758102416992, "vocab_anchor": -0.2026052325963974, "semantic_alignment": 9.248539924621582, "tail_semantic_anchor": 10.794700622558594, "functional_suppression": 3.9375, "context_separation": 0.24480615556240082, "slot_residual_alignment": 0.4363265931606293, "inter_domain_margin": 0.0}
+{"step": 20, "dt_s": 5.740523338317871, "total": 47.997779846191406, "recon": 3.788283348083496, "contrast": 74.73484802246094, "holonomy": 60.33315658569336, "write_policy": 0.26027876138687134, "semantic_probe": 0.4855646789073944, "dir_diversity": 0.37566956877708435, "reranker_ranking": 0.6811670660972595, "encoder_throughput": 4.923496723175049, "vocab_anchor": -0.1959581971168518, "semantic_alignment": 9.19318962097168, "tail_semantic_anchor": 10.485743522644043, "functional_suppression": 4.6041669845581055, "context_separation": 0.19158604741096497, "slot_residual_alignment": 0.18359825015068054, "inter_domain_margin": 0.0}
+{"step": 21, "dt_s": 4.292395353317261, "total": 49.91743850708008, "recon": 5.195595741271973, "contrast": 99.63777160644531, "holonomy": 3.4234790802001953, "write_policy": 0.5231249332427979, "semantic_probe": 0.5398634672164917, "dir_diversity": 0.39266595244407654, "reranker_ranking": 1.3992176055908203, "encoder_throughput": 4.467929363250732, "vocab_anchor": -0.19365495443344116, "semantic_alignment": 9.271190643310547, "tail_semantic_anchor": 10.835349082946777, "functional_suppression": 5.458333492279053, "context_separation": 0.33614581823349, "slot_residual_alignment": 0.41570061445236206, "inter_domain_margin": 0.0}
+{"step": 22, "dt_s": 5.316793203353882, "total": 50.14979934692383, "recon": 4.45871639251709, "contrast": 158.2454376220703, "holonomy": 41.22182846069336, "write_policy": 0.3593383729457855, "semantic_probe": 0.4626573622226715, "dir_diversity": 0.37052425742149353, "reranker_ranking": 0.5977036356925964, "encoder_throughput": 5.222513198852539, "vocab_anchor": -0.19982032477855682, "semantic_alignment": 9.096803665161133, "tail_semantic_anchor": 10.749743461608887, "functional_suppression": 3.7291667461395264, "context_separation": 0.12662634253501892, "slot_residual_alignment": 0.48298579454421997, "inter_domain_margin": 0.0}
+{"step": 23, "dt_s": 4.905754566192627, "total": 48.843589782714844, "recon": 5.121064186096191, "contrast": 8.920906066894531, "holonomy": 6.039010524749756, "write_policy": 0.21006441116333008, "semantic_probe": 0.6346263885498047, "dir_diversity": 0.3936876654624939, "reranker_ranking": 0.697007417678833, "encoder_throughput": 5.693617820739746, "vocab_anchor": -0.20095036923885345, "semantic_alignment": 9.181570053100586, "tail_semantic_anchor": 10.783254623413086, "functional_suppression": 4.208333492279053, "context_separation": 0.01282113790512085, "slot_residual_alignment": 0.42780792713165283, "inter_domain_margin": 0.0}
+{"step": 24, "dt_s": 5.19560432434082, "total": 45.95124435424805, "recon": 3.58393931388855, "contrast": 23.245323181152344, "holonomy": 85.93484497070312, "write_policy": 0.2037968933582306, "semantic_probe": 0.531635582447052, "dir_diversity": 0.36873859167099, "reranker_ranking": 0.522104799747467, "encoder_throughput": 4.295145034790039, "vocab_anchor": -0.19150906801223755, "semantic_alignment": 9.173014640808105, "tail_semantic_anchor": 10.482585906982422, "functional_suppression": 4.9166669845581055, "context_separation": 0.06715075671672821, "slot_residual_alignment": 0.1920577585697174, "inter_domain_margin": 0.0}
+{"step": 25, "dt_s": 4.476183652877808, "total": 47.03428649902344, "recon": 3.5679497718811035, "contrast": 97.89957427978516, "holonomy": 5.220252513885498, "write_policy": 0.4119507968425751, "semantic_probe": 0.4921112656593323, "dir_diversity": 0.3994268774986267, "reranker_ranking": 0.8052929043769836, "encoder_throughput": 4.058958053588867, "vocab_anchor": -0.18982519209384918, "semantic_alignment": 9.269722938537598, "tail_semantic_anchor": 10.836390495300293, "functional_suppression": 4.395833492279053, "context_separation": 0.18746201694011688, "slot_residual_alignment": 0.4199323356151581, "inter_domain_margin": 0.0}
+{"step": 26, "dt_s": 5.022085905075073, "total": 48.0265998840332, "recon": 4.52186918258667, "contrast": 45.34407424926758, "holonomy": 18.666357040405273, "write_policy": 0.3609965741634369, "semantic_probe": 0.48039162158966064, "dir_diversity": 0.3688211441040039, "reranker_ranking": 0.4735085070133209, "encoder_throughput": 5.07188081741333, "vocab_anchor": -0.19505575299263, "semantic_alignment": 9.197484970092773, "tail_semantic_anchor": 10.74250316619873, "functional_suppression": 4.083333492279053, "context_separation": 0.08956396579742432, "slot_residual_alignment": 0.48361527919769287, "inter_domain_margin": 0.0}
+{"step": 27, "dt_s": 4.827812194824219, "total": 48.925750732421875, "recon": 5.023128032684326, "contrast": 42.546630859375, "holonomy": 9.366353034973145, "write_policy": 0.163956418633461, "semantic_probe": 0.49160826206207275, "dir_diversity": 0.3956567645072937, "reranker_ranking": 0.6263725161552429, "encoder_throughput": 5.442854404449463, "vocab_anchor": -0.196529820561409, "semantic_alignment": 9.183401107788086, "tail_semantic_anchor": 10.768585205078125, "functional_suppression": 4.0416669845581055, "context_separation": 0.0, "slot_residual_alignment": 0.4130026698112488, "inter_domain_margin": 0.0}
+{"step": 28, "dt_s": 5.622410535812378, "total": 45.044532775878906, "recon": 3.7052507400512695, "contrast": 13.477803230285645, "holonomy": 17.66839599609375, "write_policy": 0.15302510559558868, "semantic_probe": 0.5116596817970276, "dir_diversity": 0.36868858337402344, "reranker_ranking": 0.42400050163269043, "encoder_throughput": 4.42167854309082, "vocab_anchor": -0.1889352947473526, "semantic_alignment": 9.070842742919922, "tail_semantic_anchor": 10.483975410461426, "functional_suppression": 4.1041669845581055, "context_separation": 0.0, "slot_residual_alignment": 0.21467086672782898, "inter_domain_margin": 0.0}
+{"step": 29, "dt_s": 4.275408983230591, "total": 45.7886848449707, "recon": 3.5938196182250977, "contrast": 21.105491638183594, "holonomy": 7.596940040588379, "write_policy": 0.3319071829319, "semantic_probe": 0.4785138666629791, "dir_diversity": 0.3922926187515259, "reranker_ranking": 0.4693453311920166, "encoder_throughput": 4.132025241851807, "vocab_anchor": -0.18880659341812134, "semantic_alignment": 9.326589584350586, "tail_semantic_anchor": 10.840926170349121, "functional_suppression": 4.5625, "context_separation": 0.1313747614622116, "slot_residual_alignment": 0.4333094656467438, "inter_domain_margin": 0.0}
+{"step": 30, "dt_s": 5.580240726470947, "total": 47.09113311767578, "recon": 4.427570343017578, "contrast": 20.258773803710938, "holonomy": 23.029035568237305, "write_policy": 0.2914152443408966, "semantic_probe": 0.3134371042251587, "dir_diversity": 0.3683568835258484, "reranker_ranking": 0.345679372549057, "encoder_throughput": 4.948168754577637, "vocab_anchor": -0.1973496526479721, "semantic_alignment": 9.139399528503418, "tail_semantic_anchor": 10.73609447479248, "functional_suppression": 4.3541669845581055, "context_separation": 0.011339257471263409, "slot_residual_alignment": 0.48074454069137573, "inter_domain_margin": 0.0}
+{"step": 31, "dt_s": 4.453314542770386, "total": 48.54909133911133, "recon": 5.015549659729004, "contrast": 11.260205268859863, "holonomy": 8.314573287963867, "write_policy": 0.13746634125709534, "semantic_probe": 0.45352160930633545, "dir_diversity": 0.3858489990234375, "reranker_ranking": 0.3718695342540741, "encoder_throughput": 5.5938591957092285, "vocab_anchor": -0.2000311017036438, "semantic_alignment": 9.25428295135498, "tail_semantic_anchor": 10.764066696166992, "functional_suppression": 3.7708334922790527, "context_separation": 0.0, "slot_residual_alignment": 0.4154483675956726, "inter_domain_margin": 0.0}
+{"step": 32, "dt_s": 5.2248241901397705, "total": 44.73004913330078, "recon": 3.554171085357666, "contrast": 32.83123779296875, "holonomy": 9.613456726074219, "write_policy": 0.10704371333122253, "semantic_probe": 0.4706486463546753, "dir_diversity": 0.3701421916484833, "reranker_ranking": 0.26061925292015076, "encoder_throughput": 4.3157172203063965, "vocab_anchor": -0.195038840174675, "semantic_alignment": 8.999361038208008, "tail_semantic_anchor": 10.47833251953125, "functional_suppression": 3.8958334922790527, "context_separation": 0.0, "slot_residual_alignment": 0.22855165600776672, "inter_domain_margin": 0.0}
+{"step": 33, "dt_s": 3.836758613586426, "total": 46.26542282104492, "recon": 3.570352077484131, "contrast": 37.973487854003906, "holonomy": 4.97968053817749, "write_policy": 0.26292112469673157, "semantic_probe": 0.48352697491645813, "dir_diversity": 0.38878893852233887, "reranker_ranking": 0.2658866345882416, "encoder_throughput": 4.025471210479736, "vocab_anchor": -0.1925235390663147, "semantic_alignment": 9.469202041625977, "tail_semantic_anchor": 10.833590507507324, "functional_suppression": 4.5, "context_separation": 0.07732044160366058, "slot_residual_alignment": 0.43830376863479614, "inter_domain_margin": 0.0}
+{"step": 34, "dt_s": 5.322328090667725, "total": 46.03813552856445, "recon": 4.343929290771484, "contrast": 28.99069595336914, "holonomy": 29.608627319335938, "write_policy": 0.21709129214286804, "semantic_probe": 0.31864285469055176, "dir_diversity": 0.3701157569885254, "reranker_ranking": 0.22028741240501404, "encoder_throughput": 4.845775604248047, "vocab_anchor": -0.20206287503242493, "semantic_alignment": 8.966723442077637, "tail_semantic_anchor": 10.712446212768555, "functional_suppression": 3.2083334922790527, "context_separation": 0.0, "slot_residual_alignment": 0.46940886974334717, "inter_domain_margin": 0.0}
+{"step": 35, "dt_s": 4.7232115268707275, "total": 48.69865798950195, "recon": 5.1011061668396, "contrast": 11.502132415771484, "holonomy": 5.496285915374756, "write_policy": 0.1210976168513298, "semantic_probe": 0.4470455050468445, "dir_diversity": 0.38547179102897644, "reranker_ranking": 0.2506255507469177, "encoder_throughput": 5.536550521850586, "vocab_anchor": -0.20398542284965515, "semantic_alignment": 9.326234817504883, "tail_semantic_anchor": 10.758135795593262, "functional_suppression": 3.7083334922790527, "context_separation": 0.0, "slot_residual_alignment": 0.41755911707878113, "inter_domain_margin": 0.0}
+{"step": 36, "dt_s": 5.080393314361572, "total": 43.38152313232422, "recon": 3.4255290031433105, "contrast": 21.012954711914062, "holonomy": 8.42962646484375, "write_policy": 0.07101736217737198, "semantic_probe": 0.38892924785614014, "dir_diversity": 0.36991700530052185, "reranker_ranking": 0.18239399790763855, "encoder_throughput": 3.9610226154327393, "vocab_anchor": -0.1988062709569931, "semantic_alignment": 8.97142219543457, "tail_semantic_anchor": 10.487560272216797, "functional_suppression": 3.0833334922790527, "context_separation": 0.01059678103774786, "slot_residual_alignment": 0.24507743120193481, "inter_domain_margin": 0.0}
+{"step": 37, "dt_s": 3.795853614807129, "total": 45.26548385620117, "recon": 3.549677848815918, "contrast": 24.701316833496094, "holonomy": 4.05967903137207, "write_policy": 0.20942094922065735, "semantic_probe": 0.4681665599346161, "dir_diversity": 0.39099425077438354, "reranker_ranking": 0.24367572367191315, "encoder_throughput": 3.7425177097320557, "vocab_anchor": -0.19536133110523224, "semantic_alignment": 9.418148040771484, "tail_semantic_anchor": 10.829547882080078, "functional_suppression": 4.270833492279053, "context_separation": 0.0, "slot_residual_alignment": 0.44410985708236694, "inter_domain_margin": 0.0}
+{"step": 38, "dt_s": 5.481587171554565, "total": 45.133155822753906, "recon": 4.1910295486450195, "contrast": 14.886419296264648, "holonomy": 26.912521362304688, "write_policy": 0.15138891339302063, "semantic_probe": 0.2859296202659607, "dir_diversity": 0.36939215660095215, "reranker_ranking": 0.16762736439704895, "encoder_throughput": 4.724213123321533, "vocab_anchor": -0.20386111736297607, "semantic_alignment": 8.932318687438965, "tail_semantic_anchor": 10.691630363464355, "functional_suppression": 2.875, "context_separation": 0.0004431593115441501, "slot_residual_alignment": 0.46025174856185913, "inter_domain_margin": 0.0}
+{"step": 39, "dt_s": 5.142491340637207, "total": 48.39955139160156, "recon": 5.0079874992370605, "contrast": 8.717339515686035, "holonomy": 3.959277629852295, "write_policy": 0.10174553841352463, "semantic_probe": 0.4204414188861847, "dir_diversity": 0.38900646567344666, "reranker_ranking": 0.21488028764724731, "encoder_throughput": 5.627437591552734, "vocab_anchor": -0.20557616651058197, "semantic_alignment": 9.288630485534668, "tail_semantic_anchor": 10.74327278137207, "functional_suppression": 3.3541667461395264, "context_separation": 0.0, "slot_residual_alignment": 0.41380205750465393, "inter_domain_margin": 0.0}
+{"step": 40, "dt_s": 6.476794958114624, "total": 43.30239486694336, "recon": 3.3712613582611084, "contrast": 15.683893203735352, "holonomy": 2.9424960613250732, "write_policy": 0.051018547266721725, "semantic_probe": 0.37669825553894043, "dir_diversity": 0.36885350942611694, "reranker_ranking": 0.13987793028354645, "encoder_throughput": 3.9853086471557617, "vocab_anchor": -0.199788898229599, "semantic_alignment": 8.995321273803711, "tail_semantic_anchor": 10.491599082946777, "functional_suppression": 3.125, "context_separation": 0.0, "slot_residual_alignment": 0.25347888469696045, "inter_domain_margin": 0.0}
+{"step": 41, "dt_s": 4.4560816287994385, "total": 44.96157455444336, "recon": 3.537008285522461, "contrast": 2.032209634780884, "holonomy": 4.170089244842529, "write_policy": 0.17055284976959229, "semantic_probe": 0.45578980445861816, "dir_diversity": 0.39704594016075134, "reranker_ranking": 0.23324726521968842, "encoder_throughput": 3.893531560897827, "vocab_anchor": -0.19700030982494354, "semantic_alignment": 9.401329040527344, "tail_semantic_anchor": 10.819415092468262, "functional_suppression": 4.270833492279053, "context_separation": 0.0, "slot_residual_alignment": 0.4434751868247986, "inter_domain_margin": 0.0}
+{"step": 42, "dt_s": 5.7171525955200195, "total": 45.3223876953125, "recon": 4.156482696533203, "contrast": 18.380443572998047, "holonomy": 10.6222505569458, "write_policy": 0.10920312255620956, "semantic_probe": 0.2629302144050598, "dir_diversity": 0.37034568190574646, "reranker_ranking": 0.1361001878976822, "encoder_throughput": 4.66585111618042, "vocab_anchor": -0.20446549355983734, "semantic_alignment": 8.97308349609375, "tail_semantic_anchor": 10.677995681762695, "functional_suppression": 3.4375, "context_separation": 0.0, "slot_residual_alignment": 0.4525626301765442, "inter_domain_margin": 0.0}
+{"step": 43, "dt_s": 4.291723012924194, "total": 47.18626022338867, "recon": 4.825976371765137, "contrast": 3.1379318237304688, "holonomy": 4.193202018737793, "write_policy": 0.07200492918491364, "semantic_probe": 0.3764450252056122, "dir_diversity": 0.394595205783844, "reranker_ranking": 0.17772898077964783, "encoder_throughput": 5.485467910766602, "vocab_anchor": -0.20565049350261688, "semantic_alignment": 9.105148315429688, "tail_semantic_anchor": 10.724467277526855, "functional_suppression": 3.0416667461395264, "context_separation": 0.0, "slot_residual_alignment": 0.4038097858428955, "inter_domain_margin": 0.0}
+{"step": 44, "dt_s": 5.153038024902344, "total": 43.57353210449219, "recon": 3.3236212730407715, "contrast": 21.3458309173584, "holonomy": 5.2195281982421875, "write_policy": 0.039848849177360535, "semantic_probe": 0.37921154499053955, "dir_diversity": 0.3697623610496521, "reranker_ranking": 0.10290936380624771, "encoder_throughput": 3.8777639865875244, "vocab_anchor": -0.19936813414096832, "semantic_alignment": 9.084465026855469, "tail_semantic_anchor": 10.499517440795898, "functional_suppression": 3.3541667461395264, "context_separation": 0.0, "slot_residual_alignment": 0.2596360146999359, "inter_domain_margin": 0.0}
+{"step": 45, "dt_s": 3.759885787963867, "total": 45.749481201171875, "recon": 3.483689785003662, "contrast": 1.9868213740892315e-08, "holonomy": 3.421891212463379, "write_policy": 0.14848721027374268, "semantic_probe": 0.43499454855918884, "dir_diversity": 0.40093955397605896, "reranker_ranking": 0.16148464381694794, "encoder_throughput": 4.729005336761475, "vocab_anchor": -0.19639548659324646, "semantic_alignment": 9.319930076599121, "tail_semantic_anchor": 10.800520896911621, "functional_suppression": 4.0416669845581055, "context_separation": 0.0, "slot_residual_alignment": 0.44560256600379944, "inter_domain_margin": 0.0}
+{"step": 46, "dt_s": 5.414437294006348, "total": 45.253204345703125, "recon": 4.187786102294922, "contrast": 13.33327579498291, "holonomy": 7.912032604217529, "write_policy": 0.08873845636844635, "semantic_probe": 0.22315838932991028, "dir_diversity": 0.3715795874595642, "reranker_ranking": 0.08523325622081757, "encoder_throughput": 4.8188581466674805, "vocab_anchor": -0.20405331254005432, "semantic_alignment": 8.992080688476562, "tail_semantic_anchor": 10.664222717285156, "functional_suppression": 2.8333334922790527, "context_separation": 0.0, "slot_residual_alignment": 0.44909656047821045, "inter_domain_margin": 0.0}
+{"step": 47, "dt_s": 3.7571990489959717, "total": 47.90068435668945, "recon": 4.686264991760254, "contrast": 5.309545040130615, "holonomy": 2.352567672729492, "write_policy": 0.10094986855983734, "semantic_probe": 0.35874417424201965, "dir_diversity": 0.40132495760917664, "reranker_ranking": 0.12526121735572815, "encoder_throughput": 6.060349464416504, "vocab_anchor": -0.2053200900554657, "semantic_alignment": 9.106246948242188, "tail_semantic_anchor": 10.707404136657715, "functional_suppression": 2.9791667461395264, "context_separation": 0.0, "slot_residual_alignment": 0.39318591356277466, "inter_domain_margin": 0.0}
+{"step": 48, "dt_s": 5.419058322906494, "total": 43.881649017333984, "recon": 3.264848470687866, "contrast": 0.20690467953681946, "holonomy": 2.003607749938965, "write_policy": 0.07058241963386536, "semantic_probe": 0.3492080271244049, "dir_diversity": 0.36977824568748474, "reranker_ranking": 0.06046048551797867, "encoder_throughput": 4.339890480041504, "vocab_anchor": -0.199030339717865, "semantic_alignment": 9.143569946289062, "tail_semantic_anchor": 10.498687744140625, "functional_suppression": 3.2291667461395264, "context_separation": 0.0, "slot_residual_alignment": 0.2629481554031372, "inter_domain_margin": 0.0}
+{"step": 49, "dt_s": 3.4690475463867188, "total": 44.30413818359375, "recon": 3.397336721420288, "contrast": 6.512163162231445, "holonomy": 1.7714495658874512, "write_policy": 0.12031050026416779, "semantic_probe": 0.41017162799835205, "dir_diversity": 0.40328967571258545, "reranker_ranking": 0.08964170515537262, "encoder_throughput": 4.109604358673096, "vocab_anchor": -0.1962694376707077, "semantic_alignment": 9.149703979492188, "tail_semantic_anchor": 10.766862869262695, "functional_suppression": 4.0416669845581055, "context_separation": 0.0, "slot_residual_alignment": 0.4336094558238983, "inter_domain_margin": 0.0}
+{"step": 50, "dt_s": 5.286025762557983, "total": 44.78114700317383, "recon": 4.12325382232666, "contrast": 13.508724212646484, "holonomy": 3.451904296875, "write_policy": 0.06746810674667358, "semantic_probe": 0.24645540118217468, "dir_diversity": 0.3724554777145386, "reranker_ranking": 0.05502992123365402, "encoder_throughput": 4.604001998901367, "vocab_anchor": -0.2035370022058487, "semantic_alignment": 9.010517120361328, "tail_semantic_anchor": 10.656023025512695, "functional_suppression": 2.5416667461395264, "context_separation": 0.0, "slot_residual_alignment": 0.4527361989021301, "inter_domain_margin": 0.0}
+{"step": 51, "dt_s": 3.8469533920288086, "total": 47.2175407409668, "recon": 4.67989444732666, "contrast": 2.183373726438731e-05, "holonomy": 1.4197707176208496, "write_policy": 0.05335784703493118, "semantic_probe": 0.3483617901802063, "dir_diversity": 0.40528520941734314, "reranker_ranking": 0.08100803196430206, "encoder_throughput": 5.622017860412598, "vocab_anchor": -0.20437146723270416, "semantic_alignment": 9.172056198120117, "tail_semantic_anchor": 10.694639205932617, "functional_suppression": 2.7708334922790527, "context_separation": 0.0, "slot_residual_alignment": 0.3842431902885437, "inter_domain_margin": 0.0}
+{"step": 52, "dt_s": 5.426782608032227, "total": 43.436180114746094, "recon": 3.186408519744873, "contrast": 19.09634780883789, "holonomy": 3.013406276702881, "write_policy": 0.038871880620718, "semantic_probe": 0.3342770040035248, "dir_diversity": 0.37065988779067993, "reranker_ranking": 0.03631899133324623, "encoder_throughput": 4.035032272338867, "vocab_anchor": -0.19868868589401245, "semantic_alignment": 9.046126365661621, "tail_semantic_anchor": 10.512541770935059, "functional_suppression": 3.2291667461395264, "context_separation": 0.01714806817471981, "slot_residual_alignment": 0.27584508061408997, "inter_domain_margin": 0.0}
+{"step": 53, "dt_s": 3.7061309814453125, "total": 43.37702941894531, "recon": 3.3934993743896484, "contrast": 0.0, "holonomy": 1.5600996017456055, "write_policy": 0.0768166035413742, "semantic_probe": 0.40102618932724, "dir_diversity": 0.4076686501502991, "reranker_ranking": 0.061287201941013336, "encoder_throughput": 3.636530876159668, "vocab_anchor": -0.19680587947368622, "semantic_alignment": 9.157262802124023, "tail_semantic_anchor": 10.748312950134277, "functional_suppression": 3.8333334922790527, "context_separation": 0.0, "slot_residual_alignment": 0.4286777079105377, "inter_domain_margin": 0.0}
+{"step": 54, "dt_s": 5.387641191482544, "total": 44.92699432373047, "recon": 4.080650329589844, "contrast": 8.399429321289062, "holonomy": 6.808872222900391, "write_policy": 0.07899715006351471, "semantic_probe": 0.21231165528297424, "dir_diversity": 0.3705131411552429, "reranker_ranking": 0.029054680839180946, "encoder_throughput": 4.624510288238525, "vocab_anchor": -0.20403140783309937, "semantic_alignment": 9.071155548095703, "tail_semantic_anchor": 10.657523155212402, "functional_suppression": 2.7291667461395264, "context_separation": 0.0, "slot_residual_alignment": 0.4597969651222229, "inter_domain_margin": 0.0}
+{"step": 55, "dt_s": 3.891601324081421, "total": 46.75312042236328, "recon": 4.699041843414307, "contrast": 0.037908874452114105, "holonomy": 1.4756110906600952, "write_policy": 0.03558492660522461, "semantic_probe": 0.31059569120407104, "dir_diversity": 0.40582379698753357, "reranker_ranking": 0.07101200520992279, "encoder_throughput": 5.445874214172363, "vocab_anchor": -0.20455902814865112, "semantic_alignment": 9.128427505493164, "tail_semantic_anchor": 10.67914867401123, "functional_suppression": 2.6041667461395264, "context_separation": 0.0, "slot_residual_alignment": 0.3806415796279907, "inter_domain_margin": 0.0}
+{"step": 56, "dt_s": 5.298295497894287, "total": 44.5620002746582, "recon": 3.268003463745117, "contrast": 14.91746711730957, "holonomy": 4.609067916870117, "write_policy": 0.02360808476805687, "semantic_probe": 0.33831459283828735, "dir_diversity": 0.37061867117881775, "reranker_ranking": 0.03027866967022419, "encoder_throughput": 4.7991180419921875, "vocab_anchor": -0.19885191321372986, "semantic_alignment": 9.096372604370117, "tail_semantic_anchor": 10.521891593933105, "functional_suppression": 2.7916667461395264, "context_separation": 0.0, "slot_residual_alignment": 0.28579622507095337, "inter_domain_margin": 0.0}
+{"step": 57, "dt_s": 4.3319032192230225, "total": 46.089786529541016, "recon": 3.2148704528808594, "contrast": 7.476414203643799, "holonomy": 1.542240858078003, "write_policy": 0.07449627667665482, "semantic_probe": 0.3836245834827423, "dir_diversity": 0.4112270474433899, "reranker_ranking": 0.047330331057310104, "encoder_throughput": 5.596998691558838, "vocab_anchor": -0.19745582342147827, "semantic_alignment": 9.105244636535645, "tail_semantic_anchor": 10.728957176208496, "functional_suppression": 3.7708334922790527, "context_separation": 0.0, "slot_residual_alignment": 0.4231620132923126, "inter_domain_margin": 0.0}
+{"step": 58, "dt_s": 4.849287509918213, "total": 49.908748626708984, "recon": 4.080421447753906, "contrast": 1.942293405532837, "holonomy": 4.163114547729492, "write_policy": 0.05154755711555481, "semantic_probe": 0.21513792872428894, "dir_diversity": 0.36999958753585815, "reranker_ranking": 0.021042784675955772, "encoder_throughput": 7.956796169281006, "vocab_anchor": -0.2043587863445282, "semantic_alignment": 9.088956832885742, "tail_semantic_anchor": 10.65980339050293, "functional_suppression": 2.9166667461395264, "context_separation": 0.0, "slot_residual_alignment": 0.468086838722229, "inter_domain_margin": 0.0}
+{"step": 59, "dt_s": 4.262746572494507, "total": 49.26776885986328, "recon": 4.715743064880371, "contrast": 0.0, "holonomy": 1.2825682163238525, "write_policy": 0.03918006271123886, "semantic_probe": 0.29025137424468994, "dir_diversity": 0.4023857116699219, "reranker_ranking": 0.04996822401881218, "encoder_throughput": 7.232363700866699, "vocab_anchor": -0.20476281642913818, "semantic_alignment": 9.048741340637207, "tail_semantic_anchor": 10.667806625366211, "functional_suppression": 2.7916667461395264, "context_separation": 0.0, "slot_residual_alignment": 0.38110798597335815, "inter_domain_margin": 0.0}
diff --git a/reports/v346_trained_blackbox/train_stdout.log b/reports/v346_trained_blackbox/train_stdout.log
new file mode 100644
index 0000000..1f22181
--- /dev/null
+++ b/reports/v346_trained_blackbox/train_stdout.log
@@ -0,0 +1,72 @@
+`torch_dtype` is deprecated! Use `dtype` instead!
+Loading weights:   0%|          | 0/338 [00:00<?, ?it/s]Loading weights: 100%|██████████| 338/338 [00:00<00:00, 3759.52it/s]
+  [neighbor cache] vocab_size=151936 > 60000, skip
+[build] device=cuda  params total=1,657,496,024  trainable=113,781,720
+[build] initial memory count = 11
+[probe pre-train] {'tail_head_slot1_abs_mean': 0.0, 'vocab_proj_last_abs_mean': 0.0}
+[train] Trainer built  batch=3  steps=60
+/usr/local/lib/python3.12/dist-packages/torch/autograd/graph.py:869: UserWarning: Attempting to run cuBLAS, but there was no current CUDA context! Attempting to set the primary context... (Triggered internally at /pytorch/aten/src/ATen/cuda/CublasHandlePool.cpp:335.)
+  return Variable._execution_engine.run_backward(  # Calls into the C++ engine to run the backward pass
+step   0  total=481.6660  recon=3.979  sa=9.902  tsa=10.922  va=-0.000  fs=0.000  cs=0.000  dt=19.8s
+step   1  total=119.4697  recon=4.319  sa=9.650  tsa=10.858  va=-0.033  fs=1.604  cs=0.082  dt=13.3s
+step   2  total=63.2969  recon=4.862  sa=9.649  tsa=10.767  va=-0.071  fs=2.639  cs=0.171  dt=15.5s
+step   3  total=65.6129  recon=5.044  sa=9.489  tsa=10.812  va=-0.107  fs=4.250  cs=0.251  dt=9.5s
+step   4  total=60.1234  recon=4.077  sa=9.579  tsa=10.503  va=-0.139  fs=4.958  cs=0.342  dt=6.6s
+step   5  total=52.4816  recon=3.734  sa=9.189  tsa=10.851  va=-0.174  fs=4.333  cs=0.398  dt=6.6s
+step   6  total=54.1920  recon=4.909  sa=9.184  tsa=10.757  va=-0.186  fs=4.604  cs=0.482  dt=6.2s
+step   7  total=56.3720  recon=5.359  sa=9.227  tsa=10.805  va=-0.191  fs=4.625  cs=0.533  dt=5.5s
+step   8  total=51.0531  recon=3.712  sa=9.229  tsa=10.494  va=-0.188  fs=4.625  cs=0.617  dt=4.8s
+step   9  total=94.4659  recon=3.598  sa=9.477  tsa=10.841  va=-0.186  fs=4.688  cs=0.649  dt=4.7s
+step  10  total=61.6950  recon=4.405  sa=9.065  tsa=10.739  va=-0.195  fs=3.458  cs=0.682  dt=4.7s
+step  11  total=52.7172  recon=5.322  sa=9.583  tsa=10.796  va=-0.198  fs=3.292  cs=0.650  dt=4.3s
+step  12  total=45.9884  recon=3.586  sa=9.058  tsa=10.485  va=-0.191  fs=3.875  cs=0.619  dt=4.8s
+step  13  total=52.2593  recon=3.367  sa=9.481  tsa=10.834  va=-0.188  fs=4.250  cs=0.654  dt=4.3s
+step  14  total=49.7553  recon=4.421  sa=9.106  tsa=10.745  va=-0.197  fs=3.667  cs=0.555  dt=5.5s
+step  15  total=52.4259  recon=5.438  sa=9.204  tsa=10.796  va=-0.199  fs=4.979  cs=0.469  dt=5.1s
+step  16  total=50.0380  recon=4.447  sa=9.104  tsa=10.485  va=-0.193  fs=4.417  cs=0.380  dt=5.7s
+step  17  total=48.8605  recon=3.726  sa=9.431  tsa=10.833  va=-0.190  fs=5.125  cs=0.558  dt=5.1s
+step  18  total=48.3267  recon=4.572  sa=9.038  tsa=10.750  va=-0.200  fs=3.979  cs=0.318  dt=5.6s
+step  19  total=50.6655  recon=5.417  sa=9.249  tsa=10.795  va=-0.203  fs=3.938  cs=0.245  dt=4.7s
+step  20  total=47.9978  recon=3.788  sa=9.193  tsa=10.486  va=-0.196  fs=4.604  cs=0.192  dt=5.7s
+step  21  total=49.9174  recon=5.196  sa=9.271  tsa=10.835  va=-0.194  fs=5.458  cs=0.336  dt=4.3s
+step  22  total=50.1498  recon=4.459  sa=9.097  tsa=10.750  va=-0.200  fs=3.729  cs=0.127  dt=5.3s
+step  23  total=48.8436  recon=5.121  sa=9.182  tsa=10.783  va=-0.201  fs=4.208  cs=0.013  dt=4.9s
+step  24  total=45.9512  recon=3.584  sa=9.173  tsa=10.483  va=-0.192  fs=4.917  cs=0.067  dt=5.2s
+step  25  total=47.0343  recon=3.568  sa=9.270  tsa=10.836  va=-0.190  fs=4.396  cs=0.187  dt=4.5s
+step  26  total=48.0266  recon=4.522  sa=9.197  tsa=10.743  va=-0.195  fs=4.083  cs=0.090  dt=5.0s
+step  27  total=48.9258  recon=5.023  sa=9.183  tsa=10.769  va=-0.197  fs=4.042  cs=0.000  dt=4.8s
+step  28  total=45.0445  recon=3.705  sa=9.071  tsa=10.484  va=-0.189  fs=4.104  cs=0.000  dt=5.6s
+step  29  total=45.7887  recon=3.594  sa=9.327  tsa=10.841  va=-0.189  fs=4.562  cs=0.131  dt=4.3s
+step  30  total=47.0911  recon=4.428  sa=9.139  tsa=10.736  va=-0.197  fs=4.354  cs=0.011  dt=5.6s
+step  31  total=48.5491  recon=5.016  sa=9.254  tsa=10.764  va=-0.200  fs=3.771  cs=0.000  dt=4.5s
+step  32  total=44.7300  recon=3.554  sa=8.999  tsa=10.478  va=-0.195  fs=3.896  cs=0.000  dt=5.2s
+step  33  total=46.2654  recon=3.570  sa=9.469  tsa=10.834  va=-0.193  fs=4.500  cs=0.077  dt=3.8s
+step  34  total=46.0381  recon=4.344  sa=8.967  tsa=10.712  va=-0.202  fs=3.208  cs=0.000  dt=5.3s
+step  35  total=48.6987  recon=5.101  sa=9.326  tsa=10.758  va=-0.204  fs=3.708  cs=0.000  dt=4.7s
+step  36  total=43.3815  recon=3.426  sa=8.971  tsa=10.488  va=-0.199  fs=3.083  cs=0.011  dt=5.1s
+step  37  total=45.2655  recon=3.550  sa=9.418  tsa=10.830  va=-0.195  fs=4.271  cs=0.000  dt=3.8s
+step  38  total=45.1332  recon=4.191  sa=8.932  tsa=10.692  va=-0.204  fs=2.875  cs=0.000  dt=5.5s
+step  39  total=48.3996  recon=5.008  sa=9.289  tsa=10.743  va=-0.206  fs=3.354  cs=0.000  dt=5.1s
+step  40  total=43.3024  recon=3.371  sa=8.995  tsa=10.492  va=-0.200  fs=3.125  cs=0.000  dt=6.5s
+step  41  total=44.9616  recon=3.537  sa=9.401  tsa=10.819  va=-0.197  fs=4.271  cs=0.000  dt=4.5s
+step  42  total=45.3224  recon=4.156  sa=8.973  tsa=10.678  va=-0.204  fs=3.438  cs=0.000  dt=5.7s
+step  43  total=47.1863  recon=4.826  sa=9.105  tsa=10.724  va=-0.206  fs=3.042  cs=0.000  dt=4.3s
+step  44  total=43.5735  recon=3.324  sa=9.084  tsa=10.500  va=-0.199  fs=3.354  cs=0.000  dt=5.2s
+step  45  total=45.7495  recon=3.484  sa=9.320  tsa=10.801  va=-0.196  fs=4.042  cs=0.000  dt=3.8s
+step  46  total=45.2532  recon=4.188  sa=8.992  tsa=10.664  va=-0.204  fs=2.833  cs=0.000  dt=5.4s
+step  47  total=47.9007  recon=4.686  sa=9.106  tsa=10.707  va=-0.205  fs=2.979  cs=0.000  dt=3.8s
+step  48  total=43.8816  recon=3.265  sa=9.144  tsa=10.499  va=-0.199  fs=3.229  cs=0.000  dt=5.4s
+step  49  total=44.3041  recon=3.397  sa=9.150  tsa=10.767  va=-0.196  fs=4.042  cs=0.000  dt=3.5s
+step  50  total=44.7811  recon=4.123  sa=9.011  tsa=10.656  va=-0.204  fs=2.542  cs=0.000  dt=5.3s
+step  51  total=47.2175  recon=4.680  sa=9.172  tsa=10.695  va=-0.204  fs=2.771  cs=0.000  dt=3.8s
+step  52  total=43.4362  recon=3.186  sa=9.046  tsa=10.513  va=-0.199  fs=3.229  cs=0.017  dt=5.4s
+step  53  total=43.3770  recon=3.393  sa=9.157  tsa=10.748  va=-0.197  fs=3.833  cs=0.000  dt=3.7s
+step  54  total=44.9270  recon=4.081  sa=9.071  tsa=10.658  va=-0.204  fs=2.729  cs=0.000  dt=5.4s
+step  55  total=46.7531  recon=4.699  sa=9.128  tsa=10.679  va=-0.205  fs=2.604  cs=0.000  dt=3.9s
+step  56  total=44.5620  recon=3.268  sa=9.096  tsa=10.522  va=-0.199  fs=2.792  cs=0.000  dt=5.3s
+step  57  total=46.0898  recon=3.215  sa=9.105  tsa=10.729  va=-0.197  fs=3.771  cs=0.000  dt=4.3s
+step  58  total=49.9087  recon=4.080  sa=9.089  tsa=10.660  va=-0.204  fs=2.917  cs=0.000  dt=4.8s
+step  59  total=49.2678  recon=4.716  sa=9.049  tsa=10.668  va=-0.205  fs=2.792  cs=0.000  dt=4.3s
+[probe post-train] {'tail_head_slot1_abs_mean': 0.0007297309930436313, 'vocab_proj_last_abs_mean': 0.0005491127376444638}
+[train] elapsed 335.1s  avg/step=5.58s
+[save] wrote ckpt/v346_trained.pt  tensors=202