chaoticgoodcomputing
diff --git a/‎examples/advanced/DroppedNeuralNet/Data/_08_Reporting/Catalog.Reporting.cs‎
Lines changed: 16 additions & 1 deletion b/‎examples/advanced/DroppedNeuralNet/Data/_08_Reporting/Catalog.Reporting.cs‎
Lines changed: 16 additions & 1 deletion
diff --git a/‎examples/advanced/DroppedNeuralNet/Data/_08_Reporting/Schemas/CandidateEvaluation.cs‎
Lines changed: 26 additions & 0 deletions b/‎examples/advanced/DroppedNeuralNet/Data/_08_Reporting/Schemas/CandidateEvaluation.cs‎
Lines changed: 26 additions & 0 deletions
diff --git a/‎examples/advanced/DroppedNeuralNet/Flows/Exploration/ExplorationFlow.cs‎
Lines changed: 52 additions & 4 deletions b/‎examples/advanced/DroppedNeuralNet/Flows/Exploration/ExplorationFlow.cs‎
Lines changed: 52 additions & 4 deletions
diff --git a/‎examples/advanced/DroppedNeuralNet/Flows/Exploration/Steps/compute_activation_scores.py‎
Lines changed: 161 additions & 0 deletions b/‎examples/advanced/DroppedNeuralNet/Flows/Exploration/Steps/compute_activation_scores.py‎
Lines changed: 161 additions & 0 deletions
@@ -8,7 +8,8 @@ public partial class Catalog
   /// <summary>
   /// Diagnostic measurements from the Validation flow.
   /// Each row is a (Category, Metric, Value, Notes) tuple covering pairing signal
-  /// quality, fixed-ordering baseline error, and per-candidate forward-pass errors.
+  /// quality, fixed-ordering baseline error, per-candidate forward-pass errors, and
+  /// per-block residual blame attribution.
   /// Persisted as JSON so reports survive process exit and can be inspected offline.
   /// </summary>
   public IItem<IEnumerable<DiagnosticEntry>> Diagnostics =>
@@ -19,4 +20,18 @@ public partial class Catalog
           filePath: $"{_basePath}/_08_Reporting/Datasets/diagnostics.json"
         )
     );
+
+  /// <summary>
+  /// Forward-pass evaluation of every candidate permutation produced by the Solver flow.
+  /// Always populated — no candidate is gated by tolerance. Downstream SelectSolution
+  /// picks the best entry to write to Solution.
+  /// </summary>
+  public IItem<IEnumerable<CandidateEvaluation>> CandidateEvaluations =>
+    CreateItem(
+      () =>
+        ItemFactory.Enumerable.Json<CandidateEvaluation>(
+          label: "CandidateEvaluations",
+          filePath: $"{_basePath}/_08_Reporting/Datasets/candidate_evaluations.json"
+        )
+    );
 }
@@ -0,0 +1,26 @@
+using Flowthru.Core.Abstractions;
+
+namespace DroppedNeuralNet.Data._08_Reporting.Schemas;
+
+/// <summary>
+/// Forward-pass evaluation result for a single candidate permutation produced by the
+/// Solver flow. All candidates are always emitted — no tolerance gating — so the full
+/// error distribution is preserved as a catalog entry for downstream analysis.
+/// </summary>
+[FlowthruSchema]
+public partial record CandidateEvaluation
+{
+  public int CandidateIndex { get; init; }
+
+  /// <summary>Maximum absolute error across all historical samples.</summary>
+  public float MaxErr { get; init; }
+
+  /// <summary>Mean absolute error across all historical samples.</summary>
+  public float MeanErr { get; init; }
+
+  /// <summary>1 if MaxErr is below the tolerance threshold used during evaluation, 0 otherwise.</summary>
+  public int PassesTolerance { get; init; }
+
+  /// <summary>JSON-encoded int[97] permutation (same encoding as CandidatePermutation.Permutation).</summary>
+  public string Permutation { get; init; } = "[]";
+}
@@ -18,12 +18,19 @@ namespace DroppedNeuralNet.Flows.Exploration;
 ///   Sieves PieceMetadata to enumerate every structurally valid (inp, out) Block candidate.
 ///   Pure dimension arithmetic; no blobs.
 ///
-/// Step 2 (Python) — compute_pairing_scores:
-///   For every legal (inp, out) candidate, computes ||W_out @ W_inp||_F.
-///   Lower scores indicate residual coupling — the signal left by training.
+/// Step 2 (Python) — compute_svd_activation_scores:
+///   Scores each legal (inp, out) candidate by SVD subspace alignment. The top-R left
+///   singular vectors of W_inp (principal hidden directions written to) are compared against
+///   the top-R right singular vectors of W_out (principal hidden directions read from).
+///   High overlap → trained pair; orthogonal subspaces → mismatch.
+///   No historical data required — purely geometric.
+///
+///   Supersedes compute_activation_scores (Pearson correlation on data pass, v2) and
+///   compute_pairing_scores (Frobenius of W_out @ W_inp, v1). Both are retained but
+///   commented out for reference.
 ///
 /// Step 3 (Python) — run_hungarian:
-///   Applies the Hungarian algorithm to the 48×48 score matrix.
+///   Applies the Hungarian algorithm to the 48×48 score matrix (with Sinkhorn normalization).
 ///   Produces the globally optimal assignment of inp ↔ out pieces in O(n³).
 ///
 /// Step 4 (Python) — rank_orderings:
@@ -44,6 +51,7 @@ public static Flow Create(Catalog catalog, IPythonExecutor executor)
         output: catalog.LegalPairings
       );
 
+      /* SUPERSEDED — weight-space Frobenius signal collapses under normalization.
       pipeline.AddPythonStep<
         IEnumerable<PieceMetadata>,
         IEnumerable<PieceBlob>,
@@ -58,6 +66,46 @@ public static Flow Create(Catalog catalog, IPythonExecutor executor)
         output: catalog.PairingScores,
         executor: executor
       );
+      */
+
+      pipeline.AddPythonStep<
+        IEnumerable<PieceMetadata>,
+        IEnumerable<PieceBlob>,
+        IEnumerable<BlockCandidate>,
+        IEnumerable<PairingScore>
+      >(
+        label: "ComputeSvdActivationScores",
+        description: "Score each (inp, out) candidate by SVD subspace alignment between inp write-directions and out read-directions. Pure weight geometry, no data pass required (Python).",
+        module: "Flows.Exploration.Steps.compute_svd_activation_scores",
+        function: "compute_svd_activation_scores",
+        input: (catalog.PieceMetadata, catalog.Pieces, catalog.LegalPairings),
+        output: catalog.PairingScores,
+        executor: executor
+      );
+
+      /* SUPERSEDED — Pearson correlation between mean activation and column attention norms.
+         Required a full data pass; SVD subspace alignment captures the same signal geometrically.
+      pipeline.AddPythonStep<
+        IEnumerable<PieceMetadata>,
+        IEnumerable<PieceBlob>,
+        IEnumerable<BlockCandidate>,
+        IEnumerable<MeasurementSchema>,
+        IEnumerable<PairingScore>
+      >(
+        label: "ComputeActivationScores",
+        description: "Run historical data through each inp piece; score each out piece by residual response magnitude. Lower = trained pair (Python).",
+        module: "Flows.Exploration.Steps.compute_activation_scores",
+        function: "compute_activation_scores",
+        input: (
+          catalog.PieceMetadata,
+          catalog.Pieces,
+          catalog.LegalPairings,
+          catalog.HistoricalData
+        ),
+        output: catalog.PairingScores,
+        executor: executor
+      );
+      */
 
       pipeline.AddPythonStep<IEnumerable<PairingScore>, IEnumerable<BlockAssignment>>(
         label: "RunHungarian",
 
@@ -0,0 +1,161 @@
+"""Score every legal (inp, out) Block pairing using data-driven activation response.
+
+Attempts
+--------
+v1 — Mean residual magnitude  (SUPERSEDED, see commented block below)
+    score = mean_i ||W_out · relu(W_inp · x_i + b_inp) + b_out||_2
+    Result: std=0.33, gap-to-2nd=0.02 — the bias term dominates ||R||_2 regardless
+    of H, giving poor within-row discrimination (only 6/48 assignments at row min).
+
+v2 — Pearson correlation between mean activation pattern and column attention  (CURRENT)
+    For a trained (inp, out) pair:
+      - inp uses a specific subset of the 96 hidden neurons on real data
+        → measured by mean_act[inp][k] = E[relu(W_inp[k,:] · x + b_inp[k])]
+      - out has been trained to attend to exactly those neurons
+        → measured by col_norm[out][k] = ||W_out[:, k]||_2
+
+    Pearson correlation(mean_act[inp], col_norm[out]) should be strongly positive
+    for trained pairs and near-zero for random ones.
+
+    score = 1 - pearson_r   (lower = better, consistent with Hungarian minimization)
+
+    Bias terms are irrelevant: mean_act uses only the inp bias inside ReLU (shifts the
+    active set, which is part of the signal), and col_norm ignores b_out entirely.
+"""
+import io
+import logging
+import numpy as np
+import pandas as pd
+import torch
+from flowthru import step
+
+logger = logging.getLogger(__name__)
+
+
+@step(
+    inputs=["PieceMetadata", "PieceBlob", "BlockCandidate", "MeasurementSchema"],
+    outputs=["PairingScore"],
+)
+def compute_activation_scores(
+    piece_metadata: pd.DataFrame,
+    pieces: pd.DataFrame,
+    legal_pairings: pd.DataFrame,
+    historical_data: pd.DataFrame,
+) -> pd.DataFrame:
+    """Score each legal (inp, out) pairing by activation-pattern / attention alignment.
+
+    Uses Pearson correlation between:
+      - mean_act[inp]: which of the 96 hidden neurons inp activates most strongly on data
+      - col_norm[out]: which of the 96 hidden neurons out pays most attention to
+
+    A trained pair has high positive correlation; mismatched pairs are near zero.
+    score = 1 - pearson_r  (lower = better for Hungarian minimization).
+
+    Args:
+        piece_metadata: Structural metadata for all pieces (LayerType, dims).
+        pieces: Raw byte blobs indexed by PieceIndex.
+        legal_pairings: Dimension-valid (InpPieceIndex, OutPieceIndex) candidates.
+        historical_data: Sensor measurements used to probe inp activation patterns.
+
+    Returns:
+        DataFrame with [InpPieceIndex, OutPieceIndex, CoherenceScore].
+        Lower CoherenceScore indicates a more likely trained pair.
+    """
+    blob_by_index: dict[int, bytes] = {
+        int(r["PieceIndex"]): r["Data"] for _, r in pieces.iterrows()
+    }
+
+    legal_set: set[tuple[int, int]] = set(
+        zip(
+            legal_pairings["InpPieceIndex"].astype(int),
+            legal_pairings["OutPieceIndex"].astype(int),
+        )
+    )
+
+    inp_indices = (
+        piece_metadata[piece_metadata["LayerType"] == "BlockInp"]["PieceIndex"]
+        .astype(int)
+        .tolist()
+    )
+    out_indices = (
+        piece_metadata[piece_metadata["LayerType"] == "BlockOut"]["PieceIndex"]
+        .astype(int)
+        .tolist()
+    )
+
+    logger.info(
+        f"[compute_activation_scores] {len(inp_indices)} inp × {len(out_indices)} out = "
+        f"{len(legal_set)} legal pairs"
+    )
+
+    feature_cols = [f"measurement_{i}" for i in range(48)]
+    X_t = torch.tensor(
+        historical_data[feature_cols].values, dtype=torch.float32
+    ).T  # (48, N)
+
+    def load_state(piece_idx: int) -> dict[str, torch.Tensor]:
+        return torch.load(
+            io.BytesIO(blob_by_index[piece_idx]),
+            weights_only=True,
+            map_location=torch.device("cpu"),
+        )
+
+    # ------------------------------------------------------------------
+    # mean_act[inp]: (96,) — average activation of each hidden neuron over the dataset
+    # ------------------------------------------------------------------
+    mean_act: dict[int, np.ndarray] = {}
+    with torch.no_grad():
+        for inp_idx in inp_indices:
+            sd = load_state(inp_idx)
+            H = torch.relu(sd["weight"] @ X_t + sd["bias"].unsqueeze(1))  # (96, N)
+            mean_act[inp_idx] = H.mean(dim=1).numpy()  # (96,)
+
+    # ------------------------------------------------------------------
+    # col_norm[out]: (96,) — L2 norm of each column of W_out
+    # column k corresponds to how much out "attends to" hidden neuron k
+    # ------------------------------------------------------------------
+    col_norm: dict[int, np.ndarray] = {}
+    for out_idx in out_indices:
+        sd = load_state(out_idx)
+        col_norm[out_idx] = np.linalg.norm(sd["weight"].numpy(), axis=0)  # (96,)
+
+    # ------------------------------------------------------------------
+    # Pearson correlation → score = 1 - r  (lower = better)
+    # ------------------------------------------------------------------
+    def pearson_r(a: np.ndarray, b: np.ndarray) -> float:
+        a_c = a - a.mean()
+        b_c = b - b.mean()
+        denom = np.linalg.norm(a_c) * np.linalg.norm(b_c)
+        return float(np.dot(a_c, b_c) / denom) if denom > 1e-8 else 0.0
+
+    rows = []
+    for inp_idx in inp_indices:
+        for out_idx in out_indices:
+            if (inp_idx, out_idx) not in legal_set:
+                continue
+            r = pearson_r(mean_act[inp_idx], col_norm[out_idx])
+            rows.append({
+                "InpPieceIndex": inp_idx,
+                "OutPieceIndex": out_idx,
+                "CoherenceScore": 1.0 - r,   # lower = better alignment
+            })
+
+    logger.info(f"[compute_activation_scores] Computed {len(rows)} scores")
+    return pd.DataFrame(rows, columns=["InpPieceIndex", "OutPieceIndex", "CoherenceScore"])
+
+
+# =============================================================================
+# v1 — SUPERSEDED: mean residual magnitude
+# Bias dominates ||W_out @ H + b_out||_2 regardless of H; poor within-row gaps.
+# =============================================================================
+# def compute_activation_scores_v1(...):
+#     ...
+#     for inp_idx in inp_indices:
+#         H = inp_activations[inp_idx]
+#         for out_idx in out_indices:
+#             W_out, b_out = out_params[out_idx]
+#             R = W_out @ H + b_out.unsqueeze(1)
+#             score = float(torch.norm(R, dim=0).mean())
+#             rows.append({"InpPieceIndex": inp_idx, "OutPieceIndex": out_idx,
+#                          "CoherenceScore": score})
+