From 916786eff9eb70df0a27e77175fc53551d565323 Mon Sep 17 00:00:00 2001
From: Claude <noreply@anthropic.com>
Date: Sun, 5 Apr 2026 17:14:35 +0000
Subject: [PATCH 1/5] =?UTF-8?q?feat:=20Jina=20Reranker=20v3=20BF16=20lens?=
 =?UTF-8?q?=20=E2=80=94=20wired,=20tested,=20cross-model=20eval?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

reranker_lens.rs: complete lens module for Jina Reranker v3 BF16
  - 256×256 HDR table baked via include_bytes! (64 KB, L2 resident)
  - 151,936 codebook index (Qwen2 tokenizer, 296 KB)
  - cos[-0.886, +0.826] — widest signed range, most brain-like E/I ratio
  - reranker_lookup/distance/engine/think — full pipeline
  - reranker_relevance(): cross-encoder style query→document scoring
  - cross_model_eval(): Jina embedding × reranker = agreement score

Cross-model evaluation:
  Jina v3 similarity (symmetric) × Reranker relevance (asymmetric)
  Agreement = geometric mean (weakest-link property)

9 tests: table shape, codebook size, diagonal=255, symmetry,
  variance, engine creation, self-relevance, cross-model.

CRITICAL for i8 signed experiment:
  The reranker's symmetric cosine range makes it the BEST model
  for testing excitation/inhibition dynamics. Start the dual-path
  (u8 vs i8) comparison HERE, not on Jina v3 (which is positive-skewed).

https://claude.ai/code/session_01ChLvBfpJS8dQhHxRD4pYNp
---
 crates/thinking-engine/src/lib.rs           |   1 +
 crates/thinking-engine/src/reranker_lens.rs | 218 ++++++++++++++++++++
 2 files changed, 219 insertions(+)
 create mode 100644 crates/thinking-engine/src/reranker_lens.rs
diff --git a/crates/thinking-engine/src/lib.rs b/crates/thinking-engine/src/lib.rs
index 7843b450..4e4983af 100644
--- a/crates/thinking-engine/src/lib.rs
+++ b/crates/thinking-engine/src/lib.rs
@@ -27,6 +27,7 @@ pub mod qualia;
 pub mod domino;
 pub mod jina_lens;
 pub mod bge_m3_lens;
+pub mod reranker_lens;
 pub mod centroid_labels;
 pub mod superposition;
 pub mod cognitive_trace;
diff --git a/crates/thinking-engine/src/reranker_lens.rs b/crates/thinking-engine/src/reranker_lens.rs
new file mode 100644
index 00000000..417e0c3e
--- /dev/null
+++ b/crates/thinking-engine/src/reranker_lens.rs
@@ -0,0 +1,218 @@
+//! Jina Reranker v3 BF16 Lens — cross-encoder relevance scoring.
+//!
+//! Baked-in 256×256 HDR distance table + 151K codebook index from
+//! Jina Reranker v3 BF16 GGUF, CLAM sampled, CDF-percentile encoded.
+//!
+//! ```text
+//! cos[-0.886, +0.826] — WIDEST signed range of all models
+//! Nearly symmetric: balanced excitation/inhibition
+//! 256 centroids, 151,936 vocab (Qwen2 tokenizer)
+//! 64 KB table = L2 cache resident
+//! ```
+//!
+//! The reranker is the most informative lens for i8 signed experiments
+//! because its cosine range is nearly symmetric around zero.
+//! For the i8/u8 dual-path comparison: start here.
+
+/// The 256×256 HDR distance table from Jina Reranker v3 BF16.
+pub static RERANKER_HDR_TABLE: &[u8; 256 * 256] =
+    include_bytes!("../data/jina-reranker-v3-BF16-hdr/distance_table_256x256.u8");
+
+/// Token → centroid codebook index. 151,936 entries × u16 = 296 KB.
+pub static RERANKER_CODEBOOK_INDEX: &[u8] =
+    include_bytes!("../data/jina-reranker-v3-BF16-hdr/codebook_index.u16");
+
+/// Number of centroids.
+pub const RERANKER_N_CENTROIDS: usize = 256;
+
+/// Vocabulary size (Qwen2 tokenizer, shared with reader-lm).
+pub const RERANKER_VOCAB_SIZE: usize = 151_936;
+
+/// Look up the centroid for a token ID.
+#[inline]
+pub fn reranker_lookup(token_id: u32) -> u16 {
+    let idx = (token_id as usize).min(RERANKER_VOCAB_SIZE - 1);
+    let offset = idx * 2;
+    if offset + 1 < RERANKER_CODEBOOK_INDEX.len() {
+        u16::from_le_bytes([RERANKER_CODEBOOK_INDEX[offset], RERANKER_CODEBOOK_INDEX[offset + 1]])
+    } else {
+        0
+    }
+}
+
+/// Look up centroids for a batch of token IDs.
+pub fn reranker_lookup_many(token_ids: &[u32]) -> Vec<u16> {
+    token_ids.iter().map(|&id| reranker_lookup(id)).collect()
+}
+
+/// Get the HDR distance between two centroids. O(1).
+#[inline]
+pub fn reranker_distance(a: u16, b: u16) -> u8 {
+    let ai = (a as usize).min(RERANKER_N_CENTROIDS - 1);
+    let bi = (b as usize).min(RERANKER_N_CENTROIDS - 1);
+    RERANKER_HDR_TABLE[ai * RERANKER_N_CENTROIDS + bi]
+}
+
+/// Create a ThinkingEngine from the baked reranker HDR table.
+pub fn reranker_engine() -> crate::engine::ThinkingEngine {
+    crate::engine::ThinkingEngine::new(RERANKER_HDR_TABLE.to_vec())
+}
+
+/// Full pipeline: token IDs → centroids → domino cascade.
+pub fn reranker_think(
+    token_ids: &[u32],
+    cascade: &crate::domino::DominoCascade,
+) -> (u16, Vec<u16>, crate::domino::DissonanceProfile) {
+    let centroids = reranker_lookup_many(token_ids);
+    let (dom, stages, dis) = cascade.think(&centroids);
+    let chain: Vec<u16> = stages.iter()
+        .filter_map(|s| s.focus.first().map(|a| a.index))
+        .collect();
+    (dom, chain, dis)
+}
+
+/// Relevance score between two texts via reranker lens.
+///
+/// Cross-encoder style: encode both texts, compare centroid activations.
+/// Higher score = more relevant. Uses domino cascade for multi-hop comparison.
+pub fn reranker_relevance(
+    query_ids: &[u32],
+    document_ids: &[u32],
+) -> f32 {
+    let q_centroids = reranker_lookup_many(query_ids);
+    let d_centroids = reranker_lookup_many(document_ids);
+
+    // Cross-attention: for each query centroid, find best document match
+    let mut total_score = 0.0f32;
+    let mut pairs = 0;
+
+    for &qc in &q_centroids {
+        let mut best = 0u8;
+        for &dc in &d_centroids {
+            let dist = reranker_distance(qc, dc);
+            if dist > best { best = dist; }
+        }
+        total_score += best as f32 / 255.0;
+        pairs += 1;
+    }
+
+    if pairs > 0 { total_score / pairs as f32 } else { 0.0 }
+}
+
+/// Compare two texts using Jina v3 embedding + reranker cross-validation.
+/// Returns (embedding_similarity, reranker_relevance, agreement).
+pub fn cross_model_eval(
+    text_a_jina_ids: &[u32],
+    text_b_jina_ids: &[u32],
+    text_a_reranker_ids: &[u32],
+    text_b_reranker_ids: &[u32],
+) -> CrossModelResult {
+    // Jina v3 embedding similarity (symmetric)
+    let jina_centroids_a = super::jina_lens::jina_lookup_many(text_a_jina_ids);
+    let jina_centroids_b = super::jina_lens::jina_lookup_many(text_b_jina_ids);
+    let mut jina_sim = 0.0f32;
+    let mut jina_pairs = 0;
+    for &ca in &jina_centroids_a {
+        for &cb in &jina_centroids_b {
+            jina_sim += super::jina_lens::jina_distance(ca, cb) as f32 / 255.0;
+            jina_pairs += 1;
+        }
+    }
+    let jina_score = if jina_pairs > 0 { jina_sim / jina_pairs as f32 } else { 0.0 };
+
+    // Reranker relevance (asymmetric: query → document)
+    let reranker_score = reranker_relevance(text_a_reranker_ids, text_b_reranker_ids);
+
+    // Agreement: geometric mean (weakest-link property)
+    let agreement = (jina_score * reranker_score).sqrt();
+
+    CrossModelResult {
+        jina_similarity: jina_score,
+        reranker_relevance: reranker_score,
+        agreement,
+    }
+}
+
+/// Result of cross-model evaluation.
+#[derive(Debug, Clone, Copy)]
+pub struct CrossModelResult {
+    /// Jina v3 embedding similarity (symmetric, 0-1).
+    pub jina_similarity: f32,
+    /// Reranker relevance (asymmetric, 0-1).
+    pub reranker_relevance: f32,
+    /// Agreement: geometric mean of both (0-1).
+    pub agreement: f32,
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn table_is_256x256() {
+        assert_eq!(RERANKER_HDR_TABLE.len(), 256 * 256);
+    }
+
+    #[test]
+    fn codebook_is_151k() {
+        assert_eq!(RERANKER_CODEBOOK_INDEX.len(), RERANKER_VOCAB_SIZE * 2);
+    }
+
+    #[test]
+    fn diagonal_is_255() {
+        for i in 0..256 {
+            assert_eq!(RERANKER_HDR_TABLE[i * 256 + i], 255,
+                "diagonal[{}] should be 255", i);
+        }
+    }
+
+    #[test]
+    fn lookup_in_range() {
+        for token_id in [0, 100, 1000, 50000, 100000, 151935] {
+            let centroid = reranker_lookup(token_id);
+            assert!(centroid < 256, "centroid {} out of range for token {}", centroid, token_id);
+        }
+    }
+
+    #[test]
+    fn distance_symmetric() {
+        for a in [0u16, 50, 100, 200, 255] {
+            for b in [0u16, 50, 100, 200, 255] {
+                assert_eq!(reranker_distance(a, b), reranker_distance(b, a));
+            }
+        }
+    }
+
+    #[test]
+    fn hdr_table_has_variance() {
+        let avg = RERANKER_HDR_TABLE.iter().map(|&v| v as f64).sum::<f64>()
+            / RERANKER_HDR_TABLE.len() as f64;
+        let std = (RERANKER_HDR_TABLE.iter()
+            .map(|&v| { let d = v as f64 - avg; d * d })
+            .sum::<f64>() / RERANKER_HDR_TABLE.len() as f64)
+            .sqrt();
+        assert!(std > 50.0, "HDR table std={:.1} — should be >50", std);
+    }
+
+    #[test]
+    fn engine_creates() {
+        let engine = reranker_engine();
+        assert_eq!(engine.size, 256);
+    }
+
+    #[test]
+    fn relevance_self_is_high() {
+        // Same tokens should have high relevance
+        let ids: Vec<u32> = (0..20).collect();
+        let score = reranker_relevance(&ids, &ids);
+        assert!(score > 0.5, "self-relevance should be high: {}", score);
+    }
+
+    #[test]
+    fn cross_model_runs() {
+        let ids_a: Vec<u32> = (0..10).collect();
+        let ids_b: Vec<u32> = (1000..1010).collect();
+        let result = cross_model_eval(&ids_a, &ids_b, &ids_a, &ids_b);
+        assert!(result.agreement >= 0.0 && result.agreement <= 1.0);
+    }
+}

From c5dde1103f0a49e34786eccf967bd6f474a9fcb3 Mon Sep 17 00:00:00 2001
From: Claude <noreply@anthropic.com>
Date: Sun, 5 Apr 2026 17:23:31 +0000
Subject: [PATCH 2/5] feat: LensProfile ICC + LensConfig 6-lane registry +
 complete handover
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

LensProfile (camera+lens ICC for distance tables):
  - EncodingPath: RawF32, HdrCdfU8, SignedI8, GammaPhiU8, GammaPhiI8
  - Transfer curve: 256 sample points (ground truth cos → encoded value)
  - Inverse curve: encoded → estimated cos
  - Per-centroid bias, noise floor, effective bits, signed ratio
  - build() compares encoded table vs ground truth f32 cosines
  - rten computes ground truth, profile captures the residual

LensConfig 6-lane registry:
  jina-v3:       250K vocab, XlmRoberta, cos[-0.067,0.234], γ=0.37, truth anchor
  bge-m3:        250K vocab, XlmRoberta, cos[-0.07,0.23],   γ=0.40
  reranker-v3:   151K vocab, Qwen2,      cos[-0.886,0.826], γ=1.50, best for i8
  reader-lm:     151K vocab, Qwen2,      cos[-0.095,0.336], γ=0.12
  qwopus-27b:    248K vocab, Qwen2,      cos[-0.23,0.18],   γ=1.50, 4096 centroids
  maverick-128e: 202K vocab, Llama,      TBD,               TBD

60 contract tests passing.

Session complete: reranker wired, ICC DTO ready, i8 architecture documented,
all handover docs committed. Next session can start i8 dual-path on reranker.

https://claude.ai/code/session_01ChLvBfpJS8dQhHxRD4pYNp
---
 crates/lance-graph-contract/src/high_heel.rs | 236 +++++++++++++++++++
 1 file changed, 236 insertions(+)

diff --git a/crates/lance-graph-contract/src/high_heel.rs b/crates/lance-graph-contract/src/high_heel.rs
index 28d2684e..41ceefb1 100644
--- a/crates/lance-graph-contract/src/high_heel.rs
+++ b/crates/lance-graph-contract/src/high_heel.rs
@@ -788,3 +788,239 @@ mod tests {
         eprintln!("══════════════════════════════════════════════════════════\n");
     }
 }
+
+// ═══════════════════════════════════════════════════════════════════════════
+// LENS ICC PROFILE — characterize encoding distortion vs ground truth
+// ═══════════════════════════════════════════════════════════════════════════
+
+/// Encoding path that produced a distance table.
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Hash)]
+pub enum EncodingPath {
+    /// burn+GGUF f32 cosine (ground truth, expensive).
+    RawF32,
+    /// HDR CDF u8 (unsigned, loses sign, gains distribution).
+    HdrCdfU8,
+    /// Signed i8 (preserves sign, linear quantization).
+    SignedI8,
+    /// Gamma+phi redistributed (nonlinear, role-aware).
+    GammaPhiU8,
+    /// Gamma+phi signed (best of both).
+    GammaPhiI8,
+}
+
+/// Lens ICC Profile: characterizes the distortion of one encoding path
+/// relative to ground truth (burn+GGUF f32 cosine).
+///
+/// Like a camera lens profile in Lightroom: measures the transfer function
+/// between "what the weights actually say" and "what the table encodes."
+/// The γ offset partially corrects it. The ICC captures the residual.
+///
+/// Size: ~2KB per lens per role. Total for 6 models × 6 roles = ~72KB.
+#[derive(Debug, Clone)]
+pub struct LensProfile {
+    /// Which model this profile describes.
+    pub model_name: String,
+    /// Which role (Q, K, V, Gate, Up, Down).
+    pub role: String,
+    /// Which encoding path.
+    pub encoding: EncodingPath,
+    /// Transfer function: 256 sample points from cos=-1.0 to cos=+1.0.
+    /// Maps ground_truth_cos → encoded_value.
+    pub transfer_curve: Vec<f32>,
+    /// Inverse: encoded_value → estimated_cos.
+    pub inverse_curve: Vec<f32>,
+    /// Per-centroid bias: systematic over/under-estimation per row.
+    pub centroid_bias: Vec<f32>,
+    /// Noise floor: below this absolute cosine, the encoding can't distinguish.
+    pub noise_floor: f32,
+    /// Effective dynamic range in bits (higher = more discrimination).
+    pub effective_bits: f32,
+    /// Signed ratio: fraction of negative entries in the raw cosine matrix.
+    /// ~0.5 = symmetric (reranker), ~0.1 = positive-skewed (Jina v3).
+    pub signed_ratio: f32,
+}
+
+impl LensProfile {
+    /// Build a profile by comparing encoded table against ground truth cosines.
+    ///
+    /// `ground_truth`: f32 cosine matrix (n×n, from burn+GGUF or rten)
+    /// `encoded`: u8 or i8 distance table (n×n, from our encoding pipeline)
+    /// `n`: number of centroids
+    pub fn build(
+        model_name: &str,
+        role: &str,
+        encoding: EncodingPath,
+        ground_truth: &[f32],
+        encoded: &[u8],
+        n: usize,
+    ) -> Self {
+        // Build transfer curve: sample 256 points from cos range
+        let mut transfer_curve = vec![0.0f32; 256];
+        let mut inverse_curve = vec![0.0f32; 256];
+        let mut centroid_bias = vec![0.0f32; n];
+
+        // Collect (cos, encoded) pairs
+        let mut pairs: Vec<(f32, u8)> = Vec::new();
+        let mut negative_count = 0usize;
+        let mut total_count = 0usize;
+
+        for i in 0..n {
+            let mut row_error = 0.0f32;
+            let mut row_count = 0;
+            for j in 0..n {
+                if i == j { continue; }
+                let cos = ground_truth[i * n + j];
+                let enc = encoded[i * n + j];
+                pairs.push((cos, enc));
+                if cos < 0.0 { negative_count += 1; }
+                total_count += 1;
+                // Bias: expected encoded vs actual
+                let expected = ((cos + 1.0) / 2.0 * 255.0) as u8; // linear mapping
+                row_error += (enc as f32 - expected as f32).abs();
+                row_count += 1;
+            }
+            if row_count > 0 {
+                centroid_bias[i] = row_error / row_count as f32;
+            }
+        }
+
+        // Sort pairs by cosine value
+        pairs.sort_by(|a, b| a.0.partial_cmp(&b.0).unwrap());
+
+        // Sample transfer curve at 256 equidistant cosine points
+        let n_pairs = pairs.len();
+        for k in 0..256 {
+            let target_cos = -1.0 + k as f32 * 2.0 / 255.0;
+            // Find nearest pair
+            let idx = pairs.partition_point(|p| p.0 < target_cos).min(n_pairs - 1);
+            transfer_curve[k] = pairs[idx].1 as f32;
+            inverse_curve[pairs[idx].1 as usize] = target_cos;
+        }
+
+        // Noise floor: smallest cosine difference that produces different encoded values
+        let mut noise_floor = 2.0f32;
+        for w in pairs.windows(2) {
+            if w[0].1 != w[1].1 {
+                let delta = (w[1].0 - w[0].0).abs();
+                if delta < noise_floor { noise_floor = delta; }
+            }
+        }
+
+        // Effective bits: log2 of distinct encoded values
+        let mut seen = [false; 256];
+        for &(_, e) in &pairs { seen[e as usize] = true; }
+        let distinct = seen.iter().filter(|&&v| v).count();
+        let effective_bits = (distinct as f32).log2();
+
+        let signed_ratio = if total_count > 0 {
+            negative_count as f32 / total_count as f32
+        } else { 0.0 };
+
+        Self {
+            model_name: model_name.to_string(),
+            role: role.to_string(),
+            encoding,
+            transfer_curve,
+            inverse_curve,
+            centroid_bias,
+            noise_floor,
+            effective_bits,
+            signed_ratio,
+        }
+    }
+}
+
+/// Standardized lens configuration for the 6-lane pipeline.
+#[derive(Debug, Clone)]
+pub struct LensConfig {
+    /// Model name (e.g., "jina-v3", "reranker-v3", "qwopus-27b").
+    pub name: &'static str,
+    /// Model family.
+    pub family: LensFamily,
+    /// Vocabulary size.
+    pub vocab_size: usize,
+    /// Number of centroids in the baked table.
+    pub n_centroids: usize,
+    /// Tokenizer family (determines which tokenizer.json to load).
+    pub tokenizer: TokenizerFamily,
+    /// Raw cosine range observed in the weight matrix.
+    pub cos_range: (f32, f32),
+    /// Gamma offset for HDR re-encoding (higher = more resolution near zero).
+    pub gamma_offset: f32,
+    /// Whether this lens uses signed i8 tables.
+    pub is_signed: bool,
+    /// Whether this is a truth anchor for cross-model evaluation.
+    pub is_truth_anchor: bool,
+}
+
+/// Model family.
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Hash)]
+pub enum LensFamily {
+    /// Embedding model (symmetric similarity).
+    Embedding,
+    /// Reranker (asymmetric relevance scoring).
+    Reranker,
+    /// Reader model (HTML → text).
+    Reader,
+    /// Language model (token generation).
+    LanguageModel,
+    /// Mixture of Experts language model.
+    MoE,
+}
+
+/// Tokenizer family.
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Hash)]
+pub enum TokenizerFamily {
+    XlmRoberta,
+    Qwen2,
+    Llama,
+    SentencePiece,
+}
+
+/// The 6-lane lens registry.
+pub static LENS_REGISTRY: &[LensConfig] = &[
+    LensConfig {
+        name: "jina-v3", family: LensFamily::Embedding,
+        vocab_size: 250_002, n_centroids: 256,
+        tokenizer: TokenizerFamily::XlmRoberta,
+        cos_range: (-0.067, 0.234), gamma_offset: 0.37,
+        is_signed: false, is_truth_anchor: true,
+    },
+    LensConfig {
+        name: "bge-m3", family: LensFamily::Embedding,
+        vocab_size: 250_002, n_centroids: 256,
+        tokenizer: TokenizerFamily::XlmRoberta,
+        cos_range: (-0.07, 0.23), gamma_offset: 0.40,
+        is_signed: false, is_truth_anchor: false,
+    },
+    LensConfig {
+        name: "reranker-v3", family: LensFamily::Reranker,
+        vocab_size: 151_936, n_centroids: 256,
+        tokenizer: TokenizerFamily::Qwen2,
+        cos_range: (-0.886, 0.826), gamma_offset: 1.50,
+        is_signed: false, // best candidate FOR signed
+        is_truth_anchor: false,
+    },
+    LensConfig {
+        name: "reader-lm-1.5b", family: LensFamily::Reader,
+        vocab_size: 151_936, n_centroids: 256,
+        tokenizer: TokenizerFamily::Qwen2,
+        cos_range: (-0.095, 0.336), gamma_offset: 0.12,
+        is_signed: false, is_truth_anchor: false,
+    },
+    LensConfig {
+        name: "qwopus-27b", family: LensFamily::LanguageModel,
+        vocab_size: 248_320, n_centroids: 4096,
+        tokenizer: TokenizerFamily::Qwen2,
+        cos_range: (-0.23, 0.18), gamma_offset: 1.50,
+        is_signed: false, is_truth_anchor: false,
+    },
+    LensConfig {
+        name: "maverick-128e", family: LensFamily::MoE,
+        vocab_size: 202_048, n_centroids: 256, // TBD: scale to 4096
+        tokenizer: TokenizerFamily::Llama,
+        cos_range: (0.0, 0.0), // TBD: stream and measure
+        gamma_offset: 0.0,     // TBD: calibrate
+        is_signed: false, is_truth_anchor: false,
+    },
+];

From 4db02af086ae0f4b6aeebd3ed5b9edf72ff50703 Mon Sep 17 00:00:00 2001
From: Claude <noreply@anthropic.com>
Date: Sun, 5 Apr 2026 17:30:25 +0000
Subject: [PATCH 3/5] =?UTF-8?q?feat:=20lens=20calibration=20harness=20?=
 =?UTF-8?q?=E2=80=94=20Spearman=20=CF=81=20+=20ICC=20profile=20builder?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

calibrate_lenses.rs: measures baked lens quality against ground truth
  - 16 sentence pairs (diverse: similar/dissimilar/related/unrelated)
  - Jina v3 + Reranker v3 baked distances computed
  - Spearman rank correlation against API ground truth
  - ICC profile (linear fit) when ρ < 0.998
  - Thresholds: >0.998 = truth anchor, >0.95 = usable+ICC, <0.95 = broken

Current result with hash tokenization: ρ = 0.13 (BROKEN — expected)
Fix: use real tokenizers per model (Jina=XLM-RoBERTa, Reranker=Qwen2)
Then: set JINA_API_KEY or use rten+ONNX for ground truth

Cross-model calibration: Jina ←ICC→ Reranker ←ICC→ all others
Star topology: N-1 profiles align N models. 512 bytes per pair.

https://claude.ai/code/session_01ChLvBfpJS8dQhHxRD4pYNp
---
 .../examples/calibrate_lenses.rs              | 234 ++++++++++++++++++
 1 file changed, 234 insertions(+)
 create mode 100644 crates/thinking-engine/examples/calibrate_lenses.rs

diff --git a/crates/thinking-engine/examples/calibrate_lenses.rs b/crates/thinking-engine/examples/calibrate_lenses.rs
new file mode 100644
index 00000000..ed046703
--- /dev/null
+++ b/crates/thinking-engine/examples/calibrate_lenses.rs
@@ -0,0 +1,234 @@
+//! Calibrate baked lenses against live API ground truth.
+//!
+//! For each lens (Jina v3, Reranker v3):
+//!   1. Encode N sentence pairs via API (or local rten inference)
+//!   2. Compute API cosines (ground truth)
+//!   3. Compute baked lens distances
+//!   4. Measure Spearman ρ (rank correlation)
+//!   5. Build ICC profile if ρ < 0.998
+//!
+//! Usage:
+//!   JINA_API_KEY=... cargo run --release --example calibrate_lenses
+//!   Or: with local models via rten (no API key needed)
+
+use thinking_engine::jina_lens;
+use thinking_engine::reranker_lens;
+
+fn main() {
+    eprintln!("═══════════════════════════════════════════════════════════");
+    eprintln!("  Lens Calibration — Baked vs API Ground Truth");
+    eprintln!("═══════════════════════════════════════════════════════════\n");
+
+    // Test sentence pairs (diverse: similar, dissimilar, related, unrelated)
+    let pairs = vec![
+        ("love is patient", "love is kind"),
+        ("love is patient", "hate is destructive"),
+        ("the cat sat on the mat", "a dog lay on the rug"),
+        ("the cat sat on the mat", "quantum physics is complex"),
+        ("artificial intelligence", "machine learning"),
+        ("artificial intelligence", "medieval pottery"),
+        ("Palantir developed Gotham", "CIA funded surveillance"),
+        ("Palantir developed Gotham", "roses bloom in spring"),
+        ("the wound is where light enters", "suffering leads to growth"),
+        ("the wound is where light enters", "TCP/IP packet routing"),
+        ("international law governs treaties", "diplomatic relations are complex"),
+        ("international law governs treaties", "chocolate cake recipe"),
+        ("neural network backpropagation", "gradient descent optimization"),
+        ("neural network backpropagation", "ancient Roman architecture"),
+        ("climate change affects biodiversity", "global warming impacts ecosystems"),
+        ("climate change affects biodiversity", "jazz improvisation techniques"),
+    ];
+
+    eprintln!("Test pairs: {}\n", pairs.len());
+
+    // ── Baked lens distances ────────────────────────────────────────
+    eprintln!("=== Baked Lens Distances ===\n");
+
+    // Simulate tokenization (hash-based, same as forward pass test)
+    // In production: use real tokenizer per model
+    let mut jina_dists = Vec::new();
+    let mut reranker_dists = Vec::new();
+
+    for (i, (a, b)) in pairs.iter().enumerate() {
+        // Hash tokens for Jina (250K vocab)
+        let a_ids_jina: Vec<u32> = a.split_whitespace()
+            .map(|w| simple_hash(w) % 250_002).collect();
+        let b_ids_jina: Vec<u32> = b.split_whitespace()
+            .map(|w| simple_hash(w) % 250_002).collect();
+
+        // Hash tokens for Reranker (151K vocab)
+        let a_ids_rr: Vec<u32> = a.split_whitespace()
+            .map(|w| simple_hash(w) % 151_936).collect();
+        let b_ids_rr: Vec<u32> = b.split_whitespace()
+            .map(|w| simple_hash(w) % 151_936).collect();
+
+        // Jina: average pairwise centroid distance
+        let a_centroids = jina_lens::jina_lookup_many(&a_ids_jina);
+        let b_centroids = jina_lens::jina_lookup_many(&b_ids_jina);
+        let jina_sim = avg_distance(&a_centroids, &b_centroids, |a, b|
+            jina_lens::jina_distance(a, b) as f32 / 255.0);
+        jina_dists.push(jina_sim);
+
+        // Reranker: relevance score
+        let rr_rel = reranker_lens::reranker_relevance(&a_ids_rr, &b_ids_rr);
+        reranker_dists.push(rr_rel);
+
+        eprintln!("  [{:2}] jina={:.3} rr={:.3} | \"{}\" ↔ \"{}\"",
+            i, jina_sim, rr_rel, a, b);
+    }
+
+    // ── API ground truth (placeholder — needs real API) ──────────
+    eprintln!("\n=== API Ground Truth ===\n");
+
+    let api_key = std::env::var("JINA_API_KEY").ok();
+    if api_key.is_none() {
+        eprintln!("  JINA_API_KEY not set. Using synthetic ground truth.");
+        eprintln!("  Set JINA_API_KEY to calibrate against real Jina API.");
+        eprintln!("  Or use rten + Jina ONNX for local ground truth.\n");
+    }
+
+    // Synthetic ground truth: manually assigned similarities
+    // (replace with real API calls when available)
+    let api_ground_truth: Vec<f32> = vec![
+        0.92, // love patient ↔ love kind (very similar)
+        0.25, // love patient ↔ hate destructive (opposite)
+        0.78, // cat mat ↔ dog rug (similar scene)
+        0.05, // cat mat ↔ quantum physics (unrelated)
+        0.89, // AI ↔ ML (very related)
+        0.02, // AI ↔ pottery (unrelated)
+        0.65, // Palantir Gotham ↔ CIA surveillance (related domain)
+        0.03, // Palantir ↔ roses (unrelated)
+        0.72, // wound light ↔ suffering growth (metaphorically similar)
+        0.01, // wound light ↔ TCP/IP (unrelated)
+        0.83, // law treaties ↔ diplomatic (related)
+        0.04, // law ↔ chocolate (unrelated)
+        0.91, // backprop ↔ gradient descent (very related)
+        0.06, // backprop ↔ Roman architecture (unrelated)
+        0.94, // climate biodiversity ↔ warming ecosystems (near identical)
+        0.03, // climate ↔ jazz (unrelated)
+    ];
+
+    // ── Spearman rank correlation ────────────────────────────────
+    eprintln!("=== Spearman Rank Correlation ===\n");
+
+    let rho_jina = spearman(&jina_dists, &api_ground_truth);
+    let rho_reranker = spearman(&reranker_dists, &api_ground_truth);
+
+    eprintln!("  Jina v3 baked vs API:     ρ = {:.4}", rho_jina);
+    eprintln!("  Reranker v3 baked vs API: ρ = {:.4}", rho_reranker);
+
+    // Cross-model: Jina vs Reranker
+    let rho_cross = spearman(&jina_dists, &reranker_dists);
+    eprintln!("  Jina vs Reranker (cross): ρ = {:.4}", rho_cross);
+
+    eprintln!("\n  Thresholds:");
+    eprintln!("    ρ > 0.998: truth-anchor grade (< 2 rank disagreements in 1000)");
+    eprintln!("    ρ > 0.95:  usable with ICC correction");
+    eprintln!("    ρ < 0.95:  broken, needs rebuild");
+
+    for (name, rho) in [("Jina", rho_jina), ("Reranker", rho_reranker)] {
+        let status = if rho > 0.998 { "TRUTH ANCHOR ✓" }
+            else if rho > 0.95 { "USABLE (needs ICC)" }
+            else if rho > 0.80 { "WEAK (needs rebuild or more centroids)" }
+            else { "BROKEN" };
+        eprintln!("  {} → {}", name, status);
+    }
+
+    // ── ICC Profile (if needed) ──────────────────────────────────
+    if rho_jina < 0.998 || rho_reranker < 0.998 {
+        eprintln!("\n=== ICC Profile Needed ===\n");
+        eprintln!("  Building transfer curves from {} pairs...", pairs.len());
+
+        // Simple linear regression as baseline ICC
+        let (jina_slope, jina_intercept) = linear_fit(&jina_dists, &api_ground_truth);
+        let (rr_slope, rr_intercept) = linear_fit(&reranker_dists, &api_ground_truth);
+
+        eprintln!("  Jina ICC:     corrected = {:.3} × baked + {:.3}", jina_slope, jina_intercept);
+        eprintln!("  Reranker ICC: corrected = {:.3} × baked + {:.3}", rr_slope, rr_intercept);
+
+        // Apply correction and re-measure
+        let jina_corrected: Vec<f32> = jina_dists.iter()
+            .map(|&d| (d * jina_slope + jina_intercept).clamp(0.0, 1.0))
+            .collect();
+        let rr_corrected: Vec<f32> = reranker_dists.iter()
+            .map(|&d| (d * rr_slope + rr_intercept).clamp(0.0, 1.0))
+            .collect();
+
+        let rho_jina_corrected = spearman(&jina_corrected, &api_ground_truth);
+        let rho_rr_corrected = spearman(&rr_corrected, &api_ground_truth);
+
+        eprintln!("  After ICC: Jina ρ = {:.4} (was {:.4})", rho_jina_corrected, rho_jina);
+        eprintln!("  After ICC: Reranker ρ = {:.4} (was {:.4})", rho_rr_corrected, rho_reranker);
+    }
+
+    eprintln!("\n═══════════════════════════════════════════════════════════");
+    eprintln!("  NOTE: Using hash-based tokenization (not real BPE).");
+    eprintln!("  For production calibration, use real tokenizers per model.");
+    eprintln!("  Set JINA_API_KEY for real API ground truth.");
+    eprintln!("═══════════════════════════════════════════════════════════\n");
+}
+
+fn avg_distance(a: &[u16], b: &[u16], dist_fn: impl Fn(u16, u16) -> f32) -> f32 {
+    let mut sum = 0.0f32;
+    let mut count = 0;
+    for &ca in a {
+        for &cb in b {
+            sum += dist_fn(ca, cb);
+            count += 1;
+        }
+    }
+    if count > 0 { sum / count as f32 } else { 0.0 }
+}
+
+fn spearman(a: &[f32], b: &[f32]) -> f32 {
+    let n = a.len().min(b.len());
+    if n < 2 { return 0.0; }
+    let rank_a = ranks(a);
+    let rank_b = ranks(b);
+    let mean_a = rank_a.iter().sum::<f32>() / n as f32;
+    let mean_b = rank_b.iter().sum::<f32>() / n as f32;
+    let mut num = 0.0f32;
+    let mut den_a = 0.0f32;
+    let mut den_b = 0.0f32;
+    for i in 0..n {
+        let da = rank_a[i] - mean_a;
+        let db = rank_b[i] - mean_b;
+        num += da * db;
+        den_a += da * da;
+        den_b += db * db;
+    }
+    let den = (den_a * den_b).sqrt();
+    if den > 1e-10 { num / den } else { 0.0 }
+}
+
+fn ranks(values: &[f32]) -> Vec<f32> {
+    let mut indexed: Vec<(usize, f32)> = values.iter().enumerate()
+        .map(|(i, &v)| (i, v)).collect();
+    indexed.sort_by(|a, b| a.1.partial_cmp(&b.1).unwrap());
+    let mut result = vec![0.0f32; values.len()];
+    for (rank, &(orig_idx, _)) in indexed.iter().enumerate() {
+        result[orig_idx] = rank as f32;
+    }
+    result
+}
+
+fn linear_fit(x: &[f32], y: &[f32]) -> (f32, f32) {
+    let n = x.len().min(y.len()) as f32;
+    let mx = x.iter().sum::<f32>() / n;
+    let my = y.iter().sum::<f32>() / n;
+    let mut num = 0.0f32;
+    let mut den = 0.0f32;
+    for i in 0..x.len().min(y.len()) {
+        num += (x[i] - mx) * (y[i] - my);
+        den += (x[i] - mx) * (x[i] - mx);
+    }
+    let slope = if den > 1e-10 { num / den } else { 1.0 };
+    let intercept = my - slope * mx;
+    (slope, intercept)
+}
+
+fn simple_hash(word: &str) -> u32 {
+    let mut h: u64 = 0x9e3779b97f4a7c15;
+    for b in word.bytes() { h = h.wrapping_mul(31).wrapping_add(b as u64); }
+    h as u32
+}

From fb42be732a59ade61039b7f51c006368fb0b744d Mon Sep 17 00:00:00 2001
From: Claude <noreply@anthropic.com>
Date: Sun, 5 Apr 2026 17:33:02 +0000
Subject: [PATCH 4/5] docs: add Jina v5 as new truth anchor (GGUF + ONNX, no
 API needed)

jinaai/jina-embeddings-v5-text-small-text-matching:
  F16 GGUF: 1,198 MB (streamable, v3 format, 310 tensors)
  ONNX: 2,384 MB (rten ground truth, full f32)
  tokenizer.json: 11.4 MB (real BPE)

Calibration: rten(ONNX) = ground truth, stream(GGUF) = baked lens.
Same model, two paths, ICC profile bridges them. No API key.

https://claude.ai/code/session_01ChLvBfpJS8dQhHxRD4pYNp
---
 .claude/HANDOVER_MAVERICK_SESSION.md | 19 +++++++++++++++++++
 1 file changed, 19 insertions(+)

diff --git a/.claude/HANDOVER_MAVERICK_SESSION.md b/.claude/HANDOVER_MAVERICK_SESSION.md
index 594489b7..423ada33 100644
--- a/.claude/HANDOVER_MAVERICK_SESSION.md
+++ b/.claude/HANDOVER_MAVERICK_SESSION.md
@@ -562,3 +562,22 @@ NACHHER:
 
 SiLU-ONNX: GESTRICHEN. Vorzeichen-Erhaltung ersetzt es.
 ```
+
+---
+
+## Jina v5 — New Truth Anchor (replaces v3)
+
+```
+Repo:  jinaai/jina-embeddings-v5-text-small-text-matching
+GGUF:  v5-small-text-matching-F16.gguf (1,198 MB, GGUF v3, 310 tensors)
+ONNX:  onnx/model.onnx + model.onnx_data (2,384 MB, for rten ground truth)
+Tok:   tokenizer.json (11.4 MB, real BPE)
+
+Calibration pipeline:
+  rten loads ONNX → forward pass → ground truth embeddings
+  Our pipeline: stream F16 GGUF → CLAM → bake HDR table
+  ICC profile: compare → calibrate → truth anchor at ρ > 0.998
+
+Both ONNX and GGUF from SAME model = no API key, no network for calibration.
+Jina v5 replaces v3 as truth anchor (newer, better, has ONNX).
+```

From 6619cb1e9228d3491c394069d05715b1d6debc9a Mon Sep 17 00:00:00 2001
From: Claude <noreply@anthropic.com>
Date: Sun, 5 Apr 2026 17:47:51 +0000
Subject: [PATCH 5/5] =?UTF-8?q?docs:=20calibration=20matrix=20=E2=80=94=20?=
 =?UTF-8?q?ONNX=20vs=20GGUF=20vs=20highheelbgz=20=C3=97=20ICC=20profiles?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

5 encoding paths × ONNX ground truth × 6 models × 6 roles:
  ONNX (rten) = f32 ground truth
  GGUF raw u8 CDF, GGUF γ+φ, GGUF i8 signed, GGUF highheelbgz spiral

ICC profile per path. Spearman ρ identifies best encoding per model×role.
All tools ready: rten, streaming, gamma_phi, LensProfile, calibrate harness.
Estimated: ~2.5 hours for complete matrix.

https://claude.ai/code/session_01ChLvBfpJS8dQhHxRD4pYNp
---
 .claude/HANDOVER_MAVERICK_SESSION.md | 65 ++++++++++++++++++++++++++++
 1 file changed, 65 insertions(+)

diff --git a/.claude/HANDOVER_MAVERICK_SESSION.md b/.claude/HANDOVER_MAVERICK_SESSION.md
index 423ada33..a6c6640d 100644
--- a/.claude/HANDOVER_MAVERICK_SESSION.md
+++ b/.claude/HANDOVER_MAVERICK_SESSION.md
@@ -581,3 +581,68 @@ Calibration pipeline:
 Both ONNX and GGUF from SAME model = no API key, no network for calibration.
 Jina v5 replaces v3 as truth anchor (newer, better, has ONNX).
 ```
+
+---
+
+## CALIBRATION MATRIX — The Definitive Experiment
+
+### Three encoding paths × ONNX ground truth
+
+```
+For each model (Jina v5, BGE-M3, Reranker, Reader-LM, Qwopus, Maverick):
+  For each role (Q, K, V, Gate, Up, Down — or token_embd for embedding models):
+  
+    1. ONNX (rten): load model.onnx → forward pass → f32 embeddings = GROUND TRUTH
+    2. GGUF raw:    stream BF16 → CLAM → cosine → u8 HDR CDF table
+    3. GGUF γ+φ:    stream BF16 → CLAM → cosine → gamma offset → phi redistribute
+    4. GGUF i8:     stream BF16 → CLAM → cosine → signed i8 (preserves inhibition)
+    5. GGUF hhbgz:  stream BF16 → CLAM → highheelbgz spiral → golden ratio stride
+    
+    ICC profile: compare each path (2-5) against ground truth (1)
+    Measure: Spearman ρ, transfer curve, noise floor, effective bits
+    
+    Best path = highest ρ after ICC correction
+    Per-model per-role winner may differ!
+```
+
+### Why this is definitive
+
+```
+Current state: we ASSUME our encoding preserves topology.
+After calibration: we KNOW, quantified to 4 decimal places.
+
+Expected outcomes:
+  - i8 wins for reranker (symmetric cos range, sign matters)
+  - γ+φ wins for gate-heavy roles (concentrates resolution at zero)
+  - raw u8 CDF is surprisingly good for embedding models (positive-skewed)
+  - hhbgz spiral wins for... we don't know yet. That's why we test.
+  
+  ICC correction makes EVERY path usable.
+  But some paths need less correction = more faithful = preferred.
+```
+
+### Tools ready
+
+```
+rten:                 AdaWorldAPI/rten (ONNX runtime, your fork)
+GGUF streaming:       stream_hdr_lens.rs, stream_maverick.rs (HTTP range)
+highheelbgz:          spiral addressing + golden ratio stride
+bgz-tensor:           gamma_phi.rs (GammaProfile, encode/decode)
+LensProfile:          lance-graph-contract/high_heel.rs (ICC DTO)
+LensConfig:           lance-graph-contract/high_heel.rs (6-model registry)
+calibrate_lenses.rs:  Spearman ρ + ICC builder harness
+Jina v5 ONNX:         jinaai/jina-embeddings-v5-text-small-text-matching
+Jina v5 GGUF:         same repo, F16.gguf (1.2 GB, streamable)
+```
+
+### Session estimate
+```
+Download: Jina v5 ONNX (2.4 GB) + GGUF (1.2 GB) = 3.6 GB (fits in 18 GB free)
+Compute:  rten inference on 1000 texts ≈ 5 min
+          CLAM + 5 encoding paths ≈ 10 min
+          ICC profiles ≈ 1 min
+          Total: ~20 min for Jina v5 complete calibration
+          
+Repeat for remaining 5 models: ~2 hours total
+Full calibration matrix: ~2.5 hours
+```