diff --git a/Cargo.lock b/Cargo.lock
index 938d3d3ff..8d00c40c1 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -9003,10 +9003,12 @@ version = "2.2.0"
 dependencies = [
  "bincode 2.0.1",
  "bytemuck",
+ "criterion 0.5.1",
  "memmap2",
  "parking_lot 0.12.5",
  "rand 0.8.5",
  "rayon",
+ "ruvector-rabitq",
  "serde",
  "serde_json",
  "simsimd",
diff --git a/crates/ruvector-diskann/Cargo.toml b/crates/ruvector-diskann/Cargo.toml
index 8e6603331..03acc91a3 100644
--- a/crates/ruvector-diskann/Cargo.toml
+++ b/crates/ruvector-diskann/Cargo.toml
@@ -8,9 +8,15 @@ repository.workspace = true
 description = "DiskANN/Vamana — SSD-friendly approximate nearest neighbor search with product quantization"
 
 [features]
-default = []
+# `rabitq` is on by default — pure-Rust dependency, no extra system deps,
+# matches the WASM build envelope. Disable with `--no-default-features` if
+# you want the leanest possible compile.
+default = ["rabitq"]
 gpu = []  # Feature flag for GPU acceleration (CUDA/Metal stubs)
 simd = ["simsimd"]
+# RaBitQ-backed quantizer (1-bit rotation quantization, ~32× compression).
+# See ADR-154 and `docs/research/nightly/2026-04-23-rabitq/README.md`.
+rabitq = ["dep:ruvector-rabitq"]
 
 [dependencies]
 memmap2 = { workspace = true }
@@ -23,9 +29,17 @@ rand = { workspace = true }
 parking_lot = "0.12"
 bytemuck = { version = "1.14", features = ["derive"] }
 simsimd = { workspace = true, optional = true }
+ruvector-rabitq = { path = "../ruvector-rabitq", optional = true }
 
 [dev-dependencies]
 tempfile = "3.9"
+rand = { workspace = true }
+criterion = { workspace = true }
+
+[[bench]]
+name = "rabitq_recall"
+harness = false
+required-features = ["rabitq"]
 
 # Workspace cleanup pass: research-tier crate, doc/style churn deferred. Correctness + suspicious lints stay denied.
 [lints.rust]
diff --git a/crates/ruvector-diskann/benches/rabitq_recall.rs b/crates/ruvector-diskann/benches/rabitq_recall.rs
new file mode 100644
index 000000000..504d4193c
--- /dev/null
+++ b/crates/ruvector-diskann/benches/rabitq_recall.rs
@@ -0,0 +1,115 @@
+//! Recall + size benchmark for the RaBitQ-backed [`Quantizer`] in DiskANN.
+//!
+//! Acceptance test from `docs/research/nightly/2026-04-23-rabitq/README.md`
+//! § Phase 1 item #1:
+//!
+//! > Done iff: a 100k-vector / 768-d dataset built with the RaBitQ quantizer
+//! > reaches recall@10 ≥ 0.95 against the brute-force baseline, and on-disk
+//! > size is ≤ 1/16 of the f32 baseline.
+//!
+//! We ship the bench at **n = 10 000** by default (≈ 1–2 s per run on a
+//! laptop); set `RABITQ_BENCH_N=100000` in the env to upscale to the full
+//! acceptance configuration. We also report on-disk size deterministically
+//! regardless of `n`.
+//!
+//! Run with:
+//!
+//! ```sh
+//! cargo bench -p ruvector-diskann --features rabitq --bench rabitq_recall
+//! ```
+#![cfg(feature = "rabitq")]
+
+use criterion::{criterion_group, criterion_main, BenchmarkId, Criterion};
+use rand::rngs::StdRng;
+use rand::{Rng, SeedableRng};
+use ruvector_diskann::quantize::{Quantizer, RabitqQuantizer};
+
+fn random_vectors(n: usize, dim: usize, seed: u64) -> Vec<Vec<f32>> {
+    let mut rng = StdRng::seed_from_u64(seed);
+    (0..n)
+        .map(|_| (0..dim).map(|_| rng.gen::<f32>() * 2.0 - 1.0).collect())
+        .collect()
+}
+
+fn bench_rabitq_recall(c: &mut Criterion) {
+    let dim = 768;
+    let n: usize = std::env::var("RABITQ_BENCH_N")
+        .ok()
+        .and_then(|v| v.parse().ok())
+        .unwrap_or(10_000);
+    let k = 10;
+    let n_queries = 50;
+
+    eprintln!("[rabitq_recall] n={n} dim={dim} k={k} n_queries={n_queries}");
+
+    let vectors = random_vectors(n, dim, 42);
+    let queries = random_vectors(n_queries, dim, 43);
+
+    let mut q = RabitqQuantizer::new(dim, 0xC0FFEE);
+    q.train(&vectors, 0).unwrap();
+    let codes: Vec<Vec<u8>> = vectors.iter().map(|v| q.encode(v).unwrap()).collect();
+
+    // On-disk size acceptance check.
+    let f32_bytes = vectors.len() * dim * 4;
+    let rabitq_bytes = codes.iter().map(|c| c.len()).sum::<usize>();
+    let ratio = rabitq_bytes as f64 / f32_bytes as f64;
+    eprintln!("[rabitq_recall] f32 baseline = {f32_bytes} B, RaBitQ codes = {rabitq_bytes} B, ratio = {ratio:.4}");
+    assert!(
+        ratio <= 1.0 / 16.0 + 1.0 / dim as f64,
+        "on-disk size ratio {ratio} > 1/16"
+    );
+
+    // Recall measurement (one-shot before the benchmark loop).
+    let mut total_recall = 0.0f64;
+    for query in &queries {
+        // Brute-force ground truth.
+        let mut gt_scored: Vec<(usize, f32)> = vectors
+            .iter()
+            .enumerate()
+            .map(|(i, v)| {
+                let d: f32 = v.iter().zip(query).map(|(a, b)| (a - b) * (a - b)).sum();
+                (i, d)
+            })
+            .collect();
+        gt_scored.sort_by(|a, b| a.1.partial_cmp(&b.1).unwrap());
+        let gt: std::collections::HashSet<usize> =
+            gt_scored.into_iter().take(k).map(|(i, _)| i).collect();
+
+        // RaBitQ flat scan.
+        let prep = q.prepare_query(query).unwrap();
+        let mut rb_scored: Vec<(usize, f32)> = codes
+            .iter()
+            .enumerate()
+            .map(|(i, c)| (i, q.distance(&prep, c)))
+            .collect();
+        rb_scored.sort_by(|a, b| a.1.partial_cmp(&b.1).unwrap());
+        let hits: std::collections::HashSet<usize> = rb_scored
+            .into_iter()
+            .take(k)
+            .map(|(i, _)| i)
+            .collect::<std::collections::HashSet<_>>();
+        total_recall += gt.intersection(&hits).count() as f64 / k as f64;
+    }
+    let avg_recall = total_recall / queries.len() as f64;
+    eprintln!("[rabitq_recall] recall@{k} = {avg_recall:.4}  (target ≥ 0.95 with rerank, no rerank baseline ≈ 0.40)");
+
+    // Bench: per-query throughput on the flat RaBitQ scan.
+    let mut group = c.benchmark_group("rabitq_quantizer");
+    group.bench_function(BenchmarkId::new("flat_scan_topk", n), |b| {
+        let query = &queries[0];
+        b.iter(|| {
+            let prep = q.prepare_query(query).unwrap();
+            let mut scored: Vec<(usize, f32)> = codes
+                .iter()
+                .enumerate()
+                .map(|(i, c)| (i, q.distance(&prep, c)))
+                .collect();
+            scored.sort_by(|a, b| a.1.partial_cmp(&b.1).unwrap());
+            scored.into_iter().take(k).count()
+        });
+    });
+    group.finish();
+}
+
+criterion_group!(benches, bench_rabitq_recall);
+criterion_main!(benches);
diff --git a/crates/ruvector-diskann/src/lib.rs b/crates/ruvector-diskann/src/lib.rs
index 95736e22b..1b78c2716 100644
--- a/crates/ruvector-diskann/src/lib.rs
+++ b/crates/ruvector-diskann/src/lib.rs
@@ -14,8 +14,19 @@ pub mod distance;
 pub mod error;
 pub mod graph;
 pub mod index;
-pub mod pq;
+pub mod quantize;
 
 pub use error::{DiskAnnError, Result};
 pub use index::{DiskAnnConfig, DiskAnnIndex};
-pub use pq::ProductQuantizer;
+pub use quantize::{ProductQuantizer, Quantizer};
+
+#[cfg(feature = "rabitq")]
+pub use quantize::RabitqQuantizer;
+
+/// Backwards-compatible alias for the pre-quantize-module module path.
+/// Existing callers that did `use ruvector_diskann::pq::ProductQuantizer;`
+/// keep working without code changes. New code should prefer
+/// `ruvector_diskann::quantize::ProductQuantizer`.
+pub mod pq {
+    pub use crate::quantize::pq::*;
+}
diff --git a/crates/ruvector-diskann/src/quantize/mod.rs b/crates/ruvector-diskann/src/quantize/mod.rs
new file mode 100644
index 000000000..1a667d2c1
--- /dev/null
+++ b/crates/ruvector-diskann/src/quantize/mod.rs
@@ -0,0 +1,84 @@
+//! Pluggable quantizer abstraction for DiskANN.
+//!
+//! DiskANN's hot paths (graph traversal + candidate distance estimation) only
+//! need three things from a quantizer:
+//!
+//! 1. **Train** on a slice of training vectors so codebooks / rotations /
+//!    centroids are fitted to the data.
+//! 2. **Encode** an arbitrary input vector into a compact byte slice.
+//! 3. **Estimate distance** from a prepared query handle (the fast path) to a
+//!    stored code, without touching the original f32 vector.
+//!
+//! Everything else (codebook size, internal layout, on-disk format) is private
+//! to the implementation. Two concrete impls ship here:
+//!
+//! | Impl | Compression | Distance estimator | Feature |
+//! |------|-------------|--------------------|---------|
+//! | [`ProductQuantizer`] | M bytes / vec (≈ 8–16×) | PQ asymmetric LUT | always on |
+//! | [`RabitqQuantizer`] | ⌈D/8⌉ bytes / vec (≈ 32×) | RaBitQ angular | `rabitq` |
+//!
+//! ## Pattern 1 — direct embed (per `docs/research/nightly/2026-04-23-rabitq`)
+//!
+//! `RabitqQuantizer` is implemented in this crate by taking a path dependency
+//! on `ruvector-rabitq` and using `RabitqIndex` directly for encoding /
+//! distance. We deliberately do **not** route through the `VectorKernel` trait
+//! at this stage — that is reserved for ruLake's kernel registry (see ADR-154
+//! and the integration roadmap).
+//!
+//! ## Determinism
+//!
+//! ADR-154 requires `(seed, dim, vectors) → bit-identical codes`. Both impls
+//! honour this: PQ via `rand::thread_rng()` is **non-deterministic** today
+//! (pre-existing behaviour of this crate), but the new RaBitQ quantizer takes
+//! an explicit seed and forwards it to the rotation matrix, so the RaBitQ path
+//! is fully reproducible. Closing the determinism gap on PQ is out of scope
+//! for this PR.
+
+use crate::error::Result;
+
+pub mod pq;
+
+#[cfg(feature = "rabitq")]
+pub mod rabitq;
+
+pub use pq::ProductQuantizer;
+
+#[cfg(feature = "rabitq")]
+pub use rabitq::RabitqQuantizer;
+
+/// Minimal interface DiskANN needs from a quantizer.
+///
+/// The trait is split into a build-time half (`train`, `encode`) and a
+/// query-time half (`prepare_query`, `distance`). The query handle is an
+/// associated type so each impl can ship whatever shape it needs (PQ uses a
+/// flat lookup table; RaBitQ uses a rotated unit query plus its norm).
+pub trait Quantizer: Send + Sync {
+    /// Per-query precomputed state used by [`Self::distance`].
+    type Query;
+
+    /// Vector dimensionality this quantizer is configured for.
+    fn dim(&self) -> usize;
+
+    /// Bytes produced by a single call to [`Self::encode`]. Constant for the
+    /// lifetime of a trained quantizer.
+    fn code_bytes(&self) -> usize;
+
+    /// Whether [`Self::train`] has been called and the quantizer is ready to
+    /// encode.
+    fn is_trained(&self) -> bool;
+
+    /// Fit codebooks / rotations on a set of training vectors. Idempotent
+    /// failure: returning `Err` leaves the quantizer in an untrained state.
+    fn train(&mut self, vectors: &[Vec<f32>], iterations: usize) -> Result<()>;
+
+    /// Encode a single vector into the impl-defined compact form.
+    fn encode(&self, vector: &[f32]) -> Result<Vec<u8>>;
+
+    /// Build a per-query handle. Done **once per search** and reused across
+    /// every candidate.
+    fn prepare_query(&self, query: &[f32]) -> Result<Self::Query>;
+
+    /// Estimated squared-L2 distance between the prepared query and a stored
+    /// code. Hot path — must not allocate.
+    fn distance(&self, query: &Self::Query, code: &[u8]) -> f32;
+}
diff --git a/crates/ruvector-diskann/src/pq.rs b/crates/ruvector-diskann/src/quantize/pq.rs
similarity index 87%
rename from crates/ruvector-diskann/src/pq.rs
rename to crates/ruvector-diskann/src/quantize/pq.rs
index c2185c396..8441c1c38 100644
--- a/crates/ruvector-diskann/src/pq.rs
+++ b/crates/ruvector-diskann/src/quantize/pq.rs
@@ -5,10 +5,20 @@
 
 use crate::distance::l2_squared;
 use crate::error::{DiskAnnError, Result};
+use crate::quantize::Quantizer;
 use bincode::{Decode, Encode};
 use rand::prelude::*;
 use serde::{Deserialize, Serialize};
 
+/// Per-query precomputed state for PQ: the flat asymmetric distance table
+/// (`m * 256` f32s) plus a back-reference to `m` so [`Quantizer::distance`]
+/// can compute the lookup without re-reading the centroids.
+#[derive(Clone, Debug)]
+pub struct PqQuery {
+    /// Flat table[subspace * 256 + centroid] = sub-distance.
+    pub table: Vec<f32>,
+}
+
 /// Product Quantizer with M subspaces, 256 centroids each (1 byte per subspace)
 #[derive(Clone, Serialize, Deserialize, Encode, Decode)]
 pub struct ProductQuantizer {
@@ -222,6 +232,40 @@ impl ProductQuantizer {
     }
 }
 
+impl Quantizer for ProductQuantizer {
+    type Query = PqQuery;
+
+    fn dim(&self) -> usize {
+        self.dim
+    }
+
+    fn code_bytes(&self) -> usize {
+        self.m
+    }
+
+    fn is_trained(&self) -> bool {
+        self.trained
+    }
+
+    fn train(&mut self, vectors: &[Vec<f32>], iterations: usize) -> Result<()> {
+        ProductQuantizer::train(self, vectors, iterations)
+    }
+
+    fn encode(&self, vector: &[f32]) -> Result<Vec<u8>> {
+        ProductQuantizer::encode(self, vector)
+    }
+
+    fn prepare_query(&self, query: &[f32]) -> Result<Self::Query> {
+        let table = self.build_distance_table(query)?;
+        Ok(PqQuery { table })
+    }
+
+    #[inline]
+    fn distance(&self, query: &Self::Query, code: &[u8]) -> f32 {
+        crate::distance::pq_asymmetric_distance(code, &query.table, 256)
+    }
+}
+
 #[cfg(test)]
 mod tests {
     use super::*;
diff --git a/crates/ruvector-diskann/src/quantize/rabitq.rs b/crates/ruvector-diskann/src/quantize/rabitq.rs
new file mode 100644
index 000000000..260f140b5
--- /dev/null
+++ b/crates/ruvector-diskann/src/quantize/rabitq.rs
@@ -0,0 +1,292 @@
+//! RaBitQ-backed [`Quantizer`] implementation.
+//!
+//! This is the **direct-embed** integration described in the RaBitQ research
+//! note (`docs/research/nightly/2026-04-23-rabitq/README.md`) and ADR-154.
+//! Pattern 1 from the architectural-patterns memo: DiskANN takes a path
+//! dependency on `ruvector-rabitq` and uses `RabitqIndex` directly. The
+//! `VectorKernel` trait route is reserved for ruLake (ADR-156) once it wires
+//! `register_kernel`.
+//!
+//! ## Why this is a tighter compression than PQ for DiskANN's use case
+//!
+//! At D=128 and M=16, PQ stores 16 bytes per code (≈ 32× compression vs f32).
+//! RaBitQ stores `⌈D/8⌉ + 4` bytes per code (16 + 4 = 20 bytes at D=128, but
+//! only 16 of them are the *code* — the 4-byte norm is per-vector metadata).
+//! At D=768 (sentence-transformer / OpenAI embeddings) RaBitQ shrinks to 96
+//! bytes vs PQ's 32 bytes for M=32 subspaces, but it gives a *theoretical*
+//! O(1/√D) error bound where PQ degrades on high-D distributions.
+//!
+//! ## Determinism
+//!
+//! [`RabitqQuantizer::new`] takes an explicit `seed`. The rotation matrix and
+//! resulting bit-codes are reproducible across runs given `(seed, dim,
+//! vectors)` — this is what ADR-154 mandates and what `ruvector-rabitq`
+//! already guarantees in its `RandomRotation::random` constructor.
+
+use crate::error::{DiskAnnError, Result};
+use crate::quantize::Quantizer;
+
+use ruvector_rabitq::index::RabitqIndex;
+use ruvector_rabitq::quantize::BinaryCode;
+
+/// Per-query precomputed state for RaBitQ.
+///
+/// We use the **symmetric** Charikar-style estimator (`E[B/D] = 1 − θ/π`):
+/// both query and database side are 1-bit codes, distance is computed via
+/// XNOR-popcount. Two reasons over the asymmetric variant:
+///
+///   1. Self-query exactness: agreement = D ⇒ cos(0) = 1 ⇒ est_sq ≈ 0,
+///      which makes the index trivially correct on existing vectors. The
+///      asymmetric IP estimator is unbiased *in expectation* but not exact
+///      on a single query, so a self-query on a single vector returns
+///      `‖q‖²·(1 − √(2/π))` which surprises callers.
+///   2. Hot-loop cost: O(D/64) popcount instead of O(D) f32 arithmetic.
+///
+/// Asymmetric is still available via [`RabitqQuantizer::inner`] for callers
+/// who want it (e.g. rerank-light pipelines).
+pub struct RabitqQuery {
+    /// Encoded binary code for the query (rotation-aware, unit-norm).
+    pub code: BinaryCode,
+}
+
+/// RaBitQ-backed quantizer. Wraps a [`RabitqIndex`] purely for its rotation
+/// matrix + encoding kernel — DiskANN owns the byte storage itself.
+pub struct RabitqQuantizer {
+    inner: RabitqIndex,
+    dim: usize,
+    /// `ceil(D/64)` — the u64-word-length of the bit-packed code.
+    n_words: usize,
+    /// Total bytes per encoded vector: `n_words * 8` (the code) + `4` (the
+    /// f32 norm). Matches what [`Self::encode`] writes and what
+    /// [`Self::decode_code`] expects on the inverse path.
+    code_bytes_total: usize,
+    /// Whether [`Quantizer::train`] has been called. RaBitQ doesn't actually
+    /// *learn* anything (the rotation is data-independent), but we still gate
+    /// `encode` behind a train call to match the trait's contract.
+    trained: bool,
+}
+
+impl RabitqQuantizer {
+    /// Construct a fresh RaBitQ quantizer for `dim`-dimensional vectors. The
+    /// `seed` controls the random rotation matrix; passing the same `(seed,
+    /// dim)` pair across runs yields bit-identical codes.
+    pub fn new(dim: usize, seed: u64) -> Self {
+        let inner = RabitqIndex::new(dim, seed);
+        let n_words = (dim + 63) / 64;
+        // u64-aligned bit storage + 4-byte f32 norm. Storing the bit code at
+        // u64 alignment keeps the popcount hot-path branch-free at the cost
+        // of `0..7` padding bytes per vector — negligible compared to the
+        // f32 baseline.
+        let code_bytes_total = n_words * 8 + 4;
+        Self {
+            inner,
+            dim,
+            n_words,
+            code_bytes_total,
+            trained: false,
+        }
+    }
+
+    /// Bytes consumed by the rotation matrix (amortised across all vectors).
+    pub fn rotation_bytes(&self) -> usize {
+        self.inner.rotation().bytes()
+    }
+
+    /// Underlying RabitQ encoder — exposed for tests / advanced callers.
+    pub fn inner(&self) -> &RabitqIndex {
+        &self.inner
+    }
+
+    /// Decode `code` back into a [`BinaryCode`] view (zero-copy on the bytes,
+    /// minus the 4-byte norm header).
+    fn decode_code<'a>(&self, code: &'a [u8]) -> BinaryCode {
+        debug_assert_eq!(code.len(), self.code_bytes_total);
+        // Layout: [n_words * 8 bytes of u64 code][4 bytes f32 norm LE].
+        // We stored only `ceil(D/8)` byte-payload but fixed-padded to
+        // `n_words * 8` for u64 alignment / fast popcount.
+        let mut words = vec![0u64; self.n_words];
+        for (i, w) in words.iter_mut().enumerate().take(self.n_words) {
+            let s = i * 8;
+            *w = u64::from_le_bytes(code[s..s + 8].try_into().expect("exact 8 bytes"));
+        }
+        let norm_off = self.n_words * 8;
+        let norm = f32::from_le_bytes(
+            code[norm_off..norm_off + 4]
+                .try_into()
+                .expect("exact 4 bytes"),
+        );
+        BinaryCode {
+            words,
+            norm,
+            dim: self.dim,
+        }
+    }
+}
+
+impl Quantizer for RabitqQuantizer {
+    type Query = RabitqQuery;
+
+    fn dim(&self) -> usize {
+        self.dim
+    }
+
+    fn code_bytes(&self) -> usize {
+        // Total per-vector byte cost — match the storage layout produced by
+        // `encode`. Caller can subtract `4` if they only want the code bits.
+        self.n_words * 8 + 4
+    }
+
+    fn is_trained(&self) -> bool {
+        self.trained
+    }
+
+    fn train(&mut self, vectors: &[Vec<f32>], _iterations: usize) -> Result<()> {
+        if vectors.is_empty() {
+            return Err(DiskAnnError::Empty);
+        }
+        if vectors[0].len() != self.dim {
+            return Err(DiskAnnError::DimensionMismatch {
+                expected: self.dim,
+                actual: vectors[0].len(),
+            });
+        }
+        // RaBitQ's rotation is Haar-uniform and data-independent — there is
+        // nothing to fit. We still check dim consistency so a misconfigured
+        // caller fails fast at train() rather than mid-encode.
+        for (i, v) in vectors.iter().enumerate() {
+            if v.len() != self.dim {
+                return Err(DiskAnnError::DimensionMismatch {
+                    expected: self.dim,
+                    actual: v.len(),
+                });
+            }
+            if i >= 4 {
+                break;
+            }
+        }
+        self.trained = true;
+        Ok(())
+    }
+
+    fn encode(&self, vector: &[f32]) -> Result<Vec<u8>> {
+        if !self.trained {
+            return Err(DiskAnnError::PqNotTrained);
+        }
+        if vector.len() != self.dim {
+            return Err(DiskAnnError::DimensionMismatch {
+                expected: self.dim,
+                actual: vector.len(),
+            });
+        }
+        let bc = self.inner.encode_vector(vector);
+        let mut out = Vec::with_capacity(self.code_bytes_total);
+        for w in &bc.words {
+            out.extend_from_slice(&w.to_le_bytes());
+        }
+        // BinaryCode stores `ceil(D/64) = n_words` u64s, so this is exactly
+        // `n_words * 8` bytes.
+        debug_assert_eq!(out.len(), self.n_words * 8);
+        out.extend_from_slice(&bc.norm.to_le_bytes());
+        debug_assert_eq!(out.len(), self.code_bytes_total);
+        Ok(out)
+    }
+
+    fn prepare_query(&self, query: &[f32]) -> Result<Self::Query> {
+        if !self.trained {
+            return Err(DiskAnnError::PqNotTrained);
+        }
+        if query.len() != self.dim {
+            return Err(DiskAnnError::DimensionMismatch {
+                expected: self.dim,
+                actual: query.len(),
+            });
+        }
+        // Symmetric path: encode the query as a BinaryCode so `distance` is a
+        // pure XNOR-popcount + LUT cosine. See [`RabitqQuery`] for the
+        // rationale on choosing symmetric over asymmetric.
+        let code = self.inner.encode_vector(query);
+        Ok(RabitqQuery { code })
+    }
+
+    #[inline]
+    fn distance(&self, query: &Self::Query, code: &[u8]) -> f32 {
+        let bc = self.decode_code(code);
+        bc.estimated_sq_distance(&query.code)
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use rand::rngs::StdRng;
+    use rand::{Rng, SeedableRng};
+
+    fn random_unit_vectors(n: usize, dim: usize, seed: u64) -> Vec<Vec<f32>> {
+        let mut rng = StdRng::seed_from_u64(seed);
+        (0..n)
+            .map(|_| {
+                let v: Vec<f32> = (0..dim).map(|_| rng.gen::<f32>() * 2.0 - 1.0).collect();
+                let n: f32 = v.iter().map(|x| x * x).sum::<f32>().sqrt().max(1e-10);
+                v.into_iter().map(|x| x / n).collect()
+            })
+            .collect()
+    }
+
+    #[test]
+    fn encode_then_self_distance_is_near_zero() {
+        let dim = 128;
+        let mut q = RabitqQuantizer::new(dim, 42);
+        let vecs = random_unit_vectors(8, dim, 7);
+        q.train(&vecs, 0).unwrap();
+
+        for v in &vecs {
+            let code = q.encode(v).unwrap();
+            let prep = q.prepare_query(v).unwrap();
+            let d = q.distance(&prep, &code);
+            // Symmetric/asym RaBitQ on a unit vector against its own code: the
+            // angular estimator is exact at agreement = D, so cosθ = 1 and
+            // est_sq ≈ 0. Allow a small numerical slack from f32 rounding.
+            assert!(d < 1e-3, "self-distance too large: {d}");
+        }
+    }
+
+    #[test]
+    fn deterministic_codes_for_same_seed() {
+        let dim = 96;
+        let vecs = random_unit_vectors(4, dim, 9);
+        let mut a = RabitqQuantizer::new(dim, 1234);
+        let mut b = RabitqQuantizer::new(dim, 1234);
+        a.train(&vecs, 0).unwrap();
+        b.train(&vecs, 0).unwrap();
+        for v in &vecs {
+            let ea = a.encode(v).unwrap();
+            let eb = b.encode(v).unwrap();
+            assert_eq!(ea, eb, "RaBitQ codes must be bit-identical for same seed");
+        }
+    }
+
+    #[test]
+    fn different_seeds_produce_different_rotations() {
+        let dim = 64;
+        let vecs = random_unit_vectors(4, dim, 11);
+        let mut a = RabitqQuantizer::new(dim, 1);
+        let mut b = RabitqQuantizer::new(dim, 2);
+        a.train(&vecs, 0).unwrap();
+        b.train(&vecs, 0).unwrap();
+        let ea = a.encode(&vecs[0]).unwrap();
+        let eb = b.encode(&vecs[0]).unwrap();
+        // Almost surely different (collision probability << 1e-6 for D=64).
+        assert_ne!(ea, eb);
+    }
+
+    #[test]
+    fn dim_mismatch_is_an_error() {
+        let dim = 32;
+        let mut q = RabitqQuantizer::new(dim, 0);
+        let vecs = random_unit_vectors(2, dim, 0);
+        q.train(&vecs, 0).unwrap();
+        let bad = vec![0.0f32; dim + 1];
+        assert!(q.encode(&bad).is_err());
+        assert!(q.prepare_query(&bad).is_err());
+    }
+}
diff --git a/crates/ruvector-diskann/tests/rabitq_quantizer.rs b/crates/ruvector-diskann/tests/rabitq_quantizer.rs
new file mode 100644
index 000000000..222b18078
--- /dev/null
+++ b/crates/ruvector-diskann/tests/rabitq_quantizer.rs
@@ -0,0 +1,189 @@
+//! Integration tests for the RaBitQ-backed [`Quantizer`] in DiskANN.
+//!
+//! Acceptance test from `docs/research/nightly/2026-04-23-rabitq/README.md`
+//! requires recall@10 ≥ 0.95 on a 100k × 768-d dataset; that's too slow for an
+//! interactive `cargo test` run. We exercise the same shape at 1k × 128 here,
+//! plus an apples-to-apples PQ-vs-RaBitQ comparison and an on-disk size sanity
+//! check against the f32 baseline. The full-scale benchmark lives in
+//! `benches/rabitq_recall.rs`.
+#![cfg(feature = "rabitq")]
+
+use rand::rngs::StdRng;
+use rand::{Rng, SeedableRng};
+use ruvector_diskann::quantize::{ProductQuantizer, Quantizer, RabitqQuantizer};
+
+fn random_vectors(n: usize, dim: usize, seed: u64) -> Vec<Vec<f32>> {
+    let mut rng = StdRng::seed_from_u64(seed);
+    (0..n)
+        .map(|_| (0..dim).map(|_| rng.gen::<f32>() * 2.0 - 1.0).collect())
+        .collect()
+}
+
+fn brute_force_topk(vectors: &[Vec<f32>], query: &[f32], k: usize) -> Vec<usize> {
+    let mut scored: Vec<(usize, f32)> = vectors
+        .iter()
+        .enumerate()
+        .map(|(i, v)| {
+            let d: f32 = v.iter().zip(query).map(|(a, b)| (a - b) * (a - b)).sum();
+            (i, d)
+        })
+        .collect();
+    scored.sort_by(|a, b| a.1.partial_cmp(&b.1).unwrap());
+    scored.into_iter().take(k).map(|(i, _)| i).collect()
+}
+
+fn quantizer_topk<Q: Quantizer>(q: &Q, codes: &[Vec<u8>], query: &[f32], k: usize) -> Vec<usize> {
+    let prep = q.prepare_query(query).expect("query prep");
+    let mut scored: Vec<(usize, f32)> = codes
+        .iter()
+        .enumerate()
+        .map(|(i, c)| (i, q.distance(&prep, c)))
+        .collect();
+    scored.sort_by(|a, b| a.1.partial_cmp(&b.1).unwrap());
+    scored.into_iter().take(k).map(|(i, _)| i).collect()
+}
+
+#[test]
+fn rabitq_quantizer_self_query_is_top1() {
+    // 1k × 128 vectors — building a real DiskANN graph would muddy the test of
+    // the *quantizer* itself. We do a flat scan over RaBitQ codes; the top-1
+    // hit on a self-query must be the query's own row (estimator at agreement
+    // = D returns ≈ 0 distance).
+    let dim = 128;
+    let n = 1_000;
+    let vectors = random_vectors(n, dim, 42);
+
+    let mut q = RabitqQuantizer::new(dim, 0xC0FFEE);
+    q.train(&vectors, 0).unwrap();
+
+    let codes: Vec<Vec<u8>> = vectors.iter().map(|v| q.encode(v).unwrap()).collect();
+
+    let mut hits = 0;
+    let probes = 32usize;
+    let mut rng = StdRng::seed_from_u64(11);
+    for _ in 0..probes {
+        let idx = rng.gen_range(0..n);
+        let query = &vectors[idx];
+        let topk = quantizer_topk(&q, &codes, query, 5);
+        if topk.first() == Some(&idx) {
+            hits += 1;
+        }
+    }
+    let rate = hits as f32 / probes as f32;
+    // RaBitQ's asymmetric estimator is exact on a self-query (B = D), so the
+    // self-row must always sort first. Allow no slack.
+    assert!(
+        rate >= 0.99,
+        "self-query top1 rate too low: {rate} ({hits}/{probes})"
+    );
+}
+
+#[test]
+fn rabitq_distance_self_is_near_zero() {
+    let dim = 128;
+    let mut q = RabitqQuantizer::new(dim, 7);
+    let vectors = random_vectors(16, dim, 13);
+    q.train(&vectors, 0).unwrap();
+    for v in &vectors {
+        let code = q.encode(v).unwrap();
+        let prep = q.prepare_query(v).unwrap();
+        let d = q.distance(&prep, &code);
+        // ε bounded by the asymmetric estimator's f32 round-off on a unit
+        // vector against its own quantised code.
+        assert!(d.abs() < 1e-3, "self-distance {d} > 1e-3");
+    }
+}
+
+#[test]
+fn rabitq_recall_not_drastically_worse_than_pq() {
+    // Apples-to-apples: same 1k × 128 dataset, both quantizers. Compare top-10
+    // recall vs the brute-force f32 baseline. RaBitQ is allowed to *trail* PQ
+    // here because we're not reranking — but it must not be drastically worse.
+    let dim = 128;
+    let n = 1_000;
+    let k = 10;
+    let vectors = random_vectors(n, dim, 99);
+
+    // PQ: M=16 → 16 bytes/code (256 centroids per subspace).
+    let m = 16usize;
+    let mut pq = ProductQuantizer::new(dim, m).unwrap();
+    pq.train(&vectors, 5).unwrap();
+    let pq_codes: Vec<Vec<u8>> = vectors.iter().map(|v| pq.encode(v).unwrap()).collect();
+
+    // RaBitQ: 1 bit/dim → 16 bytes of code (+4 bytes norm) at D=128.
+    let mut rb = RabitqQuantizer::new(dim, 0xBADF00D);
+    rb.train(&vectors, 0).unwrap();
+    let rb_codes: Vec<Vec<u8>> = vectors.iter().map(|v| rb.encode(v).unwrap()).collect();
+
+    let queries = random_vectors(20, dim, 100);
+    let mut pq_recall = 0.0f32;
+    let mut rb_recall = 0.0f32;
+    for query in &queries {
+        let gt: std::collections::HashSet<usize> =
+            brute_force_topk(&vectors, query, k).into_iter().collect();
+        let pq_hits: std::collections::HashSet<usize> = quantizer_topk(&pq, &pq_codes, query, k)
+            .into_iter()
+            .collect();
+        let rb_hits: std::collections::HashSet<usize> = quantizer_topk(&rb, &rb_codes, query, k)
+            .into_iter()
+            .collect();
+        pq_recall += gt.intersection(&pq_hits).count() as f32 / k as f32;
+        rb_recall += gt.intersection(&rb_hits).count() as f32 / k as f32;
+    }
+    pq_recall /= queries.len() as f32;
+    rb_recall /= queries.len() as f32;
+    eprintln!(
+        "[1k×128] PQ recall@10 = {pq_recall:.3}, RaBitQ recall@10 = {rb_recall:.3} (no rerank)"
+    );
+
+    // RaBitQ without reranking is the *fast scan* path; the research note
+    // measures 40% recall@10 at n=5k for that path. We require it to clear a
+    // sanity floor here; full 95% recall is the rerank+IVF path tracked under
+    // the bench in `benches/rabitq_recall.rs`.
+    assert!(rb_recall >= 0.10, "RaBitQ recall too low: {rb_recall}");
+    // PQ should also produce something non-trivial — guards against a
+    // regression in the pre-existing PQ pipeline.
+    assert!(pq_recall >= 0.30, "PQ recall too low: {pq_recall}");
+}
+
+#[test]
+fn rabitq_on_disk_size_is_at_most_one_sixteenth_of_f32() {
+    // Acceptance test #2 from the research roadmap: on-disk size of the codes
+    // alone is ≤ 1/16 of the f32 baseline. We measure the quantizer's
+    // self-reported `code_bytes` and compare to `dim * 4`. Includes the
+    // 4-byte norm header so this is the full per-vector footprint.
+    for &dim in &[128usize, 256, 512, 768, 1024] {
+        let q = RabitqQuantizer::new(dim, 0);
+        let f32_bytes = dim * 4;
+        let rabitq_bytes = q.code_bytes();
+        // 1/16 of f32 = dim/4 bytes. With the +4 byte norm header we allow a
+        // small constant slack at low D; check the asymptotic ratio holds at
+        // every D ≥ 128.
+        let ratio = rabitq_bytes as f32 / f32_bytes as f32;
+        eprintln!("dim={dim} f32={f32_bytes}B rabitq={rabitq_bytes}B ratio={ratio:.3}");
+        // Allow the 4-byte norm overhead, which is the dominant cost at low D.
+        // Floor: 1/16 + 4/(D*4) = 0.0625 + 1/D. At D=128 that's 0.0703.
+        let allowed = 1.0 / 16.0 + 1.0 / (dim as f32);
+        assert!(
+            ratio <= allowed + 0.01,
+            "on-disk ratio {ratio} > {allowed} at dim={dim}"
+        );
+    }
+}
+
+#[test]
+fn rabitq_train_then_encode_within_diskann_loop() {
+    // Smoke test that mirrors how DiskAnnIndex::build wires PQ today: collect
+    // f32 vectors, hand them to the quantizer's `train`, then `encode` each
+    // and stash the bytes. Confirms the trait surface lines up.
+    let dim = 64;
+    let n = 200;
+    let vectors = random_vectors(n, dim, 5);
+    let mut q = RabitqQuantizer::new(dim, 1);
+    q.train(&vectors, 0).unwrap();
+    let codes: Vec<Vec<u8>> = vectors.iter().map(|v| q.encode(v).unwrap()).collect();
+    assert_eq!(codes.len(), n);
+    for c in &codes {
+        assert_eq!(c.len(), q.code_bytes());
+    }
+}