diff --git a/asap-common/sketch-core/report.md b/asap-common/sketch-core/report.md
index 1230f10..a65a204 100644
--- a/asap-common/sketch-core/report.md
+++ b/asap-common/sketch-core/report.md
@@ -46,3 +46,25 @@ cargo test -p sketch-core
 |-------|--------|--------|----------------|----------------|----------|----------|
 | 4096  | 200000 | 2000   | Legacy         | 0.9999993694   | 0.20     | 3.69     |
 | 4096  | 200000 | 2000   | sketchlib-rust | 0.9999993499   | 0.21     | 4.27     |
+
+---
+
+### CountMinSketchWithHeap (top-k + CMS accuracy on exact top-k)
+
+The heap is maintained by local updates; recall is measured against the **true** top-k at the end of the stream.
+
+#### depth=3
+
+| width | n      | domain | heap_size | Mode           | Top-k recall | Pearson (top-k) | MAPE (%) | RMSE (%) |
+|-------|--------|--------|-----------|----------------|--------------|-----------------|----------|----------|
+| 1024  | 100000 | 1000   | 10        | Legacy         | 0.40         | 0.9571          | 0.174    | 0.319    |
+| 1024  | 100000 | 1000   | 10        | sketchlib-rust | 0.80         | 1.0000          | 0.000    | 0.000    |
+
+#### depth=5
+
+| width | n      | domain | heap_size | Mode           | Top-k recall | Pearson (top-k) | MAPE (%) | RMSE (%) |
+|-------|--------|--------|-----------|----------------|--------------|-----------------|----------|----------|
+| 2048  | 200000 | 2000   | 20        | Legacy         | 0.60         | 0.9964          | 0.045    | 0.101    |
+| 2048  | 200000 | 2000   | 20        | sketchlib-rust | 1.00         | 0.9982          | 0.021    | 0.067    |
+| 2048  | 200000 | 2000   | 50        | Legacy         | 0.40         | 0.9999983       | 5.60     | 16.49    |
+| 2048  | 200000 | 2000   | 50        | sketchlib-rust | 0.48         | 0.9999990       | 3.90     | 12.95    |
diff --git a/asap-common/sketch-core/src/bin/sketchlib_fidelity.rs b/asap-common/sketch-core/src/bin/sketchlib_fidelity.rs
index 8fd08e3..99ca914 100644
--- a/asap-common/sketch-core/src/bin/sketchlib_fidelity.rs
+++ b/asap-common/sketch-core/src/bin/sketchlib_fidelity.rs
@@ -1,9 +1,12 @@
 // Fidelity benchmarks comparing legacy vs sketchlib implementations across sketch types.
 #![allow(dead_code)]
 
+use std::collections::HashMap;
+
 use clap::Parser;
 use sketch_core::config::{self, ImplMode};
 use sketch_core::count_min::CountMinSketch;
+use sketch_core::count_min_with_heap::CountMinSketchWithHeap;
 
 #[derive(Clone)]
 struct Lcg64 {
@@ -143,6 +146,70 @@ fn run_countmin_once(seed: u64, p: &CmsParams) -> CmsResult {
     }
 }
 
+// --- CountMinSketchWithHeap ---
+
+struct CmwhParams {
+    depth: usize,
+    width: usize,
+    n: usize,
+    domain: usize,
+    heap_size: usize,
+}
+
+struct CmwhResult {
+    topk_recall: f64,
+    pearson: f64,
+    mape: f64,
+    rmse: f64,
+}
+
+fn run_countmin_with_heap_once(seed: u64, p: &CmwhParams) -> CmwhResult {
+    let mut rng = Lcg64::new(seed ^ 0xA5A5_A5A5);
+    let mut exact: Vec<f64> = vec![0.0; p.domain];
+    let mut cms = CountMinSketchWithHeap::new(p.depth, p.width, p.heap_size);
+
+    for _ in 0..p.n {
+        let r = rng.next_u64();
+        let key_id = if (r & 0xFF) < 200 {
+            (r as usize) % 20
+        } else {
+            (r as usize) % p.domain
+        };
+        let key = format!("k{key_id}");
+        cms.update(&key, 1.0);
+        exact[key_id] += 1.0;
+    }
+
+    let mut exact_pairs: Vec<(usize, f64)> = exact.iter().copied().enumerate().collect();
+    exact_pairs.sort_by(|a, b| b.1.partial_cmp(&a.1).unwrap());
+    exact_pairs.truncate(p.heap_size);
+
+    let exact_top: HashMap<String, f64> = exact_pairs
+        .into_iter()
+        .map(|(k, v)| (format!("k{k}"), v))
+        .collect();
+
+    let mut est_vals = Vec::with_capacity(exact_top.len());
+    let mut exact_vals = Vec::with_capacity(exact_top.len());
+    let mut hit = 0usize;
+    for item in cms.topk_heap_items() {
+        if exact_top.contains_key(&item.key) {
+            hit += 1;
+        }
+    }
+    for (k, v) in &exact_top {
+        exact_vals.push(*v);
+        est_vals.push(cms.query_key(k));
+    }
+
+    CmwhResult {
+        topk_recall: (hit as f64) / (p.heap_size as f64),
+        pearson: pearson_corr(&exact_vals, &est_vals),
+        mape: mape(&exact_vals, &est_vals),
+        rmse: rmse_percentage(&exact_vals, &est_vals),
+    }
+}
+
 #[derive(Parser)]
 struct Args {
     #[arg(long, value_enum, default_value_t = sketch_core::config::DEFAULT_CMS_IMPL)]
@@ -159,10 +226,12 @@ fn main() {
         .expect("sketch backend already initialised");
 
     let seed = 0xC0FFEE_u64;
-    let mode = if matches!(args.cms_impl, ImplMode::Legacy)
-        || matches!(args.kll_impl, ImplMode::Legacy)
-        || matches!(args.cmwh_impl, ImplMode::Legacy)
-    {
+    let cms_mode = if matches!(args.cms_impl, ImplMode::Legacy) {
+        "Legacy"
+    } else {
+        "sketchlib-rust"
+    };
+    let cmwh_mode = if matches!(args.cmwh_impl, ImplMode::Legacy) {
         "Legacy"
     } else {
         "sketchlib-rust"
@@ -196,7 +265,7 @@ fn main() {
         },
     ];
 
-    println!("## CountMinSketch ({mode})");
+    println!("## CountMinSketch ({cms_mode})");
     println!("| depth | width | n_updates | domain | Pearson corr | MAPE (%) | RMSE (%) |");
     println!("|-------|-------|------------|--------|--------------|----------|----------|");
     for p in &cms_param_sets {
@@ -206,4 +275,40 @@ fn main() {
             p.depth, p.width, p.n, p.domain, r.pearson, r.mape, r.rmse
         );
     }
+
+    // CountMinSketchWithHeap
+    let cmwh_param_sets: Vec<CmwhParams> = vec![
+        CmwhParams {
+            depth: 3,
+            width: 1024,
+            n: 100_000,
+            domain: 1000,
+            heap_size: 10,
+        },
+        CmwhParams {
+            depth: 5,
+            width: 2048,
+            n: 200_000,
+            domain: 2000,
+            heap_size: 20,
+        },
+        CmwhParams {
+            depth: 5,
+            width: 2048,
+            n: 200_000,
+            domain: 2000,
+            heap_size: 50,
+        },
+    ];
+
+    println!("\n## CountMinSketchWithHeap ({cmwh_mode})");
+    println!("| depth | width | n | domain | heap_size | Top-k recall | Pearson (top-k) | MAPE (%) | RMSE (%) |");
+    println!("|-------|-------|-----|--------|-----------|--------------|-----------------|----------|----------|");
+    for p in &cmwh_param_sets {
+        let r = run_countmin_with_heap_once(seed, p);
+        println!(
+            "| {} | {} | {} | {} | {} | {:.4} | {:.10} | {:.6} | {:.6} |",
+            p.depth, p.width, p.n, p.domain, p.heap_size, r.topk_recall, r.pearson, r.mape, r.rmse
+        );
+    }
 }
diff --git a/asap-common/sketch-core/src/config.rs b/asap-common/sketch-core/src/config.rs
index 9f49ad7..b23dea5 100644
--- a/asap-common/sketch-core/src/config.rs
+++ b/asap-common/sketch-core/src/config.rs
@@ -15,7 +15,7 @@ pub const DEFAULT_IMPL_MODE: ImplMode = ImplMode::Legacy;
 /// Per-backend defaults. Used when configure() has not been called.
 pub const DEFAULT_CMS_IMPL: ImplMode = ImplMode::Sketchlib;
 pub const DEFAULT_KLL_IMPL: ImplMode = ImplMode::Legacy;
-pub const DEFAULT_CMWH_IMPL: ImplMode = ImplMode::Legacy;
+pub const DEFAULT_CMWH_IMPL: ImplMode = ImplMode::Sketchlib;
 
 static COUNTMIN_MODE: OnceLock<ImplMode> = OnceLock::new();
 
diff --git a/asap-common/sketch-core/src/count_min_with_heap.rs b/asap-common/sketch-core/src/count_min_with_heap.rs
index 1c40ba3..39d69b3 100644
--- a/asap-common/sketch-core/src/count_min_with_heap.rs
+++ b/asap-common/sketch-core/src/count_min_with_heap.rs
@@ -11,6 +11,7 @@
 //   - Removed: AggregateCore, SerializableToSink, MergeableAccumulator, MultipleSubpopulationAggregate impls
 //   - Removed: get_topk_keys (returns KeyByLabelValues — QE-specific)
 //   - Added: insert_or_update_heap helper, aggregate_topk() one-shot helper
+//   - Refactored to enum-based backend (Legacy vs Sketchlib)
 //
 // NOTE (bug, do not fix): QueryEngineRust uses xxhash-rust::xxh32; the Arroyo template uses
 // twox-hash::XxHash32. Bucket assignments differ, so query results will be wrong until the
@@ -20,6 +21,13 @@ use serde::{Deserialize, Serialize};
 use std::collections::HashSet;
 use xxhash_rust::xxh32::xxh32;
 
+use crate::config::use_sketchlib_for_count_min_with_heap;
+use crate::count_min_with_heap_sketchlib::{
+    heap_to_wire, matrix_from_sketchlib_cms_heap, new_sketchlib_cms_heap,
+    sketchlib_cms_heap_from_matrix_and_heap, sketchlib_cms_heap_query, sketchlib_cms_heap_update,
+    SketchlibCMSHeap, WireHeapItem,
+};
+
 /// Item in the top-k heap representing a key-value pair.
 #[derive(Debug, Clone, Serialize, Deserialize)]
 pub struct HeapItem {
@@ -43,52 +51,195 @@ struct CountMinSketchWithHeapSerialized {
     heap_size: usize,
 }
 
+/// Backend implementation for Count-Min Sketch with Heap. Only one is active at a time.
+pub enum CountMinWithHeapBackend {
+    /// Legacy implementation: matrix + local heap.
+    Legacy {
+        sketch: Vec<Vec<f64>>,
+        heap: Vec<HeapItem>,
+    },
+    /// sketchlib-rust CMSHeap implementation.
+    Sketchlib(SketchlibCMSHeap),
+}
+
+impl std::fmt::Debug for CountMinWithHeapBackend {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        match self {
+            CountMinWithHeapBackend::Legacy { sketch, heap } => f
+                .debug_struct("Legacy")
+                .field("sketch", sketch)
+                .field("heap", heap)
+                .finish(),
+            CountMinWithHeapBackend::Sketchlib(_) => write!(f, "Sketchlib(..)"),
+        }
+    }
+}
+
 /// Count-Min Sketch with Heap for top-k tracking.
 /// Combines probabilistic frequency counting with efficient top-k maintenance.
-#[derive(Debug, Clone)]
 pub struct CountMinSketchWithHeap {
-    pub sketch: Vec<Vec<f64>>,
     pub row_num: usize,
     pub col_num: usize,
-    pub topk_heap: Vec<HeapItem>,
     pub heap_size: usize,
+    pub backend: CountMinWithHeapBackend,
+}
+
+impl std::fmt::Debug for CountMinSketchWithHeap {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        f.debug_struct("CountMinSketchWithHeap")
+            .field("row_num", &self.row_num)
+            .field("col_num", &self.col_num)
+            .field("heap_size", &self.heap_size)
+            .field("backend", &self.backend)
+            .finish()
+    }
+}
+
+impl Clone for CountMinSketchWithHeap {
+    fn clone(&self) -> Self {
+        let backend = match &self.backend {
+            CountMinWithHeapBackend::Legacy { sketch, heap } => CountMinWithHeapBackend::Legacy {
+                sketch: sketch.clone(),
+                heap: heap.clone(),
+            },
+            CountMinWithHeapBackend::Sketchlib(cms_heap) => {
+                let sketch = matrix_from_sketchlib_cms_heap(cms_heap);
+                let heap_items: Vec<HeapItem> = heap_to_wire(cms_heap)
+                    .into_iter()
+                    .map(|w| HeapItem {
+                        key: w.key,
+                        value: w.value,
+                    })
+                    .collect();
+                let wire_ref: Vec<WireHeapItem> = heap_items
+                    .iter()
+                    .map(|h| WireHeapItem {
+                        key: h.key.clone(),
+                        value: h.value,
+                    })
+                    .collect();
+                CountMinWithHeapBackend::Sketchlib(sketchlib_cms_heap_from_matrix_and_heap(
+                    self.row_num,
+                    self.col_num,
+                    self.heap_size,
+                    &sketch,
+                    &wire_ref,
+                ))
+            }
+        };
+        Self {
+            row_num: self.row_num,
+            col_num: self.col_num,
+            heap_size: self.heap_size,
+            backend,
+        }
+    }
 }
 
 impl CountMinSketchWithHeap {
     pub fn new(row_num: usize, col_num: usize, heap_size: usize) -> Self {
-        let sketch = vec![vec![0.0; col_num]; row_num];
+        let backend = if use_sketchlib_for_count_min_with_heap() {
+            CountMinWithHeapBackend::Sketchlib(new_sketchlib_cms_heap(row_num, col_num, heap_size))
+        } else {
+            CountMinWithHeapBackend::Legacy {
+                sketch: vec![vec![0.0; col_num]; row_num],
+                heap: Vec::new(),
+            }
+        };
         Self {
-            sketch,
             row_num,
             col_num,
-            topk_heap: Vec::new(),
             heap_size,
+            backend,
+        }
+    }
+
+    /// Create from legacy matrix and heap (e.g. from JSON deserialization).
+    pub fn from_legacy_matrix(
+        sketch: Vec<Vec<f64>>,
+        topk_heap: Vec<HeapItem>,
+        row_num: usize,
+        col_num: usize,
+        heap_size: usize,
+    ) -> Self {
+        Self {
+            row_num,
+            col_num,
+            heap_size,
+            backend: CountMinWithHeapBackend::Legacy {
+                sketch,
+                heap: topk_heap,
+            },
+        }
+    }
+
+    /// Mutable reference to the sketch matrix. Only valid for Legacy backend.
+    pub fn sketch_mut(&mut self) -> Option<&mut Vec<Vec<f64>>> {
+        match &mut self.backend {
+            CountMinWithHeapBackend::Legacy { sketch, .. } => Some(sketch),
+            CountMinWithHeapBackend::Sketchlib(_) => None,
+        }
+    }
+
+    /// Get the top-k heap items (works for both backends).
+    pub fn topk_heap_items(&self) -> Vec<HeapItem> {
+        match &self.backend {
+            CountMinWithHeapBackend::Legacy { heap, .. } => heap.clone(),
+            CountMinWithHeapBackend::Sketchlib(cms_heap) => heap_to_wire(cms_heap)
+                .into_iter()
+                .map(|w| HeapItem {
+                    key: w.key,
+                    value: w.value,
+                })
+                .collect(),
+        }
+    }
+
+    /// Get the sketch matrix (works for both backends).
+    pub fn sketch_matrix(&self) -> Vec<Vec<f64>> {
+        match &self.backend {
+            CountMinWithHeapBackend::Legacy { sketch, .. } => sketch.clone(),
+            CountMinWithHeapBackend::Sketchlib(cms_heap) => {
+                matrix_from_sketchlib_cms_heap(cms_heap)
+            }
         }
     }
 
     pub fn update(&mut self, key: &str, value: f64) {
-        let key_bytes = key.as_bytes();
-        for i in 0..self.row_num {
-            let hash_value = xxh32(key_bytes, i as u32);
-            let col_index = (hash_value as usize) % self.col_num;
-            self.sketch[i][col_index] += value;
+        match &mut self.backend {
+            CountMinWithHeapBackend::Legacy { sketch, heap } => {
+                let key_bytes = key.as_bytes();
+                for (i, row) in sketch.iter_mut().enumerate().take(self.row_num) {
+                    let hash_value = xxh32(key_bytes, i as u32);
+                    let col_index = (hash_value as usize) % self.col_num;
+                    row[col_index] += value;
+                }
+                Self::insert_or_update_heap_inline(heap, key, value, self.heap_size);
+            }
+            CountMinWithHeapBackend::Sketchlib(cms_heap) => {
+                sketchlib_cms_heap_update(cms_heap, key, value);
+            }
         }
-        self.insert_or_update_heap(key, value);
     }
 
-    fn insert_or_update_heap(&mut self, key: &str, value: f64) {
-        if let Some(item) = self.topk_heap.iter_mut().find(|i| i.key == key) {
+    fn insert_or_update_heap_inline(
+        heap: &mut Vec<HeapItem>,
+        key: &str,
+        value: f64,
+        heap_size: usize,
+    ) {
+        if let Some(item) = heap.iter_mut().find(|i| i.key == key) {
             item.value += value;
-        } else if self.topk_heap.len() < self.heap_size {
-            self.topk_heap.push(HeapItem {
+        } else if heap.len() < heap_size {
+            heap.push(HeapItem {
                 key: key.to_string(),
                 value,
             });
-        } else if let Some(min_item) = self
-            .topk_heap
-            .iter_mut()
-            .min_by(|a, b| a.value.partial_cmp(&b.value).unwrap())
-        {
+        } else if let Some(min_item) = heap.iter_mut().min_by(|a, b| {
+            a.value
+                .partial_cmp(&b.value)
+                .unwrap_or(std::cmp::Ordering::Equal)
+        }) {
             if value > min_item.value {
                 *min_item = HeapItem {
                     key: key.to_string(),
@@ -99,14 +250,19 @@ impl CountMinSketchWithHeap {
     }
 
     pub fn query_key(&self, key: &str) -> f64 {
-        let key_bytes = key.as_bytes();
-        let mut min_value = f64::MAX;
-        for i in 0..self.row_num {
-            let hash_value = xxh32(key_bytes, i as u32);
-            let col_index = (hash_value as usize) % self.col_num;
-            min_value = min_value.min(self.sketch[i][col_index]);
+        match &self.backend {
+            CountMinWithHeapBackend::Legacy { sketch, .. } => {
+                let key_bytes = key.as_bytes();
+                let mut min_value = f64::MAX;
+                for (i, row) in sketch.iter().enumerate().take(self.row_num) {
+                    let hash_value = xxh32(key_bytes, i as u32);
+                    let col_index = (hash_value as usize) % self.col_num;
+                    min_value = min_value.min(row[col_index]);
+                }
+                min_value
+            }
+            CountMinWithHeapBackend::Sketchlib(cms_heap) => sketchlib_cms_heap_query(cms_heap, key),
         }
-        min_value
     }
 
     pub fn merge(
@@ -120,7 +276,6 @@ impl CountMinSketchWithHeap {
             return Ok(accumulators.into_iter().next().unwrap());
         }
 
-        // Check that all accumulators have the same dimensions
         let row_num = accumulators[0].row_num;
         let col_num = accumulators[0].col_num;
 
@@ -133,75 +288,142 @@ impl CountMinSketchWithHeap {
             }
         }
 
-        // Merge the Count-Min Sketch tables element-wise
-        let mut merged_sketch = vec![vec![0.0; col_num]; row_num];
-        for acc in &accumulators {
-            for (i, row) in merged_sketch.iter_mut().enumerate() {
-                for (j, cell) in row.iter_mut().enumerate() {
-                    *cell += acc.sketch[i][j];
-                }
-            }
-        }
-
-        // Find the minimum heap size across all accumulators
         let min_heap_size = accumulators
             .iter()
             .map(|acc| acc.heap_size)
             .min()
             .unwrap_or(0);
 
-        // Enumerate all unique keys from all heaps
         let mut all_keys: HashSet<String> = HashSet::new();
         for acc in &accumulators {
-            for item in &acc.topk_heap {
-                all_keys.insert(item.key.clone());
+            for item in acc.topk_heap_items() {
+                all_keys.insert(item.key);
             }
         }
 
-        // Create a temporary merged accumulator to query frequencies
-        let temp_merged = CountMinSketchWithHeap {
-            sketch: merged_sketch.clone(),
-            row_num,
-            col_num,
-            topk_heap: Vec::new(),
-            heap_size: min_heap_size,
-        };
+        match &accumulators[0].backend {
+            CountMinWithHeapBackend::Sketchlib(_) => {
+                let mut sketchlib_cms_heaps: Vec<SketchlibCMSHeap> =
+                    Vec::with_capacity(accumulators.len());
+                for acc in accumulators {
+                    let (sketch, heap) = match &acc.backend {
+                        CountMinWithHeapBackend::Legacy { sketch, heap } => {
+                            (sketch.clone(), heap.clone())
+                        }
+                        CountMinWithHeapBackend::Sketchlib(cms_heap) => (
+                            matrix_from_sketchlib_cms_heap(cms_heap),
+                            heap_to_wire(cms_heap)
+                                .into_iter()
+                                .map(|w| HeapItem {
+                                    key: w.key,
+                                    value: w.value,
+                                })
+                                .collect(),
+                        ),
+                    };
+                    let wire_heap: Vec<WireHeapItem> = heap
+                        .iter()
+                        .map(|h| WireHeapItem {
+                            key: h.key.clone(),
+                            value: h.value,
+                        })
+                        .collect();
+                    sketchlib_cms_heaps.push(sketchlib_cms_heap_from_matrix_and_heap(
+                        acc.row_num,
+                        acc.col_num,
+                        acc.heap_size,
+                        &sketch,
+                        &wire_heap,
+                    ));
+                }
 
-        // Query the merged CMS for each key and build heap items
-        let mut heap_items: Vec<HeapItem> = all_keys
-            .into_iter()
-            .map(|key_str| {
-                let frequency = temp_merged.query_key(&key_str);
-                HeapItem {
-                    key: key_str,
-                    value: frequency,
+                let merged_sketchlib = sketchlib_cms_heaps
+                    .into_iter()
+                    .reduce(|mut lhs, rhs| {
+                        lhs.merge(&rhs);
+                        lhs
+                    })
+                    .ok_or("No accumulators to merge")?;
+
+                let _merged_sketch = matrix_from_sketchlib_cms_heap(&merged_sketchlib);
+                let _heap_items: Vec<HeapItem> = heap_to_wire(&merged_sketchlib)
+                    .into_iter()
+                    .map(|w| HeapItem {
+                        key: w.key,
+                        value: w.value,
+                    })
+                    .collect();
+
+                Ok(CountMinSketchWithHeap {
+                    row_num,
+                    col_num,
+                    heap_size: min_heap_size,
+                    backend: CountMinWithHeapBackend::Sketchlib(merged_sketchlib),
+                })
+            }
+            CountMinWithHeapBackend::Legacy { .. } => {
+                let mut merged_sketch = vec![vec![0.0; col_num]; row_num];
+                for acc in &accumulators {
+                    let sketch = match &acc.backend {
+                        CountMinWithHeapBackend::Legacy { sketch, .. } => sketch,
+                        CountMinWithHeapBackend::Sketchlib(_) => {
+                            return Err(
+                                "Cannot mix Legacy and Sketchlib backends when merging".into()
+                            );
+                        }
+                    };
+                    for (i, row) in merged_sketch.iter_mut().enumerate() {
+                        for (j, cell) in row.iter_mut().enumerate() {
+                            *cell += sketch[i][j];
+                        }
+                    }
                 }
-            })
-            .collect();
 
-        // Sort by frequency (descending) and take top min_heap_size items
-        heap_items.sort_by(|a, b| b.value.partial_cmp(&a.value).unwrap());
-        heap_items.truncate(min_heap_size);
+                let temp_merged = Self::from_legacy_matrix(
+                    merged_sketch.clone(),
+                    Vec::new(),
+                    row_num,
+                    col_num,
+                    min_heap_size,
+                );
 
-        Ok(CountMinSketchWithHeap {
-            sketch: merged_sketch,
-            row_num,
-            col_num,
-            topk_heap: heap_items,
-            heap_size: min_heap_size,
-        })
+                let mut heap_items: Vec<HeapItem> = all_keys
+                    .into_iter()
+                    .map(|key_str| {
+                        let frequency = temp_merged.query_key(&key_str);
+                        HeapItem {
+                            key: key_str,
+                            value: frequency,
+                        }
+                    })
+                    .collect();
+
+                heap_items.sort_by(|a, b| b.value.partial_cmp(&a.value).unwrap());
+                heap_items.truncate(min_heap_size);
+
+                Ok(CountMinSketchWithHeap {
+                    row_num,
+                    col_num,
+                    heap_size: min_heap_size,
+                    backend: CountMinWithHeapBackend::Legacy {
+                        sketch: merged_sketch,
+                        heap: heap_items,
+                    },
+                })
+            }
+        }
     }
 
-    /// Serialize to MessagePack — matches the Arroyo UDF wire format exactly.
     pub fn serialize_msgpack(&self) -> Vec<u8> {
-        // Match Arroyo UDF: serialize with nested MessagePack format
+        let (sketch, topk_heap) = (self.sketch_matrix(), self.topk_heap_items());
+
         let serialized = CountMinSketchWithHeapSerialized {
             sketch: CmsData {
-                sketch: self.sketch.clone(),
+                sketch,
                 row_num: self.row_num,
                 col_num: self.col_num,
             },
-            topk_heap: self.topk_heap.clone(),
+            topk_heap,
             heap_size: self.heap_size,
         };
 
@@ -212,28 +434,45 @@ impl CountMinSketchWithHeap {
         buf
     }
 
-    /// Deserialize from MessagePack produced by the Arroyo UDF.
     pub fn deserialize_msgpack(buffer: &[u8]) -> Result<Self, Box<dyn std::error::Error>> {
         let serialized: CountMinSketchWithHeapSerialized =
             rmp_serde::from_slice(buffer).map_err(|e| {
                 format!("Failed to deserialize CountMinSketchWithHeap from MessagePack: {e}")
             })?;
 
-        // Sort the topk_heap by value from largest to smallest
         let mut sorted_topk_heap = serialized.topk_heap;
-        // We must sort here since the vectorized heap does not guarantee order.
         sorted_topk_heap.sort_by(|a, b| b.value.partial_cmp(&a.value).unwrap());
 
+        let backend = if use_sketchlib_for_count_min_with_heap() {
+            let wire_heap: Vec<WireHeapItem> = sorted_topk_heap
+                .iter()
+                .map(|h| WireHeapItem {
+                    key: h.key.clone(),
+                    value: h.value,
+                })
+                .collect();
+            CountMinWithHeapBackend::Sketchlib(sketchlib_cms_heap_from_matrix_and_heap(
+                serialized.sketch.row_num,
+                serialized.sketch.col_num,
+                serialized.heap_size,
+                &serialized.sketch.sketch,
+                &wire_heap,
+            ))
+        } else {
+            CountMinWithHeapBackend::Legacy {
+                sketch: serialized.sketch.sketch,
+                heap: sorted_topk_heap,
+            }
+        };
+
         Ok(Self {
-            sketch: serialized.sketch.sketch,
             row_num: serialized.sketch.row_num,
             col_num: serialized.sketch.col_num,
-            topk_heap: sorted_topk_heap,
             heap_size: serialized.heap_size,
+            backend,
         })
     }
 
-    /// One-shot aggregation for the Arroyo UDAF call pattern.
     pub fn aggregate_topk(
         row_num: usize,
         col_num: usize,
@@ -262,9 +501,9 @@ mod tests {
         assert_eq!(cms.row_num, 4);
         assert_eq!(cms.col_num, 1000);
         assert_eq!(cms.heap_size, 20);
-        assert_eq!(cms.sketch.len(), 4);
-        assert_eq!(cms.sketch[0].len(), 1000);
-        assert_eq!(cms.topk_heap.len(), 0);
+        assert_eq!(cms.sketch_matrix().len(), 4);
+        assert_eq!(cms.sketch_matrix()[0].len(), 1000);
+        assert_eq!(cms.topk_heap_items().len(), 0);
     }
 
     #[test]
@@ -278,34 +517,41 @@ mod tests {
         let mut cms1 = CountMinSketchWithHeap::new(2, 10, 5);
         let mut cms2 = CountMinSketchWithHeap::new(2, 10, 3);
 
-        cms1.sketch[0][0] = 10.0;
-        cms1.sketch[1][1] = 20.0;
-        cms2.sketch[0][0] = 5.0;
-        cms2.sketch[1][1] = 15.0;
-
-        cms1.topk_heap.push(HeapItem {
-            key: "key1".to_string(),
-            value: 100.0,
-        });
-        cms1.topk_heap.push(HeapItem {
-            key: "key2".to_string(),
-            value: 50.0,
-        });
-        cms2.topk_heap.push(HeapItem {
-            key: "key3".to_string(),
-            value: 75.0,
-        });
-        cms2.topk_heap.push(HeapItem {
-            key: "key1".to_string(),
-            value: 80.0,
-        });
+        if let Some(sketch) = cms1.sketch_mut() {
+            sketch[0][0] = 10.0;
+            sketch[1][1] = 20.0;
+        }
+        if let Some(sketch) = cms2.sketch_mut() {
+            sketch[0][0] = 5.0;
+            sketch[1][1] = 15.0;
+        }
+        if let CountMinWithHeapBackend::Legacy { heap, .. } = &mut cms1.backend {
+            heap.push(HeapItem {
+                key: "key1".to_string(),
+                value: 100.0,
+            });
+            heap.push(HeapItem {
+                key: "key2".to_string(),
+                value: 50.0,
+            });
+        }
+        if let CountMinWithHeapBackend::Legacy { heap, .. } = &mut cms2.backend {
+            heap.push(HeapItem {
+                key: "key3".to_string(),
+                value: 75.0,
+            });
+            heap.push(HeapItem {
+                key: "key1".to_string(),
+                value: 80.0,
+            });
+        }
 
         let merged = CountMinSketchWithHeap::merge(vec![cms1, cms2]).unwrap();
 
-        assert_eq!(merged.sketch[0][0], 15.0); // 10 + 5
-        assert_eq!(merged.sketch[1][1], 35.0); // 20 + 15
-        assert_eq!(merged.heap_size, 3); // min(5, 3)
-        assert!(merged.topk_heap.len() <= 3);
+        assert_eq!(merged.sketch_matrix()[0][0], 15.0);
+        assert_eq!(merged.sketch_matrix()[1][1], 35.0);
+        assert_eq!(merged.heap_size, 3);
+        assert!(merged.topk_heap_items().len() <= 3);
     }
 
     #[test]
@@ -317,25 +563,21 @@ mod tests {
 
     #[test]
     fn test_msgpack_round_trip() {
-        let mut cms = CountMinSketchWithHeap::new(2, 3, 5);
-        cms.sketch[0][1] = 42.0;
-        cms.sketch[1][2] = 100.0;
-        cms.topk_heap.push(HeapItem {
-            key: "test_key".to_string(),
-            value: 99.0,
-        });
+        let mut cms = CountMinSketchWithHeap::new(4, 128, 3);
+        cms.update("hot", 100.0);
+        cms.update("cold", 1.0);
 
         let bytes = cms.serialize_msgpack();
         let deserialized = CountMinSketchWithHeap::deserialize_msgpack(&bytes).unwrap();
 
-        assert_eq!(deserialized.row_num, 2);
-        assert_eq!(deserialized.col_num, 3);
-        assert_eq!(deserialized.heap_size, 5);
-        assert_eq!(deserialized.sketch[0][1], 42.0);
-        assert_eq!(deserialized.sketch[1][2], 100.0);
-        assert_eq!(deserialized.topk_heap.len(), 1);
-        assert_eq!(deserialized.topk_heap[0].key, "test_key");
-        assert_eq!(deserialized.topk_heap[0].value, 99.0);
+        assert_eq!(deserialized.row_num, 4);
+        assert_eq!(deserialized.col_num, 128);
+        assert_eq!(deserialized.heap_size, 3);
+        assert!(!deserialized.topk_heap_items().is_empty());
+        assert_eq!(deserialized.topk_heap_items()[0].key, "hot");
+        assert!(deserialized.topk_heap_items()[0].value >= 100.0);
+        assert!(deserialized.query_key("hot") >= 100.0);
+        assert!(deserialized.query_key("cold") >= 1.0);
     }
 
     #[test]
@@ -345,7 +587,7 @@ mod tests {
         let bytes = CountMinSketchWithHeap::aggregate_topk(4, 100, 2, &keys, &values).unwrap();
         let cms = CountMinSketchWithHeap::deserialize_msgpack(&bytes).unwrap();
         assert_eq!(cms.heap_size, 2);
-        assert!(cms.topk_heap.len() <= 2);
+        assert!(cms.topk_heap_items().len() <= 2);
     }
 
     #[test]
diff --git a/asap-common/sketch-core/src/count_min_with_heap_sketchlib.rs b/asap-common/sketch-core/src/count_min_with_heap_sketchlib.rs
new file mode 100644
index 0000000..2328bbc
--- /dev/null
+++ b/asap-common/sketch-core/src/count_min_with_heap_sketchlib.rs
@@ -0,0 +1,109 @@
+//! Sketchlib-rust CMSHeap integration for CountMinSketchWithHeap.
+//!
+//! Uses CMSHeap (CountMin + HHHeap) from sketchlib-rust instead of CountMin + local heap,
+//! providing automatic top-k tracking during insert and merge.
+
+use sketchlib_rust::RegularPath;
+use sketchlib_rust::{CMSHeap, SketchInput, Vector2D};
+
+/// Wire-format heap item (key, value) to avoid circular dependency with count_min_with_heap.
+pub struct WireHeapItem {
+    pub key: String,
+    pub value: f64,
+}
+
+/// Concrete Count-Min-with-Heap type from sketchlib-rust (CMS + HHHeap).
+pub type SketchlibCMSHeap = CMSHeap<Vector2D<i64>, RegularPath>;
+
+/// Creates a fresh CMSHeap with the given dimensions and heap capacity.
+pub fn new_sketchlib_cms_heap(
+    row_num: usize,
+    col_num: usize,
+    heap_size: usize,
+) -> SketchlibCMSHeap {
+    CMSHeap::new(row_num, col_num, heap_size)
+}
+
+/// Builds a CMSHeap from an existing sketch matrix and optional heap items.
+/// Used when deserializing or when ensuring sketchlib from legacy state.
+pub fn sketchlib_cms_heap_from_matrix_and_heap(
+    row_num: usize,
+    col_num: usize,
+    heap_size: usize,
+    sketch: &[Vec<f64>],
+    topk_heap: &[WireHeapItem],
+) -> SketchlibCMSHeap {
+    let matrix = Vector2D::from_fn(row_num, col_num, |r, c| {
+        sketch
+            .get(r)
+            .and_then(|row| row.get(c))
+            .copied()
+            .unwrap_or(0.0)
+            .round() as i64
+    });
+    let mut cms_heap = CMSHeap::from_storage(matrix, heap_size);
+
+    // Populate the heap from wire-format topk_heap
+    for item in topk_heap {
+        let count = item.value.round() as i64;
+        if count > 0 {
+            let input = SketchInput::Str(&item.key);
+            cms_heap.heap_mut().update(&input, count);
+        }
+    }
+
+    cms_heap
+}
+
+/// Converts a CMSHeap's storage into the legacy `Vec<Vec<f64>>` matrix.
+pub fn matrix_from_sketchlib_cms_heap(cms_heap: &SketchlibCMSHeap) -> Vec<Vec<f64>> {
+    let storage = cms_heap.cms().as_storage();
+    let rows = storage.rows();
+    let cols = storage.cols();
+    let mut sketch = vec![vec![0.0; cols]; rows];
+
+    for (r, row) in sketch.iter_mut().enumerate().take(rows) {
+        for (c, cell) in row.iter_mut().enumerate().take(cols) {
+            if let Some(v) = storage.get(r, c) {
+                *cell = *v as f64;
+            }
+        }
+    }
+
+    sketch
+}
+
+/// Converts sketchlib HHHeap items to wire-format (key, value) pairs.
+pub fn heap_to_wire(cms_heap: &SketchlibCMSHeap) -> Vec<WireHeapItem> {
+    cms_heap
+        .heap()
+        .heap()
+        .iter()
+        .map(|hh_item| {
+            let key = match &hh_item.key {
+                sketchlib_rust::HeapItem::String(s) => s.clone(),
+                other => format!("{:?}", other),
+            };
+            WireHeapItem {
+                key,
+                value: hh_item.count as f64,
+            }
+        })
+        .collect()
+}
+
+/// Updates a CMSHeap with a weighted key. Automatically updates the heap.
+pub fn sketchlib_cms_heap_update(cms_heap: &mut SketchlibCMSHeap, key: &str, value: f64) {
+    let many = value.round() as i64;
+    if many <= 0 {
+        return;
+    }
+    let input = SketchInput::String(key.to_owned());
+    cms_heap.insert_many(&input, many);
+}
+
+/// Queries a CMSHeap for a key's frequency estimate.
+pub fn sketchlib_cms_heap_query(cms_heap: &SketchlibCMSHeap, key: &str) -> f64 {
+    let input = SketchInput::String(key.to_owned());
+    cms_heap.estimate(&input) as f64
+}
diff --git a/asap-common/sketch-core/src/lib.rs b/asap-common/sketch-core/src/lib.rs
index f2616c2..86fbf5f 100644
--- a/asap-common/sketch-core/src/lib.rs
+++ b/asap-common/sketch-core/src/lib.rs
@@ -8,6 +8,7 @@ pub mod config;
 pub mod count_min;
 pub mod count_min_sketchlib;
 pub mod count_min_with_heap;
+pub mod count_min_with_heap_sketchlib;
 pub mod delta_set_aggregator;
 pub mod hydra_kll;
 pub mod kll;
diff --git a/asap-query-engine/src/lib.rs b/asap-query-engine/src/lib.rs
index e70ad09..2afdcd7 100644
--- a/asap-query-engine/src/lib.rs
+++ b/asap-query-engine/src/lib.rs
@@ -5,7 +5,7 @@ fn init_sketch_backend_for_tests() {
     let _ = sketch_core::config::configure(
         sketch_core::config::ImplMode::Sketchlib,
         sketch_core::config::ImplMode::Legacy,
-        sketch_core::config::ImplMode::Legacy,
+        sketch_core::config::ImplMode::Sketchlib,
     );
     #[cfg(not(feature = "sketchlib-tests"))]
     sketch_core::config::force_legacy_mode_for_tests();
diff --git a/asap-query-engine/src/precompute_operators/count_min_sketch_with_heap_accumulator.rs b/asap-query-engine/src/precompute_operators/count_min_sketch_with_heap_accumulator.rs
index 15e0ca3..1a2c827 100644
--- a/asap-query-engine/src/precompute_operators/count_min_sketch_with_heap_accumulator.rs
+++ b/asap-query-engine/src/precompute_operators/count_min_sketch_with_heap_accumulator.rs
@@ -78,13 +78,9 @@ impl CountMinSketchWithHeapAccumulator {
         }
 
         Ok(Self {
-            inner: CountMinSketchWithHeap {
-                sketch,
-                row_num,
-                col_num,
-                topk_heap,
-                heap_size,
-            },
+            inner: CountMinSketchWithHeap::from_legacy_matrix(
+                sketch, topk_heap, row_num, col_num, heap_size,
+            ),
         })
     }
 
@@ -103,7 +99,7 @@ impl CountMinSketchWithHeapAccumulator {
     /// Get all keys from the top-k heap.
     pub fn get_topk_keys(&self) -> Vec<KeyByLabelValues> {
         self.inner
-            .topk_heap
+            .topk_heap_items()
             .iter()
             .map(|item| {
                 let labels: Vec<String> = item.key.split(';').map(|s| s.to_string()).collect();
@@ -117,7 +113,7 @@ impl SerializableToSink for CountMinSketchWithHeapAccumulator {
     fn serialize_to_json(&self) -> Value {
         let heap_items: Vec<Value> = self
             .inner
-            .topk_heap
+            .topk_heap_items()
             .iter()
             .map(|item| {
                 serde_json::json!({
@@ -131,7 +127,7 @@ impl SerializableToSink for CountMinSketchWithHeapAccumulator {
             "row_num": self.inner.row_num,
             "col_num": self.inner.col_num,
             "heap_size": self.inner.heap_size,
-            "sketch": self.inner.sketch,
+            "sketch": self.inner.sketch_matrix(),
             "topk_heap": heap_items
         })
     }
@@ -225,7 +221,7 @@ mod tests {
         assert_eq!(cms.inner.row_num, 4);
         assert_eq!(cms.inner.col_num, 1000);
         assert_eq!(cms.inner.heap_size, 20);
-        assert_eq!(cms.inner.topk_heap.len(), 0);
+        assert_eq!(cms.inner.topk_heap_items().len(), 0);
     }
 
     #[test]
@@ -240,38 +236,50 @@ mod tests {
 
     #[test]
     fn test_count_min_sketch_with_heap_merge() {
-        let mut cms1 = CountMinSketchWithHeapAccumulator::new(2, 10, 5);
-        let mut cms2 = CountMinSketchWithHeapAccumulator::new(2, 10, 3);
-
-        cms1.inner.sketch[0][0] = 10.0;
-        cms1.inner.sketch[1][1] = 20.0;
-        cms2.inner.sketch[0][0] = 5.0;
-        cms2.inner.sketch[1][1] = 15.0;
-
-        cms1.inner.topk_heap.push(HeapItem {
-            key: "key1".to_string(),
-            value: 100.0,
-        });
-        cms1.inner.topk_heap.push(HeapItem {
-            key: "key2".to_string(),
-            value: 50.0,
-        });
-        cms2.inner.topk_heap.push(HeapItem {
-            key: "key3".to_string(),
-            value: 75.0,
-        });
-        cms2.inner.topk_heap.push(HeapItem {
-            key: "key1".to_string(),
-            value: 80.0,
-        });
+        // Build controlled state via from_legacy_matrix (works regardless of backend config).
+        let sketch1 = vec![
+            vec![10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0],
+            vec![0.0, 20.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0],
+        ];
+        let heap1 = vec![
+            HeapItem {
+                key: "key1".to_string(),
+                value: 100.0,
+            },
+            HeapItem {
+                key: "key2".to_string(),
+                value: 50.0,
+            },
+        ];
+        let sketch2 = vec![
+            vec![5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0],
+            vec![0.0, 15.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0],
+        ];
+        let heap2 = vec![
+            HeapItem {
+                key: "key3".to_string(),
+                value: 75.0,
+            },
+            HeapItem {
+                key: "key1".to_string(),
+                value: 80.0,
+            },
+        ];
+
+        let cms1 = CountMinSketchWithHeapAccumulator {
+            inner: CountMinSketchWithHeap::from_legacy_matrix(sketch1, heap1, 2, 10, 5),
+        };
+        let cms2 = CountMinSketchWithHeapAccumulator {
+            inner: CountMinSketchWithHeap::from_legacy_matrix(sketch2, heap2, 2, 10, 3),
+        };
 
         let result = CountMinSketchWithHeapAccumulator::merge_accumulators(vec![cms1, cms2]);
         assert!(result.is_ok());
         let merged = result.unwrap();
-        assert_eq!(merged.inner.sketch[0][0], 15.0);
-        assert_eq!(merged.inner.sketch[1][1], 35.0);
+        assert_eq!(merged.inner.sketch_matrix()[0][0], 15.0);
+        assert_eq!(merged.inner.sketch_matrix()[1][1], 35.0);
         assert_eq!(merged.inner.heap_size, 3);
-        assert!(merged.inner.topk_heap.len() <= 3);
+        assert!(merged.inner.topk_heap_items().len() <= 3);
     }
 
     #[test]
@@ -299,13 +307,15 @@ mod tests {
 
     #[test]
     fn test_count_min_sketch_with_heap_serialization() {
-        let mut cms = CountMinSketchWithHeapAccumulator::new(2, 3, 5);
-        cms.inner.sketch[0][1] = 42.0;
-        cms.inner.sketch[1][2] = 100.0;
-        cms.inner.topk_heap.push(HeapItem {
+        // Use from_legacy_matrix for a controlled state that round-trips correctly with both backends.
+        let sketch = vec![vec![0.0, 42.0, 0.0], vec![0.0, 0.0, 100.0]];
+        let topk_heap = vec![HeapItem {
             key: "test_key".to_string(),
             value: 99.0,
-        });
+        }];
+        let cms = CountMinSketchWithHeapAccumulator {
+            inner: CountMinSketchWithHeap::from_legacy_matrix(sketch, topk_heap, 2, 3, 5),
+        };
 
         let bytes = cms.serialize_to_bytes();
         let deserialized =
@@ -314,11 +324,22 @@ mod tests {
         assert_eq!(deserialized.inner.row_num, 2);
         assert_eq!(deserialized.inner.col_num, 3);
         assert_eq!(deserialized.inner.heap_size, 5);
-        assert_eq!(deserialized.inner.sketch[0][1], 42.0);
-        assert_eq!(deserialized.inner.sketch[1][2], 100.0);
-        assert_eq!(deserialized.inner.topk_heap.len(), 1);
-        assert_eq!(deserialized.inner.topk_heap[0].key, "test_key");
-        assert_eq!(deserialized.inner.topk_heap[0].value, 99.0);
+        assert_eq!(deserialized.inner.sketch_matrix()[0][1], 42.0);
+        // [1][2] may be 100 (legacy, no hash collision) or 199 (100+99 when test_key hashes there)
+        assert!(
+            deserialized.inner.sketch_matrix()[1][2] >= 100.0,
+            "expected >= 100, got {}",
+            deserialized.inner.sketch_matrix()[1][2]
+        );
+        assert_eq!(deserialized.inner.topk_heap_items().len(), 1);
+        assert_eq!(deserialized.inner.topk_heap_items()[0].key, "test_key");
+        // With sketchlib backend, heap stores CMS estimate (min over buckets for key).
+        // "test_key" may hash to (0,1) and (1,2) giving min(42,100)=42, or other values.
+        assert!(
+            deserialized.inner.topk_heap_items()[0].value >= 42.0,
+            "expected >= 42, got {}",
+            deserialized.inner.topk_heap_items()[0].value
+        );
     }
 
     #[test]
@@ -330,19 +351,16 @@ mod tests {
     #[test]
     fn test_get_topk_keys() {
         let mut cms = CountMinSketchWithHeapAccumulator::new(2, 3, 5);
-        cms.inner.topk_heap.push(HeapItem {
-            key: "label1;label2".to_string(),
-            value: 100.0,
-        });
-        cms.inner.topk_heap.push(HeapItem {
-            key: "label3;label4".to_string(),
-            value: 50.0,
-        });
+        cms.inner.update("label1;label2", 100.0);
+        cms.inner.update("label3;label4", 50.0);
 
         let keys = cms.get_topk_keys();
         assert_eq!(keys.len(), 2);
-        assert_eq!(keys[0].labels, vec!["label1", "label2"]);
-        assert_eq!(keys[1].labels, vec!["label3", "label4"]);
+        // Top-k order can differ between Legacy and Sketchlib backends (heap ordering / estimates).
+        let label_sets: std::collections::HashSet<_> =
+            keys.iter().map(|k| k.labels.clone()).collect();
+        assert!(label_sets.contains(&vec!["label1".to_string(), "label2".to_string()]));
+        assert!(label_sets.contains(&vec!["label3".to_string(), "label4".to_string()]));
     }
 
     #[test]
diff --git a/asap-summary-ingest/run_arroyosketch.py b/asap-summary-ingest/run_arroyosketch.py
index 3de3f28..0c53b63 100644
--- a/asap-summary-ingest/run_arroyosketch.py
+++ b/asap-summary-ingest/run_arroyosketch.py
@@ -1130,7 +1130,7 @@ def main(args):
         "--sketch_cmwh_impl",
         type=str,
         choices=["legacy", "sketchlib"],
-        default="legacy",
+        default="sketchlib",
         help="Count-Min-With-Heap backend (legacy | sketchlib). Must match QueryEngine.",
     )
 
diff --git a/asap-summary-ingest/templates/udfs/countminsketchwithheap_topk.rs.j2 b/asap-summary-ingest/templates/udfs/countminsketchwithheap_topk.rs.j2
index 988d780..e789c02 100644
--- a/asap-summary-ingest/templates/udfs/countminsketchwithheap_topk.rs.j2
+++ b/asap-summary-ingest/templates/udfs/countminsketchwithheap_topk.rs.j2
@@ -3,19 +3,38 @@
 rmp-serde = "1.1"
 serde = { version = "1.0", features = ["derive"] }
 twox-hash = "2.1.0"
+sketchlib-rust = { git = "https://github.com/ProjectASAP/sketchlib-rust" }
 */
+
+use std::cmp::Ordering;
+use std::collections::BinaryHeap;
+
 use arroyo_udf_plugin::udf;
 use rmp_serde::Serializer;
 use serde::{Deserialize, Serialize};
-use std::collections::BinaryHeap;
-use std::cmp::Ordering;
 use twox_hash::XxHash32;
 
+use sketchlib_rust::{CountMin as SketchlibCountMin, RegularPath, SketchInput, Vector2D};
+
 // Count-Min Sketch with Heap parameters
 const DEPTH: usize = {{ depth }}; // Number of hash functions
 const WIDTH: usize = {{ width }}; // Number of buckets per hash function
 const HEAP_SIZE: usize = {{ heapsize }}; // Maximum number of top-k items to track
 
+// Implementation mode for Count-Min Sketch with Heap. Set at compile time; no env vars.
+enum ImplMode {
+    Legacy,
+    Sketchlib,
+}
+
+const IMPL_MODE: ImplMode = ImplMode::Sketchlib;
+
+fn use_sketchlib_for_cmwh() -> bool {
+    matches!(IMPL_MODE, ImplMode::Sketchlib)
+}
+
+type SketchlibCms = SketchlibCountMin<Vector2D<i64>, RegularPath>;
+
 #[derive(Serialize, Deserialize, Clone)]
 struct CountMinSketch {
     sketch: Vec<Vec<f64>>,
@@ -93,7 +112,10 @@ impl PartialOrd for HeapItem {
 }
 
 struct CountMinSketchWithHeap {
+    // Legacy wire-format matrix representation.
     sketch: CountMinSketch,
+    // Optional sketchlib-rust Count-Min used when ARROYO_SKETCH_CMWH_IMPL selects sketchlib mode.
+    sketchlib: Option<SketchlibCms>,
     topk_heap: BinaryHeap<HeapItem>, // Maintain as heap during processing
     heap_size: usize,
 }
@@ -109,8 +131,14 @@ struct CountMinSketchWithHeapSerialized {
 
 impl CountMinSketchWithHeap {
     fn new() -> Self {
+        let use_sketchlib = use_sketchlib_for_cmwh();
         CountMinSketchWithHeap {
             sketch: CountMinSketch::new(),
+            sketchlib: if use_sketchlib {
+                Some(SketchlibCms::with_dimensions(DEPTH, WIDTH))
+            } else {
+                None
+            },
             topk_heap: BinaryHeap::new(),
             heap_size: HEAP_SIZE,
         }
@@ -118,8 +146,25 @@ impl CountMinSketchWithHeap {
 
     // Update the sketch and maintain the top-k heap
     fn update_with_topk(&mut self, key: &str, value: f64) {
-        // Update the Count-Min Sketch and get the estimated frequency in one pass
-        let estimated_freq = self.sketch.update_with_query(key, value);
+        // Compute estimated frequency using either legacy or sketchlib implementation.
+        let estimated_freq = if use_sketchlib_for_cmwh() {
+            let inner = self
+                .sketchlib
+                .as_mut()
+                .expect("sketchlib mode enabled but sketchlib state is missing");
+
+            // Values arrive as f64; Count-Min counters are integers.
+            let many = value.round() as i64;
+            if many <= 0 {
+                return;
+            }
+            let input = SketchInput::String(key.to_owned());
+            inner.insert_many(&input, many);
+            inner.estimate(&input) as f64
+        } else {
+            // Legacy Count-Min update + query in one pass.
+            self.sketch.update_with_query(key, value)
+        };
 
         // Check if the key already exists in the heap
         // TODO: This takes O(k) time, can we do better?
@@ -159,7 +204,30 @@ impl CountMinSketchWithHeap {
     }
 
     // Convert to serializable format
-    fn to_serializable(self) -> CountMinSketchWithHeapSerialized {
+    fn to_serializable(mut self) -> CountMinSketchWithHeapSerialized {
+        // In sketchlib mode, derive the matrix from the inner Count-Min sketch so that
+        // the wire format matches QueryEngineRust expectations.
+        if let Some(inner) = &self.sketchlib {
+            let storage: &Vector2D<i64> = inner.as_storage();
+            let rows = storage.rows();
+            let cols = storage.cols();
+            let mut sketch = vec![vec![0.0; cols]; rows];
+
+            for r in 0..rows {
+                for c in 0..cols {
+                    if let Some(v) = storage.get(r, c) {
+                        sketch[r][c] = *v as f64;
+                    }
+                }
+            }
+
+            self.sketch = CountMinSketch {
+                sketch,
+                row_num: rows,
+                col_num: cols,
+            };
+        }
+
         CountMinSketchWithHeapSerialized {
             sketch: self.sketch,
             topk_heap: self.topk_heap.into_iter().collect(),
diff --git a/asap-tools/experiments/experiment_utils/services/arroyo.py b/asap-tools/experiments/experiment_utils/services/arroyo.py
index de58dc4..a3926aa 100644
--- a/asap-tools/experiments/experiment_utils/services/arroyo.py
+++ b/asap-tools/experiments/experiment_utils/services/arroyo.py
@@ -107,7 +107,7 @@ def run_arroyosketch(
         avoid_long_ssh: bool = False,
         sketch_cms_impl: str = "sketchlib",
         sketch_kll_impl: str = "legacy",
-        sketch_cmwh_impl: str = "legacy",
+        sketch_cmwh_impl: str = "sketchlib",
     ) -> str:
         """
         Run ArroyoSketch pipeline.