diff --git a/Cargo.lock b/Cargo.lock
index 348aa1209..0b9ff2552 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -94,6 +94,12 @@ version = "1.5.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "c08606f8c3cbf4ce6ec8e28fb0014a2c086708fe954eaa885384a6165172e7e8"
 
+[[package]]
+name = "bitflags"
+version = "1.3.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "bef38d45163c2f1dde094a7dfd33ccf595c92905c8f8f4fdc18d06fb1037718a"
+
 [[package]]
 name = "bitflags"
 version = "2.10.0"
@@ -124,6 +130,12 @@ version = "3.19.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "46c5e41b57b8bba42a04676d81cb89e9ee8e859a1a66f80a5a72e1cb76b34d43"
 
+[[package]]
+name = "byteorder"
+version = "1.5.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "1fd0f2584146f6f2ef48085050886acf353beff7305ebd1ae69500e27c67f64b"
+
 [[package]]
 name = "cc"
 version = "1.2.41"
@@ -235,7 +247,7 @@ checksum = "93e373516c58af1c344bfe013b6c9831ce6a08bb59709ab3fa6fe5c9b0e904ff"
 dependencies = [
  "divan-macros",
  "itertools",
- "proc-macro-crate",
+ "proc-macro-crate 3.4.0",
  "proc-macro2",
  "quote",
  "syn 2.0.107",
@@ -460,6 +472,7 @@ dependencies = [
  "egglog-reports",
  "egraph-serialize",
  "env_logger",
+ "flexbuffers",
  "glob",
  "hashbrown 0.16.0",
  "im-rc",
@@ -726,6 +739,19 @@ version = "0.5.7"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "1d674e81391d1e1ab681a28d99df07927c6d4aa5b027d7da16ba32d1d21ecd99"
 
+[[package]]
+name = "flexbuffers"
+version = "25.12.19"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "8bc752b3d049e0705749b9999d0b130d6cf62935bc7762fd3bdb7636047abe43"
+dependencies = [
+ "bitflags 1.3.2",
+ "byteorder",
+ "num_enum",
+ "serde",
+ "serde_derive",
+]
+
 [[package]]
 name = "foldhash"
 version = "0.1.5"
@@ -1017,7 +1043,7 @@ version = "0.30.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "74523f3a35e05aba87a1d978330aef40f67b0304ac79c1c00b294c9830543db6"
 dependencies = [
- "bitflags",
+ "bitflags 2.10.0",
  "cfg-if",
  "cfg_aliases",
  "libc",
@@ -1098,6 +1124,27 @@ dependencies = [
  "autocfg",
 ]
 
+[[package]]
+name = "num_enum"
+version = "0.5.11"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "1f646caf906c20226733ed5b1374287eb97e3c2a5c227ce668c1f2ce20ae57c9"
+dependencies = [
+ "num_enum_derive",
+]
+
+[[package]]
+name = "num_enum_derive"
+version = "0.5.11"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "dcbff9bc912032c62bf65ef1d5aea88983b420f4f839db1e9b0c281a25c9c799"
+dependencies = [
+ "proc-macro-crate 1.3.1",
+ "proc-macro2",
+ "quote",
+ "syn 1.0.109",
+]
+
 [[package]]
 name = "once_cell"
 version = "1.21.3"
@@ -1213,13 +1260,23 @@ dependencies = [
  "zerocopy",
 ]
 
+[[package]]
+name = "proc-macro-crate"
+version = "1.3.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "7f4c021e1093a56626774e81216a4ce732a735e5bad4868a03f3ed65ca0c3919"
+dependencies = [
+ "once_cell",
+ "toml_edit 0.19.15",
+]
+
 [[package]]
 name = "proc-macro-crate"
 version = "3.4.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "219cb19e96be00ab2e37d6e299658a0cfa83e52429179969b0f0121b4ac46983"
 dependencies = [
- "toml_edit",
+ "toml_edit 0.23.7",
 ]
 
 [[package]]
@@ -1329,7 +1386,7 @@ version = "0.5.18"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "ed2bf2547551a7053d6fdfafda3f938979645c44812fbfcda098faae3f1a362d"
 dependencies = [
- "bitflags",
+ "bitflags 2.10.0",
 ]
 
 [[package]]
@@ -1379,7 +1436,7 @@ version = "1.1.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "cd15f8a2c5551a84d56efdc1cd049089e409ac19a3072d5037a17fd70719ff3e"
 dependencies = [
- "bitflags",
+ "bitflags 2.10.0",
  "errno",
  "libc",
  "linux-raw-sys",
@@ -1596,6 +1653,12 @@ dependencies = [
  "syn 2.0.107",
 ]
 
+[[package]]
+name = "toml_datetime"
+version = "0.6.11"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "22cddaf88f4fbc13c51aebbf5f8eceb5c7c5a9da2ac40a13519eb5b0a0e8f11c"
+
 [[package]]
 name = "toml_datetime"
 version = "0.7.3"
@@ -1605,6 +1668,17 @@ dependencies = [
  "serde_core",
 ]
 
+[[package]]
+name = "toml_edit"
+version = "0.19.15"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "1b5bb770da30e5cbfde35a2d7b9b8a2c4b8ef89548a7a6aeab5c9a576e3e7421"
+dependencies = [
+ "indexmap",
+ "toml_datetime 0.6.11",
+ "winnow 0.5.40",
+]
+
 [[package]]
 name = "toml_edit"
 version = "0.23.7"
@@ -1612,9 +1686,9 @@ source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "6485ef6d0d9b5d0ec17244ff7eb05310113c3f316f2d14200d4de56b3cb98f8d"
 dependencies = [
  "indexmap",
- "toml_datetime",
+ "toml_datetime 0.7.3",
  "toml_parser",
- "winnow",
+ "winnow 0.7.13",
 ]
 
 [[package]]
@@ -1623,7 +1697,7 @@ version = "1.0.4"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "c0cbe268d35bdb4bb5a56a2de88d0ad0eb70af5384a99d648cd4b3d04039800e"
 dependencies = [
- "winnow",
+ "winnow 0.7.13",
 ]
 
 [[package]]
@@ -1956,6 +2030,15 @@ version = "0.53.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "d6bbff5f0aada427a1e5a6da5f1f98158182f26556f345ac9e04d36d0ebed650"
 
+[[package]]
+name = "winnow"
+version = "0.5.40"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "f593a95398737aeed53e489c785df13f3618e41dbcd6718c6addbf1395aa6876"
+dependencies = [
+ "memchr",
+]
+
 [[package]]
 name = "winnow"
 version = "0.7.13"
diff --git a/Cargo.toml b/Cargo.toml
index 86206ef8d..2190a235e 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -52,10 +52,11 @@ getrandom = "0.3"
 once_cell = "1.21"
 num-bigint = { version = "0.4", features = ["serde"] }
 num-rational = {version = "0.4", features = ["serde"]}
-csv = "1.3"
+csv = "1.4"
 typetag = "0.2"
 serde = { version = "1.0", features = ["derive", "rc"] }
 serde_json = "1.0"
+flexbuffers = "25.12.19"
 
 ######################
 # build dependencies
@@ -162,6 +163,7 @@ serde_json_diff = "0.2.0"
 anyhow.workspace = true
 walkdir = "2.5.0"
 egglog-reports = { workspace = true }
+flexbuffers.workspace = true
 
 [build-dependencies]
 chrono = { workspace = true, features = ["now"], optional = true }
diff --git a/core-relations/src/hash_index/mod.rs b/core-relations/src/hash_index/mod.rs
index f5e3c436d..7f6497326 100644
--- a/core-relations/src/hash_index/mod.rs
+++ b/core-relations/src/hash_index/mod.rs
@@ -915,6 +915,7 @@ static THREAD_POOL: Lazy<rayon::ThreadPool> = Lazy::new(|| {
 /// to the beginning of an unused vector.
 #[derive(Default, Clone, Serialize, Deserialize)]
 pub(super) struct FreeList {
+    #[serde(skip)]
     data: HashMap<usize, Vec<BufferIndex>>,
 }
 impl FreeList {
diff --git a/core-relations/src/row_buffer/mod.rs b/core-relations/src/row_buffer/mod.rs
index a4426940c..df4d88045 100644
--- a/core-relations/src/row_buffer/mod.rs
+++ b/core-relations/src/row_buffer/mod.rs
@@ -6,7 +6,7 @@ use std::{cell::Cell, mem, ops::Deref};
 use crate::numeric_id::NumericId;
 use egglog_concurrency::ParallelVecWriter;
 use rayon::iter::ParallelIterator;
-use serde::{ser::SerializeStruct, Deserialize, Deserializer, Serialize};
+use serde::{Deserialize, Deserializer, Serialize};
 use smallvec::SmallVec;
 
 use crate::{
@@ -35,6 +35,7 @@ impl<'de> Deserialize<'de> for RowBuffer {
     where
         D: Deserializer<'de>,
     {
+        /*
         #[derive(Deserialize)]
         struct Partial {
             n_columns: usize,
@@ -49,19 +50,105 @@ impl<'de> Deserialize<'de> for RowBuffer {
             total_rows: helper.total_rows,
             data: Pooled::new(helper.data),
         })
+        */
+
+        struct RowBufferVisitor;
+
+        impl<'de> serde::de::Visitor<'de> for RowBufferVisitor {
+            type Value = RowBuffer;
+
+            fn expecting(&self, formatter: &mut std::fmt::Formatter) -> std::fmt::Result {
+                formatter.write_str("Expecting a byte array")
+            }
+
+            fn visit_bytes<E>(self, bytes: &[u8]) -> Result<Self::Value, E>
+            where
+                E: serde::de::Error,
+            {
+                let mut it = bytes.iter();
+                let n_columns = deserialize_compressed(&mut it);
+                let total_rows = deserialize_compressed(&mut it);
+                let mut data = <Vec<Cell<Value>>>::new();
+                for _i in 0..n_columns * total_rows {
+                    data.push(Cell::new(Value::new(deserialize_compressed(&mut it))));
+                }
+                Ok(RowBuffer {
+                    n_columns: n_columns.try_into().unwrap(),
+                    total_rows: total_rows.try_into().unwrap(),
+                    data: Pooled::new(data),
+                })
+            }
+        }
+
+        deserializer.deserialize_bytes(RowBufferVisitor)
     }
 }
 
+#[allow(dead_code)]
+fn get_n_compressed_bytes(x: u32) -> usize {
+    if x < (1u32 << 7) {
+        1
+    } else if x < (1u32 << 14) {
+        2
+    } else if x < (1u32 << 21) {
+        3
+    } else if x < (1u32 << 28) {
+        4
+    } else {
+        5
+    }
+}
+
+fn compressed_serialize(buf: &mut Vec<u8>, x: u32) {
+    let mut rem = x;
+    while rem >= (1u32 << 7) {
+        buf.push((rem & ((1u32 << 7) - 1)).try_into().unwrap());
+        rem = rem >> 7;
+    }
+    buf.push((rem | (1u32 << 7)).try_into().unwrap());
+}
+
+fn deserialize_compressed<'a, T: Iterator<Item = &'a u8>>(it: &mut T) -> u32 {
+    let mut ret = 0u32;
+    let mut delta = 0u32;
+    let mut val: u32 = <u8>::into(*it.next().unwrap());
+    while val < (1u32 << 7) {
+        ret = ret | (val << delta);
+        delta += 7;
+        val = <u8>::into(*it.next().unwrap());
+    }
+    let last = (val ^ (1u32 << 7)) << delta;
+    ret | last
+}
+
 impl Serialize for RowBuffer {
     fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
     where
         S: serde::Serializer,
     {
+        /*
         let mut state = serializer.serialize_struct("RowBuffer", 3)?;
         state.serialize_field("n_columns", &self.n_columns)?;
         state.serialize_field("total_rows", &self.total_rows)?;
         state.serialize_field("data", &*self.data)?;
         state.end()
+        */
+        //let len = mem::size_of::<usize>() * 2 + self.n_columns * self.total_rows * mem::size_of::<u32>();
+        /*
+        let mut len = get_n_compressed_bytes(self.n_columns.try_into().unwrap()) + get_n_compressed_bytes(self.total_rows.try_into().unwrap());
+        for r in self.data.iter() {
+            len = len + get_n_compressed_bytes(r.get().rep);
+        }
+        let mut buf = vec![0u8; len];
+        //TODO: put data in
+        */
+        let mut buf = Vec::new();
+        compressed_serialize(&mut buf, self.n_columns.try_into().unwrap());
+        compressed_serialize(&mut buf, self.total_rows.try_into().unwrap());
+        for r in self.data.iter() {
+            compressed_serialize(&mut buf, r.get().rep);
+        }
+        serializer.serialize_bytes(&buf)
     }
 }
 
diff --git a/core-relations/src/table/mod.rs b/core-relations/src/table/mod.rs
index 3166577f7..039b20912 100644
--- a/core-relations/src/table/mod.rs
+++ b/core-relations/src/table/mod.rs
@@ -51,12 +51,41 @@ mod tests;
 type HashCode = u64;
 
 /// A pointer to a row in the table.
-#[derive(Clone, Debug, Serialize, Deserialize)]
+#[derive(Clone, Debug)]
 pub(crate) struct TableEntry {
     hashcode: HashCode,
     row: RowId,
 }
 
+impl Serialize for TableEntry {
+    fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
+    where
+        S: Serializer,
+    {
+        let mut bytes = [0u8; 12];
+        let b1 = self.hashcode.to_be_bytes();
+        bytes[..b1.len()].copy_from_slice(&b1);
+        let b2 = self.row.rep.to_be_bytes();
+        bytes[b1.len()..].copy_from_slice(&b2);
+        serializer.serialize_bytes(&bytes)
+    }
+}
+
+impl<'de> Deserialize<'de> for TableEntry {
+    fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
+    where
+        D: Deserializer<'de>,
+    {
+        let bytes = <[u8; 16]>::deserialize(deserializer).expect("Failed to parse TabelEntry");
+        Ok(TableEntry {
+            hashcode: u64::from_be_bytes(bytes[0..8].try_into().unwrap()),
+            row: RowId {
+                rep: u32::from_be_bytes(bytes[8..12].try_into().unwrap()),
+            },
+        })
+    }
+}
+
 impl TableEntry {
     fn hashcode(&self) -> u64 {
         // We keep the cast here to make it easy to switch to HashCode=u32.
@@ -171,8 +200,8 @@ impl<'de> Deserialize<'de> for SortedWritesTable {
         #[derive(Deserialize)]
         struct Partial {
             generation: Generation,
-            shard_data: ShardData,
-            shards: Vec<Vec<TableEntry>>,
+            //shard_data: ShardData,
+            //shards: Vec<Vec<TableEntry>>,
             data: Rows,
 
             n_keys: usize,
@@ -183,13 +212,13 @@ impl<'de> Deserialize<'de> for SortedWritesTable {
             pending_state: Arc<PendingState>,
 
             to_rebuild: Vec<ColumnId>,
-            rebuild_index: Index<ColumnIndex>,
-
+            //rebuild_index: Index<ColumnIndex>,
             subset_tracker: SubsetTracker,
         }
 
         let partial = Partial::deserialize(deserializer)?;
 
+        /*
         let shards: Vec<HashTable<TableEntry>> = partial
             .shards
             .iter()
@@ -206,11 +235,12 @@ impl<'de> Deserialize<'de> for SortedWritesTable {
             shard_data: partial.shard_data,
             shards,
         };
+        */
 
         Ok(SortedWritesTable {
             generation: partial.generation,
             data: partial.data,
-            hash,
+            hash: ShardedHashTable::default(),
             n_keys: partial.n_keys,
             n_columns: partial.n_columns,
             sort_by: partial.sort_by,
@@ -218,7 +248,7 @@ impl<'de> Deserialize<'de> for SortedWritesTable {
             pending_state: partial.pending_state,
             merge: Arc::new(|_, _, _, _| true),
             to_rebuild: partial.to_rebuild,
-            rebuild_index: partial.rebuild_index,
+            rebuild_index: <Index<ColumnIndex>>::default(),
             subset_tracker: partial.subset_tracker,
         })
     }
@@ -229,6 +259,7 @@ impl Serialize for SortedWritesTable {
     where
         S: Serializer,
     {
+        /*
         let serialized_shards: Vec<Vec<TableEntry>> = self
             .hash
             .shards
@@ -239,11 +270,11 @@ impl Serialize for SortedWritesTable {
                 v
             })
             .collect();
-
+        */
         let mut state = serializer.serialize_struct("SortedWritesTable", 11)?;
         state.serialize_field("generation", &self.generation)?;
-        state.serialize_field("shard_data", &self.hash.shard_data())?;
-        state.serialize_field("shards", &serialized_shards)?;
+        //state.serialize_field("shard_data", &self.hash.shard_data())?;
+        //state.serialize_field("shards", &serialized_shards)?;
         state.serialize_field("data", &self.data)?;
         state.serialize_field("n_keys", &self.n_keys)?;
         state.serialize_field("n_columns", &self.n_columns)?;
@@ -251,7 +282,7 @@ impl Serialize for SortedWritesTable {
         state.serialize_field("offsets", &self.offsets)?;
         state.serialize_field("pending_state", &self.pending_state)?;
         state.serialize_field("to_rebuild", &self.to_rebuild)?;
-        state.serialize_field("rebuild_index", &self.rebuild_index)?;
+        //state.serialize_field("rebuild_index", &self.rebuild_index)?;
         state.serialize_field("subset_tracker", &self.subset_tracker)?;
 
         state.end()
diff --git a/core-relations/src/table_spec.rs b/core-relations/src/table_spec.rs
index 1c9b4fab8..6bae2c7d4 100644
--- a/core-relations/src/table_spec.rs
+++ b/core-relations/src/table_spec.rs
@@ -27,8 +27,7 @@ use crate::{
     offsets::{RowId, Subset, SubsetRef},
     pool::{with_pool_set, PoolSet, Pooled},
     row_buffer::{RowBuffer, TaggedRowBuffer},
-    DisplacedTable, DisplacedTableWithProvenance,
-    QueryEntry, TableId, Variable,
+    DisplacedTable, DisplacedTableWithProvenance, QueryEntry, TableId, Variable,
 };
 
 define_id!(pub ColumnId, u32, "a particular column in a table");
@@ -553,7 +552,9 @@ impl<'de> Deserialize<'de> for WrappedTable {
         } else if inner.as_any().is::<DisplacedTableWithProvenance>() {
             wrapper::<DisplacedTableWithProvenance>()
         } else {
-            return Err(serde::de::Error::custom("unknown table type for WrappedTable"));
+            return Err(serde::de::Error::custom(
+                "unknown table type for WrappedTable",
+            ));
         };
 
         Ok(WrappedTable { inner, wrapper })
diff --git a/core-relations/src/uf/mod.rs b/core-relations/src/uf/mod.rs
index ca589c775..923b3faf4 100644
--- a/core-relations/src/uf/mod.rs
+++ b/core-relations/src/uf/mod.rs
@@ -63,8 +63,10 @@ pub struct DisplacedTable {
     // k columns, k-1 are args, kth is the ID
     // enode is the row index
     // on deserialize: need to recompute this from `displaced`
+    #[serde(skip)]
     displaced: Vec<(Value, Value)>, // this is "the table" everything else can be recomputed from this
     // can even recanonicalize on serialization to get rid of dead things
+    #[serde(skip)]
     changed: bool,
     #[serde(skip)]
     lookup_table: HashMap<Value, RowId>,
diff --git a/egglog-ast/src/span.rs b/egglog-ast/src/span.rs
index c2c8db320..2651d9cdc 100644
--- a/egglog-ast/src/span.rs
+++ b/egglog-ast/src/span.rs
@@ -3,11 +3,30 @@ use std::sync::Arc;
 
 use serde::{Deserialize, Serialize};
 
-#[derive(Clone, PartialEq, Eq, Hash, Serialize, Deserialize)]
+#[derive(Clone, PartialEq, Eq, Hash)]
 pub enum Span {
     Panic,
     Egglog(Arc<EgglogSpan>),
     Rust(Arc<RustSpan>),
+    POACH,
+}
+
+impl serde::Serialize for Span {
+    fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
+    where
+        S: serde::Serializer,
+    {
+        serializer.serialize_unit()
+    }
+}
+
+impl<'de> serde::Deserialize<'de> for Span {
+    fn deserialize<D>(_: D) -> Result<Self, D::Error>
+    where
+        D: serde::Deserializer<'de>,
+    {
+        Ok(Self::POACH)
+    }
 }
 
 #[derive(Debug, Clone, PartialEq, Eq, Hash, Serialize, Deserialize)]
@@ -55,6 +74,7 @@ impl Span {
             Span::Panic => panic!("Span::Panic in Span::string"),
             Span::Rust(_) => panic!("Span::Rust cannot track end position"),
             Span::Egglog(span) => &span.file.contents[span.i..span.j],
+            Span::POACH => "From POACH deserialization",
         }
     }
 }
@@ -97,6 +117,7 @@ impl Display for Span {
                     }
                 }
             }
+            Span::POACH => write!(f, "From POACH deserialization"),
         }
     }
 }
diff --git a/egglog-bridge/src/lib.rs b/egglog-bridge/src/lib.rs
index b17177a93..af222388d 100644
--- a/egglog-bridge/src/lib.rs
+++ b/egglog-bridge/src/lib.rs
@@ -812,6 +812,25 @@ impl EGraph {
         Ok(iteration_report)
     }
 
+    /// This hack speeds up extraction and
+    /// avoid certain fields of the backend data structure
+    /// by skipping rebuild
+    pub fn run_rules_without_rebuild(&mut self, rules: &[RuleId]) -> Result<IterationReport> {
+        let ts = self.next_ts();
+
+        let rule_set_report =
+            run_rules_impl(&mut self.db, &mut self.rules, rules, ts, self.report_level)?;
+        if let Some(message) = self.panic_message.lock().unwrap().take() {
+            return Err(PanicError(message).into());
+        }
+
+        let iteration_report = IterationReport {
+            rule_set_report,
+            rebuild_time: Duration::ZERO,
+        };
+        Ok(iteration_report)
+    }
+
     fn rebuild(&mut self) -> Result<()> {
         fn do_parallel() -> bool {
             #[cfg(test)]
diff --git a/infra/nightly-resources/web/chart.js b/infra/nightly-resources/web/chart.js
index 466b69975..aed046dd9 100644
--- a/infra/nightly-resources/web/chart.js
+++ b/infra/nightly-resources/web/chart.js
@@ -124,6 +124,51 @@ function initializeCharts() {
     );
   }
 
+  if (!!document.getElementById("speedup-chart")) {
+    console.assert(GLOBAL_DATA.differenceChart === null);
+
+    GLOBAL_DATA.speedupChart = new Chart(
+      document.getElementById("speedup-chart"),
+      {
+        type: "bar",
+        data: {},
+        options: {
+          responsive: true,
+          plugins: {
+            legend: {
+              display: false,
+            },
+            title: {
+              display: true,
+              text: "Per-benchmark Runtime Speedup",
+            },
+            tooltip: {
+              callbacks: {
+                label: (ctx) => `${ctx.raw.toFixed(2)}x`,
+              },
+            },
+          },
+          scales: {
+            x: {
+              ticks: {
+                maxRotation: 90,
+                minRotation: 45,
+              },
+            },
+            y: {
+              min: 0,
+              max: 50,
+              title: {
+                display: true,
+                text: "Speedup (times)",
+              },
+            },
+          },
+        },
+      },
+    );
+  }
+
   if (!!document.getElementById("difference-chart")) {
     console.assert(GLOBAL_DATA.differenceChart === null);
 
@@ -156,8 +201,8 @@ function initializeCharts() {
               },
             },
             y: {
-              min: -25,
-              max: 25,
+              min: -1000,
+              max: 3000,
               title: {
                 display: true,
                 text: "time (ms)",
diff --git a/infra/nightly-resources/web/extract.html b/infra/nightly-resources/web/extract.html
index 55de269b5..f8a2483d9 100644
--- a/infra/nightly-resources/web/extract.html
+++ b/infra/nightly-resources/web/extract.html
@@ -25,6 +25,15 @@ <h2>POACH vs Vanilla Egglog</h2>
       Serialization time is not counted
     </p>
 
+    <form id="icldser" onchange="plotExtract()">
+      <input type="checkbox" id="icldser1" name="icldser1" >
+      <label for="icldser1"> Include serialization time for Poach </label>
+    </form>
+    <form id="suite" onchange="plotExtract()"></form>
+
+    <div style="max-height: 800px;">
+      <canvas class="content" id="speedup-chart"></canvas>
+    </div>  
     <div style="max-height: 800px;">
       <canvas class="content" id="difference-chart"></canvas>
     </div>
diff --git a/infra/nightly-resources/web/extract.js b/infra/nightly-resources/web/extract.js
index e83b0c854..e922b536a 100644
--- a/infra/nightly-resources/web/extract.js
+++ b/infra/nightly-resources/web/extract.js
@@ -1,9 +1,45 @@
 function initializeExtract() {
-  initializeGlobalData().then(initializeCharts).then(plotExtract);
+  initializeGlobalData()
+    .then(initializeExtractOptions)  
+    .then(initializeCharts)
+    .then(plotExtract);
 }
 
+function initializeExtractOptions() {
+  const suiteElt = document.getElementById("suite");
+  Object.keys(GLOBAL_DATA.data).forEach((suite, idx) => {
+    const label = document.createElement("label");
+    const input = document.createElement("input");
+
+    input.type = "radio";
+    input.name = "suiteToggle";
+    input.value = suite;
+
+    if (idx === 0) {
+      input.checked = true; // select first run mode
+    }
+
+    label.appendChild(input);
+    label.append(" " + suite);
+
+    suiteElt.appendChild(label);
+  });
+}
+
+
 function plotExtract() {
-  const all_data = GLOBAL_DATA.data.tests.extract;
+
+  const suite = document.querySelector(
+    'input[name="suiteToggle"]:checked'
+  ).value;
+
+  if (!suite) {
+    return;
+  }
+
+  const includeser = document.querySelector("input[name='icldser1']:checked");
+
+  const all_data = GLOBAL_DATA.data[suite].extract;
 
   if (GLOBAL_DATA.extractChart === null) {
     return;
@@ -29,11 +65,33 @@ function plotExtract() {
 
     data[b].poachExtract = aggregate(extracts.slice(midpoint), "total");
     data[b].poachDeser = aggregate(all_data[b].deserialize, "total");
-    data[b].poachTotal = data[b].poachDeser + data[b].poachExtract;
+    if (includeser) {
+      data[b].poachTotal = data[b].poachDeser + data[b].poachExtract;
+    } else {
+      data[b].poachTotal = data[b].poachExtract;
+    }
 
-    data[b].difference = data[b].poachTotal - data[b].vanillaTotal;
+    data[b].difference = data[b].vanillaTotal - data[b].poachTotal;
+    data[b].speedup = data[b].vanillaTotal / data[b].poachTotal;
   });
 
+  GLOBAL_DATA.speedupChart.data = {
+    labels: benchmarks,
+    datasets: [
+      {
+        label: "poach - vanilla",
+        data: Object.values(data).map((d) => d.speedup),
+        backgroundColor: Object.values(data).map((d) => {
+          return d.speedup >= 1
+            ? "rgba(54, 162, 235, 0.7)"
+            : "rgba(255, 99, 132, 0.7)";
+        }),
+      },
+    ],
+  };
+
+  GLOBAL_DATA.speedupChart.update();
+
   GLOBAL_DATA.differenceChart.data = {
     labels: benchmarks,
     datasets: [
@@ -41,18 +99,16 @@ function plotExtract() {
         label: "poach - vanilla",
         data: Object.values(data).map((d) => d.difference),
         backgroundColor: Object.values(data).map((d) => {
-          if (Math.abs(d.difference) > 25) {
-            return "gray";
-          } else {
-            return d.difference >= 0
-              ? "rgba(255, 99, 132, 0.7)"
-              : "rgba(54, 162, 235, 0.7)";
-          }
+          return d.difference >= 0
+            ? "rgba(54, 162, 235, 0.7)"
+            : "rgba(255, 99, 132, 0.7)";
         }),
       },
     ],
   };
 
+  GLOBAL_DATA.differenceChart.update();
+
   GLOBAL_DATA.extractChart.data = {
     labels: benchmarks,
     datasets: [
@@ -85,4 +141,6 @@ function plotExtract() {
       },
     ],
   };
+
+  GLOBAL_DATA.extractChart.update();  
 }
diff --git a/infra/nightly.py b/infra/nightly.py
index 3e833356a..5da422cc0 100644
--- a/infra/nightly.py
+++ b/infra/nightly.py
@@ -88,23 +88,34 @@ def run_test_experiments(top_dir, tmp_dir, aggregator):
       run_poach(benchmark, tmp_dir, run_mode)
       add_benchmark_data(aggregator, timeline_file, f"tests/{benchmark_name}/{benchmark.stem}/timeline.json")
       extra_files = {
-        "sequential-round-trip": [tmp_dir / f"{benchmark.stem}-serialize1.json"],
+        "sequential-round-trip": [tmp_dir / f"{benchmark.stem}-serialize1.fbs"],
         "old-serialize": [
-          tmp_dir / f"{benchmark.stem}-serialize-poach.json",
+          tmp_dir / f"{benchmark.stem}-serialize-poach.fbs",
           tmp_dir / f"{benchmark.stem}-serialize-old.json",
         ],
       }.get(run_mode, [])
       cleanup_benchmark_files(timeline_file, tmp_dir / "summary.json", *extra_files)
 
+def run_extract_experiments(resource_dir, tmp_dir, aggregator, csv_aggregator):
+  timeline_suites = ["herbie-hamming", "herbie-math-rewrite", "herbie-math-taylor"]
+  for suite in timeline_suites:
+    for benchmark in benchmark_files(resource_dir / "test-files" / suite):
+      timeline_file = tmp_dir / f"{benchmark.stem}-timeline.json"
+      run_poach(benchmark, tmp_dir, "extract")
+      add_benchmark_data(aggregator, timeline_file, f"{suite}/extract/{benchmark.stem}/timeline.json")
+      extra_files = [tmp_dir / f"{benchmark.stem}.csv"]
+      csv_aggregator.add_file(extra_files[0])
+      cleanup_benchmark_files(timeline_file, tmp_dir / "summary.json", *extra_files)
+
 def run_mined_experiments(resource_dir, tmp_dir, aggregator):
-  mega_serialize_file = tmp_dir / "mega-easteregg-serialize.json"
+  mega_serialize_file = tmp_dir / "mega-easteregg-serialize.fbs"
   mega_timeline_file = tmp_dir / "mega-easteregg-timeline.json"
   run_poach(resource_dir / "mega-easteregg.egg", tmp_dir, "serialize")
   add_benchmark_data(aggregator, mega_timeline_file, "easteregg/serialize/mega-easteregg/timeline.json")
   cleanup_benchmark_files(mega_timeline_file, tmp_dir / "summary.json")
   for benchmark in benchmark_files(resource_dir / "test-files" / "easteregg"):
     timeline_file = tmp_dir / f"{benchmark.stem}-timeline.json"
-    serialize_file = tmp_dir / f"{benchmark.stem}-serialize.json"
+    serialize_file = tmp_dir / f"{benchmark.stem}-serialize.fbs"
     run_poach(benchmark, tmp_dir, "serialize")
     add_benchmark_data(aggregator, timeline_file, f"easteregg/serialize/{benchmark.stem}/timeline.json")
     cleanup_benchmark_files(timeline_file, tmp_dir / "summary.json")
@@ -137,6 +148,7 @@ def run_mined_experiments(resource_dir, tmp_dir, aggregator):
   tmp_dir = nightly_dir / "tmp"
   output_data_dir = nightly_dir / "output" / "data"
   aggregator = transform.TimelineAggregator(output_data_dir)
+  csv_aggregator = transform.CSVAggregator(output_data_dir)
 
   # Make sure we're in the right place
   os.chdir(top_dir)
@@ -146,22 +158,26 @@ def run_mined_experiments(resource_dir, tmp_dir, aggregator):
   ##############################################################################
 
   # Run the benchmarks and record timeline-only data.
-  run_timeline_experiments(resource_dir, tmp_dir, aggregator)
+  # run_timeline_experiments(resource_dir, tmp_dir, aggregator)
   
   # Re-run the benchmarks with JSON round-tripping kept entirely in memory.
-  run_no_io_experiments(resource_dir, tmp_dir, aggregator)
+  # run_no_io_experiments(resource_dir, tmp_dir, aggregator)
   
   # Run the egglog tests under each serialization experiment mode.
-  run_test_experiments(top_dir, tmp_dir, aggregator)
+  # run_test_experiments(top_dir, tmp_dir, aggregator)
   
   # Run the mined-egraph experiment using both per-benchmark and mega-egraph seeds.
-  run_mined_experiments(resource_dir, tmp_dir, aggregator)
+  # run_mined_experiments(resource_dir, tmp_dir, aggregator)
+
+  # Run the extract experiment on our heavy benchmarks
+  run_extract_experiments(resource_dir, tmp_dir, aggregator, csv_aggregator)
 
   ##############################################################################
 
   aggregator.save()
+  csv_aggregator.save()
 
-  if shutil.which("perf") is not None:
-    # Generate flamegraphs
-    for egg_file in glob.glob("tests/*.egg") + glob.glob("tests/web-demo/*.egg"):
-      run_cmd([str(script_dir / "flamegraph.sh"), egg_file, str(nightly_dir / "output" / "flamegraphs")])
+  #if shutil.which("perf") is not None:
+  #  # Generate flamegraphs
+  #  for egg_file in glob.glob("tests/*.egg") + glob.glob("tests/web-demo/*.egg"):
+  #    run_cmd([str(script_dir / "flamegraph.sh"), egg_file, str(nightly_dir / "output" / "flamegraphs")])
diff --git a/infra/nightly.sh b/infra/nightly.sh
old mode 100644
new mode 100755
index 766e417cb..a0777ca6c
--- a/infra/nightly.sh
+++ b/infra/nightly.sh
@@ -47,7 +47,8 @@ mkdir -p nightly/output
 mkdir -p nightly/output/flamegraphs
 mkdir -p nightly/tmp
 
-git clone https://github.com/brendangregg/FlameGraph.git
+# Skip FlameGraphs for mining MVP
+# git clone https://github.com/brendangregg/FlameGraph.git
 
 # Build in release mode before running nightly.py
 cargo build --release
@@ -61,7 +62,7 @@ if [ ! -f nightly/output/data/data.json ]; then
   exit 1
 fi
 
-ls nightly/output/flamegraphs > nightly/output/flamegraphs.txt
+# ls nightly/output/flamegraphs > nightly/output/flamegraphs.txt
 
 cp infra/nightly-resources/web/* nightly/output
 
diff --git a/infra/transform.py b/infra/transform.py
index 2fe95fbfd..f6a334003 100644
--- a/infra/transform.py
+++ b/infra/transform.py
@@ -1,4 +1,5 @@
 import json
+import pandas
 import os
 from pathlib import Path
 
@@ -111,3 +112,18 @@ def add_file(self, input_file, benchmark_name):
     def save(self):
         os.makedirs(self.output_dir, exist_ok=True)
         save_json(self.data_path, self.aggregated)
+
+class CSVAggregator:
+    def __init__(self, output_dir):
+        self.output_dir = Path(output_dir)
+        self.data_path = self.output_dir / "data.csv"
+        self.records = []
+
+    def add_file(self, input_file):
+        df = pandas.read_csv(input_file)
+        self.records.append(df)
+
+    def save(self):
+        os.makedirs(self.output_dir, exist_ok=True)
+        combined = pandas.concat(self.records)
+        combined.to_csv(self.data_path, index=False)
\ No newline at end of file
diff --git a/numeric-id/src/lib.rs b/numeric-id/src/lib.rs
index 9825268f2..b1202c26a 100644
--- a/numeric-id/src/lib.rs
+++ b/numeric-id/src/lib.rs
@@ -438,7 +438,8 @@ macro_rules! define_id {
         #[derive(Copy, Clone, Default)]
         #[doc = $doc]
         $v struct $name {
-            rep: $repr,
+            // visibility hack for serialization
+            pub rep: $repr,
         }
 
         impl serde::Serialize for $name {
diff --git a/src/lib.rs b/src/lib.rs
index 4910c1661..28d4baa28 100644
--- a/src/lib.rs
+++ b/src/lib.rs
@@ -30,8 +30,11 @@ mod typechecking;
 pub mod util;
 pub use command_macro::{CommandMacro, CommandMacroRegistry};
 
+pub mod serialize_size;
+
 // This is used to allow the `add_primitive` macro to work in
 // both this crate and other crates by referring to `::egglog`.
+extern crate flexbuffers;
 extern crate self as egglog;
 use anyhow::{Context, Result};
 use ast::*;
@@ -62,6 +65,7 @@ use scheduler::{SchedulerId, SchedulerRecord};
 use serde::ser::SerializeStruct;
 use serde::{Deserialize, Serialize};
 use serde_json::json;
+use serialize_size::GenerateSizeReport;
 pub use serialize_vis::{SerializeConfig, SerializeOutput, SerializedNode};
 use size::GetSizePrimitive;
 use sort::*;
@@ -69,7 +73,7 @@ use std::any::Any;
 use std::fmt::{Debug, Display, Formatter};
 use std::fs::{self, read_to_string, File};
 use std::hash::Hash;
-use std::io::{BufReader, BufWriter, Read, Write as _};
+use std::io::{BufWriter, Read, Write as _};
 use std::iter::once;
 use std::ops::Deref;
 use std::path::{Path, PathBuf};
@@ -255,31 +259,59 @@ impl Serialize for SerializableSort {
             s.serialize_field("type", "FunctionSort")?;
             s.serialize_field("data", sort)?;
             s.end()
-        } else if let Some(_) = sort.as_any().downcast_ref::<BaseSortImpl<BigIntSort>>() {
+        } else if sort
+            .as_any()
+            .downcast_ref::<BaseSortImpl<BigIntSort>>()
+            .is_some()
+        {
             s.serialize_field("type", "BaseSort")?;
             s.serialize_field("data", "BigIntSort")?;
             s.end()
-        } else if let Some(_) = sort.as_any().downcast_ref::<BaseSortImpl<BigRatSort>>() {
+        } else if sort
+            .as_any()
+            .downcast_ref::<BaseSortImpl<BigRatSort>>()
+            .is_some()
+        {
             s.serialize_field("type", "BaseSort")?;
             s.serialize_field("data", "BigRatSort")?;
             s.end()
-        } else if let Some(_) = sort.as_any().downcast_ref::<BaseSortImpl<BoolSort>>() {
+        } else if sort
+            .as_any()
+            .downcast_ref::<BaseSortImpl<BoolSort>>()
+            .is_some()
+        {
             s.serialize_field("type", "BaseSort")?;
             s.serialize_field("data", "BoolSort")?;
             s.end()
-        } else if let Some(_) = sort.as_any().downcast_ref::<BaseSortImpl<F64Sort>>() {
+        } else if sort
+            .as_any()
+            .downcast_ref::<BaseSortImpl<F64Sort>>()
+            .is_some()
+        {
             s.serialize_field("type", "BaseSort")?;
             s.serialize_field("data", "F64Sort")?;
             s.end()
-        } else if let Some(_) = sort.as_any().downcast_ref::<BaseSortImpl<I64Sort>>() {
+        } else if sort
+            .as_any()
+            .downcast_ref::<BaseSortImpl<I64Sort>>()
+            .is_some()
+        {
             s.serialize_field("type", "BaseSort")?;
             s.serialize_field("data", "I64Sort")?;
             s.end()
-        } else if let Some(_) = sort.as_any().downcast_ref::<BaseSortImpl<StringSort>>() {
+        } else if sort
+            .as_any()
+            .downcast_ref::<BaseSortImpl<StringSort>>()
+            .is_some()
+        {
             s.serialize_field("type", "BaseSort")?;
             s.serialize_field("data", "StringSort")?;
             s.end()
-        } else if let Some(_) = sort.as_any().downcast_ref::<BaseSortImpl<UnitSort>>() {
+        } else if sort
+            .as_any()
+            .downcast_ref::<BaseSortImpl<UnitSort>>()
+            .is_some()
+        {
             s.serialize_field("type", "BaseSort")?;
             s.serialize_field("data", "UnitSort")?;
             s.end()
@@ -1334,7 +1366,7 @@ impl EGraph {
         );
 
         let id = translator.build();
-        let rule_result = self.backend.run_rules(&[id]);
+        let rule_result = self.backend.run_rules_without_rebuild(&[id]);
         self.backend.free_rule(id);
         self.backend.free_external_func(ext_id);
         let _ = rule_result.map_err(|e| {
@@ -1553,7 +1585,7 @@ impl EGraph {
                                 expr.output_type(),
                             )
                             .iter()
-                            .map(|e| e.1.clone())
+                            .map(|e| e.1)
                             .collect();
                         if log_enabled!(Level::Info) {
                             let expr_str = expr.to_string();
@@ -2498,16 +2530,36 @@ mod tests {
 
 /***** TESTING AREA FOR TIMED EGRAPH *****/
 
-static START: &'static str = "start";
-static END: &'static str = "end";
+static START: &str = "start";
+static END: &str = "end";
 
-#[derive(Serialize, Clone)]
+#[derive(Serialize, Clone, Eq)]
 pub struct EgraphEvent {
     sexp_idx: i32,
     evt: &'static str,
     time_micros: u128,
 }
 
+impl Ord for EgraphEvent {
+    fn cmp(&self, other: &Self) -> std::cmp::Ordering {
+        self.time_micros.cmp(&other.time_micros)
+    }
+}
+
+impl PartialOrd for EgraphEvent {
+    fn partial_cmp(&self, other: &Self) -> Option<std::cmp::Ordering> {
+        Some(self.cmp(other))
+    }
+}
+
+impl PartialEq for EgraphEvent {
+    fn eq(&self, other: &Self) -> bool {
+        self.sexp_idx == other.sexp_idx
+            && self.evt == other.evt
+            && self.time_micros == other.time_micros
+    }
+}
+
 #[derive(Serialize, Clone)]
 pub struct ProgramTimeline {
     program_text: String,
@@ -2530,6 +2582,12 @@ pub struct TimedEgraph {
     timer: std::time::Instant,
 }
 
+impl Default for TimedEgraph {
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
 impl TimedEgraph {
     /// Create a new TimedEgraph with a default EGraph
     pub fn new() -> Self {
@@ -2544,14 +2602,16 @@ impl TimedEgraph {
     }
 
     pub fn new_from_file(path: &Path) -> Self {
-        let file = File::open(path).expect("failed to open egraph file");
-        let reader = BufReader::new(file);
+        let mut file = fs::File::open(path).expect("failed to open file");
+        let mut buf = Vec::new();
+        file.read_to_end(&mut buf)
+            .expect("Failed to read Flatbuffer from file");
 
-        let mut egraph: EGraph =
-            serde_json::from_reader(reader).expect("failed to parse egraph JSON");
+        let r = flexbuffers::Reader::get_root(buf.as_slice()).unwrap();
+        let mut egraph: EGraph = EGraph::deserialize(r).unwrap();
         egraph
             .restore_deserialized_runtime()
-            .expect("failed to restore deserialized runtime");
+            .expect("Failed to restore deserialized runtime");
 
         Self {
             egraphs: vec![egraph],
@@ -2560,15 +2620,20 @@ impl TimedEgraph {
         }
     }
 
+    pub fn get_total_time(&self, id: usize) -> u128 {
+        self.timeline[id].evts.iter().max().unwrap().time_micros
+            - self.timeline[id].evts.iter().min().unwrap().time_micros
+    }
+
     pub fn egraphs(&self) -> Vec<&EGraph> {
-        self.egraphs.iter().map(|x| x).collect()
+        self.egraphs.iter().collect()
     }
 
     pub fn write_timeline(&self, path: &Path) -> Result<(), serde_json::Error> {
         if let Some(parent) = path.parent() {
             fs::create_dir_all(parent).expect("Failed to create out dir");
         }
-        let file = File::create(&path).expect("Failed to create timeline.json");
+        let file = File::create(path).expect("Failed to create timeline.json");
         serde_json::to_writer_pretty(BufWriter::new(file), &self.timeline)
     }
 
@@ -2639,7 +2704,7 @@ impl TimedEgraph {
                 time_micros: self.timer.elapsed().as_micros(),
             });
 
-            i = i + 1;
+            i += 1;
         }
 
         self.timeline.push(program_timeline);
@@ -2698,7 +2763,7 @@ impl TimedEgraph {
         Ok(())
     }
 
-    pub fn to_value(&mut self) -> Result<serde_json::Value> {
+    pub fn to_value(&mut self) -> Result<Vec<u8>> {
         let mut timeline = ProgramTimeline::new("(serialize)");
 
         let egraph = self.egraphs.last().unwrap();
@@ -2708,7 +2773,10 @@ impl TimedEgraph {
             time_micros: self.timer.elapsed().as_micros(),
         });
 
-        let value = serde_json::to_value(egraph).context("Failed to encode egraph as json")?;
+        let mut buf = flexbuffers::FlexbufferSerializer::new();
+        Serialize::serialize(egraph, &mut buf)
+            .expect("Failed to serialize the egraph in Flexbuffer");
+        let value = Vec::from(buf.view());
 
         timeline.evts.push(EgraphEvent {
             sexp_idx: 0,
@@ -2720,7 +2788,7 @@ impl TimedEgraph {
         Ok(value)
     }
 
-    pub fn from_value(&mut self, value: serde_json::Value) -> Result<()> {
+    pub fn from_value(&mut self, value: Vec<u8>) -> Result<()> {
         let mut timeline = ProgramTimeline::new("(deserialize)");
 
         timeline.evts.push(EgraphEvent {
@@ -2729,8 +2797,8 @@ impl TimedEgraph {
             time_micros: self.timer.elapsed().as_micros(),
         });
 
-        let mut egraph: EGraph =
-            serde_json::from_value(value).context("Failed to decode egraph from json")?;
+        let r = flexbuffers::Reader::get_root(value.as_slice()).unwrap();
+        let mut egraph: EGraph = EGraph::deserialize(r).unwrap();
         egraph
             .restore_deserialized_runtime()
             .context("Failed to restore deserialized runtime")?;
@@ -2747,6 +2815,13 @@ impl TimedEgraph {
         Ok(())
     }
 
+    pub fn print_size_report(&mut self, max_level: usize) -> Result<()> {
+        let egraph = self.egraphs.last().unwrap();
+        println!("egraph size: {:}", egraph.num_tuples());
+        egraph.get_sizerp().pretty_print(0, max_level);
+        Ok(())
+    }
+
     pub fn to_file(&mut self, path: &Path) -> Result<()> {
         let mut timeline = ProgramTimeline::new("(serialize)\n(write)");
         let egraph = self.egraphs.last().unwrap();
@@ -2756,7 +2831,9 @@ impl TimedEgraph {
             time_micros: self.timer.elapsed().as_micros(),
         });
 
-        let value = serde_json::to_value(egraph).context("Failed to encode egraph as json")?;
+        let mut buf = flexbuffers::FlexbufferSerializer::new();
+        Serialize::serialize(egraph, &mut buf)
+            .expect("Failed to serialize the egraph in Flexbuffer");
 
         timeline.evts.push(EgraphEvent {
             sexp_idx: 0,
@@ -2770,9 +2847,9 @@ impl TimedEgraph {
             time_micros: self.timer.elapsed().as_micros(),
         });
 
-        let file = fs::File::create(path)
+        let mut file = fs::File::create(path)
             .with_context(|| format!("failed to create file {}", path.display()))?;
-        serde_json::to_writer_pretty(BufWriter::new(file), &value)
+        file.write_all(buf.view())
             .context("Failed to write value to file")?;
 
         timeline.evts.push(EgraphEvent {
@@ -2795,11 +2872,11 @@ impl TimedEgraph {
             time_micros: self.timer.elapsed().as_micros(),
         });
 
-        let file = fs::File::open(path)
+        let mut file = fs::File::open(path)
             .with_context(|| format!("failed to open file {}", path.display()))?;
-        let reader = BufReader::new(file);
-        let value: serde_json::Value =
-            serde_json::from_reader(reader).context("Failed to read json from file")?;
+        let mut buf = Vec::new();
+        file.read_to_end(&mut buf)
+            .context("Failed to read Flatbuffer from file")?;
 
         timeline.evts.push(EgraphEvent {
             sexp_idx: 0,
@@ -2813,7 +2890,8 @@ impl TimedEgraph {
             time_micros: self.timer.elapsed().as_micros(),
         });
 
-        let mut egraph: EGraph = serde_json::from_value(value)?;
+        let r = flexbuffers::Reader::get_root(buf.as_slice()).unwrap();
+        let mut egraph: EGraph = EGraph::deserialize(r).unwrap();
         egraph
             .restore_deserialized_runtime()
             .context("Failed to restore deserialized runtime")?;
diff --git a/src/poach.rs b/src/poach.rs
index c7ed26dce..39720f4a2 100644
--- a/src/poach.rs
+++ b/src/poach.rs
@@ -52,7 +52,7 @@ enum RunMode {
     // For each egg file under the input path,
     //      Run the egglog program, recording timing information.
     //      Round trip to JSON Value, but do not read/write from file
-    //      Assert the deserialized egraph has hthe same size as the initial egraph.
+    //      Assert the deserialized egraph has the same size as the initial egraph.
     //      Save the completed timeline, for consumption by the nightly frontend
     NoIO,
 
@@ -71,6 +71,11 @@ enum RunMode {
     //      Run the egglog program, skipping declarations of Sorts and Rules
     //      Save the completed timeline, for consumption by the nightly frontend
     Mine,
+
+    // For each egg file under the input path,
+    //      run the egglog program and record timing information.
+    //      Print size information on the serialized egraphs.
+    SizeReport,
 }
 
 impl Display for RunMode {
@@ -87,6 +92,7 @@ impl Display for RunMode {
                 RunMode::NoIO => "no-io",
                 RunMode::Extract => "extract",
                 RunMode::Mine => "mine",
+                RunMode::SizeReport => "size-report",
             }
         )
     }
@@ -128,6 +134,8 @@ fn check_egraph_size(egraph: &TimedEgraph) -> Result<()> {
     Ok(())
 }
 
+// TODO: This is not working right now due to no longer using serde_json
+/*
 fn check_idempotent(p1: &PathBuf, p2: &PathBuf, name: &str, out_dir: &PathBuf) {
     let json1: serde_json::Value = serde_json::from_str(
         &fs::read_to_string(p1).expect(&format!("failed to open {}", p1.display())),
@@ -147,6 +155,7 @@ fn check_idempotent(p1: &PathBuf, p2: &PathBuf, name: &str, out_dir: &PathBuf) {
         panic!("Diff for {}", name)
     }
 }
+*/
 
 fn benchmark_name(egg_file: &Path) -> &str {
     egg_file
@@ -193,7 +202,7 @@ where
             }
         }
     }
-    if failures.len() == 0 {
+    if failures.is_empty() {
         println!("0 failures out of {} files", files.len());
     } else {
         println!("{} failures out of {} files", failures.len(), files.len());
@@ -204,6 +213,7 @@ where
     (successes, failures)
 }
 
+#[allow(dead_code)]
 fn compare_extracts(
     initial_extracts: &[CommandOutput],
     final_extracts: &[CommandOutput],
@@ -242,6 +252,29 @@ fn compare_extracts(
     Ok(())
 }
 
+fn compare_extracts_weak(
+    initial_extracts: &[CommandOutput],
+    final_extracts: &[CommandOutput],
+) -> Result<()> {
+    if initial_extracts.len() != final_extracts.len() {
+        anyhow::bail!("extract lengths mismatch")
+    }
+
+    for (x, y) in initial_extracts.iter().zip(final_extracts) {
+        match (x, y) {
+            (CommandOutput::ExtractBest(_, _, _), CommandOutput::ExtractBest(_, _, _)) => {}
+            (CommandOutput::ExtractVariants(_, _), CommandOutput::ExtractVariants(_, _)) => {}
+            (
+                CommandOutput::MultiExtractVariants(_, _),
+                CommandOutput::MultiExtractVariants(_, _),
+            ) => {}
+            _ => anyhow::bail!("No match : {:?} {:?}", x, y),
+        }
+    }
+
+    Ok(())
+}
+
 fn poach(
     files: Vec<PathBuf>,
     out_dir: &PathBuf,
@@ -269,7 +302,7 @@ fn poach(
             |egg_file, out_dir, timed_egraph| {
                 let name = benchmark_name(egg_file);
                 timed_egraph.run_from_file(egg_file)?;
-                timed_egraph.to_file(&out_dir.join(format!("{name}-serialize.json")))?;
+                timed_egraph.to_file(&out_dir.join(format!("{name}-serialize.fbs")))?;
                 timed_egraph.write_timeline(&out_dir.join(format!("{name}-timeline.json")))?;
                 Ok(())
             },
@@ -282,19 +315,19 @@ fn poach(
             |egg_file, out_dir: &PathBuf, timed_egraph| {
                 let name = benchmark_name(egg_file);
                 timed_egraph.run_from_file(egg_file)?;
-                let s1 = out_dir.join(format!("{name}-serialize1.json"));
+                let s1 = out_dir.join(format!("{name}-serialize1.fbs"));
 
                 timed_egraph
                     .to_file(&s1)
-                    .context("Failed to write s1.json")?;
+                    .context("Failed to write s1.fbs")?;
 
                 timed_egraph
                     .from_file(&s1)
-                    .context("failed to read s1.json")?;
+                    .context("failed to read s1.fbs")?;
 
-                check_egraph_number(&timed_egraph, 2)?;
+                check_egraph_number(timed_egraph, 2)?;
 
-                check_egraph_size(&timed_egraph)?;
+                check_egraph_size(timed_egraph)?;
 
                 timed_egraph.write_timeline(&out_dir.join(format!("{name}-timeline.json")))?;
                 Ok(())
@@ -308,37 +341,37 @@ fn poach(
             |egg_file, out_dir, timed_egraph| {
                 let name = benchmark_name(egg_file);
                 timed_egraph.run_from_file(egg_file)?;
-                let s1 = out_dir.join(format!("{name}-serialize1.json"));
-                let s2 = out_dir.join(format!("{name}-serialize2.json"));
-                let s3 = out_dir.join(format!("{name}-serialize3.json"));
+                let s1 = out_dir.join(format!("{name}-serialize1.fbs"));
+                let s2 = out_dir.join(format!("{name}-serialize2.fbs"));
+                let s3 = out_dir.join(format!("{name}-serialize3.fbs"));
 
                 timed_egraph
                     .to_file(&s1)
-                    .context("failed to serialize s1.json")?;
+                    .context("failed to serialize s1.fbs")?;
 
                 timed_egraph
                     .from_file(&s1)
-                    .context("failed to read s1.json")?;
+                    .context("failed to read s1.fbs")?;
 
                 timed_egraph
                     .to_file(&s2)
-                    .context("failed to serialize s2.json")?;
+                    .context("failed to serialize s2.fbs")?;
 
                 timed_egraph
                     .from_file(&s2)
-                    .context("failed to read s2.json")?;
+                    .context("failed to read s2.fbs")?;
 
                 timed_egraph
                     .to_file(&s3)
-                    .context("failed to serialize s3.json")?;
+                    .context("failed to serialize s3.fbs")?;
 
                 timed_egraph
                     .from_file(&s3)
-                    .context("failed to read s3.json")?;
+                    .context("failed to read s3.fbs")?;
 
-                check_egraph_number(&timed_egraph, 4)?;
-                check_egraph_size(&timed_egraph)?;
-                check_idempotent(&s2, &s3, name, out_dir);
+                check_egraph_number(timed_egraph, 4)?;
+                check_egraph_size(timed_egraph)?;
+                //check_idempotent(&s2, &s3, name, out_dir);
 
                 timed_egraph.write_timeline(&out_dir.join(format!("{name}-timeline.json")))?;
                 Ok(())
@@ -354,8 +387,8 @@ fn poach(
                 timed_egraph.run_from_file(egg_file)?;
 
                 timed_egraph
-                    .to_file(&out_dir.join(format!("{name}-serialize-poach.json")))
-                    .context("failed to write poach.json")?;
+                    .to_file(&out_dir.join(format!("{name}-serialize-poach.fbs")))
+                    .context("failed to write poach.fbs")?;
 
                 timed_egraph
                     .old_serialize_egraph(&out_dir.join(format!("{name}-serialize-old.json")))
@@ -376,15 +409,15 @@ fn poach(
 
                 let value = timed_egraph
                     .to_value()
-                    .context("Failed to encode egraph as json")?;
+                    .context("Failed to encode egraph as flatbuffer")?;
 
                 timed_egraph
                     .from_value(value)
-                    .context("failed to decode egraph from json")?;
+                    .context("failed to decode egraph from flatbuffer")?;
 
-                check_egraph_number(&timed_egraph, 2)?;
+                check_egraph_number(timed_egraph, 2)?;
 
-                check_egraph_size(&timed_egraph)?;
+                check_egraph_size(timed_egraph)?;
 
                 timed_egraph.write_timeline(&out_dir.join(format!("{name}-timeline.json")))?;
 
@@ -418,7 +451,7 @@ fn poach(
                     if let Sexp::List(xs, _) = sexp {
                         if !xs.is_empty() {
                             match &xs[0] {
-                                Sexp::Atom(s, _) => s == "extract",
+                                Sexp::Atom(s, _) => s == "extract" || s == "multi-extract",
                                 _ => false,
                             }
                         } else {
@@ -446,21 +479,46 @@ fn poach(
 
                 let value = timed_egraph
                     .to_value()
-                    .context("Failed to encode egraph as JSON")?;
+                    .context("Failed to encode egraph as Flatbuffer")?;
+
+                let serialized_size = value.len();
 
                 timed_egraph
                     .from_value(value)
-                    .context("failed to decode egraph from json")?;
+                    .context("Failed to decode egraph from Flatbuffer")?;
 
-                check_egraph_number(&timed_egraph, 2)?;
+                check_egraph_number(timed_egraph, 2)?;
 
                 let final_extracts =
                     timed_egraph.run_program_with_timeline(extract_cmds, &extracts)?;
 
-                compare_extracts(&initial_extracts, &final_extracts)?;
+                compare_extracts_weak(&initial_extracts, &final_extracts)?;
 
                 timed_egraph.write_timeline(&out_dir.join(format!("{name}-timeline.json")))?;
 
+                #[derive(Serialize)]
+                struct CSVRecord {
+                    benchname: String,
+                    egraph_size: usize,
+                    serialized_size: usize,
+                    ser_time: u128,
+                    der_time: u128,
+                    ext_time: u128,
+                    run_time: u128,
+                }
+
+                let r = CSVRecord {
+                    benchname: name.to_string(),
+                    egraph_size: timed_egraph.egraphs().last().unwrap().num_tuples(),
+                    serialized_size,
+                    ser_time: timed_egraph.get_total_time(1),
+                    der_time: timed_egraph.get_total_time(2),
+                    ext_time: timed_egraph.get_total_time(3),
+                    run_time: timed_egraph.get_total_time(0),
+                };
+
+                csv::Writer::from_path(out_dir.join(format!("{name}.csv")))?.serialize(r)?;
+
                 Ok(())
             },
         ),
@@ -574,7 +632,7 @@ fn poach(
 
                     let all_cmds = EGraph::default()
                         .parser
-                        .get_program_from_string(None, &program_string)?;
+                        .get_program_from_string(None, program_string)?;
 
                     assert!(all_cmds.len() == all_sexps.len());
 
@@ -660,6 +718,15 @@ fn poach(
                 },
             )
         }
+        RunMode::SizeReport => process_files(
+            &files,
+            out_dir,
+            initial_egraph.as_deref(),
+            |egg_file, _, timed_egraph| {
+                timed_egraph.run_from_file(egg_file)?;
+                timed_egraph.print_size_report(100)
+            },
+        ),
     }
 }
 
diff --git a/src/serialize_size.rs b/src/serialize_size.rs
new file mode 100644
index 000000000..d99b47083
--- /dev/null
+++ b/src/serialize_size.rs
@@ -0,0 +1,248 @@
+use crate::{
+    ast::ResolvedVar,
+    core::{
+        GenericAtom, GenericCoreAction, GenericCoreActions, Query, ResolvedCall, ResolvedCoreRule,
+    },
+    egglog::util::IndexMap,
+    term_encoding::EncodingState,
+    CommandMacroRegistry, EGraph, RunReport, TypeInfo,
+};
+
+/// Generate a json report for the size of a serialized structu
+/// By default, only uses serialize
+/// Allow specalization to look into subfields
+
+#[allow(dead_code)]
+#[derive(Debug, Clone)]
+pub struct SizeReport {
+    name: String,
+    size: usize,
+    fields: Vec<(String, Box<SizeReport>)>,
+}
+
+fn up_to_two_decimals(a: usize, b: usize) -> String {
+    let a100 = a * 100 / b;
+    let high = a100 / 100;
+    let low = a100 % 100;
+    let low_str = if low < 10 {
+        "0".to_string() + &low.to_string()
+    } else {
+        low.to_string()
+    };
+    high.to_string() + "." + &low_str
+}
+
+fn pretty_print_nbytes(size: usize) -> String {
+    if size < 200 {
+        size.to_string() + "B"
+    } else if size < 200 * 1024 {
+        up_to_two_decimals(size, 1024) + "KB"
+    } else if size < 200 * 1024 * 1024 {
+        up_to_two_decimals(size, 1024 * 1024) + "MB"
+    } else {
+        up_to_two_decimals(size, 1024 * 1024 * 1024) + "GB"
+    }
+}
+
+fn truncate_string_with_ellipsis(s: &str, max_len: usize) -> String {
+    if s.chars().count() > max_len {
+        let mut truncated = s.chars().take(max_len).collect::<String>();
+        truncated.push_str(&format!("...{:} chars total", s.len()));
+        truncated
+    } else {
+        s.to_string()
+    }
+}
+
+impl SizeReport {
+    pub fn pretty_print(&self, level: usize, max_level: usize) {
+        if level > max_level {
+            return;
+        }
+        if level == 0 {
+            println!("{} : {}", self.name, pretty_print_nbytes(self.size));
+        }
+        let mut sorted_fields = self.fields.clone();
+        sorted_fields.sort_by(|(_, a), (_, b)| b.size.cmp(&a.size));
+        for (name, sr) in sorted_fields.iter().take(10) {
+            let percentage = (sr.size as f64 / self.size as f64) * 100.0;
+            let indent = level * 2;
+            println!(
+                "  {:indent$}{} : {} ({:.2}%)",
+                "",
+                name,
+                pretty_print_nbytes(sr.size),
+                percentage
+            );
+            if percentage > 1.0 {
+                sr.pretty_print(level + 1, max_level);
+            }
+        }
+        if sorted_fields.len() > 10 {
+            println!("  {:level$} ... {:} fields total", "", sorted_fields.len());
+        }
+    }
+}
+
+fn get_sizerp_default<T: serde::Serialize>(obj: &T) -> SizeReport {
+    let mut buf = flexbuffers::FlexbufferSerializer::new();
+    serde::Serialize::serialize(obj, &mut buf).expect("Failed to serialize in Flexbuffer");
+    SizeReport {
+        name: std::any::type_name::<T>().to_string(),
+        size: buf.view().len(),
+        fields: Vec::new(),
+    }
+}
+
+pub trait GenerateSizeReport: serde::Serialize + Sized {
+    fn get_sizerp(&self) -> SizeReport {
+        get_sizerp_default(self)
+    }
+}
+
+impl<T: serde::Serialize> GenerateSizeReport for Option<T> {}
+
+impl<K: serde::Serialize + ToString, V: serde::Serialize + GenerateSizeReport> GenerateSizeReport
+    for IndexMap<K, V>
+{
+    fn get_sizerp(&self) -> SizeReport {
+        let mut ret = get_sizerp_default(self);
+        for (k, v) in self {
+            ret.fields.push((
+                truncate_string_with_ellipsis(&k.to_string(), 20),
+                Box::new(v.get_sizerp()),
+            ));
+        }
+        ret
+    }
+}
+
+impl GenerateSizeReport for TypeInfo {}
+
+impl GenerateSizeReport for RunReport {}
+
+impl<K: serde::Serialize, V: serde::Serialize + GenerateSizeReport> GenerateSizeReport
+    for egglog_numeric_id::DenseIdMap<K, V>
+{
+}
+
+impl GenerateSizeReport for CommandMacroRegistry {}
+
+impl GenerateSizeReport for EncodingState {}
+
+impl GenerateSizeReport for egglog::Function {}
+
+use egglog::ast::Ruleset;
+use egglog_ast::span::Span;
+
+impl GenerateSizeReport for Span {}
+
+impl<H: serde::Serialize, L: serde::Serialize> GenerateSizeReport for GenericAtom<H, L> {}
+
+impl<H: serde::Serialize, L: serde::Serialize> GenerateSizeReport for Query<H, L> {
+    fn get_sizerp(&self) -> SizeReport {
+        self.atoms.get_sizerp()
+    }
+}
+
+impl<T: serde::Serialize + GenerateSizeReport> GenerateSizeReport for Vec<T> {
+    fn get_sizerp(&self) -> SizeReport {
+        let mut ret = get_sizerp_default(self);
+        for e in self {
+            let rep = e.get_sizerp();
+            ret.fields.push((rep.name.clone(), Box::new(rep)));
+        }
+        ret
+    }
+}
+
+impl<H: serde::Serialize, L: serde::Serialize> GenerateSizeReport for GenericCoreAction<H, L> {}
+
+impl<H: serde::Serialize, L: serde::Serialize> GenerateSizeReport for GenericCoreActions<H, L> {
+    fn get_sizerp(&self) -> SizeReport {
+        self.0.get_sizerp()
+    }
+}
+
+impl GenerateSizeReport for ResolvedCall {}
+
+impl GenerateSizeReport for ResolvedVar {}
+
+impl GenerateSizeReport for ResolvedCoreRule {
+    fn get_sizerp(&self) -> SizeReport {
+        let mut ret = get_sizerp_default(self);
+        ret.fields
+            .push(("span".to_string(), Box::new(self.span.get_sizerp())));
+        ret.fields
+            .push(("body".to_string(), Box::new(self.body.get_sizerp())));
+        ret.fields
+            .push(("head".to_string(), Box::new(self.head.get_sizerp())));
+        ret
+    }
+}
+
+impl<T: serde::Serialize + GenerateSizeReport, S: serde::Serialize + GenerateSizeReport>
+    GenerateSizeReport for (T, S)
+{
+    fn get_sizerp(&self) -> SizeReport {
+        let mut ret = get_sizerp_default(self);
+        ret.fields
+            .push(("0".to_string(), Box::new(self.0.get_sizerp())));
+        ret.fields
+            .push(("1".to_string(), Box::new(self.1.get_sizerp())));
+        ret
+    }
+}
+
+impl GenerateSizeReport for egglog_bridge::RuleId {}
+
+impl GenerateSizeReport for egglog::ast::Ruleset {
+    fn get_sizerp(&self) -> SizeReport {
+        match &self {
+            Ruleset::Rules(mp) => mp.get_sizerp(),
+            Ruleset::Combined(_l) => {
+                //TODO if needed
+                get_sizerp_default(self)
+            }
+        }
+    }
+}
+
+impl GenerateSizeReport for EGraph {
+    fn get_sizerp(&self) -> SizeReport {
+        let mut ret = get_sizerp_default(&self);
+        ret.fields
+            .push(("backend".to_string(), Box::new(self.backend.get_sizerp())));
+        ret.fields.push((
+            "pushed_egraph".to_string(),
+            Box::new(self.pushed_egraph.get_sizerp()),
+        ));
+        ret.fields.push((
+            "functions".to_string(),
+            Box::new(self.functions.get_sizerp()),
+        ));
+        ret.fields
+            .push(("rulesets".to_string(), Box::new(self.rulesets.get_sizerp())));
+        ret.fields.push((
+            "type_info".to_string(),
+            Box::new(self.type_info.get_sizerp()),
+        ));
+        ret.fields.push((
+            "overall_run_report".to_string(),
+            Box::new(self.overall_run_report.get_sizerp()),
+        ));
+        //ret.fields.push((
+        //    "schedulers".to_string(),
+        //    Box::new(self.schedulers.get_sizerp()),
+        //));
+        //ret.fields.push(("commands".to_string(), Box::new(self.commands.get_sizerp())));
+        //ret.fields.push(("command_macros".to_string(), Box::new(self.command_macros.get_sizerp())));
+        ret.fields.push((
+            "proof_state".to_string(),
+            Box::new(self.proof_state.get_sizerp()),
+        ));
+        ret
+    }
+}
+
+impl GenerateSizeReport for egglog_bridge::EGraph {}
diff --git a/src/typechecking.rs b/src/typechecking.rs
index 859f464e5..444dac2d9 100644
--- a/src/typechecking.rs
+++ b/src/typechecking.rs
@@ -318,7 +318,7 @@ impl EGraph {
             }
             NCommand::MultiExtract(span, variants, exprs) => {
                 let res_exprs = exprs
-                    .into_iter()
+                    .iter()
                     .map(|expr| {
                         self.type_info
                             .typecheck_expr(symbol_gen, expr, &Default::default())