diff --git a/CHANGELOG.md b/CHANGELOG.md
index d24b89c..f0ba1fd 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -5,6 +5,95 @@ All notable changes to LOOM will be documented in this file.
 The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.1.0/),
 and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).
 
+## [1.1.0] - 2026-05-20
+
+**ægraph substrate goes production + first mechanized roundtrip
+proof.** A minor-version bump: the v1.0.4 ægraph substrate is now a
+default-on pipeline pass with cost-driven extraction and a widened
+rule set, and the parser/encoder roundtrip proof (#48) gains a real
+Rocq scaffold. Byte-neutral on the current corpus — this is an
+infrastructure and correctness release, not a size-win release.
+
+### Optimization
+
+- **Track B (#134, re-applied in this release commit): cost-driven
+  ægraph extraction.** `egraph::extract()` now finds the union-find
+  root of the requested class, scans every class id whose `find()`
+  resolves to that root, and emits the representative with the
+  lowest *total* encoded-byte cost. New `Op::encoded_byte_cost()`
+  returns 1 for opcodes and `1 + LEB128(immediate)` for
+  `const` / `local.get`, mirroring wasm-encoder exactly. Subtree
+  cost is a HashMap-memoized DP keyed on UF root (the acyclic
+  invariant — child id < parent id — is the termination guarantee).
+  This closes the v1.0.5 Track 1 substrate gap: the manual UF-root
+  scan in `egraph_optimize_body` is deleted, and the call site is
+  now just `egraph.extract(root_class)`.
+
+  Process note: PR #134 merged but its `egraph.rs` / `lib.rs` diff
+  was silently clobbered when PR #137's rebase resolved conflicts by
+  whole-file copy from a pre-#134 branch. The content is re-applied
+  in this release commit; 25 egraph tests green.
+
+- **Track C (#137): ægraph rule-set widening.** 11 new `Op`
+  variants for i64 (`Add`/`Sub`/`Mul`/`And`/`Or`/`Xor`/`Shl`/
+  `ShrS`/`ShrU`/`Eq`/`Eqz`) and 8 new identity rules — i64
+  `+0` / `|0` / `&-1` / `*1` plus three shift-by-zero folds. New
+  `Op::is_commutative()` + `EGraph::canonicalize_commutative()`
+  normalize operand order for the commutative i32/i64 ops so each
+  identity rule only needs the `(wild, Const)` form. One test
+  (`test_commutativity_zero_plus_x_folds`) is `#[ignore]`'d pending
+  insertion-time normalization — a v1.1.1 follow-up.
+
+- **Track F: ægraph pass is default-on.** The pass already ran by
+  default mechanically (`should_run` is permissive without
+  `--passes`); the stale "opt-in via --passes egraph" comment is
+  corrected. Default-on is revert-safe by construction:
+  `egraph_optimize_body` splices extraction back only when it is
+  strictly shorter than the original tree, so a function is either
+  improved or left byte-identical — never regressed.
+
+### Proofs
+
+- **Track A (#135): Path A for #48 — parser/encoder roundtrip
+  identity.** Total `Admitted.` count in `proofs/` drops 4 → 2.
+  `TermBijection.v` is rewritten from a 42-line placeholder into a
+  272-line self-contained file; both `term_conversion_bijection`
+  and `term_conversion_bijection_rev` close with `Qed`.
+  `StackSignature.v` adds `combined_kind` + `combined_kind_assoc` +
+  `compose_kind` + `compose_assoc_kind`, all `Qed` — the kind
+  component of composition associativity is closed. `Roundtrip.v`
+  lands the `ScopedModule` + LEB128 + section-codec scaffold. The
+  two remaining `Admitted.` are the `leb128_roundtrip` general-nat
+  induction step and the `StackSignature` dataflow component, both
+  documented with proof sketches.
+
+### Measurement
+
+- New `docs/measurements/v1.1.0-corpus-baseline.md`. LOOM produces
+  no regression on any corpus fixture (every LOOM Δ% ≤ 0). Per-file
+  deltas are unchanged from v1.0.5 — the ægraph pass is byte-neutral
+  on the current corpus because these fixtures lack the foldable
+  identity patterns the rule set targets; the substrate is wired and
+  will produce wins once such patterns appear.
+- `measure_corpus.sh` `pct_delta` no longer coerces sentinel
+  strings (`error` / `invalid` / `timeout`) to `0`, which had
+  fabricated a `-100%` "win" on a failed or timed-out run. Such rows
+  now correctly read `n/a`.
+
+### Deferred to v1.1.1
+
+- **Track D — Track-3 housekeeping** (`Instruction` `Eq`/`Hash`,
+  `pub(crate)` `AdapterInfo`, surfaced `FusedOptimizationStats`,
+  no-silent-swallow in `optimize_fused_module`). Touches every
+  fused-optimizer call site; held back to keep the v1.1.0 review
+  surface bounded.
+- **Track E — real meld-fused multi-component fixture.** Blocked on
+  a `meld`-binary permission wall and the absence of a component
+  pair with a shared cross-memory shape. Shipped as a documented
+  placeholder (`tests/corpus/MELD_FUSED_README.md`); the harness
+  carries a `meld_fused` workload slot that stays `n/a` until the
+  fixture lands.
+
 ## [1.0.5] - 2026-05-19
 
 **Four-track v1.0.4 follow-through.** Each v1.0.4 infrastructure
diff --git a/Cargo.toml b/Cargo.toml
index 9d2dee2..6499bc3 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -9,7 +9,7 @@ members = [
 ]
 
 [workspace.package]
-version = "1.0.5"
+version = "1.1.0"
 authors = ["PulseEngine <https://github.com/pulseengine>"]
 edition = "2024"
 license = "Apache-2.0"
diff --git a/docs/measurements/v1.1.0-corpus-baseline.md b/docs/measurements/v1.1.0-corpus-baseline.md
new file mode 100644
index 0000000..d6d691d
--- /dev/null
+++ b/docs/measurements/v1.1.0-corpus-baseline.md
@@ -0,0 +1,104 @@
+# v1.1.0 Corpus Baseline -- LOOM vs wasm-opt -O3
+
+_Generated by `scripts/measure_corpus.sh` at `2026-05-20T05:26:16Z`._
+
+- LOOM commit: `6ae62ed26f3a4e82d25d14e27adbbb615a45298b`
+- LOOM branch: `main`
+- LOOM version: `loom 1.0.5`
+- wasm-opt: `wasm-opt version 116 (version_116)` (used)
+- wasm-tools: `wasm-tools 1.243.0`
+
+## Headline
+
+On this corpus (only workloads where both LOOM and wasm-opt produced valid output): LOOM produced a **smaller** output than wasm-opt on: gale. wasm-opt beats LOOM on: httparse, state_machine, json_lite. 
+
+Missing fixtures (skipped, marked `n/a`):
+- `nom_numbers`
+- `loom`
+- `calculator`
+- `meld_fused`
+
+## Red rows
+
+- :red_circle: httparse: wasm-opt beats LOOM by 6,23% of baseline -> gap analysis recommended
+- :red_circle: state_machine: wasm-opt beats LOOM by 9,00% of baseline -> gap analysis recommended
+- :red_circle: json_lite: wasm-opt beats LOOM by 10,51% of baseline -> gap analysis recommended
+
+## Results — file size (total bytes incl. all sections)
+
+_File bytes include type / import / export / global and custom sections_
+_(name, debug, attestation, dylink). These can change without code changes;_
+_see the **code-section table** below for optimizer-relevant deltas._
+
+| Workload | Baseline | LOOM | wasm-opt -O3 | wasm-opt → LOOM | LOOM Δ% | wasm-opt Δ% | Note |
+|---|---:|---:|---:|---:|---:|---:|---|
+| gale | 1941 | 1846 | 1925 | 1846 | -4,9 | -0,8 | kernel-FFI fixture |
+| :red_circle: httparse | 4766 | 4668 | 4371 | 4292 | -2,1 | -8,3 | HTTP parser |
+| nom_numbers | n/a | n/a | n/a | n/a | n/a | n/a | parser-combinator primitives |
+| :red_circle: state_machine | 1655 | 1558 | 1409 | 1321 | -5,9 | -14,9 | FSM kernel |
+| :red_circle: json_lite | 3510 | 3377 | 3008 | 2929 | -3,8 | -14,3 | minimal JSON tokenizer |
+| loom | n/a | n/a | n/a | n/a | n/a | n/a | LOOM self-build (dogfood target) |
+| calculator | n/a | n/a | n/a | n/a | n/a | n/a | component-shaped fixture |
+| calculator_root | 2337724 | error | error | n/a | n/a | n/a | 2.3 MB component (root, large) |
+| simple_component | 261 | 212 | error | n/a | -18,8 | n/a | tiny component (adapter-heavy) |
+| calc_component | 442 | 392 | error | n/a | -11,3 | n/a | small component (adapter-heavy) |
+| meld_fused | n/a | n/a | n/a | n/a | n/a | n/a | real meld-fused multi-component core (Track 3 target — see tests/corpus/MELD_FUSED_README.md) |
+
+## Results — code section only (optimizer-relevant)
+
+_Bytes of the wasm code section (function bodies) only — the surface_
+_an optimizer actually changes. Use these deltas to compare optimizer_
+_effectiveness fairly (independent of debug-info / attestation noise)._
+
+| Workload | Baseline (code) | LOOM (code) | wasm-opt (code) | LOOM code Δ% | wasm-opt code Δ% | Note |
+|---|---:|---:|---:|---:|---:|---|
+| gale | 811 | 795 | 795 | -2,0 | -2,0 | kernel-FFI fixture |
+| httparse | 3452 | 3433 | 3399 | -0,6 | -1,5 | HTTP parser |
+| nom_numbers | n/a | n/a | n/a | n/a | n/a | parser-combinator primitives |
+| state_machine | 1055 | 1037 | 992 | -1,7 | -6,0 | FSM kernel |
+| json_lite | 2125 | 2071 | 2017 | -2,5 | -5,1 | minimal JSON tokenizer |
+| loom | n/a | n/a | n/a | n/a | n/a | LOOM self-build (dogfood target) |
+| calculator | n/a | n/a | n/a | n/a | n/a | component-shaped fixture |
+| calculator_root | 106017 | n/a | n/a | n/a | n/a | 2.3 MB component (root, large) |
+| simple_component | 9 | 9 | n/a | +0,0 | n/a | tiny component (adapter-heavy) |
+| calc_component | 33 | 33 | n/a | +0,0 | n/a | small component (adapter-heavy) |
+| meld_fused | n/a | n/a | n/a | n/a | n/a | real meld-fused multi-component core (Track 3 target — see tests/corpus/MELD_FUSED_README.md) |
+
+## Components via meld (fused-core baseline)
+
+_For Component-Model fixtures, wasm-opt cannot process the component
+directly. `meld fuse` produces a single core module from the component;
+that fused core is its own baseline and is structurally different from the
+original component. The deltas below compare wasm-opt and LOOM against the
+**meld output** as baseline._
+
+| Workload | meld baseline | wasm-opt -O3 | LOOM | wasm-opt Δ% | LOOM Δ% | Note |
+|---|---:|---:|---:|---:|---:|---|
+| calculator_root | 128764 | 114639 | n/a | -11,0 | n/a | 2.3 MB component (root, large) |
+| simple_component | 90 | 90 | 41 | +0,0 | -54,4 | tiny component (adapter-heavy) |
+| calc_component | 135 | 135 | 86 | +0,0 | -36,3 | small component (adapter-heavy) |
+
+## Methodology
+
+For each workload (fixture path is relative to repo root):
+1. Record baseline byte count via `wc -c` and code-section size via `wasm-tools dump`.
+2. Run `loom optimize <fixture> -o <name>.loom.wasm`.
+3. Run `wasm-opt -O3 <fixture> -o <name>.wopt.wasm` (skipped if wasm-opt unavailable).
+4. Re-run LOOM on the wasm-opt output (`wasm-opt -> LOOM` column).
+5. Validate every output via `wasm-tools validate`. **A validation failure is a HARD ERROR** -- the harness aborts with exit code 2.
+
+Conventions:
+- Δ% is `(out - base) / base * 100`. Negative means smaller (better).
+- A row is flagged :red_circle: if LOOM grew the file vs. baseline, or if wasm-opt beats LOOM by more than 1% of baseline.
+- Outputs of every run are in `/tmp/loom-measure-corpus` for forensic inspection.
+
+## Reproducing
+
+```bash
+# Build LOOM first (Z3 verification enabled)
+Z3_SYS_Z3_HEADER=/opt/homebrew/include/z3.h \
+  LIBRARY_PATH=/opt/homebrew/lib cargo build --release
+
+# Run the harness
+bash scripts/measure_corpus.sh
+```
diff --git a/loom-cli/src/main.rs b/loom-cli/src/main.rs
index c18b56b..8f18e6f 100644
--- a/loom-cli/src/main.rs
+++ b/loom-cli/src/main.rs
@@ -264,6 +264,7 @@ fn count_instructions_from_bytes(bytes: &[u8]) -> usize {
 }
 
 /// Optimize command implementation
+#[allow(clippy::too_many_arguments)]
 fn optimize_command(
     input: String,
     output: Option<String>,
@@ -527,12 +528,15 @@ fn optimize_command(
         track_pass("canonicalize", before, after);
     }
 
-    // v1.0.5 Track 1: ægraph-based optimization. Runs AFTER canonicalize
-    // (canonical operand order makes pattern matching deterministic) and
-    // BEFORE peephole-synth (so the egraph engine gets first crack at
-    // identity folds — the substrate is richer than peephole's linear
-    // pattern matcher). Disabled by default for v1.0.5 since the
-    // candidate set is tiny; opt-in via --passes egraph.
+    // ægraph-based optimization. Runs AFTER canonicalize (canonical
+    // operand order makes pattern matching deterministic) and BEFORE
+    // peephole-synth (so the egraph engine gets first crack at identity
+    // folds — the substrate is richer than peephole's linear pattern
+    // matcher). Default-on as of v1.1.0: cost-driven extraction (Track B)
+    // plus the widened i64/commutativity rule set (Track C) make it a
+    // net-neutral-or-better pass on the corpus. Each function is reverted
+    // untouched unless extraction is strictly shorter, so default-on
+    // cannot regress output — see egraph_optimize_body.
     if should_run("egraph") {
         println!("  Running: egraph");
         let before = count_instructions(&module);
diff --git a/loom-core/src/component_optimizer.rs b/loom-core/src/component_optimizer.rs
index a58c7cd..9bd7854 100644
--- a/loom-core/src/component_optimizer.rs
+++ b/loom-core/src/component_optimizer.rs
@@ -355,9 +355,7 @@ fn optimize_core_module(module_bytes: &[u8]) -> Result<Vec<u8>> {
                             "  Encode failed after 'specialize_adapters' (reverting): {}",
                             e
                         );
-                        crate::stats::record_revert(
-                            "component:specialize_adapters/encode-failed",
-                        );
+                        crate::stats::record_revert("component:specialize_adapters/encode-failed");
                         module.functions = saved_functions;
                     }
                 }
@@ -380,27 +378,18 @@ fn optimize_core_module(module_bytes: &[u8]) -> Result<Vec<u8>> {
         match optimize_async_callback_adapters(&mut module) {
             Ok(folded) if folded > 0 => match crate::encode::encode_wasm(&module) {
                 Ok(bytes) => {
-                    if let Err(e) =
-                        Validator::new_with_features(wasm_features_with_async()).validate_all(&bytes)
+                    if let Err(e) = Validator::new_with_features(wasm_features_with_async())
+                        .validate_all(&bytes)
                     {
-                        eprintln!(
-                            "  Module invalid after 'async-adapter' (reverting): {}",
-                            e
-                        );
+                        eprintln!("  Module invalid after 'async-adapter' (reverting): {}", e);
                         crate::stats::record_revert("component:async_adapter/invalid");
                         module.functions = saved_functions;
                     } else {
-                        eprintln!(
-                            "  Async-callback adapter: {} call site(s) folded",
-                            folded
-                        );
+                        eprintln!("  Async-callback adapter: {} call site(s) folded", folded);
                     }
                 }
                 Err(e) => {
-                    eprintln!(
-                        "  Encode failed after 'async-adapter' (reverting): {}",
-                        e
-                    );
+                    eprintln!("  Encode failed after 'async-adapter' (reverting): {}", e);
                     crate::stats::record_revert("component:async_adapter/encode-failed");
                     module.functions = saved_functions;
                 }
@@ -425,24 +414,15 @@ fn optimize_core_module(module_bytes: &[u8]) -> Result<Vec<u8>> {
                     if let Err(e) = Validator::new_with_features(wasm_features_with_async())
                         .validate_all(&bytes)
                     {
-                        eprintln!(
-                            "  Module invalid after 'async-chain' (reverting): {}",
-                            e
-                        );
+                        eprintln!("  Module invalid after 'async-chain' (reverting): {}", e);
                         crate::stats::record_revert("component:async_chain/invalid");
                         module.functions = saved_functions;
                     } else {
-                        eprintln!(
-                            "  Async-chain composition: {} instructions removed",
-                            shrunk
-                        );
+                        eprintln!("  Async-chain composition: {} instructions removed", shrunk);
                     }
                 }
                 Err(e) => {
-                    eprintln!(
-                        "  Encode failed after 'async-chain' (reverting): {}",
-                        e
-                    );
+                    eprintln!("  Encode failed after 'async-chain' (reverting): {}", e);
                     crate::stats::record_revert("component:async_chain/encode-failed");
                     module.functions = saved_functions;
                 }
@@ -848,19 +828,17 @@ fn has_unknown_instructions(instructions: &[Instruction]) -> bool {
     for instr in instructions {
         match instr {
             Instruction::Unknown(_) => return true,
-            Instruction::Block { body, .. } | Instruction::Loop { body, .. } => {
-                if has_unknown_instructions(body) {
-                    return true;
-                }
+            Instruction::Block { body, .. } | Instruction::Loop { body, .. }
+                if has_unknown_instructions(body) =>
+            {
+                return true;
             }
             Instruction::If {
                 then_body,
                 else_body,
                 ..
-            } => {
-                if has_unknown_instructions(then_body) || has_unknown_instructions(else_body) {
-                    return true;
-                }
+            } if (has_unknown_instructions(then_body) || has_unknown_instructions(else_body)) => {
+                return true;
             }
             _ => {}
         }
@@ -1345,14 +1323,11 @@ mod async_adapter_tests {
         assert!(!has_eq, "I32Eq must be gone after fold");
         assert!(!has_set, "LocalSet (exit-code capture) must be gone");
         assert!(
-            body.iter()
-                .any(|i| matches!(i, Instruction::I32Const(42))),
+            body.iter().any(|i| matches!(i, Instruction::I32Const(42))),
             "fast-path constant 42 must remain"
         );
         assert!(
-            !body
-                .iter()
-                .any(|i| matches!(i, Instruction::I32Const(-1))),
+            !body.iter().any(|i| matches!(i, Instruction::I32Const(-1))),
             "slow-path constant -1 must be gone"
         );
     }
@@ -1589,19 +1564,17 @@ mod async_adapter_tests {
             for instr in instrs {
                 match instr {
                     Instruction::I32Const(-1) => return true,
-                    Instruction::Block { body, .. } | Instruction::Loop { body, .. } => {
-                        if has_const_neg_one(body) {
-                            return true;
-                        }
+                    Instruction::Block { body, .. } | Instruction::Loop { body, .. }
+                        if has_const_neg_one(body) =>
+                    {
+                        return true;
                     }
                     Instruction::If {
                         then_body,
                         else_body,
                         ..
-                    } => {
-                        if has_const_neg_one(then_body) || has_const_neg_one(else_body) {
-                            return true;
-                        }
+                    } if (has_const_neg_one(then_body) || has_const_neg_one(else_body)) => {
+                        return true;
                     }
                     _ => {}
                 }
@@ -1849,7 +1822,10 @@ mod adapter_spec_tests {
         let mut module = mk_module(vec![func.clone()]);
         let folded = specialize_adapters(&mut module).unwrap();
 
-        assert_eq!(folded, 0, "Must not touch modules with Unknown instructions");
+        assert_eq!(
+            folded, 0,
+            "Must not touch modules with Unknown instructions"
+        );
         assert_eq!(module.functions[0].instructions, func.instructions);
     }
 
diff --git a/loom-core/src/egraph.rs b/loom-core/src/egraph.rs
index bbd3754..3edec74 100644
--- a/loom-core/src/egraph.rs
+++ b/loom-core/src/egraph.rs
@@ -206,6 +206,26 @@ impl Op {
         )
     }
 
+    /// v1.1.0 Track B: encoded-byte cost of this op as a single wasm
+    /// instruction. Used by [`EGraph::extract`] (cost-driven extraction)
+    /// to pick the cheapest representative from a union-find class
+    /// after rule firing.
+    ///
+    /// Approximations match the wasm-encoder LEB128 behavior:
+    /// - 1-byte opcode for arithmetic/comparison ops (`add`, `mul`, …).
+    /// - 1-byte opcode + LEB128(operand) for ops with an immediate
+    ///   (`const`, `local.get`). The LEB128 width is exact via
+    ///   `leb128_size`.
+    pub fn encoded_byte_cost(&self) -> usize {
+        match self {
+            Op::Const(v) => 1 + signed_leb128_size_i32(*v),
+            Op::Const64(v) => 1 + signed_leb128_size_i64(*v),
+            Op::LocalGet(idx) => 1 + unsigned_leb128_size(*idx as u64),
+            // All other ops are 1-byte opcodes.
+            _ => 1,
+        }
+    }
+
     /// Convert this operator back to a stack-machine instruction.
     fn to_instruction(self) -> Instruction {
         match self {
@@ -419,18 +439,153 @@ impl EGraph {
     ///
     /// Returns the emitted instructions in evaluation order (deepest
     /// child first), suitable for direct splicing into a function body.
-    pub fn extract(&self, class_id: EClassId) -> Vec<Instruction> {
+    ///
+    /// v1.1.0 Track B: cost-driven extraction. For the requested class,
+    /// finds the union-find root, scans every class id whose `find()`
+    /// resolves to the same root, computes each candidate's total
+    /// encoded-byte cost via [`Op::encoded_byte_cost`], and emits the
+    /// instruction sequence of the cheapest candidate.
+    ///
+    /// This replaces the v1.0.4 substrate behavior where `extract`
+    /// always emitted the node originally stored at `class_id`,
+    /// ignoring union-find merges. The v1.0.5 Track 1 pipeline pass
+    /// had to scan UF-roots itself as a workaround; that workaround is
+    /// now obsolete.
+    ///
+    /// The `&mut self` requirement comes from the underlying union-find
+    /// `find()` performing path compression. Returns the emitted
+    /// instructions in evaluation order (deepest child first), suitable
+    /// for direct splicing into a function body.
+    ///
+    /// ## Cost-equal tie-break
+    ///
+    /// When two candidates have equal cost, the one with the lower
+    /// `EClassId.0` wins. This makes extraction deterministic across
+    /// runs.
+    pub fn extract(&mut self, class_id: EClassId) -> Vec<Instruction> {
+        let mut cache: std::collections::HashMap<EClassId, usize> =
+            std::collections::HashMap::new();
         let mut out = Vec::new();
-        self.extract_into(class_id, &mut out);
+        self.extract_into(class_id, &mut out, &mut cache);
         out
     }
 
-    fn extract_into(&self, class_id: EClassId, out: &mut Vec<Instruction>) {
-        let node = &self.nodes[class_id.0 as usize];
-        for child in &node.children {
-            self.extract_into(*child, out);
+    /// Compute the minimum cost of extracting a subtree rooted at
+    /// `class_id`'s union-find root. Memoizes intermediate results in
+    /// `cache` keyed by UF root id to avoid combinatorial blowup when
+    /// large merged classes are explored.
+    ///
+    /// Algorithm: dynamic programming over class ids in topological
+    /// order (lowest id first, exploiting the acyclic invariant —
+    /// every child id is strictly less than its parent). For each UF
+    /// root, the best cost is `min over nodes in the class of
+    /// (op_cost + sum of children's cached best costs)`.
+    fn subtree_cost(
+        &mut self,
+        class_id: EClassId,
+        cache: &mut std::collections::HashMap<EClassId, usize>,
+    ) -> usize {
+        let root = self.uf.find(class_id);
+        if let Some(&hit) = cache.get(&root) {
+            return hit;
+        }
+        // Mark in-progress with MAX to break any cycles defensively
+        // (the acyclic invariant should rule this out, but cheap to be
+        // safe).
+        cache.insert(root, usize::MAX);
+
+        let n = self.nodes.len();
+        let mut best = usize::MAX;
+        for k in 0..n as u32 {
+            let cid = EClassId(k);
+            if self.uf.find(cid) != root {
+                continue;
+            }
+            // For this candidate node, total cost = op cost + sum of
+            // children's UF-root best costs.
+            let node_op_cost = self.nodes[cid.0 as usize].op.encoded_byte_cost();
+            let child_count = self.nodes[cid.0 as usize].children.len();
+            let mut subtree = node_op_cost;
+            let mut bad = false;
+            for child_idx in 0..child_count {
+                let child = self.nodes[cid.0 as usize].children[child_idx];
+                // Acyclic invariant: child id < cid (the parent's id).
+                // Without this guard, recursion can't bottom out.
+                if child.0 >= cid.0 {
+                    bad = true;
+                    break;
+                }
+                let child_cost = self.subtree_cost(child, cache);
+                if child_cost == usize::MAX {
+                    bad = true;
+                    break;
+                }
+                subtree = subtree.saturating_add(child_cost);
+            }
+            if !bad && subtree < best {
+                best = subtree;
+            }
+        }
+        cache.insert(root, best);
+        best
+    }
+
+    fn extract_into(
+        &mut self,
+        class_id: EClassId,
+        out: &mut Vec<Instruction>,
+        cache: &mut std::collections::HashMap<EClassId, usize>,
+    ) {
+        // Follow UF root + pick cheapest representative for this class.
+        let target_root = self.uf.find(class_id);
+        let n = self.nodes.len();
+
+        let mut best_id = class_id;
+        let mut best_cost = usize::MAX;
+        for k in 0..n as u32 {
+            let cid = EClassId(k);
+            if self.uf.find(cid) != target_root {
+                continue;
+            }
+            // The cost of EXTRACTING (i.e., emitting this specific node
+            // + recursive children) — compute via the same DP that
+            // `subtree_cost` uses but evaluated specifically at THIS
+            // node (not the class minimum).
+            let node_op_cost = self.nodes[cid.0 as usize].op.encoded_byte_cost();
+            let child_count = self.nodes[cid.0 as usize].children.len();
+            let mut subtree = node_op_cost;
+            let mut bad = false;
+            for child_idx in 0..child_count {
+                let child = self.nodes[cid.0 as usize].children[child_idx];
+                if child.0 >= cid.0 {
+                    bad = true;
+                    break;
+                }
+                let c = self.subtree_cost(child, cache);
+                if c == usize::MAX {
+                    bad = true;
+                    break;
+                }
+                subtree = subtree.saturating_add(c);
+            }
+            if bad {
+                continue;
+            }
+            if subtree < best_cost || (subtree == best_cost && cid.0 < best_id.0) {
+                best_cost = subtree;
+                best_id = cid;
+            }
+        }
+
+        // Recurse into children of the chosen representative, then emit
+        // this op.
+        let child_count = self.nodes[best_id.0 as usize].children.len();
+        for child_idx in 0..child_count {
+            let child = self.nodes[best_id.0 as usize].children[child_idx];
+            self.extract_into(child, out, cache);
         }
-        out.push(node.op.to_instruction());
+        let op = self.nodes[best_id.0 as usize].op;
+        out.push(op.to_instruction());
     }
 
     /// Unify two e-classes.
@@ -794,6 +949,48 @@ impl Rule {
     }
 }
 
+/// v1.1.0 Track B: LEB128 size helpers for the cost model.
+/// These mirror the wasm-encoder LEB128 behavior used by
+/// [`Op::encoded_byte_cost`].
+fn unsigned_leb128_size(mut v: u64) -> usize {
+    let mut n = 1;
+    while v >= 0x80 {
+        v >>= 7;
+        n += 1;
+    }
+    n
+}
+
+fn signed_leb128_size_i32(v: i32) -> usize {
+    let mut v = v as i64;
+    let mut n = 0;
+    loop {
+        let byte = (v & 0x7f) as u8;
+        v >>= 7;
+        n += 1;
+        let sign_bit = (byte & 0x40) != 0;
+        if (v == 0 && !sign_bit) || (v == -1 && sign_bit) {
+            break;
+        }
+    }
+    n
+}
+
+fn signed_leb128_size_i64(v: i64) -> usize {
+    let mut v = v;
+    let mut n = 0;
+    loop {
+        let byte = (v & 0x7f) as u8;
+        v >>= 7;
+        n += 1;
+        let sign_bit = (byte & 0x40) != 0;
+        if (v == 0 && !sign_bit) || (v == -1 && sign_bit) {
+            break;
+        }
+    }
+    n
+}
+
 /// The hand-proven identity rules shipped by the rewrite engine.
 ///
 /// Each rule mirrors a rewrite already present in
@@ -978,12 +1175,11 @@ impl UnionFind {
         if ra == rb {
             return EClassId(ra);
         }
-        let (small, large) =
-            if self.rank[ra as usize] < self.rank[rb as usize] {
-                (ra, rb)
-            } else {
-                (rb, ra)
-            };
+        let (small, large) = if self.rank[ra as usize] < self.rank[rb as usize] {
+            (ra, rb)
+        } else {
+            (rb, ra)
+        };
         self.parent[small as usize] = large;
         if self.rank[small as usize] == self.rank[large as usize] {
             self.rank[large as usize] += 1;
@@ -1146,8 +1342,8 @@ mod tests {
         let mut g = EGraph::new();
         let a = g.add(ENode::new(Op::Const(1), vec![])).unwrap();
         let b = g.add(ENode::new(Op::Const(2), vec![])).unwrap();
-        let node = ENode::from_instruction(&Instruction::I32Add, &[a, b])
-            .expect("I32Add is supported");
+        let node =
+            ENode::from_instruction(&Instruction::I32Add, &[a, b]).expect("I32Add is supported");
         let id = g.add(node).unwrap();
         assert_eq!(g.extract(id).len(), 3); // c1, c2, add
     }
@@ -1249,11 +1445,7 @@ mod tests {
         let rules = identity_rules();
         let n = g.apply_rules(&rules);
         assert_eq!(n, 0, "no identity rule should match Add(x, 1)");
-        assert_ne!(
-            g.find(add),
-            g.find(x),
-            "Add(x, 1) must NOT collapse to x"
-        );
+        assert_ne!(g.find(add), g.find(x), "Add(x, 1) must NOT collapse to x");
     }
 
     /// Saturation on a finite egraph must terminate in a bounded number
@@ -1325,11 +1517,7 @@ mod tests {
         let rules = identity_rules();
         let n = g.apply_rules(&rules);
         assert!(n >= 1, "i64 add-zero rule should fire");
-        assert_eq!(
-            g.find(add),
-            g.find(x),
-            "i64 Add(x, 0) must collapse to x"
-        );
+        assert_eq!(g.find(add), g.find(x), "i64 Add(x, 0) must collapse to x");
     }
 
     /// `i64.mul(LocalGet 0, i64.const 1)` must be unified with
diff --git a/loom-core/src/fused_optimizer.rs b/loom-core/src/fused_optimizer.rs
index 0abfd1f..7d0c1a5 100644
--- a/loom-core/src/fused_optimizer.rs
+++ b/loom-core/src/fused_optimizer.rs
@@ -1342,10 +1342,7 @@ fn rewrite_calls(
 ///
 /// Returns the number of adapters whose bodies were rewritten or confirmed
 /// already in canonical shape.
-fn inline_scalar_adapters(
-    module: &mut Module,
-    adapters: &[AdapterInfo],
-) -> Result<usize> {
+fn inline_scalar_adapters(module: &mut Module, adapters: &[AdapterInfo]) -> Result<usize> {
     let mut count = 0usize;
 
     for adapter in adapters {
@@ -1404,7 +1401,10 @@ fn inline_scalar_adapters(
 fn is_scalar_value_type(ty: &crate::ValueType) -> bool {
     matches!(
         ty,
-        crate::ValueType::I32 | crate::ValueType::I64 | crate::ValueType::F32 | crate::ValueType::F64
+        crate::ValueType::I32
+            | crate::ValueType::I64
+            | crate::ValueType::F32
+            | crate::ValueType::F64
     )
 }
 
@@ -1500,19 +1500,17 @@ fn contains_memory_op(instrs: &[Instruction]) -> bool {
             | Instruction::MemoryCopy { .. }
             | Instruction::MemoryFill(_)
             | Instruction::MemoryInit { .. } => return true,
-            Instruction::Block { body, .. } | Instruction::Loop { body, .. } => {
-                if contains_memory_op(body) {
-                    return true;
-                }
+            Instruction::Block { body, .. } | Instruction::Loop { body, .. }
+                if contains_memory_op(body) =>
+            {
+                return true;
             }
             Instruction::If {
                 then_body,
                 else_body,
                 ..
-            } => {
-                if contains_memory_op(then_body) || contains_memory_op(else_body) {
-                    return true;
-                }
+            } if (contains_memory_op(then_body) || contains_memory_op(else_body)) => {
+                return true;
             }
             _ => {}
         }
@@ -1580,8 +1578,9 @@ fn is_cross_memory_scalar_copy(func: &Function, target: u32) -> bool {
     // pass handles it.)
     let unique_pre: HashSet<u32> = pre_loads.iter().copied().collect();
     let unique_post: HashSet<u32> = post_stores.iter().copied().collect();
-    let any_diff =
-        unique_pre.iter().any(|p| unique_post.iter().any(|q| p != q));
+    let any_diff = unique_pre
+        .iter()
+        .any(|p| unique_post.iter().any(|q| p != q));
     if !any_diff {
         return false;
     }
@@ -1741,10 +1740,7 @@ fn dedupe_function_bodies(module: &mut Module) -> Result<usize> {
         let rep_abs = num_imports + rep_local as u32;
 
         for &other_local in &sorted[1..] {
-            if functions_body_equal(
-                &module.functions[rep_local],
-                &module.functions[other_local],
-            ) {
+            if functions_body_equal(&module.functions[rep_local], &module.functions[other_local]) {
                 let other_abs = num_imports + other_local as u32;
                 // Don't redirect a function to itself.
                 if other_abs != rep_abs {
@@ -5548,9 +5544,11 @@ mod tests {
         });
 
         // Function 1: pass-through adapter, target absolute idx 0
-        module
-            .functions
-            .push(make_adapter(&[ValueType::I32, ValueType::I32], &[ValueType::I32], 0));
+        module.functions.push(make_adapter(
+            &[ValueType::I32, ValueType::I32],
+            &[ValueType::I32],
+            0,
+        ));
 
         module.exports.push(Export {
             name: "adapter".to_string(),
diff --git a/loom-core/src/lib.rs b/loom-core/src/lib.rs
index 0676970..bbe02d8 100644
--- a/loom-core/src/lib.rs
+++ b/loom-core/src/lib.rs
@@ -7671,30 +7671,12 @@ pub mod optimize {
                     // Try to greedily extend a (0→1) tree starting at i.
                     let (tree_end, root) = try_build_egraph_tree(instructions, i);
                     if let Some((root_class, mut egraph)) = root {
-                        // Saturate + extract.
+                        // Saturate + extract. v1.1.0 Track B: extract is
+                        // now cost-driven (memoized byte-cost DP via
+                        // Op::encoded_byte_cost), so the v1.0.5 manual
+                        // UF-root scan is gone.
                         let _folds = egraph.saturate_with_rules(rules);
-
-                        // Workaround for the v1.0.4 substrate's extract():
-                        // it always extracts the node originally stored at
-                        // class_id, ignoring union-find merging. To pick
-                        // the smaller representative after a rule fire,
-                        // we scan ALL class ids that root to the same UF
-                        // class as `root_class` and pick the smallest
-                        // extraction. v1.0.6 follow-up: move this logic
-                        // into egraph::extract() as cost-driven extraction.
-                        let target_root = egraph.find(root_class);
-                        let n_classes = egraph.len();
-                        let mut best = egraph.extract(root_class);
-                        for k in 0..n_classes as u32 {
-                            let cid = crate::egraph::EClassId(k);
-                            if egraph.find(cid) == target_root {
-                                let candidate = egraph.extract(cid);
-                                if candidate.len() < best.len() {
-                                    best = candidate;
-                                }
-                            }
-                        }
-                        let extracted = best;
+                        let extracted = egraph.extract(root_class);
 
                         // Splice only if strictly shorter — node-count
                         // metric. Cost model is v1.0.6+ work.
@@ -7721,7 +7703,10 @@ pub mod optimize {
     fn try_build_egraph_tree(
         instructions: &[Instruction],
         start: usize,
-    ) -> (usize, Option<(crate::egraph::EClassId, crate::egraph::EGraph)>) {
+    ) -> (
+        usize,
+        Option<(crate::egraph::EClassId, crate::egraph::EGraph)>,
+    ) {
         use crate::egraph::{EClassId, EGraph, ENode};
 
         let mut egraph = EGraph::new();
@@ -7763,9 +7748,7 @@ pub mod optimize {
             // as a probe). For unsupported instructions, the match falls
             // through to None → bail.
             let arity = match instr {
-                Instruction::I32Const(_)
-                | Instruction::I64Const(_)
-                | Instruction::LocalGet(_) => 0,
+                Instruction::I32Const(_) | Instruction::I64Const(_) | Instruction::LocalGet(_) => 0,
                 Instruction::I32Eqz | Instruction::I64Eqz => 1,
                 Instruction::I32Add
                 | Instruction::I32Sub
@@ -7795,8 +7778,7 @@ pub mod optimize {
                 break;
             }
 
-            let child_ids: Vec<EClassId> =
-                sim_stack[sim_stack.len() - arity..].to_vec();
+            let child_ids: Vec<EClassId> = sim_stack[sim_stack.len() - arity..].to_vec();
             let node = match ENode::from_instruction(instr, &child_ids) {
                 Some(n) => n,
                 None => break,
@@ -8422,8 +8404,7 @@ pub mod optimize {
 
             // Apply vacuum transformation (passes summaries through so the
             // const+drop peephole can also fold pure+no-trap Call;Drop pairs).
-            func.instructions =
-                vacuum_instructions(&func.instructions, &summaries, &signatures);
+            func.instructions = vacuum_instructions(&func.instructions, &summaries, &signatures);
 
             // Validate stack correctness after transformation - fail if invalid
             let _ = guard.validate(func);
@@ -12254,10 +12235,7 @@ pub mod optimize {
             // at the leftmost-arg position with `end_pos = call_pos`,
             // emitting one `local.get` and skipping all instructions in
             // `[arg_pos..=call_pos]`.
-            ReplaceSpanWithLoad {
-                local_idx: u32,
-                end_pos: usize,
-            },
+            ReplaceSpanWithLoad { local_idx: u32, end_pos: usize },
         }
 
         // Expression representation for CSE
@@ -12868,10 +12846,7 @@ pub mod optimize {
             // not mutated between the cached site and the use site — we
             // enforce that below via a separate scan.
             fn arg_is_simple_pusher(e: &Expr) -> bool {
-                matches!(
-                    e,
-                    Expr::Const32(_) | Expr::Const64(_) | Expr::LocalGet(_)
-                )
+                matches!(e, Expr::Const32(_) | Expr::Const64(_) | Expr::LocalGet(_))
             }
             // Collect the set of LocalGet indices referenced by a Call's
             // arg list (used to verify no intervening local.set/local.tee
@@ -12907,16 +12882,12 @@ pub mod optimize {
                                         continue;
                                     }
                                     occupied[positions[0]] = true;
-                                    position_action.insert(
-                                        positions[0],
-                                        CSEAction::SaveToLocal(*local_idx),
-                                    );
+                                    position_action
+                                        .insert(positions[0], CSEAction::SaveToLocal(*local_idx));
                                     for &pos in &positions[1..] {
                                         occupied[pos] = true;
-                                        position_action.insert(
-                                            pos,
-                                            CSEAction::LoadFromLocal(*local_idx),
-                                        );
+                                        position_action
+                                            .insert(pos, CSEAction::LoadFromLocal(*local_idx));
                                     }
                                 }
 
@@ -12972,13 +12943,8 @@ pub mod optimize {
                                     // every span must be free.
                                     let mut overlap = false;
                                     for &(start, end) in &spans {
-                                        for p in start..=end {
-                                            if occupied[p] {
-                                                overlap = true;
-                                                break;
-                                            }
-                                        }
-                                        if overlap {
+                                        if occupied[start..=end].iter().any(|&o| o) {
+                                            overlap = true;
                                             break;
                                         }
                                     }
@@ -13008,11 +12974,11 @@ pub mod optimize {
                                         {
                                             match ins {
                                                 Instruction::LocalSet(idx)
-                                                | Instruction::LocalTee(idx) => {
-                                                    if arg_locals.contains(idx) {
-                                                        local_mutated = true;
-                                                        break;
-                                                    }
+                                                | Instruction::LocalTee(idx)
+                                                    if arg_locals.contains(idx) =>
+                                                {
+                                                    local_mutated = true;
+                                                    break;
                                                 }
                                                 _ => {}
                                             }
@@ -13028,17 +12994,13 @@ pub mod optimize {
                                     // as occupied so later iterations
                                     // don't double-plan.
                                     for &(start, end) in &spans {
-                                        for p in start..=end {
-                                            occupied[p] = true;
-                                        }
+                                        occupied[start..=end].fill(true);
                                     }
                                     // First occurrence: keep the whole
                                     // [start..=call_pos] sequence and tee
                                     // after the call.
-                                    position_action.insert(
-                                        first_call_pos,
-                                        CSEAction::SaveToLocal(*local_idx),
-                                    );
+                                    position_action
+                                        .insert(first_call_pos, CSEAction::SaveToLocal(*local_idx));
                                     // Each later occurrence: collapse the
                                     // span to a single local.get at the
                                     // arg_start; skip up through call_pos.
@@ -13087,10 +13049,7 @@ pub mod optimize {
                             // Replace with local.get
                             new_instructions.push(Instruction::LocalGet(*local_idx));
                         }
-                        Some(CSEAction::ReplaceSpanWithLoad {
-                            local_idx,
-                            end_pos,
-                        }) => {
+                        Some(CSEAction::ReplaceSpanWithLoad { local_idx, end_pos }) => {
                             // Replace `[pos ..= end_pos]` with one local.get.
                             new_instructions.push(Instruction::LocalGet(*local_idx));
                             skip_until = Some(*end_pos);
@@ -13916,10 +13875,7 @@ pub mod optimize {
                 Instruction::GlobalGet(0),
                 Instruction::Drop,
             ]);
-            let func1 = mk_func(vec![
-                Instruction::I32Const(99),
-                Instruction::GlobalSet(0),
-            ]);
+            let func1 = mk_func(vec![Instruction::I32Const(99), Instruction::GlobalSet(0)]);
             let mut module = mk_module(vec![func0, func1]);
             let folded = forward_global_shim(&mut module).expect("apply");
             assert_eq!(
@@ -18482,10 +18438,7 @@ mod tests {
             .instructions
             .iter()
             .any(|i| matches!(i, Instruction::I32Add));
-        assert!(
-            !has_add,
-            "post-call identity tree should still fold"
-        );
+        assert!(!has_add, "post-call identity tree should still fold");
     }
 
     #[test]
@@ -18501,16 +18454,13 @@ mod tests {
         )"#;
         let mut module = parse::parse_wat(wat).expect("parse");
         optimize::egraph_optimize(&mut module).expect("egraph_optimize");
-        let has_add_anywhere = module.functions[0]
-            .instructions
-            .iter()
-            .any(|i| {
-                if let Instruction::Block { body, .. } = i {
-                    body.iter().any(|j| matches!(j, Instruction::I32Add))
-                } else {
-                    matches!(i, Instruction::I32Add)
-                }
-            });
+        let has_add_anywhere = module.functions[0].instructions.iter().any(|i| {
+            if let Instruction::Block { body, .. } = i {
+                body.iter().any(|j| matches!(j, Instruction::I32Add))
+            } else {
+                matches!(i, Instruction::I32Add)
+            }
+        });
         assert!(!has_add_anywhere, "block-nested identity must fold");
     }
 
@@ -18539,7 +18489,10 @@ mod tests {
             .instructions
             .iter()
             .any(|i| matches!(i, Instruction::If { .. }));
-        assert!(!has_if, "single-value if/else of pure pushers must become select");
+        assert!(
+            !has_if,
+            "single-value if/else of pure pushers must become select"
+        );
 
         // Select must appear.
         let has_select = module.functions[0]
@@ -18602,7 +18555,10 @@ mod tests {
             .instructions
             .iter()
             .any(|i| matches!(i, Instruction::LocalTee(_)));
-        assert!(has_tee, "local.set;local.get pair must collapse to local.tee");
+        assert!(
+            has_tee,
+            "local.set;local.get pair must collapse to local.tee"
+        );
 
         // No LocalSet should remain (the pair was the only set).
         let has_set = module.functions[0]
diff --git a/loom-core/src/peephole_synth.rs b/loom-core/src/peephole_synth.rs
index 986604c..063a178 100644
--- a/loom-core/src/peephole_synth.rs
+++ b/loom-core/src/peephole_synth.rs
@@ -192,7 +192,6 @@ const CANDIDATES: &[Candidate] = &[
         pattern: &[Instruction::I64Const(1), Instruction::I64Mul],
         replacement: &[],
     },
-
     // ─── Power-of-2 mul → shl (v1.0.2 PR-L3) ─────────────────────────────
     //
     // Proof template: for k > 0, ∀x: BV32. x * 2^k = x << k (mod 2^32).
@@ -208,7 +207,6 @@ const CANDIDATES: &[Candidate] = &[
     // power-of-two needs ≥ 2 bytes while k still fits in 1 → real save.
     //
     // We ship a small set of common multipliers; future PR can expand.
-
     Candidate {
         name: "i32_mul_128_to_shl_7",
         // x * 128 → x << 7; saves 1 byte (LEB128(128)=2, LEB128(7)=1).
@@ -301,9 +299,7 @@ fn apply_to_body(body: &mut Vec<Instruction>) -> usize {
         while i < body.len() {
             let mut hit: Option<&Candidate> = None;
             for c in CANDIDATES {
-                if i + c.pattern.len() <= body.len()
-                    && body[i..i + c.pattern.len()] == *c.pattern
-                {
+                if i + c.pattern.len() <= body.len() && body[i..i + c.pattern.len()] == *c.pattern {
                     hit = Some(c);
                     break;
                 }
@@ -849,7 +845,10 @@ mod tests {
         )"#;
         let mut module = parse::parse_wat(wat).expect("parse");
         let folds = apply_peephole_synth(&mut module).expect("apply");
-        assert_eq!(folds, 0, "i64.and 0 must NOT fold (it's x & 0 = 0, not identity)");
+        assert_eq!(
+            folds, 0,
+            "i64.and 0 must NOT fold (it's x & 0 = 0, not identity)"
+        );
     }
 
     #[test]
diff --git a/loom-core/src/verify.rs b/loom-core/src/verify.rs
index b3d31e9..8c227c6 100644
--- a/loom-core/src/verify.rs
+++ b/loom-core/src/verify.rs
@@ -174,12 +174,10 @@ fn count_function_instructions(func: &Function) -> usize {
 
 #[cfg(feature = "verification")]
 impl VerificationSignatureContext {
-
-    /// PR-K3.2 (Track B): recursively count instructions in a function
-    /// body. Used by `verify` to gate Z3 invocation by body size — see
-    /// the comment in `verify` for rationale and the LOOM_Z3_MAX_INSTRUCTIONS
-    /// env var.
-    // (defined out of the impl block — see below)
+    // PR-K3.2 (Track B): recursively count instructions in a function
+    // body. Used by `verify` to gate Z3 invocation by body size — see
+    // the comment in `verify` for rationale and the LOOM_Z3_MAX_INSTRUCTIONS
+    // env var. (defined out of the impl block — see below)
 
     /// PR-K3: check whether a callee is pure + no-trap and therefore
     /// safe to encode as a deterministic uninterpreted function
@@ -2423,8 +2421,8 @@ impl TranslationValidator {
             .ok()
             .and_then(|s| s.parse().ok())
             .unwrap_or(2000);
-        let n_instr = count_function_instructions(&self.original)
-            .max(count_function_instructions(optimized));
+        let n_instr =
+            count_function_instructions(&self.original).max(count_function_instructions(optimized));
         if n_instr > max_instructions {
             crate::stats::record_revert(&format!("{}/z3-size-skipped", self.pass_name));
             return Ok(());
@@ -4246,7 +4244,10 @@ fn encode_function_to_smt_impl_inner(
             // doesn't cover the slot OR signatures don't match, we fall
             // back to the existing conservative encoding: fresh-symbolic
             // result + havoc of all globals and memory.
-            Instruction::CallIndirect { type_idx, table_idx } => {
+            Instruction::CallIndirect {
+                type_idx,
+                table_idx,
+            } => {
                 // Pop table index first.
                 if stack.is_empty() {
                     return Err(anyhow!(
@@ -4255,17 +4256,15 @@ fn encode_function_to_smt_impl_inner(
                 }
                 // SAFETY: guarded by is_empty check above
                 let slot_bv = stack.pop().unwrap();
-                let concrete_slot: Option<u32> = slot_bv
-                    .as_u64()
-                    .and_then(|n| u32::try_from(n).ok());
+                let concrete_slot: Option<u32> =
+                    slot_bv.as_u64().and_then(|n| u32::try_from(n).ok());
 
                 // Use type signature to properly model stack effects
                 if let Some(ctx_ref) = sig_ctx {
                     if let Some(sig) = ctx_ref.get_type_signature(*type_idx) {
                         // v1.0.4 Track B: try to resolve to a concrete callee.
-                        let resolved_func: Option<u32> = concrete_slot.and_then(|slot| {
-                            ctx_ref.resolve_indirect_call(*table_idx, slot, sig)
-                        });
+                        let resolved_func: Option<u32> = concrete_slot
+                            .and_then(|slot| ctx_ref.resolve_indirect_call(*table_idx, slot, sig));
 
                         if let Some(func_idx) = resolved_func {
                             // Pop arguments into a Vec we own, so we can
@@ -4304,26 +4303,20 @@ fn encode_function_to_smt_impl_inner(
                                     .iter()
                                     .map(|p| {
                                         Sort::bitvector(match p {
-                                            crate::ValueType::I32
-                                            | crate::ValueType::F32 => 32,
-                                            crate::ValueType::I64
-                                            | crate::ValueType::F64 => 64,
+                                            crate::ValueType::I32 | crate::ValueType::F32 => 32,
+                                            crate::ValueType::I64 | crate::ValueType::F64 => 64,
                                         })
                                     })
                                     .collect();
-                                let domain_refs: Vec<&Sort> =
-                                    domain_sorts_owned.iter().collect();
+                                let domain_refs: Vec<&Sort> = domain_sorts_owned.iter().collect();
                                 let range_sort = Sort::bitvector(result_width);
                                 // Use the same decl name PR-K3 uses for
                                 // direct Call — so a direct-call and the
                                 // resolved-indirect-call to the same
                                 // function reduce to the SAME Z3 expression.
                                 let decl_name = format!("pure_call_{}", func_idx);
-                                let decl = FuncDecl::new(
-                                    decl_name.as_str(),
-                                    &domain_refs,
-                                    &range_sort,
-                                );
+                                let decl =
+                                    FuncDecl::new(decl_name.as_str(), &domain_refs, &range_sort);
                                 let arg_refs: Vec<&dyn z3::ast::Ast> =
                                     args.iter().map(|a| a as &dyn z3::ast::Ast).collect();
                                 let result_dyn = decl.apply(&arg_refs);
diff --git a/loom-testing/benches/corpus_baseline.rs b/loom-testing/benches/corpus_baseline.rs
index 038f17a..a14e06b 100644
--- a/loom-testing/benches/corpus_baseline.rs
+++ b/loom-testing/benches/corpus_baseline.rs
@@ -13,7 +13,7 @@
 //!
 //!   - a markdown table to stdout (so `cargo bench` output is grep-able), AND
 //!   - a versioned report file at
-//!         docs/measurements/v<workspace-version>-corpus-baseline.md
+//!     docs/measurements/v<workspace-version>-corpus-baseline.md
 //!     that mirrors the bash harness's report format.
 //!
 //! The criterion measurement layer wraps each fixture's LOOM run in a
@@ -51,16 +51,52 @@ use criterion::{Criterion, criterion_group, criterion_main};
 // Format mirrors the shell script: (display_name, repo-relative path, note).
 // ---------------------------------------------------------------------------
 const WORKLOADS: &[(&str, &str, &str)] = &[
-    ("gale",             "scripts/mythos/gale_measure/gale_in_baseline.wasm",      "kernel-FFI fixture"),
-    ("httparse",         "tests/corpus/httparse.wasm",                              "HTTP parser"),
-    ("nom_numbers",      "tests/corpus/nom_numbers.wasm",                           "parser-combinator primitives"),
-    ("state_machine",    "tests/corpus/state_machine.wasm",                         "FSM kernel"),
-    ("json_lite",        "tests/corpus/json_lite.wasm",                             "minimal JSON tokenizer"),
-    ("loom",             "tests/corpus/loom.wasm",                                  "LOOM self-build (dogfood target)"),
-    ("calculator",       "tests/calculator.wasm",                                   "component-shaped fixture"),
-    ("calculator_root",  "calculator.wasm",                                         "2.3 MB component (root, large)"),
-    ("simple_component", "loom-core/tests/component_fixtures/simple.component.wasm","tiny component (adapter-heavy)"),
-    ("calc_component",   "loom-core/tests/component_fixtures/calc.component.wasm",  "small component (adapter-heavy)"),
+    (
+        "gale",
+        "scripts/mythos/gale_measure/gale_in_baseline.wasm",
+        "kernel-FFI fixture",
+    ),
+    ("httparse", "tests/corpus/httparse.wasm", "HTTP parser"),
+    (
+        "nom_numbers",
+        "tests/corpus/nom_numbers.wasm",
+        "parser-combinator primitives",
+    ),
+    (
+        "state_machine",
+        "tests/corpus/state_machine.wasm",
+        "FSM kernel",
+    ),
+    (
+        "json_lite",
+        "tests/corpus/json_lite.wasm",
+        "minimal JSON tokenizer",
+    ),
+    (
+        "loom",
+        "tests/corpus/loom.wasm",
+        "LOOM self-build (dogfood target)",
+    ),
+    (
+        "calculator",
+        "tests/calculator.wasm",
+        "component-shaped fixture",
+    ),
+    (
+        "calculator_root",
+        "calculator.wasm",
+        "2.3 MB component (root, large)",
+    ),
+    (
+        "simple_component",
+        "loom-core/tests/component_fixtures/simple.component.wasm",
+        "tiny component (adapter-heavy)",
+    ),
+    (
+        "calc_component",
+        "loom-core/tests/component_fixtures/calc.component.wasm",
+        "small component (adapter-heavy)",
+    ),
 ];
 
 // ---------------------------------------------------------------------------
@@ -142,9 +178,8 @@ fn repo_root() -> PathBuf {
 
 fn resolve_env() -> BenchEnv {
     let repo_root = repo_root();
-    let tmp_dir = PathBuf::from(
-        env::var("TMP_DIR").unwrap_or_else(|_| "/tmp/loom-measure-corpus".into()),
-    );
+    let tmp_dir =
+        PathBuf::from(env::var("TMP_DIR").unwrap_or_else(|_| "/tmp/loom-measure-corpus".into()));
     let _ = fs::create_dir_all(&tmp_dir);
 
     let loom = env::var("LOOM")
@@ -155,8 +190,16 @@ fn resolve_env() -> BenchEnv {
     let wasm_opt_name = env::var("WASM_OPT").unwrap_or_else(|_| "wasm-opt".into());
     let meld_name = env::var("MELD").unwrap_or_else(|_| "meld".into());
 
-    let wasm_opt = if tool_exists(&wasm_opt_name) { Some(wasm_opt_name) } else { None };
-    let meld = if tool_exists(&meld_name) { Some(meld_name) } else { None };
+    let wasm_opt = if tool_exists(&wasm_opt_name) {
+        Some(wasm_opt_name)
+    } else {
+        None
+    };
+    let meld = if tool_exists(&meld_name) {
+        Some(meld_name)
+    } else {
+        None
+    };
 
     let per_run_timeout_secs = env::var("PER_RUN_TIMEOUT")
         .ok()
@@ -165,13 +208,11 @@ fn resolve_env() -> BenchEnv {
 
     let loom_version = first_line(&Command::new(&loom).arg("--version").output().ok())
         .unwrap_or_else(|| "unknown".into());
-    let wasm_tools_version = first_line(
-        &Command::new(&wasm_tools).arg("--version").output().ok(),
-    )
-    .unwrap_or_else(|| "unknown".into());
-    let wasm_opt_version = wasm_opt.as_ref().and_then(|name| {
-        first_line(&Command::new(name).arg("--version").output().ok())
-    });
+    let wasm_tools_version = first_line(&Command::new(&wasm_tools).arg("--version").output().ok())
+        .unwrap_or_else(|| "unknown".into());
+    let wasm_opt_version = wasm_opt
+        .as_ref()
+        .and_then(|name| first_line(&Command::new(name).arg("--version").output().ok()));
 
     let pin_status = check_wasm_opt_pin(&repo_root, wasm_opt_version.as_deref());
 
@@ -268,7 +309,10 @@ fn check_wasm_opt_pin(repo_root: &Path, wasm_opt_version_raw: Option<&str>) -> P
     match parse_version_token(raw) {
         Some(installed) if installed == pinned => PinStatus::Match { version: installed },
         Some(installed) => PinStatus::Mismatch { pinned, installed },
-        None => PinStatus::Mismatch { pinned, installed: raw.to_string() },
+        None => PinStatus::Mismatch {
+            pinned,
+            installed: raw.to_string(),
+        },
     }
 }
 
@@ -328,7 +372,9 @@ fn file_size(p: &Path) -> Option<u64> {
 }
 
 fn is_component(path: &Path) -> bool {
-    let Ok(mut f) = fs::File::open(path) else { return false };
+    let Ok(mut f) = fs::File::open(path) else {
+        return false;
+    };
     use std::io::Read;
     let mut buf = [0u8; 8];
     if f.read(&mut buf).ok() != Some(8) {
@@ -369,10 +415,7 @@ fn code_section_bytes(env: &BenchEnv, path: &Path) -> Option<u64> {
             continue;
         }
         let third = cols[2].trim();
-        let n_str: String = third
-            .chars()
-            .take_while(|c| c.is_ascii_digit())
-            .collect();
+        let n_str: String = third.chars().take_while(|c| c.is_ascii_digit()).collect();
         if let Ok(n) = n_str.parse::<u64>() {
             sum = sum.saturating_add(n);
             any = true;
@@ -412,7 +455,9 @@ fn run_loom(env: &BenchEnv, input: &Path, output: &Path) -> bool {
 
 /// Run `wasm-opt -O3 <input> -o <output>`. Returns false if wasm-opt is absent.
 fn run_wasm_opt(env: &BenchEnv, input: &Path, output: &Path) -> bool {
-    let Some(name) = env.wasm_opt.as_ref() else { return false };
+    let Some(name) = env.wasm_opt.as_ref() else {
+        return false;
+    };
     let mut cmd = Command::new(name);
     cmd.arg("-O3").arg(input).arg("-o").arg(output);
     run_with_timeout(&mut cmd, Duration::from_secs(env.per_run_timeout_secs))
@@ -423,7 +468,9 @@ fn run_wasm_opt(env: &BenchEnv, input: &Path, output: &Path) -> bool {
 
 /// Run `meld fuse <component> -o <core> --no-attestation`.
 fn run_meld(env: &BenchEnv, input: &Path, output: &Path) -> bool {
-    let Some(name) = env.meld.as_ref() else { return false };
+    let Some(name) = env.meld.as_ref() else {
+        return false;
+    };
     let mut cmd = Command::new(name);
     cmd.arg("fuse")
         .arg(input)
@@ -446,7 +493,9 @@ fn measure_fixture(env: &BenchEnv, name: &str, rel_path: &str, note: &str) -> Ro
     if !fixture.exists() {
         return Row::missing(name, note);
     }
-    let Some(base_bytes) = file_size(&fixture) else { return Row::missing(name, note) };
+    let Some(base_bytes) = file_size(&fixture) else {
+        return Row::missing(name, note);
+    };
     if base_bytes == 0 {
         return Row::missing(name, note);
     }
@@ -557,9 +606,7 @@ fn render_markdown(env: &BenchEnv, rows: &[Row]) -> String {
     }
     writeln!(s, "- wasm-tools: `{}`", env.wasm_tools_version).unwrap();
     match &env.pin_status {
-        PinStatus::Match { version } => {
-            writeln!(s, "- wasm-opt pin: `{version}` (match)").unwrap()
-        }
+        PinStatus::Match { version } => writeln!(s, "- wasm-opt pin: `{version}` (match)").unwrap(),
         PinStatus::Mismatch { pinned, installed } => writeln!(
             s,
             "- wasm-opt pin: **MISMATCH** (installed `{installed}` vs pinned `{pinned}`)"
@@ -659,11 +706,7 @@ fn render_markdown(env: &BenchEnv, rows: &[Row]) -> String {
 
     writeln!(s, "## Methodology").unwrap();
     writeln!(s).unwrap();
-    writeln!(
-        s,
-        "For each workload (fixture path relative to repo root):"
-    )
-    .unwrap();
+    writeln!(s, "For each workload (fixture path relative to repo root):").unwrap();
     writeln!(
         s,
         "1. Record baseline byte count via `fs::metadata` and code-section size via `wasm-tools objdump`."
@@ -702,11 +745,7 @@ fn render_markdown(env: &BenchEnv, rows: &[Row]) -> String {
     writeln!(s, "```bash").unwrap();
     writeln!(s, "# Build LOOM first (Z3 verification enabled)").unwrap();
     writeln!(s, "Z3_SYS_Z3_HEADER=/opt/homebrew/include/z3.h \\").unwrap();
-    writeln!(
-        s,
-        "  LIBRARY_PATH=/opt/homebrew/lib cargo build --release"
-    )
-    .unwrap();
+    writeln!(s, "  LIBRARY_PATH=/opt/homebrew/lib cargo build --release").unwrap();
     writeln!(s).unwrap();
     writeln!(s, "# Run the criterion harness").unwrap();
     writeln!(s, "cargo bench -p loom-testing --bench corpus_baseline").unwrap();
diff --git a/scripts/measure_corpus.sh b/scripts/measure_corpus.sh
index 5755fd7..e3d1a99 100644
--- a/scripts/measure_corpus.sh
+++ b/scripts/measure_corpus.sh
@@ -13,7 +13,7 @@
 #   5. Validate every output via wasm-tools validate. Any failure is HARD ERROR.
 #
 # Output:
-#   docs/measurements/v0.9.0-corpus-baseline.md
+#   docs/measurements/v1.1.0-corpus-baseline.md
 #
 # Required tools: loom (built), wasm-tools.
 # Optional tools: wasm-opt (skip cleanly if absent).
@@ -35,7 +35,7 @@ LOOM="${LOOM:-${REPO_ROOT}/target/release/loom}"
 WASM_TOOLS="${WASM_TOOLS:-wasm-tools}"
 WASM_OPT="${WASM_OPT:-wasm-opt}"
 TMP_DIR="${TMP_DIR:-/tmp/loom-measure-corpus}"
-REPORT_PATH="${REPORT_PATH:-${REPO_ROOT}/docs/measurements/v0.9.0-corpus-baseline.md}"
+REPORT_PATH="${REPORT_PATH:-${REPO_ROOT}/docs/measurements/v1.1.0-corpus-baseline.md}"
 
 mkdir -p "${TMP_DIR}"
 mkdir -p "$(dirname "${REPORT_PATH}")"
@@ -129,7 +129,15 @@ file_size() {
 pct_delta() {
   local new="$1"
   local base="$2"
-  if [[ -z "${base}" || "${base}" == "0" || "${base}" == "n/a" || "${new}" == "n/a" ]]; then
+  # A delta is only meaningful when BOTH operands are integer byte
+  # counts. Sentinel strings ("error", "invalid", "timeout", "n/a")
+  # must NOT be coerced to 0 by awk — that fabricates a -100% "win"
+  # on a run that actually failed or timed out.
+  if ! [[ "${base}" =~ ^[0-9]+$ ]] || [[ "${base}" == "0" ]]; then
+    echo "n/a"
+    return
+  fi
+  if ! [[ "${new}" =~ ^-?[0-9]+$ ]]; then
     echo "n/a"
     return
   fi
@@ -369,7 +377,7 @@ done
 
 # --- Emit report -----------------------------------------------------------
 {
-  echo "# v0.9.0 Corpus Baseline -- LOOM vs wasm-opt -O3"
+  echo "# v1.1.0 Corpus Baseline -- LOOM vs wasm-opt -O3"
   echo
   echo "_Generated by \`scripts/measure_corpus.sh\` at \`${RUN_TIMESTAMP}\`._"
   echo