AztecProtocol · iakovenkos · Mar 20, 2026 · Mar 20, 2026 · Mar 20, 2026 · Mar 23, 2026
diff --git a/...etenberg/cpp/src/barretenberg/boomerang_value_detection/graph_description_goblin.test.cpp b/...etenberg/cpp/src/barretenberg/boomerang_value_detection/graph_description_goblin.test.cpp
@@ -109,6 +109,15 @@ TEST_F(BoomerangGoblinRecursiveVerifierTests, graph_description_basic)
     // rather than relying solely on them being public outputs.
     translator_pairing_points.fix_witness();
 
+    // Run static analysis before ProverInstance construction, which frees circuit block data.
+    // finalize_circuit() is normally called inside ProverInstance; since we need to run the StaticAnalyzer
+    // first, we call it explicitly here (ProverInstance will skip it when called again due to the guard).
+    builder.finalize_circuit(/*ensure_nonzero_polynomials=*/false);
+    info("Recursive Verifier: num gates = ", builder.num_gates());
+    auto graph = cdg::StaticAnalyzer(builder, false);
+    auto variables_in_one_gate = graph.get_variables_in_one_gate();
+    EXPECT_EQ(variables_in_one_gate.size(), 0);
+
     // Construct and verify a proof for the Goblin Recursive Verifier circuit
     {
         auto prover_instance = std::make_shared<OuterProverInstance>(builder);
@@ -118,15 +127,11 @@ TEST_F(BoomerangGoblinRecursiveVerifierTests, graph_description_basic)
         OuterProver prover(prover_instance, verification_key);
         OuterVerifier verifier(vk_and_hash);
         auto proof = prover.construct_proof();
+        info("Proof constructed");
         bool verified = verifier.verify_proof(proof).result;
 
         ASSERT_TRUE(verified);
     }
-
-    info("Recursive Verifier: num gates = ", builder.num_gates());
-    auto graph = cdg::StaticAnalyzer(builder, false);
-    auto variables_in_one_gate = graph.get_variables_in_one_gate();
-    EXPECT_EQ(variables_in_one_gate.size(), 0);
 }
 
 } // namespace bb::stdlib::recursion::honk
diff --git a/...berg/cpp/src/barretenberg/boomerang_value_detection/graph_description_goblin_avm.test.cpp b/...berg/cpp/src/barretenberg/boomerang_value_detection/graph_description_goblin_avm.test.cpp
@@ -110,6 +110,17 @@ TEST_F(BoomerangGoblinAvmRecursiveVerifierTests, graph_description_basic)
     // rather than relying solely on them being public outputs.
     translator_pairing_points.fix_witness();
 
+    // Run static analysis before ProverInstance construction, which frees circuit block data.
+    // finalize_circuit() is normally called inside ProverInstance; since we need to run the StaticAnalyzer
+    // first, we call it explicitly here (ProverInstance will skip it when called again due to the guard).
+    builder.finalize_circuit(/*ensure_nonzero_polynomials=*/false);
+    info("Recursive Verifier: num gates = ", builder.num_gates());
+    auto graph = cdg::StaticAnalyzer(builder, false);
+    auto variables_in_one_gate = graph.get_variables_in_one_gate();
+    // All pairing point coordinate limbs are now properly constrained. The self_reduce() call in bigfield::set_public()
+    // ensures limbs are in canonical form, adding constraints that use each limb in multiple gates.
+    EXPECT_EQ(variables_in_one_gate.size(), 0);
+
     // Construct and verify a proof for the Goblin Recursive Verifier circuit
     {
         auto prover_instance = std::make_shared<OuterProverInstance>(builder);
@@ -123,13 +134,6 @@ TEST_F(BoomerangGoblinAvmRecursiveVerifierTests, graph_description_basic)
 
         ASSERT_TRUE(verified);
     }
-
-    info("Recursive Verifier: num gates = ", builder.num_gates());
-    auto graph = cdg::StaticAnalyzer(builder, false);
-    auto variables_in_one_gate = graph.get_variables_in_one_gate();
-    // All pairing point coordinate limbs are now properly constrained. The self_reduce() call in bigfield::set_public()
-    // ensures limbs are in canonical form, adding constraints that use each limb in multiple gates.
-    EXPECT_EQ(variables_in_one_gate.size(), 0);
 }
 
 } // namespace bb::stdlib::recursion::honk
diff --git a/barretenberg/cpp/src/barretenberg/chonk/GOBLIN_FLUSH_DESIGN.md b/barretenberg/cpp/src/barretenberg/chonk/GOBLIN_FLUSH_DESIGN.md
@@ -0,0 +1,159 @@
+# Goblin Reset Design
+
+## Problem
+
+Chonk's accumulation capacity is bounded by the ECCVM circuit size (`2^CONST_ECCVM_LOG_N = 2^15 = 32,768` rows). Each folding step generates ~62 short scalar multiplications that are deferred to the ECCVM via Goblin's op queue. Currently, the maximum is ~17 app circuits before the ECCVM overflows.
+
+## Design
+
+### Goblin App
+
+This is an app $A_G$ that does only one thing: it recursively verifies an Ultra Honk proof of the circuit $C$ which contains a Goblin recursive verifier.
+
+A valid witness for $A_G$ attests to the knowledge of a valid proof for the circuit $C$, which in turn attests to the knowledge of a valid proof of Goblin (merge + ECCVM + Translator).
+
+In addition to the recursive verification, $A_G$ exposes in its PublicIO:
+- The **IPA opening claim** extracted from the ECCVM recursive verification inside $C$.
+- The **`T_pre_flush` commitment** — the merged op queue table that was proven, read from the merge proof's public inputs inside $C$. This is needed by the Goblin kernel for the merge chain consistency check (see below).
+
+### Goblin Kernel
+
+This is a kernel $K_G$ that behaves almost like an inner kernel with the difference that it recursively verifies the folding of a kernel into a running accumulator and of the Goblin app into the accumulator.
+
+So:
+- It verifies two foldings.
+- For the second folding, the VK is equal to the VK of $A_G$ (in contrast with inner kernels, where the VK is one of the allowed VKs in `ALLOWED_VK_TREE`).
+- It extracts the IPA claim from the Goblin app's PublicIO and accumulates it into the running IPA claim, which is part of the public inputs of every kernel (see IPA Claim Accumulation below).
+
+#### Merge Chain Reset (T_prev subtlety)
+
+$K_G$ must also reset the Goblin merge chain. This is the subtlest part of the design.
+
+The Chonk verification loop threads a `T_prev` commitment through every kernel: each kernel reads `T_prev` from the previous kernel's `ecc_op_tables`, merges the new subtable onto it, and outputs the updated commitment. At a flush, this chain must be broken and restarted cleanly, because the final ECCVM at `prove()` time only covers post-flush ops — it never proves `T_pre_flush`.
+
+$K_G$'s `complete_kernel_circuit_logic` therefore does the following, in place of the standard T_prev inheritance:
+
+1. Reads `T_pre_flush` from the **previous kernel's** `ecc_op_tables`.
+2. Reads `T_pre_flush` from **$A_G$'s PublicIO** — the commitment to the table that $A_G$ verified was correctly processed by the intermediate ECCVM inside $C$.
+3. **Asserts equality**: `A_G.verified_T_pre_flush == prev_kernel.ecc_op_tables`. This ties the two chains together: the flush proof covered exactly the ops committed to by the previous kernel, no more, no less. Without this check a malicious prover could supply an $A_G$ that verifies a flush proof for a different (smaller) batch of ops, leaving some pre-flush operations unaccounted for.
+4. Uses **T_0 (empty tables)** as `T_prev` for the merge verification of $A_G$'s subtable — discarding `T_pre_flush` from the forward chain.
+5. Outputs `ecc_op_tables = T_0 ∥ A_G ops`, the fresh starting point for all subsequent kernels.
+
+The native `prove_merge()` call for $A_G$ uses `MergeSettings::RESET`, setting `T_prev = T_0`, so prover and verifier agree on the fresh start.
+
+#### IPA Claim Accumulation
+
+Every kernel carries a running IPA accumulator in `KernelIO` / `HidingKernelIO` (~8 field elements: a commitment point + opening pair):
+
+- **Init kernel**: outputs a trivial/default accumulator.
+- **Inner / Reset kernels**: pass-through — copy the accumulator from the previous kernel's public inputs. Not free: adds copy constraints in the permutation argument.
+- **$K_G$**: folds the flush's IPA claim from $A_G$'s PublicIO into the running accumulator via the `IpaAccumulate` opcode.
+- **Tail / Hiding kernels**: pass-through. Hiding kernel outputs the accumulated claim in `HidingKernelIO`.
+- **`prove()`**: the final ECCVM IPA claim only exists after `prove()` runs the ECCVM prover. A dedicated IPA accumulation circuit folds this final claim into the kernel-chain accumulator. Its Oink is a separate sub-proof; sumcheck/PCS are batched into the joint proof.
+
+For zero-flush flows, the trivial accumulator passes through untouched. The `prove()` accumulation circuit folds the single final IPA claim into the trivial accumulator, equivalent to today's behaviour.
+
+### How to Drop Them In
+
+Write $A_1, \dots, A_N$ for the execution stack. Each app has a number $N_i$ of ECC ops that can be estimated from ACIR by counting the number of recursive verifications happening in the app.
+
+In `proveWithKernels` we proceed as follows:
+
+1. Run a loop over `executionStack` and add Reset kernels as we do now, producing `executionStackWithKernels`.
+2. Run a loop over `executionStackWithKernels` and estimate the running ECC op count at each step. If app $A_i$ (plus the following kernel or kernels) would push the total above the ECCVM fixed size, insert the Goblin pair before it so the stack becomes $A_1, \dots, A_{i-1}, A_G, K_G, A_i, \dots$
+
+This works because $A_G$ and $K_G$ do not read or write any Aztec state, so inserting them at any position in the kernel chain after Reset kernels have been placed is valid.
+
+An app whose EC ops alone (plus one kernel pair) exceed ECCVM capacity is **rejected** at this point — it can never fit regardless of flushing.
+
+A **hard bound** (insert a flush every $N$ circuits regardless of row count) is enforced as a safety net in the same loop.
+
+## Implementation
+
+### New ACIR Opcodes
+
+Both cryptographic primitives introduced by this design are exposed as ACIR blackbox functions, following the existing pattern of `EmbeddedCurveAdd`, `EmbeddedCurveScalarMul`, and `RecursiveAggregation`. This keeps all cryptographic implementation in BB and makes the Noir circuits trivially thin.
+
+#### `ULTRA_GOBLIN` (new proof type for `std::verify_with_type`)
+
+A new variant in the ACIR proof type enum. It performs an Ultra Honk recursive verification with the VK hash of circuit $C$ (the GoblinRecursiveVerifier) hard-coded in BB. No VK is passed from Noir — BB rejects any attempt to override it.
+
+**BB side** (`dsl/acir_format/`, `stdlib/`): implement the recursive verifier gadget for $C$, hard-coding $C$'s VK hash. Extracts IPA claim and `T_pre_flush` from the proof's public inputs and places them in the circuit's return data.
+
+**Noir side**: `$A_G$` calls `std::verify_with_type(goblin_flush_proof, ULTRA_GOBLIN)` — one line.
+
+#### `IpaAccumulate` (new blackbox function)
+
+Folds a new IPA opening claim into a running IPA accumulator using the IPA accumulation protocol already used at the rollup level (`IPA::accumulate()`, `OpeningClaim<Grumpkin>`).
+
+- **Inputs**: running accumulator (~8 field elements: Grumpkin commitment + opening pair) + new IPA claim (~8 field elements)
+- **Output**: updated accumulator (~8 field elements)
+- **BB side** (`commitment_schemes/ipa/`): ~54K gate circuit, same gadget used by both $K_G$ and `prove()`. One implementation, two call sites.
+- **Noir side**: $K_G$ calls `IpaAccumulate(running_claim, app_ipa_claim)` — one line.
+
+Because `IpaAccumulate` is a blackbox opcode, $K_G$ contains no cryptographic implementation — it simply calls the builtin. The `prove()`-time IPA accumulation circuit is built directly in BB using the same gadget.
+
+### Goblin App
+
+Noir circuit (`private-kernel-goblin-app`). Calls `std::verify_with_type(goblin_flush_proof, ULTRA_GOBLIN)`. The PublicIO of $A_G$ includes the IPA claim and `T_pre_flush` commitment, both extracted by the `ULTRA_GOBLIN` opcode implementation in BB.
+
+**Scope**: new Noir crate, ~20–30 lines. The circuit itself is trivial; the substance is in the `ULTRA_GOBLIN` BB implementation.
+
+### Goblin Kernel
+
+Noir kernel (`private-kernel-goblin-kernel`) similar to `private-kernel-inner`. Differences:
+
+- **Noir**: the second VK being folded is hard-coded to the VK of $A_G$ instead of being checked against `ALLOWED_VK_TREE`. IPA accumulation is a single call to `IpaAccumulate(prev_ipa_accum, A_G.ipa_claim)`.
+- **BB** (`complete_kernel_circuit_logic`): new `is_goblin_kernel` path that performs the `T_pre_flush` consistency check and resets `T_prev` to T_0 before processing $A_G$'s merge subtable (steps 3–5 of the Merge Chain Reset section above).
+
+**Scope**: new Noir crate (~50–80 lines, mostly copied from inner kernel), ~30–50 lines of new BB logic in `chonk.cpp`.
+
+### Scope Summary
+
+| Component | Kind | Complexity | Notes |
+|---|---|---|---|
+| `ULTRA_GOBLIN` ACIR opcode | New (BB + Noir enum) | Medium | Composing existing ECCVM/Translator recursive verifiers |
+| `IpaAccumulate` ACIR opcode | New (BB) | Medium | Reuses existing `IPA::accumulate()` protocol |
+| `GoblinRecursiveVerifier` circuit $C$ | New (BB) | Medium-high | Wraps merge + ECCVM + Translator into one Ultra Honk proof |
+| `$A_G$` Noir circuit | New (Noir) | Low | ~20–30 lines; substance is in `ULTRA_GOBLIN` |
+| `$K_G$` Noir circuit | New (Noir + BB) | Medium | ~50–80 lines Noir, ~30–50 lines BB |
+| `KernelIO` / `HidingKernelIO` IPA field | Modified | Medium | Mechanical but wide blast radius across 3 packages |
+| Existing kernel IPA pass-through | Modified (Noir) | Low-medium | All kernels gain one pass-through field |
+| `complete_kernel_circuit_logic` | Modified (BB) | Medium | New `is_goblin_kernel` branch |
+| `prove()` IPA accumulation phase | Modified (BB) | Medium | Extends existing multi-phase proving; reuses `IpaAccumulate` |
+| `MergeSettings::RESET` | Modified (BB) | Trivial | New enum variant + a few lines |
+| `proveWithKernels` TS loop | Modified (TS) | Medium | Two-pass loop; ECC op count estimation from ACIR |
+| Constants propagation | Modified (multi) | Low-medium | Mechanical; `yarn remake-constants` handles TS side |
+
+The **critical path** items are the two new ACIR opcodes and the GoblinRecursiveVerifier circuit $C$, as these contain the only genuinely novel cryptographic work. Everything else is either mechanical propagation of a new field or a thin Noir wrapper over the opcodes.
+
+### TS Land
+
+Modifications to `proveWithKernels` as per the *How to Drop Them In* section. The one additional detail: witness generation for $A_G$ requires producing the Goblin flush proof (merge + ECCVM + Translator), proving it through $C$ (the GoblinRecursiveVerifier), and packaging the resulting Ultra Honk proof as $A_G$'s witness input.
+
+## Proof Structure
+
+The final proof is **constant size** (6 sub-proofs), identical whether zero or $N$ flushes occurred. The verifier cannot distinguish a zero-flush proof from an $N$-flush proof.
+
+1. **MegaZK Oink proof** — hiding kernel pre-sumcheck
+2. **Merge proof** — final op queue subtable (post-last-flush ops only)
+3. **ECCVM proof** — final EC operations on Grumpkin (post-last-flush)
+4. **IPA proof** — opening proof for the final ECCVM's polynomial commitment
+5. **IPA accumulation Oink proof** — pre-sumcheck for the `prove()`-time accumulation circuit
+6. **Joint proof** — Translator Oink + batched sumcheck + batched PCS (MegaZK, Translator, IPA accumulation)
+
+## Impact on Non-Flush Flows
+
+All non-flush flows are affected by the following structural changes:
+
+- **`KernelIO` / `HidingKernelIO`**: gain IPA accumulator fields. All kernel VKs change.
+- **`complete_kernel_circuit_logic()`**: every kernel passes through the IPA accumulator (copy constraints only for non-Goblin kernels).
+- **`prove()`**: new IPA accumulation circuit + Oink sub-proof. Joint proof batches 3 circuits instead of 2.
+- **Verifier**: batches three circuit reductions (MegaZK, Translator, IPA accumulation) instead of two.
+- **Constants**: `HIDING_KERNEL_PUBLIC_INPUTS_SIZE`, `CHONK_PROOF_LENGTH`, Noir constants, TypeScript constants all update.
+
+## Open Questions
+
+1. **GoblinRecursiveVerifier gate count**: what is the total gate count and ECCVM row cost of circuit $C$? This determines the overhead of each flush and informs the hard bound value.
+2. **Hard bound value**: should be derived from ECCVM capacity and known per-circuit costs rather than hardcoded.
+3. **Testing strategy**: flush triggering in TS, T_pre_flush consistency check correctness, proof validity across multiple flushes.
diff --git a/barretenberg/cpp/src/barretenberg/chonk/chonk.cpp b/barretenberg/cpp/src/barretenberg/chonk/chonk.cpp
@@ -489,6 +489,11 @@ void Chonk::accumulate_and_fold(ClientCircuit& circuit,
         block.free_data();
     }
 
+#ifndef NDEBUG
+    // VK comparison runs after ProverInstance construction (circuit blocks already freed, but not needed here).
+    debug_vk_check(prover_instance, precomputed_vk);
+#endif
+
     // We're accumulating a kernel if the verification queue is empty (because the kernel circuit contains recursive
     // verifiers for all the entries previously present in the verification queue) and if it's not the first accumulate
     // call (which will always be for an app circuit).
@@ -738,24 +743,24 @@ void Chonk::update_native_verifier_accumulator(const VerifierInputs& queue_entry
     info("======= END OF DEBUGGING INFO FOR NATIVE FOLDING STEP =======");
 }
 
-void Chonk::debug_incoming_circuit(ClientCircuit& circuit,
-                                   const std::shared_ptr<ProverInstance>& prover_instance,
-                                   const std::shared_ptr<MegaVerificationKey>& precomputed_vk)
+void Chonk::debug_circuit_check(ClientCircuit& circuit)
 {
     info("======= DEBUGGING INFO FOR INCOMING CIRCUIT =======");
-
     info("Accumulating circuit ", num_circuits_accumulated + 1, " of ", num_circuits);
     info("Is the circuit valid? ", CircuitChecker::check(circuit) ? "true" : "false");
     info("Did we find a failure? ", circuit.failed() ? "true" : "false");
     if (circuit.failed()) {
         info("\t\t\tError message? ", circuit.err());
     }
+}
 
+void Chonk::debug_vk_check(const std::shared_ptr<ProverInstance>& prover_instance,
+                           const std::shared_ptr<MegaVerificationKey>& precomputed_vk)
+{
     // Compare precomputed VK with the one generated during accumulation
     auto vk = std::make_shared<MegaVerificationKey>(prover_instance->get_precomputed());
     info("Does the precomputed vk match with the one generated during accumulation? ",
          vk->compare(*precomputed_vk, MegaFlavor::CommitmentLabels().get_precomputed()) ? "true" : "false");
-
     info("======= END OF DEBUGGING INFO FOR INCOMING CIRCUIT =======");
 }
 #endif

diff --git a/barretenberg/cpp/src/barretenberg/chonk/chonk.hpp b/barretenberg/cpp/src/barretenberg/chonk/chonk.hpp
@@ -240,9 +240,9 @@ class Chonk : public IVCBase {
     void update_native_verifier_accumulator(const VerifierInputs& queue_entry,
                                             const std::shared_ptr<Transcript>& verifier_transcript);
 
-    void debug_incoming_circuit(ClientCircuit& circuit,
-                                const std::shared_ptr<ProverInstance>& prover_instance,
-                                const std::shared_ptr<MegaVerificationKey>& precomputed_vk);
+    void debug_circuit_check(ClientCircuit& circuit);
+    void debug_vk_check(const std::shared_ptr<ProverInstance>& prover_instance,
+                        const std::shared_ptr<MegaVerificationKey>& precomputed_vk);
 #endif
 
     FoldingResult verify_folding(ClientCircuit& circuit,

diff --git a/barretenberg/cpp/src/barretenberg/chonk/mock_circuit_producer.hpp b/barretenberg/cpp/src/barretenberg/chonk/mock_circuit_producer.hpp
@@ -197,7 +197,11 @@ class PrivateFunctionExecutionMockCircuitProducer {
         }
 
         if (check_circuit_sizes) {
-            auto prover_instance = std::make_shared<Chonk::ProverInstance>(circuit);
+            // Use a copy so that ProverInstance construction (which frees circuit block data) doesn't
+            // affect the original circuit, which is still needed by get_verification_key and accumulate.
+            MegaCircuitBuilder_<bb::fr> circuit_copy{ circuit };
+            circuit_copy.op_queue = std::make_shared<ECCOpQueue>(*circuit_copy.op_queue);
+            auto prover_instance = std::make_shared<Chonk::ProverInstance>(circuit_copy);
             size_t log2_dyadic_size = prover_instance->log_dyadic_size();
             if (log2_num_gates != 0) {
                 if (is_kernel) {

diff --git a/barretenberg/cpp/src/barretenberg/commitment_schemes_recursion/ipa_recursive.test.cpp b/barretenberg/cpp/src/barretenberg/commitment_schemes_recursion/ipa_recursive.test.cpp
@@ -328,7 +328,7 @@ TEST_F(IPARecursiveTests, AccumulateSmallRandom)
  */
 TEST_F(IPARecursiveTests, AccumulateMediumRandom)
 {
-    static constexpr size_t log_poly_length = 10;
+    static constexpr size_t log_poly_length = 15;
     auto [poly1, x1] = generate_poly_and_challenge<log_poly_length>();
     auto [poly2, x2] = generate_poly_and_challenge<log_poly_length>();
     test_accumulation<log_poly_length>(poly1, poly2, x1, x2);