From 4f1a904da24324227ca5238bcfa3fce4a5a5392b Mon Sep 17 00:00:00 2001
From: Danny Willems <be.danny.willems@gmail.com>
Date: Wed, 30 Aug 2023 19:04:23 +0200
Subject: [PATCH 01/32] Add link to GitHub

---
 kimchi/src/circuits/gate.rs | 2 ++
 kimchi/src/prover.rs        | 2 +-
 2 files changed, 3 insertions(+), 1 deletion(-)
diff --git a/kimchi/src/circuits/gate.rs b/kimchi/src/circuits/gate.rs
index fadac16ba2..6b53847dfb 100644
--- a/kimchi/src/circuits/gate.rs
+++ b/kimchi/src/circuits/gate.rs
@@ -210,6 +210,7 @@ impl<F: PrimeField + SquareRootField> CircuitGate<F> {
             EndoMul => self.verify_endomul::<G>(row, witness, &index.cs),
             EndoMulScalar => self.verify_endomul_scalar::<G>(row, witness, &index.cs),
             // TODO: implement the verification for the lookup gate
+            // See https://github.com/MinaProtocol/mina/issues/14011
             Lookup => Ok(()),
             CairoClaim | CairoInstruction | CairoFlags | CairoTransition => {
                 self.verify_cairo_gate::<G>(row, witness, &index.cs)
@@ -297,6 +298,7 @@ impl<F: PrimeField + SquareRootField> CircuitGate<F> {
             }
             GateType::Lookup => {
                 // TODO: implement the verification for the lookup gate
+                // See https://github.com/MinaProtocol/mina/issues/14011
                 vec![]
             }
             GateType::CairoClaim => turshi::Claim::constraint_checks(&env, &mut cache),
diff --git a/kimchi/src/prover.rs b/kimchi/src/prover.rs
index adf55f2a36..f55f0019ac 100644
--- a/kimchi/src/prover.rs
+++ b/kimchi/src/prover.rs
@@ -921,7 +921,7 @@ where
         //~~ * $s_i$
         //~~ * $w_i$
         //~~ * $z$
-        //~~ * lookup (TODO)
+        //~~ * lookup (TODO https://github.com/MinaProtocol/mina/issues/13886)
         //~~ * generic selector
         //~~ * poseidon selector
         //~

From 5e91825e0b248d7fa3fc508de46876388a74a4f8 Mon Sep 17 00:00:00 2001
From: Danny Willems <be.danny.willems@gmail.com>
Date: Wed, 30 Aug 2023 18:39:48 +0200
Subject: [PATCH 02/32] This TODO is done

---
 kimchi/src/circuits/lookup/lookups.rs | 1 -
 1 file changed, 1 deletion(-)

diff --git a/kimchi/src/circuits/lookup/lookups.rs b/kimchi/src/circuits/lookup/lookups.rs
index 6b6de6a517..7a2fc5f386 100644
--- a/kimchi/src/circuits/lookup/lookups.rs
+++ b/kimchi/src/circuits/lookup/lookups.rs
@@ -323,7 +323,6 @@ pub type JointLookupSpec<F> = JointLookup<SingleLookup<F>, LookupTableID>;
 pub type JointLookupValue<F> = JointLookup<F, F>;
 
 impl<F: Zero + One + Clone + Neg<Output = F> + From<u64>> JointLookupValue<F> {
-    // TODO: Support multiple tables
     /// Evaluate the combined value of a joint-lookup.
     pub fn evaluate(&self, joint_combiner: &F, table_id_combiner: &F) -> F {
         combine_table_entry(

From 99b35be1af23f841ac433203148996463c59ebd3 Mon Sep 17 00:00:00 2001
From: mrmr1993 <mr_1993@hotmail.co.uk>
Date: Mon, 9 Oct 2023 10:41:13 +0100
Subject: [PATCH 03/32] Add helpers for inferring feature flags

---
 kimchi/src/circuits/constraints.rs | 67 +++++++++++++++++++-----------
 1 file changed, 43 insertions(+), 24 deletions(-)

diff --git a/kimchi/src/circuits/constraints.rs b/kimchi/src/circuits/constraints.rs
index 48c88cc0cc..02988d6473 100644
--- a/kimchi/src/circuits/constraints.rs
+++ b/kimchi/src/circuits/constraints.rs
@@ -614,6 +614,47 @@ pub fn zk_rows_strict_lower_bound(num_chunks: usize) -> usize {
     (2 * (PERMUTS + 1) * num_chunks - 2) / PERMUTS
 }
 
+impl FeatureFlags {
+    pub fn from_gates_and_lookup_features<F: PrimeField>(
+        gates: &[CircuitGate<F>],
+        lookup_features: LookupFeatures,
+    ) -> FeatureFlags {
+        let mut feature_flags = FeatureFlags {
+            range_check0: false,
+            range_check1: false,
+            lookup_features,
+            foreign_field_add: false,
+            foreign_field_mul: false,
+            xor: false,
+            rot: false,
+        };
+
+        for gate in gates {
+            match gate.typ {
+                GateType::RangeCheck0 => feature_flags.range_check0 = true,
+                GateType::RangeCheck1 => feature_flags.range_check1 = true,
+                GateType::ForeignFieldAdd => feature_flags.foreign_field_add = true,
+                GateType::ForeignFieldMul => feature_flags.foreign_field_mul = true,
+                GateType::Xor16 => feature_flags.xor = true,
+                GateType::Rot64 => feature_flags.rot = true,
+                _ => (),
+            }
+        }
+
+        feature_flags
+    }
+
+    pub fn from_gates<F: PrimeField>(
+        gates: &[CircuitGate<F>],
+        uses_runtime_tables: bool,
+    ) -> FeatureFlags {
+        FeatureFlags::from_gates_and_lookup_features(
+            gates,
+            LookupFeatures::from_gates(gates, uses_runtime_tables),
+        )
+    }
+}
+
 impl<F: PrimeField + SquareRootField> Builder<F> {
     /// Set up the number of public inputs.
     /// If not invoked, it equals `0` by default.
@@ -682,7 +723,7 @@ impl<F: PrimeField + SquareRootField> Builder<F> {
         // for some reason we need more than 1 gate for the circuit to work, see TODO below
         assert!(gates.len() > 1);
 
-        let lookup_features = LookupFeatures::from_gates(&gates, runtime_tables.is_some());
+        let feature_flags = FeatureFlags::from_gates(&gates, runtime_tables.is_some());
 
         let lookup_domain_size = {
             // First we sum over the lookup table size
@@ -705,7 +746,7 @@ impl<F: PrimeField + SquareRootField> Builder<F> {
                 }
             }
             // And we add the built-in tables, depending on the features.
-            let LookupFeatures { patterns, .. } = &lookup_features;
+            let LookupFeatures { patterns, .. } = &feature_flags.lookup_features;
             for pattern in patterns.into_iter() {
                 if let Some(gate_table) = pattern.table() {
                     lookup_domain_size += gate_table.table_size();
@@ -782,28 +823,6 @@ impl<F: PrimeField + SquareRootField> Builder<F> {
             .collect();
         gates.append(&mut padding);
 
-        let mut feature_flags = FeatureFlags {
-            range_check0: false,
-            range_check1: false,
-            lookup_features,
-            foreign_field_add: false,
-            foreign_field_mul: false,
-            xor: false,
-            rot: false,
-        };
-
-        for gate in &gates {
-            match gate.typ {
-                GateType::RangeCheck0 => feature_flags.range_check0 = true,
-                GateType::RangeCheck1 => feature_flags.range_check1 = true,
-                GateType::ForeignFieldAdd => feature_flags.foreign_field_add = true,
-                GateType::ForeignFieldMul => feature_flags.foreign_field_mul = true,
-                GateType::Xor16 => feature_flags.xor = true,
-                GateType::Rot64 => feature_flags.rot = true,
-                _ => (),
-            }
-        }
-
         //~ 1. sample the `PERMUTS` shifts.
         let shifts = Shifts::new(&domain.d1);
 

From 33252de376e3df5785773b7f687ffb3894b1eba2 Mon Sep 17 00:00:00 2001
From: mrmr1993 <mr_1993@hotmail.co.uk>
Date: Mon, 9 Oct 2023 10:51:26 +0100
Subject: [PATCH 04/32] Derive binding types for FeatureFlags

---
 kimchi/src/circuits/constraints.rs | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/kimchi/src/circuits/constraints.rs b/kimchi/src/circuits/constraints.rs
index 02988d6473..c76ef48e02 100644
--- a/kimchi/src/circuits/constraints.rs
+++ b/kimchi/src/circuits/constraints.rs
@@ -32,6 +32,11 @@ use std::sync::Arc;
 //
 
 /// Flags for optional features in the constraint system
+#[cfg_attr(
+    feature = "ocaml_types",
+    derive(ocaml::IntoValue, ocaml::FromValue, ocaml_gen::Struct)
+)]
+#[cfg_attr(feature = "wasm_types", wasm_bindgen::prelude::wasm_bindgen)]
 #[derive(Copy, Clone, Serialize, Deserialize, Debug)]
 pub struct FeatureFlags {
     /// RangeCheck0 gate

From 488ad1882f4ee4a36fc4f1408aebec1ca41da8c2 Mon Sep 17 00:00:00 2001
From: Mikhail Volkhov <volhovm.cs@gmail.com>
Date: Mon, 2 Oct 2023 21:17:07 +0100
Subject: [PATCH 05/32] [#14070] Add a unit check for the table id zero value
 condition

---
 kimchi/src/circuits/lookup/index.rs | 37 +++++++++++++++++++++++++++++
 1 file changed, 37 insertions(+)

diff --git a/kimchi/src/circuits/lookup/index.rs b/kimchi/src/circuits/lookup/index.rs
index ab3e4545ab..c414e32d14 100644
--- a/kimchi/src/circuits/lookup/index.rs
+++ b/kimchi/src/circuits/lookup/index.rs
@@ -443,3 +443,40 @@ impl<F: PrimeField + SquareRootField> LookupConstraintSystem<F> {
         }
     }
 }
+
+#[cfg(test)]
+mod tests {
+
+    use super::*;
+    use crate::circuits::{
+        gate::{CircuitGate, GateType},
+        wires::Wire,
+    };
+    use mina_curves::pasta::Fp;
+
+    #[test]
+    fn test_zero_table_zero_row() {
+        let lookup_r: u64 = 32;
+        let num_lookups: usize = 16;
+        if let Ok(domain) = EvaluationDomains::<Fp>::create(2 * lookup_r as usize) {
+            // Table column that does not contain zeros
+            let lookup_table_values: Vec<_> = (1..lookup_r + 1).map(From::from).collect();
+
+            let lookup_tables: Vec<LookupTable<Fp>> = vec![LookupTable {
+                id: 0,
+                data: vec![lookup_table_values],
+            }];
+
+            let gates: Vec<CircuitGate<Fp>> = (0..num_lookups)
+                .map(|i| CircuitGate::new(GateType::Lookup, Wire::for_row(i), vec![]))
+                .collect();
+
+            let res =
+                LookupConstraintSystem::create(gates.as_slice(), lookup_tables, None, &domain);
+            assert!(
+                matches!(res, Err(LookupError::TableIDZeroMustHaveZeroEntry)),
+                "LookupConstraintSystem::create(...) returns OK when zero table has no zero rows"
+            );
+        }
+    }
+}

From 74b5b0ce2c65a0e6e9a22227e00731a2dc499959 Mon Sep 17 00:00:00 2001
From: Mikhail Volkhov <volhovm.cs@gmail.com>
Date: Thu, 12 Oct 2023 12:22:23 +0100
Subject: [PATCH 06/32] [#14070] Fix the table dummy rows bug

---
 kimchi/src/circuits/lookup/index.rs      | 11 +++++++----
 kimchi/src/circuits/lookup/tables/mod.rs |  8 ++++++--
 2 files changed, 13 insertions(+), 6 deletions(-)

diff --git a/kimchi/src/circuits/lookup/index.rs b/kimchi/src/circuits/lookup/index.rs
index c414e32d14..d1f24d3dbf 100644
--- a/kimchi/src/circuits/lookup/index.rs
+++ b/kimchi/src/circuits/lookup/index.rs
@@ -459,12 +459,15 @@ mod tests {
         let lookup_r: u64 = 32;
         let num_lookups: usize = 16;
         if let Ok(domain) = EvaluationDomains::<Fp>::create(2 * lookup_r as usize) {
-            // Table column that does not contain zeros
-            let lookup_table_values: Vec<_> = (1..lookup_r + 1).map(From::from).collect();
+            // Table column that /does not/ contain zeros
+            let lookup_table_values_1: Vec<_> = (1..lookup_r+1).map(From::from).collect();
+            // Another table column that /does/ contain zeros.
+            // Jointly two tables /do not/ have a full zero now.
+            let lookup_table_values_2: Vec<_> = (0..lookup_r).map(From::from).collect();
 
             let lookup_tables: Vec<LookupTable<Fp>> = vec![LookupTable {
                 id: 0,
-                data: vec![lookup_table_values],
+                data: vec![lookup_table_values_1, lookup_table_values_2],
             }];
 
             let gates: Vec<CircuitGate<Fp>> = (0..num_lookups)
@@ -475,7 +478,7 @@ mod tests {
                 LookupConstraintSystem::create(gates.as_slice(), lookup_tables, None, &domain);
             assert!(
                 matches!(res, Err(LookupError::TableIDZeroMustHaveZeroEntry)),
-                "LookupConstraintSystem::create(...) returns OK when zero table has no zero rows"
+                "LookupConstraintSystem::create(...) must fail when zero table has no zero rows"
             );
         }
     }
diff --git a/kimchi/src/circuits/lookup/tables/mod.rs b/kimchi/src/circuits/lookup/tables/mod.rs
index d6be11f9bd..d57d36a828 100644
--- a/kimchi/src/circuits/lookup/tables/mod.rs
+++ b/kimchi/src/circuits/lookup/tables/mod.rs
@@ -31,15 +31,19 @@ impl<F> LookupTable<F>
 where
     F: FftField,
 {
-    /// Return true if the table has an entry containing all zeros.
+    /// Return true if the table has an entry (row) containing all zeros.
     pub fn has_zero_entry(&self) -> bool {
         // reminder: a table is written as a list of columns,
         // not as a list of row entries.
         for row in 0..self.len() {
+            let mut row_zero = true;
             for col in &self.data {
                 if !col[row].is_zero() {
-                    continue;
+                    row_zero = false;
+                    break;
                 }
+            }
+            if row_zero {
                 return true;
             }
         }

From eaf31842ccaba6e16c02fcf0dc74c52b9beba341 Mon Sep 17 00:00:00 2001
From: Mikhail Volkhov <volhovm.cs@gmail.com>
Date: Thu, 12 Oct 2023 12:56:28 +0100
Subject: [PATCH 07/32] [#14097,#14070] Move lookup table consistency checks
 into LookupTable#create()

---
 kimchi/src/circuits/lookup/index.rs      | 71 +--------------------
 kimchi/src/circuits/lookup/tables/mod.rs | 78 +++++++++++++++++++++++-
 2 files changed, 79 insertions(+), 70 deletions(-)

diff --git a/kimchi/src/circuits/lookup/index.rs b/kimchi/src/circuits/lookup/index.rs
index d1f24d3dbf..592fd0db48 100644
--- a/kimchi/src/circuits/lookup/index.rs
+++ b/kimchi/src/circuits/lookup/index.rs
@@ -23,15 +23,11 @@ use thiserror::Error;
 /// Represents an error found when computing the lookup constraint system
 #[derive(Debug, Error)]
 pub enum LookupError {
-    #[error("One of the lookup tables has columns of different lengths")]
-    InconsistentTableLength,
     #[error("The combined lookup table is larger than allowed by the domain size. Observed: {length}, expected: {maximum_allowed}")]
     LookupTableTooLong {
         length: usize,
         maximum_allowed: usize,
     },
-    #[error("The table with id 0 must have an entry of all zeros")]
-    TableIDZeroMustHaveZeroEntry,
 }
 
 /// Lookup selectors
@@ -227,8 +223,6 @@ impl<F: PrimeField + SquareRootField> LookupConstraintSystem<F> {
                     .chain(lookup_tables)
                     .collect();
 
-                let mut has_table_id_0 = false;
-
                 // if we are using runtime tables
                 let (runtime_table_offset, runtime_selector) =
                     if let Some(runtime_tables) = &runtime_tables {
@@ -272,11 +266,8 @@ impl<F: PrimeField + SquareRootField> LookupConstraintSystem<F> {
                             let (id, first_column) =
                                 (runtime_table.id, runtime_table.first_column.clone());
 
-                            // record if table ID 0 is used in one of the runtime tables
-                            // note: the check later will still force you to have a fixed table with ID 0
-                            if id == 0 {
-                                has_table_id_0 = true;
-                            }
+                            // @volhovm: Do we need to enforce that there is at least one table
+                            // with id 0?
 
                             // important: we still need a placeholder column to make sure that
                             // if all other tables have a single column
@@ -345,17 +336,11 @@ impl<F: PrimeField + SquareRootField> LookupConstraintSystem<F> {
                 let mut table_ids: Vec<F> = Vec::with_capacity(d1_size);
 
                 let mut non_zero_table_id = false;
-                let mut has_table_id_0_with_zero_entry = false;
 
                 for table in &lookup_tables {
                     let table_len = table.len();
 
-                    if table.id == 0 {
-                        has_table_id_0 = true;
-                        if table.has_zero_entry() {
-                            has_table_id_0_with_zero_entry = true;
-                        }
-                    } else {
+                    if table.id != 0 {
                         non_zero_table_id = true;
                     }
 
@@ -366,10 +351,6 @@ impl<F: PrimeField + SquareRootField> LookupConstraintSystem<F> {
 
                     //~~ * Copy the entries from the table to new rows in the corresponding columns of the concatenated table.
                     for (i, col) in table.data.iter().enumerate() {
-                        // See GH issue: https://github.com/MinaProtocol/mina/issues/14097
-                        if col.len() != table_len {
-                            return Err(LookupError::InconsistentTableLength);
-                        }
                         lookup_table[i].extend(col);
                     }
 
@@ -379,12 +360,6 @@ impl<F: PrimeField + SquareRootField> LookupConstraintSystem<F> {
                     }
                 }
 
-                // If a table has ID 0, then it must have a zero entry.
-                // This is for the dummy lookups to work.
-                if has_table_id_0 && !has_table_id_0_with_zero_entry {
-                    return Err(LookupError::TableIDZeroMustHaveZeroEntry);
-                }
-
                 // Note: we use `>=` here to leave space for the dummy value.
                 if lookup_table[0].len() >= max_num_entries {
                     return Err(LookupError::LookupTableTooLong {
@@ -443,43 +418,3 @@ impl<F: PrimeField + SquareRootField> LookupConstraintSystem<F> {
         }
     }
 }
-
-#[cfg(test)]
-mod tests {
-
-    use super::*;
-    use crate::circuits::{
-        gate::{CircuitGate, GateType},
-        wires::Wire,
-    };
-    use mina_curves::pasta::Fp;
-
-    #[test]
-    fn test_zero_table_zero_row() {
-        let lookup_r: u64 = 32;
-        let num_lookups: usize = 16;
-        if let Ok(domain) = EvaluationDomains::<Fp>::create(2 * lookup_r as usize) {
-            // Table column that /does not/ contain zeros
-            let lookup_table_values_1: Vec<_> = (1..lookup_r+1).map(From::from).collect();
-            // Another table column that /does/ contain zeros.
-            // Jointly two tables /do not/ have a full zero now.
-            let lookup_table_values_2: Vec<_> = (0..lookup_r).map(From::from).collect();
-
-            let lookup_tables: Vec<LookupTable<Fp>> = vec![LookupTable {
-                id: 0,
-                data: vec![lookup_table_values_1, lookup_table_values_2],
-            }];
-
-            let gates: Vec<CircuitGate<Fp>> = (0..num_lookups)
-                .map(|i| CircuitGate::new(GateType::Lookup, Wire::for_row(i), vec![]))
-                .collect();
-
-            let res =
-                LookupConstraintSystem::create(gates.as_slice(), lookup_tables, None, &domain);
-            assert!(
-                matches!(res, Err(LookupError::TableIDZeroMustHaveZeroEntry)),
-                "LookupConstraintSystem::create(...) must fail when zero table has no zero rows"
-            );
-        }
-    }
-}
diff --git a/kimchi/src/circuits/lookup/tables/mod.rs b/kimchi/src/circuits/lookup/tables/mod.rs
index d57d36a828..063e3cf78f 100644
--- a/kimchi/src/circuits/lookup/tables/mod.rs
+++ b/kimchi/src/circuits/lookup/tables/mod.rs
@@ -1,6 +1,7 @@
 use ark_ff::{FftField, One, Zero};
 use poly_commitment::PolyComm;
 use serde::{Deserialize, Serialize};
+use thiserror::Error;
 
 pub mod range_check;
 pub mod xor;
@@ -27,12 +28,41 @@ pub struct LookupTable<F> {
     pub data: Vec<Vec<F>>,
 }
 
+/// Represents inconsistency errors during table construction and composition.
+#[derive(Debug, Error)]
+pub enum LookupTableError {
+    #[error("One of the lookup tables has columns of different lengths")]
+    InconsistentTableLength,
+    #[error("The table with id 0 must have an entry of all zeros")]
+    TableIDZeroMustHaveZeroEntry,
+}
+
 impl<F> LookupTable<F>
 where
     F: FftField,
 {
+    pub fn create(id: i32, data: Vec<Vec<F>>) -> Result<Self, LookupTableError> {
+        let res = LookupTable { id, data };
+        let table_len = res.len();
+
+        // All columns in the table must have same length
+        for col in res.data.iter() {
+            if col.len() != table_len {
+                return Err(LookupTableError::InconsistentTableLength);
+            }
+        }
+
+        // If a table has ID 0, then it must have a zero entry.
+        // This is for the dummy lookups to work.
+        if id == 0 && !res.has_zero_entry() {
+            return Err(LookupTableError::TableIDZeroMustHaveZeroEntry);
+        }
+
+        Ok(res)
+    }
+
     /// Return true if the table has an entry (row) containing all zeros.
-    pub fn has_zero_entry(&self) -> bool {
+    fn has_zero_entry(&self) -> bool {
         // reminder: a table is written as a list of columns,
         // not as a list of row entries.
         for row in 0..self.len() {
@@ -58,8 +88,11 @@ where
         self.data.len()
     }
 
-    /// Returns the length of the table.
+    /// Returns the length (height) of the table.
     pub fn len(&self) -> usize {
+        if self.is_empty() {
+            panic!("LookupTable#len() is called on an empty table")
+        }
         self.data[0].len()
     }
 
@@ -212,3 +245,44 @@ pub mod caml {
         }
     }
 }
+
+#[cfg(test)]
+mod tests {
+
+    use super::*;
+    use mina_curves::pasta::Fp;
+
+    #[test]
+    fn test_zero_table_zero_row() {
+        let lookup_r: u64 = 32;
+        // Table column that /does not/ contain zeros
+        let lookup_table_values_1: Vec<_> = (1..lookup_r + 1).map(From::from).collect();
+        // Another table column that /does/ contain zeros.
+        let lookup_table_values_2: Vec<_> = (0..lookup_r).map(From::from).collect();
+
+        // Jointly two columns /do not/ have a full zero now.
+        let table: Result<LookupTable<Fp>, _> =
+            LookupTable::create(0, vec![lookup_table_values_1, lookup_table_values_2]);
+
+        assert!(
+            matches!(table, Err(LookupTableError::TableIDZeroMustHaveZeroEntry)),
+            "LookupTable::create(...) must fail when zero table has no zero rows"
+        );
+    }
+
+    #[test]
+    fn test_inconsistent_lengths() {
+        let lookup_r: u64 = 32;
+        // Two columns of different lengths
+        let lookup_table_values_1: Vec<_> = (0..2 * lookup_r).map(From::from).collect();
+        let lookup_table_values_2: Vec<_> = (0..lookup_r).map(From::from).collect();
+
+        let table: Result<LookupTable<Fp>, _> =
+            LookupTable::create(0, vec![lookup_table_values_1, lookup_table_values_2]);
+
+        assert!(
+            matches!(table, Err(LookupTableError::InconsistentTableLength)),
+            "LookupTable::create(...) must fail when columns are not of the same length"
+        );
+    }
+}

From 2cf2ea49c97c38dd68b4792bfb78ddf3e6010008 Mon Sep 17 00:00:00 2001
From: Mikhail Volkhov <volhovm.cs@gmail.com>
Date: Sat, 21 Oct 2023 13:00:21 +0100
Subject: [PATCH 08/32] Cosmetics on the lookup RFC

---
 book/src/rfcs/3-lookup.md | 132 ++++++++++++++++++++------------------
 1 file changed, 69 insertions(+), 63 deletions(-)

diff --git a/book/src/rfcs/3-lookup.md b/book/src/rfcs/3-lookup.md
index 6f256e6a6f..b7e0e7979f 100644
--- a/book/src/rfcs/3-lookup.md
+++ b/book/src/rfcs/3-lookup.md
@@ -1,4 +1,4 @@
-# RFC: Plookup in kimchi
+# RFC: Plookup in Kimchi
 
 In 2020, [plookup](https://eprint.iacr.org/2020/315.pdf) showed how to create lookup proofs. Proofs that some witness values are part of a [lookup table](https://en.wikipedia.org/wiki/Lookup_table). Two years later, an independent team published [plonkup](https://eprint.iacr.org/2022/086) showing how to integrate Plookup into Plonk.
 
@@ -40,17 +40,17 @@ where $\text{diff}$ is a new set derived by applying a "randomized difference" b
 
 The equality between the multisets can be proved with the permutation argument of plonk, which would look like enforcing constraints on the following accumulator:
 
-* init: $acc_0 = 1$ 
-* final: $acc_n = 1$
+* init: $\mathsf{acc}_0 = 1$
+* final: $\mathsf{acc}_n = 1$
 * for every $0 < i \leq n$:
     $$
-    acc_i = acc_{i-1} \cdot \frac{(\gamma + (1+\beta) f_{i-1})(\gamma + t_{i-1} + \beta t_i)}{(\gamma + s_{i-1} + \beta s_{i})}
+    \mathsf{acc}_i = \mathsf{acc}_{i-1} \cdot \frac{(\gamma + (1+\beta) f_{i-1})(\gamma + t_{i-1} + \beta t_i)}{(\gamma + s_{i-1} + \beta s_{i})}
     $$
- 
+
 Note that the plookup paper uses a slightly different equation to make the proof work. I believe the proof would work with the above equation, but for simplicity let's just use the equation published in plookup:
 
 $$
-acc_i = acc_{i-1} \cdot \frac{(1+\beta)(\gamma + f_{i-1})(\gamma(1 + \beta) + t_{i-1} + \beta t_i)}{(\gamma(1+\beta) + s_{i-1} + \beta s_{i})}
+\mathsf{acc}_i = \mathsf{acc}_{i-1} \cdot \frac{(1+\beta)(\gamma + f_{i-1})(\gamma(1 + \beta) + t_{i-1} + \beta t_i)}{(\gamma(1+\beta) + s_{i-1} + \beta s_{i})}
 $$
 
 > Note: in plookup $s$ is too large, and so needs to be split into multiple vectors to enforce the constraint at every $i \in [[0;n]]$. We ignore this for now.
@@ -67,9 +67,9 @@ Kimchi uses a single **lookup table** at the moment of this writing; the XOR tab
 | 1   | 1   | 0   |
 | 0   | 0   | 0   |
 
-Whereas kimchi uses the XOR table for values of 4 bits, which has $2^{8}$ entries.
+Whereas kimchi uses the XOR table for values of $4$ bits, which has $2^{8}$ entries.
 
-Note: the (0, 0, 0) **entry** is at the very end on purpose (as it will be used as dummy entry for rows of the witness that don't care about lookups).
+Note: the $(0, 0, 0)$ **entry** is at the very end on purpose (as it will be used as dummy entry for rows of the witness that don't care about lookups).
 
 ### Querying the table
 
@@ -80,16 +80,16 @@ The plookup paper handles a vector of lookups $f$ which we do not have. So the f
 
 Let's go over the first item in this section.
 
-For example, the following **query** tells us that we want to check if $r_0 \oplus r_2 = 2r_1$
+For example, the following **query** tells us that we want to check if $r_0 \oplus r_2 = 2\cdot r_1$
 
-|   l   |   r   |   o   |
-| :---: | :---: | :---: |
-| 1, r0 | 1, r2 | 2, r1 |
+|   l      |   r      |   o      |
+| :---:    | :---:    | :---:    |
+| 1, $r_0$ | 1, $r_2$ | 2, $r_1$ |
 
 The grand product argument for the lookup consraint will look like this at this point:
 
 $$
-acc_i = acc_{i-1} \cdot \frac{\color{green}{(1+\beta)(\gamma + w_0(g^i) + j \cdot w_2(g^i) + j^2 \cdot 2 \cdot w_1(g^i))}(\gamma(1 + \beta) + t_{i-1} + \beta t_i)}{(\gamma(1+\beta) + s_{i-1} + \beta s_{i})}
+\mathsf{acc}_i = \mathsf{acc}_{i-1} \cdot \frac{(1+\beta){\color{green}(\gamma + w_0(g^i) + j \cdot w_2(g^i) + j^2 \cdot 2 \cdot w_1(g^i))}(\gamma(1 + \beta) + t_{i-1} + \beta t_i)}{(\gamma(1+\beta) + s_{i-1} + \beta s_{i})}
 $$
 
 Not all rows need to perform queries into a lookup table. We will use a query selector in the next section to make the constraints work with this in mind.
@@ -109,63 +109,67 @@ Both the (XOR) lookup table and the query are built-ins in kimchi. The query sel
 The grand product argument for the lookup constraint looks like this now:
 
 $$
-acc_i = acc_{i-1} \cdot \frac{\color{green}{(1+\beta) \cdot query} \cdot (\gamma(1 + \beta) + t_{i-1} + \beta t_i)}{(\gamma(1+\beta) + s_{i-1} + \beta s_{i})}
+\mathsf{acc}_i = \mathsf{acc}_{i-1} \cdot \frac{(1+\beta) \cdot {\color{green}\mathsf{query}} \cdot (\gamma(1 + \beta) + t_{i-1} + \beta t_i)}{(\gamma(1+\beta) + s_{i-1} + \beta s_{i})}
 $$
 
-where $\color{green}{query}$ is constructed so that a dummy query ($0 \oplus 0 = 0$) is used on rows that don't have a query.
+where $\color{green}{\mathsf{query}}$ is constructed so that a dummy query ($0 \oplus 0 = 0$) is used on rows that don't have a query.
 
 $$
 \begin{align}
-query = &\ selector \cdot (\gamma + w_0(g^i) + j \cdot w_2(g^i) + j^2 \cdot 2 \cdot w_1(g^i)) + \\
-&\ (1- selector) \cdot (\gamma + 0 + j \cdot 0 + j^2 \cdot 0)
+\mathsf{query} := &\ \mathsf{selector} \cdot (\gamma + w_0(g^i) + j \cdot w_2(g^i) + j^2 \cdot 2 \cdot w_1(g^i)) + \\
+&\ (1- \mathsf{selector}) \cdot (\gamma + 0 + j \cdot 0 + j^2 \cdot 0)
 \end{align}
 $$
 
 ### Queries, not query
 
-Since we allow multiple queries per row, we define multiple **queries**, where each query is associated with a **lookup selector**. 
+Since we allow multiple queries per row, we define multiple **queries**, where each query is associated with a **lookup selector**.
 
 At the moment of this writing, the `ChaCha` gates all perform $4$ queries in a row. Thus, $4$ is trivially the largest number of queries that happen in a row.
 
-**Important**: to make constraints work, this means that each row must make 4 queries. (Potentially some or all of them are dummy queries.)
+**Important**: to make constraints work, this means that each row must make $4$ queries. (Potentially some or all of them are dummy queries.)
 
-For example, the `ChaCha0`, `ChaCha1`, and `ChaCha2` gates will apply the following 4 XOR queries on the current and following rows:
+For example, the `ChaCha0`, `ChaCha1`, and `ChaCha2` gates will jointly apply the following 4 XOR queries on the current and following rows:
 
-|   l   |   r   |   o    | -   |   l   |   r   |   o    | -   |   l   |   r   |   o    | -   |   l   |   r    |   o    |
-| :---: | :---: | :----: | --- | :---: | :---: | :----: | --- | :---: | :---: | :----: | --- | :---: | :----: | :----: |
-| 1, r3 | 1, r7 | 1, r11 | -   | 1, r4 | 1, r8 | 1, r12 | -   | 1, r5 | 1, r9 | 1, r13 | -   | 1, r6 | 1, r10 | 1, r14 |
+|   l      |   r      |   o         | -   |   l      |   r      |   o        | -   |   l      |   r      |   o         | -   |   l      |   r         |   o         |
+| :---:    | :---:    | :----:      | --- | :---:    | :---:    | :----:     | --- | :---:    | :---:    | :----:      | --- | :---:    | :----:      | :----:      |
+| 1, $r_3$ | 1, $r_7$ | 1, $r_{11}$ | -   | 1, $r_4$ | 1, $r_8$ | 1, $r_{12}$ | -   | 1, $r_5$ | 1, $r_9$ | 1, $r_{13}$ | -   | 1, $r_6$ | 1, $r_{10}$ | 1, $r_{14}$ |
 
 which you can understand as checking for the current and following row that
 
-* $r_3 \oplus r7 = r_{11}$
-* $r_4 \oplus r8 = r_{12}$
-* $r_5 \oplus r9 = r_{13}$
-* $r_6 \oplus r10 = r_{14}$
+$$
+\begin{align}
+r_3 \oplus r_7 &= r_{11}\\
+r_4 \oplus r_8 &= r_{12}\\
+r_5 \oplus r_9 &= r_{13}\\
+r_6 \oplus r_{10} &= r_{14}
+\end{align}
+$$
 
-The `ChaChaFinal` also performs $4$ (somewhat similar) queries in the XOR lookup table. In total this is 8 different queries that could be associated to 8 selector polynomials.
+The `ChaChaFinal` also performs $4$ (somewhat similar) queries in the XOR lookup table. In total this is $8$ different queries that could be associated to $8$ selector polynomials.
 
 ### Grouping queries by queries pattern
 
 Associating each query with a selector polynomial is not necessarily efficient. To summarize:
 
-* the `ChaCha0`, `ChaCha1`, and `ChaCha2` gates that make $4$ queries into the XOR table
-* the `ChaChaFinal` gate makes $4$ different queries into the XOR table
+* the `ChaCha0`, `ChaCha1`, and `ChaCha2` gates that in total make $4$ queries into the XOR table
+* the `ChaChaFinal` gate makes another $4$ different queries into the XOR table
 
 Using the previous section's method, we'd have to use $8$ different lookup selector polynomials for each of the different $8$ queries. Since there's only $2$ use-cases, we can simply group them by **queries patterns** to reduce the number of lookup selector polynomials to $2$.
 
 The grand product argument for the lookup constraint looks like this now:
 
 $$
-acc_i = acc_{i-1} \cdot \frac{\color{green}{(1+\beta)^4 \cdot query} \cdot (\gamma(1 + \beta) + t_{i-1} + \beta t_i)}{(\gamma(1+\beta) + s_{i-1} + \beta s_{i})}
+\mathsf{acc}_i = \mathsf{acc}_{i-1} \cdot \frac{{\color{green}(1+\beta)^4 \cdot \mathsf{query}} \cdot (\gamma(1 + \beta) + t_{i-1} + \beta t_i)}{(\gamma(1+\beta) + s_{i-1} + \beta s_{i})}
 $$
 
-where $\color{green}{query}$ is constructed as:
+where $\color{green}{\mathsf{query}}$ is constructed as:
 
 $$
 \begin{align}
-query = &\ selector_1 \cdot pattern_1 + \\
-&\ selector_2 \cdot pattern_2 + \\
-&\ (1 - selector_1 - selector_2) \cdot (\gamma + 0 + j \cdot 0 + j^2 \cdot 0)^4
+\mathsf{query} = &\ \mathsf{selector}_1 \cdot \mathsf{pattern}_1 + \\
+&\ \mathsf{selector}_2 \cdot \mathsf{pattern}_2 + \\
+&\ (1 - \mathsf{selector}_1 - \mathsf{selector}_2) \cdot (\gamma + 0 + j \cdot 0 + j^2 \cdot 0)^4
 \end{align}
 $$
 
@@ -173,17 +177,17 @@ where, for example the first pattern for the `ChaCha0`, `ChaCha1`, and `ChaCha2`
 
 $$
 \begin{align}
-pattern_1 = &\ (\gamma + w_3(g^i) + j \cdot w_7(g^i) + j^2 \cdot w_{11}(g^i)) \cdot \\
+\mathsf{pattern}_1 = &\ (\gamma + w_3(g^i) + j \cdot w_7(g^i) + j^2 \cdot w_{11}(g^i)) \cdot \\
 &\ (\gamma + w_4(g^i) + j \cdot w_8(g^i) + j^2 \cdot w_{12}(g^i)) \cdot \\
 &\ (\gamma + w_5(g^i) + j \cdot w_9(g^i) + j^2 \cdot w_{13}(g^i)) \cdot \\
 &\ (\gamma + w_6(g^i) + j \cdot w_{10}(g^i) + j^2 \cdot w_{14}(g^i)) \cdot \\
 \end{align}
 $$
 
-Note:
+Note that:
 
-* there's now 4 dummy queries, and they only appear when none of the lookup selectors are active
-* if a pattern uses less than 4 queries, they'd have to pad their queries with dummy queries as well
+* There's now $4$ dummy queries, and they only appear when none of the lookup selectors are active
+* If a pattern uses less than $4$ queries, they'd have to pad their queries with dummy queries as well
 
 ## Back to the grand product argument
 
@@ -192,58 +196,60 @@ There are two things that we haven't touched on:
 * The vector $t$ representing the **combined lookup table** (after its columns have been combined with a joint combiner $j$). The **non-combined loookup table** is fixed at setup time and derived based on the lookup tables used in the circuit (for now only one, the XOR lookup table, can be used in the circuit).
 * The vector $s$ representing the sorted multiset of both the queries and the lookup table. This is created by the prover and sent as commitment to the verifier.
 
-The first vector $t$ is quite straightforward to think about: 
+The first vector $t$ is quite straightforward to think about:
 
 * if it is smaller than the domain (of size $n$), then we can repeat the last entry enough times to make the table of size $n$.
 * if it is larger than the domain, then we can either increase the domain or split the vector in two (or more) vectors. This is most likely what we will have to do to support multiple lookup tables later.
 
-What about the second vector?
+What about the second vector $s$?
 
 ## The sorted vector $s$
 
-The second vector $s$ is of size 
+The second vector $s$ is of size
 
 $$n \cdot |\text{queries}| + |\text{lookup\_table}|$$
 
 That is, it contains the $n$ elements of each **query vectors** (the actual values being looked up, after being combined with the joint combinator, that's $4$ per row), as well as the elements of our lookup table (after being combined as well).
 
-Because the vector $s$ is larger than the domain size $n$, it is split into several vectors of size $n$. Specifically, in the plonkup paper, the two halves of $s$ (which are then interpolated as $h_1$ and $h_2$).
+Because the vector $s$ is larger than the domain size $n$, it is split into several vectors of size $n$. Specifically, in the plonkup paper, the two halves of $s$, which are then interpolated as $h_1$ and $h_2$.
 
 $$
-acc_i = acc_{i-1} \cdot \frac{\color{green}{(1+\beta)^4 \cdot query} \cdot (\gamma(1 + \beta) + t_{i-1} + \beta t_i)}{(\gamma(1+\beta) + s_{i-1} + \beta s_{i})(\gamma(1+\beta)+s_{n+i-1} + \beta s_{n+i})}
+\mathsf{acc}_i = \mathsf{acc}_{i-1} \cdot \frac{{\color{green}(1+\beta)^4 \cdot \mathsf{query}} \cdot (\gamma(1 + \beta) + t_{i-1} + \beta t_i)}{(\gamma(1+\beta) + s_{i-1} + \beta s_{i})(\gamma(1+\beta)+s_{n+i-1} + \beta s_{n+i})}
 $$
 
-Since you must compute the difference of every contiguous pairs, the last element of the first half is the replicated as the first element of the second half ($s_{n-1} = s_{n}$), and a separate constraint enforces that continuity on the interpolated polynomials $h_1$ and $h_2$: 
+Since one has to compute the difference of every contiguous pairs, the last element of the first half is the replicated as the first element of the second half ($s_{n-1} = s_{n}$), and a separate constraint enforces that continuity on the interpolated polynomials $h_1$ and $h_2$:
 
 $$L_{n-1}(h_1(x) - h_2(g \cdot x)) = 0$$
 
-which is equivalent with checking that
+which is equivalent to checking that
 
 $$h_1(g^{n-1}) = h_2(1)$$
 
 ## The sorted vector $s$ in kimchi
 
-Since this vector is known only by the prover, and is evaluated as part of the protocol, zero-knowledge must be added to the polynomial. To do this in kimchi, we use the same technique as with the other prover polynomials: we randomize the last evaluations (or rows, on the domain) of the polynomial. 
+Since this vector is known only by the prover, and is evaluated as part of the protocol, zero-knowledge must be added to the corresponding polynomial (in case of plookup approach, to $h_1(X),h_2(X)$). To do this in kimchi, we use the same technique as with the other prover polynomials: we randomize the last evaluations (or rows, on the domain) of the polynomial.
 
 This means two things for the lookup grand product argument:
 
-1. we cannot use the wrap around trick to make sure that the list is split in two correctly (enforced by $L_{n-1}(h_1(x) - h_2(g \cdot x)) = 0$ which is equivalent to $h_1(g^{n-1}) = h_2(1)$ in the plookup paper)
-2. we have even less space to store an entire query vector. Which is actually super correct, as the witness also has some zero-knowledge rows at the end that should not be part of the queries anyway.
+1. We cannot use the wrap around trick to make sure that the list is split in two correctly (enforced by $L_{n-1}(h_1(x) - h_2(g \cdot x)) = 0$ which is equivalent to $h_1(g^{n-1}) = h_2(1)$ in the plookup paper)
+2. We have even less space to store an entire query vector. Which is actually super correct, as the witness also has some zero-knowledge rows at the end that should not be part of the queries anyway.
 
 The first problem can be solved in two ways:
 
-* **Zig-zag technique**. By reorganizing $s$ to alternate its values between the columns. For example, $h_1 = (s_0, s_2, s_4, \cdots)$ and $h_2 = (s_1, s_3, s_5, \cdots)$ so that you can simply write the denominator of the grand product argument as 
+* **Zig-zag technique**. By reorganizing $s$ to alternate its values between the columns. For example, $h_1 = (s_0, s_2, s_4, \cdots)$ and $h_2 = (s_1, s_3, s_5, \cdots)$ so that you can simply write the denominator of the grand product argument as
     $$(\gamma(1+\beta) + h_1(x) + \beta h_2(x))(\gamma(1+\beta)+ h_2(x) + \beta h_1(x \cdot g))$$
-    this is what the [plonkup](https://eprint.iacr.org/2022/086) paper does. 
-* **Snake technique**. by reorganizing $s$ as a snake. This is what is done in kimchi currently.
+    Whis approach is taken by the [plonkup](https://eprint.iacr.org/2022/086) paper.
+* **Snake technique**. By reorganizing $s$ as a snake. This is what is currently implemented in kimchi.
 
 The snake technique rearranges $s$ into the following shape:
 
 ```
-    _   _
- | | | | |
- | | | | |
- |_| |_| |
+                     __    _
+          s_0 |  s_{2n-1} |  |  | |
+          ... |       ... |  |  | |
+      s_{n-1} |       s_n |  |  | |
+               ‾‾‾‾‾‾‾‾‾‾‾    ‾‾   ‾
+              h1         h2  h3 ...
 ```
 
 so that the denominator becomes the following equation:
@@ -264,19 +270,19 @@ $$L_{0} \cdot (h_2(x) - h_3(x)) = 0$$
 
 ## Unsorted $t$ in $s$
 
-Note that at setup time, $t$ cannot be sorted as it is not combined yet. Since $s$ needs to be sorted by $t$ (in other words, not sorted, but sorted following the elements of $t$), there are two solutions:
+Note that at setup time, $t$ cannot be sorted lexicographically as it is not combined yet. Since $s$ must be sorted by $t$ (in other words sorting of $s$ must follow the elements of $t$), there are two solutions:
 
-1. both the prover and the verifier can sort the combined $t$, so that $s$ can be sorted via the typical sorting algorithms
-2. the prover can sort $s$ by $t$, so that the verifier doesn't have to do any sorting and can just rely on the commitment of the columns of $t$ (which the prover can evaluate in the protocol).
+1. Both the prover and the verifier can sort the combined $t$ lexicographically, so that $s$ can be sorted lexicographically too using typical sorting algorithms
+2. The prover can directly sort $s$ by $t$, so that the verifier doesn't have to do any pre-sorting and can just rely on the commitment of the columns of $t$ (which the prover can evaluate in the protocol).
 
-We do the second one, but there is an edge-case: the combined $t$ entries can repeat.
-For some $i, l$ such that $i \neq l$, we might have
+We take the second approach.
+However, this must be done carefully since the combined $t$ entries can repeat. For some $i, l$ such that $i \neq l$, we might have
 
 $$
-t_0[i] + j t_1[i] + j^2 t_2[i] = t_0[l] + j t_1[l] + j^2 t_2[l]
+t_0[i] + j \cdot t_1[i] + j^2 \cdot t_2[i] = t_0[l] + j \cdot t_1[l] + j^2 \cdot t_2[l]
 $$
 
-For example, if $f = \{1, 2, 2, 3\}$ and $t = \{2, 1, 2, 3\}$, then $\text{sorted}(f, t) = \{2, 2, 2, 1, 1, 2, 3, 3\}$ would be one way of sorting things out. But $\text{sorted}(f, t) = \{ 2, 2, 2, 2, 1, 1, 3, 3 \}$ would be incorrect.
+For example, if $f = \{1, 2, 2, 3\}$ and $t = \{2, 1, 2, 3\}$, then $\text{sorted}(f, t) = \{2, 2, 2, 1, 1, 2, 3, 3\}$ would be a way of correctly sorting the combined vector $s$. At the same time $\text{sorted}(f, t) = \{ 2, 2, 2, 2, 1, 1, 3, 3 \}$ is incorrect since it does not have a second block of $2$s, and thus such an $s$ is not sorted by $t$.
 
 
 ## Recap

From c5d1459550be4a8d1a6b84fc85fbecbcbe327487 Mon Sep 17 00:00:00 2001
From: Mikhail Volkhov <volhovm.cs@gmail.com>
Date: Mon, 23 Oct 2023 09:51:14 +0100
Subject: [PATCH 09/32] Capitalize book summary titles

---
 book/src/SUMMARY.md | 34 +++++++++++++++++-----------------
 1 file changed, 17 insertions(+), 17 deletions(-)

diff --git a/book/src/SUMMARY.md b/book/src/SUMMARY.md
index f39f655421..1ae5454019 100644
--- a/book/src/SUMMARY.md
+++ b/book/src/SUMMARY.md
@@ -9,15 +9,15 @@
 - [Rings](./fundamentals/zkbook_rings.md)
 - [Fields](./fundamentals/zkbook.md)
 - [Polynomials](./fundamentals/zkbook_polynomials.md)
-  - [Multiplying polynomials](./fundamentals/zkbook_multiplying_polynomials.md)
-  - [Fast Fourier transform](./fundamentals/zkbook_fft.md)
+  - [Multiplying Polynomials](./fundamentals/zkbook_multiplying_polynomials.md)
+  - [Fast Fourier Transform](./fundamentals/zkbook_fft.md)
 
 # Cryptographic tools
 
 - [Commitments](./fundamentals/zkbook_commitment.md)
-- [Polynomial commitments](./plonk/polynomial_commitments.md)
-  - [Inner product argument](./plonk/inner_product.md)
-  - [Different functionnalities](./plonk/inner_product_api.md)
+- [Polynomial Commitments](./plonk/polynomial_commitments.md)
+  - [Inner Product Argument](./plonk/inner_product.md)
+  - [Different Functionnalities](./plonk/inner_product_api.md)
 - [Two Party Computation](./fundamentals/zkbook_2pc/overview.md)
   - [Garbled Circuits](./fundamentals/zkbook_2pc/gc.md)
     - [Basics](./fundamentals/zkbook_2pc/basics.md)
@@ -45,16 +45,16 @@
 - [Overview](./plonk/overview.md)
 - [Glossary](./plonk/glossary.md)
 - [Domain](./plonk/domain.md)
-- [Lagrange basis in multiplicative subgroups](./plonk/lagrange.md)
-- [Non-interaction with fiat-shamir](./plonk/fiat_shamir.md)
+- [Lagrange Basis in Multiplicative Subgroups](./plonk/lagrange.md)
+- [Non-interaction with Fiat-Shamir](./plonk/fiat_shamir.md)
 - [Plookup](./plonk/plookup.md)
-- [Maller's optimization](./plonk/maller.md)
+- [Maller's Optimization](./plonk/maller.md)
 
 # Kimchi
 
 - [Overview](./kimchi/overview.md)
   - [Arguments](./kimchi/arguments.md)
-    - [Custom gates](./kimchi/gates.md)
+    - [Custom Gates](./kimchi/gates.md)
     - [Permutation](./kimchi/permut.md)
     - [Lookup](./kimchi/lookup.md)
 
@@ -67,20 +67,20 @@
 
 # RFCs
 
-- [RFC 0: Alternative zero-knowledge](./plonk/zkpm.md)
-- [RFC 1: Final check](./plonk/final_check.md)
-- [RFC 2: Maller's optimization for kimchi](./plonk/maller_15.md)
-- [RFC 3: Plookup integration in kimchi](./rfcs/3-lookup.md)
-- [RFC 4: Extended lookup tables](./rfcs/extended-lookup-tables.md)
+- [RFC 0: Alternative Zero-Knowledge](./plonk/zkpm.md)
+- [RFC 1: Final Check](./plonk/final_check.md)
+- [RFC 2: Maller's Optimization for Kimchi](./plonk/maller_15.md)
+- [RFC 3: Plookup Integration in Kimchi](./rfcs/3-lookup.md)
+- [RFC 4: Extended Lookup Tables](./rfcs/extended-lookup-tables.md)
 - [RFC 5: Foreign Field Addition](./rfcs/foreign_field_add.md)
 - [RFC 6: Foreign Field Multiplication](./rfcs/foreign_field_mul.md)
 - [RFC 7: Keccak](./rfcs/keccak.md)
-  
+
 # Specifications
 
 - [Poseidon hash](./specs/poseidon.md)
-- [Polynomial commitment](./specs/poly-commitment.md)
-- [Pasta curves](./specs/pasta.md)
+- [Polynomial Commitment](./specs/poly-commitment.md)
+- [Pasta Curves](./specs/pasta.md)
 - [Kimchi](./specs/kimchi.md)
 - [Universal Reference String (URS)](./specs/urs.md)
 - [Pickles](./specs/pickles.md)

From d71b06bb309966bf8cb0ef0b7c641f2bae677e19 Mon Sep 17 00:00:00 2001
From: Mikhail Volkhov <volhovm.cs@gmail.com>
Date: Mon, 23 Oct 2023 09:52:31 +0100
Subject: [PATCH 10/32] Add .ignore file to .gitignore

---
 .gitignore | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/.gitignore b/.gitignore
index 3a29d80589..fb03a39692 100644
--- a/.gitignore
+++ b/.gitignore
@@ -25,4 +25,6 @@ _build
 
 *.html
 # If symlink created for kimchi-visu
-tools/srs
\ No newline at end of file
+tools/srs
+
+.ignore

From 51e267287f031eb6e93b138e9ca24c28d9b4d3ab Mon Sep 17 00:00:00 2001
From: Mikhail Volkhov <volhovm.cs@gmail.com>
Date: Mon, 23 Oct 2023 13:45:00 +0100
Subject: [PATCH 11/32] Improve RFC3, fix rendering in kimchi/overview.md

---
 book/src/kimchi/overview.md               | 22 +++---
 book/src/rfcs/3-lookup.md                 | 81 ++++++++++++++---------
 kimchi/src/circuits/lookup/constraints.rs |  2 +
 3 files changed, 64 insertions(+), 41 deletions(-)

diff --git a/book/src/kimchi/overview.md b/book/src/kimchi/overview.md
index b8ad73a78e..6ecf0f95e4 100644
--- a/book/src/kimchi/overview.md
+++ b/book/src/kimchi/overview.md
@@ -1,11 +1,11 @@
 # Overview
 
-Here we explain how the Kimchi protocol design is translated into the `proof-systems` repository, from a high level perspective, touching briefly on all the involved aspects of cryptography. The concepts that we will be introducing can be studied more thoroughly by accessing the specific sections in the book. 
+Here we explain how the Kimchi protocol design is translated into the `proof-systems` repository, from a high level perspective, touching briefly on all the involved aspects of cryptography. The concepts that we will be introducing can be studied more thoroughly by accessing the specific sections in the book.
 
-In brief, the Kimchi protocol requires three different types of arguments `Argument`: 
-- **Custom gates:** they correspond to each of the specific functions performed by the circuit, which are represented by gate constraints. 
+In brief, the Kimchi protocol requires three different types of arguments `Argument`:
+- **Custom gates:** they correspond to each of the specific functions performed by the circuit, which are represented by gate constraints.
 - **Permutation:** the equality between different cells is constrained by copy constraints, which are represented by a permutation argument. It represents the wiring between gates, the connections from/to inputs and outputs.
-- **Lookup tables:** for efficiency reasons, some public information can be stored by both parties (prover and verifier) instead of wired in the circuit. Examples of these are boolean functions. 
+- **Lookup tables:** for efficiency reasons, some public information can be stored by both parties (prover and verifier) instead of wired in the circuit. Examples of these are boolean functions.
 
 All of these arguments are translated into equations that must hold for a correct witness for the full relation. Equivalently, this is to say that a number of expressions need to evaluate to zero on a certain set of numbers. So there are two problems to tackle here:
 
@@ -24,31 +24,31 @@ $$q(X) := \frac{p(X)}{v_S(X)}$$
 
 And still, where's the hype? If you can provide such a quotient polynomial, one could easily check that if $q(a) = p(a) / v_S(a)$ for a random number $a\in\mathbb{F}$ \ $S$ (recall you will check in a point out of the set, otherwise you would get a $0/0$), then with very high probability that would mean that actually $p(X) = q(X) \cdot v_S(X)$, meaning that $p(X)$ vanishes on the whole set $S$, with **just one point**!
 
-Let's take a deeper look into the _"magic"_ going on here. First, what do we mean by _high probability_? Is this even good enough? And the answer to this question is: as good as you want it to be. 
+Let's take a deeper look into the _"magic"_ going on here. First, what do we mean by _high probability_? Is this even good enough? And the answer to this question is: as good as you want it to be.
 
 **First** we analyse the math in this check. If the polynomial form of $p(X) = q(X) \cdot v_S(X)$ actually holds, then of course for any possible $a\in\mathbb{F}$ \ $S$ the check $p(a) =_? q(a) \cdot v_S(a)$ will hold. But is there any unlucky instantiation of the point $a$ such that $p(a) = q(a) \cdot v_S(a)$ but $p(X) \neq q(X) \cdot v_S(X)$? And the answer is, yes, there are, BUT not many. But how many? How unlikely this is? You already know the answer to this: **Schwartz-Zippel**. Recalling this lemma:
 
-> Given two different polynomials $f(X)$ and $g(X)$ of degree $d$, they can at most intersect (i.e. _coincide_) in $d$ points. Or what's equivalent, let $h(X) := f(X) - g(X)$, the polynomial $h(X)$ can only evaluate to $0$ in at most $d$ points (its roots). 
+> Given two different polynomials $f(X)$ and $g(X)$ of degree $d$, they can at most intersect (i.e. _coincide_) in $d$ points. Or what's equivalent, let $h(X) := f(X) - g(X)$, the polynomial $h(X)$ can only evaluate to $0$ in at most $d$ points (its roots).
 
 Thus, if we interchange $p(X) \rightarrow f(X)$ and $q(X)\cdot v_S(X) \rightarrow g(X)$, both of degree $d$, there are at most $\frac{d}{|\mathbb{F}- S|}$ unlucky points of $a$ that could trick you into thinking that $p(X)$ was a multiple of the vanishing polynomial (and thus being equal to zero on all of $S$). So, how can you make this error probability negligible? By having a field size that is big enough (the formal definition says that the inverse of its size should decrease faster than any polynomial expression). Since we are working with fields of size $2^{255}$, we are safe on this side!
 
 **Second**, is this really faster than checking that $p(x)=0$ for all $x\in S$ ? At the end of the day, it seems like we need to evaluate $v_S(a)$, and since this is a degree $|S|$ polynomial it looks like we are still performing about the same order of computations. But here comes math again. _In practice_, we want to define this set $S$ to have a _nice structure_ that allows us to perform some computations more efficiently than with arbitrary sets of numbers. Indeed, this set will normally be a **multiplicative group** (normally represented as $\mathbb{G}$ or $\mathbb{H}$), because in such groups the vanishing polynomial $v_\mathbb{G}(X):=\prod_{\omega\in\mathbb{G}}(X-\omega)$ has an efficient representation $v_\mathbb{G}(X)=X^{|\mathbb{G}|}-1$, which is much faster to evaluate than the above product.
 
-**Third**, we may want to understand what happens with the evaluation of $p(a)$ instead. Since this is a degree $d ≥ |\mathbb{G}|$, it may look like this will as well take a lot of effort. But here's where cryptography comes into play, since the verifier will _never_ get to evaluate the actual polynomial by themselves. Various reasons why. One, if the verifier had access to the full polynomial $p(X)$, then the prover should have sent it along with the proof, which would require $d+1$ coefficients to be represented (and this is no longer succinct for a SNARK). Two, this polynomial could carry some secret information, and if the verifier could recompute evaluations of it, they could learn some private data by evaluating on specific points. So instead, these evaluations will be a "mental game" thanks to **polynomial commitments** and **proofs of evaluation** sent by the prover (for whom a computation in the order of $d$ is not only acceptable, but necessary). The actual proof length will depend heavily on the type of polynomial commitments we are using. For example, in Kate-like commitments, committing to a polynomial takes a constant number of group elements (normally one), whereas in Bootleproof it is logarithmic. But in any case this will be shorter than sending $O(d)$ elements. 
+**Third**, we may want to understand what happens with the evaluation of $p(a)$ instead. Since this is a degree $d ≥ |\mathbb{G}|$, it may look like this will as well take a lot of effort. But here's where cryptography comes into play, since the verifier will _never_ get to evaluate the actual polynomial by themselves. Various reasons why. One, if the verifier had access to the full polynomial $p(X)$, then the prover should have sent it along with the proof, which would require $d+1$ coefficients to be represented (and this is no longer succinct for a SNARK). Two, this polynomial could carry some secret information, and if the verifier could recompute evaluations of it, they could learn some private data by evaluating on specific points. So instead, these evaluations will be a "mental game" thanks to **polynomial commitments** and **proofs of evaluation** sent by the prover (for whom a computation in the order of $d$ is not only acceptable, but necessary). The actual proof length will depend heavily on the type of polynomial commitments we are using. For example, in Kate-like commitments, committing to a polynomial takes a constant number of group elements (normally one), whereas in Bootleproof it is logarithmic. But in any case this will be shorter than sending $O(d)$ elements.
 
 
 ### Aggregation
 
-So far we have seen how to check that a polynomial equals zero on all of $\mathbb{G}$, with just a single point. This is somehow an aggregation _per se_. But we are left to analyse how we can prove such a thing, for many polynomials. Altogether, if they hold, this will mean that the polynomials encode a correct witness and the relation would be satisfied.  These checks can be performed one by one (checking that each of the quotients are indeed correct), or using an efficient aggregation mechanism and checking only **one longer equation at once**. 
+So far we have seen how to check that a polynomial equals zero on all of $\mathbb{G}$, with just a single point. This is somehow an aggregation _per se_. But we are left to analyse how we can prove such a thing, for many polynomials. Altogether, if they hold, this will mean that the polynomials encode a correct witness and the relation would be satisfied.  These checks can be performed one by one (checking that each of the quotients are indeed correct), or using an efficient aggregation mechanism and checking only **one longer equation at once**.
 
 So what is the simplest way one could think of to perform this one-time check? Perhaps one could come up with the idea of adding up all of the equations $p_0(X),...,p_n(X)$ into a longer one $\sum_{i=0}^{n} p_i(X)$. But by doing this, we may be cancelling out terms and we could get an incorrect statemement.
 
 So instead, we can multiply each term in the sum by a random number. The reason why this trick works is the independence between random numbers. That is, if two different polynomials $f(X)$ and $g(X)$ are both equal to zero on a given $X=x$, then with very high probability the same $x$ will be a root of the random combination $\alpha\cdot f(x) + \beta\cdot g(x) = 0$. If applied to the whole statement, we could transform the $n$ equations into a single equation,
 
-$$\bigwedge_{i_n} p_i(X) =_? 0 \iff_{w.h.p.} \sum_{i=0}^{n} \rho_i \cdot p_i(X) =_? 0 $$
+$$\bigwedge_{i_n} p_i(X) \stackrel{?}{=} 0 \text{\quad iff w.h.p. \quad} \sum_{i=0}^{n} \rho_i \cdot p_i(X) \stackrel{?}{=} 0$$
 
-This sounds great so far. But we are forgetting about an important part of proof systems which is proof length. For the above claim to be sound, the random values used for aggregation should be verifier-chosen, or at least prover-independent. So if the verifier had to communicate with the prover to inform about the random values being used, we would get an overhead of $n$ field elements. 
+This sounds great so far. But we are forgetting about an important part of proof systems which is proof length. For the above claim to be sound, the random values used for aggregation should be verifier-chosen, or at least prover-independent. So if the verifier had to communicate with the prover to inform about the random values being used, we would get an overhead of $n$ field elements.
 
 Instead, we take advantage of another technique that is called **powers-of-alpha**. Here, we make the assumption that powers of a random value $\alpha^i$ are indistinguishable from actual random values $\rho_i$. Then, we can twist the above claim to use only one random element $\alpha$ to be agreed with the prover as:
 
-$$\bigwedge_{i_n} p_i(X) =_? 0 \iff_{w.h.p.} \sum_{i=0}^{n} \alpha^i \cdot p_i(X) =_? 0 $$
+$$\bigwedge_{i_n} p_i(X) \stackrel{?}{=} 0 \text{\quad iff w.h.p. \quad} \sum_{i=0}^{n} \alpha^i \cdot p_i(X) \stackrel{?}{=} 0$$
diff --git a/book/src/rfcs/3-lookup.md b/book/src/rfcs/3-lookup.md
index b7e0e7979f..32dc9d39b8 100644
--- a/book/src/rfcs/3-lookup.md
+++ b/book/src/rfcs/3-lookup.md
@@ -44,16 +44,16 @@ The equality between the multisets can be proved with the permutation argument o
 * final: $\mathsf{acc}_n = 1$
 * for every $0 < i \leq n$:
     $$
-    \mathsf{acc}_i = \mathsf{acc}_{i-1} \cdot \frac{(\gamma + (1+\beta) f_{i-1})(\gamma + t_{i-1} + \beta t_i)}{(\gamma + s_{i-1} + \beta s_{i})}
+    \mathsf{acc}_i = \mathsf{acc}_{i-1} \cdot \frac{(\gamma + (1+\beta) f_{i-1}) \cdot (\gamma + t_{i-1} + \beta t_i)}{(\gamma + s_{i-1} + \beta s_{i})(\gamma + s_{n+i-1} + \beta s_{n+i})}
     $$
 
-Note that the plookup paper uses a slightly different equation to make the proof work. I believe the proof would work with the above equation, but for simplicity let's just use the equation published in plookup:
+Note that the plookup paper uses a slightly different equation to make the proof work. It is possible that the proof would work with the above equation, but for simplicity let's just use the equation published in plookup:
 
 $$
-\mathsf{acc}_i = \mathsf{acc}_{i-1} \cdot \frac{(1+\beta)(\gamma + f_{i-1})(\gamma(1 + \beta) + t_{i-1} + \beta t_i)}{(\gamma(1+\beta) + s_{i-1} + \beta s_{i})}
+\mathsf{acc}_i = \mathsf{acc}_{i-1} \cdot \frac{(1+\beta) \cdot (\gamma + f_{i-1}) \cdot (\gamma(1 + \beta) + t_{i-1} + \beta t_i)}{(\gamma(1+\beta) + s_{i-1} + \beta s_{i})(\gamma(1+\beta) + s_{n+i-1} + \beta s_{n+i})}
 $$
 
-> Note: in plookup $s$ is too large, and so needs to be split into multiple vectors to enforce the constraint at every $i \in [[0;n]]$. We ignore this for now.
+> Note: in plookup $s$ is longer than $n$ ($|s| = |f| + |t|$), and thus it needs to be split into multiple vectors to enforce the constraint at every $i \in [[0;n]]$. This leads to the two terms in the denominator as shown above, so that the degree of $\gamma (1 + \beta)$ is equal in the nominator and denominator.
 
 ### Lookup tables
 
@@ -89,7 +89,7 @@ For example, the following **query** tells us that we want to check if $r_0 \opl
 The grand product argument for the lookup consraint will look like this at this point:
 
 $$
-\mathsf{acc}_i = \mathsf{acc}_{i-1} \cdot \frac{(1+\beta){\color{green}(\gamma + w_0(g^i) + j \cdot w_2(g^i) + j^2 \cdot 2 \cdot w_1(g^i))}(\gamma(1 + \beta) + t_{i-1} + \beta t_i)}{(\gamma(1+\beta) + s_{i-1} + \beta s_{i})}
+\mathsf{acc}_i = \mathsf{acc}_{i-1} \cdot \frac{(1+\beta) \cdot {\color{green}(\gamma + w_0(g^i) + j \cdot w_2(g^i) + j^2 \cdot 2 \cdot w_1(g^i))} \cdot (\gamma(1 + \beta) + t_{i-1} + \beta t_i)}{(\gamma(1+\beta) + s_{i-1} + \beta s_{i})(\gamma(1+\beta) + s_{n+i-1} + \beta s_{n+i})}
 $$
 
 Not all rows need to perform queries into a lookup table. We will use a query selector in the next section to make the constraints work with this in mind.
@@ -106,7 +106,7 @@ The associated **query selector** tells us on which rows the query into the XOR
 
 Both the (XOR) lookup table and the query are built-ins in kimchi. The query selector is derived from the circuit at setup time. Currently only the ChaCha gates make use of the lookups.
 
-The grand product argument for the lookup constraint looks like this now:
+With the selectors, the grand product argument for the lookup constraint has the following form:
 
 $$
 \mathsf{acc}_i = \mathsf{acc}_{i-1} \cdot \frac{(1+\beta) \cdot {\color{green}\mathsf{query}} \cdot (\gamma(1 + \beta) + t_{i-1} + \beta t_i)}{(\gamma(1+\beta) + s_{i-1} + \beta s_{i})}
@@ -121,13 +121,13 @@ $$
 \end{align}
 $$
 
-### Queries, not query
+### Supporting multiple queries
 
-Since we allow multiple queries per row, we define multiple **queries**, where each query is associated with a **lookup selector**.
+Since we would like to allow multiple table lookups per row, we define multiple **queries**, where each query is associated with a **lookup selector**.
 
 At the moment of this writing, the `ChaCha` gates all perform $4$ queries in a row. Thus, $4$ is trivially the largest number of queries that happen in a row.
 
-**Important**: to make constraints work, this means that each row must make $4$ queries. (Potentially some or all of them are dummy queries.)
+**Important**: to make constraints work, this means that each row must make $4$ queries. Potentially some or all of them are dummy queries.
 
 For example, the `ChaCha0`, `ChaCha1`, and `ChaCha2` gates will jointly apply the following 4 XOR queries on the current and following rows:
 
@@ -160,7 +160,7 @@ Using the previous section's method, we'd have to use $8$ different lookup selec
 The grand product argument for the lookup constraint looks like this now:
 
 $$
-\mathsf{acc}_i = \mathsf{acc}_{i-1} \cdot \frac{{\color{green}(1+\beta)^4 \cdot \mathsf{query}} \cdot (\gamma(1 + \beta) + t_{i-1} + \beta t_i)}{(\gamma(1+\beta) + s_{i-1} + \beta s_{i})}
+\mathsf{acc}_i = \mathsf{acc}_{i-1} \cdot \frac{{\color{green}(1+\beta)^4 \cdot \mathsf{query}} \cdot (\gamma(1 + \beta) + t_{i-1} + \beta t_i)}{(\gamma(1+\beta) + s_{i-1} + \beta s_{i})\times \ldots}
 $$
 
 where $\color{green}{\mathsf{query}}$ is constructed as:
@@ -184,10 +184,13 @@ $$
 \end{align}
 $$
 
-Note that:
+Note that there's now $4$ dummy queries, and they only appear when none of the lookup selectors are active.
+If a pattern uses less than $4$ queries, it has to be padded with dummy queries as well.
 
-* There's now $4$ dummy queries, and they only appear when none of the lookup selectors are active
-* If a pattern uses less than $4$ queries, they'd have to pad their queries with dummy queries as well
+Finally, note that the denominator of the grand product argument is incomplete in the formula above.
+Since the nominator has degree $5$ in $\gamma (1 + \beta)$, the denominator must match too.
+This is achieved by having a longer $s$, and referring to it $5$ times.
+The denominator thus becomes $\prod_{k=1}^{5} (\gamma (1+\beta) + s_{kn+i-1} + \beta s_{kn+i})$.
 
 ## Back to the grand product argument
 
@@ -205,25 +208,29 @@ What about the second vector $s$?
 
 ## The sorted vector $s$
 
-The second vector $s$ is of size
+We said earlier that in original plonk the size of $s$ is equal to $|s| = |f|+|t|$, where $f$ encodes queries, and $t$ encodes the lookup table.
+With our multi-query approach, the second vector $s$ is of the size
 
-$$n \cdot |\text{queries}| + |\text{lookup\_table}|$$
+$$n \cdot |\#\text{queries}| + |\text{lookup\_table}|$$
 
 That is, it contains the $n$ elements of each **query vectors** (the actual values being looked up, after being combined with the joint combinator, that's $4$ per row), as well as the elements of our lookup table (after being combined as well).
 
 Because the vector $s$ is larger than the domain size $n$, it is split into several vectors of size $n$. Specifically, in the plonkup paper, the two halves of $s$, which are then interpolated as $h_1$ and $h_2$.
-
+The denominator in plonk in the vector form is
 $$
-\mathsf{acc}_i = \mathsf{acc}_{i-1} \cdot \frac{{\color{green}(1+\beta)^4 \cdot \mathsf{query}} \cdot (\gamma(1 + \beta) + t_{i-1} + \beta t_i)}{(\gamma(1+\beta) + s_{i-1} + \beta s_{i})(\gamma(1+\beta)+s_{n+i-1} + \beta s_{n+i})}
+\big(\gamma(1+\beta) + s_{i-1} + \beta s_{i}\big)\big(\gamma(1+\beta)+s_{n+i-1} + \beta s_{n+i}\big)
+$$
+which, when interpolated into $h_1$ and $h_2$, becomes
+$$
+\big(\gamma(1+\beta) + h_1(x) + \beta h_1(g \cdot x)\big)\big(\gamma(1+\beta) + h_2(x) + \beta h_2(g \cdot x)\big)
 $$
 
-Since one has to compute the difference of every contiguous pairs, the last element of the first half is the replicated as the first element of the second half ($s_{n-1} = s_{n}$), and a separate constraint enforces that continuity on the interpolated polynomials $h_1$ and $h_2$:
-
-$$L_{n-1}(h_1(x) - h_2(g \cdot x)) = 0$$
+Since one has to compute the difference of every contiguous pairs, the last element of the first half is the replicated as the first element of the second half ($s_{n-1} = s_{n}$).
+Hence, a separate constraint must be added to enforce that continuity on the interpolated polynomials $h_1$ and $h_2$:
 
-which is equivalent to checking that
+$$L_{n-1}(X)\cdot\big(h_1(X) - h_2(g \cdot X)\big) \equiv 0$$
 
-$$h_1(g^{n-1}) = h_2(1)$$
+which is equivalent to checking that $h_1(g^{n-1}) = h_2(1)$.
 
 ## The sorted vector $s$ in kimchi
 
@@ -244,7 +251,7 @@ The first problem can be solved in two ways:
 The snake technique rearranges $s$ into the following shape:
 
 ```
-                     __    _
+                           __    _
           s_0 |  s_{2n-1} |  |  | |
           ... |       ... |  |  | |
       s_{n-1} |       s_n |  |  | |
@@ -252,21 +259,35 @@ The snake technique rearranges $s$ into the following shape:
               h1         h2  h3 ...
 ```
 
-so that the denominator becomes the following equation:
+Assuming that for now we have only one bend and two polynomials $h_1(X),h_2(X)$, the denominator has the following form:
 
-$$(\gamma(1+\beta) + h_1(x) + \beta h_1(x \cdot g))(\gamma(1+\beta)+ h_2(x \cdot g) + \beta h_2(x))$$
+$$\big(\gamma(1+\beta) + h_1(x) + \beta h_1(x \cdot g)\big)\big(\gamma(1+\beta)+ h_2(x \cdot g) + \beta h_2(x)\big)$$
 
-and the snake doing a U-turn is constrained via something like
+and the snake doing a U-turn is constrained via $s_{n-1} = s_n$, enforced by the following equation:
 
 $$L_{n-1} \cdot (h_1(x) - h_2(x)) = 0$$
 
-If there's an $h_3$ (because the table is very large, for example), then you'd have something like:
+In practice, $s$ will have more sections than just two.
+Assume that we have $k$ sections in total, then the denominator generalizes to
 
-$$(\gamma(1+\beta) + h_1(x) + \beta h_1(x \cdot g))(\gamma(1+\beta)+ h_2(x \cdot g) + \beta h_2(x))\color{green}{(\gamma(1+\beta)+ h_3(x) + \beta h_3(x \cdot g))}$$
+$$
+\prod_{i=1}^k \gamma(1+\beta) + h_i(x \cdot g^{\delta_{0,\ i \text{ mod } 2}}) + \beta h_i(x \cdot g^{\delta_{1,\ i \text{ mod } 2}})
+$$
+
+where $\delta_{i,j}$ is Kronecker delta, equal to $1$ when $i$ is even (for the first term) or odd (for the second one), and equal to $0$ otherwise.
+
+Similarly, the U-turn constraints now become
 
-with the added U-turn constraint:
+$$
+\begin{align*}
+L_{n-1}(X) \cdot (h_2(X) - h_1(X)) &\equiv 0\\
+\color{green}L_{0}(X) \cdot (h_3(X) - h_2(X)) &\color{green}\equiv 0\\
+\color{green}L_{n-1}(X) \cdot (h_4(X) - h_3(X)) &\color{green}\equiv 0\\
+\ldots
+\end{align*}
+$$
 
-$$L_{0} \cdot (h_2(x) - h_3(x)) = 0$$
+In our concrete case with $4$ simultaneous lookups the vector $s$ has to be split into $k= 5$ sections --- each denominator term in the accumulator accounts for $4$ queries ($f$) and $1$ table consistency check ($t$).
 
 ## Unsorted $t$ in $s$
 
diff --git a/kimchi/src/circuits/lookup/constraints.rs b/kimchi/src/circuits/lookup/constraints.rs
index 2ba98b08c4..3b5c38b4d4 100644
--- a/kimchi/src/circuits/lookup/constraints.rs
+++ b/kimchi/src/circuits/lookup/constraints.rs
@@ -255,6 +255,8 @@ where
             .iter()
             .enumerate()
             .map(|(i, s)| {
+                // Snake pattern: even chunks of s are direct
+                // while the odd ones are reversed
                 let (i1, i2) = if i % 2 == 0 {
                     (row, row + 1)
                 } else {

From f38a2c3b6a9a303998f3c242b35975e687762da9 Mon Sep 17 00:00:00 2001
From: Richard Bonichon <richard.bonichon@gmail.com>
Date: Thu, 26 Oct 2023 16:00:30 +0200
Subject: [PATCH 12/32] Cargo: use wasm-bindgen 0.2.87

---
 kimchi/Cargo.toml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/kimchi/Cargo.toml b/kimchi/Cargo.toml
index d9415dce18..f1c3042598 100644
--- a/kimchi/Cargo.toml
+++ b/kimchi/Cargo.toml
@@ -50,7 +50,7 @@ mina-poseidon = { path = "../poseidon", version = "0.1.0" }
 ocaml = { version = "0.22.2", optional = true }
 ocaml-gen = { version = "0.1.5", optional = true }
 
-wasm-bindgen = { version = "0.2.81", optional = true }
+wasm-bindgen = { version = "=0.2.87", optional = true }
 
 internal-tracing = { path = "../internal-tracing", version = "0.1.0" }
 

From 81f129634f4730af3dd8d317789ce054e90cf13a Mon Sep 17 00:00:00 2001
From: Mikhail Volkhov <volhovm.cs@gmail.com>
Date: Tue, 31 Oct 2023 14:32:26 +0000
Subject: [PATCH 13/32] Initially move sections around
 [MinaProtocol/mina#14442]

---
 book/src/SUMMARY.md                           |  29 +-
 .../extended-lookup-tables.md                 |   4 +-
 book/src/{plonk => kimchi}/final_check.md     |   0
 .../src/{rfcs => kimchi}/foreign_field_add.md |   0
 .../src/{rfcs => kimchi}/foreign_field_mul.md |   0
 book/src/kimchi/keccak.md                     | 166 +++++++++
 book/src/kimchi/lookup.md                     | 319 +++++++++++++++++-
 book/src/{plonk => kimchi}/maller_15.md       |   0
 book/src/{plonk => kimchi}/zkpm.md            |   0
 book/src/rfcs/3-lookup.md                     | 318 -----------------
 book/src/rfcs/keccak.md                       | 167 +--------
 11 files changed, 499 insertions(+), 504 deletions(-)
 rename book/src/{rfcs => kimchi}/extended-lookup-tables.md (99%)
 rename book/src/{plonk => kimchi}/final_check.md (100%)
 rename book/src/{rfcs => kimchi}/foreign_field_add.md (100%)
 rename book/src/{rfcs => kimchi}/foreign_field_mul.md (100%)
 create mode 100644 book/src/kimchi/keccak.md
 rename book/src/{plonk => kimchi}/maller_15.md (100%)
 rename book/src/{plonk => kimchi}/zkpm.md (100%)
 delete mode 100644 book/src/rfcs/3-lookup.md

diff --git a/book/src/SUMMARY.md b/book/src/SUMMARY.md
index 1ae5454019..35b2d36267 100644
--- a/book/src/SUMMARY.md
+++ b/book/src/SUMMARY.md
@@ -53,10 +53,18 @@
 # Kimchi
 
 - [Overview](./kimchi/overview.md)
-  - [Arguments](./kimchi/arguments.md)
-    - [Custom Gates](./kimchi/gates.md)
-    - [Permutation](./kimchi/permut.md)
-    - [Lookup](./kimchi/lookup.md)
+- [Arguments](./kimchi/arguments.md)
+- [Zero-Column Approach to Zero-Knowledge](./kimchi/zkpm.md)
+- [Final Check](./kimchi/final_check.md)
+- [Maller's Optimization for Kimchi](./kimchi/maller_15.md)
+- [Permutation](./kimchi/permut.md)
+- [Lookup Tables](./kimchi/lookup.md)
+  - [Extended Lookup Tables](./kimchi/extended-lookup-tables.md)
+- [Custom Gates](./kimchi/gates.md)
+  - [Foreign Field Addition](./kimchi/foreign_field_add.md)
+  - [Foreign Field Multiplication](./kimchi/foreign_field_mul.md)
+  - [Keccak](./rfcs/keccak.md)
+
 
 # Pickles & Inductive Proof Systems
 
@@ -65,18 +73,7 @@
 - [Deferred Computation](./pickles/deferred.md)
 - [Passthough & Me-Only](./pickles/passthrough.md)
 
-# RFCs
-
-- [RFC 0: Alternative Zero-Knowledge](./plonk/zkpm.md)
-- [RFC 1: Final Check](./plonk/final_check.md)
-- [RFC 2: Maller's Optimization for Kimchi](./plonk/maller_15.md)
-- [RFC 3: Plookup Integration in Kimchi](./rfcs/3-lookup.md)
-- [RFC 4: Extended Lookup Tables](./rfcs/extended-lookup-tables.md)
-- [RFC 5: Foreign Field Addition](./rfcs/foreign_field_add.md)
-- [RFC 6: Foreign Field Multiplication](./rfcs/foreign_field_mul.md)
-- [RFC 7: Keccak](./rfcs/keccak.md)
-
-# Specifications
+# Technical Specifications
 
 - [Poseidon hash](./specs/poseidon.md)
 - [Polynomial Commitment](./specs/poly-commitment.md)
diff --git a/book/src/rfcs/extended-lookup-tables.md b/book/src/kimchi/extended-lookup-tables.md
similarity index 99%
rename from book/src/rfcs/extended-lookup-tables.md
rename to book/src/kimchi/extended-lookup-tables.md
index ed8d29bf7c..a2205ddebd 100644
--- a/book/src/rfcs/extended-lookup-tables.md
+++ b/book/src/kimchi/extended-lookup-tables.md
@@ -1,6 +1,6 @@
-# RFC: Extended lookup tables
+# Extended lookup tables
 
-This RFC proposes an extension to our use of lookup tables using the PLOOKUP
+This (old) RFC proposes an extension to our use of lookup tables using the PLOOKUP
 multiset inclusion argument, so that values within lookup tables can be chosen
 after the constraint system for a circuit has been fixed.
 
diff --git a/book/src/plonk/final_check.md b/book/src/kimchi/final_check.md
similarity index 100%
rename from book/src/plonk/final_check.md
rename to book/src/kimchi/final_check.md
diff --git a/book/src/rfcs/foreign_field_add.md b/book/src/kimchi/foreign_field_add.md
similarity index 100%
rename from book/src/rfcs/foreign_field_add.md
rename to book/src/kimchi/foreign_field_add.md
diff --git a/book/src/rfcs/foreign_field_mul.md b/book/src/kimchi/foreign_field_mul.md
similarity index 100%
rename from book/src/rfcs/foreign_field_mul.md
rename to book/src/kimchi/foreign_field_mul.md
diff --git a/book/src/kimchi/keccak.md b/book/src/kimchi/keccak.md
new file mode 100644
index 0000000000..457c247b97
--- /dev/null
+++ b/book/src/kimchi/keccak.md
@@ -0,0 +1,166 @@
+# RFC: Keccak
+
+The Keccak gadget is comprised of 3 circuit gates (`Xor16`, `Rot64`, and `Zero`)
+
+Keccak works with 64-bit words. The state is represented using $5\times 5$ matrix
+of 64 bit words. Each compression step of Keccak consists of 24 rounds. Let us
+denote the state matrix with $A$ (indexing elements as $A[x,y]$), from which we derive
+further states as follows in each round. Each round then consists of the following 5 steps:
+
+$$
+\begin{align}
+C[x] &= A[x,0] \oplus A[x,1] \oplus A[x,2] \oplus A[x,3] \oplus A[x,4] \\
+D[x] &= C[x-1] \oplus ROT(C[x+1],1) \\
+E[x,y] &= A[x,y]  \oplus D[x] \\
+B[y,2x+3y] &= ROT(E[x,y],\rho[x,y]) \\
+F[x,y] &= B[x,y] \oplus ((NOT\ B[x+1,y]) AND\ B[x+2,y]) \\
+Fp[0,0] &= F[0,0] \oplus RC
+\end{align}
+$$
+
+for $0\leq x, y \leq 4$ and $\rho[x,y]$ is the rotation offset defined for Keccak.
+The values are in the table below extracted from the Keccak reference
+<https://keccak.team/files/Keccak-reference-3.0.pdf>
+
+|       | x = 3 | x = 4 | x = 0 | x = 1 | x = 2 |
+| ----- | ----- | ----- | ----- | ----- | ----- |
+| y = 2 | 155   | 231   | 3     | 10    | 171   |
+| y = 1 | 55    | 276   | 36    | 300   | 6     |
+| y = 0 | 28    | 91    | 0     | 1     | 190   |
+| y = 4 | 120   | 78    | 210   | 66    | 253   |
+| y = 3 | 21    | 136   | 105   | 45    | 15    |
+
+## Design Approach:
+
+The atomic operations are XOR, ROT, NOT, AND. In the sections below, we will describe
+the gates for these operations. Below are some common approaches followed in their design.
+
+To fit within 15 wires, we first decompose each word into its lower and upper 32-bit
+components. A gate for an atomic operation works with those 32-bit components at a time.
+
+Before we describe the specific gate design approaches, below are some constraints in the
+Kimchi framework that dictated those approaches.
+* only 4 lookups per row
+* only first 7 columns are available to the permutation polynomial
+
+## Rot64
+
+It is clear from the definition of the rotation gate that its constraints are complete 
+(meaning that honest instances always satisfy the constraints). It is left to be proven
+that the proposal is sound. In this section, we will give a proof that as soon as we 
+perform the range checks on the excess and shifted parts of the input, only one possible
+assignment satisfies the constraints. This means that there is no dishonest instance that
+can make the constraints pass. We will also give an example where one could find wrong
+rotation witnesses that would satisfy the constraints if we did not check the range.
+
+### Necessity of range checks
+
+First of all, we will illustrate the necessity of range-checks with a simple example. 
+For the sake of readability, we will use some toy field lengths. In particular, let us 
+assume that our words have 4 bits, meaning all of the elements between `0x0` and `0xF`. 
+Next, we will be using the native field $\mathbb{F}_{32}$. 
+
+As we will later see, this choice of field lengths is not enough to perform any 4-bit
+rotation, since the operations in the constraints would overflow the native field.
+Nonetheless, it will be sufficient for our example where we will only rotate by 1 bit.
+
+Assume we want to rotate the word `0b1101` (meaning 13) by 1 bit to the left. This gives
+us the rotated word `0b1011` (meaning 11). The excess part of the word is `0b1`, whereas
+the shifted part corresponds to `0b1010`. We recall the constraints for the rotation gate:
+
+$$
+\begin{align*}
+word \cdot 2^{rot} &= excess \cdot 2^{len} + shifted \\
+rotated &= excess + shifted
+\end{align*}
+$$
+
+Applied to our example, this results in the following equations:
+
+$$
+\begin{align*}
+13 \cdot 2 &= excess \cdot 16 + shifted \\
+11 &= excess + shifted
+\end{align*}
+$$
+
+We can easily check that the proposed values of the shifted `0b1010=10` and the excess
+`0b1=1` values satisfy the above constraint because $26 = 1 \cdot 16 + 10$ and $11 = 1 + 10$. 
+Now, the question is: _can we find another value for excess and shifted, such that their addition results in an incorrect rotated word?_
+
+The answer to this question is yes, due to __diophantine equations__. We basically want to find $x,y$ such that $26 = x \cdot 16 + y (\text{ mod } 32)$. The solution to this equation is:
+
+$$
+\begin{align*}
+\forall k \in [0..31]: & \\
+x &= k \\
+y &= 26 - 16 \cdot k
+\end{align*}
+$$
+
+We chose these word and field lengths to better understand the behaviour of the solution. Here, we can see two "classes" of evaluations.
+
+- If we choose an even $k$, then $y$ will have the following shape: 
+  - $$26 - 16 \cdot (2 \cdot n) \iff 26 - 32n \equiv_{32} 26 $$
+  - Meaning, if $x = 2n$ then $y = 26$.
+
+- If on the other hand, we chose an odd $k$, then $y$ will have the following shape instead:
+  - $$26 - 16 \cdot (2 \cdot n + 1) \iff 26 - 32n - 16 \equiv_{32} 26 - 16 = 10$$
+  - Meaning, if $x = 2n+1$ then $y = 10$. 
+
+Thus, possible solutions to the diophantine equation are:
+
+$$
+\begin{align*}
+x &= 0, 1, 2, 3, 4, 5... \\
+y &= 26, 10, 26, 10, 26, 10...
+\end{align*}
+$$
+
+Note that our valid witness is part of that set of solutions, meaning $x=1$ and $y=10$. Of course, we can also find another dishonest instantiation such as $x=0$ and $y=26$. Perhaps one could think that we do not need to worry about this case, because the resulting rotation word would be $0+26=26$, and if we later use that result as an input to a subsequent gate such as XOR, the value $26$ would not fit and at some point the constraint system would complain. Nonetheless, we still have other solutions to worry about, such as $(x=3, y=10)$ or $(x=5, y=10)$, since they would result in a rotated word that would fit in the word length of 4 bits, yet would be incorrect (not equal to $11$). 
+
+All of the above incorrect solutions differ in one thing: they have different bit lengths. This means that we need to range check the values for the excess and shifted witnesses to make sure they have the correct length. 
+
+### Sufficiency of range checks
+
+In the following, we will give a proof that performing range checks for these values is not only necessary but also sufficient to prove that the rotation gate is sound. In other words, we will prove there are no two possible solutions of the decomposition constraint that have the correct bit lengths. Now, for the sake of robustness, we will consider 64-bit words and fields with at least twice the bit length of the words (as is our case). 
+
+We will proceed by __contradiction__. Suppose there are two different solutions to the following diophantic equation:
+
+$$
+\begin{align*}
+\forall k \in \mathbb{F}_n: & \\
+x &= k \\
+y &= w \cdot 2^r - 2^{64} \cdot k
+\end{align*}
+$$
+
+where $k$ is a parameter to instantiate the solutions, $w$ is the word to be rotated, $r$ is the rotation amount, and $n$ is the field length.
+
+Then, that means that there are two different solutions, $(0\leq x=a<2^r, 0\leq y=b<2^{64})$ and $(0\leq x=a'<2^r, 0\leq y=b'<2^{64})$ with at least $a \neq a'$ or $b \neq b'$. We will show that this is impossible.
+
+If both are solutions to the same equation, then: 
+$$
+\begin{align*}
+w \cdot 2^r &= a \cdot 2^{64} + b \\
+w \cdot 2^r &= a'\cdot 2^{64} + b'
+\end{align*}
+$$
+means that $a \cdot 2^{64} + b = a'\cdot 2^{64} + b'$. Moving terms to the left side, we have an equivalent equality: $2^{64}(a-a') + (b-b')=0 \mod{n}$. There are three cases to consider:
+
+- $a = a'$ and $b \neq b'$: then $(b - b') \equiv_n 0$ and this can only happen if $b' = b + kn$. But since $n > 2^{64}$, then $b'$ cannot be smaller than $2^{64}$ as it was assumed. CONTRADICTION.
+  
+- $b = b'$ and $a \neq a'$: then $2^{64}(a - a') \equiv_n 0$ and this can only happen if $a' = a + kn$. But since $n > 2^r$, then $a'$ cannot be smaller than $2^r$ as it was assumed. CONTRADICTION.
+
+- $a\neq a'$ and $b \neq b'$: then we have something like $2^{64} \alpha + \beta \equiv_n 0$. 
+  - This means $\beta \equiv_n -2^{64} \alpha = k \cdot n - 2^{64} \alpha$ for any $k$.
+  - According to the assumption, both $0\leq a<2^r$ and $0\leq a'<2^r$. This means, the difference $\alpha:=(a - a')$ lies anywhere in between the following interval: 
+  - $$1 - 2^r \leq \alpha \leq 2^r - 1$$
+  - We plug in this interval to the above equation to obtain the following interval for $\beta$:
+  - $$k\cdot n - 2^{64}(1-2^r)\leq \beta \leq k\cdot n - 2^{64}(2^r - 1) $$
+  - We look at this interval from both sides of the inequality: $\beta \geq kn - 2^{64} + 2^{64+r}$ and $\beta \leq kn + 2^{64} - 2^{64+r}$ and we wonder if $kn - 2^{64} + 2^{64+r} \leq kn + 2^{64} - 2^{64+r}$ is at all possible. We rewrite as follows:
+  - $$2^{64+r} - 2^{64} \leq 2^{64} - 2^{64+r}$$
+  - $$2\cdot2^{64+r} \leq 2\cdot2^{64} $$
+  - $$2^{64+r} \leq 2^{64} $$
+  - But this can only happen if $r\leq 0$, which is impossible since we assume $0 < r < 64$.CONTRADICTION.
+- EOP.
diff --git a/book/src/kimchi/lookup.md b/book/src/kimchi/lookup.md
index 9989ac5557..a261672716 100644
--- a/book/src/kimchi/lookup.md
+++ b/book/src/kimchi/lookup.md
@@ -1,3 +1,318 @@
-## Lookup
+# Plookup in Kimchi
 
-TO-DO
\ No newline at end of file
+In 2020, [plookup](https://eprint.iacr.org/2020/315.pdf) showed how to create lookup proofs. Proofs that some witness values are part of a [lookup table](https://en.wikipedia.org/wiki/Lookup_table). Two years later, an independent team published [plonkup](https://eprint.iacr.org/2022/086) showing how to integrate Plookup into Plonk.
+
+This document specifies how we integrate plookup in kimchi. It assumes that the reader understands the basics behind plookup.
+
+## Overview
+
+We integrate plookup in kimchi with the following differences:
+
+* we snake-ify the sorted table instead of wrapping it around (see later)
+* we allow fixed-ahead-of-time linear combinations of columns of the queries we make
+* we only use a single table (XOR) at the moment of this writing
+* we allow several lookups (or queries) to be performed within the same row
+* zero-knowledgeness is added in a specific way (see later)
+
+The following document explains the protocol in more detail
+
+### Recap on the grand product argument of plookup
+
+As per the Plookup paper, the prover will have to compute three vectors:
+
+* $f$, the (secret) **query vector**, containing the witness values that the prover wants to prove are part of the lookup table.
+* $t$, the (public) **lookup table**.
+* $s$, the (secret) concatenation of $f$ and $t$, sorted by $t$ (where elements are listed in the order they are listed in $t$).
+
+Essentially, plookup proves that all the elements in $f$ are indeed in the lookup table $t$ if and only if the following multisets are equal:
+
+* $\{(1+\beta)f, \text{diff}(t)\}$
+* $\text{diff}(\text{sorted}(f, t))$
+
+where $\text{diff}$ is a new set derived by applying a "randomized difference" between every successive pairs of a vector. For example:
+
+* $f = \{5, 4, 1, 5\}$
+* $t = \{1, 4, 5\}$
+* $\{\color{blue}{(1+\beta)f}, \color{green}{\text{diff}(t)}\} = \{\color{blue}{(1+\beta)5, (1+\beta)4, (1+\beta)1, (1+\beta)5}, \color{green}{1+\beta 4, 4+\beta 5}\}$
+* $\text{diff}(\text{sorted}(f, t)) = \{1+\beta 1, 1+\beta 4, 4+\beta 4, 4+\beta 5, 5+\beta 5, 5+\beta 5\}$
+
+> Note: This assumes that the lookup table is a single column. You will see in the next section how to address lookup tables with more than one column.
+
+The equality between the multisets can be proved with the permutation argument of plonk, which would look like enforcing constraints on the following accumulator:
+
+* init: $\mathsf{acc}_0 = 1$
+* final: $\mathsf{acc}_n = 1$
+* for every $0 < i \leq n$:
+    $$
+    \mathsf{acc}_i = \mathsf{acc}_{i-1} \cdot \frac{(\gamma + (1+\beta) f_{i-1}) \cdot (\gamma + t_{i-1} + \beta t_i)}{(\gamma + s_{i-1} + \beta s_{i})(\gamma + s_{n+i-1} + \beta s_{n+i})}
+    $$
+
+Note that the plookup paper uses a slightly different equation to make the proof work. It is possible that the proof would work with the above equation, but for simplicity let's just use the equation published in plookup:
+
+$$
+\mathsf{acc}_i = \mathsf{acc}_{i-1} \cdot \frac{(1+\beta) \cdot (\gamma + f_{i-1}) \cdot (\gamma(1 + \beta) + t_{i-1} + \beta t_i)}{(\gamma(1+\beta) + s_{i-1} + \beta s_{i})(\gamma(1+\beta) + s_{n+i-1} + \beta s_{n+i})}
+$$
+
+> Note: in plookup $s$ is longer than $n$ ($|s| = |f| + |t|$), and thus it needs to be split into multiple vectors to enforce the constraint at every $i \in [[0;n]]$. This leads to the two terms in the denominator as shown above, so that the degree of $\gamma (1 + \beta)$ is equal in the nominator and denominator.
+
+### Lookup tables
+
+Kimchi uses a single **lookup table** at the moment of this writing; the XOR table. The XOR table for values of 1 bit is the following:
+
+
+| l   | r   | o   |
+| --- | --- | --- |
+| 1   | 0   | 1   |
+| 0   | 1   | 1   |
+| 1   | 1   | 0   |
+| 0   | 0   | 0   |
+
+Whereas kimchi uses the XOR table for values of $4$ bits, which has $2^{8}$ entries.
+
+Note: the $(0, 0, 0)$ **entry** is at the very end on purpose (as it will be used as dummy entry for rows of the witness that don't care about lookups).
+
+### Querying the table
+
+The plookup paper handles a vector of lookups $f$ which we do not have. So the first step is to create such a table from the witness columns (or registers). To do this, we define the following objects:
+
+* a **query** tells us what registers, in what order, and scaled by how much, are part of a query
+* a **query selector** tells us which rows are using the query. It is pretty much the same as a [gate selector]().
+
+Let's go over the first item in this section.
+
+For example, the following **query** tells us that we want to check if $r_0 \oplus r_2 = 2\cdot r_1$
+
+|   l      |   r      |   o      |
+| :---:    | :---:    | :---:    |
+| 1, $r_0$ | 1, $r_2$ | 2, $r_1$ |
+
+The grand product argument for the lookup consraint will look like this at this point:
+
+$$
+\mathsf{acc}_i = \mathsf{acc}_{i-1} \cdot \frac{(1+\beta) \cdot {\color{green}(\gamma + w_0(g^i) + j \cdot w_2(g^i) + j^2 \cdot 2 \cdot w_1(g^i))} \cdot (\gamma(1 + \beta) + t_{i-1} + \beta t_i)}{(\gamma(1+\beta) + s_{i-1} + \beta s_{i})(\gamma(1+\beta) + s_{n+i-1} + \beta s_{n+i})}
+$$
+
+Not all rows need to perform queries into a lookup table. We will use a query selector in the next section to make the constraints work with this in mind.
+
+### Query selector
+
+The associated **query selector** tells us on which rows the query into the XOR lookup table occurs.
+
+|  row  | query selector |
+| :---: | :------------: |
+|   0   |       1        |
+|   1   |       0        |
+
+
+Both the (XOR) lookup table and the query are built-ins in kimchi. The query selector is derived from the circuit at setup time. Currently only the ChaCha gates make use of the lookups.
+
+With the selectors, the grand product argument for the lookup constraint has the following form:
+
+$$
+\mathsf{acc}_i = \mathsf{acc}_{i-1} \cdot \frac{(1+\beta) \cdot {\color{green}\mathsf{query}} \cdot (\gamma(1 + \beta) + t_{i-1} + \beta t_i)}{(\gamma(1+\beta) + s_{i-1} + \beta s_{i})}
+$$
+
+where $\color{green}{\mathsf{query}}$ is constructed so that a dummy query ($0 \oplus 0 = 0$) is used on rows that don't have a query.
+
+$$
+\begin{align}
+\mathsf{query} := &\ \mathsf{selector} \cdot (\gamma + w_0(g^i) + j \cdot w_2(g^i) + j^2 \cdot 2 \cdot w_1(g^i)) + \\
+&\ (1- \mathsf{selector}) \cdot (\gamma + 0 + j \cdot 0 + j^2 \cdot 0)
+\end{align}
+$$
+
+### Supporting multiple queries
+
+Since we would like to allow multiple table lookups per row, we define multiple **queries**, where each query is associated with a **lookup selector**.
+
+At the moment of this writing, the `ChaCha` gates all perform $4$ queries in a row. Thus, $4$ is trivially the largest number of queries that happen in a row.
+
+**Important**: to make constraints work, this means that each row must make $4$ queries. Potentially some or all of them are dummy queries.
+
+For example, the `ChaCha0`, `ChaCha1`, and `ChaCha2` gates will jointly apply the following 4 XOR queries on the current and following rows:
+
+|   l      |   r      |   o         | -   |   l      |   r      |   o        | -   |   l      |   r      |   o         | -   |   l      |   r         |   o         |
+| :---:    | :---:    | :----:      | --- | :---:    | :---:    | :----:     | --- | :---:    | :---:    | :----:      | --- | :---:    | :----:      | :----:      |
+| 1, $r_3$ | 1, $r_7$ | 1, $r_{11}$ | -   | 1, $r_4$ | 1, $r_8$ | 1, $r_{12}$ | -   | 1, $r_5$ | 1, $r_9$ | 1, $r_{13}$ | -   | 1, $r_6$ | 1, $r_{10}$ | 1, $r_{14}$ |
+
+which you can understand as checking for the current and following row that
+
+$$
+\begin{align}
+r_3 \oplus r_7 &= r_{11}\\
+r_4 \oplus r_8 &= r_{12}\\
+r_5 \oplus r_9 &= r_{13}\\
+r_6 \oplus r_{10} &= r_{14}
+\end{align}
+$$
+
+The `ChaChaFinal` also performs $4$ (somewhat similar) queries in the XOR lookup table. In total this is $8$ different queries that could be associated to $8$ selector polynomials.
+
+### Grouping queries by queries pattern
+
+Associating each query with a selector polynomial is not necessarily efficient. To summarize:
+
+* the `ChaCha0`, `ChaCha1`, and `ChaCha2` gates that in total make $4$ queries into the XOR table
+* the `ChaChaFinal` gate makes another $4$ different queries into the XOR table
+
+Using the previous section's method, we'd have to use $8$ different lookup selector polynomials for each of the different $8$ queries. Since there's only $2$ use-cases, we can simply group them by **queries patterns** to reduce the number of lookup selector polynomials to $2$.
+
+The grand product argument for the lookup constraint looks like this now:
+
+$$
+\mathsf{acc}_i = \mathsf{acc}_{i-1} \cdot \frac{{\color{green}(1+\beta)^4 \cdot \mathsf{query}} \cdot (\gamma(1 + \beta) + t_{i-1} + \beta t_i)}{(\gamma(1+\beta) + s_{i-1} + \beta s_{i})\times \ldots}
+$$
+
+where $\color{green}{\mathsf{query}}$ is constructed as:
+
+$$
+\begin{align}
+\mathsf{query} = &\ \mathsf{selector}_1 \cdot \mathsf{pattern}_1 + \\
+&\ \mathsf{selector}_2 \cdot \mathsf{pattern}_2 + \\
+&\ (1 - \mathsf{selector}_1 - \mathsf{selector}_2) \cdot (\gamma + 0 + j \cdot 0 + j^2 \cdot 0)^4
+\end{align}
+$$
+
+where, for example the first pattern for the `ChaCha0`, `ChaCha1`, and `ChaCha2` gates looks like this:
+
+$$
+\begin{align}
+\mathsf{pattern}_1 = &\ (\gamma + w_3(g^i) + j \cdot w_7(g^i) + j^2 \cdot w_{11}(g^i)) \cdot \\
+&\ (\gamma + w_4(g^i) + j \cdot w_8(g^i) + j^2 \cdot w_{12}(g^i)) \cdot \\
+&\ (\gamma + w_5(g^i) + j \cdot w_9(g^i) + j^2 \cdot w_{13}(g^i)) \cdot \\
+&\ (\gamma + w_6(g^i) + j \cdot w_{10}(g^i) + j^2 \cdot w_{14}(g^i)) \cdot \\
+\end{align}
+$$
+
+Note that there's now $4$ dummy queries, and they only appear when none of the lookup selectors are active.
+If a pattern uses less than $4$ queries, it has to be padded with dummy queries as well.
+
+Finally, note that the denominator of the grand product argument is incomplete in the formula above.
+Since the nominator has degree $5$ in $\gamma (1 + \beta)$, the denominator must match too.
+This is achieved by having a longer $s$, and referring to it $5$ times.
+The denominator thus becomes $\prod_{k=1}^{5} (\gamma (1+\beta) + s_{kn+i-1} + \beta s_{kn+i})$.
+
+## Back to the grand product argument
+
+There are two things that we haven't touched on:
+
+* The vector $t$ representing the **combined lookup table** (after its columns have been combined with a joint combiner $j$). The **non-combined loookup table** is fixed at setup time and derived based on the lookup tables used in the circuit (for now only one, the XOR lookup table, can be used in the circuit).
+* The vector $s$ representing the sorted multiset of both the queries and the lookup table. This is created by the prover and sent as commitment to the verifier.
+
+The first vector $t$ is quite straightforward to think about:
+
+* if it is smaller than the domain (of size $n$), then we can repeat the last entry enough times to make the table of size $n$.
+* if it is larger than the domain, then we can either increase the domain or split the vector in two (or more) vectors. This is most likely what we will have to do to support multiple lookup tables later.
+
+What about the second vector $s$?
+
+## The sorted vector $s$
+
+We said earlier that in original plonk the size of $s$ is equal to $|s| = |f|+|t|$, where $f$ encodes queries, and $t$ encodes the lookup table.
+With our multi-query approach, the second vector $s$ is of the size
+
+$$n \cdot |\#\text{queries}| + |\text{lookup\_table}|$$
+
+That is, it contains the $n$ elements of each **query vectors** (the actual values being looked up, after being combined with the joint combinator, that's $4$ per row), as well as the elements of our lookup table (after being combined as well).
+
+Because the vector $s$ is larger than the domain size $n$, it is split into several vectors of size $n$. Specifically, in the plonkup paper, the two halves of $s$, which are then interpolated as $h_1$ and $h_2$.
+The denominator in plonk in the vector form is
+$$
+\big(\gamma(1+\beta) + s_{i-1} + \beta s_{i}\big)\big(\gamma(1+\beta)+s_{n+i-1} + \beta s_{n+i}\big)
+$$
+which, when interpolated into $h_1$ and $h_2$, becomes
+$$
+\big(\gamma(1+\beta) + h_1(x) + \beta h_1(g \cdot x)\big)\big(\gamma(1+\beta) + h_2(x) + \beta h_2(g \cdot x)\big)
+$$
+
+Since one has to compute the difference of every contiguous pairs, the last element of the first half is the replicated as the first element of the second half ($s_{n-1} = s_{n}$).
+Hence, a separate constraint must be added to enforce that continuity on the interpolated polynomials $h_1$ and $h_2$:
+
+$$L_{n-1}(X)\cdot\big(h_1(X) - h_2(g \cdot X)\big) \equiv 0$$
+
+which is equivalent to checking that $h_1(g^{n-1}) = h_2(1)$.
+
+## The sorted vector $s$ in kimchi
+
+Since this vector is known only by the prover, and is evaluated as part of the protocol, zero-knowledge must be added to the corresponding polynomial (in case of plookup approach, to $h_1(X),h_2(X)$). To do this in kimchi, we use the same technique as with the other prover polynomials: we randomize the last evaluations (or rows, on the domain) of the polynomial.
+
+This means two things for the lookup grand product argument:
+
+1. We cannot use the wrap around trick to make sure that the list is split in two correctly (enforced by $L_{n-1}(h_1(x) - h_2(g \cdot x)) = 0$ which is equivalent to $h_1(g^{n-1}) = h_2(1)$ in the plookup paper)
+2. We have even less space to store an entire query vector. Which is actually super correct, as the witness also has some zero-knowledge rows at the end that should not be part of the queries anyway.
+
+The first problem can be solved in two ways:
+
+* **Zig-zag technique**. By reorganizing $s$ to alternate its values between the columns. For example, $h_1 = (s_0, s_2, s_4, \cdots)$ and $h_2 = (s_1, s_3, s_5, \cdots)$ so that you can simply write the denominator of the grand product argument as
+    $$(\gamma(1+\beta) + h_1(x) + \beta h_2(x))(\gamma(1+\beta)+ h_2(x) + \beta h_1(x \cdot g))$$
+    Whis approach is taken by the [plonkup](https://eprint.iacr.org/2022/086) paper.
+* **Snake technique**. By reorganizing $s$ as a snake. This is what is currently implemented in kimchi.
+
+The snake technique rearranges $s$ into the following shape:
+
+```
+                           __    _
+          s_0 |  s_{2n-1} |  |  | |
+          ... |       ... |  |  | |
+      s_{n-1} |       s_n |  |  | |
+               ‾‾‾‾‾‾‾‾‾‾‾    ‾‾   ‾
+              h1         h2  h3 ...
+```
+
+Assuming that for now we have only one bend and two polynomials $h_1(X),h_2(X)$, the denominator has the following form:
+
+$$\big(\gamma(1+\beta) + h_1(x) + \beta h_1(x \cdot g)\big)\big(\gamma(1+\beta)+ h_2(x \cdot g) + \beta h_2(x)\big)$$
+
+and the snake doing a U-turn is constrained via $s_{n-1} = s_n$, enforced by the following equation:
+
+$$L_{n-1} \cdot (h_1(x) - h_2(x)) = 0$$
+
+In practice, $s$ will have more sections than just two.
+Assume that we have $k$ sections in total, then the denominator generalizes to
+
+$$
+\prod_{i=1}^k \gamma(1+\beta) + h_i(x \cdot g^{\delta_{0,\ i \text{ mod } 2}}) + \beta h_i(x \cdot g^{\delta_{1,\ i \text{ mod } 2}})
+$$
+
+where $\delta_{i,j}$ is Kronecker delta, equal to $1$ when $i$ is even (for the first term) or odd (for the second one), and equal to $0$ otherwise.
+
+Similarly, the U-turn constraints now become
+
+$$
+\begin{align*}
+L_{n-1}(X) \cdot (h_2(X) - h_1(X)) &\equiv 0\\
+\color{green}L_{0}(X) \cdot (h_3(X) - h_2(X)) &\color{green}\equiv 0\\
+\color{green}L_{n-1}(X) \cdot (h_4(X) - h_3(X)) &\color{green}\equiv 0\\
+\ldots
+\end{align*}
+$$
+
+In our concrete case with $4$ simultaneous lookups the vector $s$ has to be split into $k= 5$ sections --- each denominator term in the accumulator accounts for $4$ queries ($f$) and $1$ table consistency check ($t$).
+
+## Unsorted $t$ in $s$
+
+Note that at setup time, $t$ cannot be sorted lexicographically as it is not combined yet. Since $s$ must be sorted by $t$ (in other words sorting of $s$ must follow the elements of $t$), there are two solutions:
+
+1. Both the prover and the verifier can sort the combined $t$ lexicographically, so that $s$ can be sorted lexicographically too using typical sorting algorithms
+2. The prover can directly sort $s$ by $t$, so that the verifier doesn't have to do any pre-sorting and can just rely on the commitment of the columns of $t$ (which the prover can evaluate in the protocol).
+
+We take the second approach.
+However, this must be done carefully since the combined $t$ entries can repeat. For some $i, l$ such that $i \neq l$, we might have
+
+$$
+t_0[i] + j \cdot t_1[i] + j^2 \cdot t_2[i] = t_0[l] + j \cdot t_1[l] + j^2 \cdot t_2[l]
+$$
+
+For example, if $f = \{1, 2, 2, 3\}$ and $t = \{2, 1, 2, 3\}$, then $\text{sorted}(f, t) = \{2, 2, 2, 1, 1, 2, 3, 3\}$ would be a way of correctly sorting the combined vector $s$. At the same time $\text{sorted}(f, t) = \{ 2, 2, 2, 2, 1, 1, 3, 3 \}$ is incorrect since it does not have a second block of $2$s, and thus such an $s$ is not sorted by $t$.
+
+
+## Recap
+
+So to recap, to create the sorted polynomials $h_i$, the prover:
+
+1. creates a large query vector which contains the concatenation of the $4$ per-row (combined with the joint combinator) queries (that might contain dummy queries) for all rows
+2. creates the (combined with the joint combinator) table vector
+3. sorts all of that into a big vector $s$
+4. divides that vector $s$ into as many $h_i$ vectors as a necessary following the snake method
+5. interpolate these $h_i$ vectors into $h_i$ polynomials
+6. commit to them, and evaluate them as part of the protocol.
diff --git a/book/src/plonk/maller_15.md b/book/src/kimchi/maller_15.md
similarity index 100%
rename from book/src/plonk/maller_15.md
rename to book/src/kimchi/maller_15.md
diff --git a/book/src/plonk/zkpm.md b/book/src/kimchi/zkpm.md
similarity index 100%
rename from book/src/plonk/zkpm.md
rename to book/src/kimchi/zkpm.md
diff --git a/book/src/rfcs/3-lookup.md b/book/src/rfcs/3-lookup.md
deleted file mode 100644
index 32dc9d39b8..0000000000
--- a/book/src/rfcs/3-lookup.md
+++ /dev/null
@@ -1,318 +0,0 @@
-# RFC: Plookup in Kimchi
-
-In 2020, [plookup](https://eprint.iacr.org/2020/315.pdf) showed how to create lookup proofs. Proofs that some witness values are part of a [lookup table](https://en.wikipedia.org/wiki/Lookup_table). Two years later, an independent team published [plonkup](https://eprint.iacr.org/2022/086) showing how to integrate Plookup into Plonk.
-
-This document specifies how we integrate plookup in kimchi. It assumes that the reader understands the basics behind plookup.
-
-## Overview
-
-We integrate plookup in kimchi with the following differences:
-
-* we snake-ify the sorted table instead of wrapping it around (see later)
-* we allow fixed-ahead-of-time linear combinations of columns of the queries we make
-* we only use a single table (XOR) at the moment of this writing
-* we allow several lookups (or queries) to be performed within the same row
-* zero-knowledgeness is added in a specific way (see later)
-
-The following document explains the protocol in more detail
-
-### Recap on the grand product argument of plookup
-
-As per the Plookup paper, the prover will have to compute three vectors:
-
-* $f$, the (secret) **query vector**, containing the witness values that the prover wants to prove are part of the lookup table.
-* $t$, the (public) **lookup table**.
-* $s$, the (secret) concatenation of $f$ and $t$, sorted by $t$ (where elements are listed in the order they are listed in $t$).
-
-Essentially, plookup proves that all the elements in $f$ are indeed in the lookup table $t$ if and only if the following multisets are equal:
-
-* $\{(1+\beta)f, \text{diff}(t)\}$
-* $\text{diff}(\text{sorted}(f, t))$
-
-where $\text{diff}$ is a new set derived by applying a "randomized difference" between every successive pairs of a vector. For example:
-
-* $f = \{5, 4, 1, 5\}$
-* $t = \{1, 4, 5\}$
-* $\{\color{blue}{(1+\beta)f}, \color{green}{\text{diff}(t)}\} = \{\color{blue}{(1+\beta)5, (1+\beta)4, (1+\beta)1, (1+\beta)5}, \color{green}{1+\beta 4, 4+\beta 5}\}$
-* $\text{diff}(\text{sorted}(f, t)) = \{1+\beta 1, 1+\beta 4, 4+\beta 4, 4+\beta 5, 5+\beta 5, 5+\beta 5\}$
-
-> Note: This assumes that the lookup table is a single column. You will see in the next section how to address lookup tables with more than one column.
-
-The equality between the multisets can be proved with the permutation argument of plonk, which would look like enforcing constraints on the following accumulator:
-
-* init: $\mathsf{acc}_0 = 1$
-* final: $\mathsf{acc}_n = 1$
-* for every $0 < i \leq n$:
-    $$
-    \mathsf{acc}_i = \mathsf{acc}_{i-1} \cdot \frac{(\gamma + (1+\beta) f_{i-1}) \cdot (\gamma + t_{i-1} + \beta t_i)}{(\gamma + s_{i-1} + \beta s_{i})(\gamma + s_{n+i-1} + \beta s_{n+i})}
-    $$
-
-Note that the plookup paper uses a slightly different equation to make the proof work. It is possible that the proof would work with the above equation, but for simplicity let's just use the equation published in plookup:
-
-$$
-\mathsf{acc}_i = \mathsf{acc}_{i-1} \cdot \frac{(1+\beta) \cdot (\gamma + f_{i-1}) \cdot (\gamma(1 + \beta) + t_{i-1} + \beta t_i)}{(\gamma(1+\beta) + s_{i-1} + \beta s_{i})(\gamma(1+\beta) + s_{n+i-1} + \beta s_{n+i})}
-$$
-
-> Note: in plookup $s$ is longer than $n$ ($|s| = |f| + |t|$), and thus it needs to be split into multiple vectors to enforce the constraint at every $i \in [[0;n]]$. This leads to the two terms in the denominator as shown above, so that the degree of $\gamma (1 + \beta)$ is equal in the nominator and denominator.
-
-### Lookup tables
-
-Kimchi uses a single **lookup table** at the moment of this writing; the XOR table. The XOR table for values of 1 bit is the following:
-
-
-| l   | r   | o   |
-| --- | --- | --- |
-| 1   | 0   | 1   |
-| 0   | 1   | 1   |
-| 1   | 1   | 0   |
-| 0   | 0   | 0   |
-
-Whereas kimchi uses the XOR table for values of $4$ bits, which has $2^{8}$ entries.
-
-Note: the $(0, 0, 0)$ **entry** is at the very end on purpose (as it will be used as dummy entry for rows of the witness that don't care about lookups).
-
-### Querying the table
-
-The plookup paper handles a vector of lookups $f$ which we do not have. So the first step is to create such a table from the witness columns (or registers). To do this, we define the following objects:
-
-* a **query** tells us what registers, in what order, and scaled by how much, are part of a query
-* a **query selector** tells us which rows are using the query. It is pretty much the same as a [gate selector]().
-
-Let's go over the first item in this section.
-
-For example, the following **query** tells us that we want to check if $r_0 \oplus r_2 = 2\cdot r_1$
-
-|   l      |   r      |   o      |
-| :---:    | :---:    | :---:    |
-| 1, $r_0$ | 1, $r_2$ | 2, $r_1$ |
-
-The grand product argument for the lookup consraint will look like this at this point:
-
-$$
-\mathsf{acc}_i = \mathsf{acc}_{i-1} \cdot \frac{(1+\beta) \cdot {\color{green}(\gamma + w_0(g^i) + j \cdot w_2(g^i) + j^2 \cdot 2 \cdot w_1(g^i))} \cdot (\gamma(1 + \beta) + t_{i-1} + \beta t_i)}{(\gamma(1+\beta) + s_{i-1} + \beta s_{i})(\gamma(1+\beta) + s_{n+i-1} + \beta s_{n+i})}
-$$
-
-Not all rows need to perform queries into a lookup table. We will use a query selector in the next section to make the constraints work with this in mind.
-
-### Query selector
-
-The associated **query selector** tells us on which rows the query into the XOR lookup table occurs.
-
-|  row  | query selector |
-| :---: | :------------: |
-|   0   |       1        |
-|   1   |       0        |
-
-
-Both the (XOR) lookup table and the query are built-ins in kimchi. The query selector is derived from the circuit at setup time. Currently only the ChaCha gates make use of the lookups.
-
-With the selectors, the grand product argument for the lookup constraint has the following form:
-
-$$
-\mathsf{acc}_i = \mathsf{acc}_{i-1} \cdot \frac{(1+\beta) \cdot {\color{green}\mathsf{query}} \cdot (\gamma(1 + \beta) + t_{i-1} + \beta t_i)}{(\gamma(1+\beta) + s_{i-1} + \beta s_{i})}
-$$
-
-where $\color{green}{\mathsf{query}}$ is constructed so that a dummy query ($0 \oplus 0 = 0$) is used on rows that don't have a query.
-
-$$
-\begin{align}
-\mathsf{query} := &\ \mathsf{selector} \cdot (\gamma + w_0(g^i) + j \cdot w_2(g^i) + j^2 \cdot 2 \cdot w_1(g^i)) + \\
-&\ (1- \mathsf{selector}) \cdot (\gamma + 0 + j \cdot 0 + j^2 \cdot 0)
-\end{align}
-$$
-
-### Supporting multiple queries
-
-Since we would like to allow multiple table lookups per row, we define multiple **queries**, where each query is associated with a **lookup selector**.
-
-At the moment of this writing, the `ChaCha` gates all perform $4$ queries in a row. Thus, $4$ is trivially the largest number of queries that happen in a row.
-
-**Important**: to make constraints work, this means that each row must make $4$ queries. Potentially some or all of them are dummy queries.
-
-For example, the `ChaCha0`, `ChaCha1`, and `ChaCha2` gates will jointly apply the following 4 XOR queries on the current and following rows:
-
-|   l      |   r      |   o         | -   |   l      |   r      |   o        | -   |   l      |   r      |   o         | -   |   l      |   r         |   o         |
-| :---:    | :---:    | :----:      | --- | :---:    | :---:    | :----:     | --- | :---:    | :---:    | :----:      | --- | :---:    | :----:      | :----:      |
-| 1, $r_3$ | 1, $r_7$ | 1, $r_{11}$ | -   | 1, $r_4$ | 1, $r_8$ | 1, $r_{12}$ | -   | 1, $r_5$ | 1, $r_9$ | 1, $r_{13}$ | -   | 1, $r_6$ | 1, $r_{10}$ | 1, $r_{14}$ |
-
-which you can understand as checking for the current and following row that
-
-$$
-\begin{align}
-r_3 \oplus r_7 &= r_{11}\\
-r_4 \oplus r_8 &= r_{12}\\
-r_5 \oplus r_9 &= r_{13}\\
-r_6 \oplus r_{10} &= r_{14}
-\end{align}
-$$
-
-The `ChaChaFinal` also performs $4$ (somewhat similar) queries in the XOR lookup table. In total this is $8$ different queries that could be associated to $8$ selector polynomials.
-
-### Grouping queries by queries pattern
-
-Associating each query with a selector polynomial is not necessarily efficient. To summarize:
-
-* the `ChaCha0`, `ChaCha1`, and `ChaCha2` gates that in total make $4$ queries into the XOR table
-* the `ChaChaFinal` gate makes another $4$ different queries into the XOR table
-
-Using the previous section's method, we'd have to use $8$ different lookup selector polynomials for each of the different $8$ queries. Since there's only $2$ use-cases, we can simply group them by **queries patterns** to reduce the number of lookup selector polynomials to $2$.
-
-The grand product argument for the lookup constraint looks like this now:
-
-$$
-\mathsf{acc}_i = \mathsf{acc}_{i-1} \cdot \frac{{\color{green}(1+\beta)^4 \cdot \mathsf{query}} \cdot (\gamma(1 + \beta) + t_{i-1} + \beta t_i)}{(\gamma(1+\beta) + s_{i-1} + \beta s_{i})\times \ldots}
-$$
-
-where $\color{green}{\mathsf{query}}$ is constructed as:
-
-$$
-\begin{align}
-\mathsf{query} = &\ \mathsf{selector}_1 \cdot \mathsf{pattern}_1 + \\
-&\ \mathsf{selector}_2 \cdot \mathsf{pattern}_2 + \\
-&\ (1 - \mathsf{selector}_1 - \mathsf{selector}_2) \cdot (\gamma + 0 + j \cdot 0 + j^2 \cdot 0)^4
-\end{align}
-$$
-
-where, for example the first pattern for the `ChaCha0`, `ChaCha1`, and `ChaCha2` gates looks like this:
-
-$$
-\begin{align}
-\mathsf{pattern}_1 = &\ (\gamma + w_3(g^i) + j \cdot w_7(g^i) + j^2 \cdot w_{11}(g^i)) \cdot \\
-&\ (\gamma + w_4(g^i) + j \cdot w_8(g^i) + j^2 \cdot w_{12}(g^i)) \cdot \\
-&\ (\gamma + w_5(g^i) + j \cdot w_9(g^i) + j^2 \cdot w_{13}(g^i)) \cdot \\
-&\ (\gamma + w_6(g^i) + j \cdot w_{10}(g^i) + j^2 \cdot w_{14}(g^i)) \cdot \\
-\end{align}
-$$
-
-Note that there's now $4$ dummy queries, and they only appear when none of the lookup selectors are active.
-If a pattern uses less than $4$ queries, it has to be padded with dummy queries as well.
-
-Finally, note that the denominator of the grand product argument is incomplete in the formula above.
-Since the nominator has degree $5$ in $\gamma (1 + \beta)$, the denominator must match too.
-This is achieved by having a longer $s$, and referring to it $5$ times.
-The denominator thus becomes $\prod_{k=1}^{5} (\gamma (1+\beta) + s_{kn+i-1} + \beta s_{kn+i})$.
-
-## Back to the grand product argument
-
-There are two things that we haven't touched on:
-
-* The vector $t$ representing the **combined lookup table** (after its columns have been combined with a joint combiner $j$). The **non-combined loookup table** is fixed at setup time and derived based on the lookup tables used in the circuit (for now only one, the XOR lookup table, can be used in the circuit).
-* The vector $s$ representing the sorted multiset of both the queries and the lookup table. This is created by the prover and sent as commitment to the verifier.
-
-The first vector $t$ is quite straightforward to think about:
-
-* if it is smaller than the domain (of size $n$), then we can repeat the last entry enough times to make the table of size $n$.
-* if it is larger than the domain, then we can either increase the domain or split the vector in two (or more) vectors. This is most likely what we will have to do to support multiple lookup tables later.
-
-What about the second vector $s$?
-
-## The sorted vector $s$
-
-We said earlier that in original plonk the size of $s$ is equal to $|s| = |f|+|t|$, where $f$ encodes queries, and $t$ encodes the lookup table.
-With our multi-query approach, the second vector $s$ is of the size
-
-$$n \cdot |\#\text{queries}| + |\text{lookup\_table}|$$
-
-That is, it contains the $n$ elements of each **query vectors** (the actual values being looked up, after being combined with the joint combinator, that's $4$ per row), as well as the elements of our lookup table (after being combined as well).
-
-Because the vector $s$ is larger than the domain size $n$, it is split into several vectors of size $n$. Specifically, in the plonkup paper, the two halves of $s$, which are then interpolated as $h_1$ and $h_2$.
-The denominator in plonk in the vector form is
-$$
-\big(\gamma(1+\beta) + s_{i-1} + \beta s_{i}\big)\big(\gamma(1+\beta)+s_{n+i-1} + \beta s_{n+i}\big)
-$$
-which, when interpolated into $h_1$ and $h_2$, becomes
-$$
-\big(\gamma(1+\beta) + h_1(x) + \beta h_1(g \cdot x)\big)\big(\gamma(1+\beta) + h_2(x) + \beta h_2(g \cdot x)\big)
-$$
-
-Since one has to compute the difference of every contiguous pairs, the last element of the first half is the replicated as the first element of the second half ($s_{n-1} = s_{n}$).
-Hence, a separate constraint must be added to enforce that continuity on the interpolated polynomials $h_1$ and $h_2$:
-
-$$L_{n-1}(X)\cdot\big(h_1(X) - h_2(g \cdot X)\big) \equiv 0$$
-
-which is equivalent to checking that $h_1(g^{n-1}) = h_2(1)$.
-
-## The sorted vector $s$ in kimchi
-
-Since this vector is known only by the prover, and is evaluated as part of the protocol, zero-knowledge must be added to the corresponding polynomial (in case of plookup approach, to $h_1(X),h_2(X)$). To do this in kimchi, we use the same technique as with the other prover polynomials: we randomize the last evaluations (or rows, on the domain) of the polynomial.
-
-This means two things for the lookup grand product argument:
-
-1. We cannot use the wrap around trick to make sure that the list is split in two correctly (enforced by $L_{n-1}(h_1(x) - h_2(g \cdot x)) = 0$ which is equivalent to $h_1(g^{n-1}) = h_2(1)$ in the plookup paper)
-2. We have even less space to store an entire query vector. Which is actually super correct, as the witness also has some zero-knowledge rows at the end that should not be part of the queries anyway.
-
-The first problem can be solved in two ways:
-
-* **Zig-zag technique**. By reorganizing $s$ to alternate its values between the columns. For example, $h_1 = (s_0, s_2, s_4, \cdots)$ and $h_2 = (s_1, s_3, s_5, \cdots)$ so that you can simply write the denominator of the grand product argument as
-    $$(\gamma(1+\beta) + h_1(x) + \beta h_2(x))(\gamma(1+\beta)+ h_2(x) + \beta h_1(x \cdot g))$$
-    Whis approach is taken by the [plonkup](https://eprint.iacr.org/2022/086) paper.
-* **Snake technique**. By reorganizing $s$ as a snake. This is what is currently implemented in kimchi.
-
-The snake technique rearranges $s$ into the following shape:
-
-```
-                           __    _
-          s_0 |  s_{2n-1} |  |  | |
-          ... |       ... |  |  | |
-      s_{n-1} |       s_n |  |  | |
-               ‾‾‾‾‾‾‾‾‾‾‾    ‾‾   ‾
-              h1         h2  h3 ...
-```
-
-Assuming that for now we have only one bend and two polynomials $h_1(X),h_2(X)$, the denominator has the following form:
-
-$$\big(\gamma(1+\beta) + h_1(x) + \beta h_1(x \cdot g)\big)\big(\gamma(1+\beta)+ h_2(x \cdot g) + \beta h_2(x)\big)$$
-
-and the snake doing a U-turn is constrained via $s_{n-1} = s_n$, enforced by the following equation:
-
-$$L_{n-1} \cdot (h_1(x) - h_2(x)) = 0$$
-
-In practice, $s$ will have more sections than just two.
-Assume that we have $k$ sections in total, then the denominator generalizes to
-
-$$
-\prod_{i=1}^k \gamma(1+\beta) + h_i(x \cdot g^{\delta_{0,\ i \text{ mod } 2}}) + \beta h_i(x \cdot g^{\delta_{1,\ i \text{ mod } 2}})
-$$
-
-where $\delta_{i,j}$ is Kronecker delta, equal to $1$ when $i$ is even (for the first term) or odd (for the second one), and equal to $0$ otherwise.
-
-Similarly, the U-turn constraints now become
-
-$$
-\begin{align*}
-L_{n-1}(X) \cdot (h_2(X) - h_1(X)) &\equiv 0\\
-\color{green}L_{0}(X) \cdot (h_3(X) - h_2(X)) &\color{green}\equiv 0\\
-\color{green}L_{n-1}(X) \cdot (h_4(X) - h_3(X)) &\color{green}\equiv 0\\
-\ldots
-\end{align*}
-$$
-
-In our concrete case with $4$ simultaneous lookups the vector $s$ has to be split into $k= 5$ sections --- each denominator term in the accumulator accounts for $4$ queries ($f$) and $1$ table consistency check ($t$).
-
-## Unsorted $t$ in $s$
-
-Note that at setup time, $t$ cannot be sorted lexicographically as it is not combined yet. Since $s$ must be sorted by $t$ (in other words sorting of $s$ must follow the elements of $t$), there are two solutions:
-
-1. Both the prover and the verifier can sort the combined $t$ lexicographically, so that $s$ can be sorted lexicographically too using typical sorting algorithms
-2. The prover can directly sort $s$ by $t$, so that the verifier doesn't have to do any pre-sorting and can just rely on the commitment of the columns of $t$ (which the prover can evaluate in the protocol).
-
-We take the second approach.
-However, this must be done carefully since the combined $t$ entries can repeat. For some $i, l$ such that $i \neq l$, we might have
-
-$$
-t_0[i] + j \cdot t_1[i] + j^2 \cdot t_2[i] = t_0[l] + j \cdot t_1[l] + j^2 \cdot t_2[l]
-$$
-
-For example, if $f = \{1, 2, 2, 3\}$ and $t = \{2, 1, 2, 3\}$, then $\text{sorted}(f, t) = \{2, 2, 2, 1, 1, 2, 3, 3\}$ would be a way of correctly sorting the combined vector $s$. At the same time $\text{sorted}(f, t) = \{ 2, 2, 2, 2, 1, 1, 3, 3 \}$ is incorrect since it does not have a second block of $2$s, and thus such an $s$ is not sorted by $t$.
-
-
-## Recap
-
-So to recap, to create the sorted polynomials $h_i$, the prover:
-
-1. creates a large query vector which contains the concatenation of the $4$ per-row (combined with the joint combinator) queries (that might contain dummy queries) for all rows
-2. creates the (combined with the joint combinator) table vector
-3. sorts all of that into a big vector $s$
-4. divides that vector $s$ into as many $h_i$ vectors as a necessary following the snake method
-5. interpolate these $h_i$ vectors into $h_i$ polynomials
-6. commit to them, and evaluate them as part of the protocol.
diff --git a/book/src/rfcs/keccak.md b/book/src/rfcs/keccak.md
index 457c247b97..03174df193 100644
--- a/book/src/rfcs/keccak.md
+++ b/book/src/rfcs/keccak.md
@@ -1,166 +1 @@
-# RFC: Keccak
-
-The Keccak gadget is comprised of 3 circuit gates (`Xor16`, `Rot64`, and `Zero`)
-
-Keccak works with 64-bit words. The state is represented using $5\times 5$ matrix
-of 64 bit words. Each compression step of Keccak consists of 24 rounds. Let us
-denote the state matrix with $A$ (indexing elements as $A[x,y]$), from which we derive
-further states as follows in each round. Each round then consists of the following 5 steps:
-
-$$
-\begin{align}
-C[x] &= A[x,0] \oplus A[x,1] \oplus A[x,2] \oplus A[x,3] \oplus A[x,4] \\
-D[x] &= C[x-1] \oplus ROT(C[x+1],1) \\
-E[x,y] &= A[x,y]  \oplus D[x] \\
-B[y,2x+3y] &= ROT(E[x,y],\rho[x,y]) \\
-F[x,y] &= B[x,y] \oplus ((NOT\ B[x+1,y]) AND\ B[x+2,y]) \\
-Fp[0,0] &= F[0,0] \oplus RC
-\end{align}
-$$
-
-for $0\leq x, y \leq 4$ and $\rho[x,y]$ is the rotation offset defined for Keccak.
-The values are in the table below extracted from the Keccak reference
-<https://keccak.team/files/Keccak-reference-3.0.pdf>
-
-|       | x = 3 | x = 4 | x = 0 | x = 1 | x = 2 |
-| ----- | ----- | ----- | ----- | ----- | ----- |
-| y = 2 | 155   | 231   | 3     | 10    | 171   |
-| y = 1 | 55    | 276   | 36    | 300   | 6     |
-| y = 0 | 28    | 91    | 0     | 1     | 190   |
-| y = 4 | 120   | 78    | 210   | 66    | 253   |
-| y = 3 | 21    | 136   | 105   | 45    | 15    |
-
-## Design Approach:
-
-The atomic operations are XOR, ROT, NOT, AND. In the sections below, we will describe
-the gates for these operations. Below are some common approaches followed in their design.
-
-To fit within 15 wires, we first decompose each word into its lower and upper 32-bit
-components. A gate for an atomic operation works with those 32-bit components at a time.
-
-Before we describe the specific gate design approaches, below are some constraints in the
-Kimchi framework that dictated those approaches.
-* only 4 lookups per row
-* only first 7 columns are available to the permutation polynomial
-
-## Rot64
-
-It is clear from the definition of the rotation gate that its constraints are complete 
-(meaning that honest instances always satisfy the constraints). It is left to be proven
-that the proposal is sound. In this section, we will give a proof that as soon as we 
-perform the range checks on the excess and shifted parts of the input, only one possible
-assignment satisfies the constraints. This means that there is no dishonest instance that
-can make the constraints pass. We will also give an example where one could find wrong
-rotation witnesses that would satisfy the constraints if we did not check the range.
-
-### Necessity of range checks
-
-First of all, we will illustrate the necessity of range-checks with a simple example. 
-For the sake of readability, we will use some toy field lengths. In particular, let us 
-assume that our words have 4 bits, meaning all of the elements between `0x0` and `0xF`. 
-Next, we will be using the native field $\mathbb{F}_{32}$. 
-
-As we will later see, this choice of field lengths is not enough to perform any 4-bit
-rotation, since the operations in the constraints would overflow the native field.
-Nonetheless, it will be sufficient for our example where we will only rotate by 1 bit.
-
-Assume we want to rotate the word `0b1101` (meaning 13) by 1 bit to the left. This gives
-us the rotated word `0b1011` (meaning 11). The excess part of the word is `0b1`, whereas
-the shifted part corresponds to `0b1010`. We recall the constraints for the rotation gate:
-
-$$
-\begin{align*}
-word \cdot 2^{rot} &= excess \cdot 2^{len} + shifted \\
-rotated &= excess + shifted
-\end{align*}
-$$
-
-Applied to our example, this results in the following equations:
-
-$$
-\begin{align*}
-13 \cdot 2 &= excess \cdot 16 + shifted \\
-11 &= excess + shifted
-\end{align*}
-$$
-
-We can easily check that the proposed values of the shifted `0b1010=10` and the excess
-`0b1=1` values satisfy the above constraint because $26 = 1 \cdot 16 + 10$ and $11 = 1 + 10$. 
-Now, the question is: _can we find another value for excess and shifted, such that their addition results in an incorrect rotated word?_
-
-The answer to this question is yes, due to __diophantine equations__. We basically want to find $x,y$ such that $26 = x \cdot 16 + y (\text{ mod } 32)$. The solution to this equation is:
-
-$$
-\begin{align*}
-\forall k \in [0..31]: & \\
-x &= k \\
-y &= 26 - 16 \cdot k
-\end{align*}
-$$
-
-We chose these word and field lengths to better understand the behaviour of the solution. Here, we can see two "classes" of evaluations.
-
-- If we choose an even $k$, then $y$ will have the following shape: 
-  - $$26 - 16 \cdot (2 \cdot n) \iff 26 - 32n \equiv_{32} 26 $$
-  - Meaning, if $x = 2n$ then $y = 26$.
-
-- If on the other hand, we chose an odd $k$, then $y$ will have the following shape instead:
-  - $$26 - 16 \cdot (2 \cdot n + 1) \iff 26 - 32n - 16 \equiv_{32} 26 - 16 = 10$$
-  - Meaning, if $x = 2n+1$ then $y = 10$. 
-
-Thus, possible solutions to the diophantine equation are:
-
-$$
-\begin{align*}
-x &= 0, 1, 2, 3, 4, 5... \\
-y &= 26, 10, 26, 10, 26, 10...
-\end{align*}
-$$
-
-Note that our valid witness is part of that set of solutions, meaning $x=1$ and $y=10$. Of course, we can also find another dishonest instantiation such as $x=0$ and $y=26$. Perhaps one could think that we do not need to worry about this case, because the resulting rotation word would be $0+26=26$, and if we later use that result as an input to a subsequent gate such as XOR, the value $26$ would not fit and at some point the constraint system would complain. Nonetheless, we still have other solutions to worry about, such as $(x=3, y=10)$ or $(x=5, y=10)$, since they would result in a rotated word that would fit in the word length of 4 bits, yet would be incorrect (not equal to $11$). 
-
-All of the above incorrect solutions differ in one thing: they have different bit lengths. This means that we need to range check the values for the excess and shifted witnesses to make sure they have the correct length. 
-
-### Sufficiency of range checks
-
-In the following, we will give a proof that performing range checks for these values is not only necessary but also sufficient to prove that the rotation gate is sound. In other words, we will prove there are no two possible solutions of the decomposition constraint that have the correct bit lengths. Now, for the sake of robustness, we will consider 64-bit words and fields with at least twice the bit length of the words (as is our case). 
-
-We will proceed by __contradiction__. Suppose there are two different solutions to the following diophantic equation:
-
-$$
-\begin{align*}
-\forall k \in \mathbb{F}_n: & \\
-x &= k \\
-y &= w \cdot 2^r - 2^{64} \cdot k
-\end{align*}
-$$
-
-where $k$ is a parameter to instantiate the solutions, $w$ is the word to be rotated, $r$ is the rotation amount, and $n$ is the field length.
-
-Then, that means that there are two different solutions, $(0\leq x=a<2^r, 0\leq y=b<2^{64})$ and $(0\leq x=a'<2^r, 0\leq y=b'<2^{64})$ with at least $a \neq a'$ or $b \neq b'$. We will show that this is impossible.
-
-If both are solutions to the same equation, then: 
-$$
-\begin{align*}
-w \cdot 2^r &= a \cdot 2^{64} + b \\
-w \cdot 2^r &= a'\cdot 2^{64} + b'
-\end{align*}
-$$
-means that $a \cdot 2^{64} + b = a'\cdot 2^{64} + b'$. Moving terms to the left side, we have an equivalent equality: $2^{64}(a-a') + (b-b')=0 \mod{n}$. There are three cases to consider:
-
-- $a = a'$ and $b \neq b'$: then $(b - b') \equiv_n 0$ and this can only happen if $b' = b + kn$. But since $n > 2^{64}$, then $b'$ cannot be smaller than $2^{64}$ as it was assumed. CONTRADICTION.
-  
-- $b = b'$ and $a \neq a'$: then $2^{64}(a - a') \equiv_n 0$ and this can only happen if $a' = a + kn$. But since $n > 2^r$, then $a'$ cannot be smaller than $2^r$ as it was assumed. CONTRADICTION.
-
-- $a\neq a'$ and $b \neq b'$: then we have something like $2^{64} \alpha + \beta \equiv_n 0$. 
-  - This means $\beta \equiv_n -2^{64} \alpha = k \cdot n - 2^{64} \alpha$ for any $k$.
-  - According to the assumption, both $0\leq a<2^r$ and $0\leq a'<2^r$. This means, the difference $\alpha:=(a - a')$ lies anywhere in between the following interval: 
-  - $$1 - 2^r \leq \alpha \leq 2^r - 1$$
-  - We plug in this interval to the above equation to obtain the following interval for $\beta$:
-  - $$k\cdot n - 2^{64}(1-2^r)\leq \beta \leq k\cdot n - 2^{64}(2^r - 1) $$
-  - We look at this interval from both sides of the inequality: $\beta \geq kn - 2^{64} + 2^{64+r}$ and $\beta \leq kn + 2^{64} - 2^{64+r}$ and we wonder if $kn - 2^{64} + 2^{64+r} \leq kn + 2^{64} - 2^{64+r}$ is at all possible. We rewrite as follows:
-  - $$2^{64+r} - 2^{64} \leq 2^{64} - 2^{64+r}$$
-  - $$2\cdot2^{64+r} \leq 2\cdot2^{64} $$
-  - $$2^{64+r} \leq 2^{64} $$
-  - But this can only happen if $r\leq 0$, which is impossible since we assume $0 < r < 64$.CONTRADICTION.
-- EOP.
+# RFC 7: Keccak

From 992448ec58cfb177cb3658008dfe3aa5c64bebd1 Mon Sep 17 00:00:00 2001
From: Danny Willems <be.danny.willems@gmail.com>
Date: Wed, 1 Nov 2023 17:20:29 +0100
Subject: [PATCH 14/32] Bump up actions/@checkout to 4.1.1

---
 .github/workflows/benches.yml           | 2 +-
 .github/workflows/coverage.yml.disabled | 2 +-
 .github/workflows/gh-page.yml           | 2 +-
 .github/workflows/rust.yml              | 2 +-
 4 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/.github/workflows/benches.yml b/.github/workflows/benches.yml
index e8ac86e6b9..7fd1fe8e2e 100644
--- a/.github/workflows/benches.yml
+++ b/.github/workflows/benches.yml
@@ -17,7 +17,7 @@ jobs:
     if: github.event.label.name == 'benchmark'
     steps:
       - name: Checkout PR
-        uses: actions/checkout@v2
+        uses: actions/checkout@v4.1.1
 
       # as action-rs does not seem to be maintained anymore, building from
       # scratch the environment using rustup
diff --git a/.github/workflows/coverage.yml.disabled b/.github/workflows/coverage.yml.disabled
index f9f00e3503..837124ea24 100644
--- a/.github/workflows/coverage.yml.disabled
+++ b/.github/workflows/coverage.yml.disabled
@@ -17,7 +17,7 @@ jobs:
     timeout-minutes: 60
     runs-on: ubuntu-latest
     steps:
-      - uses: actions/checkout@v2.3.4
+      - uses: actions/checkout@v4.1.1
         with:
           persist-credentials: false
 
diff --git a/.github/workflows/gh-page.yml b/.github/workflows/gh-page.yml
index edbccf8ca3..7077069ded 100644
--- a/.github/workflows/gh-page.yml
+++ b/.github/workflows/gh-page.yml
@@ -16,7 +16,7 @@ jobs:
 
     steps:
       - name: Checkout Repository
-        uses: actions/checkout@v2
+        uses: actions/checkout@v4.1.1
 
       # as action-rs does not seem to be maintained anymore, building from
       # scratch the environment using rustup
diff --git a/.github/workflows/rust.yml b/.github/workflows/rust.yml
index 3490171728..422940b2b8 100644
--- a/.github/workflows/rust.yml
+++ b/.github/workflows/rust.yml
@@ -26,7 +26,7 @@ jobs:
     name: Run some basic checks and tests
     steps:
       - name: Checkout PR
-        uses: actions/checkout@v3
+        uses: actions/checkout@v4.1.1
 
       # as action-rs does not seem to be maintained anymore, building from
       # scratch the environment using rustup

From 251ab0c2017408bc933bce05684c0d80af668b4c Mon Sep 17 00:00:00 2001
From: Mikhail Volkhov <volhovm.cs@gmail.com>
Date: Mon, 16 Oct 2023 13:41:21 +0100
Subject: [PATCH 15/32] [#14097,#14070] Enforce using constructor through
 private fields

---
 kimchi/src/circuits/constraints.rs       |  6 +++---
 kimchi/src/circuits/lookup/index.rs      | 10 ++++++----
 kimchi/src/circuits/lookup/tables/mod.rs | 14 ++++++++++++--
 kimchi/src/tests/lookup.rs               |  8 ++++----
 4 files changed, 25 insertions(+), 13 deletions(-)

diff --git a/kimchi/src/circuits/constraints.rs b/kimchi/src/circuits/constraints.rs
index 115a696965..43425e7b50 100644
--- a/kimchi/src/circuits/constraints.rs
+++ b/kimchi/src/circuits/constraints.rs
@@ -689,11 +689,11 @@ impl<F: PrimeField + SquareRootField> Builder<F> {
             let mut lookup_domain_size: usize = lookup_tables
                 .iter()
                 .map(
-                    |LookupTable { data, id: _ }| {
-                        if data.is_empty() {
+                    |lt| {
+                        if lt.data().is_empty() {
                             0
                         } else {
-                            data[0].len()
+                            lt.data()[0].len()
                         }
                     },
                 )
diff --git a/kimchi/src/circuits/lookup/index.rs b/kimchi/src/circuits/lookup/index.rs
index 592fd0db48..96971aaf40 100644
--- a/kimchi/src/circuits/lookup/index.rs
+++ b/kimchi/src/circuits/lookup/index.rs
@@ -274,7 +274,9 @@ impl<F: PrimeField + SquareRootField> LookupConstraintSystem<F> {
                             // we don't use the second table as table ID column.
                             let placeholders = vec![F::zero(); first_column.len()];
                             let data = vec![first_column, placeholders];
-                            let table = LookupTable { id, data };
+                            // TODO Check it does not fail actually. Maybe this should throw a different error.
+                            let table = LookupTable::create(id, data).expect("Runtime table creation must succeed");
+
                             lookup_tables.push(table);
                         }
 
@@ -340,17 +342,17 @@ impl<F: PrimeField + SquareRootField> LookupConstraintSystem<F> {
                 for table in &lookup_tables {
                     let table_len = table.len();
 
-                    if table.id != 0 {
+                    if table.id() != 0 {
                         non_zero_table_id = true;
                     }
 
                     //~~ * Update the corresponding entries in a table id vector (of size the domain as well)
                     //~    with the table ID of the table.
-                    let table_id: F = i32_to_field(table.id);
+                    let table_id: F = i32_to_field(table.id());
                     table_ids.extend(repeat_n(table_id, table_len));
 
                     //~~ * Copy the entries from the table to new rows in the corresponding columns of the concatenated table.
-                    for (i, col) in table.data.iter().enumerate() {
+                    for (i, col) in table.data().iter().enumerate() {
                         lookup_table[i].extend(col);
                     }
 
diff --git a/kimchi/src/circuits/lookup/tables/mod.rs b/kimchi/src/circuits/lookup/tables/mod.rs
index 063e3cf78f..716b58ecb9 100644
--- a/kimchi/src/circuits/lookup/tables/mod.rs
+++ b/kimchi/src/circuits/lookup/tables/mod.rs
@@ -24,8 +24,8 @@ pub enum GateLookupTable {
 /// A table of values that can be used for a lookup, along with the ID for the table.
 #[derive(Debug, Clone)]
 pub struct LookupTable<F> {
-    pub id: i32,
-    pub data: Vec<Vec<F>>,
+    id: i32,
+    data: Vec<Vec<F>>,
 }
 
 /// Represents inconsistency errors during table construction and composition.
@@ -100,6 +100,16 @@ where
     pub fn is_empty(&self) -> bool {
         self.data.is_empty()
     }
+
+    /// Returns table id.
+    pub fn id(&self) -> i32 {
+        self.id
+    }
+
+    /// Returns table data.
+    pub fn data(&self) -> &Vec<Vec<F>> {
+        &self.data
+    }
 }
 
 /// Returns the lookup table associated to a [`GateLookupTable`].
diff --git a/kimchi/src/tests/lookup.rs b/kimchi/src/tests/lookup.rs
index a674eba78f..7deea89a1f 100644
--- a/kimchi/src/tests/lookup.rs
+++ b/kimchi/src/tests/lookup.rs
@@ -33,10 +33,10 @@ fn setup_lookup_proof(use_values_from_table: bool, num_lookups: usize, table_siz
             let index_column = (0..lookup_table_values.len() as u64)
                 .map(Into::into)
                 .collect();
-            LookupTable {
-                id: id as i32,
-                data: vec![index_column, lookup_table_values.clone()],
-            }
+            LookupTable::create(
+                id as i32,
+                vec![index_column, lookup_table_values.clone()]
+            ).expect("setup_lookup_proof: Table creation must succeed")
         })
         .collect();
 

From cb460628bb7d97cd60edb47884150e6682327cc3 Mon Sep 17 00:00:00 2001
From: Mikhail Volkhov <volhovm.cs@gmail.com>
Date: Mon, 16 Oct 2023 14:08:43 +0100
Subject: [PATCH 16/32] Formatting

---
 kimchi/src/circuits/constraints.rs  | 16 +++++++---------
 kimchi/src/circuits/lookup/index.rs |  3 ++-
 kimchi/src/tests/lookup.rs          |  6 ++----
 3 files changed, 11 insertions(+), 14 deletions(-)

diff --git a/kimchi/src/circuits/constraints.rs b/kimchi/src/circuits/constraints.rs
index 43425e7b50..ea9cbadf74 100644
--- a/kimchi/src/circuits/constraints.rs
+++ b/kimchi/src/circuits/constraints.rs
@@ -688,15 +688,13 @@ impl<F: PrimeField + SquareRootField> Builder<F> {
             // First we sum over the lookup table size
             let mut lookup_domain_size: usize = lookup_tables
                 .iter()
-                .map(
-                    |lt| {
-                        if lt.data().is_empty() {
-                            0
-                        } else {
-                            lt.data()[0].len()
-                        }
-                    },
-                )
+                .map(|lt| {
+                    if lt.data().is_empty() {
+                        0
+                    } else {
+                        lt.data()[0].len()
+                    }
+                })
                 .sum();
             // After that on the runtime tables
             if let Some(runtime_tables) = runtime_tables.as_ref() {
diff --git a/kimchi/src/circuits/lookup/index.rs b/kimchi/src/circuits/lookup/index.rs
index 96971aaf40..3b2b856ba6 100644
--- a/kimchi/src/circuits/lookup/index.rs
+++ b/kimchi/src/circuits/lookup/index.rs
@@ -275,7 +275,8 @@ impl<F: PrimeField + SquareRootField> LookupConstraintSystem<F> {
                             let placeholders = vec![F::zero(); first_column.len()];
                             let data = vec![first_column, placeholders];
                             // TODO Check it does not fail actually. Maybe this should throw a different error.
-                            let table = LookupTable::create(id, data).expect("Runtime table creation must succeed");
+                            let table = LookupTable::create(id, data)
+                                .expect("Runtime table creation must succeed");
 
                             lookup_tables.push(table);
                         }
diff --git a/kimchi/src/tests/lookup.rs b/kimchi/src/tests/lookup.rs
index 7deea89a1f..010dd07a4f 100644
--- a/kimchi/src/tests/lookup.rs
+++ b/kimchi/src/tests/lookup.rs
@@ -33,10 +33,8 @@ fn setup_lookup_proof(use_values_from_table: bool, num_lookups: usize, table_siz
             let index_column = (0..lookup_table_values.len() as u64)
                 .map(Into::into)
                 .collect();
-            LookupTable::create(
-                id as i32,
-                vec![index_column, lookup_table_values.clone()]
-            ).expect("setup_lookup_proof: Table creation must succeed")
+            LookupTable::create(id as i32, vec![index_column, lookup_table_values.clone()])
+                .expect("setup_lookup_proof: Table creation must succeed")
         })
         .collect();
 

From e3aceafedb10f46d5daf1609793b82c3a96920ce Mon Sep 17 00:00:00 2001
From: Mikhail Volkhov <volhovm.cs@gmail.com>
Date: Mon, 16 Oct 2023 15:01:07 +0100
Subject: [PATCH 17/32] [#14097,#14070] Fix lookup test creating invalid id=0
 zero table

---
 kimchi/src/circuits/lookup/index.rs           |  2 +-
 kimchi/src/circuits/lookup/tables/mod.rs      | 37 ++++++++++---------
 .../src/circuits/lookup/tables/range_check.rs |  8 ++--
 kimchi/src/circuits/lookup/tables/xor.rs      |  6 +--
 kimchi/src/tests/lookup.rs                    |  4 +-
 5 files changed, 28 insertions(+), 29 deletions(-)

diff --git a/kimchi/src/circuits/lookup/index.rs b/kimchi/src/circuits/lookup/index.rs
index 3b2b856ba6..758db1b6c6 100644
--- a/kimchi/src/circuits/lookup/index.rs
+++ b/kimchi/src/circuits/lookup/index.rs
@@ -1,4 +1,3 @@
-use super::runtime_tables::{RuntimeTableCfg, RuntimeTableSpec};
 use crate::circuits::{
     domains::EvaluationDomains,
     gate::CircuitGate,
@@ -6,6 +5,7 @@ use crate::circuits::{
         constraints::LookupConfiguration,
         lookups::{LookupInfo, LookupPattern},
         tables::LookupTable,
+        runtime_tables::{RuntimeTableCfg, RuntimeTableSpec},
     },
 };
 use ark_ff::{FftField, PrimeField, SquareRootField};
diff --git a/kimchi/src/circuits/lookup/tables/mod.rs b/kimchi/src/circuits/lookup/tables/mod.rs
index 716b58ecb9..c5f68c341d 100644
--- a/kimchi/src/circuits/lookup/tables/mod.rs
+++ b/kimchi/src/circuits/lookup/tables/mod.rs
@@ -1,4 +1,4 @@
-use ark_ff::{FftField, One, Zero};
+use ark_ff::{Field, One, Zero};
 use poly_commitment::PolyComm;
 use serde::{Deserialize, Serialize};
 use thiserror::Error;
@@ -6,21 +6,6 @@ use thiserror::Error;
 pub mod range_check;
 pub mod xor;
 
-//~ spec:startcode
-/// The table ID associated with the XOR lookup table.
-pub const XOR_TABLE_ID: i32 = 0;
-
-/// The range check table ID.
-pub const RANGE_CHECK_TABLE_ID: i32 = 1;
-//~ spec:endcode
-
-/// Enumerates the different 'fixed' lookup tables used by individual gates
-#[derive(Copy, Clone, Debug, PartialEq, Eq, Hash, Serialize, Deserialize)]
-pub enum GateLookupTable {
-    Xor,
-    RangeCheck,
-}
-
 /// A table of values that can be used for a lookup, along with the ID for the table.
 #[derive(Debug, Clone)]
 pub struct LookupTable<F> {
@@ -39,7 +24,7 @@ pub enum LookupTableError {
 
 impl<F> LookupTable<F>
 where
-    F: FftField,
+    F: Field,
 {
     pub fn create(id: i32, data: Vec<Vec<F>>) -> Result<Self, LookupTableError> {
         let res = LookupTable { id, data };
@@ -112,8 +97,23 @@ where
     }
 }
 
+//~ spec:startcode
+/// The table ID associated with the XOR lookup table.
+pub const XOR_TABLE_ID: i32 = 0;
+
+/// The range check table ID.
+pub const RANGE_CHECK_TABLE_ID: i32 = 1;
+//~ spec:endcode
+
+/// Enumerates the different 'fixed' lookup tables used by individual gates
+#[derive(Copy, Clone, Debug, PartialEq, Eq, Hash, Serialize, Deserialize)]
+pub enum GateLookupTable {
+    Xor,
+    RangeCheck,
+}
+
 /// Returns the lookup table associated to a [`GateLookupTable`].
-pub fn get_table<F: FftField>(table_name: GateLookupTable) -> LookupTable<F> {
+pub fn get_table<F: Field>(table_name: GateLookupTable) -> LookupTable<F> {
     match table_name {
         GateLookupTable::Xor => xor::xor_table(),
         GateLookupTable::RangeCheck => range_check::range_check_table(),
@@ -155,6 +155,7 @@ where
     F: Zero + One + Clone,
     I: DoubleEndedIterator<Item = &'a F>,
 {
+    // TODO: unnecessary cloning if binops between F and &F are supported
     v.rev()
         .fold(F::zero(), |acc, x| joint_combiner.clone() * acc + x.clone())
         + table_id_combiner.clone() * table_id.clone()
diff --git a/kimchi/src/circuits/lookup/tables/range_check.rs b/kimchi/src/circuits/lookup/tables/range_check.rs
index 001ffedd52..2bf00e64f7 100644
--- a/kimchi/src/circuits/lookup/tables/range_check.rs
+++ b/kimchi/src/circuits/lookup/tables/range_check.rs
@@ -14,11 +14,9 @@ pub fn range_check_table<F>() -> LookupTable<F>
 where
     F: Field,
 {
-    let table = vec![(0..RANGE_CHECK_UPPERBOUND).map(F::from).collect()];
-    LookupTable {
-        id: RANGE_CHECK_TABLE_ID,
-        data: table,
-    }
+    let data = vec![(0..RANGE_CHECK_UPPERBOUND).map(F::from).collect()];
+    LookupTable::create(RANGE_CHECK_TABLE_ID, data)
+        .expect("range_check_table creation must succeed")
 }
 
 pub const TABLE_SIZE: usize = RANGE_CHECK_UPPERBOUND as usize;
diff --git a/kimchi/src/circuits/lookup/tables/xor.rs b/kimchi/src/circuits/lookup/tables/xor.rs
index d846942a31..6f87377d96 100644
--- a/kimchi/src/circuits/lookup/tables/xor.rs
+++ b/kimchi/src/circuits/lookup/tables/xor.rs
@@ -37,10 +37,8 @@ pub fn xor_table<F: Field>() -> LookupTable<F> {
         // Just to be safe.
         assert!(r[r.len() - 1].is_zero());
     }
-    LookupTable {
-        id: XOR_TABLE_ID,
-        data,
-    }
+
+    LookupTable::create(XOR_TABLE_ID, data).expect("xor_table creation must succeed")
 }
 
 pub const TABLE_SIZE: usize = 256;
diff --git a/kimchi/src/tests/lookup.rs b/kimchi/src/tests/lookup.rs
index 010dd07a4f..6363c69063 100644
--- a/kimchi/src/tests/lookup.rs
+++ b/kimchi/src/tests/lookup.rs
@@ -22,10 +22,12 @@ type BaseSponge = DefaultFqSponge<VestaParameters, SpongeParams>;
 type ScalarSponge = DefaultFrSponge<Fp, SpongeParams>;
 
 fn setup_lookup_proof(use_values_from_table: bool, num_lookups: usize, table_sizes: Vec<usize>) {
-    let lookup_table_values: Vec<Vec<_>> = table_sizes
+    let mut lookup_table_values: Vec<Vec<_>> = table_sizes
         .iter()
         .map(|size| (0..*size).map(|_| rand::random()).collect())
         .collect();
+    // Zero table must have a zero row
+    lookup_table_values[0][0] = From::from(0);
     let lookup_tables = lookup_table_values
         .iter()
         .enumerate()

From 1fac311cd2a8054d7fc07a56d493595dd4f7cbe1 Mon Sep 17 00:00:00 2001
From: Mikhail Volkhov <volhovm.cs@gmail.com>
Date: Tue, 24 Oct 2023 18:28:18 +0100
Subject: [PATCH 18/32] Add table id collision assertions to
 LookupConstraintSystem#create

---
 kimchi/src/circuits/lookup/index.rs | 34 ++++++++++++++++++++++++++---
 1 file changed, 31 insertions(+), 3 deletions(-)

diff --git a/kimchi/src/circuits/lookup/index.rs b/kimchi/src/circuits/lookup/index.rs
index 758db1b6c6..c645cb77eb 100644
--- a/kimchi/src/circuits/lookup/index.rs
+++ b/kimchi/src/circuits/lookup/index.rs
@@ -4,8 +4,8 @@ use crate::circuits::{
     lookup::{
         constraints::LookupConfiguration,
         lookups::{LookupInfo, LookupPattern},
-        tables::LookupTable,
         runtime_tables::{RuntimeTableCfg, RuntimeTableSpec},
+        tables::LookupTable,
     },
 };
 use ark_ff::{FftField, PrimeField, SquareRootField};
@@ -28,6 +28,10 @@ pub enum LookupError {
         length: usize,
         maximum_allowed: usize,
     },
+    #[error("Cannot create a combined table since ids for sub-tables are colliding. The collision type is: {collision_type}")]
+    LookupTableIdCollision {
+        collision_type: String,
+    },
 }
 
 /// Lookup selectors
@@ -223,9 +227,32 @@ impl<F: PrimeField + SquareRootField> LookupConstraintSystem<F> {
                     .chain(lookup_tables)
                     .collect();
 
+                // Checks whether iterator collects any duplicates, and if yes, raises
+                // a corresponding LookupTableIdCollision error.
+                fn check_id_duplicates<'a, I:Iterator<Item = &'a i32>>(iter: I, msg: &str) -> Result<(),LookupError>  {
+                    use itertools::Itertools;
+                    match iter.duplicates().collect::<Vec<_>>() {
+                        dups if !dups.is_empty() => {
+                            Err(LookupError::LookupTableIdCollision {
+                                collision_type: format!("{}: {:?}", msg, dups).to_string()
+                            })
+                        },
+                        _ => {Ok(())}
+                    }
+                }
+
+                let fixed_lookup_tables_ids: Vec<i32> = lookup_tables.iter().map(|lt| lt.id()).collect();
+                check_id_duplicates(fixed_lookup_tables_ids.iter(),"fixed lookup table duplicates")?;
+
                 // if we are using runtime tables
                 let (runtime_table_offset, runtime_selector) =
                     if let Some(runtime_tables) = &runtime_tables {
+                        let runtime_tables_ids: Vec<i32> = runtime_tables.iter().map(|rt| rt.id).collect();
+                        check_id_duplicates(runtime_tables_ids.iter(), "runtime table duplicates")?;
+                        check_id_duplicates(runtime_tables_ids.iter().chain(fixed_lookup_tables_ids.iter()),
+                                         "duplicates between runtime and fixed tables")?;
+
+
                         // save the offset of the end of the table
                         let mut runtime_table_offset = 0;
                         for table in &lookup_tables {
@@ -266,8 +293,6 @@ impl<F: PrimeField + SquareRootField> LookupConstraintSystem<F> {
                             let (id, first_column) =
                                 (runtime_table.id, runtime_table.first_column.clone());
 
-                            // @volhovm: Do we need to enforce that there is at least one table
-                            // with id 0?
 
                             // important: we still need a placeholder column to make sure that
                             // if all other tables have a single column
@@ -389,6 +414,9 @@ impl<F: PrimeField + SquareRootField> LookupConstraintSystem<F> {
                     lookup_table8.push(eval);
                 }
 
+
+                // @volhovm: Do we need to enforce that there is at least one table
+                // with id 0?
                 //~ 9. pre-compute polynomial and evaluation form for the table IDs,
                 //~    only if a table with an ID different from zero was used.
                 let (table_ids, table_ids8) = if non_zero_table_id {

From d0e5de6076b472723d748834548ed5dc2f137c7c Mon Sep 17 00:00:00 2001
From: Mikhail Volkhov <volhovm.cs@gmail.com>
Date: Mon, 30 Oct 2023 09:26:33 +0000
Subject: [PATCH 19/32] Improve lookup collision checks, fixed broken tests

---
 book/src/specs/kimchi.md                     |  4 +-
 kimchi/src/circuits/lookup/index.rs          | 72 ++++++++++++--------
 kimchi/src/circuits/lookup/lookups.rs        |  6 +-
 kimchi/src/circuits/lookup/runtime_tables.rs | 10 ++-
 kimchi/src/circuits/lookup/tables/mod.rs     |  2 +-
 kimchi/src/prover_index.rs                   |  2 +
 kimchi/src/tests/and.rs                      |  1 +
 kimchi/src/tests/foreign_field_add.rs        |  1 -
 kimchi/src/tests/lookup.rs                   |  4 +-
 kimchi/src/tests/range_check.rs              |  5 +-
 kimchi/src/tests/rot.rs                      |  1 -
 kimchi/src/tests/xor.rs                      |  1 -
 12 files changed, 67 insertions(+), 42 deletions(-)

diff --git a/book/src/specs/kimchi.md b/book/src/specs/kimchi.md
index 13a51330d9..d84af63172 100644
--- a/book/src/specs/kimchi.md
+++ b/book/src/specs/kimchi.md
@@ -1641,8 +1641,8 @@ If lookup is used, the following values are added to the common index:
 To create the index, follow these steps:
 
 1. If no lookup is used in the circuit, do not create a lookup index
-2. Get the lookup selectors and lookup tables (TODO: how?)
-3. Concatenate runtime lookup tables with the ones used by gates
+2. Get the lookup selectors and lookup tables that are specified implicitly
+3. Concatenate explicit runtime lookup tables with the ones (implicitly) used by gates.
 4. Get the highest number of columns `max_table_width`
    that a lookup table can have.
 5. Create the concatenated table of all the fixed lookup tables.
diff --git a/kimchi/src/circuits/lookup/index.rs b/kimchi/src/circuits/lookup/index.rs
index c645cb77eb..861e3693c4 100644
--- a/kimchi/src/circuits/lookup/index.rs
+++ b/kimchi/src/circuits/lookup/index.rs
@@ -29,9 +29,7 @@ pub enum LookupError {
         maximum_allowed: usize,
     },
     #[error("Cannot create a combined table since ids for sub-tables are colliding. The collision type is: {collision_type}")]
-    LookupTableIdCollision {
-        collision_type: String,
-    },
+    LookupTableIdCollision { collision_type: String },
 }
 
 /// Lookup selectors
@@ -200,7 +198,7 @@ impl<F: PrimeField + SquareRootField> LookupConstraintSystem<F> {
     /// Will give error if inputs validation do not match.
     pub fn create(
         gates: &[CircuitGate<F>],
-        lookup_tables: Vec<LookupTable<F>>,
+        fixed_lookup_tables: Vec<LookupTable<F>>,
         runtime_tables: Option<Vec<RuntimeTableCfg<F>>>,
         domain: &EvaluationDomains<F>,
         zk_rows: usize,
@@ -217,41 +215,63 @@ impl<F: PrimeField + SquareRootField> LookupConstraintSystem<F> {
                 // product is 1, we cannot use those rows to store any values.
                 let max_num_entries = d1_size - zk_rows - 1;
 
-                //~ 2. Get the lookup selectors and lookup tables (TODO: how?)
+                //~ 2. Get the lookup selectors and lookup tables that are specified implicitly
+                // by the lookup gates (TODO: how?)
                 let (lookup_selectors, gate_lookup_tables) =
                     lookup_info.selector_polynomials_and_tables(domain, gates);
 
-                //~ 3. Concatenate runtime lookup tables with the ones used by gates
-                let mut lookup_tables: Vec<_> = gate_lookup_tables
-                    .into_iter()
-                    .chain(lookup_tables)
-                    .collect();
-
-                // Checks whether iterator collects any duplicates, and if yes, raises
+                // Checks whether an iterator contains any duplicates, and if yes, raises
                 // a corresponding LookupTableIdCollision error.
-                fn check_id_duplicates<'a, I:Iterator<Item = &'a i32>>(iter: I, msg: &str) -> Result<(),LookupError>  {
+                fn check_id_duplicates<'a, I: Iterator<Item = &'a i32>>(
+                    iter: I,
+                    msg: &str,
+                ) -> Result<(), LookupError> {
                     use itertools::Itertools;
                     match iter.duplicates().collect::<Vec<_>>() {
-                        dups if !dups.is_empty() => {
-                            Err(LookupError::LookupTableIdCollision {
-                                collision_type: format!("{}: {:?}", msg, dups).to_string()
-                            })
-                        },
-                        _ => {Ok(())}
+                        dups if !dups.is_empty() => Err(LookupError::LookupTableIdCollision {
+                            collision_type: format!("{}: {:?}", msg, dups).to_string(),
+                        }),
+                        _ => Ok(()),
                     }
                 }
 
-                let fixed_lookup_tables_ids: Vec<i32> = lookup_tables.iter().map(|lt| lt.id()).collect();
-                check_id_duplicates(fixed_lookup_tables_ids.iter(),"fixed lookup table duplicates")?;
+                // If there is a gate using a lookup table, this table must not be added
+                // explicitly to the constraint system.
+                let fixed_gate_joint_ids: Vec<i32> = fixed_lookup_tables
+                    .iter()
+                    .map(|lt| lt.id())
+                    .chain(gate_lookup_tables.iter().map(|lt| lt.id()))
+                    .collect();
+                check_id_duplicates(
+                    fixed_gate_joint_ids.iter(),
+                    "duplicates between fixed given and fixed from-gate tables",
+                )?;
+
+                //~ 3. Concatenate explicit runtime lookup tables with the ones (implicitly) used by gates.
+                let mut lookup_tables: Vec<LookupTable<_>> = fixed_lookup_tables
+                    .into_iter()
+                    .chain(gate_lookup_tables)
+                    .collect();
+
+                let fixed_lookup_tables_ids: Vec<i32> =
+                    lookup_tables.iter().map(|lt| lt.id()).collect();
+                check_id_duplicates(
+                    fixed_lookup_tables_ids.iter(),
+                    "fixed lookup table duplicates",
+                )?;
 
                 // if we are using runtime tables
                 let (runtime_table_offset, runtime_selector) =
                     if let Some(runtime_tables) = &runtime_tables {
-                        let runtime_tables_ids: Vec<i32> = runtime_tables.iter().map(|rt| rt.id).collect();
+                        let runtime_tables_ids: Vec<i32> =
+                            runtime_tables.iter().map(|rt| rt.id).collect();
                         check_id_duplicates(runtime_tables_ids.iter(), "runtime table duplicates")?;
-                        check_id_duplicates(runtime_tables_ids.iter().chain(fixed_lookup_tables_ids.iter()),
-                                         "duplicates between runtime and fixed tables")?;
-
+                        check_id_duplicates(
+                            runtime_tables_ids
+                                .iter()
+                                .chain(fixed_lookup_tables_ids.iter()),
+                            "duplicates between runtime and fixed tables",
+                        )?;
 
                         // save the offset of the end of the table
                         let mut runtime_table_offset = 0;
@@ -293,7 +313,6 @@ impl<F: PrimeField + SquareRootField> LookupConstraintSystem<F> {
                             let (id, first_column) =
                                 (runtime_table.id, runtime_table.first_column.clone());
 
-
                             // important: we still need a placeholder column to make sure that
                             // if all other tables have a single column
                             // we don't use the second table as table ID column.
@@ -414,7 +433,6 @@ impl<F: PrimeField + SquareRootField> LookupConstraintSystem<F> {
                     lookup_table8.push(eval);
                 }
 
-
                 // @volhovm: Do we need to enforce that there is at least one table
                 // with id 0?
                 //~ 9. pre-compute polynomial and evaluation form for the table IDs,
diff --git a/kimchi/src/circuits/lookup/lookups.rs b/kimchi/src/circuits/lookup/lookups.rs
index b126e1be00..5796fcb814 100644
--- a/kimchi/src/circuits/lookup/lookups.rs
+++ b/kimchi/src/circuits/lookup/lookups.rs
@@ -204,7 +204,7 @@ impl LookupInfo {
         &self,
         domain: &EvaluationDomains<F>,
         gates: &[CircuitGate<F>],
-    ) -> (LookupSelectors<Evaluations<F>>, Vec<LookupTable<F>>) {
+    ) -> (LookupSelectors<Evaluations<F>>, HashSet<LookupTable<F>>) {
         let n = domain.d1.size();
 
         let mut selector_values = LookupSelectors::default();
@@ -222,7 +222,7 @@ impl LookupInfo {
         };
 
         // TODO: is take(n) useful here? I don't see why we need this
-        for (i, gate) in gates.iter().enumerate().take(n) {
+        for (i, gate) in gates.iter().take(n).enumerate() {
             let typ = gate.typ;
 
             if let Some(lookup_pattern) = LookupPattern::from_gate(typ, CurrOrNext::Curr) {
@@ -246,7 +246,7 @@ impl LookupInfo {
                 .interpolate()
                 .evaluate_over_domain(domain.d8)
         });
-        let res_tables: Vec<_> = gate_tables.into_iter().map(get_table).collect();
+        let res_tables: HashSet<_> = gate_tables.into_iter().map(get_table).collect();
         (selector_values8, res_tables)
     }
 
diff --git a/kimchi/src/circuits/lookup/runtime_tables.rs b/kimchi/src/circuits/lookup/runtime_tables.rs
index 98b018ed8a..d05a0a5a72 100644
--- a/kimchi/src/circuits/lookup/runtime_tables.rs
+++ b/kimchi/src/circuits/lookup/runtime_tables.rs
@@ -18,6 +18,8 @@ pub struct RuntimeTableSpec {
     pub len: usize,
 }
 
+/// A configuration of the runtime table as known at setup time.
+///
 /// Use this type at setup time, to list all the runtime tables.
 ///
 /// Note: care must be taken as table IDs can collide with IDs of other types of lookup tables.
@@ -25,7 +27,8 @@ pub struct RuntimeTableSpec {
 pub struct RuntimeTableCfg<F> {
     /// The table ID.
     pub id: i32,
-    /// The content of the first column of the runtime table.
+    /// The content of the first column of the runtime table, i.e.
+    /// keys when a table is viewed as a (k,v) array.
     pub first_column: Vec<F>,
 }
 
@@ -56,12 +59,13 @@ impl<F> From<RuntimeTableCfg<F>> for RuntimeTableSpec {
 }
 
 /// A runtime table. Runtime tables must match the configuration
-/// that was specified in [`RuntimeTableCfg`].
+/// specified in [`RuntimeTableCfg`].
 #[derive(Debug, Clone)]
 pub struct RuntimeTable<F> {
     /// The table id.
     pub id: i32,
-    /// A single column.
+    /// A single column. Represents runtime table values, where
+    /// ['RuntimeTableCfg'] defines compile-time keys.
     pub data: Vec<F>,
 }
 
diff --git a/kimchi/src/circuits/lookup/tables/mod.rs b/kimchi/src/circuits/lookup/tables/mod.rs
index c5f68c341d..7a9397115f 100644
--- a/kimchi/src/circuits/lookup/tables/mod.rs
+++ b/kimchi/src/circuits/lookup/tables/mod.rs
@@ -7,7 +7,7 @@ pub mod range_check;
 pub mod xor;
 
 /// A table of values that can be used for a lookup, along with the ID for the table.
-#[derive(Debug, Clone)]
+#[derive(Debug, Clone, PartialEq, Eq, Hash)]
 pub struct LookupTable<F> {
     id: i32,
     data: Vec<Vec<F>>,
diff --git a/kimchi/src/prover_index.rs b/kimchi/src/prover_index.rs
index 44ee0f6266..b28442fb53 100644
--- a/kimchi/src/prover_index.rs
+++ b/kimchi/src/prover_index.rs
@@ -211,7 +211,9 @@ pub mod testing {
             override_srs_size,
             |d1: D<G::ScalarField>, size: usize| {
                 let log2_size = size.ilog2();
+                // Run test_srs_serialization test to generate test SRS & enable this
                 let mut srs = if log2_size <= precomputed_srs::SERIALIZED_SRS_SIZE {
+                    // @volhovm: on my machine for d=16 (2.2Mb SRS file) this takes 110s. Why???
                     // TODO: we should trim it if it's smaller
                     precomputed_srs::get_srs()
                 } else {
diff --git a/kimchi/src/tests/and.rs b/kimchi/src/tests/and.rs
index e344af6da4..9c1a86fbcd 100644
--- a/kimchi/src/tests/and.rs
+++ b/kimchi/src/tests/and.rs
@@ -255,6 +255,7 @@ fn verify_bad_and_decomposition<G: KimchiCurve>(
             );
             witness[col][and_row] += G::ScalarField::one();
         }
+
         if col == 2 {
             assert_eq!(
                 cs.gates[0].verify_witness::<G>(0, witness, &cs, &witness[0][0..cs.public]),
diff --git a/kimchi/src/tests/foreign_field_add.rs b/kimchi/src/tests/foreign_field_add.rs
index 24c1d5a8c1..760c7fa2d5 100644
--- a/kimchi/src/tests/foreign_field_add.rs
+++ b/kimchi/src/tests/foreign_field_add.rs
@@ -1490,7 +1490,6 @@ fn test_ffadd_finalization() {
 
     let index = {
         let cs = ConstraintSystem::create(gates.clone())
-            .lookup(vec![range_check::gadget::lookup_table()])
             .public(num_public_inputs)
             .build()
             .unwrap();
diff --git a/kimchi/src/tests/lookup.rs b/kimchi/src/tests/lookup.rs
index 6363c69063..269235d35e 100644
--- a/kimchi/src/tests/lookup.rs
+++ b/kimchi/src/tests/lookup.rs
@@ -200,7 +200,7 @@ fn test_runtime_table() {
     let len = first_column.len();
 
     let mut runtime_tables_setup = vec![];
-    for table_id in 0..num {
+    for table_id in 1..num + 1 {
         let cfg = RuntimeTableCfg {
             id: table_id,
             first_column: first_column.into_iter().map(Into::into).collect(),
@@ -236,7 +236,7 @@ fn test_runtime_table() {
 
         for row in 0..20 {
             // the first register is the table id. We pick one random table.
-            lookup_cols[0][row] = (rng.gen_range(0..num) as u32).into();
+            lookup_cols[0][row] = (rng.gen_range(1..num + 1) as u32).into();
 
             // create queries into our runtime lookup table.
             // We will set [w1, w2], [w3, w4] and [w5, w6] to randon indexes and
diff --git a/kimchi/src/tests/range_check.rs b/kimchi/src/tests/range_check.rs
index 27240db942..577e2aa4f7 100644
--- a/kimchi/src/tests/range_check.rs
+++ b/kimchi/src/tests/range_check.rs
@@ -68,7 +68,10 @@ fn create_test_prover_index(
         gates,
         public_size,
         0,
-        vec![range_check::gadget::lookup_table()],
+        // specifying lookup table is not necessary,
+        // since it's already passed through patterns implicitly
+        //vec![range_check::gadget::lookup_table()],
+        vec![],
         None,
         false,
         None,
diff --git a/kimchi/src/tests/rot.rs b/kimchi/src/tests/rot.rs
index f88125cf9b..f9a1308b86 100644
--- a/kimchi/src/tests/rot.rs
+++ b/kimchi/src/tests/rot.rs
@@ -328,7 +328,6 @@ fn test_rot_finalization() {
     let index = {
         let cs = ConstraintSystem::create(gates.clone())
             .public(num_public_inputs)
-            .lookup(vec![rot::lookup_table()])
             .build()
             .unwrap();
         let mut srs = SRS::<Vesta>::create(cs.domain.d1.size());
diff --git a/kimchi/src/tests/xor.rs b/kimchi/src/tests/xor.rs
index 0344e0aea3..7ab28b4008 100644
--- a/kimchi/src/tests/xor.rs
+++ b/kimchi/src/tests/xor.rs
@@ -392,7 +392,6 @@ fn test_xor_finalization() {
 
     let index = {
         let cs = ConstraintSystem::create(gates.clone())
-            .lookup(vec![xor::lookup_table()])
             .public(num_inputs)
             .build()
             .unwrap();

From 64e915537b7b560c77a8f6d87f68def267a37dba Mon Sep 17 00:00:00 2001
From: Mikhail Volkhov <volhovm.cs@gmail.com>
Date: Mon, 30 Oct 2023 18:50:18 +0000
Subject: [PATCH 20/32] Add a test for lookup table id collisions

---
 kimchi/src/circuits/constraints.rs  |   2 +-
 kimchi/src/circuits/lookup/index.rs | 104 +++++++++++++++++++++++++++-
 kimchi/src/error.rs                 |   4 ++
 3 files changed, 108 insertions(+), 2 deletions(-)

diff --git a/kimchi/src/circuits/constraints.rs b/kimchi/src/circuits/constraints.rs
index ea9cbadf74..ae8e63ba91 100644
--- a/kimchi/src/circuits/constraints.rs
+++ b/kimchi/src/circuits/constraints.rs
@@ -820,7 +820,7 @@ impl<F: PrimeField + SquareRootField> Builder<F> {
             &domain,
             zk_rows as usize,
         )
-        .map_err(|e| SetupError::ConstraintSystem(e.to_string()))?;
+        .map_err(SetupError::LookupCreation)?;
 
         let sid = shifts.map[0].clone();
 
diff --git a/kimchi/src/circuits/lookup/index.rs b/kimchi/src/circuits/lookup/index.rs
index 861e3693c4..50b0879242 100644
--- a/kimchi/src/circuits/lookup/index.rs
+++ b/kimchi/src/circuits/lookup/index.rs
@@ -21,7 +21,7 @@ use std::iter;
 use thiserror::Error;
 
 /// Represents an error found when computing the lookup constraint system
-#[derive(Debug, Error)]
+#[derive(Debug, Error, Clone)]
 pub enum LookupError {
     #[error("The combined lookup table is larger than allowed by the domain size. Observed: {length}, expected: {maximum_allowed}")]
     LookupTableTooLong {
@@ -467,3 +467,105 @@ impl<F: PrimeField + SquareRootField> LookupConstraintSystem<F> {
         }
     }
 }
+
+#[cfg(test)]
+mod tests {
+
+    use super::{LookupError, LookupTable, RuntimeTableCfg};
+    use crate::{
+        circuits::constraints::ConstraintSystem, circuits::gate::CircuitGate,
+        circuits::lookup::tables::xor, circuits::polynomials::range_check, error::SetupError,
+    };
+    use mina_curves::pasta::Fp;
+
+    #[test]
+    fn colliding_table_ids() {
+        let (_, gates) = CircuitGate::<Fp>::create_multi_range_check(0);
+        let collision_id: i32 = 5;
+
+        let cs = ConstraintSystem::<Fp>::create(gates.clone())
+            .lookup(vec![range_check::gadget::lookup_table()])
+            .build();
+
+        assert!(
+            matches!(
+                cs,
+                Err(SetupError::LookupCreation(
+                    LookupError::LookupTableIdCollision { .. }
+                ))
+            ),
+            "LookupConstraintSystem::create(...) must fail due to range table passed twice"
+        );
+
+        let cs = ConstraintSystem::<Fp>::create(gates.clone())
+            .lookup(vec![xor::xor_table()])
+            .build();
+
+        assert!(
+            cs.is_ok(),
+            "LookupConstraintSystem::create(...) must succeed, no duplicates exist"
+        );
+
+        let cs = ConstraintSystem::<Fp>::create(gates.clone())
+            .lookup(vec![
+                LookupTable::create(collision_id, vec![vec![From::from(0); 16]]).unwrap(),
+                LookupTable::create(collision_id, vec![vec![From::from(1); 16]]).unwrap(),
+            ])
+            .build();
+
+        assert!(
+            matches!(
+                cs,
+                Err(SetupError::LookupCreation(
+                    LookupError::LookupTableIdCollision { .. }
+                ))
+            ),
+            "LookupConstraintSystem::create(...) must fail, collision in fixed ids"
+        );
+
+        let cs = ConstraintSystem::<Fp>::create(gates.clone())
+            .runtime(Some(vec![
+                RuntimeTableCfg {
+                    id: collision_id,
+                    first_column: vec![From::from(0); 16],
+                },
+                RuntimeTableCfg {
+                    id: collision_id,
+                    first_column: vec![From::from(1); 16],
+                },
+            ]))
+            .build();
+
+        assert!(
+            matches!(
+                cs,
+                Err(SetupError::LookupCreation(
+                    LookupError::LookupTableIdCollision { .. }
+                ))
+            ),
+            "LookupConstraintSystem::create(...) must fail, collision in runtime ids"
+        );
+
+        let cs = ConstraintSystem::<Fp>::create(gates.clone())
+            .lookup(vec![LookupTable::create(
+                collision_id,
+                vec![vec![From::from(0); 16]],
+            )
+            .unwrap()])
+            .runtime(Some(vec![RuntimeTableCfg {
+                id: collision_id,
+                first_column: vec![From::from(1); 16],
+            }]))
+            .build();
+
+        assert!(
+            matches!(
+                cs,
+                Err(SetupError::LookupCreation(
+                    LookupError::LookupTableIdCollision { .. }
+                ))
+            ),
+            "LookupConstraintSystem::create(...) must fail, collision between runtime and lookup ids"
+        );
+    }
+}
diff --git a/kimchi/src/error.rs b/kimchi/src/error.rs
index 8c801fd38f..8f2e8406a1 100644
--- a/kimchi/src/error.rs
+++ b/kimchi/src/error.rs
@@ -1,5 +1,6 @@
 //! This module implements the [`ProverError`] type.
 
+use crate::circuits::lookup::index::LookupError; // not sure about hierarchy
 use poly_commitment::error::CommitmentError;
 use thiserror::Error;
 
@@ -100,6 +101,9 @@ pub enum SetupError {
 
     #[error("the domain could not be constructed: {0}")]
     DomainCreation(DomainCreationError),
+
+    #[error("the lookup constraint system cannot not be constructed: {0}")]
+    LookupCreation(LookupError),
 }
 
 /// Errors that can arise when creating a verifier index

From 2121c7faf31ac0037ea0024af87fbc3da6f768dc Mon Sep 17 00:00:00 2001
From: Mikhail Volkhov <volhovm.cs@gmail.com>
Date: Thu, 2 Nov 2023 11:54:29 +0000
Subject: [PATCH 21/32] Address PR comments [MinaProtocol/mina#14070]

---
 kimchi/src/circuits/constraints.rs       | 11 +----------
 kimchi/src/circuits/lookup/index.rs      |  2 +-
 kimchi/src/circuits/lookup/tables/mod.rs | 17 +++++++++++++++--
 kimchi/src/precomputed_srs.rs            |  3 +++
 kimchi/src/prover_index.rs               |  1 -
 5 files changed, 20 insertions(+), 14 deletions(-)

diff --git a/kimchi/src/circuits/constraints.rs b/kimchi/src/circuits/constraints.rs
index ae8e63ba91..8af6df4280 100644
--- a/kimchi/src/circuits/constraints.rs
+++ b/kimchi/src/circuits/constraints.rs
@@ -686,16 +686,7 @@ impl<F: PrimeField + SquareRootField> Builder<F> {
 
         let lookup_domain_size = {
             // First we sum over the lookup table size
-            let mut lookup_domain_size: usize = lookup_tables
-                .iter()
-                .map(|lt| {
-                    if lt.data().is_empty() {
-                        0
-                    } else {
-                        lt.data()[0].len()
-                    }
-                })
-                .sum();
+            let mut lookup_domain_size: usize = lookup_tables.iter().map(|lt| lt.len()).sum();
             // After that on the runtime tables
             if let Some(runtime_tables) = runtime_tables.as_ref() {
                 for runtime_table in runtime_tables.iter() {
diff --git a/kimchi/src/circuits/lookup/index.rs b/kimchi/src/circuits/lookup/index.rs
index 50b0879242..41a9709737 100644
--- a/kimchi/src/circuits/lookup/index.rs
+++ b/kimchi/src/circuits/lookup/index.rs
@@ -216,7 +216,7 @@ impl<F: PrimeField + SquareRootField> LookupConstraintSystem<F> {
                 let max_num_entries = d1_size - zk_rows - 1;
 
                 //~ 2. Get the lookup selectors and lookup tables that are specified implicitly
-                // by the lookup gates (TODO: how?)
+                // by the lookup gates.
                 let (lookup_selectors, gate_lookup_tables) =
                     lookup_info.selector_polynomials_and_tables(domain, gates);
 
diff --git a/kimchi/src/circuits/lookup/tables/mod.rs b/kimchi/src/circuits/lookup/tables/mod.rs
index 7a9397115f..3672d47ec2 100644
--- a/kimchi/src/circuits/lookup/tables/mod.rs
+++ b/kimchi/src/circuits/lookup/tables/mod.rs
@@ -16,6 +16,8 @@ pub struct LookupTable<F> {
 /// Represents inconsistency errors during table construction and composition.
 #[derive(Debug, Error)]
 pub enum LookupTableError {
+    #[error("Table must be nonempty")]
+    InputTableDataEmpty,
     #[error("One of the lookup tables has columns of different lengths")]
     InconsistentTableLength,
     #[error("The table with id 0 must have an entry of all zeros")]
@@ -28,9 +30,14 @@ where
 {
     pub fn create(id: i32, data: Vec<Vec<F>>) -> Result<Self, LookupTableError> {
         let res = LookupTable { id, data };
-        let table_len = res.len();
+
+        // Empty tables are not allowed
+        if res.data.is_empty() {
+            return Err(LookupTableError::InputTableDataEmpty);
+        }
 
         // All columns in the table must have same length
+        let table_len = res.len();
         for col in res.data.iter() {
             if col.len() != table_len {
                 return Err(LookupTableError::InconsistentTableLength);
@@ -282,7 +289,13 @@ mod tests {
     }
 
     #[test]
-    fn test_inconsistent_lengths() {
+    fn test_invalid_data_inputs() {
+        let table: Result<LookupTable<Fp>, _> = LookupTable::create(0, vec![]);
+        assert!(
+            matches!(table, Err(LookupTableError::InputTableDataEmpty)),
+            "LookupTable::create(...) must fail when empty table creation is attempted"
+        );
+
         let lookup_r: u64 = 32;
         // Two columns of different lengths
         let lookup_table_values_1: Vec<_> = (0..2 * lookup_r).map(From::from).collect();
diff --git a/kimchi/src/precomputed_srs.rs b/kimchi/src/precomputed_srs.rs
index 116554e262..11f60edec3 100644
--- a/kimchi/src/precomputed_srs.rs
+++ b/kimchi/src/precomputed_srs.rs
@@ -33,6 +33,9 @@ where
     let file =
         File::open(srs_path.clone()).unwrap_or_else(|_| panic!("missing SRS file: {srs_path:?}"));
     let reader = BufReader::new(file);
+    // Note: In tests, this read takes significant amount of time (2 min) due
+    // to -O0 optimisation level. Compile tests with -O1 or --release flag.
+    // See: https://github.com/o1-labs/proof-systems/blob/develop/CONTRIBUTING.md#development
     rmp_serde::from_read(reader).unwrap()
 }
 
diff --git a/kimchi/src/prover_index.rs b/kimchi/src/prover_index.rs
index b28442fb53..8348baa289 100644
--- a/kimchi/src/prover_index.rs
+++ b/kimchi/src/prover_index.rs
@@ -213,7 +213,6 @@ pub mod testing {
                 let log2_size = size.ilog2();
                 // Run test_srs_serialization test to generate test SRS & enable this
                 let mut srs = if log2_size <= precomputed_srs::SERIALIZED_SRS_SIZE {
-                    // @volhovm: on my machine for d=16 (2.2Mb SRS file) this takes 110s. Why???
                     // TODO: we should trim it if it's smaller
                     precomputed_srs::get_srs()
                 } else {

From d79015d4287949bf7eed51640c22de610b9390c5 Mon Sep 17 00:00:00 2001
From: Mikhail Volkhov <volhovm.cs@gmail.com>
Date: Thu, 2 Nov 2023 13:03:17 +0000
Subject: [PATCH 22/32] Revert HashSet<LookupTable<_>> changes

---
 kimchi/src/circuits/lookup/lookups.rs    | 4 ++--
 kimchi/src/circuits/lookup/tables/mod.rs | 2 +-
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/kimchi/src/circuits/lookup/lookups.rs b/kimchi/src/circuits/lookup/lookups.rs
index 5796fcb814..12e4bd058d 100644
--- a/kimchi/src/circuits/lookup/lookups.rs
+++ b/kimchi/src/circuits/lookup/lookups.rs
@@ -204,7 +204,7 @@ impl LookupInfo {
         &self,
         domain: &EvaluationDomains<F>,
         gates: &[CircuitGate<F>],
-    ) -> (LookupSelectors<Evaluations<F>>, HashSet<LookupTable<F>>) {
+    ) -> (LookupSelectors<Evaluations<F>>, Vec<LookupTable<F>>) {
         let n = domain.d1.size();
 
         let mut selector_values = LookupSelectors::default();
@@ -246,7 +246,7 @@ impl LookupInfo {
                 .interpolate()
                 .evaluate_over_domain(domain.d8)
         });
-        let res_tables: HashSet<_> = gate_tables.into_iter().map(get_table).collect();
+        let res_tables: Vec<_> = gate_tables.into_iter().map(get_table).collect();
         (selector_values8, res_tables)
     }
 
diff --git a/kimchi/src/circuits/lookup/tables/mod.rs b/kimchi/src/circuits/lookup/tables/mod.rs
index 3672d47ec2..929d77ade5 100644
--- a/kimchi/src/circuits/lookup/tables/mod.rs
+++ b/kimchi/src/circuits/lookup/tables/mod.rs
@@ -7,7 +7,7 @@ pub mod range_check;
 pub mod xor;
 
 /// A table of values that can be used for a lookup, along with the ID for the table.
-#[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[derive(Debug, Clone)]
 pub struct LookupTable<F> {
     id: i32,
     data: Vec<Vec<F>>,

From 2bcd3db1f190bd8026af93f9ef2a5f550cc30ef2 Mon Sep 17 00:00:00 2001
From: Mikhail Volkhov <volhovm.cs@gmail.com>
Date: Thu, 2 Nov 2023 11:18:04 +0000
Subject: [PATCH 23/32] Consistency pass on book chapters / styling

---
 book/src/SUMMARY.md             |  6 +--
 book/src/kimchi/keccak.md       | 60 ++++++++++++++--------------
 book/src/kimchi/permut.md       |  5 +--
 book/src/kimchi/zkpm.md         | 64 +-----------------------------
 book/src/pickles/passthrough.md |  1 -
 book/src/plonk/zkpm.md          | 70 +++++++++++++++++++++++++++++++++
 6 files changed, 105 insertions(+), 101 deletions(-)
 delete mode 100644 book/src/pickles/passthrough.md
 create mode 100644 book/src/plonk/zkpm.md

diff --git a/book/src/SUMMARY.md b/book/src/SUMMARY.md
index 35b2d36267..106368db6b 100644
--- a/book/src/SUMMARY.md
+++ b/book/src/SUMMARY.md
@@ -49,21 +49,20 @@
 - [Non-interaction with Fiat-Shamir](./plonk/fiat_shamir.md)
 - [Plookup](./plonk/plookup.md)
 - [Maller's Optimization](./plonk/maller.md)
+- [Zero-Column Approach to Zero-Knowledge](./plonk/zkpm.md)
 
 # Kimchi
 
 - [Overview](./kimchi/overview.md)
 - [Arguments](./kimchi/arguments.md)
-- [Zero-Column Approach to Zero-Knowledge](./kimchi/zkpm.md)
 - [Final Check](./kimchi/final_check.md)
 - [Maller's Optimization for Kimchi](./kimchi/maller_15.md)
-- [Permutation](./kimchi/permut.md)
 - [Lookup Tables](./kimchi/lookup.md)
   - [Extended Lookup Tables](./kimchi/extended-lookup-tables.md)
 - [Custom Gates](./kimchi/gates.md)
   - [Foreign Field Addition](./kimchi/foreign_field_add.md)
   - [Foreign Field Multiplication](./kimchi/foreign_field_mul.md)
-  - [Keccak](./rfcs/keccak.md)
+  - [Keccak](./kimchi/keccak.md)
 
 
 # Pickles & Inductive Proof Systems
@@ -71,7 +70,6 @@
 - [Overview](./fundamentals/zkbook_ips.md)
 - [Accumulation](./pickles/accumulation.md)
 - [Deferred Computation](./pickles/deferred.md)
-- [Passthough & Me-Only](./pickles/passthrough.md)
 
 # Technical Specifications
 
diff --git a/book/src/kimchi/keccak.md b/book/src/kimchi/keccak.md
index 457c247b97..9c00ad6d7c 100644
--- a/book/src/kimchi/keccak.md
+++ b/book/src/kimchi/keccak.md
@@ -1,4 +1,4 @@
-# RFC: Keccak
+# Keccak Gate
 
 The Keccak gadget is comprised of 3 circuit gates (`Xor16`, `Rot64`, and `Zero`)
 
@@ -45,9 +45,9 @@ Kimchi framework that dictated those approaches.
 
 ## Rot64
 
-It is clear from the definition of the rotation gate that its constraints are complete 
+It is clear from the definition of the rotation gate that its constraints are complete
 (meaning that honest instances always satisfy the constraints). It is left to be proven
-that the proposal is sound. In this section, we will give a proof that as soon as we 
+that the proposal is sound. In this section, we will give a proof that as soon as we
 perform the range checks on the excess and shifted parts of the input, only one possible
 assignment satisfies the constraints. This means that there is no dishonest instance that
 can make the constraints pass. We will also give an example where one could find wrong
@@ -55,10 +55,10 @@ rotation witnesses that would satisfy the constraints if we did not check the ra
 
 ### Necessity of range checks
 
-First of all, we will illustrate the necessity of range-checks with a simple example. 
-For the sake of readability, we will use some toy field lengths. In particular, let us 
-assume that our words have 4 bits, meaning all of the elements between `0x0` and `0xF`. 
-Next, we will be using the native field $\mathbb{F}_{32}$. 
+First of all, we will illustrate the necessity of range-checks with a simple example.
+For the sake of readability, we will use some toy field lengths. In particular, let us
+assume that our words have 4 bits, meaning all of the elements between `0x0` and `0xF`.
+Next, we will be using the native field $\mathbb{F}_{32}$.
 
 As we will later see, this choice of field lengths is not enough to perform any 4-bit
 rotation, since the operations in the constraints would overflow the native field.
@@ -85,52 +85,50 @@ $$
 $$
 
 We can easily check that the proposed values of the shifted `0b1010=10` and the excess
-`0b1=1` values satisfy the above constraint because $26 = 1 \cdot 16 + 10$ and $11 = 1 + 10$. 
+`0b1=1` values satisfy the above constraint because $26 = 1 \cdot 16 + 10$ and $11 = 1 + 10$.
 Now, the question is: _can we find another value for excess and shifted, such that their addition results in an incorrect rotated word?_
 
 The answer to this question is yes, due to __diophantine equations__. We basically want to find $x,y$ such that $26 = x \cdot 16 + y (\text{ mod } 32)$. The solution to this equation is:
 
 $$
 \begin{align*}
-\forall k \in [0..31]: & \\
-x &= k \\
+\forall k \in [0 \ldots 31]: x &= k \ \land \\
 y &= 26 - 16 \cdot k
 \end{align*}
 $$
 
 We chose these word and field lengths to better understand the behaviour of the solution. Here, we can see two "classes" of evaluations.
 
-- If we choose an even $k$, then $y$ will have the following shape: 
+- If we choose an even $k$, then $y$ will have the following shape:
   - $$26 - 16 \cdot (2 \cdot n) \iff 26 - 32n \equiv_{32} 26 $$
   - Meaning, if $x = 2n$ then $y = 26$.
 
 - If on the other hand, we chose an odd $k$, then $y$ will have the following shape instead:
   - $$26 - 16 \cdot (2 \cdot n + 1) \iff 26 - 32n - 16 \equiv_{32} 26 - 16 = 10$$
-  - Meaning, if $x = 2n+1$ then $y = 10$. 
+  - Meaning, if $x = 2n+1$ then $y = 10$.
 
 Thus, possible solutions to the diophantine equation are:
 
 $$
 \begin{align*}
-x &= 0, 1, 2, 3, 4, 5... \\
-y &= 26, 10, 26, 10, 26, 10...
+x &= 0, 1, 2, 3, 4, 5 \ldots \\
+y &= 26, 10, 26, 10, 26, 10 \ldots
 \end{align*}
 $$
 
-Note that our valid witness is part of that set of solutions, meaning $x=1$ and $y=10$. Of course, we can also find another dishonest instantiation such as $x=0$ and $y=26$. Perhaps one could think that we do not need to worry about this case, because the resulting rotation word would be $0+26=26$, and if we later use that result as an input to a subsequent gate such as XOR, the value $26$ would not fit and at some point the constraint system would complain. Nonetheless, we still have other solutions to worry about, such as $(x=3, y=10)$ or $(x=5, y=10)$, since they would result in a rotated word that would fit in the word length of 4 bits, yet would be incorrect (not equal to $11$). 
+Note that our valid witness is part of that set of solutions, meaning $x=1$ and $y=10$. Of course, we can also find another dishonest instantiation such as $x=0$ and $y=26$. Perhaps one could think that we do not need to worry about this case, because the resulting rotation word would be $0+26=26$, and if we later use that result as an input to a subsequent gate such as XOR, the value $26$ would not fit and at some point the constraint system would complain. Nonetheless, we still have other solutions to worry about, such as $(x=3, y=10)$ or $(x=5, y=10)$, since they would result in a rotated word that would fit in the word length of 4 bits, yet would be incorrect (not equal to $11$).
 
-All of the above incorrect solutions differ in one thing: they have different bit lengths. This means that we need to range check the values for the excess and shifted witnesses to make sure they have the correct length. 
+All of the above incorrect solutions differ in one thing: they have different bit lengths. This means that we need to range check the values for the excess and shifted witnesses to make sure they have the correct length.
 
 ### Sufficiency of range checks
 
-In the following, we will give a proof that performing range checks for these values is not only necessary but also sufficient to prove that the rotation gate is sound. In other words, we will prove there are no two possible solutions of the decomposition constraint that have the correct bit lengths. Now, for the sake of robustness, we will consider 64-bit words and fields with at least twice the bit length of the words (as is our case). 
+In the following, we will give a proof that performing range checks for these values is not only necessary but also sufficient to prove that the rotation gate is sound. In other words, we will prove there are no two possible solutions of the decomposition constraint that have the correct bit lengths. Now, for the sake of robustness, we will consider 64-bit words and fields with at least twice the bit length of the words (as is our case).
 
 We will proceed by __contradiction__. Suppose there are two different solutions to the following diophantic equation:
 
 $$
 \begin{align*}
-\forall k \in \mathbb{F}_n: & \\
-x &= k \\
+\forall k \in \mathbb{F}_n: x &= k \ \land \\
 y &= w \cdot 2^r - 2^{64} \cdot k
 \end{align*}
 $$
@@ -139,7 +137,7 @@ where $k$ is a parameter to instantiate the solutions, $w$ is the word to be rot
 
 Then, that means that there are two different solutions, $(0\leq x=a<2^r, 0\leq y=b<2^{64})$ and $(0\leq x=a'<2^r, 0\leq y=b'<2^{64})$ with at least $a \neq a'$ or $b \neq b'$. We will show that this is impossible.
 
-If both are solutions to the same equation, then: 
+If both are solutions to the same equation, then:
 $$
 \begin{align*}
 w \cdot 2^r &= a \cdot 2^{64} + b \\
@@ -149,18 +147,22 @@ $$
 means that $a \cdot 2^{64} + b = a'\cdot 2^{64} + b'$. Moving terms to the left side, we have an equivalent equality: $2^{64}(a-a') + (b-b')=0 \mod{n}$. There are three cases to consider:
 
 - $a = a'$ and $b \neq b'$: then $(b - b') \equiv_n 0$ and this can only happen if $b' = b + kn$. But since $n > 2^{64}$, then $b'$ cannot be smaller than $2^{64}$ as it was assumed. CONTRADICTION.
-  
+
 - $b = b'$ and $a \neq a'$: then $2^{64}(a - a') \equiv_n 0$ and this can only happen if $a' = a + kn$. But since $n > 2^r$, then $a'$ cannot be smaller than $2^r$ as it was assumed. CONTRADICTION.
 
-- $a\neq a'$ and $b \neq b'$: then we have something like $2^{64} \alpha + \beta \equiv_n 0$. 
+- $a\neq a'$ and $b \neq b'$: then we have something like $2^{64} \alpha + \beta \equiv_n 0$.
   - This means $\beta \equiv_n -2^{64} \alpha = k \cdot n - 2^{64} \alpha$ for any $k$.
-  - According to the assumption, both $0\leq a<2^r$ and $0\leq a'<2^r$. This means, the difference $\alpha:=(a - a')$ lies anywhere in between the following interval: 
-  - $$1 - 2^r \leq \alpha \leq 2^r - 1$$
+  - According to the assumption, both $0\leq a<2^r$ and $0\leq a'<2^r$. This means, the difference $\alpha:=(a - a')$ lies anywhere in between the following interval:
+    $$1 - 2^r \leq \alpha \leq 2^r - 1$$
   - We plug in this interval to the above equation to obtain the following interval for $\beta$:
-  - $$k\cdot n - 2^{64}(1-2^r)\leq \beta \leq k\cdot n - 2^{64}(2^r - 1) $$
+    $$k\cdot n - 2^{64}(1-2^r)\leq \beta \leq k\cdot n - 2^{64}(2^r - 1) $$
   - We look at this interval from both sides of the inequality: $\beta \geq kn - 2^{64} + 2^{64+r}$ and $\beta \leq kn + 2^{64} - 2^{64+r}$ and we wonder if $kn - 2^{64} + 2^{64+r} \leq kn + 2^{64} - 2^{64+r}$ is at all possible. We rewrite as follows:
-  - $$2^{64+r} - 2^{64} \leq 2^{64} - 2^{64+r}$$
-  - $$2\cdot2^{64+r} \leq 2\cdot2^{64} $$
-  - $$2^{64+r} \leq 2^{64} $$
-  - But this can only happen if $r\leq 0$, which is impossible since we assume $0 < r < 64$.CONTRADICTION.
+    $$
+    \begin{align*}
+     2^{64+r} - 2^{64} &\leq 2^{64} - 2^{64+r}\\
+     2\cdot2^{64+r} &\leq 2\cdot2^{64} \\
+     2^{64+r} &\leq 2^{64}
+     \end{align*}
+     $$
+  - But this can only happen if $r\leq 0$, which is impossible since we assume $0 < r < 64$. CONTRADICTION.
 - EOP.
diff --git a/book/src/kimchi/permut.md b/book/src/kimchi/permut.md
index 3d62293eae..cc82360ef6 100644
--- a/book/src/kimchi/permut.md
+++ b/book/src/kimchi/permut.md
@@ -1,4 +1 @@
-## Permutation
-
-TO-DO
-
+# Permutation
diff --git a/book/src/kimchi/zkpm.md b/book/src/kimchi/zkpm.md
index a4a1ba291c..947a334538 100644
--- a/book/src/kimchi/zkpm.md
+++ b/book/src/kimchi/zkpm.md
@@ -1,63 +1 @@
-# A More Efficient Approach to Zero Knowledge for PLONK
-
-In PLONK (considered as an interactive oracle proof), the prover sends the verifier several polynomials. They are evaluated at some $k$ points during the course of the protocol. Of course, if we want zero-knowledge, we would require that those evaluations do not reveal anything about the proof's underlying witness.
-
-PLONK as described <a href="https://eprint.iacr.org/2019/953" target="_blank" rel="noopener">here</a> achieves <a href="https://minaprotocol.com/blog/zero-knowledge-proofs-an-intuitive-explanation">zero knowledge</a> by multiplying the polynomials with a small degree polynomial of random coefficients. When PLONK is instantiated with a discrete-log base <a href="https://eprint.iacr.org/2016/263" target="_blank" rel="noopener">Bootle et al type</a> polynomial commitment scheme, the polynomial degrees must be padded to the nearest power of two. As a result, since several of the polynomials in PLONK already have degree equal to a power of two before the zero-knowledge masking, the multiplication with a random polynomial pushes the degree to the next power of two, which hurts efficiency. In order to avoid it, we propose an alternative method of achieving zero knowledge.
-
-## Zero Knowledge for the Column Polynomials
-
-Let $w$ be the number of rows in a PLONK constraint system. For a typical real-world circuit, $w$ will not be equal to a power of two.
-
-Let the witness elements from one column be $s_1, s_2, \ldots, s_w$. Let $n$ be the closest power of two to $w$ such that $n \geq w$. Let $\mathbb{F}$ be the field that witness elements belong to.
-
-Now, in vanilla PLONK, we pad the $s_i$ with $n - w$ elements, interpolate the polynomial over a domain of size $n$, scale it by a low degree random polynomial, and commit to the resulting polynomial. We want to avoid increasing the degree with the scaling by a low degree polynomial, so consider the following procedure.
-
-**Procedure.** Sample $k$ elements uniformly from $\mathbb{F}$: $r_{w+1}, \ldots, r_{w+k}$. Append them to the tuple of witness elements and then pad the remaining $n - (w+k)$ places as zeroes. The resulting tuple is interpolated as the witness polynomial. This approach ensures zero knowledge for the witness polynomials as established by Lemma 1.
-
-**Lemma 1.** Let $H \subset \mathbb{F}$ be a domain of size $n$. Let $s_1, s_2, \ldots, s_w\in \mathbb{F}$. Let $r_{w+1}, \ldots, r_{w+k}$ be $k$ uniformly and independently random elements in $\mathbb{F}.$ Let $\mathbf{v}$ be the $n$-tuple $\mathbf{v} = (s_1, s_2, \ldots, s_w, r_{w+1}, \ldots, r_{w+k}, 0,\ldots_{\text{n - (w+k) times}})$.
-Let $f(X)$ be an interpolation polynomial of degree $n-1$ such that $f(h_i) = v_i$, where $h_i \in H$. Let $c_1, \ldots, c_k$ be any elements in $\mathbb{F}$ such that $c_i \neq v_j$ for every $i,j$. Then, $(f(c_1), \ldots, f(c_k))$ is distributed uniformly at random in $\mathbb{F}^k$.
-
-**Proof sketch.** Recall that the interpolation polynomial is
-
-$f(X) = \sum_{j = 1}^n \prod_{k \neq j} \frac{(X-h_k)}{(h_j-h_k)} v_j$
-
-With $V_{w+1}, \ldots, V_{w+k}$ as random variables, we have,
-$f(X) = a_{w+1} V_{w+1} + a_{w+2} V_{w+2} + \ldots + a_{w+k} V_{w+k} + a$
-for some constant field elements $a, a_{w+1}, \ldots, a_{w+k}$. Therefore, assigning random values to $V_{w+1}, \ldots, V_{w+k}$ will give $k$ degrees of freedom that will let $(f(c_1), \ldots, f(c_k))$ to be distributed uniformly at random in $\mathbb{F}^k$.
-
-## Zero Knowledge for the Permutation Polynomial
-
-The other polynomial in PLONK for which we need zero-knowledge is the "permutation polynomial" $z$.
-The idea here is to set the last $k$ evaluations to be uniformly random elements $t_1, \ldots, t_k$ in $\mathbb{F}$. Then, we'll modify the verification equation to not check for those values to satisfy the permutation property.
-
-**Modified permutation polynomial.** Specifically, set $z(X)$ as follows.
-
-$z(X) = L_1(X) + \sum_{i = 1}^{\blue{n-k-2}} \left(L_{i+1} \prod_{j=1}^i \mathsf{frac}_{i,j} \right) + \blue{t_1 L_{n-k}(X) + \ldots + t_k L_{n}(X) }$
-
-From Lemma 1, the above $z(X)$ has the desired zero knowledge property when $k$ evaluations are revealed. However, we need to modify the other parts of the protocol so that the last $k$ elements are not subject to the permutation evaluation, since they will no longer satisfy the permutation check. Specifically, we will need to modify the permutation polynomial to disregard those random elements, as follows.
-
-$ \begin{aligned}  & t(X) = \\
-  & (a(X)b(X)q_M(X) + a(X)q_L(X) + b(X)q_R(X) + c(X)q_O(X) + PI(X) + q_C(X)) \frac{1}{z_H(X)} \\
-  &+ ((a(X) + \beta X + \gamma)(b(X) + \beta k_1 X + \gamma)(c(X) + \beta k_2X + \gamma)z(X) \blue{(X-h_{n-k}) \ldots (X-h_{n-1})(X-h_n)} ) \frac{\alpha}{z_{H}(X)} \\
-  & - ((a(X) + \beta S_{\sigma1}(X) + \gamma)(b(X) + \beta S_{\sigma2}(X) + \gamma)(c(X) + \beta S_{\sigma3}(X) + \gamma)z(X\omega) \blue{(X-h_{n-k}) \ldots (X-h_{n-1})(X-h_n)}) \frac{\alpha}{z_{H}(X)} \\
-  & + (z(X)-1)L_1(X) \frac{\alpha^2}{z_H(X)} \\
-  & + \blue{(z(X)-1)L_{n-k}(X) \frac{\alpha^3}{z_H(X)} }  \end{aligned} $
-
-**Modified permutation checks.** To recall, the permutation check was originally as follows. For all $h \in H$,
-
-* $L_1(h)(Z(h) - 1) = 0$
-*  $Z(h)[(a(h) + \beta h + \gamma)(b(h) + \beta k_1 h + \gamma)(c(h) + \beta k_2 h + \gamma)] \\
-  = Z(\omega h)[(a(h) + \beta S_{\sigma1}(h) + \gamma)(b(h) + \beta S_{\sigma2}(h) + \gamma)(c(h) + \beta S_{\sigma3}(h) + \gamma)]$
-
-
-
-The modified permuation checks that ensures that the check is performed only on all the values except the last $k$ elements in the witness polynomials are as follows.
-
-* For all $h \in H$, $L_1(h)(Z(h) - 1) = 0$
-* For all $h \in \blue{H\setminus \{h_{n-k}, \ldots, h_n\}}$, $\begin{aligned}  & Z(h)[(a(h) + \beta h + \gamma)(b(h) + \beta k_1 h + \gamma)(c(h) + \beta k_2 h + \gamma)] \\
-  &= Z(\omega h)[(a(h) + \beta S_{\sigma1}(h) + \gamma)(b(h) + \beta S_{\sigma2}(h) + \gamma)(c(h) + \beta S_{\sigma3}(h) + \gamma)]  \end{aligned}$
-
-* For all $h \in H$, $L_{n-k}(h)(Z(h) - 1) = 0$
-
-
-In the modified permutation polynomial above, the multiple $(X-h_{n-k}) \ldots (X-h_{n-1})(X-h_n)$ ensures that the permutation check is performed only on all the values except the last $k$ elements in the witness polynomials.
+# Zero-Column Approach to Zero-Knowledge
diff --git a/book/src/pickles/passthrough.md b/book/src/pickles/passthrough.md
deleted file mode 100644
index cc182c4e51..0000000000
--- a/book/src/pickles/passthrough.md
+++ /dev/null
@@ -1 +0,0 @@
-# Passthrough and Me-Only
diff --git a/book/src/plonk/zkpm.md b/book/src/plonk/zkpm.md
new file mode 100644
index 0000000000..84f46f3ec0
--- /dev/null
+++ b/book/src/plonk/zkpm.md
@@ -0,0 +1,70 @@
+# A More Efficient Approach to Zero Knowledge for PLONK
+
+In PLONK (considered as an interactive oracle proof), the prover sends the verifier several polynomials. They are evaluated at some $k$ points during the course of the protocol. Of course, if we want zero-knowledge, we would require that those evaluations do not reveal anything about the proof's underlying witness.
+
+PLONK as described <a href="https://eprint.iacr.org/2019/953" target="_blank" rel="noopener">here</a> achieves <a href="https://minaprotocol.com/blog/zero-knowledge-proofs-an-intuitive-explanation">zero knowledge</a> by multiplying the polynomials with a small degree polynomial of random coefficients. When PLONK is instantiated with a discrete-log base <a href="https://eprint.iacr.org/2016/263" target="_blank" rel="noopener">Bootle et al type</a> polynomial commitment scheme, the polynomial degrees must be padded to the nearest power of two. As a result, since several of the polynomials in PLONK already have degree equal to a power of two before the zero-knowledge masking, the multiplication with a random polynomial pushes the degree to the next power of two, which hurts efficiency. In order to avoid it, we propose an alternative method of achieving zero knowledge.
+
+## Zero Knowledge for the Column Polynomials
+
+Let $w$ be the number of rows in a PLONK constraint system. For a typical real-world circuit, $w$ will not be equal to a power of two.
+
+Let the witness elements from one column be $s_1, s_2, \ldots, s_w$. Let $n$ be the closest power of two to $w$ such that $n \geq w$. Let $\mathbb{F}$ be the field that witness elements belong to.
+
+Now, in vanilla PLONK, we pad the $s_i$ with $n - w$ elements, interpolate the polynomial over a domain of size $n$, scale it by a low degree random polynomial, and commit to the resulting polynomial. We want to avoid increasing the degree with the scaling by a low degree polynomial, so consider the following procedure.
+
+**Procedure.** Sample $k$ elements uniformly from $\mathbb{F}$: $r_{w+1}, \ldots, r_{w+k}$. Append them to the tuple of witness elements and then pad the remaining $n - (w+k)$ places as zeroes. The resulting tuple is interpolated as the witness polynomial. This approach ensures zero knowledge for the witness polynomials as established by Lemma 1.
+
+**Lemma 1.** Let $H \subset \mathbb{F}$ be a domain of size $n$. Let $s_1, s_2, \ldots, s_w\in \mathbb{F}$. Let $r_{w+1}, \ldots, r_{w+k}$ be $k$ uniformly and independently random elements in $\mathbb{F}.$ Let $\mathbf{v}$ be the $n$-tuple $\mathbf{v} = (s_1, s_2, \ldots, s_w, r_{w+1}, \ldots, r_{w+k}, 0,\ldots_{\text{n - (w+k) times}})$.
+Let $f(X)$ be an interpolation polynomial of degree $n-1$ such that $f(h_i) = v_i$, where $h_i \in H$. Let $c_1, \ldots, c_k$ be any elements in $\mathbb{F}$ such that $c_i \neq v_j$ for every $i,j$. Then, $(f(c_1), \ldots, f(c_k))$ is distributed uniformly at random in $\mathbb{F}^k$.
+
+**Proof sketch.** Recall that the interpolation polynomial is
+
+$$
+f(X) = \sum_{j = 1}^n \prod_{k \neq j} \frac{(X-h_k)}{(h_j-h_k)} v_j
+$$
+
+With $V_{w+1}, \ldots, V_{w+k}$ as random variables, we have,
+$f(X) = a_{w+1} V_{w+1} + a_{w+2} V_{w+2} + \ldots + a_{w+k} V_{w+k} + a$
+for some constant field elements $a, a_{w+1}, \ldots, a_{w+k}$. Therefore, assigning random values to $V_{w+1}, \ldots, V_{w+k}$ will give $k$ degrees of freedom that will let $(f(c_1), \ldots, f(c_k))$ to be distributed uniformly at random in $\mathbb{F}^k$.
+
+## Zero Knowledge for the Permutation Polynomial
+
+The other polynomial in PLONK for which we need zero-knowledge is the "permutation polynomial" $z$.
+The idea here is to set the last $k$ evaluations to be uniformly random elements $t_1, \ldots, t_k$ in $\mathbb{F}$. Then, we'll modify the verification equation to not check for those values to satisfy the permutation property.
+
+**Modified permutation polynomial.** Specifically, set $z(X)$ as follows.
+
+$$
+z(X) = L_1(X) + \sum_{i = 1}^{\blue{n-k-2}} \left(L_{i+1} \prod_{j=1}^i \mathsf{frac}_{i,j} \right) + \blue{t_1 L_{n-k}(X) + \ldots + t_k L_{n}(X) }
+$$
+
+From Lemma 1, the above $z(X)$ has the desired zero knowledge property when $k$ evaluations are revealed. However, we need to modify the other parts of the protocol so that the last $k$ elements are not subject to the permutation evaluation, since they will no longer satisfy the permutation check. Specifically, we will need to modify the permutation polynomial to disregard those random elements, as follows.
+
+$$
+\begin{aligned}  & t(X) = \\
+  & \Big(a(X)b(X)q_M(X) + a(X)q_L(X) + b(X)q_R(X) + c(X)q_O(X) + PI(X) + q_C(X)\Big) \frac{1}{z_H(X)} \\
+  &+ \Big((a(X) + \beta X + \gamma)(b(X) + \beta k_1 X + \gamma)(c(X) + \beta k_2X + \gamma)z(X)\\
+  &\qquad\qquad\qquad\times{\blue{(X-h_{n-k}) \ldots (X-h_{n-1})(X-h_n)}} \Big) \frac{\alpha}{z_{H}(X)} \\
+  & - \Big((a(X) + \beta S_{\sigma1}(X) + \gamma)(b(X) + \beta S_{\sigma2}(X) + \gamma)(c(X) + \beta S_{\sigma3}(X) + \gamma)z(X\omega)\\
+  &\qquad\qquad\qquad\times{\blue{(X-h_{n-k}) \ldots (X-h_{n-1})(X-h_n)}}\Big) \frac{\alpha}{z_{H}(X)} \\
+  & + \Big(z(X)-1\Big)\cdot L_1(X) \frac{\alpha^2}{z_H(X)} \\
+  & + \blue{\Big(z(X)-1\Big)\cdot L_{n-k}(X) \frac{\alpha^3}{z_H(X)} }  \end{aligned}
+$$
+
+**Modified permutation checks.** To recall, the permutation check was originally as follows. For all $h \in H$,
+
+* $L_1(h)(Z(h) - 1) = 0$
+*  $Z(h)[(a(h) + \beta h + \gamma)(b(h) + \beta k_1 h + \gamma)(c(h) + \beta k_2 h + \gamma)] \\
+  = Z(\omega h)[(a(h) + \beta S_{\sigma1}(h) + \gamma)(b(h) + \beta S_{\sigma2}(h) + \gamma)(c(h) + \beta S_{\sigma3}(h) + \gamma)]$
+
+
+The modified permuation checks that ensures that the check is performed only on all the values except the last $k$ elements in the witness polynomials are as follows.
+
+* For all $h \in H$, $L_1(h)(Z(h) - 1) = 0$
+* For all $h \in \blue{H\setminus \{h_{n-k}, \ldots, h_n\}}$, $\begin{aligned}  & Z(h)[(a(h) + \beta h + \gamma)(b(h) + \beta k_1 h + \gamma)(c(h) + \beta k_2 h + \gamma)] \\
+  &= Z(\omega h)[(a(h) + \beta S_{\sigma1}(h) + \gamma)(b(h) + \beta S_{\sigma2}(h) + \gamma)(c(h) + \beta S_{\sigma3}(h) + \gamma)]  \end{aligned}$
+
+* For all $h \in H$, $L_{n-k}(h)(Z(h) - 1) = 0$
+
+
+In the modified permutation polynomial above, the multiple $(X-h_{n-k}) \ldots (X-h_{n-1})(X-h_n)$ ensures that the permutation check is performed only on all the values except the last $k$ elements in the witness polynomials.

From 73ae00a5bfe56295c7eb862d08b3d6ba5fb8cfcd Mon Sep 17 00:00:00 2001
From: Mikhail Volkhov <volhovm.cs@gmail.com>
Date: Tue, 7 Nov 2023 21:06:43 +0000
Subject: [PATCH 24/32] Prettify sections more

---
 book/src/SUMMARY.md                         | 17 +++---
 book/src/fundamentals/custom_constraints.md | 59 +--------------------
 book/src/fundamentals/proof_systems.md      | 24 ++++-----
 book/src/kimchi/custom_constraints.md       | 58 ++++++++++++++++++++
 book/src/plonk/fiat_shamir.md               |  8 +--
 book/src/plonk/glossary.md                  | 14 ++---
 6 files changed, 87 insertions(+), 93 deletions(-)
 create mode 100644 book/src/kimchi/custom_constraints.md

diff --git a/book/src/SUMMARY.md b/book/src/SUMMARY.md
index 106368db6b..f30839da67 100644
--- a/book/src/SUMMARY.md
+++ b/book/src/SUMMARY.md
@@ -12,7 +12,7 @@
   - [Multiplying Polynomials](./fundamentals/zkbook_multiplying_polynomials.md)
   - [Fast Fourier Transform](./fundamentals/zkbook_fft.md)
 
-# Cryptographic tools
+# Cryptographic Tools
 
 - [Commitments](./fundamentals/zkbook_commitment.md)
 - [Polynomial Commitments](./plonk/polynomial_commitments.md)
@@ -27,26 +27,20 @@
     - [Half Gate](./fundamentals/zkbook_2pc/halfgate.md)
     - [Full Description](./fundamentals/zkbook_2pc/fulldesc.md)
     - [Fixed-Key-AES Hashes](./fundamentals/zkbook_2pc/fkaes.md)
-
   - [Oblivious Transfer](./fundamentals/zkbook_2pc/ot.md)
     - [Base OT](./fundamentals/zkbook_2pc/baseot.md)
     - [OT Extension](./fundamentals/zkbook_2pc/ote.md)
-
   - [Full Protocol](./fundamentals/zkbook_2pc/2pc.md)
-
-# Proof systems
-
-- [Overview](./fundamentals/proof_systems.md)
-- [zk-SNARKs](./fundamentals/zkbook_plonk.md)
-- [Custom constraints](./fundamentals/custom_constraints.md)
+- [Proof Systems](./fundamentals/proof_systems.md)
+  - [zk-SNARKs](./fundamentals/zkbook_plonk.md)
 
 # Background on PLONK
 
 - [Overview](./plonk/overview.md)
-- [Glossary](./plonk/glossary.md)
+  - [Glossary](./plonk/glossary.md)
 - [Domain](./plonk/domain.md)
 - [Lagrange Basis in Multiplicative Subgroups](./plonk/lagrange.md)
-- [Non-interaction with Fiat-Shamir](./plonk/fiat_shamir.md)
+- [Non-Interactivity via Fiat-Shamir](./plonk/fiat_shamir.md)
 - [Plookup](./plonk/plookup.md)
 - [Maller's Optimization](./plonk/maller.md)
 - [Zero-Column Approach to Zero-Knowledge](./plonk/zkpm.md)
@@ -59,6 +53,7 @@
 - [Maller's Optimization for Kimchi](./kimchi/maller_15.md)
 - [Lookup Tables](./kimchi/lookup.md)
   - [Extended Lookup Tables](./kimchi/extended-lookup-tables.md)
+- [Custom Constraints](./kimchi/custom_constraints.md)
 - [Custom Gates](./kimchi/gates.md)
   - [Foreign Field Addition](./kimchi/foreign_field_add.md)
   - [Foreign Field Multiplication](./kimchi/foreign_field_mul.md)
diff --git a/book/src/fundamentals/custom_constraints.md b/book/src/fundamentals/custom_constraints.md
index e2c7256d68..8773465d1c 100644
--- a/book/src/fundamentals/custom_constraints.md
+++ b/book/src/fundamentals/custom_constraints.md
@@ -1,58 +1 @@
-This section explains how to design and add a custom constraint to our `proof-systems` library.
-
-PLONK is an AIOP. That is, it is a protocol in which the prover sends polynomials as messages and the verifier sends random challenges, and then evaluates the prover's polynomials and performs some final checks on the outputs.
-
-PLONK is very flexible. It can be customized with constraints specific to computations of interest. For example, in Mina, we use a PLONK configuration called kimchi that has custom constraints for poseidon hashing, doing elliptic curve operations, and more.
-
-A "PLONK configuration" specifies
-- The set of types of constraints that you would like to be able to enforce. We will describe below how these types of constraints are specified.
-- A number of "eq-able" columns `W`
-- A number of "advice" columns `A`
-
-Under such configuration, a circuit is specified by
-- A number of rows `n`
-- A vector `cs` of constraint-types of length `n`. I.e., a vector that specifies, for each row, which types of constraints should be enforced on that row.
-- A vector `eqs : Vec<(Position, Position)>` of equalities to enforce, where `struct Position { row: usize, column: usize }`. E.g., if the pair `(Position { row: 0, col: 8 }, Position { row: 10, col: 2 })` is in `eqs`, then the circuit is saying the entries in those two positions should be equal, or in other words that they refer to the same value. This is where the distinction between "eq-able" and "advice" columns comes in. The `column` field of a position in the `eqs` array can only refer to one of the first `W` columns. Equalities cannot be enforced on entries in the `A` columns after that.
-
-Then, given such a circuit, PLONK lets you produce proofs for the statement
-
-> I know `W + A` "column vectors" of field elements `vs: [Vec<F>; W + A]` such that for each row index `i < n`, the constraint of type `cs[i]` holds on the values `[vs[0][i], ..., vs[W+A - 1][i], vs[0][i+1], ..., vs[W+A - 1][i+1]` and all the equalities in `eqs` hold. I.e., for `(p1, p2)` in `eqs` we have `vs[p1.col][p1.row] == vs[p2.col][p2.row]`. So, a constraint can check the values in two adjacent rows.
-
-## Specifying a constraint
-
-Mathematically speaking, a constraint is a multivariate polynomial over the variables $c_{\mathsf{Curr},i}, \dots, v_{\mathsf{Curr}, W+A-1}, v_{\mathsf{Next}, 0}, \dots, v_{\mathsf{Next}, W+A-1}$. In other words, there is one variable corresponding to the value of each column in the "current row" and one variable correspond to the value of each column in the "next row".
-
-In Rust, $v_{r, i}$ is written `E::cell(Column::Witness(i), r)`. So, for example, the variable $v_{\mathsf{Next}, 3}$ is written
-`E::cell(Column::Witness(3), CurrOrNext::Next)`.
-
-
-
-    let w = |i| v(Column::Witness(i));
-Let's 
-
-## Defining a PLONK configuration
-
-The art in proof systems comes from knowing how to design a PLONK configuration to ensure maximal efficiency for the sorts of computations you are trying to prove. That is, how to choose the numbers of columns `W` and `A`, and how to define the set of constraint types.
-
-Let's describe the trade-offs involved here.
-
-The majority of the proving time for the PLONK prover is in
-- committing to the `W + A` column polynomials, which have length equal to the number of rows `n`
-- committing to the "permutation accumulator polynomial, which has length `n`.
-- committing to the quotient polynomial, which reduces to computing `max(k, W)` MSMs of size `n`, where `k` is the max degree of a constraint.
-- performing the commitment opening proof, which is mostly dependent on the number of rows `n`.
-
-So all in all, the proving time is approximately equal to the time to perform `W + A + 1 + max(k - 1, W)` MSMs of size `n`, plus the cost of an opening proof for polynomials of degree `n - 1`.
-
-and maybe
-- computing the combined constraint polynomial, which has degree `k * n` where `k` is the maximum degree of a constraint
-
-- Increasing `W` and `A` increase proof size, and they potentially impact the prover-time as the prover must compute polynomial commitments to each column, and computing a polynomial commitment corresponds to doing one MSM (multi-scalar multiplication, also called a multi-exponentiation.)
-
-  However, often increasing the number of columns allows you to decrease the number of rows required for a given computation. For example, if you can perform one Poseidon hash in 36 rows with 5 total columns, then you can also perform it in 12 (= 36 / 3) rows with 15 (= 5 * 3) total columns.
-
-  **Decreasing the number of rows (even while keeping the total number of table entries the same) is desirable because it reduces the cost of the polynomial commitment opening proof, which is dominated by a factor linear in the number of rows, and barely depends on the number of columns.**
-
-  Increasing the number of columns also increases verifier time, as the verifier must perform one scalar-multiplication and one hash per column. Proof length is also affected by a larger number of columns, as more polynomials need to be committed and sent along to the verifier.
-
-There is typically some interplay between these 
+# Custom constraints
diff --git a/book/src/fundamentals/proof_systems.md b/book/src/fundamentals/proof_systems.md
index 84b5f8fe97..d281048974 100644
--- a/book/src/fundamentals/proof_systems.md
+++ b/book/src/fundamentals/proof_systems.md
@@ -1,31 +1,29 @@
-# Overview
+# Proof Systems Design Overview
 
 Many modern proof systems (and I think all that are in use) are constructed according to the  following recipe.
 
 1. You start out with a class of computations.
 
 2. You devise a way to *arithmetize* those computations. That is, to express your computation as a statement about polynomials.
-   
+
    More specifically, you describe what is often called an "algebraic interactive oracle proof" (AIOP) that encodes your computation. An AIOP is a protocol describing an interaction between a prover and a verifier, in which the prover sends the verifier some "polynomial oracles" (basically a black box function that given a point evaluates a polynomial at that point), the verifier sends the prover random challenges, and at the end, the verifier queries the prover's polynomials at points of its choosing and makes a decision as to whether it has been satisfied by the proof.
 
 3. An AIOP is an imagined interaction between parties. It is an abstract description of the protocol that will be "compiled" into a SNARK. There are several "non-realistic" aspects about it. One is that the prover sends the verifier black-box polynomials that the verifier can evaluate. These polynomials have degree comparable to the size of the computation being verified. If we implemented these "polynomial oracles" by having the prover really send the $O(n)$ size polynomials (say by sending all their coefficients), then we would not have a zk-SNARK at all, since the verifier would have to read this linearly sized polynomial so we would  lose succinctness, and the polynomials would not be black-box functions, so we may lose zero-knowledge.
-   
+
    Instead, when we concretely instantiate the AIOP, we have the prover send constant-sized, hiding *polynomial commitments*. Then, in the phase of the AIOP where the verifier queries the polynomials, the prover sends an *opening proof* for the polynomial commitments which the verifier can check, thus simulating the activity of evaluating the prover's polynomials on your own.
-   
+
    So this is the next step of making a SNARK: instantiating the AIOP with a polynomial commitment scheme of one's choosing. There are several choices here and these affect the properties of the SNARK you are constructing, as the SNARK will inherit efficiency and setup properties of the polynomial commitment scheme used.
 
-4. An AIOP describes an interactive protocol between the verifier and the prover. In reality, typically, we also want our proofs to be non-interactive. 
-   
+4. An AIOP describes an interactive protocol between the verifier and the prover. In reality, typically, we also want our proofs to be non-interactive.
+
    This is accomplished by what is called the [Fiat--Shamir transformation](). The basic idea is this: all that the verifier is doing is sampling random values to send to the prover. Instead, to generate a "random" value, the prover simulates the verifier by hashing its messages. The resulting hash is used as the "random" challenge.
-   
+
    At this point we have a fully non-interactive proof. Let's review our steps.
-   
+
    1. Start with a computation.
-   
+
    2. Translate the computation into a statement about polynomials and design a corresponding AIOP.
-   
-   3. Compile the AIOP into an interactive protocol by having the prover send hiding polynomial commitments instead of polynomial oracles.
-   
-   4. Get rid of the verifier-interaction by replacing it with a hash function. I.e., apply the Fiat--Shamir transform.
 
+   3. Compile the AIOP into an interactive protocol by having the prover send hiding polynomial commitments instead of polynomial oracles.
 
+   4. Get rid of the verifier-interaction by replacing it with a hash function. I.e., apply the Fiat--Shamir transform.
diff --git a/book/src/kimchi/custom_constraints.md b/book/src/kimchi/custom_constraints.md
new file mode 100644
index 0000000000..e2c7256d68
--- /dev/null
+++ b/book/src/kimchi/custom_constraints.md
@@ -0,0 +1,58 @@
+This section explains how to design and add a custom constraint to our `proof-systems` library.
+
+PLONK is an AIOP. That is, it is a protocol in which the prover sends polynomials as messages and the verifier sends random challenges, and then evaluates the prover's polynomials and performs some final checks on the outputs.
+
+PLONK is very flexible. It can be customized with constraints specific to computations of interest. For example, in Mina, we use a PLONK configuration called kimchi that has custom constraints for poseidon hashing, doing elliptic curve operations, and more.
+
+A "PLONK configuration" specifies
+- The set of types of constraints that you would like to be able to enforce. We will describe below how these types of constraints are specified.
+- A number of "eq-able" columns `W`
+- A number of "advice" columns `A`
+
+Under such configuration, a circuit is specified by
+- A number of rows `n`
+- A vector `cs` of constraint-types of length `n`. I.e., a vector that specifies, for each row, which types of constraints should be enforced on that row.
+- A vector `eqs : Vec<(Position, Position)>` of equalities to enforce, where `struct Position { row: usize, column: usize }`. E.g., if the pair `(Position { row: 0, col: 8 }, Position { row: 10, col: 2 })` is in `eqs`, then the circuit is saying the entries in those two positions should be equal, or in other words that they refer to the same value. This is where the distinction between "eq-able" and "advice" columns comes in. The `column` field of a position in the `eqs` array can only refer to one of the first `W` columns. Equalities cannot be enforced on entries in the `A` columns after that.
+
+Then, given such a circuit, PLONK lets you produce proofs for the statement
+
+> I know `W + A` "column vectors" of field elements `vs: [Vec<F>; W + A]` such that for each row index `i < n`, the constraint of type `cs[i]` holds on the values `[vs[0][i], ..., vs[W+A - 1][i], vs[0][i+1], ..., vs[W+A - 1][i+1]` and all the equalities in `eqs` hold. I.e., for `(p1, p2)` in `eqs` we have `vs[p1.col][p1.row] == vs[p2.col][p2.row]`. So, a constraint can check the values in two adjacent rows.
+
+## Specifying a constraint
+
+Mathematically speaking, a constraint is a multivariate polynomial over the variables $c_{\mathsf{Curr},i}, \dots, v_{\mathsf{Curr}, W+A-1}, v_{\mathsf{Next}, 0}, \dots, v_{\mathsf{Next}, W+A-1}$. In other words, there is one variable corresponding to the value of each column in the "current row" and one variable correspond to the value of each column in the "next row".
+
+In Rust, $v_{r, i}$ is written `E::cell(Column::Witness(i), r)`. So, for example, the variable $v_{\mathsf{Next}, 3}$ is written
+`E::cell(Column::Witness(3), CurrOrNext::Next)`.
+
+
+
+    let w = |i| v(Column::Witness(i));
+Let's 
+
+## Defining a PLONK configuration
+
+The art in proof systems comes from knowing how to design a PLONK configuration to ensure maximal efficiency for the sorts of computations you are trying to prove. That is, how to choose the numbers of columns `W` and `A`, and how to define the set of constraint types.
+
+Let's describe the trade-offs involved here.
+
+The majority of the proving time for the PLONK prover is in
+- committing to the `W + A` column polynomials, which have length equal to the number of rows `n`
+- committing to the "permutation accumulator polynomial, which has length `n`.
+- committing to the quotient polynomial, which reduces to computing `max(k, W)` MSMs of size `n`, where `k` is the max degree of a constraint.
+- performing the commitment opening proof, which is mostly dependent on the number of rows `n`.
+
+So all in all, the proving time is approximately equal to the time to perform `W + A + 1 + max(k - 1, W)` MSMs of size `n`, plus the cost of an opening proof for polynomials of degree `n - 1`.
+
+and maybe
+- computing the combined constraint polynomial, which has degree `k * n` where `k` is the maximum degree of a constraint
+
+- Increasing `W` and `A` increase proof size, and they potentially impact the prover-time as the prover must compute polynomial commitments to each column, and computing a polynomial commitment corresponds to doing one MSM (multi-scalar multiplication, also called a multi-exponentiation.)
+
+  However, often increasing the number of columns allows you to decrease the number of rows required for a given computation. For example, if you can perform one Poseidon hash in 36 rows with 5 total columns, then you can also perform it in 12 (= 36 / 3) rows with 15 (= 5 * 3) total columns.
+
+  **Decreasing the number of rows (even while keeping the total number of table entries the same) is desirable because it reduces the cost of the polynomial commitment opening proof, which is dominated by a factor linear in the number of rows, and barely depends on the number of columns.**
+
+  Increasing the number of columns also increases verifier time, as the verifier must perform one scalar-multiplication and one hash per column. Proof length is also affected by a larger number of columns, as more polynomials need to be committed and sent along to the verifier.
+
+There is typically some interplay between these 
diff --git a/book/src/plonk/fiat_shamir.md b/book/src/plonk/fiat_shamir.md
index fd486f6aba..f1e2b264ef 100644
--- a/book/src/plonk/fiat_shamir.md
+++ b/book/src/plonk/fiat_shamir.md
@@ -1,4 +1,4 @@
-# non-interaction with fiat-shamir
+# Non-Interactivity via Fiat-Shamir
 
 So far we've talked about an interactive protocol between a prover and a verifier.
 The zero-knowledge proof was also in the honest verifier zero-knowedlge (HVZK) model, which is problematic.
@@ -15,7 +15,7 @@ This is important as our technique to transform an interactive protocol to a non
 The whole idea is to replace the verifier by a random oracle, which in practice is a hash function.
 Note that by doing this, we remove potential leaks that can happen when the verifier acts dishonestly.
 
-Initially the Fiat-Shamir transformation was only applied to sigma protocols, named after the greek letter $\Sigma$ due to its shape resembling the direction of messages (prover sends a commit to a verifier, verifier sends a challenge to a prover, prover sends the final proof to a verifier). 
+Initially the Fiat-Shamir transformation was only applied to sigma protocols, named after the greek letter $\Sigma$ due to its shape resembling the direction of messages (prover sends a commit to a verifier, verifier sends a challenge to a prover, prover sends the final proof to a verifier).
 A $Z$ would have made more sense but here we are.
 
 ## Generalization of Fiat-Shamir
@@ -27,6 +27,6 @@ This is simple: every verifier move can be replaced by a hash of the transcript
 
 While we use a hash function for that, a different construction called the [duplex construction](https://keccak.team/sponge_duplex.html) is particularly useful in such situations as they allow to continuously absorb the transcript and produce challenges, while automatically authenticating the fact that they produced a challenge.
 
-[Merlin](https://merlin.cool/) is a standardization of such a construction using the [Strobe protocol framework](https://strobe.sourceforge.io/) (a framework to make use of a duplex construction). 
-Note that the more recent [Xoodyak](https://keccak.team/xoodyak.html) (part of NIST's lightweight competition) could have been used for this as well. 
+[Merlin](https://merlin.cool/) is a standardization of such a construction using the [Strobe protocol framework](https://strobe.sourceforge.io/) (a framework to make use of a duplex construction).
+Note that the more recent [Xoodyak](https://keccak.team/xoodyak.html) (part of NIST's lightweight competition) could have been used for this as well.
 Note also that Mina uses none of these standards, instead it simply uses Poseidon (see section on poseidon).
diff --git a/book/src/plonk/glossary.md b/book/src/plonk/glossary.md
index 4880894fb4..6769ac5f83 100644
--- a/book/src/plonk/glossary.md
+++ b/book/src/plonk/glossary.md
@@ -1,9 +1,9 @@
 # Glossary
 
-* size = number of rows
-* columns = number of variables per rows
-* cell = a pair (row, column)
-* witness = the values assigned in all the cells
-* gate = polynomials that act on the variables in a row
-* selector vector = a vector of values 1 or 0 (not true for constant vector I think) that toggles gates and variables in a row
-* gadget = a series of contiguous rows with some specific gates set (via selector vectors)
+* Size: number of rows
+* Columns: number of variables per rows
+* Cell: a pair (row, column)
+* Witness: the values assigned in all the cells
+* Gate: polynomials that act on the variables in a row
+* Selector vector: a vector of values 1 or 0 (not true for constant vector I think) that toggles gates and variables in a row
+* Gadget: a series of contiguous rows with some specific gates set (via selector vectors)

From a285216b622c711166b538dee38050937c399cc1 Mon Sep 17 00:00:00 2001
From: Danny Willems <be.danny.willems@gmail.com>
Date: Tue, 14 Nov 2023 14:32:46 +0100
Subject: [PATCH 25/32] Add TODO link

---
 book/src/specs/kimchi.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/book/src/specs/kimchi.md b/book/src/specs/kimchi.md
index 13a51330d9..9259ffa2d6 100644
--- a/book/src/specs/kimchi.md
+++ b/book/src/specs/kimchi.md
@@ -2202,7 +2202,7 @@ The prover then follows the following steps to create the proof:
 	* $s_i$
 	* $w_i$
 	* $z$
-	* lookup (TODO)
+	* lookup (TODO https://github.com/MinaProtocol/mina/issues/13886)
 	* generic selector
 	* poseidon selector
 

From da65a25aa5f4205d456ae557059188a872486476 Mon Sep 17 00:00:00 2001
From: mrmr1993 <mr_1993@hotmail.co.uk>
Date: Thu, 16 Nov 2023 13:36:25 +0000
Subject: [PATCH 26/32] Deduplicate lookup tables

---
 kimchi/src/circuits/constraints.rs       | 15 +++++++-
 kimchi/src/circuits/lookup/tables/mod.rs | 47 ++++++++++++++++++++++++
 2 files changed, 60 insertions(+), 2 deletions(-)

diff --git a/kimchi/src/circuits/constraints.rs b/kimchi/src/circuits/constraints.rs
index ceeacca60f..930060a293 100644
--- a/kimchi/src/circuits/constraints.rs
+++ b/kimchi/src/circuits/constraints.rs
@@ -5,7 +5,11 @@ use crate::{
         domain_constant_evaluation::DomainConstantEvaluations,
         domains::EvaluationDomains,
         gate::{CircuitGate, GateType},
-        lookup::{index::LookupConstraintSystem, lookups::LookupFeatures, tables::LookupTable},
+        lookup::{
+            index::LookupConstraintSystem,
+            lookups::LookupFeatures,
+            tables::{GateLookupTables, LookupTable},
+        },
         polynomial::{WitnessEvals, WitnessOverDomains, WitnessShifts},
         polynomials::permutation::Shifts,
         wires::*,
@@ -752,11 +756,18 @@ impl<F: PrimeField + SquareRootField> Builder<F> {
             }
             // And we add the built-in tables, depending on the features.
             let LookupFeatures { patterns, .. } = &feature_flags.lookup_features;
+            let mut gate_lookup_tables = GateLookupTables {
+                xor: false,
+                range_check: false,
+            };
             for pattern in patterns.into_iter() {
                 if let Some(gate_table) = pattern.table() {
-                    lookup_domain_size += gate_table.table_size();
+                    gate_lookup_tables[gate_table] = true
                 }
             }
+            for gate_table in gate_lookup_tables.into_iter() {
+                lookup_domain_size += gate_table.table_size();
+            }
             lookup_domain_size
         };
 
diff --git a/kimchi/src/circuits/lookup/tables/mod.rs b/kimchi/src/circuits/lookup/tables/mod.rs
index d6be11f9bd..0c049f3e59 100644
--- a/kimchi/src/circuits/lookup/tables/mod.rs
+++ b/kimchi/src/circuits/lookup/tables/mod.rs
@@ -20,6 +20,53 @@ pub enum GateLookupTable {
     RangeCheck,
 }
 
+/// Enumerates the different 'fixed' lookup tables used by individual gates
+#[derive(Copy, Clone, Debug, PartialEq, Eq, Hash, Serialize, Deserialize)]
+pub struct GateLookupTables {
+    pub xor: bool,
+    pub range_check: bool,
+}
+
+impl std::ops::Index<GateLookupTable> for GateLookupTables {
+    type Output = bool;
+
+    fn index(&self, index: GateLookupTable) -> &Self::Output {
+        match index {
+            GateLookupTable::Xor => &self.xor,
+            GateLookupTable::RangeCheck => &self.range_check,
+        }
+    }
+}
+
+impl std::ops::IndexMut<GateLookupTable> for GateLookupTables {
+    fn index_mut(&mut self, index: GateLookupTable) -> &mut Self::Output {
+        match index {
+            GateLookupTable::Xor => &mut self.xor,
+            GateLookupTable::RangeCheck => &mut self.range_check,
+        }
+    }
+}
+
+impl IntoIterator for GateLookupTables {
+    type Item = GateLookupTable;
+    type IntoIter = std::vec::IntoIter<Self::Item>;
+
+    fn into_iter(self) -> Self::IntoIter {
+        // Destructor pattern to make sure we add new lookup patterns.
+        let GateLookupTables { xor, range_check } = self;
+
+        let mut patterns = Vec::with_capacity(2);
+
+        if xor {
+            patterns.push(GateLookupTable::Xor)
+        }
+        if range_check {
+            patterns.push(GateLookupTable::RangeCheck)
+        }
+        patterns.into_iter()
+    }
+}
+
 /// A table of values that can be used for a lookup, along with the ID for the table.
 #[derive(Debug, Clone)]
 pub struct LookupTable<F> {

From 8920a012f4d5eeb87123755e359792c502f25e63 Mon Sep 17 00:00:00 2001
From: Danny Willems <be.danny.willems@gmail.com>
Date: Mon, 27 Nov 2023 17:08:19 +0100
Subject: [PATCH 27/32] Bare URL's are not supported and must be wrapped.

---
 kimchi/src/prover.rs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/kimchi/src/prover.rs b/kimchi/src/prover.rs
index 7fac5dd2b8..0f92745d7f 100644
--- a/kimchi/src/prover.rs
+++ b/kimchi/src/prover.rs
@@ -936,7 +936,7 @@ where
         //~~ * $s_i$
         //~~ * $w_i$
         //~~ * $z$
-        //~~ * lookup (TODO https://github.com/MinaProtocol/mina/issues/13886)
+        //~~ * lookup (TODO, see [this issue](https://github.com/MinaProtocol/mina/issues/13886))
         //~~ * generic selector
         //~~ * poseidon selector
         //~

From 25156a2b6a64dc2e931440f885c30906b1270f17 Mon Sep 17 00:00:00 2001
From: Danny Willems <be.danny.willems@gmail.com>
Date: Mon, 27 Nov 2023 17:10:23 +0100
Subject: [PATCH 28/32] Update specifications

Run make build
---
 book/src/specs/kimchi.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/book/src/specs/kimchi.md b/book/src/specs/kimchi.md
index 9259ffa2d6..20399a02b3 100644
--- a/book/src/specs/kimchi.md
+++ b/book/src/specs/kimchi.md
@@ -2202,7 +2202,7 @@ The prover then follows the following steps to create the proof:
 	* $s_i$
 	* $w_i$
 	* $z$
-	* lookup (TODO https://github.com/MinaProtocol/mina/issues/13886)
+	* lookup (TODO, see [this issue](https://github.com/MinaProtocol/mina/issues/13886))
 	* generic selector
 	* poseidon selector
 

From 6c6adcaf62805143d590cd8bcb200b164bd5ffe1 Mon Sep 17 00:00:00 2001
From: Danny Willems <be.danny.willems@gmail.com>
Date: Wed, 29 Nov 2023 19:58:36 +0100
Subject: [PATCH 29/32] Fix resolver warnings

https://doc.rust-lang.org/edition-guide/rust-2021/default-cargo-resolver.html
---
 Cargo.toml | 1 +
 1 file changed, 1 insertion(+)

diff --git a/Cargo.toml b/Cargo.toml
index c50da37068..3d0d91c9cb 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -14,6 +14,7 @@ members = [
     "utils",
     "internal-tracing",
 ]
+resolver = "2"
 
 [profile.release]
 lto = true

From 1c3063567e69951ce441d37ad852df6ef440c3c1 Mon Sep 17 00:00:00 2001
From: Danny Willems <be.danny.willems@gmail.com>
Date: Wed, 29 Nov 2023 23:56:57 +0100
Subject: [PATCH 30/32] Additional comment on the table_id_combiner

---
 kimchi/src/verifier.rs | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/kimchi/src/verifier.rs b/kimchi/src/verifier.rs
index 0c9cd4aef3..dd2ac7b434 100644
--- a/kimchi/src/verifier.rs
+++ b/kimchi/src/verifier.rs
@@ -1038,6 +1038,9 @@ where
             let joint_combiner = oracles
                 .joint_combiner
                 .expect("joint_combiner should be present if lookups are used");
+            // The table ID is added as the last column of the vector.
+            // Therefore, the exponent for the combiner for the table ID is the
+            // width of the concatenated table, i.e. max_joint_size.
             let table_id_combiner = joint_combiner
                 .1
                 .pow([u64::from(li.lookup_info.max_joint_size)]);

From 267105a0bec35076eb8e2fbf9ec5b1f6502cd14c Mon Sep 17 00:00:00 2001
From: mrmr1993 <mr_1993@hotmail.co.uk>
Date: Mon, 4 Dec 2023 20:08:48 +0000
Subject: [PATCH 31/32] Revert "Merge pull request #1263 from
 o1-labs/volhovm/mina14070-table-id-zero-row"

This reverts commit 7f6eba0653fd47aa73725b1815c741c8f7c18015, reversing
changes made to 88c17767f19ff9651afefc37c4436bb14e3536a5.
---
 book/src/specs/kimchi.md                      |   4 +-
 kimchi/src/circuits/constraints.rs            |  15 +-
 kimchi/src/circuits/lookup/index.rs           | 202 ++++--------------
 kimchi/src/circuits/lookup/lookups.rs         |   2 +-
 kimchi/src/circuits/lookup/runtime_tables.rs  |  10 +-
 kimchi/src/circuits/lookup/tables/mod.rs      | 196 ++++-------------
 .../src/circuits/lookup/tables/range_check.rs |   8 +-
 kimchi/src/circuits/lookup/tables/xor.rs      |   6 +-
 kimchi/src/error.rs                           |   4 -
 kimchi/src/precomputed_srs.rs                 |   3 -
 kimchi/src/prover_index.rs                    |   1 -
 kimchi/src/tests/and.rs                       |   1 -
 kimchi/src/tests/foreign_field_add.rs         |   1 +
 kimchi/src/tests/lookup.rs                    |  14 +-
 kimchi/src/tests/range_check.rs               |   5 +-
 kimchi/src/tests/rot.rs                       |   1 +
 kimchi/src/tests/xor.rs                       |   1 +
 17 files changed, 124 insertions(+), 350 deletions(-)

diff --git a/book/src/specs/kimchi.md b/book/src/specs/kimchi.md
index 7559baa739..20399a02b3 100644
--- a/book/src/specs/kimchi.md
+++ b/book/src/specs/kimchi.md
@@ -1641,8 +1641,8 @@ If lookup is used, the following values are added to the common index:
 To create the index, follow these steps:
 
 1. If no lookup is used in the circuit, do not create a lookup index
-2. Get the lookup selectors and lookup tables that are specified implicitly
-3. Concatenate explicit runtime lookup tables with the ones (implicitly) used by gates.
+2. Get the lookup selectors and lookup tables (TODO: how?)
+3. Concatenate runtime lookup tables with the ones used by gates
 4. Get the highest number of columns `max_table_width`
    that a lookup table can have.
 5. Create the concatenated table of all the fixed lookup tables.
diff --git a/kimchi/src/circuits/constraints.rs b/kimchi/src/circuits/constraints.rs
index 31fdf5c4e0..930060a293 100644
--- a/kimchi/src/circuits/constraints.rs
+++ b/kimchi/src/circuits/constraints.rs
@@ -736,7 +736,18 @@ impl<F: PrimeField + SquareRootField> Builder<F> {
 
         let lookup_domain_size = {
             // First we sum over the lookup table size
-            let mut lookup_domain_size: usize = lookup_tables.iter().map(|lt| lt.len()).sum();
+            let mut lookup_domain_size: usize = lookup_tables
+                .iter()
+                .map(
+                    |LookupTable { data, id: _ }| {
+                        if data.is_empty() {
+                            0
+                        } else {
+                            data[0].len()
+                        }
+                    },
+                )
+                .sum();
             // After that on the runtime tables
             if let Some(runtime_tables) = runtime_tables.as_ref() {
                 for runtime_table in runtime_tables.iter() {
@@ -846,7 +857,7 @@ impl<F: PrimeField + SquareRootField> Builder<F> {
             &domain,
             zk_rows as usize,
         )
-        .map_err(SetupError::LookupCreation)?;
+        .map_err(|e| SetupError::ConstraintSystem(e.to_string()))?;
 
         let sid = shifts.map[0].clone();
 
diff --git a/kimchi/src/circuits/lookup/index.rs b/kimchi/src/circuits/lookup/index.rs
index 41a9709737..ab3e4545ab 100644
--- a/kimchi/src/circuits/lookup/index.rs
+++ b/kimchi/src/circuits/lookup/index.rs
@@ -1,10 +1,10 @@
+use super::runtime_tables::{RuntimeTableCfg, RuntimeTableSpec};
 use crate::circuits::{
     domains::EvaluationDomains,
     gate::CircuitGate,
     lookup::{
         constraints::LookupConfiguration,
         lookups::{LookupInfo, LookupPattern},
-        runtime_tables::{RuntimeTableCfg, RuntimeTableSpec},
         tables::LookupTable,
     },
 };
@@ -21,15 +21,17 @@ use std::iter;
 use thiserror::Error;
 
 /// Represents an error found when computing the lookup constraint system
-#[derive(Debug, Error, Clone)]
+#[derive(Debug, Error)]
 pub enum LookupError {
+    #[error("One of the lookup tables has columns of different lengths")]
+    InconsistentTableLength,
     #[error("The combined lookup table is larger than allowed by the domain size. Observed: {length}, expected: {maximum_allowed}")]
     LookupTableTooLong {
         length: usize,
         maximum_allowed: usize,
     },
-    #[error("Cannot create a combined table since ids for sub-tables are colliding. The collision type is: {collision_type}")]
-    LookupTableIdCollision { collision_type: String },
+    #[error("The table with id 0 must have an entry of all zeros")]
+    TableIDZeroMustHaveZeroEntry,
 }
 
 /// Lookup selectors
@@ -198,7 +200,7 @@ impl<F: PrimeField + SquareRootField> LookupConstraintSystem<F> {
     /// Will give error if inputs validation do not match.
     pub fn create(
         gates: &[CircuitGate<F>],
-        fixed_lookup_tables: Vec<LookupTable<F>>,
+        lookup_tables: Vec<LookupTable<F>>,
         runtime_tables: Option<Vec<RuntimeTableCfg<F>>>,
         domain: &EvaluationDomains<F>,
         zk_rows: usize,
@@ -215,64 +217,21 @@ impl<F: PrimeField + SquareRootField> LookupConstraintSystem<F> {
                 // product is 1, we cannot use those rows to store any values.
                 let max_num_entries = d1_size - zk_rows - 1;
 
-                //~ 2. Get the lookup selectors and lookup tables that are specified implicitly
-                // by the lookup gates.
+                //~ 2. Get the lookup selectors and lookup tables (TODO: how?)
                 let (lookup_selectors, gate_lookup_tables) =
                     lookup_info.selector_polynomials_and_tables(domain, gates);
 
-                // Checks whether an iterator contains any duplicates, and if yes, raises
-                // a corresponding LookupTableIdCollision error.
-                fn check_id_duplicates<'a, I: Iterator<Item = &'a i32>>(
-                    iter: I,
-                    msg: &str,
-                ) -> Result<(), LookupError> {
-                    use itertools::Itertools;
-                    match iter.duplicates().collect::<Vec<_>>() {
-                        dups if !dups.is_empty() => Err(LookupError::LookupTableIdCollision {
-                            collision_type: format!("{}: {:?}", msg, dups).to_string(),
-                        }),
-                        _ => Ok(()),
-                    }
-                }
-
-                // If there is a gate using a lookup table, this table must not be added
-                // explicitly to the constraint system.
-                let fixed_gate_joint_ids: Vec<i32> = fixed_lookup_tables
-                    .iter()
-                    .map(|lt| lt.id())
-                    .chain(gate_lookup_tables.iter().map(|lt| lt.id()))
-                    .collect();
-                check_id_duplicates(
-                    fixed_gate_joint_ids.iter(),
-                    "duplicates between fixed given and fixed from-gate tables",
-                )?;
-
-                //~ 3. Concatenate explicit runtime lookup tables with the ones (implicitly) used by gates.
-                let mut lookup_tables: Vec<LookupTable<_>> = fixed_lookup_tables
+                //~ 3. Concatenate runtime lookup tables with the ones used by gates
+                let mut lookup_tables: Vec<_> = gate_lookup_tables
                     .into_iter()
-                    .chain(gate_lookup_tables)
+                    .chain(lookup_tables)
                     .collect();
 
-                let fixed_lookup_tables_ids: Vec<i32> =
-                    lookup_tables.iter().map(|lt| lt.id()).collect();
-                check_id_duplicates(
-                    fixed_lookup_tables_ids.iter(),
-                    "fixed lookup table duplicates",
-                )?;
+                let mut has_table_id_0 = false;
 
                 // if we are using runtime tables
                 let (runtime_table_offset, runtime_selector) =
                     if let Some(runtime_tables) = &runtime_tables {
-                        let runtime_tables_ids: Vec<i32> =
-                            runtime_tables.iter().map(|rt| rt.id).collect();
-                        check_id_duplicates(runtime_tables_ids.iter(), "runtime table duplicates")?;
-                        check_id_duplicates(
-                            runtime_tables_ids
-                                .iter()
-                                .chain(fixed_lookup_tables_ids.iter()),
-                            "duplicates between runtime and fixed tables",
-                        )?;
-
                         // save the offset of the end of the table
                         let mut runtime_table_offset = 0;
                         for table in &lookup_tables {
@@ -313,15 +272,18 @@ impl<F: PrimeField + SquareRootField> LookupConstraintSystem<F> {
                             let (id, first_column) =
                                 (runtime_table.id, runtime_table.first_column.clone());
 
+                            // record if table ID 0 is used in one of the runtime tables
+                            // note: the check later will still force you to have a fixed table with ID 0
+                            if id == 0 {
+                                has_table_id_0 = true;
+                            }
+
                             // important: we still need a placeholder column to make sure that
                             // if all other tables have a single column
                             // we don't use the second table as table ID column.
                             let placeholders = vec![F::zero(); first_column.len()];
                             let data = vec![first_column, placeholders];
-                            // TODO Check it does not fail actually. Maybe this should throw a different error.
-                            let table = LookupTable::create(id, data)
-                                .expect("Runtime table creation must succeed");
-
+                            let table = LookupTable { id, data };
                             lookup_tables.push(table);
                         }
 
@@ -383,21 +345,31 @@ impl<F: PrimeField + SquareRootField> LookupConstraintSystem<F> {
                 let mut table_ids: Vec<F> = Vec::with_capacity(d1_size);
 
                 let mut non_zero_table_id = false;
+                let mut has_table_id_0_with_zero_entry = false;
 
                 for table in &lookup_tables {
                     let table_len = table.len();
 
-                    if table.id() != 0 {
+                    if table.id == 0 {
+                        has_table_id_0 = true;
+                        if table.has_zero_entry() {
+                            has_table_id_0_with_zero_entry = true;
+                        }
+                    } else {
                         non_zero_table_id = true;
                     }
 
                     //~~ * Update the corresponding entries in a table id vector (of size the domain as well)
                     //~    with the table ID of the table.
-                    let table_id: F = i32_to_field(table.id());
+                    let table_id: F = i32_to_field(table.id);
                     table_ids.extend(repeat_n(table_id, table_len));
 
                     //~~ * Copy the entries from the table to new rows in the corresponding columns of the concatenated table.
-                    for (i, col) in table.data().iter().enumerate() {
+                    for (i, col) in table.data.iter().enumerate() {
+                        // See GH issue: https://github.com/MinaProtocol/mina/issues/14097
+                        if col.len() != table_len {
+                            return Err(LookupError::InconsistentTableLength);
+                        }
                         lookup_table[i].extend(col);
                     }
 
@@ -407,6 +379,12 @@ impl<F: PrimeField + SquareRootField> LookupConstraintSystem<F> {
                     }
                 }
 
+                // If a table has ID 0, then it must have a zero entry.
+                // This is for the dummy lookups to work.
+                if has_table_id_0 && !has_table_id_0_with_zero_entry {
+                    return Err(LookupError::TableIDZeroMustHaveZeroEntry);
+                }
+
                 // Note: we use `>=` here to leave space for the dummy value.
                 if lookup_table[0].len() >= max_num_entries {
                     return Err(LookupError::LookupTableTooLong {
@@ -433,8 +411,6 @@ impl<F: PrimeField + SquareRootField> LookupConstraintSystem<F> {
                     lookup_table8.push(eval);
                 }
 
-                // @volhovm: Do we need to enforce that there is at least one table
-                // with id 0?
                 //~ 9. pre-compute polynomial and evaluation form for the table IDs,
                 //~    only if a table with an ID different from zero was used.
                 let (table_ids, table_ids8) = if non_zero_table_id {
@@ -467,105 +443,3 @@ impl<F: PrimeField + SquareRootField> LookupConstraintSystem<F> {
         }
     }
 }
-
-#[cfg(test)]
-mod tests {
-
-    use super::{LookupError, LookupTable, RuntimeTableCfg};
-    use crate::{
-        circuits::constraints::ConstraintSystem, circuits::gate::CircuitGate,
-        circuits::lookup::tables::xor, circuits::polynomials::range_check, error::SetupError,
-    };
-    use mina_curves::pasta::Fp;
-
-    #[test]
-    fn colliding_table_ids() {
-        let (_, gates) = CircuitGate::<Fp>::create_multi_range_check(0);
-        let collision_id: i32 = 5;
-
-        let cs = ConstraintSystem::<Fp>::create(gates.clone())
-            .lookup(vec![range_check::gadget::lookup_table()])
-            .build();
-
-        assert!(
-            matches!(
-                cs,
-                Err(SetupError::LookupCreation(
-                    LookupError::LookupTableIdCollision { .. }
-                ))
-            ),
-            "LookupConstraintSystem::create(...) must fail due to range table passed twice"
-        );
-
-        let cs = ConstraintSystem::<Fp>::create(gates.clone())
-            .lookup(vec![xor::xor_table()])
-            .build();
-
-        assert!(
-            cs.is_ok(),
-            "LookupConstraintSystem::create(...) must succeed, no duplicates exist"
-        );
-
-        let cs = ConstraintSystem::<Fp>::create(gates.clone())
-            .lookup(vec![
-                LookupTable::create(collision_id, vec![vec![From::from(0); 16]]).unwrap(),
-                LookupTable::create(collision_id, vec![vec![From::from(1); 16]]).unwrap(),
-            ])
-            .build();
-
-        assert!(
-            matches!(
-                cs,
-                Err(SetupError::LookupCreation(
-                    LookupError::LookupTableIdCollision { .. }
-                ))
-            ),
-            "LookupConstraintSystem::create(...) must fail, collision in fixed ids"
-        );
-
-        let cs = ConstraintSystem::<Fp>::create(gates.clone())
-            .runtime(Some(vec![
-                RuntimeTableCfg {
-                    id: collision_id,
-                    first_column: vec![From::from(0); 16],
-                },
-                RuntimeTableCfg {
-                    id: collision_id,
-                    first_column: vec![From::from(1); 16],
-                },
-            ]))
-            .build();
-
-        assert!(
-            matches!(
-                cs,
-                Err(SetupError::LookupCreation(
-                    LookupError::LookupTableIdCollision { .. }
-                ))
-            ),
-            "LookupConstraintSystem::create(...) must fail, collision in runtime ids"
-        );
-
-        let cs = ConstraintSystem::<Fp>::create(gates.clone())
-            .lookup(vec![LookupTable::create(
-                collision_id,
-                vec![vec![From::from(0); 16]],
-            )
-            .unwrap()])
-            .runtime(Some(vec![RuntimeTableCfg {
-                id: collision_id,
-                first_column: vec![From::from(1); 16],
-            }]))
-            .build();
-
-        assert!(
-            matches!(
-                cs,
-                Err(SetupError::LookupCreation(
-                    LookupError::LookupTableIdCollision { .. }
-                ))
-            ),
-            "LookupConstraintSystem::create(...) must fail, collision between runtime and lookup ids"
-        );
-    }
-}
diff --git a/kimchi/src/circuits/lookup/lookups.rs b/kimchi/src/circuits/lookup/lookups.rs
index 63266b3abf..002b040828 100644
--- a/kimchi/src/circuits/lookup/lookups.rs
+++ b/kimchi/src/circuits/lookup/lookups.rs
@@ -222,7 +222,7 @@ impl LookupInfo {
         };
 
         // TODO: is take(n) useful here? I don't see why we need this
-        for (i, gate) in gates.iter().take(n).enumerate() {
+        for (i, gate) in gates.iter().enumerate().take(n) {
             let typ = gate.typ;
 
             if let Some(lookup_pattern) = LookupPattern::from_gate(typ, CurrOrNext::Curr) {
diff --git a/kimchi/src/circuits/lookup/runtime_tables.rs b/kimchi/src/circuits/lookup/runtime_tables.rs
index d05a0a5a72..98b018ed8a 100644
--- a/kimchi/src/circuits/lookup/runtime_tables.rs
+++ b/kimchi/src/circuits/lookup/runtime_tables.rs
@@ -18,8 +18,6 @@ pub struct RuntimeTableSpec {
     pub len: usize,
 }
 
-/// A configuration of the runtime table as known at setup time.
-///
 /// Use this type at setup time, to list all the runtime tables.
 ///
 /// Note: care must be taken as table IDs can collide with IDs of other types of lookup tables.
@@ -27,8 +25,7 @@ pub struct RuntimeTableSpec {
 pub struct RuntimeTableCfg<F> {
     /// The table ID.
     pub id: i32,
-    /// The content of the first column of the runtime table, i.e.
-    /// keys when a table is viewed as a (k,v) array.
+    /// The content of the first column of the runtime table.
     pub first_column: Vec<F>,
 }
 
@@ -59,13 +56,12 @@ impl<F> From<RuntimeTableCfg<F>> for RuntimeTableSpec {
 }
 
 /// A runtime table. Runtime tables must match the configuration
-/// specified in [`RuntimeTableCfg`].
+/// that was specified in [`RuntimeTableCfg`].
 #[derive(Debug, Clone)]
 pub struct RuntimeTable<F> {
     /// The table id.
     pub id: i32,
-    /// A single column. Represents runtime table values, where
-    /// ['RuntimeTableCfg'] defines compile-time keys.
+    /// A single column.
     pub data: Vec<F>,
 }
 
diff --git a/kimchi/src/circuits/lookup/tables/mod.rs b/kimchi/src/circuits/lookup/tables/mod.rs
index 7760086512..0c049f3e59 100644
--- a/kimchi/src/circuits/lookup/tables/mod.rs
+++ b/kimchi/src/circuits/lookup/tables/mod.rs
@@ -1,109 +1,10 @@
-use ark_ff::{Field, One, Zero};
+use ark_ff::{FftField, One, Zero};
 use poly_commitment::PolyComm;
 use serde::{Deserialize, Serialize};
-use thiserror::Error;
 
 pub mod range_check;
 pub mod xor;
 
-/// A table of values that can be used for a lookup, along with the ID for the table.
-#[derive(Debug, Clone)]
-pub struct LookupTable<F> {
-    id: i32,
-    data: Vec<Vec<F>>,
-}
-
-/// Represents inconsistency errors during table construction and composition.
-#[derive(Debug, Error)]
-pub enum LookupTableError {
-    #[error("Table must be nonempty")]
-    InputTableDataEmpty,
-    #[error("One of the lookup tables has columns of different lengths")]
-    InconsistentTableLength,
-    #[error("The table with id 0 must have an entry of all zeros")]
-    TableIDZeroMustHaveZeroEntry,
-}
-
-impl<F> LookupTable<F>
-where
-    F: Field,
-{
-    pub fn create(id: i32, data: Vec<Vec<F>>) -> Result<Self, LookupTableError> {
-        let res = LookupTable { id, data };
-
-        // Empty tables are not allowed
-        if res.data.is_empty() {
-            return Err(LookupTableError::InputTableDataEmpty);
-        }
-
-        // All columns in the table must have same length
-        let table_len = res.len();
-        for col in res.data.iter() {
-            if col.len() != table_len {
-                return Err(LookupTableError::InconsistentTableLength);
-            }
-        }
-
-        // If a table has ID 0, then it must have a zero entry.
-        // This is for the dummy lookups to work.
-        if id == 0 && !res.has_zero_entry() {
-            return Err(LookupTableError::TableIDZeroMustHaveZeroEntry);
-        }
-
-        Ok(res)
-    }
-
-    /// Return true if the table has an entry (row) containing all zeros.
-    fn has_zero_entry(&self) -> bool {
-        // reminder: a table is written as a list of columns,
-        // not as a list of row entries.
-        for row in 0..self.len() {
-            let mut row_zero = true;
-            for col in &self.data {
-                if !col[row].is_zero() {
-                    row_zero = false;
-                    break;
-                }
-            }
-            if row_zero {
-                return true;
-            }
-        }
-
-        false
-    }
-
-    /// Returns the number of columns, i.e. the width of the table.
-    /// It is less error prone to introduce this method than using the public
-    /// field data.
-    pub fn width(&self) -> usize {
-        self.data.len()
-    }
-
-    /// Returns the length (height) of the table.
-    pub fn len(&self) -> usize {
-        if self.is_empty() {
-            panic!("LookupTable#len() is called on an empty table")
-        }
-        self.data[0].len()
-    }
-
-    /// Returns `true` if the lookup table is empty, `false` otherwise.
-    pub fn is_empty(&self) -> bool {
-        self.data.is_empty()
-    }
-
-    /// Returns table id.
-    pub fn id(&self) -> i32 {
-        self.id
-    }
-
-    /// Returns table data.
-    pub fn data(&self) -> &Vec<Vec<F>> {
-        &self.data
-    }
-}
-
 //~ spec:startcode
 /// The table ID associated with the XOR lookup table.
 pub const XOR_TABLE_ID: i32 = 0;
@@ -166,8 +67,53 @@ impl IntoIterator for GateLookupTables {
     }
 }
 
+/// A table of values that can be used for a lookup, along with the ID for the table.
+#[derive(Debug, Clone)]
+pub struct LookupTable<F> {
+    pub id: i32,
+    pub data: Vec<Vec<F>>,
+}
+
+impl<F> LookupTable<F>
+where
+    F: FftField,
+{
+    /// Return true if the table has an entry containing all zeros.
+    pub fn has_zero_entry(&self) -> bool {
+        // reminder: a table is written as a list of columns,
+        // not as a list of row entries.
+        for row in 0..self.len() {
+            for col in &self.data {
+                if !col[row].is_zero() {
+                    continue;
+                }
+                return true;
+            }
+        }
+
+        false
+    }
+
+    /// Returns the number of columns, i.e. the width of the table.
+    /// It is less error prone to introduce this method than using the public
+    /// field data.
+    pub fn width(&self) -> usize {
+        self.data.len()
+    }
+
+    /// Returns the length of the table.
+    pub fn len(&self) -> usize {
+        self.data[0].len()
+    }
+
+    /// Returns `true` if the lookup table is empty, `false` otherwise.
+    pub fn is_empty(&self) -> bool {
+        self.data.is_empty()
+    }
+}
+
 /// Returns the lookup table associated to a [`GateLookupTable`].
-pub fn get_table<F: Field>(table_name: GateLookupTable) -> LookupTable<F> {
+pub fn get_table<F: FftField>(table_name: GateLookupTable) -> LookupTable<F> {
     match table_name {
         GateLookupTable::Xor => xor::xor_table(),
         GateLookupTable::RangeCheck => range_check::range_check_table(),
@@ -209,7 +155,6 @@ where
     F: Zero + One + Clone,
     I: DoubleEndedIterator<Item = &'a F>,
 {
-    // TODO: unnecessary cloning if binops between F and &F are supported
     v.rev()
         .fold(F::zero(), |acc, x| joint_combiner.clone() * acc + x.clone())
         + table_id_combiner.clone() * table_id.clone()
@@ -310,50 +255,3 @@ pub mod caml {
         }
     }
 }
-
-#[cfg(test)]
-mod tests {
-
-    use super::*;
-    use mina_curves::pasta::Fp;
-
-    #[test]
-    fn test_zero_table_zero_row() {
-        let lookup_r: u64 = 32;
-        // Table column that /does not/ contain zeros
-        let lookup_table_values_1: Vec<_> = (1..lookup_r + 1).map(From::from).collect();
-        // Another table column that /does/ contain zeros.
-        let lookup_table_values_2: Vec<_> = (0..lookup_r).map(From::from).collect();
-
-        // Jointly two columns /do not/ have a full zero now.
-        let table: Result<LookupTable<Fp>, _> =
-            LookupTable::create(0, vec![lookup_table_values_1, lookup_table_values_2]);
-
-        assert!(
-            matches!(table, Err(LookupTableError::TableIDZeroMustHaveZeroEntry)),
-            "LookupTable::create(...) must fail when zero table has no zero rows"
-        );
-    }
-
-    #[test]
-    fn test_invalid_data_inputs() {
-        let table: Result<LookupTable<Fp>, _> = LookupTable::create(0, vec![]);
-        assert!(
-            matches!(table, Err(LookupTableError::InputTableDataEmpty)),
-            "LookupTable::create(...) must fail when empty table creation is attempted"
-        );
-
-        let lookup_r: u64 = 32;
-        // Two columns of different lengths
-        let lookup_table_values_1: Vec<_> = (0..2 * lookup_r).map(From::from).collect();
-        let lookup_table_values_2: Vec<_> = (0..lookup_r).map(From::from).collect();
-
-        let table: Result<LookupTable<Fp>, _> =
-            LookupTable::create(0, vec![lookup_table_values_1, lookup_table_values_2]);
-
-        assert!(
-            matches!(table, Err(LookupTableError::InconsistentTableLength)),
-            "LookupTable::create(...) must fail when columns are not of the same length"
-        );
-    }
-}
diff --git a/kimchi/src/circuits/lookup/tables/range_check.rs b/kimchi/src/circuits/lookup/tables/range_check.rs
index 2bf00e64f7..001ffedd52 100644
--- a/kimchi/src/circuits/lookup/tables/range_check.rs
+++ b/kimchi/src/circuits/lookup/tables/range_check.rs
@@ -14,9 +14,11 @@ pub fn range_check_table<F>() -> LookupTable<F>
 where
     F: Field,
 {
-    let data = vec![(0..RANGE_CHECK_UPPERBOUND).map(F::from).collect()];
-    LookupTable::create(RANGE_CHECK_TABLE_ID, data)
-        .expect("range_check_table creation must succeed")
+    let table = vec![(0..RANGE_CHECK_UPPERBOUND).map(F::from).collect()];
+    LookupTable {
+        id: RANGE_CHECK_TABLE_ID,
+        data: table,
+    }
 }
 
 pub const TABLE_SIZE: usize = RANGE_CHECK_UPPERBOUND as usize;
diff --git a/kimchi/src/circuits/lookup/tables/xor.rs b/kimchi/src/circuits/lookup/tables/xor.rs
index 6f87377d96..d846942a31 100644
--- a/kimchi/src/circuits/lookup/tables/xor.rs
+++ b/kimchi/src/circuits/lookup/tables/xor.rs
@@ -37,8 +37,10 @@ pub fn xor_table<F: Field>() -> LookupTable<F> {
         // Just to be safe.
         assert!(r[r.len() - 1].is_zero());
     }
-
-    LookupTable::create(XOR_TABLE_ID, data).expect("xor_table creation must succeed")
+    LookupTable {
+        id: XOR_TABLE_ID,
+        data,
+    }
 }
 
 pub const TABLE_SIZE: usize = 256;
diff --git a/kimchi/src/error.rs b/kimchi/src/error.rs
index 8f2e8406a1..8c801fd38f 100644
--- a/kimchi/src/error.rs
+++ b/kimchi/src/error.rs
@@ -1,6 +1,5 @@
 //! This module implements the [`ProverError`] type.
 
-use crate::circuits::lookup::index::LookupError; // not sure about hierarchy
 use poly_commitment::error::CommitmentError;
 use thiserror::Error;
 
@@ -101,9 +100,6 @@ pub enum SetupError {
 
     #[error("the domain could not be constructed: {0}")]
     DomainCreation(DomainCreationError),
-
-    #[error("the lookup constraint system cannot not be constructed: {0}")]
-    LookupCreation(LookupError),
 }
 
 /// Errors that can arise when creating a verifier index
diff --git a/kimchi/src/precomputed_srs.rs b/kimchi/src/precomputed_srs.rs
index 11f60edec3..116554e262 100644
--- a/kimchi/src/precomputed_srs.rs
+++ b/kimchi/src/precomputed_srs.rs
@@ -33,9 +33,6 @@ where
     let file =
         File::open(srs_path.clone()).unwrap_or_else(|_| panic!("missing SRS file: {srs_path:?}"));
     let reader = BufReader::new(file);
-    // Note: In tests, this read takes significant amount of time (2 min) due
-    // to -O0 optimisation level. Compile tests with -O1 or --release flag.
-    // See: https://github.com/o1-labs/proof-systems/blob/develop/CONTRIBUTING.md#development
     rmp_serde::from_read(reader).unwrap()
 }
 
diff --git a/kimchi/src/prover_index.rs b/kimchi/src/prover_index.rs
index b3fa552669..523d583e18 100644
--- a/kimchi/src/prover_index.rs
+++ b/kimchi/src/prover_index.rs
@@ -210,7 +210,6 @@ pub mod testing {
             override_srs_size,
             |d1: D<G::ScalarField>, size: usize| {
                 let log2_size = size.ilog2();
-                // Run test_srs_serialization test to generate test SRS & enable this
                 let mut srs = if log2_size <= precomputed_srs::SERIALIZED_SRS_SIZE {
                     // TODO: we should trim it if it's smaller
                     precomputed_srs::get_srs()
diff --git a/kimchi/src/tests/and.rs b/kimchi/src/tests/and.rs
index 9c1a86fbcd..e344af6da4 100644
--- a/kimchi/src/tests/and.rs
+++ b/kimchi/src/tests/and.rs
@@ -255,7 +255,6 @@ fn verify_bad_and_decomposition<G: KimchiCurve>(
             );
             witness[col][and_row] += G::ScalarField::one();
         }
-
         if col == 2 {
             assert_eq!(
                 cs.gates[0].verify_witness::<G>(0, witness, &cs, &witness[0][0..cs.public]),
diff --git a/kimchi/src/tests/foreign_field_add.rs b/kimchi/src/tests/foreign_field_add.rs
index 760c7fa2d5..24c1d5a8c1 100644
--- a/kimchi/src/tests/foreign_field_add.rs
+++ b/kimchi/src/tests/foreign_field_add.rs
@@ -1490,6 +1490,7 @@ fn test_ffadd_finalization() {
 
     let index = {
         let cs = ConstraintSystem::create(gates.clone())
+            .lookup(vec![range_check::gadget::lookup_table()])
             .public(num_public_inputs)
             .build()
             .unwrap();
diff --git a/kimchi/src/tests/lookup.rs b/kimchi/src/tests/lookup.rs
index 269235d35e..a674eba78f 100644
--- a/kimchi/src/tests/lookup.rs
+++ b/kimchi/src/tests/lookup.rs
@@ -22,12 +22,10 @@ type BaseSponge = DefaultFqSponge<VestaParameters, SpongeParams>;
 type ScalarSponge = DefaultFrSponge<Fp, SpongeParams>;
 
 fn setup_lookup_proof(use_values_from_table: bool, num_lookups: usize, table_sizes: Vec<usize>) {
-    let mut lookup_table_values: Vec<Vec<_>> = table_sizes
+    let lookup_table_values: Vec<Vec<_>> = table_sizes
         .iter()
         .map(|size| (0..*size).map(|_| rand::random()).collect())
         .collect();
-    // Zero table must have a zero row
-    lookup_table_values[0][0] = From::from(0);
     let lookup_tables = lookup_table_values
         .iter()
         .enumerate()
@@ -35,8 +33,10 @@ fn setup_lookup_proof(use_values_from_table: bool, num_lookups: usize, table_siz
             let index_column = (0..lookup_table_values.len() as u64)
                 .map(Into::into)
                 .collect();
-            LookupTable::create(id as i32, vec![index_column, lookup_table_values.clone()])
-                .expect("setup_lookup_proof: Table creation must succeed")
+            LookupTable {
+                id: id as i32,
+                data: vec![index_column, lookup_table_values.clone()],
+            }
         })
         .collect();
 
@@ -200,7 +200,7 @@ fn test_runtime_table() {
     let len = first_column.len();
 
     let mut runtime_tables_setup = vec![];
-    for table_id in 1..num + 1 {
+    for table_id in 0..num {
         let cfg = RuntimeTableCfg {
             id: table_id,
             first_column: first_column.into_iter().map(Into::into).collect(),
@@ -236,7 +236,7 @@ fn test_runtime_table() {
 
         for row in 0..20 {
             // the first register is the table id. We pick one random table.
-            lookup_cols[0][row] = (rng.gen_range(1..num + 1) as u32).into();
+            lookup_cols[0][row] = (rng.gen_range(0..num) as u32).into();
 
             // create queries into our runtime lookup table.
             // We will set [w1, w2], [w3, w4] and [w5, w6] to randon indexes and
diff --git a/kimchi/src/tests/range_check.rs b/kimchi/src/tests/range_check.rs
index 577e2aa4f7..27240db942 100644
--- a/kimchi/src/tests/range_check.rs
+++ b/kimchi/src/tests/range_check.rs
@@ -68,10 +68,7 @@ fn create_test_prover_index(
         gates,
         public_size,
         0,
-        // specifying lookup table is not necessary,
-        // since it's already passed through patterns implicitly
-        //vec![range_check::gadget::lookup_table()],
-        vec![],
+        vec![range_check::gadget::lookup_table()],
         None,
         false,
         None,
diff --git a/kimchi/src/tests/rot.rs b/kimchi/src/tests/rot.rs
index f9a1308b86..f88125cf9b 100644
--- a/kimchi/src/tests/rot.rs
+++ b/kimchi/src/tests/rot.rs
@@ -328,6 +328,7 @@ fn test_rot_finalization() {
     let index = {
         let cs = ConstraintSystem::create(gates.clone())
             .public(num_public_inputs)
+            .lookup(vec![rot::lookup_table()])
             .build()
             .unwrap();
         let mut srs = SRS::<Vesta>::create(cs.domain.d1.size());
diff --git a/kimchi/src/tests/xor.rs b/kimchi/src/tests/xor.rs
index 7ab28b4008..0344e0aea3 100644
--- a/kimchi/src/tests/xor.rs
+++ b/kimchi/src/tests/xor.rs
@@ -392,6 +392,7 @@ fn test_xor_finalization() {
 
     let index = {
         let cs = ConstraintSystem::create(gates.clone())
+            .lookup(vec![xor::lookup_table()])
             .public(num_inputs)
             .build()
             .unwrap();

From b88e61c85930aa5d07e1e41fdd4cf1e2545d3b4e Mon Sep 17 00:00:00 2001
From: mrmr1993 <mr_1993@hotmail.co.uk>
Date: Mon, 4 Dec 2023 21:40:36 +0000
Subject: [PATCH 32/32] Reintroduce comment

---
 kimchi/src/circuits/lookup/tables/mod.rs | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/kimchi/src/circuits/lookup/tables/mod.rs b/kimchi/src/circuits/lookup/tables/mod.rs
index 0c049f3e59..dc5bf3febd 100644
--- a/kimchi/src/circuits/lookup/tables/mod.rs
+++ b/kimchi/src/circuits/lookup/tables/mod.rs
@@ -5,6 +5,9 @@ use serde::{Deserialize, Serialize};
 pub mod range_check;
 pub mod xor;
 
+// If you add new tables, update ../../../../../book/src/kimchi/lookup.md
+// accordingly
+
 //~ spec:startcode
 /// The table ID associated with the XOR lookup table.
 pub const XOR_TABLE_ID: i32 = 0;