reference/cpp/compiler_8h_source.html

// Copyright 2025 Google LLC.

//

// Licensed under the Apache License, Version 2.0 (the "License");

// you may not use this file except in compliance with the License.

// You may obtain a copy of the License at

//

//     http://www.apache.org/licenses/LICENSE-2.0

//

// Unless required by applicable law or agreed to in writing, software

// distributed under the License is distributed on an "AS IS" BASIS,

// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

// See the License for the specific language governing permissions and

// limitations under the License.


#ifndef PRIVACY_PROOFS_ZK_LIB_CIRCUITS_COMPILER_COMPILER_H_

#define PRIVACY_PROOFS_ZK_LIB_CIRCUITS_COMPILER_COMPILER_H_


#include <stddef.h>

#include <stdint.h>


#include <algorithm>

#include <memory>

#include <vector>


#include "algebra/hash.h"

#include "circuits/compiler/circuit_id.h"

#include "circuits/compiler/node.h"

#include "circuits/compiler/pdqhash.h"

#include "circuits/compiler/schedule.h"

#include "sumcheck/circuit.h"

#include "sumcheck/quad.h"

#include "util/panic.h"


namespace proofs {

/*

QuadCircuit contains methods that facilitate defining circuits used to

express predicates that are to be proven or verified. This class allows one

to use basic arithmetic circuit operations (add, mul, input, assert0, ...)

to define the circuit on a set of abstract wire labels.


The "mkcircuit" compiler method than optimizes the circuit by applying all of

the basic tricks of constant propagation, common sub-expression elimination,

squashing layers into as few as possible, and grouping terms into quads.


Quads are a new form of gate (in contrast to the add and mul gates in most

sumcheck proof systems). Quads represent a "sum of quadratic terms" where

each term is w_l * w_r * v for two wire labels and a constant v.

*/

template <class Field>


class QuadCircuit {

 public:

  using Elt = typename Field::Elt;

  using nodeinfo = NodeInfoF<Field>;

  using node = NodeF<Field>;

  using size_t_for_storage = term::size_t_for_storage;

  using quad_corner_t = typename Quad<Field>::quad_corner_t;


  const Field& f_;


 public:

  // Variables for informational purposes:

  size_t ninput_;

  size_t npub_input_;         // number of public inputs, index of 1st private

  size_t subfield_boundary_;  // least wire not known to be in the subfield

  size_t noutput_;


  // set by the algebraic simplifiers in this file

  size_t depth_;

  size_t nwires_cse_eliminated_;

  size_t nwires_not_needed_;


  // set by the scheduler

  size_t nwires_;

  size_t nquad_terms_;

  size_t nwires_overhead_;


  explicit QuadCircuit(const Field& f)

      : f_(f),

        ninput_(0),

        npub_input_(0),

        subfield_boundary_(0),

        noutput_(0),

        depth_(0),

        nwires_cse_eliminated_(0),

        nwires_not_needed_(0),

        nwires_(-1),  // undefined until set in mkcircuit()

        nquad_terms_(-1),

        nwires_overhead_(-1) {

    // make sure that Elt(0) is represented as index 0 in the constant

    // table.

    size_t ki0 = kstore(f.zero());

    proofs::check(ki0 == 0, "ki0 == 0");

    size_t ki1 = kstore(f.one());

    proofs::check(ki1 == 1, "ki1 == 1");


    // make sure node 0 exists, carrying input[0] = F.one()

    input();

  }


  // Produce a linear term 1 * op0 that the compiler will not

  // attempt to optimize to op0.  The reason for this function

  // is to implement linear terms such as a*x in the quadratic form

  // a*x+b*x*y.  Left to its own devices, the compiler peeks into x,

  // and if x=k*z*w, it produces a term (a*k)*z*w in the previous

  // layer, possibly destroying common subexpressions.  linear(op)

  // introduces an explicit multiplication by wire 0, which the

  // compiler does not attempt to optimize away.

  size_t linear(size_t op0) { return mul(0, op0); }

  size_t linear(const Elt& k, size_t op0) { return mul(k, 0, op0); }


  size_t mul(const Elt& k, size_t op) {

    if (k == f_.zero()) {

      return konst(k);

    } else if (k == f_.one() || nodes_[op].zero()) {

      return op;

    } else {

      return push_node(scale(k, op));

    }

  }


  size_t mul(size_t op0, size_t op1) { return mul(f_.one(), op0, op1); }


  size_t mul(const Elt& k, size_t op0, size_t op1) {

    const auto& n0 = nodes_[op0];

    const auto& n1 = nodes_[op1];


    if (n0.zero()) {

      return op0;

    } else if (n0.constant()) {

      // k * (k1 * op1) -> (k * k1) * op1

      return mul(f_.mulf(k, kload(n0.terms[0].ki)), op1);

    } else if (n0.linearp()) {

      // k * ((k1 * op0) * op1) -> (k * k1) * op0 * op1

      return mul(f_.mulf(k, kload(n0.terms[0].ki)), n0.terms[0].op1, op1);

    } else if (n1.zero() || n1.constant() || n1.linearp()) {

      return mul(k, op1, op0);

    } else {

      // general term k * op0 * op1

      return push_node(node(kstore(k), op0, op1));

    }

  }


  size_t add(size_t op0, size_t op1) {

    const auto& n0 = nodes_[op0];

    const auto& n1 = nodes_[op1];


    if (n0.zero()) {

      return op1;

    } else if (n1.zero()) {

      return op0;

    } else {

      // If the two addends are of different depth, do not merge

      // them, which is accomplished by multiplying the shallower

      // node by 1 and treating it as a single term of the final

      // sum.

      //

      // Like many other "optimizations", this is a heuristic

      // that may or may not work, but it seems to be uniformly

      // beneficial or at least not harmful for all our circuits

      // as of 2023-11-15.

      if (n0.info.depth < n1.info.depth) {

        op0 = linear(op0);

      } else if (n1.info.depth < n0.info.depth) {

        op1 = linear(op1);

      }

      return push_node(merge(op0, op1));

    }

  }

  size_t sub(size_t op0, size_t op1) { return add(op0, mul(f_.mone(), op1)); }


  size_t konst(const Elt& k) { return push_node(node(kstore(k), 0, 0)); }


  // Generate a special node that asserts that op == 0.

  // The node has the form 0*(1*op), which does not normally

  // appear in circuits.

  size_t assert0(size_t op) {

    const node* n = &nodes_[op];

    if (n->zero()) {

      // Identically zero, so nothing to generate.

      // More importantly, we cannot multiply OP by 1,

      // since OP doesn't really exist.

      return op;

    } else if (n->linearp()) {

      // n = k * (1 * op1).

      //

      // Reduce to assert0(op1), but handle the screw case k==0,

      // which shouldn't happen but just in case...

      if (n->terms[0].ki == 0) {

        return op;

      } else {

        return assert0(n->terms[0].op1);

      }

    } else {

      typename term::assert0_type_hack hack;

      std::vector<term> terms;

      terms.push_back(term(op, hack));

      size_t n1 = push_node(node(terms));

      nodes_[n1].info.is_assert0 = true;

      return n1;

    }

  }


  // Wrappers to avoid creating unnecessary wires.  The

  // compiler will discard them anyway, but they still take

  // time and space.

  size_t axpy(size_t y, const Elt& a, size_t x) {

    if (a == f_.zero()) {

      return y;

    }

    return add(y, linear(a, x));

  }

  size_t apy(size_t y, const Elt& a) {

    if (a == f_.zero()) {

      return y;

    }

    return add(y, konst(a));

  }


  size_t input() { return push_node(node(quad_corner_t(ninput_++))); }


  // This function demarcates the end of the public inputs and beginning of

  // private inputs. It can only be called once.

  void private_input() {

    proofs::check(

        npub_input_ == 0,

        "private_input can only be called once after setting public inputs");

    npub_input_ = ninput_;

  }


  // This function demarcates the end of the private inputs in the

  // subfield and beginning of the full-field private inputs. It can

  // only be called once.

  void begin_full_field() {

    proofs::check(subfield_boundary_ == 0,

                  "begin_full_field() can only be called once");

    subfield_boundary_ = ninput_;

  }


  size_t ninput() const { return ninput_; }


  void output(size_t n, size_t wire_id) {

    output_internal(n, quad_corner_t(wire_id));

  }


  std::unique_ptr<Circuit<Field>> mkcircuit(size_t nc) {

    size_t depth_ub = compute_depth_ub();

    fixup_last_layer_assertions(depth_ub);

    compute_needed(depth_ub);


    Scheduler<Field> sched(nodes_, f_);

    std::unique_ptr<Circuit<Field>> c =

        sched.mkcircuit(constants_, depth_ub, nc);


    // re-export the scheduler telemetry

    nwires_ = sched.nwires_;

    nquad_terms_ = sched.nquad_terms_;

    nwires_overhead_ = sched.nwires_overhead_;


    c->ninputs = ninput();

    c->npub_in = npub_input_;

    c->subfield_boundary = subfield_boundary_;


    circuit_id(c->id, *c, f_);

    return c;

  }


 private:

  void output_internal(size_t n, quad_corner_t wire_id) {

    nodes_[n].info.is_output = true;

    nodes_[n].info.desired_wire_id_for_output = wire_id;

    noutput_++;

  }


  size_t push_node(node n) {

    // common-subexpression elimination: if we have already seen a

    // node equal to n, return that node.

    uint64_t d = n.hash();


    auto pred = [&](PdqHash::value_t op) { return n == nodes_[op]; };

    if (size_t op = cse_.find(d, pred); op != PdqHash::kNil) {

      // do not linear terms as eliminated by the CSE, since they are

      // likely placeholder nodes absorbed by the next layer.

      if (!n.linearp()) {

        ++nwires_cse_eliminated_;

      }

      return op;

    }


    // compute the node depth, which has been so far uninitialized

    n.info.depth = 0;

    for (const auto& t : n.terms) {

      n.info.depth = std::max<size_t>(

          n.info.depth, 1 + std::max<size_t>(nodes_[t.op0].info.depth,

                                             nodes_[t.op1].info.depth));

    }


    size_t nid = nodes_.size();

    nodes_.push_back(n);


    // record NID into the common-subexpression elimination table

    cse_.insert(d, nid);


    return nid;

  }


  node materialize_input(size_t op) {

    if (nodes_[op].info.is_input) {

      return node(/*kstore(f.one())=*/1, 0, op);

    } else {

      return /*a copy of*/ nodes_[op];

    }

  }


  node scale(const Elt& k, size_t op) {

    node n = materialize_input(op);

    for (auto& t : n.terms) {

      t.ki = kstore(f_.mulf(kload(t.ki), k));

    }

    return n;

  }


  void push_back_unless_zero(std::vector<term>& terms, const term& t) const {

    if (t.ki != 0) {

      terms.push_back(t);

    }

  }


  node merge(size_t op0, size_t op1) {

    const node n0 = materialize_input(op0);

    const node n1 = materialize_input(op1);

    const std::vector<term>& t0 = n0.terms;

    const std::vector<term>& t1 = n1.terms;

    std::vector<term> terms;

    size_t i0 = 0, i1 = 0;

    while (i0 < t0.size() && i1 < t1.size()) {

      term t;

      if (t0[i0].eqndx(t1[i1])) {

        t = t0[i0];

        t.ki = kstore(f_.addf(kload(t.ki), kload(t1[i1].ki)));

        i0++;

        i1++;

      } else if (t0[i0].ltndx(t1[i1])) {

        t = t0[i0++];

      } else {

        t = t1[i1++];

      }

      push_back_unless_zero(terms, t);

    }


    while (i0 < t0.size()) {

      push_back_unless_zero(terms, t0[i0++]);

    }


    while (i1 < t1.size()) {

      push_back_unless_zero(terms, t1[i1++]);

    }


    return node(terms);

  }


  // constants_[n] stores the n-th constant, once.

  // Modulo collisions, constants_[constttab_[hash(k)]] == k

  // for k \in Elt.

  std::vector<Elt> constants_;

  PdqHash consttab_;


  std::vector<node> nodes_;

  PdqHash cse_;


  size_t kstore(const Elt& k) {

    uint64_t d = elt_hash(k, f_);

    auto pred = [&](PdqHash::value_t ki) { return k == constants_[ki]; };

    size_t ki = consttab_.find(d, pred);


    if (ki == PdqHash::kNil) {

      ki = constants_.size();

      constants_.push_back(k);

      consttab_.insert(d, ki);

    }

    return ki;

  }

  Elt& kload(size_t ki) { return constants_[ki]; }


  void mark_needed(size_t op, size_t depth_at_which_needed) {

    nodeinfo* nfo = &nodes_[op].info;

    nfo->is_needed = true;

    nfo->max_needed_depth =

        std::max<size_t>(depth_at_which_needed, nfo->max_needed_depth);


    // If DEPTH_AT_WHICH_NEEDED > DEPTH + 1, we need a constant 1 at

    // depth DEPTH_AT_WHICH_NEEDED-1 (and implicily any lower depths) in

    // order to copy the node across levels.

    if (depth_at_which_needed > nfo->depth + 1) {

      nodeinfo* nfo0 = &nodes_[0].info;

      nfo0->is_needed = true;

      nfo0->max_needed_depth =

          std::max<size_t>(depth_at_which_needed - 1, nfo0->max_needed_depth);

    }

  }


  size_t compute_depth_ub() {

    size_t r = 0;

    for (auto& n : nodes_) {

      if (n.info.is_output) {

        r = std::max<size_t>(r, 1 + n.info.depth);

      } else if (n.info.is_assert0) {

        // Assertions of the form 0*(1*OP) contibute n.info.depth and

        // not 1 + n.info.depth.  If the assertion is in the last

        // layer, it will be transformed in an output of OP at

        // n.info.depth.  If the assertion is not in the last layer,

        // then it doesn't matter whether we use DEPTH or 1 + DEPTH.

        if (n.linearp()) {

          r = std::max<size_t>(r, n.info.depth);

        } else {

          r = std::max<size_t>(r, 1 + n.info.depth);

        }

      }

    }

    depth_ = r;

    return r;

  }


  void fixup_last_layer_assertions(size_t depth_ub) {

    // convert assertions in the last layer into outputs

    for (auto& n : nodes_) {

      if (!n.info.is_output && n.info.is_assert0 && n.info.depth == depth_ub &&

          n.linearp()) {

        n.info.is_assert0 = false;

        output_internal(n.terms[0].op1, nodeinfo::kWireIdUndefined);

      }

    }

  }


  void compute_needed(size_t depth_ub) {

    nwires_not_needed_ = 0;

    for (size_t i = nodes_.size(); i-- > 0;) {

      nodeinfo* nfo = &nodes_[i].info;


      // mark all inputs as needed, to prevent ambiguity

      // in the layout of the W[] vector.

      if (nfo->is_input) {

        mark_needed(i, 1);

      }

      // outputs are needed at depth_ub_

      if (nfo->is_output) {

        mark_needed(i, depth_ub);

      }

      // assertions are needed in the next layer

      if (nfo->is_assert0) {

        mark_needed(i, nfo->depth + 1);

      }


      if (nfo->is_needed) {

        for (const auto& t : nodes_[i].terms) {

          mark_needed(t.op0, nfo->depth);

          mark_needed(t.op1, nfo->depth);

        }

      } else {

        ++nwires_not_needed_;

      }

    }

  }

};


}  // namespace proofs


#endif  // PRIVACY_PROOFS_ZK_LIB_CIRCUITS_COMPILER_COMPILER_H_

proofs::PdqHash
Definition pdqhash.h:37

proofs::Quad
Definition quad.h:37

proofs::Scheduler
Definition schedule.h:35

proofs::GF2_128::Elt
Definition gf2_128.h:63

proofs::NodeF
Definition node.h:115

proofs::NodeInfoF
Definition node.h:76

proofs::term::assert0_type_hack
Definition node.h:52

proofs::term
Definition node.h:30