src/zal.rs

//! This module provides "ZK Acceleration Layer" traits
//! to abstract away the execution engine for performance-critical primitives.
//!
//! The ZAL Engine is voluntarily left unconstrained
//! so that accelerator libraries are not prematurely limited.
//!
//! Terminology
//! -----------
//!
//! We use the name Backend+Engine for concrete implementations of ZalEngine.
//! For exaple H2cEngine for pure Halo2curves implementation.
//!
//! Alternative names considered were Executor or Driver however
//! - executor is already used in Rust (and the name is long)
//! - driver will be confusing as we work quite low-level with GPUs and FPGAs.
//!
//! Unfortunately Engine is used in bn256 for pairings.
//! Fortunately ZalEngine is only used in the prover
//! while "pairing engine" is only used in the verifier
//!
//! Initialization design space
//! ---------------------------
//!
//! It is recommended that ZAL backends provide:
//! - an initialization function:
//!   - either "fn new() -> ZalEngine" for simple libraries
//!   - or a builder pattern for complex initializations
//! - a shutdown function.
//!
//! The ZalEngine can be a stub type
//! and the shutdown function might be unnecessary
//! if the ZalEngine uses a global threadpool like Rayon.
//!
//! Backends might want to add as an option:
//! - The number of threads (CPU)
//! - The device(s) to run on (multi-sockets machines, multi-GPUs machines, ...)
//! - The curve (JIT-compiled backend)

#[allow(deprecated)]
use core::fmt::Debug;
use crate::msm::best_multiexp;
use pasta_curves::arithmetic::CurveAffine;

// The ZK Accel Layer API
// ---------------------------------------------------

pub trait ZalEngine: Debug {}

pub trait MsmAccel<C: CurveAffine>: ZalEngine {
    fn msm(&self, coeffs: &[C::Scalar], base: &[C]) -> C::Curve;

    // // Caching API
    // // -------------------------------------------------
    // // From here we propose an extended API
    // // that allows reusing coeffs and/or the base points
    // //
    // // This is inspired by CuDNN API (Nvidia GPU)
    // // and oneDNN API (CPU, OpenCL) https://docs.nvidia.com/deeplearning/cudnn/api/index.html#cudnn-ops-infer-so-opaque
    // // usage of descriptors
    // //
    // // https://github.com/oneapi-src/oneDNN/blob/master/doc/programming_model/basic_concepts.md
    // //
    // // Descriptors are opaque pointers that hold the input in a format suitable for the accelerator engine.
    // // They may be:
    // // - Input moved on accelerator device (only once for repeated calls)
    // // - Endianess conversion
    // // - Converting from Montgomery to Canonical form
    // // - Input changed from Projective to Jacobian coordinates or even to a Twisted Edwards curve.
    // // - other form of expensive preprocessing
    // type CoeffsDescriptor<'c>;
    // type BaseDescriptor<'b>;

    // fn get_coeffs_descriptor<'c>(&self, coeffs: &'c [C::Scalar]) -> Self::CoeffsDescriptor<'c>;
    // fn get_base_descriptor<'b>(&self, base: &'b [C]) -> Self::BaseDescriptor<'b>;

    // fn msm_with_cached_scalars(&self, coeffs: &Self::CoeffsDescriptor<'_>, base: &[C]) -> C::Curve;

    // fn msm_with_cached_base(&self, coeffs: &[C::Scalar], base: &Self::BaseDescriptor<'_>) -> C::Curve;

    // fn msm_with_cached_inputs(&self, coeffs: &Self::CoeffsDescriptor<'_>, base: &Self::BaseDescriptor<'_>) -> C::Curve;
    //   // Execute MSM according to descriptors
    //   // Unsure of naming, msm_with_cached_inputs, msm_apply, msm_cached, msm_with_descriptors, ...
}

// ZAL using Halo2curves as a backend
// ---------------------------------------------------

#[derive(Debug)]
pub struct H2cEngine;
pub struct H2cMsmCoeffsDesc<'c, C: CurveAffine> { raw: &'c [C::Scalar]}
pub struct H2cMsmBaseDesc<'b, C: CurveAffine> { raw: &'b [C]}

impl H2cEngine {
    pub fn new() -> Self {
        Self {}
    }
}

impl ZalEngine for H2cEngine {}

impl<C: CurveAffine> MsmAccel<C> for H2cEngine {
    fn msm(&self, coeffs: &[C::Scalar], bases: &[C]) -> C::Curve {
        #[allow(deprecated)]
        best_multiexp(coeffs, bases)
    }

    // // Caching API
    // // -------------------------------------------------

    // type CoeffsDescriptor<'c> = H2cMsmCoeffsDesc<'c, C>;
    // type BaseDescriptor<'b> = H2cMsmBaseDesc<'b, C>;

    // fn get_coeffs_descriptor<'c>(&self, coeffs: &'c [C::Scalar]) -> Self::CoeffsDescriptor<'c>{
    //     // Do expensive device/library specific preprocessing here
    //     Self::CoeffsDescriptor { raw: coeffs }
    // }
    // fn get_base_descriptor<'b>(&self, base: &'b [C]) -> Self::BaseDescriptor<'b> {
    //     Self::BaseDescriptor { raw: base }
    // }

    // fn msm_with_cached_scalars(&self, coeffs: &Self::CoeffsDescriptor<'_>, base: &[C]) -> C::Curve {
    //     best_multiexp(coeffs.raw, base)
    // }

    // fn msm_with_cached_base(&self, coeffs: &[C::Scalar], base: &Self::BaseDescriptor<'_>) -> C::Curve {
    //     best_multiexp(coeffs, base.raw)
    // }

    // fn msm_with_cached_inputs(&self, coeffs: &Self::CoeffsDescriptor<'_>, base: &Self::BaseDescriptor<'_>) -> C::Curve {
    //     best_multiexp(coeffs.raw, base.raw)
    // }
}

impl Default for H2cEngine {
    fn default() -> Self {
        Self::new()
    }
}

// Testing
// ---------------------------------------------------

#[cfg(test)]
mod test {
    use super::{H2cEngine, MsmAccel};
    use crate::bn256::G1Affine;
    use ark_std::{end_timer, start_timer};
    use ff::Field;
    use group::{Curve, Group};
    use pasta_curves::arithmetic::CurveAffine;
    use rand_core::OsRng;

    fn run_msm_zal<C: CurveAffine>(min_k: usize, max_k: usize) {
        let points = (0..1 << max_k)
            .map(|_| C::Curve::random(OsRng))
            .collect::<Vec<_>>();
        let mut affine_points = vec![C::identity(); 1 << max_k];
        C::Curve::batch_normalize(&points[..], &mut affine_points[..]);
        let points = affine_points;

        let scalars = (0..1 << max_k)
            .map(|_| C::Scalar::random(OsRng))
            .collect::<Vec<_>>();

        for k in min_k..=max_k {
            let points = &points[..1 << k];
            let scalars = &scalars[..1 << k];

            let t0 = start_timer!(|| format!("freestanding msm k={}", k));
            #[allow(deprecated)]
            let e0 = super::best_multiexp(scalars, points);
            end_timer!(t0);

            let engine = H2cEngine::new();
            let t1 = start_timer!(|| format!("H2cEngine msm k={}", k));
            let e1 = engine.msm(scalars, points);
            end_timer!(t1);

            assert_eq!(e0, e1);

            // // Caching API
            // // -----------
            // let t2 = start_timer!(|| format!("H2cEngine msm cached base k={}", k));
            // let base_descriptor = engine.get_base_descriptor(points);
            // let e2 = engine.msm_with_cached_base(scalars, &base_descriptor);
            // end_timer!(t2);

            // assert_eq!(e0, e2)
        }
    }

    #[test]
    fn test_msm_zal() {
        run_msm_zal::<G1Affine>(3, 14);
    }
}