FK20-CUDAdocs/fk20__msm_8cu_source.html

 // bls12_381: Arithmetic for BLS12-381

 // Copyright 2022-2023 Dag Arne Osvik

 // Copyright 2022-2023 Luan Cardoso dos Santos


 #include "fr.cuh"

 #include "g1.cuh"

 #include "fk20.cuh"


 __global__ void fk20_msm(g1p_t *he_fft, const fr_t *tc_fft, const g1p_t *xe_fft) {

     if (gridDim.y  !=   1) return;

     if (gridDim.z  !=   1) return;

     if (blockDim.x != 256) return;  // k

     if (blockDim.y !=   1) return;

     if (blockDim.z !=   1) return;


     unsigned tid = threadIdx.x; // Thread number

     unsigned bid = blockIdx.x;  // Block number


     g1p_t a0, a1, t;


     g1p_inf(a0);

     g1p_inf(a1);


     // Move pointer for blocks

     he_fft += 512*bid;

     tc_fft += 16*512*bid;


     // MSM Loop

     for (int i=0; i<16; i++) {


         // Multiply and accumulate


         g1p_cpy(t, xe_fft[512*i+tid+0]);

         g1p_mul(t, tc_fft[512*i+tid+0]);

         g1p_add(a0, t);


         g1p_cpy(t, xe_fft[512*i+tid+256]);

         g1p_mul(t, tc_fft[512*i+tid+256]);

         g1p_add(a1, t);

     }


     // hext_fft = a0||a1

     // Store accumulators

     g1p_cpy(he_fft[tid+  0], a0);

     g1p_cpy(he_fft[tid+256], a1);

 }


 // vim: ts=4 et sw=4 si

fk20.cuh

fk20_msm
__global__ void fk20_msm(g1p_t *he_fft, const fr_t *tc_fft, const g1p_t *xe_fft)
toeplitz_coefficients_fft + xext_fft -> hext_fft
Definition: fk20_msm.cu:20

fr.cuh

fr_t
uint64_t fr_t[4]
Subgroup element stored as a 256-bit array (a 4-element little-endian array of uint64_t)....
Definition: fr.cuh:24

g1.cuh

g1p_inf
__device__ __host__ void g1p_inf(g1p_t &p)
Set p to the point-at-infinity (0,1,0)
Definition: g1p.cu:93

g1p_add
__device__ void g1p_add(g1p_t &p, const g1p_t &q)
Computes the sum of two points q into p, using projective coordinates. and stores in p.
Definition: g1p_add.cu:29

g1p_mul
__device__ void g1p_mul(g1p_t &p, const fr_t &x)
p ← k·p Point multiplication by scalar, in projective coordinates. That result is stored back into p.
Definition: g1p_mul.cu:19

g1p_cpy
__device__ __host__ void g1p_cpy(g1p_t &p, const g1p_t &q)
Copy from q into p.
Definition: g1p.cu:67

g1p_t
G1 point in projective coordinates.
Definition: g1.cuh:27