FK20-CUDAdocs/fptest__mulconst_8cu_source.html

 // bls12_381: Arithmetic for BLS12-381

 // Copyright 2022-2023 Dag Arne Osvik

 // Copyright 2022-2023 Luan Cardoso dos Santos


 #include "fp.cuh"

 #include "fptest.cuh"


 #define ITER 100


 __global__ void FpTestMulConst(testval_t *testval) {


     printf("=== RUN   %s\n", __func__);


     bool    pass    = true;

     size_t  count   = 0;


     // 2*4 == 8


     for (int i=0; pass && i<TESTVALS; i++) {

         fp_t x2x4, x8;


         fp_cpy(x2x4, testval[i]);

         fp_cpy(x8,   testval[i]);


         for (int j=0; pass && j<ITER; j++) {

             fp_t x1;

             fp_cpy(x1, x2x4);


             fp_x2(x2x4, x2x4);

             fp_x4(x2x4, x2x4);


             fp_x8(x8, x8);


             if (fp_neq(x2x4, x8)) {

                 pass = false;


                 printf("%d: FAILED: inconsistent result\n", j);

                 fp_print("1   : ",  x1);

                 fp_print("2*4 : ",  x2x4);

                 fp_print("8   : ",  x8);

             }

             ++count;

         }

     }


     // 2*2*2*2*2*2 == 4*4*4 == 8*8


     for (int i=0; pass && i<TESTVALS; i++) {

         fp_t x2, x4, x8;


         fp_cpy(x2, testval[i]);

         fp_cpy(x4, testval[i]);

         fp_cpy(x8, testval[i]);


         for (int j=0; pass && j<ITER; j++) {

             fp_t x1;

             fp_cpy(x1, x2);


             fp_x2(x2, x2);

             fp_x2(x2, x2);

             fp_x2(x2, x2);

             fp_x2(x2, x2);

             fp_x2(x2, x2);

             fp_x2(x2, x2);


             fp_x4(x4, x4);

             fp_x4(x4, x4);

             fp_x4(x4, x4);


             fp_x8(x8, x8);

             fp_x8(x8, x8);


             if (fp_neq(x2, x4) || fp_neq(x2, x8)) {

                 pass = false;


                 printf("%d: FAILED: inconsistent result\n", j);

                 fp_print("1   : ",  x1);

                 fp_print("2^6 : ",  x2);

                 fp_print("4^3 : ",  x4);

                 fp_print("8^2 : ",  x8);

             }

             ++count;

         }

     }


     // 3*4 == 12


     for (int i=0; pass && i<TESTVALS; i++) {

         fp_t x3x4, x12;


         fp_cpy(x3x4, testval[i]);

         fp_cpy(x12,  testval[i]);


         for (int j=0; pass && j<ITER; j++) {

             fp_t x1;

             fp_cpy(x1, x3x4);


             fp_x3(x3x4, x3x4);

             fp_x4(x3x4, x3x4);


             fp_x12(x12, x12);


             if (fp_neq(x3x4, x12)) {

                 pass = false;


                 printf("%d: FAILED: inconsistent result\n", j);

                 fp_print("1   : ",  x1);

                 fp_print("3*4 : ",  x3x4);

                 fp_print("12  : ",  x12);

             }

             ++count;

         }

     }


     // 12+8 == 4(3+2)


     for (int i=0; pass && i<TESTVALS; i++) {

         fp_t x1, x2, x3, x8, x12, l, r;


         fp_cpy(l, testval[i]);

         fp_cpy(r, testval[i]);


         for (int j=0; pass && j<ITER; j++) {


             fp_cpy(x1, l);


             fp_x2(x2, l);

             fp_x3(x3, l);

             fp_x8(x8, l);

             fp_x12(x12, l);


             fp_add(l, x12, x8);


             fp_add(r, x3, x2);

             fp_x4(r, r);


             if (fp_neq(l, r)) {

                 pass = false;


                 printf("%d: FAILED: inconsistent result\n", i);

                 fp_print("1      : ",  x1);

                 fp_print("12+8   : ",  l);

                 fp_print("4(3+2) : ",  r);

             }

             ++count;

         }

     }


     // 3*3*3*2*4*8 == 12*12*12


     for (int i=0; pass && i<TESTVALS; i++) {

         fp_t x1, l, r;


         fp_cpy(l, testval[i]);

         fp_cpy(r, testval[i]);


         for (int j=0; pass && j<ITER; j++) {


             fp_cpy(x1, l);


             fp_x3(l, l);

             fp_x3(l, l);

             fp_x3(l, l);

             fp_x2(l, l);

             fp_x4(l, l);

             fp_x8(l, l);


             fp_x12(r, r);

             fp_x12(r, r);

             fp_x12(r, r);


             if (fp_neq(l, r)) {

                 pass = false;


                 printf("%d: FAILED: inconsistent result\n", i);

                 fp_print("1           : ",  x1);

                 fp_print("3*3*3*2*4*8 : ",  l);

                 fp_print("12*12*12    : ",  r);

             }

             ++count;

         }

     }


     printf("%ld tests\n", count);


     PRINTPASS(pass);

 }


 // vim: ts=4 et sw=4 si

fp_print
__device__ void fp_print(const char *s, const fp_t &x)
Prints the canonical representation of x to STDOUT.
Definition: fp.cu:39

fp.cuh

fp_neq
__device__ bool fp_neq(const fp_t &x, const fp_t &y)
Compares two fp_t residues.
Definition: fp_neq.cu:14

fp_add
__device__ void fp_add(fp_t &z, const fp_t &x, const fp_t &y)
Computes the sum of two residues x and y modulo p and stores it in z. Device only function.
Definition: fp_add.cu:17

fp_x8
__device__ void fp_x8(fp_t &z, const fp_t &x)
Multiplies x by 8 and stores the result into z.
Definition: fp_x8.cu:15

fp_x2
__device__ void fp_x2(fp_t &z, const fp_t &x)
Multiplies x by 2 and stores the result into z.
Definition: fp_x2.cu:15

fp_x12
__device__ void fp_x12(fp_t &z, const fp_t &x)
Multiplies the residue mod p x by 12 and stores the result into z.
Definition: fp_x12.cu:15

fp_x4
__device__ void fp_x4(fp_t &z, const fp_t &x)
Multiplies x by 4 and stores the result into z.
Definition: fp_x4.cu:15

fp_t
uint64_t fp_t[6]
Residue modulo p. Any 384-bit representative of each residue is allowed, and stored as a 6-element li...
Definition: fp.cuh:14

fp_cpy
__device__ __host__ void fp_cpy(fp_t &z, const fp_t &x)
Copy from x into z.
Definition: fp_cpy.cu:14

fp_x3
__device__ void fp_x3(fp_t &z, const fp_t &x)
Multiplies x by 3 and stores the result into z.
Definition: fp_x3.cu:15

testval
__managed__ testval_t testval[TESTVALS]
Definition: fptest.cu:8

fptest.cuh

TESTVALS
#define TESTVALS
Definition: fptest.cuh:13

FpTestMulConst
__global__ void FpTestMulConst(testval_t *testval)
Test self consistency in multiplication by constant:
Definition: fptest_mulconst.cu:21

ITER
#define ITER
Definition: fptest_mulconst.cu:8

testval_t
Definition: g1test.cuh:13

PRINTPASS
#define PRINTPASS(pass)
Definition: test.h:25