26     "\n\t.reg .u64 x<6>, z<6>;" 
   34     "\n\tmov.u64 x4, %10;" 
   35     "\n\tmov.u64 x5, %11;" 
   48     "=l"(z0), 
"=l"(z1), 
"=l"(z2), 
"=l"(z3), 
"=l"(z4), 
"=l"(z5)
 
   50     "l"(x0), 
"l"(x1), 
"l"(x2), 
"l"(x3), 
"l"(x4), 
"l"(x5)
 
   53     z[0] = z0, z[1] = z1, z[2] = z2, z[3] = z3, z[4] = z4, z[5] = z5;
 
uint64_t fp_t[6]
Residue modulo p. Any 384-bit representative of each residue is allowed, and stored as a 6-element li...
__device__ void fp_x4(fp_t &z, const fp_t &x)
Multiplies x by 4 and stores the result into z.
#define FP_X4(Z, X)
PTX macro for multiplication by 4. Stores in Z.