-rw-r--r-- 1805 libmceliece-20230612/crypto_kem/348864/vec/vec.c raw
// 20221230 djb: add linker line
// linker define vec_mul vec_sq vec_inv
#include "vec.h"
#include "params.h"
void vec_mul(vec * h, const vec * f, const vec * g)
{
	int i, j;
	vec buf[ 2*GFBITS-1 ];
	for (i = 0; i < 2*GFBITS-1; i++)
		buf[i] = 0;
	for (i = 0; i < GFBITS; i++)
	for (j = 0; j < GFBITS; j++)
		buf[i+j] ^= f[i] & g[j];
		
	for (i = 2*GFBITS-2; i >= GFBITS; i--)
	{
		buf[i-GFBITS+3] ^= buf[i]; 
		buf[i-GFBITS+0] ^= buf[i]; 
	}
	for (i = 0; i < GFBITS; i++)
		h[i] = buf[i];
}
/* bitsliced field squarings */
void vec_sq(vec *out, vec *in)
{
        int i;
        uint64_t result[GFBITS];
        //
        result[0] = in[0]^in[6];
        result[1] = in[11];
        result[2] = in[1]^in[7];
        result[3] = in[6];
        result[4] = in[2] ^ in[11] ^ in[8];
        result[5] = in[7];
        result[6] = in[3]^in[9];
        result[7] = in[8];
        result[8] = in[4]^in[10];
        result[9] = in[9];
        result[10] = in[5] ^ in[11];
        result[11] = in[10];
        //
        for (i = 0; i < GFBITS; i++)
                out[i] = result[i];
}
/* bitsliced field inverses */
void vec_inv(vec *out, vec *in)
{
        uint64_t tmp_11[GFBITS];
        uint64_t tmp_1111[GFBITS];
        vec_copy(out, in);
        vec_sq(out, out);
        vec_mul(tmp_11, out, in); // 11
        vec_sq(out, tmp_11);
        vec_sq(out, out);
        vec_mul(tmp_1111, out, tmp_11); // 1111
        vec_sq(out, tmp_1111);
        vec_sq(out, out);
        vec_sq(out, out);
        vec_sq(out, out);
        vec_mul(out, out, tmp_1111); // 11111111
        vec_sq(out, out);
        vec_sq(out, out);
        vec_mul(out, out, tmp_11); // 1111111111
        vec_sq(out, out);
        vec_mul(out, out, in); // 11111111111
        vec_sq(out, out); // 111111111110
}