-rw-r--r-- 8083 libmceliece-20241009/crypto_kem/460896/avx/vec256_mul_asm.q raw
reg256 a0 reg256 a1 reg256 a2 reg256 a3 reg256 a4 reg256 a5 reg256 a6 reg256 a7 reg256 a8 reg256 a9 reg256 a10 reg256 a11 reg256 a12 reg256 b0 reg256 b1 reg256 r0 reg256 r1 reg256 r2 reg256 r3 reg256 r4 reg256 r5 reg256 r6 reg256 r7 reg256 r8 reg256 r9 reg256 r10 reg256 r11 reg256 r12 reg256 r13 reg256 r14 reg256 r15 reg256 r16 reg256 r17 reg256 r18 reg256 r19 reg256 r20 reg256 r21 reg256 r22 reg256 r23 reg256 r24 reg256 r enter vec256_mul_asm b0 = mem256[ input_2 + 0 ] a12 = mem256[ input_1 + 384 ] r12 = a12 & b0 r13 = a12 & mem256[input_2 + 32] r14 = a12 & mem256[input_2 + 64] r15 = a12 & mem256[input_2 + 96] r16 = a12 & mem256[input_2 + 128] r17 = a12 & mem256[input_2 + 160] r18 = a12 & mem256[input_2 + 192] r19 = a12 & mem256[input_2 + 224] r20 = a12 & mem256[input_2 + 256] r21 = a12 & mem256[input_2 + 288] r22 = a12 & mem256[input_2 + 320] r23 = a12 & mem256[input_2 + 352] r24 = a12 & mem256[input_2 + 384] r15 ^= r24 r14 ^= r24 r12 ^= r24 r11 = r24 a11 = mem256[ input_1 + 352 ] r = a11 & b0 r11 ^= r r = a11 & mem256[input_2 + 32] r12 ^= r r = a11 & mem256[input_2 + 64] r13 ^= r r = a11 & mem256[input_2 + 96] r14 ^= r r = a11 & mem256[input_2 + 128] r15 ^= r r = a11 & mem256[input_2 + 160] r16 ^= r r = a11 & mem256[input_2 + 192] r17 ^= r r = a11 & mem256[input_2 + 224] r18 ^= r r = a11 & mem256[input_2 + 256] r19 ^= r r = a11 & mem256[input_2 + 288] r20 ^= r r = a11 & mem256[input_2 + 320] r21 ^= r r = a11 & mem256[input_2 + 352] r22 ^= r r = a11 & mem256[input_2 + 384] r23 ^= r r14 ^= r23 r13 ^= r23 r11 ^= r23 r10 = r23 a10 = mem256[ input_1 + 320 ] r = a10 & b0 r10 ^= r r = a10 & mem256[input_2 + 32] r11 ^= r r = a10 & mem256[input_2 + 64] r12 ^= r r = a10 & mem256[input_2 + 96] r13 ^= r r = a10 & mem256[input_2 + 128] r14 ^= r r = a10 & mem256[input_2 + 160] r15 ^= r r = a10 & mem256[input_2 + 192] r16 ^= r r = a10 & mem256[input_2 + 224] r17 ^= r r = a10 & mem256[input_2 + 256] r18 ^= r r = a10 & mem256[input_2 + 288] r19 ^= r r = a10 & mem256[input_2 + 320] r20 ^= r r = a10 & mem256[input_2 + 352] r21 ^= r r = a10 & mem256[input_2 + 384] r22 ^= r r13 ^= r22 r12 ^= r22 r10 ^= r22 r9 = r22 a9 = mem256[ input_1 + 288 ] r = a9 & b0 r9 ^= r r = a9 & mem256[input_2 + 32] r10 ^= r r = a9 & mem256[input_2 + 64] r11 ^= r r = a9 & mem256[input_2 + 96] r12 ^= r r = a9 & mem256[input_2 + 128] r13 ^= r r = a9 & mem256[input_2 + 160] r14 ^= r r = a9 & mem256[input_2 + 192] r15 ^= r r = a9 & mem256[input_2 + 224] r16 ^= r r = a9 & mem256[input_2 + 256] r17 ^= r r = a9 & mem256[input_2 + 288] r18 ^= r r = a9 & mem256[input_2 + 320] r19 ^= r r = a9 & mem256[input_2 + 352] r20 ^= r r = a9 & mem256[input_2 + 384] r21 ^= r r12 ^= r21 r11 ^= r21 r9 ^= r21 r8 = r21 a8 = mem256[ input_1 + 256 ] r = a8 & b0 r8 ^= r r = a8 & mem256[input_2 + 32] r9 ^= r r = a8 & mem256[input_2 + 64] r10 ^= r r = a8 & mem256[input_2 + 96] r11 ^= r r = a8 & mem256[input_2 + 128] r12 ^= r r = a8 & mem256[input_2 + 160] r13 ^= r r = a8 & mem256[input_2 + 192] r14 ^= r r = a8 & mem256[input_2 + 224] r15 ^= r r = a8 & mem256[input_2 + 256] r16 ^= r r = a8 & mem256[input_2 + 288] r17 ^= r r = a8 & mem256[input_2 + 320] r18 ^= r r = a8 & mem256[input_2 + 352] r19 ^= r r = a8 & mem256[input_2 + 384] r20 ^= r r11 ^= r20 r10 ^= r20 r8 ^= r20 r7 = r20 a7 = mem256[ input_1 + 224 ] r = a7 & b0 r7 ^= r r = a7 & mem256[input_2 + 32] r8 ^= r r = a7 & mem256[input_2 + 64] r9 ^= r r = a7 & mem256[input_2 + 96] r10 ^= r r = a7 & mem256[input_2 + 128] r11 ^= r r = a7 & mem256[input_2 + 160] r12 ^= r r = a7 & mem256[input_2 + 192] r13 ^= r r = a7 & mem256[input_2 + 224] r14 ^= r r = a7 & mem256[input_2 + 256] r15 ^= r r = a7 & mem256[input_2 + 288] r16 ^= r r = a7 & mem256[input_2 + 320] r17 ^= r r = a7 & mem256[input_2 + 352] r18 ^= r r = a7 & mem256[input_2 + 384] r19 ^= r r10 ^= r19 r9 ^= r19 r7 ^= r19 r6 = r19 a6 = mem256[ input_1 + 192 ] r = a6 & b0 r6 ^= r r = a6 & mem256[input_2 + 32] r7 ^= r r = a6 & mem256[input_2 + 64] r8 ^= r r = a6 & mem256[input_2 + 96] r9 ^= r r = a6 & mem256[input_2 + 128] r10 ^= r r = a6 & mem256[input_2 + 160] r11 ^= r r = a6 & mem256[input_2 + 192] r12 ^= r r = a6 & mem256[input_2 + 224] r13 ^= r r = a6 & mem256[input_2 + 256] r14 ^= r r = a6 & mem256[input_2 + 288] r15 ^= r r = a6 & mem256[input_2 + 320] r16 ^= r r = a6 & mem256[input_2 + 352] r17 ^= r r = a6 & mem256[input_2 + 384] r18 ^= r r9 ^= r18 r8 ^= r18 r6 ^= r18 r5 = r18 a5 = mem256[ input_1 + 160 ] r = a5 & b0 r5 ^= r r = a5 & mem256[input_2 + 32] r6 ^= r r = a5 & mem256[input_2 + 64] r7 ^= r r = a5 & mem256[input_2 + 96] r8 ^= r r = a5 & mem256[input_2 + 128] r9 ^= r r = a5 & mem256[input_2 + 160] r10 ^= r r = a5 & mem256[input_2 + 192] r11 ^= r r = a5 & mem256[input_2 + 224] r12 ^= r r = a5 & mem256[input_2 + 256] r13 ^= r r = a5 & mem256[input_2 + 288] r14 ^= r r = a5 & mem256[input_2 + 320] r15 ^= r r = a5 & mem256[input_2 + 352] r16 ^= r r = a5 & mem256[input_2 + 384] r17 ^= r r8 ^= r17 r7 ^= r17 r5 ^= r17 r4 = r17 a4 = mem256[ input_1 + 128 ] r = a4 & b0 r4 ^= r r = a4 & mem256[input_2 + 32] r5 ^= r r = a4 & mem256[input_2 + 64] r6 ^= r r = a4 & mem256[input_2 + 96] r7 ^= r r = a4 & mem256[input_2 + 128] r8 ^= r r = a4 & mem256[input_2 + 160] r9 ^= r r = a4 & mem256[input_2 + 192] r10 ^= r r = a4 & mem256[input_2 + 224] r11 ^= r r = a4 & mem256[input_2 + 256] r12 ^= r r = a4 & mem256[input_2 + 288] r13 ^= r r = a4 & mem256[input_2 + 320] r14 ^= r r = a4 & mem256[input_2 + 352] r15 ^= r r = a4 & mem256[input_2 + 384] r16 ^= r r7 ^= r16 r6 ^= r16 r4 ^= r16 r3 = r16 a3 = mem256[ input_1 + 96 ] r = a3 & b0 r3 ^= r r = a3 & mem256[input_2 + 32] r4 ^= r r = a3 & mem256[input_2 + 64] r5 ^= r r = a3 & mem256[input_2 + 96] r6 ^= r r = a3 & mem256[input_2 + 128] r7 ^= r r = a3 & mem256[input_2 + 160] r8 ^= r r = a3 & mem256[input_2 + 192] r9 ^= r r = a3 & mem256[input_2 + 224] r10 ^= r r = a3 & mem256[input_2 + 256] r11 ^= r r = a3 & mem256[input_2 + 288] r12 ^= r r = a3 & mem256[input_2 + 320] r13 ^= r r = a3 & mem256[input_2 + 352] r14 ^= r r = a3 & mem256[input_2 + 384] r15 ^= r r6 ^= r15 r5 ^= r15 r3 ^= r15 r2 = r15 a2 = mem256[ input_1 + 64 ] r = a2 & b0 r2 ^= r r = a2 & mem256[input_2 + 32] r3 ^= r r = a2 & mem256[input_2 + 64] r4 ^= r r = a2 & mem256[input_2 + 96] r5 ^= r r = a2 & mem256[input_2 + 128] r6 ^= r r = a2 & mem256[input_2 + 160] r7 ^= r r = a2 & mem256[input_2 + 192] r8 ^= r r = a2 & mem256[input_2 + 224] r9 ^= r r = a2 & mem256[input_2 + 256] r10 ^= r r = a2 & mem256[input_2 + 288] r11 ^= r r = a2 & mem256[input_2 + 320] r12 ^= r r = a2 & mem256[input_2 + 352] r13 ^= r r = a2 & mem256[input_2 + 384] r14 ^= r r5 ^= r14 r4 ^= r14 r2 ^= r14 r1 = r14 a1 = mem256[ input_1 + 32 ] r = a1 & b0 r1 ^= r r = a1 & mem256[input_2 + 32] r2 ^= r r = a1 & mem256[input_2 + 64] r3 ^= r r = a1 & mem256[input_2 + 96] r4 ^= r r = a1 & mem256[input_2 + 128] r5 ^= r r = a1 & mem256[input_2 + 160] r6 ^= r r = a1 & mem256[input_2 + 192] r7 ^= r r = a1 & mem256[input_2 + 224] r8 ^= r r = a1 & mem256[input_2 + 256] r9 ^= r r = a1 & mem256[input_2 + 288] r10 ^= r r = a1 & mem256[input_2 + 320] r11 ^= r r = a1 & mem256[input_2 + 352] r12 ^= r r = a1 & mem256[input_2 + 384] r13 ^= r r4 ^= r13 r3 ^= r13 r1 ^= r13 r0 = r13 a0 = mem256[ input_1 + 0 ] r = a0 & b0 r0 ^= r r = a0 & mem256[input_2 + 32] r1 ^= r r = a0 & mem256[input_2 + 64] r2 ^= r r = a0 & mem256[input_2 + 96] r3 ^= r r = a0 & mem256[input_2 + 128] r4 ^= r r = a0 & mem256[input_2 + 160] r5 ^= r r = a0 & mem256[input_2 + 192] r6 ^= r r = a0 & mem256[input_2 + 224] r7 ^= r r = a0 & mem256[input_2 + 256] r8 ^= r r = a0 & mem256[input_2 + 288] r9 ^= r r = a0 & mem256[input_2 + 320] r10 ^= r r = a0 & mem256[input_2 + 352] r11 ^= r r = a0 & mem256[input_2 + 384] r12 ^= r mem256[ input_0 + 384 ] = r12 mem256[ input_0 + 352 ] = r11 mem256[ input_0 + 320 ] = r10 mem256[ input_0 + 288 ] = r9 mem256[ input_0 + 256 ] = r8 mem256[ input_0 + 224 ] = r7 mem256[ input_0 + 192 ] = r6 mem256[ input_0 + 160 ] = r5 mem256[ input_0 + 128 ] = r4 mem256[ input_0 + 96 ] = r3 mem256[ input_0 + 64 ] = r2 mem256[ input_0 + 32 ] = r1 mem256[ input_0 + 0 ] = r0 return