-rw-r--r-- 9344 libmceliece-20240513/crypto_kem/460896/avx/vec256_maa_asm.q raw
reg256 a0
reg256 a1
reg256 a2
reg256 a3
reg256 a4
reg256 a5
reg256 a6
reg256 a7
reg256 a8
reg256 a9
reg256 a10
reg256 a11
reg256 a12
reg256 b0
reg256 b1
reg256 r0
reg256 r1
reg256 r2
reg256 r3
reg256 r4
reg256 r5
reg256 r6
reg256 r7
reg256 r8
reg256 r9
reg256 r10
reg256 r11
reg256 r12
reg256 r13
reg256 r14
reg256 r15
reg256 r16
reg256 r17
reg256 r18
reg256 r19
reg256 r20
reg256 r21
reg256 r22
reg256 r23
reg256 r24
reg256 r
enter vec256_maa_asm
b0 = mem256[ input_2 + 0 ]
a12 = mem256[ input_1 + 384 ]
r12 = a12 & b0
r13 = a12 & mem256[input_2 + 32]
r14 = a12 & mem256[input_2 + 64]
r15 = a12 & mem256[input_2 + 96]
r16 = a12 & mem256[input_2 + 128]
r17 = a12 & mem256[input_2 + 160]
r18 = a12 & mem256[input_2 + 192]
r19 = a12 & mem256[input_2 + 224]
r20 = a12 & mem256[input_2 + 256]
r21 = a12 & mem256[input_2 + 288]
r22 = a12 & mem256[input_2 + 320]
r23 = a12 & mem256[input_2 + 352]
r24 = a12 & mem256[input_2 + 384]
r15 ^= r24
r14 ^= r24
r12 ^= r24
r11 = r24
a11 = mem256[ input_1 + 352 ]
r = a11 & b0
r11 ^= r
r = a11 & mem256[input_2 + 32]
r12 ^= r
r = a11 & mem256[input_2 + 64]
r13 ^= r
r = a11 & mem256[input_2 + 96]
r14 ^= r
r = a11 & mem256[input_2 + 128]
r15 ^= r
r = a11 & mem256[input_2 + 160]
r16 ^= r
r = a11 & mem256[input_2 + 192]
r17 ^= r
r = a11 & mem256[input_2 + 224]
r18 ^= r
r = a11 & mem256[input_2 + 256]
r19 ^= r
r = a11 & mem256[input_2 + 288]
r20 ^= r
r = a11 & mem256[input_2 + 320]
r21 ^= r
r = a11 & mem256[input_2 + 352]
r22 ^= r
r = a11 & mem256[input_2 + 384]
r23 ^= r
r14 ^= r23
r13 ^= r23
r11 ^= r23
r10 = r23
a10 = mem256[ input_1 + 320 ]
r = a10 & b0
r10 ^= r
r = a10 & mem256[input_2 + 32]
r11 ^= r
r = a10 & mem256[input_2 + 64]
r12 ^= r
r = a10 & mem256[input_2 + 96]
r13 ^= r
r = a10 & mem256[input_2 + 128]
r14 ^= r
r = a10 & mem256[input_2 + 160]
r15 ^= r
r = a10 & mem256[input_2 + 192]
r16 ^= r
r = a10 & mem256[input_2 + 224]
r17 ^= r
r = a10 & mem256[input_2 + 256]
r18 ^= r
r = a10 & mem256[input_2 + 288]
r19 ^= r
r = a10 & mem256[input_2 + 320]
r20 ^= r
r = a10 & mem256[input_2 + 352]
r21 ^= r
r = a10 & mem256[input_2 + 384]
r22 ^= r
r13 ^= r22
r12 ^= r22
r10 ^= r22
r9 = r22
a9 = mem256[ input_1 + 288 ]
r = a9 & b0
r9 ^= r
r = a9 & mem256[input_2 + 32]
r10 ^= r
r = a9 & mem256[input_2 + 64]
r11 ^= r
r = a9 & mem256[input_2 + 96]
r12 ^= r
r = a9 & mem256[input_2 + 128]
r13 ^= r
r = a9 & mem256[input_2 + 160]
r14 ^= r
r = a9 & mem256[input_2 + 192]
r15 ^= r
r = a9 & mem256[input_2 + 224]
r16 ^= r
r = a9 & mem256[input_2 + 256]
r17 ^= r
r = a9 & mem256[input_2 + 288]
r18 ^= r
r = a9 & mem256[input_2 + 320]
r19 ^= r
r = a9 & mem256[input_2 + 352]
r20 ^= r
r = a9 & mem256[input_2 + 384]
r21 ^= r
r12 ^= r21
r11 ^= r21
r9 ^= r21
r8 = r21
a8 = mem256[ input_1 + 256 ]
r = a8 & b0
r8 ^= r
r = a8 & mem256[input_2 + 32]
r9 ^= r
r = a8 & mem256[input_2 + 64]
r10 ^= r
r = a8 & mem256[input_2 + 96]
r11 ^= r
r = a8 & mem256[input_2 + 128]
r12 ^= r
r = a8 & mem256[input_2 + 160]
r13 ^= r
r = a8 & mem256[input_2 + 192]
r14 ^= r
r = a8 & mem256[input_2 + 224]
r15 ^= r
r = a8 & mem256[input_2 + 256]
r16 ^= r
r = a8 & mem256[input_2 + 288]
r17 ^= r
r = a8 & mem256[input_2 + 320]
r18 ^= r
r = a8 & mem256[input_2 + 352]
r19 ^= r
r = a8 & mem256[input_2 + 384]
r20 ^= r
r11 ^= r20
r10 ^= r20
r8 ^= r20
r7 = r20
a7 = mem256[ input_1 + 224 ]
r = a7 & b0
r7 ^= r
r = a7 & mem256[input_2 + 32]
r8 ^= r
r = a7 & mem256[input_2 + 64]
r9 ^= r
r = a7 & mem256[input_2 + 96]
r10 ^= r
r = a7 & mem256[input_2 + 128]
r11 ^= r
r = a7 & mem256[input_2 + 160]
r12 ^= r
r = a7 & mem256[input_2 + 192]
r13 ^= r
r = a7 & mem256[input_2 + 224]
r14 ^= r
r = a7 & mem256[input_2 + 256]
r15 ^= r
r = a7 & mem256[input_2 + 288]
r16 ^= r
r = a7 & mem256[input_2 + 320]
r17 ^= r
r = a7 & mem256[input_2 + 352]
r18 ^= r
r = a7 & mem256[input_2 + 384]
r19 ^= r
r10 ^= r19
r9 ^= r19
r7 ^= r19
r6 = r19
a6 = mem256[ input_1 + 192 ]
r = a6 & b0
r6 ^= r
r = a6 & mem256[input_2 + 32]
r7 ^= r
r = a6 & mem256[input_2 + 64]
r8 ^= r
r = a6 & mem256[input_2 + 96]
r9 ^= r
r = a6 & mem256[input_2 + 128]
r10 ^= r
r = a6 & mem256[input_2 + 160]
r11 ^= r
r = a6 & mem256[input_2 + 192]
r12 ^= r
r = a6 & mem256[input_2 + 224]
r13 ^= r
r = a6 & mem256[input_2 + 256]
r14 ^= r
r = a6 & mem256[input_2 + 288]
r15 ^= r
r = a6 & mem256[input_2 + 320]
r16 ^= r
r = a6 & mem256[input_2 + 352]
r17 ^= r
r = a6 & mem256[input_2 + 384]
r18 ^= r
r9 ^= r18
r8 ^= r18
r6 ^= r18
r5 = r18
a5 = mem256[ input_1 + 160 ]
r = a5 & b0
r5 ^= r
r = a5 & mem256[input_2 + 32]
r6 ^= r
r = a5 & mem256[input_2 + 64]
r7 ^= r
r = a5 & mem256[input_2 + 96]
r8 ^= r
r = a5 & mem256[input_2 + 128]
r9 ^= r
r = a5 & mem256[input_2 + 160]
r10 ^= r
r = a5 & mem256[input_2 + 192]
r11 ^= r
r = a5 & mem256[input_2 + 224]
r12 ^= r
r = a5 & mem256[input_2 + 256]
r13 ^= r
r = a5 & mem256[input_2 + 288]
r14 ^= r
r = a5 & mem256[input_2 + 320]
r15 ^= r
r = a5 & mem256[input_2 + 352]
r16 ^= r
r = a5 & mem256[input_2 + 384]
r17 ^= r
r8 ^= r17
r7 ^= r17
r5 ^= r17
r4 = r17
a4 = mem256[ input_1 + 128 ]
r = a4 & b0
r4 ^= r
r = a4 & mem256[input_2 + 32]
r5 ^= r
r = a4 & mem256[input_2 + 64]
r6 ^= r
r = a4 & mem256[input_2 + 96]
r7 ^= r
r = a4 & mem256[input_2 + 128]
r8 ^= r
r = a4 & mem256[input_2 + 160]
r9 ^= r
r = a4 & mem256[input_2 + 192]
r10 ^= r
r = a4 & mem256[input_2 + 224]
r11 ^= r
r = a4 & mem256[input_2 + 256]
r12 ^= r
r = a4 & mem256[input_2 + 288]
r13 ^= r
r = a4 & mem256[input_2 + 320]
r14 ^= r
r = a4 & mem256[input_2 + 352]
r15 ^= r
r = a4 & mem256[input_2 + 384]
r16 ^= r
r7 ^= r16
r6 ^= r16
r4 ^= r16
r3 = r16
a3 = mem256[ input_1 + 96 ]
r = a3 & b0
r3 ^= r
r = a3 & mem256[input_2 + 32]
r4 ^= r
r = a3 & mem256[input_2 + 64]
r5 ^= r
r = a3 & mem256[input_2 + 96]
r6 ^= r
r = a3 & mem256[input_2 + 128]
r7 ^= r
r = a3 & mem256[input_2 + 160]
r8 ^= r
r = a3 & mem256[input_2 + 192]
r9 ^= r
r = a3 & mem256[input_2 + 224]
r10 ^= r
r = a3 & mem256[input_2 + 256]
r11 ^= r
r = a3 & mem256[input_2 + 288]
r12 ^= r
r = a3 & mem256[input_2 + 320]
r13 ^= r
r = a3 & mem256[input_2 + 352]
r14 ^= r
r = a3 & mem256[input_2 + 384]
r15 ^= r
r6 ^= r15
r5 ^= r15
r3 ^= r15
r2 = r15
a2 = mem256[ input_1 + 64 ]
r = a2 & b0
r2 ^= r
r = a2 & mem256[input_2 + 32]
r3 ^= r
r = a2 & mem256[input_2 + 64]
r4 ^= r
r = a2 & mem256[input_2 + 96]
r5 ^= r
r = a2 & mem256[input_2 + 128]
r6 ^= r
r = a2 & mem256[input_2 + 160]
r7 ^= r
r = a2 & mem256[input_2 + 192]
r8 ^= r
r = a2 & mem256[input_2 + 224]
r9 ^= r
r = a2 & mem256[input_2 + 256]
r10 ^= r
r = a2 & mem256[input_2 + 288]
r11 ^= r
r = a2 & mem256[input_2 + 320]
r12 ^= r
r = a2 & mem256[input_2 + 352]
r13 ^= r
r = a2 & mem256[input_2 + 384]
r14 ^= r
r5 ^= r14
r4 ^= r14
r2 ^= r14
r1 = r14
a1 = mem256[ input_1 + 32 ]
r = a1 & b0
r1 ^= r
r = a1 & mem256[input_2 + 32]
r2 ^= r
r = a1 & mem256[input_2 + 64]
r3 ^= r
r = a1 & mem256[input_2 + 96]
r4 ^= r
r = a1 & mem256[input_2 + 128]
r5 ^= r
r = a1 & mem256[input_2 + 160]
r6 ^= r
r = a1 & mem256[input_2 + 192]
r7 ^= r
r = a1 & mem256[input_2 + 224]
r8 ^= r
r = a1 & mem256[input_2 + 256]
r9 ^= r
r = a1 & mem256[input_2 + 288]
r10 ^= r
r = a1 & mem256[input_2 + 320]
r11 ^= r
r = a1 & mem256[input_2 + 352]
r12 ^= r
r = a1 & mem256[input_2 + 384]
r13 ^= r
r4 ^= r13
r3 ^= r13
r1 ^= r13
r0 = r13
a0 = mem256[ input_1 + 0 ]
r = a0 & b0
r0 ^= r
r = a0 & mem256[input_2 + 32]
r1 ^= r
r = a0 & mem256[input_2 + 64]
r2 ^= r
r = a0 & mem256[input_2 + 96]
r3 ^= r
r = a0 & mem256[input_2 + 128]
r4 ^= r
r = a0 & mem256[input_2 + 160]
r5 ^= r
r = a0 & mem256[input_2 + 192]
r6 ^= r
r = a0 & mem256[input_2 + 224]
r7 ^= r
r = a0 & mem256[input_2 + 256]
r8 ^= r
r = a0 & mem256[input_2 + 288]
r9 ^= r
r = a0 & mem256[input_2 + 320]
r10 ^= r
r = a0 & mem256[input_2 + 352]
r11 ^= r
r = a0 & mem256[input_2 + 384]
r12 ^= r
r12 = r12 ^ mem256[ input_0 + 384 ]
mem256[ input_0 + 384 ] = r12
r12 = r12 ^ mem256[ input_1 + 384 ]
mem256[ input_1 + 384 ] = r12
r11 = r11 ^ mem256[ input_0 + 352 ]
mem256[ input_0 + 352 ] = r11
r11 = r11 ^ mem256[ input_1 + 352 ]
mem256[ input_1 + 352 ] = r11
r10 = r10 ^ mem256[ input_0 + 320 ]
mem256[ input_0 + 320 ] = r10
r10 = r10 ^ mem256[ input_1 + 320 ]
mem256[ input_1 + 320 ] = r10
r9 = r9 ^ mem256[ input_0 + 288 ]
mem256[ input_0 + 288 ] = r9
r9 = r9 ^ mem256[ input_1 + 288 ]
mem256[ input_1 + 288 ] = r9
r8 = r8 ^ mem256[ input_0 + 256 ]
mem256[ input_0 + 256 ] = r8
r8 = r8 ^ mem256[ input_1 + 256 ]
mem256[ input_1 + 256 ] = r8
r7 = r7 ^ mem256[ input_0 + 224 ]
mem256[ input_0 + 224 ] = r7
r7 = r7 ^ mem256[ input_1 + 224 ]
mem256[ input_1 + 224 ] = r7
r6 = r6 ^ mem256[ input_0 + 192 ]
mem256[ input_0 + 192 ] = r6
r6 = r6 ^ mem256[ input_1 + 192 ]
mem256[ input_1 + 192 ] = r6
r5 = r5 ^ mem256[ input_0 + 160 ]
mem256[ input_0 + 160 ] = r5
r5 = r5 ^ mem256[ input_1 + 160 ]
mem256[ input_1 + 160 ] = r5
r4 = r4 ^ mem256[ input_0 + 128 ]
mem256[ input_0 + 128 ] = r4
r4 = r4 ^ mem256[ input_1 + 128 ]
mem256[ input_1 + 128 ] = r4
r3 = r3 ^ mem256[ input_0 + 96 ]
mem256[ input_0 + 96 ] = r3
r3 = r3 ^ mem256[ input_1 + 96 ]
mem256[ input_1 + 96 ] = r3
r2 = r2 ^ mem256[ input_0 + 64 ]
mem256[ input_0 + 64 ] = r2
r2 = r2 ^ mem256[ input_1 + 64 ]
mem256[ input_1 + 64 ] = r2
r1 = r1 ^ mem256[ input_0 + 32 ]
mem256[ input_0 + 32 ] = r1
r1 = r1 ^ mem256[ input_1 + 32 ]
mem256[ input_1 + 32 ] = r1
r0 = r0 ^ mem256[ input_0 + 0 ]
mem256[ input_0 + 0 ] = r0
r0 = r0 ^ mem256[ input_1 + 0 ]
mem256[ input_1 + 0 ] = r0
return