// 20240504 djb: add note.GNU-stack // 20221231 djb: port hidden to macos; tnx thom wiggers // 20221230 djb: add linker line // linker define vec128_mul_asm #include "crypto_asm_hidden.h" #define vec128_mul_asm CRYPTO_SHARED_NAMESPACE(vec128_mul_asm) #define _vec128_mul_asm _CRYPTO_SHARED_NAMESPACE(vec128_mul_asm) # qhasm: int64 input_0 # qhasm: int64 input_1 # qhasm: int64 input_2 # qhasm: int64 input_3 # qhasm: int64 input_4 # qhasm: int64 input_5 # qhasm: stack64 input_6 # qhasm: stack64 input_7 # qhasm: int64 caller_r11 # qhasm: int64 caller_r12 # qhasm: int64 caller_r13 # qhasm: int64 caller_r14 # qhasm: int64 caller_r15 # qhasm: int64 caller_rbx # qhasm: int64 caller_rbp # qhasm: reg256 b0 # qhasm: reg256 b1 # qhasm: reg256 b2 # qhasm: reg256 b3 # qhasm: reg256 b4 # qhasm: reg256 b5 # qhasm: reg256 b6 # qhasm: reg256 b7 # qhasm: reg256 b8 # qhasm: reg256 b9 # qhasm: reg256 b10 # qhasm: reg256 b11 # qhasm: reg256 b12 # qhasm: reg256 a0 # qhasm: reg256 a1 # qhasm: reg256 a2 # qhasm: reg256 a3 # qhasm: reg256 a4 # qhasm: reg256 a5 # qhasm: reg256 a6 # qhasm: reg256 r0 # qhasm: reg256 r1 # qhasm: reg256 r2 # qhasm: reg256 r3 # qhasm: reg256 r4 # qhasm: reg256 r5 # qhasm: reg256 r6 # qhasm: reg256 r7 # qhasm: reg256 r8 # qhasm: reg256 r9 # qhasm: reg256 r10 # qhasm: reg256 r11 # qhasm: reg256 r12 # qhasm: reg256 r13 # qhasm: reg256 r14 # qhasm: reg256 r15 # qhasm: reg256 r16 # qhasm: reg256 r17 # qhasm: reg256 r18 # qhasm: reg256 r19 # qhasm: reg256 r20 # qhasm: reg256 r21 # qhasm: reg256 r22 # qhasm: reg256 r23 # qhasm: reg256 r24 # qhasm: reg256 r # qhasm: reg128 h0 # qhasm: reg128 h1 # qhasm: reg128 h2 # qhasm: reg128 h3 # qhasm: reg128 h4 # qhasm: reg128 h5 # qhasm: reg128 h6 # qhasm: reg128 h7 # qhasm: reg128 h8 # qhasm: reg128 h9 # qhasm: reg128 h10 # qhasm: reg128 h11 # qhasm: reg128 h12 # qhasm: reg128 h13 # qhasm: reg128 h14 # qhasm: reg128 h15 # qhasm: reg128 h16 # qhasm: reg128 h17 # qhasm: reg128 h18 # qhasm: reg128 h19 # qhasm: reg128 h20 # qhasm: reg128 h21 # qhasm: reg128 h22 # qhasm: reg128 h23 # qhasm: reg128 h24 # qhasm: stack4864 buf # qhasm: int64 ptr # qhasm: int64 tmp # qhasm: enter vec128_mul_asm .p2align 5 ASM_HIDDEN _vec128_mul_asm ASM_HIDDEN vec128_mul_asm .global _vec128_mul_asm .global vec128_mul_asm _vec128_mul_asm: vec128_mul_asm: mov %rsp,%r11 and $31,%r11 add $608,%r11 sub %r11,%rsp # qhasm: ptr = &buf # asm 1: leaq ptr=int64#5 # asm 2: leaq ptr=%r8 leaq 0(%rsp),%r8 # qhasm: tmp = input_3 # asm 1: mov tmp=int64#6 # asm 2: mov tmp=%r9 mov %rcx,%r9 # qhasm: tmp *= 12 # asm 1: imulq $12,tmp=int64#6 # asm 2: imulq $12,tmp=%r9 imulq $12,%r9,%r9 # qhasm: input_2 += tmp # asm 1: add b12=reg256#1 # asm 2: vbroadcasti128 0(b12=%ymm0 vbroadcasti128 0(%rdx), %ymm0 # qhasm: input_2 -= input_3 # asm 1: sub a6=reg256#2 # asm 2: vpxor a6=%ymm1 vpxor %ymm1,%ymm1,%ymm1 # qhasm: a6[0] = mem128[ input_1 + 96 ] # asm 1: vinsertf128 $0x0,96(r18=reg256#3 # asm 2: vpand r18=%ymm2 vpand %ymm0,%ymm1,%ymm2 # qhasm: mem256[ ptr + 576 ] = r18 # asm 1: vmovupd r17=reg256#4 # asm 2: vpand r17=%ymm3 vpand %ymm0,%ymm2,%ymm3 # qhasm: a4[0] = mem128[ input_1 + 64 ] # asm 1: vinsertf128 $0x0,64(r16=reg256#6 # asm 2: vpand r16=%ymm5 vpand %ymm0,%ymm4,%ymm5 # qhasm: a3[0] = mem128[ input_1 + 48 ] # asm 1: vinsertf128 $0x0,48(r15=reg256#8 # asm 2: vpand r15=%ymm7 vpand %ymm0,%ymm6,%ymm7 # qhasm: a2[0] = mem128[ input_1 + 32 ] # asm 1: vinsertf128 $0x0,32(r14=reg256#10 # asm 2: vpand r14=%ymm9 vpand %ymm0,%ymm8,%ymm9 # qhasm: a1[0] = mem128[ input_1 + 16 ] # asm 1: vinsertf128 $0x0,16(r13=reg256#12 # asm 2: vpand r13=%ymm11 vpand %ymm0,%ymm10,%ymm11 # qhasm: a0[0] = mem128[ input_1 + 0 ] # asm 1: vinsertf128 $0x0,0(r12=reg256#1 # asm 2: vpand r12=%ymm0 vpand %ymm0,%ymm12,%ymm0 # qhasm: b11 = mem128[ input_2 + 0 ] x2 # asm 1: vbroadcasti128 0(b11=reg256#14 # asm 2: vbroadcasti128 0(b11=%ymm13 vbroadcasti128 0(%rdx), %ymm13 # qhasm: input_2 -= input_3 # asm 1: sub r=reg256#15 # asm 2: vpand r=%ymm14 vpand %ymm13,%ymm1,%ymm14 # qhasm: r17 ^= r # asm 1: vpxor r=reg256#4 # asm 2: vpand r=%ymm3 vpand %ymm13,%ymm2,%ymm3 # qhasm: r16 ^= r # asm 1: vpxor r=reg256#4 # asm 2: vpand r=%ymm3 vpand %ymm13,%ymm4,%ymm3 # qhasm: r15 ^= r # asm 1: vpxor r=reg256#4 # asm 2: vpand r=%ymm3 vpand %ymm13,%ymm6,%ymm3 # qhasm: r14 ^= r # asm 1: vpxor r=reg256#4 # asm 2: vpand r=%ymm3 vpand %ymm13,%ymm8,%ymm3 # qhasm: r13 ^= r # asm 1: vpxor r=reg256#4 # asm 2: vpand r=%ymm3 vpand %ymm13,%ymm10,%ymm3 # qhasm: r12 ^= r # asm 1: vpxor r11=reg256#4 # asm 2: vpand r11=%ymm3 vpand %ymm13,%ymm12,%ymm3 # qhasm: b10 = mem128[ input_2 + 0 ] x2 # asm 1: vbroadcasti128 0(b10=reg256#14 # asm 2: vbroadcasti128 0(b10=%ymm13 vbroadcasti128 0(%rdx), %ymm13 # qhasm: input_2 -= input_3 # asm 1: sub r=reg256#15 # asm 2: vpand r=%ymm14 vpand %ymm13,%ymm1,%ymm14 # qhasm: r16 ^= r # asm 1: vpxor r=reg256#6 # asm 2: vpand r=%ymm5 vpand %ymm13,%ymm2,%ymm5 # qhasm: r15 ^= r # asm 1: vpxor r=reg256#6 # asm 2: vpand r=%ymm5 vpand %ymm13,%ymm4,%ymm5 # qhasm: r14 ^= r # asm 1: vpxor r=reg256#6 # asm 2: vpand r=%ymm5 vpand %ymm13,%ymm6,%ymm5 # qhasm: r13 ^= r # asm 1: vpxor r=reg256#6 # asm 2: vpand r=%ymm5 vpand %ymm13,%ymm8,%ymm5 # qhasm: r12 ^= r # asm 1: vpxor r=reg256#6 # asm 2: vpand r=%ymm5 vpand %ymm13,%ymm10,%ymm5 # qhasm: r11 ^= r # asm 1: vpxor r10=reg256#6 # asm 2: vpand r10=%ymm5 vpand %ymm13,%ymm12,%ymm5 # qhasm: b9 = mem128[ input_2 + 0 ] x2 # asm 1: vbroadcasti128 0(b9=reg256#14 # asm 2: vbroadcasti128 0(b9=%ymm13 vbroadcasti128 0(%rdx), %ymm13 # qhasm: input_2 -= input_3 # asm 1: sub r=reg256#15 # asm 2: vpand r=%ymm14 vpand %ymm13,%ymm1,%ymm14 # qhasm: r15 ^= r # asm 1: vpxor r=reg256#8 # asm 2: vpand r=%ymm7 vpand %ymm13,%ymm2,%ymm7 # qhasm: r14 ^= r # asm 1: vpxor r=reg256#8 # asm 2: vpand r=%ymm7 vpand %ymm13,%ymm4,%ymm7 # qhasm: r13 ^= r # asm 1: vpxor r=reg256#8 # asm 2: vpand r=%ymm7 vpand %ymm13,%ymm6,%ymm7 # qhasm: r12 ^= r # asm 1: vpxor r=reg256#8 # asm 2: vpand r=%ymm7 vpand %ymm13,%ymm8,%ymm7 # qhasm: r11 ^= r # asm 1: vpxor r=reg256#8 # asm 2: vpand r=%ymm7 vpand %ymm13,%ymm10,%ymm7 # qhasm: r10 ^= r # asm 1: vpxor r9=reg256#8 # asm 2: vpand r9=%ymm7 vpand %ymm13,%ymm12,%ymm7 # qhasm: b8 = mem128[ input_2 + 0 ] x2 # asm 1: vbroadcasti128 0(b8=reg256#14 # asm 2: vbroadcasti128 0(b8=%ymm13 vbroadcasti128 0(%rdx), %ymm13 # qhasm: input_2 -= input_3 # asm 1: sub r=reg256#15 # asm 2: vpand r=%ymm14 vpand %ymm13,%ymm1,%ymm14 # qhasm: r14 ^= r # asm 1: vpxor r=reg256#10 # asm 2: vpand r=%ymm9 vpand %ymm13,%ymm2,%ymm9 # qhasm: r13 ^= r # asm 1: vpxor r=reg256#10 # asm 2: vpand r=%ymm9 vpand %ymm13,%ymm4,%ymm9 # qhasm: r12 ^= r # asm 1: vpxor r=reg256#10 # asm 2: vpand r=%ymm9 vpand %ymm13,%ymm6,%ymm9 # qhasm: r11 ^= r # asm 1: vpxor r=reg256#10 # asm 2: vpand r=%ymm9 vpand %ymm13,%ymm8,%ymm9 # qhasm: r10 ^= r # asm 1: vpxor r=reg256#10 # asm 2: vpand r=%ymm9 vpand %ymm13,%ymm10,%ymm9 # qhasm: r9 ^= r # asm 1: vpxor r8=reg256#10 # asm 2: vpand r8=%ymm9 vpand %ymm13,%ymm12,%ymm9 # qhasm: b7 = mem128[ input_2 + 0 ] x2 # asm 1: vbroadcasti128 0(b7=reg256#14 # asm 2: vbroadcasti128 0(b7=%ymm13 vbroadcasti128 0(%rdx), %ymm13 # qhasm: input_2 -= input_3 # asm 1: sub r=reg256#15 # asm 2: vpand r=%ymm14 vpand %ymm13,%ymm1,%ymm14 # qhasm: r13 ^= r # asm 1: vpxor r=reg256#12 # asm 2: vpand r=%ymm11 vpand %ymm13,%ymm2,%ymm11 # qhasm: r12 ^= r # asm 1: vpxor r=reg256#12 # asm 2: vpand r=%ymm11 vpand %ymm13,%ymm4,%ymm11 # qhasm: r11 ^= r # asm 1: vpxor r=reg256#12 # asm 2: vpand r=%ymm11 vpand %ymm13,%ymm6,%ymm11 # qhasm: r10 ^= r # asm 1: vpxor r=reg256#12 # asm 2: vpand r=%ymm11 vpand %ymm13,%ymm8,%ymm11 # qhasm: r9 ^= r # asm 1: vpxor r=reg256#12 # asm 2: vpand r=%ymm11 vpand %ymm13,%ymm10,%ymm11 # qhasm: r8 ^= r # asm 1: vpxor r7=reg256#12 # asm 2: vpand r7=%ymm11 vpand %ymm13,%ymm12,%ymm11 # qhasm: b6 = mem128[ input_2 + 0 ] x2 # asm 1: vbroadcasti128 0(b6=reg256#14 # asm 2: vbroadcasti128 0(b6=%ymm13 vbroadcasti128 0(%rdx), %ymm13 # qhasm: input_2 -= input_3 # asm 1: sub r=reg256#15 # asm 2: vpand r=%ymm14 vpand %ymm13,%ymm1,%ymm14 # qhasm: r12 ^= r # asm 1: vpxor r=reg256#1 # asm 2: vpand r=%ymm0 vpand %ymm13,%ymm2,%ymm0 # qhasm: r11 ^= r # asm 1: vpxor r=reg256#1 # asm 2: vpand r=%ymm0 vpand %ymm13,%ymm4,%ymm0 # qhasm: r10 ^= r # asm 1: vpxor r=reg256#1 # asm 2: vpand r=%ymm0 vpand %ymm13,%ymm6,%ymm0 # qhasm: r9 ^= r # asm 1: vpxor r=reg256#1 # asm 2: vpand r=%ymm0 vpand %ymm13,%ymm8,%ymm0 # qhasm: r8 ^= r # asm 1: vpxor r=reg256#1 # asm 2: vpand r=%ymm0 vpand %ymm13,%ymm10,%ymm0 # qhasm: r7 ^= r # asm 1: vpxor r6=reg256#1 # asm 2: vpand r6=%ymm0 vpand %ymm13,%ymm12,%ymm0 # qhasm: b5 = mem128[ input_2 + 0 ] x2 # asm 1: vbroadcasti128 0(b5=reg256#14 # asm 2: vbroadcasti128 0(b5=%ymm13 vbroadcasti128 0(%rdx), %ymm13 # qhasm: input_2 -= input_3 # asm 1: sub r=reg256#15 # asm 2: vpand r=%ymm14 vpand %ymm13,%ymm1,%ymm14 # qhasm: r11 ^= r # asm 1: vpxor r=reg256#4 # asm 2: vpand r=%ymm3 vpand %ymm13,%ymm2,%ymm3 # qhasm: r10 ^= r # asm 1: vpxor r=reg256#4 # asm 2: vpand r=%ymm3 vpand %ymm13,%ymm4,%ymm3 # qhasm: r9 ^= r # asm 1: vpxor r=reg256#4 # asm 2: vpand r=%ymm3 vpand %ymm13,%ymm6,%ymm3 # qhasm: r8 ^= r # asm 1: vpxor r=reg256#4 # asm 2: vpand r=%ymm3 vpand %ymm13,%ymm8,%ymm3 # qhasm: r7 ^= r # asm 1: vpxor r=reg256#4 # asm 2: vpand r=%ymm3 vpand %ymm13,%ymm10,%ymm3 # qhasm: r6 ^= r # asm 1: vpxor r5=reg256#4 # asm 2: vpand r5=%ymm3 vpand %ymm13,%ymm12,%ymm3 # qhasm: b4 = mem128[ input_2 + 0 ] x2 # asm 1: vbroadcasti128 0(b4=reg256#14 # asm 2: vbroadcasti128 0(b4=%ymm13 vbroadcasti128 0(%rdx), %ymm13 # qhasm: input_2 -= input_3 # asm 1: sub r=reg256#15 # asm 2: vpand r=%ymm14 vpand %ymm13,%ymm1,%ymm14 # qhasm: r10 ^= r # asm 1: vpxor r=reg256#6 # asm 2: vpand r=%ymm5 vpand %ymm13,%ymm2,%ymm5 # qhasm: r9 ^= r # asm 1: vpxor r=reg256#6 # asm 2: vpand r=%ymm5 vpand %ymm13,%ymm4,%ymm5 # qhasm: r8 ^= r # asm 1: vpxor r=reg256#6 # asm 2: vpand r=%ymm5 vpand %ymm13,%ymm6,%ymm5 # qhasm: r7 ^= r # asm 1: vpxor r=reg256#6 # asm 2: vpand r=%ymm5 vpand %ymm13,%ymm8,%ymm5 # qhasm: r6 ^= r # asm 1: vpxor r=reg256#6 # asm 2: vpand r=%ymm5 vpand %ymm13,%ymm10,%ymm5 # qhasm: r5 ^= r # asm 1: vpxor r4=reg256#6 # asm 2: vpand r4=%ymm5 vpand %ymm13,%ymm12,%ymm5 # qhasm: b3 = mem128[ input_2 + 0 ] x2 # asm 1: vbroadcasti128 0(b3=reg256#14 # asm 2: vbroadcasti128 0(b3=%ymm13 vbroadcasti128 0(%rdx), %ymm13 # qhasm: input_2 -= input_3 # asm 1: sub r=reg256#15 # asm 2: vpand r=%ymm14 vpand %ymm13,%ymm1,%ymm14 # qhasm: r9 ^= r # asm 1: vpxor r=reg256#8 # asm 2: vpand r=%ymm7 vpand %ymm13,%ymm2,%ymm7 # qhasm: r8 ^= r # asm 1: vpxor r=reg256#8 # asm 2: vpand r=%ymm7 vpand %ymm13,%ymm4,%ymm7 # qhasm: r7 ^= r # asm 1: vpxor r=reg256#8 # asm 2: vpand r=%ymm7 vpand %ymm13,%ymm6,%ymm7 # qhasm: r6 ^= r # asm 1: vpxor r=reg256#8 # asm 2: vpand r=%ymm7 vpand %ymm13,%ymm8,%ymm7 # qhasm: r5 ^= r # asm 1: vpxor r=reg256#8 # asm 2: vpand r=%ymm7 vpand %ymm13,%ymm10,%ymm7 # qhasm: r4 ^= r # asm 1: vpxor r3=reg256#8 # asm 2: vpand r3=%ymm7 vpand %ymm13,%ymm12,%ymm7 # qhasm: b2 = mem128[ input_2 + 0 ] x2 # asm 1: vbroadcasti128 0(b2=reg256#14 # asm 2: vbroadcasti128 0(b2=%ymm13 vbroadcasti128 0(%rdx), %ymm13 # qhasm: input_2 -= input_3 # asm 1: sub r=reg256#15 # asm 2: vpand r=%ymm14 vpand %ymm13,%ymm1,%ymm14 # qhasm: r8 ^= r # asm 1: vpxor r=reg256#10 # asm 2: vpand r=%ymm9 vpand %ymm13,%ymm2,%ymm9 # qhasm: r7 ^= r # asm 1: vpxor r=reg256#10 # asm 2: vpand r=%ymm9 vpand %ymm13,%ymm4,%ymm9 # qhasm: r6 ^= r # asm 1: vpxor r=reg256#10 # asm 2: vpand r=%ymm9 vpand %ymm13,%ymm6,%ymm9 # qhasm: r5 ^= r # asm 1: vpxor r=reg256#10 # asm 2: vpand r=%ymm9 vpand %ymm13,%ymm8,%ymm9 # qhasm: r4 ^= r # asm 1: vpxor r=reg256#10 # asm 2: vpand r=%ymm9 vpand %ymm13,%ymm10,%ymm9 # qhasm: r3 ^= r # asm 1: vpxor r2=reg256#10 # asm 2: vpand r2=%ymm9 vpand %ymm13,%ymm12,%ymm9 # qhasm: b1 = mem128[ input_2 + 0 ] x2 # asm 1: vbroadcasti128 0(b1=reg256#14 # asm 2: vbroadcasti128 0(b1=%ymm13 vbroadcasti128 0(%rdx), %ymm13 # qhasm: input_2 -= input_3 # asm 1: sub r=reg256#15 # asm 2: vpand r=%ymm14 vpand %ymm13,%ymm1,%ymm14 # qhasm: r7 ^= r # asm 1: vpxor r=reg256#12 # asm 2: vpand r=%ymm11 vpand %ymm13,%ymm2,%ymm11 # qhasm: r6 ^= r # asm 1: vpxor r=reg256#12 # asm 2: vpand r=%ymm11 vpand %ymm13,%ymm4,%ymm11 # qhasm: r5 ^= r # asm 1: vpxor r=reg256#12 # asm 2: vpand r=%ymm11 vpand %ymm13,%ymm6,%ymm11 # qhasm: r4 ^= r # asm 1: vpxor r=reg256#12 # asm 2: vpand r=%ymm11 vpand %ymm13,%ymm8,%ymm11 # qhasm: r3 ^= r # asm 1: vpxor r=reg256#12 # asm 2: vpand r=%ymm11 vpand %ymm13,%ymm10,%ymm11 # qhasm: r2 ^= r # asm 1: vpxor r1=reg256#12 # asm 2: vpand r1=%ymm11 vpand %ymm13,%ymm12,%ymm11 # qhasm: b0 = mem128[ input_2 + 0 ] x2 # asm 1: vbroadcasti128 0(b0=reg256#14 # asm 2: vbroadcasti128 0(b0=%ymm13 vbroadcasti128 0(%rdx), %ymm13 # qhasm: input_2 -= input_3 # asm 1: sub r=reg256#2 # asm 2: vpand r=%ymm1 vpand %ymm13,%ymm1,%ymm1 # qhasm: r6 ^= r # asm 1: vpxor r=reg256#1 # asm 2: vpand r=%ymm0 vpand %ymm13,%ymm2,%ymm0 # qhasm: r5 ^= r # asm 1: vpxor r=reg256#1 # asm 2: vpand r=%ymm0 vpand %ymm13,%ymm4,%ymm0 # qhasm: r4 ^= r # asm 1: vpxor r=reg256#1 # asm 2: vpand r=%ymm0 vpand %ymm13,%ymm6,%ymm0 # qhasm: r3 ^= r # asm 1: vpxor r=reg256#1 # asm 2: vpand r=%ymm0 vpand %ymm13,%ymm8,%ymm0 # qhasm: r2 ^= r # asm 1: vpxor r=reg256#1 # asm 2: vpand r=%ymm0 vpand %ymm13,%ymm10,%ymm0 # qhasm: r1 ^= r # asm 1: vpxor r0=reg256#1 # asm 2: vpand r0=%ymm0 vpand %ymm13,%ymm12,%ymm0 # qhasm: mem256[ ptr + 160 ] = r5 # asm 1: vmovupd h24=reg128#1 # asm 2: movdqu 560(h24=%xmm0 movdqu 560(%r8),%xmm0 # qhasm: h11 = h24 # asm 1: movdqa h11=reg128#2 # asm 2: movdqa h11=%xmm1 movdqa %xmm0,%xmm1 # qhasm: h12 = h24 # asm 1: movdqa h12=reg128#3 # asm 2: movdqa h12=%xmm2 movdqa %xmm0,%xmm2 # qhasm: h14 = h24 # asm 1: movdqa h14=reg128#4 # asm 2: movdqa h14=%xmm3 movdqa %xmm0,%xmm3 # qhasm: h15 = h24 # asm 1: movdqa h15=reg128#1 # asm 2: movdqa h15=%xmm0 movdqa %xmm0,%xmm0 # qhasm: h23 = mem128[ ptr + 528 ] # asm 1: movdqu 528(h23=reg128#5 # asm 2: movdqu 528(h23=%xmm4 movdqu 528(%r8),%xmm4 # qhasm: h10 = h23 # asm 1: movdqa h10=reg128#6 # asm 2: movdqa h10=%xmm5 movdqa %xmm4,%xmm5 # qhasm: h11 = h11 ^ h23 # asm 1: vpxor h11=reg128#2 # asm 2: vpxor h11=%xmm1 vpxor %xmm4,%xmm1,%xmm1 # qhasm: h13 = h23 # asm 1: movdqa h13=reg128#7 # asm 2: movdqa h13=%xmm6 movdqa %xmm4,%xmm6 # qhasm: h14 = h14 ^ h23 # asm 1: vpxor h14=reg128#4 # asm 2: vpxor h14=%xmm3 vpxor %xmm4,%xmm3,%xmm3 # qhasm: h22 = mem128[ ptr + 496 ] # asm 1: movdqu 496(h22=reg128#5 # asm 2: movdqu 496(h22=%xmm4 movdqu 496(%r8),%xmm4 # qhasm: h9 = h22 # asm 1: movdqa h9=reg128#8 # asm 2: movdqa h9=%xmm7 movdqa %xmm4,%xmm7 # qhasm: h10 = h10 ^ h22 # asm 1: vpxor h10=reg128#6 # asm 2: vpxor h10=%xmm5 vpxor %xmm4,%xmm5,%xmm5 # qhasm: h12 = h12 ^ h22 # asm 1: vpxor h12=reg128#3 # asm 2: vpxor h12=%xmm2 vpxor %xmm4,%xmm2,%xmm2 # qhasm: h13 = h13 ^ h22 # asm 1: vpxor h13=reg128#5 # asm 2: vpxor h13=%xmm4 vpxor %xmm4,%xmm6,%xmm4 # qhasm: h21 = mem128[ ptr + 464 ] # asm 1: movdqu 464(h21=reg128#7 # asm 2: movdqu 464(h21=%xmm6 movdqu 464(%r8),%xmm6 # qhasm: h8 = h21 # asm 1: movdqa h8=reg128#9 # asm 2: movdqa h8=%xmm8 movdqa %xmm6,%xmm8 # qhasm: h9 = h9 ^ h21 # asm 1: vpxor h9=reg128#8 # asm 2: vpxor h9=%xmm7 vpxor %xmm6,%xmm7,%xmm7 # qhasm: h11 = h11 ^ h21 # asm 1: vpxor h11=reg128#2 # asm 2: vpxor h11=%xmm1 vpxor %xmm6,%xmm1,%xmm1 # qhasm: h12 = h12 ^ h21 # asm 1: vpxor h12=reg128#3 # asm 2: vpxor h12=%xmm2 vpxor %xmm6,%xmm2,%xmm2 # qhasm: h20 = mem128[ ptr + 432 ] # asm 1: movdqu 432(h20=reg128#7 # asm 2: movdqu 432(h20=%xmm6 movdqu 432(%r8),%xmm6 # qhasm: h7 = h20 # asm 1: movdqa h7=reg128#10 # asm 2: movdqa h7=%xmm9 movdqa %xmm6,%xmm9 # qhasm: h8 = h8 ^ h20 # asm 1: vpxor h8=reg128#9 # asm 2: vpxor h8=%xmm8 vpxor %xmm6,%xmm8,%xmm8 # qhasm: h10 = h10 ^ h20 # asm 1: vpxor h10=reg128#6 # asm 2: vpxor h10=%xmm5 vpxor %xmm6,%xmm5,%xmm5 # qhasm: h11 = h11 ^ h20 # asm 1: vpxor h11=reg128#2 # asm 2: vpxor h11=%xmm1 vpxor %xmm6,%xmm1,%xmm1 # qhasm: h19 = mem128[ ptr + 400 ] # asm 1: movdqu 400(h19=reg128#7 # asm 2: movdqu 400(h19=%xmm6 movdqu 400(%r8),%xmm6 # qhasm: h6 = h19 # asm 1: movdqa h6=reg128#11 # asm 2: movdqa h6=%xmm10 movdqa %xmm6,%xmm10 # qhasm: h7 = h7 ^ h19 # asm 1: vpxor h7=reg128#10 # asm 2: vpxor h7=%xmm9 vpxor %xmm6,%xmm9,%xmm9 # qhasm: h9 = h9 ^ h19 # asm 1: vpxor h9=reg128#8 # asm 2: vpxor h9=%xmm7 vpxor %xmm6,%xmm7,%xmm7 # qhasm: h10 = h10 ^ h19 # asm 1: vpxor h10=reg128#6 # asm 2: vpxor h10=%xmm5 vpxor %xmm6,%xmm5,%xmm5 # qhasm: h18 = mem128[ ptr + 368 ] # asm 1: movdqu 368(h18=reg128#7 # asm 2: movdqu 368(h18=%xmm6 movdqu 368(%r8),%xmm6 # qhasm: h18 = h18 ^ mem128[ ptr + 576 ] # asm 1: vpxor 576(h18=reg128#7 # asm 2: vpxor 576(h18=%xmm6 vpxor 576(%r8),%xmm6,%xmm6 # qhasm: h5 = h18 # asm 1: movdqa h5=reg128#12 # asm 2: movdqa h5=%xmm11 movdqa %xmm6,%xmm11 # qhasm: h6 = h6 ^ h18 # asm 1: vpxor h6=reg128#11 # asm 2: vpxor h6=%xmm10 vpxor %xmm6,%xmm10,%xmm10 # qhasm: h8 = h8 ^ h18 # asm 1: vpxor h8=reg128#9 # asm 2: vpxor h8=%xmm8 vpxor %xmm6,%xmm8,%xmm8 # qhasm: h9 = h9 ^ h18 # asm 1: vpxor h9=reg128#7 # asm 2: vpxor h9=%xmm6 vpxor %xmm6,%xmm7,%xmm6 # qhasm: h17 = mem128[ ptr + 336 ] # asm 1: movdqu 336(h17=reg128#8 # asm 2: movdqu 336(h17=%xmm7 movdqu 336(%r8),%xmm7 # qhasm: h17 = h17 ^ mem128[ ptr + 544 ] # asm 1: vpxor 544(h17=reg128#8 # asm 2: vpxor 544(h17=%xmm7 vpxor 544(%r8),%xmm7,%xmm7 # qhasm: h4 = h17 # asm 1: movdqa h4=reg128#13 # asm 2: movdqa h4=%xmm12 movdqa %xmm7,%xmm12 # qhasm: h5 = h5 ^ h17 # asm 1: vpxor h5=reg128#12 # asm 2: vpxor h5=%xmm11 vpxor %xmm7,%xmm11,%xmm11 # qhasm: h7 = h7 ^ h17 # asm 1: vpxor h7=reg128#10 # asm 2: vpxor h7=%xmm9 vpxor %xmm7,%xmm9,%xmm9 # qhasm: h8 = h8 ^ h17 # asm 1: vpxor h8=reg128#8 # asm 2: vpxor h8=%xmm7 vpxor %xmm7,%xmm8,%xmm7 # qhasm: h16 = mem128[ ptr + 304 ] # asm 1: movdqu 304(h16=reg128#9 # asm 2: movdqu 304(h16=%xmm8 movdqu 304(%r8),%xmm8 # qhasm: h16 = h16 ^ mem128[ ptr + 512 ] # asm 1: vpxor 512(h16=reg128#9 # asm 2: vpxor 512(h16=%xmm8 vpxor 512(%r8),%xmm8,%xmm8 # qhasm: h3 = h16 # asm 1: movdqa h3=reg128#14 # asm 2: movdqa h3=%xmm13 movdqa %xmm8,%xmm13 # qhasm: h4 = h4 ^ h16 # asm 1: vpxor h4=reg128#13 # asm 2: vpxor h4=%xmm12 vpxor %xmm8,%xmm12,%xmm12 # qhasm: h6 = h6 ^ h16 # asm 1: vpxor h6=reg128#11 # asm 2: vpxor h6=%xmm10 vpxor %xmm8,%xmm10,%xmm10 # qhasm: h7 = h7 ^ h16 # asm 1: vpxor h7=reg128#9 # asm 2: vpxor h7=%xmm8 vpxor %xmm8,%xmm9,%xmm8 # qhasm: h15 = h15 ^ mem128[ ptr + 272 ] # asm 1: vpxor 272(h15=reg128#1 # asm 2: vpxor 272(h15=%xmm0 vpxor 272(%r8),%xmm0,%xmm0 # qhasm: h15 = h15 ^ mem128[ ptr + 480 ] # asm 1: vpxor 480(h15=reg128#1 # asm 2: vpxor 480(h15=%xmm0 vpxor 480(%r8),%xmm0,%xmm0 # qhasm: h2 = h15 # asm 1: movdqa h2=reg128#10 # asm 2: movdqa h2=%xmm9 movdqa %xmm0,%xmm9 # qhasm: h3 = h3 ^ h15 # asm 1: vpxor h3=reg128#14 # asm 2: vpxor h3=%xmm13 vpxor %xmm0,%xmm13,%xmm13 # qhasm: h5 = h5 ^ h15 # asm 1: vpxor h5=reg128#12 # asm 2: vpxor h5=%xmm11 vpxor %xmm0,%xmm11,%xmm11 # qhasm: h6 = h6 ^ h15 # asm 1: vpxor h6=reg128#1 # asm 2: vpxor h6=%xmm0 vpxor %xmm0,%xmm10,%xmm0 # qhasm: h14 = h14 ^ mem128[ ptr + 240 ] # asm 1: vpxor 240(h14=reg128#4 # asm 2: vpxor 240(h14=%xmm3 vpxor 240(%r8),%xmm3,%xmm3 # qhasm: h14 = h14 ^ mem128[ ptr + 448 ] # asm 1: vpxor 448(h14=reg128#4 # asm 2: vpxor 448(h14=%xmm3 vpxor 448(%r8),%xmm3,%xmm3 # qhasm: h1 = h14 # asm 1: movdqa h1=reg128#11 # asm 2: movdqa h1=%xmm10 movdqa %xmm3,%xmm10 # qhasm: h2 = h2 ^ h14 # asm 1: vpxor h2=reg128#10 # asm 2: vpxor h2=%xmm9 vpxor %xmm3,%xmm9,%xmm9 # qhasm: h4 = h4 ^ h14 # asm 1: vpxor h4=reg128#13 # asm 2: vpxor h4=%xmm12 vpxor %xmm3,%xmm12,%xmm12 # qhasm: h5 = h5 ^ h14 # asm 1: vpxor h5=reg128#4 # asm 2: vpxor h5=%xmm3 vpxor %xmm3,%xmm11,%xmm3 # qhasm: h13 = h13 ^ mem128[ ptr + 208 ] # asm 1: vpxor 208(h13=reg128#5 # asm 2: vpxor 208(h13=%xmm4 vpxor 208(%r8),%xmm4,%xmm4 # qhasm: h13 = h13 ^ mem128[ ptr + 416 ] # asm 1: vpxor 416(h13=reg128#5 # asm 2: vpxor 416(h13=%xmm4 vpxor 416(%r8),%xmm4,%xmm4 # qhasm: h0 = h13 # asm 1: movdqa h0=reg128#12 # asm 2: movdqa h0=%xmm11 movdqa %xmm4,%xmm11 # qhasm: h1 = h1 ^ h13 # asm 1: vpxor h1=reg128#11 # asm 2: vpxor h1=%xmm10 vpxor %xmm4,%xmm10,%xmm10 # qhasm: h3 = h3 ^ h13 # asm 1: vpxor h3=reg128#14 # asm 2: vpxor h3=%xmm13 vpxor %xmm4,%xmm13,%xmm13 # qhasm: h4 = h4 ^ h13 # asm 1: vpxor h4=reg128#5 # asm 2: vpxor h4=%xmm4 vpxor %xmm4,%xmm12,%xmm4 # qhasm: h12 = h12 ^ mem128[ ptr + 384 ] # asm 1: vpxor 384(h12=reg128#3 # asm 2: vpxor 384(h12=%xmm2 vpxor 384(%r8),%xmm2,%xmm2 # qhasm: h12 = h12 ^ mem128[ ptr + 176 ] # asm 1: vpxor 176(h12=reg128#3 # asm 2: vpxor 176(h12=%xmm2 vpxor 176(%r8),%xmm2,%xmm2 # qhasm: mem128[ input_0 + 192 ] = h12 # asm 1: movdqu h11=reg128#2 # asm 2: vpxor 352(h11=%xmm1 vpxor 352(%r8),%xmm1,%xmm1 # qhasm: h11 = h11 ^ mem128[ ptr + 144 ] # asm 1: vpxor 144(h11=reg128#2 # asm 2: vpxor 144(h11=%xmm1 vpxor 144(%r8),%xmm1,%xmm1 # qhasm: mem128[ input_0 + 176 ] = h11 # asm 1: movdqu h10=reg128#2 # asm 2: vpxor 320(h10=%xmm1 vpxor 320(%r8),%xmm5,%xmm1 # qhasm: h10 = h10 ^ mem128[ ptr + 112 ] # asm 1: vpxor 112(h10=reg128#2 # asm 2: vpxor 112(h10=%xmm1 vpxor 112(%r8),%xmm1,%xmm1 # qhasm: mem128[ input_0 + 160 ] = h10 # asm 1: movdqu h9=reg128#2 # asm 2: vpxor 288(h9=%xmm1 vpxor 288(%r8),%xmm6,%xmm1 # qhasm: h9 = h9 ^ mem128[ ptr + 80 ] # asm 1: vpxor 80(h9=reg128#2 # asm 2: vpxor 80(h9=%xmm1 vpxor 80(%r8),%xmm1,%xmm1 # qhasm: mem128[ input_0 + 144 ] = h9 # asm 1: movdqu h8=reg128#2 # asm 2: vpxor 256(h8=%xmm1 vpxor 256(%r8),%xmm7,%xmm1 # qhasm: h8 = h8 ^ mem128[ ptr + 48 ] # asm 1: vpxor 48(h8=reg128#2 # asm 2: vpxor 48(h8=%xmm1 vpxor 48(%r8),%xmm1,%xmm1 # qhasm: mem128[ input_0 + 128 ] = h8 # asm 1: movdqu h7=reg128#2 # asm 2: vpxor 224(h7=%xmm1 vpxor 224(%r8),%xmm8,%xmm1 # qhasm: h7 = h7 ^ mem128[ ptr + 16 ] # asm 1: vpxor 16(h7=reg128#2 # asm 2: vpxor 16(h7=%xmm1 vpxor 16(%r8),%xmm1,%xmm1 # qhasm: mem128[ input_0 + 112 ] = h7 # asm 1: movdqu h6=reg128#1 # asm 2: vpxor 192(h6=%xmm0 vpxor 192(%r8),%xmm0,%xmm0 # qhasm: mem128[ input_0 + 96 ] = h6 # asm 1: movdqu h5=reg128#1 # asm 2: vpxor 160(h5=%xmm0 vpxor 160(%r8),%xmm3,%xmm0 # qhasm: mem128[ input_0 + 80 ] = h5 # asm 1: movdqu h4=reg128#1 # asm 2: vpxor 128(h4=%xmm0 vpxor 128(%r8),%xmm4,%xmm0 # qhasm: mem128[ input_0 + 64 ] = h4 # asm 1: movdqu h3=reg128#1 # asm 2: vpxor 96(h3=%xmm0 vpxor 96(%r8),%xmm13,%xmm0 # qhasm: mem128[ input_0 + 48 ] = h3 # asm 1: movdqu h2=reg128#1 # asm 2: vpxor 64(h2=%xmm0 vpxor 64(%r8),%xmm9,%xmm0 # qhasm: mem128[ input_0 + 32 ] = h2 # asm 1: movdqu h1=reg128#1 # asm 2: vpxor 32(h1=%xmm0 vpxor 32(%r8),%xmm10,%xmm0 # qhasm: mem128[ input_0 + 16 ] = h1 # asm 1: movdqu h0=reg128#1 # asm 2: vpxor 0(h0=%xmm0 vpxor 0(%r8),%xmm11,%xmm0 # qhasm: mem128[ input_0 + 0 ] = h0 # asm 1: movdqu