// 20240504 djb: add note.GNU-stack // 20221231 djb: port hidden to macos; tnx thom wiggers // 20221230 djb: add linker line // linker define vec128_mul_asm #include "crypto_asm_hidden.h" #define vec128_mul_asm CRYPTO_SHARED_NAMESPACE(vec128_mul_asm) #define _vec128_mul_asm _CRYPTO_SHARED_NAMESPACE(vec128_mul_asm) # qhasm: int64 input_0 # qhasm: int64 input_1 # qhasm: int64 input_2 # qhasm: int64 input_3 # qhasm: int64 input_4 # qhasm: int64 input_5 # qhasm: stack64 input_6 # qhasm: stack64 input_7 # qhasm: int64 caller_r11 # qhasm: int64 caller_r12 # qhasm: int64 caller_r13 # qhasm: int64 caller_r14 # qhasm: int64 caller_r15 # qhasm: int64 caller_rbx # qhasm: int64 caller_rbp # qhasm: reg256 b0 # qhasm: reg256 b1 # qhasm: reg256 b2 # qhasm: reg256 b3 # qhasm: reg256 b4 # qhasm: reg256 b5 # qhasm: reg256 b6 # qhasm: reg256 b7 # qhasm: reg256 b8 # qhasm: reg256 b9 # qhasm: reg256 b10 # qhasm: reg256 b11 # qhasm: reg256 a0 # qhasm: reg256 a1 # qhasm: reg256 a2 # qhasm: reg256 a3 # qhasm: reg256 a4 # qhasm: reg256 a5 # qhasm: reg256 r0 # qhasm: reg256 r1 # qhasm: reg256 r2 # qhasm: reg256 r3 # qhasm: reg256 r4 # qhasm: reg256 r5 # qhasm: reg256 r6 # qhasm: reg256 r7 # qhasm: reg256 r8 # qhasm: reg256 r9 # qhasm: reg256 r10 # qhasm: reg256 r11 # qhasm: reg256 r12 # qhasm: reg256 r13 # qhasm: reg256 r14 # qhasm: reg256 r15 # qhasm: reg256 r16 # qhasm: reg256 r17 # qhasm: reg256 r18 # qhasm: reg256 r19 # qhasm: reg256 r20 # qhasm: reg256 r21 # qhasm: reg256 r22 # qhasm: reg256 r # qhasm: reg128 h0 # qhasm: reg128 h1 # qhasm: reg128 h2 # qhasm: reg128 h3 # qhasm: reg128 h4 # qhasm: reg128 h5 # qhasm: reg128 h6 # qhasm: reg128 h7 # qhasm: reg128 h8 # qhasm: reg128 h9 # qhasm: reg128 h10 # qhasm: reg128 h11 # qhasm: reg128 h12 # qhasm: reg128 h13 # qhasm: reg128 h14 # qhasm: reg128 h15 # qhasm: reg128 h16 # qhasm: reg128 h17 # qhasm: reg128 h18 # qhasm: reg128 h19 # qhasm: reg128 h20 # qhasm: reg128 h21 # qhasm: reg128 h22 # qhasm: stack4864 buf # qhasm: int64 ptr # qhasm: int64 tmp # qhasm: enter vec128_mul_asm .p2align 5 ASM_HIDDEN _vec128_mul_asm ASM_HIDDEN vec128_mul_asm .global _vec128_mul_asm .global vec128_mul_asm _vec128_mul_asm: vec128_mul_asm: mov %rsp,%r11 and $31,%r11 add $608,%r11 sub %r11,%rsp # qhasm: ptr = &buf # asm 1: leaq ptr=int64#4 # asm 2: leaq ptr=%rcx leaq 0(%rsp),%rcx # qhasm: b11 = mem128[ input_2 + 176 ] x2 # asm 1: vbroadcasti128 176(b11=reg256#1 # asm 2: vbroadcasti128 176(b11=%ymm0 vbroadcasti128 176(%rdx), %ymm0 # qhasm: a5[0] = mem128[ input_1 + 80 ] # asm 1: vinsertf128 $0x0,80(r16=reg256#3 # asm 2: vpand r16=%ymm2 vpand %ymm0,%ymm1,%ymm2 # qhasm: mem256[ ptr + 512 ] = r16 # asm 1: vmovupd r15=reg256#4 # asm 2: vpand r15=%ymm3 vpand %ymm0,%ymm2,%ymm3 # qhasm: a3[0] = mem128[ input_1 + 48 ] # asm 1: vinsertf128 $0x0,48(r14=reg256#6 # asm 2: vpand r14=%ymm5 vpand %ymm0,%ymm4,%ymm5 # qhasm: a2[0] = mem128[ input_1 + 32 ] # asm 1: vinsertf128 $0x0,32(r13=reg256#8 # asm 2: vpand r13=%ymm7 vpand %ymm0,%ymm6,%ymm7 # qhasm: a1[0] = mem128[ input_1 + 16 ] # asm 1: vinsertf128 $0x0,16(r12=reg256#10 # asm 2: vpand r12=%ymm9 vpand %ymm0,%ymm8,%ymm9 # qhasm: a0[0] = mem128[ input_1 + 0 ] # asm 1: vinsertf128 $0x0,0(r11=reg256#1 # asm 2: vpand r11=%ymm0 vpand %ymm0,%ymm10,%ymm0 # qhasm: b10 = mem128[ input_2 + 160 ] x2 # asm 1: vbroadcasti128 160(b10=reg256#12 # asm 2: vbroadcasti128 160(b10=%ymm11 vbroadcasti128 160(%rdx), %ymm11 # qhasm: r = b10 & a5 # asm 1: vpand r=reg256#13 # asm 2: vpand r=%ymm12 vpand %ymm11,%ymm1,%ymm12 # qhasm: r15 ^= r # asm 1: vpxor r=reg256#4 # asm 2: vpand r=%ymm3 vpand %ymm11,%ymm2,%ymm3 # qhasm: r14 ^= r # asm 1: vpxor r=reg256#4 # asm 2: vpand r=%ymm3 vpand %ymm11,%ymm4,%ymm3 # qhasm: r13 ^= r # asm 1: vpxor r=reg256#4 # asm 2: vpand r=%ymm3 vpand %ymm11,%ymm6,%ymm3 # qhasm: r12 ^= r # asm 1: vpxor r=reg256#4 # asm 2: vpand r=%ymm3 vpand %ymm11,%ymm8,%ymm3 # qhasm: r11 ^= r # asm 1: vpxor r10=reg256#4 # asm 2: vpand r10=%ymm3 vpand %ymm11,%ymm10,%ymm3 # qhasm: b9 = mem128[ input_2 + 144 ] x2 # asm 1: vbroadcasti128 144(b9=reg256#12 # asm 2: vbroadcasti128 144(b9=%ymm11 vbroadcasti128 144(%rdx), %ymm11 # qhasm: r = b9 & a5 # asm 1: vpand r=reg256#13 # asm 2: vpand r=%ymm12 vpand %ymm11,%ymm1,%ymm12 # qhasm: r14 ^= r # asm 1: vpxor r=reg256#6 # asm 2: vpand r=%ymm5 vpand %ymm11,%ymm2,%ymm5 # qhasm: r13 ^= r # asm 1: vpxor r=reg256#6 # asm 2: vpand r=%ymm5 vpand %ymm11,%ymm4,%ymm5 # qhasm: r12 ^= r # asm 1: vpxor r=reg256#6 # asm 2: vpand r=%ymm5 vpand %ymm11,%ymm6,%ymm5 # qhasm: r11 ^= r # asm 1: vpxor r=reg256#6 # asm 2: vpand r=%ymm5 vpand %ymm11,%ymm8,%ymm5 # qhasm: r10 ^= r # asm 1: vpxor r9=reg256#6 # asm 2: vpand r9=%ymm5 vpand %ymm11,%ymm10,%ymm5 # qhasm: b8 = mem128[ input_2 + 128 ] x2 # asm 1: vbroadcasti128 128(b8=reg256#12 # asm 2: vbroadcasti128 128(b8=%ymm11 vbroadcasti128 128(%rdx), %ymm11 # qhasm: r = b8 & a5 # asm 1: vpand r=reg256#13 # asm 2: vpand r=%ymm12 vpand %ymm11,%ymm1,%ymm12 # qhasm: r13 ^= r # asm 1: vpxor r=reg256#8 # asm 2: vpand r=%ymm7 vpand %ymm11,%ymm2,%ymm7 # qhasm: r12 ^= r # asm 1: vpxor r=reg256#8 # asm 2: vpand r=%ymm7 vpand %ymm11,%ymm4,%ymm7 # qhasm: r11 ^= r # asm 1: vpxor r=reg256#8 # asm 2: vpand r=%ymm7 vpand %ymm11,%ymm6,%ymm7 # qhasm: r10 ^= r # asm 1: vpxor r=reg256#8 # asm 2: vpand r=%ymm7 vpand %ymm11,%ymm8,%ymm7 # qhasm: r9 ^= r # asm 1: vpxor r8=reg256#8 # asm 2: vpand r8=%ymm7 vpand %ymm11,%ymm10,%ymm7 # qhasm: b7 = mem128[ input_2 + 112 ] x2 # asm 1: vbroadcasti128 112(b7=reg256#12 # asm 2: vbroadcasti128 112(b7=%ymm11 vbroadcasti128 112(%rdx), %ymm11 # qhasm: r = b7 & a5 # asm 1: vpand r=reg256#13 # asm 2: vpand r=%ymm12 vpand %ymm11,%ymm1,%ymm12 # qhasm: r12 ^= r # asm 1: vpxor r=reg256#10 # asm 2: vpand r=%ymm9 vpand %ymm11,%ymm2,%ymm9 # qhasm: r11 ^= r # asm 1: vpxor r=reg256#10 # asm 2: vpand r=%ymm9 vpand %ymm11,%ymm4,%ymm9 # qhasm: r10 ^= r # asm 1: vpxor r=reg256#10 # asm 2: vpand r=%ymm9 vpand %ymm11,%ymm6,%ymm9 # qhasm: r9 ^= r # asm 1: vpxor r=reg256#10 # asm 2: vpand r=%ymm9 vpand %ymm11,%ymm8,%ymm9 # qhasm: r8 ^= r # asm 1: vpxor r7=reg256#10 # asm 2: vpand r7=%ymm9 vpand %ymm11,%ymm10,%ymm9 # qhasm: b6 = mem128[ input_2 + 96 ] x2 # asm 1: vbroadcasti128 96(b6=reg256#12 # asm 2: vbroadcasti128 96(b6=%ymm11 vbroadcasti128 96(%rdx), %ymm11 # qhasm: r = b6 & a5 # asm 1: vpand r=reg256#13 # asm 2: vpand r=%ymm12 vpand %ymm11,%ymm1,%ymm12 # qhasm: r11 ^= r # asm 1: vpxor r=reg256#1 # asm 2: vpand r=%ymm0 vpand %ymm11,%ymm2,%ymm0 # qhasm: r10 ^= r # asm 1: vpxor r=reg256#1 # asm 2: vpand r=%ymm0 vpand %ymm11,%ymm4,%ymm0 # qhasm: r9 ^= r # asm 1: vpxor r=reg256#1 # asm 2: vpand r=%ymm0 vpand %ymm11,%ymm6,%ymm0 # qhasm: r8 ^= r # asm 1: vpxor r=reg256#1 # asm 2: vpand r=%ymm0 vpand %ymm11,%ymm8,%ymm0 # qhasm: r7 ^= r # asm 1: vpxor r6=reg256#1 # asm 2: vpand r6=%ymm0 vpand %ymm11,%ymm10,%ymm0 # qhasm: b5 = mem128[ input_2 + 80 ] x2 # asm 1: vbroadcasti128 80(b5=reg256#12 # asm 2: vbroadcasti128 80(b5=%ymm11 vbroadcasti128 80(%rdx), %ymm11 # qhasm: r = b5 & a5 # asm 1: vpand r=reg256#13 # asm 2: vpand r=%ymm12 vpand %ymm11,%ymm1,%ymm12 # qhasm: r10 ^= r # asm 1: vpxor r=reg256#4 # asm 2: vpand r=%ymm3 vpand %ymm11,%ymm2,%ymm3 # qhasm: r9 ^= r # asm 1: vpxor r=reg256#4 # asm 2: vpand r=%ymm3 vpand %ymm11,%ymm4,%ymm3 # qhasm: r8 ^= r # asm 1: vpxor r=reg256#4 # asm 2: vpand r=%ymm3 vpand %ymm11,%ymm6,%ymm3 # qhasm: r7 ^= r # asm 1: vpxor r=reg256#4 # asm 2: vpand r=%ymm3 vpand %ymm11,%ymm8,%ymm3 # qhasm: r6 ^= r # asm 1: vpxor r5=reg256#4 # asm 2: vpand r5=%ymm3 vpand %ymm11,%ymm10,%ymm3 # qhasm: b4 = mem128[ input_2 + 64 ] x2 # asm 1: vbroadcasti128 64(b4=reg256#12 # asm 2: vbroadcasti128 64(b4=%ymm11 vbroadcasti128 64(%rdx), %ymm11 # qhasm: r = b4 & a5 # asm 1: vpand r=reg256#13 # asm 2: vpand r=%ymm12 vpand %ymm11,%ymm1,%ymm12 # qhasm: r9 ^= r # asm 1: vpxor r=reg256#6 # asm 2: vpand r=%ymm5 vpand %ymm11,%ymm2,%ymm5 # qhasm: r8 ^= r # asm 1: vpxor r=reg256#6 # asm 2: vpand r=%ymm5 vpand %ymm11,%ymm4,%ymm5 # qhasm: r7 ^= r # asm 1: vpxor r=reg256#6 # asm 2: vpand r=%ymm5 vpand %ymm11,%ymm6,%ymm5 # qhasm: r6 ^= r # asm 1: vpxor r=reg256#6 # asm 2: vpand r=%ymm5 vpand %ymm11,%ymm8,%ymm5 # qhasm: r5 ^= r # asm 1: vpxor r4=reg256#6 # asm 2: vpand r4=%ymm5 vpand %ymm11,%ymm10,%ymm5 # qhasm: b3 = mem128[ input_2 + 48 ] x2 # asm 1: vbroadcasti128 48(b3=reg256#12 # asm 2: vbroadcasti128 48(b3=%ymm11 vbroadcasti128 48(%rdx), %ymm11 # qhasm: r = b3 & a5 # asm 1: vpand r=reg256#13 # asm 2: vpand r=%ymm12 vpand %ymm11,%ymm1,%ymm12 # qhasm: r8 ^= r # asm 1: vpxor r=reg256#8 # asm 2: vpand r=%ymm7 vpand %ymm11,%ymm2,%ymm7 # qhasm: r7 ^= r # asm 1: vpxor r=reg256#8 # asm 2: vpand r=%ymm7 vpand %ymm11,%ymm4,%ymm7 # qhasm: r6 ^= r # asm 1: vpxor r=reg256#8 # asm 2: vpand r=%ymm7 vpand %ymm11,%ymm6,%ymm7 # qhasm: r5 ^= r # asm 1: vpxor r=reg256#8 # asm 2: vpand r=%ymm7 vpand %ymm11,%ymm8,%ymm7 # qhasm: r4 ^= r # asm 1: vpxor r3=reg256#8 # asm 2: vpand r3=%ymm7 vpand %ymm11,%ymm10,%ymm7 # qhasm: b2 = mem128[ input_2 + 32 ] x2 # asm 1: vbroadcasti128 32(b2=reg256#12 # asm 2: vbroadcasti128 32(b2=%ymm11 vbroadcasti128 32(%rdx), %ymm11 # qhasm: r = b2 & a5 # asm 1: vpand r=reg256#13 # asm 2: vpand r=%ymm12 vpand %ymm11,%ymm1,%ymm12 # qhasm: r7 ^= r # asm 1: vpxor r=reg256#10 # asm 2: vpand r=%ymm9 vpand %ymm11,%ymm2,%ymm9 # qhasm: r6 ^= r # asm 1: vpxor r=reg256#10 # asm 2: vpand r=%ymm9 vpand %ymm11,%ymm4,%ymm9 # qhasm: r5 ^= r # asm 1: vpxor r=reg256#10 # asm 2: vpand r=%ymm9 vpand %ymm11,%ymm6,%ymm9 # qhasm: r4 ^= r # asm 1: vpxor r=reg256#10 # asm 2: vpand r=%ymm9 vpand %ymm11,%ymm8,%ymm9 # qhasm: r3 ^= r # asm 1: vpxor r2=reg256#10 # asm 2: vpand r2=%ymm9 vpand %ymm11,%ymm10,%ymm9 # qhasm: b1 = mem128[ input_2 + 16 ] x2 # asm 1: vbroadcasti128 16(b1=reg256#12 # asm 2: vbroadcasti128 16(b1=%ymm11 vbroadcasti128 16(%rdx), %ymm11 # qhasm: r = b1 & a5 # asm 1: vpand r=reg256#13 # asm 2: vpand r=%ymm12 vpand %ymm11,%ymm1,%ymm12 # qhasm: r6 ^= r # asm 1: vpxor r=reg256#1 # asm 2: vpand r=%ymm0 vpand %ymm11,%ymm2,%ymm0 # qhasm: r5 ^= r # asm 1: vpxor r=reg256#1 # asm 2: vpand r=%ymm0 vpand %ymm11,%ymm4,%ymm0 # qhasm: r4 ^= r # asm 1: vpxor r=reg256#1 # asm 2: vpand r=%ymm0 vpand %ymm11,%ymm6,%ymm0 # qhasm: r3 ^= r # asm 1: vpxor r=reg256#1 # asm 2: vpand r=%ymm0 vpand %ymm11,%ymm8,%ymm0 # qhasm: r2 ^= r # asm 1: vpxor r1=reg256#1 # asm 2: vpand r1=%ymm0 vpand %ymm11,%ymm10,%ymm0 # qhasm: b0 = mem128[ input_2 + 0 ] x2 # asm 1: vbroadcasti128 0(b0=reg256#12 # asm 2: vbroadcasti128 0(b0=%ymm11 vbroadcasti128 0(%rdx), %ymm11 # qhasm: r = b0 & a5 # asm 1: vpand r=reg256#2 # asm 2: vpand r=%ymm1 vpand %ymm11,%ymm1,%ymm1 # qhasm: r5 ^= r # asm 1: vpxor r=reg256#2 # asm 2: vpand r=%ymm1 vpand %ymm11,%ymm2,%ymm1 # qhasm: r4 ^= r # asm 1: vpxor r=reg256#2 # asm 2: vpand r=%ymm1 vpand %ymm11,%ymm4,%ymm1 # qhasm: r3 ^= r # asm 1: vpxor r=reg256#2 # asm 2: vpand r=%ymm1 vpand %ymm11,%ymm6,%ymm1 # qhasm: r2 ^= r # asm 1: vpxor r=reg256#2 # asm 2: vpand r=%ymm1 vpand %ymm11,%ymm8,%ymm1 # qhasm: r1 ^= r # asm 1: vpxor r0=reg256#2 # asm 2: vpand r0=%ymm1 vpand %ymm11,%ymm10,%ymm1 # qhasm: mem256[ ptr + 128 ] = r4 # asm 1: vmovupd h22=reg128#1 # asm 2: movdqu 528(h22=%xmm0 movdqu 528(%rcx),%xmm0 # qhasm: h13 = h22 # asm 1: movdqa h13=reg128#2 # asm 2: movdqa h13=%xmm1 movdqa %xmm0,%xmm1 # qhasm: h10 = h22 # asm 1: movdqa h10=reg128#1 # asm 2: movdqa h10=%xmm0 movdqa %xmm0,%xmm0 # qhasm: h21 = mem128[ ptr + 496 ] # asm 1: movdqu 496(h21=reg128#3 # asm 2: movdqu 496(h21=%xmm2 movdqu 496(%rcx),%xmm2 # qhasm: h12 = h21 # asm 1: movdqa h12=reg128#4 # asm 2: movdqa h12=%xmm3 movdqa %xmm2,%xmm3 # qhasm: h9 = h21 # asm 1: movdqa h9=reg128#3 # asm 2: movdqa h9=%xmm2 movdqa %xmm2,%xmm2 # qhasm: h20 = mem128[ ptr + 464 ] # asm 1: movdqu 464(h20=reg128#5 # asm 2: movdqu 464(h20=%xmm4 movdqu 464(%rcx),%xmm4 # qhasm: h11 = h20 # asm 1: movdqa h11=reg128#6 # asm 2: movdqa h11=%xmm5 movdqa %xmm4,%xmm5 # qhasm: h8 = h20 # asm 1: movdqa h8=reg128#5 # asm 2: movdqa h8=%xmm4 movdqa %xmm4,%xmm4 # qhasm: h19 = mem128[ ptr + 432 ] # asm 1: movdqu 432(h19=reg128#7 # asm 2: movdqu 432(h19=%xmm6 movdqu 432(%rcx),%xmm6 # qhasm: h10 = h10 ^ h19 # asm 1: vpxor h10=reg128#1 # asm 2: vpxor h10=%xmm0 vpxor %xmm6,%xmm0,%xmm0 # qhasm: h7 = h19 # asm 1: movdqa h7=reg128#7 # asm 2: movdqa h7=%xmm6 movdqa %xmm6,%xmm6 # qhasm: h18 = mem128[ ptr + 400 ] # asm 1: movdqu 400(h18=reg128#8 # asm 2: movdqu 400(h18=%xmm7 movdqu 400(%rcx),%xmm7 # qhasm: h9 = h9 ^ h18 # asm 1: vpxor h9=reg128#3 # asm 2: vpxor h9=%xmm2 vpxor %xmm7,%xmm2,%xmm2 # qhasm: h6 = h18 # asm 1: movdqa h6=reg128#8 # asm 2: movdqa h6=%xmm7 movdqa %xmm7,%xmm7 # qhasm: h17 = mem128[ ptr + 368 ] # asm 1: movdqu 368(h17=reg128#9 # asm 2: movdqu 368(h17=%xmm8 movdqu 368(%rcx),%xmm8 # qhasm: h8 = h8 ^ h17 # asm 1: vpxor h8=reg128#5 # asm 2: vpxor h8=%xmm4 vpxor %xmm8,%xmm4,%xmm4 # qhasm: h5 = h17 # asm 1: movdqa h5=reg128#9 # asm 2: movdqa h5=%xmm8 movdqa %xmm8,%xmm8 # qhasm: h16 = mem128[ ptr + 336 ] # asm 1: movdqu 336(h16=reg128#10 # asm 2: movdqu 336(h16=%xmm9 movdqu 336(%rcx),%xmm9 # qhasm: h16 = h16 ^ mem128[ ptr + 512 ] # asm 1: vpxor 512(h16=reg128#10 # asm 2: vpxor 512(h16=%xmm9 vpxor 512(%rcx),%xmm9,%xmm9 # qhasm: h7 = h7 ^ h16 # asm 1: vpxor h7=reg128#7 # asm 2: vpxor h7=%xmm6 vpxor %xmm9,%xmm6,%xmm6 # qhasm: h4 = h16 # asm 1: movdqa h4=reg128#10 # asm 2: movdqa h4=%xmm9 movdqa %xmm9,%xmm9 # qhasm: h15 = mem128[ ptr + 304 ] # asm 1: movdqu 304(h15=reg128#11 # asm 2: movdqu 304(h15=%xmm10 movdqu 304(%rcx),%xmm10 # qhasm: h15 = h15 ^ mem128[ ptr + 480 ] # asm 1: vpxor 480(h15=reg128#11 # asm 2: vpxor 480(h15=%xmm10 vpxor 480(%rcx),%xmm10,%xmm10 # qhasm: h6 = h6 ^ h15 # asm 1: vpxor h6=reg128#8 # asm 2: vpxor h6=%xmm7 vpxor %xmm10,%xmm7,%xmm7 # qhasm: h3 = h15 # asm 1: movdqa h3=reg128#11 # asm 2: movdqa h3=%xmm10 movdqa %xmm10,%xmm10 # qhasm: h14 = mem128[ ptr + 272 ] # asm 1: movdqu 272(h14=reg128#12 # asm 2: movdqu 272(h14=%xmm11 movdqu 272(%rcx),%xmm11 # qhasm: h14 = h14 ^ mem128[ ptr + 448 ] # asm 1: vpxor 448(h14=reg128#12 # asm 2: vpxor 448(h14=%xmm11 vpxor 448(%rcx),%xmm11,%xmm11 # qhasm: h5 = h5 ^ h14 # asm 1: vpxor h5=reg128#9 # asm 2: vpxor h5=%xmm8 vpxor %xmm11,%xmm8,%xmm8 # qhasm: h2 = h14 # asm 1: movdqa h2=reg128#12 # asm 2: movdqa h2=%xmm11 movdqa %xmm11,%xmm11 # qhasm: h13 = h13 ^ mem128[ ptr + 240 ] # asm 1: vpxor 240(h13=reg128#2 # asm 2: vpxor 240(h13=%xmm1 vpxor 240(%rcx),%xmm1,%xmm1 # qhasm: h13 = h13 ^ mem128[ ptr + 416 ] # asm 1: vpxor 416(h13=reg128#2 # asm 2: vpxor 416(h13=%xmm1 vpxor 416(%rcx),%xmm1,%xmm1 # qhasm: h4 = h4 ^ h13 # asm 1: vpxor h4=reg128#10 # asm 2: vpxor h4=%xmm9 vpxor %xmm1,%xmm9,%xmm9 # qhasm: h1 = h13 # asm 1: movdqa h1=reg128#2 # asm 2: movdqa h1=%xmm1 movdqa %xmm1,%xmm1 # qhasm: h12 = h12 ^ mem128[ ptr + 208 ] # asm 1: vpxor 208(h12=reg128#4 # asm 2: vpxor 208(h12=%xmm3 vpxor 208(%rcx),%xmm3,%xmm3 # qhasm: h12 = h12 ^ mem128[ ptr + 384 ] # asm 1: vpxor 384(h12=reg128#4 # asm 2: vpxor 384(h12=%xmm3 vpxor 384(%rcx),%xmm3,%xmm3 # qhasm: h3 = h3 ^ h12 # asm 1: vpxor h3=reg128#11 # asm 2: vpxor h3=%xmm10 vpxor %xmm3,%xmm10,%xmm10 # qhasm: h0 = h12 # asm 1: movdqa h0=reg128#4 # asm 2: movdqa h0=%xmm3 movdqa %xmm3,%xmm3 # qhasm: h11 = h11 ^ mem128[ ptr + 352 ] # asm 1: vpxor 352(h11=reg128#6 # asm 2: vpxor 352(h11=%xmm5 vpxor 352(%rcx),%xmm5,%xmm5 # qhasm: h11 = h11 ^ mem128[ ptr + 176 ] # asm 1: vpxor 176(h11=reg128#6 # asm 2: vpxor 176(h11=%xmm5 vpxor 176(%rcx),%xmm5,%xmm5 # qhasm: mem128[ input_0 + 176 ] = h11 # asm 1: movdqu h10=reg128#1 # asm 2: vpxor 320(h10=%xmm0 vpxor 320(%rcx),%xmm0,%xmm0 # qhasm: h10 = h10 ^ mem128[ ptr + 144 ] # asm 1: vpxor 144(h10=reg128#1 # asm 2: vpxor 144(h10=%xmm0 vpxor 144(%rcx),%xmm0,%xmm0 # qhasm: mem128[ input_0 + 160 ] = h10 # asm 1: movdqu h9=reg128#1 # asm 2: vpxor 288(h9=%xmm0 vpxor 288(%rcx),%xmm2,%xmm0 # qhasm: h9 = h9 ^ mem128[ ptr + 112 ] # asm 1: vpxor 112(h9=reg128#1 # asm 2: vpxor 112(h9=%xmm0 vpxor 112(%rcx),%xmm0,%xmm0 # qhasm: mem128[ input_0 + 144 ] = h9 # asm 1: movdqu h8=reg128#1 # asm 2: vpxor 256(h8=%xmm0 vpxor 256(%rcx),%xmm4,%xmm0 # qhasm: h8 = h8 ^ mem128[ ptr + 80 ] # asm 1: vpxor 80(h8=reg128#1 # asm 2: vpxor 80(h8=%xmm0 vpxor 80(%rcx),%xmm0,%xmm0 # qhasm: mem128[ input_0 + 128 ] = h8 # asm 1: movdqu h7=reg128#1 # asm 2: vpxor 224(h7=%xmm0 vpxor 224(%rcx),%xmm6,%xmm0 # qhasm: h7 = h7 ^ mem128[ ptr + 48 ] # asm 1: vpxor 48(h7=reg128#1 # asm 2: vpxor 48(h7=%xmm0 vpxor 48(%rcx),%xmm0,%xmm0 # qhasm: mem128[ input_0 + 112 ] = h7 # asm 1: movdqu h6=reg128#1 # asm 2: vpxor 192(h6=%xmm0 vpxor 192(%rcx),%xmm7,%xmm0 # qhasm: h6 = h6 ^ mem128[ ptr + 16 ] # asm 1: vpxor 16(h6=reg128#1 # asm 2: vpxor 16(h6=%xmm0 vpxor 16(%rcx),%xmm0,%xmm0 # qhasm: mem128[ input_0 + 96 ] = h6 # asm 1: movdqu h5=reg128#1 # asm 2: vpxor 160(h5=%xmm0 vpxor 160(%rcx),%xmm8,%xmm0 # qhasm: mem128[ input_0 + 80 ] = h5 # asm 1: movdqu h4=reg128#1 # asm 2: vpxor 128(h4=%xmm0 vpxor 128(%rcx),%xmm9,%xmm0 # qhasm: mem128[ input_0 + 64 ] = h4 # asm 1: movdqu h3=reg128#1 # asm 2: vpxor 96(h3=%xmm0 vpxor 96(%rcx),%xmm10,%xmm0 # qhasm: mem128[ input_0 + 48 ] = h3 # asm 1: movdqu h2=reg128#1 # asm 2: vpxor 64(h2=%xmm0 vpxor 64(%rcx),%xmm11,%xmm0 # qhasm: mem128[ input_0 + 32 ] = h2 # asm 1: movdqu h1=reg128#1 # asm 2: vpxor 32(h1=%xmm0 vpxor 32(%rcx),%xmm1,%xmm0 # qhasm: mem128[ input_0 + 16 ] = h1 # asm 1: movdqu h0=reg128#1 # asm 2: vpxor 0(h0=%xmm0 vpxor 0(%rcx),%xmm3,%xmm0 # qhasm: mem128[ input_0 + 0 ] = h0 # asm 1: movdqu