OPTION DOTNAME .text$ SEGMENT ALIGN(256) 'CODE' EXTERN OPENSSL_ia32cap_P:NEAR PUBLIC sha1_multi_block ALIGN 32 sha1_multi_block PROC PUBLIC mov QWORD PTR[8+rsp],rdi ;WIN64 prologue mov QWORD PTR[16+rsp],rsi mov rax,rsp $L$SEH_begin_sha1_multi_block:: mov rdi,rcx mov rsi,rdx mov rdx,r8 mov rcx,QWORD PTR[((OPENSSL_ia32cap_P+4))] bt rcx,61 jc _shaext_shortcut test ecx,268435456 jnz _avx_shortcut mov rax,rsp push rbx push rbp lea rsp,QWORD PTR[((-168))+rsp] movaps XMMWORD PTR[rsp],xmm6 movaps XMMWORD PTR[16+rsp],xmm7 movaps XMMWORD PTR[32+rsp],xmm8 movaps XMMWORD PTR[48+rsp],xmm9 movaps XMMWORD PTR[(-120)+rax],xmm10 movaps XMMWORD PTR[(-104)+rax],xmm11 movaps XMMWORD PTR[(-88)+rax],xmm12 movaps XMMWORD PTR[(-72)+rax],xmm13 movaps XMMWORD PTR[(-56)+rax],xmm14 movaps XMMWORD PTR[(-40)+rax],xmm15 sub rsp,288 and rsp,-256 mov QWORD PTR[272+rsp],rax $L$body:: lea rbp,QWORD PTR[K_XX_XX] lea rbx,QWORD PTR[256+rsp] $L$oop_grande:: mov DWORD PTR[280+rsp],edx xor edx,edx mov r8,QWORD PTR[rsi] mov ecx,DWORD PTR[8+rsi] cmp ecx,edx cmovg edx,ecx test ecx,ecx mov DWORD PTR[rbx],ecx cmovle r8,rbp mov r9,QWORD PTR[16+rsi] mov ecx,DWORD PTR[24+rsi] cmp ecx,edx cmovg edx,ecx test ecx,ecx mov DWORD PTR[4+rbx],ecx cmovle r9,rbp mov r10,QWORD PTR[32+rsi] mov ecx,DWORD PTR[40+rsi] cmp ecx,edx cmovg edx,ecx test ecx,ecx mov DWORD PTR[8+rbx],ecx cmovle r10,rbp mov r11,QWORD PTR[48+rsi] mov ecx,DWORD PTR[56+rsi] cmp ecx,edx cmovg edx,ecx test ecx,ecx mov DWORD PTR[12+rbx],ecx cmovle r11,rbp test edx,edx jz $L$done movdqu xmm10,XMMWORD PTR[rdi] lea rax,QWORD PTR[128+rsp] movdqu xmm11,XMMWORD PTR[32+rdi] movdqu xmm12,XMMWORD PTR[64+rdi] movdqu xmm13,XMMWORD PTR[96+rdi] movdqu xmm14,XMMWORD PTR[128+rdi] movdqa xmm5,XMMWORD PTR[96+rbp] movdqa xmm15,XMMWORD PTR[((-32))+rbp] jmp $L$oop ALIGN 32 $L$oop:: movd xmm0,DWORD PTR[r8] lea r8,QWORD PTR[64+r8] movd xmm2,DWORD PTR[r9] lea r9,QWORD PTR[64+r9] movd xmm3,DWORD PTR[r10] lea r10,QWORD PTR[64+r10] movd xmm4,DWORD PTR[r11] lea r11,QWORD PTR[64+r11] punpckldq xmm0,xmm3 movd xmm1,DWORD PTR[((-60))+r8] punpckldq xmm2,xmm4 movd xmm9,DWORD PTR[((-60))+r9] punpckldq xmm0,xmm2 movd xmm8,DWORD PTR[((-60))+r10] DB 102,15,56,0,197 movd xmm7,DWORD PTR[((-60))+r11] punpckldq xmm1,xmm8 movdqa xmm8,xmm10 paddd xmm14,xmm15 punpckldq xmm9,xmm7 movdqa xmm7,xmm11 movdqa xmm6,xmm11 pslld xmm8,5 pandn xmm7,xmm13 pand xmm6,xmm12 punpckldq xmm1,xmm9 movdqa xmm9,xmm10 movdqa XMMWORD PTR[(0-128)+rax],xmm0 paddd xmm14,xmm0 movd xmm2,DWORD PTR[((-56))+r8] psrld xmm9,27 pxor xmm6,xmm7 movdqa xmm7,xmm11 por xmm8,xmm9 movd xmm9,DWORD PTR[((-56))+r9] pslld xmm7,30 paddd xmm14,xmm6 psrld xmm11,2 paddd xmm14,xmm8 DB 102,15,56,0,205 movd xmm8,DWORD PTR[((-56))+r10] por xmm11,xmm7 movd xmm7,DWORD PTR[((-56))+r11] punpckldq xmm2,xmm8 movdqa xmm8,xmm14 paddd xmm13,xmm15 punpckldq xmm9,xmm7 movdqa xmm7,xmm10 movdqa xmm6,xmm10 pslld xmm8,5 pandn xmm7,xmm12 pand xmm6,xmm11 punpckldq xmm2,xmm9 movdqa xmm9,xmm14 movdqa XMMWORD PTR[(16-128)+rax],xmm1 paddd xmm13,xmm1 movd xmm3,DWORD PTR[((-52))+r8] psrld xmm9,27 pxor xmm6,xmm7 movdqa xmm7,xmm10 por xmm8,xmm9 movd xmm9,DWORD PTR[((-52))+r9] pslld xmm7,30 paddd xmm13,xmm6 psrld xmm10,2 paddd xmm13,xmm8 DB 102,15,56,0,213 movd xmm8,DWORD PTR[((-52))+r10] por xmm10,xmm7 movd xmm7,DWORD PTR[((-52))+r11] punpckldq xmm3,xmm8 movdqa xmm8,xmm13 paddd xmm12,xmm15 punpckldq xmm9,xmm7 movdqa xmm7,xmm14 movdqa xmm6,xmm14 pslld xmm8,5 pandn xmm7,xmm11 pand xmm6,xmm10 punpckldq xmm3,xmm9 movdqa xmm9,xmm13 movdqa XMMWORD PTR[(32-128)+rax],xmm2 paddd xmm12,xmm2 movd xmm4,DWORD PTR[((-48))+r8] psrld xmm9,27 pxor xmm6,xmm7 movdqa xmm7,xmm14 por xmm8,xmm9 movd xmm9,DWORD PTR[((-48))+r9] pslld xmm7,30 paddd xmm12,xmm6 psrld xmm14,2 paddd xmm12,xmm8 DB 102,15,56,0,221 movd xmm8,DWORD PTR[((-48))+r10] por xmm14,xmm7 movd xmm7,DWORD PTR[((-48))+r11] punpckldq xmm4,xmm8 movdqa xmm8,xmm12 paddd xmm11,xmm15 punpckldq xmm9,xmm7 movdqa xmm7,xmm13 movdqa xmm6,xmm13 pslld xmm8,5 pandn xmm7,xmm10 pand xmm6,xmm14 punpckldq xmm4,xmm9 movdqa xmm9,xmm12 movdqa XMMWORD PTR[(48-128)+rax],xmm3 paddd xmm11,xmm3 movd xmm0,DWORD PTR[((-44))+r8] psrld xmm9,27 pxor xmm6,xmm7 movdqa xmm7,xmm13 por xmm8,xmm9 movd xmm9,DWORD PTR[((-44))+r9] pslld xmm7,30 paddd xmm11,xmm6 psrld xmm13,2 paddd xmm11,xmm8 DB 102,15,56,0,229 movd xmm8,DWORD PTR[((-44))+r10] por xmm13,xmm7 movd xmm7,DWORD PTR[((-44))+r11] punpckldq xmm0,xmm8 movdqa xmm8,xmm11 paddd xmm10,xmm15 punpckldq xmm9,xmm7 movdqa xmm7,xmm12 movdqa xmm6,xmm12 pslld xmm8,5 pandn xmm7,xmm14 pand xmm6,xmm13 punpckldq xmm0,xmm9 movdqa xmm9,xmm11 movdqa XMMWORD PTR[(64-128)+rax],xmm4 paddd xmm10,xmm4 movd xmm1,DWORD PTR[((-40))+r8] psrld xmm9,27 pxor xmm6,xmm7 movdqa xmm7,xmm12 por xmm8,xmm9 movd xmm9,DWORD PTR[((-40))+r9] pslld xmm7,30 paddd xmm10,xmm6 psrld xmm12,2 paddd xmm10,xmm8 DB 102,15,56,0,197 movd xmm8,DWORD PTR[((-40))+r10] por xmm12,xmm7 movd xmm7,DWORD PTR[((-40))+r11] punpckldq xmm1,xmm8 movdqa xmm8,xmm10 paddd xmm14,xmm15 punpckldq xmm9,xmm7 movdqa xmm7,xmm11 movdqa xmm6,xmm11 pslld xmm8,5 pandn xmm7,xmm13 pand xmm6,xmm12 punpckldq xmm1,xmm9 movdqa xmm9,xmm10 movdqa XMMWORD PTR[(80-128)+rax],xmm0 paddd xmm14,xmm0 movd xmm2,DWORD PTR[((-36))+r8] psrld xmm9,27 pxor xmm6,xmm7 movdqa xmm7,xmm11 por xmm8,xmm9 movd xmm9,DWORD PTR[((-36))+r9] pslld xmm7,30 paddd xmm14,xmm6 psrld xmm11,2 paddd xmm14,xmm8 DB 102,15,56,0,205 movd xmm8,DWORD PTR[((-36))+r10] por xmm11,xmm7 movd xmm7,DWORD PTR[((-36))+r11] punpckldq xmm2,xmm8 movdqa xmm8,xmm14 paddd xmm13,xmm15 punpckldq xmm9,xmm7 movdqa xmm7,xmm10 movdqa xmm6,xmm10 pslld xmm8,5 pandn xmm7,xmm12 pand xmm6,xmm11 punpckldq xmm2,xmm9 movdqa xmm9,xmm14 movdqa XMMWORD PTR[(96-128)+rax],xmm1 paddd xmm13,xmm1 movd xmm3,DWORD PTR[((-32))+r8] psrld xmm9,27 pxor xmm6,xmm7 movdqa xmm7,xmm10 por xmm8,xmm9 movd xmm9,DWORD PTR[((-32))+r9] pslld xmm7,30 paddd xmm13,xmm6 psrld xmm10,2 paddd xmm13,xmm8 DB 102,15,56,0,213 movd xmm8,DWORD PTR[((-32))+r10] por xmm10,xmm7 movd xmm7,DWORD PTR[((-32))+r11] punpckldq xmm3,xmm8 movdqa xmm8,xmm13 paddd xmm12,xmm15 punpckldq xmm9,xmm7 movdqa xmm7,xmm14 movdqa xmm6,xmm14 pslld xmm8,5 pandn xmm7,xmm11 pand xmm6,xmm10 punpckldq xmm3,xmm9 movdqa xmm9,xmm13 movdqa XMMWORD PTR[(112-128)+rax],xmm2 paddd xmm12,xmm2 movd xmm4,DWORD PTR[((-28))+r8] psrld xmm9,27 pxor xmm6,xmm7 movdqa xmm7,xmm14 por xmm8,xmm9 movd xmm9,DWORD PTR[((-28))+r9] pslld xmm7,30 paddd xmm12,xmm6 psrld xmm14,2 paddd xmm12,xmm8 DB 102,15,56,0,221 movd xmm8,DWORD PTR[((-28))+r10] por xmm14,xmm7 movd xmm7,DWORD PTR[((-28))+r11] punpckldq xmm4,xmm8 movdqa xmm8,xmm12 paddd xmm11,xmm15 punpckldq xmm9,xmm7 movdqa xmm7,xmm13 movdqa xmm6,xmm13 pslld xmm8,5 pandn xmm7,xmm10 pand xmm6,xmm14 punpckldq xmm4,xmm9 movdqa xmm9,xmm12 movdqa XMMWORD PTR[(128-128)+rax],xmm3 paddd xmm11,xmm3 movd xmm0,DWORD PTR[((-24))+r8] psrld xmm9,27 pxor xmm6,xmm7 movdqa xmm7,xmm13 por xmm8,xmm9 movd xmm9,DWORD PTR[((-24))+r9] pslld xmm7,30 paddd xmm11,xmm6 psrld xmm13,2 paddd xmm11,xmm8 DB 102,15,56,0,229 movd xmm8,DWORD PTR[((-24))+r10] por xmm13,xmm7 movd xmm7,DWORD PTR[((-24))+r11] punpckldq xmm0,xmm8 movdqa xmm8,xmm11 paddd xmm10,xmm15 punpckldq xmm9,xmm7 movdqa xmm7,xmm12 movdqa xmm6,xmm12 pslld xmm8,5 pandn xmm7,xmm14 pand xmm6,xmm13 punpckldq xmm0,xmm9 movdqa xmm9,xmm11 movdqa XMMWORD PTR[(144-128)+rax],xmm4 paddd xmm10,xmm4 movd xmm1,DWORD PTR[((-20))+r8] psrld xmm9,27 pxor xmm6,xmm7 movdqa xmm7,xmm12 por xmm8,xmm9 movd xmm9,DWORD PTR[((-20))+r9] pslld xmm7,30 paddd xmm10,xmm6 psrld xmm12,2 paddd xmm10,xmm8 DB 102,15,56,0,197 movd xmm8,DWORD PTR[((-20))+r10] por xmm12,xmm7 movd xmm7,DWORD PTR[((-20))+r11] punpckldq xmm1,xmm8 movdqa xmm8,xmm10 paddd xmm14,xmm15 punpckldq xmm9,xmm7 movdqa xmm7,xmm11 movdqa xmm6,xmm11 pslld xmm8,5 pandn xmm7,xmm13 pand xmm6,xmm12 punpckldq xmm1,xmm9 movdqa xmm9,xmm10 movdqa XMMWORD PTR[(160-128)+rax],xmm0 paddd xmm14,xmm0 movd xmm2,DWORD PTR[((-16))+r8] psrld xmm9,27 pxor xmm6,xmm7 movdqa xmm7,xmm11 por xmm8,xmm9 movd xmm9,DWORD PTR[((-16))+r9] pslld xmm7,30 paddd xmm14,xmm6 psrld xmm11,2 paddd xmm14,xmm8 DB 102,15,56,0,205 movd xmm8,DWORD PTR[((-16))+r10] por xmm11,xmm7 movd xmm7,DWORD PTR[((-16))+r11] punpckldq xmm2,xmm8 movdqa xmm8,xmm14 paddd xmm13,xmm15 punpckldq xmm9,xmm7 movdqa xmm7,xmm10 movdqa xmm6,xmm10 pslld xmm8,5 pandn xmm7,xmm12 pand xmm6,xmm11 punpckldq xmm2,xmm9 movdqa xmm9,xmm14 movdqa XMMWORD PTR[(176-128)+rax],xmm1 paddd xmm13,xmm1 movd xmm3,DWORD PTR[((-12))+r8] psrld xmm9,27 pxor xmm6,xmm7 movdqa xmm7,xmm10 por xmm8,xmm9 movd xmm9,DWORD PTR[((-12))+r9] pslld xmm7,30 paddd xmm13,xmm6 psrld xmm10,2 paddd xmm13,xmm8 DB 102,15,56,0,213 movd xmm8,DWORD PTR[((-12))+r10] por xmm10,xmm7 movd xmm7,DWORD PTR[((-12))+r11] punpckldq xmm3,xmm8 movdqa xmm8,xmm13 paddd xmm12,xmm15 punpckldq xmm9,xmm7 movdqa xmm7,xmm14 movdqa xmm6,xmm14 pslld xmm8,5 pandn xmm7,xmm11 pand xmm6,xmm10 punpckldq xmm3,xmm9 movdqa xmm9,xmm13 movdqa XMMWORD PTR[(192-128)+rax],xmm2 paddd xmm12,xmm2 movd xmm4,DWORD PTR[((-8))+r8] psrld xmm9,27 pxor xmm6,xmm7 movdqa xmm7,xmm14 por xmm8,xmm9 movd xmm9,DWORD PTR[((-8))+r9] pslld xmm7,30 paddd xmm12,xmm6 psrld xmm14,2 paddd xmm12,xmm8 DB 102,15,56,0,221 movd xmm8,DWORD PTR[((-8))+r10] por xmm14,xmm7 movd xmm7,DWORD PTR[((-8))+r11] punpckldq xmm4,xmm8 movdqa xmm8,xmm12 paddd xmm11,xmm15 punpckldq xmm9,xmm7 movdqa xmm7,xmm13 movdqa xmm6,xmm13 pslld xmm8,5 pandn xmm7,xmm10 pand xmm6,xmm14 punpckldq xmm4,xmm9 movdqa xmm9,xmm12 movdqa XMMWORD PTR[(208-128)+rax],xmm3 paddd xmm11,xmm3 movd xmm0,DWORD PTR[((-4))+r8] psrld xmm9,27 pxor xmm6,xmm7 movdqa xmm7,xmm13 por xmm8,xmm9 movd xmm9,DWORD PTR[((-4))+r9] pslld xmm7,30 paddd xmm11,xmm6 psrld xmm13,2 paddd xmm11,xmm8 DB 102,15,56,0,229 movd xmm8,DWORD PTR[((-4))+r10] por xmm13,xmm7 movdqa xmm1,XMMWORD PTR[((0-128))+rax] movd xmm7,DWORD PTR[((-4))+r11] punpckldq xmm0,xmm8 movdqa xmm8,xmm11 paddd xmm10,xmm15 punpckldq xmm9,xmm7 movdqa xmm7,xmm12 movdqa xmm6,xmm12 pslld xmm8,5 prefetcht0 [63+r8] pandn xmm7,xmm14 pand xmm6,xmm13 punpckldq xmm0,xmm9 movdqa xmm9,xmm11 movdqa XMMWORD PTR[(224-128)+rax],xmm4 paddd xmm10,xmm4 psrld xmm9,27 pxor xmm6,xmm7 movdqa xmm7,xmm12 prefetcht0 [63+r9] por xmm8,xmm9 pslld xmm7,30 paddd xmm10,xmm6 prefetcht0 [63+r10] psrld xmm12,2 paddd xmm10,xmm8 DB 102,15,56,0,197 prefetcht0 [63+r11] por xmm12,xmm7 movdqa xmm2,XMMWORD PTR[((16-128))+rax] pxor xmm1,xmm3 movdqa xmm3,XMMWORD PTR[((32-128))+rax] movdqa xmm8,xmm10 pxor xmm1,XMMWORD PTR[((128-128))+rax] paddd xmm14,xmm15 movdqa xmm7,xmm11 pslld xmm8,5 pxor xmm1,xmm3 movdqa xmm6,xmm11 pandn xmm7,xmm13 movdqa xmm5,xmm1 pand xmm6,xmm12 movdqa xmm9,xmm10 psrld xmm5,31 paddd xmm1,xmm1 movdqa XMMWORD PTR[(240-128)+rax],xmm0 paddd xmm14,xmm0 psrld xmm9,27 pxor xmm6,xmm7 movdqa xmm7,xmm11 por xmm8,xmm9 pslld xmm7,30 paddd xmm14,xmm6 psrld xmm11,2 paddd xmm14,xmm8 por xmm1,xmm5 por xmm11,xmm7 pxor xmm2,xmm4 movdqa xmm4,XMMWORD PTR[((48-128))+rax] movdqa xmm8,xmm14 pxor xmm2,XMMWORD PTR[((144-128))+rax] paddd xmm13,xmm15 movdqa xmm7,xmm10 pslld xmm8,5 pxor xmm2,xmm4 movdqa xmm6,xmm10 pandn xmm7,xmm12 movdqa xmm5,xmm2 pand xmm6,xmm11 movdqa xmm9,xmm14 psrld xmm5,31 paddd xmm2,xmm2 movdqa XMMWORD PTR[(0-128)+rax],xmm1 paddd xmm13,xmm1 psrld xmm9,27 pxor xmm6,xmm7 movdqa xmm7,xmm10 por xmm8,xmm9 pslld xmm7,30 paddd xmm13,xmm6 psrld xmm10,2 paddd xmm13,xmm8 por xmm2,xmm5 por xmm10,xmm7 pxor xmm3,xmm0 movdqa xmm0,XMMWORD PTR[((64-128))+rax] movdqa xmm8,xmm13 pxor xmm3,XMMWORD PTR[((160-128))+rax] paddd xmm12,xmm15 movdqa xmm7,xmm14 pslld xmm8,5 pxor xmm3,xmm0 movdqa xmm6,xmm14 pandn xmm7,xmm11 movdqa xmm5,xmm3 pand xmm6,xmm10 movdqa xmm9,xmm13 psrld xmm5,31 paddd xmm3,xmm3 movdqa XMMWORD PTR[(16-128)+rax],xmm2 paddd xmm12,xmm2 psrld xmm9,27 pxor xmm6,xmm7 movdqa xmm7,xmm14 por xmm8,xmm9 pslld xmm7,30 paddd xmm12,xmm6 psrld xmm14,2 paddd xmm12,xmm8 por xmm3,xmm5 por xmm14,xmm7 pxor xmm4,xmm1 movdqa xmm1,XMMWORD PTR[((80-128))+rax] movdqa xmm8,xmm12 pxor xmm4,XMMWORD PTR[((176-128))+rax] paddd xmm11,xmm15 movdqa xmm7,xmm13 pslld xmm8,5 pxor xmm4,xmm1 movdqa xmm6,xmm13 pandn xmm7,xmm10 movdqa xmm5,xmm4 pand xmm6,xmm14 movdqa xmm9,xmm12 psrld xmm5,31 paddd xmm4,xmm4 movdqa XMMWORD PTR[(32-128)+rax],xmm3 paddd xmm11,xmm3 psrld xmm9,27 pxor xmm6,xmm7 movdqa xmm7,xmm13 por xmm8,xmm9 pslld xmm7,30 paddd xmm11,xmm6 psrld xmm13,2 paddd xmm11,xmm8 por xmm4,xmm5 por xmm13,xmm7 pxor xmm0,xmm2 movdqa xmm2,XMMWORD PTR[((96-128))+rax] movdqa xmm8,xmm11 pxor xmm0,XMMWORD PTR[((192-128))+rax] paddd xmm10,xmm15 movdqa xmm7,xmm12 pslld xmm8,5 pxor xmm0,xmm2 movdqa xmm6,xmm12 pandn xmm7,xmm14 movdqa xmm5,xmm0 pand xmm6,xmm13 movdqa xmm9,xmm11 psrld xmm5,31 paddd xmm0,xmm0 movdqa XMMWORD PTR[(48-128)+rax],xmm4 paddd xmm10,xmm4 psrld xmm9,27 pxor xmm6,xmm7 movdqa xmm7,xmm12 por xmm8,xmm9 pslld xmm7,30 paddd xmm10,xmm6 psrld xmm12,2 paddd xmm10,xmm8 por xmm0,xmm5 por xmm12,xmm7 movdqa xmm15,XMMWORD PTR[rbp] pxor xmm1,xmm3 movdqa xmm3,XMMWORD PTR[((112-128))+rax] movdqa xmm8,xmm10 movdqa xmm6,xmm13 pxor xmm1,XMMWORD PTR[((208-128))+rax] paddd xmm14,xmm15 pslld xmm8,5 pxor xmm6,xmm11 movdqa xmm9,xmm10 movdqa XMMWORD PTR[(64-128)+rax],xmm0 paddd xmm14,xmm0 pxor xmm1,xmm3 psrld xmm9,27 pxor xmm6,xmm12 movdqa xmm7,xmm11 pslld xmm7,30 movdqa xmm5,xmm1 por xmm8,xmm9 psrld xmm5,31 paddd xmm14,xmm6 paddd xmm1,xmm1 psrld xmm11,2 paddd xmm14,xmm8 por xmm1,xmm5 por xmm11,xmm7 pxor xmm2,xmm4 movdqa xmm4,XMMWORD PTR[((128-128))+rax] movdqa xmm8,xmm14 movdqa xmm6,xmm12 pxor xmm2,XMMWORD PTR[((224-128))+rax] paddd xmm13,xmm15 pslld xmm8,5 pxor xmm6,xmm10 movdqa xmm9,xmm14 movdqa XMMWORD PTR[(80-128)+rax],xmm1 paddd xmm13,xmm1 pxor xmm2,xmm4 psrld xmm9,27 pxor xmm6,xmm11 movdqa xmm7,xmm10 pslld xmm7,30 movdqa xmm5,xmm2 por xmm8,xmm9 psrld xmm5,31 paddd xmm13,xmm6 paddd xmm2,xmm2 psrld xmm10,2 paddd xmm13,xmm8 por xmm2,xmm5 por xmm10,xmm7 pxor xmm3,xmm0 movdqa xmm0,XMMWORD PTR[((144-128))+rax] movdqa xmm8,xmm13 movdqa xmm6,xmm11 pxor xmm3,XMMWORD PTR[((240-128))+rax] paddd xmm12,xmm15 pslld xmm8,5 pxor xmm6,xmm14 movdqa xmm9,xmm13 movdqa XMMWORD PTR[(96-128)+rax],xmm2 paddd xmm12,xmm2 pxor xmm3,xmm0 psrld xmm9,27 pxor xmm6,xmm10 movdqa xmm7,xmm14 pslld xmm7,30 movdqa xmm5,xmm3 por xmm8,xmm9 psrld xmm5,31 paddd xmm12,xmm6 paddd xmm3,xmm3 psrld xmm14,2 paddd xmm12,xmm8 por xmm3,xmm5 por xmm14,xmm7 pxor xmm4,xmm1 movdqa xmm1,XMMWORD PTR[((160-128))+rax] movdqa xmm8,xmm12 movdqa xmm6,xmm10 pxor xmm4,XMMWORD PTR[((0-128))+rax] paddd xmm11,xmm15 pslld xmm8,5 pxor xmm6,xmm13 movdqa xmm9,xmm12 movdqa XMMWORD PTR[(112-128)+rax],xmm3 paddd xmm11,xmm3 pxor xmm4,xmm1 psrld xmm9,27 pxor xmm6,xmm14 movdqa xmm7,xmm13 pslld xmm7,30 movdqa xmm5,xmm4 por xmm8,xmm9 psrld xmm5,31 paddd xmm11,xmm6 paddd xmm4,xmm4 psrld xmm13,2 paddd xmm11,xmm8 por xmm4,xmm5 por xmm13,xmm7 pxor xmm0,xmm2 movdqa xmm2,XMMWORD PTR[((176-128))+rax] movdqa xmm8,xmm11 movdqa xmm6,xmm14 pxor xmm0,XMMWORD PTR[((16-128))+rax] paddd xmm10,xmm15 pslld xmm8,5 pxor xmm6,xmm12 movdqa xmm9,xmm11 movdqa XMMWORD PTR[(128-128)+rax],xmm4 paddd xmm10,xmm4 pxor xmm0,xmm2 psrld xmm9,27 pxor xmm6,xmm13 movdqa xmm7,xmm12 pslld xmm7,30 movdqa xmm5,xmm0 por xmm8,xmm9 psrld xmm5,31 paddd xmm10,xmm6 paddd xmm0,xmm0 psrld xmm12,2 paddd xmm10,xmm8 por xmm0,xmm5 por xmm12,xmm7 pxor xmm1,xmm3 movdqa xmm3,XMMWORD PTR[((192-128))+rax] movdqa xmm8,xmm10 movdqa xmm6,xmm13 pxor xmm1,XMMWORD PTR[((32-128))+rax] paddd xmm14,xmm15 pslld xmm8,5 pxor xmm6,xmm11 movdqa xmm9,xmm10 movdqa XMMWORD PTR[(144-128)+rax],xmm0 paddd xmm14,xmm0 pxor xmm1,xmm3 psrld xmm9,27 pxor xmm6,xmm12 movdqa xmm7,xmm11 pslld xmm7,30 movdqa xmm5,xmm1 por xmm8,xmm9 psrld xmm5,31 paddd xmm14,xmm6 paddd xmm1,xmm1 psrld xmm11,2 paddd xmm14,xmm8 por xmm1,xmm5 por xmm11,xmm7 pxor xmm2,xmm4 movdqa xmm4,XMMWORD PTR[((208-128))+rax] movdqa xmm8,xmm14 movdqa xmm6,xmm12 pxor xmm2,XMMWORD PTR[((48-128))+rax] paddd xmm13,xmm15 pslld xmm8,5 pxor xmm6,xmm10 movdqa xmm9,xmm14 movdqa XMMWORD PTR[(160-128)+rax],xmm1 paddd xmm13,xmm1 pxor xmm2,xmm4 psrld xmm9,27 pxor xmm6,xmm11 movdqa xmm7,xmm10 pslld xmm7,30 movdqa xmm5,xmm2 por xmm8,xmm9 psrld xmm5,31 paddd xmm13,xmm6 paddd xmm2,xmm2 psrld xmm10,2 paddd xmm13,xmm8 por xmm2,xmm5 por xmm10,xmm7 pxor xmm3,xmm0 movdqa xmm0,XMMWORD PTR[((224-128))+rax] movdqa xmm8,xmm13 movdqa xmm6,xmm11 pxor xmm3,XMMWORD PTR[((64-128))+rax] paddd xmm12,xmm15 pslld xmm8,5 pxor xmm6,xmm14 movdqa xmm9,xmm13 movdqa XMMWORD PTR[(176-128)+rax],xmm2 paddd xmm12,xmm2 pxor xmm3,xmm0 psrld xmm9,27 pxor xmm6,xmm10 movdqa xmm7,xmm14 pslld xmm7,30 movdqa xmm5,xmm3 por xmm8,xmm9 psrld xmm5,31 paddd xmm12,xmm6 paddd xmm3,xmm3 psrld xmm14,2 paddd xmm12,xmm8 por xmm3,xmm5 por xmm14,xmm7 pxor xmm4,xmm1 movdqa xmm1,XMMWORD PTR[((240-128))+rax] movdqa xmm8,xmm12 movdqa xmm6,xmm10 pxor xmm4,XMMWORD PTR[((80-128))+rax] paddd xmm11,xmm15 pslld xmm8,5 pxor xmm6,xmm13 movdqa xmm9,xmm12 movdqa XMMWORD PTR[(192-128)+rax],xmm3 paddd xmm11,xmm3 pxor xmm4,xmm1 psrld xmm9,27 pxor xmm6,xmm14 movdqa xmm7,xmm13 pslld xmm7,30 movdqa xmm5,xmm4 por xmm8,xmm9 psrld xmm5,31 paddd xmm11,xmm6 paddd xmm4,xmm4 psrld xmm13,2 paddd xmm11,xmm8 por xmm4,xmm5 por xmm13,xmm7 pxor xmm0,xmm2 movdqa xmm2,XMMWORD PTR[((0-128))+rax] movdqa xmm8,xmm11 movdqa xmm6,xmm14 pxor xmm0,XMMWORD PTR[((96-128))+rax] paddd xmm10,xmm15 pslld xmm8,5 pxor xmm6,xmm12 movdqa xmm9,xmm11 movdqa XMMWORD PTR[(208-128)+rax],xmm4 paddd xmm10,xmm4 pxor xmm0,xmm2 psrld xmm9,27 pxor xmm6,xmm13 movdqa xmm7,xmm12 pslld xmm7,30 movdqa xmm5,xmm0 por xmm8,xmm9 psrld xmm5,31 paddd xmm10,xmm6 paddd xmm0,xmm0 psrld xmm12,2 paddd xmm10,xmm8 por xmm0,xmm5 por xmm12,xmm7 pxor xmm1,xmm3 movdqa xmm3,XMMWORD PTR[((16-128))+rax] movdqa xmm8,xmm10 movdqa xmm6,xmm13 pxor xmm1,XMMWORD PTR[((112-128))+rax] paddd xmm14,xmm15 pslld xmm8,5 pxor xmm6,xmm11 movdqa xmm9,xmm10 movdqa XMMWORD PTR[(224-128)+rax],xmm0 paddd xmm14,xmm0 pxor xmm1,xmm3 psrld xmm9,27 pxor xmm6,xmm12 movdqa xmm7,xmm11 pslld xmm7,30 movdqa xmm5,xmm1 por xmm8,xmm9 psrld xmm5,31 paddd xmm14,xmm6 paddd xmm1,xmm1 psrld xmm11,2 paddd xmm14,xmm8 por xmm1,xmm5 por xmm11,xmm7 pxor xmm2,xmm4 movdqa xmm4,XMMWORD PTR[((32-128))+rax] movdqa xmm8,xmm14 movdqa xmm6,xmm12 pxor xmm2,XMMWORD PTR[((128-128))+rax] paddd xmm13,xmm15 pslld xmm8,5 pxor xmm6,xmm10 movdqa xmm9,xmm14 movdqa XMMWORD PTR[(240-128)+rax],xmm1 paddd xmm13,xmm1 pxor xmm2,xmm4 psrld xmm9,27 pxor xmm6,xmm11 movdqa xmm7,xmm10 pslld xmm7,30 movdqa xmm5,xmm2 por xmm8,xmm9 psrld xmm5,31 paddd xmm13,xmm6 paddd xmm2,xmm2 psrld xmm10,2 paddd xmm13,xmm8 por xmm2,xmm5 por xmm10,xmm7 pxor xmm3,xmm0 movdqa xmm0,XMMWORD PTR[((48-128))+rax] movdqa xmm8,xmm13 movdqa xmm6,xmm11 pxor xmm3,XMMWORD PTR[((144-128))+rax] paddd xmm12,xmm15 pslld xmm8,5 pxor xmm6,xmm14 movdqa xmm9,xmm13 movdqa XMMWORD PTR[(0-128)+rax],xmm2 paddd xmm12,xmm2 pxor xmm3,xmm0 psrld xmm9,27 pxor xmm6,xmm10 movdqa xmm7,xmm14 pslld xmm7,30 movdqa xmm5,xmm3 por xmm8,xmm9 psrld xmm5,31 paddd xmm12,xmm6 paddd xmm3,xmm3 psrld xmm14,2 paddd xmm12,xmm8 por xmm3,xmm5 por xmm14,xmm7 pxor xmm4,xmm1 movdqa xmm1,XMMWORD PTR[((64-128))+rax] movdqa xmm8,xmm12 movdqa xmm6,xmm10 pxor xmm4,XMMWORD PTR[((160-128))+rax] paddd xmm11,xmm15 pslld xmm8,5 pxor xmm6,xmm13 movdqa xmm9,xmm12 movdqa XMMWORD PTR[(16-128)+rax],xmm3 paddd xmm11,xmm3 pxor xmm4,xmm1 psrld xmm9,27 pxor xmm6,xmm14 movdqa xmm7,xmm13 pslld xmm7,30 movdqa xmm5,xmm4 por xmm8,xmm9 psrld xmm5,31 paddd xmm11,xmm6 paddd xmm4,xmm4 psrld xmm13,2 paddd xmm11,xmm8 por xmm4,xmm5 por xmm13,xmm7 pxor xmm0,xmm2 movdqa xmm2,XMMWORD PTR[((80-128))+rax] movdqa xmm8,xmm11 movdqa xmm6,xmm14 pxor xmm0,XMMWORD PTR[((176-128))+rax] paddd xmm10,xmm15 pslld xmm8,5 pxor xmm6,xmm12 movdqa xmm9,xmm11 movdqa XMMWORD PTR[(32-128)+rax],xmm4 paddd xmm10,xmm4 pxor xmm0,xmm2 psrld xmm9,27 pxor xmm6,xmm13 movdqa xmm7,xmm12 pslld xmm7,30 movdqa xmm5,xmm0 por xmm8,xmm9 psrld xmm5,31 paddd xmm10,xmm6 paddd xmm0,xmm0 psrld xmm12,2 paddd xmm10,xmm8 por xmm0,xmm5 por xmm12,xmm7 pxor xmm1,xmm3 movdqa xmm3,XMMWORD PTR[((96-128))+rax] movdqa xmm8,xmm10 movdqa xmm6,xmm13 pxor xmm1,XMMWORD PTR[((192-128))+rax] paddd xmm14,xmm15 pslld xmm8,5 pxor xmm6,xmm11 movdqa xmm9,xmm10 movdqa XMMWORD PTR[(48-128)+rax],xmm0 paddd xmm14,xmm0 pxor xmm1,xmm3 psrld xmm9,27 pxor xmm6,xmm12 movdqa xmm7,xmm11 pslld xmm7,30 movdqa xmm5,xmm1 por xmm8,xmm9 psrld xmm5,31 paddd xmm14,xmm6 paddd xmm1,xmm1 psrld xmm11,2 paddd xmm14,xmm8 por xmm1,xmm5 por xmm11,xmm7 pxor xmm2,xmm4 movdqa xmm4,XMMWORD PTR[((112-128))+rax] movdqa xmm8,xmm14 movdqa xmm6,xmm12 pxor xmm2,XMMWORD PTR[((208-128))+rax] paddd xmm13,xmm15 pslld xmm8,5 pxor xmm6,xmm10 movdqa xmm9,xmm14 movdqa XMMWORD PTR[(64-128)+rax],xmm1 paddd xmm13,xmm1 pxor xmm2,xmm4 psrld xmm9,27 pxor xmm6,xmm11 movdqa xmm7,xmm10 pslld xmm7,30 movdqa xmm5,xmm2 por xmm8,xmm9 psrld xmm5,31 paddd xmm13,xmm6 paddd xmm2,xmm2 psrld xmm10,2 paddd xmm13,xmm8 por xmm2,xmm5 por xmm10,xmm7 pxor xmm3,xmm0 movdqa xmm0,XMMWORD PTR[((128-128))+rax] movdqa xmm8,xmm13 movdqa xmm6,xmm11 pxor xmm3,XMMWORD PTR[((224-128))+rax] paddd xmm12,xmm15 pslld xmm8,5 pxor xmm6,xmm14 movdqa xmm9,xmm13 movdqa XMMWORD PTR[(80-128)+rax],xmm2 paddd xmm12,xmm2 pxor xmm3,xmm0 psrld xmm9,27 pxor xmm6,xmm10 movdqa xmm7,xmm14 pslld xmm7,30 movdqa xmm5,xmm3 por xmm8,xmm9 psrld xmm5,31 paddd xmm12,xmm6 paddd xmm3,xmm3 psrld xmm14,2 paddd xmm12,xmm8 por xmm3,xmm5 por xmm14,xmm7 pxor xmm4,xmm1 movdqa xmm1,XMMWORD PTR[((144-128))+rax] movdqa xmm8,xmm12 movdqa xmm6,xmm10 pxor xmm4,XMMWORD PTR[((240-128))+rax] paddd xmm11,xmm15 pslld xmm8,5 pxor xmm6,xmm13 movdqa xmm9,xmm12 movdqa XMMWORD PTR[(96-128)+rax],xmm3 paddd xmm11,xmm3 pxor xmm4,xmm1 psrld xmm9,27 pxor xmm6,xmm14 movdqa xmm7,xmm13 pslld xmm7,30 movdqa xmm5,xmm4 por xmm8,xmm9 psrld xmm5,31 paddd xmm11,xmm6 paddd xmm4,xmm4 psrld xmm13,2 paddd xmm11,xmm8 por xmm4,xmm5 por xmm13,xmm7 pxor xmm0,xmm2 movdqa xmm2,XMMWORD PTR[((160-128))+rax] movdqa xmm8,xmm11 movdqa xmm6,xmm14 pxor xmm0,XMMWORD PTR[((0-128))+rax] paddd xmm10,xmm15 pslld xmm8,5 pxor xmm6,xmm12 movdqa xmm9,xmm11 movdqa XMMWORD PTR[(112-128)+rax],xmm4 paddd xmm10,xmm4 pxor xmm0,xmm2 psrld xmm9,27 pxor xmm6,xmm13 movdqa xmm7,xmm12 pslld xmm7,30 movdqa xmm5,xmm0 por xmm8,xmm9 psrld xmm5,31 paddd xmm10,xmm6 paddd xmm0,xmm0 psrld xmm12,2 paddd xmm10,xmm8 por xmm0,xmm5 por xmm12,xmm7 movdqa xmm15,XMMWORD PTR[32+rbp] pxor xmm1,xmm3 movdqa xmm3,XMMWORD PTR[((176-128))+rax] movdqa xmm8,xmm10 movdqa xmm7,xmm13 pxor xmm1,XMMWORD PTR[((16-128))+rax] pxor xmm1,xmm3 paddd xmm14,xmm15 pslld xmm8,5 movdqa xmm9,xmm10 pand xmm7,xmm12 movdqa xmm6,xmm13 movdqa xmm5,xmm1 psrld xmm9,27 paddd xmm14,xmm7 pxor xmm6,xmm12 movdqa XMMWORD PTR[(128-128)+rax],xmm0 paddd xmm14,xmm0 por xmm8,xmm9 psrld xmm5,31 pand xmm6,xmm11 movdqa xmm7,xmm11 pslld xmm7,30 paddd xmm1,xmm1 paddd xmm14,xmm6 psrld xmm11,2 paddd xmm14,xmm8 por xmm1,xmm5 por xmm11,xmm7 pxor xmm2,xmm4 movdqa xmm4,XMMWORD PTR[((192-128))+rax] movdqa xmm8,xmm14 movdqa xmm7,xmm12 pxor xmm2,XMMWORD PTR[((32-128))+rax] pxor xmm2,xmm4 paddd xmm13,xmm15 pslld xmm8,5 movdqa xmm9,xmm14 pand xmm7,xmm11 movdqa xmm6,xmm12 movdqa xmm5,xmm2 psrld xmm9,27 paddd xmm13,xmm7 pxor xmm6,xmm11 movdqa XMMWORD PTR[(144-128)+rax],xmm1 paddd xmm13,xmm1 por xmm8,xmm9 psrld xmm5,31 pand xmm6,xmm10 movdqa xmm7,xmm10 pslld xmm7,30 paddd xmm2,xmm2 paddd xmm13,xmm6 psrld xmm10,2 paddd xmm13,xmm8 por xmm2,xmm5 por xmm10,xmm7 pxor xmm3,xmm0 movdqa xmm0,XMMWORD PTR[((208-128))+rax] movdqa xmm8,xmm13 movdqa xmm7,xmm11 pxor xmm3,XMMWORD PTR[((48-128))+rax] pxor xmm3,xmm0 paddd xmm12,xmm15 pslld xmm8,5 movdqa xmm9,xmm13 pand xmm7,xmm10 movdqa xmm6,xmm11 movdqa xmm5,xmm3 psrld xmm9,27 paddd xmm12,xmm7 pxor xmm6,xmm10 movdqa XMMWORD PTR[(160-128)+rax],xmm2 paddd xmm12,xmm2 por xmm8,xmm9 psrld xmm5,31 pand xmm6,xmm14 movdqa xmm7,xmm14 pslld xmm7,30 paddd xmm3,xmm3 paddd xmm12,xmm6 psrld xmm14,2 paddd xmm12,xmm8 por xmm3,xmm5 por xmm14,xmm7 pxor xmm4,xmm1 movdqa xmm1,XMMWORD PTR[((224-128))+rax] movdqa xmm8,xmm12 movdqa xmm7,xmm10 pxor xmm4,XMMWORD PTR[((64-128))+rax] pxor xmm4,xmm1 paddd xmm11,xmm15 pslld xmm8,5 movdqa xmm9,xmm12 pand xmm7,xmm14 movdqa xmm6,xmm10 movdqa xmm5,xmm4 psrld xmm9,27 paddd xmm11,xmm7 pxor xmm6,xmm14 movdqa XMMWORD PTR[(176-128)+rax],xmm3 paddd xmm11,xmm3 por xmm8,xmm9 psrld xmm5,31 pand xmm6,xmm13 movdqa xmm7,xmm13 pslld xmm7,30 paddd xmm4,xmm4 paddd xmm11,xmm6 psrld xmm13,2 paddd xmm11,xmm8 por xmm4,xmm5 por xmm13,xmm7 pxor xmm0,xmm2 movdqa xmm2,XMMWORD PTR[((240-128))+rax] movdqa xmm8,xmm11 movdqa xmm7,xmm14 pxor xmm0,XMMWORD PTR[((80-128))+rax] pxor xmm0,xmm2 paddd xmm10,xmm15 pslld xmm8,5 movdqa xmm9,xmm11 pand xmm7,xmm13 movdqa xmm6,xmm14 movdqa xmm5,xmm0 psrld xmm9,27 paddd xmm10,xmm7 pxor xmm6,xmm13 movdqa XMMWORD PTR[(192-128)+rax],xmm4 paddd xmm10,xmm4 por xmm8,xmm9 psrld xmm5,31 pand xmm6,xmm12 movdqa xmm7,xmm12 pslld xmm7,30 paddd xmm0,xmm0 paddd xmm10,xmm6 psrld xmm12,2 paddd xmm10,xmm8 por xmm0,xmm5 por xmm12,xmm7 pxor xmm1,xmm3 movdqa xmm3,XMMWORD PTR[((0-128))+rax] movdqa xmm8,xmm10 movdqa xmm7,xmm13 pxor xmm1,XMMWORD PTR[((96-128))+rax] pxor xmm1,xmm3 paddd xmm14,xmm15 pslld xmm8,5 movdqa xmm9,xmm10 pand xmm7,xmm12 movdqa xmm6,xmm13 movdqa xmm5,xmm1 psrld xmm9,27 paddd xmm14,xmm7 pxor xmm6,xmm12 movdqa XMMWORD PTR[(208-128)+rax],xmm0 paddd xmm14,xmm0 por xmm8,xmm9 psrld xmm5,31 pand xmm6,xmm11 movdqa xmm7,xmm11 pslld xmm7,30 paddd xmm1,xmm1 paddd xmm14,xmm6 psrld xmm11,2 paddd xmm14,xmm8 por xmm1,xmm5 por xmm11,xmm7 pxor xmm2,xmm4 movdqa xmm4,XMMWORD PTR[((16-128))+rax] movdqa xmm8,xmm14 movdqa xmm7,xmm12 pxor xmm2,XMMWORD PTR[((112-128))+rax] pxor xmm2,xmm4 paddd xmm13,xmm15 pslld xmm8,5 movdqa xmm9,xmm14 pand xmm7,xmm11 movdqa xmm6,xmm12 movdqa xmm5,xmm2 psrld xmm9,27 paddd xmm13,xmm7 pxor xmm6,xmm11 movdqa XMMWORD PTR[(224-128)+rax],xmm1 paddd xmm13,xmm1 por xmm8,xmm9 psrld xmm5,31 pand xmm6,xmm10 movdqa xmm7,xmm10 pslld xmm7,30 paddd xmm2,xmm2 paddd xmm13,xmm6 psrld xmm10,2 paddd xmm13,xmm8 por xmm2,xmm5 por xmm10,xmm7 pxor xmm3,xmm0 movdqa xmm0,XMMWORD PTR[((32-128))+rax] movdqa xmm8,xmm13 movdqa xmm7,xmm11 pxor xmm3,XMMWORD PTR[((128-128))+rax] pxor xmm3,xmm0 paddd xmm12,xmm15 pslld xmm8,5 movdqa xmm9,xmm13 pand xmm7,xmm10 movdqa xmm6,xmm11 movdqa xmm5,xmm3 psrld xmm9,27 paddd xmm12,xmm7 pxor xmm6,xmm10 movdqa XMMWORD PTR[(240-128)+rax],xmm2 paddd xmm12,xmm2 por xmm8,xmm9 psrld xmm5,31 pand xmm6,xmm14 movdqa xmm7,xmm14 pslld xmm7,30 paddd xmm3,xmm3 paddd xmm12,xmm6 psrld xmm14,2 paddd xmm12,xmm8 por xmm3,xmm5 por xmm14,xmm7 pxor xmm4,xmm1 movdqa xmm1,XMMWORD PTR[((48-128))+rax] movdqa xmm8,xmm12 movdqa xmm7,xmm10 pxor xmm4,XMMWORD PTR[((144-128))+rax] pxor xmm4,xmm1 paddd xmm11,xmm15 pslld xmm8,5 movdqa xmm9,xmm12 pand xmm7,xmm14 movdqa xmm6,xmm10 movdqa xmm5,xmm4 psrld xmm9,27 paddd xmm11,xmm7 pxor xmm6,xmm14 movdqa XMMWORD PTR[(0-128)+rax],xmm3 paddd xmm11,xmm3 por xmm8,xmm9 psrld xmm5,31 pand xmm6,xmm13 movdqa xmm7,xmm13 pslld xmm7,30 paddd xmm4,xmm4 paddd xmm11,xmm6 psrld xmm13,2 paddd xmm11,xmm8 por xmm4,xmm5 por xmm13,xmm7 pxor xmm0,xmm2 movdqa xmm2,XMMWORD PTR[((64-128))+rax] movdqa xmm8,xmm11 movdqa xmm7,xmm14 pxor xmm0,XMMWORD PTR[((160-128))+rax] pxor xmm0,xmm2 paddd xmm10,xmm15 pslld xmm8,5 movdqa xmm9,xmm11 pand xmm7,xmm13 movdqa xmm6,xmm14 movdqa xmm5,xmm0 psrld xmm9,27 paddd xmm10,xmm7 pxor xmm6,xmm13 movdqa XMMWORD PTR[(16-128)+rax],xmm4 paddd xmm10,xmm4 por xmm8,xmm9 psrld xmm5,31 pand xmm6,xmm12 movdqa xmm7,xmm12 pslld xmm7,30 paddd xmm0,xmm0 paddd xmm10,xmm6 psrld xmm12,2 paddd xmm10,xmm8 por xmm0,xmm5 por xmm12,xmm7 pxor xmm1,xmm3 movdqa xmm3,XMMWORD PTR[((80-128))+rax] movdqa xmm8,xmm10 movdqa xmm7,xmm13 pxor xmm1,XMMWORD PTR[((176-128))+rax] pxor xmm1,xmm3 paddd xmm14,xmm15 pslld xmm8,5 movdqa xmm9,xmm10 pand xmm7,xmm12 movdqa xmm6,xmm13 movdqa xmm5,xmm1 psrld xmm9,27 paddd xmm14,xmm7 pxor xmm6,xmm12 movdqa XMMWORD PTR[(32-128)+rax],xmm0 paddd xmm14,xmm0 por xmm8,xmm9 psrld xmm5,31 pand xmm6,xmm11 movdqa xmm7,xmm11 pslld xmm7,30 paddd xmm1,xmm1 paddd xmm14,xmm6 psrld xmm11,2 paddd xmm14,xmm8 por xmm1,xmm5 por xmm11,xmm7 pxor xmm2,xmm4 movdqa xmm4,XMMWORD PTR[((96-128))+rax] movdqa xmm8,xmm14 movdqa xmm7,xmm12 pxor xmm2,XMMWORD PTR[((192-128))+rax] pxor xmm2,xmm4 paddd xmm13,xmm15 pslld xmm8,5 movdqa xmm9,xmm14 pand xmm7,xmm11 movdqa xmm6,xmm12 movdqa xmm5,xmm2 psrld xmm9,27 paddd xmm13,xmm7 pxor xmm6,xmm11 movdqa XMMWORD PTR[(48-128)+rax],xmm1 paddd xmm13,xmm1 por xmm8,xmm9 psrld xmm5,31 pand xmm6,xmm10 movdqa xmm7,xmm10 pslld xmm7,30 paddd xmm2,xmm2 paddd xmm13,xmm6 psrld xmm10,2 paddd xmm13,xmm8 por xmm2,xmm5 por xmm10,xmm7 pxor xmm3,xmm0 movdqa xmm0,XMMWORD PTR[((112-128))+rax] movdqa xmm8,xmm13 movdqa xmm7,xmm11 pxor xmm3,XMMWORD PTR[((208-128))+rax] pxor xmm3,xmm0 paddd xmm12,xmm15 pslld xmm8,5 movdqa xmm9,xmm13 pand xmm7,xmm10 movdqa xmm6,xmm11 movdqa xmm5,xmm3 psrld xmm9,27 paddd xmm12,xmm7 pxor xmm6,xmm10 movdqa XMMWORD PTR[(64-128)+rax],xmm2 paddd xmm12,xmm2 por xmm8,xmm9 psrld xmm5,31 pand xmm6,xmm14 movdqa xmm7,xmm14 pslld xmm7,30 paddd xmm3,xmm3 paddd xmm12,xmm6 psrld xmm14,2 paddd xmm12,xmm8 por xmm3,xmm5 por xmm14,xmm7 pxor xmm4,xmm1 movdqa xmm1,XMMWORD PTR[((128-128))+rax] movdqa xmm8,xmm12 movdqa xmm7,xmm10 pxor xmm4,XMMWORD PTR[((224-128))+rax] pxor xmm4,xmm1 paddd xmm11,xmm15 pslld xmm8,5 movdqa xmm9,xmm12 pand xmm7,xmm14 movdqa xmm6,xmm10 movdqa xmm5,xmm4 psrld xmm9,27 paddd xmm11,xmm7 pxor xmm6,xmm14 movdqa XMMWORD PTR[(80-128)+rax],xmm3 paddd xmm11,xmm3 por xmm8,xmm9 psrld xmm5,31 pand xmm6,xmm13 movdqa xmm7,xmm13 pslld xmm7,30 paddd xmm4,xmm4 paddd xmm11,xmm6 psrld xmm13,2 paddd xmm11,xmm8 por xmm4,xmm5 por xmm13,xmm7 pxor xmm0,xmm2 movdqa xmm2,XMMWORD PTR[((144-128))+rax] movdqa xmm8,xmm11 movdqa xmm7,xmm14 pxor xmm0,XMMWORD PTR[((240-128))+rax] pxor xmm0,xmm2 paddd xmm10,xmm15 pslld xmm8,5 movdqa xmm9,xmm11 pand xmm7,xmm13 movdqa xmm6,xmm14 movdqa xmm5,xmm0 psrld xmm9,27 paddd xmm10,xmm7 pxor xmm6,xmm13 movdqa XMMWORD PTR[(96-128)+rax],xmm4 paddd xmm10,xmm4 por xmm8,xmm9 psrld xmm5,31 pand xmm6,xmm12 movdqa xmm7,xmm12 pslld xmm7,30 paddd xmm0,xmm0 paddd xmm10,xmm6 psrld xmm12,2 paddd xmm10,xmm8 por xmm0,xmm5 por xmm12,xmm7 pxor xmm1,xmm3 movdqa xmm3,XMMWORD PTR[((160-128))+rax] movdqa xmm8,xmm10 movdqa xmm7,xmm13 pxor xmm1,XMMWORD PTR[((0-128))+rax] pxor xmm1,xmm3 paddd xmm14,xmm15 pslld xmm8,5 movdqa xmm9,xmm10 pand xmm7,xmm12 movdqa xmm6,xmm13 movdqa xmm5,xmm1 psrld xmm9,27 paddd xmm14,xmm7 pxor xmm6,xmm12 movdqa XMMWORD PTR[(112-128)+rax],xmm0 paddd xmm14,xmm0 por xmm8,xmm9 psrld xmm5,31 pand xmm6,xmm11 movdqa xmm7,xmm11 pslld xmm7,30 paddd xmm1,xmm1 paddd xmm14,xmm6 psrld xmm11,2 paddd xmm14,xmm8 por xmm1,xmm5 por xmm11,xmm7 pxor xmm2,xmm4 movdqa xmm4,XMMWORD PTR[((176-128))+rax] movdqa xmm8,xmm14 movdqa xmm7,xmm12 pxor xmm2,XMMWORD PTR[((16-128))+rax] pxor xmm2,xmm4 paddd xmm13,xmm15 pslld xmm8,5 movdqa xmm9,xmm14 pand xmm7,xmm11 movdqa xmm6,xmm12 movdqa xmm5,xmm2 psrld xmm9,27 paddd xmm13,xmm7 pxor xmm6,xmm11 movdqa XMMWORD PTR[(128-128)+rax],xmm1 paddd xmm13,xmm1 por xmm8,xmm9 psrld xmm5,31 pand xmm6,xmm10 movdqa xmm7,xmm10 pslld xmm7,30 paddd xmm2,xmm2 paddd xmm13,xmm6 psrld xmm10,2 paddd xmm13,xmm8 por xmm2,xmm5 por xmm10,xmm7 pxor xmm3,xmm0 movdqa xmm0,XMMWORD PTR[((192-128))+rax] movdqa xmm8,xmm13 movdqa xmm7,xmm11 pxor xmm3,XMMWORD PTR[((32-128))+rax] pxor xmm3,xmm0 paddd xmm12,xmm15 pslld xmm8,5 movdqa xmm9,xmm13 pand xmm7,xmm10 movdqa xmm6,xmm11 movdqa xmm5,xmm3 psrld xmm9,27 paddd xmm12,xmm7 pxor xmm6,xmm10 movdqa XMMWORD PTR[(144-128)+rax],xmm2 paddd xmm12,xmm2 por xmm8,xmm9 psrld xmm5,31 pand xmm6,xmm14 movdqa xmm7,xmm14 pslld xmm7,30 paddd xmm3,xmm3 paddd xmm12,xmm6 psrld xmm14,2 paddd xmm12,xmm8 por xmm3,xmm5 por xmm14,xmm7 pxor xmm4,xmm1 movdqa xmm1,XMMWORD PTR[((208-128))+rax] movdqa xmm8,xmm12 movdqa xmm7,xmm10 pxor xmm4,XMMWORD PTR[((48-128))+rax] pxor xmm4,xmm1 paddd xmm11,xmm15 pslld xmm8,5 movdqa xmm9,xmm12 pand xmm7,xmm14 movdqa xmm6,xmm10 movdqa xmm5,xmm4 psrld xmm9,27 paddd xmm11,xmm7 pxor xmm6,xmm14 movdqa XMMWORD PTR[(160-128)+rax],xmm3 paddd xmm11,xmm3 por xmm8,xmm9 psrld xmm5,31 pand xmm6,xmm13 movdqa xmm7,xmm13 pslld xmm7,30 paddd xmm4,xmm4 paddd xmm11,xmm6 psrld xmm13,2 paddd xmm11,xmm8 por xmm4,xmm5 por xmm13,xmm7 pxor xmm0,xmm2 movdqa xmm2,XMMWORD PTR[((224-128))+rax] movdqa xmm8,xmm11 movdqa xmm7,xmm14 pxor xmm0,XMMWORD PTR[((64-128))+rax] pxor xmm0,xmm2 paddd xmm10,xmm15 pslld xmm8,5 movdqa xmm9,xmm11 pand xmm7,xmm13 movdqa xmm6,xmm14 movdqa xmm5,xmm0 psrld xmm9,27 paddd xmm10,xmm7 pxor xmm6,xmm13 movdqa XMMWORD PTR[(176-128)+rax],xmm4 paddd xmm10,xmm4 por xmm8,xmm9 psrld xmm5,31 pand xmm6,xmm12 movdqa xmm7,xmm12 pslld xmm7,30 paddd xmm0,xmm0 paddd xmm10,xmm6 psrld xmm12,2 paddd xmm10,xmm8 por xmm0,xmm5 por xmm12,xmm7 movdqa xmm15,XMMWORD PTR[64+rbp] pxor xmm1,xmm3 movdqa xmm3,XMMWORD PTR[((240-128))+rax] movdqa xmm8,xmm10 movdqa xmm6,xmm13 pxor xmm1,XMMWORD PTR[((80-128))+rax] paddd xmm14,xmm15 pslld xmm8,5 pxor xmm6,xmm11 movdqa xmm9,xmm10 movdqa XMMWORD PTR[(192-128)+rax],xmm0 paddd xmm14,xmm0 pxor xmm1,xmm3 psrld xmm9,27 pxor xmm6,xmm12 movdqa xmm7,xmm11 pslld xmm7,30 movdqa xmm5,xmm1 por xmm8,xmm9 psrld xmm5,31 paddd xmm14,xmm6 paddd xmm1,xmm1 psrld xmm11,2 paddd xmm14,xmm8 por xmm1,xmm5 por xmm11,xmm7 pxor xmm2,xmm4 movdqa xmm4,XMMWORD PTR[((0-128))+rax] movdqa xmm8,xmm14 movdqa xmm6,xmm12 pxor xmm2,XMMWORD PTR[((96-128))+rax] paddd xmm13,xmm15 pslld xmm8,5 pxor xmm6,xmm10 movdqa xmm9,xmm14 movdqa XMMWORD PTR[(208-128)+rax],xmm1 paddd xmm13,xmm1 pxor xmm2,xmm4 psrld xmm9,27 pxor xmm6,xmm11 movdqa xmm7,xmm10 pslld xmm7,30 movdqa xmm5,xmm2 por xmm8,xmm9 psrld xmm5,31 paddd xmm13,xmm6 paddd xmm2,xmm2 psrld xmm10,2 paddd xmm13,xmm8 por xmm2,xmm5 por xmm10,xmm7 pxor xmm3,xmm0 movdqa xmm0,XMMWORD PTR[((16-128))+rax] movdqa xmm8,xmm13 movdqa xmm6,xmm11 pxor xmm3,XMMWORD PTR[((112-128))+rax] paddd xmm12,xmm15 pslld xmm8,5 pxor xmm6,xmm14 movdqa xmm9,xmm13 movdqa XMMWORD PTR[(224-128)+rax],xmm2 paddd xmm12,xmm2 pxor xmm3,xmm0 psrld xmm9,27 pxor xmm6,xmm10 movdqa xmm7,xmm14 pslld xmm7,30 movdqa xmm5,xmm3 por xmm8,xmm9 psrld xmm5,31 paddd xmm12,xmm6 paddd xmm3,xmm3 psrld xmm14,2 paddd xmm12,xmm8 por xmm3,xmm5 por xmm14,xmm7 pxor xmm4,xmm1 movdqa xmm1,XMMWORD PTR[((32-128))+rax] movdqa xmm8,xmm12 movdqa xmm6,xmm10 pxor xmm4,XMMWORD PTR[((128-128))+rax] paddd xmm11,xmm15 pslld xmm8,5 pxor xmm6,xmm13 movdqa xmm9,xmm12 movdqa XMMWORD PTR[(240-128)+rax],xmm3 paddd xmm11,xmm3 pxor xmm4,xmm1 psrld xmm9,27 pxor xmm6,xmm14 movdqa xmm7,xmm13 pslld xmm7,30 movdqa xmm5,xmm4 por xmm8,xmm9 psrld xmm5,31 paddd xmm11,xmm6 paddd xmm4,xmm4 psrld xmm13,2 paddd xmm11,xmm8 por xmm4,xmm5 por xmm13,xmm7 pxor xmm0,xmm2 movdqa xmm2,XMMWORD PTR[((48-128))+rax] movdqa xmm8,xmm11 movdqa xmm6,xmm14 pxor xmm0,XMMWORD PTR[((144-128))+rax] paddd xmm10,xmm15 pslld xmm8,5 pxor xmm6,xmm12 movdqa xmm9,xmm11 movdqa XMMWORD PTR[(0-128)+rax],xmm4 paddd xmm10,xmm4 pxor xmm0,xmm2 psrld xmm9,27 pxor xmm6,xmm13 movdqa xmm7,xmm12 pslld xmm7,30 movdqa xmm5,xmm0 por xmm8,xmm9 psrld xmm5,31 paddd xmm10,xmm6 paddd xmm0,xmm0 psrld xmm12,2 paddd xmm10,xmm8 por xmm0,xmm5 por xmm12,xmm7 pxor xmm1,xmm3 movdqa xmm3,XMMWORD PTR[((64-128))+rax] movdqa xmm8,xmm10 movdqa xmm6,xmm13 pxor xmm1,XMMWORD PTR[((160-128))+rax] paddd xmm14,xmm15 pslld xmm8,5 pxor xmm6,xmm11 movdqa xmm9,xmm10 movdqa XMMWORD PTR[(16-128)+rax],xmm0 paddd xmm14,xmm0 pxor xmm1,xmm3 psrld xmm9,27 pxor xmm6,xmm12 movdqa xmm7,xmm11 pslld xmm7,30 movdqa xmm5,xmm1 por xmm8,xmm9 psrld xmm5,31 paddd xmm14,xmm6 paddd xmm1,xmm1 psrld xmm11,2 paddd xmm14,xmm8 por xmm1,xmm5 por xmm11,xmm7 pxor xmm2,xmm4 movdqa xmm4,XMMWORD PTR[((80-128))+rax] movdqa xmm8,xmm14 movdqa xmm6,xmm12 pxor xmm2,XMMWORD PTR[((176-128))+rax] paddd xmm13,xmm15 pslld xmm8,5 pxor xmm6,xmm10 movdqa xmm9,xmm14 movdqa XMMWORD PTR[(32-128)+rax],xmm1 paddd xmm13,xmm1 pxor xmm2,xmm4 psrld xmm9,27 pxor xmm6,xmm11 movdqa xmm7,xmm10 pslld xmm7,30 movdqa xmm5,xmm2 por xmm8,xmm9 psrld xmm5,31 paddd xmm13,xmm6 paddd xmm2,xmm2 psrld xmm10,2 paddd xmm13,xmm8 por xmm2,xmm5 por xmm10,xmm7 pxor xmm3,xmm0 movdqa xmm0,XMMWORD PTR[((96-128))+rax] movdqa xmm8,xmm13 movdqa xmm6,xmm11 pxor xmm3,XMMWORD PTR[((192-128))+rax] paddd xmm12,xmm15 pslld xmm8,5 pxor xmm6,xmm14 movdqa xmm9,xmm13 movdqa XMMWORD PTR[(48-128)+rax],xmm2 paddd xmm12,xmm2 pxor xmm3,xmm0 psrld xmm9,27 pxor xmm6,xmm10 movdqa xmm7,xmm14 pslld xmm7,30 movdqa xmm5,xmm3 por xmm8,xmm9 psrld xmm5,31 paddd xmm12,xmm6 paddd xmm3,xmm3 psrld xmm14,2 paddd xmm12,xmm8 por xmm3,xmm5 por xmm14,xmm7 pxor xmm4,xmm1 movdqa xmm1,XMMWORD PTR[((112-128))+rax] movdqa xmm8,xmm12 movdqa xmm6,xmm10 pxor xmm4,XMMWORD PTR[((208-128))+rax] paddd xmm11,xmm15 pslld xmm8,5 pxor xmm6,xmm13 movdqa xmm9,xmm12 movdqa XMMWORD PTR[(64-128)+rax],xmm3 paddd xmm11,xmm3 pxor xmm4,xmm1 psrld xmm9,27 pxor xmm6,xmm14 movdqa xmm7,xmm13 pslld xmm7,30 movdqa xmm5,xmm4 por xmm8,xmm9 psrld xmm5,31 paddd xmm11,xmm6 paddd xmm4,xmm4 psrld xmm13,2 paddd xmm11,xmm8 por xmm4,xmm5 por xmm13,xmm7 pxor xmm0,xmm2 movdqa xmm2,XMMWORD PTR[((128-128))+rax] movdqa xmm8,xmm11 movdqa xmm6,xmm14 pxor xmm0,XMMWORD PTR[((224-128))+rax] paddd xmm10,xmm15 pslld xmm8,5 pxor xmm6,xmm12 movdqa xmm9,xmm11 movdqa XMMWORD PTR[(80-128)+rax],xmm4 paddd xmm10,xmm4 pxor xmm0,xmm2 psrld xmm9,27 pxor xmm6,xmm13 movdqa xmm7,xmm12 pslld xmm7,30 movdqa xmm5,xmm0 por xmm8,xmm9 psrld xmm5,31 paddd xmm10,xmm6 paddd xmm0,xmm0 psrld xmm12,2 paddd xmm10,xmm8 por xmm0,xmm5 por xmm12,xmm7 pxor xmm1,xmm3 movdqa xmm3,XMMWORD PTR[((144-128))+rax] movdqa xmm8,xmm10 movdqa xmm6,xmm13 pxor xmm1,XMMWORD PTR[((240-128))+rax] paddd xmm14,xmm15 pslld xmm8,5 pxor xmm6,xmm11 movdqa xmm9,xmm10 movdqa XMMWORD PTR[(96-128)+rax],xmm0 paddd xmm14,xmm0 pxor xmm1,xmm3 psrld xmm9,27 pxor xmm6,xmm12 movdqa xmm7,xmm11 pslld xmm7,30 movdqa xmm5,xmm1 por xmm8,xmm9 psrld xmm5,31 paddd xmm14,xmm6 paddd xmm1,xmm1 psrld xmm11,2 paddd xmm14,xmm8 por xmm1,xmm5 por xmm11,xmm7 pxor xmm2,xmm4 movdqa xmm4,XMMWORD PTR[((160-128))+rax] movdqa xmm8,xmm14 movdqa xmm6,xmm12 pxor xmm2,XMMWORD PTR[((0-128))+rax] paddd xmm13,xmm15 pslld xmm8,5 pxor xmm6,xmm10 movdqa xmm9,xmm14 movdqa XMMWORD PTR[(112-128)+rax],xmm1 paddd xmm13,xmm1 pxor xmm2,xmm4 psrld xmm9,27 pxor xmm6,xmm11 movdqa xmm7,xmm10 pslld xmm7,30 movdqa xmm5,xmm2 por xmm8,xmm9 psrld xmm5,31 paddd xmm13,xmm6 paddd xmm2,xmm2 psrld xmm10,2 paddd xmm13,xmm8 por xmm2,xmm5 por xmm10,xmm7 pxor xmm3,xmm0 movdqa xmm0,XMMWORD PTR[((176-128))+rax] movdqa xmm8,xmm13 movdqa xmm6,xmm11 pxor xmm3,XMMWORD PTR[((16-128))+rax] paddd xmm12,xmm15 pslld xmm8,5 pxor xmm6,xmm14 movdqa xmm9,xmm13 paddd xmm12,xmm2 pxor xmm3,xmm0 psrld xmm9,27 pxor xmm6,xmm10 movdqa xmm7,xmm14 pslld xmm7,30 movdqa xmm5,xmm3 por xmm8,xmm9 psrld xmm5,31 paddd xmm12,xmm6 paddd xmm3,xmm3 psrld xmm14,2 paddd xmm12,xmm8 por xmm3,xmm5 por xmm14,xmm7 pxor xmm4,xmm1 movdqa xmm1,XMMWORD PTR[((192-128))+rax] movdqa xmm8,xmm12 movdqa xmm6,xmm10 pxor xmm4,XMMWORD PTR[((32-128))+rax] paddd xmm11,xmm15 pslld xmm8,5 pxor xmm6,xmm13 movdqa xmm9,xmm12 paddd xmm11,xmm3 pxor xmm4,xmm1 psrld xmm9,27 pxor xmm6,xmm14 movdqa xmm7,xmm13 pslld xmm7,30 movdqa xmm5,xmm4 por xmm8,xmm9 psrld xmm5,31 paddd xmm11,xmm6 paddd xmm4,xmm4 psrld xmm13,2 paddd xmm11,xmm8 por xmm4,xmm5 por xmm13,xmm7 pxor xmm0,xmm2 movdqa xmm2,XMMWORD PTR[((208-128))+rax] movdqa xmm8,xmm11 movdqa xmm6,xmm14 pxor xmm0,XMMWORD PTR[((48-128))+rax] paddd xmm10,xmm15 pslld xmm8,5 pxor xmm6,xmm12 movdqa xmm9,xmm11 paddd xmm10,xmm4 pxor xmm0,xmm2 psrld xmm9,27 pxor xmm6,xmm13 movdqa xmm7,xmm12 pslld xmm7,30 movdqa xmm5,xmm0 por xmm8,xmm9 psrld xmm5,31 paddd xmm10,xmm6 paddd xmm0,xmm0 psrld xmm12,2 paddd xmm10,xmm8 por xmm0,xmm5 por xmm12,xmm7 pxor xmm1,xmm3 movdqa xmm3,XMMWORD PTR[((224-128))+rax] movdqa xmm8,xmm10 movdqa xmm6,xmm13 pxor xmm1,XMMWORD PTR[((64-128))+rax] paddd xmm14,xmm15 pslld xmm8,5 pxor xmm6,xmm11 movdqa xmm9,xmm10 paddd xmm14,xmm0 pxor xmm1,xmm3 psrld xmm9,27 pxor xmm6,xmm12 movdqa xmm7,xmm11 pslld xmm7,30 movdqa xmm5,xmm1 por xmm8,xmm9 psrld xmm5,31 paddd xmm14,xmm6 paddd xmm1,xmm1 psrld xmm11,2 paddd xmm14,xmm8 por xmm1,xmm5 por xmm11,xmm7 pxor xmm2,xmm4 movdqa xmm4,XMMWORD PTR[((240-128))+rax] movdqa xmm8,xmm14 movdqa xmm6,xmm12 pxor xmm2,XMMWORD PTR[((80-128))+rax] paddd xmm13,xmm15 pslld xmm8,5 pxor xmm6,xmm10 movdqa xmm9,xmm14 paddd xmm13,xmm1 pxor xmm2,xmm4 psrld xmm9,27 pxor xmm6,xmm11 movdqa xmm7,xmm10 pslld xmm7,30 movdqa xmm5,xmm2 por xmm8,xmm9 psrld xmm5,31 paddd xmm13,xmm6 paddd xmm2,xmm2 psrld xmm10,2 paddd xmm13,xmm8 por xmm2,xmm5 por xmm10,xmm7 pxor xmm3,xmm0 movdqa xmm0,XMMWORD PTR[((0-128))+rax] movdqa xmm8,xmm13 movdqa xmm6,xmm11 pxor xmm3,XMMWORD PTR[((96-128))+rax] paddd xmm12,xmm15 pslld xmm8,5 pxor xmm6,xmm14 movdqa xmm9,xmm13 paddd xmm12,xmm2 pxor xmm3,xmm0 psrld xmm9,27 pxor xmm6,xmm10 movdqa xmm7,xmm14 pslld xmm7,30 movdqa xmm5,xmm3 por xmm8,xmm9 psrld xmm5,31 paddd xmm12,xmm6 paddd xmm3,xmm3 psrld xmm14,2 paddd xmm12,xmm8 por xmm3,xmm5 por xmm14,xmm7 pxor xmm4,xmm1 movdqa xmm1,XMMWORD PTR[((16-128))+rax] movdqa xmm8,xmm12 movdqa xmm6,xmm10 pxor xmm4,XMMWORD PTR[((112-128))+rax] paddd xmm11,xmm15 pslld xmm8,5 pxor xmm6,xmm13 movdqa xmm9,xmm12 paddd xmm11,xmm3 pxor xmm4,xmm1 psrld xmm9,27 pxor xmm6,xmm14 movdqa xmm7,xmm13 pslld xmm7,30 movdqa xmm5,xmm4 por xmm8,xmm9 psrld xmm5,31 paddd xmm11,xmm6 paddd xmm4,xmm4 psrld xmm13,2 paddd xmm11,xmm8 por xmm4,xmm5 por xmm13,xmm7 movdqa xmm8,xmm11 paddd xmm10,xmm15 movdqa xmm6,xmm14 pslld xmm8,5 pxor xmm6,xmm12 movdqa xmm9,xmm11 paddd xmm10,xmm4 psrld xmm9,27 movdqa xmm7,xmm12 pxor xmm6,xmm13 pslld xmm7,30 por xmm8,xmm9 paddd xmm10,xmm6 psrld xmm12,2 paddd xmm10,xmm8 por xmm12,xmm7 movdqa xmm0,XMMWORD PTR[rbx] mov ecx,1 cmp ecx,DWORD PTR[rbx] pxor xmm8,xmm8 cmovge r8,rbp cmp ecx,DWORD PTR[4+rbx] movdqa xmm1,xmm0 cmovge r9,rbp cmp ecx,DWORD PTR[8+rbx] pcmpgtd xmm1,xmm8 cmovge r10,rbp cmp ecx,DWORD PTR[12+rbx] paddd xmm0,xmm1 cmovge r11,rbp movdqu xmm6,XMMWORD PTR[rdi] pand xmm10,xmm1 movdqu xmm7,XMMWORD PTR[32+rdi] pand xmm11,xmm1 paddd xmm10,xmm6 movdqu xmm8,XMMWORD PTR[64+rdi] pand xmm12,xmm1 paddd xmm11,xmm7 movdqu xmm9,XMMWORD PTR[96+rdi] pand xmm13,xmm1 paddd xmm12,xmm8 movdqu xmm5,XMMWORD PTR[128+rdi] pand xmm14,xmm1 movdqu XMMWORD PTR[rdi],xmm10 paddd xmm13,xmm9 movdqu XMMWORD PTR[32+rdi],xmm11 paddd xmm14,xmm5 movdqu XMMWORD PTR[64+rdi],xmm12 movdqu XMMWORD PTR[96+rdi],xmm13 movdqu XMMWORD PTR[128+rdi],xmm14 movdqa XMMWORD PTR[rbx],xmm0 movdqa xmm5,XMMWORD PTR[96+rbp] movdqa xmm15,XMMWORD PTR[((-32))+rbp] dec edx jnz $L$oop mov edx,DWORD PTR[280+rsp] lea rdi,QWORD PTR[16+rdi] lea rsi,QWORD PTR[64+rsi] dec edx jnz $L$oop_grande $L$done:: mov rax,QWORD PTR[272+rsp] movaps xmm6,XMMWORD PTR[((-184))+rax] movaps xmm7,XMMWORD PTR[((-168))+rax] movaps xmm8,XMMWORD PTR[((-152))+rax] movaps xmm9,XMMWORD PTR[((-136))+rax] movaps xmm10,XMMWORD PTR[((-120))+rax] movaps xmm11,XMMWORD PTR[((-104))+rax] movaps xmm12,XMMWORD PTR[((-88))+rax] movaps xmm13,XMMWORD PTR[((-72))+rax] movaps xmm14,XMMWORD PTR[((-56))+rax] movaps xmm15,XMMWORD PTR[((-40))+rax] mov rbp,QWORD PTR[((-16))+rax] mov rbx,QWORD PTR[((-8))+rax] lea rsp,QWORD PTR[rax] $L$epilogue:: mov rdi,QWORD PTR[8+rsp] ;WIN64 epilogue mov rsi,QWORD PTR[16+rsp] DB 0F3h,0C3h ;repret $L$SEH_end_sha1_multi_block:: sha1_multi_block ENDP ALIGN 32 sha1_multi_block_shaext PROC PRIVATE mov QWORD PTR[8+rsp],rdi ;WIN64 prologue mov QWORD PTR[16+rsp],rsi mov rax,rsp $L$SEH_begin_sha1_multi_block_shaext:: mov rdi,rcx mov rsi,rdx mov rdx,r8 _shaext_shortcut:: mov rax,rsp push rbx push rbp lea rsp,QWORD PTR[((-168))+rsp] movaps XMMWORD PTR[rsp],xmm6 movaps XMMWORD PTR[16+rsp],xmm7 movaps XMMWORD PTR[32+rsp],xmm8 movaps XMMWORD PTR[48+rsp],xmm9 movaps XMMWORD PTR[(-120)+rax],xmm10 movaps XMMWORD PTR[(-104)+rax],xmm11 movaps XMMWORD PTR[(-88)+rax],xmm12 movaps XMMWORD PTR[(-72)+rax],xmm13 movaps XMMWORD PTR[(-56)+rax],xmm14 movaps XMMWORD PTR[(-40)+rax],xmm15 sub rsp,288 shl edx,1 and rsp,-256 lea rdi,QWORD PTR[64+rdi] mov QWORD PTR[272+rsp],rax $L$body_shaext:: lea rbx,QWORD PTR[256+rsp] movdqa xmm3,XMMWORD PTR[((K_XX_XX+128))] $L$oop_grande_shaext:: mov DWORD PTR[280+rsp],edx xor edx,edx mov r8,QWORD PTR[rsi] mov ecx,DWORD PTR[8+rsi] cmp ecx,edx cmovg edx,ecx test ecx,ecx mov DWORD PTR[rbx],ecx cmovle r8,rsp mov r9,QWORD PTR[16+rsi] mov ecx,DWORD PTR[24+rsi] cmp ecx,edx cmovg edx,ecx test ecx,ecx mov DWORD PTR[4+rbx],ecx cmovle r9,rsp test edx,edx jz $L$done_shaext movq xmm0,QWORD PTR[((0-64))+rdi] movq xmm4,QWORD PTR[((32-64))+rdi] movq xmm5,QWORD PTR[((64-64))+rdi] movq xmm6,QWORD PTR[((96-64))+rdi] movq xmm7,QWORD PTR[((128-64))+rdi] punpckldq xmm0,xmm4 punpckldq xmm5,xmm6 movdqa xmm8,xmm0 punpcklqdq xmm0,xmm5 punpckhqdq xmm8,xmm5 pshufd xmm1,xmm7,63 pshufd xmm9,xmm7,127 pshufd xmm0,xmm0,27 pshufd xmm8,xmm8,27 jmp $L$oop_shaext ALIGN 32 $L$oop_shaext:: movdqu xmm4,XMMWORD PTR[r8] movdqu xmm11,XMMWORD PTR[r9] movdqu xmm5,XMMWORD PTR[16+r8] movdqu xmm12,XMMWORD PTR[16+r9] movdqu xmm6,XMMWORD PTR[32+r8] DB 102,15,56,0,227 movdqu xmm13,XMMWORD PTR[32+r9] DB 102,68,15,56,0,219 movdqu xmm7,XMMWORD PTR[48+r8] lea r8,QWORD PTR[64+r8] DB 102,15,56,0,235 movdqu xmm14,XMMWORD PTR[48+r9] lea r9,QWORD PTR[64+r9] DB 102,68,15,56,0,227 movdqa XMMWORD PTR[80+rsp],xmm1 paddd xmm1,xmm4 movdqa XMMWORD PTR[112+rsp],xmm9 paddd xmm9,xmm11 movdqa XMMWORD PTR[64+rsp],xmm0 movdqa xmm2,xmm0 movdqa XMMWORD PTR[96+rsp],xmm8 movdqa xmm10,xmm8 DB 15,58,204,193,0 DB 15,56,200,213 DB 69,15,58,204,193,0 DB 69,15,56,200,212 DB 102,15,56,0,243 prefetcht0 [127+r8] DB 15,56,201,229 DB 102,68,15,56,0,235 prefetcht0 [127+r9] DB 69,15,56,201,220 DB 102,15,56,0,251 movdqa xmm1,xmm0 DB 102,68,15,56,0,243 movdqa xmm9,xmm8 DB 15,58,204,194,0 DB 15,56,200,206 DB 69,15,58,204,194,0 DB 69,15,56,200,205 pxor xmm4,xmm6 DB 15,56,201,238 pxor xmm11,xmm13 DB 69,15,56,201,229 movdqa xmm2,xmm0 movdqa xmm10,xmm8 DB 15,58,204,193,0 DB 15,56,200,215 DB 69,15,58,204,193,0 DB 69,15,56,200,214 DB 15,56,202,231 DB 69,15,56,202,222 pxor xmm5,xmm7 DB 15,56,201,247 pxor xmm12,xmm14 DB 69,15,56,201,238 movdqa xmm1,xmm0 movdqa xmm9,xmm8 DB 15,58,204,194,0 DB 15,56,200,204 DB 69,15,58,204,194,0 DB 69,15,56,200,203 DB 15,56,202,236 DB 69,15,56,202,227 pxor xmm6,xmm4 DB 15,56,201,252 pxor xmm13,xmm11 DB 69,15,56,201,243 movdqa xmm2,xmm0 movdqa xmm10,xmm8 DB 15,58,204,193,0 DB 15,56,200,213 DB 69,15,58,204,193,0 DB 69,15,56,200,212 DB 15,56,202,245 DB 69,15,56,202,236 pxor xmm7,xmm5 DB 15,56,201,229 pxor xmm14,xmm12 DB 69,15,56,201,220 movdqa xmm1,xmm0 movdqa xmm9,xmm8 DB 15,58,204,194,1 DB 15,56,200,206 DB 69,15,58,204,194,1 DB 69,15,56,200,205 DB 15,56,202,254 DB 69,15,56,202,245 pxor xmm4,xmm6 DB 15,56,201,238 pxor xmm11,xmm13 DB 69,15,56,201,229 movdqa xmm2,xmm0 movdqa xmm10,xmm8 DB 15,58,204,193,1 DB 15,56,200,215 DB 69,15,58,204,193,1 DB 69,15,56,200,214 DB 15,56,202,231 DB 69,15,56,202,222 pxor xmm5,xmm7 DB 15,56,201,247 pxor xmm12,xmm14 DB 69,15,56,201,238 movdqa xmm1,xmm0 movdqa xmm9,xmm8 DB 15,58,204,194,1 DB 15,56,200,204 DB 69,15,58,204,194,1 DB 69,15,56,200,203 DB 15,56,202,236 DB 69,15,56,202,227 pxor xmm6,xmm4 DB 15,56,201,252 pxor xmm13,xmm11 DB 69,15,56,201,243 movdqa xmm2,xmm0 movdqa xmm10,xmm8 DB 15,58,204,193,1 DB 15,56,200,213 DB 69,15,58,204,193,1 DB 69,15,56,200,212 DB 15,56,202,245 DB 69,15,56,202,236 pxor xmm7,xmm5 DB 15,56,201,229 pxor xmm14,xmm12 DB 69,15,56,201,220 movdqa xmm1,xmm0 movdqa xmm9,xmm8 DB 15,58,204,194,1 DB 15,56,200,206 DB 69,15,58,204,194,1 DB 69,15,56,200,205 DB 15,56,202,254 DB 69,15,56,202,245 pxor xmm4,xmm6 DB 15,56,201,238 pxor xmm11,xmm13 DB 69,15,56,201,229 movdqa xmm2,xmm0 movdqa xmm10,xmm8 DB 15,58,204,193,2 DB 15,56,200,215 DB 69,15,58,204,193,2 DB 69,15,56,200,214 DB 15,56,202,231 DB 69,15,56,202,222 pxor xmm5,xmm7 DB 15,56,201,247 pxor xmm12,xmm14 DB 69,15,56,201,238 movdqa xmm1,xmm0 movdqa xmm9,xmm8 DB 15,58,204,194,2 DB 15,56,200,204 DB 69,15,58,204,194,2 DB 69,15,56,200,203 DB 15,56,202,236 DB 69,15,56,202,227 pxor xmm6,xmm4 DB 15,56,201,252 pxor xmm13,xmm11 DB 69,15,56,201,243 movdqa xmm2,xmm0 movdqa xmm10,xmm8 DB 15,58,204,193,2 DB 15,56,200,213 DB 69,15,58,204,193,2 DB 69,15,56,200,212 DB 15,56,202,245 DB 69,15,56,202,236 pxor xmm7,xmm5 DB 15,56,201,229 pxor xmm14,xmm12 DB 69,15,56,201,220 movdqa xmm1,xmm0 movdqa xmm9,xmm8 DB 15,58,204,194,2 DB 15,56,200,206 DB 69,15,58,204,194,2 DB 69,15,56,200,205 DB 15,56,202,254 DB 69,15,56,202,245 pxor xmm4,xmm6 DB 15,56,201,238 pxor xmm11,xmm13 DB 69,15,56,201,229 movdqa xmm2,xmm0 movdqa xmm10,xmm8 DB 15,58,204,193,2 DB 15,56,200,215 DB 69,15,58,204,193,2 DB 69,15,56,200,214 DB 15,56,202,231 DB 69,15,56,202,222 pxor xmm5,xmm7 DB 15,56,201,247 pxor xmm12,xmm14 DB 69,15,56,201,238 movdqa xmm1,xmm0 movdqa xmm9,xmm8 DB 15,58,204,194,3 DB 15,56,200,204 DB 69,15,58,204,194,3 DB 69,15,56,200,203 DB 15,56,202,236 DB 69,15,56,202,227 pxor xmm6,xmm4 DB 15,56,201,252 pxor xmm13,xmm11 DB 69,15,56,201,243 movdqa xmm2,xmm0 movdqa xmm10,xmm8 DB 15,58,204,193,3 DB 15,56,200,213 DB 69,15,58,204,193,3 DB 69,15,56,200,212 DB 15,56,202,245 DB 69,15,56,202,236 pxor xmm7,xmm5 pxor xmm14,xmm12 mov ecx,1 pxor xmm4,xmm4 cmp ecx,DWORD PTR[rbx] cmovge r8,rsp movdqa xmm1,xmm0 movdqa xmm9,xmm8 DB 15,58,204,194,3 DB 15,56,200,206 DB 69,15,58,204,194,3 DB 69,15,56,200,205 DB 15,56,202,254 DB 69,15,56,202,245 cmp ecx,DWORD PTR[4+rbx] cmovge r9,rsp movq xmm6,QWORD PTR[rbx] movdqa xmm2,xmm0 movdqa xmm10,xmm8 DB 15,58,204,193,3 DB 15,56,200,215 DB 69,15,58,204,193,3 DB 69,15,56,200,214 pshufd xmm11,xmm6,000h pshufd xmm12,xmm6,055h movdqa xmm7,xmm6 pcmpgtd xmm11,xmm4 pcmpgtd xmm12,xmm4 movdqa xmm1,xmm0 movdqa xmm9,xmm8 DB 15,58,204,194,3 DB 15,56,200,204 DB 69,15,58,204,194,3 DB 68,15,56,200,204 pcmpgtd xmm7,xmm4 pand xmm0,xmm11 pand xmm1,xmm11 pand xmm8,xmm12 pand xmm9,xmm12 paddd xmm6,xmm7 paddd xmm0,XMMWORD PTR[64+rsp] paddd xmm1,XMMWORD PTR[80+rsp] paddd xmm8,XMMWORD PTR[96+rsp] paddd xmm9,XMMWORD PTR[112+rsp] movq QWORD PTR[rbx],xmm6 dec edx jnz $L$oop_shaext mov edx,DWORD PTR[280+rsp] pshufd xmm0,xmm0,27 pshufd xmm8,xmm8,27 movdqa xmm6,xmm0 punpckldq xmm0,xmm8 punpckhdq xmm6,xmm8 punpckhdq xmm1,xmm9 movq QWORD PTR[(0-64)+rdi],xmm0 psrldq xmm0,8 movq QWORD PTR[(64-64)+rdi],xmm6 psrldq xmm6,8 movq QWORD PTR[(32-64)+rdi],xmm0 psrldq xmm1,8 movq QWORD PTR[(96-64)+rdi],xmm6 movq QWORD PTR[(128-64)+rdi],xmm1 lea rdi,QWORD PTR[8+rdi] lea rsi,QWORD PTR[32+rsi] dec edx jnz $L$oop_grande_shaext $L$done_shaext:: movaps xmm6,XMMWORD PTR[((-184))+rax] movaps xmm7,XMMWORD PTR[((-168))+rax] movaps xmm8,XMMWORD PTR[((-152))+rax] movaps xmm9,XMMWORD PTR[((-136))+rax] movaps xmm10,XMMWORD PTR[((-120))+rax] movaps xmm11,XMMWORD PTR[((-104))+rax] movaps xmm12,XMMWORD PTR[((-88))+rax] movaps xmm13,XMMWORD PTR[((-72))+rax] movaps xmm14,XMMWORD PTR[((-56))+rax] movaps xmm15,XMMWORD PTR[((-40))+rax] mov rbp,QWORD PTR[((-16))+rax] mov rbx,QWORD PTR[((-8))+rax] lea rsp,QWORD PTR[rax] $L$epilogue_shaext:: mov rdi,QWORD PTR[8+rsp] ;WIN64 epilogue mov rsi,QWORD PTR[16+rsp] DB 0F3h,0C3h ;repret $L$SEH_end_sha1_multi_block_shaext:: sha1_multi_block_shaext ENDP ALIGN 32 sha1_multi_block_avx PROC PRIVATE mov QWORD PTR[8+rsp],rdi ;WIN64 prologue mov QWORD PTR[16+rsp],rsi mov rax,rsp $L$SEH_begin_sha1_multi_block_avx:: mov rdi,rcx mov rsi,rdx mov rdx,r8 _avx_shortcut:: shr rcx,32 cmp edx,2 jb $L$avx test ecx,32 jnz _avx2_shortcut jmp $L$avx ALIGN 32 $L$avx:: mov rax,rsp push rbx push rbp lea rsp,QWORD PTR[((-168))+rsp] movaps XMMWORD PTR[rsp],xmm6 movaps XMMWORD PTR[16+rsp],xmm7 movaps XMMWORD PTR[32+rsp],xmm8 movaps XMMWORD PTR[48+rsp],xmm9 movaps XMMWORD PTR[(-120)+rax],xmm10 movaps XMMWORD PTR[(-104)+rax],xmm11 movaps XMMWORD PTR[(-88)+rax],xmm12 movaps XMMWORD PTR[(-72)+rax],xmm13 movaps XMMWORD PTR[(-56)+rax],xmm14 movaps XMMWORD PTR[(-40)+rax],xmm15 sub rsp,288 and rsp,-256 mov QWORD PTR[272+rsp],rax $L$body_avx:: lea rbp,QWORD PTR[K_XX_XX] lea rbx,QWORD PTR[256+rsp] vzeroupper $L$oop_grande_avx:: mov DWORD PTR[280+rsp],edx xor edx,edx mov r8,QWORD PTR[rsi] mov ecx,DWORD PTR[8+rsi] cmp ecx,edx cmovg edx,ecx test ecx,ecx mov DWORD PTR[rbx],ecx cmovle r8,rbp mov r9,QWORD PTR[16+rsi] mov ecx,DWORD PTR[24+rsi] cmp ecx,edx cmovg edx,ecx test ecx,ecx mov DWORD PTR[4+rbx],ecx cmovle r9,rbp mov r10,QWORD PTR[32+rsi] mov ecx,DWORD PTR[40+rsi] cmp ecx,edx cmovg edx,ecx test ecx,ecx mov DWORD PTR[8+rbx],ecx cmovle r10,rbp mov r11,QWORD PTR[48+rsi] mov ecx,DWORD PTR[56+rsi] cmp ecx,edx cmovg edx,ecx test ecx,ecx mov DWORD PTR[12+rbx],ecx cmovle r11,rbp test edx,edx jz $L$done_avx vmovdqu xmm10,XMMWORD PTR[rdi] lea rax,QWORD PTR[128+rsp] vmovdqu xmm11,XMMWORD PTR[32+rdi] vmovdqu xmm12,XMMWORD PTR[64+rdi] vmovdqu xmm13,XMMWORD PTR[96+rdi] vmovdqu xmm14,XMMWORD PTR[128+rdi] vmovdqu xmm5,XMMWORD PTR[96+rbp] jmp $L$oop_avx ALIGN 32 $L$oop_avx:: vmovdqa xmm15,XMMWORD PTR[((-32))+rbp] vmovd xmm0,DWORD PTR[r8] lea r8,QWORD PTR[64+r8] vmovd xmm2,DWORD PTR[r9] lea r9,QWORD PTR[64+r9] vpinsrd xmm0,xmm0,DWORD PTR[r10],1 lea r10,QWORD PTR[64+r10] vpinsrd xmm2,xmm2,DWORD PTR[r11],1 lea r11,QWORD PTR[64+r11] vmovd xmm1,DWORD PTR[((-60))+r8] vpunpckldq xmm0,xmm0,xmm2 vmovd xmm9,DWORD PTR[((-60))+r9] vpshufb xmm0,xmm0,xmm5 vpinsrd xmm1,xmm1,DWORD PTR[((-60))+r10],1 vpinsrd xmm9,xmm9,DWORD PTR[((-60))+r11],1 vpaddd xmm14,xmm14,xmm15 vpslld xmm8,xmm10,5 vpandn xmm7,xmm11,xmm13 vpand xmm6,xmm11,xmm12 vmovdqa XMMWORD PTR[(0-128)+rax],xmm0 vpaddd xmm14,xmm14,xmm0 vpunpckldq xmm1,xmm1,xmm9 vpsrld xmm9,xmm10,27 vpxor xmm6,xmm6,xmm7 vmovd xmm2,DWORD PTR[((-56))+r8] vpslld xmm7,xmm11,30 vpor xmm8,xmm8,xmm9 vmovd xmm9,DWORD PTR[((-56))+r9] vpaddd xmm14,xmm14,xmm6 vpsrld xmm11,xmm11,2 vpaddd xmm14,xmm14,xmm8 vpshufb xmm1,xmm1,xmm5 vpor xmm11,xmm11,xmm7 vpinsrd xmm2,xmm2,DWORD PTR[((-56))+r10],1 vpinsrd xmm9,xmm9,DWORD PTR[((-56))+r11],1 vpaddd xmm13,xmm13,xmm15 vpslld xmm8,xmm14,5 vpandn xmm7,xmm10,xmm12 vpand xmm6,xmm10,xmm11 vmovdqa XMMWORD PTR[(16-128)+rax],xmm1 vpaddd xmm13,xmm13,xmm1 vpunpckldq xmm2,xmm2,xmm9 vpsrld xmm9,xmm14,27 vpxor xmm6,xmm6,xmm7 vmovd xmm3,DWORD PTR[((-52))+r8] vpslld xmm7,xmm10,30 vpor xmm8,xmm8,xmm9 vmovd xmm9,DWORD PTR[((-52))+r9] vpaddd xmm13,xmm13,xmm6 vpsrld xmm10,xmm10,2 vpaddd xmm13,xmm13,xmm8 vpshufb xmm2,xmm2,xmm5 vpor xmm10,xmm10,xmm7 vpinsrd xmm3,xmm3,DWORD PTR[((-52))+r10],1 vpinsrd xmm9,xmm9,DWORD PTR[((-52))+r11],1 vpaddd xmm12,xmm12,xmm15 vpslld xmm8,xmm13,5 vpandn xmm7,xmm14,xmm11 vpand xmm6,xmm14,xmm10 vmovdqa XMMWORD PTR[(32-128)+rax],xmm2 vpaddd xmm12,xmm12,xmm2 vpunpckldq xmm3,xmm3,xmm9 vpsrld xmm9,xmm13,27 vpxor xmm6,xmm6,xmm7 vmovd xmm4,DWORD PTR[((-48))+r8] vpslld xmm7,xmm14,30 vpor xmm8,xmm8,xmm9 vmovd xmm9,DWORD PTR[((-48))+r9] vpaddd xmm12,xmm12,xmm6 vpsrld xmm14,xmm14,2 vpaddd xmm12,xmm12,xmm8 vpshufb xmm3,xmm3,xmm5 vpor xmm14,xmm14,xmm7 vpinsrd xmm4,xmm4,DWORD PTR[((-48))+r10],1 vpinsrd xmm9,xmm9,DWORD PTR[((-48))+r11],1 vpaddd xmm11,xmm11,xmm15 vpslld xmm8,xmm12,5 vpandn xmm7,xmm13,xmm10 vpand xmm6,xmm13,xmm14 vmovdqa XMMWORD PTR[(48-128)+rax],xmm3 vpaddd xmm11,xmm11,xmm3 vpunpckldq xmm4,xmm4,xmm9 vpsrld xmm9,xmm12,27 vpxor xmm6,xmm6,xmm7 vmovd xmm0,DWORD PTR[((-44))+r8] vpslld xmm7,xmm13,30 vpor xmm8,xmm8,xmm9 vmovd xmm9,DWORD PTR[((-44))+r9] vpaddd xmm11,xmm11,xmm6 vpsrld xmm13,xmm13,2 vpaddd xmm11,xmm11,xmm8 vpshufb xmm4,xmm4,xmm5 vpor xmm13,xmm13,xmm7 vpinsrd xmm0,xmm0,DWORD PTR[((-44))+r10],1 vpinsrd xmm9,xmm9,DWORD PTR[((-44))+r11],1 vpaddd xmm10,xmm10,xmm15 vpslld xmm8,xmm11,5 vpandn xmm7,xmm12,xmm14 vpand xmm6,xmm12,xmm13 vmovdqa XMMWORD PTR[(64-128)+rax],xmm4 vpaddd xmm10,xmm10,xmm4 vpunpckldq xmm0,xmm0,xmm9 vpsrld xmm9,xmm11,27 vpxor xmm6,xmm6,xmm7 vmovd xmm1,DWORD PTR[((-40))+r8] vpslld xmm7,xmm12,30 vpor xmm8,xmm8,xmm9 vmovd xmm9,DWORD PTR[((-40))+r9] vpaddd xmm10,xmm10,xmm6 vpsrld xmm12,xmm12,2 vpaddd xmm10,xmm10,xmm8 vpshufb xmm0,xmm0,xmm5 vpor xmm12,xmm12,xmm7 vpinsrd xmm1,xmm1,DWORD PTR[((-40))+r10],1 vpinsrd xmm9,xmm9,DWORD PTR[((-40))+r11],1 vpaddd xmm14,xmm14,xmm15 vpslld xmm8,xmm10,5 vpandn xmm7,xmm11,xmm13 vpand xmm6,xmm11,xmm12 vmovdqa XMMWORD PTR[(80-128)+rax],xmm0 vpaddd xmm14,xmm14,xmm0 vpunpckldq xmm1,xmm1,xmm9 vpsrld xmm9,xmm10,27 vpxor xmm6,xmm6,xmm7 vmovd xmm2,DWORD PTR[((-36))+r8] vpslld xmm7,xmm11,30 vpor xmm8,xmm8,xmm9 vmovd xmm9,DWORD PTR[((-36))+r9] vpaddd xmm14,xmm14,xmm6 vpsrld xmm11,xmm11,2 vpaddd xmm14,xmm14,xmm8 vpshufb xmm1,xmm1,xmm5 vpor xmm11,xmm11,xmm7 vpinsrd xmm2,xmm2,DWORD PTR[((-36))+r10],1 vpinsrd xmm9,xmm9,DWORD PTR[((-36))+r11],1 vpaddd xmm13,xmm13,xmm15 vpslld xmm8,xmm14,5 vpandn xmm7,xmm10,xmm12 vpand xmm6,xmm10,xmm11 vmovdqa XMMWORD PTR[(96-128)+rax],xmm1 vpaddd xmm13,xmm13,xmm1 vpunpckldq xmm2,xmm2,xmm9 vpsrld xmm9,xmm14,27 vpxor xmm6,xmm6,xmm7 vmovd xmm3,DWORD PTR[((-32))+r8] vpslld xmm7,xmm10,30 vpor xmm8,xmm8,xmm9 vmovd xmm9,DWORD PTR[((-32))+r9] vpaddd xmm13,xmm13,xmm6 vpsrld xmm10,xmm10,2 vpaddd xmm13,xmm13,xmm8 vpshufb xmm2,xmm2,xmm5 vpor xmm10,xmm10,xmm7 vpinsrd xmm3,xmm3,DWORD PTR[((-32))+r10],1 vpinsrd xmm9,xmm9,DWORD PTR[((-32))+r11],1 vpaddd xmm12,xmm12,xmm15 vpslld xmm8,xmm13,5 vpandn xmm7,xmm14,xmm11 vpand xmm6,xmm14,xmm10 vmovdqa XMMWORD PTR[(112-128)+rax],xmm2 vpaddd xmm12,xmm12,xmm2 vpunpckldq xmm3,xmm3,xmm9 vpsrld xmm9,xmm13,27 vpxor xmm6,xmm6,xmm7 vmovd xmm4,DWORD PTR[((-28))+r8] vpslld xmm7,xmm14,30 vpor xmm8,xmm8,xmm9 vmovd xmm9,DWORD PTR[((-28))+r9] vpaddd xmm12,xmm12,xmm6 vpsrld xmm14,xmm14,2 vpaddd xmm12,xmm12,xmm8 vpshufb xmm3,xmm3,xmm5 vpor xmm14,xmm14,xmm7 vpinsrd xmm4,xmm4,DWORD PTR[((-28))+r10],1 vpinsrd xmm9,xmm9,DWORD PTR[((-28))+r11],1 vpaddd xmm11,xmm11,xmm15 vpslld xmm8,xmm12,5 vpandn xmm7,xmm13,xmm10 vpand xmm6,xmm13,xmm14 vmovdqa XMMWORD PTR[(128-128)+rax],xmm3 vpaddd xmm11,xmm11,xmm3 vpunpckldq xmm4,xmm4,xmm9 vpsrld xmm9,xmm12,27 vpxor xmm6,xmm6,xmm7 vmovd xmm0,DWORD PTR[((-24))+r8] vpslld xmm7,xmm13,30 vpor xmm8,xmm8,xmm9 vmovd xmm9,DWORD PTR[((-24))+r9] vpaddd xmm11,xmm11,xmm6 vpsrld xmm13,xmm13,2 vpaddd xmm11,xmm11,xmm8 vpshufb xmm4,xmm4,xmm5 vpor xmm13,xmm13,xmm7 vpinsrd xmm0,xmm0,DWORD PTR[((-24))+r10],1 vpinsrd xmm9,xmm9,DWORD PTR[((-24))+r11],1 vpaddd xmm10,xmm10,xmm15 vpslld xmm8,xmm11,5 vpandn xmm7,xmm12,xmm14 vpand xmm6,xmm12,xmm13 vmovdqa XMMWORD PTR[(144-128)+rax],xmm4 vpaddd xmm10,xmm10,xmm4 vpunpckldq xmm0,xmm0,xmm9 vpsrld xmm9,xmm11,27 vpxor xmm6,xmm6,xmm7 vmovd xmm1,DWORD PTR[((-20))+r8] vpslld xmm7,xmm12,30 vpor xmm8,xmm8,xmm9 vmovd xmm9,DWORD PTR[((-20))+r9] vpaddd xmm10,xmm10,xmm6 vpsrld xmm12,xmm12,2 vpaddd xmm10,xmm10,xmm8 vpshufb xmm0,xmm0,xmm5 vpor xmm12,xmm12,xmm7 vpinsrd xmm1,xmm1,DWORD PTR[((-20))+r10],1 vpinsrd xmm9,xmm9,DWORD PTR[((-20))+r11],1 vpaddd xmm14,xmm14,xmm15 vpslld xmm8,xmm10,5 vpandn xmm7,xmm11,xmm13 vpand xmm6,xmm11,xmm12 vmovdqa XMMWORD PTR[(160-128)+rax],xmm0 vpaddd xmm14,xmm14,xmm0 vpunpckldq xmm1,xmm1,xmm9 vpsrld xmm9,xmm10,27 vpxor xmm6,xmm6,xmm7 vmovd xmm2,DWORD PTR[((-16))+r8] vpslld xmm7,xmm11,30 vpor xmm8,xmm8,xmm9 vmovd xmm9,DWORD PTR[((-16))+r9] vpaddd xmm14,xmm14,xmm6 vpsrld xmm11,xmm11,2 vpaddd xmm14,xmm14,xmm8 vpshufb xmm1,xmm1,xmm5 vpor xmm11,xmm11,xmm7 vpinsrd xmm2,xmm2,DWORD PTR[((-16))+r10],1 vpinsrd xmm9,xmm9,DWORD PTR[((-16))+r11],1 vpaddd xmm13,xmm13,xmm15 vpslld xmm8,xmm14,5 vpandn xmm7,xmm10,xmm12 vpand xmm6,xmm10,xmm11 vmovdqa XMMWORD PTR[(176-128)+rax],xmm1 vpaddd xmm13,xmm13,xmm1 vpunpckldq xmm2,xmm2,xmm9 vpsrld xmm9,xmm14,27 vpxor xmm6,xmm6,xmm7 vmovd xmm3,DWORD PTR[((-12))+r8] vpslld xmm7,xmm10,30 vpor xmm8,xmm8,xmm9 vmovd xmm9,DWORD PTR[((-12))+r9] vpaddd xmm13,xmm13,xmm6 vpsrld xmm10,xmm10,2 vpaddd xmm13,xmm13,xmm8 vpshufb xmm2,xmm2,xmm5 vpor xmm10,xmm10,xmm7 vpinsrd xmm3,xmm3,DWORD PTR[((-12))+r10],1 vpinsrd xmm9,xmm9,DWORD PTR[((-12))+r11],1 vpaddd xmm12,xmm12,xmm15 vpslld xmm8,xmm13,5 vpandn xmm7,xmm14,xmm11 vpand xmm6,xmm14,xmm10 vmovdqa XMMWORD PTR[(192-128)+rax],xmm2 vpaddd xmm12,xmm12,xmm2 vpunpckldq xmm3,xmm3,xmm9 vpsrld xmm9,xmm13,27 vpxor xmm6,xmm6,xmm7 vmovd xmm4,DWORD PTR[((-8))+r8] vpslld xmm7,xmm14,30 vpor xmm8,xmm8,xmm9 vmovd xmm9,DWORD PTR[((-8))+r9] vpaddd xmm12,xmm12,xmm6 vpsrld xmm14,xmm14,2 vpaddd xmm12,xmm12,xmm8 vpshufb xmm3,xmm3,xmm5 vpor xmm14,xmm14,xmm7 vpinsrd xmm4,xmm4,DWORD PTR[((-8))+r10],1 vpinsrd xmm9,xmm9,DWORD PTR[((-8))+r11],1 vpaddd xmm11,xmm11,xmm15 vpslld xmm8,xmm12,5 vpandn xmm7,xmm13,xmm10 vpand xmm6,xmm13,xmm14 vmovdqa XMMWORD PTR[(208-128)+rax],xmm3 vpaddd xmm11,xmm11,xmm3 vpunpckldq xmm4,xmm4,xmm9 vpsrld xmm9,xmm12,27 vpxor xmm6,xmm6,xmm7 vmovd xmm0,DWORD PTR[((-4))+r8] vpslld xmm7,xmm13,30 vpor xmm8,xmm8,xmm9 vmovd xmm9,DWORD PTR[((-4))+r9] vpaddd xmm11,xmm11,xmm6 vpsrld xmm13,xmm13,2 vpaddd xmm11,xmm11,xmm8 vpshufb xmm4,xmm4,xmm5 vpor xmm13,xmm13,xmm7 vmovdqa xmm1,XMMWORD PTR[((0-128))+rax] vpinsrd xmm0,xmm0,DWORD PTR[((-4))+r10],1 vpinsrd xmm9,xmm9,DWORD PTR[((-4))+r11],1 vpaddd xmm10,xmm10,xmm15 prefetcht0 [63+r8] vpslld xmm8,xmm11,5 vpandn xmm7,xmm12,xmm14 vpand xmm6,xmm12,xmm13 vmovdqa XMMWORD PTR[(224-128)+rax],xmm4 vpaddd xmm10,xmm10,xmm4 vpunpckldq xmm0,xmm0,xmm9 vpsrld xmm9,xmm11,27 prefetcht0 [63+r9] vpxor xmm6,xmm6,xmm7 vpslld xmm7,xmm12,30 vpor xmm8,xmm8,xmm9 prefetcht0 [63+r10] vpaddd xmm10,xmm10,xmm6 vpsrld xmm12,xmm12,2 vpaddd xmm10,xmm10,xmm8 prefetcht0 [63+r11] vpshufb xmm0,xmm0,xmm5 vpor xmm12,xmm12,xmm7 vmovdqa xmm2,XMMWORD PTR[((16-128))+rax] vpxor xmm1,xmm1,xmm3 vmovdqa xmm3,XMMWORD PTR[((32-128))+rax] vpaddd xmm14,xmm14,xmm15 vpslld xmm8,xmm10,5 vpandn xmm7,xmm11,xmm13 vpand xmm6,xmm11,xmm12 vmovdqa XMMWORD PTR[(240-128)+rax],xmm0 vpaddd xmm14,xmm14,xmm0 vpxor xmm1,xmm1,XMMWORD PTR[((128-128))+rax] vpsrld xmm9,xmm10,27 vpxor xmm6,xmm6,xmm7 vpxor xmm1,xmm1,xmm3 vpslld xmm7,xmm11,30 vpor xmm8,xmm8,xmm9 vpaddd xmm14,xmm14,xmm6 vpsrld xmm5,xmm1,31 vpaddd xmm1,xmm1,xmm1 vpsrld xmm11,xmm11,2 vpaddd xmm14,xmm14,xmm8 vpor xmm1,xmm1,xmm5 vpor xmm11,xmm11,xmm7 vpxor xmm2,xmm2,xmm4 vmovdqa xmm4,XMMWORD PTR[((48-128))+rax] vpaddd xmm13,xmm13,xmm15 vpslld xmm8,xmm14,5 vpandn xmm7,xmm10,xmm12 vpand xmm6,xmm10,xmm11 vmovdqa XMMWORD PTR[(0-128)+rax],xmm1 vpaddd xmm13,xmm13,xmm1 vpxor xmm2,xmm2,XMMWORD PTR[((144-128))+rax] vpsrld xmm9,xmm14,27 vpxor xmm6,xmm6,xmm7 vpxor xmm2,xmm2,xmm4 vpslld xmm7,xmm10,30 vpor xmm8,xmm8,xmm9 vpaddd xmm13,xmm13,xmm6 vpsrld xmm5,xmm2,31 vpaddd xmm2,xmm2,xmm2 vpsrld xmm10,xmm10,2 vpaddd xmm13,xmm13,xmm8 vpor xmm2,xmm2,xmm5 vpor xmm10,xmm10,xmm7 vpxor xmm3,xmm3,xmm0 vmovdqa xmm0,XMMWORD PTR[((64-128))+rax] vpaddd xmm12,xmm12,xmm15 vpslld xmm8,xmm13,5 vpandn xmm7,xmm14,xmm11 vpand xmm6,xmm14,xmm10 vmovdqa XMMWORD PTR[(16-128)+rax],xmm2 vpaddd xmm12,xmm12,xmm2 vpxor xmm3,xmm3,XMMWORD PTR[((160-128))+rax] vpsrld xmm9,xmm13,27 vpxor xmm6,xmm6,xmm7 vpxor xmm3,xmm3,xmm0 vpslld xmm7,xmm14,30 vpor xmm8,xmm8,xmm9 vpaddd xmm12,xmm12,xmm6 vpsrld xmm5,xmm3,31 vpaddd xmm3,xmm3,xmm3 vpsrld xmm14,xmm14,2 vpaddd xmm12,xmm12,xmm8 vpor xmm3,xmm3,xmm5 vpor xmm14,xmm14,xmm7 vpxor xmm4,xmm4,xmm1 vmovdqa xmm1,XMMWORD PTR[((80-128))+rax] vpaddd xmm11,xmm11,xmm15 vpslld xmm8,xmm12,5 vpandn xmm7,xmm13,xmm10 vpand xmm6,xmm13,xmm14 vmovdqa XMMWORD PTR[(32-128)+rax],xmm3 vpaddd xmm11,xmm11,xmm3 vpxor xmm4,xmm4,XMMWORD PTR[((176-128))+rax] vpsrld xmm9,xmm12,27 vpxor xmm6,xmm6,xmm7 vpxor xmm4,xmm4,xmm1 vpslld xmm7,xmm13,30 vpor xmm8,xmm8,xmm9 vpaddd xmm11,xmm11,xmm6 vpsrld xmm5,xmm4,31 vpaddd xmm4,xmm4,xmm4 vpsrld xmm13,xmm13,2 vpaddd xmm11,xmm11,xmm8 vpor xmm4,xmm4,xmm5 vpor xmm13,xmm13,xmm7 vpxor xmm0,xmm0,xmm2 vmovdqa xmm2,XMMWORD PTR[((96-128))+rax] vpaddd xmm10,xmm10,xmm15 vpslld xmm8,xmm11,5 vpandn xmm7,xmm12,xmm14 vpand xmm6,xmm12,xmm13 vmovdqa XMMWORD PTR[(48-128)+rax],xmm4 vpaddd xmm10,xmm10,xmm4 vpxor xmm0,xmm0,XMMWORD PTR[((192-128))+rax] vpsrld xmm9,xmm11,27 vpxor xmm6,xmm6,xmm7 vpxor xmm0,xmm0,xmm2 vpslld xmm7,xmm12,30 vpor xmm8,xmm8,xmm9 vpaddd xmm10,xmm10,xmm6 vpsrld xmm5,xmm0,31 vpaddd xmm0,xmm0,xmm0 vpsrld xmm12,xmm12,2 vpaddd xmm10,xmm10,xmm8 vpor xmm0,xmm0,xmm5 vpor xmm12,xmm12,xmm7 vmovdqa xmm15,XMMWORD PTR[rbp] vpxor xmm1,xmm1,xmm3 vmovdqa xmm3,XMMWORD PTR[((112-128))+rax] vpslld xmm8,xmm10,5 vpaddd xmm14,xmm14,xmm15 vpxor xmm6,xmm13,xmm11 vmovdqa XMMWORD PTR[(64-128)+rax],xmm0 vpaddd xmm14,xmm14,xmm0 vpxor xmm1,xmm1,XMMWORD PTR[((208-128))+rax] vpsrld xmm9,xmm10,27 vpxor xmm6,xmm6,xmm12 vpxor xmm1,xmm1,xmm3 vpslld xmm7,xmm11,30 vpor xmm8,xmm8,xmm9 vpaddd xmm14,xmm14,xmm6 vpsrld xmm5,xmm1,31 vpaddd xmm1,xmm1,xmm1 vpsrld xmm11,xmm11,2 vpaddd xmm14,xmm14,xmm8 vpor xmm1,xmm1,xmm5 vpor xmm11,xmm11,xmm7 vpxor xmm2,xmm2,xmm4 vmovdqa xmm4,XMMWORD PTR[((128-128))+rax] vpslld xmm8,xmm14,5 vpaddd xmm13,xmm13,xmm15 vpxor xmm6,xmm12,xmm10 vmovdqa XMMWORD PTR[(80-128)+rax],xmm1 vpaddd xmm13,xmm13,xmm1 vpxor xmm2,xmm2,XMMWORD PTR[((224-128))+rax] vpsrld xmm9,xmm14,27 vpxor xmm6,xmm6,xmm11 vpxor xmm2,xmm2,xmm4 vpslld xmm7,xmm10,30 vpor xmm8,xmm8,xmm9 vpaddd xmm13,xmm13,xmm6 vpsrld xmm5,xmm2,31 vpaddd xmm2,xmm2,xmm2 vpsrld xmm10,xmm10,2 vpaddd xmm13,xmm13,xmm8 vpor xmm2,xmm2,xmm5 vpor xmm10,xmm10,xmm7 vpxor xmm3,xmm3,xmm0 vmovdqa xmm0,XMMWORD PTR[((144-128))+rax] vpslld xmm8,xmm13,5 vpaddd xmm12,xmm12,xmm15 vpxor xmm6,xmm11,xmm14 vmovdqa XMMWORD PTR[(96-128)+rax],xmm2 vpaddd xmm12,xmm12,xmm2 vpxor xmm3,xmm3,XMMWORD PTR[((240-128))+rax] vpsrld xmm9,xmm13,27 vpxor xmm6,xmm6,xmm10 vpxor xmm3,xmm3,xmm0 vpslld xmm7,xmm14,30 vpor xmm8,xmm8,xmm9 vpaddd xmm12,xmm12,xmm6 vpsrld xmm5,xmm3,31 vpaddd xmm3,xmm3,xmm3 vpsrld xmm14,xmm14,2 vpaddd xmm12,xmm12,xmm8 vpor xmm3,xmm3,xmm5 vpor xmm14,xmm14,xmm7 vpxor xmm4,xmm4,xmm1 vmovdqa xmm1,XMMWORD PTR[((160-128))+rax] vpslld xmm8,xmm12,5 vpaddd xmm11,xmm11,xmm15 vpxor xmm6,xmm10,xmm13 vmovdqa XMMWORD PTR[(112-128)+rax],xmm3 vpaddd xmm11,xmm11,xmm3 vpxor xmm4,xmm4,XMMWORD PTR[((0-128))+rax] vpsrld xmm9,xmm12,27 vpxor xmm6,xmm6,xmm14 vpxor xmm4,xmm4,xmm1 vpslld xmm7,xmm13,30 vpor xmm8,xmm8,xmm9 vpaddd xmm11,xmm11,xmm6 vpsrld xmm5,xmm4,31 vpaddd xmm4,xmm4,xmm4 vpsrld xmm13,xmm13,2 vpaddd xmm11,xmm11,xmm8 vpor xmm4,xmm4,xmm5 vpor xmm13,xmm13,xmm7 vpxor xmm0,xmm0,xmm2 vmovdqa xmm2,XMMWORD PTR[((176-128))+rax] vpslld xmm8,xmm11,5 vpaddd xmm10,xmm10,xmm15 vpxor xmm6,xmm14,xmm12 vmovdqa XMMWORD PTR[(128-128)+rax],xmm4 vpaddd xmm10,xmm10,xmm4 vpxor xmm0,xmm0,XMMWORD PTR[((16-128))+rax] vpsrld xmm9,xmm11,27 vpxor xmm6,xmm6,xmm13 vpxor xmm0,xmm0,xmm2 vpslld xmm7,xmm12,30 vpor xmm8,xmm8,xmm9 vpaddd xmm10,xmm10,xmm6 vpsrld xmm5,xmm0,31 vpaddd xmm0,xmm0,xmm0 vpsrld xmm12,xmm12,2 vpaddd xmm10,xmm10,xmm8 vpor xmm0,xmm0,xmm5 vpor xmm12,xmm12,xmm7 vpxor xmm1,xmm1,xmm3 vmovdqa xmm3,XMMWORD PTR[((192-128))+rax] vpslld xmm8,xmm10,5 vpaddd xmm14,xmm14,xmm15 vpxor xmm6,xmm13,xmm11 vmovdqa XMMWORD PTR[(144-128)+rax],xmm0 vpaddd xmm14,xmm14,xmm0 vpxor xmm1,xmm1,XMMWORD PTR[((32-128))+rax] vpsrld xmm9,xmm10,27 vpxor xmm6,xmm6,xmm12 vpxor xmm1,xmm1,xmm3 vpslld xmm7,xmm11,30 vpor xmm8,xmm8,xmm9 vpaddd xmm14,xmm14,xmm6 vpsrld xmm5,xmm1,31 vpaddd xmm1,xmm1,xmm1 vpsrld xmm11,xmm11,2 vpaddd xmm14,xmm14,xmm8 vpor xmm1,xmm1,xmm5 vpor xmm11,xmm11,xmm7 vpxor xmm2,xmm2,xmm4 vmovdqa xmm4,XMMWORD PTR[((208-128))+rax] vpslld xmm8,xmm14,5 vpaddd xmm13,xmm13,xmm15 vpxor xmm6,xmm12,xmm10 vmovdqa XMMWORD PTR[(160-128)+rax],xmm1 vpaddd xmm13,xmm13,xmm1 vpxor xmm2,xmm2,XMMWORD PTR[((48-128))+rax] vpsrld xmm9,xmm14,27 vpxor xmm6,xmm6,xmm11 vpxor xmm2,xmm2,xmm4 vpslld xmm7,xmm10,30 vpor xmm8,xmm8,xmm9 vpaddd xmm13,xmm13,xmm6 vpsrld xmm5,xmm2,31 vpaddd xmm2,xmm2,xmm2 vpsrld xmm10,xmm10,2 vpaddd xmm13,xmm13,xmm8 vpor xmm2,xmm2,xmm5 vpor xmm10,xmm10,xmm7 vpxor xmm3,xmm3,xmm0 vmovdqa xmm0,XMMWORD PTR[((224-128))+rax] vpslld xmm8,xmm13,5 vpaddd xmm12,xmm12,xmm15 vpxor xmm6,xmm11,xmm14 vmovdqa XMMWORD PTR[(176-128)+rax],xmm2 vpaddd xmm12,xmm12,xmm2 vpxor xmm3,xmm3,XMMWORD PTR[((64-128))+rax] vpsrld xmm9,xmm13,27 vpxor xmm6,xmm6,xmm10 vpxor xmm3,xmm3,xmm0 vpslld xmm7,xmm14,30 vpor xmm8,xmm8,xmm9 vpaddd xmm12,xmm12,xmm6 vpsrld xmm5,xmm3,31 vpaddd xmm3,xmm3,xmm3 vpsrld xmm14,xmm14,2 vpaddd xmm12,xmm12,xmm8 vpor xmm3,xmm3,xmm5 vpor xmm14,xmm14,xmm7 vpxor xmm4,xmm4,xmm1 vmovdqa xmm1,XMMWORD PTR[((240-128))+rax] vpslld xmm8,xmm12,5 vpaddd xmm11,xmm11,xmm15 vpxor xmm6,xmm10,xmm13 vmovdqa XMMWORD PTR[(192-128)+rax],xmm3 vpaddd xmm11,xmm11,xmm3 vpxor xmm4,xmm4,XMMWORD PTR[((80-128))+rax] vpsrld xmm9,xmm12,27 vpxor xmm6,xmm6,xmm14 vpxor xmm4,xmm4,xmm1 vpslld xmm7,xmm13,30 vpor xmm8,xmm8,xmm9 vpaddd xmm11,xmm11,xmm6 vpsrld xmm5,xmm4,31 vpaddd xmm4,xmm4,xmm4 vpsrld xmm13,xmm13,2 vpaddd xmm11,xmm11,xmm8 vpor xmm4,xmm4,xmm5 vpor xmm13,xmm13,xmm7 vpxor xmm0,xmm0,xmm2 vmovdqa xmm2,XMMWORD PTR[((0-128))+rax] vpslld xmm8,xmm11,5 vpaddd xmm10,xmm10,xmm15 vpxor xmm6,xmm14,xmm12 vmovdqa XMMWORD PTR[(208-128)+rax],xmm4 vpaddd xmm10,xmm10,xmm4 vpxor xmm0,xmm0,XMMWORD PTR[((96-128))+rax] vpsrld xmm9,xmm11,27 vpxor xmm6,xmm6,xmm13 vpxor xmm0,xmm0,xmm2 vpslld xmm7,xmm12,30 vpor xmm8,xmm8,xmm9 vpaddd xmm10,xmm10,xmm6 vpsrld xmm5,xmm0,31 vpaddd xmm0,xmm0,xmm0 vpsrld xmm12,xmm12,2 vpaddd xmm10,xmm10,xmm8 vpor xmm0,xmm0,xmm5 vpor xmm12,xmm12,xmm7 vpxor xmm1,xmm1,xmm3 vmovdqa xmm3,XMMWORD PTR[((16-128))+rax] vpslld xmm8,xmm10,5 vpaddd xmm14,xmm14,xmm15 vpxor xmm6,xmm13,xmm11 vmovdqa XMMWORD PTR[(224-128)+rax],xmm0 vpaddd xmm14,xmm14,xmm0 vpxor xmm1,xmm1,XMMWORD PTR[((112-128))+rax] vpsrld xmm9,xmm10,27 vpxor xmm6,xmm6,xmm12 vpxor xmm1,xmm1,xmm3 vpslld xmm7,xmm11,30 vpor xmm8,xmm8,xmm9 vpaddd xmm14,xmm14,xmm6 vpsrld xmm5,xmm1,31 vpaddd xmm1,xmm1,xmm1 vpsrld xmm11,xmm11,2 vpaddd xmm14,xmm14,xmm8 vpor xmm1,xmm1,xmm5 vpor xmm11,xmm11,xmm7 vpxor xmm2,xmm2,xmm4 vmovdqa xmm4,XMMWORD PTR[((32-128))+rax] vpslld xmm8,xmm14,5 vpaddd xmm13,xmm13,xmm15 vpxor xmm6,xmm12,xmm10 vmovdqa XMMWORD PTR[(240-128)+rax],xmm1 vpaddd xmm13,xmm13,xmm1 vpxor xmm2,xmm2,XMMWORD PTR[((128-128))+rax] vpsrld xmm9,xmm14,27 vpxor xmm6,xmm6,xmm11 vpxor xmm2,xmm2,xmm4 vpslld xmm7,xmm10,30 vpor xmm8,xmm8,xmm9 vpaddd xmm13,xmm13,xmm6 vpsrld xmm5,xmm2,31 vpaddd xmm2,xmm2,xmm2 vpsrld xmm10,xmm10,2 vpaddd xmm13,xmm13,xmm8 vpor xmm2,xmm2,xmm5 vpor xmm10,xmm10,xmm7 vpxor xmm3,xmm3,xmm0 vmovdqa xmm0,XMMWORD PTR[((48-128))+rax] vpslld xmm8,xmm13,5 vpaddd xmm12,xmm12,xmm15 vpxor xmm6,xmm11,xmm14 vmovdqa XMMWORD PTR[(0-128)+rax],xmm2 vpaddd xmm12,xmm12,xmm2 vpxor xmm3,xmm3,XMMWORD PTR[((144-128))+rax] vpsrld xmm9,xmm13,27 vpxor xmm6,xmm6,xmm10 vpxor xmm3,xmm3,xmm0 vpslld xmm7,xmm14,30 vpor xmm8,xmm8,xmm9 vpaddd xmm12,xmm12,xmm6 vpsrld xmm5,xmm3,31 vpaddd xmm3,xmm3,xmm3 vpsrld xmm14,xmm14,2 vpaddd xmm12,xmm12,xmm8 vpor xmm3,xmm3,xmm5 vpor xmm14,xmm14,xmm7 vpxor xmm4,xmm4,xmm1 vmovdqa xmm1,XMMWORD PTR[((64-128))+rax] vpslld xmm8,xmm12,5 vpaddd xmm11,xmm11,xmm15 vpxor xmm6,xmm10,xmm13 vmovdqa XMMWORD PTR[(16-128)+rax],xmm3 vpaddd xmm11,xmm11,xmm3 vpxor xmm4,xmm4,XMMWORD PTR[((160-128))+rax] vpsrld xmm9,xmm12,27 vpxor xmm6,xmm6,xmm14 vpxor xmm4,xmm4,xmm1 vpslld xmm7,xmm13,30 vpor xmm8,xmm8,xmm9 vpaddd xmm11,xmm11,xmm6 vpsrld xmm5,xmm4,31 vpaddd xmm4,xmm4,xmm4 vpsrld xmm13,xmm13,2 vpaddd xmm11,xmm11,xmm8 vpor xmm4,xmm4,xmm5 vpor xmm13,xmm13,xmm7 vpxor xmm0,xmm0,xmm2 vmovdqa xmm2,XMMWORD PTR[((80-128))+rax] vpslld xmm8,xmm11,5 vpaddd xmm10,xmm10,xmm15 vpxor xmm6,xmm14,xmm12 vmovdqa XMMWORD PTR[(32-128)+rax],xmm4 vpaddd xmm10,xmm10,xmm4 vpxor xmm0,xmm0,XMMWORD PTR[((176-128))+rax] vpsrld xmm9,xmm11,27 vpxor xmm6,xmm6,xmm13 vpxor xmm0,xmm0,xmm2 vpslld xmm7,xmm12,30 vpor xmm8,xmm8,xmm9 vpaddd xmm10,xmm10,xmm6 vpsrld xmm5,xmm0,31 vpaddd xmm0,xmm0,xmm0 vpsrld xmm12,xmm12,2 vpaddd xmm10,xmm10,xmm8 vpor xmm0,xmm0,xmm5 vpor xmm12,xmm12,xmm7 vpxor xmm1,xmm1,xmm3 vmovdqa xmm3,XMMWORD PTR[((96-128))+rax] vpslld xmm8,xmm10,5 vpaddd xmm14,xmm14,xmm15 vpxor xmm6,xmm13,xmm11 vmovdqa XMMWORD PTR[(48-128)+rax],xmm0 vpaddd xmm14,xmm14,xmm0 vpxor xmm1,xmm1,XMMWORD PTR[((192-128))+rax] vpsrld xmm9,xmm10,27 vpxor xmm6,xmm6,xmm12 vpxor xmm1,xmm1,xmm3 vpslld xmm7,xmm11,30 vpor xmm8,xmm8,xmm9 vpaddd xmm14,xmm14,xmm6 vpsrld xmm5,xmm1,31 vpaddd xmm1,xmm1,xmm1 vpsrld xmm11,xmm11,2 vpaddd xmm14,xmm14,xmm8 vpor xmm1,xmm1,xmm5 vpor xmm11,xmm11,xmm7 vpxor xmm2,xmm2,xmm4 vmovdqa xmm4,XMMWORD PTR[((112-128))+rax] vpslld xmm8,xmm14,5 vpaddd xmm13,xmm13,xmm15 vpxor xmm6,xmm12,xmm10 vmovdqa XMMWORD PTR[(64-128)+rax],xmm1 vpaddd xmm13,xmm13,xmm1 vpxor xmm2,xmm2,XMMWORD PTR[((208-128))+rax] vpsrld xmm9,xmm14,27 vpxor xmm6,xmm6,xmm11 vpxor xmm2,xmm2,xmm4 vpslld xmm7,xmm10,30 vpor xmm8,xmm8,xmm9 vpaddd xmm13,xmm13,xmm6 vpsrld xmm5,xmm2,31 vpaddd xmm2,xmm2,xmm2 vpsrld xmm10,xmm10,2 vpaddd xmm13,xmm13,xmm8 vpor xmm2,xmm2,xmm5 vpor xmm10,xmm10,xmm7 vpxor xmm3,xmm3,xmm0 vmovdqa xmm0,XMMWORD PTR[((128-128))+rax] vpslld xmm8,xmm13,5 vpaddd xmm12,xmm12,xmm15 vpxor xmm6,xmm11,xmm14 vmovdqa XMMWORD PTR[(80-128)+rax],xmm2 vpaddd xmm12,xmm12,xmm2 vpxor xmm3,xmm3,XMMWORD PTR[((224-128))+rax] vpsrld xmm9,xmm13,27 vpxor xmm6,xmm6,xmm10 vpxor xmm3,xmm3,xmm0 vpslld xmm7,xmm14,30 vpor xmm8,xmm8,xmm9 vpaddd xmm12,xmm12,xmm6 vpsrld xmm5,xmm3,31 vpaddd xmm3,xmm3,xmm3 vpsrld xmm14,xmm14,2 vpaddd xmm12,xmm12,xmm8 vpor xmm3,xmm3,xmm5 vpor xmm14,xmm14,xmm7 vpxor xmm4,xmm4,xmm1 vmovdqa xmm1,XMMWORD PTR[((144-128))+rax] vpslld xmm8,xmm12,5 vpaddd xmm11,xmm11,xmm15 vpxor xmm6,xmm10,xmm13 vmovdqa XMMWORD PTR[(96-128)+rax],xmm3 vpaddd xmm11,xmm11,xmm3 vpxor xmm4,xmm4,XMMWORD PTR[((240-128))+rax] vpsrld xmm9,xmm12,27 vpxor xmm6,xmm6,xmm14 vpxor xmm4,xmm4,xmm1 vpslld xmm7,xmm13,30 vpor xmm8,xmm8,xmm9 vpaddd xmm11,xmm11,xmm6 vpsrld xmm5,xmm4,31 vpaddd xmm4,xmm4,xmm4 vpsrld xmm13,xmm13,2 vpaddd xmm11,xmm11,xmm8 vpor xmm4,xmm4,xmm5 vpor xmm13,xmm13,xmm7 vpxor xmm0,xmm0,xmm2 vmovdqa xmm2,XMMWORD PTR[((160-128))+rax] vpslld xmm8,xmm11,5 vpaddd xmm10,xmm10,xmm15 vpxor xmm6,xmm14,xmm12 vmovdqa XMMWORD PTR[(112-128)+rax],xmm4 vpaddd xmm10,xmm10,xmm4 vpxor xmm0,xmm0,XMMWORD PTR[((0-128))+rax] vpsrld xmm9,xmm11,27 vpxor xmm6,xmm6,xmm13 vpxor xmm0,xmm0,xmm2 vpslld xmm7,xmm12,30 vpor xmm8,xmm8,xmm9 vpaddd xmm10,xmm10,xmm6 vpsrld xmm5,xmm0,31 vpaddd xmm0,xmm0,xmm0 vpsrld xmm12,xmm12,2 vpaddd xmm10,xmm10,xmm8 vpor xmm0,xmm0,xmm5 vpor xmm12,xmm12,xmm7 vmovdqa xmm15,XMMWORD PTR[32+rbp] vpxor xmm1,xmm1,xmm3 vmovdqa xmm3,XMMWORD PTR[((176-128))+rax] vpaddd xmm14,xmm14,xmm15 vpslld xmm8,xmm10,5 vpand xmm7,xmm13,xmm12 vpxor xmm1,xmm1,XMMWORD PTR[((16-128))+rax] vpaddd xmm14,xmm14,xmm7 vpsrld xmm9,xmm10,27 vpxor xmm6,xmm13,xmm12 vpxor xmm1,xmm1,xmm3 vmovdqu XMMWORD PTR[(128-128)+rax],xmm0 vpaddd xmm14,xmm14,xmm0 vpor xmm8,xmm8,xmm9 vpsrld xmm5,xmm1,31 vpand xmm6,xmm6,xmm11 vpaddd xmm1,xmm1,xmm1 vpslld xmm7,xmm11,30 vpaddd xmm14,xmm14,xmm6 vpsrld xmm11,xmm11,2 vpaddd xmm14,xmm14,xmm8 vpor xmm1,xmm1,xmm5 vpor xmm11,xmm11,xmm7 vpxor xmm2,xmm2,xmm4 vmovdqa xmm4,XMMWORD PTR[((192-128))+rax] vpaddd xmm13,xmm13,xmm15 vpslld xmm8,xmm14,5 vpand xmm7,xmm12,xmm11 vpxor xmm2,xmm2,XMMWORD PTR[((32-128))+rax] vpaddd xmm13,xmm13,xmm7 vpsrld xmm9,xmm14,27 vpxor xmm6,xmm12,xmm11 vpxor xmm2,xmm2,xmm4 vmovdqu XMMWORD PTR[(144-128)+rax],xmm1 vpaddd xmm13,xmm13,xmm1 vpor xmm8,xmm8,xmm9 vpsrld xmm5,xmm2,31 vpand xmm6,xmm6,xmm10 vpaddd xmm2,xmm2,xmm2 vpslld xmm7,xmm10,30 vpaddd xmm13,xmm13,xmm6 vpsrld xmm10,xmm10,2 vpaddd xmm13,xmm13,xmm8 vpor xmm2,xmm2,xmm5 vpor xmm10,xmm10,xmm7 vpxor xmm3,xmm3,xmm0 vmovdqa xmm0,XMMWORD PTR[((208-128))+rax] vpaddd xmm12,xmm12,xmm15 vpslld xmm8,xmm13,5 vpand xmm7,xmm11,xmm10 vpxor xmm3,xmm3,XMMWORD PTR[((48-128))+rax] vpaddd xmm12,xmm12,xmm7 vpsrld xmm9,xmm13,27 vpxor xmm6,xmm11,xmm10 vpxor xmm3,xmm3,xmm0 vmovdqu XMMWORD PTR[(160-128)+rax],xmm2 vpaddd xmm12,xmm12,xmm2 vpor xmm8,xmm8,xmm9 vpsrld xmm5,xmm3,31 vpand xmm6,xmm6,xmm14 vpaddd xmm3,xmm3,xmm3 vpslld xmm7,xmm14,30 vpaddd xmm12,xmm12,xmm6 vpsrld xmm14,xmm14,2 vpaddd xmm12,xmm12,xmm8 vpor xmm3,xmm3,xmm5 vpor xmm14,xmm14,xmm7 vpxor xmm4,xmm4,xmm1 vmovdqa xmm1,XMMWORD PTR[((224-128))+rax] vpaddd xmm11,xmm11,xmm15 vpslld xmm8,xmm12,5 vpand xmm7,xmm10,xmm14 vpxor xmm4,xmm4,XMMWORD PTR[((64-128))+rax] vpaddd xmm11,xmm11,xmm7 vpsrld xmm9,xmm12,27 vpxor xmm6,xmm10,xmm14 vpxor xmm4,xmm4,xmm1 vmovdqu XMMWORD PTR[(176-128)+rax],xmm3 vpaddd xmm11,xmm11,xmm3 vpor xmm8,xmm8,xmm9 vpsrld xmm5,xmm4,31 vpand xmm6,xmm6,xmm13 vpaddd xmm4,xmm4,xmm4 vpslld xmm7,xmm13,30 vpaddd xmm11,xmm11,xmm6 vpsrld xmm13,xmm13,2 vpaddd xmm11,xmm11,xmm8 vpor xmm4,xmm4,xmm5 vpor xmm13,xmm13,xmm7 vpxor xmm0,xmm0,xmm2 vmovdqa xmm2,XMMWORD PTR[((240-128))+rax] vpaddd xmm10,xmm10,xmm15 vpslld xmm8,xmm11,5 vpand xmm7,xmm14,xmm13 vpxor xmm0,xmm0,XMMWORD PTR[((80-128))+rax] vpaddd xmm10,xmm10,xmm7 vpsrld xmm9,xmm11,27 vpxor xmm6,xmm14,xmm13 vpxor xmm0,xmm0,xmm2 vmovdqu XMMWORD PTR[(192-128)+rax],xmm4 vpaddd xmm10,xmm10,xmm4 vpor xmm8,xmm8,xmm9 vpsrld xmm5,xmm0,31 vpand xmm6,xmm6,xmm12 vpaddd xmm0,xmm0,xmm0 vpslld xmm7,xmm12,30 vpaddd xmm10,xmm10,xmm6 vpsrld xmm12,xmm12,2 vpaddd xmm10,xmm10,xmm8 vpor xmm0,xmm0,xmm5 vpor xmm12,xmm12,xmm7 vpxor xmm1,xmm1,xmm3 vmovdqa xmm3,XMMWORD PTR[((0-128))+rax] vpaddd xmm14,xmm14,xmm15 vpslld xmm8,xmm10,5 vpand xmm7,xmm13,xmm12 vpxor xmm1,xmm1,XMMWORD PTR[((96-128))+rax] vpaddd xmm14,xmm14,xmm7 vpsrld xmm9,xmm10,27 vpxor xmm6,xmm13,xmm12 vpxor xmm1,xmm1,xmm3 vmovdqu XMMWORD PTR[(208-128)+rax],xmm0 vpaddd xmm14,xmm14,xmm0 vpor xmm8,xmm8,xmm9 vpsrld xmm5,xmm1,31 vpand xmm6,xmm6,xmm11 vpaddd xmm1,xmm1,xmm1 vpslld xmm7,xmm11,30 vpaddd xmm14,xmm14,xmm6 vpsrld xmm11,xmm11,2 vpaddd xmm14,xmm14,xmm8 vpor xmm1,xmm1,xmm5 vpor xmm11,xmm11,xmm7 vpxor xmm2,xmm2,xmm4 vmovdqa xmm4,XMMWORD PTR[((16-128))+rax] vpaddd xmm13,xmm13,xmm15 vpslld xmm8,xmm14,5 vpand xmm7,xmm12,xmm11 vpxor xmm2,xmm2,XMMWORD PTR[((112-128))+rax] vpaddd xmm13,xmm13,xmm7 vpsrld xmm9,xmm14,27 vpxor xmm6,xmm12,xmm11 vpxor xmm2,xmm2,xmm4 vmovdqu XMMWORD PTR[(224-128)+rax],xmm1 vpaddd xmm13,xmm13,xmm1 vpor xmm8,xmm8,xmm9 vpsrld xmm5,xmm2,31 vpand xmm6,xmm6,xmm10 vpaddd xmm2,xmm2,xmm2 vpslld xmm7,xmm10,30 vpaddd xmm13,xmm13,xmm6 vpsrld xmm10,xmm10,2 vpaddd xmm13,xmm13,xmm8 vpor xmm2,xmm2,xmm5 vpor xmm10,xmm10,xmm7 vpxor xmm3,xmm3,xmm0 vmovdqa xmm0,XMMWORD PTR[((32-128))+rax] vpaddd xmm12,xmm12,xmm15 vpslld xmm8,xmm13,5 vpand xmm7,xmm11,xmm10 vpxor xmm3,xmm3,XMMWORD PTR[((128-128))+rax] vpaddd xmm12,xmm12,xmm7 vpsrld xmm9,xmm13,27 vpxor xmm6,xmm11,xmm10 vpxor xmm3,xmm3,xmm0 vmovdqu XMMWORD PTR[(240-128)+rax],xmm2 vpaddd xmm12,xmm12,xmm2 vpor xmm8,xmm8,xmm9 vpsrld xmm5,xmm3,31 vpand xmm6,xmm6,xmm14 vpaddd xmm3,xmm3,xmm3 vpslld xmm7,xmm14,30 vpaddd xmm12,xmm12,xmm6 vpsrld xmm14,xmm14,2 vpaddd xmm12,xmm12,xmm8 vpor xmm3,xmm3,xmm5 vpor xmm14,xmm14,xmm7 vpxor xmm4,xmm4,xmm1 vmovdqa xmm1,XMMWORD PTR[((48-128))+rax] vpaddd xmm11,xmm11,xmm15 vpslld xmm8,xmm12,5 vpand xmm7,xmm10,xmm14 vpxor xmm4,xmm4,XMMWORD PTR[((144-128))+rax] vpaddd xmm11,xmm11,xmm7 vpsrld xmm9,xmm12,27 vpxor xmm6,xmm10,xmm14 vpxor xmm4,xmm4,xmm1 vmovdqu XMMWORD PTR[(0-128)+rax],xmm3 vpaddd xmm11,xmm11,xmm3 vpor xmm8,xmm8,xmm9 vpsrld xmm5,xmm4,31 vpand xmm6,xmm6,xmm13 vpaddd xmm4,xmm4,xmm4 vpslld xmm7,xmm13,30 vpaddd xmm11,xmm11,xmm6 vpsrld xmm13,xmm13,2 vpaddd xmm11,xmm11,xmm8 vpor xmm4,xmm4,xmm5 vpor xmm13,xmm13,xmm7 vpxor xmm0,xmm0,xmm2 vmovdqa xmm2,XMMWORD PTR[((64-128))+rax] vpaddd xmm10,xmm10,xmm15 vpslld xmm8,xmm11,5 vpand xmm7,xmm14,xmm13 vpxor xmm0,xmm0,XMMWORD PTR[((160-128))+rax] vpaddd xmm10,xmm10,xmm7 vpsrld xmm9,xmm11,27 vpxor xmm6,xmm14,xmm13 vpxor xmm0,xmm0,xmm2 vmovdqu XMMWORD PTR[(16-128)+rax],xmm4 vpaddd xmm10,xmm10,xmm4 vpor xmm8,xmm8,xmm9 vpsrld xmm5,xmm0,31 vpand xmm6,xmm6,xmm12 vpaddd xmm0,xmm0,xmm0 vpslld xmm7,xmm12,30 vpaddd xmm10,xmm10,xmm6 vpsrld xmm12,xmm12,2 vpaddd xmm10,xmm10,xmm8 vpor xmm0,xmm0,xmm5 vpor xmm12,xmm12,xmm7 vpxor xmm1,xmm1,xmm3 vmovdqa xmm3,XMMWORD PTR[((80-128))+rax] vpaddd xmm14,xmm14,xmm15 vpslld xmm8,xmm10,5 vpand xmm7,xmm13,xmm12 vpxor xmm1,xmm1,XMMWORD PTR[((176-128))+rax] vpaddd xmm14,xmm14,xmm7 vpsrld xmm9,xmm10,27 vpxor xmm6,xmm13,xmm12 vpxor xmm1,xmm1,xmm3 vmovdqu XMMWORD PTR[(32-128)+rax],xmm0 vpaddd xmm14,xmm14,xmm0 vpor xmm8,xmm8,xmm9 vpsrld xmm5,xmm1,31 vpand xmm6,xmm6,xmm11 vpaddd xmm1,xmm1,xmm1 vpslld xmm7,xmm11,30 vpaddd xmm14,xmm14,xmm6 vpsrld xmm11,xmm11,2 vpaddd xmm14,xmm14,xmm8 vpor xmm1,xmm1,xmm5 vpor xmm11,xmm11,xmm7 vpxor xmm2,xmm2,xmm4 vmovdqa xmm4,XMMWORD PTR[((96-128))+rax] vpaddd xmm13,xmm13,xmm15 vpslld xmm8,xmm14,5 vpand xmm7,xmm12,xmm11 vpxor xmm2,xmm2,XMMWORD PTR[((192-128))+rax] vpaddd xmm13,xmm13,xmm7 vpsrld xmm9,xmm14,27 vpxor xmm6,xmm12,xmm11 vpxor xmm2,xmm2,xmm4 vmovdqu XMMWORD PTR[(48-128)+rax],xmm1 vpaddd xmm13,xmm13,xmm1 vpor xmm8,xmm8,xmm9 vpsrld xmm5,xmm2,31 vpand xmm6,xmm6,xmm10 vpaddd xmm2,xmm2,xmm2 vpslld xmm7,xmm10,30 vpaddd xmm13,xmm13,xmm6 vpsrld xmm10,xmm10,2 vpaddd xmm13,xmm13,xmm8 vpor xmm2,xmm2,xmm5 vpor xmm10,xmm10,xmm7 vpxor xmm3,xmm3,xmm0 vmovdqa xmm0,XMMWORD PTR[((112-128))+rax] vpaddd xmm12,xmm12,xmm15 vpslld xmm8,xmm13,5 vpand xmm7,xmm11,xmm10 vpxor xmm3,xmm3,XMMWORD PTR[((208-128))+rax] vpaddd xmm12,xmm12,xmm7 vpsrld xmm9,xmm13,27 vpxor xmm6,xmm11,xmm10 vpxor xmm3,xmm3,xmm0 vmovdqu XMMWORD PTR[(64-128)+rax],xmm2 vpaddd xmm12,xmm12,xmm2 vpor xmm8,xmm8,xmm9 vpsrld xmm5,xmm3,31 vpand xmm6,xmm6,xmm14 vpaddd xmm3,xmm3,xmm3 vpslld xmm7,xmm14,30 vpaddd xmm12,xmm12,xmm6 vpsrld xmm14,xmm14,2 vpaddd xmm12,xmm12,xmm8 vpor xmm3,xmm3,xmm5 vpor xmm14,xmm14,xmm7 vpxor xmm4,xmm4,xmm1 vmovdqa xmm1,XMMWORD PTR[((128-128))+rax] vpaddd xmm11,xmm11,xmm15 vpslld xmm8,xmm12,5 vpand xmm7,xmm10,xmm14 vpxor xmm4,xmm4,XMMWORD PTR[((224-128))+rax] vpaddd xmm11,xmm11,xmm7 vpsrld xmm9,xmm12,27 vpxor xmm6,xmm10,xmm14 vpxor xmm4,xmm4,xmm1 vmovdqu XMMWORD PTR[(80-128)+rax],xmm3 vpaddd xmm11,xmm11,xmm3 vpor xmm8,xmm8,xmm9 vpsrld xmm5,xmm4,31 vpand xmm6,xmm6,xmm13 vpaddd xmm4,xmm4,xmm4 vpslld xmm7,xmm13,30 vpaddd xmm11,xmm11,xmm6 vpsrld xmm13,xmm13,2 vpaddd xmm11,xmm11,xmm8 vpor xmm4,xmm4,xmm5 vpor xmm13,xmm13,xmm7 vpxor xmm0,xmm0,xmm2 vmovdqa xmm2,XMMWORD PTR[((144-128))+rax] vpaddd xmm10,xmm10,xmm15 vpslld xmm8,xmm11,5 vpand xmm7,xmm14,xmm13 vpxor xmm0,xmm0,XMMWORD PTR[((240-128))+rax] vpaddd xmm10,xmm10,xmm7 vpsrld xmm9,xmm11,27 vpxor xmm6,xmm14,xmm13 vpxor xmm0,xmm0,xmm2 vmovdqu XMMWORD PTR[(96-128)+rax],xmm4 vpaddd xmm10,xmm10,xmm4 vpor xmm8,xmm8,xmm9 vpsrld xmm5,xmm0,31 vpand xmm6,xmm6,xmm12 vpaddd xmm0,xmm0,xmm0 vpslld xmm7,xmm12,30 vpaddd xmm10,xmm10,xmm6 vpsrld xmm12,xmm12,2 vpaddd xmm10,xmm10,xmm8 vpor xmm0,xmm0,xmm5 vpor xmm12,xmm12,xmm7 vpxor xmm1,xmm1,xmm3 vmovdqa xmm3,XMMWORD PTR[((160-128))+rax] vpaddd xmm14,xmm14,xmm15 vpslld xmm8,xmm10,5 vpand xmm7,xmm13,xmm12 vpxor xmm1,xmm1,XMMWORD PTR[((0-128))+rax] vpaddd xmm14,xmm14,xmm7 vpsrld xmm9,xmm10,27 vpxor xmm6,xmm13,xmm12 vpxor xmm1,xmm1,xmm3 vmovdqu XMMWORD PTR[(112-128)+rax],xmm0 vpaddd xmm14,xmm14,xmm0 vpor xmm8,xmm8,xmm9 vpsrld xmm5,xmm1,31 vpand xmm6,xmm6,xmm11 vpaddd xmm1,xmm1,xmm1 vpslld xmm7,xmm11,30 vpaddd xmm14,xmm14,xmm6 vpsrld xmm11,xmm11,2 vpaddd xmm14,xmm14,xmm8 vpor xmm1,xmm1,xmm5 vpor xmm11,xmm11,xmm7 vpxor xmm2,xmm2,xmm4 vmovdqa xmm4,XMMWORD PTR[((176-128))+rax] vpaddd xmm13,xmm13,xmm15 vpslld xmm8,xmm14,5 vpand xmm7,xmm12,xmm11 vpxor xmm2,xmm2,XMMWORD PTR[((16-128))+rax] vpaddd xmm13,xmm13,xmm7 vpsrld xmm9,xmm14,27 vpxor xmm6,xmm12,xmm11 vpxor xmm2,xmm2,xmm4 vmovdqu XMMWORD PTR[(128-128)+rax],xmm1 vpaddd xmm13,xmm13,xmm1 vpor xmm8,xmm8,xmm9 vpsrld xmm5,xmm2,31 vpand xmm6,xmm6,xmm10 vpaddd xmm2,xmm2,xmm2 vpslld xmm7,xmm10,30 vpaddd xmm13,xmm13,xmm6 vpsrld xmm10,xmm10,2 vpaddd xmm13,xmm13,xmm8 vpor xmm2,xmm2,xmm5 vpor xmm10,xmm10,xmm7 vpxor xmm3,xmm3,xmm0 vmovdqa xmm0,XMMWORD PTR[((192-128))+rax] vpaddd xmm12,xmm12,xmm15 vpslld xmm8,xmm13,5 vpand xmm7,xmm11,xmm10 vpxor xmm3,xmm3,XMMWORD PTR[((32-128))+rax] vpaddd xmm12,xmm12,xmm7 vpsrld xmm9,xmm13,27 vpxor xmm6,xmm11,xmm10 vpxor xmm3,xmm3,xmm0 vmovdqu XMMWORD PTR[(144-128)+rax],xmm2 vpaddd xmm12,xmm12,xmm2 vpor xmm8,xmm8,xmm9 vpsrld xmm5,xmm3,31 vpand xmm6,xmm6,xmm14 vpaddd xmm3,xmm3,xmm3 vpslld xmm7,xmm14,30 vpaddd xmm12,xmm12,xmm6 vpsrld xmm14,xmm14,2 vpaddd xmm12,xmm12,xmm8 vpor xmm3,xmm3,xmm5 vpor xmm14,xmm14,xmm7 vpxor xmm4,xmm4,xmm1 vmovdqa xmm1,XMMWORD PTR[((208-128))+rax] vpaddd xmm11,xmm11,xmm15 vpslld xmm8,xmm12,5 vpand xmm7,xmm10,xmm14 vpxor xmm4,xmm4,XMMWORD PTR[((48-128))+rax] vpaddd xmm11,xmm11,xmm7 vpsrld xmm9,xmm12,27 vpxor xmm6,xmm10,xmm14 vpxor xmm4,xmm4,xmm1 vmovdqu XMMWORD PTR[(160-128)+rax],xmm3 vpaddd xmm11,xmm11,xmm3 vpor xmm8,xmm8,xmm9 vpsrld xmm5,xmm4,31 vpand xmm6,xmm6,xmm13 vpaddd xmm4,xmm4,xmm4 vpslld xmm7,xmm13,30 vpaddd xmm11,xmm11,xmm6 vpsrld xmm13,xmm13,2 vpaddd xmm11,xmm11,xmm8 vpor xmm4,xmm4,xmm5 vpor xmm13,xmm13,xmm7 vpxor xmm0,xmm0,xmm2 vmovdqa xmm2,XMMWORD PTR[((224-128))+rax] vpaddd xmm10,xmm10,xmm15 vpslld xmm8,xmm11,5 vpand xmm7,xmm14,xmm13 vpxor xmm0,xmm0,XMMWORD PTR[((64-128))+rax] vpaddd xmm10,xmm10,xmm7 vpsrld xmm9,xmm11,27 vpxor xmm6,xmm14,xmm13 vpxor xmm0,xmm0,xmm2 vmovdqu XMMWORD PTR[(176-128)+rax],xmm4 vpaddd xmm10,xmm10,xmm4 vpor xmm8,xmm8,xmm9 vpsrld xmm5,xmm0,31 vpand xmm6,xmm6,xmm12 vpaddd xmm0,xmm0,xmm0 vpslld xmm7,xmm12,30 vpaddd xmm10,xmm10,xmm6 vpsrld xmm12,xmm12,2 vpaddd xmm10,xmm10,xmm8 vpor xmm0,xmm0,xmm5 vpor xmm12,xmm12,xmm7 vmovdqa xmm15,XMMWORD PTR[64+rbp] vpxor xmm1,xmm1,xmm3 vmovdqa xmm3,XMMWORD PTR[((240-128))+rax] vpslld xmm8,xmm10,5 vpaddd xmm14,xmm14,xmm15 vpxor xmm6,xmm13,xmm11 vmovdqa XMMWORD PTR[(192-128)+rax],xmm0 vpaddd xmm14,xmm14,xmm0 vpxor xmm1,xmm1,XMMWORD PTR[((80-128))+rax] vpsrld xmm9,xmm10,27 vpxor xmm6,xmm6,xmm12 vpxor xmm1,xmm1,xmm3 vpslld xmm7,xmm11,30 vpor xmm8,xmm8,xmm9 vpaddd xmm14,xmm14,xmm6 vpsrld xmm5,xmm1,31 vpaddd xmm1,xmm1,xmm1 vpsrld xmm11,xmm11,2 vpaddd xmm14,xmm14,xmm8 vpor xmm1,xmm1,xmm5 vpor xmm11,xmm11,xmm7 vpxor xmm2,xmm2,xmm4 vmovdqa xmm4,XMMWORD PTR[((0-128))+rax] vpslld xmm8,xmm14,5 vpaddd xmm13,xmm13,xmm15 vpxor xmm6,xmm12,xmm10 vmovdqa XMMWORD PTR[(208-128)+rax],xmm1 vpaddd xmm13,xmm13,xmm1 vpxor xmm2,xmm2,XMMWORD PTR[((96-128))+rax] vpsrld xmm9,xmm14,27 vpxor xmm6,xmm6,xmm11 vpxor xmm2,xmm2,xmm4 vpslld xmm7,xmm10,30 vpor xmm8,xmm8,xmm9 vpaddd xmm13,xmm13,xmm6 vpsrld xmm5,xmm2,31 vpaddd xmm2,xmm2,xmm2 vpsrld xmm10,xmm10,2 vpaddd xmm13,xmm13,xmm8 vpor xmm2,xmm2,xmm5 vpor xmm10,xmm10,xmm7 vpxor xmm3,xmm3,xmm0 vmovdqa xmm0,XMMWORD PTR[((16-128))+rax] vpslld xmm8,xmm13,5 vpaddd xmm12,xmm12,xmm15 vpxor xmm6,xmm11,xmm14 vmovdqa XMMWORD PTR[(224-128)+rax],xmm2 vpaddd xmm12,xmm12,xmm2 vpxor xmm3,xmm3,XMMWORD PTR[((112-128))+rax] vpsrld xmm9,xmm13,27 vpxor xmm6,xmm6,xmm10 vpxor xmm3,xmm3,xmm0 vpslld xmm7,xmm14,30 vpor xmm8,xmm8,xmm9 vpaddd xmm12,xmm12,xmm6 vpsrld xmm5,xmm3,31 vpaddd xmm3,xmm3,xmm3 vpsrld xmm14,xmm14,2 vpaddd xmm12,xmm12,xmm8 vpor xmm3,xmm3,xmm5 vpor xmm14,xmm14,xmm7 vpxor xmm4,xmm4,xmm1 vmovdqa xmm1,XMMWORD PTR[((32-128))+rax] vpslld xmm8,xmm12,5 vpaddd xmm11,xmm11,xmm15 vpxor xmm6,xmm10,xmm13 vmovdqa XMMWORD PTR[(240-128)+rax],xmm3 vpaddd xmm11,xmm11,xmm3 vpxor xmm4,xmm4,XMMWORD PTR[((128-128))+rax] vpsrld xmm9,xmm12,27 vpxor xmm6,xmm6,xmm14 vpxor xmm4,xmm4,xmm1 vpslld xmm7,xmm13,30 vpor xmm8,xmm8,xmm9 vpaddd xmm11,xmm11,xmm6 vpsrld xmm5,xmm4,31 vpaddd xmm4,xmm4,xmm4 vpsrld xmm13,xmm13,2 vpaddd xmm11,xmm11,xmm8 vpor xmm4,xmm4,xmm5 vpor xmm13,xmm13,xmm7 vpxor xmm0,xmm0,xmm2 vmovdqa xmm2,XMMWORD PTR[((48-128))+rax] vpslld xmm8,xmm11,5 vpaddd xmm10,xmm10,xmm15 vpxor xmm6,xmm14,xmm12 vmovdqa XMMWORD PTR[(0-128)+rax],xmm4 vpaddd xmm10,xmm10,xmm4 vpxor xmm0,xmm0,XMMWORD PTR[((144-128))+rax] vpsrld xmm9,xmm11,27 vpxor xmm6,xmm6,xmm13 vpxor xmm0,xmm0,xmm2 vpslld xmm7,xmm12,30 vpor xmm8,xmm8,xmm9 vpaddd xmm10,xmm10,xmm6 vpsrld xmm5,xmm0,31 vpaddd xmm0,xmm0,xmm0 vpsrld xmm12,xmm12,2 vpaddd xmm10,xmm10,xmm8 vpor xmm0,xmm0,xmm5 vpor xmm12,xmm12,xmm7 vpxor xmm1,xmm1,xmm3 vmovdqa xmm3,XMMWORD PTR[((64-128))+rax] vpslld xmm8,xmm10,5 vpaddd xmm14,xmm14,xmm15 vpxor xmm6,xmm13,xmm11 vmovdqa XMMWORD PTR[(16-128)+rax],xmm0 vpaddd xmm14,xmm14,xmm0 vpxor xmm1,xmm1,XMMWORD PTR[((160-128))+rax] vpsrld xmm9,xmm10,27 vpxor xmm6,xmm6,xmm12 vpxor xmm1,xmm1,xmm3 vpslld xmm7,xmm11,30 vpor xmm8,xmm8,xmm9 vpaddd xmm14,xmm14,xmm6 vpsrld xmm5,xmm1,31 vpaddd xmm1,xmm1,xmm1 vpsrld xmm11,xmm11,2 vpaddd xmm14,xmm14,xmm8 vpor xmm1,xmm1,xmm5 vpor xmm11,xmm11,xmm7 vpxor xmm2,xmm2,xmm4 vmovdqa xmm4,XMMWORD PTR[((80-128))+rax] vpslld xmm8,xmm14,5 vpaddd xmm13,xmm13,xmm15 vpxor xmm6,xmm12,xmm10 vmovdqa XMMWORD PTR[(32-128)+rax],xmm1 vpaddd xmm13,xmm13,xmm1 vpxor xmm2,xmm2,XMMWORD PTR[((176-128))+rax] vpsrld xmm9,xmm14,27 vpxor xmm6,xmm6,xmm11 vpxor xmm2,xmm2,xmm4 vpslld xmm7,xmm10,30 vpor xmm8,xmm8,xmm9 vpaddd xmm13,xmm13,xmm6 vpsrld xmm5,xmm2,31 vpaddd xmm2,xmm2,xmm2 vpsrld xmm10,xmm10,2 vpaddd xmm13,xmm13,xmm8 vpor xmm2,xmm2,xmm5 vpor xmm10,xmm10,xmm7 vpxor xmm3,xmm3,xmm0 vmovdqa xmm0,XMMWORD PTR[((96-128))+rax] vpslld xmm8,xmm13,5 vpaddd xmm12,xmm12,xmm15 vpxor xmm6,xmm11,xmm14 vmovdqa XMMWORD PTR[(48-128)+rax],xmm2 vpaddd xmm12,xmm12,xmm2 vpxor xmm3,xmm3,XMMWORD PTR[((192-128))+rax] vpsrld xmm9,xmm13,27 vpxor xmm6,xmm6,xmm10 vpxor xmm3,xmm3,xmm0 vpslld xmm7,xmm14,30 vpor xmm8,xmm8,xmm9 vpaddd xmm12,xmm12,xmm6 vpsrld xmm5,xmm3,31 vpaddd xmm3,xmm3,xmm3 vpsrld xmm14,xmm14,2 vpaddd xmm12,xmm12,xmm8 vpor xmm3,xmm3,xmm5 vpor xmm14,xmm14,xmm7 vpxor xmm4,xmm4,xmm1 vmovdqa xmm1,XMMWORD PTR[((112-128))+rax] vpslld xmm8,xmm12,5 vpaddd xmm11,xmm11,xmm15 vpxor xmm6,xmm10,xmm13 vmovdqa XMMWORD PTR[(64-128)+rax],xmm3 vpaddd xmm11,xmm11,xmm3 vpxor xmm4,xmm4,XMMWORD PTR[((208-128))+rax] vpsrld xmm9,xmm12,27 vpxor xmm6,xmm6,xmm14 vpxor xmm4,xmm4,xmm1 vpslld xmm7,xmm13,30 vpor xmm8,xmm8,xmm9 vpaddd xmm11,xmm11,xmm6 vpsrld xmm5,xmm4,31 vpaddd xmm4,xmm4,xmm4 vpsrld xmm13,xmm13,2 vpaddd xmm11,xmm11,xmm8 vpor xmm4,xmm4,xmm5 vpor xmm13,xmm13,xmm7 vpxor xmm0,xmm0,xmm2 vmovdqa xmm2,XMMWORD PTR[((128-128))+rax] vpslld xmm8,xmm11,5 vpaddd xmm10,xmm10,xmm15 vpxor xmm6,xmm14,xmm12 vmovdqa XMMWORD PTR[(80-128)+rax],xmm4 vpaddd xmm10,xmm10,xmm4 vpxor xmm0,xmm0,XMMWORD PTR[((224-128))+rax] vpsrld xmm9,xmm11,27 vpxor xmm6,xmm6,xmm13 vpxor xmm0,xmm0,xmm2 vpslld xmm7,xmm12,30 vpor xmm8,xmm8,xmm9 vpaddd xmm10,xmm10,xmm6 vpsrld xmm5,xmm0,31 vpaddd xmm0,xmm0,xmm0 vpsrld xmm12,xmm12,2 vpaddd xmm10,xmm10,xmm8 vpor xmm0,xmm0,xmm5 vpor xmm12,xmm12,xmm7 vpxor xmm1,xmm1,xmm3 vmovdqa xmm3,XMMWORD PTR[((144-128))+rax] vpslld xmm8,xmm10,5 vpaddd xmm14,xmm14,xmm15 vpxor xmm6,xmm13,xmm11 vmovdqa XMMWORD PTR[(96-128)+rax],xmm0 vpaddd xmm14,xmm14,xmm0 vpxor xmm1,xmm1,XMMWORD PTR[((240-128))+rax] vpsrld xmm9,xmm10,27 vpxor xmm6,xmm6,xmm12 vpxor xmm1,xmm1,xmm3 vpslld xmm7,xmm11,30 vpor xmm8,xmm8,xmm9 vpaddd xmm14,xmm14,xmm6 vpsrld xmm5,xmm1,31 vpaddd xmm1,xmm1,xmm1 vpsrld xmm11,xmm11,2 vpaddd xmm14,xmm14,xmm8 vpor xmm1,xmm1,xmm5 vpor xmm11,xmm11,xmm7 vpxor xmm2,xmm2,xmm4 vmovdqa xmm4,XMMWORD PTR[((160-128))+rax] vpslld xmm8,xmm14,5 vpaddd xmm13,xmm13,xmm15 vpxor xmm6,xmm12,xmm10 vmovdqa XMMWORD PTR[(112-128)+rax],xmm1 vpaddd xmm13,xmm13,xmm1 vpxor xmm2,xmm2,XMMWORD PTR[((0-128))+rax] vpsrld xmm9,xmm14,27 vpxor xmm6,xmm6,xmm11 vpxor xmm2,xmm2,xmm4 vpslld xmm7,xmm10,30 vpor xmm8,xmm8,xmm9 vpaddd xmm13,xmm13,xmm6 vpsrld xmm5,xmm2,31 vpaddd xmm2,xmm2,xmm2 vpsrld xmm10,xmm10,2 vpaddd xmm13,xmm13,xmm8 vpor xmm2,xmm2,xmm5 vpor xmm10,xmm10,xmm7 vpxor xmm3,xmm3,xmm0 vmovdqa xmm0,XMMWORD PTR[((176-128))+rax] vpslld xmm8,xmm13,5 vpaddd xmm12,xmm12,xmm15 vpxor xmm6,xmm11,xmm14 vpaddd xmm12,xmm12,xmm2 vpxor xmm3,xmm3,XMMWORD PTR[((16-128))+rax] vpsrld xmm9,xmm13,27 vpxor xmm6,xmm6,xmm10 vpxor xmm3,xmm3,xmm0 vpslld xmm7,xmm14,30 vpor xmm8,xmm8,xmm9 vpaddd xmm12,xmm12,xmm6 vpsrld xmm5,xmm3,31 vpaddd xmm3,xmm3,xmm3 vpsrld xmm14,xmm14,2 vpaddd xmm12,xmm12,xmm8 vpor xmm3,xmm3,xmm5 vpor xmm14,xmm14,xmm7 vpxor xmm4,xmm4,xmm1 vmovdqa xmm1,XMMWORD PTR[((192-128))+rax] vpslld xmm8,xmm12,5 vpaddd xmm11,xmm11,xmm15 vpxor xmm6,xmm10,xmm13 vpaddd xmm11,xmm11,xmm3 vpxor xmm4,xmm4,XMMWORD PTR[((32-128))+rax] vpsrld xmm9,xmm12,27 vpxor xmm6,xmm6,xmm14 vpxor xmm4,xmm4,xmm1 vpslld xmm7,xmm13,30 vpor xmm8,xmm8,xmm9 vpaddd xmm11,xmm11,xmm6 vpsrld xmm5,xmm4,31 vpaddd xmm4,xmm4,xmm4 vpsrld xmm13,xmm13,2 vpaddd xmm11,xmm11,xmm8 vpor xmm4,xmm4,xmm5 vpor xmm13,xmm13,xmm7 vpxor xmm0,xmm0,xmm2 vmovdqa xmm2,XMMWORD PTR[((208-128))+rax] vpslld xmm8,xmm11,5 vpaddd xmm10,xmm10,xmm15 vpxor xmm6,xmm14,xmm12 vpaddd xmm10,xmm10,xmm4 vpxor xmm0,xmm0,XMMWORD PTR[((48-128))+rax] vpsrld xmm9,xmm11,27 vpxor xmm6,xmm6,xmm13 vpxor xmm0,xmm0,xmm2 vpslld xmm7,xmm12,30 vpor xmm8,xmm8,xmm9 vpaddd xmm10,xmm10,xmm6 vpsrld xmm5,xmm0,31 vpaddd xmm0,xmm0,xmm0 vpsrld xmm12,xmm12,2 vpaddd xmm10,xmm10,xmm8 vpor xmm0,xmm0,xmm5 vpor xmm12,xmm12,xmm7 vpxor xmm1,xmm1,xmm3 vmovdqa xmm3,XMMWORD PTR[((224-128))+rax] vpslld xmm8,xmm10,5 vpaddd xmm14,xmm14,xmm15 vpxor xmm6,xmm13,xmm11 vpaddd xmm14,xmm14,xmm0 vpxor xmm1,xmm1,XMMWORD PTR[((64-128))+rax] vpsrld xmm9,xmm10,27 vpxor xmm6,xmm6,xmm12 vpxor xmm1,xmm1,xmm3 vpslld xmm7,xmm11,30 vpor xmm8,xmm8,xmm9 vpaddd xmm14,xmm14,xmm6 vpsrld xmm5,xmm1,31 vpaddd xmm1,xmm1,xmm1 vpsrld xmm11,xmm11,2 vpaddd xmm14,xmm14,xmm8 vpor xmm1,xmm1,xmm5 vpor xmm11,xmm11,xmm7 vpxor xmm2,xmm2,xmm4 vmovdqa xmm4,XMMWORD PTR[((240-128))+rax] vpslld xmm8,xmm14,5 vpaddd xmm13,xmm13,xmm15 vpxor xmm6,xmm12,xmm10 vpaddd xmm13,xmm13,xmm1 vpxor xmm2,xmm2,XMMWORD PTR[((80-128))+rax] vpsrld xmm9,xmm14,27 vpxor xmm6,xmm6,xmm11 vpxor xmm2,xmm2,xmm4 vpslld xmm7,xmm10,30 vpor xmm8,xmm8,xmm9 vpaddd xmm13,xmm13,xmm6 vpsrld xmm5,xmm2,31 vpaddd xmm2,xmm2,xmm2 vpsrld xmm10,xmm10,2 vpaddd xmm13,xmm13,xmm8 vpor xmm2,xmm2,xmm5 vpor xmm10,xmm10,xmm7 vpxor xmm3,xmm3,xmm0 vmovdqa xmm0,XMMWORD PTR[((0-128))+rax] vpslld xmm8,xmm13,5 vpaddd xmm12,xmm12,xmm15 vpxor xmm6,xmm11,xmm14 vpaddd xmm12,xmm12,xmm2 vpxor xmm3,xmm3,XMMWORD PTR[((96-128))+rax] vpsrld xmm9,xmm13,27 vpxor xmm6,xmm6,xmm10 vpxor xmm3,xmm3,xmm0 vpslld xmm7,xmm14,30 vpor xmm8,xmm8,xmm9 vpaddd xmm12,xmm12,xmm6 vpsrld xmm5,xmm3,31 vpaddd xmm3,xmm3,xmm3 vpsrld xmm14,xmm14,2 vpaddd xmm12,xmm12,xmm8 vpor xmm3,xmm3,xmm5 vpor xmm14,xmm14,xmm7 vpxor xmm4,xmm4,xmm1 vmovdqa xmm1,XMMWORD PTR[((16-128))+rax] vpslld xmm8,xmm12,5 vpaddd xmm11,xmm11,xmm15 vpxor xmm6,xmm10,xmm13 vpaddd xmm11,xmm11,xmm3 vpxor xmm4,xmm4,XMMWORD PTR[((112-128))+rax] vpsrld xmm9,xmm12,27 vpxor xmm6,xmm6,xmm14 vpxor xmm4,xmm4,xmm1 vpslld xmm7,xmm13,30 vpor xmm8,xmm8,xmm9 vpaddd xmm11,xmm11,xmm6 vpsrld xmm5,xmm4,31 vpaddd xmm4,xmm4,xmm4 vpsrld xmm13,xmm13,2 vpaddd xmm11,xmm11,xmm8 vpor xmm4,xmm4,xmm5 vpor xmm13,xmm13,xmm7 vpslld xmm8,xmm11,5 vpaddd xmm10,xmm10,xmm15 vpxor xmm6,xmm14,xmm12 vpsrld xmm9,xmm11,27 vpaddd xmm10,xmm10,xmm4 vpxor xmm6,xmm6,xmm13 vpslld xmm7,xmm12,30 vpor xmm8,xmm8,xmm9 vpaddd xmm10,xmm10,xmm6 vpsrld xmm12,xmm12,2 vpaddd xmm10,xmm10,xmm8 vpor xmm12,xmm12,xmm7 mov ecx,1 cmp ecx,DWORD PTR[rbx] cmovge r8,rbp cmp ecx,DWORD PTR[4+rbx] cmovge r9,rbp cmp ecx,DWORD PTR[8+rbx] cmovge r10,rbp cmp ecx,DWORD PTR[12+rbx] cmovge r11,rbp vmovdqu xmm6,XMMWORD PTR[rbx] vpxor xmm8,xmm8,xmm8 vmovdqa xmm7,xmm6 vpcmpgtd xmm7,xmm7,xmm8 vpaddd xmm6,xmm6,xmm7 vpand xmm10,xmm10,xmm7 vpand xmm11,xmm11,xmm7 vpaddd xmm10,xmm10,XMMWORD PTR[rdi] vpand xmm12,xmm12,xmm7 vpaddd xmm11,xmm11,XMMWORD PTR[32+rdi] vpand xmm13,xmm13,xmm7 vpaddd xmm12,xmm12,XMMWORD PTR[64+rdi] vpand xmm14,xmm14,xmm7 vpaddd xmm13,xmm13,XMMWORD PTR[96+rdi] vpaddd xmm14,xmm14,XMMWORD PTR[128+rdi] vmovdqu XMMWORD PTR[rdi],xmm10 vmovdqu XMMWORD PTR[32+rdi],xmm11 vmovdqu XMMWORD PTR[64+rdi],xmm12 vmovdqu XMMWORD PTR[96+rdi],xmm13 vmovdqu XMMWORD PTR[128+rdi],xmm14 vmovdqu XMMWORD PTR[rbx],xmm6 vmovdqu xmm5,XMMWORD PTR[96+rbp] dec edx jnz $L$oop_avx mov edx,DWORD PTR[280+rsp] lea rdi,QWORD PTR[16+rdi] lea rsi,QWORD PTR[64+rsi] dec edx jnz $L$oop_grande_avx $L$done_avx:: mov rax,QWORD PTR[272+rsp] vzeroupper movaps xmm6,XMMWORD PTR[((-184))+rax] movaps xmm7,XMMWORD PTR[((-168))+rax] movaps xmm8,XMMWORD PTR[((-152))+rax] movaps xmm9,XMMWORD PTR[((-136))+rax] movaps xmm10,XMMWORD PTR[((-120))+rax] movaps xmm11,XMMWORD PTR[((-104))+rax] movaps xmm12,XMMWORD PTR[((-88))+rax] movaps xmm13,XMMWORD PTR[((-72))+rax] movaps xmm14,XMMWORD PTR[((-56))+rax] movaps xmm15,XMMWORD PTR[((-40))+rax] mov rbp,QWORD PTR[((-16))+rax] mov rbx,QWORD PTR[((-8))+rax] lea rsp,QWORD PTR[rax] $L$epilogue_avx:: mov rdi,QWORD PTR[8+rsp] ;WIN64 epilogue mov rsi,QWORD PTR[16+rsp] DB 0F3h,0C3h ;repret $L$SEH_end_sha1_multi_block_avx:: sha1_multi_block_avx ENDP ALIGN 32 sha1_multi_block_avx2 PROC PRIVATE mov QWORD PTR[8+rsp],rdi ;WIN64 prologue mov QWORD PTR[16+rsp],rsi mov rax,rsp $L$SEH_begin_sha1_multi_block_avx2:: mov rdi,rcx mov rsi,rdx mov rdx,r8 _avx2_shortcut:: mov rax,rsp push rbx push rbp push r12 push r13 push r14 push r15 lea rsp,QWORD PTR[((-168))+rsp] movaps XMMWORD PTR[rsp],xmm6 movaps XMMWORD PTR[16+rsp],xmm7 movaps XMMWORD PTR[32+rsp],xmm8 movaps XMMWORD PTR[48+rsp],xmm9 movaps XMMWORD PTR[64+rsp],xmm10 movaps XMMWORD PTR[80+rsp],xmm11 movaps XMMWORD PTR[(-120)+rax],xmm12 movaps XMMWORD PTR[(-104)+rax],xmm13 movaps XMMWORD PTR[(-88)+rax],xmm14 movaps XMMWORD PTR[(-72)+rax],xmm15 sub rsp,576 and rsp,-256 mov QWORD PTR[544+rsp],rax $L$body_avx2:: lea rbp,QWORD PTR[K_XX_XX] shr edx,1 vzeroupper $L$oop_grande_avx2:: mov DWORD PTR[552+rsp],edx xor edx,edx lea rbx,QWORD PTR[512+rsp] mov r12,QWORD PTR[rsi] mov ecx,DWORD PTR[8+rsi] cmp ecx,edx cmovg edx,ecx test ecx,ecx mov DWORD PTR[rbx],ecx cmovle r12,rbp mov r13,QWORD PTR[16+rsi] mov ecx,DWORD PTR[24+rsi] cmp ecx,edx cmovg edx,ecx test ecx,ecx mov DWORD PTR[4+rbx],ecx cmovle r13,rbp mov r14,QWORD PTR[32+rsi] mov ecx,DWORD PTR[40+rsi] cmp ecx,edx cmovg edx,ecx test ecx,ecx mov DWORD PTR[8+rbx],ecx cmovle r14,rbp mov r15,QWORD PTR[48+rsi] mov ecx,DWORD PTR[56+rsi] cmp ecx,edx cmovg edx,ecx test ecx,ecx mov DWORD PTR[12+rbx],ecx cmovle r15,rbp mov r8,QWORD PTR[64+rsi] mov ecx,DWORD PTR[72+rsi] cmp ecx,edx cmovg edx,ecx test ecx,ecx mov DWORD PTR[16+rbx],ecx cmovle r8,rbp mov r9,QWORD PTR[80+rsi] mov ecx,DWORD PTR[88+rsi] cmp ecx,edx cmovg edx,ecx test ecx,ecx mov DWORD PTR[20+rbx],ecx cmovle r9,rbp mov r10,QWORD PTR[96+rsi] mov ecx,DWORD PTR[104+rsi] cmp ecx,edx cmovg edx,ecx test ecx,ecx mov DWORD PTR[24+rbx],ecx cmovle r10,rbp mov r11,QWORD PTR[112+rsi] mov ecx,DWORD PTR[120+rsi] cmp ecx,edx cmovg edx,ecx test ecx,ecx mov DWORD PTR[28+rbx],ecx cmovle r11,rbp vmovdqu ymm0,YMMWORD PTR[rdi] lea rax,QWORD PTR[128+rsp] vmovdqu ymm1,YMMWORD PTR[32+rdi] lea rbx,QWORD PTR[((256+128))+rsp] vmovdqu ymm2,YMMWORD PTR[64+rdi] vmovdqu ymm3,YMMWORD PTR[96+rdi] vmovdqu ymm4,YMMWORD PTR[128+rdi] vmovdqu ymm9,YMMWORD PTR[96+rbp] jmp $L$oop_avx2 ALIGN 32 $L$oop_avx2:: vmovdqa ymm15,YMMWORD PTR[((-32))+rbp] vmovd xmm10,DWORD PTR[r12] lea r12,QWORD PTR[64+r12] vmovd xmm12,DWORD PTR[r8] lea r8,QWORD PTR[64+r8] vmovd xmm7,DWORD PTR[r13] lea r13,QWORD PTR[64+r13] vmovd xmm6,DWORD PTR[r9] lea r9,QWORD PTR[64+r9] vpinsrd xmm10,xmm10,DWORD PTR[r14],1 lea r14,QWORD PTR[64+r14] vpinsrd xmm12,xmm12,DWORD PTR[r10],1 lea r10,QWORD PTR[64+r10] vpinsrd xmm7,xmm7,DWORD PTR[r15],1 lea r15,QWORD PTR[64+r15] vpunpckldq ymm10,ymm10,ymm7 vpinsrd xmm6,xmm6,DWORD PTR[r11],1 lea r11,QWORD PTR[64+r11] vpunpckldq ymm12,ymm12,ymm6 vmovd xmm11,DWORD PTR[((-60))+r12] vinserti128 ymm10,ymm10,xmm12,1 vmovd xmm8,DWORD PTR[((-60))+r8] vpshufb ymm10,ymm10,ymm9 vmovd xmm7,DWORD PTR[((-60))+r13] vmovd xmm6,DWORD PTR[((-60))+r9] vpinsrd xmm11,xmm11,DWORD PTR[((-60))+r14],1 vpinsrd xmm8,xmm8,DWORD PTR[((-60))+r10],1 vpinsrd xmm7,xmm7,DWORD PTR[((-60))+r15],1 vpunpckldq ymm11,ymm11,ymm7 vpinsrd xmm6,xmm6,DWORD PTR[((-60))+r11],1 vpunpckldq ymm8,ymm8,ymm6 vpaddd ymm4,ymm4,ymm15 vpslld ymm7,ymm0,5 vpandn ymm6,ymm1,ymm3 vpand ymm5,ymm1,ymm2 vmovdqa YMMWORD PTR[(0-128)+rax],ymm10 vpaddd ymm4,ymm4,ymm10 vinserti128 ymm11,ymm11,xmm8,1 vpsrld ymm8,ymm0,27 vpxor ymm5,ymm5,ymm6 vmovd xmm12,DWORD PTR[((-56))+r12] vpslld ymm6,ymm1,30 vpor ymm7,ymm7,ymm8 vmovd xmm8,DWORD PTR[((-56))+r8] vpaddd ymm4,ymm4,ymm5 vpsrld ymm1,ymm1,2 vpaddd ymm4,ymm4,ymm7 vpshufb ymm11,ymm11,ymm9 vpor ymm1,ymm1,ymm6 vmovd xmm7,DWORD PTR[((-56))+r13] vmovd xmm6,DWORD PTR[((-56))+r9] vpinsrd xmm12,xmm12,DWORD PTR[((-56))+r14],1 vpinsrd xmm8,xmm8,DWORD PTR[((-56))+r10],1 vpinsrd xmm7,xmm7,DWORD PTR[((-56))+r15],1 vpunpckldq ymm12,ymm12,ymm7 vpinsrd xmm6,xmm6,DWORD PTR[((-56))+r11],1 vpunpckldq ymm8,ymm8,ymm6 vpaddd ymm3,ymm3,ymm15 vpslld ymm7,ymm4,5 vpandn ymm6,ymm0,ymm2 vpand ymm5,ymm0,ymm1 vmovdqa YMMWORD PTR[(32-128)+rax],ymm11 vpaddd ymm3,ymm3,ymm11 vinserti128 ymm12,ymm12,xmm8,1 vpsrld ymm8,ymm4,27 vpxor ymm5,ymm5,ymm6 vmovd xmm13,DWORD PTR[((-52))+r12] vpslld ymm6,ymm0,30 vpor ymm7,ymm7,ymm8 vmovd xmm8,DWORD PTR[((-52))+r8] vpaddd ymm3,ymm3,ymm5 vpsrld ymm0,ymm0,2 vpaddd ymm3,ymm3,ymm7 vpshufb ymm12,ymm12,ymm9 vpor ymm0,ymm0,ymm6 vmovd xmm7,DWORD PTR[((-52))+r13] vmovd xmm6,DWORD PTR[((-52))+r9] vpinsrd xmm13,xmm13,DWORD PTR[((-52))+r14],1 vpinsrd xmm8,xmm8,DWORD PTR[((-52))+r10],1 vpinsrd xmm7,xmm7,DWORD PTR[((-52))+r15],1 vpunpckldq ymm13,ymm13,ymm7 vpinsrd xmm6,xmm6,DWORD PTR[((-52))+r11],1 vpunpckldq ymm8,ymm8,ymm6 vpaddd ymm2,ymm2,ymm15 vpslld ymm7,ymm3,5 vpandn ymm6,ymm4,ymm1 vpand ymm5,ymm4,ymm0 vmovdqa YMMWORD PTR[(64-128)+rax],ymm12 vpaddd ymm2,ymm2,ymm12 vinserti128 ymm13,ymm13,xmm8,1 vpsrld ymm8,ymm3,27 vpxor ymm5,ymm5,ymm6 vmovd xmm14,DWORD PTR[((-48))+r12] vpslld ymm6,ymm4,30 vpor ymm7,ymm7,ymm8 vmovd xmm8,DWORD PTR[((-48))+r8] vpaddd ymm2,ymm2,ymm5 vpsrld ymm4,ymm4,2 vpaddd ymm2,ymm2,ymm7 vpshufb ymm13,ymm13,ymm9 vpor ymm4,ymm4,ymm6 vmovd xmm7,DWORD PTR[((-48))+r13] vmovd xmm6,DWORD PTR[((-48))+r9] vpinsrd xmm14,xmm14,DWORD PTR[((-48))+r14],1 vpinsrd xmm8,xmm8,DWORD PTR[((-48))+r10],1 vpinsrd xmm7,xmm7,DWORD PTR[((-48))+r15],1 vpunpckldq ymm14,ymm14,ymm7 vpinsrd xmm6,xmm6,DWORD PTR[((-48))+r11],1 vpunpckldq ymm8,ymm8,ymm6 vpaddd ymm1,ymm1,ymm15 vpslld ymm7,ymm2,5 vpandn ymm6,ymm3,ymm0 vpand ymm5,ymm3,ymm4 vmovdqa YMMWORD PTR[(96-128)+rax],ymm13 vpaddd ymm1,ymm1,ymm13 vinserti128 ymm14,ymm14,xmm8,1 vpsrld ymm8,ymm2,27 vpxor ymm5,ymm5,ymm6 vmovd xmm10,DWORD PTR[((-44))+r12] vpslld ymm6,ymm3,30 vpor ymm7,ymm7,ymm8 vmovd xmm8,DWORD PTR[((-44))+r8] vpaddd ymm1,ymm1,ymm5 vpsrld ymm3,ymm3,2 vpaddd ymm1,ymm1,ymm7 vpshufb ymm14,ymm14,ymm9 vpor ymm3,ymm3,ymm6 vmovd xmm7,DWORD PTR[((-44))+r13] vmovd xmm6,DWORD PTR[((-44))+r9] vpinsrd xmm10,xmm10,DWORD PTR[((-44))+r14],1 vpinsrd xmm8,xmm8,DWORD PTR[((-44))+r10],1 vpinsrd xmm7,xmm7,DWORD PTR[((-44))+r15],1 vpunpckldq ymm10,ymm10,ymm7 vpinsrd xmm6,xmm6,DWORD PTR[((-44))+r11],1 vpunpckldq ymm8,ymm8,ymm6 vpaddd ymm0,ymm0,ymm15 vpslld ymm7,ymm1,5 vpandn ymm6,ymm2,ymm4 vpand ymm5,ymm2,ymm3 vmovdqa YMMWORD PTR[(128-128)+rax],ymm14 vpaddd ymm0,ymm0,ymm14 vinserti128 ymm10,ymm10,xmm8,1 vpsrld ymm8,ymm1,27 vpxor ymm5,ymm5,ymm6 vmovd xmm11,DWORD PTR[((-40))+r12] vpslld ymm6,ymm2,30 vpor ymm7,ymm7,ymm8 vmovd xmm8,DWORD PTR[((-40))+r8] vpaddd ymm0,ymm0,ymm5 vpsrld ymm2,ymm2,2 vpaddd ymm0,ymm0,ymm7 vpshufb ymm10,ymm10,ymm9 vpor ymm2,ymm2,ymm6 vmovd xmm7,DWORD PTR[((-40))+r13] vmovd xmm6,DWORD PTR[((-40))+r9] vpinsrd xmm11,xmm11,DWORD PTR[((-40))+r14],1 vpinsrd xmm8,xmm8,DWORD PTR[((-40))+r10],1 vpinsrd xmm7,xmm7,DWORD PTR[((-40))+r15],1 vpunpckldq ymm11,ymm11,ymm7 vpinsrd xmm6,xmm6,DWORD PTR[((-40))+r11],1 vpunpckldq ymm8,ymm8,ymm6 vpaddd ymm4,ymm4,ymm15 vpslld ymm7,ymm0,5 vpandn ymm6,ymm1,ymm3 vpand ymm5,ymm1,ymm2 vmovdqa YMMWORD PTR[(160-128)+rax],ymm10 vpaddd ymm4,ymm4,ymm10 vinserti128 ymm11,ymm11,xmm8,1 vpsrld ymm8,ymm0,27 vpxor ymm5,ymm5,ymm6 vmovd xmm12,DWORD PTR[((-36))+r12] vpslld ymm6,ymm1,30 vpor ymm7,ymm7,ymm8 vmovd xmm8,DWORD PTR[((-36))+r8] vpaddd ymm4,ymm4,ymm5 vpsrld ymm1,ymm1,2 vpaddd ymm4,ymm4,ymm7 vpshufb ymm11,ymm11,ymm9 vpor ymm1,ymm1,ymm6 vmovd xmm7,DWORD PTR[((-36))+r13] vmovd xmm6,DWORD PTR[((-36))+r9] vpinsrd xmm12,xmm12,DWORD PTR[((-36))+r14],1 vpinsrd xmm8,xmm8,DWORD PTR[((-36))+r10],1 vpinsrd xmm7,xmm7,DWORD PTR[((-36))+r15],1 vpunpckldq ymm12,ymm12,ymm7 vpinsrd xmm6,xmm6,DWORD PTR[((-36))+r11],1 vpunpckldq ymm8,ymm8,ymm6 vpaddd ymm3,ymm3,ymm15 vpslld ymm7,ymm4,5 vpandn ymm6,ymm0,ymm2 vpand ymm5,ymm0,ymm1 vmovdqa YMMWORD PTR[(192-128)+rax],ymm11 vpaddd ymm3,ymm3,ymm11 vinserti128 ymm12,ymm12,xmm8,1 vpsrld ymm8,ymm4,27 vpxor ymm5,ymm5,ymm6 vmovd xmm13,DWORD PTR[((-32))+r12] vpslld ymm6,ymm0,30 vpor ymm7,ymm7,ymm8 vmovd xmm8,DWORD PTR[((-32))+r8] vpaddd ymm3,ymm3,ymm5 vpsrld ymm0,ymm0,2 vpaddd ymm3,ymm3,ymm7 vpshufb ymm12,ymm12,ymm9 vpor ymm0,ymm0,ymm6 vmovd xmm7,DWORD PTR[((-32))+r13] vmovd xmm6,DWORD PTR[((-32))+r9] vpinsrd xmm13,xmm13,DWORD PTR[((-32))+r14],1 vpinsrd xmm8,xmm8,DWORD PTR[((-32))+r10],1 vpinsrd xmm7,xmm7,DWORD PTR[((-32))+r15],1 vpunpckldq ymm13,ymm13,ymm7 vpinsrd xmm6,xmm6,DWORD PTR[((-32))+r11],1 vpunpckldq ymm8,ymm8,ymm6 vpaddd ymm2,ymm2,ymm15 vpslld ymm7,ymm3,5 vpandn ymm6,ymm4,ymm1 vpand ymm5,ymm4,ymm0 vmovdqa YMMWORD PTR[(224-128)+rax],ymm12 vpaddd ymm2,ymm2,ymm12 vinserti128 ymm13,ymm13,xmm8,1 vpsrld ymm8,ymm3,27 vpxor ymm5,ymm5,ymm6 vmovd xmm14,DWORD PTR[((-28))+r12] vpslld ymm6,ymm4,30 vpor ymm7,ymm7,ymm8 vmovd xmm8,DWORD PTR[((-28))+r8] vpaddd ymm2,ymm2,ymm5 vpsrld ymm4,ymm4,2 vpaddd ymm2,ymm2,ymm7 vpshufb ymm13,ymm13,ymm9 vpor ymm4,ymm4,ymm6 vmovd xmm7,DWORD PTR[((-28))+r13] vmovd xmm6,DWORD PTR[((-28))+r9] vpinsrd xmm14,xmm14,DWORD PTR[((-28))+r14],1 vpinsrd xmm8,xmm8,DWORD PTR[((-28))+r10],1 vpinsrd xmm7,xmm7,DWORD PTR[((-28))+r15],1 vpunpckldq ymm14,ymm14,ymm7 vpinsrd xmm6,xmm6,DWORD PTR[((-28))+r11],1 vpunpckldq ymm8,ymm8,ymm6 vpaddd ymm1,ymm1,ymm15 vpslld ymm7,ymm2,5 vpandn ymm6,ymm3,ymm0 vpand ymm5,ymm3,ymm4 vmovdqa YMMWORD PTR[(256-256-128)+rbx],ymm13 vpaddd ymm1,ymm1,ymm13 vinserti128 ymm14,ymm14,xmm8,1 vpsrld ymm8,ymm2,27 vpxor ymm5,ymm5,ymm6 vmovd xmm10,DWORD PTR[((-24))+r12] vpslld ymm6,ymm3,30 vpor ymm7,ymm7,ymm8 vmovd xmm8,DWORD PTR[((-24))+r8] vpaddd ymm1,ymm1,ymm5 vpsrld ymm3,ymm3,2 vpaddd ymm1,ymm1,ymm7 vpshufb ymm14,ymm14,ymm9 vpor ymm3,ymm3,ymm6 vmovd xmm7,DWORD PTR[((-24))+r13] vmovd xmm6,DWORD PTR[((-24))+r9] vpinsrd xmm10,xmm10,DWORD PTR[((-24))+r14],1 vpinsrd xmm8,xmm8,DWORD PTR[((-24))+r10],1 vpinsrd xmm7,xmm7,DWORD PTR[((-24))+r15],1 vpunpckldq ymm10,ymm10,ymm7 vpinsrd xmm6,xmm6,DWORD PTR[((-24))+r11],1 vpunpckldq ymm8,ymm8,ymm6 vpaddd ymm0,ymm0,ymm15 vpslld ymm7,ymm1,5 vpandn ymm6,ymm2,ymm4 vpand ymm5,ymm2,ymm3 vmovdqa YMMWORD PTR[(288-256-128)+rbx],ymm14 vpaddd ymm0,ymm0,ymm14 vinserti128 ymm10,ymm10,xmm8,1 vpsrld ymm8,ymm1,27 vpxor ymm5,ymm5,ymm6 vmovd xmm11,DWORD PTR[((-20))+r12] vpslld ymm6,ymm2,30 vpor ymm7,ymm7,ymm8 vmovd xmm8,DWORD PTR[((-20))+r8] vpaddd ymm0,ymm0,ymm5 vpsrld ymm2,ymm2,2 vpaddd ymm0,ymm0,ymm7 vpshufb ymm10,ymm10,ymm9 vpor ymm2,ymm2,ymm6 vmovd xmm7,DWORD PTR[((-20))+r13] vmovd xmm6,DWORD PTR[((-20))+r9] vpinsrd xmm11,xmm11,DWORD PTR[((-20))+r14],1 vpinsrd xmm8,xmm8,DWORD PTR[((-20))+r10],1 vpinsrd xmm7,xmm7,DWORD PTR[((-20))+r15],1 vpunpckldq ymm11,ymm11,ymm7 vpinsrd xmm6,xmm6,DWORD PTR[((-20))+r11],1 vpunpckldq ymm8,ymm8,ymm6 vpaddd ymm4,ymm4,ymm15 vpslld ymm7,ymm0,5 vpandn ymm6,ymm1,ymm3 vpand ymm5,ymm1,ymm2 vmovdqa YMMWORD PTR[(320-256-128)+rbx],ymm10 vpaddd ymm4,ymm4,ymm10 vinserti128 ymm11,ymm11,xmm8,1 vpsrld ymm8,ymm0,27 vpxor ymm5,ymm5,ymm6 vmovd xmm12,DWORD PTR[((-16))+r12] vpslld ymm6,ymm1,30 vpor ymm7,ymm7,ymm8 vmovd xmm8,DWORD PTR[((-16))+r8] vpaddd ymm4,ymm4,ymm5 vpsrld ymm1,ymm1,2 vpaddd ymm4,ymm4,ymm7 vpshufb ymm11,ymm11,ymm9 vpor ymm1,ymm1,ymm6 vmovd xmm7,DWORD PTR[((-16))+r13] vmovd xmm6,DWORD PTR[((-16))+r9] vpinsrd xmm12,xmm12,DWORD PTR[((-16))+r14],1 vpinsrd xmm8,xmm8,DWORD PTR[((-16))+r10],1 vpinsrd xmm7,xmm7,DWORD PTR[((-16))+r15],1 vpunpckldq ymm12,ymm12,ymm7 vpinsrd xmm6,xmm6,DWORD PTR[((-16))+r11],1 vpunpckldq ymm8,ymm8,ymm6 vpaddd ymm3,ymm3,ymm15 vpslld ymm7,ymm4,5 vpandn ymm6,ymm0,ymm2 vpand ymm5,ymm0,ymm1 vmovdqa YMMWORD PTR[(352-256-128)+rbx],ymm11 vpaddd ymm3,ymm3,ymm11 vinserti128 ymm12,ymm12,xmm8,1 vpsrld ymm8,ymm4,27 vpxor ymm5,ymm5,ymm6 vmovd xmm13,DWORD PTR[((-12))+r12] vpslld ymm6,ymm0,30 vpor ymm7,ymm7,ymm8 vmovd xmm8,DWORD PTR[((-12))+r8] vpaddd ymm3,ymm3,ymm5 vpsrld ymm0,ymm0,2 vpaddd ymm3,ymm3,ymm7 vpshufb ymm12,ymm12,ymm9 vpor ymm0,ymm0,ymm6 vmovd xmm7,DWORD PTR[((-12))+r13] vmovd xmm6,DWORD PTR[((-12))+r9] vpinsrd xmm13,xmm13,DWORD PTR[((-12))+r14],1 vpinsrd xmm8,xmm8,DWORD PTR[((-12))+r10],1 vpinsrd xmm7,xmm7,DWORD PTR[((-12))+r15],1 vpunpckldq ymm13,ymm13,ymm7 vpinsrd xmm6,xmm6,DWORD PTR[((-12))+r11],1 vpunpckldq ymm8,ymm8,ymm6 vpaddd ymm2,ymm2,ymm15 vpslld ymm7,ymm3,5 vpandn ymm6,ymm4,ymm1 vpand ymm5,ymm4,ymm0 vmovdqa YMMWORD PTR[(384-256-128)+rbx],ymm12 vpaddd ymm2,ymm2,ymm12 vinserti128 ymm13,ymm13,xmm8,1 vpsrld ymm8,ymm3,27 vpxor ymm5,ymm5,ymm6 vmovd xmm14,DWORD PTR[((-8))+r12] vpslld ymm6,ymm4,30 vpor ymm7,ymm7,ymm8 vmovd xmm8,DWORD PTR[((-8))+r8] vpaddd ymm2,ymm2,ymm5 vpsrld ymm4,ymm4,2 vpaddd ymm2,ymm2,ymm7 vpshufb ymm13,ymm13,ymm9 vpor ymm4,ymm4,ymm6 vmovd xmm7,DWORD PTR[((-8))+r13] vmovd xmm6,DWORD PTR[((-8))+r9] vpinsrd xmm14,xmm14,DWORD PTR[((-8))+r14],1 vpinsrd xmm8,xmm8,DWORD PTR[((-8))+r10],1 vpinsrd xmm7,xmm7,DWORD PTR[((-8))+r15],1 vpunpckldq ymm14,ymm14,ymm7 vpinsrd xmm6,xmm6,DWORD PTR[((-8))+r11],1 vpunpckldq ymm8,ymm8,ymm6 vpaddd ymm1,ymm1,ymm15 vpslld ymm7,ymm2,5 vpandn ymm6,ymm3,ymm0 vpand ymm5,ymm3,ymm4 vmovdqa YMMWORD PTR[(416-256-128)+rbx],ymm13 vpaddd ymm1,ymm1,ymm13 vinserti128 ymm14,ymm14,xmm8,1 vpsrld ymm8,ymm2,27 vpxor ymm5,ymm5,ymm6 vmovd xmm10,DWORD PTR[((-4))+r12] vpslld ymm6,ymm3,30 vpor ymm7,ymm7,ymm8 vmovd xmm8,DWORD PTR[((-4))+r8] vpaddd ymm1,ymm1,ymm5 vpsrld ymm3,ymm3,2 vpaddd ymm1,ymm1,ymm7 vpshufb ymm14,ymm14,ymm9 vpor ymm3,ymm3,ymm6 vmovdqa ymm11,YMMWORD PTR[((0-128))+rax] vmovd xmm7,DWORD PTR[((-4))+r13] vmovd xmm6,DWORD PTR[((-4))+r9] vpinsrd xmm10,xmm10,DWORD PTR[((-4))+r14],1 vpinsrd xmm8,xmm8,DWORD PTR[((-4))+r10],1 vpinsrd xmm7,xmm7,DWORD PTR[((-4))+r15],1 vpunpckldq ymm10,ymm10,ymm7 vpinsrd xmm6,xmm6,DWORD PTR[((-4))+r11],1 vpunpckldq ymm8,ymm8,ymm6 vpaddd ymm0,ymm0,ymm15 prefetcht0 [63+r12] vpslld ymm7,ymm1,5 vpandn ymm6,ymm2,ymm4 vpand ymm5,ymm2,ymm3 vmovdqa YMMWORD PTR[(448-256-128)+rbx],ymm14 vpaddd ymm0,ymm0,ymm14 vinserti128 ymm10,ymm10,xmm8,1 vpsrld ymm8,ymm1,27 prefetcht0 [63+r13] vpxor ymm5,ymm5,ymm6 vpslld ymm6,ymm2,30 vpor ymm7,ymm7,ymm8 prefetcht0 [63+r14] vpaddd ymm0,ymm0,ymm5 vpsrld ymm2,ymm2,2 vpaddd ymm0,ymm0,ymm7 prefetcht0 [63+r15] vpshufb ymm10,ymm10,ymm9 vpor ymm2,ymm2,ymm6 vmovdqa ymm12,YMMWORD PTR[((32-128))+rax] vpxor ymm11,ymm11,ymm13 vmovdqa ymm13,YMMWORD PTR[((64-128))+rax] vpaddd ymm4,ymm4,ymm15 vpslld ymm7,ymm0,5 vpandn ymm6,ymm1,ymm3 prefetcht0 [63+r8] vpand ymm5,ymm1,ymm2 vmovdqa YMMWORD PTR[(480-256-128)+rbx],ymm10 vpaddd ymm4,ymm4,ymm10 vpxor ymm11,ymm11,YMMWORD PTR[((256-256-128))+rbx] vpsrld ymm8,ymm0,27 vpxor ymm5,ymm5,ymm6 vpxor ymm11,ymm11,ymm13 prefetcht0 [63+r9] vpslld ymm6,ymm1,30 vpor ymm7,ymm7,ymm8 vpaddd ymm4,ymm4,ymm5 prefetcht0 [63+r10] vpsrld ymm9,ymm11,31 vpaddd ymm11,ymm11,ymm11 vpsrld ymm1,ymm1,2 prefetcht0 [63+r11] vpaddd ymm4,ymm4,ymm7 vpor ymm11,ymm11,ymm9 vpor ymm1,ymm1,ymm6 vpxor ymm12,ymm12,ymm14 vmovdqa ymm14,YMMWORD PTR[((96-128))+rax] vpaddd ymm3,ymm3,ymm15 vpslld ymm7,ymm4,5 vpandn ymm6,ymm0,ymm2 vpand ymm5,ymm0,ymm1 vmovdqa YMMWORD PTR[(0-128)+rax],ymm11 vpaddd ymm3,ymm3,ymm11 vpxor ymm12,ymm12,YMMWORD PTR[((288-256-128))+rbx] vpsrld ymm8,ymm4,27 vpxor ymm5,ymm5,ymm6 vpxor ymm12,ymm12,ymm14 vpslld ymm6,ymm0,30 vpor ymm7,ymm7,ymm8 vpaddd ymm3,ymm3,ymm5 vpsrld ymm9,ymm12,31 vpaddd ymm12,ymm12,ymm12 vpsrld ymm0,ymm0,2 vpaddd ymm3,ymm3,ymm7 vpor ymm12,ymm12,ymm9 vpor ymm0,ymm0,ymm6 vpxor ymm13,ymm13,ymm10 vmovdqa ymm10,YMMWORD PTR[((128-128))+rax] vpaddd ymm2,ymm2,ymm15 vpslld ymm7,ymm3,5 vpandn ymm6,ymm4,ymm1 vpand ymm5,ymm4,ymm0 vmovdqa YMMWORD PTR[(32-128)+rax],ymm12 vpaddd ymm2,ymm2,ymm12 vpxor ymm13,ymm13,YMMWORD PTR[((320-256-128))+rbx] vpsrld ymm8,ymm3,27 vpxor ymm5,ymm5,ymm6 vpxor ymm13,ymm13,ymm10 vpslld ymm6,ymm4,30 vpor ymm7,ymm7,ymm8 vpaddd ymm2,ymm2,ymm5 vpsrld ymm9,ymm13,31 vpaddd ymm13,ymm13,ymm13 vpsrld ymm4,ymm4,2 vpaddd ymm2,ymm2,ymm7 vpor ymm13,ymm13,ymm9 vpor ymm4,ymm4,ymm6 vpxor ymm14,ymm14,ymm11 vmovdqa ymm11,YMMWORD PTR[((160-128))+rax] vpaddd ymm1,ymm1,ymm15 vpslld ymm7,ymm2,5 vpandn ymm6,ymm3,ymm0 vpand ymm5,ymm3,ymm4 vmovdqa YMMWORD PTR[(64-128)+rax],ymm13 vpaddd ymm1,ymm1,ymm13 vpxor ymm14,ymm14,YMMWORD PTR[((352-256-128))+rbx] vpsrld ymm8,ymm2,27 vpxor ymm5,ymm5,ymm6 vpxor ymm14,ymm14,ymm11 vpslld ymm6,ymm3,30 vpor ymm7,ymm7,ymm8 vpaddd ymm1,ymm1,ymm5 vpsrld ymm9,ymm14,31 vpaddd ymm14,ymm14,ymm14 vpsrld ymm3,ymm3,2 vpaddd ymm1,ymm1,ymm7 vpor ymm14,ymm14,ymm9 vpor ymm3,ymm3,ymm6 vpxor ymm10,ymm10,ymm12 vmovdqa ymm12,YMMWORD PTR[((192-128))+rax] vpaddd ymm0,ymm0,ymm15 vpslld ymm7,ymm1,5 vpandn ymm6,ymm2,ymm4 vpand ymm5,ymm2,ymm3 vmovdqa YMMWORD PTR[(96-128)+rax],ymm14 vpaddd ymm0,ymm0,ymm14 vpxor ymm10,ymm10,YMMWORD PTR[((384-256-128))+rbx] vpsrld ymm8,ymm1,27 vpxor ymm5,ymm5,ymm6 vpxor ymm10,ymm10,ymm12 vpslld ymm6,ymm2,30 vpor ymm7,ymm7,ymm8 vpaddd ymm0,ymm0,ymm5 vpsrld ymm9,ymm10,31 vpaddd ymm10,ymm10,ymm10 vpsrld ymm2,ymm2,2 vpaddd ymm0,ymm0,ymm7 vpor ymm10,ymm10,ymm9 vpor ymm2,ymm2,ymm6 vmovdqa ymm15,YMMWORD PTR[rbp] vpxor ymm11,ymm11,ymm13 vmovdqa ymm13,YMMWORD PTR[((224-128))+rax] vpslld ymm7,ymm0,5 vpaddd ymm4,ymm4,ymm15 vpxor ymm5,ymm3,ymm1 vmovdqa YMMWORD PTR[(128-128)+rax],ymm10 vpaddd ymm4,ymm4,ymm10 vpxor ymm11,ymm11,YMMWORD PTR[((416-256-128))+rbx] vpsrld ymm8,ymm0,27 vpxor ymm5,ymm5,ymm2 vpxor ymm11,ymm11,ymm13 vpslld ymm6,ymm1,30 vpor ymm7,ymm7,ymm8 vpaddd ymm4,ymm4,ymm5 vpsrld ymm9,ymm11,31 vpaddd ymm11,ymm11,ymm11 vpsrld ymm1,ymm1,2 vpaddd ymm4,ymm4,ymm7 vpor ymm11,ymm11,ymm9 vpor ymm1,ymm1,ymm6 vpxor ymm12,ymm12,ymm14 vmovdqa ymm14,YMMWORD PTR[((256-256-128))+rbx] vpslld ymm7,ymm4,5 vpaddd ymm3,ymm3,ymm15 vpxor ymm5,ymm2,ymm0 vmovdqa YMMWORD PTR[(160-128)+rax],ymm11 vpaddd ymm3,ymm3,ymm11 vpxor ymm12,ymm12,YMMWORD PTR[((448-256-128))+rbx] vpsrld ymm8,ymm4,27 vpxor ymm5,ymm5,ymm1 vpxor ymm12,ymm12,ymm14 vpslld ymm6,ymm0,30 vpor ymm7,ymm7,ymm8 vpaddd ymm3,ymm3,ymm5 vpsrld ymm9,ymm12,31 vpaddd ymm12,ymm12,ymm12 vpsrld ymm0,ymm0,2 vpaddd ymm3,ymm3,ymm7 vpor ymm12,ymm12,ymm9 vpor ymm0,ymm0,ymm6 vpxor ymm13,ymm13,ymm10 vmovdqa ymm10,YMMWORD PTR[((288-256-128))+rbx] vpslld ymm7,ymm3,5 vpaddd ymm2,ymm2,ymm15 vpxor ymm5,ymm1,ymm4 vmovdqa YMMWORD PTR[(192-128)+rax],ymm12 vpaddd ymm2,ymm2,ymm12 vpxor ymm13,ymm13,YMMWORD PTR[((480-256-128))+rbx] vpsrld ymm8,ymm3,27 vpxor ymm5,ymm5,ymm0 vpxor ymm13,ymm13,ymm10 vpslld ymm6,ymm4,30 vpor ymm7,ymm7,ymm8 vpaddd ymm2,ymm2,ymm5 vpsrld ymm9,ymm13,31 vpaddd ymm13,ymm13,ymm13 vpsrld ymm4,ymm4,2 vpaddd ymm2,ymm2,ymm7 vpor ymm13,ymm13,ymm9 vpor ymm4,ymm4,ymm6 vpxor ymm14,ymm14,ymm11 vmovdqa ymm11,YMMWORD PTR[((320-256-128))+rbx] vpslld ymm7,ymm2,5 vpaddd ymm1,ymm1,ymm15 vpxor ymm5,ymm0,ymm3 vmovdqa YMMWORD PTR[(224-128)+rax],ymm13 vpaddd ymm1,ymm1,ymm13 vpxor ymm14,ymm14,YMMWORD PTR[((0-128))+rax] vpsrld ymm8,ymm2,27 vpxor ymm5,ymm5,ymm4 vpxor ymm14,ymm14,ymm11 vpslld ymm6,ymm3,30 vpor ymm7,ymm7,ymm8 vpaddd ymm1,ymm1,ymm5 vpsrld ymm9,ymm14,31 vpaddd ymm14,ymm14,ymm14 vpsrld ymm3,ymm3,2 vpaddd ymm1,ymm1,ymm7 vpor ymm14,ymm14,ymm9 vpor ymm3,ymm3,ymm6 vpxor ymm10,ymm10,ymm12 vmovdqa ymm12,YMMWORD PTR[((352-256-128))+rbx] vpslld ymm7,ymm1,5 vpaddd ymm0,ymm0,ymm15 vpxor ymm5,ymm4,ymm2 vmovdqa YMMWORD PTR[(256-256-128)+rbx],ymm14 vpaddd ymm0,ymm0,ymm14 vpxor ymm10,ymm10,YMMWORD PTR[((32-128))+rax] vpsrld ymm8,ymm1,27 vpxor ymm5,ymm5,ymm3 vpxor ymm10,ymm10,ymm12 vpslld ymm6,ymm2,30 vpor ymm7,ymm7,ymm8 vpaddd ymm0,ymm0,ymm5 vpsrld ymm9,ymm10,31 vpaddd ymm10,ymm10,ymm10 vpsrld ymm2,ymm2,2 vpaddd ymm0,ymm0,ymm7 vpor ymm10,ymm10,ymm9 vpor ymm2,ymm2,ymm6 vpxor ymm11,ymm11,ymm13 vmovdqa ymm13,YMMWORD PTR[((384-256-128))+rbx] vpslld ymm7,ymm0,5 vpaddd ymm4,ymm4,ymm15 vpxor ymm5,ymm3,ymm1 vmovdqa YMMWORD PTR[(288-256-128)+rbx],ymm10 vpaddd ymm4,ymm4,ymm10 vpxor ymm11,ymm11,YMMWORD PTR[((64-128))+rax] vpsrld ymm8,ymm0,27 vpxor ymm5,ymm5,ymm2 vpxor ymm11,ymm11,ymm13 vpslld ymm6,ymm1,30 vpor ymm7,ymm7,ymm8 vpaddd ymm4,ymm4,ymm5 vpsrld ymm9,ymm11,31 vpaddd ymm11,ymm11,ymm11 vpsrld ymm1,ymm1,2 vpaddd ymm4,ymm4,ymm7 vpor ymm11,ymm11,ymm9 vpor ymm1,ymm1,ymm6 vpxor ymm12,ymm12,ymm14 vmovdqa ymm14,YMMWORD PTR[((416-256-128))+rbx] vpslld ymm7,ymm4,5 vpaddd ymm3,ymm3,ymm15 vpxor ymm5,ymm2,ymm0 vmovdqa YMMWORD PTR[(320-256-128)+rbx],ymm11 vpaddd ymm3,ymm3,ymm11 vpxor ymm12,ymm12,YMMWORD PTR[((96-128))+rax] vpsrld ymm8,ymm4,27 vpxor ymm5,ymm5,ymm1 vpxor ymm12,ymm12,ymm14 vpslld ymm6,ymm0,30 vpor ymm7,ymm7,ymm8 vpaddd ymm3,ymm3,ymm5 vpsrld ymm9,ymm12,31 vpaddd ymm12,ymm12,ymm12 vpsrld ymm0,ymm0,2 vpaddd ymm3,ymm3,ymm7 vpor ymm12,ymm12,ymm9 vpor ymm0,ymm0,ymm6 vpxor ymm13,ymm13,ymm10 vmovdqa ymm10,YMMWORD PTR[((448-256-128))+rbx] vpslld ymm7,ymm3,5 vpaddd ymm2,ymm2,ymm15 vpxor ymm5,ymm1,ymm4 vmovdqa YMMWORD PTR[(352-256-128)+rbx],ymm12 vpaddd ymm2,ymm2,ymm12 vpxor ymm13,ymm13,YMMWORD PTR[((128-128))+rax] vpsrld ymm8,ymm3,27 vpxor ymm5,ymm5,ymm0 vpxor ymm13,ymm13,ymm10 vpslld ymm6,ymm4,30 vpor ymm7,ymm7,ymm8 vpaddd ymm2,ymm2,ymm5 vpsrld ymm9,ymm13,31 vpaddd ymm13,ymm13,ymm13 vpsrld ymm4,ymm4,2 vpaddd ymm2,ymm2,ymm7 vpor ymm13,ymm13,ymm9 vpor ymm4,ymm4,ymm6 vpxor ymm14,ymm14,ymm11 vmovdqa ymm11,YMMWORD PTR[((480-256-128))+rbx] vpslld ymm7,ymm2,5 vpaddd ymm1,ymm1,ymm15 vpxor ymm5,ymm0,ymm3 vmovdqa YMMWORD PTR[(384-256-128)+rbx],ymm13 vpaddd ymm1,ymm1,ymm13 vpxor ymm14,ymm14,YMMWORD PTR[((160-128))+rax] vpsrld ymm8,ymm2,27 vpxor ymm5,ymm5,ymm4 vpxor ymm14,ymm14,ymm11 vpslld ymm6,ymm3,30 vpor ymm7,ymm7,ymm8 vpaddd ymm1,ymm1,ymm5 vpsrld ymm9,ymm14,31 vpaddd ymm14,ymm14,ymm14 vpsrld ymm3,ymm3,2 vpaddd ymm1,ymm1,ymm7 vpor ymm14,ymm14,ymm9 vpor ymm3,ymm3,ymm6 vpxor ymm10,ymm10,ymm12 vmovdqa ymm12,YMMWORD PTR[((0-128))+rax] vpslld ymm7,ymm1,5 vpaddd ymm0,ymm0,ymm15 vpxor ymm5,ymm4,ymm2 vmovdqa YMMWORD PTR[(416-256-128)+rbx],ymm14 vpaddd ymm0,ymm0,ymm14 vpxor ymm10,ymm10,YMMWORD PTR[((192-128))+rax] vpsrld ymm8,ymm1,27 vpxor ymm5,ymm5,ymm3 vpxor ymm10,ymm10,ymm12 vpslld ymm6,ymm2,30 vpor ymm7,ymm7,ymm8 vpaddd ymm0,ymm0,ymm5 vpsrld ymm9,ymm10,31 vpaddd ymm10,ymm10,ymm10 vpsrld ymm2,ymm2,2 vpaddd ymm0,ymm0,ymm7 vpor ymm10,ymm10,ymm9 vpor ymm2,ymm2,ymm6 vpxor ymm11,ymm11,ymm13 vmovdqa ymm13,YMMWORD PTR[((32-128))+rax] vpslld ymm7,ymm0,5 vpaddd ymm4,ymm4,ymm15 vpxor ymm5,ymm3,ymm1 vmovdqa YMMWORD PTR[(448-256-128)+rbx],ymm10 vpaddd ymm4,ymm4,ymm10 vpxor ymm11,ymm11,YMMWORD PTR[((224-128))+rax] vpsrld ymm8,ymm0,27 vpxor ymm5,ymm5,ymm2 vpxor ymm11,ymm11,ymm13 vpslld ymm6,ymm1,30 vpor ymm7,ymm7,ymm8 vpaddd ymm4,ymm4,ymm5 vpsrld ymm9,ymm11,31 vpaddd ymm11,ymm11,ymm11 vpsrld ymm1,ymm1,2 vpaddd ymm4,ymm4,ymm7 vpor ymm11,ymm11,ymm9 vpor ymm1,ymm1,ymm6 vpxor ymm12,ymm12,ymm14 vmovdqa ymm14,YMMWORD PTR[((64-128))+rax] vpslld ymm7,ymm4,5 vpaddd ymm3,ymm3,ymm15 vpxor ymm5,ymm2,ymm0 vmovdqa YMMWORD PTR[(480-256-128)+rbx],ymm11 vpaddd ymm3,ymm3,ymm11 vpxor ymm12,ymm12,YMMWORD PTR[((256-256-128))+rbx] vpsrld ymm8,ymm4,27 vpxor ymm5,ymm5,ymm1 vpxor ymm12,ymm12,ymm14 vpslld ymm6,ymm0,30 vpor ymm7,ymm7,ymm8 vpaddd ymm3,ymm3,ymm5 vpsrld ymm9,ymm12,31 vpaddd ymm12,ymm12,ymm12 vpsrld ymm0,ymm0,2 vpaddd ymm3,ymm3,ymm7 vpor ymm12,ymm12,ymm9 vpor ymm0,ymm0,ymm6 vpxor ymm13,ymm13,ymm10 vmovdqa ymm10,YMMWORD PTR[((96-128))+rax] vpslld ymm7,ymm3,5 vpaddd ymm2,ymm2,ymm15 vpxor ymm5,ymm1,ymm4 vmovdqa YMMWORD PTR[(0-128)+rax],ymm12 vpaddd ymm2,ymm2,ymm12 vpxor ymm13,ymm13,YMMWORD PTR[((288-256-128))+rbx] vpsrld ymm8,ymm3,27 vpxor ymm5,ymm5,ymm0 vpxor ymm13,ymm13,ymm10 vpslld ymm6,ymm4,30 vpor ymm7,ymm7,ymm8 vpaddd ymm2,ymm2,ymm5 vpsrld ymm9,ymm13,31 vpaddd ymm13,ymm13,ymm13 vpsrld ymm4,ymm4,2 vpaddd ymm2,ymm2,ymm7 vpor ymm13,ymm13,ymm9 vpor ymm4,ymm4,ymm6 vpxor ymm14,ymm14,ymm11 vmovdqa ymm11,YMMWORD PTR[((128-128))+rax] vpslld ymm7,ymm2,5 vpaddd ymm1,ymm1,ymm15 vpxor ymm5,ymm0,ymm3 vmovdqa YMMWORD PTR[(32-128)+rax],ymm13 vpaddd ymm1,ymm1,ymm13 vpxor ymm14,ymm14,YMMWORD PTR[((320-256-128))+rbx] vpsrld ymm8,ymm2,27 vpxor ymm5,ymm5,ymm4 vpxor ymm14,ymm14,ymm11 vpslld ymm6,ymm3,30 vpor ymm7,ymm7,ymm8 vpaddd ymm1,ymm1,ymm5 vpsrld ymm9,ymm14,31 vpaddd ymm14,ymm14,ymm14 vpsrld ymm3,ymm3,2 vpaddd ymm1,ymm1,ymm7 vpor ymm14,ymm14,ymm9 vpor ymm3,ymm3,ymm6 vpxor ymm10,ymm10,ymm12 vmovdqa ymm12,YMMWORD PTR[((160-128))+rax] vpslld ymm7,ymm1,5 vpaddd ymm0,ymm0,ymm15 vpxor ymm5,ymm4,ymm2 vmovdqa YMMWORD PTR[(64-128)+rax],ymm14 vpaddd ymm0,ymm0,ymm14 vpxor ymm10,ymm10,YMMWORD PTR[((352-256-128))+rbx] vpsrld ymm8,ymm1,27 vpxor ymm5,ymm5,ymm3 vpxor ymm10,ymm10,ymm12 vpslld ymm6,ymm2,30 vpor ymm7,ymm7,ymm8 vpaddd ymm0,ymm0,ymm5 vpsrld ymm9,ymm10,31 vpaddd ymm10,ymm10,ymm10 vpsrld ymm2,ymm2,2 vpaddd ymm0,ymm0,ymm7 vpor ymm10,ymm10,ymm9 vpor ymm2,ymm2,ymm6 vpxor ymm11,ymm11,ymm13 vmovdqa ymm13,YMMWORD PTR[((192-128))+rax] vpslld ymm7,ymm0,5 vpaddd ymm4,ymm4,ymm15 vpxor ymm5,ymm3,ymm1 vmovdqa YMMWORD PTR[(96-128)+rax],ymm10 vpaddd ymm4,ymm4,ymm10 vpxor ymm11,ymm11,YMMWORD PTR[((384-256-128))+rbx] vpsrld ymm8,ymm0,27 vpxor ymm5,ymm5,ymm2 vpxor ymm11,ymm11,ymm13 vpslld ymm6,ymm1,30 vpor ymm7,ymm7,ymm8 vpaddd ymm4,ymm4,ymm5 vpsrld ymm9,ymm11,31 vpaddd ymm11,ymm11,ymm11 vpsrld ymm1,ymm1,2 vpaddd ymm4,ymm4,ymm7 vpor ymm11,ymm11,ymm9 vpor ymm1,ymm1,ymm6 vpxor ymm12,ymm12,ymm14 vmovdqa ymm14,YMMWORD PTR[((224-128))+rax] vpslld ymm7,ymm4,5 vpaddd ymm3,ymm3,ymm15 vpxor ymm5,ymm2,ymm0 vmovdqa YMMWORD PTR[(128-128)+rax],ymm11 vpaddd ymm3,ymm3,ymm11 vpxor ymm12,ymm12,YMMWORD PTR[((416-256-128))+rbx] vpsrld ymm8,ymm4,27 vpxor ymm5,ymm5,ymm1 vpxor ymm12,ymm12,ymm14 vpslld ymm6,ymm0,30 vpor ymm7,ymm7,ymm8 vpaddd ymm3,ymm3,ymm5 vpsrld ymm9,ymm12,31 vpaddd ymm12,ymm12,ymm12 vpsrld ymm0,ymm0,2 vpaddd ymm3,ymm3,ymm7 vpor ymm12,ymm12,ymm9 vpor ymm0,ymm0,ymm6 vpxor ymm13,ymm13,ymm10 vmovdqa ymm10,YMMWORD PTR[((256-256-128))+rbx] vpslld ymm7,ymm3,5 vpaddd ymm2,ymm2,ymm15 vpxor ymm5,ymm1,ymm4 vmovdqa YMMWORD PTR[(160-128)+rax],ymm12 vpaddd ymm2,ymm2,ymm12 vpxor ymm13,ymm13,YMMWORD PTR[((448-256-128))+rbx] vpsrld ymm8,ymm3,27 vpxor ymm5,ymm5,ymm0 vpxor ymm13,ymm13,ymm10 vpslld ymm6,ymm4,30 vpor ymm7,ymm7,ymm8 vpaddd ymm2,ymm2,ymm5 vpsrld ymm9,ymm13,31 vpaddd ymm13,ymm13,ymm13 vpsrld ymm4,ymm4,2 vpaddd ymm2,ymm2,ymm7 vpor ymm13,ymm13,ymm9 vpor ymm4,ymm4,ymm6 vpxor ymm14,ymm14,ymm11 vmovdqa ymm11,YMMWORD PTR[((288-256-128))+rbx] vpslld ymm7,ymm2,5 vpaddd ymm1,ymm1,ymm15 vpxor ymm5,ymm0,ymm3 vmovdqa YMMWORD PTR[(192-128)+rax],ymm13 vpaddd ymm1,ymm1,ymm13 vpxor ymm14,ymm14,YMMWORD PTR[((480-256-128))+rbx] vpsrld ymm8,ymm2,27 vpxor ymm5,ymm5,ymm4 vpxor ymm14,ymm14,ymm11 vpslld ymm6,ymm3,30 vpor ymm7,ymm7,ymm8 vpaddd ymm1,ymm1,ymm5 vpsrld ymm9,ymm14,31 vpaddd ymm14,ymm14,ymm14 vpsrld ymm3,ymm3,2 vpaddd ymm1,ymm1,ymm7 vpor ymm14,ymm14,ymm9 vpor ymm3,ymm3,ymm6 vpxor ymm10,ymm10,ymm12 vmovdqa ymm12,YMMWORD PTR[((320-256-128))+rbx] vpslld ymm7,ymm1,5 vpaddd ymm0,ymm0,ymm15 vpxor ymm5,ymm4,ymm2 vmovdqa YMMWORD PTR[(224-128)+rax],ymm14 vpaddd ymm0,ymm0,ymm14 vpxor ymm10,ymm10,YMMWORD PTR[((0-128))+rax] vpsrld ymm8,ymm1,27 vpxor ymm5,ymm5,ymm3 vpxor ymm10,ymm10,ymm12 vpslld ymm6,ymm2,30 vpor ymm7,ymm7,ymm8 vpaddd ymm0,ymm0,ymm5 vpsrld ymm9,ymm10,31 vpaddd ymm10,ymm10,ymm10 vpsrld ymm2,ymm2,2 vpaddd ymm0,ymm0,ymm7 vpor ymm10,ymm10,ymm9 vpor ymm2,ymm2,ymm6 vmovdqa ymm15,YMMWORD PTR[32+rbp] vpxor ymm11,ymm11,ymm13 vmovdqa ymm13,YMMWORD PTR[((352-256-128))+rbx] vpaddd ymm4,ymm4,ymm15 vpslld ymm7,ymm0,5 vpand ymm6,ymm3,ymm2 vpxor ymm11,ymm11,YMMWORD PTR[((32-128))+rax] vpaddd ymm4,ymm4,ymm6 vpsrld ymm8,ymm0,27 vpxor ymm5,ymm3,ymm2 vpxor ymm11,ymm11,ymm13 vmovdqu YMMWORD PTR[(256-256-128)+rbx],ymm10 vpaddd ymm4,ymm4,ymm10 vpor ymm7,ymm7,ymm8 vpsrld ymm9,ymm11,31 vpand ymm5,ymm5,ymm1 vpaddd ymm11,ymm11,ymm11 vpslld ymm6,ymm1,30 vpaddd ymm4,ymm4,ymm5 vpsrld ymm1,ymm1,2 vpaddd ymm4,ymm4,ymm7 vpor ymm11,ymm11,ymm9 vpor ymm1,ymm1,ymm6 vpxor ymm12,ymm12,ymm14 vmovdqa ymm14,YMMWORD PTR[((384-256-128))+rbx] vpaddd ymm3,ymm3,ymm15 vpslld ymm7,ymm4,5 vpand ymm6,ymm2,ymm1 vpxor ymm12,ymm12,YMMWORD PTR[((64-128))+rax] vpaddd ymm3,ymm3,ymm6 vpsrld ymm8,ymm4,27 vpxor ymm5,ymm2,ymm1 vpxor ymm12,ymm12,ymm14 vmovdqu YMMWORD PTR[(288-256-128)+rbx],ymm11 vpaddd ymm3,ymm3,ymm11 vpor ymm7,ymm7,ymm8 vpsrld ymm9,ymm12,31 vpand ymm5,ymm5,ymm0 vpaddd ymm12,ymm12,ymm12 vpslld ymm6,ymm0,30 vpaddd ymm3,ymm3,ymm5 vpsrld ymm0,ymm0,2 vpaddd ymm3,ymm3,ymm7 vpor ymm12,ymm12,ymm9 vpor ymm0,ymm0,ymm6 vpxor ymm13,ymm13,ymm10 vmovdqa ymm10,YMMWORD PTR[((416-256-128))+rbx] vpaddd ymm2,ymm2,ymm15 vpslld ymm7,ymm3,5 vpand ymm6,ymm1,ymm0 vpxor ymm13,ymm13,YMMWORD PTR[((96-128))+rax] vpaddd ymm2,ymm2,ymm6 vpsrld ymm8,ymm3,27 vpxor ymm5,ymm1,ymm0 vpxor ymm13,ymm13,ymm10 vmovdqu YMMWORD PTR[(320-256-128)+rbx],ymm12 vpaddd ymm2,ymm2,ymm12 vpor ymm7,ymm7,ymm8 vpsrld ymm9,ymm13,31 vpand ymm5,ymm5,ymm4 vpaddd ymm13,ymm13,ymm13 vpslld ymm6,ymm4,30 vpaddd ymm2,ymm2,ymm5 vpsrld ymm4,ymm4,2 vpaddd ymm2,ymm2,ymm7 vpor ymm13,ymm13,ymm9 vpor ymm4,ymm4,ymm6 vpxor ymm14,ymm14,ymm11 vmovdqa ymm11,YMMWORD PTR[((448-256-128))+rbx] vpaddd ymm1,ymm1,ymm15 vpslld ymm7,ymm2,5 vpand ymm6,ymm0,ymm4 vpxor ymm14,ymm14,YMMWORD PTR[((128-128))+rax] vpaddd ymm1,ymm1,ymm6 vpsrld ymm8,ymm2,27 vpxor ymm5,ymm0,ymm4 vpxor ymm14,ymm14,ymm11 vmovdqu YMMWORD PTR[(352-256-128)+rbx],ymm13 vpaddd ymm1,ymm1,ymm13 vpor ymm7,ymm7,ymm8 vpsrld ymm9,ymm14,31 vpand ymm5,ymm5,ymm3 vpaddd ymm14,ymm14,ymm14 vpslld ymm6,ymm3,30 vpaddd ymm1,ymm1,ymm5 vpsrld ymm3,ymm3,2 vpaddd ymm1,ymm1,ymm7 vpor ymm14,ymm14,ymm9 vpor ymm3,ymm3,ymm6 vpxor ymm10,ymm10,ymm12 vmovdqa ymm12,YMMWORD PTR[((480-256-128))+rbx] vpaddd ymm0,ymm0,ymm15 vpslld ymm7,ymm1,5 vpand ymm6,ymm4,ymm3 vpxor ymm10,ymm10,YMMWORD PTR[((160-128))+rax] vpaddd ymm0,ymm0,ymm6 vpsrld ymm8,ymm1,27 vpxor ymm5,ymm4,ymm3 vpxor ymm10,ymm10,ymm12 vmovdqu YMMWORD PTR[(384-256-128)+rbx],ymm14 vpaddd ymm0,ymm0,ymm14 vpor ymm7,ymm7,ymm8 vpsrld ymm9,ymm10,31 vpand ymm5,ymm5,ymm2 vpaddd ymm10,ymm10,ymm10 vpslld ymm6,ymm2,30 vpaddd ymm0,ymm0,ymm5 vpsrld ymm2,ymm2,2 vpaddd ymm0,ymm0,ymm7 vpor ymm10,ymm10,ymm9 vpor ymm2,ymm2,ymm6 vpxor ymm11,ymm11,ymm13 vmovdqa ymm13,YMMWORD PTR[((0-128))+rax] vpaddd ymm4,ymm4,ymm15 vpslld ymm7,ymm0,5 vpand ymm6,ymm3,ymm2 vpxor ymm11,ymm11,YMMWORD PTR[((192-128))+rax] vpaddd ymm4,ymm4,ymm6 vpsrld ymm8,ymm0,27 vpxor ymm5,ymm3,ymm2 vpxor ymm11,ymm11,ymm13 vmovdqu YMMWORD PTR[(416-256-128)+rbx],ymm10 vpaddd ymm4,ymm4,ymm10 vpor ymm7,ymm7,ymm8 vpsrld ymm9,ymm11,31 vpand ymm5,ymm5,ymm1 vpaddd ymm11,ymm11,ymm11 vpslld ymm6,ymm1,30 vpaddd ymm4,ymm4,ymm5 vpsrld ymm1,ymm1,2 vpaddd ymm4,ymm4,ymm7 vpor ymm11,ymm11,ymm9 vpor ymm1,ymm1,ymm6 vpxor ymm12,ymm12,ymm14 vmovdqa ymm14,YMMWORD PTR[((32-128))+rax] vpaddd ymm3,ymm3,ymm15 vpslld ymm7,ymm4,5 vpand ymm6,ymm2,ymm1 vpxor ymm12,ymm12,YMMWORD PTR[((224-128))+rax] vpaddd ymm3,ymm3,ymm6 vpsrld ymm8,ymm4,27 vpxor ymm5,ymm2,ymm1 vpxor ymm12,ymm12,ymm14 vmovdqu YMMWORD PTR[(448-256-128)+rbx],ymm11 vpaddd ymm3,ymm3,ymm11 vpor ymm7,ymm7,ymm8 vpsrld ymm9,ymm12,31 vpand ymm5,ymm5,ymm0 vpaddd ymm12,ymm12,ymm12 vpslld ymm6,ymm0,30 vpaddd ymm3,ymm3,ymm5 vpsrld ymm0,ymm0,2 vpaddd ymm3,ymm3,ymm7 vpor ymm12,ymm12,ymm9 vpor ymm0,ymm0,ymm6 vpxor ymm13,ymm13,ymm10 vmovdqa ymm10,YMMWORD PTR[((64-128))+rax] vpaddd ymm2,ymm2,ymm15 vpslld ymm7,ymm3,5 vpand ymm6,ymm1,ymm0 vpxor ymm13,ymm13,YMMWORD PTR[((256-256-128))+rbx] vpaddd ymm2,ymm2,ymm6 vpsrld ymm8,ymm3,27 vpxor ymm5,ymm1,ymm0 vpxor ymm13,ymm13,ymm10 vmovdqu YMMWORD PTR[(480-256-128)+rbx],ymm12 vpaddd ymm2,ymm2,ymm12 vpor ymm7,ymm7,ymm8 vpsrld ymm9,ymm13,31 vpand ymm5,ymm5,ymm4 vpaddd ymm13,ymm13,ymm13 vpslld ymm6,ymm4,30 vpaddd ymm2,ymm2,ymm5 vpsrld ymm4,ymm4,2 vpaddd ymm2,ymm2,ymm7 vpor ymm13,ymm13,ymm9 vpor ymm4,ymm4,ymm6 vpxor ymm14,ymm14,ymm11 vmovdqa ymm11,YMMWORD PTR[((96-128))+rax] vpaddd ymm1,ymm1,ymm15 vpslld ymm7,ymm2,5 vpand ymm6,ymm0,ymm4 vpxor ymm14,ymm14,YMMWORD PTR[((288-256-128))+rbx] vpaddd ymm1,ymm1,ymm6 vpsrld ymm8,ymm2,27 vpxor ymm5,ymm0,ymm4 vpxor ymm14,ymm14,ymm11 vmovdqu YMMWORD PTR[(0-128)+rax],ymm13 vpaddd ymm1,ymm1,ymm13 vpor ymm7,ymm7,ymm8 vpsrld ymm9,ymm14,31 vpand ymm5,ymm5,ymm3 vpaddd ymm14,ymm14,ymm14 vpslld ymm6,ymm3,30 vpaddd ymm1,ymm1,ymm5 vpsrld ymm3,ymm3,2 vpaddd ymm1,ymm1,ymm7 vpor ymm14,ymm14,ymm9 vpor ymm3,ymm3,ymm6 vpxor ymm10,ymm10,ymm12 vmovdqa ymm12,YMMWORD PTR[((128-128))+rax] vpaddd ymm0,ymm0,ymm15 vpslld ymm7,ymm1,5 vpand ymm6,ymm4,ymm3 vpxor ymm10,ymm10,YMMWORD PTR[((320-256-128))+rbx] vpaddd ymm0,ymm0,ymm6 vpsrld ymm8,ymm1,27 vpxor ymm5,ymm4,ymm3 vpxor ymm10,ymm10,ymm12 vmovdqu YMMWORD PTR[(32-128)+rax],ymm14 vpaddd ymm0,ymm0,ymm14 vpor ymm7,ymm7,ymm8 vpsrld ymm9,ymm10,31 vpand ymm5,ymm5,ymm2 vpaddd ymm10,ymm10,ymm10 vpslld ymm6,ymm2,30 vpaddd ymm0,ymm0,ymm5 vpsrld ymm2,ymm2,2 vpaddd ymm0,ymm0,ymm7 vpor ymm10,ymm10,ymm9 vpor ymm2,ymm2,ymm6 vpxor ymm11,ymm11,ymm13 vmovdqa ymm13,YMMWORD PTR[((160-128))+rax] vpaddd ymm4,ymm4,ymm15 vpslld ymm7,ymm0,5 vpand ymm6,ymm3,ymm2 vpxor ymm11,ymm11,YMMWORD PTR[((352-256-128))+rbx] vpaddd ymm4,ymm4,ymm6 vpsrld ymm8,ymm0,27 vpxor ymm5,ymm3,ymm2 vpxor ymm11,ymm11,ymm13 vmovdqu YMMWORD PTR[(64-128)+rax],ymm10 vpaddd ymm4,ymm4,ymm10 vpor ymm7,ymm7,ymm8 vpsrld ymm9,ymm11,31 vpand ymm5,ymm5,ymm1 vpaddd ymm11,ymm11,ymm11 vpslld ymm6,ymm1,30 vpaddd ymm4,ymm4,ymm5 vpsrld ymm1,ymm1,2 vpaddd ymm4,ymm4,ymm7 vpor ymm11,ymm11,ymm9 vpor ymm1,ymm1,ymm6 vpxor ymm12,ymm12,ymm14 vmovdqa ymm14,YMMWORD PTR[((192-128))+rax] vpaddd ymm3,ymm3,ymm15 vpslld ymm7,ymm4,5 vpand ymm6,ymm2,ymm1 vpxor ymm12,ymm12,YMMWORD PTR[((384-256-128))+rbx] vpaddd ymm3,ymm3,ymm6 vpsrld ymm8,ymm4,27 vpxor ymm5,ymm2,ymm1 vpxor ymm12,ymm12,ymm14 vmovdqu YMMWORD PTR[(96-128)+rax],ymm11 vpaddd ymm3,ymm3,ymm11 vpor ymm7,ymm7,ymm8 vpsrld ymm9,ymm12,31 vpand ymm5,ymm5,ymm0 vpaddd ymm12,ymm12,ymm12 vpslld ymm6,ymm0,30 vpaddd ymm3,ymm3,ymm5 vpsrld ymm0,ymm0,2 vpaddd ymm3,ymm3,ymm7 vpor ymm12,ymm12,ymm9 vpor ymm0,ymm0,ymm6 vpxor ymm13,ymm13,ymm10 vmovdqa ymm10,YMMWORD PTR[((224-128))+rax] vpaddd ymm2,ymm2,ymm15 vpslld ymm7,ymm3,5 vpand ymm6,ymm1,ymm0 vpxor ymm13,ymm13,YMMWORD PTR[((416-256-128))+rbx] vpaddd ymm2,ymm2,ymm6 vpsrld ymm8,ymm3,27 vpxor ymm5,ymm1,ymm0 vpxor ymm13,ymm13,ymm10 vmovdqu YMMWORD PTR[(128-128)+rax],ymm12 vpaddd ymm2,ymm2,ymm12 vpor ymm7,ymm7,ymm8 vpsrld ymm9,ymm13,31 vpand ymm5,ymm5,ymm4 vpaddd ymm13,ymm13,ymm13 vpslld ymm6,ymm4,30 vpaddd ymm2,ymm2,ymm5 vpsrld ymm4,ymm4,2 vpaddd ymm2,ymm2,ymm7 vpor ymm13,ymm13,ymm9 vpor ymm4,ymm4,ymm6 vpxor ymm14,ymm14,ymm11 vmovdqa ymm11,YMMWORD PTR[((256-256-128))+rbx] vpaddd ymm1,ymm1,ymm15 vpslld ymm7,ymm2,5 vpand ymm6,ymm0,ymm4 vpxor ymm14,ymm14,YMMWORD PTR[((448-256-128))+rbx] vpaddd ymm1,ymm1,ymm6 vpsrld ymm8,ymm2,27 vpxor ymm5,ymm0,ymm4 vpxor ymm14,ymm14,ymm11 vmovdqu YMMWORD PTR[(160-128)+rax],ymm13 vpaddd ymm1,ymm1,ymm13 vpor ymm7,ymm7,ymm8 vpsrld ymm9,ymm14,31 vpand ymm5,ymm5,ymm3 vpaddd ymm14,ymm14,ymm14 vpslld ymm6,ymm3,30 vpaddd ymm1,ymm1,ymm5 vpsrld ymm3,ymm3,2 vpaddd ymm1,ymm1,ymm7 vpor ymm14,ymm14,ymm9 vpor ymm3,ymm3,ymm6 vpxor ymm10,ymm10,ymm12 vmovdqa ymm12,YMMWORD PTR[((288-256-128))+rbx] vpaddd ymm0,ymm0,ymm15 vpslld ymm7,ymm1,5 vpand ymm6,ymm4,ymm3 vpxor ymm10,ymm10,YMMWORD PTR[((480-256-128))+rbx] vpaddd ymm0,ymm0,ymm6 vpsrld ymm8,ymm1,27 vpxor ymm5,ymm4,ymm3 vpxor ymm10,ymm10,ymm12 vmovdqu YMMWORD PTR[(192-128)+rax],ymm14 vpaddd ymm0,ymm0,ymm14 vpor ymm7,ymm7,ymm8 vpsrld ymm9,ymm10,31 vpand ymm5,ymm5,ymm2 vpaddd ymm10,ymm10,ymm10 vpslld ymm6,ymm2,30 vpaddd ymm0,ymm0,ymm5 vpsrld ymm2,ymm2,2 vpaddd ymm0,ymm0,ymm7 vpor ymm10,ymm10,ymm9 vpor ymm2,ymm2,ymm6 vpxor ymm11,ymm11,ymm13 vmovdqa ymm13,YMMWORD PTR[((320-256-128))+rbx] vpaddd ymm4,ymm4,ymm15 vpslld ymm7,ymm0,5 vpand ymm6,ymm3,ymm2 vpxor ymm11,ymm11,YMMWORD PTR[((0-128))+rax] vpaddd ymm4,ymm4,ymm6 vpsrld ymm8,ymm0,27 vpxor ymm5,ymm3,ymm2 vpxor ymm11,ymm11,ymm13 vmovdqu YMMWORD PTR[(224-128)+rax],ymm10 vpaddd ymm4,ymm4,ymm10 vpor ymm7,ymm7,ymm8 vpsrld ymm9,ymm11,31 vpand ymm5,ymm5,ymm1 vpaddd ymm11,ymm11,ymm11 vpslld ymm6,ymm1,30 vpaddd ymm4,ymm4,ymm5 vpsrld ymm1,ymm1,2 vpaddd ymm4,ymm4,ymm7 vpor ymm11,ymm11,ymm9 vpor ymm1,ymm1,ymm6 vpxor ymm12,ymm12,ymm14 vmovdqa ymm14,YMMWORD PTR[((352-256-128))+rbx] vpaddd ymm3,ymm3,ymm15 vpslld ymm7,ymm4,5 vpand ymm6,ymm2,ymm1 vpxor ymm12,ymm12,YMMWORD PTR[((32-128))+rax] vpaddd ymm3,ymm3,ymm6 vpsrld ymm8,ymm4,27 vpxor ymm5,ymm2,ymm1 vpxor ymm12,ymm12,ymm14 vmovdqu YMMWORD PTR[(256-256-128)+rbx],ymm11 vpaddd ymm3,ymm3,ymm11 vpor ymm7,ymm7,ymm8 vpsrld ymm9,ymm12,31 vpand ymm5,ymm5,ymm0 vpaddd ymm12,ymm12,ymm12 vpslld ymm6,ymm0,30 vpaddd ymm3,ymm3,ymm5 vpsrld ymm0,ymm0,2 vpaddd ymm3,ymm3,ymm7 vpor ymm12,ymm12,ymm9 vpor ymm0,ymm0,ymm6 vpxor ymm13,ymm13,ymm10 vmovdqa ymm10,YMMWORD PTR[((384-256-128))+rbx] vpaddd ymm2,ymm2,ymm15 vpslld ymm7,ymm3,5 vpand ymm6,ymm1,ymm0 vpxor ymm13,ymm13,YMMWORD PTR[((64-128))+rax] vpaddd ymm2,ymm2,ymm6 vpsrld ymm8,ymm3,27 vpxor ymm5,ymm1,ymm0 vpxor ymm13,ymm13,ymm10 vmovdqu YMMWORD PTR[(288-256-128)+rbx],ymm12 vpaddd ymm2,ymm2,ymm12 vpor ymm7,ymm7,ymm8 vpsrld ymm9,ymm13,31 vpand ymm5,ymm5,ymm4 vpaddd ymm13,ymm13,ymm13 vpslld ymm6,ymm4,30 vpaddd ymm2,ymm2,ymm5 vpsrld ymm4,ymm4,2 vpaddd ymm2,ymm2,ymm7 vpor ymm13,ymm13,ymm9 vpor ymm4,ymm4,ymm6 vpxor ymm14,ymm14,ymm11 vmovdqa ymm11,YMMWORD PTR[((416-256-128))+rbx] vpaddd ymm1,ymm1,ymm15 vpslld ymm7,ymm2,5 vpand ymm6,ymm0,ymm4 vpxor ymm14,ymm14,YMMWORD PTR[((96-128))+rax] vpaddd ymm1,ymm1,ymm6 vpsrld ymm8,ymm2,27 vpxor ymm5,ymm0,ymm4 vpxor ymm14,ymm14,ymm11 vmovdqu YMMWORD PTR[(320-256-128)+rbx],ymm13 vpaddd ymm1,ymm1,ymm13 vpor ymm7,ymm7,ymm8 vpsrld ymm9,ymm14,31 vpand ymm5,ymm5,ymm3 vpaddd ymm14,ymm14,ymm14 vpslld ymm6,ymm3,30 vpaddd ymm1,ymm1,ymm5 vpsrld ymm3,ymm3,2 vpaddd ymm1,ymm1,ymm7 vpor ymm14,ymm14,ymm9 vpor ymm3,ymm3,ymm6 vpxor ymm10,ymm10,ymm12 vmovdqa ymm12,YMMWORD PTR[((448-256-128))+rbx] vpaddd ymm0,ymm0,ymm15 vpslld ymm7,ymm1,5 vpand ymm6,ymm4,ymm3 vpxor ymm10,ymm10,YMMWORD PTR[((128-128))+rax] vpaddd ymm0,ymm0,ymm6 vpsrld ymm8,ymm1,27 vpxor ymm5,ymm4,ymm3 vpxor ymm10,ymm10,ymm12 vmovdqu YMMWORD PTR[(352-256-128)+rbx],ymm14 vpaddd ymm0,ymm0,ymm14 vpor ymm7,ymm7,ymm8 vpsrld ymm9,ymm10,31 vpand ymm5,ymm5,ymm2 vpaddd ymm10,ymm10,ymm10 vpslld ymm6,ymm2,30 vpaddd ymm0,ymm0,ymm5 vpsrld ymm2,ymm2,2 vpaddd ymm0,ymm0,ymm7 vpor ymm10,ymm10,ymm9 vpor ymm2,ymm2,ymm6 vmovdqa ymm15,YMMWORD PTR[64+rbp] vpxor ymm11,ymm11,ymm13 vmovdqa ymm13,YMMWORD PTR[((480-256-128))+rbx] vpslld ymm7,ymm0,5 vpaddd ymm4,ymm4,ymm15 vpxor ymm5,ymm3,ymm1 vmovdqa YMMWORD PTR[(384-256-128)+rbx],ymm10 vpaddd ymm4,ymm4,ymm10 vpxor ymm11,ymm11,YMMWORD PTR[((160-128))+rax] vpsrld ymm8,ymm0,27 vpxor ymm5,ymm5,ymm2 vpxor ymm11,ymm11,ymm13 vpslld ymm6,ymm1,30 vpor ymm7,ymm7,ymm8 vpaddd ymm4,ymm4,ymm5 vpsrld ymm9,ymm11,31 vpaddd ymm11,ymm11,ymm11 vpsrld ymm1,ymm1,2 vpaddd ymm4,ymm4,ymm7 vpor ymm11,ymm11,ymm9 vpor ymm1,ymm1,ymm6 vpxor ymm12,ymm12,ymm14 vmovdqa ymm14,YMMWORD PTR[((0-128))+rax] vpslld ymm7,ymm4,5 vpaddd ymm3,ymm3,ymm15 vpxor ymm5,ymm2,ymm0 vmovdqa YMMWORD PTR[(416-256-128)+rbx],ymm11 vpaddd ymm3,ymm3,ymm11 vpxor ymm12,ymm12,YMMWORD PTR[((192-128))+rax] vpsrld ymm8,ymm4,27 vpxor ymm5,ymm5,ymm1 vpxor ymm12,ymm12,ymm14 vpslld ymm6,ymm0,30 vpor ymm7,ymm7,ymm8 vpaddd ymm3,ymm3,ymm5 vpsrld ymm9,ymm12,31 vpaddd ymm12,ymm12,ymm12 vpsrld ymm0,ymm0,2 vpaddd ymm3,ymm3,ymm7 vpor ymm12,ymm12,ymm9 vpor ymm0,ymm0,ymm6 vpxor ymm13,ymm13,ymm10 vmovdqa ymm10,YMMWORD PTR[((32-128))+rax] vpslld ymm7,ymm3,5 vpaddd ymm2,ymm2,ymm15 vpxor ymm5,ymm1,ymm4 vmovdqa YMMWORD PTR[(448-256-128)+rbx],ymm12 vpaddd ymm2,ymm2,ymm12 vpxor ymm13,ymm13,YMMWORD PTR[((224-128))+rax] vpsrld ymm8,ymm3,27 vpxor ymm5,ymm5,ymm0 vpxor ymm13,ymm13,ymm10 vpslld ymm6,ymm4,30 vpor ymm7,ymm7,ymm8 vpaddd ymm2,ymm2,ymm5 vpsrld ymm9,ymm13,31 vpaddd ymm13,ymm13,ymm13 vpsrld ymm4,ymm4,2 vpaddd ymm2,ymm2,ymm7 vpor ymm13,ymm13,ymm9 vpor ymm4,ymm4,ymm6 vpxor ymm14,ymm14,ymm11 vmovdqa ymm11,YMMWORD PTR[((64-128))+rax] vpslld ymm7,ymm2,5 vpaddd ymm1,ymm1,ymm15 vpxor ymm5,ymm0,ymm3 vmovdqa YMMWORD PTR[(480-256-128)+rbx],ymm13 vpaddd ymm1,ymm1,ymm13 vpxor ymm14,ymm14,YMMWORD PTR[((256-256-128))+rbx] vpsrld ymm8,ymm2,27 vpxor ymm5,ymm5,ymm4 vpxor ymm14,ymm14,ymm11 vpslld ymm6,ymm3,30 vpor ymm7,ymm7,ymm8 vpaddd ymm1,ymm1,ymm5 vpsrld ymm9,ymm14,31 vpaddd ymm14,ymm14,ymm14 vpsrld ymm3,ymm3,2 vpaddd ymm1,ymm1,ymm7 vpor ymm14,ymm14,ymm9 vpor ymm3,ymm3,ymm6 vpxor ymm10,ymm10,ymm12 vmovdqa ymm12,YMMWORD PTR[((96-128))+rax] vpslld ymm7,ymm1,5 vpaddd ymm0,ymm0,ymm15 vpxor ymm5,ymm4,ymm2 vmovdqa YMMWORD PTR[(0-128)+rax],ymm14 vpaddd ymm0,ymm0,ymm14 vpxor ymm10,ymm10,YMMWORD PTR[((288-256-128))+rbx] vpsrld ymm8,ymm1,27 vpxor ymm5,ymm5,ymm3 vpxor ymm10,ymm10,ymm12 vpslld ymm6,ymm2,30 vpor ymm7,ymm7,ymm8 vpaddd ymm0,ymm0,ymm5 vpsrld ymm9,ymm10,31 vpaddd ymm10,ymm10,ymm10 vpsrld ymm2,ymm2,2 vpaddd ymm0,ymm0,ymm7 vpor ymm10,ymm10,ymm9 vpor ymm2,ymm2,ymm6 vpxor ymm11,ymm11,ymm13 vmovdqa ymm13,YMMWORD PTR[((128-128))+rax] vpslld ymm7,ymm0,5 vpaddd ymm4,ymm4,ymm15 vpxor ymm5,ymm3,ymm1 vmovdqa YMMWORD PTR[(32-128)+rax],ymm10 vpaddd ymm4,ymm4,ymm10 vpxor ymm11,ymm11,YMMWORD PTR[((320-256-128))+rbx] vpsrld ymm8,ymm0,27 vpxor ymm5,ymm5,ymm2 vpxor ymm11,ymm11,ymm13 vpslld ymm6,ymm1,30 vpor ymm7,ymm7,ymm8 vpaddd ymm4,ymm4,ymm5 vpsrld ymm9,ymm11,31 vpaddd ymm11,ymm11,ymm11 vpsrld ymm1,ymm1,2 vpaddd ymm4,ymm4,ymm7 vpor ymm11,ymm11,ymm9 vpor ymm1,ymm1,ymm6 vpxor ymm12,ymm12,ymm14 vmovdqa ymm14,YMMWORD PTR[((160-128))+rax] vpslld ymm7,ymm4,5 vpaddd ymm3,ymm3,ymm15 vpxor ymm5,ymm2,ymm0 vmovdqa YMMWORD PTR[(64-128)+rax],ymm11 vpaddd ymm3,ymm3,ymm11 vpxor ymm12,ymm12,YMMWORD PTR[((352-256-128))+rbx] vpsrld ymm8,ymm4,27 vpxor ymm5,ymm5,ymm1 vpxor ymm12,ymm12,ymm14 vpslld ymm6,ymm0,30 vpor ymm7,ymm7,ymm8 vpaddd ymm3,ymm3,ymm5 vpsrld ymm9,ymm12,31 vpaddd ymm12,ymm12,ymm12 vpsrld ymm0,ymm0,2 vpaddd ymm3,ymm3,ymm7 vpor ymm12,ymm12,ymm9 vpor ymm0,ymm0,ymm6 vpxor ymm13,ymm13,ymm10 vmovdqa ymm10,YMMWORD PTR[((192-128))+rax] vpslld ymm7,ymm3,5 vpaddd ymm2,ymm2,ymm15 vpxor ymm5,ymm1,ymm4 vmovdqa YMMWORD PTR[(96-128)+rax],ymm12 vpaddd ymm2,ymm2,ymm12 vpxor ymm13,ymm13,YMMWORD PTR[((384-256-128))+rbx] vpsrld ymm8,ymm3,27 vpxor ymm5,ymm5,ymm0 vpxor ymm13,ymm13,ymm10 vpslld ymm6,ymm4,30 vpor ymm7,ymm7,ymm8 vpaddd ymm2,ymm2,ymm5 vpsrld ymm9,ymm13,31 vpaddd ymm13,ymm13,ymm13 vpsrld ymm4,ymm4,2 vpaddd ymm2,ymm2,ymm7 vpor ymm13,ymm13,ymm9 vpor ymm4,ymm4,ymm6 vpxor ymm14,ymm14,ymm11 vmovdqa ymm11,YMMWORD PTR[((224-128))+rax] vpslld ymm7,ymm2,5 vpaddd ymm1,ymm1,ymm15 vpxor ymm5,ymm0,ymm3 vmovdqa YMMWORD PTR[(128-128)+rax],ymm13 vpaddd ymm1,ymm1,ymm13 vpxor ymm14,ymm14,YMMWORD PTR[((416-256-128))+rbx] vpsrld ymm8,ymm2,27 vpxor ymm5,ymm5,ymm4 vpxor ymm14,ymm14,ymm11 vpslld ymm6,ymm3,30 vpor ymm7,ymm7,ymm8 vpaddd ymm1,ymm1,ymm5 vpsrld ymm9,ymm14,31 vpaddd ymm14,ymm14,ymm14 vpsrld ymm3,ymm3,2 vpaddd ymm1,ymm1,ymm7 vpor ymm14,ymm14,ymm9 vpor ymm3,ymm3,ymm6 vpxor ymm10,ymm10,ymm12 vmovdqa ymm12,YMMWORD PTR[((256-256-128))+rbx] vpslld ymm7,ymm1,5 vpaddd ymm0,ymm0,ymm15 vpxor ymm5,ymm4,ymm2 vmovdqa YMMWORD PTR[(160-128)+rax],ymm14 vpaddd ymm0,ymm0,ymm14 vpxor ymm10,ymm10,YMMWORD PTR[((448-256-128))+rbx] vpsrld ymm8,ymm1,27 vpxor ymm5,ymm5,ymm3 vpxor ymm10,ymm10,ymm12 vpslld ymm6,ymm2,30 vpor ymm7,ymm7,ymm8 vpaddd ymm0,ymm0,ymm5 vpsrld ymm9,ymm10,31 vpaddd ymm10,ymm10,ymm10 vpsrld ymm2,ymm2,2 vpaddd ymm0,ymm0,ymm7 vpor ymm10,ymm10,ymm9 vpor ymm2,ymm2,ymm6 vpxor ymm11,ymm11,ymm13 vmovdqa ymm13,YMMWORD PTR[((288-256-128))+rbx] vpslld ymm7,ymm0,5 vpaddd ymm4,ymm4,ymm15 vpxor ymm5,ymm3,ymm1 vmovdqa YMMWORD PTR[(192-128)+rax],ymm10 vpaddd ymm4,ymm4,ymm10 vpxor ymm11,ymm11,YMMWORD PTR[((480-256-128))+rbx] vpsrld ymm8,ymm0,27 vpxor ymm5,ymm5,ymm2 vpxor ymm11,ymm11,ymm13 vpslld ymm6,ymm1,30 vpor ymm7,ymm7,ymm8 vpaddd ymm4,ymm4,ymm5 vpsrld ymm9,ymm11,31 vpaddd ymm11,ymm11,ymm11 vpsrld ymm1,ymm1,2 vpaddd ymm4,ymm4,ymm7 vpor ymm11,ymm11,ymm9 vpor ymm1,ymm1,ymm6 vpxor ymm12,ymm12,ymm14 vmovdqa ymm14,YMMWORD PTR[((320-256-128))+rbx] vpslld ymm7,ymm4,5 vpaddd ymm3,ymm3,ymm15 vpxor ymm5,ymm2,ymm0 vmovdqa YMMWORD PTR[(224-128)+rax],ymm11 vpaddd ymm3,ymm3,ymm11 vpxor ymm12,ymm12,YMMWORD PTR[((0-128))+rax] vpsrld ymm8,ymm4,27 vpxor ymm5,ymm5,ymm1 vpxor ymm12,ymm12,ymm14 vpslld ymm6,ymm0,30 vpor ymm7,ymm7,ymm8 vpaddd ymm3,ymm3,ymm5 vpsrld ymm9,ymm12,31 vpaddd ymm12,ymm12,ymm12 vpsrld ymm0,ymm0,2 vpaddd ymm3,ymm3,ymm7 vpor ymm12,ymm12,ymm9 vpor ymm0,ymm0,ymm6 vpxor ymm13,ymm13,ymm10 vmovdqa ymm10,YMMWORD PTR[((352-256-128))+rbx] vpslld ymm7,ymm3,5 vpaddd ymm2,ymm2,ymm15 vpxor ymm5,ymm1,ymm4 vpaddd ymm2,ymm2,ymm12 vpxor ymm13,ymm13,YMMWORD PTR[((32-128))+rax] vpsrld ymm8,ymm3,27 vpxor ymm5,ymm5,ymm0 vpxor ymm13,ymm13,ymm10 vpslld ymm6,ymm4,30 vpor ymm7,ymm7,ymm8 vpaddd ymm2,ymm2,ymm5 vpsrld ymm9,ymm13,31 vpaddd ymm13,ymm13,ymm13 vpsrld ymm4,ymm4,2 vpaddd ymm2,ymm2,ymm7 vpor ymm13,ymm13,ymm9 vpor ymm4,ymm4,ymm6 vpxor ymm14,ymm14,ymm11 vmovdqa ymm11,YMMWORD PTR[((384-256-128))+rbx] vpslld ymm7,ymm2,5 vpaddd ymm1,ymm1,ymm15 vpxor ymm5,ymm0,ymm3 vpaddd ymm1,ymm1,ymm13 vpxor ymm14,ymm14,YMMWORD PTR[((64-128))+rax] vpsrld ymm8,ymm2,27 vpxor ymm5,ymm5,ymm4 vpxor ymm14,ymm14,ymm11 vpslld ymm6,ymm3,30 vpor ymm7,ymm7,ymm8 vpaddd ymm1,ymm1,ymm5 vpsrld ymm9,ymm14,31 vpaddd ymm14,ymm14,ymm14 vpsrld ymm3,ymm3,2 vpaddd ymm1,ymm1,ymm7 vpor ymm14,ymm14,ymm9 vpor ymm3,ymm3,ymm6 vpxor ymm10,ymm10,ymm12 vmovdqa ymm12,YMMWORD PTR[((416-256-128))+rbx] vpslld ymm7,ymm1,5 vpaddd ymm0,ymm0,ymm15 vpxor ymm5,ymm4,ymm2 vpaddd ymm0,ymm0,ymm14 vpxor ymm10,ymm10,YMMWORD PTR[((96-128))+rax] vpsrld ymm8,ymm1,27 vpxor ymm5,ymm5,ymm3 vpxor ymm10,ymm10,ymm12 vpslld ymm6,ymm2,30 vpor ymm7,ymm7,ymm8 vpaddd ymm0,ymm0,ymm5 vpsrld ymm9,ymm10,31 vpaddd ymm10,ymm10,ymm10 vpsrld ymm2,ymm2,2 vpaddd ymm0,ymm0,ymm7 vpor ymm10,ymm10,ymm9 vpor ymm2,ymm2,ymm6 vpxor ymm11,ymm11,ymm13 vmovdqa ymm13,YMMWORD PTR[((448-256-128))+rbx] vpslld ymm7,ymm0,5 vpaddd ymm4,ymm4,ymm15 vpxor ymm5,ymm3,ymm1 vpaddd ymm4,ymm4,ymm10 vpxor ymm11,ymm11,YMMWORD PTR[((128-128))+rax] vpsrld ymm8,ymm0,27 vpxor ymm5,ymm5,ymm2 vpxor ymm11,ymm11,ymm13 vpslld ymm6,ymm1,30 vpor ymm7,ymm7,ymm8 vpaddd ymm4,ymm4,ymm5 vpsrld ymm9,ymm11,31 vpaddd ymm11,ymm11,ymm11 vpsrld ymm1,ymm1,2 vpaddd ymm4,ymm4,ymm7 vpor ymm11,ymm11,ymm9 vpor ymm1,ymm1,ymm6 vpxor ymm12,ymm12,ymm14 vmovdqa ymm14,YMMWORD PTR[((480-256-128))+rbx] vpslld ymm7,ymm4,5 vpaddd ymm3,ymm3,ymm15 vpxor ymm5,ymm2,ymm0 vpaddd ymm3,ymm3,ymm11 vpxor ymm12,ymm12,YMMWORD PTR[((160-128))+rax] vpsrld ymm8,ymm4,27 vpxor ymm5,ymm5,ymm1 vpxor ymm12,ymm12,ymm14 vpslld ymm6,ymm0,30 vpor ymm7,ymm7,ymm8 vpaddd ymm3,ymm3,ymm5 vpsrld ymm9,ymm12,31 vpaddd ymm12,ymm12,ymm12 vpsrld ymm0,ymm0,2 vpaddd ymm3,ymm3,ymm7 vpor ymm12,ymm12,ymm9 vpor ymm0,ymm0,ymm6 vpxor ymm13,ymm13,ymm10 vmovdqa ymm10,YMMWORD PTR[((0-128))+rax] vpslld ymm7,ymm3,5 vpaddd ymm2,ymm2,ymm15 vpxor ymm5,ymm1,ymm4 vpaddd ymm2,ymm2,ymm12 vpxor ymm13,ymm13,YMMWORD PTR[((192-128))+rax] vpsrld ymm8,ymm3,27 vpxor ymm5,ymm5,ymm0 vpxor ymm13,ymm13,ymm10 vpslld ymm6,ymm4,30 vpor ymm7,ymm7,ymm8 vpaddd ymm2,ymm2,ymm5 vpsrld ymm9,ymm13,31 vpaddd ymm13,ymm13,ymm13 vpsrld ymm4,ymm4,2 vpaddd ymm2,ymm2,ymm7 vpor ymm13,ymm13,ymm9 vpor ymm4,ymm4,ymm6 vpxor ymm14,ymm14,ymm11 vmovdqa ymm11,YMMWORD PTR[((32-128))+rax] vpslld ymm7,ymm2,5 vpaddd ymm1,ymm1,ymm15 vpxor ymm5,ymm0,ymm3 vpaddd ymm1,ymm1,ymm13 vpxor ymm14,ymm14,YMMWORD PTR[((224-128))+rax] vpsrld ymm8,ymm2,27 vpxor ymm5,ymm5,ymm4 vpxor ymm14,ymm14,ymm11 vpslld ymm6,ymm3,30 vpor ymm7,ymm7,ymm8 vpaddd ymm1,ymm1,ymm5 vpsrld ymm9,ymm14,31 vpaddd ymm14,ymm14,ymm14 vpsrld ymm3,ymm3,2 vpaddd ymm1,ymm1,ymm7 vpor ymm14,ymm14,ymm9 vpor ymm3,ymm3,ymm6 vpslld ymm7,ymm1,5 vpaddd ymm0,ymm0,ymm15 vpxor ymm5,ymm4,ymm2 vpsrld ymm8,ymm1,27 vpaddd ymm0,ymm0,ymm14 vpxor ymm5,ymm5,ymm3 vpslld ymm6,ymm2,30 vpor ymm7,ymm7,ymm8 vpaddd ymm0,ymm0,ymm5 vpsrld ymm2,ymm2,2 vpaddd ymm0,ymm0,ymm7 vpor ymm2,ymm2,ymm6 mov ecx,1 lea rbx,QWORD PTR[512+rsp] cmp ecx,DWORD PTR[rbx] cmovge r12,rbp cmp ecx,DWORD PTR[4+rbx] cmovge r13,rbp cmp ecx,DWORD PTR[8+rbx] cmovge r14,rbp cmp ecx,DWORD PTR[12+rbx] cmovge r15,rbp cmp ecx,DWORD PTR[16+rbx] cmovge r8,rbp cmp ecx,DWORD PTR[20+rbx] cmovge r9,rbp cmp ecx,DWORD PTR[24+rbx] cmovge r10,rbp cmp ecx,DWORD PTR[28+rbx] cmovge r11,rbp vmovdqu ymm5,YMMWORD PTR[rbx] vpxor ymm7,ymm7,ymm7 vmovdqa ymm6,ymm5 vpcmpgtd ymm6,ymm6,ymm7 vpaddd ymm5,ymm5,ymm6 vpand ymm0,ymm0,ymm6 vpand ymm1,ymm1,ymm6 vpaddd ymm0,ymm0,YMMWORD PTR[rdi] vpand ymm2,ymm2,ymm6 vpaddd ymm1,ymm1,YMMWORD PTR[32+rdi] vpand ymm3,ymm3,ymm6 vpaddd ymm2,ymm2,YMMWORD PTR[64+rdi] vpand ymm4,ymm4,ymm6 vpaddd ymm3,ymm3,YMMWORD PTR[96+rdi] vpaddd ymm4,ymm4,YMMWORD PTR[128+rdi] vmovdqu YMMWORD PTR[rdi],ymm0 vmovdqu YMMWORD PTR[32+rdi],ymm1 vmovdqu YMMWORD PTR[64+rdi],ymm2 vmovdqu YMMWORD PTR[96+rdi],ymm3 vmovdqu YMMWORD PTR[128+rdi],ymm4 vmovdqu YMMWORD PTR[rbx],ymm5 lea rbx,QWORD PTR[((256+128))+rsp] vmovdqu ymm9,YMMWORD PTR[96+rbp] dec edx jnz $L$oop_avx2 $L$done_avx2:: mov rax,QWORD PTR[544+rsp] vzeroupper movaps xmm6,XMMWORD PTR[((-216))+rax] movaps xmm7,XMMWORD PTR[((-200))+rax] movaps xmm8,XMMWORD PTR[((-184))+rax] movaps xmm9,XMMWORD PTR[((-168))+rax] movaps xmm10,XMMWORD PTR[((-152))+rax] movaps xmm11,XMMWORD PTR[((-136))+rax] movaps xmm12,XMMWORD PTR[((-120))+rax] movaps xmm13,XMMWORD PTR[((-104))+rax] movaps xmm14,XMMWORD PTR[((-88))+rax] movaps xmm15,XMMWORD PTR[((-72))+rax] mov r15,QWORD PTR[((-48))+rax] mov r14,QWORD PTR[((-40))+rax] mov r13,QWORD PTR[((-32))+rax] mov r12,QWORD PTR[((-24))+rax] mov rbp,QWORD PTR[((-16))+rax] mov rbx,QWORD PTR[((-8))+rax] lea rsp,QWORD PTR[rax] $L$epilogue_avx2:: mov rdi,QWORD PTR[8+rsp] ;WIN64 epilogue mov rsi,QWORD PTR[16+rsp] DB 0F3h,0C3h ;repret $L$SEH_end_sha1_multi_block_avx2:: sha1_multi_block_avx2 ENDP ALIGN 256 DD 05a827999h,05a827999h,05a827999h,05a827999h DD 05a827999h,05a827999h,05a827999h,05a827999h K_XX_XX:: DD 06ed9eba1h,06ed9eba1h,06ed9eba1h,06ed9eba1h DD 06ed9eba1h,06ed9eba1h,06ed9eba1h,06ed9eba1h DD 08f1bbcdch,08f1bbcdch,08f1bbcdch,08f1bbcdch DD 08f1bbcdch,08f1bbcdch,08f1bbcdch,08f1bbcdch DD 0ca62c1d6h,0ca62c1d6h,0ca62c1d6h,0ca62c1d6h DD 0ca62c1d6h,0ca62c1d6h,0ca62c1d6h,0ca62c1d6h DD 000010203h,004050607h,008090a0bh,00c0d0e0fh DD 000010203h,004050607h,008090a0bh,00c0d0e0fh DB 0fh,0eh,0dh,0ch,0bh,0ah,09h,08h,07h,06h,05h,04h,03h,02h,01h,00h DB 83,72,65,49,32,109,117,108,116,105,45,98,108,111,99,107 DB 32,116,114,97,110,115,102,111,114,109,32,102,111,114,32,120 DB 56,54,95,54,52,44,32,67,82,89,80,84,79,71,65,77 DB 83,32,98,121,32,60,97,112,112,114,111,64,111,112,101,110 DB 115,115,108,46,111,114,103,62,0 EXTERN __imp_RtlVirtualUnwind:NEAR ALIGN 16 se_handler PROC PRIVATE push rsi push rdi push rbx push rbp push r12 push r13 push r14 push r15 pushfq sub rsp,64 mov rax,QWORD PTR[120+r8] mov rbx,QWORD PTR[248+r8] mov rsi,QWORD PTR[8+r9] mov r11,QWORD PTR[56+r9] mov r10d,DWORD PTR[r11] lea r10,QWORD PTR[r10*1+rsi] cmp rbx,r10 jb $L$in_prologue mov rax,QWORD PTR[152+r8] mov r10d,DWORD PTR[4+r11] lea r10,QWORD PTR[r10*1+rsi] cmp rbx,r10 jae $L$in_prologue mov rax,QWORD PTR[272+rax] mov rbx,QWORD PTR[((-8))+rax] mov rbp,QWORD PTR[((-16))+rax] mov QWORD PTR[144+r8],rbx mov QWORD PTR[160+r8],rbp lea rsi,QWORD PTR[((-24-160))+rax] lea rdi,QWORD PTR[512+r8] mov ecx,20 DD 0a548f3fch $L$in_prologue:: mov rdi,QWORD PTR[8+rax] mov rsi,QWORD PTR[16+rax] mov QWORD PTR[152+r8],rax mov QWORD PTR[168+r8],rsi mov QWORD PTR[176+r8],rdi mov rdi,QWORD PTR[40+r9] mov rsi,r8 mov ecx,154 DD 0a548f3fch mov rsi,r9 xor rcx,rcx mov rdx,QWORD PTR[8+rsi] mov r8,QWORD PTR[rsi] mov r9,QWORD PTR[16+rsi] mov r10,QWORD PTR[40+rsi] lea r11,QWORD PTR[56+rsi] lea r12,QWORD PTR[24+rsi] mov QWORD PTR[32+rsp],r10 mov QWORD PTR[40+rsp],r11 mov QWORD PTR[48+rsp],r12 mov QWORD PTR[56+rsp],rcx call QWORD PTR[__imp_RtlVirtualUnwind] mov eax,1 add rsp,64 popfq pop r15 pop r14 pop r13 pop r12 pop rbp pop rbx pop rdi pop rsi DB 0F3h,0C3h ;repret se_handler ENDP ALIGN 16 avx2_handler PROC PRIVATE push rsi push rdi push rbx push rbp push r12 push r13 push r14 push r15 pushfq sub rsp,64 mov rax,QWORD PTR[120+r8] mov rbx,QWORD PTR[248+r8] mov rsi,QWORD PTR[8+r9] mov r11,QWORD PTR[56+r9] mov r10d,DWORD PTR[r11] lea r10,QWORD PTR[r10*1+rsi] cmp rbx,r10 jb $L$in_prologue mov rax,QWORD PTR[152+r8] mov r10d,DWORD PTR[4+r11] lea r10,QWORD PTR[r10*1+rsi] cmp rbx,r10 jae $L$in_prologue mov rax,QWORD PTR[544+r8] mov rbx,QWORD PTR[((-8))+rax] mov rbp,QWORD PTR[((-16))+rax] mov r12,QWORD PTR[((-24))+rax] mov r13,QWORD PTR[((-32))+rax] mov r14,QWORD PTR[((-40))+rax] mov r15,QWORD PTR[((-48))+rax] mov QWORD PTR[144+r8],rbx mov QWORD PTR[160+r8],rbp mov QWORD PTR[216+r8],r12 mov QWORD PTR[224+r8],r13 mov QWORD PTR[232+r8],r14 mov QWORD PTR[240+r8],r15 lea rsi,QWORD PTR[((-56-160))+rax] lea rdi,QWORD PTR[512+r8] mov ecx,20 DD 0a548f3fch jmp $L$in_prologue avx2_handler ENDP .text$ ENDS .pdata SEGMENT READONLY ALIGN(4) ALIGN 4 DD imagerel $L$SEH_begin_sha1_multi_block DD imagerel $L$SEH_end_sha1_multi_block DD imagerel $L$SEH_info_sha1_multi_block DD imagerel $L$SEH_begin_sha1_multi_block_shaext DD imagerel $L$SEH_end_sha1_multi_block_shaext DD imagerel $L$SEH_info_sha1_multi_block_shaext DD imagerel $L$SEH_begin_sha1_multi_block_avx DD imagerel $L$SEH_end_sha1_multi_block_avx DD imagerel $L$SEH_info_sha1_multi_block_avx DD imagerel $L$SEH_begin_sha1_multi_block_avx2 DD imagerel $L$SEH_end_sha1_multi_block_avx2 DD imagerel $L$SEH_info_sha1_multi_block_avx2 .pdata ENDS .xdata SEGMENT READONLY ALIGN(8) ALIGN 8 $L$SEH_info_sha1_multi_block:: DB 9,0,0,0 DD imagerel se_handler DD imagerel $L$body,imagerel $L$epilogue $L$SEH_info_sha1_multi_block_shaext:: DB 9,0,0,0 DD imagerel se_handler DD imagerel $L$body_shaext,imagerel $L$epilogue_shaext $L$SEH_info_sha1_multi_block_avx:: DB 9,0,0,0 DD imagerel se_handler DD imagerel $L$body_avx,imagerel $L$epilogue_avx $L$SEH_info_sha1_multi_block_avx2:: DB 9,0,0,0 DD imagerel avx2_handler DD imagerel $L$body_avx2,imagerel $L$epilogue_avx2 .xdata ENDS END