OPTION DOTNAME .text$ SEGMENT ALIGN(256) 'CODE' EXTERN OPENSSL_ia32cap_P:NEAR PUBLIC rsaz_512_sqr ALIGN 32 rsaz_512_sqr PROC PUBLIC mov QWORD PTR[8+rsp],rdi ;WIN64 prologue mov QWORD PTR[16+rsp],rsi mov rax,rsp $L$SEH_begin_rsaz_512_sqr:: mov rdi,rcx mov rsi,rdx mov rdx,r8 mov rcx,r9 mov r8,QWORD PTR[40+rsp] push rbx push rbp push r12 push r13 push r14 push r15 sub rsp,128+24 $L$sqr_body:: mov rbp,rdx mov rdx,QWORD PTR[rsi] mov rax,QWORD PTR[8+rsi] mov QWORD PTR[128+rsp],rcx mov r11d,080100h and r11d,DWORD PTR[((OPENSSL_ia32cap_P+8))] cmp r11d,080100h je $L$oop_sqrx jmp $L$oop_sqr ALIGN 32 $L$oop_sqr:: mov DWORD PTR[((128+8))+rsp],r8d mov rbx,rdx mul rdx mov r8,rax mov rax,QWORD PTR[16+rsi] mov r9,rdx mul rbx add r9,rax mov rax,QWORD PTR[24+rsi] mov r10,rdx adc r10,0 mul rbx add r10,rax mov rax,QWORD PTR[32+rsi] mov r11,rdx adc r11,0 mul rbx add r11,rax mov rax,QWORD PTR[40+rsi] mov r12,rdx adc r12,0 mul rbx add r12,rax mov rax,QWORD PTR[48+rsi] mov r13,rdx adc r13,0 mul rbx add r13,rax mov rax,QWORD PTR[56+rsi] mov r14,rdx adc r14,0 mul rbx add r14,rax mov rax,rbx mov r15,rdx adc r15,0 add r8,r8 mov rcx,r9 adc r9,r9 mul rax mov QWORD PTR[rsp],rax add r8,rdx adc r9,0 mov QWORD PTR[8+rsp],r8 shr rcx,63 mov r8,QWORD PTR[8+rsi] mov rax,QWORD PTR[16+rsi] mul r8 add r10,rax mov rax,QWORD PTR[24+rsi] mov rbx,rdx adc rbx,0 mul r8 add r11,rax mov rax,QWORD PTR[32+rsi] adc rdx,0 add r11,rbx mov rbx,rdx adc rbx,0 mul r8 add r12,rax mov rax,QWORD PTR[40+rsi] adc rdx,0 add r12,rbx mov rbx,rdx adc rbx,0 mul r8 add r13,rax mov rax,QWORD PTR[48+rsi] adc rdx,0 add r13,rbx mov rbx,rdx adc rbx,0 mul r8 add r14,rax mov rax,QWORD PTR[56+rsi] adc rdx,0 add r14,rbx mov rbx,rdx adc rbx,0 mul r8 add r15,rax mov rax,r8 adc rdx,0 add r15,rbx mov r8,rdx mov rdx,r10 adc r8,0 add rdx,rdx lea r10,QWORD PTR[r10*2+rcx] mov rbx,r11 adc r11,r11 mul rax add r9,rax adc r10,rdx adc r11,0 mov QWORD PTR[16+rsp],r9 mov QWORD PTR[24+rsp],r10 shr rbx,63 mov r9,QWORD PTR[16+rsi] mov rax,QWORD PTR[24+rsi] mul r9 add r12,rax mov rax,QWORD PTR[32+rsi] mov rcx,rdx adc rcx,0 mul r9 add r13,rax mov rax,QWORD PTR[40+rsi] adc rdx,0 add r13,rcx mov rcx,rdx adc rcx,0 mul r9 add r14,rax mov rax,QWORD PTR[48+rsi] adc rdx,0 add r14,rcx mov rcx,rdx adc rcx,0 mul r9 mov r10,r12 lea r12,QWORD PTR[r12*2+rbx] add r15,rax mov rax,QWORD PTR[56+rsi] adc rdx,0 add r15,rcx mov rcx,rdx adc rcx,0 mul r9 shr r10,63 add r8,rax mov rax,r9 adc rdx,0 add r8,rcx mov r9,rdx adc r9,0 mov rcx,r13 lea r13,QWORD PTR[r13*2+r10] mul rax add r11,rax adc r12,rdx adc r13,0 mov QWORD PTR[32+rsp],r11 mov QWORD PTR[40+rsp],r12 shr rcx,63 mov r10,QWORD PTR[24+rsi] mov rax,QWORD PTR[32+rsi] mul r10 add r14,rax mov rax,QWORD PTR[40+rsi] mov rbx,rdx adc rbx,0 mul r10 add r15,rax mov rax,QWORD PTR[48+rsi] adc rdx,0 add r15,rbx mov rbx,rdx adc rbx,0 mul r10 mov r12,r14 lea r14,QWORD PTR[r14*2+rcx] add r8,rax mov rax,QWORD PTR[56+rsi] adc rdx,0 add r8,rbx mov rbx,rdx adc rbx,0 mul r10 shr r12,63 add r9,rax mov rax,r10 adc rdx,0 add r9,rbx mov r10,rdx adc r10,0 mov rbx,r15 lea r15,QWORD PTR[r15*2+r12] mul rax add r13,rax adc r14,rdx adc r15,0 mov QWORD PTR[48+rsp],r13 mov QWORD PTR[56+rsp],r14 shr rbx,63 mov r11,QWORD PTR[32+rsi] mov rax,QWORD PTR[40+rsi] mul r11 add r8,rax mov rax,QWORD PTR[48+rsi] mov rcx,rdx adc rcx,0 mul r11 add r9,rax mov rax,QWORD PTR[56+rsi] adc rdx,0 mov r12,r8 lea r8,QWORD PTR[r8*2+rbx] add r9,rcx mov rcx,rdx adc rcx,0 mul r11 shr r12,63 add r10,rax mov rax,r11 adc rdx,0 add r10,rcx mov r11,rdx adc r11,0 mov rcx,r9 lea r9,QWORD PTR[r9*2+r12] mul rax add r15,rax adc r8,rdx adc r9,0 mov QWORD PTR[64+rsp],r15 mov QWORD PTR[72+rsp],r8 shr rcx,63 mov r12,QWORD PTR[40+rsi] mov rax,QWORD PTR[48+rsi] mul r12 add r10,rax mov rax,QWORD PTR[56+rsi] mov rbx,rdx adc rbx,0 mul r12 add r11,rax mov rax,r12 mov r15,r10 lea r10,QWORD PTR[r10*2+rcx] adc rdx,0 shr r15,63 add r11,rbx mov r12,rdx adc r12,0 mov rbx,r11 lea r11,QWORD PTR[r11*2+r15] mul rax add r9,rax adc r10,rdx adc r11,0 mov QWORD PTR[80+rsp],r9 mov QWORD PTR[88+rsp],r10 mov r13,QWORD PTR[48+rsi] mov rax,QWORD PTR[56+rsi] mul r13 add r12,rax mov rax,r13 mov r13,rdx adc r13,0 xor r14,r14 shl rbx,1 adc r12,r12 adc r13,r13 adc r14,r14 mul rax add r11,rax adc r12,rdx adc r13,0 mov QWORD PTR[96+rsp],r11 mov QWORD PTR[104+rsp],r12 mov rax,QWORD PTR[56+rsi] mul rax add r13,rax adc rdx,0 add r14,rdx mov QWORD PTR[112+rsp],r13 mov QWORD PTR[120+rsp],r14 mov r8,QWORD PTR[rsp] mov r9,QWORD PTR[8+rsp] mov r10,QWORD PTR[16+rsp] mov r11,QWORD PTR[24+rsp] mov r12,QWORD PTR[32+rsp] mov r13,QWORD PTR[40+rsp] mov r14,QWORD PTR[48+rsp] mov r15,QWORD PTR[56+rsp] call __rsaz_512_reduce add r8,QWORD PTR[64+rsp] adc r9,QWORD PTR[72+rsp] adc r10,QWORD PTR[80+rsp] adc r11,QWORD PTR[88+rsp] adc r12,QWORD PTR[96+rsp] adc r13,QWORD PTR[104+rsp] adc r14,QWORD PTR[112+rsp] adc r15,QWORD PTR[120+rsp] sbb rcx,rcx call __rsaz_512_subtract mov rdx,r8 mov rax,r9 mov r8d,DWORD PTR[((128+8))+rsp] mov rsi,rdi dec r8d jnz $L$oop_sqr jmp $L$sqr_tail ALIGN 32 $L$oop_sqrx:: mov DWORD PTR[((128+8))+rsp],r8d DB 102,72,15,110,199 DB 102,72,15,110,205 mulx r9,r8,rax mulx r10,rcx,QWORD PTR[16+rsi] xor rbp,rbp mulx r11,rax,QWORD PTR[24+rsi] adcx r9,rcx mulx r12,rcx,QWORD PTR[32+rsi] adcx r10,rax mulx r13,rax,QWORD PTR[40+rsi] adcx r11,rcx DB 0c4h,062h,0f3h,0f6h,0b6h,030h,000h,000h,000h adcx r12,rax adcx r13,rcx DB 0c4h,062h,0fbh,0f6h,0beh,038h,000h,000h,000h adcx r14,rax adcx r15,rbp mov rcx,r9 shld r9,r8,1 shl r8,1 xor ebp,ebp mulx rdx,rax,rdx adcx r8,rdx mov rdx,QWORD PTR[8+rsi] adcx r9,rbp mov QWORD PTR[rsp],rax mov QWORD PTR[8+rsp],r8 mulx rbx,rax,QWORD PTR[16+rsi] adox r10,rax adcx r11,rbx DB 0c4h,062h,0c3h,0f6h,086h,018h,000h,000h,000h adox r11,rdi adcx r12,r8 mulx rbx,rax,QWORD PTR[32+rsi] adox r12,rax adcx r13,rbx mulx r8,rdi,QWORD PTR[40+rsi] adox r13,rdi adcx r14,r8 DB 0c4h,0e2h,0fbh,0f6h,09eh,030h,000h,000h,000h adox r14,rax adcx r15,rbx DB 0c4h,062h,0c3h,0f6h,086h,038h,000h,000h,000h adox r15,rdi adcx r8,rbp adox r8,rbp mov rbx,r11 shld r11,r10,1 shld r10,rcx,1 xor ebp,ebp mulx rcx,rax,rdx mov rdx,QWORD PTR[16+rsi] adcx r9,rax adcx r10,rcx adcx r11,rbp mov QWORD PTR[16+rsp],r9 DB 04ch,089h,094h,024h,018h,000h,000h,000h DB 0c4h,062h,0c3h,0f6h,08eh,018h,000h,000h,000h adox r12,rdi adcx r13,r9 mulx rcx,rax,QWORD PTR[32+rsi] adox r13,rax adcx r14,rcx mulx r9,rdi,QWORD PTR[40+rsi] adox r14,rdi adcx r15,r9 DB 0c4h,0e2h,0fbh,0f6h,08eh,030h,000h,000h,000h adox r15,rax adcx r8,rcx DB 0c4h,062h,0c3h,0f6h,08eh,038h,000h,000h,000h adox r8,rdi adcx r9,rbp adox r9,rbp mov rcx,r13 shld r13,r12,1 shld r12,rbx,1 xor ebp,ebp mulx rdx,rax,rdx adcx r11,rax adcx r12,rdx mov rdx,QWORD PTR[24+rsi] adcx r13,rbp mov QWORD PTR[32+rsp],r11 DB 04ch,089h,0a4h,024h,028h,000h,000h,000h DB 0c4h,0e2h,0fbh,0f6h,09eh,020h,000h,000h,000h adox r14,rax adcx r15,rbx mulx r10,rdi,QWORD PTR[40+rsi] adox r15,rdi adcx r8,r10 mulx rbx,rax,QWORD PTR[48+rsi] adox r8,rax adcx r9,rbx mulx r10,rdi,QWORD PTR[56+rsi] adox r9,rdi adcx r10,rbp adox r10,rbp DB 066h mov rbx,r15 shld r15,r14,1 shld r14,rcx,1 xor ebp,ebp mulx rdx,rax,rdx adcx r13,rax adcx r14,rdx mov rdx,QWORD PTR[32+rsi] adcx r15,rbp mov QWORD PTR[48+rsp],r13 mov QWORD PTR[56+rsp],r14 DB 0c4h,062h,0c3h,0f6h,09eh,028h,000h,000h,000h adox r8,rdi adcx r9,r11 mulx rcx,rax,QWORD PTR[48+rsi] adox r9,rax adcx r10,rcx mulx r11,rdi,QWORD PTR[56+rsi] adox r10,rdi adcx r11,rbp adox r11,rbp mov rcx,r9 shld r9,r8,1 shld r8,rbx,1 xor ebp,ebp mulx rdx,rax,rdx adcx r15,rax adcx r8,rdx mov rdx,QWORD PTR[40+rsi] adcx r9,rbp mov QWORD PTR[64+rsp],r15 mov QWORD PTR[72+rsp],r8 DB 0c4h,0e2h,0fbh,0f6h,09eh,030h,000h,000h,000h adox r10,rax adcx r11,rbx DB 0c4h,062h,0c3h,0f6h,0a6h,038h,000h,000h,000h adox r11,rdi adcx r12,rbp adox r12,rbp mov rbx,r11 shld r11,r10,1 shld r10,rcx,1 xor ebp,ebp mulx rdx,rax,rdx adcx r9,rax adcx r10,rdx mov rdx,QWORD PTR[48+rsi] adcx r11,rbp mov QWORD PTR[80+rsp],r9 mov QWORD PTR[88+rsp],r10 DB 0c4h,062h,0fbh,0f6h,0aeh,038h,000h,000h,000h adox r12,rax adox r13,rbp xor r14,r14 shld r14,r13,1 shld r13,r12,1 shld r12,rbx,1 xor ebp,ebp mulx rdx,rax,rdx adcx r11,rax adcx r12,rdx mov rdx,QWORD PTR[56+rsi] adcx r13,rbp DB 04ch,089h,09ch,024h,060h,000h,000h,000h DB 04ch,089h,0a4h,024h,068h,000h,000h,000h mulx rdx,rax,rdx adox r13,rax adox rdx,rbp DB 066h add r14,rdx mov QWORD PTR[112+rsp],r13 mov QWORD PTR[120+rsp],r14 DB 102,72,15,126,199 DB 102,72,15,126,205 mov rdx,QWORD PTR[128+rsp] mov r8,QWORD PTR[rsp] mov r9,QWORD PTR[8+rsp] mov r10,QWORD PTR[16+rsp] mov r11,QWORD PTR[24+rsp] mov r12,QWORD PTR[32+rsp] mov r13,QWORD PTR[40+rsp] mov r14,QWORD PTR[48+rsp] mov r15,QWORD PTR[56+rsp] call __rsaz_512_reducex add r8,QWORD PTR[64+rsp] adc r9,QWORD PTR[72+rsp] adc r10,QWORD PTR[80+rsp] adc r11,QWORD PTR[88+rsp] adc r12,QWORD PTR[96+rsp] adc r13,QWORD PTR[104+rsp] adc r14,QWORD PTR[112+rsp] adc r15,QWORD PTR[120+rsp] sbb rcx,rcx call __rsaz_512_subtract mov rdx,r8 mov rax,r9 mov r8d,DWORD PTR[((128+8))+rsp] mov rsi,rdi dec r8d jnz $L$oop_sqrx $L$sqr_tail:: lea rax,QWORD PTR[((128+24+48))+rsp] mov r15,QWORD PTR[((-48))+rax] mov r14,QWORD PTR[((-40))+rax] mov r13,QWORD PTR[((-32))+rax] mov r12,QWORD PTR[((-24))+rax] mov rbp,QWORD PTR[((-16))+rax] mov rbx,QWORD PTR[((-8))+rax] lea rsp,QWORD PTR[rax] $L$sqr_epilogue:: mov rdi,QWORD PTR[8+rsp] ;WIN64 epilogue mov rsi,QWORD PTR[16+rsp] DB 0F3h,0C3h ;repret $L$SEH_end_rsaz_512_sqr:: rsaz_512_sqr ENDP PUBLIC rsaz_512_mul ALIGN 32 rsaz_512_mul PROC PUBLIC mov QWORD PTR[8+rsp],rdi ;WIN64 prologue mov QWORD PTR[16+rsp],rsi mov rax,rsp $L$SEH_begin_rsaz_512_mul:: mov rdi,rcx mov rsi,rdx mov rdx,r8 mov rcx,r9 mov r8,QWORD PTR[40+rsp] push rbx push rbp push r12 push r13 push r14 push r15 sub rsp,128+24 $L$mul_body:: DB 102,72,15,110,199 DB 102,72,15,110,201 mov QWORD PTR[128+rsp],r8 mov r11d,080100h and r11d,DWORD PTR[((OPENSSL_ia32cap_P+8))] cmp r11d,080100h je $L$mulx mov rbx,QWORD PTR[rdx] mov rbp,rdx call __rsaz_512_mul DB 102,72,15,126,199 DB 102,72,15,126,205 mov r8,QWORD PTR[rsp] mov r9,QWORD PTR[8+rsp] mov r10,QWORD PTR[16+rsp] mov r11,QWORD PTR[24+rsp] mov r12,QWORD PTR[32+rsp] mov r13,QWORD PTR[40+rsp] mov r14,QWORD PTR[48+rsp] mov r15,QWORD PTR[56+rsp] call __rsaz_512_reduce jmp $L$mul_tail ALIGN 32 $L$mulx:: mov rbp,rdx mov rdx,QWORD PTR[rdx] call __rsaz_512_mulx DB 102,72,15,126,199 DB 102,72,15,126,205 mov rdx,QWORD PTR[128+rsp] mov r8,QWORD PTR[rsp] mov r9,QWORD PTR[8+rsp] mov r10,QWORD PTR[16+rsp] mov r11,QWORD PTR[24+rsp] mov r12,QWORD PTR[32+rsp] mov r13,QWORD PTR[40+rsp] mov r14,QWORD PTR[48+rsp] mov r15,QWORD PTR[56+rsp] call __rsaz_512_reducex $L$mul_tail:: add r8,QWORD PTR[64+rsp] adc r9,QWORD PTR[72+rsp] adc r10,QWORD PTR[80+rsp] adc r11,QWORD PTR[88+rsp] adc r12,QWORD PTR[96+rsp] adc r13,QWORD PTR[104+rsp] adc r14,QWORD PTR[112+rsp] adc r15,QWORD PTR[120+rsp] sbb rcx,rcx call __rsaz_512_subtract lea rax,QWORD PTR[((128+24+48))+rsp] mov r15,QWORD PTR[((-48))+rax] mov r14,QWORD PTR[((-40))+rax] mov r13,QWORD PTR[((-32))+rax] mov r12,QWORD PTR[((-24))+rax] mov rbp,QWORD PTR[((-16))+rax] mov rbx,QWORD PTR[((-8))+rax] lea rsp,QWORD PTR[rax] $L$mul_epilogue:: mov rdi,QWORD PTR[8+rsp] ;WIN64 epilogue mov rsi,QWORD PTR[16+rsp] DB 0F3h,0C3h ;repret $L$SEH_end_rsaz_512_mul:: rsaz_512_mul ENDP PUBLIC rsaz_512_mul_gather4 ALIGN 32 rsaz_512_mul_gather4 PROC PUBLIC mov QWORD PTR[8+rsp],rdi ;WIN64 prologue mov QWORD PTR[16+rsp],rsi mov rax,rsp $L$SEH_begin_rsaz_512_mul_gather4:: mov rdi,rcx mov rsi,rdx mov rdx,r8 mov rcx,r9 mov r8,QWORD PTR[40+rsp] mov r9,QWORD PTR[48+rsp] push rbx push rbp push r12 push r13 push r14 push r15 sub rsp,328 movaps XMMWORD PTR[160+rsp],xmm6 movaps XMMWORD PTR[176+rsp],xmm7 movaps XMMWORD PTR[192+rsp],xmm8 movaps XMMWORD PTR[208+rsp],xmm9 movaps XMMWORD PTR[224+rsp],xmm10 movaps XMMWORD PTR[240+rsp],xmm11 movaps XMMWORD PTR[256+rsp],xmm12 movaps XMMWORD PTR[272+rsp],xmm13 movaps XMMWORD PTR[288+rsp],xmm14 movaps XMMWORD PTR[304+rsp],xmm15 $L$mul_gather4_body:: movd xmm8,r9d movdqa xmm1,XMMWORD PTR[(($L$inc+16))] movdqa xmm0,XMMWORD PTR[$L$inc] pshufd xmm8,xmm8,0 movdqa xmm7,xmm1 movdqa xmm2,xmm1 paddd xmm1,xmm0 pcmpeqd xmm0,xmm8 movdqa xmm3,xmm7 paddd xmm2,xmm1 pcmpeqd xmm1,xmm8 movdqa xmm4,xmm7 paddd xmm3,xmm2 pcmpeqd xmm2,xmm8 movdqa xmm5,xmm7 paddd xmm4,xmm3 pcmpeqd xmm3,xmm8 movdqa xmm6,xmm7 paddd xmm5,xmm4 pcmpeqd xmm4,xmm8 paddd xmm6,xmm5 pcmpeqd xmm5,xmm8 paddd xmm7,xmm6 pcmpeqd xmm6,xmm8 pcmpeqd xmm7,xmm8 movdqa xmm8,XMMWORD PTR[rdx] movdqa xmm9,XMMWORD PTR[16+rdx] movdqa xmm10,XMMWORD PTR[32+rdx] movdqa xmm11,XMMWORD PTR[48+rdx] pand xmm8,xmm0 movdqa xmm12,XMMWORD PTR[64+rdx] pand xmm9,xmm1 movdqa xmm13,XMMWORD PTR[80+rdx] pand xmm10,xmm2 movdqa xmm14,XMMWORD PTR[96+rdx] pand xmm11,xmm3 movdqa xmm15,XMMWORD PTR[112+rdx] lea rbp,QWORD PTR[128+rdx] pand xmm12,xmm4 pand xmm13,xmm5 pand xmm14,xmm6 pand xmm15,xmm7 por xmm8,xmm10 por xmm9,xmm11 por xmm8,xmm12 por xmm9,xmm13 por xmm8,xmm14 por xmm9,xmm15 por xmm8,xmm9 pshufd xmm9,xmm8,04eh por xmm8,xmm9 mov r11d,080100h and r11d,DWORD PTR[((OPENSSL_ia32cap_P+8))] cmp r11d,080100h je $L$mulx_gather DB 102,76,15,126,195 mov QWORD PTR[128+rsp],r8 mov QWORD PTR[((128+8))+rsp],rdi mov QWORD PTR[((128+16))+rsp],rcx mov rax,QWORD PTR[rsi] mov rcx,QWORD PTR[8+rsi] mul rbx mov QWORD PTR[rsp],rax mov rax,rcx mov r8,rdx mul rbx add r8,rax mov rax,QWORD PTR[16+rsi] mov r9,rdx adc r9,0 mul rbx add r9,rax mov rax,QWORD PTR[24+rsi] mov r10,rdx adc r10,0 mul rbx add r10,rax mov rax,QWORD PTR[32+rsi] mov r11,rdx adc r11,0 mul rbx add r11,rax mov rax,QWORD PTR[40+rsi] mov r12,rdx adc r12,0 mul rbx add r12,rax mov rax,QWORD PTR[48+rsi] mov r13,rdx adc r13,0 mul rbx add r13,rax mov rax,QWORD PTR[56+rsi] mov r14,rdx adc r14,0 mul rbx add r14,rax mov rax,QWORD PTR[rsi] mov r15,rdx adc r15,0 lea rdi,QWORD PTR[8+rsp] mov ecx,7 jmp $L$oop_mul_gather ALIGN 32 $L$oop_mul_gather:: movdqa xmm8,XMMWORD PTR[rbp] movdqa xmm9,XMMWORD PTR[16+rbp] movdqa xmm10,XMMWORD PTR[32+rbp] movdqa xmm11,XMMWORD PTR[48+rbp] pand xmm8,xmm0 movdqa xmm12,XMMWORD PTR[64+rbp] pand xmm9,xmm1 movdqa xmm13,XMMWORD PTR[80+rbp] pand xmm10,xmm2 movdqa xmm14,XMMWORD PTR[96+rbp] pand xmm11,xmm3 movdqa xmm15,XMMWORD PTR[112+rbp] lea rbp,QWORD PTR[128+rbp] pand xmm12,xmm4 pand xmm13,xmm5 pand xmm14,xmm6 pand xmm15,xmm7 por xmm8,xmm10 por xmm9,xmm11 por xmm8,xmm12 por xmm9,xmm13 por xmm8,xmm14 por xmm9,xmm15 por xmm8,xmm9 pshufd xmm9,xmm8,04eh por xmm8,xmm9 DB 102,76,15,126,195 mul rbx add r8,rax mov rax,QWORD PTR[8+rsi] mov QWORD PTR[rdi],r8 mov r8,rdx adc r8,0 mul rbx add r9,rax mov rax,QWORD PTR[16+rsi] adc rdx,0 add r8,r9 mov r9,rdx adc r9,0 mul rbx add r10,rax mov rax,QWORD PTR[24+rsi] adc rdx,0 add r9,r10 mov r10,rdx adc r10,0 mul rbx add r11,rax mov rax,QWORD PTR[32+rsi] adc rdx,0 add r10,r11 mov r11,rdx adc r11,0 mul rbx add r12,rax mov rax,QWORD PTR[40+rsi] adc rdx,0 add r11,r12 mov r12,rdx adc r12,0 mul rbx add r13,rax mov rax,QWORD PTR[48+rsi] adc rdx,0 add r12,r13 mov r13,rdx adc r13,0 mul rbx add r14,rax mov rax,QWORD PTR[56+rsi] adc rdx,0 add r13,r14 mov r14,rdx adc r14,0 mul rbx add r15,rax mov rax,QWORD PTR[rsi] adc rdx,0 add r14,r15 mov r15,rdx adc r15,0 lea rdi,QWORD PTR[8+rdi] dec ecx jnz $L$oop_mul_gather mov QWORD PTR[rdi],r8 mov QWORD PTR[8+rdi],r9 mov QWORD PTR[16+rdi],r10 mov QWORD PTR[24+rdi],r11 mov QWORD PTR[32+rdi],r12 mov QWORD PTR[40+rdi],r13 mov QWORD PTR[48+rdi],r14 mov QWORD PTR[56+rdi],r15 mov rdi,QWORD PTR[((128+8))+rsp] mov rbp,QWORD PTR[((128+16))+rsp] mov r8,QWORD PTR[rsp] mov r9,QWORD PTR[8+rsp] mov r10,QWORD PTR[16+rsp] mov r11,QWORD PTR[24+rsp] mov r12,QWORD PTR[32+rsp] mov r13,QWORD PTR[40+rsp] mov r14,QWORD PTR[48+rsp] mov r15,QWORD PTR[56+rsp] call __rsaz_512_reduce jmp $L$mul_gather_tail ALIGN 32 $L$mulx_gather:: DB 102,76,15,126,194 mov QWORD PTR[128+rsp],r8 mov QWORD PTR[((128+8))+rsp],rdi mov QWORD PTR[((128+16))+rsp],rcx mulx r8,rbx,QWORD PTR[rsi] mov QWORD PTR[rsp],rbx xor edi,edi mulx r9,rax,QWORD PTR[8+rsi] mulx r10,rbx,QWORD PTR[16+rsi] adcx r8,rax mulx r11,rax,QWORD PTR[24+rsi] adcx r9,rbx mulx r12,rbx,QWORD PTR[32+rsi] adcx r10,rax mulx r13,rax,QWORD PTR[40+rsi] adcx r11,rbx mulx r14,rbx,QWORD PTR[48+rsi] adcx r12,rax mulx r15,rax,QWORD PTR[56+rsi] adcx r13,rbx adcx r14,rax DB 067h mov rbx,r8 adcx r15,rdi mov rcx,-7 jmp $L$oop_mulx_gather ALIGN 32 $L$oop_mulx_gather:: movdqa xmm8,XMMWORD PTR[rbp] movdqa xmm9,XMMWORD PTR[16+rbp] movdqa xmm10,XMMWORD PTR[32+rbp] movdqa xmm11,XMMWORD PTR[48+rbp] pand xmm8,xmm0 movdqa xmm12,XMMWORD PTR[64+rbp] pand xmm9,xmm1 movdqa xmm13,XMMWORD PTR[80+rbp] pand xmm10,xmm2 movdqa xmm14,XMMWORD PTR[96+rbp] pand xmm11,xmm3 movdqa xmm15,XMMWORD PTR[112+rbp] lea rbp,QWORD PTR[128+rbp] pand xmm12,xmm4 pand xmm13,xmm5 pand xmm14,xmm6 pand xmm15,xmm7 por xmm8,xmm10 por xmm9,xmm11 por xmm8,xmm12 por xmm9,xmm13 por xmm8,xmm14 por xmm9,xmm15 por xmm8,xmm9 pshufd xmm9,xmm8,04eh por xmm8,xmm9 DB 102,76,15,126,194 DB 0c4h,062h,0fbh,0f6h,086h,000h,000h,000h,000h adcx rbx,rax adox r8,r9 mulx r9,rax,QWORD PTR[8+rsi] adcx r8,rax adox r9,r10 mulx r10,rax,QWORD PTR[16+rsi] adcx r9,rax adox r10,r11 DB 0c4h,062h,0fbh,0f6h,09eh,018h,000h,000h,000h adcx r10,rax adox r11,r12 mulx r12,rax,QWORD PTR[32+rsi] adcx r11,rax adox r12,r13 mulx r13,rax,QWORD PTR[40+rsi] adcx r12,rax adox r13,r14 DB 0c4h,062h,0fbh,0f6h,0b6h,030h,000h,000h,000h adcx r13,rax DB 067h adox r14,r15 mulx r15,rax,QWORD PTR[56+rsi] mov QWORD PTR[64+rcx*8+rsp],rbx adcx r14,rax adox r15,rdi mov rbx,r8 adcx r15,rdi inc rcx jnz $L$oop_mulx_gather mov QWORD PTR[64+rsp],r8 mov QWORD PTR[((64+8))+rsp],r9 mov QWORD PTR[((64+16))+rsp],r10 mov QWORD PTR[((64+24))+rsp],r11 mov QWORD PTR[((64+32))+rsp],r12 mov QWORD PTR[((64+40))+rsp],r13 mov QWORD PTR[((64+48))+rsp],r14 mov QWORD PTR[((64+56))+rsp],r15 mov rdx,QWORD PTR[128+rsp] mov rdi,QWORD PTR[((128+8))+rsp] mov rbp,QWORD PTR[((128+16))+rsp] mov r8,QWORD PTR[rsp] mov r9,QWORD PTR[8+rsp] mov r10,QWORD PTR[16+rsp] mov r11,QWORD PTR[24+rsp] mov r12,QWORD PTR[32+rsp] mov r13,QWORD PTR[40+rsp] mov r14,QWORD PTR[48+rsp] mov r15,QWORD PTR[56+rsp] call __rsaz_512_reducex $L$mul_gather_tail:: add r8,QWORD PTR[64+rsp] adc r9,QWORD PTR[72+rsp] adc r10,QWORD PTR[80+rsp] adc r11,QWORD PTR[88+rsp] adc r12,QWORD PTR[96+rsp] adc r13,QWORD PTR[104+rsp] adc r14,QWORD PTR[112+rsp] adc r15,QWORD PTR[120+rsp] sbb rcx,rcx call __rsaz_512_subtract lea rax,QWORD PTR[((128+24+48))+rsp] movaps xmm6,XMMWORD PTR[((160-200))+rax] movaps xmm7,XMMWORD PTR[((176-200))+rax] movaps xmm8,XMMWORD PTR[((192-200))+rax] movaps xmm9,XMMWORD PTR[((208-200))+rax] movaps xmm10,XMMWORD PTR[((224-200))+rax] movaps xmm11,XMMWORD PTR[((240-200))+rax] movaps xmm12,XMMWORD PTR[((256-200))+rax] movaps xmm13,XMMWORD PTR[((272-200))+rax] movaps xmm14,XMMWORD PTR[((288-200))+rax] movaps xmm15,XMMWORD PTR[((304-200))+rax] lea rax,QWORD PTR[176+rax] mov r15,QWORD PTR[((-48))+rax] mov r14,QWORD PTR[((-40))+rax] mov r13,QWORD PTR[((-32))+rax] mov r12,QWORD PTR[((-24))+rax] mov rbp,QWORD PTR[((-16))+rax] mov rbx,QWORD PTR[((-8))+rax] lea rsp,QWORD PTR[rax] $L$mul_gather4_epilogue:: mov rdi,QWORD PTR[8+rsp] ;WIN64 epilogue mov rsi,QWORD PTR[16+rsp] DB 0F3h,0C3h ;repret $L$SEH_end_rsaz_512_mul_gather4:: rsaz_512_mul_gather4 ENDP PUBLIC rsaz_512_mul_scatter4 ALIGN 32 rsaz_512_mul_scatter4 PROC PUBLIC mov QWORD PTR[8+rsp],rdi ;WIN64 prologue mov QWORD PTR[16+rsp],rsi mov rax,rsp $L$SEH_begin_rsaz_512_mul_scatter4:: mov rdi,rcx mov rsi,rdx mov rdx,r8 mov rcx,r9 mov r8,QWORD PTR[40+rsp] mov r9,QWORD PTR[48+rsp] push rbx push rbp push r12 push r13 push r14 push r15 mov r9d,r9d sub rsp,128+24 $L$mul_scatter4_body:: lea r8,QWORD PTR[r9*8+r8] DB 102,72,15,110,199 DB 102,72,15,110,202 DB 102,73,15,110,208 mov QWORD PTR[128+rsp],rcx mov rbp,rdi mov r11d,080100h and r11d,DWORD PTR[((OPENSSL_ia32cap_P+8))] cmp r11d,080100h je $L$mulx_scatter mov rbx,QWORD PTR[rdi] call __rsaz_512_mul DB 102,72,15,126,199 DB 102,72,15,126,205 mov r8,QWORD PTR[rsp] mov r9,QWORD PTR[8+rsp] mov r10,QWORD PTR[16+rsp] mov r11,QWORD PTR[24+rsp] mov r12,QWORD PTR[32+rsp] mov r13,QWORD PTR[40+rsp] mov r14,QWORD PTR[48+rsp] mov r15,QWORD PTR[56+rsp] call __rsaz_512_reduce jmp $L$mul_scatter_tail ALIGN 32 $L$mulx_scatter:: mov rdx,QWORD PTR[rdi] call __rsaz_512_mulx DB 102,72,15,126,199 DB 102,72,15,126,205 mov rdx,QWORD PTR[128+rsp] mov r8,QWORD PTR[rsp] mov r9,QWORD PTR[8+rsp] mov r10,QWORD PTR[16+rsp] mov r11,QWORD PTR[24+rsp] mov r12,QWORD PTR[32+rsp] mov r13,QWORD PTR[40+rsp] mov r14,QWORD PTR[48+rsp] mov r15,QWORD PTR[56+rsp] call __rsaz_512_reducex $L$mul_scatter_tail:: add r8,QWORD PTR[64+rsp] adc r9,QWORD PTR[72+rsp] adc r10,QWORD PTR[80+rsp] adc r11,QWORD PTR[88+rsp] adc r12,QWORD PTR[96+rsp] adc r13,QWORD PTR[104+rsp] adc r14,QWORD PTR[112+rsp] adc r15,QWORD PTR[120+rsp] DB 102,72,15,126,214 sbb rcx,rcx call __rsaz_512_subtract mov QWORD PTR[rsi],r8 mov QWORD PTR[128+rsi],r9 mov QWORD PTR[256+rsi],r10 mov QWORD PTR[384+rsi],r11 mov QWORD PTR[512+rsi],r12 mov QWORD PTR[640+rsi],r13 mov QWORD PTR[768+rsi],r14 mov QWORD PTR[896+rsi],r15 lea rax,QWORD PTR[((128+24+48))+rsp] mov r15,QWORD PTR[((-48))+rax] mov r14,QWORD PTR[((-40))+rax] mov r13,QWORD PTR[((-32))+rax] mov r12,QWORD PTR[((-24))+rax] mov rbp,QWORD PTR[((-16))+rax] mov rbx,QWORD PTR[((-8))+rax] lea rsp,QWORD PTR[rax] $L$mul_scatter4_epilogue:: mov rdi,QWORD PTR[8+rsp] ;WIN64 epilogue mov rsi,QWORD PTR[16+rsp] DB 0F3h,0C3h ;repret $L$SEH_end_rsaz_512_mul_scatter4:: rsaz_512_mul_scatter4 ENDP PUBLIC rsaz_512_mul_by_one ALIGN 32 rsaz_512_mul_by_one PROC PUBLIC mov QWORD PTR[8+rsp],rdi ;WIN64 prologue mov QWORD PTR[16+rsp],rsi mov rax,rsp $L$SEH_begin_rsaz_512_mul_by_one:: mov rdi,rcx mov rsi,rdx mov rdx,r8 mov rcx,r9 push rbx push rbp push r12 push r13 push r14 push r15 sub rsp,128+24 $L$mul_by_one_body:: mov eax,DWORD PTR[((OPENSSL_ia32cap_P+8))] mov rbp,rdx mov QWORD PTR[128+rsp],rcx mov r8,QWORD PTR[rsi] pxor xmm0,xmm0 mov r9,QWORD PTR[8+rsi] mov r10,QWORD PTR[16+rsi] mov r11,QWORD PTR[24+rsi] mov r12,QWORD PTR[32+rsi] mov r13,QWORD PTR[40+rsi] mov r14,QWORD PTR[48+rsi] mov r15,QWORD PTR[56+rsi] movdqa XMMWORD PTR[rsp],xmm0 movdqa XMMWORD PTR[16+rsp],xmm0 movdqa XMMWORD PTR[32+rsp],xmm0 movdqa XMMWORD PTR[48+rsp],xmm0 movdqa XMMWORD PTR[64+rsp],xmm0 movdqa XMMWORD PTR[80+rsp],xmm0 movdqa XMMWORD PTR[96+rsp],xmm0 and eax,080100h cmp eax,080100h je $L$by_one_callx call __rsaz_512_reduce jmp $L$by_one_tail ALIGN 32 $L$by_one_callx:: mov rdx,QWORD PTR[128+rsp] call __rsaz_512_reducex $L$by_one_tail:: mov QWORD PTR[rdi],r8 mov QWORD PTR[8+rdi],r9 mov QWORD PTR[16+rdi],r10 mov QWORD PTR[24+rdi],r11 mov QWORD PTR[32+rdi],r12 mov QWORD PTR[40+rdi],r13 mov QWORD PTR[48+rdi],r14 mov QWORD PTR[56+rdi],r15 lea rax,QWORD PTR[((128+24+48))+rsp] mov r15,QWORD PTR[((-48))+rax] mov r14,QWORD PTR[((-40))+rax] mov r13,QWORD PTR[((-32))+rax] mov r12,QWORD PTR[((-24))+rax] mov rbp,QWORD PTR[((-16))+rax] mov rbx,QWORD PTR[((-8))+rax] lea rsp,QWORD PTR[rax] $L$mul_by_one_epilogue:: mov rdi,QWORD PTR[8+rsp] ;WIN64 epilogue mov rsi,QWORD PTR[16+rsp] DB 0F3h,0C3h ;repret $L$SEH_end_rsaz_512_mul_by_one:: rsaz_512_mul_by_one ENDP ALIGN 32 __rsaz_512_reduce PROC PRIVATE mov rbx,r8 imul rbx,QWORD PTR[((128+8))+rsp] mov rax,QWORD PTR[rbp] mov ecx,8 jmp $L$reduction_loop ALIGN 32 $L$reduction_loop:: mul rbx mov rax,QWORD PTR[8+rbp] neg r8 mov r8,rdx adc r8,0 mul rbx add r9,rax mov rax,QWORD PTR[16+rbp] adc rdx,0 add r8,r9 mov r9,rdx adc r9,0 mul rbx add r10,rax mov rax,QWORD PTR[24+rbp] adc rdx,0 add r9,r10 mov r10,rdx adc r10,0 mul rbx add r11,rax mov rax,QWORD PTR[32+rbp] adc rdx,0 add r10,r11 mov rsi,QWORD PTR[((128+8))+rsp] adc rdx,0 mov r11,rdx mul rbx add r12,rax mov rax,QWORD PTR[40+rbp] adc rdx,0 imul rsi,r8 add r11,r12 mov r12,rdx adc r12,0 mul rbx add r13,rax mov rax,QWORD PTR[48+rbp] adc rdx,0 add r12,r13 mov r13,rdx adc r13,0 mul rbx add r14,rax mov rax,QWORD PTR[56+rbp] adc rdx,0 add r13,r14 mov r14,rdx adc r14,0 mul rbx mov rbx,rsi add r15,rax mov rax,QWORD PTR[rbp] adc rdx,0 add r14,r15 mov r15,rdx adc r15,0 dec ecx jne $L$reduction_loop DB 0F3h,0C3h ;repret __rsaz_512_reduce ENDP ALIGN 32 __rsaz_512_reducex PROC PRIVATE imul rdx,r8 xor rsi,rsi mov ecx,8 jmp $L$reduction_loopx ALIGN 32 $L$reduction_loopx:: mov rbx,r8 mulx r8,rax,QWORD PTR[rbp] adcx rax,rbx adox r8,r9 mulx r9,rax,QWORD PTR[8+rbp] adcx r8,rax adox r9,r10 mulx r10,rbx,QWORD PTR[16+rbp] adcx r9,rbx adox r10,r11 mulx r11,rbx,QWORD PTR[24+rbp] adcx r10,rbx adox r11,r12 DB 0c4h,062h,0e3h,0f6h,0a5h,020h,000h,000h,000h mov rax,rdx mov rdx,r8 adcx r11,rbx adox r12,r13 mulx rdx,rbx,QWORD PTR[((128+8))+rsp] mov rdx,rax mulx r13,rax,QWORD PTR[40+rbp] adcx r12,rax adox r13,r14 DB 0c4h,062h,0fbh,0f6h,0b5h,030h,000h,000h,000h adcx r13,rax adox r14,r15 mulx r15,rax,QWORD PTR[56+rbp] mov rdx,rbx adcx r14,rax adox r15,rsi adcx r15,rsi dec ecx jne $L$reduction_loopx DB 0F3h,0C3h ;repret __rsaz_512_reducex ENDP ALIGN 32 __rsaz_512_subtract PROC PRIVATE mov QWORD PTR[rdi],r8 mov QWORD PTR[8+rdi],r9 mov QWORD PTR[16+rdi],r10 mov QWORD PTR[24+rdi],r11 mov QWORD PTR[32+rdi],r12 mov QWORD PTR[40+rdi],r13 mov QWORD PTR[48+rdi],r14 mov QWORD PTR[56+rdi],r15 mov r8,QWORD PTR[rbp] mov r9,QWORD PTR[8+rbp] neg r8 not r9 and r8,rcx mov r10,QWORD PTR[16+rbp] and r9,rcx not r10 mov r11,QWORD PTR[24+rbp] and r10,rcx not r11 mov r12,QWORD PTR[32+rbp] and r11,rcx not r12 mov r13,QWORD PTR[40+rbp] and r12,rcx not r13 mov r14,QWORD PTR[48+rbp] and r13,rcx not r14 mov r15,QWORD PTR[56+rbp] and r14,rcx not r15 and r15,rcx add r8,QWORD PTR[rdi] adc r9,QWORD PTR[8+rdi] adc r10,QWORD PTR[16+rdi] adc r11,QWORD PTR[24+rdi] adc r12,QWORD PTR[32+rdi] adc r13,QWORD PTR[40+rdi] adc r14,QWORD PTR[48+rdi] adc r15,QWORD PTR[56+rdi] mov QWORD PTR[rdi],r8 mov QWORD PTR[8+rdi],r9 mov QWORD PTR[16+rdi],r10 mov QWORD PTR[24+rdi],r11 mov QWORD PTR[32+rdi],r12 mov QWORD PTR[40+rdi],r13 mov QWORD PTR[48+rdi],r14 mov QWORD PTR[56+rdi],r15 DB 0F3h,0C3h ;repret __rsaz_512_subtract ENDP ALIGN 32 __rsaz_512_mul PROC PRIVATE lea rdi,QWORD PTR[8+rsp] mov rax,QWORD PTR[rsi] mul rbx mov QWORD PTR[rdi],rax mov rax,QWORD PTR[8+rsi] mov r8,rdx mul rbx add r8,rax mov rax,QWORD PTR[16+rsi] mov r9,rdx adc r9,0 mul rbx add r9,rax mov rax,QWORD PTR[24+rsi] mov r10,rdx adc r10,0 mul rbx add r10,rax mov rax,QWORD PTR[32+rsi] mov r11,rdx adc r11,0 mul rbx add r11,rax mov rax,QWORD PTR[40+rsi] mov r12,rdx adc r12,0 mul rbx add r12,rax mov rax,QWORD PTR[48+rsi] mov r13,rdx adc r13,0 mul rbx add r13,rax mov rax,QWORD PTR[56+rsi] mov r14,rdx adc r14,0 mul rbx add r14,rax mov rax,QWORD PTR[rsi] mov r15,rdx adc r15,0 lea rbp,QWORD PTR[8+rbp] lea rdi,QWORD PTR[8+rdi] mov ecx,7 jmp $L$oop_mul ALIGN 32 $L$oop_mul:: mov rbx,QWORD PTR[rbp] mul rbx add r8,rax mov rax,QWORD PTR[8+rsi] mov QWORD PTR[rdi],r8 mov r8,rdx adc r8,0 mul rbx add r9,rax mov rax,QWORD PTR[16+rsi] adc rdx,0 add r8,r9 mov r9,rdx adc r9,0 mul rbx add r10,rax mov rax,QWORD PTR[24+rsi] adc rdx,0 add r9,r10 mov r10,rdx adc r10,0 mul rbx add r11,rax mov rax,QWORD PTR[32+rsi] adc rdx,0 add r10,r11 mov r11,rdx adc r11,0 mul rbx add r12,rax mov rax,QWORD PTR[40+rsi] adc rdx,0 add r11,r12 mov r12,rdx adc r12,0 mul rbx add r13,rax mov rax,QWORD PTR[48+rsi] adc rdx,0 add r12,r13 mov r13,rdx adc r13,0 mul rbx add r14,rax mov rax,QWORD PTR[56+rsi] adc rdx,0 add r13,r14 mov r14,rdx lea rbp,QWORD PTR[8+rbp] adc r14,0 mul rbx add r15,rax mov rax,QWORD PTR[rsi] adc rdx,0 add r14,r15 mov r15,rdx adc r15,0 lea rdi,QWORD PTR[8+rdi] dec ecx jnz $L$oop_mul mov QWORD PTR[rdi],r8 mov QWORD PTR[8+rdi],r9 mov QWORD PTR[16+rdi],r10 mov QWORD PTR[24+rdi],r11 mov QWORD PTR[32+rdi],r12 mov QWORD PTR[40+rdi],r13 mov QWORD PTR[48+rdi],r14 mov QWORD PTR[56+rdi],r15 DB 0F3h,0C3h ;repret __rsaz_512_mul ENDP ALIGN 32 __rsaz_512_mulx PROC PRIVATE mulx r8,rbx,QWORD PTR[rsi] mov rcx,-6 mulx r9,rax,QWORD PTR[8+rsi] mov QWORD PTR[8+rsp],rbx mulx r10,rbx,QWORD PTR[16+rsi] adc r8,rax mulx r11,rax,QWORD PTR[24+rsi] adc r9,rbx mulx r12,rbx,QWORD PTR[32+rsi] adc r10,rax mulx r13,rax,QWORD PTR[40+rsi] adc r11,rbx mulx r14,rbx,QWORD PTR[48+rsi] adc r12,rax mulx r15,rax,QWORD PTR[56+rsi] mov rdx,QWORD PTR[8+rbp] adc r13,rbx adc r14,rax adc r15,0 xor rdi,rdi jmp $L$oop_mulx ALIGN 32 $L$oop_mulx:: mov rbx,r8 mulx r8,rax,QWORD PTR[rsi] adcx rbx,rax adox r8,r9 mulx r9,rax,QWORD PTR[8+rsi] adcx r8,rax adox r9,r10 mulx r10,rax,QWORD PTR[16+rsi] adcx r9,rax adox r10,r11 mulx r11,rax,QWORD PTR[24+rsi] adcx r10,rax adox r11,r12 DB 03eh,0c4h,062h,0fbh,0f6h,0a6h,020h,000h,000h,000h adcx r11,rax adox r12,r13 mulx r13,rax,QWORD PTR[40+rsi] adcx r12,rax adox r13,r14 mulx r14,rax,QWORD PTR[48+rsi] adcx r13,rax adox r14,r15 mulx r15,rax,QWORD PTR[56+rsi] mov rdx,QWORD PTR[64+rcx*8+rbp] mov QWORD PTR[((8+64-8))+rcx*8+rsp],rbx adcx r14,rax adox r15,rdi adcx r15,rdi inc rcx jnz $L$oop_mulx mov rbx,r8 mulx r8,rax,QWORD PTR[rsi] adcx rbx,rax adox r8,r9 DB 0c4h,062h,0fbh,0f6h,08eh,008h,000h,000h,000h adcx r8,rax adox r9,r10 DB 0c4h,062h,0fbh,0f6h,096h,010h,000h,000h,000h adcx r9,rax adox r10,r11 mulx r11,rax,QWORD PTR[24+rsi] adcx r10,rax adox r11,r12 mulx r12,rax,QWORD PTR[32+rsi] adcx r11,rax adox r12,r13 mulx r13,rax,QWORD PTR[40+rsi] adcx r12,rax adox r13,r14 DB 0c4h,062h,0fbh,0f6h,0b6h,030h,000h,000h,000h adcx r13,rax adox r14,r15 DB 0c4h,062h,0fbh,0f6h,0beh,038h,000h,000h,000h adcx r14,rax adox r15,rdi adcx r15,rdi mov QWORD PTR[((8+64-8))+rsp],rbx mov QWORD PTR[((8+64))+rsp],r8 mov QWORD PTR[((8+64+8))+rsp],r9 mov QWORD PTR[((8+64+16))+rsp],r10 mov QWORD PTR[((8+64+24))+rsp],r11 mov QWORD PTR[((8+64+32))+rsp],r12 mov QWORD PTR[((8+64+40))+rsp],r13 mov QWORD PTR[((8+64+48))+rsp],r14 mov QWORD PTR[((8+64+56))+rsp],r15 DB 0F3h,0C3h ;repret __rsaz_512_mulx ENDP PUBLIC rsaz_512_scatter4 ALIGN 16 rsaz_512_scatter4 PROC PUBLIC lea rcx,QWORD PTR[r8*8+rcx] mov r9d,8 jmp $L$oop_scatter ALIGN 16 $L$oop_scatter:: mov rax,QWORD PTR[rdx] lea rdx,QWORD PTR[8+rdx] mov QWORD PTR[rcx],rax lea rcx,QWORD PTR[128+rcx] dec r9d jnz $L$oop_scatter DB 0F3h,0C3h ;repret rsaz_512_scatter4 ENDP PUBLIC rsaz_512_gather4 ALIGN 16 rsaz_512_gather4 PROC PUBLIC $L$SEH_begin_rsaz_512_gather4:: DB 048h,081h,0ech,0a8h,000h,000h,000h DB 00fh,029h,034h,024h DB 00fh,029h,07ch,024h,010h DB 044h,00fh,029h,044h,024h,020h DB 044h,00fh,029h,04ch,024h,030h DB 044h,00fh,029h,054h,024h,040h DB 044h,00fh,029h,05ch,024h,050h DB 044h,00fh,029h,064h,024h,060h DB 044h,00fh,029h,06ch,024h,070h DB 044h,00fh,029h,0b4h,024h,080h,0,0,0 DB 044h,00fh,029h,0bch,024h,090h,0,0,0 movd xmm8,r8d movdqa xmm1,XMMWORD PTR[(($L$inc+16))] movdqa xmm0,XMMWORD PTR[$L$inc] pshufd xmm8,xmm8,0 movdqa xmm7,xmm1 movdqa xmm2,xmm1 paddd xmm1,xmm0 pcmpeqd xmm0,xmm8 movdqa xmm3,xmm7 paddd xmm2,xmm1 pcmpeqd xmm1,xmm8 movdqa xmm4,xmm7 paddd xmm3,xmm2 pcmpeqd xmm2,xmm8 movdqa xmm5,xmm7 paddd xmm4,xmm3 pcmpeqd xmm3,xmm8 movdqa xmm6,xmm7 paddd xmm5,xmm4 pcmpeqd xmm4,xmm8 paddd xmm6,xmm5 pcmpeqd xmm5,xmm8 paddd xmm7,xmm6 pcmpeqd xmm6,xmm8 pcmpeqd xmm7,xmm8 mov r9d,8 jmp $L$oop_gather ALIGN 16 $L$oop_gather:: movdqa xmm8,XMMWORD PTR[rdx] movdqa xmm9,XMMWORD PTR[16+rdx] movdqa xmm10,XMMWORD PTR[32+rdx] movdqa xmm11,XMMWORD PTR[48+rdx] pand xmm8,xmm0 movdqa xmm12,XMMWORD PTR[64+rdx] pand xmm9,xmm1 movdqa xmm13,XMMWORD PTR[80+rdx] pand xmm10,xmm2 movdqa xmm14,XMMWORD PTR[96+rdx] pand xmm11,xmm3 movdqa xmm15,XMMWORD PTR[112+rdx] lea rdx,QWORD PTR[128+rdx] pand xmm12,xmm4 pand xmm13,xmm5 pand xmm14,xmm6 pand xmm15,xmm7 por xmm8,xmm10 por xmm9,xmm11 por xmm8,xmm12 por xmm9,xmm13 por xmm8,xmm14 por xmm9,xmm15 por xmm8,xmm9 pshufd xmm9,xmm8,04eh por xmm8,xmm9 movq QWORD PTR[rcx],xmm8 lea rcx,QWORD PTR[8+rcx] dec r9d jnz $L$oop_gather movaps xmm6,XMMWORD PTR[rsp] movaps xmm7,XMMWORD PTR[16+rsp] movaps xmm8,XMMWORD PTR[32+rsp] movaps xmm9,XMMWORD PTR[48+rsp] movaps xmm10,XMMWORD PTR[64+rsp] movaps xmm11,XMMWORD PTR[80+rsp] movaps xmm12,XMMWORD PTR[96+rsp] movaps xmm13,XMMWORD PTR[112+rsp] movaps xmm14,XMMWORD PTR[128+rsp] movaps xmm15,XMMWORD PTR[144+rsp] add rsp,0a8h DB 0F3h,0C3h ;repret $L$SEH_end_rsaz_512_gather4:: rsaz_512_gather4 ENDP ALIGN 64 $L$inc:: DD 0,0,1,1 DD 2,2,2,2 EXTERN __imp_RtlVirtualUnwind:NEAR ALIGN 16 se_handler PROC PRIVATE push rsi push rdi push rbx push rbp push r12 push r13 push r14 push r15 pushfq sub rsp,64 mov rax,QWORD PTR[120+r8] mov rbx,QWORD PTR[248+r8] mov rsi,QWORD PTR[8+r9] mov r11,QWORD PTR[56+r9] mov r10d,DWORD PTR[r11] lea r10,QWORD PTR[r10*1+rsi] cmp rbx,r10 jb $L$common_seh_tail mov rax,QWORD PTR[152+r8] mov r10d,DWORD PTR[4+r11] lea r10,QWORD PTR[r10*1+rsi] cmp rbx,r10 jae $L$common_seh_tail lea rax,QWORD PTR[((128+24+48))+rax] lea rbx,QWORD PTR[$L$mul_gather4_epilogue] cmp rbx,r10 jne $L$se_not_in_mul_gather4 lea rax,QWORD PTR[176+rax] lea rsi,QWORD PTR[((-48-168))+rax] lea rdi,QWORD PTR[512+r8] mov ecx,20 DD 0a548f3fch $L$se_not_in_mul_gather4:: mov rbx,QWORD PTR[((-8))+rax] mov rbp,QWORD PTR[((-16))+rax] mov r12,QWORD PTR[((-24))+rax] mov r13,QWORD PTR[((-32))+rax] mov r14,QWORD PTR[((-40))+rax] mov r15,QWORD PTR[((-48))+rax] mov QWORD PTR[144+r8],rbx mov QWORD PTR[160+r8],rbp mov QWORD PTR[216+r8],r12 mov QWORD PTR[224+r8],r13 mov QWORD PTR[232+r8],r14 mov QWORD PTR[240+r8],r15 $L$common_seh_tail:: mov rdi,QWORD PTR[8+rax] mov rsi,QWORD PTR[16+rax] mov QWORD PTR[152+r8],rax mov QWORD PTR[168+r8],rsi mov QWORD PTR[176+r8],rdi mov rdi,QWORD PTR[40+r9] mov rsi,r8 mov ecx,154 DD 0a548f3fch mov rsi,r9 xor rcx,rcx mov rdx,QWORD PTR[8+rsi] mov r8,QWORD PTR[rsi] mov r9,QWORD PTR[16+rsi] mov r10,QWORD PTR[40+rsi] lea r11,QWORD PTR[56+rsi] lea r12,QWORD PTR[24+rsi] mov QWORD PTR[32+rsp],r10 mov QWORD PTR[40+rsp],r11 mov QWORD PTR[48+rsp],r12 mov QWORD PTR[56+rsp],rcx call QWORD PTR[__imp_RtlVirtualUnwind] mov eax,1 add rsp,64 popfq pop r15 pop r14 pop r13 pop r12 pop rbp pop rbx pop rdi pop rsi DB 0F3h,0C3h ;repret se_handler ENDP .text$ ENDS .pdata SEGMENT READONLY ALIGN(4) ALIGN 4 DD imagerel $L$SEH_begin_rsaz_512_sqr DD imagerel $L$SEH_end_rsaz_512_sqr DD imagerel $L$SEH_info_rsaz_512_sqr DD imagerel $L$SEH_begin_rsaz_512_mul DD imagerel $L$SEH_end_rsaz_512_mul DD imagerel $L$SEH_info_rsaz_512_mul DD imagerel $L$SEH_begin_rsaz_512_mul_gather4 DD imagerel $L$SEH_end_rsaz_512_mul_gather4 DD imagerel $L$SEH_info_rsaz_512_mul_gather4 DD imagerel $L$SEH_begin_rsaz_512_mul_scatter4 DD imagerel $L$SEH_end_rsaz_512_mul_scatter4 DD imagerel $L$SEH_info_rsaz_512_mul_scatter4 DD imagerel $L$SEH_begin_rsaz_512_mul_by_one DD imagerel $L$SEH_end_rsaz_512_mul_by_one DD imagerel $L$SEH_info_rsaz_512_mul_by_one DD imagerel $L$SEH_begin_rsaz_512_gather4 DD imagerel $L$SEH_end_rsaz_512_gather4 DD imagerel $L$SEH_info_rsaz_512_gather4 .pdata ENDS .xdata SEGMENT READONLY ALIGN(8) ALIGN 8 $L$SEH_info_rsaz_512_sqr:: DB 9,0,0,0 DD imagerel se_handler DD imagerel $L$sqr_body,imagerel $L$sqr_epilogue $L$SEH_info_rsaz_512_mul:: DB 9,0,0,0 DD imagerel se_handler DD imagerel $L$mul_body,imagerel $L$mul_epilogue $L$SEH_info_rsaz_512_mul_gather4:: DB 9,0,0,0 DD imagerel se_handler DD imagerel $L$mul_gather4_body,imagerel $L$mul_gather4_epilogue $L$SEH_info_rsaz_512_mul_scatter4:: DB 9,0,0,0 DD imagerel se_handler DD imagerel $L$mul_scatter4_body,imagerel $L$mul_scatter4_epilogue $L$SEH_info_rsaz_512_mul_by_one:: DB 9,0,0,0 DD imagerel se_handler DD imagerel $L$mul_by_one_body,imagerel $L$mul_by_one_epilogue $L$SEH_info_rsaz_512_gather4:: DB 001h,046h,016h,000h DB 046h,0f8h,009h,000h DB 03dh,0e8h,008h,000h DB 034h,0d8h,007h,000h DB 02eh,0c8h,006h,000h DB 028h,0b8h,005h,000h DB 022h,0a8h,004h,000h DB 01ch,098h,003h,000h DB 016h,088h,002h,000h DB 010h,078h,001h,000h DB 00bh,068h,000h,000h DB 007h,001h,015h,000h .xdata ENDS END