You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
 
 
 
 
 
 

2155 lines
36 KiB

OPTION DOTNAME
.text$ SEGMENT ALIGN(256) 'CODE'
EXTERN OPENSSL_ia32cap_P:NEAR
PUBLIC rsaz_512_sqr
ALIGN 32
rsaz_512_sqr PROC PUBLIC
mov QWORD PTR[8+rsp],rdi ;WIN64 prologue
mov QWORD PTR[16+rsp],rsi
mov rax,rsp
$L$SEH_begin_rsaz_512_sqr::
mov rdi,rcx
mov rsi,rdx
mov rdx,r8
mov rcx,r9
mov r8,QWORD PTR[40+rsp]
push rbx
push rbp
push r12
push r13
push r14
push r15
sub rsp,128+24
$L$sqr_body::
mov rbp,rdx
mov rdx,QWORD PTR[rsi]
mov rax,QWORD PTR[8+rsi]
mov QWORD PTR[128+rsp],rcx
mov r11d,080100h
and r11d,DWORD PTR[((OPENSSL_ia32cap_P+8))]
cmp r11d,080100h
je $L$oop_sqrx
jmp $L$oop_sqr
ALIGN 32
$L$oop_sqr::
mov DWORD PTR[((128+8))+rsp],r8d
mov rbx,rdx
mul rdx
mov r8,rax
mov rax,QWORD PTR[16+rsi]
mov r9,rdx
mul rbx
add r9,rax
mov rax,QWORD PTR[24+rsi]
mov r10,rdx
adc r10,0
mul rbx
add r10,rax
mov rax,QWORD PTR[32+rsi]
mov r11,rdx
adc r11,0
mul rbx
add r11,rax
mov rax,QWORD PTR[40+rsi]
mov r12,rdx
adc r12,0
mul rbx
add r12,rax
mov rax,QWORD PTR[48+rsi]
mov r13,rdx
adc r13,0
mul rbx
add r13,rax
mov rax,QWORD PTR[56+rsi]
mov r14,rdx
adc r14,0
mul rbx
add r14,rax
mov rax,rbx
mov r15,rdx
adc r15,0
add r8,r8
mov rcx,r9
adc r9,r9
mul rax
mov QWORD PTR[rsp],rax
add r8,rdx
adc r9,0
mov QWORD PTR[8+rsp],r8
shr rcx,63
mov r8,QWORD PTR[8+rsi]
mov rax,QWORD PTR[16+rsi]
mul r8
add r10,rax
mov rax,QWORD PTR[24+rsi]
mov rbx,rdx
adc rbx,0
mul r8
add r11,rax
mov rax,QWORD PTR[32+rsi]
adc rdx,0
add r11,rbx
mov rbx,rdx
adc rbx,0
mul r8
add r12,rax
mov rax,QWORD PTR[40+rsi]
adc rdx,0
add r12,rbx
mov rbx,rdx
adc rbx,0
mul r8
add r13,rax
mov rax,QWORD PTR[48+rsi]
adc rdx,0
add r13,rbx
mov rbx,rdx
adc rbx,0
mul r8
add r14,rax
mov rax,QWORD PTR[56+rsi]
adc rdx,0
add r14,rbx
mov rbx,rdx
adc rbx,0
mul r8
add r15,rax
mov rax,r8
adc rdx,0
add r15,rbx
mov r8,rdx
mov rdx,r10
adc r8,0
add rdx,rdx
lea r10,QWORD PTR[r10*2+rcx]
mov rbx,r11
adc r11,r11
mul rax
add r9,rax
adc r10,rdx
adc r11,0
mov QWORD PTR[16+rsp],r9
mov QWORD PTR[24+rsp],r10
shr rbx,63
mov r9,QWORD PTR[16+rsi]
mov rax,QWORD PTR[24+rsi]
mul r9
add r12,rax
mov rax,QWORD PTR[32+rsi]
mov rcx,rdx
adc rcx,0
mul r9
add r13,rax
mov rax,QWORD PTR[40+rsi]
adc rdx,0
add r13,rcx
mov rcx,rdx
adc rcx,0
mul r9
add r14,rax
mov rax,QWORD PTR[48+rsi]
adc rdx,0
add r14,rcx
mov rcx,rdx
adc rcx,0
mul r9
mov r10,r12
lea r12,QWORD PTR[r12*2+rbx]
add r15,rax
mov rax,QWORD PTR[56+rsi]
adc rdx,0
add r15,rcx
mov rcx,rdx
adc rcx,0
mul r9
shr r10,63
add r8,rax
mov rax,r9
adc rdx,0
add r8,rcx
mov r9,rdx
adc r9,0
mov rcx,r13
lea r13,QWORD PTR[r13*2+r10]
mul rax
add r11,rax
adc r12,rdx
adc r13,0
mov QWORD PTR[32+rsp],r11
mov QWORD PTR[40+rsp],r12
shr rcx,63
mov r10,QWORD PTR[24+rsi]
mov rax,QWORD PTR[32+rsi]
mul r10
add r14,rax
mov rax,QWORD PTR[40+rsi]
mov rbx,rdx
adc rbx,0
mul r10
add r15,rax
mov rax,QWORD PTR[48+rsi]
adc rdx,0
add r15,rbx
mov rbx,rdx
adc rbx,0
mul r10
mov r12,r14
lea r14,QWORD PTR[r14*2+rcx]
add r8,rax
mov rax,QWORD PTR[56+rsi]
adc rdx,0
add r8,rbx
mov rbx,rdx
adc rbx,0
mul r10
shr r12,63
add r9,rax
mov rax,r10
adc rdx,0
add r9,rbx
mov r10,rdx
adc r10,0
mov rbx,r15
lea r15,QWORD PTR[r15*2+r12]
mul rax
add r13,rax
adc r14,rdx
adc r15,0
mov QWORD PTR[48+rsp],r13
mov QWORD PTR[56+rsp],r14
shr rbx,63
mov r11,QWORD PTR[32+rsi]
mov rax,QWORD PTR[40+rsi]
mul r11
add r8,rax
mov rax,QWORD PTR[48+rsi]
mov rcx,rdx
adc rcx,0
mul r11
add r9,rax
mov rax,QWORD PTR[56+rsi]
adc rdx,0
mov r12,r8
lea r8,QWORD PTR[r8*2+rbx]
add r9,rcx
mov rcx,rdx
adc rcx,0
mul r11
shr r12,63
add r10,rax
mov rax,r11
adc rdx,0
add r10,rcx
mov r11,rdx
adc r11,0
mov rcx,r9
lea r9,QWORD PTR[r9*2+r12]
mul rax
add r15,rax
adc r8,rdx
adc r9,0
mov QWORD PTR[64+rsp],r15
mov QWORD PTR[72+rsp],r8
shr rcx,63
mov r12,QWORD PTR[40+rsi]
mov rax,QWORD PTR[48+rsi]
mul r12
add r10,rax
mov rax,QWORD PTR[56+rsi]
mov rbx,rdx
adc rbx,0
mul r12
add r11,rax
mov rax,r12
mov r15,r10
lea r10,QWORD PTR[r10*2+rcx]
adc rdx,0
shr r15,63
add r11,rbx
mov r12,rdx
adc r12,0
mov rbx,r11
lea r11,QWORD PTR[r11*2+r15]
mul rax
add r9,rax
adc r10,rdx
adc r11,0
mov QWORD PTR[80+rsp],r9
mov QWORD PTR[88+rsp],r10
mov r13,QWORD PTR[48+rsi]
mov rax,QWORD PTR[56+rsi]
mul r13
add r12,rax
mov rax,r13
mov r13,rdx
adc r13,0
xor r14,r14
shl rbx,1
adc r12,r12
adc r13,r13
adc r14,r14
mul rax
add r11,rax
adc r12,rdx
adc r13,0
mov QWORD PTR[96+rsp],r11
mov QWORD PTR[104+rsp],r12
mov rax,QWORD PTR[56+rsi]
mul rax
add r13,rax
adc rdx,0
add r14,rdx
mov QWORD PTR[112+rsp],r13
mov QWORD PTR[120+rsp],r14
mov r8,QWORD PTR[rsp]
mov r9,QWORD PTR[8+rsp]
mov r10,QWORD PTR[16+rsp]
mov r11,QWORD PTR[24+rsp]
mov r12,QWORD PTR[32+rsp]
mov r13,QWORD PTR[40+rsp]
mov r14,QWORD PTR[48+rsp]
mov r15,QWORD PTR[56+rsp]
call __rsaz_512_reduce
add r8,QWORD PTR[64+rsp]
adc r9,QWORD PTR[72+rsp]
adc r10,QWORD PTR[80+rsp]
adc r11,QWORD PTR[88+rsp]
adc r12,QWORD PTR[96+rsp]
adc r13,QWORD PTR[104+rsp]
adc r14,QWORD PTR[112+rsp]
adc r15,QWORD PTR[120+rsp]
sbb rcx,rcx
call __rsaz_512_subtract
mov rdx,r8
mov rax,r9
mov r8d,DWORD PTR[((128+8))+rsp]
mov rsi,rdi
dec r8d
jnz $L$oop_sqr
jmp $L$sqr_tail
ALIGN 32
$L$oop_sqrx::
mov DWORD PTR[((128+8))+rsp],r8d
DB 102,72,15,110,199
DB 102,72,15,110,205
mulx r9,r8,rax
mulx r10,rcx,QWORD PTR[16+rsi]
xor rbp,rbp
mulx r11,rax,QWORD PTR[24+rsi]
adcx r9,rcx
mulx r12,rcx,QWORD PTR[32+rsi]
adcx r10,rax
mulx r13,rax,QWORD PTR[40+rsi]
adcx r11,rcx
DB 0c4h,062h,0f3h,0f6h,0b6h,030h,000h,000h,000h
adcx r12,rax
adcx r13,rcx
DB 0c4h,062h,0fbh,0f6h,0beh,038h,000h,000h,000h
adcx r14,rax
adcx r15,rbp
mov rcx,r9
shld r9,r8,1
shl r8,1
xor ebp,ebp
mulx rdx,rax,rdx
adcx r8,rdx
mov rdx,QWORD PTR[8+rsi]
adcx r9,rbp
mov QWORD PTR[rsp],rax
mov QWORD PTR[8+rsp],r8
mulx rbx,rax,QWORD PTR[16+rsi]
adox r10,rax
adcx r11,rbx
DB 0c4h,062h,0c3h,0f6h,086h,018h,000h,000h,000h
adox r11,rdi
adcx r12,r8
mulx rbx,rax,QWORD PTR[32+rsi]
adox r12,rax
adcx r13,rbx
mulx r8,rdi,QWORD PTR[40+rsi]
adox r13,rdi
adcx r14,r8
DB 0c4h,0e2h,0fbh,0f6h,09eh,030h,000h,000h,000h
adox r14,rax
adcx r15,rbx
DB 0c4h,062h,0c3h,0f6h,086h,038h,000h,000h,000h
adox r15,rdi
adcx r8,rbp
adox r8,rbp
mov rbx,r11
shld r11,r10,1
shld r10,rcx,1
xor ebp,ebp
mulx rcx,rax,rdx
mov rdx,QWORD PTR[16+rsi]
adcx r9,rax
adcx r10,rcx
adcx r11,rbp
mov QWORD PTR[16+rsp],r9
DB 04ch,089h,094h,024h,018h,000h,000h,000h
DB 0c4h,062h,0c3h,0f6h,08eh,018h,000h,000h,000h
adox r12,rdi
adcx r13,r9
mulx rcx,rax,QWORD PTR[32+rsi]
adox r13,rax
adcx r14,rcx
mulx r9,rdi,QWORD PTR[40+rsi]
adox r14,rdi
adcx r15,r9
DB 0c4h,0e2h,0fbh,0f6h,08eh,030h,000h,000h,000h
adox r15,rax
adcx r8,rcx
DB 0c4h,062h,0c3h,0f6h,08eh,038h,000h,000h,000h
adox r8,rdi
adcx r9,rbp
adox r9,rbp
mov rcx,r13
shld r13,r12,1
shld r12,rbx,1
xor ebp,ebp
mulx rdx,rax,rdx
adcx r11,rax
adcx r12,rdx
mov rdx,QWORD PTR[24+rsi]
adcx r13,rbp
mov QWORD PTR[32+rsp],r11
DB 04ch,089h,0a4h,024h,028h,000h,000h,000h
DB 0c4h,0e2h,0fbh,0f6h,09eh,020h,000h,000h,000h
adox r14,rax
adcx r15,rbx
mulx r10,rdi,QWORD PTR[40+rsi]
adox r15,rdi
adcx r8,r10
mulx rbx,rax,QWORD PTR[48+rsi]
adox r8,rax
adcx r9,rbx
mulx r10,rdi,QWORD PTR[56+rsi]
adox r9,rdi
adcx r10,rbp
adox r10,rbp
DB 066h
mov rbx,r15
shld r15,r14,1
shld r14,rcx,1
xor ebp,ebp
mulx rdx,rax,rdx
adcx r13,rax
adcx r14,rdx
mov rdx,QWORD PTR[32+rsi]
adcx r15,rbp
mov QWORD PTR[48+rsp],r13
mov QWORD PTR[56+rsp],r14
DB 0c4h,062h,0c3h,0f6h,09eh,028h,000h,000h,000h
adox r8,rdi
adcx r9,r11
mulx rcx,rax,QWORD PTR[48+rsi]
adox r9,rax
adcx r10,rcx
mulx r11,rdi,QWORD PTR[56+rsi]
adox r10,rdi
adcx r11,rbp
adox r11,rbp
mov rcx,r9
shld r9,r8,1
shld r8,rbx,1
xor ebp,ebp
mulx rdx,rax,rdx
adcx r15,rax
adcx r8,rdx
mov rdx,QWORD PTR[40+rsi]
adcx r9,rbp
mov QWORD PTR[64+rsp],r15
mov QWORD PTR[72+rsp],r8
DB 0c4h,0e2h,0fbh,0f6h,09eh,030h,000h,000h,000h
adox r10,rax
adcx r11,rbx
DB 0c4h,062h,0c3h,0f6h,0a6h,038h,000h,000h,000h
adox r11,rdi
adcx r12,rbp
adox r12,rbp
mov rbx,r11
shld r11,r10,1
shld r10,rcx,1
xor ebp,ebp
mulx rdx,rax,rdx
adcx r9,rax
adcx r10,rdx
mov rdx,QWORD PTR[48+rsi]
adcx r11,rbp
mov QWORD PTR[80+rsp],r9
mov QWORD PTR[88+rsp],r10
DB 0c4h,062h,0fbh,0f6h,0aeh,038h,000h,000h,000h
adox r12,rax
adox r13,rbp
xor r14,r14
shld r14,r13,1
shld r13,r12,1
shld r12,rbx,1
xor ebp,ebp
mulx rdx,rax,rdx
adcx r11,rax
adcx r12,rdx
mov rdx,QWORD PTR[56+rsi]
adcx r13,rbp
DB 04ch,089h,09ch,024h,060h,000h,000h,000h
DB 04ch,089h,0a4h,024h,068h,000h,000h,000h
mulx rdx,rax,rdx
adox r13,rax
adox rdx,rbp
DB 066h
add r14,rdx
mov QWORD PTR[112+rsp],r13
mov QWORD PTR[120+rsp],r14
DB 102,72,15,126,199
DB 102,72,15,126,205
mov rdx,QWORD PTR[128+rsp]
mov r8,QWORD PTR[rsp]
mov r9,QWORD PTR[8+rsp]
mov r10,QWORD PTR[16+rsp]
mov r11,QWORD PTR[24+rsp]
mov r12,QWORD PTR[32+rsp]
mov r13,QWORD PTR[40+rsp]
mov r14,QWORD PTR[48+rsp]
mov r15,QWORD PTR[56+rsp]
call __rsaz_512_reducex
add r8,QWORD PTR[64+rsp]
adc r9,QWORD PTR[72+rsp]
adc r10,QWORD PTR[80+rsp]
adc r11,QWORD PTR[88+rsp]
adc r12,QWORD PTR[96+rsp]
adc r13,QWORD PTR[104+rsp]
adc r14,QWORD PTR[112+rsp]
adc r15,QWORD PTR[120+rsp]
sbb rcx,rcx
call __rsaz_512_subtract
mov rdx,r8
mov rax,r9
mov r8d,DWORD PTR[((128+8))+rsp]
mov rsi,rdi
dec r8d
jnz $L$oop_sqrx
$L$sqr_tail::
lea rax,QWORD PTR[((128+24+48))+rsp]
mov r15,QWORD PTR[((-48))+rax]
mov r14,QWORD PTR[((-40))+rax]
mov r13,QWORD PTR[((-32))+rax]
mov r12,QWORD PTR[((-24))+rax]
mov rbp,QWORD PTR[((-16))+rax]
mov rbx,QWORD PTR[((-8))+rax]
lea rsp,QWORD PTR[rax]
$L$sqr_epilogue::
mov rdi,QWORD PTR[8+rsp] ;WIN64 epilogue
mov rsi,QWORD PTR[16+rsp]
DB 0F3h,0C3h ;repret
$L$SEH_end_rsaz_512_sqr::
rsaz_512_sqr ENDP
PUBLIC rsaz_512_mul
ALIGN 32
rsaz_512_mul PROC PUBLIC
mov QWORD PTR[8+rsp],rdi ;WIN64 prologue
mov QWORD PTR[16+rsp],rsi
mov rax,rsp
$L$SEH_begin_rsaz_512_mul::
mov rdi,rcx
mov rsi,rdx
mov rdx,r8
mov rcx,r9
mov r8,QWORD PTR[40+rsp]
push rbx
push rbp
push r12
push r13
push r14
push r15
sub rsp,128+24
$L$mul_body::
DB 102,72,15,110,199
DB 102,72,15,110,201
mov QWORD PTR[128+rsp],r8
mov r11d,080100h
and r11d,DWORD PTR[((OPENSSL_ia32cap_P+8))]
cmp r11d,080100h
je $L$mulx
mov rbx,QWORD PTR[rdx]
mov rbp,rdx
call __rsaz_512_mul
DB 102,72,15,126,199
DB 102,72,15,126,205
mov r8,QWORD PTR[rsp]
mov r9,QWORD PTR[8+rsp]
mov r10,QWORD PTR[16+rsp]
mov r11,QWORD PTR[24+rsp]
mov r12,QWORD PTR[32+rsp]
mov r13,QWORD PTR[40+rsp]
mov r14,QWORD PTR[48+rsp]
mov r15,QWORD PTR[56+rsp]
call __rsaz_512_reduce
jmp $L$mul_tail
ALIGN 32
$L$mulx::
mov rbp,rdx
mov rdx,QWORD PTR[rdx]
call __rsaz_512_mulx
DB 102,72,15,126,199
DB 102,72,15,126,205
mov rdx,QWORD PTR[128+rsp]
mov r8,QWORD PTR[rsp]
mov r9,QWORD PTR[8+rsp]
mov r10,QWORD PTR[16+rsp]
mov r11,QWORD PTR[24+rsp]
mov r12,QWORD PTR[32+rsp]
mov r13,QWORD PTR[40+rsp]
mov r14,QWORD PTR[48+rsp]
mov r15,QWORD PTR[56+rsp]
call __rsaz_512_reducex
$L$mul_tail::
add r8,QWORD PTR[64+rsp]
adc r9,QWORD PTR[72+rsp]
adc r10,QWORD PTR[80+rsp]
adc r11,QWORD PTR[88+rsp]
adc r12,QWORD PTR[96+rsp]
adc r13,QWORD PTR[104+rsp]
adc r14,QWORD PTR[112+rsp]
adc r15,QWORD PTR[120+rsp]
sbb rcx,rcx
call __rsaz_512_subtract
lea rax,QWORD PTR[((128+24+48))+rsp]
mov r15,QWORD PTR[((-48))+rax]
mov r14,QWORD PTR[((-40))+rax]
mov r13,QWORD PTR[((-32))+rax]
mov r12,QWORD PTR[((-24))+rax]
mov rbp,QWORD PTR[((-16))+rax]
mov rbx,QWORD PTR[((-8))+rax]
lea rsp,QWORD PTR[rax]
$L$mul_epilogue::
mov rdi,QWORD PTR[8+rsp] ;WIN64 epilogue
mov rsi,QWORD PTR[16+rsp]
DB 0F3h,0C3h ;repret
$L$SEH_end_rsaz_512_mul::
rsaz_512_mul ENDP
PUBLIC rsaz_512_mul_gather4
ALIGN 32
rsaz_512_mul_gather4 PROC PUBLIC
mov QWORD PTR[8+rsp],rdi ;WIN64 prologue
mov QWORD PTR[16+rsp],rsi
mov rax,rsp
$L$SEH_begin_rsaz_512_mul_gather4::
mov rdi,rcx
mov rsi,rdx
mov rdx,r8
mov rcx,r9
mov r8,QWORD PTR[40+rsp]
mov r9,QWORD PTR[48+rsp]
push rbx
push rbp
push r12
push r13
push r14
push r15
sub rsp,328
movaps XMMWORD PTR[160+rsp],xmm6
movaps XMMWORD PTR[176+rsp],xmm7
movaps XMMWORD PTR[192+rsp],xmm8
movaps XMMWORD PTR[208+rsp],xmm9
movaps XMMWORD PTR[224+rsp],xmm10
movaps XMMWORD PTR[240+rsp],xmm11
movaps XMMWORD PTR[256+rsp],xmm12
movaps XMMWORD PTR[272+rsp],xmm13
movaps XMMWORD PTR[288+rsp],xmm14
movaps XMMWORD PTR[304+rsp],xmm15
$L$mul_gather4_body::
movd xmm8,r9d
movdqa xmm1,XMMWORD PTR[(($L$inc+16))]
movdqa xmm0,XMMWORD PTR[$L$inc]
pshufd xmm8,xmm8,0
movdqa xmm7,xmm1
movdqa xmm2,xmm1
paddd xmm1,xmm0
pcmpeqd xmm0,xmm8
movdqa xmm3,xmm7
paddd xmm2,xmm1
pcmpeqd xmm1,xmm8
movdqa xmm4,xmm7
paddd xmm3,xmm2
pcmpeqd xmm2,xmm8
movdqa xmm5,xmm7
paddd xmm4,xmm3
pcmpeqd xmm3,xmm8
movdqa xmm6,xmm7
paddd xmm5,xmm4
pcmpeqd xmm4,xmm8
paddd xmm6,xmm5
pcmpeqd xmm5,xmm8
paddd xmm7,xmm6
pcmpeqd xmm6,xmm8
pcmpeqd xmm7,xmm8
movdqa xmm8,XMMWORD PTR[rdx]
movdqa xmm9,XMMWORD PTR[16+rdx]
movdqa xmm10,XMMWORD PTR[32+rdx]
movdqa xmm11,XMMWORD PTR[48+rdx]
pand xmm8,xmm0
movdqa xmm12,XMMWORD PTR[64+rdx]
pand xmm9,xmm1
movdqa xmm13,XMMWORD PTR[80+rdx]
pand xmm10,xmm2
movdqa xmm14,XMMWORD PTR[96+rdx]
pand xmm11,xmm3
movdqa xmm15,XMMWORD PTR[112+rdx]
lea rbp,QWORD PTR[128+rdx]
pand xmm12,xmm4
pand xmm13,xmm5
pand xmm14,xmm6
pand xmm15,xmm7
por xmm8,xmm10
por xmm9,xmm11
por xmm8,xmm12
por xmm9,xmm13
por xmm8,xmm14
por xmm9,xmm15
por xmm8,xmm9
pshufd xmm9,xmm8,04eh
por xmm8,xmm9
mov r11d,080100h
and r11d,DWORD PTR[((OPENSSL_ia32cap_P+8))]
cmp r11d,080100h
je $L$mulx_gather
DB 102,76,15,126,195
mov QWORD PTR[128+rsp],r8
mov QWORD PTR[((128+8))+rsp],rdi
mov QWORD PTR[((128+16))+rsp],rcx
mov rax,QWORD PTR[rsi]
mov rcx,QWORD PTR[8+rsi]
mul rbx
mov QWORD PTR[rsp],rax
mov rax,rcx
mov r8,rdx
mul rbx
add r8,rax
mov rax,QWORD PTR[16+rsi]
mov r9,rdx
adc r9,0
mul rbx
add r9,rax
mov rax,QWORD PTR[24+rsi]
mov r10,rdx
adc r10,0
mul rbx
add r10,rax
mov rax,QWORD PTR[32+rsi]
mov r11,rdx
adc r11,0
mul rbx
add r11,rax
mov rax,QWORD PTR[40+rsi]
mov r12,rdx
adc r12,0
mul rbx
add r12,rax
mov rax,QWORD PTR[48+rsi]
mov r13,rdx
adc r13,0
mul rbx
add r13,rax
mov rax,QWORD PTR[56+rsi]
mov r14,rdx
adc r14,0
mul rbx
add r14,rax
mov rax,QWORD PTR[rsi]
mov r15,rdx
adc r15,0
lea rdi,QWORD PTR[8+rsp]
mov ecx,7
jmp $L$oop_mul_gather
ALIGN 32
$L$oop_mul_gather::
movdqa xmm8,XMMWORD PTR[rbp]
movdqa xmm9,XMMWORD PTR[16+rbp]
movdqa xmm10,XMMWORD PTR[32+rbp]
movdqa xmm11,XMMWORD PTR[48+rbp]
pand xmm8,xmm0
movdqa xmm12,XMMWORD PTR[64+rbp]
pand xmm9,xmm1
movdqa xmm13,XMMWORD PTR[80+rbp]
pand xmm10,xmm2
movdqa xmm14,XMMWORD PTR[96+rbp]
pand xmm11,xmm3
movdqa xmm15,XMMWORD PTR[112+rbp]
lea rbp,QWORD PTR[128+rbp]
pand xmm12,xmm4
pand xmm13,xmm5
pand xmm14,xmm6
pand xmm15,xmm7
por xmm8,xmm10
por xmm9,xmm11
por xmm8,xmm12
por xmm9,xmm13
por xmm8,xmm14
por xmm9,xmm15
por xmm8,xmm9
pshufd xmm9,xmm8,04eh
por xmm8,xmm9
DB 102,76,15,126,195
mul rbx
add r8,rax
mov rax,QWORD PTR[8+rsi]
mov QWORD PTR[rdi],r8
mov r8,rdx
adc r8,0
mul rbx
add r9,rax
mov rax,QWORD PTR[16+rsi]
adc rdx,0
add r8,r9
mov r9,rdx
adc r9,0
mul rbx
add r10,rax
mov rax,QWORD PTR[24+rsi]
adc rdx,0
add r9,r10
mov r10,rdx
adc r10,0
mul rbx
add r11,rax
mov rax,QWORD PTR[32+rsi]
adc rdx,0
add r10,r11
mov r11,rdx
adc r11,0
mul rbx
add r12,rax
mov rax,QWORD PTR[40+rsi]
adc rdx,0
add r11,r12
mov r12,rdx
adc r12,0
mul rbx
add r13,rax
mov rax,QWORD PTR[48+rsi]
adc rdx,0
add r12,r13
mov r13,rdx
adc r13,0
mul rbx
add r14,rax
mov rax,QWORD PTR[56+rsi]
adc rdx,0
add r13,r14
mov r14,rdx
adc r14,0
mul rbx
add r15,rax
mov rax,QWORD PTR[rsi]
adc rdx,0
add r14,r15
mov r15,rdx
adc r15,0
lea rdi,QWORD PTR[8+rdi]
dec ecx
jnz $L$oop_mul_gather
mov QWORD PTR[rdi],r8
mov QWORD PTR[8+rdi],r9
mov QWORD PTR[16+rdi],r10
mov QWORD PTR[24+rdi],r11
mov QWORD PTR[32+rdi],r12
mov QWORD PTR[40+rdi],r13
mov QWORD PTR[48+rdi],r14
mov QWORD PTR[56+rdi],r15
mov rdi,QWORD PTR[((128+8))+rsp]
mov rbp,QWORD PTR[((128+16))+rsp]
mov r8,QWORD PTR[rsp]
mov r9,QWORD PTR[8+rsp]
mov r10,QWORD PTR[16+rsp]
mov r11,QWORD PTR[24+rsp]
mov r12,QWORD PTR[32+rsp]
mov r13,QWORD PTR[40+rsp]
mov r14,QWORD PTR[48+rsp]
mov r15,QWORD PTR[56+rsp]
call __rsaz_512_reduce
jmp $L$mul_gather_tail
ALIGN 32
$L$mulx_gather::
DB 102,76,15,126,194
mov QWORD PTR[128+rsp],r8
mov QWORD PTR[((128+8))+rsp],rdi
mov QWORD PTR[((128+16))+rsp],rcx
mulx r8,rbx,QWORD PTR[rsi]
mov QWORD PTR[rsp],rbx
xor edi,edi
mulx r9,rax,QWORD PTR[8+rsi]
mulx r10,rbx,QWORD PTR[16+rsi]
adcx r8,rax
mulx r11,rax,QWORD PTR[24+rsi]
adcx r9,rbx
mulx r12,rbx,QWORD PTR[32+rsi]
adcx r10,rax
mulx r13,rax,QWORD PTR[40+rsi]
adcx r11,rbx
mulx r14,rbx,QWORD PTR[48+rsi]
adcx r12,rax
mulx r15,rax,QWORD PTR[56+rsi]
adcx r13,rbx
adcx r14,rax
DB 067h
mov rbx,r8
adcx r15,rdi
mov rcx,-7
jmp $L$oop_mulx_gather
ALIGN 32
$L$oop_mulx_gather::
movdqa xmm8,XMMWORD PTR[rbp]
movdqa xmm9,XMMWORD PTR[16+rbp]
movdqa xmm10,XMMWORD PTR[32+rbp]
movdqa xmm11,XMMWORD PTR[48+rbp]
pand xmm8,xmm0
movdqa xmm12,XMMWORD PTR[64+rbp]
pand xmm9,xmm1
movdqa xmm13,XMMWORD PTR[80+rbp]
pand xmm10,xmm2
movdqa xmm14,XMMWORD PTR[96+rbp]
pand xmm11,xmm3
movdqa xmm15,XMMWORD PTR[112+rbp]
lea rbp,QWORD PTR[128+rbp]
pand xmm12,xmm4
pand xmm13,xmm5
pand xmm14,xmm6
pand xmm15,xmm7
por xmm8,xmm10
por xmm9,xmm11
por xmm8,xmm12
por xmm9,xmm13
por xmm8,xmm14
por xmm9,xmm15
por xmm8,xmm9
pshufd xmm9,xmm8,04eh
por xmm8,xmm9
DB 102,76,15,126,194
DB 0c4h,062h,0fbh,0f6h,086h,000h,000h,000h,000h
adcx rbx,rax
adox r8,r9
mulx r9,rax,QWORD PTR[8+rsi]
adcx r8,rax
adox r9,r10
mulx r10,rax,QWORD PTR[16+rsi]
adcx r9,rax
adox r10,r11
DB 0c4h,062h,0fbh,0f6h,09eh,018h,000h,000h,000h
adcx r10,rax
adox r11,r12
mulx r12,rax,QWORD PTR[32+rsi]
adcx r11,rax
adox r12,r13
mulx r13,rax,QWORD PTR[40+rsi]
adcx r12,rax
adox r13,r14
DB 0c4h,062h,0fbh,0f6h,0b6h,030h,000h,000h,000h
adcx r13,rax
DB 067h
adox r14,r15
mulx r15,rax,QWORD PTR[56+rsi]
mov QWORD PTR[64+rcx*8+rsp],rbx
adcx r14,rax
adox r15,rdi
mov rbx,r8
adcx r15,rdi
inc rcx
jnz $L$oop_mulx_gather
mov QWORD PTR[64+rsp],r8
mov QWORD PTR[((64+8))+rsp],r9
mov QWORD PTR[((64+16))+rsp],r10
mov QWORD PTR[((64+24))+rsp],r11
mov QWORD PTR[((64+32))+rsp],r12
mov QWORD PTR[((64+40))+rsp],r13
mov QWORD PTR[((64+48))+rsp],r14
mov QWORD PTR[((64+56))+rsp],r15
mov rdx,QWORD PTR[128+rsp]
mov rdi,QWORD PTR[((128+8))+rsp]
mov rbp,QWORD PTR[((128+16))+rsp]
mov r8,QWORD PTR[rsp]
mov r9,QWORD PTR[8+rsp]
mov r10,QWORD PTR[16+rsp]
mov r11,QWORD PTR[24+rsp]
mov r12,QWORD PTR[32+rsp]
mov r13,QWORD PTR[40+rsp]
mov r14,QWORD PTR[48+rsp]
mov r15,QWORD PTR[56+rsp]
call __rsaz_512_reducex
$L$mul_gather_tail::
add r8,QWORD PTR[64+rsp]
adc r9,QWORD PTR[72+rsp]
adc r10,QWORD PTR[80+rsp]
adc r11,QWORD PTR[88+rsp]
adc r12,QWORD PTR[96+rsp]
adc r13,QWORD PTR[104+rsp]
adc r14,QWORD PTR[112+rsp]
adc r15,QWORD PTR[120+rsp]
sbb rcx,rcx
call __rsaz_512_subtract
lea rax,QWORD PTR[((128+24+48))+rsp]
movaps xmm6,XMMWORD PTR[((160-200))+rax]
movaps xmm7,XMMWORD PTR[((176-200))+rax]
movaps xmm8,XMMWORD PTR[((192-200))+rax]
movaps xmm9,XMMWORD PTR[((208-200))+rax]
movaps xmm10,XMMWORD PTR[((224-200))+rax]
movaps xmm11,XMMWORD PTR[((240-200))+rax]
movaps xmm12,XMMWORD PTR[((256-200))+rax]
movaps xmm13,XMMWORD PTR[((272-200))+rax]
movaps xmm14,XMMWORD PTR[((288-200))+rax]
movaps xmm15,XMMWORD PTR[((304-200))+rax]
lea rax,QWORD PTR[176+rax]
mov r15,QWORD PTR[((-48))+rax]
mov r14,QWORD PTR[((-40))+rax]
mov r13,QWORD PTR[((-32))+rax]
mov r12,QWORD PTR[((-24))+rax]
mov rbp,QWORD PTR[((-16))+rax]
mov rbx,QWORD PTR[((-8))+rax]
lea rsp,QWORD PTR[rax]
$L$mul_gather4_epilogue::
mov rdi,QWORD PTR[8+rsp] ;WIN64 epilogue
mov rsi,QWORD PTR[16+rsp]
DB 0F3h,0C3h ;repret
$L$SEH_end_rsaz_512_mul_gather4::
rsaz_512_mul_gather4 ENDP
PUBLIC rsaz_512_mul_scatter4
ALIGN 32
rsaz_512_mul_scatter4 PROC PUBLIC
mov QWORD PTR[8+rsp],rdi ;WIN64 prologue
mov QWORD PTR[16+rsp],rsi
mov rax,rsp
$L$SEH_begin_rsaz_512_mul_scatter4::
mov rdi,rcx
mov rsi,rdx
mov rdx,r8
mov rcx,r9
mov r8,QWORD PTR[40+rsp]
mov r9,QWORD PTR[48+rsp]
push rbx
push rbp
push r12
push r13
push r14
push r15
mov r9d,r9d
sub rsp,128+24
$L$mul_scatter4_body::
lea r8,QWORD PTR[r9*8+r8]
DB 102,72,15,110,199
DB 102,72,15,110,202
DB 102,73,15,110,208
mov QWORD PTR[128+rsp],rcx
mov rbp,rdi
mov r11d,080100h
and r11d,DWORD PTR[((OPENSSL_ia32cap_P+8))]
cmp r11d,080100h
je $L$mulx_scatter
mov rbx,QWORD PTR[rdi]
call __rsaz_512_mul
DB 102,72,15,126,199
DB 102,72,15,126,205
mov r8,QWORD PTR[rsp]
mov r9,QWORD PTR[8+rsp]
mov r10,QWORD PTR[16+rsp]
mov r11,QWORD PTR[24+rsp]
mov r12,QWORD PTR[32+rsp]
mov r13,QWORD PTR[40+rsp]
mov r14,QWORD PTR[48+rsp]
mov r15,QWORD PTR[56+rsp]
call __rsaz_512_reduce
jmp $L$mul_scatter_tail
ALIGN 32
$L$mulx_scatter::
mov rdx,QWORD PTR[rdi]
call __rsaz_512_mulx
DB 102,72,15,126,199
DB 102,72,15,126,205
mov rdx,QWORD PTR[128+rsp]
mov r8,QWORD PTR[rsp]
mov r9,QWORD PTR[8+rsp]
mov r10,QWORD PTR[16+rsp]
mov r11,QWORD PTR[24+rsp]
mov r12,QWORD PTR[32+rsp]
mov r13,QWORD PTR[40+rsp]
mov r14,QWORD PTR[48+rsp]
mov r15,QWORD PTR[56+rsp]
call __rsaz_512_reducex
$L$mul_scatter_tail::
add r8,QWORD PTR[64+rsp]
adc r9,QWORD PTR[72+rsp]
adc r10,QWORD PTR[80+rsp]
adc r11,QWORD PTR[88+rsp]
adc r12,QWORD PTR[96+rsp]
adc r13,QWORD PTR[104+rsp]
adc r14,QWORD PTR[112+rsp]
adc r15,QWORD PTR[120+rsp]
DB 102,72,15,126,214
sbb rcx,rcx
call __rsaz_512_subtract
mov QWORD PTR[rsi],r8
mov QWORD PTR[128+rsi],r9
mov QWORD PTR[256+rsi],r10
mov QWORD PTR[384+rsi],r11
mov QWORD PTR[512+rsi],r12
mov QWORD PTR[640+rsi],r13
mov QWORD PTR[768+rsi],r14
mov QWORD PTR[896+rsi],r15
lea rax,QWORD PTR[((128+24+48))+rsp]
mov r15,QWORD PTR[((-48))+rax]
mov r14,QWORD PTR[((-40))+rax]
mov r13,QWORD PTR[((-32))+rax]
mov r12,QWORD PTR[((-24))+rax]
mov rbp,QWORD PTR[((-16))+rax]
mov rbx,QWORD PTR[((-8))+rax]
lea rsp,QWORD PTR[rax]
$L$mul_scatter4_epilogue::
mov rdi,QWORD PTR[8+rsp] ;WIN64 epilogue
mov rsi,QWORD PTR[16+rsp]
DB 0F3h,0C3h ;repret
$L$SEH_end_rsaz_512_mul_scatter4::
rsaz_512_mul_scatter4 ENDP
PUBLIC rsaz_512_mul_by_one
ALIGN 32
rsaz_512_mul_by_one PROC PUBLIC
mov QWORD PTR[8+rsp],rdi ;WIN64 prologue
mov QWORD PTR[16+rsp],rsi
mov rax,rsp
$L$SEH_begin_rsaz_512_mul_by_one::
mov rdi,rcx
mov rsi,rdx
mov rdx,r8
mov rcx,r9
push rbx
push rbp
push r12
push r13
push r14
push r15
sub rsp,128+24
$L$mul_by_one_body::
mov eax,DWORD PTR[((OPENSSL_ia32cap_P+8))]
mov rbp,rdx
mov QWORD PTR[128+rsp],rcx
mov r8,QWORD PTR[rsi]
pxor xmm0,xmm0
mov r9,QWORD PTR[8+rsi]
mov r10,QWORD PTR[16+rsi]
mov r11,QWORD PTR[24+rsi]
mov r12,QWORD PTR[32+rsi]
mov r13,QWORD PTR[40+rsi]
mov r14,QWORD PTR[48+rsi]
mov r15,QWORD PTR[56+rsi]
movdqa XMMWORD PTR[rsp],xmm0
movdqa XMMWORD PTR[16+rsp],xmm0
movdqa XMMWORD PTR[32+rsp],xmm0
movdqa XMMWORD PTR[48+rsp],xmm0
movdqa XMMWORD PTR[64+rsp],xmm0
movdqa XMMWORD PTR[80+rsp],xmm0
movdqa XMMWORD PTR[96+rsp],xmm0
and eax,080100h
cmp eax,080100h
je $L$by_one_callx
call __rsaz_512_reduce
jmp $L$by_one_tail
ALIGN 32
$L$by_one_callx::
mov rdx,QWORD PTR[128+rsp]
call __rsaz_512_reducex
$L$by_one_tail::
mov QWORD PTR[rdi],r8
mov QWORD PTR[8+rdi],r9
mov QWORD PTR[16+rdi],r10
mov QWORD PTR[24+rdi],r11
mov QWORD PTR[32+rdi],r12
mov QWORD PTR[40+rdi],r13
mov QWORD PTR[48+rdi],r14
mov QWORD PTR[56+rdi],r15
lea rax,QWORD PTR[((128+24+48))+rsp]
mov r15,QWORD PTR[((-48))+rax]
mov r14,QWORD PTR[((-40))+rax]
mov r13,QWORD PTR[((-32))+rax]
mov r12,QWORD PTR[((-24))+rax]
mov rbp,QWORD PTR[((-16))+rax]
mov rbx,QWORD PTR[((-8))+rax]
lea rsp,QWORD PTR[rax]
$L$mul_by_one_epilogue::
mov rdi,QWORD PTR[8+rsp] ;WIN64 epilogue
mov rsi,QWORD PTR[16+rsp]
DB 0F3h,0C3h ;repret
$L$SEH_end_rsaz_512_mul_by_one::
rsaz_512_mul_by_one ENDP
ALIGN 32
__rsaz_512_reduce PROC PRIVATE
mov rbx,r8
imul rbx,QWORD PTR[((128+8))+rsp]
mov rax,QWORD PTR[rbp]
mov ecx,8
jmp $L$reduction_loop
ALIGN 32
$L$reduction_loop::
mul rbx
mov rax,QWORD PTR[8+rbp]
neg r8
mov r8,rdx
adc r8,0
mul rbx
add r9,rax
mov rax,QWORD PTR[16+rbp]
adc rdx,0
add r8,r9
mov r9,rdx
adc r9,0
mul rbx
add r10,rax
mov rax,QWORD PTR[24+rbp]
adc rdx,0
add r9,r10
mov r10,rdx
adc r10,0
mul rbx
add r11,rax
mov rax,QWORD PTR[32+rbp]
adc rdx,0
add r10,r11
mov rsi,QWORD PTR[((128+8))+rsp]
adc rdx,0
mov r11,rdx
mul rbx
add r12,rax
mov rax,QWORD PTR[40+rbp]
adc rdx,0
imul rsi,r8
add r11,r12
mov r12,rdx
adc r12,0
mul rbx
add r13,rax
mov rax,QWORD PTR[48+rbp]
adc rdx,0
add r12,r13
mov r13,rdx
adc r13,0
mul rbx
add r14,rax
mov rax,QWORD PTR[56+rbp]
adc rdx,0
add r13,r14
mov r14,rdx
adc r14,0
mul rbx
mov rbx,rsi
add r15,rax
mov rax,QWORD PTR[rbp]
adc rdx,0
add r14,r15
mov r15,rdx
adc r15,0
dec ecx
jne $L$reduction_loop
DB 0F3h,0C3h ;repret
__rsaz_512_reduce ENDP
ALIGN 32
__rsaz_512_reducex PROC PRIVATE
imul rdx,r8
xor rsi,rsi
mov ecx,8
jmp $L$reduction_loopx
ALIGN 32
$L$reduction_loopx::
mov rbx,r8
mulx r8,rax,QWORD PTR[rbp]
adcx rax,rbx
adox r8,r9
mulx r9,rax,QWORD PTR[8+rbp]
adcx r8,rax
adox r9,r10
mulx r10,rbx,QWORD PTR[16+rbp]
adcx r9,rbx
adox r10,r11
mulx r11,rbx,QWORD PTR[24+rbp]
adcx r10,rbx
adox r11,r12
DB 0c4h,062h,0e3h,0f6h,0a5h,020h,000h,000h,000h
mov rax,rdx
mov rdx,r8
adcx r11,rbx
adox r12,r13
mulx rdx,rbx,QWORD PTR[((128+8))+rsp]
mov rdx,rax
mulx r13,rax,QWORD PTR[40+rbp]
adcx r12,rax
adox r13,r14
DB 0c4h,062h,0fbh,0f6h,0b5h,030h,000h,000h,000h
adcx r13,rax
adox r14,r15
mulx r15,rax,QWORD PTR[56+rbp]
mov rdx,rbx
adcx r14,rax
adox r15,rsi
adcx r15,rsi
dec ecx
jne $L$reduction_loopx
DB 0F3h,0C3h ;repret
__rsaz_512_reducex ENDP
ALIGN 32
__rsaz_512_subtract PROC PRIVATE
mov QWORD PTR[rdi],r8
mov QWORD PTR[8+rdi],r9
mov QWORD PTR[16+rdi],r10
mov QWORD PTR[24+rdi],r11
mov QWORD PTR[32+rdi],r12
mov QWORD PTR[40+rdi],r13
mov QWORD PTR[48+rdi],r14
mov QWORD PTR[56+rdi],r15
mov r8,QWORD PTR[rbp]
mov r9,QWORD PTR[8+rbp]
neg r8
not r9
and r8,rcx
mov r10,QWORD PTR[16+rbp]
and r9,rcx
not r10
mov r11,QWORD PTR[24+rbp]
and r10,rcx
not r11
mov r12,QWORD PTR[32+rbp]
and r11,rcx
not r12
mov r13,QWORD PTR[40+rbp]
and r12,rcx
not r13
mov r14,QWORD PTR[48+rbp]
and r13,rcx
not r14
mov r15,QWORD PTR[56+rbp]
and r14,rcx
not r15
and r15,rcx
add r8,QWORD PTR[rdi]
adc r9,QWORD PTR[8+rdi]
adc r10,QWORD PTR[16+rdi]
adc r11,QWORD PTR[24+rdi]
adc r12,QWORD PTR[32+rdi]
adc r13,QWORD PTR[40+rdi]
adc r14,QWORD PTR[48+rdi]
adc r15,QWORD PTR[56+rdi]
mov QWORD PTR[rdi],r8
mov QWORD PTR[8+rdi],r9
mov QWORD PTR[16+rdi],r10
mov QWORD PTR[24+rdi],r11
mov QWORD PTR[32+rdi],r12
mov QWORD PTR[40+rdi],r13
mov QWORD PTR[48+rdi],r14
mov QWORD PTR[56+rdi],r15
DB 0F3h,0C3h ;repret
__rsaz_512_subtract ENDP
ALIGN 32
__rsaz_512_mul PROC PRIVATE
lea rdi,QWORD PTR[8+rsp]
mov rax,QWORD PTR[rsi]
mul rbx
mov QWORD PTR[rdi],rax
mov rax,QWORD PTR[8+rsi]
mov r8,rdx
mul rbx
add r8,rax
mov rax,QWORD PTR[16+rsi]
mov r9,rdx
adc r9,0
mul rbx
add r9,rax
mov rax,QWORD PTR[24+rsi]
mov r10,rdx
adc r10,0
mul rbx
add r10,rax
mov rax,QWORD PTR[32+rsi]
mov r11,rdx
adc r11,0
mul rbx
add r11,rax
mov rax,QWORD PTR[40+rsi]
mov r12,rdx
adc r12,0
mul rbx
add r12,rax
mov rax,QWORD PTR[48+rsi]
mov r13,rdx
adc r13,0
mul rbx
add r13,rax
mov rax,QWORD PTR[56+rsi]
mov r14,rdx
adc r14,0
mul rbx
add r14,rax
mov rax,QWORD PTR[rsi]
mov r15,rdx
adc r15,0
lea rbp,QWORD PTR[8+rbp]
lea rdi,QWORD PTR[8+rdi]
mov ecx,7
jmp $L$oop_mul
ALIGN 32
$L$oop_mul::
mov rbx,QWORD PTR[rbp]
mul rbx
add r8,rax
mov rax,QWORD PTR[8+rsi]
mov QWORD PTR[rdi],r8
mov r8,rdx
adc r8,0
mul rbx
add r9,rax
mov rax,QWORD PTR[16+rsi]
adc rdx,0
add r8,r9
mov r9,rdx
adc r9,0
mul rbx
add r10,rax
mov rax,QWORD PTR[24+rsi]
adc rdx,0
add r9,r10
mov r10,rdx
adc r10,0
mul rbx
add r11,rax
mov rax,QWORD PTR[32+rsi]
adc rdx,0
add r10,r11
mov r11,rdx
adc r11,0
mul rbx
add r12,rax
mov rax,QWORD PTR[40+rsi]
adc rdx,0
add r11,r12
mov r12,rdx
adc r12,0
mul rbx
add r13,rax
mov rax,QWORD PTR[48+rsi]
adc rdx,0
add r12,r13
mov r13,rdx
adc r13,0
mul rbx
add r14,rax
mov rax,QWORD PTR[56+rsi]
adc rdx,0
add r13,r14
mov r14,rdx
lea rbp,QWORD PTR[8+rbp]
adc r14,0
mul rbx
add r15,rax
mov rax,QWORD PTR[rsi]
adc rdx,0
add r14,r15
mov r15,rdx
adc r15,0
lea rdi,QWORD PTR[8+rdi]
dec ecx
jnz $L$oop_mul
mov QWORD PTR[rdi],r8
mov QWORD PTR[8+rdi],r9
mov QWORD PTR[16+rdi],r10
mov QWORD PTR[24+rdi],r11
mov QWORD PTR[32+rdi],r12
mov QWORD PTR[40+rdi],r13
mov QWORD PTR[48+rdi],r14
mov QWORD PTR[56+rdi],r15
DB 0F3h,0C3h ;repret
__rsaz_512_mul ENDP
ALIGN 32
__rsaz_512_mulx PROC PRIVATE
mulx r8,rbx,QWORD PTR[rsi]
mov rcx,-6
mulx r9,rax,QWORD PTR[8+rsi]
mov QWORD PTR[8+rsp],rbx
mulx r10,rbx,QWORD PTR[16+rsi]
adc r8,rax
mulx r11,rax,QWORD PTR[24+rsi]
adc r9,rbx
mulx r12,rbx,QWORD PTR[32+rsi]
adc r10,rax
mulx r13,rax,QWORD PTR[40+rsi]
adc r11,rbx
mulx r14,rbx,QWORD PTR[48+rsi]
adc r12,rax
mulx r15,rax,QWORD PTR[56+rsi]
mov rdx,QWORD PTR[8+rbp]
adc r13,rbx
adc r14,rax
adc r15,0
xor rdi,rdi
jmp $L$oop_mulx
ALIGN 32
$L$oop_mulx::
mov rbx,r8
mulx r8,rax,QWORD PTR[rsi]
adcx rbx,rax
adox r8,r9
mulx r9,rax,QWORD PTR[8+rsi]
adcx r8,rax
adox r9,r10
mulx r10,rax,QWORD PTR[16+rsi]
adcx r9,rax
adox r10,r11
mulx r11,rax,QWORD PTR[24+rsi]
adcx r10,rax
adox r11,r12
DB 03eh,0c4h,062h,0fbh,0f6h,0a6h,020h,000h,000h,000h
adcx r11,rax
adox r12,r13
mulx r13,rax,QWORD PTR[40+rsi]
adcx r12,rax
adox r13,r14
mulx r14,rax,QWORD PTR[48+rsi]
adcx r13,rax
adox r14,r15
mulx r15,rax,QWORD PTR[56+rsi]
mov rdx,QWORD PTR[64+rcx*8+rbp]
mov QWORD PTR[((8+64-8))+rcx*8+rsp],rbx
adcx r14,rax
adox r15,rdi
adcx r15,rdi
inc rcx
jnz $L$oop_mulx
mov rbx,r8
mulx r8,rax,QWORD PTR[rsi]
adcx rbx,rax
adox r8,r9
DB 0c4h,062h,0fbh,0f6h,08eh,008h,000h,000h,000h
adcx r8,rax
adox r9,r10
DB 0c4h,062h,0fbh,0f6h,096h,010h,000h,000h,000h
adcx r9,rax
adox r10,r11
mulx r11,rax,QWORD PTR[24+rsi]
adcx r10,rax
adox r11,r12
mulx r12,rax,QWORD PTR[32+rsi]
adcx r11,rax
adox r12,r13
mulx r13,rax,QWORD PTR[40+rsi]
adcx r12,rax
adox r13,r14
DB 0c4h,062h,0fbh,0f6h,0b6h,030h,000h,000h,000h
adcx r13,rax
adox r14,r15
DB 0c4h,062h,0fbh,0f6h,0beh,038h,000h,000h,000h
adcx r14,rax
adox r15,rdi
adcx r15,rdi
mov QWORD PTR[((8+64-8))+rsp],rbx
mov QWORD PTR[((8+64))+rsp],r8
mov QWORD PTR[((8+64+8))+rsp],r9
mov QWORD PTR[((8+64+16))+rsp],r10
mov QWORD PTR[((8+64+24))+rsp],r11
mov QWORD PTR[((8+64+32))+rsp],r12
mov QWORD PTR[((8+64+40))+rsp],r13
mov QWORD PTR[((8+64+48))+rsp],r14
mov QWORD PTR[((8+64+56))+rsp],r15
DB 0F3h,0C3h ;repret
__rsaz_512_mulx ENDP
PUBLIC rsaz_512_scatter4
ALIGN 16
rsaz_512_scatter4 PROC PUBLIC
lea rcx,QWORD PTR[r8*8+rcx]
mov r9d,8
jmp $L$oop_scatter
ALIGN 16
$L$oop_scatter::
mov rax,QWORD PTR[rdx]
lea rdx,QWORD PTR[8+rdx]
mov QWORD PTR[rcx],rax
lea rcx,QWORD PTR[128+rcx]
dec r9d
jnz $L$oop_scatter
DB 0F3h,0C3h ;repret
rsaz_512_scatter4 ENDP
PUBLIC rsaz_512_gather4
ALIGN 16
rsaz_512_gather4 PROC PUBLIC
$L$SEH_begin_rsaz_512_gather4::
DB 048h,081h,0ech,0a8h,000h,000h,000h
DB 00fh,029h,034h,024h
DB 00fh,029h,07ch,024h,010h
DB 044h,00fh,029h,044h,024h,020h
DB 044h,00fh,029h,04ch,024h,030h
DB 044h,00fh,029h,054h,024h,040h
DB 044h,00fh,029h,05ch,024h,050h
DB 044h,00fh,029h,064h,024h,060h
DB 044h,00fh,029h,06ch,024h,070h
DB 044h,00fh,029h,0b4h,024h,080h,0,0,0
DB 044h,00fh,029h,0bch,024h,090h,0,0,0
movd xmm8,r8d
movdqa xmm1,XMMWORD PTR[(($L$inc+16))]
movdqa xmm0,XMMWORD PTR[$L$inc]
pshufd xmm8,xmm8,0
movdqa xmm7,xmm1
movdqa xmm2,xmm1
paddd xmm1,xmm0
pcmpeqd xmm0,xmm8
movdqa xmm3,xmm7
paddd xmm2,xmm1
pcmpeqd xmm1,xmm8
movdqa xmm4,xmm7
paddd xmm3,xmm2
pcmpeqd xmm2,xmm8
movdqa xmm5,xmm7
paddd xmm4,xmm3
pcmpeqd xmm3,xmm8
movdqa xmm6,xmm7
paddd xmm5,xmm4
pcmpeqd xmm4,xmm8
paddd xmm6,xmm5
pcmpeqd xmm5,xmm8
paddd xmm7,xmm6
pcmpeqd xmm6,xmm8
pcmpeqd xmm7,xmm8
mov r9d,8
jmp $L$oop_gather
ALIGN 16
$L$oop_gather::
movdqa xmm8,XMMWORD PTR[rdx]
movdqa xmm9,XMMWORD PTR[16+rdx]
movdqa xmm10,XMMWORD PTR[32+rdx]
movdqa xmm11,XMMWORD PTR[48+rdx]
pand xmm8,xmm0
movdqa xmm12,XMMWORD PTR[64+rdx]
pand xmm9,xmm1
movdqa xmm13,XMMWORD PTR[80+rdx]
pand xmm10,xmm2
movdqa xmm14,XMMWORD PTR[96+rdx]
pand xmm11,xmm3
movdqa xmm15,XMMWORD PTR[112+rdx]
lea rdx,QWORD PTR[128+rdx]
pand xmm12,xmm4
pand xmm13,xmm5
pand xmm14,xmm6
pand xmm15,xmm7
por xmm8,xmm10
por xmm9,xmm11
por xmm8,xmm12
por xmm9,xmm13
por xmm8,xmm14
por xmm9,xmm15
por xmm8,xmm9
pshufd xmm9,xmm8,04eh
por xmm8,xmm9
movq QWORD PTR[rcx],xmm8
lea rcx,QWORD PTR[8+rcx]
dec r9d
jnz $L$oop_gather
movaps xmm6,XMMWORD PTR[rsp]
movaps xmm7,XMMWORD PTR[16+rsp]
movaps xmm8,XMMWORD PTR[32+rsp]
movaps xmm9,XMMWORD PTR[48+rsp]
movaps xmm10,XMMWORD PTR[64+rsp]
movaps xmm11,XMMWORD PTR[80+rsp]
movaps xmm12,XMMWORD PTR[96+rsp]
movaps xmm13,XMMWORD PTR[112+rsp]
movaps xmm14,XMMWORD PTR[128+rsp]
movaps xmm15,XMMWORD PTR[144+rsp]
add rsp,0a8h
DB 0F3h,0C3h ;repret
$L$SEH_end_rsaz_512_gather4::
rsaz_512_gather4 ENDP
ALIGN 64
$L$inc::
DD 0,0,1,1
DD 2,2,2,2
EXTERN __imp_RtlVirtualUnwind:NEAR
ALIGN 16
se_handler PROC PRIVATE
push rsi
push rdi
push rbx
push rbp
push r12
push r13
push r14
push r15
pushfq
sub rsp,64
mov rax,QWORD PTR[120+r8]
mov rbx,QWORD PTR[248+r8]
mov rsi,QWORD PTR[8+r9]
mov r11,QWORD PTR[56+r9]
mov r10d,DWORD PTR[r11]
lea r10,QWORD PTR[r10*1+rsi]
cmp rbx,r10
jb $L$common_seh_tail
mov rax,QWORD PTR[152+r8]
mov r10d,DWORD PTR[4+r11]
lea r10,QWORD PTR[r10*1+rsi]
cmp rbx,r10
jae $L$common_seh_tail
lea rax,QWORD PTR[((128+24+48))+rax]
lea rbx,QWORD PTR[$L$mul_gather4_epilogue]
cmp rbx,r10
jne $L$se_not_in_mul_gather4
lea rax,QWORD PTR[176+rax]
lea rsi,QWORD PTR[((-48-168))+rax]
lea rdi,QWORD PTR[512+r8]
mov ecx,20
DD 0a548f3fch
$L$se_not_in_mul_gather4::
mov rbx,QWORD PTR[((-8))+rax]
mov rbp,QWORD PTR[((-16))+rax]
mov r12,QWORD PTR[((-24))+rax]
mov r13,QWORD PTR[((-32))+rax]
mov r14,QWORD PTR[((-40))+rax]
mov r15,QWORD PTR[((-48))+rax]
mov QWORD PTR[144+r8],rbx
mov QWORD PTR[160+r8],rbp
mov QWORD PTR[216+r8],r12
mov QWORD PTR[224+r8],r13
mov QWORD PTR[232+r8],r14
mov QWORD PTR[240+r8],r15
$L$common_seh_tail::
mov rdi,QWORD PTR[8+rax]
mov rsi,QWORD PTR[16+rax]
mov QWORD PTR[152+r8],rax
mov QWORD PTR[168+r8],rsi
mov QWORD PTR[176+r8],rdi
mov rdi,QWORD PTR[40+r9]
mov rsi,r8
mov ecx,154
DD 0a548f3fch
mov rsi,r9
xor rcx,rcx
mov rdx,QWORD PTR[8+rsi]
mov r8,QWORD PTR[rsi]
mov r9,QWORD PTR[16+rsi]
mov r10,QWORD PTR[40+rsi]
lea r11,QWORD PTR[56+rsi]
lea r12,QWORD PTR[24+rsi]
mov QWORD PTR[32+rsp],r10
mov QWORD PTR[40+rsp],r11
mov QWORD PTR[48+rsp],r12
mov QWORD PTR[56+rsp],rcx
call QWORD PTR[__imp_RtlVirtualUnwind]
mov eax,1
add rsp,64
popfq
pop r15
pop r14
pop r13
pop r12
pop rbp
pop rbx
pop rdi
pop rsi
DB 0F3h,0C3h ;repret
se_handler ENDP
.text$ ENDS
.pdata SEGMENT READONLY ALIGN(4)
ALIGN 4
DD imagerel $L$SEH_begin_rsaz_512_sqr
DD imagerel $L$SEH_end_rsaz_512_sqr
DD imagerel $L$SEH_info_rsaz_512_sqr
DD imagerel $L$SEH_begin_rsaz_512_mul
DD imagerel $L$SEH_end_rsaz_512_mul
DD imagerel $L$SEH_info_rsaz_512_mul
DD imagerel $L$SEH_begin_rsaz_512_mul_gather4
DD imagerel $L$SEH_end_rsaz_512_mul_gather4
DD imagerel $L$SEH_info_rsaz_512_mul_gather4
DD imagerel $L$SEH_begin_rsaz_512_mul_scatter4
DD imagerel $L$SEH_end_rsaz_512_mul_scatter4
DD imagerel $L$SEH_info_rsaz_512_mul_scatter4
DD imagerel $L$SEH_begin_rsaz_512_mul_by_one
DD imagerel $L$SEH_end_rsaz_512_mul_by_one
DD imagerel $L$SEH_info_rsaz_512_mul_by_one
DD imagerel $L$SEH_begin_rsaz_512_gather4
DD imagerel $L$SEH_end_rsaz_512_gather4
DD imagerel $L$SEH_info_rsaz_512_gather4
.pdata ENDS
.xdata SEGMENT READONLY ALIGN(8)
ALIGN 8
$L$SEH_info_rsaz_512_sqr::
DB 9,0,0,0
DD imagerel se_handler
DD imagerel $L$sqr_body,imagerel $L$sqr_epilogue
$L$SEH_info_rsaz_512_mul::
DB 9,0,0,0
DD imagerel se_handler
DD imagerel $L$mul_body,imagerel $L$mul_epilogue
$L$SEH_info_rsaz_512_mul_gather4::
DB 9,0,0,0
DD imagerel se_handler
DD imagerel $L$mul_gather4_body,imagerel $L$mul_gather4_epilogue
$L$SEH_info_rsaz_512_mul_scatter4::
DB 9,0,0,0
DD imagerel se_handler
DD imagerel $L$mul_scatter4_body,imagerel $L$mul_scatter4_epilogue
$L$SEH_info_rsaz_512_mul_by_one::
DB 9,0,0,0
DD imagerel se_handler
DD imagerel $L$mul_by_one_body,imagerel $L$mul_by_one_epilogue
$L$SEH_info_rsaz_512_gather4::
DB 001h,046h,016h,000h
DB 046h,0f8h,009h,000h
DB 03dh,0e8h,008h,000h
DB 034h,0d8h,007h,000h
DB 02eh,0c8h,006h,000h
DB 028h,0b8h,005h,000h
DB 022h,0a8h,004h,000h
DB 01ch,098h,003h,000h
DB 016h,088h,002h,000h
DB 010h,078h,001h,000h
DB 00bh,068h,000h,000h
DB 007h,001h,015h,000h
.xdata ENDS
END