You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

2117 lines
35 KiB

TITLE ../openssl/crypto/bn/asm/x86.asm
IF @Version LT 800
ECHO MASM version 8.00 or later is strongly recommended.
ENDIF
.686
.MODEL FLAT
OPTION DOTNAME
IF @Version LT 800
.text$ SEGMENT PAGE 'CODE'
ELSE
.text$ SEGMENT ALIGN(64) 'CODE'
ENDIF
ALIGN 16
_bn_mul_add_words PROC PUBLIC
$L_bn_mul_add_words_begin::
push ebp
push ebx
push esi
push edi
;
xor esi,esi
mov edi,DWORD PTR 20[esp]
mov ecx,DWORD PTR 28[esp]
mov ebx,DWORD PTR 24[esp]
and ecx,4294967288
mov ebp,DWORD PTR 32[esp]
push ecx
jz $L000maw_finish
$L001maw_loop:
mov DWORD PTR [esp],ecx
; Round 0
mov eax,DWORD PTR [ebx]
mul ebp
add eax,esi
mov esi,DWORD PTR [edi]
adc edx,0
add eax,esi
adc edx,0
mov DWORD PTR [edi],eax
mov esi,edx
; Round 4
mov eax,DWORD PTR 4[ebx]
mul ebp
add eax,esi
mov esi,DWORD PTR 4[edi]
adc edx,0
add eax,esi
adc edx,0
mov DWORD PTR 4[edi],eax
mov esi,edx
; Round 8
mov eax,DWORD PTR 8[ebx]
mul ebp
add eax,esi
mov esi,DWORD PTR 8[edi]
adc edx,0
add eax,esi
adc edx,0
mov DWORD PTR 8[edi],eax
mov esi,edx
; Round 12
mov eax,DWORD PTR 12[ebx]
mul ebp
add eax,esi
mov esi,DWORD PTR 12[edi]
adc edx,0
add eax,esi
adc edx,0
mov DWORD PTR 12[edi],eax
mov esi,edx
; Round 16
mov eax,DWORD PTR 16[ebx]
mul ebp
add eax,esi
mov esi,DWORD PTR 16[edi]
adc edx,0
add eax,esi
adc edx,0
mov DWORD PTR 16[edi],eax
mov esi,edx
; Round 20
mov eax,DWORD PTR 20[ebx]
mul ebp
add eax,esi
mov esi,DWORD PTR 20[edi]
adc edx,0
add eax,esi
adc edx,0
mov DWORD PTR 20[edi],eax
mov esi,edx
; Round 24
mov eax,DWORD PTR 24[ebx]
mul ebp
add eax,esi
mov esi,DWORD PTR 24[edi]
adc edx,0
add eax,esi
adc edx,0
mov DWORD PTR 24[edi],eax
mov esi,edx
; Round 28
mov eax,DWORD PTR 28[ebx]
mul ebp
add eax,esi
mov esi,DWORD PTR 28[edi]
adc edx,0
add eax,esi
adc edx,0
mov DWORD PTR 28[edi],eax
mov esi,edx
;
mov ecx,DWORD PTR [esp]
add ebx,32
add edi,32
sub ecx,8
jnz $L001maw_loop
$L000maw_finish:
mov ecx,DWORD PTR 32[esp]
and ecx,7
jnz $L002maw_finish2
jmp $L003maw_end
$L002maw_finish2:
; Tail Round 0
mov eax,DWORD PTR [ebx]
mul ebp
add eax,esi
mov esi,DWORD PTR [edi]
adc edx,0
add eax,esi
adc edx,0
dec ecx
mov DWORD PTR [edi],eax
mov esi,edx
jz $L003maw_end
; Tail Round 1
mov eax,DWORD PTR 4[ebx]
mul ebp
add eax,esi
mov esi,DWORD PTR 4[edi]
adc edx,0
add eax,esi
adc edx,0
dec ecx
mov DWORD PTR 4[edi],eax
mov esi,edx
jz $L003maw_end
; Tail Round 2
mov eax,DWORD PTR 8[ebx]
mul ebp
add eax,esi
mov esi,DWORD PTR 8[edi]
adc edx,0
add eax,esi
adc edx,0
dec ecx
mov DWORD PTR 8[edi],eax
mov esi,edx
jz $L003maw_end
; Tail Round 3
mov eax,DWORD PTR 12[ebx]
mul ebp
add eax,esi
mov esi,DWORD PTR 12[edi]
adc edx,0
add eax,esi
adc edx,0
dec ecx
mov DWORD PTR 12[edi],eax
mov esi,edx
jz $L003maw_end
; Tail Round 4
mov eax,DWORD PTR 16[ebx]
mul ebp
add eax,esi
mov esi,DWORD PTR 16[edi]
adc edx,0
add eax,esi
adc edx,0
dec ecx
mov DWORD PTR 16[edi],eax
mov esi,edx
jz $L003maw_end
; Tail Round 5
mov eax,DWORD PTR 20[ebx]
mul ebp
add eax,esi
mov esi,DWORD PTR 20[edi]
adc edx,0
add eax,esi
adc edx,0
dec ecx
mov DWORD PTR 20[edi],eax
mov esi,edx
jz $L003maw_end
; Tail Round 6
mov eax,DWORD PTR 24[ebx]
mul ebp
add eax,esi
mov esi,DWORD PTR 24[edi]
adc edx,0
add eax,esi
adc edx,0
mov DWORD PTR 24[edi],eax
mov esi,edx
$L003maw_end:
mov eax,esi
pop ecx
pop edi
pop esi
pop ebx
pop ebp
ret
_bn_mul_add_words ENDP
ALIGN 16
_bn_mul_words PROC PUBLIC
$L_bn_mul_words_begin::
push ebp
push ebx
push esi
push edi
;
xor esi,esi
mov edi,DWORD PTR 20[esp]
mov ebx,DWORD PTR 24[esp]
mov ebp,DWORD PTR 28[esp]
mov ecx,DWORD PTR 32[esp]
and ebp,4294967288
jz $L004mw_finish
$L005mw_loop:
; Round 0
mov eax,DWORD PTR [ebx]
mul ecx
add eax,esi
adc edx,0
mov DWORD PTR [edi],eax
mov esi,edx
; Round 4
mov eax,DWORD PTR 4[ebx]
mul ecx
add eax,esi
adc edx,0
mov DWORD PTR 4[edi],eax
mov esi,edx
; Round 8
mov eax,DWORD PTR 8[ebx]
mul ecx
add eax,esi
adc edx,0
mov DWORD PTR 8[edi],eax
mov esi,edx
; Round 12
mov eax,DWORD PTR 12[ebx]
mul ecx
add eax,esi
adc edx,0
mov DWORD PTR 12[edi],eax
mov esi,edx
; Round 16
mov eax,DWORD PTR 16[ebx]
mul ecx
add eax,esi
adc edx,0
mov DWORD PTR 16[edi],eax
mov esi,edx
; Round 20
mov eax,DWORD PTR 20[ebx]
mul ecx
add eax,esi
adc edx,0
mov DWORD PTR 20[edi],eax
mov esi,edx
; Round 24
mov eax,DWORD PTR 24[ebx]
mul ecx
add eax,esi
adc edx,0
mov DWORD PTR 24[edi],eax
mov esi,edx
; Round 28
mov eax,DWORD PTR 28[ebx]
mul ecx
add eax,esi
adc edx,0
mov DWORD PTR 28[edi],eax
mov esi,edx
;
add ebx,32
add edi,32
sub ebp,8
jz $L004mw_finish
jmp $L005mw_loop
$L004mw_finish:
mov ebp,DWORD PTR 28[esp]
and ebp,7
jnz $L006mw_finish2
jmp $L007mw_end
$L006mw_finish2:
; Tail Round 0
mov eax,DWORD PTR [ebx]
mul ecx
add eax,esi
adc edx,0
mov DWORD PTR [edi],eax
mov esi,edx
dec ebp
jz $L007mw_end
; Tail Round 1
mov eax,DWORD PTR 4[ebx]
mul ecx
add eax,esi
adc edx,0
mov DWORD PTR 4[edi],eax
mov esi,edx
dec ebp
jz $L007mw_end
; Tail Round 2
mov eax,DWORD PTR 8[ebx]
mul ecx
add eax,esi
adc edx,0
mov DWORD PTR 8[edi],eax
mov esi,edx
dec ebp
jz $L007mw_end
; Tail Round 3
mov eax,DWORD PTR 12[ebx]
mul ecx
add eax,esi
adc edx,0
mov DWORD PTR 12[edi],eax
mov esi,edx
dec ebp
jz $L007mw_end
; Tail Round 4
mov eax,DWORD PTR 16[ebx]
mul ecx
add eax,esi
adc edx,0
mov DWORD PTR 16[edi],eax
mov esi,edx
dec ebp
jz $L007mw_end
; Tail Round 5
mov eax,DWORD PTR 20[ebx]
mul ecx
add eax,esi
adc edx,0
mov DWORD PTR 20[edi],eax
mov esi,edx
dec ebp
jz $L007mw_end
; Tail Round 6
mov eax,DWORD PTR 24[ebx]
mul ecx
add eax,esi
adc edx,0
mov DWORD PTR 24[edi],eax
mov esi,edx
$L007mw_end:
mov eax,esi
pop edi
pop esi
pop ebx
pop ebp
ret
_bn_mul_words ENDP
ALIGN 16
_bn_sqr_words PROC PUBLIC
$L_bn_sqr_words_begin::
push ebp
push ebx
push esi
push edi
;
mov esi,DWORD PTR 20[esp]
mov edi,DWORD PTR 24[esp]
mov ebx,DWORD PTR 28[esp]
and ebx,4294967288
jz $L008sw_finish
$L009sw_loop:
; Round 0
mov eax,DWORD PTR [edi]
mul eax
mov DWORD PTR [esi],eax
mov DWORD PTR 4[esi],edx
; Round 4
mov eax,DWORD PTR 4[edi]
mul eax
mov DWORD PTR 8[esi],eax
mov DWORD PTR 12[esi],edx
; Round 8
mov eax,DWORD PTR 8[edi]
mul eax
mov DWORD PTR 16[esi],eax
mov DWORD PTR 20[esi],edx
; Round 12
mov eax,DWORD PTR 12[edi]
mul eax
mov DWORD PTR 24[esi],eax
mov DWORD PTR 28[esi],edx
; Round 16
mov eax,DWORD PTR 16[edi]
mul eax
mov DWORD PTR 32[esi],eax
mov DWORD PTR 36[esi],edx
; Round 20
mov eax,DWORD PTR 20[edi]
mul eax
mov DWORD PTR 40[esi],eax
mov DWORD PTR 44[esi],edx
; Round 24
mov eax,DWORD PTR 24[edi]
mul eax
mov DWORD PTR 48[esi],eax
mov DWORD PTR 52[esi],edx
; Round 28
mov eax,DWORD PTR 28[edi]
mul eax
mov DWORD PTR 56[esi],eax
mov DWORD PTR 60[esi],edx
;
add edi,32
add esi,64
sub ebx,8
jnz $L009sw_loop
$L008sw_finish:
mov ebx,DWORD PTR 28[esp]
and ebx,7
jz $L010sw_end
; Tail Round 0
mov eax,DWORD PTR [edi]
mul eax
mov DWORD PTR [esi],eax
dec ebx
mov DWORD PTR 4[esi],edx
jz $L010sw_end
; Tail Round 1
mov eax,DWORD PTR 4[edi]
mul eax
mov DWORD PTR 8[esi],eax
dec ebx
mov DWORD PTR 12[esi],edx
jz $L010sw_end
; Tail Round 2
mov eax,DWORD PTR 8[edi]
mul eax
mov DWORD PTR 16[esi],eax
dec ebx
mov DWORD PTR 20[esi],edx
jz $L010sw_end
; Tail Round 3
mov eax,DWORD PTR 12[edi]
mul eax
mov DWORD PTR 24[esi],eax
dec ebx
mov DWORD PTR 28[esi],edx
jz $L010sw_end
; Tail Round 4
mov eax,DWORD PTR 16[edi]
mul eax
mov DWORD PTR 32[esi],eax
dec ebx
mov DWORD PTR 36[esi],edx
jz $L010sw_end
; Tail Round 5
mov eax,DWORD PTR 20[edi]
mul eax
mov DWORD PTR 40[esi],eax
dec ebx
mov DWORD PTR 44[esi],edx
jz $L010sw_end
; Tail Round 6
mov eax,DWORD PTR 24[edi]
mul eax
mov DWORD PTR 48[esi],eax
mov DWORD PTR 52[esi],edx
$L010sw_end:
pop edi
pop esi
pop ebx
pop ebp
ret
_bn_sqr_words ENDP
ALIGN 16
_bn_div_words PROC PUBLIC
$L_bn_div_words_begin::
push ebp
push ebx
push esi
push edi
mov edx,DWORD PTR 20[esp]
mov eax,DWORD PTR 24[esp]
mov ebx,DWORD PTR 28[esp]
div ebx
pop edi
pop esi
pop ebx
pop ebp
ret
_bn_div_words ENDP
ALIGN 16
_bn_add_words PROC PUBLIC
$L_bn_add_words_begin::
push ebp
push ebx
push esi
push edi
;
mov ebx,DWORD PTR 20[esp]
mov esi,DWORD PTR 24[esp]
mov edi,DWORD PTR 28[esp]
mov ebp,DWORD PTR 32[esp]
xor eax,eax
and ebp,4294967288
jz $L011aw_finish
$L012aw_loop:
; Round 0
mov ecx,DWORD PTR [esi]
mov edx,DWORD PTR [edi]
add ecx,eax
mov eax,0
adc eax,eax
add ecx,edx
adc eax,0
mov DWORD PTR [ebx],ecx
; Round 1
mov ecx,DWORD PTR 4[esi]
mov edx,DWORD PTR 4[edi]
add ecx,eax
mov eax,0
adc eax,eax
add ecx,edx
adc eax,0
mov DWORD PTR 4[ebx],ecx
; Round 2
mov ecx,DWORD PTR 8[esi]
mov edx,DWORD PTR 8[edi]
add ecx,eax
mov eax,0
adc eax,eax
add ecx,edx
adc eax,0
mov DWORD PTR 8[ebx],ecx
; Round 3
mov ecx,DWORD PTR 12[esi]
mov edx,DWORD PTR 12[edi]
add ecx,eax
mov eax,0
adc eax,eax
add ecx,edx
adc eax,0
mov DWORD PTR 12[ebx],ecx
; Round 4
mov ecx,DWORD PTR 16[esi]
mov edx,DWORD PTR 16[edi]
add ecx,eax
mov eax,0
adc eax,eax
add ecx,edx
adc eax,0
mov DWORD PTR 16[ebx],ecx
; Round 5
mov ecx,DWORD PTR 20[esi]
mov edx,DWORD PTR 20[edi]
add ecx,eax
mov eax,0
adc eax,eax
add ecx,edx
adc eax,0
mov DWORD PTR 20[ebx],ecx
; Round 6
mov ecx,DWORD PTR 24[esi]
mov edx,DWORD PTR 24[edi]
add ecx,eax
mov eax,0
adc eax,eax
add ecx,edx
adc eax,0
mov DWORD PTR 24[ebx],ecx
; Round 7
mov ecx,DWORD PTR 28[esi]
mov edx,DWORD PTR 28[edi]
add ecx,eax
mov eax,0
adc eax,eax
add ecx,edx
adc eax,0
mov DWORD PTR 28[ebx],ecx
;
add esi,32
add edi,32
add ebx,32
sub ebp,8
jnz $L012aw_loop
$L011aw_finish:
mov ebp,DWORD PTR 32[esp]
and ebp,7
jz $L013aw_end
; Tail Round 0
mov ecx,DWORD PTR [esi]
mov edx,DWORD PTR [edi]
add ecx,eax
mov eax,0
adc eax,eax
add ecx,edx
adc eax,0
dec ebp
mov DWORD PTR [ebx],ecx
jz $L013aw_end
; Tail Round 1
mov ecx,DWORD PTR 4[esi]
mov edx,DWORD PTR 4[edi]
add ecx,eax
mov eax,0
adc eax,eax
add ecx,edx
adc eax,0
dec ebp
mov DWORD PTR 4[ebx],ecx
jz $L013aw_end
; Tail Round 2
mov ecx,DWORD PTR 8[esi]
mov edx,DWORD PTR 8[edi]
add ecx,eax
mov eax,0
adc eax,eax
add ecx,edx
adc eax,0
dec ebp
mov DWORD PTR 8[ebx],ecx
jz $L013aw_end
; Tail Round 3
mov ecx,DWORD PTR 12[esi]
mov edx,DWORD PTR 12[edi]
add ecx,eax
mov eax,0
adc eax,eax
add ecx,edx
adc eax,0
dec ebp
mov DWORD PTR 12[ebx],ecx
jz $L013aw_end
; Tail Round 4
mov ecx,DWORD PTR 16[esi]
mov edx,DWORD PTR 16[edi]
add ecx,eax
mov eax,0
adc eax,eax
add ecx,edx
adc eax,0
dec ebp
mov DWORD PTR 16[ebx],ecx
jz $L013aw_end
; Tail Round 5
mov ecx,DWORD PTR 20[esi]
mov edx,DWORD PTR 20[edi]
add ecx,eax
mov eax,0
adc eax,eax
add ecx,edx
adc eax,0
dec ebp
mov DWORD PTR 20[ebx],ecx
jz $L013aw_end
; Tail Round 6
mov ecx,DWORD PTR 24[esi]
mov edx,DWORD PTR 24[edi]
add ecx,eax
mov eax,0
adc eax,eax
add ecx,edx
adc eax,0
mov DWORD PTR 24[ebx],ecx
$L013aw_end:
pop edi
pop esi
pop ebx
pop ebp
ret
_bn_add_words ENDP
ALIGN 16
_bn_sub_words PROC PUBLIC
$L_bn_sub_words_begin::
push ebp
push ebx
push esi
push edi
;
mov ebx,DWORD PTR 20[esp]
mov esi,DWORD PTR 24[esp]
mov edi,DWORD PTR 28[esp]
mov ebp,DWORD PTR 32[esp]
xor eax,eax
and ebp,4294967288
jz $L014aw_finish
$L015aw_loop:
; Round 0
mov ecx,DWORD PTR [esi]
mov edx,DWORD PTR [edi]
sub ecx,eax
mov eax,0
adc eax,eax
sub ecx,edx
adc eax,0
mov DWORD PTR [ebx],ecx
; Round 1
mov ecx,DWORD PTR 4[esi]
mov edx,DWORD PTR 4[edi]
sub ecx,eax
mov eax,0
adc eax,eax
sub ecx,edx
adc eax,0
mov DWORD PTR 4[ebx],ecx
; Round 2
mov ecx,DWORD PTR 8[esi]
mov edx,DWORD PTR 8[edi]
sub ecx,eax
mov eax,0
adc eax,eax
sub ecx,edx
adc eax,0
mov DWORD PTR 8[ebx],ecx
; Round 3
mov ecx,DWORD PTR 12[esi]
mov edx,DWORD PTR 12[edi]
sub ecx,eax
mov eax,0
adc eax,eax
sub ecx,edx
adc eax,0
mov DWORD PTR 12[ebx],ecx
; Round 4
mov ecx,DWORD PTR 16[esi]
mov edx,DWORD PTR 16[edi]
sub ecx,eax
mov eax,0
adc eax,eax
sub ecx,edx
adc eax,0
mov DWORD PTR 16[ebx],ecx
; Round 5
mov ecx,DWORD PTR 20[esi]
mov edx,DWORD PTR 20[edi]
sub ecx,eax
mov eax,0
adc eax,eax
sub ecx,edx
adc eax,0
mov DWORD PTR 20[ebx],ecx
; Round 6
mov ecx,DWORD PTR 24[esi]
mov edx,DWORD PTR 24[edi]
sub ecx,eax
mov eax,0
adc eax,eax
sub ecx,edx
adc eax,0
mov DWORD PTR 24[ebx],ecx
; Round 7
mov ecx,DWORD PTR 28[esi]
mov edx,DWORD PTR 28[edi]
sub ecx,eax
mov eax,0
adc eax,eax
sub ecx,edx
adc eax,0
mov DWORD PTR 28[ebx],ecx
;
add esi,32
add edi,32
add ebx,32
sub ebp,8
jnz $L015aw_loop
$L014aw_finish:
mov ebp,DWORD PTR 32[esp]
and ebp,7
jz $L016aw_end
; Tail Round 0
mov ecx,DWORD PTR [esi]
mov edx,DWORD PTR [edi]
sub ecx,eax
mov eax,0
adc eax,eax
sub ecx,edx
adc eax,0
dec ebp
mov DWORD PTR [ebx],ecx
jz $L016aw_end
; Tail Round 1
mov ecx,DWORD PTR 4[esi]
mov edx,DWORD PTR 4[edi]
sub ecx,eax
mov eax,0
adc eax,eax
sub ecx,edx
adc eax,0
dec ebp
mov DWORD PTR 4[ebx],ecx
jz $L016aw_end
; Tail Round 2
mov ecx,DWORD PTR 8[esi]
mov edx,DWORD PTR 8[edi]
sub ecx,eax
mov eax,0
adc eax,eax
sub ecx,edx
adc eax,0
dec ebp
mov DWORD PTR 8[ebx],ecx
jz $L016aw_end
; Tail Round 3
mov ecx,DWORD PTR 12[esi]
mov edx,DWORD PTR 12[edi]
sub ecx,eax
mov eax,0
adc eax,eax
sub ecx,edx
adc eax,0
dec ebp
mov DWORD PTR 12[ebx],ecx
jz $L016aw_end
; Tail Round 4
mov ecx,DWORD PTR 16[esi]
mov edx,DWORD PTR 16[edi]
sub ecx,eax
mov eax,0
adc eax,eax
sub ecx,edx
adc eax,0
dec ebp
mov DWORD PTR 16[ebx],ecx
jz $L016aw_end
; Tail Round 5
mov ecx,DWORD PTR 20[esi]
mov edx,DWORD PTR 20[edi]
sub ecx,eax
mov eax,0
adc eax,eax
sub ecx,edx
adc eax,0
dec ebp
mov DWORD PTR 20[ebx],ecx
jz $L016aw_end
; Tail Round 6
mov ecx,DWORD PTR 24[esi]
mov edx,DWORD PTR 24[edi]
sub ecx,eax
mov eax,0
adc eax,eax
sub ecx,edx
adc eax,0
mov DWORD PTR 24[ebx],ecx
$L016aw_end:
pop edi
pop esi
pop ebx
pop ebp
ret
_bn_sub_words ENDP
ALIGN 16
_bn_mul_comba8 PROC PUBLIC
$L_bn_mul_comba8_begin::
push esi
mov esi,DWORD PTR 12[esp]
push edi
mov edi,DWORD PTR 20[esp]
push ebp
push ebx
xor ebx,ebx
mov eax,DWORD PTR [esi]
xor ecx,ecx
mov edx,DWORD PTR [edi]
; ################## Calculate word 0
xor ebp,ebp
; mul a[0]*b[0]
mul edx
add ebx,eax
mov eax,DWORD PTR 20[esp]
adc ecx,edx
mov edx,DWORD PTR [edi]
adc ebp,0
mov DWORD PTR [eax],ebx
mov eax,DWORD PTR 4[esi]
; saved r[0]
; ################## Calculate word 1
xor ebx,ebx
; mul a[1]*b[0]
mul edx
add ecx,eax
mov eax,DWORD PTR [esi]
adc ebp,edx
mov edx,DWORD PTR 4[edi]
adc ebx,0
; mul a[0]*b[1]
mul edx
add ecx,eax
mov eax,DWORD PTR 20[esp]
adc ebp,edx
mov edx,DWORD PTR [edi]
adc ebx,0
mov DWORD PTR 4[eax],ecx
mov eax,DWORD PTR 8[esi]
; saved r[1]
; ################## Calculate word 2
xor ecx,ecx
; mul a[2]*b[0]
mul edx
add ebp,eax
mov eax,DWORD PTR 4[esi]
adc ebx,edx
mov edx,DWORD PTR 4[edi]
adc ecx,0
; mul a[1]*b[1]
mul edx
add ebp,eax
mov eax,DWORD PTR [esi]
adc ebx,edx
mov edx,DWORD PTR 8[edi]
adc ecx,0
; mul a[0]*b[2]
mul edx
add ebp,eax
mov eax,DWORD PTR 20[esp]
adc ebx,edx
mov edx,DWORD PTR [edi]
adc ecx,0
mov DWORD PTR 8[eax],ebp
mov eax,DWORD PTR 12[esi]
; saved r[2]
; ################## Calculate word 3
xor ebp,ebp
; mul a[3]*b[0]
mul edx
add ebx,eax
mov eax,DWORD PTR 8[esi]
adc ecx,edx
mov edx,DWORD PTR 4[edi]
adc ebp,0
; mul a[2]*b[1]
mul edx
add ebx,eax
mov eax,DWORD PTR 4[esi]
adc ecx,edx
mov edx,DWORD PTR 8[edi]
adc ebp,0
; mul a[1]*b[2]
mul edx
add ebx,eax
mov eax,DWORD PTR [esi]
adc ecx,edx
mov edx,DWORD PTR 12[edi]
adc ebp,0
; mul a[0]*b[3]
mul edx
add ebx,eax
mov eax,DWORD PTR 20[esp]
adc ecx,edx
mov edx,DWORD PTR [edi]
adc ebp,0
mov DWORD PTR 12[eax],ebx
mov eax,DWORD PTR 16[esi]
; saved r[3]
; ################## Calculate word 4
xor ebx,ebx
; mul a[4]*b[0]
mul edx
add ecx,eax
mov eax,DWORD PTR 12[esi]
adc ebp,edx
mov edx,DWORD PTR 4[edi]
adc ebx,0
; mul a[3]*b[1]
mul edx
add ecx,eax
mov eax,DWORD PTR 8[esi]
adc ebp,edx
mov edx,DWORD PTR 8[edi]
adc ebx,0
; mul a[2]*b[2]
mul edx
add ecx,eax
mov eax,DWORD PTR 4[esi]
adc ebp,edx
mov edx,DWORD PTR 12[edi]
adc ebx,0
; mul a[1]*b[3]
mul edx
add ecx,eax
mov eax,DWORD PTR [esi]
adc ebp,edx
mov edx,DWORD PTR 16[edi]
adc ebx,0
; mul a[0]*b[4]
mul edx
add ecx,eax
mov eax,DWORD PTR 20[esp]
adc ebp,edx
mov edx,DWORD PTR [edi]
adc ebx,0
mov DWORD PTR 16[eax],ecx
mov eax,DWORD PTR 20[esi]
; saved r[4]
; ################## Calculate word 5
xor ecx,ecx
; mul a[5]*b[0]
mul edx
add ebp,eax
mov eax,DWORD PTR 16[esi]
adc ebx,edx
mov edx,DWORD PTR 4[edi]
adc ecx,0
; mul a[4]*b[1]
mul edx
add ebp,eax
mov eax,DWORD PTR 12[esi]
adc ebx,edx
mov edx,DWORD PTR 8[edi]
adc ecx,0
; mul a[3]*b[2]
mul edx
add ebp,eax
mov eax,DWORD PTR 8[esi]
adc ebx,edx
mov edx,DWORD PTR 12[edi]
adc ecx,0
; mul a[2]*b[3]
mul edx
add ebp,eax
mov eax,DWORD PTR 4[esi]
adc ebx,edx
mov edx,DWORD PTR 16[edi]
adc ecx,0
; mul a[1]*b[4]
mul edx
add ebp,eax
mov eax,DWORD PTR [esi]
adc ebx,edx
mov edx,DWORD PTR 20[edi]
adc ecx,0
; mul a[0]*b[5]
mul edx
add ebp,eax
mov eax,DWORD PTR 20[esp]
adc ebx,edx
mov edx,DWORD PTR [edi]
adc ecx,0
mov DWORD PTR 20[eax],ebp
mov eax,DWORD PTR 24[esi]
; saved r[5]
; ################## Calculate word 6
xor ebp,ebp
; mul a[6]*b[0]
mul edx
add ebx,eax
mov eax,DWORD PTR 20[esi]
adc ecx,edx
mov edx,DWORD PTR 4[edi]
adc ebp,0
; mul a[5]*b[1]
mul edx
add ebx,eax
mov eax,DWORD PTR 16[esi]
adc ecx,edx
mov edx,DWORD PTR 8[edi]
adc ebp,0
; mul a[4]*b[2]
mul edx
add ebx,eax
mov eax,DWORD PTR 12[esi]
adc ecx,edx
mov edx,DWORD PTR 12[edi]
adc ebp,0
; mul a[3]*b[3]
mul edx
add ebx,eax
mov eax,DWORD PTR 8[esi]
adc ecx,edx
mov edx,DWORD PTR 16[edi]
adc ebp,0
; mul a[2]*b[4]
mul edx
add ebx,eax
mov eax,DWORD PTR 4[esi]
adc ecx,edx
mov edx,DWORD PTR 20[edi]
adc ebp,0
; mul a[1]*b[5]
mul edx
add ebx,eax
mov eax,DWORD PTR [esi]
adc ecx,edx
mov edx,DWORD PTR 24[edi]
adc ebp,0
; mul a[0]*b[6]
mul edx
add ebx,eax
mov eax,DWORD PTR 20[esp]
adc ecx,edx
mov edx,DWORD PTR [edi]
adc ebp,0
mov DWORD PTR 24[eax],ebx
mov eax,DWORD PTR 28[esi]
; saved r[6]
; ################## Calculate word 7
xor ebx,ebx
; mul a[7]*b[0]
mul edx
add ecx,eax
mov eax,DWORD PTR 24[esi]
adc ebp,edx
mov edx,DWORD PTR 4[edi]
adc ebx,0
; mul a[6]*b[1]
mul edx
add ecx,eax
mov eax,DWORD PTR 20[esi]
adc ebp,edx
mov edx,DWORD PTR 8[edi]
adc ebx,0
; mul a[5]*b[2]
mul edx
add ecx,eax
mov eax,DWORD PTR 16[esi]
adc ebp,edx
mov edx,DWORD PTR 12[edi]
adc ebx,0
; mul a[4]*b[3]
mul edx
add ecx,eax
mov eax,DWORD PTR 12[esi]
adc ebp,edx
mov edx,DWORD PTR 16[edi]
adc ebx,0
; mul a[3]*b[4]
mul edx
add ecx,eax
mov eax,DWORD PTR 8[esi]
adc ebp,edx
mov edx,DWORD PTR 20[edi]
adc ebx,0
; mul a[2]*b[5]
mul edx
add ecx,eax
mov eax,DWORD PTR 4[esi]
adc ebp,edx
mov edx,DWORD PTR 24[edi]
adc ebx,0
; mul a[1]*b[6]
mul edx
add ecx,eax
mov eax,DWORD PTR [esi]
adc ebp,edx
mov edx,DWORD PTR 28[edi]
adc ebx,0
; mul a[0]*b[7]
mul edx
add ecx,eax
mov eax,DWORD PTR 20[esp]
adc ebp,edx
mov edx,DWORD PTR 4[edi]
adc ebx,0
mov DWORD PTR 28[eax],ecx
mov eax,DWORD PTR 28[esi]
; saved r[7]
; ################## Calculate word 8
xor ecx,ecx
; mul a[7]*b[1]
mul edx
add ebp,eax
mov eax,DWORD PTR 24[esi]
adc ebx,edx
mov edx,DWORD PTR 8[edi]
adc ecx,0
; mul a[6]*b[2]
mul edx
add ebp,eax
mov eax,DWORD PTR 20[esi]
adc ebx,edx
mov edx,DWORD PTR 12[edi]
adc ecx,0
; mul a[5]*b[3]
mul edx
add ebp,eax
mov eax,DWORD PTR 16[esi]
adc ebx,edx
mov edx,DWORD PTR 16[edi]
adc ecx,0
; mul a[4]*b[4]
mul edx
add ebp,eax
mov eax,DWORD PTR 12[esi]
adc ebx,edx
mov edx,DWORD PTR 20[edi]
adc ecx,0
; mul a[3]*b[5]
mul edx
add ebp,eax
mov eax,DWORD PTR 8[esi]
adc ebx,edx
mov edx,DWORD PTR 24[edi]
adc ecx,0
; mul a[2]*b[6]
mul edx
add ebp,eax
mov eax,DWORD PTR 4[esi]
adc ebx,edx
mov edx,DWORD PTR 28[edi]
adc ecx,0
; mul a[1]*b[7]
mul edx
add ebp,eax
mov eax,DWORD PTR 20[esp]
adc ebx,edx
mov edx,DWORD PTR 8[edi]
adc ecx,0
mov DWORD PTR 32[eax],ebp
mov eax,DWORD PTR 28[esi]
; saved r[8]
; ################## Calculate word 9
xor ebp,ebp
; mul a[7]*b[2]
mul edx
add ebx,eax
mov eax,DWORD PTR 24[esi]
adc ecx,edx
mov edx,DWORD PTR 12[edi]
adc ebp,0
; mul a[6]*b[3]
mul edx
add ebx,eax
mov eax,DWORD PTR 20[esi]
adc ecx,edx
mov edx,DWORD PTR 16[edi]
adc ebp,0
; mul a[5]*b[4]
mul edx
add ebx,eax
mov eax,DWORD PTR 16[esi]
adc ecx,edx
mov edx,DWORD PTR 20[edi]
adc ebp,0
; mul a[4]*b[5]
mul edx
add ebx,eax
mov eax,DWORD PTR 12[esi]
adc ecx,edx
mov edx,DWORD PTR 24[edi]
adc ebp,0
; mul a[3]*b[6]
mul edx
add ebx,eax
mov eax,DWORD PTR 8[esi]
adc ecx,edx
mov edx,DWORD PTR 28[edi]
adc ebp,0
; mul a[2]*b[7]
mul edx
add ebx,eax
mov eax,DWORD PTR 20[esp]
adc ecx,edx
mov edx,DWORD PTR 12[edi]
adc ebp,0
mov DWORD PTR 36[eax],ebx
mov eax,DWORD PTR 28[esi]
; saved r[9]
; ################## Calculate word 10
xor ebx,ebx
; mul a[7]*b[3]
mul edx
add ecx,eax
mov eax,DWORD PTR 24[esi]
adc ebp,edx
mov edx,DWORD PTR 16[edi]
adc ebx,0
; mul a[6]*b[4]
mul edx
add ecx,eax
mov eax,DWORD PTR 20[esi]
adc ebp,edx
mov edx,DWORD PTR 20[edi]
adc ebx,0
; mul a[5]*b[5]
mul edx
add ecx,eax
mov eax,DWORD PTR 16[esi]
adc ebp,edx
mov edx,DWORD PTR 24[edi]
adc ebx,0
; mul a[4]*b[6]
mul edx
add ecx,eax
mov eax,DWORD PTR 12[esi]
adc ebp,edx
mov edx,DWORD PTR 28[edi]
adc ebx,0
; mul a[3]*b[7]
mul edx
add ecx,eax
mov eax,DWORD PTR 20[esp]
adc ebp,edx
mov edx,DWORD PTR 16[edi]
adc ebx,0
mov DWORD PTR 40[eax],ecx
mov eax,DWORD PTR 28[esi]
; saved r[10]
; ################## Calculate word 11
xor ecx,ecx
; mul a[7]*b[4]
mul edx
add ebp,eax
mov eax,DWORD PTR 24[esi]
adc ebx,edx
mov edx,DWORD PTR 20[edi]
adc ecx,0
; mul a[6]*b[5]
mul edx
add ebp,eax
mov eax,DWORD PTR 20[esi]
adc ebx,edx
mov edx,DWORD PTR 24[edi]
adc ecx,0
; mul a[5]*b[6]
mul edx
add ebp,eax
mov eax,DWORD PTR 16[esi]
adc ebx,edx
mov edx,DWORD PTR 28[edi]
adc ecx,0
; mul a[4]*b[7]
mul edx
add ebp,eax
mov eax,DWORD PTR 20[esp]
adc ebx,edx
mov edx,DWORD PTR 20[edi]
adc ecx,0
mov DWORD PTR 44[eax],ebp
mov eax,DWORD PTR 28[esi]
; saved r[11]
; ################## Calculate word 12
xor ebp,ebp
; mul a[7]*b[5]
mul edx
add ebx,eax
mov eax,DWORD PTR 24[esi]
adc ecx,edx
mov edx,DWORD PTR 24[edi]
adc ebp,0
; mul a[6]*b[6]
mul edx
add ebx,eax
mov eax,DWORD PTR 20[esi]
adc ecx,edx
mov edx,DWORD PTR 28[edi]
adc ebp,0
; mul a[5]*b[7]
mul edx
add ebx,eax
mov eax,DWORD PTR 20[esp]
adc ecx,edx
mov edx,DWORD PTR 24[edi]
adc ebp,0
mov DWORD PTR 48[eax],ebx
mov eax,DWORD PTR 28[esi]
; saved r[12]
; ################## Calculate word 13
xor ebx,ebx
; mul a[7]*b[6]
mul edx
add ecx,eax
mov eax,DWORD PTR 24[esi]
adc ebp,edx
mov edx,DWORD PTR 28[edi]
adc ebx,0
; mul a[6]*b[7]
mul edx
add ecx,eax
mov eax,DWORD PTR 20[esp]
adc ebp,edx
mov edx,DWORD PTR 28[edi]
adc ebx,0
mov DWORD PTR 52[eax],ecx
mov eax,DWORD PTR 28[esi]
; saved r[13]
; ################## Calculate word 14
xor ecx,ecx
; mul a[7]*b[7]
mul edx
add ebp,eax
mov eax,DWORD PTR 20[esp]
adc ebx,edx
adc ecx,0
mov DWORD PTR 56[eax],ebp
; saved r[14]
; save r[15]
mov DWORD PTR 60[eax],ebx
pop ebx
pop ebp
pop edi
pop esi
ret
_bn_mul_comba8 ENDP
ALIGN 16
_bn_mul_comba4 PROC PUBLIC
$L_bn_mul_comba4_begin::
push esi
mov esi,DWORD PTR 12[esp]
push edi
mov edi,DWORD PTR 20[esp]
push ebp
push ebx
xor ebx,ebx
mov eax,DWORD PTR [esi]
xor ecx,ecx
mov edx,DWORD PTR [edi]
; ################## Calculate word 0
xor ebp,ebp
; mul a[0]*b[0]
mul edx
add ebx,eax
mov eax,DWORD PTR 20[esp]
adc ecx,edx
mov edx,DWORD PTR [edi]
adc ebp,0
mov DWORD PTR [eax],ebx
mov eax,DWORD PTR 4[esi]
; saved r[0]
; ################## Calculate word 1
xor ebx,ebx
; mul a[1]*b[0]
mul edx
add ecx,eax
mov eax,DWORD PTR [esi]
adc ebp,edx
mov edx,DWORD PTR 4[edi]
adc ebx,0
; mul a[0]*b[1]
mul edx
add ecx,eax
mov eax,DWORD PTR 20[esp]
adc ebp,edx
mov edx,DWORD PTR [edi]
adc ebx,0
mov DWORD PTR 4[eax],ecx
mov eax,DWORD PTR 8[esi]
; saved r[1]
; ################## Calculate word 2
xor ecx,ecx
; mul a[2]*b[0]
mul edx
add ebp,eax
mov eax,DWORD PTR 4[esi]
adc ebx,edx
mov edx,DWORD PTR 4[edi]
adc ecx,0
; mul a[1]*b[1]
mul edx
add ebp,eax
mov eax,DWORD PTR [esi]
adc ebx,edx
mov edx,DWORD PTR 8[edi]
adc ecx,0
; mul a[0]*b[2]
mul edx
add ebp,eax
mov eax,DWORD PTR 20[esp]
adc ebx,edx
mov edx,DWORD PTR [edi]
adc ecx,0
mov DWORD PTR 8[eax],ebp
mov eax,DWORD PTR 12[esi]
; saved r[2]
; ################## Calculate word 3
xor ebp,ebp
; mul a[3]*b[0]
mul edx
add ebx,eax
mov eax,DWORD PTR 8[esi]
adc ecx,edx
mov edx,DWORD PTR 4[edi]
adc ebp,0
; mul a[2]*b[1]
mul edx
add ebx,eax
mov eax,DWORD PTR 4[esi]
adc ecx,edx
mov edx,DWORD PTR 8[edi]
adc ebp,0
; mul a[1]*b[2]
mul edx
add ebx,eax
mov eax,DWORD PTR [esi]
adc ecx,edx
mov edx,DWORD PTR 12[edi]
adc ebp,0
; mul a[0]*b[3]
mul edx
add ebx,eax
mov eax,DWORD PTR 20[esp]
adc ecx,edx
mov edx,DWORD PTR 4[edi]
adc ebp,0
mov DWORD PTR 12[eax],ebx
mov eax,DWORD PTR 12[esi]
; saved r[3]
; ################## Calculate word 4
xor ebx,ebx
; mul a[3]*b[1]
mul edx
add ecx,eax
mov eax,DWORD PTR 8[esi]
adc ebp,edx
mov edx,DWORD PTR 8[edi]
adc ebx,0
; mul a[2]*b[2]
mul edx
add ecx,eax
mov eax,DWORD PTR 4[esi]
adc ebp,edx
mov edx,DWORD PTR 12[edi]
adc ebx,0
; mul a[1]*b[3]
mul edx
add ecx,eax
mov eax,DWORD PTR 20[esp]
adc ebp,edx
mov edx,DWORD PTR 8[edi]
adc ebx,0
mov DWORD PTR 16[eax],ecx
mov eax,DWORD PTR 12[esi]
; saved r[4]
; ################## Calculate word 5
xor ecx,ecx
; mul a[3]*b[2]
mul edx
add ebp,eax
mov eax,DWORD PTR 8[esi]
adc ebx,edx
mov edx,DWORD PTR 12[edi]
adc ecx,0
; mul a[2]*b[3]
mul edx
add ebp,eax
mov eax,DWORD PTR 20[esp]
adc ebx,edx
mov edx,DWORD PTR 12[edi]
adc ecx,0
mov DWORD PTR 20[eax],ebp
mov eax,DWORD PTR 12[esi]
; saved r[5]
; ################## Calculate word 6
xor ebp,ebp
; mul a[3]*b[3]
mul edx
add ebx,eax
mov eax,DWORD PTR 20[esp]
adc ecx,edx
adc ebp,0
mov DWORD PTR 24[eax],ebx
; saved r[6]
; save r[7]
mov DWORD PTR 28[eax],ecx
pop ebx
pop ebp
pop edi
pop esi
ret
_bn_mul_comba4 ENDP
ALIGN 16
_bn_sqr_comba8 PROC PUBLIC
$L_bn_sqr_comba8_begin::
push esi
push edi
push ebp
push ebx
mov edi,DWORD PTR 20[esp]
mov esi,DWORD PTR 24[esp]
xor ebx,ebx
xor ecx,ecx
mov eax,DWORD PTR [esi]
; ############### Calculate word 0
xor ebp,ebp
; sqr a[0]*a[0]
mul eax
add ebx,eax
adc ecx,edx
mov edx,DWORD PTR [esi]
adc ebp,0
mov DWORD PTR [edi],ebx
mov eax,DWORD PTR 4[esi]
; saved r[0]
; ############### Calculate word 1
xor ebx,ebx
; sqr a[1]*a[0]
mul edx
add eax,eax
adc edx,edx
adc ebx,0
add ecx,eax
adc ebp,edx
mov eax,DWORD PTR 8[esi]
adc ebx,0
mov DWORD PTR 4[edi],ecx
mov edx,DWORD PTR [esi]
; saved r[1]
; ############### Calculate word 2
xor ecx,ecx
; sqr a[2]*a[0]
mul edx
add eax,eax
adc edx,edx
adc ecx,0
add ebp,eax
adc ebx,edx
mov eax,DWORD PTR 4[esi]
adc ecx,0
; sqr a[1]*a[1]
mul eax
add ebp,eax
adc ebx,edx
mov edx,DWORD PTR [esi]
adc ecx,0
mov DWORD PTR 8[edi],ebp
mov eax,DWORD PTR 12[esi]
; saved r[2]
; ############### Calculate word 3
xor ebp,ebp
; sqr a[3]*a[0]
mul edx
add eax,eax
adc edx,edx
adc ebp,0
add ebx,eax
adc ecx,edx
mov eax,DWORD PTR 8[esi]
adc ebp,0
mov edx,DWORD PTR 4[esi]
; sqr a[2]*a[1]
mul edx
add eax,eax
adc edx,edx
adc ebp,0
add ebx,eax
adc ecx,edx
mov eax,DWORD PTR 16[esi]
adc ebp,0
mov DWORD PTR 12[edi],ebx
mov edx,DWORD PTR [esi]
; saved r[3]
; ############### Calculate word 4
xor ebx,ebx
; sqr a[4]*a[0]
mul edx
add eax,eax
adc edx,edx
adc ebx,0
add ecx,eax
adc ebp,edx
mov eax,DWORD PTR 12[esi]
adc ebx,0
mov edx,DWORD PTR 4[esi]
; sqr a[3]*a[1]
mul edx
add eax,eax
adc edx,edx
adc ebx,0
add ecx,eax
adc ebp,edx
mov eax,DWORD PTR 8[esi]
adc ebx,0
; sqr a[2]*a[2]
mul eax
add ecx,eax
adc ebp,edx
mov edx,DWORD PTR [esi]
adc ebx,0
mov DWORD PTR 16[edi],ecx
mov eax,DWORD PTR 20[esi]
; saved r[4]
; ############### Calculate word 5
xor ecx,ecx
; sqr a[5]*a[0]
mul edx
add eax,eax
adc edx,edx
adc ecx,0
add ebp,eax
adc ebx,edx
mov eax,DWORD PTR 16[esi]
adc ecx,0
mov edx,DWORD PTR 4[esi]
; sqr a[4]*a[1]
mul edx
add eax,eax
adc edx,edx
adc ecx,0
add ebp,eax
adc ebx,edx
mov eax,DWORD PTR 12[esi]
adc ecx,0
mov edx,DWORD PTR 8[esi]
; sqr a[3]*a[2]
mul edx
add eax,eax
adc edx,edx
adc ecx,0
add ebp,eax
adc ebx,edx
mov eax,DWORD PTR 24[esi]
adc ecx,0
mov DWORD PTR 20[edi],ebp
mov edx,DWORD PTR [esi]
; saved r[5]
; ############### Calculate word 6
xor ebp,ebp
; sqr a[6]*a[0]
mul edx
add eax,eax
adc edx,edx
adc ebp,0
add ebx,eax
adc ecx,edx
mov eax,DWORD PTR 20[esi]
adc ebp,0
mov edx,DWORD PTR 4[esi]
; sqr a[5]*a[1]
mul edx
add eax,eax
adc edx,edx
adc ebp,0
add ebx,eax
adc ecx,edx
mov eax,DWORD PTR 16[esi]
adc ebp,0
mov edx,DWORD PTR 8[esi]
; sqr a[4]*a[2]
mul edx
add eax,eax
adc edx,edx
adc ebp,0
add ebx,eax
adc ecx,edx
mov eax,DWORD PTR 12[esi]
adc ebp,0
; sqr a[3]*a[3]
mul eax
add ebx,eax
adc ecx,edx
mov edx,DWORD PTR [esi]
adc ebp,0
mov DWORD PTR 24[edi],ebx
mov eax,DWORD PTR 28[esi]
; saved r[6]
; ############### Calculate word 7
xor ebx,ebx
; sqr a[7]*a[0]
mul edx
add eax,eax
adc edx,edx
adc ebx,0
add ecx,eax
adc ebp,edx
mov eax,DWORD PTR 24[esi]
adc ebx,0
mov edx,DWORD PTR 4[esi]
; sqr a[6]*a[1]
mul edx
add eax,eax
adc edx,edx
adc ebx,0
add ecx,eax
adc ebp,edx
mov eax,DWORD PTR 20[esi]
adc ebx,0
mov edx,DWORD PTR 8[esi]
; sqr a[5]*a[2]
mul edx
add eax,eax
adc edx,edx
adc ebx,0
add ecx,eax
adc ebp,edx
mov eax,DWORD PTR 16[esi]
adc ebx,0
mov edx,DWORD PTR 12[esi]
; sqr a[4]*a[3]
mul edx
add eax,eax
adc edx,edx
adc ebx,0
add ecx,eax
adc ebp,edx
mov eax,DWORD PTR 28[esi]
adc ebx,0
mov DWORD PTR 28[edi],ecx
mov edx,DWORD PTR 4[esi]
; saved r[7]
; ############### Calculate word 8
xor ecx,ecx
; sqr a[7]*a[1]
mul edx
add eax,eax
adc edx,edx
adc ecx,0
add ebp,eax
adc ebx,edx
mov eax,DWORD PTR 24[esi]
adc ecx,0
mov edx,DWORD PTR 8[esi]
; sqr a[6]*a[2]
mul edx
add eax,eax
adc edx,edx
adc ecx,0
add ebp,eax
adc ebx,edx
mov eax,DWORD PTR 20[esi]
adc ecx,0
mov edx,DWORD PTR 12[esi]
; sqr a[5]*a[3]
mul edx
add eax,eax
adc edx,edx
adc ecx,0
add ebp,eax
adc ebx,edx
mov eax,DWORD PTR 16[esi]
adc ecx,0
; sqr a[4]*a[4]
mul eax
add ebp,eax
adc ebx,edx
mov edx,DWORD PTR 8[esi]
adc ecx,0
mov DWORD PTR 32[edi],ebp
mov eax,DWORD PTR 28[esi]
; saved r[8]
; ############### Calculate word 9
xor ebp,ebp
; sqr a[7]*a[2]
mul edx
add eax,eax
adc edx,edx
adc ebp,0
add ebx,eax
adc ecx,edx
mov eax,DWORD PTR 24[esi]
adc ebp,0
mov edx,DWORD PTR 12[esi]
; sqr a[6]*a[3]
mul edx
add eax,eax
adc edx,edx
adc ebp,0
add ebx,eax
adc ecx,edx
mov eax,DWORD PTR 20[esi]
adc ebp,0
mov edx,DWORD PTR 16[esi]
; sqr a[5]*a[4]
mul edx
add eax,eax
adc edx,edx
adc ebp,0
add ebx,eax
adc ecx,edx
mov eax,DWORD PTR 28[esi]
adc ebp,0
mov DWORD PTR 36[edi],ebx
mov edx,DWORD PTR 12[esi]
; saved r[9]
; ############### Calculate word 10
xor ebx,ebx
; sqr a[7]*a[3]
mul edx
add eax,eax
adc edx,edx
adc ebx,0
add ecx,eax
adc ebp,edx
mov eax,DWORD PTR 24[esi]
adc ebx,0
mov edx,DWORD PTR 16[esi]
; sqr a[6]*a[4]
mul edx
add eax,eax
adc edx,edx
adc ebx,0
add ecx,eax
adc ebp,edx
mov eax,DWORD PTR 20[esi]
adc ebx,0
; sqr a[5]*a[5]
mul eax
add ecx,eax
adc ebp,edx
mov edx,DWORD PTR 16[esi]
adc ebx,0
mov DWORD PTR 40[edi],ecx
mov eax,DWORD PTR 28[esi]
; saved r[10]
; ############### Calculate word 11
xor ecx,ecx
; sqr a[7]*a[4]
mul edx
add eax,eax
adc edx,edx
adc ecx,0
add ebp,eax
adc ebx,edx
mov eax,DWORD PTR 24[esi]
adc ecx,0
mov edx,DWORD PTR 20[esi]
; sqr a[6]*a[5]
mul edx
add eax,eax
adc edx,edx
adc ecx,0
add ebp,eax
adc ebx,edx
mov eax,DWORD PTR 28[esi]
adc ecx,0
mov DWORD PTR 44[edi],ebp
mov edx,DWORD PTR 20[esi]
; saved r[11]
; ############### Calculate word 12
xor ebp,ebp
; sqr a[7]*a[5]
mul edx
add eax,eax
adc edx,edx
adc ebp,0
add ebx,eax
adc ecx,edx
mov eax,DWORD PTR 24[esi]
adc ebp,0
; sqr a[6]*a[6]
mul eax
add ebx,eax
adc ecx,edx
mov edx,DWORD PTR 24[esi]
adc ebp,0
mov DWORD PTR 48[edi],ebx
mov eax,DWORD PTR 28[esi]
; saved r[12]
; ############### Calculate word 13
xor ebx,ebx
; sqr a[7]*a[6]
mul edx
add eax,eax
adc edx,edx
adc ebx,0
add ecx,eax
adc ebp,edx
mov eax,DWORD PTR 28[esi]
adc ebx,0
mov DWORD PTR 52[edi],ecx
; saved r[13]
; ############### Calculate word 14
xor ecx,ecx
; sqr a[7]*a[7]
mul eax
add ebp,eax
adc ebx,edx
adc ecx,0
mov DWORD PTR 56[edi],ebp
; saved r[14]
mov DWORD PTR 60[edi],ebx
pop ebx
pop ebp
pop edi
pop esi
ret
_bn_sqr_comba8 ENDP
ALIGN 16
_bn_sqr_comba4 PROC PUBLIC
$L_bn_sqr_comba4_begin::
push esi
push edi
push ebp
push ebx
mov edi,DWORD PTR 20[esp]
mov esi,DWORD PTR 24[esp]
xor ebx,ebx
xor ecx,ecx
mov eax,DWORD PTR [esi]
; ############### Calculate word 0
xor ebp,ebp
; sqr a[0]*a[0]
mul eax
add ebx,eax
adc ecx,edx
mov edx,DWORD PTR [esi]
adc ebp,0
mov DWORD PTR [edi],ebx
mov eax,DWORD PTR 4[esi]
; saved r[0]
; ############### Calculate word 1
xor ebx,ebx
; sqr a[1]*a[0]
mul edx
add eax,eax
adc edx,edx
adc ebx,0
add ecx,eax
adc ebp,edx
mov eax,DWORD PTR 8[esi]
adc ebx,0
mov DWORD PTR 4[edi],ecx
mov edx,DWORD PTR [esi]
; saved r[1]
; ############### Calculate word 2
xor ecx,ecx
; sqr a[2]*a[0]
mul edx
add eax,eax
adc edx,edx
adc ecx,0
add ebp,eax
adc ebx,edx
mov eax,DWORD PTR 4[esi]
adc ecx,0
; sqr a[1]*a[1]
mul eax
add ebp,eax
adc ebx,edx
mov edx,DWORD PTR [esi]
adc ecx,0
mov DWORD PTR 8[edi],ebp
mov eax,DWORD PTR 12[esi]
; saved r[2]
; ############### Calculate word 3
xor ebp,ebp
; sqr a[3]*a[0]
mul edx
add eax,eax
adc edx,edx
adc ebp,0
add ebx,eax
adc ecx,edx
mov eax,DWORD PTR 8[esi]
adc ebp,0
mov edx,DWORD PTR 4[esi]
; sqr a[2]*a[1]
mul edx
add eax,eax
adc edx,edx
adc ebp,0
add ebx,eax
adc ecx,edx
mov eax,DWORD PTR 12[esi]
adc ebp,0
mov DWORD PTR 12[edi],ebx
mov edx,DWORD PTR 4[esi]
; saved r[3]
; ############### Calculate word 4
xor ebx,ebx
; sqr a[3]*a[1]
mul edx
add eax,eax
adc edx,edx
adc ebx,0
add ecx,eax
adc ebp,edx
mov eax,DWORD PTR 8[esi]
adc ebx,0
; sqr a[2]*a[2]
mul eax
add ecx,eax
adc ebp,edx
mov edx,DWORD PTR 8[esi]
adc ebx,0
mov DWORD PTR 16[edi],ecx
mov eax,DWORD PTR 12[esi]
; saved r[4]
; ############### Calculate word 5
xor ecx,ecx
; sqr a[3]*a[2]
mul edx
add eax,eax
adc edx,edx
adc ecx,0
add ebp,eax
adc ebx,edx
mov eax,DWORD PTR 12[esi]
adc ecx,0
mov DWORD PTR 20[edi],ebp
; saved r[5]
; ############### Calculate word 6
xor ebp,ebp
; sqr a[3]*a[3]
mul eax
add ebx,eax
adc ecx,edx
adc ebp,0
mov DWORD PTR 24[edi],ebx
; saved r[6]
mov DWORD PTR 28[edi],ecx
pop ebx
pop ebp
pop edi
pop esi
ret
_bn_sqr_comba4 ENDP
.text$ ENDS
END