TITLE ../openssl/crypto/bn/asm/co-586.asm IF @Version LT 800 ECHO MASM version 8.00 or later is strongly recommended. ENDIF .686 .MODEL FLAT OPTION DOTNAME IF @Version LT 800 .text$ SEGMENT PAGE 'CODE' ELSE .text$ SEGMENT ALIGN(64) 'CODE' ENDIF ALIGN 16 _bn_mul_comba8 PROC PUBLIC $L_bn_mul_comba8_begin:: push esi mov esi,DWORD PTR 12[esp] push edi mov edi,DWORD PTR 20[esp] push ebp push ebx xor ebx,ebx mov eax,DWORD PTR [esi] xor ecx,ecx mov edx,DWORD PTR [edi] ; ################## Calculate word 0 xor ebp,ebp ; mul a[0]*b[0] mul edx add ebx,eax mov eax,DWORD PTR 20[esp] adc ecx,edx mov edx,DWORD PTR [edi] adc ebp,0 mov DWORD PTR [eax],ebx mov eax,DWORD PTR 4[esi] ; saved r[0] ; ################## Calculate word 1 xor ebx,ebx ; mul a[1]*b[0] mul edx add ecx,eax mov eax,DWORD PTR [esi] adc ebp,edx mov edx,DWORD PTR 4[edi] adc ebx,0 ; mul a[0]*b[1] mul edx add ecx,eax mov eax,DWORD PTR 20[esp] adc ebp,edx mov edx,DWORD PTR [edi] adc ebx,0 mov DWORD PTR 4[eax],ecx mov eax,DWORD PTR 8[esi] ; saved r[1] ; ################## Calculate word 2 xor ecx,ecx ; mul a[2]*b[0] mul edx add ebp,eax mov eax,DWORD PTR 4[esi] adc ebx,edx mov edx,DWORD PTR 4[edi] adc ecx,0 ; mul a[1]*b[1] mul edx add ebp,eax mov eax,DWORD PTR [esi] adc ebx,edx mov edx,DWORD PTR 8[edi] adc ecx,0 ; mul a[0]*b[2] mul edx add ebp,eax mov eax,DWORD PTR 20[esp] adc ebx,edx mov edx,DWORD PTR [edi] adc ecx,0 mov DWORD PTR 8[eax],ebp mov eax,DWORD PTR 12[esi] ; saved r[2] ; ################## Calculate word 3 xor ebp,ebp ; mul a[3]*b[0] mul edx add ebx,eax mov eax,DWORD PTR 8[esi] adc ecx,edx mov edx,DWORD PTR 4[edi] adc ebp,0 ; mul a[2]*b[1] mul edx add ebx,eax mov eax,DWORD PTR 4[esi] adc ecx,edx mov edx,DWORD PTR 8[edi] adc ebp,0 ; mul a[1]*b[2] mul edx add ebx,eax mov eax,DWORD PTR [esi] adc ecx,edx mov edx,DWORD PTR 12[edi] adc ebp,0 ; mul a[0]*b[3] mul edx add ebx,eax mov eax,DWORD PTR 20[esp] adc ecx,edx mov edx,DWORD PTR [edi] adc ebp,0 mov DWORD PTR 12[eax],ebx mov eax,DWORD PTR 16[esi] ; saved r[3] ; ################## Calculate word 4 xor ebx,ebx ; mul a[4]*b[0] mul edx add ecx,eax mov eax,DWORD PTR 12[esi] adc ebp,edx mov edx,DWORD PTR 4[edi] adc ebx,0 ; mul a[3]*b[1] mul edx add ecx,eax mov eax,DWORD PTR 8[esi] adc ebp,edx mov edx,DWORD PTR 8[edi] adc ebx,0 ; mul a[2]*b[2] mul edx add ecx,eax mov eax,DWORD PTR 4[esi] adc ebp,edx mov edx,DWORD PTR 12[edi] adc ebx,0 ; mul a[1]*b[3] mul edx add ecx,eax mov eax,DWORD PTR [esi] adc ebp,edx mov edx,DWORD PTR 16[edi] adc ebx,0 ; mul a[0]*b[4] mul edx add ecx,eax mov eax,DWORD PTR 20[esp] adc ebp,edx mov edx,DWORD PTR [edi] adc ebx,0 mov DWORD PTR 16[eax],ecx mov eax,DWORD PTR 20[esi] ; saved r[4] ; ################## Calculate word 5 xor ecx,ecx ; mul a[5]*b[0] mul edx add ebp,eax mov eax,DWORD PTR 16[esi] adc ebx,edx mov edx,DWORD PTR 4[edi] adc ecx,0 ; mul a[4]*b[1] mul edx add ebp,eax mov eax,DWORD PTR 12[esi] adc ebx,edx mov edx,DWORD PTR 8[edi] adc ecx,0 ; mul a[3]*b[2] mul edx add ebp,eax mov eax,DWORD PTR 8[esi] adc ebx,edx mov edx,DWORD PTR 12[edi] adc ecx,0 ; mul a[2]*b[3] mul edx add ebp,eax mov eax,DWORD PTR 4[esi] adc ebx,edx mov edx,DWORD PTR 16[edi] adc ecx,0 ; mul a[1]*b[4] mul edx add ebp,eax mov eax,DWORD PTR [esi] adc ebx,edx mov edx,DWORD PTR 20[edi] adc ecx,0 ; mul a[0]*b[5] mul edx add ebp,eax mov eax,DWORD PTR 20[esp] adc ebx,edx mov edx,DWORD PTR [edi] adc ecx,0 mov DWORD PTR 20[eax],ebp mov eax,DWORD PTR 24[esi] ; saved r[5] ; ################## Calculate word 6 xor ebp,ebp ; mul a[6]*b[0] mul edx add ebx,eax mov eax,DWORD PTR 20[esi] adc ecx,edx mov edx,DWORD PTR 4[edi] adc ebp,0 ; mul a[5]*b[1] mul edx add ebx,eax mov eax,DWORD PTR 16[esi] adc ecx,edx mov edx,DWORD PTR 8[edi] adc ebp,0 ; mul a[4]*b[2] mul edx add ebx,eax mov eax,DWORD PTR 12[esi] adc ecx,edx mov edx,DWORD PTR 12[edi] adc ebp,0 ; mul a[3]*b[3] mul edx add ebx,eax mov eax,DWORD PTR 8[esi] adc ecx,edx mov edx,DWORD PTR 16[edi] adc ebp,0 ; mul a[2]*b[4] mul edx add ebx,eax mov eax,DWORD PTR 4[esi] adc ecx,edx mov edx,DWORD PTR 20[edi] adc ebp,0 ; mul a[1]*b[5] mul edx add ebx,eax mov eax,DWORD PTR [esi] adc ecx,edx mov edx,DWORD PTR 24[edi] adc ebp,0 ; mul a[0]*b[6] mul edx add ebx,eax mov eax,DWORD PTR 20[esp] adc ecx,edx mov edx,DWORD PTR [edi] adc ebp,0 mov DWORD PTR 24[eax],ebx mov eax,DWORD PTR 28[esi] ; saved r[6] ; ################## Calculate word 7 xor ebx,ebx ; mul a[7]*b[0] mul edx add ecx,eax mov eax,DWORD PTR 24[esi] adc ebp,edx mov edx,DWORD PTR 4[edi] adc ebx,0 ; mul a[6]*b[1] mul edx add ecx,eax mov eax,DWORD PTR 20[esi] adc ebp,edx mov edx,DWORD PTR 8[edi] adc ebx,0 ; mul a[5]*b[2] mul edx add ecx,eax mov eax,DWORD PTR 16[esi] adc ebp,edx mov edx,DWORD PTR 12[edi] adc ebx,0 ; mul a[4]*b[3] mul edx add ecx,eax mov eax,DWORD PTR 12[esi] adc ebp,edx mov edx,DWORD PTR 16[edi] adc ebx,0 ; mul a[3]*b[4] mul edx add ecx,eax mov eax,DWORD PTR 8[esi] adc ebp,edx mov edx,DWORD PTR 20[edi] adc ebx,0 ; mul a[2]*b[5] mul edx add ecx,eax mov eax,DWORD PTR 4[esi] adc ebp,edx mov edx,DWORD PTR 24[edi] adc ebx,0 ; mul a[1]*b[6] mul edx add ecx,eax mov eax,DWORD PTR [esi] adc ebp,edx mov edx,DWORD PTR 28[edi] adc ebx,0 ; mul a[0]*b[7] mul edx add ecx,eax mov eax,DWORD PTR 20[esp] adc ebp,edx mov edx,DWORD PTR 4[edi] adc ebx,0 mov DWORD PTR 28[eax],ecx mov eax,DWORD PTR 28[esi] ; saved r[7] ; ################## Calculate word 8 xor ecx,ecx ; mul a[7]*b[1] mul edx add ebp,eax mov eax,DWORD PTR 24[esi] adc ebx,edx mov edx,DWORD PTR 8[edi] adc ecx,0 ; mul a[6]*b[2] mul edx add ebp,eax mov eax,DWORD PTR 20[esi] adc ebx,edx mov edx,DWORD PTR 12[edi] adc ecx,0 ; mul a[5]*b[3] mul edx add ebp,eax mov eax,DWORD PTR 16[esi] adc ebx,edx mov edx,DWORD PTR 16[edi] adc ecx,0 ; mul a[4]*b[4] mul edx add ebp,eax mov eax,DWORD PTR 12[esi] adc ebx,edx mov edx,DWORD PTR 20[edi] adc ecx,0 ; mul a[3]*b[5] mul edx add ebp,eax mov eax,DWORD PTR 8[esi] adc ebx,edx mov edx,DWORD PTR 24[edi] adc ecx,0 ; mul a[2]*b[6] mul edx add ebp,eax mov eax,DWORD PTR 4[esi] adc ebx,edx mov edx,DWORD PTR 28[edi] adc ecx,0 ; mul a[1]*b[7] mul edx add ebp,eax mov eax,DWORD PTR 20[esp] adc ebx,edx mov edx,DWORD PTR 8[edi] adc ecx,0 mov DWORD PTR 32[eax],ebp mov eax,DWORD PTR 28[esi] ; saved r[8] ; ################## Calculate word 9 xor ebp,ebp ; mul a[7]*b[2] mul edx add ebx,eax mov eax,DWORD PTR 24[esi] adc ecx,edx mov edx,DWORD PTR 12[edi] adc ebp,0 ; mul a[6]*b[3] mul edx add ebx,eax mov eax,DWORD PTR 20[esi] adc ecx,edx mov edx,DWORD PTR 16[edi] adc ebp,0 ; mul a[5]*b[4] mul edx add ebx,eax mov eax,DWORD PTR 16[esi] adc ecx,edx mov edx,DWORD PTR 20[edi] adc ebp,0 ; mul a[4]*b[5] mul edx add ebx,eax mov eax,DWORD PTR 12[esi] adc ecx,edx mov edx,DWORD PTR 24[edi] adc ebp,0 ; mul a[3]*b[6] mul edx add ebx,eax mov eax,DWORD PTR 8[esi] adc ecx,edx mov edx,DWORD PTR 28[edi] adc ebp,0 ; mul a[2]*b[7] mul edx add ebx,eax mov eax,DWORD PTR 20[esp] adc ecx,edx mov edx,DWORD PTR 12[edi] adc ebp,0 mov DWORD PTR 36[eax],ebx mov eax,DWORD PTR 28[esi] ; saved r[9] ; ################## Calculate word 10 xor ebx,ebx ; mul a[7]*b[3] mul edx add ecx,eax mov eax,DWORD PTR 24[esi] adc ebp,edx mov edx,DWORD PTR 16[edi] adc ebx,0 ; mul a[6]*b[4] mul edx add ecx,eax mov eax,DWORD PTR 20[esi] adc ebp,edx mov edx,DWORD PTR 20[edi] adc ebx,0 ; mul a[5]*b[5] mul edx add ecx,eax mov eax,DWORD PTR 16[esi] adc ebp,edx mov edx,DWORD PTR 24[edi] adc ebx,0 ; mul a[4]*b[6] mul edx add ecx,eax mov eax,DWORD PTR 12[esi] adc ebp,edx mov edx,DWORD PTR 28[edi] adc ebx,0 ; mul a[3]*b[7] mul edx add ecx,eax mov eax,DWORD PTR 20[esp] adc ebp,edx mov edx,DWORD PTR 16[edi] adc ebx,0 mov DWORD PTR 40[eax],ecx mov eax,DWORD PTR 28[esi] ; saved r[10] ; ################## Calculate word 11 xor ecx,ecx ; mul a[7]*b[4] mul edx add ebp,eax mov eax,DWORD PTR 24[esi] adc ebx,edx mov edx,DWORD PTR 20[edi] adc ecx,0 ; mul a[6]*b[5] mul edx add ebp,eax mov eax,DWORD PTR 20[esi] adc ebx,edx mov edx,DWORD PTR 24[edi] adc ecx,0 ; mul a[5]*b[6] mul edx add ebp,eax mov eax,DWORD PTR 16[esi] adc ebx,edx mov edx,DWORD PTR 28[edi] adc ecx,0 ; mul a[4]*b[7] mul edx add ebp,eax mov eax,DWORD PTR 20[esp] adc ebx,edx mov edx,DWORD PTR 20[edi] adc ecx,0 mov DWORD PTR 44[eax],ebp mov eax,DWORD PTR 28[esi] ; saved r[11] ; ################## Calculate word 12 xor ebp,ebp ; mul a[7]*b[5] mul edx add ebx,eax mov eax,DWORD PTR 24[esi] adc ecx,edx mov edx,DWORD PTR 24[edi] adc ebp,0 ; mul a[6]*b[6] mul edx add ebx,eax mov eax,DWORD PTR 20[esi] adc ecx,edx mov edx,DWORD PTR 28[edi] adc ebp,0 ; mul a[5]*b[7] mul edx add ebx,eax mov eax,DWORD PTR 20[esp] adc ecx,edx mov edx,DWORD PTR 24[edi] adc ebp,0 mov DWORD PTR 48[eax],ebx mov eax,DWORD PTR 28[esi] ; saved r[12] ; ################## Calculate word 13 xor ebx,ebx ; mul a[7]*b[6] mul edx add ecx,eax mov eax,DWORD PTR 24[esi] adc ebp,edx mov edx,DWORD PTR 28[edi] adc ebx,0 ; mul a[6]*b[7] mul edx add ecx,eax mov eax,DWORD PTR 20[esp] adc ebp,edx mov edx,DWORD PTR 28[edi] adc ebx,0 mov DWORD PTR 52[eax],ecx mov eax,DWORD PTR 28[esi] ; saved r[13] ; ################## Calculate word 14 xor ecx,ecx ; mul a[7]*b[7] mul edx add ebp,eax mov eax,DWORD PTR 20[esp] adc ebx,edx adc ecx,0 mov DWORD PTR 56[eax],ebp ; saved r[14] ; save r[15] mov DWORD PTR 60[eax],ebx pop ebx pop ebp pop edi pop esi ret _bn_mul_comba8 ENDP ALIGN 16 _bn_mul_comba4 PROC PUBLIC $L_bn_mul_comba4_begin:: push esi mov esi,DWORD PTR 12[esp] push edi mov edi,DWORD PTR 20[esp] push ebp push ebx xor ebx,ebx mov eax,DWORD PTR [esi] xor ecx,ecx mov edx,DWORD PTR [edi] ; ################## Calculate word 0 xor ebp,ebp ; mul a[0]*b[0] mul edx add ebx,eax mov eax,DWORD PTR 20[esp] adc ecx,edx mov edx,DWORD PTR [edi] adc ebp,0 mov DWORD PTR [eax],ebx mov eax,DWORD PTR 4[esi] ; saved r[0] ; ################## Calculate word 1 xor ebx,ebx ; mul a[1]*b[0] mul edx add ecx,eax mov eax,DWORD PTR [esi] adc ebp,edx mov edx,DWORD PTR 4[edi] adc ebx,0 ; mul a[0]*b[1] mul edx add ecx,eax mov eax,DWORD PTR 20[esp] adc ebp,edx mov edx,DWORD PTR [edi] adc ebx,0 mov DWORD PTR 4[eax],ecx mov eax,DWORD PTR 8[esi] ; saved r[1] ; ################## Calculate word 2 xor ecx,ecx ; mul a[2]*b[0] mul edx add ebp,eax mov eax,DWORD PTR 4[esi] adc ebx,edx mov edx,DWORD PTR 4[edi] adc ecx,0 ; mul a[1]*b[1] mul edx add ebp,eax mov eax,DWORD PTR [esi] adc ebx,edx mov edx,DWORD PTR 8[edi] adc ecx,0 ; mul a[0]*b[2] mul edx add ebp,eax mov eax,DWORD PTR 20[esp] adc ebx,edx mov edx,DWORD PTR [edi] adc ecx,0 mov DWORD PTR 8[eax],ebp mov eax,DWORD PTR 12[esi] ; saved r[2] ; ################## Calculate word 3 xor ebp,ebp ; mul a[3]*b[0] mul edx add ebx,eax mov eax,DWORD PTR 8[esi] adc ecx,edx mov edx,DWORD PTR 4[edi] adc ebp,0 ; mul a[2]*b[1] mul edx add ebx,eax mov eax,DWORD PTR 4[esi] adc ecx,edx mov edx,DWORD PTR 8[edi] adc ebp,0 ; mul a[1]*b[2] mul edx add ebx,eax mov eax,DWORD PTR [esi] adc ecx,edx mov edx,DWORD PTR 12[edi] adc ebp,0 ; mul a[0]*b[3] mul edx add ebx,eax mov eax,DWORD PTR 20[esp] adc ecx,edx mov edx,DWORD PTR 4[edi] adc ebp,0 mov DWORD PTR 12[eax],ebx mov eax,DWORD PTR 12[esi] ; saved r[3] ; ################## Calculate word 4 xor ebx,ebx ; mul a[3]*b[1] mul edx add ecx,eax mov eax,DWORD PTR 8[esi] adc ebp,edx mov edx,DWORD PTR 8[edi] adc ebx,0 ; mul a[2]*b[2] mul edx add ecx,eax mov eax,DWORD PTR 4[esi] adc ebp,edx mov edx,DWORD PTR 12[edi] adc ebx,0 ; mul a[1]*b[3] mul edx add ecx,eax mov eax,DWORD PTR 20[esp] adc ebp,edx mov edx,DWORD PTR 8[edi] adc ebx,0 mov DWORD PTR 16[eax],ecx mov eax,DWORD PTR 12[esi] ; saved r[4] ; ################## Calculate word 5 xor ecx,ecx ; mul a[3]*b[2] mul edx add ebp,eax mov eax,DWORD PTR 8[esi] adc ebx,edx mov edx,DWORD PTR 12[edi] adc ecx,0 ; mul a[2]*b[3] mul edx add ebp,eax mov eax,DWORD PTR 20[esp] adc ebx,edx mov edx,DWORD PTR 12[edi] adc ecx,0 mov DWORD PTR 20[eax],ebp mov eax,DWORD PTR 12[esi] ; saved r[5] ; ################## Calculate word 6 xor ebp,ebp ; mul a[3]*b[3] mul edx add ebx,eax mov eax,DWORD PTR 20[esp] adc ecx,edx adc ebp,0 mov DWORD PTR 24[eax],ebx ; saved r[6] ; save r[7] mov DWORD PTR 28[eax],ecx pop ebx pop ebp pop edi pop esi ret _bn_mul_comba4 ENDP ALIGN 16 _bn_sqr_comba8 PROC PUBLIC $L_bn_sqr_comba8_begin:: push esi push edi push ebp push ebx mov edi,DWORD PTR 20[esp] mov esi,DWORD PTR 24[esp] xor ebx,ebx xor ecx,ecx mov eax,DWORD PTR [esi] ; ############### Calculate word 0 xor ebp,ebp ; sqr a[0]*a[0] mul eax add ebx,eax adc ecx,edx mov edx,DWORD PTR [esi] adc ebp,0 mov DWORD PTR [edi],ebx mov eax,DWORD PTR 4[esi] ; saved r[0] ; ############### Calculate word 1 xor ebx,ebx ; sqr a[1]*a[0] mul edx add eax,eax adc edx,edx adc ebx,0 add ecx,eax adc ebp,edx mov eax,DWORD PTR 8[esi] adc ebx,0 mov DWORD PTR 4[edi],ecx mov edx,DWORD PTR [esi] ; saved r[1] ; ############### Calculate word 2 xor ecx,ecx ; sqr a[2]*a[0] mul edx add eax,eax adc edx,edx adc ecx,0 add ebp,eax adc ebx,edx mov eax,DWORD PTR 4[esi] adc ecx,0 ; sqr a[1]*a[1] mul eax add ebp,eax adc ebx,edx mov edx,DWORD PTR [esi] adc ecx,0 mov DWORD PTR 8[edi],ebp mov eax,DWORD PTR 12[esi] ; saved r[2] ; ############### Calculate word 3 xor ebp,ebp ; sqr a[3]*a[0] mul edx add eax,eax adc edx,edx adc ebp,0 add ebx,eax adc ecx,edx mov eax,DWORD PTR 8[esi] adc ebp,0 mov edx,DWORD PTR 4[esi] ; sqr a[2]*a[1] mul edx add eax,eax adc edx,edx adc ebp,0 add ebx,eax adc ecx,edx mov eax,DWORD PTR 16[esi] adc ebp,0 mov DWORD PTR 12[edi],ebx mov edx,DWORD PTR [esi] ; saved r[3] ; ############### Calculate word 4 xor ebx,ebx ; sqr a[4]*a[0] mul edx add eax,eax adc edx,edx adc ebx,0 add ecx,eax adc ebp,edx mov eax,DWORD PTR 12[esi] adc ebx,0 mov edx,DWORD PTR 4[esi] ; sqr a[3]*a[1] mul edx add eax,eax adc edx,edx adc ebx,0 add ecx,eax adc ebp,edx mov eax,DWORD PTR 8[esi] adc ebx,0 ; sqr a[2]*a[2] mul eax add ecx,eax adc ebp,edx mov edx,DWORD PTR [esi] adc ebx,0 mov DWORD PTR 16[edi],ecx mov eax,DWORD PTR 20[esi] ; saved r[4] ; ############### Calculate word 5 xor ecx,ecx ; sqr a[5]*a[0] mul edx add eax,eax adc edx,edx adc ecx,0 add ebp,eax adc ebx,edx mov eax,DWORD PTR 16[esi] adc ecx,0 mov edx,DWORD PTR 4[esi] ; sqr a[4]*a[1] mul edx add eax,eax adc edx,edx adc ecx,0 add ebp,eax adc ebx,edx mov eax,DWORD PTR 12[esi] adc ecx,0 mov edx,DWORD PTR 8[esi] ; sqr a[3]*a[2] mul edx add eax,eax adc edx,edx adc ecx,0 add ebp,eax adc ebx,edx mov eax,DWORD PTR 24[esi] adc ecx,0 mov DWORD PTR 20[edi],ebp mov edx,DWORD PTR [esi] ; saved r[5] ; ############### Calculate word 6 xor ebp,ebp ; sqr a[6]*a[0] mul edx add eax,eax adc edx,edx adc ebp,0 add ebx,eax adc ecx,edx mov eax,DWORD PTR 20[esi] adc ebp,0 mov edx,DWORD PTR 4[esi] ; sqr a[5]*a[1] mul edx add eax,eax adc edx,edx adc ebp,0 add ebx,eax adc ecx,edx mov eax,DWORD PTR 16[esi] adc ebp,0 mov edx,DWORD PTR 8[esi] ; sqr a[4]*a[2] mul edx add eax,eax adc edx,edx adc ebp,0 add ebx,eax adc ecx,edx mov eax,DWORD PTR 12[esi] adc ebp,0 ; sqr a[3]*a[3] mul eax add ebx,eax adc ecx,edx mov edx,DWORD PTR [esi] adc ebp,0 mov DWORD PTR 24[edi],ebx mov eax,DWORD PTR 28[esi] ; saved r[6] ; ############### Calculate word 7 xor ebx,ebx ; sqr a[7]*a[0] mul edx add eax,eax adc edx,edx adc ebx,0 add ecx,eax adc ebp,edx mov eax,DWORD PTR 24[esi] adc ebx,0 mov edx,DWORD PTR 4[esi] ; sqr a[6]*a[1] mul edx add eax,eax adc edx,edx adc ebx,0 add ecx,eax adc ebp,edx mov eax,DWORD PTR 20[esi] adc ebx,0 mov edx,DWORD PTR 8[esi] ; sqr a[5]*a[2] mul edx add eax,eax adc edx,edx adc ebx,0 add ecx,eax adc ebp,edx mov eax,DWORD PTR 16[esi] adc ebx,0 mov edx,DWORD PTR 12[esi] ; sqr a[4]*a[3] mul edx add eax,eax adc edx,edx adc ebx,0 add ecx,eax adc ebp,edx mov eax,DWORD PTR 28[esi] adc ebx,0 mov DWORD PTR 28[edi],ecx mov edx,DWORD PTR 4[esi] ; saved r[7] ; ############### Calculate word 8 xor ecx,ecx ; sqr a[7]*a[1] mul edx add eax,eax adc edx,edx adc ecx,0 add ebp,eax adc ebx,edx mov eax,DWORD PTR 24[esi] adc ecx,0 mov edx,DWORD PTR 8[esi] ; sqr a[6]*a[2] mul edx add eax,eax adc edx,edx adc ecx,0 add ebp,eax adc ebx,edx mov eax,DWORD PTR 20[esi] adc ecx,0 mov edx,DWORD PTR 12[esi] ; sqr a[5]*a[3] mul edx add eax,eax adc edx,edx adc ecx,0 add ebp,eax adc ebx,edx mov eax,DWORD PTR 16[esi] adc ecx,0 ; sqr a[4]*a[4] mul eax add ebp,eax adc ebx,edx mov edx,DWORD PTR 8[esi] adc ecx,0 mov DWORD PTR 32[edi],ebp mov eax,DWORD PTR 28[esi] ; saved r[8] ; ############### Calculate word 9 xor ebp,ebp ; sqr a[7]*a[2] mul edx add eax,eax adc edx,edx adc ebp,0 add ebx,eax adc ecx,edx mov eax,DWORD PTR 24[esi] adc ebp,0 mov edx,DWORD PTR 12[esi] ; sqr a[6]*a[3] mul edx add eax,eax adc edx,edx adc ebp,0 add ebx,eax adc ecx,edx mov eax,DWORD PTR 20[esi] adc ebp,0 mov edx,DWORD PTR 16[esi] ; sqr a[5]*a[4] mul edx add eax,eax adc edx,edx adc ebp,0 add ebx,eax adc ecx,edx mov eax,DWORD PTR 28[esi] adc ebp,0 mov DWORD PTR 36[edi],ebx mov edx,DWORD PTR 12[esi] ; saved r[9] ; ############### Calculate word 10 xor ebx,ebx ; sqr a[7]*a[3] mul edx add eax,eax adc edx,edx adc ebx,0 add ecx,eax adc ebp,edx mov eax,DWORD PTR 24[esi] adc ebx,0 mov edx,DWORD PTR 16[esi] ; sqr a[6]*a[4] mul edx add eax,eax adc edx,edx adc ebx,0 add ecx,eax adc ebp,edx mov eax,DWORD PTR 20[esi] adc ebx,0 ; sqr a[5]*a[5] mul eax add ecx,eax adc ebp,edx mov edx,DWORD PTR 16[esi] adc ebx,0 mov DWORD PTR 40[edi],ecx mov eax,DWORD PTR 28[esi] ; saved r[10] ; ############### Calculate word 11 xor ecx,ecx ; sqr a[7]*a[4] mul edx add eax,eax adc edx,edx adc ecx,0 add ebp,eax adc ebx,edx mov eax,DWORD PTR 24[esi] adc ecx,0 mov edx,DWORD PTR 20[esi] ; sqr a[6]*a[5] mul edx add eax,eax adc edx,edx adc ecx,0 add ebp,eax adc ebx,edx mov eax,DWORD PTR 28[esi] adc ecx,0 mov DWORD PTR 44[edi],ebp mov edx,DWORD PTR 20[esi] ; saved r[11] ; ############### Calculate word 12 xor ebp,ebp ; sqr a[7]*a[5] mul edx add eax,eax adc edx,edx adc ebp,0 add ebx,eax adc ecx,edx mov eax,DWORD PTR 24[esi] adc ebp,0 ; sqr a[6]*a[6] mul eax add ebx,eax adc ecx,edx mov edx,DWORD PTR 24[esi] adc ebp,0 mov DWORD PTR 48[edi],ebx mov eax,DWORD PTR 28[esi] ; saved r[12] ; ############### Calculate word 13 xor ebx,ebx ; sqr a[7]*a[6] mul edx add eax,eax adc edx,edx adc ebx,0 add ecx,eax adc ebp,edx mov eax,DWORD PTR 28[esi] adc ebx,0 mov DWORD PTR 52[edi],ecx ; saved r[13] ; ############### Calculate word 14 xor ecx,ecx ; sqr a[7]*a[7] mul eax add ebp,eax adc ebx,edx adc ecx,0 mov DWORD PTR 56[edi],ebp ; saved r[14] mov DWORD PTR 60[edi],ebx pop ebx pop ebp pop edi pop esi ret _bn_sqr_comba8 ENDP ALIGN 16 _bn_sqr_comba4 PROC PUBLIC $L_bn_sqr_comba4_begin:: push esi push edi push ebp push ebx mov edi,DWORD PTR 20[esp] mov esi,DWORD PTR 24[esp] xor ebx,ebx xor ecx,ecx mov eax,DWORD PTR [esi] ; ############### Calculate word 0 xor ebp,ebp ; sqr a[0]*a[0] mul eax add ebx,eax adc ecx,edx mov edx,DWORD PTR [esi] adc ebp,0 mov DWORD PTR [edi],ebx mov eax,DWORD PTR 4[esi] ; saved r[0] ; ############### Calculate word 1 xor ebx,ebx ; sqr a[1]*a[0] mul edx add eax,eax adc edx,edx adc ebx,0 add ecx,eax adc ebp,edx mov eax,DWORD PTR 8[esi] adc ebx,0 mov DWORD PTR 4[edi],ecx mov edx,DWORD PTR [esi] ; saved r[1] ; ############### Calculate word 2 xor ecx,ecx ; sqr a[2]*a[0] mul edx add eax,eax adc edx,edx adc ecx,0 add ebp,eax adc ebx,edx mov eax,DWORD PTR 4[esi] adc ecx,0 ; sqr a[1]*a[1] mul eax add ebp,eax adc ebx,edx mov edx,DWORD PTR [esi] adc ecx,0 mov DWORD PTR 8[edi],ebp mov eax,DWORD PTR 12[esi] ; saved r[2] ; ############### Calculate word 3 xor ebp,ebp ; sqr a[3]*a[0] mul edx add eax,eax adc edx,edx adc ebp,0 add ebx,eax adc ecx,edx mov eax,DWORD PTR 8[esi] adc ebp,0 mov edx,DWORD PTR 4[esi] ; sqr a[2]*a[1] mul edx add eax,eax adc edx,edx adc ebp,0 add ebx,eax adc ecx,edx mov eax,DWORD PTR 12[esi] adc ebp,0 mov DWORD PTR 12[edi],ebx mov edx,DWORD PTR 4[esi] ; saved r[3] ; ############### Calculate word 4 xor ebx,ebx ; sqr a[3]*a[1] mul edx add eax,eax adc edx,edx adc ebx,0 add ecx,eax adc ebp,edx mov eax,DWORD PTR 8[esi] adc ebx,0 ; sqr a[2]*a[2] mul eax add ecx,eax adc ebp,edx mov edx,DWORD PTR 8[esi] adc ebx,0 mov DWORD PTR 16[edi],ecx mov eax,DWORD PTR 12[esi] ; saved r[4] ; ############### Calculate word 5 xor ecx,ecx ; sqr a[3]*a[2] mul edx add eax,eax adc edx,edx adc ecx,0 add ebp,eax adc ebx,edx mov eax,DWORD PTR 12[esi] adc ecx,0 mov DWORD PTR 20[edi],ebp ; saved r[5] ; ############### Calculate word 6 xor ebp,ebp ; sqr a[3]*a[3] mul eax add ebx,eax adc ecx,edx adc ebp,0 mov DWORD PTR 24[edi],ebx ; saved r[6] mov DWORD PTR 28[edi],ecx pop ebx pop ebp pop edi pop esi ret _bn_sqr_comba4 ENDP .text$ ENDS END