mirror of https://github.com/lukechilds/node.git
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
2439 lines
52 KiB
2439 lines
52 KiB
TITLE ../openssl/crypto/aes/asm/aesni-x86.asm
|
|
IF @Version LT 800
|
|
ECHO MASM version 8.00 or later is strongly recommended.
|
|
ENDIF
|
|
.686
|
|
.XMM
|
|
IF @Version LT 800
|
|
XMMWORD STRUCT 16
|
|
DQ 2 dup (?)
|
|
XMMWORD ENDS
|
|
ENDIF
|
|
|
|
.MODEL FLAT
|
|
OPTION DOTNAME
|
|
IF @Version LT 800
|
|
.text$ SEGMENT PAGE 'CODE'
|
|
ELSE
|
|
.text$ SEGMENT ALIGN(64) 'CODE'
|
|
ENDIF
|
|
;EXTERN _OPENSSL_ia32cap_P:NEAR
|
|
ALIGN 16
|
|
_aesni_encrypt PROC PUBLIC
|
|
$L_aesni_encrypt_begin::
|
|
mov eax,DWORD PTR 4[esp]
|
|
mov edx,DWORD PTR 12[esp]
|
|
movups xmm2,XMMWORD PTR [eax]
|
|
mov ecx,DWORD PTR 240[edx]
|
|
mov eax,DWORD PTR 8[esp]
|
|
movups xmm0,XMMWORD PTR [edx]
|
|
movups xmm1,XMMWORD PTR 16[edx]
|
|
lea edx,DWORD PTR 32[edx]
|
|
xorps xmm2,xmm0
|
|
$L000enc1_loop_1:
|
|
DB 102,15,56,220,209
|
|
dec ecx
|
|
movups xmm1,XMMWORD PTR [edx]
|
|
lea edx,DWORD PTR 16[edx]
|
|
jnz $L000enc1_loop_1
|
|
DB 102,15,56,221,209
|
|
pxor xmm0,xmm0
|
|
pxor xmm1,xmm1
|
|
movups XMMWORD PTR [eax],xmm2
|
|
pxor xmm2,xmm2
|
|
ret
|
|
_aesni_encrypt ENDP
|
|
ALIGN 16
|
|
_aesni_decrypt PROC PUBLIC
|
|
$L_aesni_decrypt_begin::
|
|
mov eax,DWORD PTR 4[esp]
|
|
mov edx,DWORD PTR 12[esp]
|
|
movups xmm2,XMMWORD PTR [eax]
|
|
mov ecx,DWORD PTR 240[edx]
|
|
mov eax,DWORD PTR 8[esp]
|
|
movups xmm0,XMMWORD PTR [edx]
|
|
movups xmm1,XMMWORD PTR 16[edx]
|
|
lea edx,DWORD PTR 32[edx]
|
|
xorps xmm2,xmm0
|
|
$L001dec1_loop_2:
|
|
DB 102,15,56,222,209
|
|
dec ecx
|
|
movups xmm1,XMMWORD PTR [edx]
|
|
lea edx,DWORD PTR 16[edx]
|
|
jnz $L001dec1_loop_2
|
|
DB 102,15,56,223,209
|
|
pxor xmm0,xmm0
|
|
pxor xmm1,xmm1
|
|
movups XMMWORD PTR [eax],xmm2
|
|
pxor xmm2,xmm2
|
|
ret
|
|
_aesni_decrypt ENDP
|
|
ALIGN 16
|
|
__aesni_encrypt2 PROC PRIVATE
|
|
movups xmm0,XMMWORD PTR [edx]
|
|
shl ecx,4
|
|
movups xmm1,XMMWORD PTR 16[edx]
|
|
xorps xmm2,xmm0
|
|
pxor xmm3,xmm0
|
|
movups xmm0,XMMWORD PTR 32[edx]
|
|
lea edx,DWORD PTR 32[ecx*1+edx]
|
|
neg ecx
|
|
add ecx,16
|
|
$L002enc2_loop:
|
|
DB 102,15,56,220,209
|
|
DB 102,15,56,220,217
|
|
movups xmm1,XMMWORD PTR [ecx*1+edx]
|
|
add ecx,32
|
|
DB 102,15,56,220,208
|
|
DB 102,15,56,220,216
|
|
movups xmm0,XMMWORD PTR [ecx*1+edx-16]
|
|
jnz $L002enc2_loop
|
|
DB 102,15,56,220,209
|
|
DB 102,15,56,220,217
|
|
DB 102,15,56,221,208
|
|
DB 102,15,56,221,216
|
|
ret
|
|
__aesni_encrypt2 ENDP
|
|
ALIGN 16
|
|
__aesni_decrypt2 PROC PRIVATE
|
|
movups xmm0,XMMWORD PTR [edx]
|
|
shl ecx,4
|
|
movups xmm1,XMMWORD PTR 16[edx]
|
|
xorps xmm2,xmm0
|
|
pxor xmm3,xmm0
|
|
movups xmm0,XMMWORD PTR 32[edx]
|
|
lea edx,DWORD PTR 32[ecx*1+edx]
|
|
neg ecx
|
|
add ecx,16
|
|
$L003dec2_loop:
|
|
DB 102,15,56,222,209
|
|
DB 102,15,56,222,217
|
|
movups xmm1,XMMWORD PTR [ecx*1+edx]
|
|
add ecx,32
|
|
DB 102,15,56,222,208
|
|
DB 102,15,56,222,216
|
|
movups xmm0,XMMWORD PTR [ecx*1+edx-16]
|
|
jnz $L003dec2_loop
|
|
DB 102,15,56,222,209
|
|
DB 102,15,56,222,217
|
|
DB 102,15,56,223,208
|
|
DB 102,15,56,223,216
|
|
ret
|
|
__aesni_decrypt2 ENDP
|
|
ALIGN 16
|
|
__aesni_encrypt3 PROC PRIVATE
|
|
movups xmm0,XMMWORD PTR [edx]
|
|
shl ecx,4
|
|
movups xmm1,XMMWORD PTR 16[edx]
|
|
xorps xmm2,xmm0
|
|
pxor xmm3,xmm0
|
|
pxor xmm4,xmm0
|
|
movups xmm0,XMMWORD PTR 32[edx]
|
|
lea edx,DWORD PTR 32[ecx*1+edx]
|
|
neg ecx
|
|
add ecx,16
|
|
$L004enc3_loop:
|
|
DB 102,15,56,220,209
|
|
DB 102,15,56,220,217
|
|
DB 102,15,56,220,225
|
|
movups xmm1,XMMWORD PTR [ecx*1+edx]
|
|
add ecx,32
|
|
DB 102,15,56,220,208
|
|
DB 102,15,56,220,216
|
|
DB 102,15,56,220,224
|
|
movups xmm0,XMMWORD PTR [ecx*1+edx-16]
|
|
jnz $L004enc3_loop
|
|
DB 102,15,56,220,209
|
|
DB 102,15,56,220,217
|
|
DB 102,15,56,220,225
|
|
DB 102,15,56,221,208
|
|
DB 102,15,56,221,216
|
|
DB 102,15,56,221,224
|
|
ret
|
|
__aesni_encrypt3 ENDP
|
|
ALIGN 16
|
|
__aesni_decrypt3 PROC PRIVATE
|
|
movups xmm0,XMMWORD PTR [edx]
|
|
shl ecx,4
|
|
movups xmm1,XMMWORD PTR 16[edx]
|
|
xorps xmm2,xmm0
|
|
pxor xmm3,xmm0
|
|
pxor xmm4,xmm0
|
|
movups xmm0,XMMWORD PTR 32[edx]
|
|
lea edx,DWORD PTR 32[ecx*1+edx]
|
|
neg ecx
|
|
add ecx,16
|
|
$L005dec3_loop:
|
|
DB 102,15,56,222,209
|
|
DB 102,15,56,222,217
|
|
DB 102,15,56,222,225
|
|
movups xmm1,XMMWORD PTR [ecx*1+edx]
|
|
add ecx,32
|
|
DB 102,15,56,222,208
|
|
DB 102,15,56,222,216
|
|
DB 102,15,56,222,224
|
|
movups xmm0,XMMWORD PTR [ecx*1+edx-16]
|
|
jnz $L005dec3_loop
|
|
DB 102,15,56,222,209
|
|
DB 102,15,56,222,217
|
|
DB 102,15,56,222,225
|
|
DB 102,15,56,223,208
|
|
DB 102,15,56,223,216
|
|
DB 102,15,56,223,224
|
|
ret
|
|
__aesni_decrypt3 ENDP
|
|
ALIGN 16
|
|
__aesni_encrypt4 PROC PRIVATE
|
|
movups xmm0,XMMWORD PTR [edx]
|
|
movups xmm1,XMMWORD PTR 16[edx]
|
|
shl ecx,4
|
|
xorps xmm2,xmm0
|
|
pxor xmm3,xmm0
|
|
pxor xmm4,xmm0
|
|
pxor xmm5,xmm0
|
|
movups xmm0,XMMWORD PTR 32[edx]
|
|
lea edx,DWORD PTR 32[ecx*1+edx]
|
|
neg ecx
|
|
DB 15,31,64,0
|
|
add ecx,16
|
|
$L006enc4_loop:
|
|
DB 102,15,56,220,209
|
|
DB 102,15,56,220,217
|
|
DB 102,15,56,220,225
|
|
DB 102,15,56,220,233
|
|
movups xmm1,XMMWORD PTR [ecx*1+edx]
|
|
add ecx,32
|
|
DB 102,15,56,220,208
|
|
DB 102,15,56,220,216
|
|
DB 102,15,56,220,224
|
|
DB 102,15,56,220,232
|
|
movups xmm0,XMMWORD PTR [ecx*1+edx-16]
|
|
jnz $L006enc4_loop
|
|
DB 102,15,56,220,209
|
|
DB 102,15,56,220,217
|
|
DB 102,15,56,220,225
|
|
DB 102,15,56,220,233
|
|
DB 102,15,56,221,208
|
|
DB 102,15,56,221,216
|
|
DB 102,15,56,221,224
|
|
DB 102,15,56,221,232
|
|
ret
|
|
__aesni_encrypt4 ENDP
|
|
ALIGN 16
|
|
__aesni_decrypt4 PROC PRIVATE
|
|
movups xmm0,XMMWORD PTR [edx]
|
|
movups xmm1,XMMWORD PTR 16[edx]
|
|
shl ecx,4
|
|
xorps xmm2,xmm0
|
|
pxor xmm3,xmm0
|
|
pxor xmm4,xmm0
|
|
pxor xmm5,xmm0
|
|
movups xmm0,XMMWORD PTR 32[edx]
|
|
lea edx,DWORD PTR 32[ecx*1+edx]
|
|
neg ecx
|
|
DB 15,31,64,0
|
|
add ecx,16
|
|
$L007dec4_loop:
|
|
DB 102,15,56,222,209
|
|
DB 102,15,56,222,217
|
|
DB 102,15,56,222,225
|
|
DB 102,15,56,222,233
|
|
movups xmm1,XMMWORD PTR [ecx*1+edx]
|
|
add ecx,32
|
|
DB 102,15,56,222,208
|
|
DB 102,15,56,222,216
|
|
DB 102,15,56,222,224
|
|
DB 102,15,56,222,232
|
|
movups xmm0,XMMWORD PTR [ecx*1+edx-16]
|
|
jnz $L007dec4_loop
|
|
DB 102,15,56,222,209
|
|
DB 102,15,56,222,217
|
|
DB 102,15,56,222,225
|
|
DB 102,15,56,222,233
|
|
DB 102,15,56,223,208
|
|
DB 102,15,56,223,216
|
|
DB 102,15,56,223,224
|
|
DB 102,15,56,223,232
|
|
ret
|
|
__aesni_decrypt4 ENDP
|
|
ALIGN 16
|
|
__aesni_encrypt6 PROC PRIVATE
|
|
movups xmm0,XMMWORD PTR [edx]
|
|
shl ecx,4
|
|
movups xmm1,XMMWORD PTR 16[edx]
|
|
xorps xmm2,xmm0
|
|
pxor xmm3,xmm0
|
|
pxor xmm4,xmm0
|
|
DB 102,15,56,220,209
|
|
pxor xmm5,xmm0
|
|
pxor xmm6,xmm0
|
|
DB 102,15,56,220,217
|
|
lea edx,DWORD PTR 32[ecx*1+edx]
|
|
neg ecx
|
|
DB 102,15,56,220,225
|
|
pxor xmm7,xmm0
|
|
movups xmm0,XMMWORD PTR [ecx*1+edx]
|
|
add ecx,16
|
|
jmp $L008_aesni_encrypt6_inner
|
|
ALIGN 16
|
|
$L009enc6_loop:
|
|
DB 102,15,56,220,209
|
|
DB 102,15,56,220,217
|
|
DB 102,15,56,220,225
|
|
$L008_aesni_encrypt6_inner:
|
|
DB 102,15,56,220,233
|
|
DB 102,15,56,220,241
|
|
DB 102,15,56,220,249
|
|
$L_aesni_encrypt6_enter::
|
|
movups xmm1,XMMWORD PTR [ecx*1+edx]
|
|
add ecx,32
|
|
DB 102,15,56,220,208
|
|
DB 102,15,56,220,216
|
|
DB 102,15,56,220,224
|
|
DB 102,15,56,220,232
|
|
DB 102,15,56,220,240
|
|
DB 102,15,56,220,248
|
|
movups xmm0,XMMWORD PTR [ecx*1+edx-16]
|
|
jnz $L009enc6_loop
|
|
DB 102,15,56,220,209
|
|
DB 102,15,56,220,217
|
|
DB 102,15,56,220,225
|
|
DB 102,15,56,220,233
|
|
DB 102,15,56,220,241
|
|
DB 102,15,56,220,249
|
|
DB 102,15,56,221,208
|
|
DB 102,15,56,221,216
|
|
DB 102,15,56,221,224
|
|
DB 102,15,56,221,232
|
|
DB 102,15,56,221,240
|
|
DB 102,15,56,221,248
|
|
ret
|
|
__aesni_encrypt6 ENDP
|
|
ALIGN 16
|
|
__aesni_decrypt6 PROC PRIVATE
|
|
movups xmm0,XMMWORD PTR [edx]
|
|
shl ecx,4
|
|
movups xmm1,XMMWORD PTR 16[edx]
|
|
xorps xmm2,xmm0
|
|
pxor xmm3,xmm0
|
|
pxor xmm4,xmm0
|
|
DB 102,15,56,222,209
|
|
pxor xmm5,xmm0
|
|
pxor xmm6,xmm0
|
|
DB 102,15,56,222,217
|
|
lea edx,DWORD PTR 32[ecx*1+edx]
|
|
neg ecx
|
|
DB 102,15,56,222,225
|
|
pxor xmm7,xmm0
|
|
movups xmm0,XMMWORD PTR [ecx*1+edx]
|
|
add ecx,16
|
|
jmp $L010_aesni_decrypt6_inner
|
|
ALIGN 16
|
|
$L011dec6_loop:
|
|
DB 102,15,56,222,209
|
|
DB 102,15,56,222,217
|
|
DB 102,15,56,222,225
|
|
$L010_aesni_decrypt6_inner:
|
|
DB 102,15,56,222,233
|
|
DB 102,15,56,222,241
|
|
DB 102,15,56,222,249
|
|
$L_aesni_decrypt6_enter::
|
|
movups xmm1,XMMWORD PTR [ecx*1+edx]
|
|
add ecx,32
|
|
DB 102,15,56,222,208
|
|
DB 102,15,56,222,216
|
|
DB 102,15,56,222,224
|
|
DB 102,15,56,222,232
|
|
DB 102,15,56,222,240
|
|
DB 102,15,56,222,248
|
|
movups xmm0,XMMWORD PTR [ecx*1+edx-16]
|
|
jnz $L011dec6_loop
|
|
DB 102,15,56,222,209
|
|
DB 102,15,56,222,217
|
|
DB 102,15,56,222,225
|
|
DB 102,15,56,222,233
|
|
DB 102,15,56,222,241
|
|
DB 102,15,56,222,249
|
|
DB 102,15,56,223,208
|
|
DB 102,15,56,223,216
|
|
DB 102,15,56,223,224
|
|
DB 102,15,56,223,232
|
|
DB 102,15,56,223,240
|
|
DB 102,15,56,223,248
|
|
ret
|
|
__aesni_decrypt6 ENDP
|
|
ALIGN 16
|
|
_aesni_ecb_encrypt PROC PUBLIC
|
|
$L_aesni_ecb_encrypt_begin::
|
|
push ebp
|
|
push ebx
|
|
push esi
|
|
push edi
|
|
mov esi,DWORD PTR 20[esp]
|
|
mov edi,DWORD PTR 24[esp]
|
|
mov eax,DWORD PTR 28[esp]
|
|
mov edx,DWORD PTR 32[esp]
|
|
mov ebx,DWORD PTR 36[esp]
|
|
and eax,-16
|
|
jz $L012ecb_ret
|
|
mov ecx,DWORD PTR 240[edx]
|
|
test ebx,ebx
|
|
jz $L013ecb_decrypt
|
|
mov ebp,edx
|
|
mov ebx,ecx
|
|
cmp eax,96
|
|
jb $L014ecb_enc_tail
|
|
movdqu xmm2,XMMWORD PTR [esi]
|
|
movdqu xmm3,XMMWORD PTR 16[esi]
|
|
movdqu xmm4,XMMWORD PTR 32[esi]
|
|
movdqu xmm5,XMMWORD PTR 48[esi]
|
|
movdqu xmm6,XMMWORD PTR 64[esi]
|
|
movdqu xmm7,XMMWORD PTR 80[esi]
|
|
lea esi,DWORD PTR 96[esi]
|
|
sub eax,96
|
|
jmp $L015ecb_enc_loop6_enter
|
|
ALIGN 16
|
|
$L016ecb_enc_loop6:
|
|
movups XMMWORD PTR [edi],xmm2
|
|
movdqu xmm2,XMMWORD PTR [esi]
|
|
movups XMMWORD PTR 16[edi],xmm3
|
|
movdqu xmm3,XMMWORD PTR 16[esi]
|
|
movups XMMWORD PTR 32[edi],xmm4
|
|
movdqu xmm4,XMMWORD PTR 32[esi]
|
|
movups XMMWORD PTR 48[edi],xmm5
|
|
movdqu xmm5,XMMWORD PTR 48[esi]
|
|
movups XMMWORD PTR 64[edi],xmm6
|
|
movdqu xmm6,XMMWORD PTR 64[esi]
|
|
movups XMMWORD PTR 80[edi],xmm7
|
|
lea edi,DWORD PTR 96[edi]
|
|
movdqu xmm7,XMMWORD PTR 80[esi]
|
|
lea esi,DWORD PTR 96[esi]
|
|
$L015ecb_enc_loop6_enter:
|
|
call __aesni_encrypt6
|
|
mov edx,ebp
|
|
mov ecx,ebx
|
|
sub eax,96
|
|
jnc $L016ecb_enc_loop6
|
|
movups XMMWORD PTR [edi],xmm2
|
|
movups XMMWORD PTR 16[edi],xmm3
|
|
movups XMMWORD PTR 32[edi],xmm4
|
|
movups XMMWORD PTR 48[edi],xmm5
|
|
movups XMMWORD PTR 64[edi],xmm6
|
|
movups XMMWORD PTR 80[edi],xmm7
|
|
lea edi,DWORD PTR 96[edi]
|
|
add eax,96
|
|
jz $L012ecb_ret
|
|
$L014ecb_enc_tail:
|
|
movups xmm2,XMMWORD PTR [esi]
|
|
cmp eax,32
|
|
jb $L017ecb_enc_one
|
|
movups xmm3,XMMWORD PTR 16[esi]
|
|
je $L018ecb_enc_two
|
|
movups xmm4,XMMWORD PTR 32[esi]
|
|
cmp eax,64
|
|
jb $L019ecb_enc_three
|
|
movups xmm5,XMMWORD PTR 48[esi]
|
|
je $L020ecb_enc_four
|
|
movups xmm6,XMMWORD PTR 64[esi]
|
|
xorps xmm7,xmm7
|
|
call __aesni_encrypt6
|
|
movups XMMWORD PTR [edi],xmm2
|
|
movups XMMWORD PTR 16[edi],xmm3
|
|
movups XMMWORD PTR 32[edi],xmm4
|
|
movups XMMWORD PTR 48[edi],xmm5
|
|
movups XMMWORD PTR 64[edi],xmm6
|
|
jmp $L012ecb_ret
|
|
ALIGN 16
|
|
$L017ecb_enc_one:
|
|
movups xmm0,XMMWORD PTR [edx]
|
|
movups xmm1,XMMWORD PTR 16[edx]
|
|
lea edx,DWORD PTR 32[edx]
|
|
xorps xmm2,xmm0
|
|
$L021enc1_loop_3:
|
|
DB 102,15,56,220,209
|
|
dec ecx
|
|
movups xmm1,XMMWORD PTR [edx]
|
|
lea edx,DWORD PTR 16[edx]
|
|
jnz $L021enc1_loop_3
|
|
DB 102,15,56,221,209
|
|
movups XMMWORD PTR [edi],xmm2
|
|
jmp $L012ecb_ret
|
|
ALIGN 16
|
|
$L018ecb_enc_two:
|
|
call __aesni_encrypt2
|
|
movups XMMWORD PTR [edi],xmm2
|
|
movups XMMWORD PTR 16[edi],xmm3
|
|
jmp $L012ecb_ret
|
|
ALIGN 16
|
|
$L019ecb_enc_three:
|
|
call __aesni_encrypt3
|
|
movups XMMWORD PTR [edi],xmm2
|
|
movups XMMWORD PTR 16[edi],xmm3
|
|
movups XMMWORD PTR 32[edi],xmm4
|
|
jmp $L012ecb_ret
|
|
ALIGN 16
|
|
$L020ecb_enc_four:
|
|
call __aesni_encrypt4
|
|
movups XMMWORD PTR [edi],xmm2
|
|
movups XMMWORD PTR 16[edi],xmm3
|
|
movups XMMWORD PTR 32[edi],xmm4
|
|
movups XMMWORD PTR 48[edi],xmm5
|
|
jmp $L012ecb_ret
|
|
ALIGN 16
|
|
$L013ecb_decrypt:
|
|
mov ebp,edx
|
|
mov ebx,ecx
|
|
cmp eax,96
|
|
jb $L022ecb_dec_tail
|
|
movdqu xmm2,XMMWORD PTR [esi]
|
|
movdqu xmm3,XMMWORD PTR 16[esi]
|
|
movdqu xmm4,XMMWORD PTR 32[esi]
|
|
movdqu xmm5,XMMWORD PTR 48[esi]
|
|
movdqu xmm6,XMMWORD PTR 64[esi]
|
|
movdqu xmm7,XMMWORD PTR 80[esi]
|
|
lea esi,DWORD PTR 96[esi]
|
|
sub eax,96
|
|
jmp $L023ecb_dec_loop6_enter
|
|
ALIGN 16
|
|
$L024ecb_dec_loop6:
|
|
movups XMMWORD PTR [edi],xmm2
|
|
movdqu xmm2,XMMWORD PTR [esi]
|
|
movups XMMWORD PTR 16[edi],xmm3
|
|
movdqu xmm3,XMMWORD PTR 16[esi]
|
|
movups XMMWORD PTR 32[edi],xmm4
|
|
movdqu xmm4,XMMWORD PTR 32[esi]
|
|
movups XMMWORD PTR 48[edi],xmm5
|
|
movdqu xmm5,XMMWORD PTR 48[esi]
|
|
movups XMMWORD PTR 64[edi],xmm6
|
|
movdqu xmm6,XMMWORD PTR 64[esi]
|
|
movups XMMWORD PTR 80[edi],xmm7
|
|
lea edi,DWORD PTR 96[edi]
|
|
movdqu xmm7,XMMWORD PTR 80[esi]
|
|
lea esi,DWORD PTR 96[esi]
|
|
$L023ecb_dec_loop6_enter:
|
|
call __aesni_decrypt6
|
|
mov edx,ebp
|
|
mov ecx,ebx
|
|
sub eax,96
|
|
jnc $L024ecb_dec_loop6
|
|
movups XMMWORD PTR [edi],xmm2
|
|
movups XMMWORD PTR 16[edi],xmm3
|
|
movups XMMWORD PTR 32[edi],xmm4
|
|
movups XMMWORD PTR 48[edi],xmm5
|
|
movups XMMWORD PTR 64[edi],xmm6
|
|
movups XMMWORD PTR 80[edi],xmm7
|
|
lea edi,DWORD PTR 96[edi]
|
|
add eax,96
|
|
jz $L012ecb_ret
|
|
$L022ecb_dec_tail:
|
|
movups xmm2,XMMWORD PTR [esi]
|
|
cmp eax,32
|
|
jb $L025ecb_dec_one
|
|
movups xmm3,XMMWORD PTR 16[esi]
|
|
je $L026ecb_dec_two
|
|
movups xmm4,XMMWORD PTR 32[esi]
|
|
cmp eax,64
|
|
jb $L027ecb_dec_three
|
|
movups xmm5,XMMWORD PTR 48[esi]
|
|
je $L028ecb_dec_four
|
|
movups xmm6,XMMWORD PTR 64[esi]
|
|
xorps xmm7,xmm7
|
|
call __aesni_decrypt6
|
|
movups XMMWORD PTR [edi],xmm2
|
|
movups XMMWORD PTR 16[edi],xmm3
|
|
movups XMMWORD PTR 32[edi],xmm4
|
|
movups XMMWORD PTR 48[edi],xmm5
|
|
movups XMMWORD PTR 64[edi],xmm6
|
|
jmp $L012ecb_ret
|
|
ALIGN 16
|
|
$L025ecb_dec_one:
|
|
movups xmm0,XMMWORD PTR [edx]
|
|
movups xmm1,XMMWORD PTR 16[edx]
|
|
lea edx,DWORD PTR 32[edx]
|
|
xorps xmm2,xmm0
|
|
$L029dec1_loop_4:
|
|
DB 102,15,56,222,209
|
|
dec ecx
|
|
movups xmm1,XMMWORD PTR [edx]
|
|
lea edx,DWORD PTR 16[edx]
|
|
jnz $L029dec1_loop_4
|
|
DB 102,15,56,223,209
|
|
movups XMMWORD PTR [edi],xmm2
|
|
jmp $L012ecb_ret
|
|
ALIGN 16
|
|
$L026ecb_dec_two:
|
|
call __aesni_decrypt2
|
|
movups XMMWORD PTR [edi],xmm2
|
|
movups XMMWORD PTR 16[edi],xmm3
|
|
jmp $L012ecb_ret
|
|
ALIGN 16
|
|
$L027ecb_dec_three:
|
|
call __aesni_decrypt3
|
|
movups XMMWORD PTR [edi],xmm2
|
|
movups XMMWORD PTR 16[edi],xmm3
|
|
movups XMMWORD PTR 32[edi],xmm4
|
|
jmp $L012ecb_ret
|
|
ALIGN 16
|
|
$L028ecb_dec_four:
|
|
call __aesni_decrypt4
|
|
movups XMMWORD PTR [edi],xmm2
|
|
movups XMMWORD PTR 16[edi],xmm3
|
|
movups XMMWORD PTR 32[edi],xmm4
|
|
movups XMMWORD PTR 48[edi],xmm5
|
|
$L012ecb_ret:
|
|
pxor xmm0,xmm0
|
|
pxor xmm1,xmm1
|
|
pxor xmm2,xmm2
|
|
pxor xmm3,xmm3
|
|
pxor xmm4,xmm4
|
|
pxor xmm5,xmm5
|
|
pxor xmm6,xmm6
|
|
pxor xmm7,xmm7
|
|
pop edi
|
|
pop esi
|
|
pop ebx
|
|
pop ebp
|
|
ret
|
|
_aesni_ecb_encrypt ENDP
|
|
ALIGN 16
|
|
_aesni_ccm64_encrypt_blocks PROC PUBLIC
|
|
$L_aesni_ccm64_encrypt_blocks_begin::
|
|
push ebp
|
|
push ebx
|
|
push esi
|
|
push edi
|
|
mov esi,DWORD PTR 20[esp]
|
|
mov edi,DWORD PTR 24[esp]
|
|
mov eax,DWORD PTR 28[esp]
|
|
mov edx,DWORD PTR 32[esp]
|
|
mov ebx,DWORD PTR 36[esp]
|
|
mov ecx,DWORD PTR 40[esp]
|
|
mov ebp,esp
|
|
sub esp,60
|
|
and esp,-16
|
|
mov DWORD PTR 48[esp],ebp
|
|
movdqu xmm7,XMMWORD PTR [ebx]
|
|
movdqu xmm3,XMMWORD PTR [ecx]
|
|
mov ecx,DWORD PTR 240[edx]
|
|
mov DWORD PTR [esp],202182159
|
|
mov DWORD PTR 4[esp],134810123
|
|
mov DWORD PTR 8[esp],67438087
|
|
mov DWORD PTR 12[esp],66051
|
|
mov ebx,1
|
|
xor ebp,ebp
|
|
mov DWORD PTR 16[esp],ebx
|
|
mov DWORD PTR 20[esp],ebp
|
|
mov DWORD PTR 24[esp],ebp
|
|
mov DWORD PTR 28[esp],ebp
|
|
shl ecx,4
|
|
mov ebx,16
|
|
lea ebp,DWORD PTR [edx]
|
|
movdqa xmm5,XMMWORD PTR [esp]
|
|
movdqa xmm2,xmm7
|
|
lea edx,DWORD PTR 32[ecx*1+edx]
|
|
sub ebx,ecx
|
|
DB 102,15,56,0,253
|
|
$L030ccm64_enc_outer:
|
|
movups xmm0,XMMWORD PTR [ebp]
|
|
mov ecx,ebx
|
|
movups xmm6,XMMWORD PTR [esi]
|
|
xorps xmm2,xmm0
|
|
movups xmm1,XMMWORD PTR 16[ebp]
|
|
xorps xmm0,xmm6
|
|
xorps xmm3,xmm0
|
|
movups xmm0,XMMWORD PTR 32[ebp]
|
|
$L031ccm64_enc2_loop:
|
|
DB 102,15,56,220,209
|
|
DB 102,15,56,220,217
|
|
movups xmm1,XMMWORD PTR [ecx*1+edx]
|
|
add ecx,32
|
|
DB 102,15,56,220,208
|
|
DB 102,15,56,220,216
|
|
movups xmm0,XMMWORD PTR [ecx*1+edx-16]
|
|
jnz $L031ccm64_enc2_loop
|
|
DB 102,15,56,220,209
|
|
DB 102,15,56,220,217
|
|
paddq xmm7,XMMWORD PTR 16[esp]
|
|
dec eax
|
|
DB 102,15,56,221,208
|
|
DB 102,15,56,221,216
|
|
lea esi,DWORD PTR 16[esi]
|
|
xorps xmm6,xmm2
|
|
movdqa xmm2,xmm7
|
|
movups XMMWORD PTR [edi],xmm6
|
|
DB 102,15,56,0,213
|
|
lea edi,DWORD PTR 16[edi]
|
|
jnz $L030ccm64_enc_outer
|
|
mov esp,DWORD PTR 48[esp]
|
|
mov edi,DWORD PTR 40[esp]
|
|
movups XMMWORD PTR [edi],xmm3
|
|
pxor xmm0,xmm0
|
|
pxor xmm1,xmm1
|
|
pxor xmm2,xmm2
|
|
pxor xmm3,xmm3
|
|
pxor xmm4,xmm4
|
|
pxor xmm5,xmm5
|
|
pxor xmm6,xmm6
|
|
pxor xmm7,xmm7
|
|
pop edi
|
|
pop esi
|
|
pop ebx
|
|
pop ebp
|
|
ret
|
|
_aesni_ccm64_encrypt_blocks ENDP
|
|
ALIGN 16
|
|
_aesni_ccm64_decrypt_blocks PROC PUBLIC
|
|
$L_aesni_ccm64_decrypt_blocks_begin::
|
|
push ebp
|
|
push ebx
|
|
push esi
|
|
push edi
|
|
mov esi,DWORD PTR 20[esp]
|
|
mov edi,DWORD PTR 24[esp]
|
|
mov eax,DWORD PTR 28[esp]
|
|
mov edx,DWORD PTR 32[esp]
|
|
mov ebx,DWORD PTR 36[esp]
|
|
mov ecx,DWORD PTR 40[esp]
|
|
mov ebp,esp
|
|
sub esp,60
|
|
and esp,-16
|
|
mov DWORD PTR 48[esp],ebp
|
|
movdqu xmm7,XMMWORD PTR [ebx]
|
|
movdqu xmm3,XMMWORD PTR [ecx]
|
|
mov ecx,DWORD PTR 240[edx]
|
|
mov DWORD PTR [esp],202182159
|
|
mov DWORD PTR 4[esp],134810123
|
|
mov DWORD PTR 8[esp],67438087
|
|
mov DWORD PTR 12[esp],66051
|
|
mov ebx,1
|
|
xor ebp,ebp
|
|
mov DWORD PTR 16[esp],ebx
|
|
mov DWORD PTR 20[esp],ebp
|
|
mov DWORD PTR 24[esp],ebp
|
|
mov DWORD PTR 28[esp],ebp
|
|
movdqa xmm5,XMMWORD PTR [esp]
|
|
movdqa xmm2,xmm7
|
|
mov ebp,edx
|
|
mov ebx,ecx
|
|
DB 102,15,56,0,253
|
|
movups xmm0,XMMWORD PTR [edx]
|
|
movups xmm1,XMMWORD PTR 16[edx]
|
|
lea edx,DWORD PTR 32[edx]
|
|
xorps xmm2,xmm0
|
|
$L032enc1_loop_5:
|
|
DB 102,15,56,220,209
|
|
dec ecx
|
|
movups xmm1,XMMWORD PTR [edx]
|
|
lea edx,DWORD PTR 16[edx]
|
|
jnz $L032enc1_loop_5
|
|
DB 102,15,56,221,209
|
|
shl ebx,4
|
|
mov ecx,16
|
|
movups xmm6,XMMWORD PTR [esi]
|
|
paddq xmm7,XMMWORD PTR 16[esp]
|
|
lea esi,QWORD PTR 16[esi]
|
|
sub ecx,ebx
|
|
lea edx,DWORD PTR 32[ebx*1+ebp]
|
|
mov ebx,ecx
|
|
jmp $L033ccm64_dec_outer
|
|
ALIGN 16
|
|
$L033ccm64_dec_outer:
|
|
xorps xmm6,xmm2
|
|
movdqa xmm2,xmm7
|
|
movups XMMWORD PTR [edi],xmm6
|
|
lea edi,DWORD PTR 16[edi]
|
|
DB 102,15,56,0,213
|
|
sub eax,1
|
|
jz $L034ccm64_dec_break
|
|
movups xmm0,XMMWORD PTR [ebp]
|
|
mov ecx,ebx
|
|
movups xmm1,XMMWORD PTR 16[ebp]
|
|
xorps xmm6,xmm0
|
|
xorps xmm2,xmm0
|
|
xorps xmm3,xmm6
|
|
movups xmm0,XMMWORD PTR 32[ebp]
|
|
$L035ccm64_dec2_loop:
|
|
DB 102,15,56,220,209
|
|
DB 102,15,56,220,217
|
|
movups xmm1,XMMWORD PTR [ecx*1+edx]
|
|
add ecx,32
|
|
DB 102,15,56,220,208
|
|
DB 102,15,56,220,216
|
|
movups xmm0,XMMWORD PTR [ecx*1+edx-16]
|
|
jnz $L035ccm64_dec2_loop
|
|
movups xmm6,XMMWORD PTR [esi]
|
|
paddq xmm7,XMMWORD PTR 16[esp]
|
|
DB 102,15,56,220,209
|
|
DB 102,15,56,220,217
|
|
DB 102,15,56,221,208
|
|
DB 102,15,56,221,216
|
|
lea esi,QWORD PTR 16[esi]
|
|
jmp $L033ccm64_dec_outer
|
|
ALIGN 16
|
|
$L034ccm64_dec_break:
|
|
mov ecx,DWORD PTR 240[ebp]
|
|
mov edx,ebp
|
|
movups xmm0,XMMWORD PTR [edx]
|
|
movups xmm1,XMMWORD PTR 16[edx]
|
|
xorps xmm6,xmm0
|
|
lea edx,DWORD PTR 32[edx]
|
|
xorps xmm3,xmm6
|
|
$L036enc1_loop_6:
|
|
DB 102,15,56,220,217
|
|
dec ecx
|
|
movups xmm1,XMMWORD PTR [edx]
|
|
lea edx,DWORD PTR 16[edx]
|
|
jnz $L036enc1_loop_6
|
|
DB 102,15,56,221,217
|
|
mov esp,DWORD PTR 48[esp]
|
|
mov edi,DWORD PTR 40[esp]
|
|
movups XMMWORD PTR [edi],xmm3
|
|
pxor xmm0,xmm0
|
|
pxor xmm1,xmm1
|
|
pxor xmm2,xmm2
|
|
pxor xmm3,xmm3
|
|
pxor xmm4,xmm4
|
|
pxor xmm5,xmm5
|
|
pxor xmm6,xmm6
|
|
pxor xmm7,xmm7
|
|
pop edi
|
|
pop esi
|
|
pop ebx
|
|
pop ebp
|
|
ret
|
|
_aesni_ccm64_decrypt_blocks ENDP
|
|
ALIGN 16
|
|
_aesni_ctr32_encrypt_blocks PROC PUBLIC
|
|
$L_aesni_ctr32_encrypt_blocks_begin::
|
|
push ebp
|
|
push ebx
|
|
push esi
|
|
push edi
|
|
mov esi,DWORD PTR 20[esp]
|
|
mov edi,DWORD PTR 24[esp]
|
|
mov eax,DWORD PTR 28[esp]
|
|
mov edx,DWORD PTR 32[esp]
|
|
mov ebx,DWORD PTR 36[esp]
|
|
mov ebp,esp
|
|
sub esp,88
|
|
and esp,-16
|
|
mov DWORD PTR 80[esp],ebp
|
|
cmp eax,1
|
|
je $L037ctr32_one_shortcut
|
|
movdqu xmm7,XMMWORD PTR [ebx]
|
|
mov DWORD PTR [esp],202182159
|
|
mov DWORD PTR 4[esp],134810123
|
|
mov DWORD PTR 8[esp],67438087
|
|
mov DWORD PTR 12[esp],66051
|
|
mov ecx,6
|
|
xor ebp,ebp
|
|
mov DWORD PTR 16[esp],ecx
|
|
mov DWORD PTR 20[esp],ecx
|
|
mov DWORD PTR 24[esp],ecx
|
|
mov DWORD PTR 28[esp],ebp
|
|
DB 102,15,58,22,251,3
|
|
DB 102,15,58,34,253,3
|
|
mov ecx,DWORD PTR 240[edx]
|
|
bswap ebx
|
|
pxor xmm0,xmm0
|
|
pxor xmm1,xmm1
|
|
movdqa xmm2,XMMWORD PTR [esp]
|
|
DB 102,15,58,34,195,0
|
|
lea ebp,DWORD PTR 3[ebx]
|
|
DB 102,15,58,34,205,0
|
|
inc ebx
|
|
DB 102,15,58,34,195,1
|
|
inc ebp
|
|
DB 102,15,58,34,205,1
|
|
inc ebx
|
|
DB 102,15,58,34,195,2
|
|
inc ebp
|
|
DB 102,15,58,34,205,2
|
|
movdqa XMMWORD PTR 48[esp],xmm0
|
|
DB 102,15,56,0,194
|
|
movdqu xmm6,XMMWORD PTR [edx]
|
|
movdqa XMMWORD PTR 64[esp],xmm1
|
|
DB 102,15,56,0,202
|
|
pshufd xmm2,xmm0,192
|
|
pshufd xmm3,xmm0,128
|
|
cmp eax,6
|
|
jb $L038ctr32_tail
|
|
pxor xmm7,xmm6
|
|
shl ecx,4
|
|
mov ebx,16
|
|
movdqa XMMWORD PTR 32[esp],xmm7
|
|
mov ebp,edx
|
|
sub ebx,ecx
|
|
lea edx,DWORD PTR 32[ecx*1+edx]
|
|
sub eax,6
|
|
jmp $L039ctr32_loop6
|
|
ALIGN 16
|
|
$L039ctr32_loop6:
|
|
pshufd xmm4,xmm0,64
|
|
movdqa xmm0,XMMWORD PTR 32[esp]
|
|
pshufd xmm5,xmm1,192
|
|
pxor xmm2,xmm0
|
|
pshufd xmm6,xmm1,128
|
|
pxor xmm3,xmm0
|
|
pshufd xmm7,xmm1,64
|
|
movups xmm1,XMMWORD PTR 16[ebp]
|
|
pxor xmm4,xmm0
|
|
pxor xmm5,xmm0
|
|
DB 102,15,56,220,209
|
|
pxor xmm6,xmm0
|
|
pxor xmm7,xmm0
|
|
DB 102,15,56,220,217
|
|
movups xmm0,XMMWORD PTR 32[ebp]
|
|
mov ecx,ebx
|
|
DB 102,15,56,220,225
|
|
DB 102,15,56,220,233
|
|
DB 102,15,56,220,241
|
|
DB 102,15,56,220,249
|
|
call $L_aesni_encrypt6_enter
|
|
movups xmm1,XMMWORD PTR [esi]
|
|
movups xmm0,XMMWORD PTR 16[esi]
|
|
xorps xmm2,xmm1
|
|
movups xmm1,XMMWORD PTR 32[esi]
|
|
xorps xmm3,xmm0
|
|
movups XMMWORD PTR [edi],xmm2
|
|
movdqa xmm0,XMMWORD PTR 16[esp]
|
|
xorps xmm4,xmm1
|
|
movdqa xmm1,XMMWORD PTR 64[esp]
|
|
movups XMMWORD PTR 16[edi],xmm3
|
|
movups XMMWORD PTR 32[edi],xmm4
|
|
paddd xmm1,xmm0
|
|
paddd xmm0,XMMWORD PTR 48[esp]
|
|
movdqa xmm2,XMMWORD PTR [esp]
|
|
movups xmm3,XMMWORD PTR 48[esi]
|
|
movups xmm4,XMMWORD PTR 64[esi]
|
|
xorps xmm5,xmm3
|
|
movups xmm3,XMMWORD PTR 80[esi]
|
|
lea esi,DWORD PTR 96[esi]
|
|
movdqa XMMWORD PTR 48[esp],xmm0
|
|
DB 102,15,56,0,194
|
|
xorps xmm6,xmm4
|
|
movups XMMWORD PTR 48[edi],xmm5
|
|
xorps xmm7,xmm3
|
|
movdqa XMMWORD PTR 64[esp],xmm1
|
|
DB 102,15,56,0,202
|
|
movups XMMWORD PTR 64[edi],xmm6
|
|
pshufd xmm2,xmm0,192
|
|
movups XMMWORD PTR 80[edi],xmm7
|
|
lea edi,DWORD PTR 96[edi]
|
|
pshufd xmm3,xmm0,128
|
|
sub eax,6
|
|
jnc $L039ctr32_loop6
|
|
add eax,6
|
|
jz $L040ctr32_ret
|
|
movdqu xmm7,XMMWORD PTR [ebp]
|
|
mov edx,ebp
|
|
pxor xmm7,XMMWORD PTR 32[esp]
|
|
mov ecx,DWORD PTR 240[ebp]
|
|
$L038ctr32_tail:
|
|
por xmm2,xmm7
|
|
cmp eax,2
|
|
jb $L041ctr32_one
|
|
pshufd xmm4,xmm0,64
|
|
por xmm3,xmm7
|
|
je $L042ctr32_two
|
|
pshufd xmm5,xmm1,192
|
|
por xmm4,xmm7
|
|
cmp eax,4
|
|
jb $L043ctr32_three
|
|
pshufd xmm6,xmm1,128
|
|
por xmm5,xmm7
|
|
je $L044ctr32_four
|
|
por xmm6,xmm7
|
|
call __aesni_encrypt6
|
|
movups xmm1,XMMWORD PTR [esi]
|
|
movups xmm0,XMMWORD PTR 16[esi]
|
|
xorps xmm2,xmm1
|
|
movups xmm1,XMMWORD PTR 32[esi]
|
|
xorps xmm3,xmm0
|
|
movups xmm0,XMMWORD PTR 48[esi]
|
|
xorps xmm4,xmm1
|
|
movups xmm1,XMMWORD PTR 64[esi]
|
|
xorps xmm5,xmm0
|
|
movups XMMWORD PTR [edi],xmm2
|
|
xorps xmm6,xmm1
|
|
movups XMMWORD PTR 16[edi],xmm3
|
|
movups XMMWORD PTR 32[edi],xmm4
|
|
movups XMMWORD PTR 48[edi],xmm5
|
|
movups XMMWORD PTR 64[edi],xmm6
|
|
jmp $L040ctr32_ret
|
|
ALIGN 16
|
|
$L037ctr32_one_shortcut:
|
|
movups xmm2,XMMWORD PTR [ebx]
|
|
mov ecx,DWORD PTR 240[edx]
|
|
$L041ctr32_one:
|
|
movups xmm0,XMMWORD PTR [edx]
|
|
movups xmm1,XMMWORD PTR 16[edx]
|
|
lea edx,DWORD PTR 32[edx]
|
|
xorps xmm2,xmm0
|
|
$L045enc1_loop_7:
|
|
DB 102,15,56,220,209
|
|
dec ecx
|
|
movups xmm1,XMMWORD PTR [edx]
|
|
lea edx,DWORD PTR 16[edx]
|
|
jnz $L045enc1_loop_7
|
|
DB 102,15,56,221,209
|
|
movups xmm6,XMMWORD PTR [esi]
|
|
xorps xmm6,xmm2
|
|
movups XMMWORD PTR [edi],xmm6
|
|
jmp $L040ctr32_ret
|
|
ALIGN 16
|
|
$L042ctr32_two:
|
|
call __aesni_encrypt2
|
|
movups xmm5,XMMWORD PTR [esi]
|
|
movups xmm6,XMMWORD PTR 16[esi]
|
|
xorps xmm2,xmm5
|
|
xorps xmm3,xmm6
|
|
movups XMMWORD PTR [edi],xmm2
|
|
movups XMMWORD PTR 16[edi],xmm3
|
|
jmp $L040ctr32_ret
|
|
ALIGN 16
|
|
$L043ctr32_three:
|
|
call __aesni_encrypt3
|
|
movups xmm5,XMMWORD PTR [esi]
|
|
movups xmm6,XMMWORD PTR 16[esi]
|
|
xorps xmm2,xmm5
|
|
movups xmm7,XMMWORD PTR 32[esi]
|
|
xorps xmm3,xmm6
|
|
movups XMMWORD PTR [edi],xmm2
|
|
xorps xmm4,xmm7
|
|
movups XMMWORD PTR 16[edi],xmm3
|
|
movups XMMWORD PTR 32[edi],xmm4
|
|
jmp $L040ctr32_ret
|
|
ALIGN 16
|
|
$L044ctr32_four:
|
|
call __aesni_encrypt4
|
|
movups xmm6,XMMWORD PTR [esi]
|
|
movups xmm7,XMMWORD PTR 16[esi]
|
|
movups xmm1,XMMWORD PTR 32[esi]
|
|
xorps xmm2,xmm6
|
|
movups xmm0,XMMWORD PTR 48[esi]
|
|
xorps xmm3,xmm7
|
|
movups XMMWORD PTR [edi],xmm2
|
|
xorps xmm4,xmm1
|
|
movups XMMWORD PTR 16[edi],xmm3
|
|
xorps xmm5,xmm0
|
|
movups XMMWORD PTR 32[edi],xmm4
|
|
movups XMMWORD PTR 48[edi],xmm5
|
|
$L040ctr32_ret:
|
|
pxor xmm0,xmm0
|
|
pxor xmm1,xmm1
|
|
pxor xmm2,xmm2
|
|
pxor xmm3,xmm3
|
|
pxor xmm4,xmm4
|
|
movdqa XMMWORD PTR 32[esp],xmm0
|
|
pxor xmm5,xmm5
|
|
movdqa XMMWORD PTR 48[esp],xmm0
|
|
pxor xmm6,xmm6
|
|
movdqa XMMWORD PTR 64[esp],xmm0
|
|
pxor xmm7,xmm7
|
|
mov esp,DWORD PTR 80[esp]
|
|
pop edi
|
|
pop esi
|
|
pop ebx
|
|
pop ebp
|
|
ret
|
|
_aesni_ctr32_encrypt_blocks ENDP
|
|
ALIGN 16
|
|
_aesni_xts_encrypt PROC PUBLIC
|
|
$L_aesni_xts_encrypt_begin::
|
|
push ebp
|
|
push ebx
|
|
push esi
|
|
push edi
|
|
mov edx,DWORD PTR 36[esp]
|
|
mov esi,DWORD PTR 40[esp]
|
|
mov ecx,DWORD PTR 240[edx]
|
|
movups xmm2,XMMWORD PTR [esi]
|
|
movups xmm0,XMMWORD PTR [edx]
|
|
movups xmm1,XMMWORD PTR 16[edx]
|
|
lea edx,DWORD PTR 32[edx]
|
|
xorps xmm2,xmm0
|
|
$L046enc1_loop_8:
|
|
DB 102,15,56,220,209
|
|
dec ecx
|
|
movups xmm1,XMMWORD PTR [edx]
|
|
lea edx,DWORD PTR 16[edx]
|
|
jnz $L046enc1_loop_8
|
|
DB 102,15,56,221,209
|
|
mov esi,DWORD PTR 20[esp]
|
|
mov edi,DWORD PTR 24[esp]
|
|
mov eax,DWORD PTR 28[esp]
|
|
mov edx,DWORD PTR 32[esp]
|
|
mov ebp,esp
|
|
sub esp,120
|
|
mov ecx,DWORD PTR 240[edx]
|
|
and esp,-16
|
|
mov DWORD PTR 96[esp],135
|
|
mov DWORD PTR 100[esp],0
|
|
mov DWORD PTR 104[esp],1
|
|
mov DWORD PTR 108[esp],0
|
|
mov DWORD PTR 112[esp],eax
|
|
mov DWORD PTR 116[esp],ebp
|
|
movdqa xmm1,xmm2
|
|
pxor xmm0,xmm0
|
|
movdqa xmm3,XMMWORD PTR 96[esp]
|
|
pcmpgtd xmm0,xmm1
|
|
and eax,-16
|
|
mov ebp,edx
|
|
mov ebx,ecx
|
|
sub eax,96
|
|
jc $L047xts_enc_short
|
|
shl ecx,4
|
|
mov ebx,16
|
|
sub ebx,ecx
|
|
lea edx,DWORD PTR 32[ecx*1+edx]
|
|
jmp $L048xts_enc_loop6
|
|
ALIGN 16
|
|
$L048xts_enc_loop6:
|
|
pshufd xmm2,xmm0,19
|
|
pxor xmm0,xmm0
|
|
movdqa XMMWORD PTR [esp],xmm1
|
|
paddq xmm1,xmm1
|
|
pand xmm2,xmm3
|
|
pcmpgtd xmm0,xmm1
|
|
pxor xmm1,xmm2
|
|
pshufd xmm2,xmm0,19
|
|
pxor xmm0,xmm0
|
|
movdqa XMMWORD PTR 16[esp],xmm1
|
|
paddq xmm1,xmm1
|
|
pand xmm2,xmm3
|
|
pcmpgtd xmm0,xmm1
|
|
pxor xmm1,xmm2
|
|
pshufd xmm2,xmm0,19
|
|
pxor xmm0,xmm0
|
|
movdqa XMMWORD PTR 32[esp],xmm1
|
|
paddq xmm1,xmm1
|
|
pand xmm2,xmm3
|
|
pcmpgtd xmm0,xmm1
|
|
pxor xmm1,xmm2
|
|
pshufd xmm2,xmm0,19
|
|
pxor xmm0,xmm0
|
|
movdqa XMMWORD PTR 48[esp],xmm1
|
|
paddq xmm1,xmm1
|
|
pand xmm2,xmm3
|
|
pcmpgtd xmm0,xmm1
|
|
pxor xmm1,xmm2
|
|
pshufd xmm7,xmm0,19
|
|
movdqa XMMWORD PTR 64[esp],xmm1
|
|
paddq xmm1,xmm1
|
|
movups xmm0,XMMWORD PTR [ebp]
|
|
pand xmm7,xmm3
|
|
movups xmm2,XMMWORD PTR [esi]
|
|
pxor xmm7,xmm1
|
|
mov ecx,ebx
|
|
movdqu xmm3,XMMWORD PTR 16[esi]
|
|
xorps xmm2,xmm0
|
|
movdqu xmm4,XMMWORD PTR 32[esi]
|
|
pxor xmm3,xmm0
|
|
movdqu xmm5,XMMWORD PTR 48[esi]
|
|
pxor xmm4,xmm0
|
|
movdqu xmm6,XMMWORD PTR 64[esi]
|
|
pxor xmm5,xmm0
|
|
movdqu xmm1,XMMWORD PTR 80[esi]
|
|
pxor xmm6,xmm0
|
|
lea esi,DWORD PTR 96[esi]
|
|
pxor xmm2,XMMWORD PTR [esp]
|
|
movdqa XMMWORD PTR 80[esp],xmm7
|
|
pxor xmm7,xmm1
|
|
movups xmm1,XMMWORD PTR 16[ebp]
|
|
pxor xmm3,XMMWORD PTR 16[esp]
|
|
pxor xmm4,XMMWORD PTR 32[esp]
|
|
DB 102,15,56,220,209
|
|
pxor xmm5,XMMWORD PTR 48[esp]
|
|
pxor xmm6,XMMWORD PTR 64[esp]
|
|
DB 102,15,56,220,217
|
|
pxor xmm7,xmm0
|
|
movups xmm0,XMMWORD PTR 32[ebp]
|
|
DB 102,15,56,220,225
|
|
DB 102,15,56,220,233
|
|
DB 102,15,56,220,241
|
|
DB 102,15,56,220,249
|
|
call $L_aesni_encrypt6_enter
|
|
movdqa xmm1,XMMWORD PTR 80[esp]
|
|
pxor xmm0,xmm0
|
|
xorps xmm2,XMMWORD PTR [esp]
|
|
pcmpgtd xmm0,xmm1
|
|
xorps xmm3,XMMWORD PTR 16[esp]
|
|
movups XMMWORD PTR [edi],xmm2
|
|
xorps xmm4,XMMWORD PTR 32[esp]
|
|
movups XMMWORD PTR 16[edi],xmm3
|
|
xorps xmm5,XMMWORD PTR 48[esp]
|
|
movups XMMWORD PTR 32[edi],xmm4
|
|
xorps xmm6,XMMWORD PTR 64[esp]
|
|
movups XMMWORD PTR 48[edi],xmm5
|
|
xorps xmm7,xmm1
|
|
movups XMMWORD PTR 64[edi],xmm6
|
|
pshufd xmm2,xmm0,19
|
|
movups XMMWORD PTR 80[edi],xmm7
|
|
lea edi,DWORD PTR 96[edi]
|
|
movdqa xmm3,XMMWORD PTR 96[esp]
|
|
pxor xmm0,xmm0
|
|
paddq xmm1,xmm1
|
|
pand xmm2,xmm3
|
|
pcmpgtd xmm0,xmm1
|
|
pxor xmm1,xmm2
|
|
sub eax,96
|
|
jnc $L048xts_enc_loop6
|
|
mov ecx,DWORD PTR 240[ebp]
|
|
mov edx,ebp
|
|
mov ebx,ecx
|
|
$L047xts_enc_short:
|
|
add eax,96
|
|
jz $L049xts_enc_done6x
|
|
movdqa xmm5,xmm1
|
|
cmp eax,32
|
|
jb $L050xts_enc_one
|
|
pshufd xmm2,xmm0,19
|
|
pxor xmm0,xmm0
|
|
paddq xmm1,xmm1
|
|
pand xmm2,xmm3
|
|
pcmpgtd xmm0,xmm1
|
|
pxor xmm1,xmm2
|
|
je $L051xts_enc_two
|
|
pshufd xmm2,xmm0,19
|
|
pxor xmm0,xmm0
|
|
movdqa xmm6,xmm1
|
|
paddq xmm1,xmm1
|
|
pand xmm2,xmm3
|
|
pcmpgtd xmm0,xmm1
|
|
pxor xmm1,xmm2
|
|
cmp eax,64
|
|
jb $L052xts_enc_three
|
|
pshufd xmm2,xmm0,19
|
|
pxor xmm0,xmm0
|
|
movdqa xmm7,xmm1
|
|
paddq xmm1,xmm1
|
|
pand xmm2,xmm3
|
|
pcmpgtd xmm0,xmm1
|
|
pxor xmm1,xmm2
|
|
movdqa XMMWORD PTR [esp],xmm5
|
|
movdqa XMMWORD PTR 16[esp],xmm6
|
|
je $L053xts_enc_four
|
|
movdqa XMMWORD PTR 32[esp],xmm7
|
|
pshufd xmm7,xmm0,19
|
|
movdqa XMMWORD PTR 48[esp],xmm1
|
|
paddq xmm1,xmm1
|
|
pand xmm7,xmm3
|
|
pxor xmm7,xmm1
|
|
movdqu xmm2,XMMWORD PTR [esi]
|
|
movdqu xmm3,XMMWORD PTR 16[esi]
|
|
movdqu xmm4,XMMWORD PTR 32[esi]
|
|
pxor xmm2,XMMWORD PTR [esp]
|
|
movdqu xmm5,XMMWORD PTR 48[esi]
|
|
pxor xmm3,XMMWORD PTR 16[esp]
|
|
movdqu xmm6,XMMWORD PTR 64[esi]
|
|
pxor xmm4,XMMWORD PTR 32[esp]
|
|
lea esi,DWORD PTR 80[esi]
|
|
pxor xmm5,XMMWORD PTR 48[esp]
|
|
movdqa XMMWORD PTR 64[esp],xmm7
|
|
pxor xmm6,xmm7
|
|
call __aesni_encrypt6
|
|
movaps xmm1,XMMWORD PTR 64[esp]
|
|
xorps xmm2,XMMWORD PTR [esp]
|
|
xorps xmm3,XMMWORD PTR 16[esp]
|
|
xorps xmm4,XMMWORD PTR 32[esp]
|
|
movups XMMWORD PTR [edi],xmm2
|
|
xorps xmm5,XMMWORD PTR 48[esp]
|
|
movups XMMWORD PTR 16[edi],xmm3
|
|
xorps xmm6,xmm1
|
|
movups XMMWORD PTR 32[edi],xmm4
|
|
movups XMMWORD PTR 48[edi],xmm5
|
|
movups XMMWORD PTR 64[edi],xmm6
|
|
lea edi,DWORD PTR 80[edi]
|
|
jmp $L054xts_enc_done
|
|
ALIGN 16
|
|
$L050xts_enc_one:
|
|
movups xmm2,XMMWORD PTR [esi]
|
|
lea esi,DWORD PTR 16[esi]
|
|
xorps xmm2,xmm5
|
|
movups xmm0,XMMWORD PTR [edx]
|
|
movups xmm1,XMMWORD PTR 16[edx]
|
|
lea edx,DWORD PTR 32[edx]
|
|
xorps xmm2,xmm0
|
|
$L055enc1_loop_9:
|
|
DB 102,15,56,220,209
|
|
dec ecx
|
|
movups xmm1,XMMWORD PTR [edx]
|
|
lea edx,DWORD PTR 16[edx]
|
|
jnz $L055enc1_loop_9
|
|
DB 102,15,56,221,209
|
|
xorps xmm2,xmm5
|
|
movups XMMWORD PTR [edi],xmm2
|
|
lea edi,DWORD PTR 16[edi]
|
|
movdqa xmm1,xmm5
|
|
jmp $L054xts_enc_done
|
|
ALIGN 16
|
|
$L051xts_enc_two:
|
|
movaps xmm6,xmm1
|
|
movups xmm2,XMMWORD PTR [esi]
|
|
movups xmm3,XMMWORD PTR 16[esi]
|
|
lea esi,DWORD PTR 32[esi]
|
|
xorps xmm2,xmm5
|
|
xorps xmm3,xmm6
|
|
call __aesni_encrypt2
|
|
xorps xmm2,xmm5
|
|
xorps xmm3,xmm6
|
|
movups XMMWORD PTR [edi],xmm2
|
|
movups XMMWORD PTR 16[edi],xmm3
|
|
lea edi,DWORD PTR 32[edi]
|
|
movdqa xmm1,xmm6
|
|
jmp $L054xts_enc_done
|
|
ALIGN 16
|
|
$L052xts_enc_three:
|
|
movaps xmm7,xmm1
|
|
movups xmm2,XMMWORD PTR [esi]
|
|
movups xmm3,XMMWORD PTR 16[esi]
|
|
movups xmm4,XMMWORD PTR 32[esi]
|
|
lea esi,DWORD PTR 48[esi]
|
|
xorps xmm2,xmm5
|
|
xorps xmm3,xmm6
|
|
xorps xmm4,xmm7
|
|
call __aesni_encrypt3
|
|
xorps xmm2,xmm5
|
|
xorps xmm3,xmm6
|
|
xorps xmm4,xmm7
|
|
movups XMMWORD PTR [edi],xmm2
|
|
movups XMMWORD PTR 16[edi],xmm3
|
|
movups XMMWORD PTR 32[edi],xmm4
|
|
lea edi,DWORD PTR 48[edi]
|
|
movdqa xmm1,xmm7
|
|
jmp $L054xts_enc_done
|
|
ALIGN 16
|
|
$L053xts_enc_four:
|
|
movaps xmm6,xmm1
|
|
movups xmm2,XMMWORD PTR [esi]
|
|
movups xmm3,XMMWORD PTR 16[esi]
|
|
movups xmm4,XMMWORD PTR 32[esi]
|
|
xorps xmm2,XMMWORD PTR [esp]
|
|
movups xmm5,XMMWORD PTR 48[esi]
|
|
lea esi,DWORD PTR 64[esi]
|
|
xorps xmm3,XMMWORD PTR 16[esp]
|
|
xorps xmm4,xmm7
|
|
xorps xmm5,xmm6
|
|
call __aesni_encrypt4
|
|
xorps xmm2,XMMWORD PTR [esp]
|
|
xorps xmm3,XMMWORD PTR 16[esp]
|
|
xorps xmm4,xmm7
|
|
movups XMMWORD PTR [edi],xmm2
|
|
xorps xmm5,xmm6
|
|
movups XMMWORD PTR 16[edi],xmm3
|
|
movups XMMWORD PTR 32[edi],xmm4
|
|
movups XMMWORD PTR 48[edi],xmm5
|
|
lea edi,DWORD PTR 64[edi]
|
|
movdqa xmm1,xmm6
|
|
jmp $L054xts_enc_done
|
|
ALIGN 16
|
|
$L049xts_enc_done6x:
|
|
mov eax,DWORD PTR 112[esp]
|
|
and eax,15
|
|
jz $L056xts_enc_ret
|
|
movdqa xmm5,xmm1
|
|
mov DWORD PTR 112[esp],eax
|
|
jmp $L057xts_enc_steal
|
|
ALIGN 16
|
|
$L054xts_enc_done:
|
|
mov eax,DWORD PTR 112[esp]
|
|
pxor xmm0,xmm0
|
|
and eax,15
|
|
jz $L056xts_enc_ret
|
|
pcmpgtd xmm0,xmm1
|
|
mov DWORD PTR 112[esp],eax
|
|
pshufd xmm5,xmm0,19
|
|
paddq xmm1,xmm1
|
|
pand xmm5,XMMWORD PTR 96[esp]
|
|
pxor xmm5,xmm1
|
|
$L057xts_enc_steal:
|
|
movzx ecx,BYTE PTR [esi]
|
|
movzx edx,BYTE PTR [edi-16]
|
|
lea esi,DWORD PTR 1[esi]
|
|
mov BYTE PTR [edi-16],cl
|
|
mov BYTE PTR [edi],dl
|
|
lea edi,DWORD PTR 1[edi]
|
|
sub eax,1
|
|
jnz $L057xts_enc_steal
|
|
sub edi,DWORD PTR 112[esp]
|
|
mov edx,ebp
|
|
mov ecx,ebx
|
|
movups xmm2,XMMWORD PTR [edi-16]
|
|
xorps xmm2,xmm5
|
|
movups xmm0,XMMWORD PTR [edx]
|
|
movups xmm1,XMMWORD PTR 16[edx]
|
|
lea edx,DWORD PTR 32[edx]
|
|
xorps xmm2,xmm0
|
|
$L058enc1_loop_10:
|
|
DB 102,15,56,220,209
|
|
dec ecx
|
|
movups xmm1,XMMWORD PTR [edx]
|
|
lea edx,DWORD PTR 16[edx]
|
|
jnz $L058enc1_loop_10
|
|
DB 102,15,56,221,209
|
|
xorps xmm2,xmm5
|
|
movups XMMWORD PTR [edi-16],xmm2
|
|
$L056xts_enc_ret:
|
|
pxor xmm0,xmm0
|
|
pxor xmm1,xmm1
|
|
pxor xmm2,xmm2
|
|
movdqa XMMWORD PTR [esp],xmm0
|
|
pxor xmm3,xmm3
|
|
movdqa XMMWORD PTR 16[esp],xmm0
|
|
pxor xmm4,xmm4
|
|
movdqa XMMWORD PTR 32[esp],xmm0
|
|
pxor xmm5,xmm5
|
|
movdqa XMMWORD PTR 48[esp],xmm0
|
|
pxor xmm6,xmm6
|
|
movdqa XMMWORD PTR 64[esp],xmm0
|
|
pxor xmm7,xmm7
|
|
movdqa XMMWORD PTR 80[esp],xmm0
|
|
mov esp,DWORD PTR 116[esp]
|
|
pop edi
|
|
pop esi
|
|
pop ebx
|
|
pop ebp
|
|
ret
|
|
_aesni_xts_encrypt ENDP
|
|
ALIGN 16
|
|
_aesni_xts_decrypt PROC PUBLIC
|
|
$L_aesni_xts_decrypt_begin::
|
|
push ebp
|
|
push ebx
|
|
push esi
|
|
push edi
|
|
mov edx,DWORD PTR 36[esp]
|
|
mov esi,DWORD PTR 40[esp]
|
|
mov ecx,DWORD PTR 240[edx]
|
|
movups xmm2,XMMWORD PTR [esi]
|
|
movups xmm0,XMMWORD PTR [edx]
|
|
movups xmm1,XMMWORD PTR 16[edx]
|
|
lea edx,DWORD PTR 32[edx]
|
|
xorps xmm2,xmm0
|
|
$L059enc1_loop_11:
|
|
DB 102,15,56,220,209
|
|
dec ecx
|
|
movups xmm1,XMMWORD PTR [edx]
|
|
lea edx,DWORD PTR 16[edx]
|
|
jnz $L059enc1_loop_11
|
|
DB 102,15,56,221,209
|
|
mov esi,DWORD PTR 20[esp]
|
|
mov edi,DWORD PTR 24[esp]
|
|
mov eax,DWORD PTR 28[esp]
|
|
mov edx,DWORD PTR 32[esp]
|
|
mov ebp,esp
|
|
sub esp,120
|
|
and esp,-16
|
|
xor ebx,ebx
|
|
test eax,15
|
|
setnz bl
|
|
shl ebx,4
|
|
sub eax,ebx
|
|
mov DWORD PTR 96[esp],135
|
|
mov DWORD PTR 100[esp],0
|
|
mov DWORD PTR 104[esp],1
|
|
mov DWORD PTR 108[esp],0
|
|
mov DWORD PTR 112[esp],eax
|
|
mov DWORD PTR 116[esp],ebp
|
|
mov ecx,DWORD PTR 240[edx]
|
|
mov ebp,edx
|
|
mov ebx,ecx
|
|
movdqa xmm1,xmm2
|
|
pxor xmm0,xmm0
|
|
movdqa xmm3,XMMWORD PTR 96[esp]
|
|
pcmpgtd xmm0,xmm1
|
|
and eax,-16
|
|
sub eax,96
|
|
jc $L060xts_dec_short
|
|
shl ecx,4
|
|
mov ebx,16
|
|
sub ebx,ecx
|
|
lea edx,DWORD PTR 32[ecx*1+edx]
|
|
jmp $L061xts_dec_loop6
|
|
ALIGN 16
|
|
$L061xts_dec_loop6:
|
|
pshufd xmm2,xmm0,19
|
|
pxor xmm0,xmm0
|
|
movdqa XMMWORD PTR [esp],xmm1
|
|
paddq xmm1,xmm1
|
|
pand xmm2,xmm3
|
|
pcmpgtd xmm0,xmm1
|
|
pxor xmm1,xmm2
|
|
pshufd xmm2,xmm0,19
|
|
pxor xmm0,xmm0
|
|
movdqa XMMWORD PTR 16[esp],xmm1
|
|
paddq xmm1,xmm1
|
|
pand xmm2,xmm3
|
|
pcmpgtd xmm0,xmm1
|
|
pxor xmm1,xmm2
|
|
pshufd xmm2,xmm0,19
|
|
pxor xmm0,xmm0
|
|
movdqa XMMWORD PTR 32[esp],xmm1
|
|
paddq xmm1,xmm1
|
|
pand xmm2,xmm3
|
|
pcmpgtd xmm0,xmm1
|
|
pxor xmm1,xmm2
|
|
pshufd xmm2,xmm0,19
|
|
pxor xmm0,xmm0
|
|
movdqa XMMWORD PTR 48[esp],xmm1
|
|
paddq xmm1,xmm1
|
|
pand xmm2,xmm3
|
|
pcmpgtd xmm0,xmm1
|
|
pxor xmm1,xmm2
|
|
pshufd xmm7,xmm0,19
|
|
movdqa XMMWORD PTR 64[esp],xmm1
|
|
paddq xmm1,xmm1
|
|
movups xmm0,XMMWORD PTR [ebp]
|
|
pand xmm7,xmm3
|
|
movups xmm2,XMMWORD PTR [esi]
|
|
pxor xmm7,xmm1
|
|
mov ecx,ebx
|
|
movdqu xmm3,XMMWORD PTR 16[esi]
|
|
xorps xmm2,xmm0
|
|
movdqu xmm4,XMMWORD PTR 32[esi]
|
|
pxor xmm3,xmm0
|
|
movdqu xmm5,XMMWORD PTR 48[esi]
|
|
pxor xmm4,xmm0
|
|
movdqu xmm6,XMMWORD PTR 64[esi]
|
|
pxor xmm5,xmm0
|
|
movdqu xmm1,XMMWORD PTR 80[esi]
|
|
pxor xmm6,xmm0
|
|
lea esi,DWORD PTR 96[esi]
|
|
pxor xmm2,XMMWORD PTR [esp]
|
|
movdqa XMMWORD PTR 80[esp],xmm7
|
|
pxor xmm7,xmm1
|
|
movups xmm1,XMMWORD PTR 16[ebp]
|
|
pxor xmm3,XMMWORD PTR 16[esp]
|
|
pxor xmm4,XMMWORD PTR 32[esp]
|
|
DB 102,15,56,222,209
|
|
pxor xmm5,XMMWORD PTR 48[esp]
|
|
pxor xmm6,XMMWORD PTR 64[esp]
|
|
DB 102,15,56,222,217
|
|
pxor xmm7,xmm0
|
|
movups xmm0,XMMWORD PTR 32[ebp]
|
|
DB 102,15,56,222,225
|
|
DB 102,15,56,222,233
|
|
DB 102,15,56,222,241
|
|
DB 102,15,56,222,249
|
|
call $L_aesni_decrypt6_enter
|
|
movdqa xmm1,XMMWORD PTR 80[esp]
|
|
pxor xmm0,xmm0
|
|
xorps xmm2,XMMWORD PTR [esp]
|
|
pcmpgtd xmm0,xmm1
|
|
xorps xmm3,XMMWORD PTR 16[esp]
|
|
movups XMMWORD PTR [edi],xmm2
|
|
xorps xmm4,XMMWORD PTR 32[esp]
|
|
movups XMMWORD PTR 16[edi],xmm3
|
|
xorps xmm5,XMMWORD PTR 48[esp]
|
|
movups XMMWORD PTR 32[edi],xmm4
|
|
xorps xmm6,XMMWORD PTR 64[esp]
|
|
movups XMMWORD PTR 48[edi],xmm5
|
|
xorps xmm7,xmm1
|
|
movups XMMWORD PTR 64[edi],xmm6
|
|
pshufd xmm2,xmm0,19
|
|
movups XMMWORD PTR 80[edi],xmm7
|
|
lea edi,DWORD PTR 96[edi]
|
|
movdqa xmm3,XMMWORD PTR 96[esp]
|
|
pxor xmm0,xmm0
|
|
paddq xmm1,xmm1
|
|
pand xmm2,xmm3
|
|
pcmpgtd xmm0,xmm1
|
|
pxor xmm1,xmm2
|
|
sub eax,96
|
|
jnc $L061xts_dec_loop6
|
|
mov ecx,DWORD PTR 240[ebp]
|
|
mov edx,ebp
|
|
mov ebx,ecx
|
|
$L060xts_dec_short:
|
|
add eax,96
|
|
jz $L062xts_dec_done6x
|
|
movdqa xmm5,xmm1
|
|
cmp eax,32
|
|
jb $L063xts_dec_one
|
|
pshufd xmm2,xmm0,19
|
|
pxor xmm0,xmm0
|
|
paddq xmm1,xmm1
|
|
pand xmm2,xmm3
|
|
pcmpgtd xmm0,xmm1
|
|
pxor xmm1,xmm2
|
|
je $L064xts_dec_two
|
|
pshufd xmm2,xmm0,19
|
|
pxor xmm0,xmm0
|
|
movdqa xmm6,xmm1
|
|
paddq xmm1,xmm1
|
|
pand xmm2,xmm3
|
|
pcmpgtd xmm0,xmm1
|
|
pxor xmm1,xmm2
|
|
cmp eax,64
|
|
jb $L065xts_dec_three
|
|
pshufd xmm2,xmm0,19
|
|
pxor xmm0,xmm0
|
|
movdqa xmm7,xmm1
|
|
paddq xmm1,xmm1
|
|
pand xmm2,xmm3
|
|
pcmpgtd xmm0,xmm1
|
|
pxor xmm1,xmm2
|
|
movdqa XMMWORD PTR [esp],xmm5
|
|
movdqa XMMWORD PTR 16[esp],xmm6
|
|
je $L066xts_dec_four
|
|
movdqa XMMWORD PTR 32[esp],xmm7
|
|
pshufd xmm7,xmm0,19
|
|
movdqa XMMWORD PTR 48[esp],xmm1
|
|
paddq xmm1,xmm1
|
|
pand xmm7,xmm3
|
|
pxor xmm7,xmm1
|
|
movdqu xmm2,XMMWORD PTR [esi]
|
|
movdqu xmm3,XMMWORD PTR 16[esi]
|
|
movdqu xmm4,XMMWORD PTR 32[esi]
|
|
pxor xmm2,XMMWORD PTR [esp]
|
|
movdqu xmm5,XMMWORD PTR 48[esi]
|
|
pxor xmm3,XMMWORD PTR 16[esp]
|
|
movdqu xmm6,XMMWORD PTR 64[esi]
|
|
pxor xmm4,XMMWORD PTR 32[esp]
|
|
lea esi,DWORD PTR 80[esi]
|
|
pxor xmm5,XMMWORD PTR 48[esp]
|
|
movdqa XMMWORD PTR 64[esp],xmm7
|
|
pxor xmm6,xmm7
|
|
call __aesni_decrypt6
|
|
movaps xmm1,XMMWORD PTR 64[esp]
|
|
xorps xmm2,XMMWORD PTR [esp]
|
|
xorps xmm3,XMMWORD PTR 16[esp]
|
|
xorps xmm4,XMMWORD PTR 32[esp]
|
|
movups XMMWORD PTR [edi],xmm2
|
|
xorps xmm5,XMMWORD PTR 48[esp]
|
|
movups XMMWORD PTR 16[edi],xmm3
|
|
xorps xmm6,xmm1
|
|
movups XMMWORD PTR 32[edi],xmm4
|
|
movups XMMWORD PTR 48[edi],xmm5
|
|
movups XMMWORD PTR 64[edi],xmm6
|
|
lea edi,DWORD PTR 80[edi]
|
|
jmp $L067xts_dec_done
|
|
ALIGN 16
|
|
$L063xts_dec_one:
|
|
movups xmm2,XMMWORD PTR [esi]
|
|
lea esi,DWORD PTR 16[esi]
|
|
xorps xmm2,xmm5
|
|
movups xmm0,XMMWORD PTR [edx]
|
|
movups xmm1,XMMWORD PTR 16[edx]
|
|
lea edx,DWORD PTR 32[edx]
|
|
xorps xmm2,xmm0
|
|
$L068dec1_loop_12:
|
|
DB 102,15,56,222,209
|
|
dec ecx
|
|
movups xmm1,XMMWORD PTR [edx]
|
|
lea edx,DWORD PTR 16[edx]
|
|
jnz $L068dec1_loop_12
|
|
DB 102,15,56,223,209
|
|
xorps xmm2,xmm5
|
|
movups XMMWORD PTR [edi],xmm2
|
|
lea edi,DWORD PTR 16[edi]
|
|
movdqa xmm1,xmm5
|
|
jmp $L067xts_dec_done
|
|
ALIGN 16
|
|
$L064xts_dec_two:
|
|
movaps xmm6,xmm1
|
|
movups xmm2,XMMWORD PTR [esi]
|
|
movups xmm3,XMMWORD PTR 16[esi]
|
|
lea esi,DWORD PTR 32[esi]
|
|
xorps xmm2,xmm5
|
|
xorps xmm3,xmm6
|
|
call __aesni_decrypt2
|
|
xorps xmm2,xmm5
|
|
xorps xmm3,xmm6
|
|
movups XMMWORD PTR [edi],xmm2
|
|
movups XMMWORD PTR 16[edi],xmm3
|
|
lea edi,DWORD PTR 32[edi]
|
|
movdqa xmm1,xmm6
|
|
jmp $L067xts_dec_done
|
|
ALIGN 16
|
|
$L065xts_dec_three:
|
|
movaps xmm7,xmm1
|
|
movups xmm2,XMMWORD PTR [esi]
|
|
movups xmm3,XMMWORD PTR 16[esi]
|
|
movups xmm4,XMMWORD PTR 32[esi]
|
|
lea esi,DWORD PTR 48[esi]
|
|
xorps xmm2,xmm5
|
|
xorps xmm3,xmm6
|
|
xorps xmm4,xmm7
|
|
call __aesni_decrypt3
|
|
xorps xmm2,xmm5
|
|
xorps xmm3,xmm6
|
|
xorps xmm4,xmm7
|
|
movups XMMWORD PTR [edi],xmm2
|
|
movups XMMWORD PTR 16[edi],xmm3
|
|
movups XMMWORD PTR 32[edi],xmm4
|
|
lea edi,DWORD PTR 48[edi]
|
|
movdqa xmm1,xmm7
|
|
jmp $L067xts_dec_done
|
|
ALIGN 16
|
|
$L066xts_dec_four:
|
|
movaps xmm6,xmm1
|
|
movups xmm2,XMMWORD PTR [esi]
|
|
movups xmm3,XMMWORD PTR 16[esi]
|
|
movups xmm4,XMMWORD PTR 32[esi]
|
|
xorps xmm2,XMMWORD PTR [esp]
|
|
movups xmm5,XMMWORD PTR 48[esi]
|
|
lea esi,DWORD PTR 64[esi]
|
|
xorps xmm3,XMMWORD PTR 16[esp]
|
|
xorps xmm4,xmm7
|
|
xorps xmm5,xmm6
|
|
call __aesni_decrypt4
|
|
xorps xmm2,XMMWORD PTR [esp]
|
|
xorps xmm3,XMMWORD PTR 16[esp]
|
|
xorps xmm4,xmm7
|
|
movups XMMWORD PTR [edi],xmm2
|
|
xorps xmm5,xmm6
|
|
movups XMMWORD PTR 16[edi],xmm3
|
|
movups XMMWORD PTR 32[edi],xmm4
|
|
movups XMMWORD PTR 48[edi],xmm5
|
|
lea edi,DWORD PTR 64[edi]
|
|
movdqa xmm1,xmm6
|
|
jmp $L067xts_dec_done
|
|
ALIGN 16
|
|
$L062xts_dec_done6x:
|
|
mov eax,DWORD PTR 112[esp]
|
|
and eax,15
|
|
jz $L069xts_dec_ret
|
|
mov DWORD PTR 112[esp],eax
|
|
jmp $L070xts_dec_only_one_more
|
|
ALIGN 16
|
|
$L067xts_dec_done:
|
|
mov eax,DWORD PTR 112[esp]
|
|
pxor xmm0,xmm0
|
|
and eax,15
|
|
jz $L069xts_dec_ret
|
|
pcmpgtd xmm0,xmm1
|
|
mov DWORD PTR 112[esp],eax
|
|
pshufd xmm2,xmm0,19
|
|
pxor xmm0,xmm0
|
|
movdqa xmm3,XMMWORD PTR 96[esp]
|
|
paddq xmm1,xmm1
|
|
pand xmm2,xmm3
|
|
pcmpgtd xmm0,xmm1
|
|
pxor xmm1,xmm2
|
|
$L070xts_dec_only_one_more:
|
|
pshufd xmm5,xmm0,19
|
|
movdqa xmm6,xmm1
|
|
paddq xmm1,xmm1
|
|
pand xmm5,xmm3
|
|
pxor xmm5,xmm1
|
|
mov edx,ebp
|
|
mov ecx,ebx
|
|
movups xmm2,XMMWORD PTR [esi]
|
|
xorps xmm2,xmm5
|
|
movups xmm0,XMMWORD PTR [edx]
|
|
movups xmm1,XMMWORD PTR 16[edx]
|
|
lea edx,DWORD PTR 32[edx]
|
|
xorps xmm2,xmm0
|
|
$L071dec1_loop_13:
|
|
DB 102,15,56,222,209
|
|
dec ecx
|
|
movups xmm1,XMMWORD PTR [edx]
|
|
lea edx,DWORD PTR 16[edx]
|
|
jnz $L071dec1_loop_13
|
|
DB 102,15,56,223,209
|
|
xorps xmm2,xmm5
|
|
movups XMMWORD PTR [edi],xmm2
|
|
$L072xts_dec_steal:
|
|
movzx ecx,BYTE PTR 16[esi]
|
|
movzx edx,BYTE PTR [edi]
|
|
lea esi,DWORD PTR 1[esi]
|
|
mov BYTE PTR [edi],cl
|
|
mov BYTE PTR 16[edi],dl
|
|
lea edi,DWORD PTR 1[edi]
|
|
sub eax,1
|
|
jnz $L072xts_dec_steal
|
|
sub edi,DWORD PTR 112[esp]
|
|
mov edx,ebp
|
|
mov ecx,ebx
|
|
movups xmm2,XMMWORD PTR [edi]
|
|
xorps xmm2,xmm6
|
|
movups xmm0,XMMWORD PTR [edx]
|
|
movups xmm1,XMMWORD PTR 16[edx]
|
|
lea edx,DWORD PTR 32[edx]
|
|
xorps xmm2,xmm0
|
|
$L073dec1_loop_14:
|
|
DB 102,15,56,222,209
|
|
dec ecx
|
|
movups xmm1,XMMWORD PTR [edx]
|
|
lea edx,DWORD PTR 16[edx]
|
|
jnz $L073dec1_loop_14
|
|
DB 102,15,56,223,209
|
|
xorps xmm2,xmm6
|
|
movups XMMWORD PTR [edi],xmm2
|
|
$L069xts_dec_ret:
|
|
pxor xmm0,xmm0
|
|
pxor xmm1,xmm1
|
|
pxor xmm2,xmm2
|
|
movdqa XMMWORD PTR [esp],xmm0
|
|
pxor xmm3,xmm3
|
|
movdqa XMMWORD PTR 16[esp],xmm0
|
|
pxor xmm4,xmm4
|
|
movdqa XMMWORD PTR 32[esp],xmm0
|
|
pxor xmm5,xmm5
|
|
movdqa XMMWORD PTR 48[esp],xmm0
|
|
pxor xmm6,xmm6
|
|
movdqa XMMWORD PTR 64[esp],xmm0
|
|
pxor xmm7,xmm7
|
|
movdqa XMMWORD PTR 80[esp],xmm0
|
|
mov esp,DWORD PTR 116[esp]
|
|
pop edi
|
|
pop esi
|
|
pop ebx
|
|
pop ebp
|
|
ret
|
|
_aesni_xts_decrypt ENDP
|
|
ALIGN 16
|
|
_aesni_cbc_encrypt PROC PUBLIC
|
|
$L_aesni_cbc_encrypt_begin::
|
|
push ebp
|
|
push ebx
|
|
push esi
|
|
push edi
|
|
mov esi,DWORD PTR 20[esp]
|
|
mov ebx,esp
|
|
mov edi,DWORD PTR 24[esp]
|
|
sub ebx,24
|
|
mov eax,DWORD PTR 28[esp]
|
|
and ebx,-16
|
|
mov edx,DWORD PTR 32[esp]
|
|
mov ebp,DWORD PTR 36[esp]
|
|
test eax,eax
|
|
jz $L074cbc_abort
|
|
cmp DWORD PTR 40[esp],0
|
|
xchg ebx,esp
|
|
movups xmm7,XMMWORD PTR [ebp]
|
|
mov ecx,DWORD PTR 240[edx]
|
|
mov ebp,edx
|
|
mov DWORD PTR 16[esp],ebx
|
|
mov ebx,ecx
|
|
je $L075cbc_decrypt
|
|
movaps xmm2,xmm7
|
|
cmp eax,16
|
|
jb $L076cbc_enc_tail
|
|
sub eax,16
|
|
jmp $L077cbc_enc_loop
|
|
ALIGN 16
|
|
$L077cbc_enc_loop:
|
|
movups xmm7,XMMWORD PTR [esi]
|
|
lea esi,DWORD PTR 16[esi]
|
|
movups xmm0,XMMWORD PTR [edx]
|
|
movups xmm1,XMMWORD PTR 16[edx]
|
|
xorps xmm7,xmm0
|
|
lea edx,DWORD PTR 32[edx]
|
|
xorps xmm2,xmm7
|
|
$L078enc1_loop_15:
|
|
DB 102,15,56,220,209
|
|
dec ecx
|
|
movups xmm1,XMMWORD PTR [edx]
|
|
lea edx,DWORD PTR 16[edx]
|
|
jnz $L078enc1_loop_15
|
|
DB 102,15,56,221,209
|
|
mov ecx,ebx
|
|
mov edx,ebp
|
|
movups XMMWORD PTR [edi],xmm2
|
|
lea edi,DWORD PTR 16[edi]
|
|
sub eax,16
|
|
jnc $L077cbc_enc_loop
|
|
add eax,16
|
|
jnz $L076cbc_enc_tail
|
|
movaps xmm7,xmm2
|
|
pxor xmm2,xmm2
|
|
jmp $L079cbc_ret
|
|
$L076cbc_enc_tail:
|
|
mov ecx,eax
|
|
DD 2767451785
|
|
mov ecx,16
|
|
sub ecx,eax
|
|
xor eax,eax
|
|
DD 2868115081
|
|
lea edi,DWORD PTR [edi-16]
|
|
mov ecx,ebx
|
|
mov esi,edi
|
|
mov edx,ebp
|
|
jmp $L077cbc_enc_loop
|
|
ALIGN 16
|
|
$L075cbc_decrypt:
|
|
cmp eax,80
|
|
jbe $L080cbc_dec_tail
|
|
movaps XMMWORD PTR [esp],xmm7
|
|
sub eax,80
|
|
jmp $L081cbc_dec_loop6_enter
|
|
ALIGN 16
|
|
$L082cbc_dec_loop6:
|
|
movaps XMMWORD PTR [esp],xmm0
|
|
movups XMMWORD PTR [edi],xmm7
|
|
lea edi,DWORD PTR 16[edi]
|
|
$L081cbc_dec_loop6_enter:
|
|
movdqu xmm2,XMMWORD PTR [esi]
|
|
movdqu xmm3,XMMWORD PTR 16[esi]
|
|
movdqu xmm4,XMMWORD PTR 32[esi]
|
|
movdqu xmm5,XMMWORD PTR 48[esi]
|
|
movdqu xmm6,XMMWORD PTR 64[esi]
|
|
movdqu xmm7,XMMWORD PTR 80[esi]
|
|
call __aesni_decrypt6
|
|
movups xmm1,XMMWORD PTR [esi]
|
|
movups xmm0,XMMWORD PTR 16[esi]
|
|
xorps xmm2,XMMWORD PTR [esp]
|
|
xorps xmm3,xmm1
|
|
movups xmm1,XMMWORD PTR 32[esi]
|
|
xorps xmm4,xmm0
|
|
movups xmm0,XMMWORD PTR 48[esi]
|
|
xorps xmm5,xmm1
|
|
movups xmm1,XMMWORD PTR 64[esi]
|
|
xorps xmm6,xmm0
|
|
movups xmm0,XMMWORD PTR 80[esi]
|
|
xorps xmm7,xmm1
|
|
movups XMMWORD PTR [edi],xmm2
|
|
movups XMMWORD PTR 16[edi],xmm3
|
|
lea esi,DWORD PTR 96[esi]
|
|
movups XMMWORD PTR 32[edi],xmm4
|
|
mov ecx,ebx
|
|
movups XMMWORD PTR 48[edi],xmm5
|
|
mov edx,ebp
|
|
movups XMMWORD PTR 64[edi],xmm6
|
|
lea edi,DWORD PTR 80[edi]
|
|
sub eax,96
|
|
ja $L082cbc_dec_loop6
|
|
movaps xmm2,xmm7
|
|
movaps xmm7,xmm0
|
|
add eax,80
|
|
jle $L083cbc_dec_clear_tail_collected
|
|
movups XMMWORD PTR [edi],xmm2
|
|
lea edi,DWORD PTR 16[edi]
|
|
$L080cbc_dec_tail:
|
|
movups xmm2,XMMWORD PTR [esi]
|
|
movaps xmm6,xmm2
|
|
cmp eax,16
|
|
jbe $L084cbc_dec_one
|
|
movups xmm3,XMMWORD PTR 16[esi]
|
|
movaps xmm5,xmm3
|
|
cmp eax,32
|
|
jbe $L085cbc_dec_two
|
|
movups xmm4,XMMWORD PTR 32[esi]
|
|
cmp eax,48
|
|
jbe $L086cbc_dec_three
|
|
movups xmm5,XMMWORD PTR 48[esi]
|
|
cmp eax,64
|
|
jbe $L087cbc_dec_four
|
|
movups xmm6,XMMWORD PTR 64[esi]
|
|
movaps XMMWORD PTR [esp],xmm7
|
|
movups xmm2,XMMWORD PTR [esi]
|
|
xorps xmm7,xmm7
|
|
call __aesni_decrypt6
|
|
movups xmm1,XMMWORD PTR [esi]
|
|
movups xmm0,XMMWORD PTR 16[esi]
|
|
xorps xmm2,XMMWORD PTR [esp]
|
|
xorps xmm3,xmm1
|
|
movups xmm1,XMMWORD PTR 32[esi]
|
|
xorps xmm4,xmm0
|
|
movups xmm0,XMMWORD PTR 48[esi]
|
|
xorps xmm5,xmm1
|
|
movups xmm7,XMMWORD PTR 64[esi]
|
|
xorps xmm6,xmm0
|
|
movups XMMWORD PTR [edi],xmm2
|
|
movups XMMWORD PTR 16[edi],xmm3
|
|
pxor xmm3,xmm3
|
|
movups XMMWORD PTR 32[edi],xmm4
|
|
pxor xmm4,xmm4
|
|
movups XMMWORD PTR 48[edi],xmm5
|
|
pxor xmm5,xmm5
|
|
lea edi,DWORD PTR 64[edi]
|
|
movaps xmm2,xmm6
|
|
pxor xmm6,xmm6
|
|
sub eax,80
|
|
jmp $L088cbc_dec_tail_collected
|
|
ALIGN 16
|
|
$L084cbc_dec_one:
|
|
movups xmm0,XMMWORD PTR [edx]
|
|
movups xmm1,XMMWORD PTR 16[edx]
|
|
lea edx,DWORD PTR 32[edx]
|
|
xorps xmm2,xmm0
|
|
$L089dec1_loop_16:
|
|
DB 102,15,56,222,209
|
|
dec ecx
|
|
movups xmm1,XMMWORD PTR [edx]
|
|
lea edx,DWORD PTR 16[edx]
|
|
jnz $L089dec1_loop_16
|
|
DB 102,15,56,223,209
|
|
xorps xmm2,xmm7
|
|
movaps xmm7,xmm6
|
|
sub eax,16
|
|
jmp $L088cbc_dec_tail_collected
|
|
ALIGN 16
|
|
$L085cbc_dec_two:
|
|
call __aesni_decrypt2
|
|
xorps xmm2,xmm7
|
|
xorps xmm3,xmm6
|
|
movups XMMWORD PTR [edi],xmm2
|
|
movaps xmm2,xmm3
|
|
pxor xmm3,xmm3
|
|
lea edi,DWORD PTR 16[edi]
|
|
movaps xmm7,xmm5
|
|
sub eax,32
|
|
jmp $L088cbc_dec_tail_collected
|
|
ALIGN 16
|
|
$L086cbc_dec_three:
|
|
call __aesni_decrypt3
|
|
xorps xmm2,xmm7
|
|
xorps xmm3,xmm6
|
|
xorps xmm4,xmm5
|
|
movups XMMWORD PTR [edi],xmm2
|
|
movaps xmm2,xmm4
|
|
pxor xmm4,xmm4
|
|
movups XMMWORD PTR 16[edi],xmm3
|
|
pxor xmm3,xmm3
|
|
lea edi,DWORD PTR 32[edi]
|
|
movups xmm7,XMMWORD PTR 32[esi]
|
|
sub eax,48
|
|
jmp $L088cbc_dec_tail_collected
|
|
ALIGN 16
|
|
$L087cbc_dec_four:
|
|
call __aesni_decrypt4
|
|
movups xmm1,XMMWORD PTR 16[esi]
|
|
movups xmm0,XMMWORD PTR 32[esi]
|
|
xorps xmm2,xmm7
|
|
movups xmm7,XMMWORD PTR 48[esi]
|
|
xorps xmm3,xmm6
|
|
movups XMMWORD PTR [edi],xmm2
|
|
xorps xmm4,xmm1
|
|
movups XMMWORD PTR 16[edi],xmm3
|
|
pxor xmm3,xmm3
|
|
xorps xmm5,xmm0
|
|
movups XMMWORD PTR 32[edi],xmm4
|
|
pxor xmm4,xmm4
|
|
lea edi,DWORD PTR 48[edi]
|
|
movaps xmm2,xmm5
|
|
pxor xmm5,xmm5
|
|
sub eax,64
|
|
jmp $L088cbc_dec_tail_collected
|
|
ALIGN 16
|
|
$L083cbc_dec_clear_tail_collected:
|
|
pxor xmm3,xmm3
|
|
pxor xmm4,xmm4
|
|
pxor xmm5,xmm5
|
|
pxor xmm6,xmm6
|
|
$L088cbc_dec_tail_collected:
|
|
and eax,15
|
|
jnz $L090cbc_dec_tail_partial
|
|
movups XMMWORD PTR [edi],xmm2
|
|
pxor xmm0,xmm0
|
|
jmp $L079cbc_ret
|
|
ALIGN 16
|
|
$L090cbc_dec_tail_partial:
|
|
movaps XMMWORD PTR [esp],xmm2
|
|
pxor xmm0,xmm0
|
|
mov ecx,16
|
|
mov esi,esp
|
|
sub ecx,eax
|
|
DD 2767451785
|
|
movdqa XMMWORD PTR [esp],xmm2
|
|
$L079cbc_ret:
|
|
mov esp,DWORD PTR 16[esp]
|
|
mov ebp,DWORD PTR 36[esp]
|
|
pxor xmm2,xmm2
|
|
pxor xmm1,xmm1
|
|
movups XMMWORD PTR [ebp],xmm7
|
|
pxor xmm7,xmm7
|
|
$L074cbc_abort:
|
|
pop edi
|
|
pop esi
|
|
pop ebx
|
|
pop ebp
|
|
ret
|
|
_aesni_cbc_encrypt ENDP
|
|
ALIGN 16
|
|
__aesni_set_encrypt_key PROC PRIVATE
|
|
push ebp
|
|
push ebx
|
|
test eax,eax
|
|
jz $L091bad_pointer
|
|
test edx,edx
|
|
jz $L091bad_pointer
|
|
call $L092pic
|
|
$L092pic:
|
|
pop ebx
|
|
lea ebx,DWORD PTR ($Lkey_const-$L092pic)[ebx]
|
|
lea ebp,DWORD PTR _OPENSSL_ia32cap_P
|
|
movups xmm0,XMMWORD PTR [eax]
|
|
xorps xmm4,xmm4
|
|
mov ebp,DWORD PTR 4[ebp]
|
|
lea edx,DWORD PTR 16[edx]
|
|
and ebp,268437504
|
|
cmp ecx,256
|
|
je $L09314rounds
|
|
cmp ecx,192
|
|
je $L09412rounds
|
|
cmp ecx,128
|
|
jne $L095bad_keybits
|
|
ALIGN 16
|
|
$L09610rounds:
|
|
cmp ebp,268435456
|
|
je $L09710rounds_alt
|
|
mov ecx,9
|
|
movups XMMWORD PTR [edx-16],xmm0
|
|
DB 102,15,58,223,200,1
|
|
call $L098key_128_cold
|
|
DB 102,15,58,223,200,2
|
|
call $L099key_128
|
|
DB 102,15,58,223,200,4
|
|
call $L099key_128
|
|
DB 102,15,58,223,200,8
|
|
call $L099key_128
|
|
DB 102,15,58,223,200,16
|
|
call $L099key_128
|
|
DB 102,15,58,223,200,32
|
|
call $L099key_128
|
|
DB 102,15,58,223,200,64
|
|
call $L099key_128
|
|
DB 102,15,58,223,200,128
|
|
call $L099key_128
|
|
DB 102,15,58,223,200,27
|
|
call $L099key_128
|
|
DB 102,15,58,223,200,54
|
|
call $L099key_128
|
|
movups XMMWORD PTR [edx],xmm0
|
|
mov DWORD PTR 80[edx],ecx
|
|
jmp $L100good_key
|
|
ALIGN 16
|
|
$L099key_128:
|
|
movups XMMWORD PTR [edx],xmm0
|
|
lea edx,DWORD PTR 16[edx]
|
|
$L098key_128_cold:
|
|
shufps xmm4,xmm0,16
|
|
xorps xmm0,xmm4
|
|
shufps xmm4,xmm0,140
|
|
xorps xmm0,xmm4
|
|
shufps xmm1,xmm1,255
|
|
xorps xmm0,xmm1
|
|
ret
|
|
ALIGN 16
|
|
$L09710rounds_alt:
|
|
movdqa xmm5,XMMWORD PTR [ebx]
|
|
mov ecx,8
|
|
movdqa xmm4,XMMWORD PTR 32[ebx]
|
|
movdqa xmm2,xmm0
|
|
movdqu XMMWORD PTR [edx-16],xmm0
|
|
$L101loop_key128:
|
|
DB 102,15,56,0,197
|
|
DB 102,15,56,221,196
|
|
pslld xmm4,1
|
|
lea edx,DWORD PTR 16[edx]
|
|
movdqa xmm3,xmm2
|
|
pslldq xmm2,4
|
|
pxor xmm3,xmm2
|
|
pslldq xmm2,4
|
|
pxor xmm3,xmm2
|
|
pslldq xmm2,4
|
|
pxor xmm2,xmm3
|
|
pxor xmm0,xmm2
|
|
movdqu XMMWORD PTR [edx-16],xmm0
|
|
movdqa xmm2,xmm0
|
|
dec ecx
|
|
jnz $L101loop_key128
|
|
movdqa xmm4,XMMWORD PTR 48[ebx]
|
|
DB 102,15,56,0,197
|
|
DB 102,15,56,221,196
|
|
pslld xmm4,1
|
|
movdqa xmm3,xmm2
|
|
pslldq xmm2,4
|
|
pxor xmm3,xmm2
|
|
pslldq xmm2,4
|
|
pxor xmm3,xmm2
|
|
pslldq xmm2,4
|
|
pxor xmm2,xmm3
|
|
pxor xmm0,xmm2
|
|
movdqu XMMWORD PTR [edx],xmm0
|
|
movdqa xmm2,xmm0
|
|
DB 102,15,56,0,197
|
|
DB 102,15,56,221,196
|
|
movdqa xmm3,xmm2
|
|
pslldq xmm2,4
|
|
pxor xmm3,xmm2
|
|
pslldq xmm2,4
|
|
pxor xmm3,xmm2
|
|
pslldq xmm2,4
|
|
pxor xmm2,xmm3
|
|
pxor xmm0,xmm2
|
|
movdqu XMMWORD PTR 16[edx],xmm0
|
|
mov ecx,9
|
|
mov DWORD PTR 96[edx],ecx
|
|
jmp $L100good_key
|
|
ALIGN 16
|
|
$L09412rounds:
|
|
movq xmm2,QWORD PTR 16[eax]
|
|
cmp ebp,268435456
|
|
je $L10212rounds_alt
|
|
mov ecx,11
|
|
movups XMMWORD PTR [edx-16],xmm0
|
|
DB 102,15,58,223,202,1
|
|
call $L103key_192a_cold
|
|
DB 102,15,58,223,202,2
|
|
call $L104key_192b
|
|
DB 102,15,58,223,202,4
|
|
call $L105key_192a
|
|
DB 102,15,58,223,202,8
|
|
call $L104key_192b
|
|
DB 102,15,58,223,202,16
|
|
call $L105key_192a
|
|
DB 102,15,58,223,202,32
|
|
call $L104key_192b
|
|
DB 102,15,58,223,202,64
|
|
call $L105key_192a
|
|
DB 102,15,58,223,202,128
|
|
call $L104key_192b
|
|
movups XMMWORD PTR [edx],xmm0
|
|
mov DWORD PTR 48[edx],ecx
|
|
jmp $L100good_key
|
|
ALIGN 16
|
|
$L105key_192a:
|
|
movups XMMWORD PTR [edx],xmm0
|
|
lea edx,DWORD PTR 16[edx]
|
|
ALIGN 16
|
|
$L103key_192a_cold:
|
|
movaps xmm5,xmm2
|
|
$L106key_192b_warm:
|
|
shufps xmm4,xmm0,16
|
|
movdqa xmm3,xmm2
|
|
xorps xmm0,xmm4
|
|
shufps xmm4,xmm0,140
|
|
pslldq xmm3,4
|
|
xorps xmm0,xmm4
|
|
pshufd xmm1,xmm1,85
|
|
pxor xmm2,xmm3
|
|
pxor xmm0,xmm1
|
|
pshufd xmm3,xmm0,255
|
|
pxor xmm2,xmm3
|
|
ret
|
|
ALIGN 16
|
|
$L104key_192b:
|
|
movaps xmm3,xmm0
|
|
shufps xmm5,xmm0,68
|
|
movups XMMWORD PTR [edx],xmm5
|
|
shufps xmm3,xmm2,78
|
|
movups XMMWORD PTR 16[edx],xmm3
|
|
lea edx,DWORD PTR 32[edx]
|
|
jmp $L106key_192b_warm
|
|
ALIGN 16
|
|
$L10212rounds_alt:
|
|
movdqa xmm5,XMMWORD PTR 16[ebx]
|
|
movdqa xmm4,XMMWORD PTR 32[ebx]
|
|
mov ecx,8
|
|
movdqu XMMWORD PTR [edx-16],xmm0
|
|
$L107loop_key192:
|
|
movq QWORD PTR [edx],xmm2
|
|
movdqa xmm1,xmm2
|
|
DB 102,15,56,0,213
|
|
DB 102,15,56,221,212
|
|
pslld xmm4,1
|
|
lea edx,DWORD PTR 24[edx]
|
|
movdqa xmm3,xmm0
|
|
pslldq xmm0,4
|
|
pxor xmm3,xmm0
|
|
pslldq xmm0,4
|
|
pxor xmm3,xmm0
|
|
pslldq xmm0,4
|
|
pxor xmm0,xmm3
|
|
pshufd xmm3,xmm0,255
|
|
pxor xmm3,xmm1
|
|
pslldq xmm1,4
|
|
pxor xmm3,xmm1
|
|
pxor xmm0,xmm2
|
|
pxor xmm2,xmm3
|
|
movdqu XMMWORD PTR [edx-16],xmm0
|
|
dec ecx
|
|
jnz $L107loop_key192
|
|
mov ecx,11
|
|
mov DWORD PTR 32[edx],ecx
|
|
jmp $L100good_key
|
|
ALIGN 16
|
|
$L09314rounds:
|
|
movups xmm2,XMMWORD PTR 16[eax]
|
|
lea edx,DWORD PTR 16[edx]
|
|
cmp ebp,268435456
|
|
je $L10814rounds_alt
|
|
mov ecx,13
|
|
movups XMMWORD PTR [edx-32],xmm0
|
|
movups XMMWORD PTR [edx-16],xmm2
|
|
DB 102,15,58,223,202,1
|
|
call $L109key_256a_cold
|
|
DB 102,15,58,223,200,1
|
|
call $L110key_256b
|
|
DB 102,15,58,223,202,2
|
|
call $L111key_256a
|
|
DB 102,15,58,223,200,2
|
|
call $L110key_256b
|
|
DB 102,15,58,223,202,4
|
|
call $L111key_256a
|
|
DB 102,15,58,223,200,4
|
|
call $L110key_256b
|
|
DB 102,15,58,223,202,8
|
|
call $L111key_256a
|
|
DB 102,15,58,223,200,8
|
|
call $L110key_256b
|
|
DB 102,15,58,223,202,16
|
|
call $L111key_256a
|
|
DB 102,15,58,223,200,16
|
|
call $L110key_256b
|
|
DB 102,15,58,223,202,32
|
|
call $L111key_256a
|
|
DB 102,15,58,223,200,32
|
|
call $L110key_256b
|
|
DB 102,15,58,223,202,64
|
|
call $L111key_256a
|
|
movups XMMWORD PTR [edx],xmm0
|
|
mov DWORD PTR 16[edx],ecx
|
|
xor eax,eax
|
|
jmp $L100good_key
|
|
ALIGN 16
|
|
$L111key_256a:
|
|
movups XMMWORD PTR [edx],xmm2
|
|
lea edx,DWORD PTR 16[edx]
|
|
$L109key_256a_cold:
|
|
shufps xmm4,xmm0,16
|
|
xorps xmm0,xmm4
|
|
shufps xmm4,xmm0,140
|
|
xorps xmm0,xmm4
|
|
shufps xmm1,xmm1,255
|
|
xorps xmm0,xmm1
|
|
ret
|
|
ALIGN 16
|
|
$L110key_256b:
|
|
movups XMMWORD PTR [edx],xmm0
|
|
lea edx,DWORD PTR 16[edx]
|
|
shufps xmm4,xmm2,16
|
|
xorps xmm2,xmm4
|
|
shufps xmm4,xmm2,140
|
|
xorps xmm2,xmm4
|
|
shufps xmm1,xmm1,170
|
|
xorps xmm2,xmm1
|
|
ret
|
|
ALIGN 16
|
|
$L10814rounds_alt:
|
|
movdqa xmm5,XMMWORD PTR [ebx]
|
|
movdqa xmm4,XMMWORD PTR 32[ebx]
|
|
mov ecx,7
|
|
movdqu XMMWORD PTR [edx-32],xmm0
|
|
movdqa xmm1,xmm2
|
|
movdqu XMMWORD PTR [edx-16],xmm2
|
|
$L112loop_key256:
|
|
DB 102,15,56,0,213
|
|
DB 102,15,56,221,212
|
|
movdqa xmm3,xmm0
|
|
pslldq xmm0,4
|
|
pxor xmm3,xmm0
|
|
pslldq xmm0,4
|
|
pxor xmm3,xmm0
|
|
pslldq xmm0,4
|
|
pxor xmm0,xmm3
|
|
pslld xmm4,1
|
|
pxor xmm0,xmm2
|
|
movdqu XMMWORD PTR [edx],xmm0
|
|
dec ecx
|
|
jz $L113done_key256
|
|
pshufd xmm2,xmm0,255
|
|
pxor xmm3,xmm3
|
|
DB 102,15,56,221,211
|
|
movdqa xmm3,xmm1
|
|
pslldq xmm1,4
|
|
pxor xmm3,xmm1
|
|
pslldq xmm1,4
|
|
pxor xmm3,xmm1
|
|
pslldq xmm1,4
|
|
pxor xmm1,xmm3
|
|
pxor xmm2,xmm1
|
|
movdqu XMMWORD PTR 16[edx],xmm2
|
|
lea edx,DWORD PTR 32[edx]
|
|
movdqa xmm1,xmm2
|
|
jmp $L112loop_key256
|
|
$L113done_key256:
|
|
mov ecx,13
|
|
mov DWORD PTR 16[edx],ecx
|
|
$L100good_key:
|
|
pxor xmm0,xmm0
|
|
pxor xmm1,xmm1
|
|
pxor xmm2,xmm2
|
|
pxor xmm3,xmm3
|
|
pxor xmm4,xmm4
|
|
pxor xmm5,xmm5
|
|
xor eax,eax
|
|
pop ebx
|
|
pop ebp
|
|
ret
|
|
ALIGN 4
|
|
$L091bad_pointer:
|
|
mov eax,-1
|
|
pop ebx
|
|
pop ebp
|
|
ret
|
|
ALIGN 4
|
|
$L095bad_keybits:
|
|
pxor xmm0,xmm0
|
|
mov eax,-2
|
|
pop ebx
|
|
pop ebp
|
|
ret
|
|
__aesni_set_encrypt_key ENDP
|
|
ALIGN 16
|
|
_aesni_set_encrypt_key PROC PUBLIC
|
|
$L_aesni_set_encrypt_key_begin::
|
|
mov eax,DWORD PTR 4[esp]
|
|
mov ecx,DWORD PTR 8[esp]
|
|
mov edx,DWORD PTR 12[esp]
|
|
call __aesni_set_encrypt_key
|
|
ret
|
|
_aesni_set_encrypt_key ENDP
|
|
ALIGN 16
|
|
_aesni_set_decrypt_key PROC PUBLIC
|
|
$L_aesni_set_decrypt_key_begin::
|
|
mov eax,DWORD PTR 4[esp]
|
|
mov ecx,DWORD PTR 8[esp]
|
|
mov edx,DWORD PTR 12[esp]
|
|
call __aesni_set_encrypt_key
|
|
mov edx,DWORD PTR 12[esp]
|
|
shl ecx,4
|
|
test eax,eax
|
|
jnz $L114dec_key_ret
|
|
lea eax,DWORD PTR 16[ecx*1+edx]
|
|
movups xmm0,XMMWORD PTR [edx]
|
|
movups xmm1,XMMWORD PTR [eax]
|
|
movups XMMWORD PTR [eax],xmm0
|
|
movups XMMWORD PTR [edx],xmm1
|
|
lea edx,DWORD PTR 16[edx]
|
|
lea eax,DWORD PTR [eax-16]
|
|
$L115dec_key_inverse:
|
|
movups xmm0,XMMWORD PTR [edx]
|
|
movups xmm1,XMMWORD PTR [eax]
|
|
DB 102,15,56,219,192
|
|
DB 102,15,56,219,201
|
|
lea edx,DWORD PTR 16[edx]
|
|
lea eax,DWORD PTR [eax-16]
|
|
movups XMMWORD PTR 16[eax],xmm0
|
|
movups XMMWORD PTR [edx-16],xmm1
|
|
cmp eax,edx
|
|
ja $L115dec_key_inverse
|
|
movups xmm0,XMMWORD PTR [edx]
|
|
DB 102,15,56,219,192
|
|
movups XMMWORD PTR [edx],xmm0
|
|
pxor xmm0,xmm0
|
|
pxor xmm1,xmm1
|
|
xor eax,eax
|
|
$L114dec_key_ret:
|
|
ret
|
|
_aesni_set_decrypt_key ENDP
|
|
ALIGN 64
|
|
$Lkey_const::
|
|
DD 202313229,202313229,202313229,202313229
|
|
DD 67569157,67569157,67569157,67569157
|
|
DD 1,1,1,1
|
|
DD 27,27,27,27
|
|
DB 65,69,83,32,102,111,114,32,73,110,116,101,108,32,65,69
|
|
DB 83,45,78,73,44,32,67,82,89,80,84,79,71,65,77,83
|
|
DB 32,98,121,32,60,97,112,112,114,111,64,111,112,101,110,115
|
|
DB 115,108,46,111,114,103,62,0
|
|
.text$ ENDS
|
|
.bss SEGMENT 'BSS'
|
|
COMM _OPENSSL_ia32cap_P:DWORD:4
|
|
.bss ENDS
|
|
END
|
|
|